diff --git "a/checkpoint-85000/trainer_state.json" "b/checkpoint-85000/trainer_state.json" new file mode 100644--- /dev/null +++ "b/checkpoint-85000/trainer_state.json" @@ -0,0 +1,510019 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 2.17859339758048, + "eval_steps": 500, + "global_step": 85000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 1.7079419299743807e-09, + "loss": 2.8359, + "step": 1 + }, + { + "epoch": 0.0, + "learning_rate": 3.4158838599487614e-09, + "loss": 2.4531, + "step": 2 + }, + { + "epoch": 0.0, + "learning_rate": 5.123825789923143e-09, + "loss": 2.2266, + "step": 3 + }, + { + "epoch": 0.0, + "learning_rate": 6.831767719897523e-09, + "loss": 2.5566, + "step": 4 + }, + { + "epoch": 0.0, + "learning_rate": 8.539709649871904e-09, + "loss": 2.7461, + "step": 5 + }, + { + "epoch": 0.0, + "learning_rate": 1.0247651579846285e-08, + "loss": 2.5, + "step": 6 + }, + { + "epoch": 0.0, + "learning_rate": 1.1955593509820665e-08, + "loss": 2.4414, + "step": 7 + }, + { + "epoch": 0.0, + "learning_rate": 1.3663535439795045e-08, + "loss": 2.5781, + "step": 8 + }, + { + "epoch": 0.0, + "learning_rate": 1.5371477369769426e-08, + "loss": 2.8516, + "step": 9 + }, + { + "epoch": 0.0, + "learning_rate": 1.707941929974381e-08, + "loss": 2.3164, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 1.8787361229718188e-08, + "loss": 2.6289, + "step": 11 + }, + { + "epoch": 0.0, + "learning_rate": 2.049530315969257e-08, + "loss": 2.1953, + "step": 12 + }, + { + "epoch": 0.0, + "learning_rate": 2.220324508966695e-08, + "loss": 2.8398, + "step": 13 + }, + { + "epoch": 0.0, + "learning_rate": 2.391118701964133e-08, + "loss": 2.748, + "step": 14 + }, + { + "epoch": 0.0, + "learning_rate": 2.561912894961571e-08, + "loss": 2.5137, + "step": 15 + }, + { + "epoch": 0.0, + "learning_rate": 2.732707087959009e-08, + "loss": 2.5234, + "step": 16 + }, + { + "epoch": 0.0, + "learning_rate": 2.9035012809564473e-08, + "loss": 3.0508, + "step": 17 + }, + { + "epoch": 0.0, + "learning_rate": 3.074295473953885e-08, + "loss": 2.9062, + "step": 18 + }, + { + "epoch": 0.0, + "learning_rate": 3.2450896669513235e-08, + "loss": 2.25, + "step": 19 + }, + { + "epoch": 0.0, + "learning_rate": 3.415883859948762e-08, + "loss": 2.2539, + "step": 20 + }, + { + "epoch": 0.0, + "learning_rate": 3.5866780529461994e-08, + "loss": 2.1191, + "step": 21 + }, + { + "epoch": 0.0, + "learning_rate": 3.7574722459436376e-08, + "loss": 2.3359, + "step": 22 + }, + { + "epoch": 0.0, + "learning_rate": 3.928266438941076e-08, + "loss": 2.041, + "step": 23 + }, + { + "epoch": 0.0, + "learning_rate": 4.099060631938514e-08, + "loss": 2.2305, + "step": 24 + }, + { + "epoch": 0.0, + "learning_rate": 4.269854824935952e-08, + "loss": 2.4023, + "step": 25 + }, + { + "epoch": 0.0, + "learning_rate": 4.44064901793339e-08, + "loss": 3.2969, + "step": 26 + }, + { + "epoch": 0.0, + "learning_rate": 4.611443210930828e-08, + "loss": 2.0156, + "step": 27 + }, + { + "epoch": 0.0, + "learning_rate": 4.782237403928266e-08, + "loss": 2.4844, + "step": 28 + }, + { + "epoch": 0.0, + "learning_rate": 4.953031596925705e-08, + "loss": 2.8926, + "step": 29 + }, + { + "epoch": 0.0, + "learning_rate": 5.123825789923142e-08, + "loss": 2.2285, + "step": 30 + }, + { + "epoch": 0.0, + "learning_rate": 5.2946199829205806e-08, + "loss": 2.832, + "step": 31 + }, + { + "epoch": 0.0, + "learning_rate": 5.465414175918018e-08, + "loss": 2.7812, + "step": 32 + }, + { + "epoch": 0.0, + "learning_rate": 5.6362083689154564e-08, + "loss": 1.9473, + "step": 33 + }, + { + "epoch": 0.0, + "learning_rate": 5.807002561912895e-08, + "loss": 2.3086, + "step": 34 + }, + { + "epoch": 0.0, + "learning_rate": 5.977796754910333e-08, + "loss": 2.4219, + "step": 35 + }, + { + "epoch": 0.0, + "learning_rate": 6.14859094790777e-08, + "loss": 2.8789, + "step": 36 + }, + { + "epoch": 0.0, + "learning_rate": 6.31938514090521e-08, + "loss": 2.0215, + "step": 37 + }, + { + "epoch": 0.0, + "learning_rate": 6.490179333902647e-08, + "loss": 2.2305, + "step": 38 + }, + { + "epoch": 0.0, + "learning_rate": 6.660973526900085e-08, + "loss": 2.3164, + "step": 39 + }, + { + "epoch": 0.0, + "learning_rate": 6.831767719897524e-08, + "loss": 2.2891, + "step": 40 + }, + { + "epoch": 0.0, + "learning_rate": 7.002561912894961e-08, + "loss": 2.0488, + "step": 41 + }, + { + "epoch": 0.0, + "learning_rate": 7.173356105892399e-08, + "loss": 2.1172, + "step": 42 + }, + { + "epoch": 0.0, + "learning_rate": 7.344150298889836e-08, + "loss": 2.4062, + "step": 43 + }, + { + "epoch": 0.0, + "learning_rate": 7.514944491887275e-08, + "loss": 2.1133, + "step": 44 + }, + { + "epoch": 0.0, + "learning_rate": 7.685738684884714e-08, + "loss": 2.084, + "step": 45 + }, + { + "epoch": 0.0, + "learning_rate": 7.856532877882152e-08, + "loss": 2.0781, + "step": 46 + }, + { + "epoch": 0.0, + "learning_rate": 8.02732707087959e-08, + "loss": 1.7383, + "step": 47 + }, + { + "epoch": 0.0, + "learning_rate": 8.198121263877028e-08, + "loss": 1.9531, + "step": 48 + }, + { + "epoch": 0.0, + "learning_rate": 8.368915456874466e-08, + "loss": 1.916, + "step": 49 + }, + { + "epoch": 0.0, + "learning_rate": 8.539709649871903e-08, + "loss": 1.9609, + "step": 50 + }, + { + "epoch": 0.0, + "learning_rate": 8.710503842869342e-08, + "loss": 2.1758, + "step": 51 + }, + { + "epoch": 0.0, + "learning_rate": 8.88129803586678e-08, + "loss": 2.0781, + "step": 52 + }, + { + "epoch": 0.0, + "learning_rate": 9.052092228864218e-08, + "loss": 2.0742, + "step": 53 + }, + { + "epoch": 0.0, + "learning_rate": 9.222886421861656e-08, + "loss": 1.9629, + "step": 54 + }, + { + "epoch": 0.0, + "learning_rate": 9.393680614859094e-08, + "loss": 1.9492, + "step": 55 + }, + { + "epoch": 0.0, + "learning_rate": 9.564474807856532e-08, + "loss": 1.75, + "step": 56 + }, + { + "epoch": 0.0, + "learning_rate": 9.73526900085397e-08, + "loss": 1.7578, + "step": 57 + }, + { + "epoch": 0.0, + "learning_rate": 9.90606319385141e-08, + "loss": 1.707, + "step": 58 + }, + { + "epoch": 0.0, + "learning_rate": 1.0076857386848847e-07, + "loss": 1.9395, + "step": 59 + }, + { + "epoch": 0.0, + "learning_rate": 1.0247651579846285e-07, + "loss": 1.6738, + "step": 60 + }, + { + "epoch": 0.0, + "learning_rate": 1.0418445772843724e-07, + "loss": 1.8789, + "step": 61 + }, + { + "epoch": 0.0, + "learning_rate": 1.0589239965841161e-07, + "loss": 1.7871, + "step": 62 + }, + { + "epoch": 0.0, + "learning_rate": 1.0760034158838599e-07, + "loss": 1.6641, + "step": 63 + }, + { + "epoch": 0.0, + "learning_rate": 1.0930828351836036e-07, + "loss": 1.6641, + "step": 64 + }, + { + "epoch": 0.0, + "learning_rate": 1.1101622544833475e-07, + "loss": 1.7539, + "step": 65 + }, + { + "epoch": 0.0, + "learning_rate": 1.1272416737830913e-07, + "loss": 1.6777, + "step": 66 + }, + { + "epoch": 0.0, + "learning_rate": 1.144321093082835e-07, + "loss": 1.4297, + "step": 67 + }, + { + "epoch": 0.0, + "learning_rate": 1.161400512382579e-07, + "loss": 1.5352, + "step": 68 + }, + { + "epoch": 0.0, + "learning_rate": 1.1784799316823227e-07, + "loss": 1.6836, + "step": 69 + }, + { + "epoch": 0.0, + "learning_rate": 1.1955593509820666e-07, + "loss": 1.373, + "step": 70 + }, + { + "epoch": 0.0, + "learning_rate": 1.2126387702818105e-07, + "loss": 1.4453, + "step": 71 + }, + { + "epoch": 0.0, + "learning_rate": 1.229718189581554e-07, + "loss": 1.5762, + "step": 72 + }, + { + "epoch": 0.0, + "learning_rate": 1.246797608881298e-07, + "loss": 1.7363, + "step": 73 + }, + { + "epoch": 0.0, + "learning_rate": 1.263877028181042e-07, + "loss": 1.54, + "step": 74 + }, + { + "epoch": 0.0, + "learning_rate": 1.2809564474807855e-07, + "loss": 1.4727, + "step": 75 + }, + { + "epoch": 0.0, + "learning_rate": 1.2980358667805294e-07, + "loss": 1.5723, + "step": 76 + }, + { + "epoch": 0.0, + "learning_rate": 1.3151152860802733e-07, + "loss": 1.5781, + "step": 77 + }, + { + "epoch": 0.0, + "learning_rate": 1.332194705380017e-07, + "loss": 1.8008, + "step": 78 + }, + { + "epoch": 0.0, + "learning_rate": 1.3492741246797608e-07, + "loss": 1.4004, + "step": 79 + }, + { + "epoch": 0.0, + "learning_rate": 1.3663535439795047e-07, + "loss": 1.6807, + "step": 80 + }, + { + "epoch": 0.0, + "learning_rate": 1.3834329632792486e-07, + "loss": 1.4199, + "step": 81 + }, + { + "epoch": 0.0, + "learning_rate": 1.4005123825789922e-07, + "loss": 1.2354, + "step": 82 + }, + { + "epoch": 0.0, + "learning_rate": 1.417591801878736e-07, + "loss": 1.2344, + "step": 83 + }, + { + "epoch": 0.0, + "learning_rate": 1.4346712211784797e-07, + "loss": 1.6914, + "step": 84 + }, + { + "epoch": 0.0, + "learning_rate": 1.4517506404782236e-07, + "loss": 1.5156, + "step": 85 + }, + { + "epoch": 0.0, + "learning_rate": 1.4688300597779673e-07, + "loss": 1.3789, + "step": 86 + }, + { + "epoch": 0.0, + "learning_rate": 1.4859094790777114e-07, + "loss": 1.6191, + "step": 87 + }, + { + "epoch": 0.0, + "learning_rate": 1.502988898377455e-07, + "loss": 1.4922, + "step": 88 + }, + { + "epoch": 0.0, + "learning_rate": 1.520068317677199e-07, + "loss": 1.4766, + "step": 89 + }, + { + "epoch": 0.0, + "learning_rate": 1.5371477369769428e-07, + "loss": 1.165, + "step": 90 + }, + { + "epoch": 0.0, + "learning_rate": 1.5542271562766865e-07, + "loss": 1.3555, + "step": 91 + }, + { + "epoch": 0.0, + "learning_rate": 1.5713065755764303e-07, + "loss": 1.3516, + "step": 92 + }, + { + "epoch": 0.0, + "learning_rate": 1.588385994876174e-07, + "loss": 1.543, + "step": 93 + }, + { + "epoch": 0.0, + "learning_rate": 1.605465414175918e-07, + "loss": 1.416, + "step": 94 + }, + { + "epoch": 0.0, + "learning_rate": 1.6225448334756618e-07, + "loss": 1.4863, + "step": 95 + }, + { + "epoch": 0.0, + "learning_rate": 1.6396242527754057e-07, + "loss": 1.4414, + "step": 96 + }, + { + "epoch": 0.0, + "learning_rate": 1.6567036720751493e-07, + "loss": 1.3887, + "step": 97 + }, + { + "epoch": 0.0, + "learning_rate": 1.6737830913748932e-07, + "loss": 1.4336, + "step": 98 + }, + { + "epoch": 0.0, + "learning_rate": 1.6908625106746368e-07, + "loss": 1.3652, + "step": 99 + }, + { + "epoch": 0.0, + "learning_rate": 1.7079419299743807e-07, + "loss": 1.4316, + "step": 100 + }, + { + "epoch": 0.0, + "learning_rate": 1.7250213492741248e-07, + "loss": 1.0703, + "step": 101 + }, + { + "epoch": 0.0, + "learning_rate": 1.7421007685738685e-07, + "loss": 1.4082, + "step": 102 + }, + { + "epoch": 0.0, + "learning_rate": 1.7591801878736124e-07, + "loss": 1.1934, + "step": 103 + }, + { + "epoch": 0.0, + "learning_rate": 1.776259607173356e-07, + "loss": 1.4219, + "step": 104 + }, + { + "epoch": 0.0, + "learning_rate": 1.7933390264731e-07, + "loss": 1.3633, + "step": 105 + }, + { + "epoch": 0.0, + "learning_rate": 1.8104184457728435e-07, + "loss": 1.4551, + "step": 106 + }, + { + "epoch": 0.0, + "learning_rate": 1.8274978650725874e-07, + "loss": 1.0342, + "step": 107 + }, + { + "epoch": 0.0, + "learning_rate": 1.8445772843723313e-07, + "loss": 1.0078, + "step": 108 + }, + { + "epoch": 0.0, + "learning_rate": 1.8616567036720752e-07, + "loss": 1.3086, + "step": 109 + }, + { + "epoch": 0.0, + "learning_rate": 1.8787361229718188e-07, + "loss": 1.3477, + "step": 110 + }, + { + "epoch": 0.0, + "learning_rate": 1.8958155422715627e-07, + "loss": 1.2305, + "step": 111 + }, + { + "epoch": 0.0, + "learning_rate": 1.9128949615713063e-07, + "loss": 1.3457, + "step": 112 + }, + { + "epoch": 0.0, + "learning_rate": 1.9299743808710502e-07, + "loss": 1.2266, + "step": 113 + }, + { + "epoch": 0.0, + "learning_rate": 1.947053800170794e-07, + "loss": 0.9448, + "step": 114 + }, + { + "epoch": 0.0, + "learning_rate": 1.964133219470538e-07, + "loss": 1.0908, + "step": 115 + }, + { + "epoch": 0.0, + "learning_rate": 1.981212638770282e-07, + "loss": 1.1914, + "step": 116 + }, + { + "epoch": 0.0, + "learning_rate": 1.9982920580700255e-07, + "loss": 1.2041, + "step": 117 + }, + { + "epoch": 0.0, + "learning_rate": 2.0153714773697694e-07, + "loss": 1.498, + "step": 118 + }, + { + "epoch": 0.0, + "learning_rate": 2.032450896669513e-07, + "loss": 1.5176, + "step": 119 + }, + { + "epoch": 0.0, + "learning_rate": 2.049530315969257e-07, + "loss": 1.4189, + "step": 120 + }, + { + "epoch": 0.0, + "learning_rate": 2.0666097352690006e-07, + "loss": 1.3984, + "step": 121 + }, + { + "epoch": 0.0, + "learning_rate": 2.0836891545687447e-07, + "loss": 1.3066, + "step": 122 + }, + { + "epoch": 0.0, + "learning_rate": 2.1007685738684883e-07, + "loss": 1.1553, + "step": 123 + }, + { + "epoch": 0.0, + "learning_rate": 2.1178479931682322e-07, + "loss": 1.3281, + "step": 124 + }, + { + "epoch": 0.0, + "learning_rate": 2.1349274124679759e-07, + "loss": 1.1719, + "step": 125 + }, + { + "epoch": 0.0, + "learning_rate": 2.1520068317677198e-07, + "loss": 1.0166, + "step": 126 + }, + { + "epoch": 0.0, + "learning_rate": 2.1690862510674636e-07, + "loss": 1.0801, + "step": 127 + }, + { + "epoch": 0.0, + "learning_rate": 2.1861656703672073e-07, + "loss": 1.2656, + "step": 128 + }, + { + "epoch": 0.0, + "learning_rate": 2.2032450896669514e-07, + "loss": 1.1465, + "step": 129 + }, + { + "epoch": 0.0, + "learning_rate": 2.220324508966695e-07, + "loss": 1.0635, + "step": 130 + }, + { + "epoch": 0.0, + "learning_rate": 2.237403928266439e-07, + "loss": 1.2129, + "step": 131 + }, + { + "epoch": 0.0, + "learning_rate": 2.2544833475661826e-07, + "loss": 1.126, + "step": 132 + }, + { + "epoch": 0.0, + "learning_rate": 2.2715627668659265e-07, + "loss": 1.2422, + "step": 133 + }, + { + "epoch": 0.0, + "learning_rate": 2.28864218616567e-07, + "loss": 1.1582, + "step": 134 + }, + { + "epoch": 0.0, + "learning_rate": 2.305721605465414e-07, + "loss": 1.0537, + "step": 135 + }, + { + "epoch": 0.0, + "learning_rate": 2.322801024765158e-07, + "loss": 1.2129, + "step": 136 + }, + { + "epoch": 0.0, + "learning_rate": 2.3398804440649018e-07, + "loss": 1.1875, + "step": 137 + }, + { + "epoch": 0.0, + "learning_rate": 2.3569598633646454e-07, + "loss": 0.9678, + "step": 138 + }, + { + "epoch": 0.0, + "learning_rate": 2.3740392826643893e-07, + "loss": 1.2578, + "step": 139 + }, + { + "epoch": 0.0, + "learning_rate": 2.391118701964133e-07, + "loss": 1.1621, + "step": 140 + }, + { + "epoch": 0.0, + "learning_rate": 2.408198121263877e-07, + "loss": 1.2871, + "step": 141 + }, + { + "epoch": 0.0, + "learning_rate": 2.425277540563621e-07, + "loss": 1.0742, + "step": 142 + }, + { + "epoch": 0.0, + "learning_rate": 2.4423569598633643e-07, + "loss": 1.0781, + "step": 143 + }, + { + "epoch": 0.0, + "learning_rate": 2.459436379163108e-07, + "loss": 1.1885, + "step": 144 + }, + { + "epoch": 0.0, + "learning_rate": 2.476515798462852e-07, + "loss": 1.1855, + "step": 145 + }, + { + "epoch": 0.0, + "learning_rate": 2.493595217762596e-07, + "loss": 1.2354, + "step": 146 + }, + { + "epoch": 0.0, + "learning_rate": 2.51067463706234e-07, + "loss": 1.0176, + "step": 147 + }, + { + "epoch": 0.0, + "learning_rate": 2.527754056362084e-07, + "loss": 1.0557, + "step": 148 + }, + { + "epoch": 0.0, + "learning_rate": 2.544833475661827e-07, + "loss": 1.1113, + "step": 149 + }, + { + "epoch": 0.0, + "learning_rate": 2.561912894961571e-07, + "loss": 1.4492, + "step": 150 + }, + { + "epoch": 0.0, + "learning_rate": 2.578992314261315e-07, + "loss": 1.1611, + "step": 151 + }, + { + "epoch": 0.0, + "learning_rate": 2.596071733561059e-07, + "loss": 1.1807, + "step": 152 + }, + { + "epoch": 0.0, + "learning_rate": 2.6131511528608027e-07, + "loss": 1.25, + "step": 153 + }, + { + "epoch": 0.0, + "learning_rate": 2.6302305721605466e-07, + "loss": 1.1367, + "step": 154 + }, + { + "epoch": 0.0, + "learning_rate": 2.6473099914602905e-07, + "loss": 1.2207, + "step": 155 + }, + { + "epoch": 0.0, + "learning_rate": 2.664389410760034e-07, + "loss": 1.2891, + "step": 156 + }, + { + "epoch": 0.0, + "learning_rate": 2.681468830059778e-07, + "loss": 1.2412, + "step": 157 + }, + { + "epoch": 0.0, + "learning_rate": 2.6985482493595216e-07, + "loss": 0.9463, + "step": 158 + }, + { + "epoch": 0.0, + "learning_rate": 2.7156276686592655e-07, + "loss": 1.2891, + "step": 159 + }, + { + "epoch": 0.0, + "learning_rate": 2.7327070879590094e-07, + "loss": 1.2041, + "step": 160 + }, + { + "epoch": 0.0, + "learning_rate": 2.749786507258753e-07, + "loss": 1.0771, + "step": 161 + }, + { + "epoch": 0.0, + "learning_rate": 2.766865926558497e-07, + "loss": 1.2969, + "step": 162 + }, + { + "epoch": 0.0, + "learning_rate": 2.7839453458582406e-07, + "loss": 1.4609, + "step": 163 + }, + { + "epoch": 0.0, + "learning_rate": 2.8010247651579845e-07, + "loss": 0.9658, + "step": 164 + }, + { + "epoch": 0.0, + "learning_rate": 2.8181041844577283e-07, + "loss": 1.0439, + "step": 165 + }, + { + "epoch": 0.0, + "learning_rate": 2.835183603757472e-07, + "loss": 1.1113, + "step": 166 + }, + { + "epoch": 0.0, + "learning_rate": 2.852263023057216e-07, + "loss": 1.3906, + "step": 167 + }, + { + "epoch": 0.0, + "learning_rate": 2.8693424423569595e-07, + "loss": 1.0508, + "step": 168 + }, + { + "epoch": 0.0, + "learning_rate": 2.886421861656704e-07, + "loss": 1.1279, + "step": 169 + }, + { + "epoch": 0.0, + "learning_rate": 2.9035012809564473e-07, + "loss": 1.2852, + "step": 170 + }, + { + "epoch": 0.0, + "learning_rate": 2.920580700256191e-07, + "loss": 0.8525, + "step": 171 + }, + { + "epoch": 0.0, + "learning_rate": 2.9376601195559345e-07, + "loss": 1.25, + "step": 172 + }, + { + "epoch": 0.0, + "learning_rate": 2.954739538855679e-07, + "loss": 1.0869, + "step": 173 + }, + { + "epoch": 0.0, + "learning_rate": 2.971818958155423e-07, + "loss": 1.2266, + "step": 174 + }, + { + "epoch": 0.0, + "learning_rate": 2.988898377455166e-07, + "loss": 1.4424, + "step": 175 + }, + { + "epoch": 0.0, + "learning_rate": 3.00597779675491e-07, + "loss": 0.9077, + "step": 176 + }, + { + "epoch": 0.0, + "learning_rate": 3.023057216054654e-07, + "loss": 1.1211, + "step": 177 + }, + { + "epoch": 0.0, + "learning_rate": 3.040136635354398e-07, + "loss": 1.252, + "step": 178 + }, + { + "epoch": 0.0, + "learning_rate": 3.057216054654141e-07, + "loss": 1.0664, + "step": 179 + }, + { + "epoch": 0.0, + "learning_rate": 3.0742954739538857e-07, + "loss": 1.0996, + "step": 180 + }, + { + "epoch": 0.0, + "learning_rate": 3.0913748932536296e-07, + "loss": 1.1709, + "step": 181 + }, + { + "epoch": 0.0, + "learning_rate": 3.108454312553373e-07, + "loss": 0.8936, + "step": 182 + }, + { + "epoch": 0.0, + "learning_rate": 3.125533731853117e-07, + "loss": 1.2891, + "step": 183 + }, + { + "epoch": 0.0, + "learning_rate": 3.1426131511528607e-07, + "loss": 1.0977, + "step": 184 + }, + { + "epoch": 0.0, + "learning_rate": 3.1596925704526046e-07, + "loss": 1.4473, + "step": 185 + }, + { + "epoch": 0.0, + "learning_rate": 3.176771989752348e-07, + "loss": 1.3115, + "step": 186 + }, + { + "epoch": 0.0, + "learning_rate": 3.193851409052092e-07, + "loss": 1.0586, + "step": 187 + }, + { + "epoch": 0.0, + "learning_rate": 3.210930828351836e-07, + "loss": 1.3301, + "step": 188 + }, + { + "epoch": 0.0, + "learning_rate": 3.2280102476515796e-07, + "loss": 1.126, + "step": 189 + }, + { + "epoch": 0.0, + "learning_rate": 3.2450896669513235e-07, + "loss": 0.9668, + "step": 190 + }, + { + "epoch": 0.0, + "learning_rate": 3.2621690862510674e-07, + "loss": 1.1221, + "step": 191 + }, + { + "epoch": 0.0, + "learning_rate": 3.2792485055508113e-07, + "loss": 1.291, + "step": 192 + }, + { + "epoch": 0.0, + "learning_rate": 3.2963279248505547e-07, + "loss": 1.1934, + "step": 193 + }, + { + "epoch": 0.0, + "learning_rate": 3.3134073441502986e-07, + "loss": 1.1357, + "step": 194 + }, + { + "epoch": 0.0, + "learning_rate": 3.330486763450043e-07, + "loss": 1.1934, + "step": 195 + }, + { + "epoch": 0.01, + "learning_rate": 3.3475661827497863e-07, + "loss": 1.2578, + "step": 196 + }, + { + "epoch": 0.01, + "learning_rate": 3.36464560204953e-07, + "loss": 1.1631, + "step": 197 + }, + { + "epoch": 0.01, + "learning_rate": 3.3817250213492736e-07, + "loss": 1.1602, + "step": 198 + }, + { + "epoch": 0.01, + "learning_rate": 3.398804440649018e-07, + "loss": 1.248, + "step": 199 + }, + { + "epoch": 0.01, + "learning_rate": 3.4158838599487614e-07, + "loss": 1.1162, + "step": 200 + }, + { + "epoch": 0.01, + "learning_rate": 3.4329632792485053e-07, + "loss": 1.1123, + "step": 201 + }, + { + "epoch": 0.01, + "learning_rate": 3.4500426985482497e-07, + "loss": 1.1084, + "step": 202 + }, + { + "epoch": 0.01, + "learning_rate": 3.467122117847993e-07, + "loss": 1.2285, + "step": 203 + }, + { + "epoch": 0.01, + "learning_rate": 3.484201537147737e-07, + "loss": 1.1211, + "step": 204 + }, + { + "epoch": 0.01, + "learning_rate": 3.5012809564474803e-07, + "loss": 1.0586, + "step": 205 + }, + { + "epoch": 0.01, + "learning_rate": 3.5183603757472247e-07, + "loss": 1.1143, + "step": 206 + }, + { + "epoch": 0.01, + "learning_rate": 3.535439795046968e-07, + "loss": 1.2773, + "step": 207 + }, + { + "epoch": 0.01, + "learning_rate": 3.552519214346712e-07, + "loss": 1.0332, + "step": 208 + }, + { + "epoch": 0.01, + "learning_rate": 3.569598633646456e-07, + "loss": 1.0371, + "step": 209 + }, + { + "epoch": 0.01, + "learning_rate": 3.5866780529462e-07, + "loss": 0.8853, + "step": 210 + }, + { + "epoch": 0.01, + "learning_rate": 3.6037574722459437e-07, + "loss": 1.1816, + "step": 211 + }, + { + "epoch": 0.01, + "learning_rate": 3.620836891545687e-07, + "loss": 1.1865, + "step": 212 + }, + { + "epoch": 0.01, + "learning_rate": 3.637916310845431e-07, + "loss": 1.2402, + "step": 213 + }, + { + "epoch": 0.01, + "learning_rate": 3.654995730145175e-07, + "loss": 1.1846, + "step": 214 + }, + { + "epoch": 0.01, + "learning_rate": 3.6720751494449187e-07, + "loss": 1.2129, + "step": 215 + }, + { + "epoch": 0.01, + "learning_rate": 3.6891545687446626e-07, + "loss": 1.1211, + "step": 216 + }, + { + "epoch": 0.01, + "learning_rate": 3.7062339880444065e-07, + "loss": 1.002, + "step": 217 + }, + { + "epoch": 0.01, + "learning_rate": 3.7233134073441504e-07, + "loss": 0.915, + "step": 218 + }, + { + "epoch": 0.01, + "learning_rate": 3.7403928266438937e-07, + "loss": 1.1201, + "step": 219 + }, + { + "epoch": 0.01, + "learning_rate": 3.7574722459436376e-07, + "loss": 1.0869, + "step": 220 + }, + { + "epoch": 0.01, + "learning_rate": 3.7745516652433815e-07, + "loss": 1.0088, + "step": 221 + }, + { + "epoch": 0.01, + "learning_rate": 3.7916310845431254e-07, + "loss": 0.9395, + "step": 222 + }, + { + "epoch": 0.01, + "learning_rate": 3.8087105038428693e-07, + "loss": 1.1514, + "step": 223 + }, + { + "epoch": 0.01, + "learning_rate": 3.8257899231426127e-07, + "loss": 0.9434, + "step": 224 + }, + { + "epoch": 0.01, + "learning_rate": 3.842869342442357e-07, + "loss": 0.9873, + "step": 225 + }, + { + "epoch": 0.01, + "learning_rate": 3.8599487617421004e-07, + "loss": 1.1006, + "step": 226 + }, + { + "epoch": 0.01, + "learning_rate": 3.8770281810418443e-07, + "loss": 1.0166, + "step": 227 + }, + { + "epoch": 0.01, + "learning_rate": 3.894107600341588e-07, + "loss": 1.2129, + "step": 228 + }, + { + "epoch": 0.01, + "learning_rate": 3.911187019641332e-07, + "loss": 1.1572, + "step": 229 + }, + { + "epoch": 0.01, + "learning_rate": 3.928266438941076e-07, + "loss": 0.9033, + "step": 230 + }, + { + "epoch": 0.01, + "learning_rate": 3.9453458582408194e-07, + "loss": 0.959, + "step": 231 + }, + { + "epoch": 0.01, + "learning_rate": 3.962425277540564e-07, + "loss": 1.1064, + "step": 232 + }, + { + "epoch": 0.01, + "learning_rate": 3.979504696840307e-07, + "loss": 1.1416, + "step": 233 + }, + { + "epoch": 0.01, + "learning_rate": 3.996584116140051e-07, + "loss": 1.3711, + "step": 234 + }, + { + "epoch": 0.01, + "learning_rate": 4.0136635354397944e-07, + "loss": 1.043, + "step": 235 + }, + { + "epoch": 0.01, + "learning_rate": 4.030742954739539e-07, + "loss": 1.0303, + "step": 236 + }, + { + "epoch": 0.01, + "learning_rate": 4.0478223740392827e-07, + "loss": 0.8579, + "step": 237 + }, + { + "epoch": 0.01, + "learning_rate": 4.064901793339026e-07, + "loss": 1.1992, + "step": 238 + }, + { + "epoch": 0.01, + "learning_rate": 4.08198121263877e-07, + "loss": 0.8105, + "step": 239 + }, + { + "epoch": 0.01, + "learning_rate": 4.099060631938514e-07, + "loss": 1.0303, + "step": 240 + }, + { + "epoch": 0.01, + "learning_rate": 4.116140051238258e-07, + "loss": 1.0039, + "step": 241 + }, + { + "epoch": 0.01, + "learning_rate": 4.133219470538001e-07, + "loss": 1.3086, + "step": 242 + }, + { + "epoch": 0.01, + "learning_rate": 4.1502988898377455e-07, + "loss": 1.1338, + "step": 243 + }, + { + "epoch": 0.01, + "learning_rate": 4.1673783091374894e-07, + "loss": 1.0273, + "step": 244 + }, + { + "epoch": 0.01, + "learning_rate": 4.184457728437233e-07, + "loss": 0.9795, + "step": 245 + }, + { + "epoch": 0.01, + "learning_rate": 4.2015371477369767e-07, + "loss": 0.9775, + "step": 246 + }, + { + "epoch": 0.01, + "learning_rate": 4.2186165670367206e-07, + "loss": 1.1836, + "step": 247 + }, + { + "epoch": 0.01, + "learning_rate": 4.2356959863364645e-07, + "loss": 1.1309, + "step": 248 + }, + { + "epoch": 0.01, + "learning_rate": 4.252775405636208e-07, + "loss": 1.1484, + "step": 249 + }, + { + "epoch": 0.01, + "learning_rate": 4.2698548249359517e-07, + "loss": 0.7554, + "step": 250 + }, + { + "epoch": 0.01, + "learning_rate": 4.286934244235696e-07, + "loss": 0.9375, + "step": 251 + }, + { + "epoch": 0.01, + "learning_rate": 4.3040136635354395e-07, + "loss": 1.1152, + "step": 252 + }, + { + "epoch": 0.01, + "learning_rate": 4.3210930828351834e-07, + "loss": 0.9209, + "step": 253 + }, + { + "epoch": 0.01, + "learning_rate": 4.3381725021349273e-07, + "loss": 0.9922, + "step": 254 + }, + { + "epoch": 0.01, + "learning_rate": 4.355251921434671e-07, + "loss": 1.0566, + "step": 255 + }, + { + "epoch": 0.01, + "learning_rate": 4.3723313407344145e-07, + "loss": 1.0693, + "step": 256 + }, + { + "epoch": 0.01, + "learning_rate": 4.3894107600341584e-07, + "loss": 1.0098, + "step": 257 + }, + { + "epoch": 0.01, + "learning_rate": 4.406490179333903e-07, + "loss": 1.2002, + "step": 258 + }, + { + "epoch": 0.01, + "learning_rate": 4.423569598633646e-07, + "loss": 1.0488, + "step": 259 + }, + { + "epoch": 0.01, + "learning_rate": 4.44064901793339e-07, + "loss": 1.1133, + "step": 260 + }, + { + "epoch": 0.01, + "learning_rate": 4.4577284372331335e-07, + "loss": 1.0498, + "step": 261 + }, + { + "epoch": 0.01, + "learning_rate": 4.474807856532878e-07, + "loss": 0.9395, + "step": 262 + }, + { + "epoch": 0.01, + "learning_rate": 4.491887275832621e-07, + "loss": 1.0898, + "step": 263 + }, + { + "epoch": 0.01, + "learning_rate": 4.508966695132365e-07, + "loss": 1.3242, + "step": 264 + }, + { + "epoch": 0.01, + "learning_rate": 4.5260461144321096e-07, + "loss": 0.8994, + "step": 265 + }, + { + "epoch": 0.01, + "learning_rate": 4.543125533731853e-07, + "loss": 1.0664, + "step": 266 + }, + { + "epoch": 0.01, + "learning_rate": 4.560204953031597e-07, + "loss": 0.8447, + "step": 267 + }, + { + "epoch": 0.01, + "learning_rate": 4.57728437233134e-07, + "loss": 0.9893, + "step": 268 + }, + { + "epoch": 0.01, + "learning_rate": 4.5943637916310846e-07, + "loss": 1.0898, + "step": 269 + }, + { + "epoch": 0.01, + "learning_rate": 4.611443210930828e-07, + "loss": 1.2002, + "step": 270 + }, + { + "epoch": 0.01, + "learning_rate": 4.628522630230572e-07, + "loss": 0.9106, + "step": 271 + }, + { + "epoch": 0.01, + "learning_rate": 4.645602049530316e-07, + "loss": 1.2363, + "step": 272 + }, + { + "epoch": 0.01, + "learning_rate": 4.6626814688300596e-07, + "loss": 1.3057, + "step": 273 + }, + { + "epoch": 0.01, + "learning_rate": 4.6797608881298035e-07, + "loss": 0.9131, + "step": 274 + }, + { + "epoch": 0.01, + "learning_rate": 4.696840307429547e-07, + "loss": 1.0869, + "step": 275 + }, + { + "epoch": 0.01, + "learning_rate": 4.713919726729291e-07, + "loss": 1.0244, + "step": 276 + }, + { + "epoch": 0.01, + "learning_rate": 4.730999146029035e-07, + "loss": 1.0195, + "step": 277 + }, + { + "epoch": 0.01, + "learning_rate": 4.7480785653287786e-07, + "loss": 1.0977, + "step": 278 + }, + { + "epoch": 0.01, + "learning_rate": 4.7651579846285225e-07, + "loss": 0.9365, + "step": 279 + }, + { + "epoch": 0.01, + "learning_rate": 4.782237403928266e-07, + "loss": 1.2754, + "step": 280 + }, + { + "epoch": 0.01, + "learning_rate": 4.79931682322801e-07, + "loss": 1.0928, + "step": 281 + }, + { + "epoch": 0.01, + "learning_rate": 4.816396242527754e-07, + "loss": 1.1465, + "step": 282 + }, + { + "epoch": 0.01, + "learning_rate": 4.833475661827497e-07, + "loss": 0.856, + "step": 283 + }, + { + "epoch": 0.01, + "learning_rate": 4.850555081127242e-07, + "loss": 1.1621, + "step": 284 + }, + { + "epoch": 0.01, + "learning_rate": 4.867634500426985e-07, + "loss": 1.0645, + "step": 285 + }, + { + "epoch": 0.01, + "learning_rate": 4.884713919726729e-07, + "loss": 1.0635, + "step": 286 + }, + { + "epoch": 0.01, + "learning_rate": 4.901793339026473e-07, + "loss": 1.1826, + "step": 287 + }, + { + "epoch": 0.01, + "learning_rate": 4.918872758326216e-07, + "loss": 0.9922, + "step": 288 + }, + { + "epoch": 0.01, + "learning_rate": 4.935952177625961e-07, + "loss": 1.2051, + "step": 289 + }, + { + "epoch": 0.01, + "learning_rate": 4.953031596925704e-07, + "loss": 1.0996, + "step": 290 + }, + { + "epoch": 0.01, + "learning_rate": 4.970111016225449e-07, + "loss": 1.1465, + "step": 291 + }, + { + "epoch": 0.01, + "learning_rate": 4.987190435525192e-07, + "loss": 0.959, + "step": 292 + }, + { + "epoch": 0.01, + "learning_rate": 5.004269854824936e-07, + "loss": 1.0752, + "step": 293 + }, + { + "epoch": 0.01, + "learning_rate": 5.02134927412468e-07, + "loss": 1.0166, + "step": 294 + }, + { + "epoch": 0.01, + "learning_rate": 5.038428693424423e-07, + "loss": 1.1826, + "step": 295 + }, + { + "epoch": 0.01, + "learning_rate": 5.055508112724168e-07, + "loss": 1.1201, + "step": 296 + }, + { + "epoch": 0.01, + "learning_rate": 5.072587532023911e-07, + "loss": 1.1641, + "step": 297 + }, + { + "epoch": 0.01, + "learning_rate": 5.089666951323654e-07, + "loss": 0.9453, + "step": 298 + }, + { + "epoch": 0.01, + "learning_rate": 5.106746370623399e-07, + "loss": 1.1025, + "step": 299 + }, + { + "epoch": 0.01, + "learning_rate": 5.123825789923142e-07, + "loss": 1.1543, + "step": 300 + }, + { + "epoch": 0.01, + "learning_rate": 5.140905209222886e-07, + "loss": 1.0498, + "step": 301 + }, + { + "epoch": 0.01, + "learning_rate": 5.15798462852263e-07, + "loss": 0.9502, + "step": 302 + }, + { + "epoch": 0.01, + "learning_rate": 5.175064047822374e-07, + "loss": 1.1162, + "step": 303 + }, + { + "epoch": 0.01, + "learning_rate": 5.192143467122118e-07, + "loss": 0.8975, + "step": 304 + }, + { + "epoch": 0.01, + "learning_rate": 5.209222886421861e-07, + "loss": 1.4521, + "step": 305 + }, + { + "epoch": 0.01, + "learning_rate": 5.226302305721605e-07, + "loss": 1.1406, + "step": 306 + }, + { + "epoch": 0.01, + "learning_rate": 5.243381725021349e-07, + "loss": 1.1289, + "step": 307 + }, + { + "epoch": 0.01, + "learning_rate": 5.260461144321093e-07, + "loss": 1.064, + "step": 308 + }, + { + "epoch": 0.01, + "learning_rate": 5.277540563620837e-07, + "loss": 0.9507, + "step": 309 + }, + { + "epoch": 0.01, + "learning_rate": 5.294619982920581e-07, + "loss": 1.1094, + "step": 310 + }, + { + "epoch": 0.01, + "learning_rate": 5.311699402220324e-07, + "loss": 0.9355, + "step": 311 + }, + { + "epoch": 0.01, + "learning_rate": 5.328778821520068e-07, + "loss": 1.1289, + "step": 312 + }, + { + "epoch": 0.01, + "learning_rate": 5.345858240819812e-07, + "loss": 1.2461, + "step": 313 + }, + { + "epoch": 0.01, + "learning_rate": 5.362937660119555e-07, + "loss": 1.1348, + "step": 314 + }, + { + "epoch": 0.01, + "learning_rate": 5.3800170794193e-07, + "loss": 0.9053, + "step": 315 + }, + { + "epoch": 0.01, + "learning_rate": 5.397096498719043e-07, + "loss": 1.1006, + "step": 316 + }, + { + "epoch": 0.01, + "learning_rate": 5.414175918018788e-07, + "loss": 1.0391, + "step": 317 + }, + { + "epoch": 0.01, + "learning_rate": 5.431255337318531e-07, + "loss": 0.9883, + "step": 318 + }, + { + "epoch": 0.01, + "learning_rate": 5.448334756618274e-07, + "loss": 1.1436, + "step": 319 + }, + { + "epoch": 0.01, + "learning_rate": 5.465414175918019e-07, + "loss": 1.0342, + "step": 320 + }, + { + "epoch": 0.01, + "learning_rate": 5.482493595217762e-07, + "loss": 0.8926, + "step": 321 + }, + { + "epoch": 0.01, + "learning_rate": 5.499573014517506e-07, + "loss": 0.9258, + "step": 322 + }, + { + "epoch": 0.01, + "learning_rate": 5.51665243381725e-07, + "loss": 0.9902, + "step": 323 + }, + { + "epoch": 0.01, + "learning_rate": 5.533731853116994e-07, + "loss": 0.9766, + "step": 324 + }, + { + "epoch": 0.01, + "learning_rate": 5.550811272416738e-07, + "loss": 1.0791, + "step": 325 + }, + { + "epoch": 0.01, + "learning_rate": 5.567890691716481e-07, + "loss": 0.8574, + "step": 326 + }, + { + "epoch": 0.01, + "learning_rate": 5.584970111016226e-07, + "loss": 1.1416, + "step": 327 + }, + { + "epoch": 0.01, + "learning_rate": 5.602049530315969e-07, + "loss": 1.0605, + "step": 328 + }, + { + "epoch": 0.01, + "learning_rate": 5.619128949615712e-07, + "loss": 0.9629, + "step": 329 + }, + { + "epoch": 0.01, + "learning_rate": 5.636208368915457e-07, + "loss": 1.3828, + "step": 330 + }, + { + "epoch": 0.01, + "learning_rate": 5.653287788215201e-07, + "loss": 1.0889, + "step": 331 + }, + { + "epoch": 0.01, + "learning_rate": 5.670367207514944e-07, + "loss": 1.0586, + "step": 332 + }, + { + "epoch": 0.01, + "learning_rate": 5.687446626814688e-07, + "loss": 1.0518, + "step": 333 + }, + { + "epoch": 0.01, + "learning_rate": 5.704526046114432e-07, + "loss": 0.9277, + "step": 334 + }, + { + "epoch": 0.01, + "learning_rate": 5.721605465414176e-07, + "loss": 1.1211, + "step": 335 + }, + { + "epoch": 0.01, + "learning_rate": 5.738684884713919e-07, + "loss": 1.084, + "step": 336 + }, + { + "epoch": 0.01, + "learning_rate": 5.755764304013662e-07, + "loss": 0.9268, + "step": 337 + }, + { + "epoch": 0.01, + "learning_rate": 5.772843723313408e-07, + "loss": 1.1348, + "step": 338 + }, + { + "epoch": 0.01, + "learning_rate": 5.789923142613151e-07, + "loss": 1.0332, + "step": 339 + }, + { + "epoch": 0.01, + "learning_rate": 5.807002561912895e-07, + "loss": 0.8828, + "step": 340 + }, + { + "epoch": 0.01, + "learning_rate": 5.824081981212639e-07, + "loss": 0.8628, + "step": 341 + }, + { + "epoch": 0.01, + "learning_rate": 5.841161400512382e-07, + "loss": 1.0225, + "step": 342 + }, + { + "epoch": 0.01, + "learning_rate": 5.858240819812126e-07, + "loss": 0.6987, + "step": 343 + }, + { + "epoch": 0.01, + "learning_rate": 5.875320239111869e-07, + "loss": 0.9922, + "step": 344 + }, + { + "epoch": 0.01, + "learning_rate": 5.892399658411615e-07, + "loss": 0.9609, + "step": 345 + }, + { + "epoch": 0.01, + "learning_rate": 5.909479077711358e-07, + "loss": 1.0303, + "step": 346 + }, + { + "epoch": 0.01, + "learning_rate": 5.926558497011101e-07, + "loss": 1.0186, + "step": 347 + }, + { + "epoch": 0.01, + "learning_rate": 5.943637916310846e-07, + "loss": 0.9668, + "step": 348 + }, + { + "epoch": 0.01, + "learning_rate": 5.960717335610589e-07, + "loss": 1.0811, + "step": 349 + }, + { + "epoch": 0.01, + "learning_rate": 5.977796754910332e-07, + "loss": 1.0498, + "step": 350 + }, + { + "epoch": 0.01, + "learning_rate": 5.994876174210076e-07, + "loss": 1.2266, + "step": 351 + }, + { + "epoch": 0.01, + "learning_rate": 6.01195559350982e-07, + "loss": 1.1455, + "step": 352 + }, + { + "epoch": 0.01, + "learning_rate": 6.029035012809565e-07, + "loss": 0.8936, + "step": 353 + }, + { + "epoch": 0.01, + "learning_rate": 6.046114432109308e-07, + "loss": 0.9014, + "step": 354 + }, + { + "epoch": 0.01, + "learning_rate": 6.063193851409052e-07, + "loss": 0.9902, + "step": 355 + }, + { + "epoch": 0.01, + "learning_rate": 6.080273270708796e-07, + "loss": 1.1016, + "step": 356 + }, + { + "epoch": 0.01, + "learning_rate": 6.097352690008539e-07, + "loss": 0.9785, + "step": 357 + }, + { + "epoch": 0.01, + "learning_rate": 6.114432109308282e-07, + "loss": 0.9844, + "step": 358 + }, + { + "epoch": 0.01, + "learning_rate": 6.131511528608027e-07, + "loss": 1.0771, + "step": 359 + }, + { + "epoch": 0.01, + "learning_rate": 6.148590947907771e-07, + "loss": 0.9385, + "step": 360 + }, + { + "epoch": 0.01, + "learning_rate": 6.165670367207515e-07, + "loss": 0.9951, + "step": 361 + }, + { + "epoch": 0.01, + "learning_rate": 6.182749786507259e-07, + "loss": 1.0596, + "step": 362 + }, + { + "epoch": 0.01, + "learning_rate": 6.199829205807002e-07, + "loss": 0.8716, + "step": 363 + }, + { + "epoch": 0.01, + "learning_rate": 6.216908625106746e-07, + "loss": 0.9834, + "step": 364 + }, + { + "epoch": 0.01, + "learning_rate": 6.233988044406489e-07, + "loss": 1.1426, + "step": 365 + }, + { + "epoch": 0.01, + "learning_rate": 6.251067463706234e-07, + "loss": 1.0342, + "step": 366 + }, + { + "epoch": 0.01, + "learning_rate": 6.268146883005978e-07, + "loss": 1.1494, + "step": 367 + }, + { + "epoch": 0.01, + "learning_rate": 6.285226302305721e-07, + "loss": 1.1699, + "step": 368 + }, + { + "epoch": 0.01, + "learning_rate": 6.302305721605466e-07, + "loss": 1.1826, + "step": 369 + }, + { + "epoch": 0.01, + "learning_rate": 6.319385140905209e-07, + "loss": 0.9854, + "step": 370 + }, + { + "epoch": 0.01, + "learning_rate": 6.336464560204953e-07, + "loss": 0.8887, + "step": 371 + }, + { + "epoch": 0.01, + "learning_rate": 6.353543979504696e-07, + "loss": 0.7451, + "step": 372 + }, + { + "epoch": 0.01, + "learning_rate": 6.37062339880444e-07, + "loss": 0.9766, + "step": 373 + }, + { + "epoch": 0.01, + "learning_rate": 6.387702818104184e-07, + "loss": 1.3242, + "step": 374 + }, + { + "epoch": 0.01, + "learning_rate": 6.404782237403928e-07, + "loss": 1.0547, + "step": 375 + }, + { + "epoch": 0.01, + "learning_rate": 6.421861656703673e-07, + "loss": 0.9727, + "step": 376 + }, + { + "epoch": 0.01, + "learning_rate": 6.438941076003416e-07, + "loss": 0.6865, + "step": 377 + }, + { + "epoch": 0.01, + "learning_rate": 6.456020495303159e-07, + "loss": 0.9463, + "step": 378 + }, + { + "epoch": 0.01, + "learning_rate": 6.473099914602903e-07, + "loss": 0.9258, + "step": 379 + }, + { + "epoch": 0.01, + "learning_rate": 6.490179333902647e-07, + "loss": 1.1016, + "step": 380 + }, + { + "epoch": 0.01, + "learning_rate": 6.50725875320239e-07, + "loss": 0.9629, + "step": 381 + }, + { + "epoch": 0.01, + "learning_rate": 6.524338172502135e-07, + "loss": 0.9453, + "step": 382 + }, + { + "epoch": 0.01, + "learning_rate": 6.541417591801879e-07, + "loss": 0.8516, + "step": 383 + }, + { + "epoch": 0.01, + "learning_rate": 6.558497011101623e-07, + "loss": 0.9092, + "step": 384 + }, + { + "epoch": 0.01, + "learning_rate": 6.575576430401366e-07, + "loss": 1.1934, + "step": 385 + }, + { + "epoch": 0.01, + "learning_rate": 6.592655849701109e-07, + "loss": 1.0176, + "step": 386 + }, + { + "epoch": 0.01, + "learning_rate": 6.609735269000854e-07, + "loss": 0.9209, + "step": 387 + }, + { + "epoch": 0.01, + "learning_rate": 6.626814688300597e-07, + "loss": 0.8428, + "step": 388 + }, + { + "epoch": 0.01, + "learning_rate": 6.64389410760034e-07, + "loss": 1.083, + "step": 389 + }, + { + "epoch": 0.01, + "learning_rate": 6.660973526900086e-07, + "loss": 1.0059, + "step": 390 + }, + { + "epoch": 0.01, + "learning_rate": 6.678052946199829e-07, + "loss": 0.9551, + "step": 391 + }, + { + "epoch": 0.01, + "learning_rate": 6.695132365499573e-07, + "loss": 1.2363, + "step": 392 + }, + { + "epoch": 0.01, + "learning_rate": 6.712211784799316e-07, + "loss": 0.8877, + "step": 393 + }, + { + "epoch": 0.01, + "learning_rate": 6.72929120409906e-07, + "loss": 1.2549, + "step": 394 + }, + { + "epoch": 0.01, + "learning_rate": 6.746370623398804e-07, + "loss": 1.0254, + "step": 395 + }, + { + "epoch": 0.01, + "learning_rate": 6.763450042698547e-07, + "loss": 0.9619, + "step": 396 + }, + { + "epoch": 0.01, + "learning_rate": 6.780529461998293e-07, + "loss": 0.8408, + "step": 397 + }, + { + "epoch": 0.01, + "learning_rate": 6.797608881298036e-07, + "loss": 0.8213, + "step": 398 + }, + { + "epoch": 0.01, + "learning_rate": 6.814688300597779e-07, + "loss": 0.9805, + "step": 399 + }, + { + "epoch": 0.01, + "learning_rate": 6.831767719897523e-07, + "loss": 1.1094, + "step": 400 + }, + { + "epoch": 0.01, + "learning_rate": 6.848847139197267e-07, + "loss": 0.9609, + "step": 401 + }, + { + "epoch": 0.01, + "learning_rate": 6.865926558497011e-07, + "loss": 1.1543, + "step": 402 + }, + { + "epoch": 0.01, + "learning_rate": 6.883005977796754e-07, + "loss": 0.8228, + "step": 403 + }, + { + "epoch": 0.01, + "learning_rate": 6.900085397096499e-07, + "loss": 0.957, + "step": 404 + }, + { + "epoch": 0.01, + "learning_rate": 6.917164816396243e-07, + "loss": 0.9033, + "step": 405 + }, + { + "epoch": 0.01, + "learning_rate": 6.934244235695986e-07, + "loss": 1.1436, + "step": 406 + }, + { + "epoch": 0.01, + "learning_rate": 6.951323654995729e-07, + "loss": 1.1338, + "step": 407 + }, + { + "epoch": 0.01, + "learning_rate": 6.968403074295474e-07, + "loss": 0.9258, + "step": 408 + }, + { + "epoch": 0.01, + "learning_rate": 6.985482493595217e-07, + "loss": 1.0791, + "step": 409 + }, + { + "epoch": 0.01, + "learning_rate": 7.002561912894961e-07, + "loss": 1.166, + "step": 410 + }, + { + "epoch": 0.01, + "learning_rate": 7.019641332194705e-07, + "loss": 1.021, + "step": 411 + }, + { + "epoch": 0.01, + "learning_rate": 7.036720751494449e-07, + "loss": 1.0732, + "step": 412 + }, + { + "epoch": 0.01, + "learning_rate": 7.053800170794193e-07, + "loss": 1.0522, + "step": 413 + }, + { + "epoch": 0.01, + "learning_rate": 7.070879590093936e-07, + "loss": 1.0146, + "step": 414 + }, + { + "epoch": 0.01, + "learning_rate": 7.087959009393681e-07, + "loss": 0.9131, + "step": 415 + }, + { + "epoch": 0.01, + "learning_rate": 7.105038428693424e-07, + "loss": 1.0723, + "step": 416 + }, + { + "epoch": 0.01, + "learning_rate": 7.122117847993167e-07, + "loss": 0.814, + "step": 417 + }, + { + "epoch": 0.01, + "learning_rate": 7.139197267292912e-07, + "loss": 1.2051, + "step": 418 + }, + { + "epoch": 0.01, + "learning_rate": 7.156276686592656e-07, + "loss": 0.9053, + "step": 419 + }, + { + "epoch": 0.01, + "learning_rate": 7.1733561058924e-07, + "loss": 0.8457, + "step": 420 + }, + { + "epoch": 0.01, + "learning_rate": 7.190435525192143e-07, + "loss": 1.0205, + "step": 421 + }, + { + "epoch": 0.01, + "learning_rate": 7.207514944491887e-07, + "loss": 1.1445, + "step": 422 + }, + { + "epoch": 0.01, + "learning_rate": 7.224594363791631e-07, + "loss": 0.9727, + "step": 423 + }, + { + "epoch": 0.01, + "learning_rate": 7.241673783091374e-07, + "loss": 1.2812, + "step": 424 + }, + { + "epoch": 0.01, + "learning_rate": 7.258753202391118e-07, + "loss": 1.1436, + "step": 425 + }, + { + "epoch": 0.01, + "learning_rate": 7.275832621690862e-07, + "loss": 1.0098, + "step": 426 + }, + { + "epoch": 0.01, + "learning_rate": 7.292912040990606e-07, + "loss": 0.9795, + "step": 427 + }, + { + "epoch": 0.01, + "learning_rate": 7.30999146029035e-07, + "loss": 1.0107, + "step": 428 + }, + { + "epoch": 0.01, + "learning_rate": 7.327070879590094e-07, + "loss": 0.9326, + "step": 429 + }, + { + "epoch": 0.01, + "learning_rate": 7.344150298889837e-07, + "loss": 0.811, + "step": 430 + }, + { + "epoch": 0.01, + "learning_rate": 7.361229718189581e-07, + "loss": 1.0801, + "step": 431 + }, + { + "epoch": 0.01, + "learning_rate": 7.378309137489325e-07, + "loss": 1.0322, + "step": 432 + }, + { + "epoch": 0.01, + "learning_rate": 7.395388556789069e-07, + "loss": 0.8447, + "step": 433 + }, + { + "epoch": 0.01, + "learning_rate": 7.412467976088813e-07, + "loss": 0.916, + "step": 434 + }, + { + "epoch": 0.01, + "learning_rate": 7.429547395388556e-07, + "loss": 1.0225, + "step": 435 + }, + { + "epoch": 0.01, + "learning_rate": 7.446626814688301e-07, + "loss": 0.8467, + "step": 436 + }, + { + "epoch": 0.01, + "learning_rate": 7.463706233988044e-07, + "loss": 1.0645, + "step": 437 + }, + { + "epoch": 0.01, + "learning_rate": 7.480785653287787e-07, + "loss": 1.2012, + "step": 438 + }, + { + "epoch": 0.01, + "learning_rate": 7.497865072587532e-07, + "loss": 1.2334, + "step": 439 + }, + { + "epoch": 0.01, + "learning_rate": 7.514944491887275e-07, + "loss": 0.9316, + "step": 440 + }, + { + "epoch": 0.01, + "learning_rate": 7.53202391118702e-07, + "loss": 0.9658, + "step": 441 + }, + { + "epoch": 0.01, + "learning_rate": 7.549103330486763e-07, + "loss": 0.9922, + "step": 442 + }, + { + "epoch": 0.01, + "learning_rate": 7.566182749786507e-07, + "loss": 1.0156, + "step": 443 + }, + { + "epoch": 0.01, + "learning_rate": 7.583262169086251e-07, + "loss": 1.0127, + "step": 444 + }, + { + "epoch": 0.01, + "learning_rate": 7.600341588385994e-07, + "loss": 0.918, + "step": 445 + }, + { + "epoch": 0.01, + "learning_rate": 7.617421007685739e-07, + "loss": 1.0498, + "step": 446 + }, + { + "epoch": 0.01, + "learning_rate": 7.634500426985482e-07, + "loss": 0.959, + "step": 447 + }, + { + "epoch": 0.01, + "learning_rate": 7.651579846285225e-07, + "loss": 0.9277, + "step": 448 + }, + { + "epoch": 0.01, + "learning_rate": 7.66865926558497e-07, + "loss": 0.9609, + "step": 449 + }, + { + "epoch": 0.01, + "learning_rate": 7.685738684884714e-07, + "loss": 0.7563, + "step": 450 + }, + { + "epoch": 0.01, + "learning_rate": 7.702818104184458e-07, + "loss": 1.3008, + "step": 451 + }, + { + "epoch": 0.01, + "learning_rate": 7.719897523484201e-07, + "loss": 1.2383, + "step": 452 + }, + { + "epoch": 0.01, + "learning_rate": 7.736976942783945e-07, + "loss": 0.9932, + "step": 453 + }, + { + "epoch": 0.01, + "learning_rate": 7.754056362083689e-07, + "loss": 1.0752, + "step": 454 + }, + { + "epoch": 0.01, + "learning_rate": 7.771135781383432e-07, + "loss": 0.9736, + "step": 455 + }, + { + "epoch": 0.01, + "learning_rate": 7.788215200683176e-07, + "loss": 1.2686, + "step": 456 + }, + { + "epoch": 0.01, + "learning_rate": 7.805294619982921e-07, + "loss": 1.0439, + "step": 457 + }, + { + "epoch": 0.01, + "learning_rate": 7.822374039282664e-07, + "loss": 1.0811, + "step": 458 + }, + { + "epoch": 0.01, + "learning_rate": 7.839453458582408e-07, + "loss": 1.1406, + "step": 459 + }, + { + "epoch": 0.01, + "learning_rate": 7.856532877882152e-07, + "loss": 1.0122, + "step": 460 + }, + { + "epoch": 0.01, + "learning_rate": 7.873612297181895e-07, + "loss": 1.1104, + "step": 461 + }, + { + "epoch": 0.01, + "learning_rate": 7.890691716481639e-07, + "loss": 1.0459, + "step": 462 + }, + { + "epoch": 0.01, + "learning_rate": 7.907771135781382e-07, + "loss": 0.9883, + "step": 463 + }, + { + "epoch": 0.01, + "learning_rate": 7.924850555081128e-07, + "loss": 1.207, + "step": 464 + }, + { + "epoch": 0.01, + "learning_rate": 7.941929974380871e-07, + "loss": 0.9541, + "step": 465 + }, + { + "epoch": 0.01, + "learning_rate": 7.959009393680614e-07, + "loss": 1.0352, + "step": 466 + }, + { + "epoch": 0.01, + "learning_rate": 7.976088812980359e-07, + "loss": 0.9136, + "step": 467 + }, + { + "epoch": 0.01, + "learning_rate": 7.993168232280102e-07, + "loss": 1.0059, + "step": 468 + }, + { + "epoch": 0.01, + "learning_rate": 8.010247651579845e-07, + "loss": 0.8223, + "step": 469 + }, + { + "epoch": 0.01, + "learning_rate": 8.027327070879589e-07, + "loss": 0.8262, + "step": 470 + }, + { + "epoch": 0.01, + "learning_rate": 8.044406490179334e-07, + "loss": 1.0186, + "step": 471 + }, + { + "epoch": 0.01, + "learning_rate": 8.061485909479078e-07, + "loss": 0.7524, + "step": 472 + }, + { + "epoch": 0.01, + "learning_rate": 8.078565328778821e-07, + "loss": 0.8809, + "step": 473 + }, + { + "epoch": 0.01, + "learning_rate": 8.095644748078565e-07, + "loss": 0.8242, + "step": 474 + }, + { + "epoch": 0.01, + "learning_rate": 8.112724167378309e-07, + "loss": 1.0674, + "step": 475 + }, + { + "epoch": 0.01, + "learning_rate": 8.129803586678052e-07, + "loss": 1.0117, + "step": 476 + }, + { + "epoch": 0.01, + "learning_rate": 8.146883005977796e-07, + "loss": 1.0762, + "step": 477 + }, + { + "epoch": 0.01, + "learning_rate": 8.16396242527754e-07, + "loss": 0.9668, + "step": 478 + }, + { + "epoch": 0.01, + "learning_rate": 8.181041844577284e-07, + "loss": 1.0527, + "step": 479 + }, + { + "epoch": 0.01, + "learning_rate": 8.198121263877028e-07, + "loss": 1.0928, + "step": 480 + }, + { + "epoch": 0.01, + "learning_rate": 8.215200683176772e-07, + "loss": 1.1113, + "step": 481 + }, + { + "epoch": 0.01, + "learning_rate": 8.232280102476516e-07, + "loss": 0.8477, + "step": 482 + }, + { + "epoch": 0.01, + "learning_rate": 8.249359521776259e-07, + "loss": 0.9634, + "step": 483 + }, + { + "epoch": 0.01, + "learning_rate": 8.266438941076002e-07, + "loss": 0.9795, + "step": 484 + }, + { + "epoch": 0.01, + "learning_rate": 8.283518360375747e-07, + "loss": 1.0674, + "step": 485 + }, + { + "epoch": 0.01, + "learning_rate": 8.300597779675491e-07, + "loss": 1.0791, + "step": 486 + }, + { + "epoch": 0.01, + "learning_rate": 8.317677198975234e-07, + "loss": 1.0176, + "step": 487 + }, + { + "epoch": 0.01, + "learning_rate": 8.334756618274979e-07, + "loss": 0.9053, + "step": 488 + }, + { + "epoch": 0.01, + "learning_rate": 8.351836037574722e-07, + "loss": 0.9131, + "step": 489 + }, + { + "epoch": 0.01, + "learning_rate": 8.368915456874466e-07, + "loss": 1.2344, + "step": 490 + }, + { + "epoch": 0.01, + "learning_rate": 8.385994876174209e-07, + "loss": 1.0029, + "step": 491 + }, + { + "epoch": 0.01, + "learning_rate": 8.403074295473953e-07, + "loss": 1.0283, + "step": 492 + }, + { + "epoch": 0.01, + "learning_rate": 8.420153714773698e-07, + "loss": 0.9668, + "step": 493 + }, + { + "epoch": 0.01, + "learning_rate": 8.437233134073441e-07, + "loss": 1.2949, + "step": 494 + }, + { + "epoch": 0.01, + "learning_rate": 8.454312553373186e-07, + "loss": 1.0537, + "step": 495 + }, + { + "epoch": 0.01, + "learning_rate": 8.471391972672929e-07, + "loss": 1.0264, + "step": 496 + }, + { + "epoch": 0.01, + "learning_rate": 8.488471391972672e-07, + "loss": 0.9355, + "step": 497 + }, + { + "epoch": 0.01, + "learning_rate": 8.505550811272416e-07, + "loss": 1.123, + "step": 498 + }, + { + "epoch": 0.01, + "learning_rate": 8.52263023057216e-07, + "loss": 0.9248, + "step": 499 + }, + { + "epoch": 0.01, + "learning_rate": 8.539709649871903e-07, + "loss": 1.0684, + "step": 500 + }, + { + "epoch": 0.01, + "learning_rate": 8.556789069171648e-07, + "loss": 0.9834, + "step": 501 + }, + { + "epoch": 0.01, + "learning_rate": 8.573868488471392e-07, + "loss": 0.9893, + "step": 502 + }, + { + "epoch": 0.01, + "learning_rate": 8.590947907771136e-07, + "loss": 1.1426, + "step": 503 + }, + { + "epoch": 0.01, + "learning_rate": 8.608027327070879e-07, + "loss": 0.8242, + "step": 504 + }, + { + "epoch": 0.01, + "learning_rate": 8.625106746370622e-07, + "loss": 1.1387, + "step": 505 + }, + { + "epoch": 0.01, + "learning_rate": 8.642186165670367e-07, + "loss": 0.833, + "step": 506 + }, + { + "epoch": 0.01, + "learning_rate": 8.65926558497011e-07, + "loss": 1.1562, + "step": 507 + }, + { + "epoch": 0.01, + "learning_rate": 8.676345004269855e-07, + "loss": 0.9736, + "step": 508 + }, + { + "epoch": 0.01, + "learning_rate": 8.693424423569599e-07, + "loss": 1.168, + "step": 509 + }, + { + "epoch": 0.01, + "learning_rate": 8.710503842869342e-07, + "loss": 1.0205, + "step": 510 + }, + { + "epoch": 0.01, + "learning_rate": 8.727583262169086e-07, + "loss": 0.9839, + "step": 511 + }, + { + "epoch": 0.01, + "learning_rate": 8.744662681468829e-07, + "loss": 0.9004, + "step": 512 + }, + { + "epoch": 0.01, + "learning_rate": 8.761742100768573e-07, + "loss": 1.1885, + "step": 513 + }, + { + "epoch": 0.01, + "learning_rate": 8.778821520068317e-07, + "loss": 1.1719, + "step": 514 + }, + { + "epoch": 0.01, + "learning_rate": 8.79590093936806e-07, + "loss": 1.1523, + "step": 515 + }, + { + "epoch": 0.01, + "learning_rate": 8.812980358667806e-07, + "loss": 1.084, + "step": 516 + }, + { + "epoch": 0.01, + "learning_rate": 8.830059777967549e-07, + "loss": 1.209, + "step": 517 + }, + { + "epoch": 0.01, + "learning_rate": 8.847139197267292e-07, + "loss": 0.8115, + "step": 518 + }, + { + "epoch": 0.01, + "learning_rate": 8.864218616567036e-07, + "loss": 1.0215, + "step": 519 + }, + { + "epoch": 0.01, + "learning_rate": 8.88129803586678e-07, + "loss": 1.042, + "step": 520 + }, + { + "epoch": 0.01, + "learning_rate": 8.898377455166524e-07, + "loss": 1.0703, + "step": 521 + }, + { + "epoch": 0.01, + "learning_rate": 8.915456874466267e-07, + "loss": 0.9746, + "step": 522 + }, + { + "epoch": 0.01, + "learning_rate": 8.932536293766012e-07, + "loss": 0.9473, + "step": 523 + }, + { + "epoch": 0.01, + "learning_rate": 8.949615713065756e-07, + "loss": 0.9346, + "step": 524 + }, + { + "epoch": 0.01, + "learning_rate": 8.966695132365499e-07, + "loss": 0.9453, + "step": 525 + }, + { + "epoch": 0.01, + "learning_rate": 8.983774551665242e-07, + "loss": 1.0654, + "step": 526 + }, + { + "epoch": 0.01, + "learning_rate": 9.000853970964987e-07, + "loss": 1.0488, + "step": 527 + }, + { + "epoch": 0.01, + "learning_rate": 9.01793339026473e-07, + "loss": 0.9424, + "step": 528 + }, + { + "epoch": 0.01, + "learning_rate": 9.035012809564474e-07, + "loss": 0.8389, + "step": 529 + }, + { + "epoch": 0.01, + "learning_rate": 9.052092228864219e-07, + "loss": 1.1895, + "step": 530 + }, + { + "epoch": 0.01, + "learning_rate": 9.069171648163962e-07, + "loss": 1.0527, + "step": 531 + }, + { + "epoch": 0.01, + "learning_rate": 9.086251067463706e-07, + "loss": 0.9111, + "step": 532 + }, + { + "epoch": 0.01, + "learning_rate": 9.103330486763449e-07, + "loss": 0.9941, + "step": 533 + }, + { + "epoch": 0.01, + "learning_rate": 9.120409906063194e-07, + "loss": 1.0127, + "step": 534 + }, + { + "epoch": 0.01, + "learning_rate": 9.137489325362937e-07, + "loss": 1.0547, + "step": 535 + }, + { + "epoch": 0.01, + "learning_rate": 9.15456874466268e-07, + "loss": 0.9854, + "step": 536 + }, + { + "epoch": 0.01, + "learning_rate": 9.171648163962425e-07, + "loss": 0.9316, + "step": 537 + }, + { + "epoch": 0.01, + "learning_rate": 9.188727583262169e-07, + "loss": 0.9326, + "step": 538 + }, + { + "epoch": 0.01, + "learning_rate": 9.205807002561913e-07, + "loss": 1.0537, + "step": 539 + }, + { + "epoch": 0.01, + "learning_rate": 9.222886421861656e-07, + "loss": 0.917, + "step": 540 + }, + { + "epoch": 0.01, + "learning_rate": 9.2399658411614e-07, + "loss": 0.9658, + "step": 541 + }, + { + "epoch": 0.01, + "learning_rate": 9.257045260461144e-07, + "loss": 1.0029, + "step": 542 + }, + { + "epoch": 0.01, + "learning_rate": 9.274124679760887e-07, + "loss": 0.9424, + "step": 543 + }, + { + "epoch": 0.01, + "learning_rate": 9.291204099060631e-07, + "loss": 0.8638, + "step": 544 + }, + { + "epoch": 0.01, + "learning_rate": 9.308283518360376e-07, + "loss": 1.0195, + "step": 545 + }, + { + "epoch": 0.01, + "learning_rate": 9.325362937660119e-07, + "loss": 1.0195, + "step": 546 + }, + { + "epoch": 0.01, + "learning_rate": 9.342442356959863e-07, + "loss": 0.9619, + "step": 547 + }, + { + "epoch": 0.01, + "learning_rate": 9.359521776259607e-07, + "loss": 1.2627, + "step": 548 + }, + { + "epoch": 0.01, + "learning_rate": 9.37660119555935e-07, + "loss": 1.0508, + "step": 549 + }, + { + "epoch": 0.01, + "learning_rate": 9.393680614859094e-07, + "loss": 0.7354, + "step": 550 + }, + { + "epoch": 0.01, + "learning_rate": 9.410760034158838e-07, + "loss": 1.0186, + "step": 551 + }, + { + "epoch": 0.01, + "learning_rate": 9.427839453458582e-07, + "loss": 1.0352, + "step": 552 + }, + { + "epoch": 0.01, + "learning_rate": 9.444918872758326e-07, + "loss": 0.9785, + "step": 553 + }, + { + "epoch": 0.01, + "learning_rate": 9.46199829205807e-07, + "loss": 0.9395, + "step": 554 + }, + { + "epoch": 0.01, + "learning_rate": 9.479077711357814e-07, + "loss": 0.959, + "step": 555 + }, + { + "epoch": 0.01, + "learning_rate": 9.496157130657557e-07, + "loss": 0.9268, + "step": 556 + }, + { + "epoch": 0.01, + "learning_rate": 9.5132365499573e-07, + "loss": 0.9746, + "step": 557 + }, + { + "epoch": 0.01, + "learning_rate": 9.530315969257045e-07, + "loss": 0.7124, + "step": 558 + }, + { + "epoch": 0.01, + "learning_rate": 9.547395388556788e-07, + "loss": 0.8438, + "step": 559 + }, + { + "epoch": 0.01, + "learning_rate": 9.564474807856533e-07, + "loss": 1.1055, + "step": 560 + }, + { + "epoch": 0.01, + "learning_rate": 9.581554227156277e-07, + "loss": 0.8066, + "step": 561 + }, + { + "epoch": 0.01, + "learning_rate": 9.59863364645602e-07, + "loss": 0.8984, + "step": 562 + }, + { + "epoch": 0.01, + "learning_rate": 9.615713065755764e-07, + "loss": 0.9697, + "step": 563 + }, + { + "epoch": 0.01, + "learning_rate": 9.632792485055508e-07, + "loss": 0.9766, + "step": 564 + }, + { + "epoch": 0.01, + "learning_rate": 9.64987190435525e-07, + "loss": 1.0391, + "step": 565 + }, + { + "epoch": 0.01, + "learning_rate": 9.666951323654995e-07, + "loss": 0.8633, + "step": 566 + }, + { + "epoch": 0.01, + "learning_rate": 9.68403074295474e-07, + "loss": 1.002, + "step": 567 + }, + { + "epoch": 0.01, + "learning_rate": 9.701110162254484e-07, + "loss": 0.9912, + "step": 568 + }, + { + "epoch": 0.01, + "learning_rate": 9.718189581554226e-07, + "loss": 1.0107, + "step": 569 + }, + { + "epoch": 0.01, + "learning_rate": 9.73526900085397e-07, + "loss": 0.9365, + "step": 570 + }, + { + "epoch": 0.01, + "learning_rate": 9.752348420153715e-07, + "loss": 0.9604, + "step": 571 + }, + { + "epoch": 0.01, + "learning_rate": 9.769427839453457e-07, + "loss": 0.709, + "step": 572 + }, + { + "epoch": 0.01, + "learning_rate": 9.786507258753202e-07, + "loss": 0.8633, + "step": 573 + }, + { + "epoch": 0.01, + "learning_rate": 9.803586678052946e-07, + "loss": 1.0596, + "step": 574 + }, + { + "epoch": 0.01, + "learning_rate": 9.82066609735269e-07, + "loss": 1.1348, + "step": 575 + }, + { + "epoch": 0.01, + "learning_rate": 9.837745516652433e-07, + "loss": 1.0977, + "step": 576 + }, + { + "epoch": 0.01, + "learning_rate": 9.854824935952177e-07, + "loss": 0.7944, + "step": 577 + }, + { + "epoch": 0.01, + "learning_rate": 9.871904355251922e-07, + "loss": 0.9824, + "step": 578 + }, + { + "epoch": 0.01, + "learning_rate": 9.888983774551664e-07, + "loss": 1.0898, + "step": 579 + }, + { + "epoch": 0.01, + "learning_rate": 9.906063193851408e-07, + "loss": 0.8818, + "step": 580 + }, + { + "epoch": 0.01, + "learning_rate": 9.923142613151153e-07, + "loss": 1.1143, + "step": 581 + }, + { + "epoch": 0.01, + "learning_rate": 9.940222032450897e-07, + "loss": 0.8672, + "step": 582 + }, + { + "epoch": 0.01, + "learning_rate": 9.95730145175064e-07, + "loss": 1.0283, + "step": 583 + }, + { + "epoch": 0.01, + "learning_rate": 9.974380871050384e-07, + "loss": 0.8799, + "step": 584 + }, + { + "epoch": 0.01, + "learning_rate": 9.991460290350128e-07, + "loss": 1.1914, + "step": 585 + }, + { + "epoch": 0.02, + "learning_rate": 1.0008539709649873e-06, + "loss": 0.8599, + "step": 586 + }, + { + "epoch": 0.02, + "learning_rate": 1.0025619128949615e-06, + "loss": 1.0684, + "step": 587 + }, + { + "epoch": 0.02, + "learning_rate": 1.004269854824936e-06, + "loss": 1.001, + "step": 588 + }, + { + "epoch": 0.02, + "learning_rate": 1.0059777967549104e-06, + "loss": 0.9033, + "step": 589 + }, + { + "epoch": 0.02, + "learning_rate": 1.0076857386848846e-06, + "loss": 1.1318, + "step": 590 + }, + { + "epoch": 0.02, + "learning_rate": 1.009393680614859e-06, + "loss": 0.8853, + "step": 591 + }, + { + "epoch": 0.02, + "learning_rate": 1.0111016225448335e-06, + "loss": 0.9932, + "step": 592 + }, + { + "epoch": 0.02, + "learning_rate": 1.0128095644748077e-06, + "loss": 0.873, + "step": 593 + }, + { + "epoch": 0.02, + "learning_rate": 1.0145175064047822e-06, + "loss": 1.0547, + "step": 594 + }, + { + "epoch": 0.02, + "learning_rate": 1.0162254483347566e-06, + "loss": 0.9053, + "step": 595 + }, + { + "epoch": 0.02, + "learning_rate": 1.0179333902647309e-06, + "loss": 0.9551, + "step": 596 + }, + { + "epoch": 0.02, + "learning_rate": 1.0196413321947053e-06, + "loss": 1.0186, + "step": 597 + }, + { + "epoch": 0.02, + "learning_rate": 1.0213492741246797e-06, + "loss": 0.9121, + "step": 598 + }, + { + "epoch": 0.02, + "learning_rate": 1.023057216054654e-06, + "loss": 1.0146, + "step": 599 + }, + { + "epoch": 0.02, + "learning_rate": 1.0247651579846284e-06, + "loss": 1.1279, + "step": 600 + }, + { + "epoch": 0.02, + "learning_rate": 1.0264730999146029e-06, + "loss": 0.9238, + "step": 601 + }, + { + "epoch": 0.02, + "learning_rate": 1.0281810418445773e-06, + "loss": 1.0566, + "step": 602 + }, + { + "epoch": 0.02, + "learning_rate": 1.0298889837745517e-06, + "loss": 0.897, + "step": 603 + }, + { + "epoch": 0.02, + "learning_rate": 1.031596925704526e-06, + "loss": 0.9668, + "step": 604 + }, + { + "epoch": 0.02, + "learning_rate": 1.0333048676345004e-06, + "loss": 0.8691, + "step": 605 + }, + { + "epoch": 0.02, + "learning_rate": 1.0350128095644749e-06, + "loss": 0.8613, + "step": 606 + }, + { + "epoch": 0.02, + "learning_rate": 1.036720751494449e-06, + "loss": 1.1328, + "step": 607 + }, + { + "epoch": 0.02, + "learning_rate": 1.0384286934244235e-06, + "loss": 1.043, + "step": 608 + }, + { + "epoch": 0.02, + "learning_rate": 1.040136635354398e-06, + "loss": 0.7407, + "step": 609 + }, + { + "epoch": 0.02, + "learning_rate": 1.0418445772843722e-06, + "loss": 1.1055, + "step": 610 + }, + { + "epoch": 0.02, + "learning_rate": 1.0435525192143466e-06, + "loss": 1.042, + "step": 611 + }, + { + "epoch": 0.02, + "learning_rate": 1.045260461144321e-06, + "loss": 1.0234, + "step": 612 + }, + { + "epoch": 0.02, + "learning_rate": 1.0469684030742953e-06, + "loss": 1.0381, + "step": 613 + }, + { + "epoch": 0.02, + "learning_rate": 1.0486763450042698e-06, + "loss": 0.9014, + "step": 614 + }, + { + "epoch": 0.02, + "learning_rate": 1.050384286934244e-06, + "loss": 0.9463, + "step": 615 + }, + { + "epoch": 0.02, + "learning_rate": 1.0520922288642186e-06, + "loss": 1.1914, + "step": 616 + }, + { + "epoch": 0.02, + "learning_rate": 1.053800170794193e-06, + "loss": 0.9873, + "step": 617 + }, + { + "epoch": 0.02, + "learning_rate": 1.0555081127241673e-06, + "loss": 0.9131, + "step": 618 + }, + { + "epoch": 0.02, + "learning_rate": 1.0572160546541418e-06, + "loss": 1.1064, + "step": 619 + }, + { + "epoch": 0.02, + "learning_rate": 1.0589239965841162e-06, + "loss": 1.1885, + "step": 620 + }, + { + "epoch": 0.02, + "learning_rate": 1.0606319385140904e-06, + "loss": 0.9678, + "step": 621 + }, + { + "epoch": 0.02, + "learning_rate": 1.0623398804440649e-06, + "loss": 0.9121, + "step": 622 + }, + { + "epoch": 0.02, + "learning_rate": 1.0640478223740393e-06, + "loss": 0.9619, + "step": 623 + }, + { + "epoch": 0.02, + "learning_rate": 1.0657557643040135e-06, + "loss": 1.1855, + "step": 624 + }, + { + "epoch": 0.02, + "learning_rate": 1.067463706233988e-06, + "loss": 1.0947, + "step": 625 + }, + { + "epoch": 0.02, + "learning_rate": 1.0691716481639624e-06, + "loss": 1.0938, + "step": 626 + }, + { + "epoch": 0.02, + "learning_rate": 1.0708795900939367e-06, + "loss": 0.6758, + "step": 627 + }, + { + "epoch": 0.02, + "learning_rate": 1.072587532023911e-06, + "loss": 0.9932, + "step": 628 + }, + { + "epoch": 0.02, + "learning_rate": 1.0742954739538853e-06, + "loss": 0.9453, + "step": 629 + }, + { + "epoch": 0.02, + "learning_rate": 1.07600341588386e-06, + "loss": 0.9561, + "step": 630 + }, + { + "epoch": 0.02, + "learning_rate": 1.0777113578138344e-06, + "loss": 0.7319, + "step": 631 + }, + { + "epoch": 0.02, + "learning_rate": 1.0794192997438087e-06, + "loss": 0.9922, + "step": 632 + }, + { + "epoch": 0.02, + "learning_rate": 1.081127241673783e-06, + "loss": 1.0449, + "step": 633 + }, + { + "epoch": 0.02, + "learning_rate": 1.0828351836037575e-06, + "loss": 1.0742, + "step": 634 + }, + { + "epoch": 0.02, + "learning_rate": 1.0845431255337318e-06, + "loss": 1.1143, + "step": 635 + }, + { + "epoch": 0.02, + "learning_rate": 1.0862510674637062e-06, + "loss": 1.1494, + "step": 636 + }, + { + "epoch": 0.02, + "learning_rate": 1.0879590093936807e-06, + "loss": 0.8838, + "step": 637 + }, + { + "epoch": 0.02, + "learning_rate": 1.0896669513236549e-06, + "loss": 0.9619, + "step": 638 + }, + { + "epoch": 0.02, + "learning_rate": 1.0913748932536293e-06, + "loss": 0.915, + "step": 639 + }, + { + "epoch": 0.02, + "learning_rate": 1.0930828351836038e-06, + "loss": 0.9707, + "step": 640 + }, + { + "epoch": 0.02, + "learning_rate": 1.094790777113578e-06, + "loss": 1.0088, + "step": 641 + }, + { + "epoch": 0.02, + "learning_rate": 1.0964987190435524e-06, + "loss": 1.1182, + "step": 642 + }, + { + "epoch": 0.02, + "learning_rate": 1.0982066609735267e-06, + "loss": 1.1133, + "step": 643 + }, + { + "epoch": 0.02, + "learning_rate": 1.0999146029035011e-06, + "loss": 1.0312, + "step": 644 + }, + { + "epoch": 0.02, + "learning_rate": 1.1016225448334758e-06, + "loss": 0.9873, + "step": 645 + }, + { + "epoch": 0.02, + "learning_rate": 1.10333048676345e-06, + "loss": 1.1318, + "step": 646 + }, + { + "epoch": 0.02, + "learning_rate": 1.1050384286934244e-06, + "loss": 0.9844, + "step": 647 + }, + { + "epoch": 0.02, + "learning_rate": 1.1067463706233989e-06, + "loss": 0.9072, + "step": 648 + }, + { + "epoch": 0.02, + "learning_rate": 1.1084543125533731e-06, + "loss": 1.0332, + "step": 649 + }, + { + "epoch": 0.02, + "learning_rate": 1.1101622544833476e-06, + "loss": 0.8164, + "step": 650 + }, + { + "epoch": 0.02, + "learning_rate": 1.111870196413322e-06, + "loss": 0.9629, + "step": 651 + }, + { + "epoch": 0.02, + "learning_rate": 1.1135781383432962e-06, + "loss": 0.6284, + "step": 652 + }, + { + "epoch": 0.02, + "learning_rate": 1.1152860802732707e-06, + "loss": 0.8906, + "step": 653 + }, + { + "epoch": 0.02, + "learning_rate": 1.1169940222032451e-06, + "loss": 1.0557, + "step": 654 + }, + { + "epoch": 0.02, + "learning_rate": 1.1187019641332193e-06, + "loss": 1.0605, + "step": 655 + }, + { + "epoch": 0.02, + "learning_rate": 1.1204099060631938e-06, + "loss": 1.2363, + "step": 656 + }, + { + "epoch": 0.02, + "learning_rate": 1.122117847993168e-06, + "loss": 1.0537, + "step": 657 + }, + { + "epoch": 0.02, + "learning_rate": 1.1238257899231425e-06, + "loss": 0.9785, + "step": 658 + }, + { + "epoch": 0.02, + "learning_rate": 1.125533731853117e-06, + "loss": 0.9521, + "step": 659 + }, + { + "epoch": 0.02, + "learning_rate": 1.1272416737830913e-06, + "loss": 1.0654, + "step": 660 + }, + { + "epoch": 0.02, + "learning_rate": 1.1289496157130658e-06, + "loss": 0.6738, + "step": 661 + }, + { + "epoch": 0.02, + "learning_rate": 1.1306575576430402e-06, + "loss": 0.7402, + "step": 662 + }, + { + "epoch": 0.02, + "learning_rate": 1.1323654995730145e-06, + "loss": 1.084, + "step": 663 + }, + { + "epoch": 0.02, + "learning_rate": 1.134073441502989e-06, + "loss": 0.9072, + "step": 664 + }, + { + "epoch": 0.02, + "learning_rate": 1.1357813834329633e-06, + "loss": 1.0918, + "step": 665 + }, + { + "epoch": 0.02, + "learning_rate": 1.1374893253629376e-06, + "loss": 0.8584, + "step": 666 + }, + { + "epoch": 0.02, + "learning_rate": 1.139197267292912e-06, + "loss": 1.1641, + "step": 667 + }, + { + "epoch": 0.02, + "learning_rate": 1.1409052092228865e-06, + "loss": 0.8535, + "step": 668 + }, + { + "epoch": 0.02, + "learning_rate": 1.1426131511528607e-06, + "loss": 0.9209, + "step": 669 + }, + { + "epoch": 0.02, + "learning_rate": 1.1443210930828351e-06, + "loss": 0.9756, + "step": 670 + }, + { + "epoch": 0.02, + "learning_rate": 1.1460290350128094e-06, + "loss": 1.1562, + "step": 671 + }, + { + "epoch": 0.02, + "learning_rate": 1.1477369769427838e-06, + "loss": 0.9678, + "step": 672 + }, + { + "epoch": 0.02, + "learning_rate": 1.1494449188727582e-06, + "loss": 0.8994, + "step": 673 + }, + { + "epoch": 0.02, + "learning_rate": 1.1511528608027325e-06, + "loss": 0.9141, + "step": 674 + }, + { + "epoch": 0.02, + "learning_rate": 1.1528608027327071e-06, + "loss": 0.8994, + "step": 675 + }, + { + "epoch": 0.02, + "learning_rate": 1.1545687446626816e-06, + "loss": 1.166, + "step": 676 + }, + { + "epoch": 0.02, + "learning_rate": 1.1562766865926558e-06, + "loss": 0.9707, + "step": 677 + }, + { + "epoch": 0.02, + "learning_rate": 1.1579846285226302e-06, + "loss": 1.1758, + "step": 678 + }, + { + "epoch": 0.02, + "learning_rate": 1.1596925704526047e-06, + "loss": 0.9434, + "step": 679 + }, + { + "epoch": 0.02, + "learning_rate": 1.161400512382579e-06, + "loss": 1.0176, + "step": 680 + }, + { + "epoch": 0.02, + "learning_rate": 1.1631084543125534e-06, + "loss": 1.2666, + "step": 681 + }, + { + "epoch": 0.02, + "learning_rate": 1.1648163962425278e-06, + "loss": 1.0596, + "step": 682 + }, + { + "epoch": 0.02, + "learning_rate": 1.166524338172502e-06, + "loss": 0.9473, + "step": 683 + }, + { + "epoch": 0.02, + "learning_rate": 1.1682322801024765e-06, + "loss": 1.0088, + "step": 684 + }, + { + "epoch": 0.02, + "learning_rate": 1.1699402220324507e-06, + "loss": 0.9141, + "step": 685 + }, + { + "epoch": 0.02, + "learning_rate": 1.1716481639624251e-06, + "loss": 1.0713, + "step": 686 + }, + { + "epoch": 0.02, + "learning_rate": 1.1733561058923996e-06, + "loss": 0.9824, + "step": 687 + }, + { + "epoch": 0.02, + "learning_rate": 1.1750640478223738e-06, + "loss": 0.9385, + "step": 688 + }, + { + "epoch": 0.02, + "learning_rate": 1.1767719897523483e-06, + "loss": 1.0166, + "step": 689 + }, + { + "epoch": 0.02, + "learning_rate": 1.178479931682323e-06, + "loss": 0.8662, + "step": 690 + }, + { + "epoch": 0.02, + "learning_rate": 1.1801878736122971e-06, + "loss": 0.9346, + "step": 691 + }, + { + "epoch": 0.02, + "learning_rate": 1.1818958155422716e-06, + "loss": 0.7891, + "step": 692 + }, + { + "epoch": 0.02, + "learning_rate": 1.183603757472246e-06, + "loss": 1.0342, + "step": 693 + }, + { + "epoch": 0.02, + "learning_rate": 1.1853116994022203e-06, + "loss": 0.8042, + "step": 694 + }, + { + "epoch": 0.02, + "learning_rate": 1.1870196413321947e-06, + "loss": 1.0547, + "step": 695 + }, + { + "epoch": 0.02, + "learning_rate": 1.1887275832621691e-06, + "loss": 1.0205, + "step": 696 + }, + { + "epoch": 0.02, + "learning_rate": 1.1904355251921434e-06, + "loss": 0.9878, + "step": 697 + }, + { + "epoch": 0.02, + "learning_rate": 1.1921434671221178e-06, + "loss": 0.9795, + "step": 698 + }, + { + "epoch": 0.02, + "learning_rate": 1.193851409052092e-06, + "loss": 0.9092, + "step": 699 + }, + { + "epoch": 0.02, + "learning_rate": 1.1955593509820665e-06, + "loss": 0.8379, + "step": 700 + }, + { + "epoch": 0.02, + "learning_rate": 1.197267292912041e-06, + "loss": 0.9785, + "step": 701 + }, + { + "epoch": 0.02, + "learning_rate": 1.1989752348420152e-06, + "loss": 1.0195, + "step": 702 + }, + { + "epoch": 0.02, + "learning_rate": 1.2006831767719896e-06, + "loss": 0.8945, + "step": 703 + }, + { + "epoch": 0.02, + "learning_rate": 1.202391118701964e-06, + "loss": 1.0625, + "step": 704 + }, + { + "epoch": 0.02, + "learning_rate": 1.2040990606319385e-06, + "loss": 0.8818, + "step": 705 + }, + { + "epoch": 0.02, + "learning_rate": 1.205807002561913e-06, + "loss": 0.7749, + "step": 706 + }, + { + "epoch": 0.02, + "learning_rate": 1.2075149444918874e-06, + "loss": 1.0859, + "step": 707 + }, + { + "epoch": 0.02, + "learning_rate": 1.2092228864218616e-06, + "loss": 1.1035, + "step": 708 + }, + { + "epoch": 0.02, + "learning_rate": 1.210930828351836e-06, + "loss": 1.083, + "step": 709 + }, + { + "epoch": 0.02, + "learning_rate": 1.2126387702818105e-06, + "loss": 1.1172, + "step": 710 + }, + { + "epoch": 0.02, + "learning_rate": 1.2143467122117847e-06, + "loss": 0.8496, + "step": 711 + }, + { + "epoch": 0.02, + "learning_rate": 1.2160546541417592e-06, + "loss": 0.8213, + "step": 712 + }, + { + "epoch": 0.02, + "learning_rate": 1.2177625960717334e-06, + "loss": 1.0283, + "step": 713 + }, + { + "epoch": 0.02, + "learning_rate": 1.2194705380017078e-06, + "loss": 1.0127, + "step": 714 + }, + { + "epoch": 0.02, + "learning_rate": 1.2211784799316823e-06, + "loss": 0.998, + "step": 715 + }, + { + "epoch": 0.02, + "learning_rate": 1.2228864218616565e-06, + "loss": 1.0264, + "step": 716 + }, + { + "epoch": 0.02, + "learning_rate": 1.224594363791631e-06, + "loss": 0.9131, + "step": 717 + }, + { + "epoch": 0.02, + "learning_rate": 1.2263023057216054e-06, + "loss": 0.9854, + "step": 718 + }, + { + "epoch": 0.02, + "learning_rate": 1.2280102476515798e-06, + "loss": 0.9233, + "step": 719 + }, + { + "epoch": 0.02, + "learning_rate": 1.2297181895815543e-06, + "loss": 1.0811, + "step": 720 + }, + { + "epoch": 0.02, + "learning_rate": 1.2314261315115287e-06, + "loss": 0.8799, + "step": 721 + }, + { + "epoch": 0.02, + "learning_rate": 1.233134073441503e-06, + "loss": 1.0508, + "step": 722 + }, + { + "epoch": 0.02, + "learning_rate": 1.2348420153714774e-06, + "loss": 1.0869, + "step": 723 + }, + { + "epoch": 0.02, + "learning_rate": 1.2365499573014518e-06, + "loss": 1.002, + "step": 724 + }, + { + "epoch": 0.02, + "learning_rate": 1.238257899231426e-06, + "loss": 1.0117, + "step": 725 + }, + { + "epoch": 0.02, + "learning_rate": 1.2399658411614005e-06, + "loss": 0.8574, + "step": 726 + }, + { + "epoch": 0.02, + "learning_rate": 1.2416737830913747e-06, + "loss": 1.3379, + "step": 727 + }, + { + "epoch": 0.02, + "learning_rate": 1.2433817250213492e-06, + "loss": 0.9717, + "step": 728 + }, + { + "epoch": 0.02, + "learning_rate": 1.2450896669513236e-06, + "loss": 0.8809, + "step": 729 + }, + { + "epoch": 0.02, + "learning_rate": 1.2467976088812978e-06, + "loss": 0.8301, + "step": 730 + }, + { + "epoch": 0.02, + "learning_rate": 1.2485055508112723e-06, + "loss": 0.7637, + "step": 731 + }, + { + "epoch": 0.02, + "learning_rate": 1.2502134927412467e-06, + "loss": 0.6958, + "step": 732 + }, + { + "epoch": 0.02, + "learning_rate": 1.251921434671221e-06, + "loss": 1.1045, + "step": 733 + }, + { + "epoch": 0.02, + "learning_rate": 1.2536293766011956e-06, + "loss": 0.8911, + "step": 734 + }, + { + "epoch": 0.02, + "learning_rate": 1.25533731853117e-06, + "loss": 0.8438, + "step": 735 + }, + { + "epoch": 0.02, + "learning_rate": 1.2570452604611443e-06, + "loss": 1.1592, + "step": 736 + }, + { + "epoch": 0.02, + "learning_rate": 1.2587532023911187e-06, + "loss": 0.8154, + "step": 737 + }, + { + "epoch": 0.02, + "learning_rate": 1.2604611443210932e-06, + "loss": 0.9756, + "step": 738 + }, + { + "epoch": 0.02, + "learning_rate": 1.2621690862510674e-06, + "loss": 1.0635, + "step": 739 + }, + { + "epoch": 0.02, + "learning_rate": 1.2638770281810418e-06, + "loss": 0.9199, + "step": 740 + }, + { + "epoch": 0.02, + "learning_rate": 1.265584970111016e-06, + "loss": 0.7734, + "step": 741 + }, + { + "epoch": 0.02, + "learning_rate": 1.2672929120409905e-06, + "loss": 1.0293, + "step": 742 + }, + { + "epoch": 0.02, + "learning_rate": 1.269000853970965e-06, + "loss": 0.9814, + "step": 743 + }, + { + "epoch": 0.02, + "learning_rate": 1.2707087959009392e-06, + "loss": 0.9409, + "step": 744 + }, + { + "epoch": 0.02, + "learning_rate": 1.2724167378309136e-06, + "loss": 0.998, + "step": 745 + }, + { + "epoch": 0.02, + "learning_rate": 1.274124679760888e-06, + "loss": 1.0283, + "step": 746 + }, + { + "epoch": 0.02, + "learning_rate": 1.2758326216908623e-06, + "loss": 1.1074, + "step": 747 + }, + { + "epoch": 0.02, + "learning_rate": 1.2775405636208367e-06, + "loss": 0.6064, + "step": 748 + }, + { + "epoch": 0.02, + "learning_rate": 1.2792485055508114e-06, + "loss": 0.8022, + "step": 749 + }, + { + "epoch": 0.02, + "learning_rate": 1.2809564474807856e-06, + "loss": 1.0547, + "step": 750 + }, + { + "epoch": 0.02, + "learning_rate": 1.28266438941076e-06, + "loss": 0.9316, + "step": 751 + }, + { + "epoch": 0.02, + "learning_rate": 1.2843723313407345e-06, + "loss": 1.085, + "step": 752 + }, + { + "epoch": 0.02, + "learning_rate": 1.2860802732707087e-06, + "loss": 0.8472, + "step": 753 + }, + { + "epoch": 0.02, + "learning_rate": 1.2877882152006832e-06, + "loss": 1.0645, + "step": 754 + }, + { + "epoch": 0.02, + "learning_rate": 1.2894961571306574e-06, + "loss": 1.0449, + "step": 755 + }, + { + "epoch": 0.02, + "learning_rate": 1.2912040990606319e-06, + "loss": 1.0264, + "step": 756 + }, + { + "epoch": 0.02, + "learning_rate": 1.2929120409906063e-06, + "loss": 1.0244, + "step": 757 + }, + { + "epoch": 0.02, + "learning_rate": 1.2946199829205805e-06, + "loss": 0.8545, + "step": 758 + }, + { + "epoch": 0.02, + "learning_rate": 1.296327924850555e-06, + "loss": 1.1943, + "step": 759 + }, + { + "epoch": 0.02, + "learning_rate": 1.2980358667805294e-06, + "loss": 0.998, + "step": 760 + }, + { + "epoch": 0.02, + "learning_rate": 1.2997438087105036e-06, + "loss": 0.9805, + "step": 761 + }, + { + "epoch": 0.02, + "learning_rate": 1.301451750640478e-06, + "loss": 1.1426, + "step": 762 + }, + { + "epoch": 0.02, + "learning_rate": 1.3031596925704525e-06, + "loss": 1.1133, + "step": 763 + }, + { + "epoch": 0.02, + "learning_rate": 1.304867634500427e-06, + "loss": 1.1699, + "step": 764 + }, + { + "epoch": 0.02, + "learning_rate": 1.3065755764304014e-06, + "loss": 0.9077, + "step": 765 + }, + { + "epoch": 0.02, + "learning_rate": 1.3082835183603758e-06, + "loss": 0.8193, + "step": 766 + }, + { + "epoch": 0.02, + "learning_rate": 1.30999146029035e-06, + "loss": 0.7754, + "step": 767 + }, + { + "epoch": 0.02, + "learning_rate": 1.3116994022203245e-06, + "loss": 1.376, + "step": 768 + }, + { + "epoch": 0.02, + "learning_rate": 1.313407344150299e-06, + "loss": 1.0488, + "step": 769 + }, + { + "epoch": 0.02, + "learning_rate": 1.3151152860802732e-06, + "loss": 1.043, + "step": 770 + }, + { + "epoch": 0.02, + "learning_rate": 1.3168232280102476e-06, + "loss": 0.9512, + "step": 771 + }, + { + "epoch": 0.02, + "learning_rate": 1.3185311699402219e-06, + "loss": 0.9775, + "step": 772 + }, + { + "epoch": 0.02, + "learning_rate": 1.3202391118701963e-06, + "loss": 1.0596, + "step": 773 + }, + { + "epoch": 0.02, + "learning_rate": 1.3219470538001707e-06, + "loss": 1.1182, + "step": 774 + }, + { + "epoch": 0.02, + "learning_rate": 1.323654995730145e-06, + "loss": 0.9014, + "step": 775 + }, + { + "epoch": 0.02, + "learning_rate": 1.3253629376601194e-06, + "loss": 1.0137, + "step": 776 + }, + { + "epoch": 0.02, + "learning_rate": 1.3270708795900939e-06, + "loss": 1.1074, + "step": 777 + }, + { + "epoch": 0.02, + "learning_rate": 1.328778821520068e-06, + "loss": 0.8018, + "step": 778 + }, + { + "epoch": 0.02, + "learning_rate": 1.3304867634500427e-06, + "loss": 1.0273, + "step": 779 + }, + { + "epoch": 0.02, + "learning_rate": 1.3321947053800172e-06, + "loss": 1.123, + "step": 780 + }, + { + "epoch": 0.02, + "learning_rate": 1.3339026473099914e-06, + "loss": 1.1133, + "step": 781 + }, + { + "epoch": 0.02, + "learning_rate": 1.3356105892399659e-06, + "loss": 1.0449, + "step": 782 + }, + { + "epoch": 0.02, + "learning_rate": 1.3373185311699403e-06, + "loss": 1.001, + "step": 783 + }, + { + "epoch": 0.02, + "learning_rate": 1.3390264730999145e-06, + "loss": 0.8457, + "step": 784 + }, + { + "epoch": 0.02, + "learning_rate": 1.340734415029889e-06, + "loss": 1.0039, + "step": 785 + }, + { + "epoch": 0.02, + "learning_rate": 1.3424423569598632e-06, + "loss": 0.959, + "step": 786 + }, + { + "epoch": 0.02, + "learning_rate": 1.3441502988898376e-06, + "loss": 1.0107, + "step": 787 + }, + { + "epoch": 0.02, + "learning_rate": 1.345858240819812e-06, + "loss": 0.8447, + "step": 788 + }, + { + "epoch": 0.02, + "learning_rate": 1.3475661827497863e-06, + "loss": 1.0781, + "step": 789 + }, + { + "epoch": 0.02, + "learning_rate": 1.3492741246797608e-06, + "loss": 0.9902, + "step": 790 + }, + { + "epoch": 0.02, + "learning_rate": 1.3509820666097352e-06, + "loss": 1.0771, + "step": 791 + }, + { + "epoch": 0.02, + "learning_rate": 1.3526900085397094e-06, + "loss": 1.0342, + "step": 792 + }, + { + "epoch": 0.02, + "learning_rate": 1.3543979504696839e-06, + "loss": 1.0869, + "step": 793 + }, + { + "epoch": 0.02, + "learning_rate": 1.3561058923996585e-06, + "loss": 0.9365, + "step": 794 + }, + { + "epoch": 0.02, + "learning_rate": 1.3578138343296328e-06, + "loss": 1.0195, + "step": 795 + }, + { + "epoch": 0.02, + "learning_rate": 1.3595217762596072e-06, + "loss": 1.04, + "step": 796 + }, + { + "epoch": 0.02, + "learning_rate": 1.3612297181895816e-06, + "loss": 0.9233, + "step": 797 + }, + { + "epoch": 0.02, + "learning_rate": 1.3629376601195559e-06, + "loss": 1.1133, + "step": 798 + }, + { + "epoch": 0.02, + "learning_rate": 1.3646456020495303e-06, + "loss": 0.9268, + "step": 799 + }, + { + "epoch": 0.02, + "learning_rate": 1.3663535439795045e-06, + "loss": 1.1152, + "step": 800 + }, + { + "epoch": 0.02, + "learning_rate": 1.368061485909479e-06, + "loss": 0.9072, + "step": 801 + }, + { + "epoch": 0.02, + "learning_rate": 1.3697694278394534e-06, + "loss": 0.9512, + "step": 802 + }, + { + "epoch": 0.02, + "learning_rate": 1.3714773697694277e-06, + "loss": 1.0371, + "step": 803 + }, + { + "epoch": 0.02, + "learning_rate": 1.3731853116994021e-06, + "loss": 0.8809, + "step": 804 + }, + { + "epoch": 0.02, + "learning_rate": 1.3748932536293765e-06, + "loss": 0.7393, + "step": 805 + }, + { + "epoch": 0.02, + "learning_rate": 1.3766011955593508e-06, + "loss": 1.1621, + "step": 806 + }, + { + "epoch": 0.02, + "learning_rate": 1.3783091374893252e-06, + "loss": 0.9854, + "step": 807 + }, + { + "epoch": 0.02, + "learning_rate": 1.3800170794192999e-06, + "loss": 0.728, + "step": 808 + }, + { + "epoch": 0.02, + "learning_rate": 1.381725021349274e-06, + "loss": 0.8242, + "step": 809 + }, + { + "epoch": 0.02, + "learning_rate": 1.3834329632792485e-06, + "loss": 0.8809, + "step": 810 + }, + { + "epoch": 0.02, + "learning_rate": 1.385140905209223e-06, + "loss": 0.834, + "step": 811 + }, + { + "epoch": 0.02, + "learning_rate": 1.3868488471391972e-06, + "loss": 0.8906, + "step": 812 + }, + { + "epoch": 0.02, + "learning_rate": 1.3885567890691717e-06, + "loss": 0.9229, + "step": 813 + }, + { + "epoch": 0.02, + "learning_rate": 1.3902647309991459e-06, + "loss": 0.9111, + "step": 814 + }, + { + "epoch": 0.02, + "learning_rate": 1.3919726729291203e-06, + "loss": 0.9824, + "step": 815 + }, + { + "epoch": 0.02, + "learning_rate": 1.3936806148590948e-06, + "loss": 1.04, + "step": 816 + }, + { + "epoch": 0.02, + "learning_rate": 1.395388556789069e-06, + "loss": 0.8945, + "step": 817 + }, + { + "epoch": 0.02, + "learning_rate": 1.3970964987190434e-06, + "loss": 1.0371, + "step": 818 + }, + { + "epoch": 0.02, + "learning_rate": 1.3988044406490179e-06, + "loss": 1.0391, + "step": 819 + }, + { + "epoch": 0.02, + "learning_rate": 1.4005123825789921e-06, + "loss": 0.9834, + "step": 820 + }, + { + "epoch": 0.02, + "learning_rate": 1.4022203245089666e-06, + "loss": 1.0117, + "step": 821 + }, + { + "epoch": 0.02, + "learning_rate": 1.403928266438941e-06, + "loss": 1.1016, + "step": 822 + }, + { + "epoch": 0.02, + "learning_rate": 1.4056362083689154e-06, + "loss": 0.9141, + "step": 823 + }, + { + "epoch": 0.02, + "learning_rate": 1.4073441502988899e-06, + "loss": 0.8418, + "step": 824 + }, + { + "epoch": 0.02, + "learning_rate": 1.4090520922288643e-06, + "loss": 0.8779, + "step": 825 + }, + { + "epoch": 0.02, + "learning_rate": 1.4107600341588386e-06, + "loss": 0.9258, + "step": 826 + }, + { + "epoch": 0.02, + "learning_rate": 1.412467976088813e-06, + "loss": 1.0723, + "step": 827 + }, + { + "epoch": 0.02, + "learning_rate": 1.4141759180187872e-06, + "loss": 1.0674, + "step": 828 + }, + { + "epoch": 0.02, + "learning_rate": 1.4158838599487617e-06, + "loss": 1.2344, + "step": 829 + }, + { + "epoch": 0.02, + "learning_rate": 1.4175918018787361e-06, + "loss": 0.8555, + "step": 830 + }, + { + "epoch": 0.02, + "learning_rate": 1.4192997438087103e-06, + "loss": 1.168, + "step": 831 + }, + { + "epoch": 0.02, + "learning_rate": 1.4210076857386848e-06, + "loss": 0.8145, + "step": 832 + }, + { + "epoch": 0.02, + "learning_rate": 1.4227156276686592e-06, + "loss": 1.208, + "step": 833 + }, + { + "epoch": 0.02, + "learning_rate": 1.4244235695986335e-06, + "loss": 0.9678, + "step": 834 + }, + { + "epoch": 0.02, + "learning_rate": 1.426131511528608e-06, + "loss": 1.0273, + "step": 835 + }, + { + "epoch": 0.02, + "learning_rate": 1.4278394534585823e-06, + "loss": 1.0703, + "step": 836 + }, + { + "epoch": 0.02, + "learning_rate": 1.4295473953885566e-06, + "loss": 1.1152, + "step": 837 + }, + { + "epoch": 0.02, + "learning_rate": 1.4312553373185312e-06, + "loss": 1.001, + "step": 838 + }, + { + "epoch": 0.02, + "learning_rate": 1.4329632792485057e-06, + "loss": 1.0566, + "step": 839 + }, + { + "epoch": 0.02, + "learning_rate": 1.43467122117848e-06, + "loss": 0.8623, + "step": 840 + }, + { + "epoch": 0.02, + "learning_rate": 1.4363791631084543e-06, + "loss": 0.9131, + "step": 841 + }, + { + "epoch": 0.02, + "learning_rate": 1.4380871050384286e-06, + "loss": 1.0273, + "step": 842 + }, + { + "epoch": 0.02, + "learning_rate": 1.439795046968403e-06, + "loss": 0.9912, + "step": 843 + }, + { + "epoch": 0.02, + "learning_rate": 1.4415029888983775e-06, + "loss": 1.0156, + "step": 844 + }, + { + "epoch": 0.02, + "learning_rate": 1.4432109308283517e-06, + "loss": 0.7725, + "step": 845 + }, + { + "epoch": 0.02, + "learning_rate": 1.4449188727583261e-06, + "loss": 0.9414, + "step": 846 + }, + { + "epoch": 0.02, + "learning_rate": 1.4466268146883006e-06, + "loss": 0.8857, + "step": 847 + }, + { + "epoch": 0.02, + "learning_rate": 1.4483347566182748e-06, + "loss": 0.7764, + "step": 848 + }, + { + "epoch": 0.02, + "learning_rate": 1.4500426985482492e-06, + "loss": 1.0166, + "step": 849 + }, + { + "epoch": 0.02, + "learning_rate": 1.4517506404782237e-06, + "loss": 0.8965, + "step": 850 + }, + { + "epoch": 0.02, + "learning_rate": 1.453458582408198e-06, + "loss": 0.9111, + "step": 851 + }, + { + "epoch": 0.02, + "learning_rate": 1.4551665243381724e-06, + "loss": 0.9004, + "step": 852 + }, + { + "epoch": 0.02, + "learning_rate": 1.456874466268147e-06, + "loss": 1.082, + "step": 853 + }, + { + "epoch": 0.02, + "learning_rate": 1.4585824081981212e-06, + "loss": 0.8086, + "step": 854 + }, + { + "epoch": 0.02, + "learning_rate": 1.4602903501280957e-06, + "loss": 0.9932, + "step": 855 + }, + { + "epoch": 0.02, + "learning_rate": 1.46199829205807e-06, + "loss": 0.9355, + "step": 856 + }, + { + "epoch": 0.02, + "learning_rate": 1.4637062339880444e-06, + "loss": 1.0879, + "step": 857 + }, + { + "epoch": 0.02, + "learning_rate": 1.4654141759180188e-06, + "loss": 1.082, + "step": 858 + }, + { + "epoch": 0.02, + "learning_rate": 1.467122117847993e-06, + "loss": 0.834, + "step": 859 + }, + { + "epoch": 0.02, + "learning_rate": 1.4688300597779675e-06, + "loss": 0.8706, + "step": 860 + }, + { + "epoch": 0.02, + "learning_rate": 1.470538001707942e-06, + "loss": 1.0312, + "step": 861 + }, + { + "epoch": 0.02, + "learning_rate": 1.4722459436379161e-06, + "loss": 0.9141, + "step": 862 + }, + { + "epoch": 0.02, + "learning_rate": 1.4739538855678906e-06, + "loss": 1.3086, + "step": 863 + }, + { + "epoch": 0.02, + "learning_rate": 1.475661827497865e-06, + "loss": 0.9463, + "step": 864 + }, + { + "epoch": 0.02, + "learning_rate": 1.4773697694278393e-06, + "loss": 1.0088, + "step": 865 + }, + { + "epoch": 0.02, + "learning_rate": 1.4790777113578137e-06, + "loss": 1.1201, + "step": 866 + }, + { + "epoch": 0.02, + "learning_rate": 1.480785653287788e-06, + "loss": 1.0791, + "step": 867 + }, + { + "epoch": 0.02, + "learning_rate": 1.4824935952177626e-06, + "loss": 0.8369, + "step": 868 + }, + { + "epoch": 0.02, + "learning_rate": 1.484201537147737e-06, + "loss": 0.9839, + "step": 869 + }, + { + "epoch": 0.02, + "learning_rate": 1.4859094790777113e-06, + "loss": 0.9873, + "step": 870 + }, + { + "epoch": 0.02, + "learning_rate": 1.4876174210076857e-06, + "loss": 0.9912, + "step": 871 + }, + { + "epoch": 0.02, + "learning_rate": 1.4893253629376601e-06, + "loss": 1.0078, + "step": 872 + }, + { + "epoch": 0.02, + "learning_rate": 1.4910333048676344e-06, + "loss": 0.9521, + "step": 873 + }, + { + "epoch": 0.02, + "learning_rate": 1.4927412467976088e-06, + "loss": 1.0254, + "step": 874 + }, + { + "epoch": 0.02, + "learning_rate": 1.4944491887275833e-06, + "loss": 1.04, + "step": 875 + }, + { + "epoch": 0.02, + "learning_rate": 1.4961571306575575e-06, + "loss": 0.8369, + "step": 876 + }, + { + "epoch": 0.02, + "learning_rate": 1.497865072587532e-06, + "loss": 1.1191, + "step": 877 + }, + { + "epoch": 0.02, + "learning_rate": 1.4995730145175064e-06, + "loss": 0.9336, + "step": 878 + }, + { + "epoch": 0.02, + "learning_rate": 1.5012809564474806e-06, + "loss": 0.957, + "step": 879 + }, + { + "epoch": 0.02, + "learning_rate": 1.502988898377455e-06, + "loss": 0.8203, + "step": 880 + }, + { + "epoch": 0.02, + "learning_rate": 1.5046968403074293e-06, + "loss": 0.9077, + "step": 881 + }, + { + "epoch": 0.02, + "learning_rate": 1.506404782237404e-06, + "loss": 1.0049, + "step": 882 + }, + { + "epoch": 0.02, + "learning_rate": 1.5081127241673784e-06, + "loss": 1.0254, + "step": 883 + }, + { + "epoch": 0.02, + "learning_rate": 1.5098206660973526e-06, + "loss": 1.085, + "step": 884 + }, + { + "epoch": 0.02, + "learning_rate": 1.511528608027327e-06, + "loss": 0.8916, + "step": 885 + }, + { + "epoch": 0.02, + "learning_rate": 1.5132365499573015e-06, + "loss": 1.1279, + "step": 886 + }, + { + "epoch": 0.02, + "learning_rate": 1.5149444918872757e-06, + "loss": 1.1855, + "step": 887 + }, + { + "epoch": 0.02, + "learning_rate": 1.5166524338172502e-06, + "loss": 1.0742, + "step": 888 + }, + { + "epoch": 0.02, + "learning_rate": 1.5183603757472246e-06, + "loss": 1.0605, + "step": 889 + }, + { + "epoch": 0.02, + "learning_rate": 1.5200683176771988e-06, + "loss": 0.9053, + "step": 890 + }, + { + "epoch": 0.02, + "learning_rate": 1.5217762596071733e-06, + "loss": 1.0137, + "step": 891 + }, + { + "epoch": 0.02, + "learning_rate": 1.5234842015371477e-06, + "loss": 0.8271, + "step": 892 + }, + { + "epoch": 0.02, + "learning_rate": 1.525192143467122e-06, + "loss": 0.9521, + "step": 893 + }, + { + "epoch": 0.02, + "learning_rate": 1.5269000853970964e-06, + "loss": 1.1836, + "step": 894 + }, + { + "epoch": 0.02, + "learning_rate": 1.5286080273270708e-06, + "loss": 1.1328, + "step": 895 + }, + { + "epoch": 0.02, + "learning_rate": 1.530315969257045e-06, + "loss": 1.1211, + "step": 896 + }, + { + "epoch": 0.02, + "learning_rate": 1.5320239111870197e-06, + "loss": 0.8066, + "step": 897 + }, + { + "epoch": 0.02, + "learning_rate": 1.533731853116994e-06, + "loss": 1.124, + "step": 898 + }, + { + "epoch": 0.02, + "learning_rate": 1.5354397950469684e-06, + "loss": 0.9336, + "step": 899 + }, + { + "epoch": 0.02, + "learning_rate": 1.5371477369769428e-06, + "loss": 1.0684, + "step": 900 + }, + { + "epoch": 0.02, + "learning_rate": 1.538855678906917e-06, + "loss": 0.8394, + "step": 901 + }, + { + "epoch": 0.02, + "learning_rate": 1.5405636208368915e-06, + "loss": 0.7148, + "step": 902 + }, + { + "epoch": 0.02, + "learning_rate": 1.542271562766866e-06, + "loss": 0.8916, + "step": 903 + }, + { + "epoch": 0.02, + "learning_rate": 1.5439795046968402e-06, + "loss": 0.8721, + "step": 904 + }, + { + "epoch": 0.02, + "learning_rate": 1.5456874466268146e-06, + "loss": 1.0615, + "step": 905 + }, + { + "epoch": 0.02, + "learning_rate": 1.547395388556789e-06, + "loss": 1.0742, + "step": 906 + }, + { + "epoch": 0.02, + "learning_rate": 1.5491033304867633e-06, + "loss": 1.106, + "step": 907 + }, + { + "epoch": 0.02, + "learning_rate": 1.5508112724167377e-06, + "loss": 0.6533, + "step": 908 + }, + { + "epoch": 0.02, + "learning_rate": 1.5525192143467122e-06, + "loss": 0.8271, + "step": 909 + }, + { + "epoch": 0.02, + "learning_rate": 1.5542271562766864e-06, + "loss": 0.957, + "step": 910 + }, + { + "epoch": 0.02, + "learning_rate": 1.5559350982066608e-06, + "loss": 0.939, + "step": 911 + }, + { + "epoch": 0.02, + "learning_rate": 1.5576430401366353e-06, + "loss": 1.1309, + "step": 912 + }, + { + "epoch": 0.02, + "learning_rate": 1.5593509820666097e-06, + "loss": 0.9258, + "step": 913 + }, + { + "epoch": 0.02, + "learning_rate": 1.5610589239965842e-06, + "loss": 0.8096, + "step": 914 + }, + { + "epoch": 0.02, + "learning_rate": 1.5627668659265584e-06, + "loss": 0.9619, + "step": 915 + }, + { + "epoch": 0.02, + "learning_rate": 1.5644748078565328e-06, + "loss": 0.9287, + "step": 916 + }, + { + "epoch": 0.02, + "learning_rate": 1.5661827497865073e-06, + "loss": 0.8394, + "step": 917 + }, + { + "epoch": 0.02, + "learning_rate": 1.5678906917164815e-06, + "loss": 1.0352, + "step": 918 + }, + { + "epoch": 0.02, + "learning_rate": 1.569598633646456e-06, + "loss": 0.7988, + "step": 919 + }, + { + "epoch": 0.02, + "learning_rate": 1.5713065755764304e-06, + "loss": 1.0566, + "step": 920 + }, + { + "epoch": 0.02, + "learning_rate": 1.5730145175064046e-06, + "loss": 0.9941, + "step": 921 + }, + { + "epoch": 0.02, + "learning_rate": 1.574722459436379e-06, + "loss": 0.9443, + "step": 922 + }, + { + "epoch": 0.02, + "learning_rate": 1.5764304013663535e-06, + "loss": 1.1211, + "step": 923 + }, + { + "epoch": 0.02, + "learning_rate": 1.5781383432963277e-06, + "loss": 0.8564, + "step": 924 + }, + { + "epoch": 0.02, + "learning_rate": 1.5798462852263022e-06, + "loss": 1.1045, + "step": 925 + }, + { + "epoch": 0.02, + "learning_rate": 1.5815542271562764e-06, + "loss": 0.8726, + "step": 926 + }, + { + "epoch": 0.02, + "learning_rate": 1.583262169086251e-06, + "loss": 1.0859, + "step": 927 + }, + { + "epoch": 0.02, + "learning_rate": 1.5849701110162255e-06, + "loss": 1.3301, + "step": 928 + }, + { + "epoch": 0.02, + "learning_rate": 1.5866780529461997e-06, + "loss": 1.2305, + "step": 929 + }, + { + "epoch": 0.02, + "learning_rate": 1.5883859948761742e-06, + "loss": 0.9453, + "step": 930 + }, + { + "epoch": 0.02, + "learning_rate": 1.5900939368061486e-06, + "loss": 1.1299, + "step": 931 + }, + { + "epoch": 0.02, + "learning_rate": 1.5918018787361229e-06, + "loss": 0.8857, + "step": 932 + }, + { + "epoch": 0.02, + "learning_rate": 1.5935098206660973e-06, + "loss": 0.9326, + "step": 933 + }, + { + "epoch": 0.02, + "learning_rate": 1.5952177625960717e-06, + "loss": 0.8394, + "step": 934 + }, + { + "epoch": 0.02, + "learning_rate": 1.596925704526046e-06, + "loss": 1.1836, + "step": 935 + }, + { + "epoch": 0.02, + "learning_rate": 1.5986336464560204e-06, + "loss": 1.0166, + "step": 936 + }, + { + "epoch": 0.02, + "learning_rate": 1.6003415883859949e-06, + "loss": 1.0518, + "step": 937 + }, + { + "epoch": 0.02, + "learning_rate": 1.602049530315969e-06, + "loss": 0.9209, + "step": 938 + }, + { + "epoch": 0.02, + "learning_rate": 1.6037574722459435e-06, + "loss": 0.8721, + "step": 939 + }, + { + "epoch": 0.02, + "learning_rate": 1.6054654141759178e-06, + "loss": 1.1602, + "step": 940 + }, + { + "epoch": 0.02, + "learning_rate": 1.6071733561058922e-06, + "loss": 1.0078, + "step": 941 + }, + { + "epoch": 0.02, + "learning_rate": 1.6088812980358669e-06, + "loss": 0.8848, + "step": 942 + }, + { + "epoch": 0.02, + "learning_rate": 1.610589239965841e-06, + "loss": 0.833, + "step": 943 + }, + { + "epoch": 0.02, + "learning_rate": 1.6122971818958155e-06, + "loss": 0.8809, + "step": 944 + }, + { + "epoch": 0.02, + "learning_rate": 1.61400512382579e-06, + "loss": 0.9521, + "step": 945 + }, + { + "epoch": 0.02, + "learning_rate": 1.6157130657557642e-06, + "loss": 0.8433, + "step": 946 + }, + { + "epoch": 0.02, + "learning_rate": 1.6174210076857386e-06, + "loss": 0.6768, + "step": 947 + }, + { + "epoch": 0.02, + "learning_rate": 1.619128949615713e-06, + "loss": 0.9404, + "step": 948 + }, + { + "epoch": 0.02, + "learning_rate": 1.6208368915456873e-06, + "loss": 0.8823, + "step": 949 + }, + { + "epoch": 0.02, + "learning_rate": 1.6225448334756618e-06, + "loss": 0.9521, + "step": 950 + }, + { + "epoch": 0.02, + "learning_rate": 1.6242527754056362e-06, + "loss": 1.1934, + "step": 951 + }, + { + "epoch": 0.02, + "learning_rate": 1.6259607173356104e-06, + "loss": 1.041, + "step": 952 + }, + { + "epoch": 0.02, + "learning_rate": 1.6276686592655849e-06, + "loss": 1.0215, + "step": 953 + }, + { + "epoch": 0.02, + "learning_rate": 1.629376601195559e-06, + "loss": 0.8281, + "step": 954 + }, + { + "epoch": 0.02, + "learning_rate": 1.6310845431255335e-06, + "loss": 1.0557, + "step": 955 + }, + { + "epoch": 0.02, + "learning_rate": 1.632792485055508e-06, + "loss": 1.2266, + "step": 956 + }, + { + "epoch": 0.02, + "learning_rate": 1.6345004269854824e-06, + "loss": 1.0703, + "step": 957 + }, + { + "epoch": 0.02, + "learning_rate": 1.6362083689154569e-06, + "loss": 0.8506, + "step": 958 + }, + { + "epoch": 0.02, + "learning_rate": 1.6379163108454313e-06, + "loss": 1.1279, + "step": 959 + }, + { + "epoch": 0.02, + "learning_rate": 1.6396242527754055e-06, + "loss": 0.9316, + "step": 960 + }, + { + "epoch": 0.02, + "learning_rate": 1.64133219470538e-06, + "loss": 1.0254, + "step": 961 + }, + { + "epoch": 0.02, + "learning_rate": 1.6430401366353544e-06, + "loss": 0.8682, + "step": 962 + }, + { + "epoch": 0.02, + "learning_rate": 1.6447480785653287e-06, + "loss": 1.1543, + "step": 963 + }, + { + "epoch": 0.02, + "learning_rate": 1.646456020495303e-06, + "loss": 0.8853, + "step": 964 + }, + { + "epoch": 0.02, + "learning_rate": 1.6481639624252775e-06, + "loss": 0.9795, + "step": 965 + }, + { + "epoch": 0.02, + "learning_rate": 1.6498719043552518e-06, + "loss": 1.0537, + "step": 966 + }, + { + "epoch": 0.02, + "learning_rate": 1.6515798462852262e-06, + "loss": 1.0938, + "step": 967 + }, + { + "epoch": 0.02, + "learning_rate": 1.6532877882152004e-06, + "loss": 1.0791, + "step": 968 + }, + { + "epoch": 0.02, + "learning_rate": 1.6549957301451749e-06, + "loss": 0.7156, + "step": 969 + }, + { + "epoch": 0.02, + "learning_rate": 1.6567036720751493e-06, + "loss": 1.0244, + "step": 970 + }, + { + "epoch": 0.02, + "learning_rate": 1.6584116140051238e-06, + "loss": 1.0127, + "step": 971 + }, + { + "epoch": 0.02, + "learning_rate": 1.6601195559350982e-06, + "loss": 0.958, + "step": 972 + }, + { + "epoch": 0.02, + "learning_rate": 1.6618274978650727e-06, + "loss": 1.126, + "step": 973 + }, + { + "epoch": 0.02, + "learning_rate": 1.6635354397950469e-06, + "loss": 1.1924, + "step": 974 + }, + { + "epoch": 0.02, + "learning_rate": 1.6652433817250213e-06, + "loss": 1.1172, + "step": 975 + }, + { + "epoch": 0.03, + "learning_rate": 1.6669513236549958e-06, + "loss": 0.9131, + "step": 976 + }, + { + "epoch": 0.03, + "learning_rate": 1.66865926558497e-06, + "loss": 0.9766, + "step": 977 + }, + { + "epoch": 0.03, + "learning_rate": 1.6703672075149444e-06, + "loss": 0.7871, + "step": 978 + }, + { + "epoch": 0.03, + "learning_rate": 1.6720751494449189e-06, + "loss": 1.085, + "step": 979 + }, + { + "epoch": 0.03, + "learning_rate": 1.6737830913748931e-06, + "loss": 0.9561, + "step": 980 + }, + { + "epoch": 0.03, + "learning_rate": 1.6754910333048676e-06, + "loss": 0.7715, + "step": 981 + }, + { + "epoch": 0.03, + "learning_rate": 1.6771989752348418e-06, + "loss": 0.8154, + "step": 982 + }, + { + "epoch": 0.03, + "learning_rate": 1.6789069171648162e-06, + "loss": 1.0205, + "step": 983 + }, + { + "epoch": 0.03, + "learning_rate": 1.6806148590947907e-06, + "loss": 1.1289, + "step": 984 + }, + { + "epoch": 0.03, + "learning_rate": 1.682322801024765e-06, + "loss": 1.0391, + "step": 985 + }, + { + "epoch": 0.03, + "learning_rate": 1.6840307429547396e-06, + "loss": 1.0186, + "step": 986 + }, + { + "epoch": 0.03, + "learning_rate": 1.685738684884714e-06, + "loss": 0.959, + "step": 987 + }, + { + "epoch": 0.03, + "learning_rate": 1.6874466268146882e-06, + "loss": 1.0381, + "step": 988 + }, + { + "epoch": 0.03, + "learning_rate": 1.6891545687446627e-06, + "loss": 0.9844, + "step": 989 + }, + { + "epoch": 0.03, + "learning_rate": 1.6908625106746371e-06, + "loss": 1.123, + "step": 990 + }, + { + "epoch": 0.03, + "learning_rate": 1.6925704526046113e-06, + "loss": 1.1426, + "step": 991 + }, + { + "epoch": 0.03, + "learning_rate": 1.6942783945345858e-06, + "loss": 0.9521, + "step": 992 + }, + { + "epoch": 0.03, + "learning_rate": 1.6959863364645602e-06, + "loss": 0.7764, + "step": 993 + }, + { + "epoch": 0.03, + "learning_rate": 1.6976942783945345e-06, + "loss": 1.0537, + "step": 994 + }, + { + "epoch": 0.03, + "learning_rate": 1.699402220324509e-06, + "loss": 1.1094, + "step": 995 + }, + { + "epoch": 0.03, + "learning_rate": 1.7011101622544831e-06, + "loss": 0.9736, + "step": 996 + }, + { + "epoch": 0.03, + "learning_rate": 1.7028181041844576e-06, + "loss": 0.9883, + "step": 997 + }, + { + "epoch": 0.03, + "learning_rate": 1.704526046114432e-06, + "loss": 0.999, + "step": 998 + }, + { + "epoch": 0.03, + "learning_rate": 1.7062339880444062e-06, + "loss": 0.9941, + "step": 999 + }, + { + "epoch": 0.03, + "learning_rate": 1.7079419299743807e-06, + "loss": 0.9629, + "step": 1000 + }, + { + "epoch": 0.03, + "learning_rate": 1.7096498719043553e-06, + "loss": 0.9141, + "step": 1001 + }, + { + "epoch": 0.03, + "learning_rate": 1.7113578138343296e-06, + "loss": 0.759, + "step": 1002 + }, + { + "epoch": 0.03, + "learning_rate": 1.713065755764304e-06, + "loss": 1.0723, + "step": 1003 + }, + { + "epoch": 0.03, + "learning_rate": 1.7147736976942785e-06, + "loss": 0.8672, + "step": 1004 + }, + { + "epoch": 0.03, + "learning_rate": 1.7164816396242527e-06, + "loss": 1.1592, + "step": 1005 + }, + { + "epoch": 0.03, + "learning_rate": 1.7181895815542271e-06, + "loss": 1.0557, + "step": 1006 + }, + { + "epoch": 0.03, + "learning_rate": 1.7198975234842016e-06, + "loss": 0.8232, + "step": 1007 + }, + { + "epoch": 0.03, + "learning_rate": 1.7216054654141758e-06, + "loss": 0.8516, + "step": 1008 + }, + { + "epoch": 0.03, + "learning_rate": 1.7233134073441502e-06, + "loss": 0.8926, + "step": 1009 + }, + { + "epoch": 0.03, + "learning_rate": 1.7250213492741245e-06, + "loss": 0.8789, + "step": 1010 + }, + { + "epoch": 0.03, + "learning_rate": 1.726729291204099e-06, + "loss": 1.1182, + "step": 1011 + }, + { + "epoch": 0.03, + "learning_rate": 1.7284372331340734e-06, + "loss": 0.8672, + "step": 1012 + }, + { + "epoch": 0.03, + "learning_rate": 1.7301451750640476e-06, + "loss": 1.0625, + "step": 1013 + }, + { + "epoch": 0.03, + "learning_rate": 1.731853116994022e-06, + "loss": 1.0449, + "step": 1014 + }, + { + "epoch": 0.03, + "learning_rate": 1.7335610589239965e-06, + "loss": 0.8184, + "step": 1015 + }, + { + "epoch": 0.03, + "learning_rate": 1.735269000853971e-06, + "loss": 1.082, + "step": 1016 + }, + { + "epoch": 0.03, + "learning_rate": 1.7369769427839454e-06, + "loss": 1.1465, + "step": 1017 + }, + { + "epoch": 0.03, + "learning_rate": 1.7386848847139198e-06, + "loss": 0.6377, + "step": 1018 + }, + { + "epoch": 0.03, + "learning_rate": 1.740392826643894e-06, + "loss": 0.915, + "step": 1019 + }, + { + "epoch": 0.03, + "learning_rate": 1.7421007685738685e-06, + "loss": 1.0547, + "step": 1020 + }, + { + "epoch": 0.03, + "learning_rate": 1.743808710503843e-06, + "loss": 1.2793, + "step": 1021 + }, + { + "epoch": 0.03, + "learning_rate": 1.7455166524338171e-06, + "loss": 0.8604, + "step": 1022 + }, + { + "epoch": 0.03, + "learning_rate": 1.7472245943637916e-06, + "loss": 0.9111, + "step": 1023 + }, + { + "epoch": 0.03, + "learning_rate": 1.7489325362937658e-06, + "loss": 0.9062, + "step": 1024 + }, + { + "epoch": 0.03, + "learning_rate": 1.7506404782237403e-06, + "loss": 1.0752, + "step": 1025 + }, + { + "epoch": 0.03, + "learning_rate": 1.7523484201537147e-06, + "loss": 1.123, + "step": 1026 + }, + { + "epoch": 0.03, + "learning_rate": 1.754056362083689e-06, + "loss": 1.0762, + "step": 1027 + }, + { + "epoch": 0.03, + "learning_rate": 1.7557643040136634e-06, + "loss": 0.8467, + "step": 1028 + }, + { + "epoch": 0.03, + "learning_rate": 1.7574722459436378e-06, + "loss": 1.0283, + "step": 1029 + }, + { + "epoch": 0.03, + "learning_rate": 1.759180187873612e-06, + "loss": 0.9092, + "step": 1030 + }, + { + "epoch": 0.03, + "learning_rate": 1.7608881298035867e-06, + "loss": 0.8926, + "step": 1031 + }, + { + "epoch": 0.03, + "learning_rate": 1.7625960717335611e-06, + "loss": 0.9033, + "step": 1032 + }, + { + "epoch": 0.03, + "learning_rate": 1.7643040136635354e-06, + "loss": 0.8647, + "step": 1033 + }, + { + "epoch": 0.03, + "learning_rate": 1.7660119555935098e-06, + "loss": 1.1143, + "step": 1034 + }, + { + "epoch": 0.03, + "learning_rate": 1.7677198975234843e-06, + "loss": 0.9775, + "step": 1035 + }, + { + "epoch": 0.03, + "learning_rate": 1.7694278394534585e-06, + "loss": 0.9717, + "step": 1036 + }, + { + "epoch": 0.03, + "learning_rate": 1.771135781383433e-06, + "loss": 0.9805, + "step": 1037 + }, + { + "epoch": 0.03, + "learning_rate": 1.7728437233134072e-06, + "loss": 0.8062, + "step": 1038 + }, + { + "epoch": 0.03, + "learning_rate": 1.7745516652433816e-06, + "loss": 0.7954, + "step": 1039 + }, + { + "epoch": 0.03, + "learning_rate": 1.776259607173356e-06, + "loss": 0.9238, + "step": 1040 + }, + { + "epoch": 0.03, + "learning_rate": 1.7779675491033303e-06, + "loss": 0.9883, + "step": 1041 + }, + { + "epoch": 0.03, + "learning_rate": 1.7796754910333047e-06, + "loss": 1.0879, + "step": 1042 + }, + { + "epoch": 0.03, + "learning_rate": 1.7813834329632792e-06, + "loss": 1.127, + "step": 1043 + }, + { + "epoch": 0.03, + "learning_rate": 1.7830913748932534e-06, + "loss": 0.8008, + "step": 1044 + }, + { + "epoch": 0.03, + "learning_rate": 1.7847993168232278e-06, + "loss": 0.9463, + "step": 1045 + }, + { + "epoch": 0.03, + "learning_rate": 1.7865072587532025e-06, + "loss": 0.96, + "step": 1046 + }, + { + "epoch": 0.03, + "learning_rate": 1.7882152006831767e-06, + "loss": 1.0117, + "step": 1047 + }, + { + "epoch": 0.03, + "learning_rate": 1.7899231426131512e-06, + "loss": 0.8945, + "step": 1048 + }, + { + "epoch": 0.03, + "learning_rate": 1.7916310845431256e-06, + "loss": 0.7495, + "step": 1049 + }, + { + "epoch": 0.03, + "learning_rate": 1.7933390264730998e-06, + "loss": 1.0996, + "step": 1050 + }, + { + "epoch": 0.03, + "learning_rate": 1.7950469684030743e-06, + "loss": 1.1709, + "step": 1051 + }, + { + "epoch": 0.03, + "learning_rate": 1.7967549103330485e-06, + "loss": 1.0645, + "step": 1052 + }, + { + "epoch": 0.03, + "learning_rate": 1.798462852263023e-06, + "loss": 0.9971, + "step": 1053 + }, + { + "epoch": 0.03, + "learning_rate": 1.8001707941929974e-06, + "loss": 1.0469, + "step": 1054 + }, + { + "epoch": 0.03, + "learning_rate": 1.8018787361229716e-06, + "loss": 0.937, + "step": 1055 + }, + { + "epoch": 0.03, + "learning_rate": 1.803586678052946e-06, + "loss": 0.8828, + "step": 1056 + }, + { + "epoch": 0.03, + "learning_rate": 1.8052946199829205e-06, + "loss": 0.9277, + "step": 1057 + }, + { + "epoch": 0.03, + "learning_rate": 1.8070025619128947e-06, + "loss": 0.9805, + "step": 1058 + }, + { + "epoch": 0.03, + "learning_rate": 1.8087105038428692e-06, + "loss": 0.9165, + "step": 1059 + }, + { + "epoch": 0.03, + "learning_rate": 1.8104184457728438e-06, + "loss": 0.9912, + "step": 1060 + }, + { + "epoch": 0.03, + "learning_rate": 1.812126387702818e-06, + "loss": 0.7705, + "step": 1061 + }, + { + "epoch": 0.03, + "learning_rate": 1.8138343296327925e-06, + "loss": 0.8242, + "step": 1062 + }, + { + "epoch": 0.03, + "learning_rate": 1.815542271562767e-06, + "loss": 0.8877, + "step": 1063 + }, + { + "epoch": 0.03, + "learning_rate": 1.8172502134927412e-06, + "loss": 0.7451, + "step": 1064 + }, + { + "epoch": 0.03, + "learning_rate": 1.8189581554227156e-06, + "loss": 0.8818, + "step": 1065 + }, + { + "epoch": 0.03, + "learning_rate": 1.8206660973526898e-06, + "loss": 0.8135, + "step": 1066 + }, + { + "epoch": 0.03, + "learning_rate": 1.8223740392826643e-06, + "loss": 1.0557, + "step": 1067 + }, + { + "epoch": 0.03, + "learning_rate": 1.8240819812126387e-06, + "loss": 0.9028, + "step": 1068 + }, + { + "epoch": 0.03, + "learning_rate": 1.825789923142613e-06, + "loss": 0.6206, + "step": 1069 + }, + { + "epoch": 0.03, + "learning_rate": 1.8274978650725874e-06, + "loss": 1.1514, + "step": 1070 + }, + { + "epoch": 0.03, + "learning_rate": 1.8292058070025618e-06, + "loss": 0.9014, + "step": 1071 + }, + { + "epoch": 0.03, + "learning_rate": 1.830913748932536e-06, + "loss": 1.042, + "step": 1072 + }, + { + "epoch": 0.03, + "learning_rate": 1.8326216908625105e-06, + "loss": 0.9893, + "step": 1073 + }, + { + "epoch": 0.03, + "learning_rate": 1.834329632792485e-06, + "loss": 0.8906, + "step": 1074 + }, + { + "epoch": 0.03, + "learning_rate": 1.8360375747224594e-06, + "loss": 0.9561, + "step": 1075 + }, + { + "epoch": 0.03, + "learning_rate": 1.8377455166524338e-06, + "loss": 0.9414, + "step": 1076 + }, + { + "epoch": 0.03, + "learning_rate": 1.8394534585824083e-06, + "loss": 1.0771, + "step": 1077 + }, + { + "epoch": 0.03, + "learning_rate": 1.8411614005123825e-06, + "loss": 1.0557, + "step": 1078 + }, + { + "epoch": 0.03, + "learning_rate": 1.842869342442357e-06, + "loss": 1.0293, + "step": 1079 + }, + { + "epoch": 0.03, + "learning_rate": 1.8445772843723312e-06, + "loss": 0.9072, + "step": 1080 + }, + { + "epoch": 0.03, + "learning_rate": 1.8462852263023056e-06, + "loss": 1.0332, + "step": 1081 + }, + { + "epoch": 0.03, + "learning_rate": 1.84799316823228e-06, + "loss": 0.9111, + "step": 1082 + }, + { + "epoch": 0.03, + "learning_rate": 1.8497011101622543e-06, + "loss": 0.9839, + "step": 1083 + }, + { + "epoch": 0.03, + "learning_rate": 1.8514090520922287e-06, + "loss": 1.0654, + "step": 1084 + }, + { + "epoch": 0.03, + "learning_rate": 1.8531169940222032e-06, + "loss": 0.8013, + "step": 1085 + }, + { + "epoch": 0.03, + "learning_rate": 1.8548249359521774e-06, + "loss": 1.0381, + "step": 1086 + }, + { + "epoch": 0.03, + "learning_rate": 1.8565328778821519e-06, + "loss": 1.082, + "step": 1087 + }, + { + "epoch": 0.03, + "learning_rate": 1.8582408198121263e-06, + "loss": 0.9414, + "step": 1088 + }, + { + "epoch": 0.03, + "learning_rate": 1.8599487617421005e-06, + "loss": 1.0918, + "step": 1089 + }, + { + "epoch": 0.03, + "learning_rate": 1.8616567036720752e-06, + "loss": 0.8799, + "step": 1090 + }, + { + "epoch": 0.03, + "learning_rate": 1.8633646456020496e-06, + "loss": 0.9521, + "step": 1091 + }, + { + "epoch": 0.03, + "learning_rate": 1.8650725875320239e-06, + "loss": 1.0879, + "step": 1092 + }, + { + "epoch": 0.03, + "learning_rate": 1.8667805294619983e-06, + "loss": 1.041, + "step": 1093 + }, + { + "epoch": 0.03, + "learning_rate": 1.8684884713919725e-06, + "loss": 0.7607, + "step": 1094 + }, + { + "epoch": 0.03, + "learning_rate": 1.870196413321947e-06, + "loss": 0.9458, + "step": 1095 + }, + { + "epoch": 0.03, + "learning_rate": 1.8719043552519214e-06, + "loss": 1.0664, + "step": 1096 + }, + { + "epoch": 0.03, + "learning_rate": 1.8736122971818956e-06, + "loss": 1.0898, + "step": 1097 + }, + { + "epoch": 0.03, + "learning_rate": 1.87532023911187e-06, + "loss": 0.8857, + "step": 1098 + }, + { + "epoch": 0.03, + "learning_rate": 1.8770281810418445e-06, + "loss": 1.0527, + "step": 1099 + }, + { + "epoch": 0.03, + "learning_rate": 1.8787361229718188e-06, + "loss": 0.876, + "step": 1100 + }, + { + "epoch": 0.03, + "learning_rate": 1.8804440649017932e-06, + "loss": 1.0801, + "step": 1101 + }, + { + "epoch": 0.03, + "learning_rate": 1.8821520068317676e-06, + "loss": 0.8174, + "step": 1102 + }, + { + "epoch": 0.03, + "learning_rate": 1.8838599487617419e-06, + "loss": 0.9844, + "step": 1103 + }, + { + "epoch": 0.03, + "learning_rate": 1.8855678906917163e-06, + "loss": 1.2305, + "step": 1104 + }, + { + "epoch": 0.03, + "learning_rate": 1.887275832621691e-06, + "loss": 1.0312, + "step": 1105 + }, + { + "epoch": 0.03, + "learning_rate": 1.8889837745516652e-06, + "loss": 0.8306, + "step": 1106 + }, + { + "epoch": 0.03, + "learning_rate": 1.8906917164816396e-06, + "loss": 0.7549, + "step": 1107 + }, + { + "epoch": 0.03, + "learning_rate": 1.892399658411614e-06, + "loss": 0.9272, + "step": 1108 + }, + { + "epoch": 0.03, + "learning_rate": 1.8941076003415883e-06, + "loss": 0.8765, + "step": 1109 + }, + { + "epoch": 0.03, + "learning_rate": 1.8958155422715628e-06, + "loss": 1.0986, + "step": 1110 + }, + { + "epoch": 0.03, + "learning_rate": 1.897523484201537e-06, + "loss": 1.1367, + "step": 1111 + }, + { + "epoch": 0.03, + "learning_rate": 1.8992314261315114e-06, + "loss": 0.9619, + "step": 1112 + }, + { + "epoch": 0.03, + "learning_rate": 1.9009393680614859e-06, + "loss": 1.0088, + "step": 1113 + }, + { + "epoch": 0.03, + "learning_rate": 1.90264730999146e-06, + "loss": 1.0298, + "step": 1114 + }, + { + "epoch": 0.03, + "learning_rate": 1.9043552519214345e-06, + "loss": 0.9512, + "step": 1115 + }, + { + "epoch": 0.03, + "learning_rate": 1.906063193851409e-06, + "loss": 1.0615, + "step": 1116 + }, + { + "epoch": 0.03, + "learning_rate": 1.9077711357813834e-06, + "loss": 0.9092, + "step": 1117 + }, + { + "epoch": 0.03, + "learning_rate": 1.9094790777113577e-06, + "loss": 1.209, + "step": 1118 + }, + { + "epoch": 0.03, + "learning_rate": 1.911187019641332e-06, + "loss": 1.1641, + "step": 1119 + }, + { + "epoch": 0.03, + "learning_rate": 1.9128949615713065e-06, + "loss": 1.0791, + "step": 1120 + }, + { + "epoch": 0.03, + "learning_rate": 1.9146029035012808e-06, + "loss": 0.7524, + "step": 1121 + }, + { + "epoch": 0.03, + "learning_rate": 1.9163108454312554e-06, + "loss": 0.8574, + "step": 1122 + }, + { + "epoch": 0.03, + "learning_rate": 1.9180187873612297e-06, + "loss": 0.9902, + "step": 1123 + }, + { + "epoch": 0.03, + "learning_rate": 1.919726729291204e-06, + "loss": 1.2393, + "step": 1124 + }, + { + "epoch": 0.03, + "learning_rate": 1.9214346712211785e-06, + "loss": 0.958, + "step": 1125 + }, + { + "epoch": 0.03, + "learning_rate": 1.9231426131511528e-06, + "loss": 1.1992, + "step": 1126 + }, + { + "epoch": 0.03, + "learning_rate": 1.924850555081127e-06, + "loss": 0.9814, + "step": 1127 + }, + { + "epoch": 0.03, + "learning_rate": 1.9265584970111017e-06, + "loss": 1.0049, + "step": 1128 + }, + { + "epoch": 0.03, + "learning_rate": 1.928266438941076e-06, + "loss": 1.1299, + "step": 1129 + }, + { + "epoch": 0.03, + "learning_rate": 1.92997438087105e-06, + "loss": 0.8892, + "step": 1130 + }, + { + "epoch": 0.03, + "learning_rate": 1.9316823228010248e-06, + "loss": 0.9189, + "step": 1131 + }, + { + "epoch": 0.03, + "learning_rate": 1.933390264730999e-06, + "loss": 0.7764, + "step": 1132 + }, + { + "epoch": 0.03, + "learning_rate": 1.9350982066609732e-06, + "loss": 0.9619, + "step": 1133 + }, + { + "epoch": 0.03, + "learning_rate": 1.936806148590948e-06, + "loss": 0.9346, + "step": 1134 + }, + { + "epoch": 0.03, + "learning_rate": 1.938514090520922e-06, + "loss": 1.084, + "step": 1135 + }, + { + "epoch": 0.03, + "learning_rate": 1.9402220324508968e-06, + "loss": 0.9355, + "step": 1136 + }, + { + "epoch": 0.03, + "learning_rate": 1.941929974380871e-06, + "loss": 1.1738, + "step": 1137 + }, + { + "epoch": 0.03, + "learning_rate": 1.9436379163108452e-06, + "loss": 1.1045, + "step": 1138 + }, + { + "epoch": 0.03, + "learning_rate": 1.94534585824082e-06, + "loss": 0.9688, + "step": 1139 + }, + { + "epoch": 0.03, + "learning_rate": 1.947053800170794e-06, + "loss": 0.9932, + "step": 1140 + }, + { + "epoch": 0.03, + "learning_rate": 1.9487617421007683e-06, + "loss": 0.9414, + "step": 1141 + }, + { + "epoch": 0.03, + "learning_rate": 1.950469684030743e-06, + "loss": 1.0459, + "step": 1142 + }, + { + "epoch": 0.03, + "learning_rate": 1.9521776259607172e-06, + "loss": 1.126, + "step": 1143 + }, + { + "epoch": 0.03, + "learning_rate": 1.9538855678906915e-06, + "loss": 0.7808, + "step": 1144 + }, + { + "epoch": 0.03, + "learning_rate": 1.955593509820666e-06, + "loss": 0.916, + "step": 1145 + }, + { + "epoch": 0.03, + "learning_rate": 1.9573014517506403e-06, + "loss": 1.1494, + "step": 1146 + }, + { + "epoch": 0.03, + "learning_rate": 1.9590093936806146e-06, + "loss": 0.9453, + "step": 1147 + }, + { + "epoch": 0.03, + "learning_rate": 1.9607173356105892e-06, + "loss": 1.0137, + "step": 1148 + }, + { + "epoch": 0.03, + "learning_rate": 1.9624252775405635e-06, + "loss": 0.9766, + "step": 1149 + }, + { + "epoch": 0.03, + "learning_rate": 1.964133219470538e-06, + "loss": 1.1035, + "step": 1150 + }, + { + "epoch": 0.03, + "learning_rate": 1.9658411614005123e-06, + "loss": 1.1084, + "step": 1151 + }, + { + "epoch": 0.03, + "learning_rate": 1.9675491033304866e-06, + "loss": 0.9346, + "step": 1152 + }, + { + "epoch": 0.03, + "learning_rate": 1.9692570452604612e-06, + "loss": 1.0039, + "step": 1153 + }, + { + "epoch": 0.03, + "learning_rate": 1.9709649871904355e-06, + "loss": 1.1416, + "step": 1154 + }, + { + "epoch": 0.03, + "learning_rate": 1.9726729291204097e-06, + "loss": 0.957, + "step": 1155 + }, + { + "epoch": 0.03, + "learning_rate": 1.9743808710503843e-06, + "loss": 0.9189, + "step": 1156 + }, + { + "epoch": 0.03, + "learning_rate": 1.9760888129803586e-06, + "loss": 0.7988, + "step": 1157 + }, + { + "epoch": 0.03, + "learning_rate": 1.977796754910333e-06, + "loss": 0.9365, + "step": 1158 + }, + { + "epoch": 0.03, + "learning_rate": 1.9795046968403075e-06, + "loss": 0.6909, + "step": 1159 + }, + { + "epoch": 0.03, + "learning_rate": 1.9812126387702817e-06, + "loss": 1.2227, + "step": 1160 + }, + { + "epoch": 0.03, + "learning_rate": 1.982920580700256e-06, + "loss": 1.0127, + "step": 1161 + }, + { + "epoch": 0.03, + "learning_rate": 1.9846285226302306e-06, + "loss": 1.0625, + "step": 1162 + }, + { + "epoch": 0.03, + "learning_rate": 1.986336464560205e-06, + "loss": 1.0898, + "step": 1163 + }, + { + "epoch": 0.03, + "learning_rate": 1.9880444064901795e-06, + "loss": 0.9346, + "step": 1164 + }, + { + "epoch": 0.03, + "learning_rate": 1.9897523484201537e-06, + "loss": 0.9248, + "step": 1165 + }, + { + "epoch": 0.03, + "learning_rate": 1.991460290350128e-06, + "loss": 0.9502, + "step": 1166 + }, + { + "epoch": 0.03, + "learning_rate": 1.9931682322801026e-06, + "loss": 0.7476, + "step": 1167 + }, + { + "epoch": 0.03, + "learning_rate": 1.994876174210077e-06, + "loss": 1.0654, + "step": 1168 + }, + { + "epoch": 0.03, + "learning_rate": 1.996584116140051e-06, + "loss": 0.998, + "step": 1169 + }, + { + "epoch": 0.03, + "learning_rate": 1.9982920580700257e-06, + "loss": 1.2603, + "step": 1170 + }, + { + "epoch": 0.03, + "learning_rate": 2e-06, + "loss": 0.9443, + "step": 1171 + }, + { + "epoch": 0.03, + "learning_rate": 1.999999996554496e-06, + "loss": 0.918, + "step": 1172 + }, + { + "epoch": 0.03, + "learning_rate": 1.999999986217985e-06, + "loss": 0.9023, + "step": 1173 + }, + { + "epoch": 0.03, + "learning_rate": 1.999999968990466e-06, + "loss": 1.0205, + "step": 1174 + }, + { + "epoch": 0.03, + "learning_rate": 1.99999994487194e-06, + "loss": 0.7886, + "step": 1175 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999999138624065e-06, + "loss": 1.0078, + "step": 1176 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999998759618665e-06, + "loss": 0.9609, + "step": 1177 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999998311703195e-06, + "loss": 0.959, + "step": 1178 + }, + { + "epoch": 0.03, + "learning_rate": 1.999999779487766e-06, + "loss": 0.8906, + "step": 1179 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999997209142066e-06, + "loss": 1.1406, + "step": 1180 + }, + { + "epoch": 0.03, + "learning_rate": 1.999999655449642e-06, + "loss": 1.041, + "step": 1181 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999995830940713e-06, + "loss": 0.9463, + "step": 1182 + }, + { + "epoch": 0.03, + "learning_rate": 1.999999503847497e-06, + "loss": 0.8613, + "step": 1183 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999994177099176e-06, + "loss": 1.0049, + "step": 1184 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999993246813355e-06, + "loss": 0.9443, + "step": 1185 + }, + { + "epoch": 0.03, + "learning_rate": 1.99999922476175e-06, + "loss": 1.1504, + "step": 1186 + }, + { + "epoch": 0.03, + "learning_rate": 1.999999117951162e-06, + "loss": 0.9932, + "step": 1187 + }, + { + "epoch": 0.03, + "learning_rate": 1.999999004249573e-06, + "loss": 1.0068, + "step": 1188 + }, + { + "epoch": 0.03, + "learning_rate": 1.999998883656983e-06, + "loss": 1.0723, + "step": 1189 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999987561733936e-06, + "loss": 0.9795, + "step": 1190 + }, + { + "epoch": 0.03, + "learning_rate": 1.999998621798805e-06, + "loss": 1.0098, + "step": 1191 + }, + { + "epoch": 0.03, + "learning_rate": 1.999998480533218e-06, + "loss": 1.0654, + "step": 1192 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999983323766343e-06, + "loss": 0.7603, + "step": 1193 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999981773290545e-06, + "loss": 1.1143, + "step": 1194 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999980153904797e-06, + "loss": 0.8125, + "step": 1195 + }, + { + "epoch": 0.03, + "learning_rate": 1.999997846560911e-06, + "loss": 0.999, + "step": 1196 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999976708403496e-06, + "loss": 0.9111, + "step": 1197 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999974882287964e-06, + "loss": 1.0264, + "step": 1198 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999972987262533e-06, + "loss": 1.1074, + "step": 1199 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999971023327215e-06, + "loss": 1.0342, + "step": 1200 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999968990482015e-06, + "loss": 0.7637, + "step": 1201 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999966888726957e-06, + "loss": 1.0762, + "step": 1202 + }, + { + "epoch": 0.03, + "learning_rate": 1.999996471806205e-06, + "loss": 1.0103, + "step": 1203 + }, + { + "epoch": 0.03, + "learning_rate": 1.999996247848731e-06, + "loss": 0.9541, + "step": 1204 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999960170002755e-06, + "loss": 1.1533, + "step": 1205 + }, + { + "epoch": 0.03, + "learning_rate": 1.99999577926084e-06, + "loss": 0.6733, + "step": 1206 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999955346304255e-06, + "loss": 0.9844, + "step": 1207 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999952831090346e-06, + "loss": 0.7695, + "step": 1208 + }, + { + "epoch": 0.03, + "learning_rate": 1.999995024696669e-06, + "loss": 0.916, + "step": 1209 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999947593933296e-06, + "loss": 0.9863, + "step": 1210 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999944871990188e-06, + "loss": 0.9697, + "step": 1211 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999942081137384e-06, + "loss": 0.7896, + "step": 1212 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999939221374905e-06, + "loss": 1.0518, + "step": 1213 + }, + { + "epoch": 0.03, + "learning_rate": 1.999993629270277e-06, + "loss": 0.8398, + "step": 1214 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999933295120998e-06, + "loss": 0.894, + "step": 1215 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999930228629608e-06, + "loss": 0.6821, + "step": 1216 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999927093228627e-06, + "loss": 1.0898, + "step": 1217 + }, + { + "epoch": 0.03, + "learning_rate": 1.999992388891807e-06, + "loss": 1.0723, + "step": 1218 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999920615697963e-06, + "loss": 0.8779, + "step": 1219 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999917273568326e-06, + "loss": 0.877, + "step": 1220 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999913862529183e-06, + "loss": 1.0771, + "step": 1221 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999910382580564e-06, + "loss": 0.8574, + "step": 1222 + }, + { + "epoch": 0.03, + "learning_rate": 1.999990683372248e-06, + "loss": 0.9736, + "step": 1223 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999903215954966e-06, + "loss": 0.9453, + "step": 1224 + }, + { + "epoch": 0.03, + "learning_rate": 1.999989952927804e-06, + "loss": 0.8955, + "step": 1225 + }, + { + "epoch": 0.03, + "learning_rate": 1.999989577369174e-06, + "loss": 1.0928, + "step": 1226 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999891949196075e-06, + "loss": 0.9648, + "step": 1227 + }, + { + "epoch": 0.03, + "learning_rate": 1.999988805579108e-06, + "loss": 0.833, + "step": 1228 + }, + { + "epoch": 0.03, + "learning_rate": 1.999988409347678e-06, + "loss": 1.0234, + "step": 1229 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999880062253203e-06, + "loss": 0.8438, + "step": 1230 + }, + { + "epoch": 0.03, + "learning_rate": 1.999987596212038e-06, + "loss": 1.0664, + "step": 1231 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999871793078335e-06, + "loss": 0.8477, + "step": 1232 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999867555127097e-06, + "loss": 0.8809, + "step": 1233 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999863248266697e-06, + "loss": 1.1553, + "step": 1234 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999858872497164e-06, + "loss": 1.0635, + "step": 1235 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999854427818527e-06, + "loss": 0.8882, + "step": 1236 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999849914230817e-06, + "loss": 0.9727, + "step": 1237 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999845331734067e-06, + "loss": 1.084, + "step": 1238 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999840680328307e-06, + "loss": 1.1387, + "step": 1239 + }, + { + "epoch": 0.03, + "learning_rate": 1.999983596001357e-06, + "loss": 1.0928, + "step": 1240 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999831170789888e-06, + "loss": 1.1201, + "step": 1241 + }, + { + "epoch": 0.03, + "learning_rate": 1.999982631265729e-06, + "loss": 1.0059, + "step": 1242 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999821385615817e-06, + "loss": 0.7881, + "step": 1243 + }, + { + "epoch": 0.03, + "learning_rate": 1.99998163896655e-06, + "loss": 1.0986, + "step": 1244 + }, + { + "epoch": 0.03, + "learning_rate": 1.999981132480637e-06, + "loss": 0.9883, + "step": 1245 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999806191038467e-06, + "loss": 0.8926, + "step": 1246 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999800988361824e-06, + "loss": 1.0127, + "step": 1247 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999795716776476e-06, + "loss": 1.0391, + "step": 1248 + }, + { + "epoch": 0.03, + "learning_rate": 1.999979037628246e-06, + "loss": 0.9375, + "step": 1249 + }, + { + "epoch": 0.03, + "learning_rate": 1.999978496687981e-06, + "loss": 0.8613, + "step": 1250 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999779488568572e-06, + "loss": 0.7905, + "step": 1251 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999773941348776e-06, + "loss": 1.0049, + "step": 1252 + }, + { + "epoch": 0.03, + "learning_rate": 1.999976832522046e-06, + "loss": 1.0547, + "step": 1253 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999762640183664e-06, + "loss": 0.9321, + "step": 1254 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999756886238434e-06, + "loss": 1.0684, + "step": 1255 + }, + { + "epoch": 0.03, + "learning_rate": 1.99997510633848e-06, + "loss": 1.0352, + "step": 1256 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999745171622806e-06, + "loss": 1.0361, + "step": 1257 + }, + { + "epoch": 0.03, + "learning_rate": 1.999973921095249e-06, + "loss": 0.9629, + "step": 1258 + }, + { + "epoch": 0.03, + "learning_rate": 1.99997331813739e-06, + "loss": 0.96, + "step": 1259 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999727082887074e-06, + "loss": 0.9287, + "step": 1260 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999720915492047e-06, + "loss": 0.9653, + "step": 1261 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999714679188874e-06, + "loss": 0.8271, + "step": 1262 + }, + { + "epoch": 0.03, + "learning_rate": 1.999970837397759e-06, + "loss": 0.8311, + "step": 1263 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999701999858234e-06, + "loss": 1.1191, + "step": 1264 + }, + { + "epoch": 0.03, + "learning_rate": 1.999969555683086e-06, + "loss": 1.1191, + "step": 1265 + }, + { + "epoch": 0.03, + "learning_rate": 1.999968904489551e-06, + "loss": 1.0583, + "step": 1266 + }, + { + "epoch": 0.03, + "learning_rate": 1.999968246405223e-06, + "loss": 1.0273, + "step": 1267 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999675814301055e-06, + "loss": 0.769, + "step": 1268 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999669095642045e-06, + "loss": 0.7451, + "step": 1269 + }, + { + "epoch": 0.03, + "learning_rate": 1.999966230807524e-06, + "loss": 0.9219, + "step": 1270 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999655451600682e-06, + "loss": 1.041, + "step": 1271 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999648526218424e-06, + "loss": 1.1357, + "step": 1272 + }, + { + "epoch": 0.03, + "learning_rate": 1.999964153192851e-06, + "loss": 1.0693, + "step": 1273 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999634468730996e-06, + "loss": 0.6895, + "step": 1274 + }, + { + "epoch": 0.03, + "learning_rate": 1.999962733662592e-06, + "loss": 1.1719, + "step": 1275 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999620135613343e-06, + "loss": 1.0264, + "step": 1276 + }, + { + "epoch": 0.03, + "learning_rate": 1.99996128656933e-06, + "loss": 0.9707, + "step": 1277 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999605526865854e-06, + "loss": 1.2891, + "step": 1278 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999598119131052e-06, + "loss": 0.9844, + "step": 1279 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999590642488943e-06, + "loss": 0.8994, + "step": 1280 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999583096939578e-06, + "loss": 1.1836, + "step": 1281 + }, + { + "epoch": 0.03, + "learning_rate": 1.999957548248301e-06, + "loss": 0.9238, + "step": 1282 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999567799119296e-06, + "loss": 1.0645, + "step": 1283 + }, + { + "epoch": 0.03, + "learning_rate": 1.999956004684848e-06, + "loss": 0.9746, + "step": 1284 + }, + { + "epoch": 0.03, + "learning_rate": 1.999955222567062e-06, + "loss": 0.9033, + "step": 1285 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999544335585773e-06, + "loss": 0.9121, + "step": 1286 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999536376593992e-06, + "loss": 1.125, + "step": 1287 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999528348695324e-06, + "loss": 0.793, + "step": 1288 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999520251889835e-06, + "loss": 0.9561, + "step": 1289 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999512086177576e-06, + "loss": 0.9316, + "step": 1290 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999503851558602e-06, + "loss": 0.9229, + "step": 1291 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999495548032973e-06, + "loss": 0.9355, + "step": 1292 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999487175600744e-06, + "loss": 1.207, + "step": 1293 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999478734261974e-06, + "loss": 0.9131, + "step": 1294 + }, + { + "epoch": 0.03, + "learning_rate": 1.999947022401672e-06, + "loss": 0.7646, + "step": 1295 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999461644865042e-06, + "loss": 0.7559, + "step": 1296 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999452996806996e-06, + "loss": 1.0391, + "step": 1297 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999444279842646e-06, + "loss": 0.8662, + "step": 1298 + }, + { + "epoch": 0.03, + "learning_rate": 1.999943549397205e-06, + "loss": 0.9121, + "step": 1299 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999426639195267e-06, + "loss": 1.0693, + "step": 1300 + }, + { + "epoch": 0.03, + "learning_rate": 1.999941771551236e-06, + "loss": 0.8398, + "step": 1301 + }, + { + "epoch": 0.03, + "learning_rate": 1.999940872292339e-06, + "loss": 0.9824, + "step": 1302 + }, + { + "epoch": 0.03, + "learning_rate": 1.999939966142842e-06, + "loss": 1.1318, + "step": 1303 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999390531027512e-06, + "loss": 0.8726, + "step": 1304 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999381331720725e-06, + "loss": 1.002, + "step": 1305 + }, + { + "epoch": 0.03, + "learning_rate": 1.999937206350813e-06, + "loss": 0.8428, + "step": 1306 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999362726389783e-06, + "loss": 1.001, + "step": 1307 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999353320365753e-06, + "loss": 0.7402, + "step": 1308 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999343845436104e-06, + "loss": 0.9736, + "step": 1309 + }, + { + "epoch": 0.03, + "learning_rate": 1.99993343016009e-06, + "loss": 0.8823, + "step": 1310 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999324688860208e-06, + "loss": 0.9863, + "step": 1311 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999315007214095e-06, + "loss": 0.9883, + "step": 1312 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999305256662628e-06, + "loss": 1.1133, + "step": 1313 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999295437205873e-06, + "loss": 0.916, + "step": 1314 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999285548843898e-06, + "loss": 0.998, + "step": 1315 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999275591576767e-06, + "loss": 0.7402, + "step": 1316 + }, + { + "epoch": 0.03, + "learning_rate": 1.999926556540455e-06, + "loss": 1.0215, + "step": 1317 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999255470327325e-06, + "loss": 1.0527, + "step": 1318 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999245306345153e-06, + "loss": 0.7427, + "step": 1319 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999235073458105e-06, + "loss": 1.0127, + "step": 1320 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999224771666256e-06, + "loss": 1.1123, + "step": 1321 + }, + { + "epoch": 0.03, + "learning_rate": 1.999921440096967e-06, + "loss": 0.728, + "step": 1322 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999203961368424e-06, + "loss": 0.9824, + "step": 1323 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999193452862585e-06, + "loss": 0.6914, + "step": 1324 + }, + { + "epoch": 0.03, + "learning_rate": 1.999918287545223e-06, + "loss": 0.8369, + "step": 1325 + }, + { + "epoch": 0.03, + "learning_rate": 1.999917222913743e-06, + "loss": 1.0996, + "step": 1326 + }, + { + "epoch": 0.03, + "learning_rate": 1.999916151391826e-06, + "loss": 0.8389, + "step": 1327 + }, + { + "epoch": 0.03, + "learning_rate": 1.999915072979479e-06, + "loss": 0.9609, + "step": 1328 + }, + { + "epoch": 0.03, + "learning_rate": 1.99991398767671e-06, + "loss": 0.7471, + "step": 1329 + }, + { + "epoch": 0.03, + "learning_rate": 1.999912895483526e-06, + "loss": 1.0107, + "step": 1330 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999117963999348e-06, + "loss": 0.9326, + "step": 1331 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999106904259434e-06, + "loss": 0.876, + "step": 1332 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999095775615604e-06, + "loss": 1.207, + "step": 1333 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999084578067927e-06, + "loss": 0.9746, + "step": 1334 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999073311616483e-06, + "loss": 1.1729, + "step": 1335 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999061976261353e-06, + "loss": 1.0996, + "step": 1336 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999050572002603e-06, + "loss": 0.9258, + "step": 1337 + }, + { + "epoch": 0.03, + "learning_rate": 1.999903909884033e-06, + "loss": 0.9727, + "step": 1338 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999027556774595e-06, + "loss": 1.0723, + "step": 1339 + }, + { + "epoch": 0.03, + "learning_rate": 1.999901594580549e-06, + "loss": 0.7607, + "step": 1340 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999004265933086e-06, + "loss": 0.9971, + "step": 1341 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998992517157475e-06, + "loss": 0.916, + "step": 1342 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998980699478724e-06, + "loss": 1.124, + "step": 1343 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998968812896926e-06, + "loss": 0.6675, + "step": 1344 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998956857412157e-06, + "loss": 0.9834, + "step": 1345 + }, + { + "epoch": 0.03, + "learning_rate": 1.99989448330245e-06, + "loss": 0.7178, + "step": 1346 + }, + { + "epoch": 0.03, + "learning_rate": 1.999893273973404e-06, + "loss": 0.8975, + "step": 1347 + }, + { + "epoch": 0.03, + "learning_rate": 1.999892057754086e-06, + "loss": 0.916, + "step": 1348 + }, + { + "epoch": 0.03, + "learning_rate": 1.999890834644504e-06, + "loss": 0.9346, + "step": 1349 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998896046446667e-06, + "loss": 1.1758, + "step": 1350 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998883677545826e-06, + "loss": 0.9658, + "step": 1351 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998871239742604e-06, + "loss": 0.8965, + "step": 1352 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998858733037083e-06, + "loss": 0.8799, + "step": 1353 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998846157429355e-06, + "loss": 1.085, + "step": 1354 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998833512919498e-06, + "loss": 0.9307, + "step": 1355 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998820799507606e-06, + "loss": 0.8916, + "step": 1356 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998808017193764e-06, + "loss": 1.0518, + "step": 1357 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998795165978057e-06, + "loss": 1.1328, + "step": 1358 + }, + { + "epoch": 0.03, + "learning_rate": 1.999878224586058e-06, + "loss": 0.9863, + "step": 1359 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998769256841423e-06, + "loss": 0.8193, + "step": 1360 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998756198920666e-06, + "loss": 0.7339, + "step": 1361 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998743072098403e-06, + "loss": 1.0117, + "step": 1362 + }, + { + "epoch": 0.03, + "learning_rate": 1.999872987637473e-06, + "loss": 0.7773, + "step": 1363 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998716611749734e-06, + "loss": 1.0908, + "step": 1364 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998703278223506e-06, + "loss": 1.0107, + "step": 1365 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998689875796136e-06, + "loss": 0.8828, + "step": 1366 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998676404467722e-06, + "loss": 0.8174, + "step": 1367 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998662864238345e-06, + "loss": 1.1143, + "step": 1368 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998649255108115e-06, + "loss": 0.9473, + "step": 1369 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998635577077116e-06, + "loss": 0.9541, + "step": 1370 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998621830145442e-06, + "loss": 1.043, + "step": 1371 + }, + { + "epoch": 0.04, + "learning_rate": 1.999860801431319e-06, + "loss": 1.0986, + "step": 1372 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998594129580458e-06, + "loss": 1.0469, + "step": 1373 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998580175947334e-06, + "loss": 1.0, + "step": 1374 + }, + { + "epoch": 0.04, + "learning_rate": 1.999856615341392e-06, + "loss": 1.0068, + "step": 1375 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998552061980313e-06, + "loss": 0.8867, + "step": 1376 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998537901646607e-06, + "loss": 0.9561, + "step": 1377 + }, + { + "epoch": 0.04, + "learning_rate": 1.99985236724129e-06, + "loss": 0.8076, + "step": 1378 + }, + { + "epoch": 0.04, + "learning_rate": 1.999850937427929e-06, + "loss": 0.8545, + "step": 1379 + }, + { + "epoch": 0.04, + "learning_rate": 1.999849500724588e-06, + "loss": 0.9077, + "step": 1380 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998480571312758e-06, + "loss": 0.8906, + "step": 1381 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998466066480037e-06, + "loss": 0.9248, + "step": 1382 + }, + { + "epoch": 0.04, + "learning_rate": 1.999845149274781e-06, + "loss": 0.9844, + "step": 1383 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998436850116173e-06, + "loss": 0.7305, + "step": 1384 + }, + { + "epoch": 0.04, + "learning_rate": 1.999842213858524e-06, + "loss": 1.2217, + "step": 1385 + }, + { + "epoch": 0.04, + "learning_rate": 1.99984073581551e-06, + "loss": 0.5537, + "step": 1386 + }, + { + "epoch": 0.04, + "learning_rate": 1.999839250882586e-06, + "loss": 0.9404, + "step": 1387 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998377590597626e-06, + "loss": 0.8486, + "step": 1388 + }, + { + "epoch": 0.04, + "learning_rate": 1.999836260347049e-06, + "loss": 0.833, + "step": 1389 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998347547444564e-06, + "loss": 1.1914, + "step": 1390 + }, + { + "epoch": 0.04, + "learning_rate": 1.999833242251995e-06, + "loss": 0.9512, + "step": 1391 + }, + { + "epoch": 0.04, + "learning_rate": 1.999831722869675e-06, + "loss": 1.084, + "step": 1392 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998301965975074e-06, + "loss": 0.9863, + "step": 1393 + }, + { + "epoch": 0.04, + "learning_rate": 1.999828663435502e-06, + "loss": 1.0908, + "step": 1394 + }, + { + "epoch": 0.04, + "learning_rate": 1.99982712338367e-06, + "loss": 1.0332, + "step": 1395 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998255764420215e-06, + "loss": 0.877, + "step": 1396 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998240226105676e-06, + "loss": 0.8955, + "step": 1397 + }, + { + "epoch": 0.04, + "learning_rate": 1.999822461889319e-06, + "loss": 1.0156, + "step": 1398 + }, + { + "epoch": 0.04, + "learning_rate": 1.999820894278286e-06, + "loss": 0.8506, + "step": 1399 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998193197774795e-06, + "loss": 0.873, + "step": 1400 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998177383869108e-06, + "loss": 0.9932, + "step": 1401 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998161501065904e-06, + "loss": 1.0742, + "step": 1402 + }, + { + "epoch": 0.04, + "learning_rate": 1.999814554936529e-06, + "loss": 0.9756, + "step": 1403 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998129528767387e-06, + "loss": 0.9453, + "step": 1404 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998113439272297e-06, + "loss": 0.9238, + "step": 1405 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998097280880123e-06, + "loss": 1.0498, + "step": 1406 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998081053590996e-06, + "loss": 1.04, + "step": 1407 + }, + { + "epoch": 0.04, + "learning_rate": 1.999806475740501e-06, + "loss": 1.165, + "step": 1408 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998048392322287e-06, + "loss": 0.9717, + "step": 1409 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998031958342937e-06, + "loss": 0.9297, + "step": 1410 + }, + { + "epoch": 0.04, + "learning_rate": 1.999801545546707e-06, + "loss": 0.9258, + "step": 1411 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997998883694803e-06, + "loss": 1.0537, + "step": 1412 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997982243026256e-06, + "loss": 1.0371, + "step": 1413 + }, + { + "epoch": 0.04, + "learning_rate": 1.999796553346153e-06, + "loss": 1.0371, + "step": 1414 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997948755000756e-06, + "loss": 1.0049, + "step": 1415 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997931907644036e-06, + "loss": 0.9893, + "step": 1416 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997914991391494e-06, + "loss": 0.9556, + "step": 1417 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997898006243244e-06, + "loss": 1.1875, + "step": 1418 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997880952199406e-06, + "loss": 0.6499, + "step": 1419 + }, + { + "epoch": 0.04, + "learning_rate": 1.999786382926009e-06, + "loss": 0.7822, + "step": 1420 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997846637425424e-06, + "loss": 1.0264, + "step": 1421 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997829376695513e-06, + "loss": 0.8823, + "step": 1422 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997812047070492e-06, + "loss": 1.0352, + "step": 1423 + }, + { + "epoch": 0.04, + "learning_rate": 1.999779464855047e-06, + "loss": 0.7891, + "step": 1424 + }, + { + "epoch": 0.04, + "learning_rate": 1.999777718113557e-06, + "loss": 1.0459, + "step": 1425 + }, + { + "epoch": 0.04, + "learning_rate": 1.999775964482591e-06, + "loss": 0.8213, + "step": 1426 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997742039621613e-06, + "loss": 1.0518, + "step": 1427 + }, + { + "epoch": 0.04, + "learning_rate": 1.99977243655228e-06, + "loss": 1.042, + "step": 1428 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997706622529596e-06, + "loss": 0.6528, + "step": 1429 + }, + { + "epoch": 0.04, + "learning_rate": 1.999768881064212e-06, + "loss": 1.2793, + "step": 1430 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997670929860492e-06, + "loss": 1.0957, + "step": 1431 + }, + { + "epoch": 0.04, + "learning_rate": 1.999765298018484e-06, + "loss": 0.8369, + "step": 1432 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997634961615284e-06, + "loss": 1.1738, + "step": 1433 + }, + { + "epoch": 0.04, + "learning_rate": 1.999761687415195e-06, + "loss": 1.0186, + "step": 1434 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997598717794966e-06, + "loss": 1.1865, + "step": 1435 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997580492544454e-06, + "loss": 0.9385, + "step": 1436 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997562198400534e-06, + "loss": 1.0156, + "step": 1437 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997543835363338e-06, + "loss": 1.127, + "step": 1438 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997525403432996e-06, + "loss": 0.9453, + "step": 1439 + }, + { + "epoch": 0.04, + "learning_rate": 1.999750690260963e-06, + "loss": 1.0527, + "step": 1440 + }, + { + "epoch": 0.04, + "learning_rate": 1.999748833289337e-06, + "loss": 1.0205, + "step": 1441 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997469694284336e-06, + "loss": 1.3848, + "step": 1442 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997450986782667e-06, + "loss": 0.9551, + "step": 1443 + }, + { + "epoch": 0.04, + "learning_rate": 1.999743221038849e-06, + "loss": 1.127, + "step": 1444 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997413365101926e-06, + "loss": 0.9561, + "step": 1445 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997394450923117e-06, + "loss": 1.1621, + "step": 1446 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997375467852183e-06, + "loss": 0.9551, + "step": 1447 + }, + { + "epoch": 0.04, + "learning_rate": 1.999735641588926e-06, + "loss": 1.041, + "step": 1448 + }, + { + "epoch": 0.04, + "learning_rate": 1.999733729503448e-06, + "loss": 1.04, + "step": 1449 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997318105287972e-06, + "loss": 0.9551, + "step": 1450 + }, + { + "epoch": 0.04, + "learning_rate": 1.999729884664987e-06, + "loss": 0.7969, + "step": 1451 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997279519120304e-06, + "loss": 0.7788, + "step": 1452 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997260122699414e-06, + "loss": 1.0234, + "step": 1453 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997240657387326e-06, + "loss": 1.0186, + "step": 1454 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997221123184177e-06, + "loss": 0.9375, + "step": 1455 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997201520090102e-06, + "loss": 1.1514, + "step": 1456 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997181848105237e-06, + "loss": 0.9395, + "step": 1457 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997162107229717e-06, + "loss": 0.8613, + "step": 1458 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997142297463673e-06, + "loss": 0.9316, + "step": 1459 + }, + { + "epoch": 0.04, + "learning_rate": 1.999712241880725e-06, + "loss": 0.8242, + "step": 1460 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997102471260577e-06, + "loss": 1.0547, + "step": 1461 + }, + { + "epoch": 0.04, + "learning_rate": 1.99970824548238e-06, + "loss": 0.8408, + "step": 1462 + }, + { + "epoch": 0.04, + "learning_rate": 1.999706236949705e-06, + "loss": 0.8994, + "step": 1463 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997042215280467e-06, + "loss": 0.7217, + "step": 1464 + }, + { + "epoch": 0.04, + "learning_rate": 1.999702199217419e-06, + "loss": 0.7227, + "step": 1465 + }, + { + "epoch": 0.04, + "learning_rate": 1.999700170017836e-06, + "loss": 0.7627, + "step": 1466 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996981339293116e-06, + "loss": 0.9014, + "step": 1467 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996960909518597e-06, + "loss": 1.0273, + "step": 1468 + }, + { + "epoch": 0.04, + "learning_rate": 1.999694041085495e-06, + "loss": 0.8245, + "step": 1469 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996919843302304e-06, + "loss": 0.9795, + "step": 1470 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996899206860814e-06, + "loss": 0.9043, + "step": 1471 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996878501530613e-06, + "loss": 0.8486, + "step": 1472 + }, + { + "epoch": 0.04, + "learning_rate": 1.999685772731185e-06, + "loss": 0.8555, + "step": 1473 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996836884204657e-06, + "loss": 0.8545, + "step": 1474 + }, + { + "epoch": 0.04, + "learning_rate": 1.999681597220919e-06, + "loss": 0.9551, + "step": 1475 + }, + { + "epoch": 0.04, + "learning_rate": 1.999679499132559e-06, + "loss": 0.8506, + "step": 1476 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996773941554e-06, + "loss": 0.8989, + "step": 1477 + }, + { + "epoch": 0.04, + "learning_rate": 1.999675282289456e-06, + "loss": 0.8877, + "step": 1478 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996731635347427e-06, + "loss": 0.6934, + "step": 1479 + }, + { + "epoch": 0.04, + "learning_rate": 1.999671037891274e-06, + "loss": 1.0088, + "step": 1480 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996689053590643e-06, + "loss": 0.8633, + "step": 1481 + }, + { + "epoch": 0.04, + "learning_rate": 1.999666765938129e-06, + "loss": 0.8779, + "step": 1482 + }, + { + "epoch": 0.04, + "learning_rate": 1.999664619628482e-06, + "loss": 1.0723, + "step": 1483 + }, + { + "epoch": 0.04, + "learning_rate": 1.999662466430139e-06, + "loss": 1.0791, + "step": 1484 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996603063431143e-06, + "loss": 1.0684, + "step": 1485 + }, + { + "epoch": 0.04, + "learning_rate": 1.999658139367423e-06, + "loss": 0.8223, + "step": 1486 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996559655030795e-06, + "loss": 1.0176, + "step": 1487 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996537847500995e-06, + "loss": 1.0225, + "step": 1488 + }, + { + "epoch": 0.04, + "learning_rate": 1.999651597108498e-06, + "loss": 0.9043, + "step": 1489 + }, + { + "epoch": 0.04, + "learning_rate": 1.999649402578289e-06, + "loss": 0.8159, + "step": 1490 + }, + { + "epoch": 0.04, + "learning_rate": 1.999647201159489e-06, + "loss": 1.0518, + "step": 1491 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996449928521122e-06, + "loss": 1.0391, + "step": 1492 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996427776561748e-06, + "loss": 1.0928, + "step": 1493 + }, + { + "epoch": 0.04, + "learning_rate": 1.999640555571691e-06, + "loss": 0.8594, + "step": 1494 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996383265986763e-06, + "loss": 1.124, + "step": 1495 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996360907371467e-06, + "loss": 1.0605, + "step": 1496 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996338479871177e-06, + "loss": 0.8867, + "step": 1497 + }, + { + "epoch": 0.04, + "learning_rate": 1.999631598348604e-06, + "loss": 1.0967, + "step": 1498 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996293418216206e-06, + "loss": 0.7886, + "step": 1499 + }, + { + "epoch": 0.04, + "learning_rate": 1.999627078406185e-06, + "loss": 1.166, + "step": 1500 + }, + { + "epoch": 0.04, + "learning_rate": 1.999624808102311e-06, + "loss": 1.1758, + "step": 1501 + }, + { + "epoch": 0.04, + "learning_rate": 1.999622530910015e-06, + "loss": 0.9106, + "step": 1502 + }, + { + "epoch": 0.04, + "learning_rate": 1.999620246829313e-06, + "loss": 0.8818, + "step": 1503 + }, + { + "epoch": 0.04, + "learning_rate": 1.99961795586022e-06, + "loss": 1.0947, + "step": 1504 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996156580027517e-06, + "loss": 0.8105, + "step": 1505 + }, + { + "epoch": 0.04, + "learning_rate": 1.999613353256925e-06, + "loss": 1.0605, + "step": 1506 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996110416227547e-06, + "loss": 0.8506, + "step": 1507 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996087231002576e-06, + "loss": 0.877, + "step": 1508 + }, + { + "epoch": 0.04, + "learning_rate": 1.999606397689449e-06, + "loss": 0.958, + "step": 1509 + }, + { + "epoch": 0.04, + "learning_rate": 1.999604065390345e-06, + "loss": 0.959, + "step": 1510 + }, + { + "epoch": 0.04, + "learning_rate": 1.999601726202962e-06, + "loss": 0.9902, + "step": 1511 + }, + { + "epoch": 0.04, + "learning_rate": 1.999599380127316e-06, + "loss": 1.1445, + "step": 1512 + }, + { + "epoch": 0.04, + "learning_rate": 1.999597027163423e-06, + "loss": 0.915, + "step": 1513 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995946673112996e-06, + "loss": 1.0547, + "step": 1514 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995923005709615e-06, + "loss": 0.8569, + "step": 1515 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995899269424253e-06, + "loss": 0.9375, + "step": 1516 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995875464257076e-06, + "loss": 1.0537, + "step": 1517 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995851590208242e-06, + "loss": 0.9463, + "step": 1518 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995827647277923e-06, + "loss": 1.0273, + "step": 1519 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995803635466275e-06, + "loss": 0.835, + "step": 1520 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995779554773476e-06, + "loss": 1.1064, + "step": 1521 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995755405199678e-06, + "loss": 0.9014, + "step": 1522 + }, + { + "epoch": 0.04, + "learning_rate": 1.999573118674506e-06, + "loss": 0.8662, + "step": 1523 + }, + { + "epoch": 0.04, + "learning_rate": 1.999570689940978e-06, + "loss": 1.1318, + "step": 1524 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995682543194006e-06, + "loss": 0.8418, + "step": 1525 + }, + { + "epoch": 0.04, + "learning_rate": 1.999565811809791e-06, + "loss": 1.0977, + "step": 1526 + }, + { + "epoch": 0.04, + "learning_rate": 1.999563362412166e-06, + "loss": 0.9766, + "step": 1527 + }, + { + "epoch": 0.04, + "learning_rate": 1.999560906126542e-06, + "loss": 1.0645, + "step": 1528 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995584429529363e-06, + "loss": 0.9307, + "step": 1529 + }, + { + "epoch": 0.04, + "learning_rate": 1.999555972891366e-06, + "loss": 0.9482, + "step": 1530 + }, + { + "epoch": 0.04, + "learning_rate": 1.999553495941848e-06, + "loss": 0.8428, + "step": 1531 + }, + { + "epoch": 0.04, + "learning_rate": 1.999551012104399e-06, + "loss": 1.1367, + "step": 1532 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995485213790365e-06, + "loss": 0.9805, + "step": 1533 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995460237657778e-06, + "loss": 0.9844, + "step": 1534 + }, + { + "epoch": 0.04, + "learning_rate": 1.99954351926464e-06, + "loss": 1.0449, + "step": 1535 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995410078756397e-06, + "loss": 0.7256, + "step": 1536 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995384895987954e-06, + "loss": 1.0244, + "step": 1537 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995359644341235e-06, + "loss": 1.1416, + "step": 1538 + }, + { + "epoch": 0.04, + "learning_rate": 1.999533432381642e-06, + "loss": 0.9023, + "step": 1539 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995308934413675e-06, + "loss": 0.9844, + "step": 1540 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995283476133184e-06, + "loss": 0.9971, + "step": 1541 + }, + { + "epoch": 0.04, + "learning_rate": 1.999525794897512e-06, + "loss": 0.9946, + "step": 1542 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995232352939655e-06, + "loss": 0.8398, + "step": 1543 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995206688026972e-06, + "loss": 0.7612, + "step": 1544 + }, + { + "epoch": 0.04, + "learning_rate": 1.999518095423724e-06, + "loss": 1.0303, + "step": 1545 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995155151570646e-06, + "loss": 1.043, + "step": 1546 + }, + { + "epoch": 0.04, + "learning_rate": 1.999512928002736e-06, + "loss": 0.7935, + "step": 1547 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995103339607558e-06, + "loss": 0.9727, + "step": 1548 + }, + { + "epoch": 0.04, + "learning_rate": 1.999507733031143e-06, + "loss": 1.0918, + "step": 1549 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995051252139147e-06, + "loss": 0.9775, + "step": 1550 + }, + { + "epoch": 0.04, + "learning_rate": 1.999502510509089e-06, + "loss": 1.0801, + "step": 1551 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994998889166837e-06, + "loss": 0.9668, + "step": 1552 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994972604367174e-06, + "loss": 0.8999, + "step": 1553 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994946250692076e-06, + "loss": 1.0742, + "step": 1554 + }, + { + "epoch": 0.04, + "learning_rate": 1.999491982814173e-06, + "loss": 1.0664, + "step": 1555 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994893336716317e-06, + "loss": 0.9912, + "step": 1556 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994866776416016e-06, + "loss": 1.0098, + "step": 1557 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994840147241013e-06, + "loss": 1.0605, + "step": 1558 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994813449191495e-06, + "loss": 0.9033, + "step": 1559 + }, + { + "epoch": 0.04, + "learning_rate": 1.999478668226764e-06, + "loss": 1.2324, + "step": 1560 + }, + { + "epoch": 0.04, + "learning_rate": 1.999475984646963e-06, + "loss": 1.1172, + "step": 1561 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994732941797658e-06, + "loss": 0.918, + "step": 1562 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994705968251907e-06, + "loss": 0.7783, + "step": 1563 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994678925832564e-06, + "loss": 1.1055, + "step": 1564 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994651814539803e-06, + "loss": 0.8374, + "step": 1565 + }, + { + "epoch": 0.04, + "learning_rate": 1.999462463437383e-06, + "loss": 1.0898, + "step": 1566 + }, + { + "epoch": 0.04, + "learning_rate": 1.999459738533482e-06, + "loss": 1.1279, + "step": 1567 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994570067422962e-06, + "loss": 1.1543, + "step": 1568 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994542680638453e-06, + "loss": 0.8213, + "step": 1569 + }, + { + "epoch": 0.04, + "learning_rate": 1.999451522498147e-06, + "loss": 1.0059, + "step": 1570 + }, + { + "epoch": 0.04, + "learning_rate": 1.999448770045221e-06, + "loss": 1.1279, + "step": 1571 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994460107050856e-06, + "loss": 0.8525, + "step": 1572 + }, + { + "epoch": 0.04, + "learning_rate": 1.99944324447776e-06, + "loss": 1.1152, + "step": 1573 + }, + { + "epoch": 0.04, + "learning_rate": 1.999440471363264e-06, + "loss": 0.8008, + "step": 1574 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994376913616156e-06, + "loss": 0.9697, + "step": 1575 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994349044728352e-06, + "loss": 0.7773, + "step": 1576 + }, + { + "epoch": 0.04, + "learning_rate": 1.999432110696941e-06, + "loss": 0.9307, + "step": 1577 + }, + { + "epoch": 0.04, + "learning_rate": 1.999429310033952e-06, + "loss": 1.0098, + "step": 1578 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994265024838892e-06, + "loss": 1.125, + "step": 1579 + }, + { + "epoch": 0.04, + "learning_rate": 1.99942368804677e-06, + "loss": 1.125, + "step": 1580 + }, + { + "epoch": 0.04, + "learning_rate": 1.999420866722615e-06, + "loss": 1.1309, + "step": 1581 + }, + { + "epoch": 0.04, + "learning_rate": 1.999418038511443e-06, + "loss": 0.8936, + "step": 1582 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994152034132742e-06, + "loss": 0.7495, + "step": 1583 + }, + { + "epoch": 0.04, + "learning_rate": 1.999412361428127e-06, + "loss": 0.6406, + "step": 1584 + }, + { + "epoch": 0.04, + "learning_rate": 1.999409512556022e-06, + "loss": 1.0166, + "step": 1585 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994066567969787e-06, + "loss": 0.8389, + "step": 1586 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994037941510165e-06, + "loss": 0.8076, + "step": 1587 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994009246181547e-06, + "loss": 0.7783, + "step": 1588 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993980481984145e-06, + "loss": 0.9165, + "step": 1589 + }, + { + "epoch": 0.04, + "learning_rate": 1.999395164891814e-06, + "loss": 1.1572, + "step": 1590 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993922746983744e-06, + "loss": 0.7473, + "step": 1591 + }, + { + "epoch": 0.04, + "learning_rate": 1.999389377618115e-06, + "loss": 0.7969, + "step": 1592 + }, + { + "epoch": 0.04, + "learning_rate": 1.999386473651055e-06, + "loss": 0.9785, + "step": 1593 + }, + { + "epoch": 0.04, + "learning_rate": 1.999383562797216e-06, + "loss": 1.0273, + "step": 1594 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993806450566177e-06, + "loss": 0.7676, + "step": 1595 + }, + { + "epoch": 0.04, + "learning_rate": 1.999377720429279e-06, + "loss": 0.8628, + "step": 1596 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993747889152215e-06, + "loss": 1.1709, + "step": 1597 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993718505144645e-06, + "loss": 0.9492, + "step": 1598 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993689052270286e-06, + "loss": 1.0029, + "step": 1599 + }, + { + "epoch": 0.04, + "learning_rate": 1.999365953052934e-06, + "loss": 0.8291, + "step": 1600 + }, + { + "epoch": 0.04, + "learning_rate": 1.999362993992201e-06, + "loss": 1.042, + "step": 1601 + }, + { + "epoch": 0.04, + "learning_rate": 1.99936002804485e-06, + "loss": 1.0566, + "step": 1602 + }, + { + "epoch": 0.04, + "learning_rate": 1.999357055210902e-06, + "loss": 0.8452, + "step": 1603 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993540754903764e-06, + "loss": 1.0996, + "step": 1604 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993510888832947e-06, + "loss": 1.166, + "step": 1605 + }, + { + "epoch": 0.04, + "learning_rate": 1.999348095389677e-06, + "loss": 0.9253, + "step": 1606 + }, + { + "epoch": 0.04, + "learning_rate": 1.999345095009544e-06, + "loss": 0.8589, + "step": 1607 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993420877429165e-06, + "loss": 1.2207, + "step": 1608 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993390735898147e-06, + "loss": 0.8809, + "step": 1609 + }, + { + "epoch": 0.04, + "learning_rate": 1.99933605255026e-06, + "loss": 1.0078, + "step": 1610 + }, + { + "epoch": 0.04, + "learning_rate": 1.999333024624273e-06, + "loss": 0.9238, + "step": 1611 + }, + { + "epoch": 0.04, + "learning_rate": 1.999329989811875e-06, + "loss": 0.8311, + "step": 1612 + }, + { + "epoch": 0.04, + "learning_rate": 1.999326948113086e-06, + "loss": 0.9629, + "step": 1613 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993238995279277e-06, + "loss": 1.1055, + "step": 1614 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993208440564207e-06, + "loss": 0.8184, + "step": 1615 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993177816985863e-06, + "loss": 1.0654, + "step": 1616 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993147124544455e-06, + "loss": 0.8213, + "step": 1617 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993116363240193e-06, + "loss": 0.9639, + "step": 1618 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993085533073295e-06, + "loss": 0.9814, + "step": 1619 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993054634043965e-06, + "loss": 1.0938, + "step": 1620 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993023666152424e-06, + "loss": 0.8604, + "step": 1621 + }, + { + "epoch": 0.04, + "learning_rate": 1.999299262939888e-06, + "loss": 0.8472, + "step": 1622 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992961523783545e-06, + "loss": 0.9385, + "step": 1623 + }, + { + "epoch": 0.04, + "learning_rate": 1.999293034930664e-06, + "loss": 0.9717, + "step": 1624 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992899105968373e-06, + "loss": 0.7954, + "step": 1625 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992867793768963e-06, + "loss": 0.9414, + "step": 1626 + }, + { + "epoch": 0.04, + "learning_rate": 1.999283641270863e-06, + "loss": 0.938, + "step": 1627 + }, + { + "epoch": 0.04, + "learning_rate": 1.999280496278758e-06, + "loss": 0.896, + "step": 1628 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992773444006043e-06, + "loss": 1.1504, + "step": 1629 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992741856364224e-06, + "loss": 1.0752, + "step": 1630 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992710199862344e-06, + "loss": 1.1104, + "step": 1631 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992678474500625e-06, + "loss": 1.1387, + "step": 1632 + }, + { + "epoch": 0.04, + "learning_rate": 1.999264668027928e-06, + "loss": 0.9512, + "step": 1633 + }, + { + "epoch": 0.04, + "learning_rate": 1.999261481719854e-06, + "loss": 0.9375, + "step": 1634 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992582885258605e-06, + "loss": 1.1729, + "step": 1635 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992550884459715e-06, + "loss": 0.9688, + "step": 1636 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992518814802074e-06, + "loss": 0.8936, + "step": 1637 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992486676285915e-06, + "loss": 1.1064, + "step": 1638 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992454468911453e-06, + "loss": 0.9648, + "step": 1639 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992422192678913e-06, + "loss": 1.1211, + "step": 1640 + }, + { + "epoch": 0.04, + "learning_rate": 1.999238984758851e-06, + "loss": 0.8062, + "step": 1641 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992357433640484e-06, + "loss": 0.9414, + "step": 1642 + }, + { + "epoch": 0.04, + "learning_rate": 1.999232495083504e-06, + "loss": 1.1533, + "step": 1643 + }, + { + "epoch": 0.04, + "learning_rate": 1.999229239917241e-06, + "loss": 0.9775, + "step": 1644 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992259778652822e-06, + "loss": 1.0303, + "step": 1645 + }, + { + "epoch": 0.04, + "learning_rate": 1.999222708927649e-06, + "loss": 1.043, + "step": 1646 + }, + { + "epoch": 0.04, + "learning_rate": 1.999219433104365e-06, + "loss": 1.0879, + "step": 1647 + }, + { + "epoch": 0.04, + "learning_rate": 1.999216150395452e-06, + "loss": 0.9023, + "step": 1648 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992128608009335e-06, + "loss": 1.0557, + "step": 1649 + }, + { + "epoch": 0.04, + "learning_rate": 1.999209564320831e-06, + "loss": 1.1309, + "step": 1650 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992062609551682e-06, + "loss": 0.8105, + "step": 1651 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992029507039676e-06, + "loss": 1.1309, + "step": 1652 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991996335672517e-06, + "loss": 0.8496, + "step": 1653 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991963095450436e-06, + "loss": 0.9219, + "step": 1654 + }, + { + "epoch": 0.04, + "learning_rate": 1.999192978637366e-06, + "loss": 0.9717, + "step": 1655 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991896408442424e-06, + "loss": 0.9385, + "step": 1656 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991862961656954e-06, + "loss": 0.7324, + "step": 1657 + }, + { + "epoch": 0.04, + "learning_rate": 1.999182944601748e-06, + "loss": 1.084, + "step": 1658 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991795861524233e-06, + "loss": 0.8599, + "step": 1659 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991762208177447e-06, + "loss": 0.8389, + "step": 1660 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991728485977347e-06, + "loss": 0.9453, + "step": 1661 + }, + { + "epoch": 0.04, + "learning_rate": 1.999169469492418e-06, + "loss": 0.9941, + "step": 1662 + }, + { + "epoch": 0.04, + "learning_rate": 1.999166083501816e-06, + "loss": 1.2207, + "step": 1663 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991626906259534e-06, + "loss": 1.0576, + "step": 1664 + }, + { + "epoch": 0.04, + "learning_rate": 1.999159290864853e-06, + "loss": 0.958, + "step": 1665 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991558842185386e-06, + "loss": 0.8574, + "step": 1666 + }, + { + "epoch": 0.04, + "learning_rate": 1.999152470687033e-06, + "loss": 1.2197, + "step": 1667 + }, + { + "epoch": 0.04, + "learning_rate": 1.999149050270361e-06, + "loss": 0.9854, + "step": 1668 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991456229685446e-06, + "loss": 1.0791, + "step": 1669 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991421887816083e-06, + "loss": 1.1025, + "step": 1670 + }, + { + "epoch": 0.04, + "learning_rate": 1.999138747709576e-06, + "loss": 1.0205, + "step": 1671 + }, + { + "epoch": 0.04, + "learning_rate": 1.999135299752471e-06, + "loss": 0.8145, + "step": 1672 + }, + { + "epoch": 0.04, + "learning_rate": 1.999131844910317e-06, + "loss": 1.0859, + "step": 1673 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991283831831376e-06, + "loss": 1.1084, + "step": 1674 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991249145709574e-06, + "loss": 0.9141, + "step": 1675 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991214390737994e-06, + "loss": 0.6851, + "step": 1676 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991179566916883e-06, + "loss": 1.0488, + "step": 1677 + }, + { + "epoch": 0.04, + "learning_rate": 1.999114467424648e-06, + "loss": 0.8306, + "step": 1678 + }, + { + "epoch": 0.04, + "learning_rate": 1.999110971272702e-06, + "loss": 1.0273, + "step": 1679 + }, + { + "epoch": 0.04, + "learning_rate": 1.999107468235875e-06, + "loss": 0.915, + "step": 1680 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991039583141906e-06, + "loss": 0.8135, + "step": 1681 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991004415076733e-06, + "loss": 0.8157, + "step": 1682 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990969178163477e-06, + "loss": 0.9941, + "step": 1683 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990933872402375e-06, + "loss": 0.8926, + "step": 1684 + }, + { + "epoch": 0.04, + "learning_rate": 1.999089849779367e-06, + "loss": 0.9482, + "step": 1685 + }, + { + "epoch": 0.04, + "learning_rate": 1.999086305433761e-06, + "loss": 0.8691, + "step": 1686 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990827542034437e-06, + "loss": 1.2578, + "step": 1687 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990791960884395e-06, + "loss": 0.9639, + "step": 1688 + }, + { + "epoch": 0.04, + "learning_rate": 1.999075631088773e-06, + "loss": 1.1738, + "step": 1689 + }, + { + "epoch": 0.04, + "learning_rate": 1.999072059204469e-06, + "loss": 0.8311, + "step": 1690 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990684804355516e-06, + "loss": 1.0938, + "step": 1691 + }, + { + "epoch": 0.04, + "learning_rate": 1.999064894782046e-06, + "loss": 1.1533, + "step": 1692 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990613022439765e-06, + "loss": 0.9297, + "step": 1693 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990577028213684e-06, + "loss": 0.8062, + "step": 1694 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990540965142455e-06, + "loss": 0.6846, + "step": 1695 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990504833226337e-06, + "loss": 0.9062, + "step": 1696 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990468632465574e-06, + "loss": 0.9473, + "step": 1697 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990432362860417e-06, + "loss": 0.9629, + "step": 1698 + }, + { + "epoch": 0.04, + "learning_rate": 1.999039602441111e-06, + "loss": 1.1035, + "step": 1699 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990359617117916e-06, + "loss": 1.0391, + "step": 1700 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990323140981075e-06, + "loss": 1.0166, + "step": 1701 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990286596000844e-06, + "loss": 1.0264, + "step": 1702 + }, + { + "epoch": 0.04, + "learning_rate": 1.999024998217747e-06, + "loss": 1.0117, + "step": 1703 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990213299511206e-06, + "loss": 0.9824, + "step": 1704 + }, + { + "epoch": 0.04, + "learning_rate": 1.999017654800231e-06, + "loss": 0.687, + "step": 1705 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990139727651034e-06, + "loss": 0.873, + "step": 1706 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990102838457624e-06, + "loss": 1.0879, + "step": 1707 + }, + { + "epoch": 0.04, + "learning_rate": 1.999006588042234e-06, + "loss": 0.8877, + "step": 1708 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990028853545443e-06, + "loss": 1.0547, + "step": 1709 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989991757827176e-06, + "loss": 0.8799, + "step": 1710 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989954593267802e-06, + "loss": 0.9863, + "step": 1711 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989917359867574e-06, + "loss": 0.7686, + "step": 1712 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989880057626755e-06, + "loss": 0.6729, + "step": 1713 + }, + { + "epoch": 0.04, + "learning_rate": 1.998984268654559e-06, + "loss": 0.8477, + "step": 1714 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989805246624347e-06, + "loss": 0.8809, + "step": 1715 + }, + { + "epoch": 0.04, + "learning_rate": 1.998976773786328e-06, + "loss": 0.6428, + "step": 1716 + }, + { + "epoch": 0.04, + "learning_rate": 1.998973016026265e-06, + "loss": 0.9922, + "step": 1717 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989692513822713e-06, + "loss": 1.0752, + "step": 1718 + }, + { + "epoch": 0.04, + "learning_rate": 1.998965479854373e-06, + "loss": 1.0547, + "step": 1719 + }, + { + "epoch": 0.04, + "learning_rate": 1.998961701442596e-06, + "loss": 0.8896, + "step": 1720 + }, + { + "epoch": 0.04, + "learning_rate": 1.998957916146966e-06, + "loss": 1.1797, + "step": 1721 + }, + { + "epoch": 0.04, + "learning_rate": 1.99895412396751e-06, + "loss": 0.9365, + "step": 1722 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989503249042535e-06, + "loss": 1.0645, + "step": 1723 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989465189572226e-06, + "loss": 1.0713, + "step": 1724 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989427061264435e-06, + "loss": 1.0586, + "step": 1725 + }, + { + "epoch": 0.04, + "learning_rate": 1.998938886411943e-06, + "loss": 0.8027, + "step": 1726 + }, + { + "epoch": 0.04, + "learning_rate": 1.998935059813747e-06, + "loss": 1.1504, + "step": 1727 + }, + { + "epoch": 0.04, + "learning_rate": 1.998931226331882e-06, + "loss": 1.1152, + "step": 1728 + }, + { + "epoch": 0.04, + "learning_rate": 1.998927385966374e-06, + "loss": 1.1221, + "step": 1729 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989235387172502e-06, + "loss": 0.9307, + "step": 1730 + }, + { + "epoch": 0.04, + "learning_rate": 1.998919684584537e-06, + "loss": 0.7588, + "step": 1731 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989158235682604e-06, + "loss": 0.8721, + "step": 1732 + }, + { + "epoch": 0.04, + "learning_rate": 1.998911955668447e-06, + "loss": 0.79, + "step": 1733 + }, + { + "epoch": 0.04, + "learning_rate": 1.998908080885124e-06, + "loss": 0.8198, + "step": 1734 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989041992183182e-06, + "loss": 1.0439, + "step": 1735 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989003106680554e-06, + "loss": 1.0967, + "step": 1736 + }, + { + "epoch": 0.04, + "learning_rate": 1.9988964152343637e-06, + "loss": 0.9146, + "step": 1737 + }, + { + "epoch": 0.04, + "learning_rate": 1.998892512917269e-06, + "loss": 0.9922, + "step": 1738 + }, + { + "epoch": 0.04, + "learning_rate": 1.998888603716798e-06, + "loss": 0.9307, + "step": 1739 + }, + { + "epoch": 0.04, + "learning_rate": 1.998884687632979e-06, + "loss": 1.0156, + "step": 1740 + }, + { + "epoch": 0.04, + "learning_rate": 1.9988807646658375e-06, + "loss": 1.0254, + "step": 1741 + }, + { + "epoch": 0.04, + "learning_rate": 1.998876834815401e-06, + "loss": 0.9307, + "step": 1742 + }, + { + "epoch": 0.04, + "learning_rate": 1.998872898081697e-06, + "loss": 0.9395, + "step": 1743 + }, + { + "epoch": 0.04, + "learning_rate": 1.998868954464752e-06, + "loss": 0.9395, + "step": 1744 + }, + { + "epoch": 0.04, + "learning_rate": 1.9988650039645937e-06, + "loss": 1.0781, + "step": 1745 + }, + { + "epoch": 0.04, + "learning_rate": 1.998861046581249e-06, + "loss": 0.9092, + "step": 1746 + }, + { + "epoch": 0.04, + "learning_rate": 1.998857082314745e-06, + "loss": 0.9619, + "step": 1747 + }, + { + "epoch": 0.04, + "learning_rate": 1.99885311116511e-06, + "loss": 0.8418, + "step": 1748 + }, + { + "epoch": 0.04, + "learning_rate": 1.99884913313237e-06, + "loss": 1.0107, + "step": 1749 + }, + { + "epoch": 0.04, + "learning_rate": 1.9988451482165534e-06, + "loss": 1.0693, + "step": 1750 + }, + { + "epoch": 0.04, + "learning_rate": 1.9988411564176877e-06, + "loss": 0.585, + "step": 1751 + }, + { + "epoch": 0.04, + "learning_rate": 1.9988371577357996e-06, + "loss": 1.1025, + "step": 1752 + }, + { + "epoch": 0.04, + "learning_rate": 1.998833152170917e-06, + "loss": 1.0127, + "step": 1753 + }, + { + "epoch": 0.04, + "learning_rate": 1.9988291397230677e-06, + "loss": 1.0195, + "step": 1754 + }, + { + "epoch": 0.04, + "learning_rate": 1.998825120392279e-06, + "loss": 1.0059, + "step": 1755 + }, + { + "epoch": 0.05, + "learning_rate": 1.9988210941785794e-06, + "loss": 0.813, + "step": 1756 + }, + { + "epoch": 0.05, + "learning_rate": 1.998817061081996e-06, + "loss": 0.9575, + "step": 1757 + }, + { + "epoch": 0.05, + "learning_rate": 1.9988130211025566e-06, + "loss": 0.874, + "step": 1758 + }, + { + "epoch": 0.05, + "learning_rate": 1.998808974240289e-06, + "loss": 0.9082, + "step": 1759 + }, + { + "epoch": 0.05, + "learning_rate": 1.9988049204952215e-06, + "loss": 0.9834, + "step": 1760 + }, + { + "epoch": 0.05, + "learning_rate": 1.9988008598673813e-06, + "loss": 0.9121, + "step": 1761 + }, + { + "epoch": 0.05, + "learning_rate": 1.998796792356797e-06, + "loss": 0.9648, + "step": 1762 + }, + { + "epoch": 0.05, + "learning_rate": 1.9987927179634966e-06, + "loss": 0.916, + "step": 1763 + }, + { + "epoch": 0.05, + "learning_rate": 1.998788636687508e-06, + "loss": 1.0762, + "step": 1764 + }, + { + "epoch": 0.05, + "learning_rate": 1.998784548528859e-06, + "loss": 0.7773, + "step": 1765 + }, + { + "epoch": 0.05, + "learning_rate": 1.998780453487579e-06, + "loss": 0.8271, + "step": 1766 + }, + { + "epoch": 0.05, + "learning_rate": 1.998776351563694e-06, + "loss": 0.9336, + "step": 1767 + }, + { + "epoch": 0.05, + "learning_rate": 1.998772242757235e-06, + "loss": 1.0684, + "step": 1768 + }, + { + "epoch": 0.05, + "learning_rate": 1.9987681270682284e-06, + "loss": 0.8691, + "step": 1769 + }, + { + "epoch": 0.05, + "learning_rate": 1.9987640044967028e-06, + "loss": 1.0322, + "step": 1770 + }, + { + "epoch": 0.05, + "learning_rate": 1.998759875042687e-06, + "loss": 1.0107, + "step": 1771 + }, + { + "epoch": 0.05, + "learning_rate": 1.99875573870621e-06, + "loss": 0.9771, + "step": 1772 + }, + { + "epoch": 0.05, + "learning_rate": 1.998751595487299e-06, + "loss": 1.0117, + "step": 1773 + }, + { + "epoch": 0.05, + "learning_rate": 1.9987474453859832e-06, + "loss": 1.1914, + "step": 1774 + }, + { + "epoch": 0.05, + "learning_rate": 1.9987432884022914e-06, + "loss": 0.7246, + "step": 1775 + }, + { + "epoch": 0.05, + "learning_rate": 1.998739124536252e-06, + "loss": 0.8457, + "step": 1776 + }, + { + "epoch": 0.05, + "learning_rate": 1.998734953787894e-06, + "loss": 0.998, + "step": 1777 + }, + { + "epoch": 0.05, + "learning_rate": 1.9987307761572456e-06, + "loss": 0.9697, + "step": 1778 + }, + { + "epoch": 0.05, + "learning_rate": 1.998726591644336e-06, + "loss": 1.0547, + "step": 1779 + }, + { + "epoch": 0.05, + "learning_rate": 1.9987224002491937e-06, + "loss": 0.8652, + "step": 1780 + }, + { + "epoch": 0.05, + "learning_rate": 1.998718201971848e-06, + "loss": 0.9814, + "step": 1781 + }, + { + "epoch": 0.05, + "learning_rate": 1.998713996812328e-06, + "loss": 0.999, + "step": 1782 + }, + { + "epoch": 0.05, + "learning_rate": 1.9987097847706614e-06, + "loss": 0.9629, + "step": 1783 + }, + { + "epoch": 0.05, + "learning_rate": 1.9987055658468786e-06, + "loss": 1.1191, + "step": 1784 + }, + { + "epoch": 0.05, + "learning_rate": 1.998701340041008e-06, + "loss": 1.0957, + "step": 1785 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986971073530796e-06, + "loss": 1.041, + "step": 1786 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986928677831214e-06, + "loss": 0.9502, + "step": 1787 + }, + { + "epoch": 0.05, + "learning_rate": 1.998688621331163e-06, + "loss": 1.0273, + "step": 1788 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986843679972337e-06, + "loss": 0.9521, + "step": 1789 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986801077813633e-06, + "loss": 1.0566, + "step": 1790 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986758406835806e-06, + "loss": 0.7463, + "step": 1791 + }, + { + "epoch": 0.05, + "learning_rate": 1.998671566703915e-06, + "loss": 0.9502, + "step": 1792 + }, + { + "epoch": 0.05, + "learning_rate": 1.998667285842396e-06, + "loss": 0.915, + "step": 1793 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986629980990536e-06, + "loss": 1.0508, + "step": 1794 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986587034739165e-06, + "loss": 1.0264, + "step": 1795 + }, + { + "epoch": 0.05, + "learning_rate": 1.998654401967015e-06, + "loss": 0.8252, + "step": 1796 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986500935783784e-06, + "loss": 0.9834, + "step": 1797 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986457783080363e-06, + "loss": 0.8604, + "step": 1798 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986414561560186e-06, + "loss": 0.7881, + "step": 1799 + }, + { + "epoch": 0.05, + "learning_rate": 1.998637127122355e-06, + "loss": 1.0645, + "step": 1800 + }, + { + "epoch": 0.05, + "learning_rate": 1.998632791207076e-06, + "loss": 0.8447, + "step": 1801 + }, + { + "epoch": 0.05, + "learning_rate": 1.99862844841021e-06, + "loss": 1.1025, + "step": 1802 + }, + { + "epoch": 0.05, + "learning_rate": 1.998624098731789e-06, + "loss": 1.124, + "step": 1803 + }, + { + "epoch": 0.05, + "learning_rate": 1.998619742171841e-06, + "loss": 0.9131, + "step": 1804 + }, + { + "epoch": 0.05, + "learning_rate": 1.998615378730397e-06, + "loss": 1.0791, + "step": 1805 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986110084074867e-06, + "loss": 0.9512, + "step": 1806 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986066312031403e-06, + "loss": 0.9814, + "step": 1807 + }, + { + "epoch": 0.05, + "learning_rate": 1.998602247117388e-06, + "loss": 1.0273, + "step": 1808 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985978561502608e-06, + "loss": 0.9604, + "step": 1809 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985934583017877e-06, + "loss": 0.7681, + "step": 1810 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985890535719995e-06, + "loss": 0.8281, + "step": 1811 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985846419609266e-06, + "loss": 1.3066, + "step": 1812 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985802234685995e-06, + "loss": 1.0215, + "step": 1813 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985757980950484e-06, + "loss": 0.5566, + "step": 1814 + }, + { + "epoch": 0.05, + "learning_rate": 1.998571365840304e-06, + "loss": 1.0391, + "step": 1815 + }, + { + "epoch": 0.05, + "learning_rate": 1.998566926704397e-06, + "loss": 0.8662, + "step": 1816 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985624806873576e-06, + "loss": 0.8203, + "step": 1817 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985580277892167e-06, + "loss": 0.9795, + "step": 1818 + }, + { + "epoch": 0.05, + "learning_rate": 1.998553568010005e-06, + "loss": 1.1699, + "step": 1819 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985491013497527e-06, + "loss": 1.043, + "step": 1820 + }, + { + "epoch": 0.05, + "learning_rate": 1.998544627808491e-06, + "loss": 1.208, + "step": 1821 + }, + { + "epoch": 0.05, + "learning_rate": 1.998540147386251e-06, + "loss": 0.9775, + "step": 1822 + }, + { + "epoch": 0.05, + "learning_rate": 1.998535660083063e-06, + "loss": 1.1777, + "step": 1823 + }, + { + "epoch": 0.05, + "learning_rate": 1.998531165898959e-06, + "loss": 0.8574, + "step": 1824 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985266648339685e-06, + "loss": 0.8652, + "step": 1825 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985221568881233e-06, + "loss": 1.126, + "step": 1826 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985176420614546e-06, + "loss": 0.9805, + "step": 1827 + }, + { + "epoch": 0.05, + "learning_rate": 1.998513120353993e-06, + "loss": 0.7686, + "step": 1828 + }, + { + "epoch": 0.05, + "learning_rate": 1.99850859176577e-06, + "loss": 0.918, + "step": 1829 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985040562968168e-06, + "loss": 0.8945, + "step": 1830 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984995139471644e-06, + "loss": 1.0869, + "step": 1831 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984949647168448e-06, + "loss": 0.8994, + "step": 1832 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984904086058885e-06, + "loss": 1.0, + "step": 1833 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984858456143274e-06, + "loss": 1.1719, + "step": 1834 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984812757421927e-06, + "loss": 0.9268, + "step": 1835 + }, + { + "epoch": 0.05, + "learning_rate": 1.998476698989516e-06, + "loss": 0.8589, + "step": 1836 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984721153563287e-06, + "loss": 1.1191, + "step": 1837 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984675248426626e-06, + "loss": 0.9199, + "step": 1838 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984629274485496e-06, + "loss": 1.0771, + "step": 1839 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984583231740205e-06, + "loss": 0.8047, + "step": 1840 + }, + { + "epoch": 0.05, + "learning_rate": 1.998453712019108e-06, + "loss": 1.0674, + "step": 1841 + }, + { + "epoch": 0.05, + "learning_rate": 1.998449093983843e-06, + "loss": 0.9473, + "step": 1842 + }, + { + "epoch": 0.05, + "learning_rate": 1.998444469068258e-06, + "loss": 0.9941, + "step": 1843 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984398372723844e-06, + "loss": 0.835, + "step": 1844 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984351985962546e-06, + "loss": 1.0693, + "step": 1845 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984305530399003e-06, + "loss": 0.874, + "step": 1846 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984259006033536e-06, + "loss": 0.9849, + "step": 1847 + }, + { + "epoch": 0.05, + "learning_rate": 1.998421241286646e-06, + "loss": 1.0693, + "step": 1848 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984165750898104e-06, + "loss": 1.1006, + "step": 1849 + }, + { + "epoch": 0.05, + "learning_rate": 1.998411902012879e-06, + "loss": 1.0557, + "step": 1850 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984072220558834e-06, + "loss": 1.084, + "step": 1851 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984025352188557e-06, + "loss": 1.0947, + "step": 1852 + }, + { + "epoch": 0.05, + "learning_rate": 1.998397841501829e-06, + "loss": 1.3066, + "step": 1853 + }, + { + "epoch": 0.05, + "learning_rate": 1.998393140904835e-06, + "loss": 1.2227, + "step": 1854 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983884334279063e-06, + "loss": 1.0918, + "step": 1855 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983837190710755e-06, + "loss": 0.9248, + "step": 1856 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983789978343746e-06, + "loss": 1.0264, + "step": 1857 + }, + { + "epoch": 0.05, + "learning_rate": 1.998374269717837e-06, + "loss": 1.168, + "step": 1858 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983695347214946e-06, + "loss": 0.8779, + "step": 1859 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983647928453804e-06, + "loss": 0.9697, + "step": 1860 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983600440895264e-06, + "loss": 1.0752, + "step": 1861 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983552884539663e-06, + "loss": 0.7705, + "step": 1862 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983505259387317e-06, + "loss": 1.3057, + "step": 1863 + }, + { + "epoch": 0.05, + "learning_rate": 1.998345756543857e-06, + "loss": 1.0225, + "step": 1864 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983409802693734e-06, + "loss": 1.0498, + "step": 1865 + }, + { + "epoch": 0.05, + "learning_rate": 1.998336197115315e-06, + "loss": 0.9961, + "step": 1866 + }, + { + "epoch": 0.05, + "learning_rate": 1.998331407081714e-06, + "loss": 0.8359, + "step": 1867 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983266101686038e-06, + "loss": 0.9185, + "step": 1868 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983218063760175e-06, + "loss": 0.9854, + "step": 1869 + }, + { + "epoch": 0.05, + "learning_rate": 1.998316995703988e-06, + "loss": 0.9443, + "step": 1870 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983121781525484e-06, + "loss": 1.0449, + "step": 1871 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983073537217325e-06, + "loss": 1.1328, + "step": 1872 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983025224115725e-06, + "loss": 1.0195, + "step": 1873 + }, + { + "epoch": 0.05, + "learning_rate": 1.9982976842221027e-06, + "loss": 0.7285, + "step": 1874 + }, + { + "epoch": 0.05, + "learning_rate": 1.9982928391533557e-06, + "loss": 0.8398, + "step": 1875 + }, + { + "epoch": 0.05, + "learning_rate": 1.998287987205366e-06, + "loss": 1.1318, + "step": 1876 + }, + { + "epoch": 0.05, + "learning_rate": 1.9982831283781653e-06, + "loss": 1.1074, + "step": 1877 + }, + { + "epoch": 0.05, + "learning_rate": 1.9982782626717883e-06, + "loss": 1.0146, + "step": 1878 + }, + { + "epoch": 0.05, + "learning_rate": 1.9982733900862684e-06, + "loss": 1.0439, + "step": 1879 + }, + { + "epoch": 0.05, + "learning_rate": 1.9982685106216387e-06, + "loss": 0.9531, + "step": 1880 + }, + { + "epoch": 0.05, + "learning_rate": 1.9982636242779333e-06, + "loss": 0.876, + "step": 1881 + }, + { + "epoch": 0.05, + "learning_rate": 1.998258731055186e-06, + "loss": 0.959, + "step": 1882 + }, + { + "epoch": 0.05, + "learning_rate": 1.99825383095343e-06, + "loss": 0.9707, + "step": 1883 + }, + { + "epoch": 0.05, + "learning_rate": 1.9982489239726995e-06, + "loss": 0.6416, + "step": 1884 + }, + { + "epoch": 0.05, + "learning_rate": 1.9982440101130276e-06, + "loss": 0.9312, + "step": 1885 + }, + { + "epoch": 0.05, + "learning_rate": 1.9982390893744496e-06, + "loss": 1.0459, + "step": 1886 + }, + { + "epoch": 0.05, + "learning_rate": 1.998234161756998e-06, + "loss": 0.8423, + "step": 1887 + }, + { + "epoch": 0.05, + "learning_rate": 1.998229227260707e-06, + "loss": 0.9473, + "step": 1888 + }, + { + "epoch": 0.05, + "learning_rate": 1.998224285885611e-06, + "loss": 0.8452, + "step": 1889 + }, + { + "epoch": 0.05, + "learning_rate": 1.9982193376317438e-06, + "loss": 0.96, + "step": 1890 + }, + { + "epoch": 0.05, + "learning_rate": 1.99821438249914e-06, + "loss": 0.9814, + "step": 1891 + }, + { + "epoch": 0.05, + "learning_rate": 1.998209420487833e-06, + "loss": 0.9297, + "step": 1892 + }, + { + "epoch": 0.05, + "learning_rate": 1.9982044515978574e-06, + "loss": 1.084, + "step": 1893 + }, + { + "epoch": 0.05, + "learning_rate": 1.998199475829248e-06, + "loss": 0.9932, + "step": 1894 + }, + { + "epoch": 0.05, + "learning_rate": 1.9981944931820376e-06, + "loss": 0.8604, + "step": 1895 + }, + { + "epoch": 0.05, + "learning_rate": 1.998189503656262e-06, + "loss": 0.8037, + "step": 1896 + }, + { + "epoch": 0.05, + "learning_rate": 1.9981845072519546e-06, + "loss": 0.8389, + "step": 1897 + }, + { + "epoch": 0.05, + "learning_rate": 1.99817950396915e-06, + "loss": 0.9941, + "step": 1898 + }, + { + "epoch": 0.05, + "learning_rate": 1.9981744938078834e-06, + "loss": 0.916, + "step": 1899 + }, + { + "epoch": 0.05, + "learning_rate": 1.9981694767681886e-06, + "loss": 0.9014, + "step": 1900 + }, + { + "epoch": 0.05, + "learning_rate": 1.9981644528501005e-06, + "loss": 1.002, + "step": 1901 + }, + { + "epoch": 0.05, + "learning_rate": 1.9981594220536538e-06, + "loss": 0.9463, + "step": 1902 + }, + { + "epoch": 0.05, + "learning_rate": 1.998154384378883e-06, + "loss": 0.9277, + "step": 1903 + }, + { + "epoch": 0.05, + "learning_rate": 1.9981493398258223e-06, + "loss": 0.9814, + "step": 1904 + }, + { + "epoch": 0.05, + "learning_rate": 1.9981442883945074e-06, + "loss": 0.8418, + "step": 1905 + }, + { + "epoch": 0.05, + "learning_rate": 1.998139230084972e-06, + "loss": 1.0977, + "step": 1906 + }, + { + "epoch": 0.05, + "learning_rate": 1.9981341648972525e-06, + "loss": 1.1152, + "step": 1907 + }, + { + "epoch": 0.05, + "learning_rate": 1.9981290928313824e-06, + "loss": 0.7014, + "step": 1908 + }, + { + "epoch": 0.05, + "learning_rate": 1.998124013887397e-06, + "loss": 0.8828, + "step": 1909 + }, + { + "epoch": 0.05, + "learning_rate": 1.998118928065332e-06, + "loss": 1.0664, + "step": 1910 + }, + { + "epoch": 0.05, + "learning_rate": 1.998113835365222e-06, + "loss": 0.9639, + "step": 1911 + }, + { + "epoch": 0.05, + "learning_rate": 1.9981087357871016e-06, + "loss": 1.0498, + "step": 1912 + }, + { + "epoch": 0.05, + "learning_rate": 1.9981036293310064e-06, + "loss": 1.082, + "step": 1913 + }, + { + "epoch": 0.05, + "learning_rate": 1.998098515996972e-06, + "loss": 0.7969, + "step": 1914 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980933957850325e-06, + "loss": 1.0264, + "step": 1915 + }, + { + "epoch": 0.05, + "learning_rate": 1.998088268695224e-06, + "loss": 1.0986, + "step": 1916 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980831347275822e-06, + "loss": 0.8838, + "step": 1917 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980779938821417e-06, + "loss": 0.9014, + "step": 1918 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980728461589385e-06, + "loss": 0.8623, + "step": 1919 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980676915580073e-06, + "loss": 1.084, + "step": 1920 + }, + { + "epoch": 0.05, + "learning_rate": 1.998062530079384e-06, + "loss": 1.1387, + "step": 1921 + }, + { + "epoch": 0.05, + "learning_rate": 1.998057361723105e-06, + "loss": 1.0322, + "step": 1922 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980521864892047e-06, + "loss": 1.1797, + "step": 1923 + }, + { + "epoch": 0.05, + "learning_rate": 1.998047004377719e-06, + "loss": 0.9424, + "step": 1924 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980418153886843e-06, + "loss": 0.8262, + "step": 1925 + }, + { + "epoch": 0.05, + "learning_rate": 1.998036619522136e-06, + "loss": 1.0312, + "step": 1926 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980314167781092e-06, + "loss": 1.0205, + "step": 1927 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980262071566406e-06, + "loss": 0.8232, + "step": 1928 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980209906577663e-06, + "loss": 0.9893, + "step": 1929 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980157672815214e-06, + "loss": 1.0996, + "step": 1930 + }, + { + "epoch": 0.05, + "learning_rate": 1.998010537027942e-06, + "loss": 1.0566, + "step": 1931 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980052998970655e-06, + "loss": 1.0439, + "step": 1932 + }, + { + "epoch": 0.05, + "learning_rate": 1.998000055888926e-06, + "loss": 1.0957, + "step": 1933 + }, + { + "epoch": 0.05, + "learning_rate": 1.997994805003561e-06, + "loss": 0.9131, + "step": 1934 + }, + { + "epoch": 0.05, + "learning_rate": 1.997989547241006e-06, + "loss": 1.0869, + "step": 1935 + }, + { + "epoch": 0.05, + "learning_rate": 1.9979842826012974e-06, + "loss": 0.9053, + "step": 1936 + }, + { + "epoch": 0.05, + "learning_rate": 1.997979011084472e-06, + "loss": 1.0254, + "step": 1937 + }, + { + "epoch": 0.05, + "learning_rate": 1.9979737326905654e-06, + "loss": 1.207, + "step": 1938 + }, + { + "epoch": 0.05, + "learning_rate": 1.9979684474196144e-06, + "loss": 0.9668, + "step": 1939 + }, + { + "epoch": 0.05, + "learning_rate": 1.9979631552716554e-06, + "loss": 0.8672, + "step": 1940 + }, + { + "epoch": 0.05, + "learning_rate": 1.9979578562467244e-06, + "loss": 1.041, + "step": 1941 + }, + { + "epoch": 0.05, + "learning_rate": 1.9979525503448587e-06, + "loss": 0.7715, + "step": 1942 + }, + { + "epoch": 0.05, + "learning_rate": 1.9979472375660943e-06, + "loss": 0.7002, + "step": 1943 + }, + { + "epoch": 0.05, + "learning_rate": 1.9979419179104675e-06, + "loss": 1.0566, + "step": 1944 + }, + { + "epoch": 0.05, + "learning_rate": 1.997936591378016e-06, + "loss": 1.0781, + "step": 1945 + }, + { + "epoch": 0.05, + "learning_rate": 1.997931257968776e-06, + "loss": 1.0645, + "step": 1946 + }, + { + "epoch": 0.05, + "learning_rate": 1.997925917682784e-06, + "loss": 1.0869, + "step": 1947 + }, + { + "epoch": 0.05, + "learning_rate": 1.9979205705200764e-06, + "loss": 0.9365, + "step": 1948 + }, + { + "epoch": 0.05, + "learning_rate": 1.997915216480691e-06, + "loss": 0.9248, + "step": 1949 + }, + { + "epoch": 0.05, + "learning_rate": 1.997909855564664e-06, + "loss": 0.7549, + "step": 1950 + }, + { + "epoch": 0.05, + "learning_rate": 1.9979044877720335e-06, + "loss": 1.0068, + "step": 1951 + }, + { + "epoch": 0.05, + "learning_rate": 1.997899113102835e-06, + "loss": 1.0469, + "step": 1952 + }, + { + "epoch": 0.05, + "learning_rate": 1.9978937315571065e-06, + "loss": 1.0752, + "step": 1953 + }, + { + "epoch": 0.05, + "learning_rate": 1.997888343134884e-06, + "loss": 0.9922, + "step": 1954 + }, + { + "epoch": 0.05, + "learning_rate": 1.9978829478362062e-06, + "loss": 1.0, + "step": 1955 + }, + { + "epoch": 0.05, + "learning_rate": 1.9978775456611094e-06, + "loss": 0.8057, + "step": 1956 + }, + { + "epoch": 0.05, + "learning_rate": 1.9978721366096305e-06, + "loss": 0.5181, + "step": 1957 + }, + { + "epoch": 0.05, + "learning_rate": 1.9978667206818073e-06, + "loss": 0.8486, + "step": 1958 + }, + { + "epoch": 0.05, + "learning_rate": 1.997861297877677e-06, + "loss": 0.9355, + "step": 1959 + }, + { + "epoch": 0.05, + "learning_rate": 1.997855868197277e-06, + "loss": 0.9873, + "step": 1960 + }, + { + "epoch": 0.05, + "learning_rate": 1.9978504316406447e-06, + "loss": 0.9863, + "step": 1961 + }, + { + "epoch": 0.05, + "learning_rate": 1.9978449882078177e-06, + "loss": 0.9854, + "step": 1962 + }, + { + "epoch": 0.05, + "learning_rate": 1.997839537898833e-06, + "loss": 0.957, + "step": 1963 + }, + { + "epoch": 0.05, + "learning_rate": 1.9978340807137287e-06, + "loss": 0.6782, + "step": 1964 + }, + { + "epoch": 0.05, + "learning_rate": 1.9978286166525425e-06, + "loss": 0.915, + "step": 1965 + }, + { + "epoch": 0.05, + "learning_rate": 1.997823145715311e-06, + "loss": 0.9185, + "step": 1966 + }, + { + "epoch": 0.05, + "learning_rate": 1.9978176679020736e-06, + "loss": 1.3047, + "step": 1967 + }, + { + "epoch": 0.05, + "learning_rate": 1.997812183212866e-06, + "loss": 1.0977, + "step": 1968 + }, + { + "epoch": 0.05, + "learning_rate": 1.997806691647728e-06, + "loss": 1.0107, + "step": 1969 + }, + { + "epoch": 0.05, + "learning_rate": 1.9978011932066965e-06, + "loss": 0.8652, + "step": 1970 + }, + { + "epoch": 0.05, + "learning_rate": 1.997795687889809e-06, + "loss": 0.9199, + "step": 1971 + }, + { + "epoch": 0.05, + "learning_rate": 1.997790175697104e-06, + "loss": 0.998, + "step": 1972 + }, + { + "epoch": 0.05, + "learning_rate": 1.9977846566286196e-06, + "loss": 0.8711, + "step": 1973 + }, + { + "epoch": 0.05, + "learning_rate": 1.9977791306843938e-06, + "loss": 1.1494, + "step": 1974 + }, + { + "epoch": 0.05, + "learning_rate": 1.997773597864464e-06, + "loss": 0.9609, + "step": 1975 + }, + { + "epoch": 0.05, + "learning_rate": 1.997768058168869e-06, + "loss": 1.125, + "step": 1976 + }, + { + "epoch": 0.05, + "learning_rate": 1.9977625115976468e-06, + "loss": 1.1738, + "step": 1977 + }, + { + "epoch": 0.05, + "learning_rate": 1.9977569581508355e-06, + "loss": 0.9297, + "step": 1978 + }, + { + "epoch": 0.05, + "learning_rate": 1.997751397828473e-06, + "loss": 1.1328, + "step": 1979 + }, + { + "epoch": 0.05, + "learning_rate": 1.997745830630599e-06, + "loss": 1.0459, + "step": 1980 + }, + { + "epoch": 0.05, + "learning_rate": 1.99774025655725e-06, + "loss": 1.0352, + "step": 1981 + }, + { + "epoch": 0.05, + "learning_rate": 1.997734675608466e-06, + "loss": 0.9395, + "step": 1982 + }, + { + "epoch": 0.05, + "learning_rate": 1.997729087784285e-06, + "loss": 0.834, + "step": 1983 + }, + { + "epoch": 0.05, + "learning_rate": 1.9977234930847447e-06, + "loss": 1.0449, + "step": 1984 + }, + { + "epoch": 0.05, + "learning_rate": 1.9977178915098848e-06, + "loss": 0.9941, + "step": 1985 + }, + { + "epoch": 0.05, + "learning_rate": 1.997712283059743e-06, + "loss": 0.6355, + "step": 1986 + }, + { + "epoch": 0.05, + "learning_rate": 1.997706667734358e-06, + "loss": 0.7588, + "step": 1987 + }, + { + "epoch": 0.05, + "learning_rate": 1.99770104553377e-06, + "loss": 1.0859, + "step": 1988 + }, + { + "epoch": 0.05, + "learning_rate": 1.997695416458016e-06, + "loss": 1.1895, + "step": 1989 + }, + { + "epoch": 0.05, + "learning_rate": 1.997689780507135e-06, + "loss": 0.9248, + "step": 1990 + }, + { + "epoch": 0.05, + "learning_rate": 1.997684137681166e-06, + "loss": 0.7959, + "step": 1991 + }, + { + "epoch": 0.05, + "learning_rate": 1.9976784879801488e-06, + "loss": 0.7959, + "step": 1992 + }, + { + "epoch": 0.05, + "learning_rate": 1.9976728314041213e-06, + "loss": 1.1064, + "step": 1993 + }, + { + "epoch": 0.05, + "learning_rate": 1.997667167953122e-06, + "loss": 0.8691, + "step": 1994 + }, + { + "epoch": 0.05, + "learning_rate": 1.997661497627192e-06, + "loss": 0.7659, + "step": 1995 + }, + { + "epoch": 0.05, + "learning_rate": 1.9976558204263686e-06, + "loss": 1.1172, + "step": 1996 + }, + { + "epoch": 0.05, + "learning_rate": 1.997650136350691e-06, + "loss": 0.8516, + "step": 1997 + }, + { + "epoch": 0.05, + "learning_rate": 1.9976444454001993e-06, + "loss": 0.9766, + "step": 1998 + }, + { + "epoch": 0.05, + "learning_rate": 1.997638747574932e-06, + "loss": 1.0088, + "step": 1999 + }, + { + "epoch": 0.05, + "learning_rate": 1.9976330428749282e-06, + "loss": 1.0693, + "step": 2000 + }, + { + "epoch": 0.05, + "learning_rate": 1.997627331300228e-06, + "loss": 1.0771, + "step": 2001 + }, + { + "epoch": 0.05, + "learning_rate": 1.9976216128508706e-06, + "loss": 0.9688, + "step": 2002 + }, + { + "epoch": 0.05, + "learning_rate": 1.9976158875268946e-06, + "loss": 0.9004, + "step": 2003 + }, + { + "epoch": 0.05, + "learning_rate": 1.99761015532834e-06, + "loss": 0.9932, + "step": 2004 + }, + { + "epoch": 0.05, + "learning_rate": 1.9976044162552467e-06, + "loss": 0.7998, + "step": 2005 + }, + { + "epoch": 0.05, + "learning_rate": 1.997598670307653e-06, + "loss": 0.9551, + "step": 2006 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975929174856004e-06, + "loss": 0.9941, + "step": 2007 + }, + { + "epoch": 0.05, + "learning_rate": 1.997587157789127e-06, + "loss": 0.8818, + "step": 2008 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975813912182724e-06, + "loss": 0.9062, + "step": 2009 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975756177730778e-06, + "loss": 0.9902, + "step": 2010 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975698374535814e-06, + "loss": 0.8374, + "step": 2011 + }, + { + "epoch": 0.05, + "learning_rate": 1.997564050259824e-06, + "loss": 0.96, + "step": 2012 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975582561918453e-06, + "loss": 1.0664, + "step": 2013 + }, + { + "epoch": 0.05, + "learning_rate": 1.997552455249685e-06, + "loss": 0.7451, + "step": 2014 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975466474333834e-06, + "loss": 0.8682, + "step": 2015 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975408327429803e-06, + "loss": 0.9102, + "step": 2016 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975350111785156e-06, + "loss": 0.8188, + "step": 2017 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975291827400295e-06, + "loss": 0.9688, + "step": 2018 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975233474275624e-06, + "loss": 0.9639, + "step": 2019 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975175052411543e-06, + "loss": 0.9707, + "step": 2020 + }, + { + "epoch": 0.05, + "learning_rate": 1.997511656180845e-06, + "loss": 0.9756, + "step": 2021 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975058002466765e-06, + "loss": 1.0352, + "step": 2022 + }, + { + "epoch": 0.05, + "learning_rate": 1.9974999374386873e-06, + "loss": 0.7651, + "step": 2023 + }, + { + "epoch": 0.05, + "learning_rate": 1.997494067756919e-06, + "loss": 0.9248, + "step": 2024 + }, + { + "epoch": 0.05, + "learning_rate": 1.997488191201411e-06, + "loss": 1.1104, + "step": 2025 + }, + { + "epoch": 0.05, + "learning_rate": 1.997482307772204e-06, + "loss": 1.0605, + "step": 2026 + }, + { + "epoch": 0.05, + "learning_rate": 1.9974764174693395e-06, + "loss": 1.0762, + "step": 2027 + }, + { + "epoch": 0.05, + "learning_rate": 1.9974705202928576e-06, + "loss": 0.9766, + "step": 2028 + }, + { + "epoch": 0.05, + "learning_rate": 1.997464616242799e-06, + "loss": 0.9561, + "step": 2029 + }, + { + "epoch": 0.05, + "learning_rate": 1.9974587053192035e-06, + "loss": 1.0439, + "step": 2030 + }, + { + "epoch": 0.05, + "learning_rate": 1.9974527875221127e-06, + "loss": 0.8906, + "step": 2031 + }, + { + "epoch": 0.05, + "learning_rate": 1.9974468628515676e-06, + "loss": 1.1406, + "step": 2032 + }, + { + "epoch": 0.05, + "learning_rate": 1.997440931307608e-06, + "loss": 1.1562, + "step": 2033 + }, + { + "epoch": 0.05, + "learning_rate": 1.9974349928902757e-06, + "loss": 1.0664, + "step": 2034 + }, + { + "epoch": 0.05, + "learning_rate": 1.997429047599612e-06, + "loss": 0.8252, + "step": 2035 + }, + { + "epoch": 0.05, + "learning_rate": 1.9974230954356563e-06, + "loss": 0.9199, + "step": 2036 + }, + { + "epoch": 0.05, + "learning_rate": 1.9974171363984507e-06, + "loss": 0.9434, + "step": 2037 + }, + { + "epoch": 0.05, + "learning_rate": 1.997411170488036e-06, + "loss": 0.9541, + "step": 2038 + }, + { + "epoch": 0.05, + "learning_rate": 1.997405197704454e-06, + "loss": 0.8125, + "step": 2039 + }, + { + "epoch": 0.05, + "learning_rate": 1.9973992180477443e-06, + "loss": 0.8369, + "step": 2040 + }, + { + "epoch": 0.05, + "learning_rate": 1.99739323151795e-06, + "loss": 0.9072, + "step": 2041 + }, + { + "epoch": 0.05, + "learning_rate": 1.9973872381151107e-06, + "loss": 1.2539, + "step": 2042 + }, + { + "epoch": 0.05, + "learning_rate": 1.9973812378392688e-06, + "loss": 0.9834, + "step": 2043 + }, + { + "epoch": 0.05, + "learning_rate": 1.997375230690465e-06, + "loss": 1.0635, + "step": 2044 + }, + { + "epoch": 0.05, + "learning_rate": 1.997369216668741e-06, + "loss": 1.2051, + "step": 2045 + }, + { + "epoch": 0.05, + "learning_rate": 1.9973631957741383e-06, + "loss": 1.2891, + "step": 2046 + }, + { + "epoch": 0.05, + "learning_rate": 1.997357168006698e-06, + "loss": 1.1719, + "step": 2047 + }, + { + "epoch": 0.05, + "learning_rate": 1.9973511333664627e-06, + "loss": 0.959, + "step": 2048 + }, + { + "epoch": 0.05, + "learning_rate": 1.9973450918534726e-06, + "loss": 0.897, + "step": 2049 + }, + { + "epoch": 0.05, + "learning_rate": 1.99733904346777e-06, + "loss": 0.8496, + "step": 2050 + }, + { + "epoch": 0.05, + "learning_rate": 1.9973329882093964e-06, + "loss": 0.8789, + "step": 2051 + }, + { + "epoch": 0.05, + "learning_rate": 1.997326926078394e-06, + "loss": 0.7881, + "step": 2052 + }, + { + "epoch": 0.05, + "learning_rate": 1.997320857074804e-06, + "loss": 0.9092, + "step": 2053 + }, + { + "epoch": 0.05, + "learning_rate": 1.9973147811986683e-06, + "loss": 1.0195, + "step": 2054 + }, + { + "epoch": 0.05, + "learning_rate": 1.997308698450029e-06, + "loss": 0.9492, + "step": 2055 + }, + { + "epoch": 0.05, + "learning_rate": 1.997302608828928e-06, + "loss": 0.958, + "step": 2056 + }, + { + "epoch": 0.05, + "learning_rate": 1.9972965123354072e-06, + "loss": 0.9248, + "step": 2057 + }, + { + "epoch": 0.05, + "learning_rate": 1.9972904089695087e-06, + "loss": 0.9355, + "step": 2058 + }, + { + "epoch": 0.05, + "learning_rate": 1.9972842987312744e-06, + "loss": 0.9629, + "step": 2059 + }, + { + "epoch": 0.05, + "learning_rate": 1.9972781816207463e-06, + "loss": 0.7534, + "step": 2060 + }, + { + "epoch": 0.05, + "learning_rate": 1.997272057637967e-06, + "loss": 0.9316, + "step": 2061 + }, + { + "epoch": 0.05, + "learning_rate": 1.997265926782978e-06, + "loss": 0.9932, + "step": 2062 + }, + { + "epoch": 0.05, + "learning_rate": 1.997259789055822e-06, + "loss": 1.1631, + "step": 2063 + }, + { + "epoch": 0.05, + "learning_rate": 1.9972536444565413e-06, + "loss": 0.9307, + "step": 2064 + }, + { + "epoch": 0.05, + "learning_rate": 1.9972474929851785e-06, + "loss": 1.1758, + "step": 2065 + }, + { + "epoch": 0.05, + "learning_rate": 1.9972413346417756e-06, + "loss": 0.8535, + "step": 2066 + }, + { + "epoch": 0.05, + "learning_rate": 1.9972351694263753e-06, + "loss": 0.8877, + "step": 2067 + }, + { + "epoch": 0.05, + "learning_rate": 1.9972289973390196e-06, + "loss": 0.9014, + "step": 2068 + }, + { + "epoch": 0.05, + "learning_rate": 1.9972228183797516e-06, + "loss": 0.9512, + "step": 2069 + }, + { + "epoch": 0.05, + "learning_rate": 1.9972166325486134e-06, + "loss": 1.0146, + "step": 2070 + }, + { + "epoch": 0.05, + "learning_rate": 1.9972104398456476e-06, + "loss": 1.0098, + "step": 2071 + }, + { + "epoch": 0.05, + "learning_rate": 1.997204240270898e-06, + "loss": 0.9961, + "step": 2072 + }, + { + "epoch": 0.05, + "learning_rate": 1.997198033824406e-06, + "loss": 1.0635, + "step": 2073 + }, + { + "epoch": 0.05, + "learning_rate": 1.9971918205062145e-06, + "loss": 0.6246, + "step": 2074 + }, + { + "epoch": 0.05, + "learning_rate": 1.9971856003163668e-06, + "loss": 0.9639, + "step": 2075 + }, + { + "epoch": 0.05, + "learning_rate": 1.9971793732549054e-06, + "loss": 0.9502, + "step": 2076 + }, + { + "epoch": 0.05, + "learning_rate": 1.997173139321874e-06, + "loss": 0.9287, + "step": 2077 + }, + { + "epoch": 0.05, + "learning_rate": 1.997166898517314e-06, + "loss": 1.1602, + "step": 2078 + }, + { + "epoch": 0.05, + "learning_rate": 1.9971606508412705e-06, + "loss": 0.6318, + "step": 2079 + }, + { + "epoch": 0.05, + "learning_rate": 1.9971543962937848e-06, + "loss": 0.9038, + "step": 2080 + }, + { + "epoch": 0.05, + "learning_rate": 1.9971481348749006e-06, + "loss": 1.1377, + "step": 2081 + }, + { + "epoch": 0.05, + "learning_rate": 1.9971418665846615e-06, + "loss": 0.8838, + "step": 2082 + }, + { + "epoch": 0.05, + "learning_rate": 1.9971355914231094e-06, + "loss": 1.0156, + "step": 2083 + }, + { + "epoch": 0.05, + "learning_rate": 1.9971293093902893e-06, + "loss": 1.1309, + "step": 2084 + }, + { + "epoch": 0.05, + "learning_rate": 1.997123020486243e-06, + "loss": 0.9854, + "step": 2085 + }, + { + "epoch": 0.05, + "learning_rate": 1.997116724711015e-06, + "loss": 1.0801, + "step": 2086 + }, + { + "epoch": 0.05, + "learning_rate": 1.997110422064648e-06, + "loss": 0.9336, + "step": 2087 + }, + { + "epoch": 0.05, + "learning_rate": 1.997104112547185e-06, + "loss": 0.6624, + "step": 2088 + }, + { + "epoch": 0.05, + "learning_rate": 1.9970977961586704e-06, + "loss": 1.0576, + "step": 2089 + }, + { + "epoch": 0.05, + "learning_rate": 1.9970914728991474e-06, + "loss": 0.9463, + "step": 2090 + }, + { + "epoch": 0.05, + "learning_rate": 1.9970851427686595e-06, + "loss": 0.9414, + "step": 2091 + }, + { + "epoch": 0.05, + "learning_rate": 1.9970788057672505e-06, + "loss": 0.79, + "step": 2092 + }, + { + "epoch": 0.05, + "learning_rate": 1.997072461894964e-06, + "loss": 0.7668, + "step": 2093 + }, + { + "epoch": 0.05, + "learning_rate": 1.997066111151843e-06, + "loss": 1.0605, + "step": 2094 + }, + { + "epoch": 0.05, + "learning_rate": 1.997059753537932e-06, + "loss": 1.0146, + "step": 2095 + }, + { + "epoch": 0.05, + "learning_rate": 1.997053389053275e-06, + "loss": 0.7148, + "step": 2096 + }, + { + "epoch": 0.05, + "learning_rate": 1.9970470176979156e-06, + "loss": 0.9971, + "step": 2097 + }, + { + "epoch": 0.05, + "learning_rate": 1.9970406394718975e-06, + "loss": 0.9053, + "step": 2098 + }, + { + "epoch": 0.05, + "learning_rate": 1.9970342543752653e-06, + "loss": 0.9482, + "step": 2099 + }, + { + "epoch": 0.05, + "learning_rate": 1.997027862408062e-06, + "loss": 1.0898, + "step": 2100 + }, + { + "epoch": 0.05, + "learning_rate": 1.9970214635703324e-06, + "loss": 0.9189, + "step": 2101 + }, + { + "epoch": 0.05, + "learning_rate": 1.9970150578621203e-06, + "loss": 1.1445, + "step": 2102 + }, + { + "epoch": 0.05, + "learning_rate": 1.9970086452834698e-06, + "loss": 0.9629, + "step": 2103 + }, + { + "epoch": 0.05, + "learning_rate": 1.9970022258344253e-06, + "loss": 0.8818, + "step": 2104 + }, + { + "epoch": 0.05, + "learning_rate": 1.996995799515031e-06, + "loss": 1.1348, + "step": 2105 + }, + { + "epoch": 0.05, + "learning_rate": 1.996989366325331e-06, + "loss": 0.958, + "step": 2106 + }, + { + "epoch": 0.05, + "learning_rate": 1.9969829262653697e-06, + "loss": 1.0303, + "step": 2107 + }, + { + "epoch": 0.05, + "learning_rate": 1.9969764793351917e-06, + "loss": 1.0791, + "step": 2108 + }, + { + "epoch": 0.05, + "learning_rate": 1.996970025534841e-06, + "loss": 0.9785, + "step": 2109 + }, + { + "epoch": 0.05, + "learning_rate": 1.9969635648643625e-06, + "loss": 0.8955, + "step": 2110 + }, + { + "epoch": 0.05, + "learning_rate": 1.9969570973238006e-06, + "loss": 1.1738, + "step": 2111 + }, + { + "epoch": 0.05, + "learning_rate": 1.9969506229131997e-06, + "loss": 1.1318, + "step": 2112 + }, + { + "epoch": 0.05, + "learning_rate": 1.9969441416326047e-06, + "loss": 0.9668, + "step": 2113 + }, + { + "epoch": 0.05, + "learning_rate": 1.99693765348206e-06, + "loss": 1.0234, + "step": 2114 + }, + { + "epoch": 0.05, + "learning_rate": 1.99693115846161e-06, + "loss": 0.9521, + "step": 2115 + }, + { + "epoch": 0.05, + "learning_rate": 1.9969246565713004e-06, + "loss": 1.1494, + "step": 2116 + }, + { + "epoch": 0.05, + "learning_rate": 1.9969181478111753e-06, + "loss": 0.6646, + "step": 2117 + }, + { + "epoch": 0.05, + "learning_rate": 1.9969116321812796e-06, + "loss": 1.0762, + "step": 2118 + }, + { + "epoch": 0.05, + "learning_rate": 1.9969051096816583e-06, + "loss": 0.7627, + "step": 2119 + }, + { + "epoch": 0.05, + "learning_rate": 1.9968985803123568e-06, + "loss": 1.0381, + "step": 2120 + }, + { + "epoch": 0.05, + "learning_rate": 1.996892044073419e-06, + "loss": 0.8838, + "step": 2121 + }, + { + "epoch": 0.05, + "learning_rate": 1.996885500964891e-06, + "loss": 1.2061, + "step": 2122 + }, + { + "epoch": 0.05, + "learning_rate": 1.9968789509868175e-06, + "loss": 0.9219, + "step": 2123 + }, + { + "epoch": 0.05, + "learning_rate": 1.9968723941392432e-06, + "loss": 1.1582, + "step": 2124 + }, + { + "epoch": 0.05, + "learning_rate": 1.996865830422214e-06, + "loss": 1.0596, + "step": 2125 + }, + { + "epoch": 0.05, + "learning_rate": 1.9968592598357746e-06, + "loss": 1.1299, + "step": 2126 + }, + { + "epoch": 0.05, + "learning_rate": 1.996852682379971e-06, + "loss": 0.8682, + "step": 2127 + }, + { + "epoch": 0.05, + "learning_rate": 1.9968460980548477e-06, + "loss": 1.1045, + "step": 2128 + }, + { + "epoch": 0.05, + "learning_rate": 1.9968395068604504e-06, + "loss": 0.957, + "step": 2129 + }, + { + "epoch": 0.05, + "learning_rate": 1.9968329087968247e-06, + "loss": 1.1406, + "step": 2130 + }, + { + "epoch": 0.05, + "learning_rate": 1.996826303864016e-06, + "loss": 1.0205, + "step": 2131 + }, + { + "epoch": 0.05, + "learning_rate": 1.9968196920620693e-06, + "loss": 0.707, + "step": 2132 + }, + { + "epoch": 0.05, + "learning_rate": 1.996813073391031e-06, + "loss": 0.7773, + "step": 2133 + }, + { + "epoch": 0.05, + "learning_rate": 1.9968064478509457e-06, + "loss": 0.9658, + "step": 2134 + }, + { + "epoch": 0.05, + "learning_rate": 1.99679981544186e-06, + "loss": 0.9121, + "step": 2135 + }, + { + "epoch": 0.05, + "learning_rate": 1.9967931761638195e-06, + "loss": 1.0078, + "step": 2136 + }, + { + "epoch": 0.05, + "learning_rate": 1.9967865300168692e-06, + "loss": 1.0527, + "step": 2137 + }, + { + "epoch": 0.05, + "learning_rate": 1.9967798770010557e-06, + "loss": 0.9834, + "step": 2138 + }, + { + "epoch": 0.05, + "learning_rate": 1.9967732171164245e-06, + "loss": 0.877, + "step": 2139 + }, + { + "epoch": 0.05, + "learning_rate": 1.9967665503630215e-06, + "loss": 1.1191, + "step": 2140 + }, + { + "epoch": 0.05, + "learning_rate": 1.9967598767408928e-06, + "loss": 1.21, + "step": 2141 + }, + { + "epoch": 0.05, + "learning_rate": 1.996753196250084e-06, + "loss": 1.082, + "step": 2142 + }, + { + "epoch": 0.05, + "learning_rate": 1.9967465088906416e-06, + "loss": 0.8076, + "step": 2143 + }, + { + "epoch": 0.05, + "learning_rate": 1.9967398146626115e-06, + "loss": 0.8706, + "step": 2144 + }, + { + "epoch": 0.05, + "learning_rate": 1.9967331135660395e-06, + "loss": 1.1289, + "step": 2145 + }, + { + "epoch": 0.06, + "learning_rate": 1.9967264056009727e-06, + "loss": 0.7769, + "step": 2146 + }, + { + "epoch": 0.06, + "learning_rate": 1.996719690767456e-06, + "loss": 0.9902, + "step": 2147 + }, + { + "epoch": 0.06, + "learning_rate": 1.996712969065537e-06, + "loss": 0.8926, + "step": 2148 + }, + { + "epoch": 0.06, + "learning_rate": 1.9967062404952607e-06, + "loss": 0.7456, + "step": 2149 + }, + { + "epoch": 0.06, + "learning_rate": 1.9966995050566746e-06, + "loss": 1.042, + "step": 2150 + }, + { + "epoch": 0.06, + "learning_rate": 1.9966927627498246e-06, + "loss": 0.8359, + "step": 2151 + }, + { + "epoch": 0.06, + "learning_rate": 1.996686013574757e-06, + "loss": 0.9746, + "step": 2152 + }, + { + "epoch": 0.06, + "learning_rate": 1.996679257531519e-06, + "loss": 0.8081, + "step": 2153 + }, + { + "epoch": 0.06, + "learning_rate": 1.9966724946201567e-06, + "loss": 1.1191, + "step": 2154 + }, + { + "epoch": 0.06, + "learning_rate": 1.9966657248407163e-06, + "loss": 0.8574, + "step": 2155 + }, + { + "epoch": 0.06, + "learning_rate": 1.996658948193245e-06, + "loss": 0.8428, + "step": 2156 + }, + { + "epoch": 0.06, + "learning_rate": 1.99665216467779e-06, + "loss": 0.9443, + "step": 2157 + }, + { + "epoch": 0.06, + "learning_rate": 1.9966453742943966e-06, + "loss": 0.6816, + "step": 2158 + }, + { + "epoch": 0.06, + "learning_rate": 1.996638577043113e-06, + "loss": 1.002, + "step": 2159 + }, + { + "epoch": 0.06, + "learning_rate": 1.996631772923985e-06, + "loss": 1.0254, + "step": 2160 + }, + { + "epoch": 0.06, + "learning_rate": 1.9966249619370597e-06, + "loss": 0.8799, + "step": 2161 + }, + { + "epoch": 0.06, + "learning_rate": 1.996618144082385e-06, + "loss": 0.7119, + "step": 2162 + }, + { + "epoch": 0.06, + "learning_rate": 1.9966113193600065e-06, + "loss": 0.9795, + "step": 2163 + }, + { + "epoch": 0.06, + "learning_rate": 1.996604487769972e-06, + "loss": 0.9365, + "step": 2164 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965976493123285e-06, + "loss": 0.9502, + "step": 2165 + }, + { + "epoch": 0.06, + "learning_rate": 1.996590803987123e-06, + "loss": 0.8838, + "step": 2166 + }, + { + "epoch": 0.06, + "learning_rate": 1.996583951794403e-06, + "loss": 0.9932, + "step": 2167 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965770927342158e-06, + "loss": 1.1201, + "step": 2168 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965702268066073e-06, + "loss": 1.1016, + "step": 2169 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965633540116267e-06, + "loss": 0.9053, + "step": 2170 + }, + { + "epoch": 0.06, + "learning_rate": 1.99655647434932e-06, + "loss": 1.0352, + "step": 2171 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965495878197355e-06, + "loss": 1.1172, + "step": 2172 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965426944229197e-06, + "loss": 1.1748, + "step": 2173 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965357941589215e-06, + "loss": 0.729, + "step": 2174 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965288870277866e-06, + "loss": 0.8936, + "step": 2175 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965219730295643e-06, + "loss": 0.8086, + "step": 2176 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965150521643013e-06, + "loss": 1.0576, + "step": 2177 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965081244320458e-06, + "loss": 1.0488, + "step": 2178 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965011898328454e-06, + "loss": 1.0312, + "step": 2179 + }, + { + "epoch": 0.06, + "learning_rate": 1.9964942483667472e-06, + "loss": 0.7231, + "step": 2180 + }, + { + "epoch": 0.06, + "learning_rate": 1.9964873000338e-06, + "loss": 0.8984, + "step": 2181 + }, + { + "epoch": 0.06, + "learning_rate": 1.9964803448340515e-06, + "loss": 0.8037, + "step": 2182 + }, + { + "epoch": 0.06, + "learning_rate": 1.9964733827675487e-06, + "loss": 1.1738, + "step": 2183 + }, + { + "epoch": 0.06, + "learning_rate": 1.996466413834341e-06, + "loss": 0.9873, + "step": 2184 + }, + { + "epoch": 0.06, + "learning_rate": 1.9964594380344754e-06, + "loss": 0.9072, + "step": 2185 + }, + { + "epoch": 0.06, + "learning_rate": 1.996452455368e-06, + "loss": 1.1377, + "step": 2186 + }, + { + "epoch": 0.06, + "learning_rate": 1.9964454658349637e-06, + "loss": 1.0645, + "step": 2187 + }, + { + "epoch": 0.06, + "learning_rate": 1.996438469435414e-06, + "loss": 0.7314, + "step": 2188 + }, + { + "epoch": 0.06, + "learning_rate": 1.9964314661693995e-06, + "loss": 0.9355, + "step": 2189 + }, + { + "epoch": 0.06, + "learning_rate": 1.9964244560369677e-06, + "loss": 0.9932, + "step": 2190 + }, + { + "epoch": 0.06, + "learning_rate": 1.9964174390381676e-06, + "loss": 1.0088, + "step": 2191 + }, + { + "epoch": 0.06, + "learning_rate": 1.996410415173048e-06, + "loss": 1.0576, + "step": 2192 + }, + { + "epoch": 0.06, + "learning_rate": 1.996403384441656e-06, + "loss": 0.9736, + "step": 2193 + }, + { + "epoch": 0.06, + "learning_rate": 1.996396346844041e-06, + "loss": 1.0098, + "step": 2194 + }, + { + "epoch": 0.06, + "learning_rate": 1.9963893023802513e-06, + "loss": 0.7744, + "step": 2195 + }, + { + "epoch": 0.06, + "learning_rate": 1.996382251050335e-06, + "loss": 0.8379, + "step": 2196 + }, + { + "epoch": 0.06, + "learning_rate": 1.996375192854342e-06, + "loss": 1.0088, + "step": 2197 + }, + { + "epoch": 0.06, + "learning_rate": 1.996368127792319e-06, + "loss": 0.7959, + "step": 2198 + }, + { + "epoch": 0.06, + "learning_rate": 1.9963610558643166e-06, + "loss": 0.8691, + "step": 2199 + }, + { + "epoch": 0.06, + "learning_rate": 1.996353977070382e-06, + "loss": 0.877, + "step": 2200 + }, + { + "epoch": 0.06, + "learning_rate": 1.9963468914105647e-06, + "loss": 0.7087, + "step": 2201 + }, + { + "epoch": 0.06, + "learning_rate": 1.9963397988849135e-06, + "loss": 0.999, + "step": 2202 + }, + { + "epoch": 0.06, + "learning_rate": 1.996332699493477e-06, + "loss": 0.9541, + "step": 2203 + }, + { + "epoch": 0.06, + "learning_rate": 1.996325593236305e-06, + "loss": 0.8262, + "step": 2204 + }, + { + "epoch": 0.06, + "learning_rate": 1.996318480113445e-06, + "loss": 1.1494, + "step": 2205 + }, + { + "epoch": 0.06, + "learning_rate": 1.9963113601249475e-06, + "loss": 1.0771, + "step": 2206 + }, + { + "epoch": 0.06, + "learning_rate": 1.9963042332708607e-06, + "loss": 0.9941, + "step": 2207 + }, + { + "epoch": 0.06, + "learning_rate": 1.996297099551234e-06, + "loss": 0.8926, + "step": 2208 + }, + { + "epoch": 0.06, + "learning_rate": 1.996289958966116e-06, + "loss": 0.9375, + "step": 2209 + }, + { + "epoch": 0.06, + "learning_rate": 1.9962828115155566e-06, + "loss": 0.8057, + "step": 2210 + }, + { + "epoch": 0.06, + "learning_rate": 1.996275657199605e-06, + "loss": 0.9219, + "step": 2211 + }, + { + "epoch": 0.06, + "learning_rate": 1.9962684960183102e-06, + "loss": 1.1777, + "step": 2212 + }, + { + "epoch": 0.06, + "learning_rate": 1.9962613279717215e-06, + "loss": 0.876, + "step": 2213 + }, + { + "epoch": 0.06, + "learning_rate": 1.996254153059889e-06, + "loss": 0.957, + "step": 2214 + }, + { + "epoch": 0.06, + "learning_rate": 1.996246971282861e-06, + "loss": 0.9863, + "step": 2215 + }, + { + "epoch": 0.06, + "learning_rate": 1.9962397826406882e-06, + "loss": 0.7559, + "step": 2216 + }, + { + "epoch": 0.06, + "learning_rate": 1.9962325871334193e-06, + "loss": 0.999, + "step": 2217 + }, + { + "epoch": 0.06, + "learning_rate": 1.996225384761104e-06, + "loss": 0.8477, + "step": 2218 + }, + { + "epoch": 0.06, + "learning_rate": 1.9962181755237916e-06, + "loss": 0.9551, + "step": 2219 + }, + { + "epoch": 0.06, + "learning_rate": 1.996210959421533e-06, + "loss": 0.79, + "step": 2220 + }, + { + "epoch": 0.06, + "learning_rate": 1.9962037364543765e-06, + "loss": 0.4814, + "step": 2221 + }, + { + "epoch": 0.06, + "learning_rate": 1.996196506622373e-06, + "loss": 1.0068, + "step": 2222 + }, + { + "epoch": 0.06, + "learning_rate": 1.9961892699255715e-06, + "loss": 0.9521, + "step": 2223 + }, + { + "epoch": 0.06, + "learning_rate": 1.9961820263640224e-06, + "loss": 1.0527, + "step": 2224 + }, + { + "epoch": 0.06, + "learning_rate": 1.9961747759377757e-06, + "loss": 0.9619, + "step": 2225 + }, + { + "epoch": 0.06, + "learning_rate": 1.9961675186468805e-06, + "loss": 1.0781, + "step": 2226 + }, + { + "epoch": 0.06, + "learning_rate": 1.996160254491388e-06, + "loss": 1.0156, + "step": 2227 + }, + { + "epoch": 0.06, + "learning_rate": 1.9961529834713474e-06, + "loss": 1.1602, + "step": 2228 + }, + { + "epoch": 0.06, + "learning_rate": 1.996145705586809e-06, + "loss": 0.9424, + "step": 2229 + }, + { + "epoch": 0.06, + "learning_rate": 1.996138420837823e-06, + "loss": 1.041, + "step": 2230 + }, + { + "epoch": 0.06, + "learning_rate": 1.99613112922444e-06, + "loss": 0.8896, + "step": 2231 + }, + { + "epoch": 0.06, + "learning_rate": 1.9961238307467096e-06, + "loss": 1.0098, + "step": 2232 + }, + { + "epoch": 0.06, + "learning_rate": 1.9961165254046822e-06, + "loss": 0.9756, + "step": 2233 + }, + { + "epoch": 0.06, + "learning_rate": 1.9961092131984083e-06, + "loss": 1.25, + "step": 2234 + }, + { + "epoch": 0.06, + "learning_rate": 1.9961018941279385e-06, + "loss": 0.8525, + "step": 2235 + }, + { + "epoch": 0.06, + "learning_rate": 1.9960945681933226e-06, + "loss": 0.6929, + "step": 2236 + }, + { + "epoch": 0.06, + "learning_rate": 1.996087235394612e-06, + "loss": 1.0459, + "step": 2237 + }, + { + "epoch": 0.06, + "learning_rate": 1.9960798957318566e-06, + "loss": 1.1016, + "step": 2238 + }, + { + "epoch": 0.06, + "learning_rate": 1.996072549205107e-06, + "loss": 0.9277, + "step": 2239 + }, + { + "epoch": 0.06, + "learning_rate": 1.996065195814414e-06, + "loss": 1.0322, + "step": 2240 + }, + { + "epoch": 0.06, + "learning_rate": 1.9960578355598285e-06, + "loss": 0.8436, + "step": 2241 + }, + { + "epoch": 0.06, + "learning_rate": 1.9960504684414004e-06, + "loss": 0.8682, + "step": 2242 + }, + { + "epoch": 0.06, + "learning_rate": 1.9960430944591815e-06, + "loss": 0.9482, + "step": 2243 + }, + { + "epoch": 0.06, + "learning_rate": 1.9960357136132217e-06, + "loss": 1.0342, + "step": 2244 + }, + { + "epoch": 0.06, + "learning_rate": 1.9960283259035726e-06, + "loss": 0.8721, + "step": 2245 + }, + { + "epoch": 0.06, + "learning_rate": 1.9960209313302847e-06, + "loss": 1.1348, + "step": 2246 + }, + { + "epoch": 0.06, + "learning_rate": 1.9960135298934087e-06, + "loss": 0.8447, + "step": 2247 + }, + { + "epoch": 0.06, + "learning_rate": 1.9960061215929964e-06, + "loss": 0.8643, + "step": 2248 + }, + { + "epoch": 0.06, + "learning_rate": 1.995998706429098e-06, + "loss": 0.9453, + "step": 2249 + }, + { + "epoch": 0.06, + "learning_rate": 1.9959912844017653e-06, + "loss": 1.2715, + "step": 2250 + }, + { + "epoch": 0.06, + "learning_rate": 1.995983855511049e-06, + "loss": 0.8945, + "step": 2251 + }, + { + "epoch": 0.06, + "learning_rate": 1.9959764197570007e-06, + "loss": 0.8193, + "step": 2252 + }, + { + "epoch": 0.06, + "learning_rate": 1.9959689771396707e-06, + "loss": 0.9775, + "step": 2253 + }, + { + "epoch": 0.06, + "learning_rate": 1.995961527659112e-06, + "loss": 0.9116, + "step": 2254 + }, + { + "epoch": 0.06, + "learning_rate": 1.995954071315374e-06, + "loss": 0.8623, + "step": 2255 + }, + { + "epoch": 0.06, + "learning_rate": 1.995946608108509e-06, + "loss": 0.9756, + "step": 2256 + }, + { + "epoch": 0.06, + "learning_rate": 1.995939138038569e-06, + "loss": 1.0811, + "step": 2257 + }, + { + "epoch": 0.06, + "learning_rate": 1.9959316611056045e-06, + "loss": 0.8818, + "step": 2258 + }, + { + "epoch": 0.06, + "learning_rate": 1.9959241773096674e-06, + "loss": 1.0742, + "step": 2259 + }, + { + "epoch": 0.06, + "learning_rate": 1.9959166866508093e-06, + "loss": 1.0498, + "step": 2260 + }, + { + "epoch": 0.06, + "learning_rate": 1.9959091891290815e-06, + "loss": 1.0469, + "step": 2261 + }, + { + "epoch": 0.06, + "learning_rate": 1.9959016847445364e-06, + "loss": 0.8135, + "step": 2262 + }, + { + "epoch": 0.06, + "learning_rate": 1.995894173497225e-06, + "loss": 0.8057, + "step": 2263 + }, + { + "epoch": 0.06, + "learning_rate": 1.9958866553871997e-06, + "loss": 1.0635, + "step": 2264 + }, + { + "epoch": 0.06, + "learning_rate": 1.9958791304145114e-06, + "loss": 1.0615, + "step": 2265 + }, + { + "epoch": 0.06, + "learning_rate": 1.995871598579213e-06, + "loss": 0.8926, + "step": 2266 + }, + { + "epoch": 0.06, + "learning_rate": 1.9958640598813556e-06, + "loss": 1.0391, + "step": 2267 + }, + { + "epoch": 0.06, + "learning_rate": 1.9958565143209914e-06, + "loss": 0.9883, + "step": 2268 + }, + { + "epoch": 0.06, + "learning_rate": 1.9958489618981726e-06, + "loss": 0.8838, + "step": 2269 + }, + { + "epoch": 0.06, + "learning_rate": 1.995841402612951e-06, + "loss": 0.9658, + "step": 2270 + }, + { + "epoch": 0.06, + "learning_rate": 1.9958338364653785e-06, + "loss": 1.1045, + "step": 2271 + }, + { + "epoch": 0.06, + "learning_rate": 1.9958262634555077e-06, + "loss": 0.8887, + "step": 2272 + }, + { + "epoch": 0.06, + "learning_rate": 1.995818683583391e-06, + "loss": 1.0703, + "step": 2273 + }, + { + "epoch": 0.06, + "learning_rate": 1.99581109684908e-06, + "loss": 0.8525, + "step": 2274 + }, + { + "epoch": 0.06, + "learning_rate": 1.995803503252627e-06, + "loss": 0.9668, + "step": 2275 + }, + { + "epoch": 0.06, + "learning_rate": 1.9957959027940847e-06, + "loss": 1.1445, + "step": 2276 + }, + { + "epoch": 0.06, + "learning_rate": 1.9957882954735054e-06, + "loss": 0.7466, + "step": 2277 + }, + { + "epoch": 0.06, + "learning_rate": 1.995780681290941e-06, + "loss": 1.0049, + "step": 2278 + }, + { + "epoch": 0.06, + "learning_rate": 1.9957730602464448e-06, + "loss": 0.9854, + "step": 2279 + }, + { + "epoch": 0.06, + "learning_rate": 1.995765432340069e-06, + "loss": 1.1113, + "step": 2280 + }, + { + "epoch": 0.06, + "learning_rate": 1.9957577975718655e-06, + "loss": 0.9307, + "step": 2281 + }, + { + "epoch": 0.06, + "learning_rate": 1.995750155941888e-06, + "loss": 0.8398, + "step": 2282 + }, + { + "epoch": 0.06, + "learning_rate": 1.9957425074501886e-06, + "loss": 0.9756, + "step": 2283 + }, + { + "epoch": 0.06, + "learning_rate": 1.99573485209682e-06, + "loss": 0.7549, + "step": 2284 + }, + { + "epoch": 0.06, + "learning_rate": 1.995727189881835e-06, + "loss": 0.8184, + "step": 2285 + }, + { + "epoch": 0.06, + "learning_rate": 1.995719520805287e-06, + "loss": 1.0244, + "step": 2286 + }, + { + "epoch": 0.06, + "learning_rate": 1.995711844867227e-06, + "loss": 1.0615, + "step": 2287 + }, + { + "epoch": 0.06, + "learning_rate": 1.9957041620677104e-06, + "loss": 0.7686, + "step": 2288 + }, + { + "epoch": 0.06, + "learning_rate": 1.995696472406788e-06, + "loss": 1.1123, + "step": 2289 + }, + { + "epoch": 0.06, + "learning_rate": 1.9956887758845144e-06, + "loss": 1.1699, + "step": 2290 + }, + { + "epoch": 0.06, + "learning_rate": 1.9956810725009414e-06, + "loss": 0.698, + "step": 2291 + }, + { + "epoch": 0.06, + "learning_rate": 1.995673362256123e-06, + "loss": 0.9854, + "step": 2292 + }, + { + "epoch": 0.06, + "learning_rate": 1.995665645150111e-06, + "loss": 1.0225, + "step": 2293 + }, + { + "epoch": 0.06, + "learning_rate": 1.9956579211829603e-06, + "loss": 0.9326, + "step": 2294 + }, + { + "epoch": 0.06, + "learning_rate": 1.9956501903547236e-06, + "loss": 0.9395, + "step": 2295 + }, + { + "epoch": 0.06, + "learning_rate": 1.9956424526654535e-06, + "loss": 1.002, + "step": 2296 + }, + { + "epoch": 0.06, + "learning_rate": 1.995634708115204e-06, + "loss": 0.9814, + "step": 2297 + }, + { + "epoch": 0.06, + "learning_rate": 1.995626956704028e-06, + "loss": 0.8896, + "step": 2298 + }, + { + "epoch": 0.06, + "learning_rate": 1.995619198431979e-06, + "loss": 0.9082, + "step": 2299 + }, + { + "epoch": 0.06, + "learning_rate": 1.995611433299111e-06, + "loss": 0.8267, + "step": 2300 + }, + { + "epoch": 0.06, + "learning_rate": 1.9956036613054766e-06, + "loss": 1.1543, + "step": 2301 + }, + { + "epoch": 0.06, + "learning_rate": 1.9955958824511303e-06, + "loss": 1.0537, + "step": 2302 + }, + { + "epoch": 0.06, + "learning_rate": 1.995588096736125e-06, + "loss": 1.0791, + "step": 2303 + }, + { + "epoch": 0.06, + "learning_rate": 1.9955803041605146e-06, + "loss": 0.9893, + "step": 2304 + }, + { + "epoch": 0.06, + "learning_rate": 1.9955725047243527e-06, + "loss": 0.9727, + "step": 2305 + }, + { + "epoch": 0.06, + "learning_rate": 1.9955646984276933e-06, + "loss": 1.0098, + "step": 2306 + }, + { + "epoch": 0.06, + "learning_rate": 1.9955568852705904e-06, + "loss": 0.8047, + "step": 2307 + }, + { + "epoch": 0.06, + "learning_rate": 1.9955490652530966e-06, + "loss": 0.8506, + "step": 2308 + }, + { + "epoch": 0.06, + "learning_rate": 1.995541238375267e-06, + "loss": 0.835, + "step": 2309 + }, + { + "epoch": 0.06, + "learning_rate": 1.995533404637156e-06, + "loss": 1.0127, + "step": 2310 + }, + { + "epoch": 0.06, + "learning_rate": 1.995525564038816e-06, + "loss": 1.0547, + "step": 2311 + }, + { + "epoch": 0.06, + "learning_rate": 1.995517716580302e-06, + "loss": 1.1191, + "step": 2312 + }, + { + "epoch": 0.06, + "learning_rate": 1.995509862261668e-06, + "loss": 1.001, + "step": 2313 + }, + { + "epoch": 0.06, + "learning_rate": 1.995502001082968e-06, + "loss": 0.9307, + "step": 2314 + }, + { + "epoch": 0.06, + "learning_rate": 1.9954941330442558e-06, + "loss": 1.0215, + "step": 2315 + }, + { + "epoch": 0.06, + "learning_rate": 1.9954862581455864e-06, + "loss": 0.9375, + "step": 2316 + }, + { + "epoch": 0.06, + "learning_rate": 1.9954783763870137e-06, + "loss": 0.9443, + "step": 2317 + }, + { + "epoch": 0.06, + "learning_rate": 1.9954704877685917e-06, + "loss": 0.6733, + "step": 2318 + }, + { + "epoch": 0.06, + "learning_rate": 1.995462592290375e-06, + "loss": 0.8398, + "step": 2319 + }, + { + "epoch": 0.06, + "learning_rate": 1.9954546899524187e-06, + "loss": 0.8809, + "step": 2320 + }, + { + "epoch": 0.06, + "learning_rate": 1.995446780754776e-06, + "loss": 0.8125, + "step": 2321 + }, + { + "epoch": 0.06, + "learning_rate": 1.9954388646975023e-06, + "loss": 0.9102, + "step": 2322 + }, + { + "epoch": 0.06, + "learning_rate": 1.9954309417806517e-06, + "loss": 1.0957, + "step": 2323 + }, + { + "epoch": 0.06, + "learning_rate": 1.995423012004279e-06, + "loss": 1.0527, + "step": 2324 + }, + { + "epoch": 0.06, + "learning_rate": 1.9954150753684387e-06, + "loss": 0.8975, + "step": 2325 + }, + { + "epoch": 0.06, + "learning_rate": 1.995407131873186e-06, + "loss": 0.9062, + "step": 2326 + }, + { + "epoch": 0.06, + "learning_rate": 1.995399181518575e-06, + "loss": 0.957, + "step": 2327 + }, + { + "epoch": 0.06, + "learning_rate": 1.9953912243046607e-06, + "loss": 1.1621, + "step": 2328 + }, + { + "epoch": 0.06, + "learning_rate": 1.9953832602314977e-06, + "loss": 0.9873, + "step": 2329 + }, + { + "epoch": 0.06, + "learning_rate": 1.9953752892991416e-06, + "loss": 0.8926, + "step": 2330 + }, + { + "epoch": 0.06, + "learning_rate": 1.9953673115076464e-06, + "loss": 1.1045, + "step": 2331 + }, + { + "epoch": 0.06, + "learning_rate": 1.995359326857068e-06, + "loss": 0.833, + "step": 2332 + }, + { + "epoch": 0.06, + "learning_rate": 1.9953513353474607e-06, + "loss": 1.248, + "step": 2333 + }, + { + "epoch": 0.06, + "learning_rate": 1.99534333697888e-06, + "loss": 0.9287, + "step": 2334 + }, + { + "epoch": 0.06, + "learning_rate": 1.9953353317513806e-06, + "loss": 0.9062, + "step": 2335 + }, + { + "epoch": 0.06, + "learning_rate": 1.995327319665018e-06, + "loss": 0.9199, + "step": 2336 + }, + { + "epoch": 0.06, + "learning_rate": 1.9953193007198475e-06, + "loss": 1.2217, + "step": 2337 + }, + { + "epoch": 0.06, + "learning_rate": 1.9953112749159236e-06, + "loss": 0.999, + "step": 2338 + }, + { + "epoch": 0.06, + "learning_rate": 1.995303242253303e-06, + "loss": 0.8936, + "step": 2339 + }, + { + "epoch": 0.06, + "learning_rate": 1.9952952027320397e-06, + "loss": 1.0186, + "step": 2340 + }, + { + "epoch": 0.06, + "learning_rate": 1.9952871563521897e-06, + "loss": 1.043, + "step": 2341 + }, + { + "epoch": 0.06, + "learning_rate": 1.9952791031138085e-06, + "loss": 0.8491, + "step": 2342 + }, + { + "epoch": 0.06, + "learning_rate": 1.9952710430169515e-06, + "loss": 1.1406, + "step": 2343 + }, + { + "epoch": 0.06, + "learning_rate": 1.9952629760616743e-06, + "loss": 1.1162, + "step": 2344 + }, + { + "epoch": 0.06, + "learning_rate": 1.9952549022480323e-06, + "loss": 0.917, + "step": 2345 + }, + { + "epoch": 0.06, + "learning_rate": 1.995246821576081e-06, + "loss": 1.0137, + "step": 2346 + }, + { + "epoch": 0.06, + "learning_rate": 1.995238734045877e-06, + "loss": 0.8096, + "step": 2347 + }, + { + "epoch": 0.06, + "learning_rate": 1.995230639657475e-06, + "loss": 0.7749, + "step": 2348 + }, + { + "epoch": 0.06, + "learning_rate": 1.995222538410931e-06, + "loss": 1.0176, + "step": 2349 + }, + { + "epoch": 0.06, + "learning_rate": 1.995214430306301e-06, + "loss": 0.8799, + "step": 2350 + }, + { + "epoch": 0.06, + "learning_rate": 1.995206315343641e-06, + "loss": 0.9961, + "step": 2351 + }, + { + "epoch": 0.06, + "learning_rate": 1.9951981935230065e-06, + "loss": 0.791, + "step": 2352 + }, + { + "epoch": 0.06, + "learning_rate": 1.9951900648444537e-06, + "loss": 1.0195, + "step": 2353 + }, + { + "epoch": 0.06, + "learning_rate": 1.995181929308039e-06, + "loss": 0.6948, + "step": 2354 + }, + { + "epoch": 0.06, + "learning_rate": 1.995173786913818e-06, + "loss": 1.0361, + "step": 2355 + }, + { + "epoch": 0.06, + "learning_rate": 1.9951656376618467e-06, + "loss": 0.8799, + "step": 2356 + }, + { + "epoch": 0.06, + "learning_rate": 1.995157481552182e-06, + "loss": 0.6646, + "step": 2357 + }, + { + "epoch": 0.06, + "learning_rate": 1.995149318584879e-06, + "loss": 0.9277, + "step": 2358 + }, + { + "epoch": 0.06, + "learning_rate": 1.9951411487599947e-06, + "loss": 0.96, + "step": 2359 + }, + { + "epoch": 0.06, + "learning_rate": 1.995132972077585e-06, + "loss": 0.9971, + "step": 2360 + }, + { + "epoch": 0.06, + "learning_rate": 1.995124788537707e-06, + "loss": 0.9961, + "step": 2361 + }, + { + "epoch": 0.06, + "learning_rate": 1.9951165981404165e-06, + "loss": 1.1084, + "step": 2362 + }, + { + "epoch": 0.06, + "learning_rate": 1.9951084008857696e-06, + "loss": 0.7422, + "step": 2363 + }, + { + "epoch": 0.06, + "learning_rate": 1.9951001967738235e-06, + "loss": 1.248, + "step": 2364 + }, + { + "epoch": 0.06, + "learning_rate": 1.995091985804634e-06, + "loss": 0.9854, + "step": 2365 + }, + { + "epoch": 0.06, + "learning_rate": 1.995083767978259e-06, + "loss": 1.085, + "step": 2366 + }, + { + "epoch": 0.06, + "learning_rate": 1.9950755432947536e-06, + "loss": 1.1084, + "step": 2367 + }, + { + "epoch": 0.06, + "learning_rate": 1.995067311754175e-06, + "loss": 0.9932, + "step": 2368 + }, + { + "epoch": 0.06, + "learning_rate": 1.9950590733565804e-06, + "loss": 1.1162, + "step": 2369 + }, + { + "epoch": 0.06, + "learning_rate": 1.995050828102026e-06, + "loss": 1.0127, + "step": 2370 + }, + { + "epoch": 0.06, + "learning_rate": 1.995042575990569e-06, + "loss": 0.7891, + "step": 2371 + }, + { + "epoch": 0.06, + "learning_rate": 1.9950343170222658e-06, + "loss": 0.9844, + "step": 2372 + }, + { + "epoch": 0.06, + "learning_rate": 1.9950260511971737e-06, + "loss": 1.1143, + "step": 2373 + }, + { + "epoch": 0.06, + "learning_rate": 1.9950177785153495e-06, + "loss": 1.0068, + "step": 2374 + }, + { + "epoch": 0.06, + "learning_rate": 1.995009498976851e-06, + "loss": 1.1152, + "step": 2375 + }, + { + "epoch": 0.06, + "learning_rate": 1.995001212581734e-06, + "loss": 0.9595, + "step": 2376 + }, + { + "epoch": 0.06, + "learning_rate": 1.9949929193300555e-06, + "loss": 0.9932, + "step": 2377 + }, + { + "epoch": 0.06, + "learning_rate": 1.994984619221874e-06, + "loss": 0.9434, + "step": 2378 + }, + { + "epoch": 0.06, + "learning_rate": 1.994976312257246e-06, + "loss": 1.0889, + "step": 2379 + }, + { + "epoch": 0.06, + "learning_rate": 1.994967998436228e-06, + "loss": 0.9785, + "step": 2380 + }, + { + "epoch": 0.06, + "learning_rate": 1.994959677758879e-06, + "loss": 1.1016, + "step": 2381 + }, + { + "epoch": 0.06, + "learning_rate": 1.9949513502252547e-06, + "loss": 0.9922, + "step": 2382 + }, + { + "epoch": 0.06, + "learning_rate": 1.9949430158354134e-06, + "loss": 0.8086, + "step": 2383 + }, + { + "epoch": 0.06, + "learning_rate": 1.994934674589412e-06, + "loss": 1.002, + "step": 2384 + }, + { + "epoch": 0.06, + "learning_rate": 1.994926326487309e-06, + "loss": 0.894, + "step": 2385 + }, + { + "epoch": 0.06, + "learning_rate": 1.9949179715291604e-06, + "loss": 0.8369, + "step": 2386 + }, + { + "epoch": 0.06, + "learning_rate": 1.9949096097150243e-06, + "loss": 1.0791, + "step": 2387 + }, + { + "epoch": 0.06, + "learning_rate": 1.994901241044959e-06, + "loss": 0.998, + "step": 2388 + }, + { + "epoch": 0.06, + "learning_rate": 1.994892865519022e-06, + "loss": 0.8984, + "step": 2389 + }, + { + "epoch": 0.06, + "learning_rate": 1.9948844831372705e-06, + "loss": 0.9697, + "step": 2390 + }, + { + "epoch": 0.06, + "learning_rate": 1.994876093899762e-06, + "loss": 0.9067, + "step": 2391 + }, + { + "epoch": 0.06, + "learning_rate": 1.9948676978065556e-06, + "loss": 1.0605, + "step": 2392 + }, + { + "epoch": 0.06, + "learning_rate": 1.994859294857708e-06, + "loss": 1.002, + "step": 2393 + }, + { + "epoch": 0.06, + "learning_rate": 1.9948508850532777e-06, + "loss": 1.1035, + "step": 2394 + }, + { + "epoch": 0.06, + "learning_rate": 1.994842468393322e-06, + "loss": 0.8354, + "step": 2395 + }, + { + "epoch": 0.06, + "learning_rate": 1.9948340448779e-06, + "loss": 0.9199, + "step": 2396 + }, + { + "epoch": 0.06, + "learning_rate": 1.9948256145070685e-06, + "loss": 0.9971, + "step": 2397 + }, + { + "epoch": 0.06, + "learning_rate": 1.9948171772808866e-06, + "loss": 1.1768, + "step": 2398 + }, + { + "epoch": 0.06, + "learning_rate": 1.9948087331994116e-06, + "loss": 1.1006, + "step": 2399 + }, + { + "epoch": 0.06, + "learning_rate": 1.9948002822627025e-06, + "loss": 1.0352, + "step": 2400 + }, + { + "epoch": 0.06, + "learning_rate": 1.994791824470817e-06, + "loss": 0.9961, + "step": 2401 + }, + { + "epoch": 0.06, + "learning_rate": 1.9947833598238135e-06, + "loss": 0.9492, + "step": 2402 + }, + { + "epoch": 0.06, + "learning_rate": 1.99477488832175e-06, + "loss": 0.6167, + "step": 2403 + }, + { + "epoch": 0.06, + "learning_rate": 1.9947664099646858e-06, + "loss": 0.9932, + "step": 2404 + }, + { + "epoch": 0.06, + "learning_rate": 1.9947579247526783e-06, + "loss": 0.9785, + "step": 2405 + }, + { + "epoch": 0.06, + "learning_rate": 1.9947494326857866e-06, + "loss": 1.0459, + "step": 2406 + }, + { + "epoch": 0.06, + "learning_rate": 1.9947409337640693e-06, + "loss": 0.9824, + "step": 2407 + }, + { + "epoch": 0.06, + "learning_rate": 1.9947324279875842e-06, + "loss": 0.957, + "step": 2408 + }, + { + "epoch": 0.06, + "learning_rate": 1.994723915356391e-06, + "loss": 0.9336, + "step": 2409 + }, + { + "epoch": 0.06, + "learning_rate": 1.9947153958705476e-06, + "loss": 1.2168, + "step": 2410 + }, + { + "epoch": 0.06, + "learning_rate": 1.9947068695301126e-06, + "loss": 1.0107, + "step": 2411 + }, + { + "epoch": 0.06, + "learning_rate": 1.994698336335145e-06, + "loss": 0.9209, + "step": 2412 + }, + { + "epoch": 0.06, + "learning_rate": 1.994689796285704e-06, + "loss": 1.1143, + "step": 2413 + }, + { + "epoch": 0.06, + "learning_rate": 1.994681249381848e-06, + "loss": 1.2363, + "step": 2414 + }, + { + "epoch": 0.06, + "learning_rate": 1.9946726956236364e-06, + "loss": 0.7778, + "step": 2415 + }, + { + "epoch": 0.06, + "learning_rate": 1.9946641350111272e-06, + "loss": 1.0508, + "step": 2416 + }, + { + "epoch": 0.06, + "learning_rate": 1.99465556754438e-06, + "loss": 0.9121, + "step": 2417 + }, + { + "epoch": 0.06, + "learning_rate": 1.994646993223454e-06, + "loss": 0.876, + "step": 2418 + }, + { + "epoch": 0.06, + "learning_rate": 1.994638412048408e-06, + "loss": 1.0195, + "step": 2419 + }, + { + "epoch": 0.06, + "learning_rate": 1.994629824019301e-06, + "loss": 1.0898, + "step": 2420 + }, + { + "epoch": 0.06, + "learning_rate": 1.994621229136192e-06, + "loss": 1.0039, + "step": 2421 + }, + { + "epoch": 0.06, + "learning_rate": 1.9946126273991415e-06, + "loss": 0.5532, + "step": 2422 + }, + { + "epoch": 0.06, + "learning_rate": 1.994604018808207e-06, + "loss": 1.0195, + "step": 2423 + }, + { + "epoch": 0.06, + "learning_rate": 1.9945954033634494e-06, + "loss": 0.9448, + "step": 2424 + }, + { + "epoch": 0.06, + "learning_rate": 1.994586781064927e-06, + "loss": 0.707, + "step": 2425 + }, + { + "epoch": 0.06, + "learning_rate": 1.9945781519127e-06, + "loss": 0.9785, + "step": 2426 + }, + { + "epoch": 0.06, + "learning_rate": 1.9945695159068267e-06, + "loss": 1.0322, + "step": 2427 + }, + { + "epoch": 0.06, + "learning_rate": 1.994560873047368e-06, + "loss": 0.9736, + "step": 2428 + }, + { + "epoch": 0.06, + "learning_rate": 1.9945522233343827e-06, + "loss": 1.0117, + "step": 2429 + }, + { + "epoch": 0.06, + "learning_rate": 1.9945435667679302e-06, + "loss": 0.9004, + "step": 2430 + }, + { + "epoch": 0.06, + "learning_rate": 1.9945349033480706e-06, + "loss": 1.043, + "step": 2431 + }, + { + "epoch": 0.06, + "learning_rate": 1.994526233074863e-06, + "loss": 0.9102, + "step": 2432 + }, + { + "epoch": 0.06, + "learning_rate": 1.9945175559483685e-06, + "loss": 0.9858, + "step": 2433 + }, + { + "epoch": 0.06, + "learning_rate": 1.994508871968646e-06, + "loss": 1.1143, + "step": 2434 + }, + { + "epoch": 0.06, + "learning_rate": 1.9945001811357547e-06, + "loss": 1.0098, + "step": 2435 + }, + { + "epoch": 0.06, + "learning_rate": 1.9944914834497557e-06, + "loss": 0.8867, + "step": 2436 + }, + { + "epoch": 0.06, + "learning_rate": 1.994482778910708e-06, + "loss": 1.0176, + "step": 2437 + }, + { + "epoch": 0.06, + "learning_rate": 1.994474067518672e-06, + "loss": 1.0547, + "step": 2438 + }, + { + "epoch": 0.06, + "learning_rate": 1.9944653492737074e-06, + "loss": 1.25, + "step": 2439 + }, + { + "epoch": 0.06, + "learning_rate": 1.9944566241758753e-06, + "loss": 0.915, + "step": 2440 + }, + { + "epoch": 0.06, + "learning_rate": 1.9944478922252345e-06, + "loss": 0.8887, + "step": 2441 + }, + { + "epoch": 0.06, + "learning_rate": 1.994439153421846e-06, + "loss": 1.0244, + "step": 2442 + }, + { + "epoch": 0.06, + "learning_rate": 1.99443040776577e-06, + "loss": 0.8955, + "step": 2443 + }, + { + "epoch": 0.06, + "learning_rate": 1.9944216552570663e-06, + "loss": 0.9277, + "step": 2444 + }, + { + "epoch": 0.06, + "learning_rate": 1.994412895895795e-06, + "loss": 0.874, + "step": 2445 + }, + { + "epoch": 0.06, + "learning_rate": 1.9944041296820178e-06, + "loss": 1.0215, + "step": 2446 + }, + { + "epoch": 0.06, + "learning_rate": 1.994395356615794e-06, + "loss": 1.0742, + "step": 2447 + }, + { + "epoch": 0.06, + "learning_rate": 1.994386576697184e-06, + "loss": 0.8887, + "step": 2448 + }, + { + "epoch": 0.06, + "learning_rate": 1.9943777899262484e-06, + "loss": 0.8193, + "step": 2449 + }, + { + "epoch": 0.06, + "learning_rate": 1.994368996303048e-06, + "loss": 0.9482, + "step": 2450 + }, + { + "epoch": 0.06, + "learning_rate": 1.9943601958276436e-06, + "loss": 0.7939, + "step": 2451 + }, + { + "epoch": 0.06, + "learning_rate": 1.9943513885000956e-06, + "loss": 0.9443, + "step": 2452 + }, + { + "epoch": 0.06, + "learning_rate": 1.994342574320465e-06, + "loss": 0.8525, + "step": 2453 + }, + { + "epoch": 0.06, + "learning_rate": 1.9943337532888116e-06, + "loss": 1.1572, + "step": 2454 + }, + { + "epoch": 0.06, + "learning_rate": 1.994324925405197e-06, + "loss": 1.085, + "step": 2455 + }, + { + "epoch": 0.06, + "learning_rate": 1.994316090669682e-06, + "loss": 0.8604, + "step": 2456 + }, + { + "epoch": 0.06, + "learning_rate": 1.994307249082327e-06, + "loss": 0.8896, + "step": 2457 + }, + { + "epoch": 0.06, + "learning_rate": 1.9942984006431934e-06, + "loss": 0.7378, + "step": 2458 + }, + { + "epoch": 0.06, + "learning_rate": 1.994289545352342e-06, + "loss": 1.0439, + "step": 2459 + }, + { + "epoch": 0.06, + "learning_rate": 1.994280683209834e-06, + "loss": 0.9248, + "step": 2460 + }, + { + "epoch": 0.06, + "learning_rate": 1.99427181421573e-06, + "loss": 0.8896, + "step": 2461 + }, + { + "epoch": 0.06, + "learning_rate": 1.9942629383700917e-06, + "loss": 1.2637, + "step": 2462 + }, + { + "epoch": 0.06, + "learning_rate": 1.9942540556729795e-06, + "loss": 1.0723, + "step": 2463 + }, + { + "epoch": 0.06, + "learning_rate": 1.994245166124456e-06, + "loss": 1.0732, + "step": 2464 + }, + { + "epoch": 0.06, + "learning_rate": 1.9942362697245804e-06, + "loss": 0.7988, + "step": 2465 + }, + { + "epoch": 0.06, + "learning_rate": 1.994227366473416e-06, + "loss": 0.9678, + "step": 2466 + }, + { + "epoch": 0.06, + "learning_rate": 1.994218456371023e-06, + "loss": 0.895, + "step": 2467 + }, + { + "epoch": 0.06, + "learning_rate": 1.994209539417463e-06, + "loss": 0.9727, + "step": 2468 + }, + { + "epoch": 0.06, + "learning_rate": 1.9942006156127975e-06, + "loss": 0.998, + "step": 2469 + }, + { + "epoch": 0.06, + "learning_rate": 1.9941916849570886e-06, + "loss": 1.1523, + "step": 2470 + }, + { + "epoch": 0.06, + "learning_rate": 1.9941827474503967e-06, + "loss": 0.9863, + "step": 2471 + }, + { + "epoch": 0.06, + "learning_rate": 1.9941738030927843e-06, + "loss": 1.0078, + "step": 2472 + }, + { + "epoch": 0.06, + "learning_rate": 1.9941648518843125e-06, + "loss": 1.1377, + "step": 2473 + }, + { + "epoch": 0.06, + "learning_rate": 1.9941558938250434e-06, + "loss": 1.0957, + "step": 2474 + }, + { + "epoch": 0.06, + "learning_rate": 1.9941469289150383e-06, + "loss": 1.0459, + "step": 2475 + }, + { + "epoch": 0.06, + "learning_rate": 1.9941379571543595e-06, + "loss": 0.9922, + "step": 2476 + }, + { + "epoch": 0.06, + "learning_rate": 1.9941289785430684e-06, + "loss": 1.0039, + "step": 2477 + }, + { + "epoch": 0.06, + "learning_rate": 1.9941199930812267e-06, + "loss": 0.9248, + "step": 2478 + }, + { + "epoch": 0.06, + "learning_rate": 1.994111000768897e-06, + "loss": 1.1348, + "step": 2479 + }, + { + "epoch": 0.06, + "learning_rate": 1.994102001606141e-06, + "loss": 0.9609, + "step": 2480 + }, + { + "epoch": 0.06, + "learning_rate": 1.9940929955930203e-06, + "loss": 0.8936, + "step": 2481 + }, + { + "epoch": 0.06, + "learning_rate": 1.9940839827295976e-06, + "loss": 0.8867, + "step": 2482 + }, + { + "epoch": 0.06, + "learning_rate": 1.994074963015934e-06, + "loss": 0.9521, + "step": 2483 + }, + { + "epoch": 0.06, + "learning_rate": 1.994065936452093e-06, + "loss": 1.0039, + "step": 2484 + }, + { + "epoch": 0.06, + "learning_rate": 1.9940569030381357e-06, + "loss": 0.8413, + "step": 2485 + }, + { + "epoch": 0.06, + "learning_rate": 1.9940478627741247e-06, + "loss": 0.8691, + "step": 2486 + }, + { + "epoch": 0.06, + "learning_rate": 1.9940388156601226e-06, + "loss": 0.9961, + "step": 2487 + }, + { + "epoch": 0.06, + "learning_rate": 1.9940297616961918e-06, + "loss": 0.9375, + "step": 2488 + }, + { + "epoch": 0.06, + "learning_rate": 1.994020700882394e-06, + "loss": 1.0498, + "step": 2489 + }, + { + "epoch": 0.06, + "learning_rate": 1.994011633218792e-06, + "loss": 1.123, + "step": 2490 + }, + { + "epoch": 0.06, + "learning_rate": 1.9940025587054485e-06, + "loss": 0.8787, + "step": 2491 + }, + { + "epoch": 0.06, + "learning_rate": 1.993993477342426e-06, + "loss": 0.6821, + "step": 2492 + }, + { + "epoch": 0.06, + "learning_rate": 1.9939843891297865e-06, + "loss": 0.8354, + "step": 2493 + }, + { + "epoch": 0.06, + "learning_rate": 1.9939752940675935e-06, + "loss": 0.918, + "step": 2494 + }, + { + "epoch": 0.06, + "learning_rate": 1.993966192155909e-06, + "loss": 0.9932, + "step": 2495 + }, + { + "epoch": 0.06, + "learning_rate": 1.993957083394796e-06, + "loss": 0.8574, + "step": 2496 + }, + { + "epoch": 0.06, + "learning_rate": 1.9939479677843175e-06, + "loss": 0.833, + "step": 2497 + }, + { + "epoch": 0.06, + "learning_rate": 1.9939388453245355e-06, + "loss": 0.9707, + "step": 2498 + }, + { + "epoch": 0.06, + "learning_rate": 1.993929716015514e-06, + "loss": 1.0742, + "step": 2499 + }, + { + "epoch": 0.06, + "learning_rate": 1.993920579857315e-06, + "loss": 0.854, + "step": 2500 + }, + { + "epoch": 0.06, + "learning_rate": 1.9939114368500014e-06, + "loss": 0.8633, + "step": 2501 + }, + { + "epoch": 0.06, + "learning_rate": 1.993902286993637e-06, + "loss": 1.1475, + "step": 2502 + }, + { + "epoch": 0.06, + "learning_rate": 1.9938931302882846e-06, + "loss": 0.9365, + "step": 2503 + }, + { + "epoch": 0.06, + "learning_rate": 1.993883966734007e-06, + "loss": 1.1084, + "step": 2504 + }, + { + "epoch": 0.06, + "learning_rate": 1.9938747963308677e-06, + "loss": 1.1514, + "step": 2505 + }, + { + "epoch": 0.06, + "learning_rate": 1.993865619078929e-06, + "loss": 0.8496, + "step": 2506 + }, + { + "epoch": 0.06, + "learning_rate": 1.9938564349782555e-06, + "loss": 0.9902, + "step": 2507 + }, + { + "epoch": 0.06, + "learning_rate": 1.9938472440289094e-06, + "loss": 1.0654, + "step": 2508 + }, + { + "epoch": 0.06, + "learning_rate": 1.9938380462309546e-06, + "loss": 0.9268, + "step": 2509 + }, + { + "epoch": 0.06, + "learning_rate": 1.993828841584454e-06, + "loss": 0.7979, + "step": 2510 + }, + { + "epoch": 0.06, + "learning_rate": 1.993819630089472e-06, + "loss": 0.9834, + "step": 2511 + }, + { + "epoch": 0.06, + "learning_rate": 1.993810411746071e-06, + "loss": 0.8584, + "step": 2512 + }, + { + "epoch": 0.06, + "learning_rate": 1.993801186554315e-06, + "loss": 0.917, + "step": 2513 + }, + { + "epoch": 0.06, + "learning_rate": 1.9937919545142673e-06, + "loss": 1.0713, + "step": 2514 + }, + { + "epoch": 0.06, + "learning_rate": 1.993782715625992e-06, + "loss": 0.9795, + "step": 2515 + }, + { + "epoch": 0.06, + "learning_rate": 1.9937734698895524e-06, + "loss": 1.0176, + "step": 2516 + }, + { + "epoch": 0.06, + "learning_rate": 1.9937642173050123e-06, + "loss": 1.0273, + "step": 2517 + }, + { + "epoch": 0.06, + "learning_rate": 1.9937549578724357e-06, + "loss": 0.8877, + "step": 2518 + }, + { + "epoch": 0.06, + "learning_rate": 1.9937456915918858e-06, + "loss": 0.9473, + "step": 2519 + }, + { + "epoch": 0.06, + "learning_rate": 1.9937364184634272e-06, + "loss": 0.79, + "step": 2520 + }, + { + "epoch": 0.06, + "learning_rate": 1.993727138487123e-06, + "loss": 1.0098, + "step": 2521 + }, + { + "epoch": 0.06, + "learning_rate": 1.993717851663038e-06, + "loss": 0.8105, + "step": 2522 + }, + { + "epoch": 0.06, + "learning_rate": 1.9937085579912357e-06, + "loss": 1.1084, + "step": 2523 + }, + { + "epoch": 0.06, + "learning_rate": 1.99369925747178e-06, + "loss": 1.0166, + "step": 2524 + }, + { + "epoch": 0.06, + "learning_rate": 1.9936899501047354e-06, + "loss": 0.9844, + "step": 2525 + }, + { + "epoch": 0.06, + "learning_rate": 1.993680635890166e-06, + "loss": 0.9639, + "step": 2526 + }, + { + "epoch": 0.06, + "learning_rate": 1.9936713148281356e-06, + "loss": 1.0537, + "step": 2527 + }, + { + "epoch": 0.06, + "learning_rate": 1.9936619869187085e-06, + "loss": 0.9824, + "step": 2528 + }, + { + "epoch": 0.06, + "learning_rate": 1.993652652161949e-06, + "loss": 0.9834, + "step": 2529 + }, + { + "epoch": 0.06, + "learning_rate": 1.993643310557922e-06, + "loss": 0.8809, + "step": 2530 + }, + { + "epoch": 0.06, + "learning_rate": 1.9936339621066914e-06, + "loss": 0.9199, + "step": 2531 + }, + { + "epoch": 0.06, + "learning_rate": 1.993624606808322e-06, + "loss": 0.9561, + "step": 2532 + }, + { + "epoch": 0.06, + "learning_rate": 1.993615244662877e-06, + "loss": 0.9805, + "step": 2533 + }, + { + "epoch": 0.06, + "learning_rate": 1.9936058756704224e-06, + "loss": 0.9199, + "step": 2534 + }, + { + "epoch": 0.06, + "learning_rate": 1.9935964998310223e-06, + "loss": 1.0049, + "step": 2535 + }, + { + "epoch": 0.06, + "learning_rate": 1.993587117144741e-06, + "loss": 0.6753, + "step": 2536 + }, + { + "epoch": 0.07, + "learning_rate": 1.9935777276116434e-06, + "loss": 1.0479, + "step": 2537 + }, + { + "epoch": 0.07, + "learning_rate": 1.9935683312317942e-06, + "loss": 1.125, + "step": 2538 + }, + { + "epoch": 0.07, + "learning_rate": 1.9935589280052583e-06, + "loss": 0.874, + "step": 2539 + }, + { + "epoch": 0.07, + "learning_rate": 1.9935495179321e-06, + "loss": 1.0654, + "step": 2540 + }, + { + "epoch": 0.07, + "learning_rate": 1.993540101012385e-06, + "loss": 0.874, + "step": 2541 + }, + { + "epoch": 0.07, + "learning_rate": 1.9935306772461773e-06, + "loss": 0.9121, + "step": 2542 + }, + { + "epoch": 0.07, + "learning_rate": 1.993521246633542e-06, + "loss": 0.8154, + "step": 2543 + }, + { + "epoch": 0.07, + "learning_rate": 1.9935118091745443e-06, + "loss": 0.9971, + "step": 2544 + }, + { + "epoch": 0.07, + "learning_rate": 1.9935023648692495e-06, + "loss": 0.7935, + "step": 2545 + }, + { + "epoch": 0.07, + "learning_rate": 1.9934929137177224e-06, + "loss": 1.001, + "step": 2546 + }, + { + "epoch": 0.07, + "learning_rate": 1.9934834557200283e-06, + "loss": 0.9414, + "step": 2547 + }, + { + "epoch": 0.07, + "learning_rate": 1.993473990876232e-06, + "loss": 0.959, + "step": 2548 + }, + { + "epoch": 0.07, + "learning_rate": 1.9934645191863987e-06, + "loss": 0.8457, + "step": 2549 + }, + { + "epoch": 0.07, + "learning_rate": 1.9934550406505937e-06, + "loss": 0.9072, + "step": 2550 + }, + { + "epoch": 0.07, + "learning_rate": 1.993445555268883e-06, + "loss": 1.0381, + "step": 2551 + }, + { + "epoch": 0.07, + "learning_rate": 1.9934360630413313e-06, + "loss": 0.9355, + "step": 2552 + }, + { + "epoch": 0.07, + "learning_rate": 1.9934265639680042e-06, + "loss": 1.0068, + "step": 2553 + }, + { + "epoch": 0.07, + "learning_rate": 1.9934170580489675e-06, + "loss": 1.0029, + "step": 2554 + }, + { + "epoch": 0.07, + "learning_rate": 1.993407545284286e-06, + "loss": 0.9121, + "step": 2555 + }, + { + "epoch": 0.07, + "learning_rate": 1.9933980256740254e-06, + "loss": 0.8259, + "step": 2556 + }, + { + "epoch": 0.07, + "learning_rate": 1.9933884992182517e-06, + "loss": 0.917, + "step": 2557 + }, + { + "epoch": 0.07, + "learning_rate": 1.9933789659170306e-06, + "loss": 1.0059, + "step": 2558 + }, + { + "epoch": 0.07, + "learning_rate": 1.993369425770427e-06, + "loss": 1.2354, + "step": 2559 + }, + { + "epoch": 0.07, + "learning_rate": 1.9933598787785073e-06, + "loss": 0.9912, + "step": 2560 + }, + { + "epoch": 0.07, + "learning_rate": 1.993350324941338e-06, + "loss": 0.8223, + "step": 2561 + }, + { + "epoch": 0.07, + "learning_rate": 1.993340764258983e-06, + "loss": 0.9639, + "step": 2562 + }, + { + "epoch": 0.07, + "learning_rate": 1.9933311967315096e-06, + "loss": 0.9717, + "step": 2563 + }, + { + "epoch": 0.07, + "learning_rate": 1.993321622358984e-06, + "loss": 0.9365, + "step": 2564 + }, + { + "epoch": 0.07, + "learning_rate": 1.993312041141471e-06, + "loss": 0.77, + "step": 2565 + }, + { + "epoch": 0.07, + "learning_rate": 1.9933024530790374e-06, + "loss": 1.1982, + "step": 2566 + }, + { + "epoch": 0.07, + "learning_rate": 1.993292858171749e-06, + "loss": 0.9932, + "step": 2567 + }, + { + "epoch": 0.07, + "learning_rate": 1.993283256419672e-06, + "loss": 0.998, + "step": 2568 + }, + { + "epoch": 0.07, + "learning_rate": 1.993273647822873e-06, + "loss": 1.0049, + "step": 2569 + }, + { + "epoch": 0.07, + "learning_rate": 1.9932640323814173e-06, + "loss": 1.1357, + "step": 2570 + }, + { + "epoch": 0.07, + "learning_rate": 1.9932544100953717e-06, + "loss": 1.0, + "step": 2571 + }, + { + "epoch": 0.07, + "learning_rate": 1.9932447809648028e-06, + "loss": 1.1094, + "step": 2572 + }, + { + "epoch": 0.07, + "learning_rate": 1.9932351449897765e-06, + "loss": 1.1562, + "step": 2573 + }, + { + "epoch": 0.07, + "learning_rate": 1.993225502170359e-06, + "loss": 0.6772, + "step": 2574 + }, + { + "epoch": 0.07, + "learning_rate": 1.9932158525066173e-06, + "loss": 1.085, + "step": 2575 + }, + { + "epoch": 0.07, + "learning_rate": 1.9932061959986175e-06, + "loss": 1.2236, + "step": 2576 + }, + { + "epoch": 0.07, + "learning_rate": 1.9931965326464263e-06, + "loss": 0.8228, + "step": 2577 + }, + { + "epoch": 0.07, + "learning_rate": 1.9931868624501106e-06, + "loss": 1.0332, + "step": 2578 + }, + { + "epoch": 0.07, + "learning_rate": 1.9931771854097365e-06, + "loss": 1.0264, + "step": 2579 + }, + { + "epoch": 0.07, + "learning_rate": 1.993167501525371e-06, + "loss": 0.9141, + "step": 2580 + }, + { + "epoch": 0.07, + "learning_rate": 1.9931578107970808e-06, + "loss": 1.0713, + "step": 2581 + }, + { + "epoch": 0.07, + "learning_rate": 1.9931481132249325e-06, + "loss": 0.999, + "step": 2582 + }, + { + "epoch": 0.07, + "learning_rate": 1.9931384088089927e-06, + "loss": 0.9131, + "step": 2583 + }, + { + "epoch": 0.07, + "learning_rate": 1.9931286975493295e-06, + "loss": 1.0488, + "step": 2584 + }, + { + "epoch": 0.07, + "learning_rate": 1.993118979446008e-06, + "loss": 1.0127, + "step": 2585 + }, + { + "epoch": 0.07, + "learning_rate": 1.9931092544990967e-06, + "loss": 0.9746, + "step": 2586 + }, + { + "epoch": 0.07, + "learning_rate": 1.993099522708662e-06, + "loss": 0.9346, + "step": 2587 + }, + { + "epoch": 0.07, + "learning_rate": 1.993089784074771e-06, + "loss": 1.0518, + "step": 2588 + }, + { + "epoch": 0.07, + "learning_rate": 1.9930800385974905e-06, + "loss": 0.9082, + "step": 2589 + }, + { + "epoch": 0.07, + "learning_rate": 1.993070286276888e-06, + "loss": 0.874, + "step": 2590 + }, + { + "epoch": 0.07, + "learning_rate": 1.9930605271130307e-06, + "loss": 0.791, + "step": 2591 + }, + { + "epoch": 0.07, + "learning_rate": 1.993050761105986e-06, + "loss": 0.8486, + "step": 2592 + }, + { + "epoch": 0.07, + "learning_rate": 1.9930409882558207e-06, + "loss": 1.2598, + "step": 2593 + }, + { + "epoch": 0.07, + "learning_rate": 1.9930312085626026e-06, + "loss": 0.9111, + "step": 2594 + }, + { + "epoch": 0.07, + "learning_rate": 1.993021422026399e-06, + "loss": 0.6909, + "step": 2595 + }, + { + "epoch": 0.07, + "learning_rate": 1.9930116286472772e-06, + "loss": 0.9863, + "step": 2596 + }, + { + "epoch": 0.07, + "learning_rate": 1.9930018284253046e-06, + "loss": 0.9404, + "step": 2597 + }, + { + "epoch": 0.07, + "learning_rate": 1.9929920213605493e-06, + "loss": 0.9746, + "step": 2598 + }, + { + "epoch": 0.07, + "learning_rate": 1.992982207453078e-06, + "loss": 1.0322, + "step": 2599 + }, + { + "epoch": 0.07, + "learning_rate": 1.9929723867029592e-06, + "loss": 1.0596, + "step": 2600 + }, + { + "epoch": 0.07, + "learning_rate": 1.99296255911026e-06, + "loss": 1.0146, + "step": 2601 + }, + { + "epoch": 0.07, + "learning_rate": 1.9929527246750487e-06, + "loss": 0.9619, + "step": 2602 + }, + { + "epoch": 0.07, + "learning_rate": 1.992942883397392e-06, + "loss": 1.0068, + "step": 2603 + }, + { + "epoch": 0.07, + "learning_rate": 1.992933035277359e-06, + "loss": 1.0747, + "step": 2604 + }, + { + "epoch": 0.07, + "learning_rate": 1.992923180315017e-06, + "loss": 1.0303, + "step": 2605 + }, + { + "epoch": 0.07, + "learning_rate": 1.9929133185104333e-06, + "loss": 0.8574, + "step": 2606 + }, + { + "epoch": 0.07, + "learning_rate": 1.9929034498636764e-06, + "loss": 1.0771, + "step": 2607 + }, + { + "epoch": 0.07, + "learning_rate": 1.992893574374815e-06, + "loss": 1.0488, + "step": 2608 + }, + { + "epoch": 0.07, + "learning_rate": 1.992883692043916e-06, + "loss": 0.8262, + "step": 2609 + }, + { + "epoch": 0.07, + "learning_rate": 1.992873802871048e-06, + "loss": 0.8408, + "step": 2610 + }, + { + "epoch": 0.07, + "learning_rate": 1.9928639068562793e-06, + "loss": 0.9258, + "step": 2611 + }, + { + "epoch": 0.07, + "learning_rate": 1.9928540039996777e-06, + "loss": 0.6797, + "step": 2612 + }, + { + "epoch": 0.07, + "learning_rate": 1.992844094301312e-06, + "loss": 0.7793, + "step": 2613 + }, + { + "epoch": 0.07, + "learning_rate": 1.9928341777612497e-06, + "loss": 1.0381, + "step": 2614 + }, + { + "epoch": 0.07, + "learning_rate": 1.9928242543795596e-06, + "loss": 1.0342, + "step": 2615 + }, + { + "epoch": 0.07, + "learning_rate": 1.9928143241563103e-06, + "loss": 1.0, + "step": 2616 + }, + { + "epoch": 0.07, + "learning_rate": 1.99280438709157e-06, + "loss": 0.9092, + "step": 2617 + }, + { + "epoch": 0.07, + "learning_rate": 1.992794443185407e-06, + "loss": 0.9019, + "step": 2618 + }, + { + "epoch": 0.07, + "learning_rate": 1.99278449243789e-06, + "loss": 0.8799, + "step": 2619 + }, + { + "epoch": 0.07, + "learning_rate": 1.992774534849088e-06, + "loss": 0.998, + "step": 2620 + }, + { + "epoch": 0.07, + "learning_rate": 1.992764570419069e-06, + "loss": 1.001, + "step": 2621 + }, + { + "epoch": 0.07, + "learning_rate": 1.9927545991479016e-06, + "loss": 0.9893, + "step": 2622 + }, + { + "epoch": 0.07, + "learning_rate": 1.9927446210356546e-06, + "loss": 1.0596, + "step": 2623 + }, + { + "epoch": 0.07, + "learning_rate": 1.9927346360823975e-06, + "loss": 0.9316, + "step": 2624 + }, + { + "epoch": 0.07, + "learning_rate": 1.992724644288198e-06, + "loss": 1.0391, + "step": 2625 + }, + { + "epoch": 0.07, + "learning_rate": 1.9927146456531256e-06, + "loss": 0.752, + "step": 2626 + }, + { + "epoch": 0.07, + "learning_rate": 1.992704640177249e-06, + "loss": 0.9053, + "step": 2627 + }, + { + "epoch": 0.07, + "learning_rate": 1.9926946278606372e-06, + "loss": 0.8521, + "step": 2628 + }, + { + "epoch": 0.07, + "learning_rate": 1.9926846087033597e-06, + "loss": 0.5986, + "step": 2629 + }, + { + "epoch": 0.07, + "learning_rate": 1.9926745827054848e-06, + "loss": 0.8047, + "step": 2630 + }, + { + "epoch": 0.07, + "learning_rate": 1.992664549867082e-06, + "loss": 0.5306, + "step": 2631 + }, + { + "epoch": 0.07, + "learning_rate": 1.99265451018822e-06, + "loss": 0.918, + "step": 2632 + }, + { + "epoch": 0.07, + "learning_rate": 1.9926444636689682e-06, + "loss": 0.9893, + "step": 2633 + }, + { + "epoch": 0.07, + "learning_rate": 1.992634410309396e-06, + "loss": 1.1016, + "step": 2634 + }, + { + "epoch": 0.07, + "learning_rate": 1.992624350109573e-06, + "loss": 0.8965, + "step": 2635 + }, + { + "epoch": 0.07, + "learning_rate": 1.9926142830695677e-06, + "loss": 1.0635, + "step": 2636 + }, + { + "epoch": 0.07, + "learning_rate": 1.9926042091894496e-06, + "loss": 0.9795, + "step": 2637 + }, + { + "epoch": 0.07, + "learning_rate": 1.992594128469289e-06, + "loss": 0.9688, + "step": 2638 + }, + { + "epoch": 0.07, + "learning_rate": 1.9925840409091542e-06, + "loss": 0.9688, + "step": 2639 + }, + { + "epoch": 0.07, + "learning_rate": 1.9925739465091154e-06, + "loss": 0.5957, + "step": 2640 + }, + { + "epoch": 0.07, + "learning_rate": 1.9925638452692428e-06, + "loss": 1.0, + "step": 2641 + }, + { + "epoch": 0.07, + "learning_rate": 1.9925537371896045e-06, + "loss": 1.0049, + "step": 2642 + }, + { + "epoch": 0.07, + "learning_rate": 1.992543622270271e-06, + "loss": 0.9336, + "step": 2643 + }, + { + "epoch": 0.07, + "learning_rate": 1.992533500511312e-06, + "loss": 1.0234, + "step": 2644 + }, + { + "epoch": 0.07, + "learning_rate": 1.9925233719127967e-06, + "loss": 1.1602, + "step": 2645 + }, + { + "epoch": 0.07, + "learning_rate": 1.992513236474796e-06, + "loss": 1.0117, + "step": 2646 + }, + { + "epoch": 0.07, + "learning_rate": 1.992503094197379e-06, + "loss": 0.8652, + "step": 2647 + }, + { + "epoch": 0.07, + "learning_rate": 1.992492945080615e-06, + "loss": 0.8965, + "step": 2648 + }, + { + "epoch": 0.07, + "learning_rate": 1.992482789124576e-06, + "loss": 1.082, + "step": 2649 + }, + { + "epoch": 0.07, + "learning_rate": 1.9924726263293294e-06, + "loss": 0.8281, + "step": 2650 + }, + { + "epoch": 0.07, + "learning_rate": 1.9924624566949467e-06, + "loss": 1.0605, + "step": 2651 + }, + { + "epoch": 0.07, + "learning_rate": 1.992452280221498e-06, + "loss": 1.0293, + "step": 2652 + }, + { + "epoch": 0.07, + "learning_rate": 1.9924420969090527e-06, + "loss": 0.8633, + "step": 2653 + }, + { + "epoch": 0.07, + "learning_rate": 1.9924319067576817e-06, + "loss": 0.7598, + "step": 2654 + }, + { + "epoch": 0.07, + "learning_rate": 1.9924217097674547e-06, + "loss": 0.7446, + "step": 2655 + }, + { + "epoch": 0.07, + "learning_rate": 1.9924115059384425e-06, + "loss": 1.1201, + "step": 2656 + }, + { + "epoch": 0.07, + "learning_rate": 1.992401295270715e-06, + "loss": 0.8218, + "step": 2657 + }, + { + "epoch": 0.07, + "learning_rate": 1.9923910777643425e-06, + "loss": 0.7305, + "step": 2658 + }, + { + "epoch": 0.07, + "learning_rate": 1.9923808534193957e-06, + "loss": 0.8691, + "step": 2659 + }, + { + "epoch": 0.07, + "learning_rate": 1.992370622235945e-06, + "loss": 0.7676, + "step": 2660 + }, + { + "epoch": 0.07, + "learning_rate": 1.992360384214061e-06, + "loss": 1.0156, + "step": 2661 + }, + { + "epoch": 0.07, + "learning_rate": 1.992350139353814e-06, + "loss": 0.8999, + "step": 2662 + }, + { + "epoch": 0.07, + "learning_rate": 1.9923398876552748e-06, + "loss": 0.8232, + "step": 2663 + }, + { + "epoch": 0.07, + "learning_rate": 1.9923296291185132e-06, + "loss": 0.9248, + "step": 2664 + }, + { + "epoch": 0.07, + "learning_rate": 1.9923193637436013e-06, + "loss": 0.6572, + "step": 2665 + }, + { + "epoch": 0.07, + "learning_rate": 1.9923090915306094e-06, + "loss": 1.1377, + "step": 2666 + }, + { + "epoch": 0.07, + "learning_rate": 1.9922988124796077e-06, + "loss": 1.0811, + "step": 2667 + }, + { + "epoch": 0.07, + "learning_rate": 1.992288526590667e-06, + "loss": 0.8804, + "step": 2668 + }, + { + "epoch": 0.07, + "learning_rate": 1.9922782338638594e-06, + "loss": 0.9697, + "step": 2669 + }, + { + "epoch": 0.07, + "learning_rate": 1.9922679342992545e-06, + "loss": 1.001, + "step": 2670 + }, + { + "epoch": 0.07, + "learning_rate": 1.9922576278969237e-06, + "loss": 0.9785, + "step": 2671 + }, + { + "epoch": 0.07, + "learning_rate": 1.9922473146569385e-06, + "loss": 0.9932, + "step": 2672 + }, + { + "epoch": 0.07, + "learning_rate": 1.992236994579369e-06, + "loss": 1.1768, + "step": 2673 + }, + { + "epoch": 0.07, + "learning_rate": 1.9922266676642873e-06, + "loss": 0.7588, + "step": 2674 + }, + { + "epoch": 0.07, + "learning_rate": 1.992216333911764e-06, + "loss": 1.083, + "step": 2675 + }, + { + "epoch": 0.07, + "learning_rate": 1.9922059933218706e-06, + "loss": 0.6689, + "step": 2676 + }, + { + "epoch": 0.07, + "learning_rate": 1.992195645894678e-06, + "loss": 0.8896, + "step": 2677 + }, + { + "epoch": 0.07, + "learning_rate": 1.9921852916302576e-06, + "loss": 1.1504, + "step": 2678 + }, + { + "epoch": 0.07, + "learning_rate": 1.992174930528681e-06, + "loss": 0.9834, + "step": 2679 + }, + { + "epoch": 0.07, + "learning_rate": 1.9921645625900196e-06, + "loss": 0.8516, + "step": 2680 + }, + { + "epoch": 0.07, + "learning_rate": 1.9921541878143448e-06, + "loss": 0.6638, + "step": 2681 + }, + { + "epoch": 0.07, + "learning_rate": 1.992143806201728e-06, + "loss": 0.8564, + "step": 2682 + }, + { + "epoch": 0.07, + "learning_rate": 1.99213341775224e-06, + "loss": 0.8521, + "step": 2683 + }, + { + "epoch": 0.07, + "learning_rate": 1.992123022465954e-06, + "loss": 1.1074, + "step": 2684 + }, + { + "epoch": 0.07, + "learning_rate": 1.9921126203429403e-06, + "loss": 1.1094, + "step": 2685 + }, + { + "epoch": 0.07, + "learning_rate": 1.9921022113832714e-06, + "loss": 0.8513, + "step": 2686 + }, + { + "epoch": 0.07, + "learning_rate": 1.9920917955870183e-06, + "loss": 1.1465, + "step": 2687 + }, + { + "epoch": 0.07, + "learning_rate": 1.992081372954253e-06, + "loss": 0.8242, + "step": 2688 + }, + { + "epoch": 0.07, + "learning_rate": 1.9920709434850476e-06, + "loss": 1.1416, + "step": 2689 + }, + { + "epoch": 0.07, + "learning_rate": 1.9920605071794744e-06, + "loss": 1.2217, + "step": 2690 + }, + { + "epoch": 0.07, + "learning_rate": 1.992050064037604e-06, + "loss": 0.9141, + "step": 2691 + }, + { + "epoch": 0.07, + "learning_rate": 1.9920396140595096e-06, + "loss": 0.9512, + "step": 2692 + }, + { + "epoch": 0.07, + "learning_rate": 1.9920291572452626e-06, + "loss": 0.9072, + "step": 2693 + }, + { + "epoch": 0.07, + "learning_rate": 1.992018693594935e-06, + "loss": 1.0381, + "step": 2694 + }, + { + "epoch": 0.07, + "learning_rate": 1.9920082231085994e-06, + "loss": 0.8955, + "step": 2695 + }, + { + "epoch": 0.07, + "learning_rate": 1.9919977457863273e-06, + "loss": 0.8379, + "step": 2696 + }, + { + "epoch": 0.07, + "learning_rate": 1.9919872616281914e-06, + "loss": 0.7734, + "step": 2697 + }, + { + "epoch": 0.07, + "learning_rate": 1.9919767706342637e-06, + "loss": 0.7817, + "step": 2698 + }, + { + "epoch": 0.07, + "learning_rate": 1.9919662728046167e-06, + "loss": 0.8916, + "step": 2699 + }, + { + "epoch": 0.07, + "learning_rate": 1.9919557681393227e-06, + "loss": 1.1318, + "step": 2700 + }, + { + "epoch": 0.07, + "learning_rate": 1.991945256638454e-06, + "loss": 0.9844, + "step": 2701 + }, + { + "epoch": 0.07, + "learning_rate": 1.9919347383020824e-06, + "loss": 0.7778, + "step": 2702 + }, + { + "epoch": 0.07, + "learning_rate": 1.9919242131302817e-06, + "loss": 1.0879, + "step": 2703 + }, + { + "epoch": 0.07, + "learning_rate": 1.9919136811231238e-06, + "loss": 0.78, + "step": 2704 + }, + { + "epoch": 0.07, + "learning_rate": 1.991903142280681e-06, + "loss": 1.041, + "step": 2705 + }, + { + "epoch": 0.07, + "learning_rate": 1.9918925966030262e-06, + "loss": 0.8848, + "step": 2706 + }, + { + "epoch": 0.07, + "learning_rate": 1.9918820440902323e-06, + "loss": 0.9443, + "step": 2707 + }, + { + "epoch": 0.07, + "learning_rate": 1.9918714847423713e-06, + "loss": 0.9316, + "step": 2708 + }, + { + "epoch": 0.07, + "learning_rate": 1.9918609185595163e-06, + "loss": 1.0205, + "step": 2709 + }, + { + "epoch": 0.07, + "learning_rate": 1.991850345541741e-06, + "loss": 0.9854, + "step": 2710 + }, + { + "epoch": 0.07, + "learning_rate": 1.9918397656891166e-06, + "loss": 0.9766, + "step": 2711 + }, + { + "epoch": 0.07, + "learning_rate": 1.9918291790017176e-06, + "loss": 0.8838, + "step": 2712 + }, + { + "epoch": 0.07, + "learning_rate": 1.9918185854796156e-06, + "loss": 1.0967, + "step": 2713 + }, + { + "epoch": 0.07, + "learning_rate": 1.9918079851228848e-06, + "loss": 1.0889, + "step": 2714 + }, + { + "epoch": 0.07, + "learning_rate": 1.991797377931597e-06, + "loss": 1.0898, + "step": 2715 + }, + { + "epoch": 0.07, + "learning_rate": 1.9917867639058264e-06, + "loss": 0.9473, + "step": 2716 + }, + { + "epoch": 0.07, + "learning_rate": 1.991776143045646e-06, + "loss": 0.9785, + "step": 2717 + }, + { + "epoch": 0.07, + "learning_rate": 1.9917655153511283e-06, + "loss": 0.7195, + "step": 2718 + }, + { + "epoch": 0.07, + "learning_rate": 1.991754880822347e-06, + "loss": 0.9473, + "step": 2719 + }, + { + "epoch": 0.07, + "learning_rate": 1.9917442394593756e-06, + "loss": 1.1348, + "step": 2720 + }, + { + "epoch": 0.07, + "learning_rate": 1.9917335912622866e-06, + "loss": 1.1631, + "step": 2721 + }, + { + "epoch": 0.07, + "learning_rate": 1.9917229362311546e-06, + "loss": 0.8623, + "step": 2722 + }, + { + "epoch": 0.07, + "learning_rate": 1.991712274366052e-06, + "loss": 0.7261, + "step": 2723 + }, + { + "epoch": 0.07, + "learning_rate": 1.9917016056670526e-06, + "loss": 0.959, + "step": 2724 + }, + { + "epoch": 0.07, + "learning_rate": 1.9916909301342296e-06, + "loss": 0.8516, + "step": 2725 + }, + { + "epoch": 0.07, + "learning_rate": 1.9916802477676574e-06, + "loss": 0.9932, + "step": 2726 + }, + { + "epoch": 0.07, + "learning_rate": 1.991669558567409e-06, + "loss": 1.0205, + "step": 2727 + }, + { + "epoch": 0.07, + "learning_rate": 1.9916588625335583e-06, + "loss": 1.0449, + "step": 2728 + }, + { + "epoch": 0.07, + "learning_rate": 1.991648159666179e-06, + "loss": 1.0859, + "step": 2729 + }, + { + "epoch": 0.07, + "learning_rate": 1.9916374499653443e-06, + "loss": 0.8633, + "step": 2730 + }, + { + "epoch": 0.07, + "learning_rate": 1.9916267334311288e-06, + "loss": 1.0225, + "step": 2731 + }, + { + "epoch": 0.07, + "learning_rate": 1.991616010063606e-06, + "loss": 0.9414, + "step": 2732 + }, + { + "epoch": 0.07, + "learning_rate": 1.9916052798628495e-06, + "loss": 0.9434, + "step": 2733 + }, + { + "epoch": 0.07, + "learning_rate": 1.9915945428289336e-06, + "loss": 0.8975, + "step": 2734 + }, + { + "epoch": 0.07, + "learning_rate": 1.991583798961932e-06, + "loss": 1.0264, + "step": 2735 + }, + { + "epoch": 0.07, + "learning_rate": 1.9915730482619197e-06, + "loss": 0.8662, + "step": 2736 + }, + { + "epoch": 0.07, + "learning_rate": 1.991562290728969e-06, + "loss": 0.9883, + "step": 2737 + }, + { + "epoch": 0.07, + "learning_rate": 1.991551526363156e-06, + "loss": 0.9414, + "step": 2738 + }, + { + "epoch": 0.07, + "learning_rate": 1.9915407551645536e-06, + "loss": 1.0029, + "step": 2739 + }, + { + "epoch": 0.07, + "learning_rate": 1.9915299771332363e-06, + "loss": 0.9795, + "step": 2740 + }, + { + "epoch": 0.07, + "learning_rate": 1.9915191922692786e-06, + "loss": 0.8477, + "step": 2741 + }, + { + "epoch": 0.07, + "learning_rate": 1.9915084005727547e-06, + "loss": 0.96, + "step": 2742 + }, + { + "epoch": 0.07, + "learning_rate": 1.9914976020437386e-06, + "loss": 0.7598, + "step": 2743 + }, + { + "epoch": 0.07, + "learning_rate": 1.991486796682305e-06, + "loss": 0.9414, + "step": 2744 + }, + { + "epoch": 0.07, + "learning_rate": 1.991475984488529e-06, + "loss": 0.915, + "step": 2745 + }, + { + "epoch": 0.07, + "learning_rate": 1.991465165462484e-06, + "loss": 0.8906, + "step": 2746 + }, + { + "epoch": 0.07, + "learning_rate": 1.991454339604245e-06, + "loss": 1.1064, + "step": 2747 + }, + { + "epoch": 0.07, + "learning_rate": 1.9914435069138865e-06, + "loss": 1.04, + "step": 2748 + }, + { + "epoch": 0.07, + "learning_rate": 1.9914326673914835e-06, + "loss": 0.5889, + "step": 2749 + }, + { + "epoch": 0.07, + "learning_rate": 1.9914218210371106e-06, + "loss": 0.9678, + "step": 2750 + }, + { + "epoch": 0.07, + "learning_rate": 1.9914109678508427e-06, + "loss": 0.9775, + "step": 2751 + }, + { + "epoch": 0.07, + "learning_rate": 1.991400107832754e-06, + "loss": 0.8169, + "step": 2752 + }, + { + "epoch": 0.07, + "learning_rate": 1.9913892409829195e-06, + "loss": 1.0615, + "step": 2753 + }, + { + "epoch": 0.07, + "learning_rate": 1.9913783673014146e-06, + "loss": 1.1777, + "step": 2754 + }, + { + "epoch": 0.07, + "learning_rate": 1.9913674867883138e-06, + "loss": 0.9404, + "step": 2755 + }, + { + "epoch": 0.07, + "learning_rate": 1.991356599443692e-06, + "loss": 1.2021, + "step": 2756 + }, + { + "epoch": 0.07, + "learning_rate": 1.9913457052676247e-06, + "loss": 0.9014, + "step": 2757 + }, + { + "epoch": 0.07, + "learning_rate": 1.9913348042601864e-06, + "loss": 1.0156, + "step": 2758 + }, + { + "epoch": 0.07, + "learning_rate": 1.9913238964214524e-06, + "loss": 0.6641, + "step": 2759 + }, + { + "epoch": 0.07, + "learning_rate": 1.9913129817514985e-06, + "loss": 0.8047, + "step": 2760 + }, + { + "epoch": 0.07, + "learning_rate": 1.9913020602503988e-06, + "loss": 0.896, + "step": 2761 + }, + { + "epoch": 0.07, + "learning_rate": 1.9912911319182295e-06, + "loss": 0.9785, + "step": 2762 + }, + { + "epoch": 0.07, + "learning_rate": 1.991280196755065e-06, + "loss": 0.6899, + "step": 2763 + }, + { + "epoch": 0.07, + "learning_rate": 1.9912692547609816e-06, + "loss": 0.9307, + "step": 2764 + }, + { + "epoch": 0.07, + "learning_rate": 1.9912583059360537e-06, + "loss": 0.9072, + "step": 2765 + }, + { + "epoch": 0.07, + "learning_rate": 1.991247350280358e-06, + "loss": 1.1201, + "step": 2766 + }, + { + "epoch": 0.07, + "learning_rate": 1.991236387793969e-06, + "loss": 1.0303, + "step": 2767 + }, + { + "epoch": 0.07, + "learning_rate": 1.9912254184769627e-06, + "loss": 0.7358, + "step": 2768 + }, + { + "epoch": 0.07, + "learning_rate": 1.9912144423294147e-06, + "loss": 0.8237, + "step": 2769 + }, + { + "epoch": 0.07, + "learning_rate": 1.9912034593514e-06, + "loss": 0.9199, + "step": 2770 + }, + { + "epoch": 0.07, + "learning_rate": 1.9911924695429953e-06, + "loss": 0.7891, + "step": 2771 + }, + { + "epoch": 0.07, + "learning_rate": 1.9911814729042757e-06, + "loss": 1.0371, + "step": 2772 + }, + { + "epoch": 0.07, + "learning_rate": 1.9911704694353165e-06, + "loss": 0.709, + "step": 2773 + }, + { + "epoch": 0.07, + "learning_rate": 1.991159459136195e-06, + "loss": 1.1152, + "step": 2774 + }, + { + "epoch": 0.07, + "learning_rate": 1.9911484420069855e-06, + "loss": 0.8335, + "step": 2775 + }, + { + "epoch": 0.07, + "learning_rate": 1.991137418047765e-06, + "loss": 0.8057, + "step": 2776 + }, + { + "epoch": 0.07, + "learning_rate": 1.991126387258609e-06, + "loss": 0.9956, + "step": 2777 + }, + { + "epoch": 0.07, + "learning_rate": 1.9911153496395933e-06, + "loss": 0.8457, + "step": 2778 + }, + { + "epoch": 0.07, + "learning_rate": 1.9911043051907943e-06, + "loss": 0.7085, + "step": 2779 + }, + { + "epoch": 0.07, + "learning_rate": 1.9910932539122882e-06, + "loss": 1.1826, + "step": 2780 + }, + { + "epoch": 0.07, + "learning_rate": 1.9910821958041512e-06, + "loss": 1.2158, + "step": 2781 + }, + { + "epoch": 0.07, + "learning_rate": 1.9910711308664588e-06, + "loss": 0.8164, + "step": 2782 + }, + { + "epoch": 0.07, + "learning_rate": 1.9910600590992883e-06, + "loss": 0.9238, + "step": 2783 + }, + { + "epoch": 0.07, + "learning_rate": 1.991048980502715e-06, + "loss": 0.4988, + "step": 2784 + }, + { + "epoch": 0.07, + "learning_rate": 1.9910378950768157e-06, + "loss": 0.6453, + "step": 2785 + }, + { + "epoch": 0.07, + "learning_rate": 1.991026802821667e-06, + "loss": 1.002, + "step": 2786 + }, + { + "epoch": 0.07, + "learning_rate": 1.991015703737345e-06, + "loss": 1.0254, + "step": 2787 + }, + { + "epoch": 0.07, + "learning_rate": 1.9910045978239264e-06, + "loss": 0.8467, + "step": 2788 + }, + { + "epoch": 0.07, + "learning_rate": 1.9909934850814876e-06, + "loss": 0.7847, + "step": 2789 + }, + { + "epoch": 0.07, + "learning_rate": 1.9909823655101052e-06, + "loss": 0.9619, + "step": 2790 + }, + { + "epoch": 0.07, + "learning_rate": 1.990971239109856e-06, + "loss": 1.1201, + "step": 2791 + }, + { + "epoch": 0.07, + "learning_rate": 1.990960105880816e-06, + "loss": 1.1172, + "step": 2792 + }, + { + "epoch": 0.07, + "learning_rate": 1.990948965823063e-06, + "loss": 0.9219, + "step": 2793 + }, + { + "epoch": 0.07, + "learning_rate": 1.9909378189366728e-06, + "loss": 1.1133, + "step": 2794 + }, + { + "epoch": 0.07, + "learning_rate": 1.990926665221723e-06, + "loss": 0.7793, + "step": 2795 + }, + { + "epoch": 0.07, + "learning_rate": 1.9909155046782894e-06, + "loss": 0.9932, + "step": 2796 + }, + { + "epoch": 0.07, + "learning_rate": 1.9909043373064504e-06, + "loss": 0.8877, + "step": 2797 + }, + { + "epoch": 0.07, + "learning_rate": 1.9908931631062816e-06, + "loss": 0.9014, + "step": 2798 + }, + { + "epoch": 0.07, + "learning_rate": 1.9908819820778605e-06, + "loss": 0.9912, + "step": 2799 + }, + { + "epoch": 0.07, + "learning_rate": 1.9908707942212645e-06, + "loss": 1.1729, + "step": 2800 + }, + { + "epoch": 0.07, + "learning_rate": 1.99085959953657e-06, + "loss": 0.854, + "step": 2801 + }, + { + "epoch": 0.07, + "learning_rate": 1.9908483980238546e-06, + "loss": 1.1289, + "step": 2802 + }, + { + "epoch": 0.07, + "learning_rate": 1.9908371896831958e-06, + "loss": 1.0498, + "step": 2803 + }, + { + "epoch": 0.07, + "learning_rate": 1.99082597451467e-06, + "loss": 0.9443, + "step": 2804 + }, + { + "epoch": 0.07, + "learning_rate": 1.990814752518355e-06, + "loss": 0.9658, + "step": 2805 + }, + { + "epoch": 0.07, + "learning_rate": 1.990803523694328e-06, + "loss": 1.1309, + "step": 2806 + }, + { + "epoch": 0.07, + "learning_rate": 1.9907922880426668e-06, + "loss": 1.0303, + "step": 2807 + }, + { + "epoch": 0.07, + "learning_rate": 1.9907810455634482e-06, + "loss": 0.9609, + "step": 2808 + }, + { + "epoch": 0.07, + "learning_rate": 1.99076979625675e-06, + "loss": 1.0527, + "step": 2809 + }, + { + "epoch": 0.07, + "learning_rate": 1.9907585401226495e-06, + "loss": 0.8833, + "step": 2810 + }, + { + "epoch": 0.07, + "learning_rate": 1.9907472771612244e-06, + "loss": 0.8955, + "step": 2811 + }, + { + "epoch": 0.07, + "learning_rate": 1.9907360073725527e-06, + "loss": 1.0625, + "step": 2812 + }, + { + "epoch": 0.07, + "learning_rate": 1.9907247307567113e-06, + "loss": 1.1543, + "step": 2813 + }, + { + "epoch": 0.07, + "learning_rate": 1.9907134473137783e-06, + "loss": 1.0146, + "step": 2814 + }, + { + "epoch": 0.07, + "learning_rate": 1.9907021570438318e-06, + "loss": 0.8799, + "step": 2815 + }, + { + "epoch": 0.07, + "learning_rate": 1.9906908599469488e-06, + "loss": 1.0352, + "step": 2816 + }, + { + "epoch": 0.07, + "learning_rate": 1.990679556023208e-06, + "loss": 0.9443, + "step": 2817 + }, + { + "epoch": 0.07, + "learning_rate": 1.9906682452726868e-06, + "loss": 1.0381, + "step": 2818 + }, + { + "epoch": 0.07, + "learning_rate": 1.990656927695463e-06, + "loss": 0.9854, + "step": 2819 + }, + { + "epoch": 0.07, + "learning_rate": 1.9906456032916152e-06, + "loss": 0.9873, + "step": 2820 + }, + { + "epoch": 0.07, + "learning_rate": 1.9906342720612204e-06, + "loss": 0.958, + "step": 2821 + }, + { + "epoch": 0.07, + "learning_rate": 1.990622934004358e-06, + "loss": 1.0127, + "step": 2822 + }, + { + "epoch": 0.07, + "learning_rate": 1.9906115891211054e-06, + "loss": 1.1191, + "step": 2823 + }, + { + "epoch": 0.07, + "learning_rate": 1.9906002374115407e-06, + "loss": 0.9043, + "step": 2824 + }, + { + "epoch": 0.07, + "learning_rate": 1.9905888788757424e-06, + "loss": 0.9941, + "step": 2825 + }, + { + "epoch": 0.07, + "learning_rate": 1.9905775135137887e-06, + "loss": 1.0859, + "step": 2826 + }, + { + "epoch": 0.07, + "learning_rate": 1.9905661413257574e-06, + "loss": 0.6499, + "step": 2827 + }, + { + "epoch": 0.07, + "learning_rate": 1.9905547623117277e-06, + "loss": 1.0049, + "step": 2828 + }, + { + "epoch": 0.07, + "learning_rate": 1.990543376471778e-06, + "loss": 1.1191, + "step": 2829 + }, + { + "epoch": 0.07, + "learning_rate": 1.9905319838059856e-06, + "loss": 1.0547, + "step": 2830 + }, + { + "epoch": 0.07, + "learning_rate": 1.9905205843144304e-06, + "loss": 1.2803, + "step": 2831 + }, + { + "epoch": 0.07, + "learning_rate": 1.9905091779971903e-06, + "loss": 0.9375, + "step": 2832 + }, + { + "epoch": 0.07, + "learning_rate": 1.990497764854344e-06, + "loss": 0.8008, + "step": 2833 + }, + { + "epoch": 0.07, + "learning_rate": 1.99048634488597e-06, + "loss": 1.1465, + "step": 2834 + }, + { + "epoch": 0.07, + "learning_rate": 1.990474918092147e-06, + "loss": 1.0498, + "step": 2835 + }, + { + "epoch": 0.07, + "learning_rate": 1.9904634844729543e-06, + "loss": 0.7744, + "step": 2836 + }, + { + "epoch": 0.07, + "learning_rate": 1.99045204402847e-06, + "loss": 0.8257, + "step": 2837 + }, + { + "epoch": 0.07, + "learning_rate": 1.990440596758773e-06, + "loss": 1.0859, + "step": 2838 + }, + { + "epoch": 0.07, + "learning_rate": 1.990429142663942e-06, + "loss": 0.895, + "step": 2839 + }, + { + "epoch": 0.07, + "learning_rate": 1.990417681744057e-06, + "loss": 0.9785, + "step": 2840 + }, + { + "epoch": 0.07, + "learning_rate": 1.990406213999196e-06, + "loss": 1.0342, + "step": 2841 + }, + { + "epoch": 0.07, + "learning_rate": 1.9903947394294386e-06, + "loss": 0.9424, + "step": 2842 + }, + { + "epoch": 0.07, + "learning_rate": 1.990383258034863e-06, + "loss": 0.917, + "step": 2843 + }, + { + "epoch": 0.07, + "learning_rate": 1.9903717698155496e-06, + "loss": 0.8408, + "step": 2844 + }, + { + "epoch": 0.07, + "learning_rate": 1.9903602747715764e-06, + "loss": 1.0234, + "step": 2845 + }, + { + "epoch": 0.07, + "learning_rate": 1.9903487729030232e-06, + "loss": 0.9824, + "step": 2846 + }, + { + "epoch": 0.07, + "learning_rate": 1.9903372642099688e-06, + "loss": 1.1123, + "step": 2847 + }, + { + "epoch": 0.07, + "learning_rate": 1.990325748692493e-06, + "loss": 0.8975, + "step": 2848 + }, + { + "epoch": 0.07, + "learning_rate": 1.9903142263506754e-06, + "loss": 0.9746, + "step": 2849 + }, + { + "epoch": 0.07, + "learning_rate": 1.9903026971845945e-06, + "loss": 0.7715, + "step": 2850 + }, + { + "epoch": 0.07, + "learning_rate": 1.9902911611943304e-06, + "loss": 1.1191, + "step": 2851 + }, + { + "epoch": 0.07, + "learning_rate": 1.9902796183799622e-06, + "loss": 0.6689, + "step": 2852 + }, + { + "epoch": 0.07, + "learning_rate": 1.99026806874157e-06, + "loss": 0.9463, + "step": 2853 + }, + { + "epoch": 0.07, + "learning_rate": 1.9902565122792333e-06, + "loss": 0.9277, + "step": 2854 + }, + { + "epoch": 0.07, + "learning_rate": 1.990244948993031e-06, + "loss": 0.9512, + "step": 2855 + }, + { + "epoch": 0.07, + "learning_rate": 1.9902333788830435e-06, + "loss": 1.0078, + "step": 2856 + }, + { + "epoch": 0.07, + "learning_rate": 1.99022180194935e-06, + "loss": 1.0889, + "step": 2857 + }, + { + "epoch": 0.07, + "learning_rate": 1.990210218192031e-06, + "loss": 0.9307, + "step": 2858 + }, + { + "epoch": 0.07, + "learning_rate": 1.9901986276111654e-06, + "loss": 1.0117, + "step": 2859 + }, + { + "epoch": 0.07, + "learning_rate": 1.990187030206834e-06, + "loss": 1.0576, + "step": 2860 + }, + { + "epoch": 0.07, + "learning_rate": 1.9901754259791164e-06, + "loss": 0.8926, + "step": 2861 + }, + { + "epoch": 0.07, + "learning_rate": 1.990163814928092e-06, + "loss": 1.0303, + "step": 2862 + }, + { + "epoch": 0.07, + "learning_rate": 1.990152197053842e-06, + "loss": 0.8892, + "step": 2863 + }, + { + "epoch": 0.07, + "learning_rate": 1.990140572356445e-06, + "loss": 0.9297, + "step": 2864 + }, + { + "epoch": 0.07, + "learning_rate": 1.990128940835982e-06, + "loss": 1.0732, + "step": 2865 + }, + { + "epoch": 0.07, + "learning_rate": 1.9901173024925332e-06, + "loss": 0.8799, + "step": 2866 + }, + { + "epoch": 0.07, + "learning_rate": 1.9901056573261787e-06, + "loss": 1.0234, + "step": 2867 + }, + { + "epoch": 0.07, + "learning_rate": 1.990094005336998e-06, + "loss": 1.0488, + "step": 2868 + }, + { + "epoch": 0.07, + "learning_rate": 1.9900823465250727e-06, + "loss": 0.9658, + "step": 2869 + }, + { + "epoch": 0.07, + "learning_rate": 1.990070680890482e-06, + "loss": 0.8081, + "step": 2870 + }, + { + "epoch": 0.07, + "learning_rate": 1.990059008433307e-06, + "loss": 0.8076, + "step": 2871 + }, + { + "epoch": 0.07, + "learning_rate": 1.990047329153628e-06, + "loss": 0.8071, + "step": 2872 + }, + { + "epoch": 0.07, + "learning_rate": 1.9900356430515252e-06, + "loss": 0.9336, + "step": 2873 + }, + { + "epoch": 0.07, + "learning_rate": 1.9900239501270794e-06, + "loss": 1.0605, + "step": 2874 + }, + { + "epoch": 0.07, + "learning_rate": 1.9900122503803705e-06, + "loss": 0.9482, + "step": 2875 + }, + { + "epoch": 0.07, + "learning_rate": 1.9900005438114804e-06, + "loss": 0.9102, + "step": 2876 + }, + { + "epoch": 0.07, + "learning_rate": 1.989988830420489e-06, + "loss": 0.8223, + "step": 2877 + }, + { + "epoch": 0.07, + "learning_rate": 1.989977110207477e-06, + "loss": 1.0254, + "step": 2878 + }, + { + "epoch": 0.07, + "learning_rate": 1.9899653831725253e-06, + "loss": 0.7896, + "step": 2879 + }, + { + "epoch": 0.07, + "learning_rate": 1.9899536493157145e-06, + "loss": 1.1357, + "step": 2880 + }, + { + "epoch": 0.07, + "learning_rate": 1.9899419086371257e-06, + "loss": 1.0254, + "step": 2881 + }, + { + "epoch": 0.07, + "learning_rate": 1.98993016113684e-06, + "loss": 1.0957, + "step": 2882 + }, + { + "epoch": 0.07, + "learning_rate": 1.989918406814938e-06, + "loss": 0.7412, + "step": 2883 + }, + { + "epoch": 0.07, + "learning_rate": 1.9899066456715003e-06, + "loss": 1.082, + "step": 2884 + }, + { + "epoch": 0.07, + "learning_rate": 1.9898948777066086e-06, + "loss": 0.8096, + "step": 2885 + }, + { + "epoch": 0.07, + "learning_rate": 1.989883102920344e-06, + "loss": 0.832, + "step": 2886 + }, + { + "epoch": 0.07, + "learning_rate": 1.9898713213127875e-06, + "loss": 0.9775, + "step": 2887 + }, + { + "epoch": 0.07, + "learning_rate": 1.9898595328840203e-06, + "loss": 1.0264, + "step": 2888 + }, + { + "epoch": 0.07, + "learning_rate": 1.9898477376341234e-06, + "loss": 0.9502, + "step": 2889 + }, + { + "epoch": 0.07, + "learning_rate": 1.9898359355631782e-06, + "loss": 0.9912, + "step": 2890 + }, + { + "epoch": 0.07, + "learning_rate": 1.9898241266712665e-06, + "loss": 1.0322, + "step": 2891 + }, + { + "epoch": 0.07, + "learning_rate": 1.989812310958469e-06, + "loss": 1.0068, + "step": 2892 + }, + { + "epoch": 0.07, + "learning_rate": 1.989800488424867e-06, + "loss": 0.875, + "step": 2893 + }, + { + "epoch": 0.07, + "learning_rate": 1.9897886590705426e-06, + "loss": 0.7861, + "step": 2894 + }, + { + "epoch": 0.07, + "learning_rate": 1.9897768228955772e-06, + "loss": 0.9414, + "step": 2895 + }, + { + "epoch": 0.07, + "learning_rate": 1.9897649799000527e-06, + "loss": 1.3027, + "step": 2896 + }, + { + "epoch": 0.07, + "learning_rate": 1.9897531300840494e-06, + "loss": 1.0273, + "step": 2897 + }, + { + "epoch": 0.07, + "learning_rate": 1.9897412734476504e-06, + "loss": 0.9131, + "step": 2898 + }, + { + "epoch": 0.07, + "learning_rate": 1.9897294099909367e-06, + "loss": 0.9678, + "step": 2899 + }, + { + "epoch": 0.07, + "learning_rate": 1.98971753971399e-06, + "loss": 1.0059, + "step": 2900 + }, + { + "epoch": 0.07, + "learning_rate": 1.989705662616892e-06, + "loss": 0.998, + "step": 2901 + }, + { + "epoch": 0.07, + "learning_rate": 1.9896937786997253e-06, + "loss": 0.9189, + "step": 2902 + }, + { + "epoch": 0.07, + "learning_rate": 1.989681887962571e-06, + "loss": 0.7532, + "step": 2903 + }, + { + "epoch": 0.07, + "learning_rate": 1.9896699904055115e-06, + "loss": 1.0059, + "step": 2904 + }, + { + "epoch": 0.07, + "learning_rate": 1.989658086028629e-06, + "loss": 0.9658, + "step": 2905 + }, + { + "epoch": 0.07, + "learning_rate": 1.9896461748320044e-06, + "loss": 0.71, + "step": 2906 + }, + { + "epoch": 0.07, + "learning_rate": 1.989634256815721e-06, + "loss": 0.9922, + "step": 2907 + }, + { + "epoch": 0.07, + "learning_rate": 1.98962233197986e-06, + "loss": 0.9512, + "step": 2908 + }, + { + "epoch": 0.07, + "learning_rate": 1.9896104003245043e-06, + "loss": 1.0264, + "step": 2909 + }, + { + "epoch": 0.07, + "learning_rate": 1.989598461849736e-06, + "loss": 1.1621, + "step": 2910 + }, + { + "epoch": 0.07, + "learning_rate": 1.9895865165556373e-06, + "loss": 1.0566, + "step": 2911 + }, + { + "epoch": 0.07, + "learning_rate": 1.98957456444229e-06, + "loss": 1.0469, + "step": 2912 + }, + { + "epoch": 0.07, + "learning_rate": 1.989562605509777e-06, + "loss": 0.875, + "step": 2913 + }, + { + "epoch": 0.07, + "learning_rate": 1.989550639758181e-06, + "loss": 0.96, + "step": 2914 + }, + { + "epoch": 0.07, + "learning_rate": 1.989538667187584e-06, + "loss": 0.9727, + "step": 2915 + }, + { + "epoch": 0.07, + "learning_rate": 1.989526687798068e-06, + "loss": 1.0088, + "step": 2916 + }, + { + "epoch": 0.07, + "learning_rate": 1.989514701589717e-06, + "loss": 0.8945, + "step": 2917 + }, + { + "epoch": 0.07, + "learning_rate": 1.9895027085626123e-06, + "loss": 1.0049, + "step": 2918 + }, + { + "epoch": 0.07, + "learning_rate": 1.9894907087168367e-06, + "loss": 1.0801, + "step": 2919 + }, + { + "epoch": 0.07, + "learning_rate": 1.9894787020524735e-06, + "loss": 1.1777, + "step": 2920 + }, + { + "epoch": 0.07, + "learning_rate": 1.989466688569605e-06, + "loss": 0.957, + "step": 2921 + }, + { + "epoch": 0.07, + "learning_rate": 1.989454668268314e-06, + "loss": 1.0713, + "step": 2922 + }, + { + "epoch": 0.07, + "learning_rate": 1.9894426411486835e-06, + "loss": 0.8789, + "step": 2923 + }, + { + "epoch": 0.07, + "learning_rate": 1.989430607210796e-06, + "loss": 1.0752, + "step": 2924 + }, + { + "epoch": 0.07, + "learning_rate": 1.989418566454735e-06, + "loss": 0.7412, + "step": 2925 + }, + { + "epoch": 0.07, + "learning_rate": 1.989406518880583e-06, + "loss": 1.0684, + "step": 2926 + }, + { + "epoch": 0.08, + "learning_rate": 1.9893944644884235e-06, + "loss": 0.9238, + "step": 2927 + }, + { + "epoch": 0.08, + "learning_rate": 1.989382403278339e-06, + "loss": 0.8013, + "step": 2928 + }, + { + "epoch": 0.08, + "learning_rate": 1.989370335250413e-06, + "loss": 0.9658, + "step": 2929 + }, + { + "epoch": 0.08, + "learning_rate": 1.9893582604047286e-06, + "loss": 0.8472, + "step": 2930 + }, + { + "epoch": 0.08, + "learning_rate": 1.9893461787413687e-06, + "loss": 0.7554, + "step": 2931 + }, + { + "epoch": 0.08, + "learning_rate": 1.989334090260417e-06, + "loss": 1.1611, + "step": 2932 + }, + { + "epoch": 0.08, + "learning_rate": 1.989321994961957e-06, + "loss": 0.8945, + "step": 2933 + }, + { + "epoch": 0.08, + "learning_rate": 1.9893098928460708e-06, + "loss": 1.0947, + "step": 2934 + }, + { + "epoch": 0.08, + "learning_rate": 1.989297783912843e-06, + "loss": 1.2236, + "step": 2935 + }, + { + "epoch": 0.08, + "learning_rate": 1.989285668162357e-06, + "loss": 0.9844, + "step": 2936 + }, + { + "epoch": 0.08, + "learning_rate": 1.9892735455946957e-06, + "loss": 1.002, + "step": 2937 + }, + { + "epoch": 0.08, + "learning_rate": 1.989261416209943e-06, + "loss": 0.8232, + "step": 2938 + }, + { + "epoch": 0.08, + "learning_rate": 1.9892492800081823e-06, + "loss": 0.9883, + "step": 2939 + }, + { + "epoch": 0.08, + "learning_rate": 1.9892371369894975e-06, + "loss": 1.0098, + "step": 2940 + }, + { + "epoch": 0.08, + "learning_rate": 1.9892249871539724e-06, + "loss": 0.8428, + "step": 2941 + }, + { + "epoch": 0.08, + "learning_rate": 1.98921283050169e-06, + "loss": 0.9111, + "step": 2942 + }, + { + "epoch": 0.08, + "learning_rate": 1.989200667032735e-06, + "loss": 0.9883, + "step": 2943 + }, + { + "epoch": 0.08, + "learning_rate": 1.98918849674719e-06, + "loss": 1.127, + "step": 2944 + }, + { + "epoch": 0.08, + "learning_rate": 1.98917631964514e-06, + "loss": 1.0273, + "step": 2945 + }, + { + "epoch": 0.08, + "learning_rate": 1.9891641357266683e-06, + "loss": 0.8584, + "step": 2946 + }, + { + "epoch": 0.08, + "learning_rate": 1.9891519449918596e-06, + "loss": 1.292, + "step": 2947 + }, + { + "epoch": 0.08, + "learning_rate": 1.989139747440797e-06, + "loss": 0.8364, + "step": 2948 + }, + { + "epoch": 0.08, + "learning_rate": 1.9891275430735646e-06, + "loss": 0.959, + "step": 2949 + }, + { + "epoch": 0.08, + "learning_rate": 1.9891153318902473e-06, + "loss": 1.0781, + "step": 2950 + }, + { + "epoch": 0.08, + "learning_rate": 1.9891031138909286e-06, + "loss": 1.0342, + "step": 2951 + }, + { + "epoch": 0.08, + "learning_rate": 1.989090889075693e-06, + "loss": 0.9619, + "step": 2952 + }, + { + "epoch": 0.08, + "learning_rate": 1.9890786574446247e-06, + "loss": 0.9316, + "step": 2953 + }, + { + "epoch": 0.08, + "learning_rate": 1.9890664189978074e-06, + "loss": 1.0361, + "step": 2954 + }, + { + "epoch": 0.08, + "learning_rate": 1.9890541737353265e-06, + "loss": 0.8838, + "step": 2955 + }, + { + "epoch": 0.08, + "learning_rate": 1.9890419216572652e-06, + "loss": 0.8984, + "step": 2956 + }, + { + "epoch": 0.08, + "learning_rate": 1.9890296627637092e-06, + "loss": 1.1406, + "step": 2957 + }, + { + "epoch": 0.08, + "learning_rate": 1.989017397054742e-06, + "loss": 0.8945, + "step": 2958 + }, + { + "epoch": 0.08, + "learning_rate": 1.9890051245304488e-06, + "loss": 0.7891, + "step": 2959 + }, + { + "epoch": 0.08, + "learning_rate": 1.9889928451909133e-06, + "loss": 0.9941, + "step": 2960 + }, + { + "epoch": 0.08, + "learning_rate": 1.9889805590362206e-06, + "loss": 0.9668, + "step": 2961 + }, + { + "epoch": 0.08, + "learning_rate": 1.988968266066456e-06, + "loss": 0.7515, + "step": 2962 + }, + { + "epoch": 0.08, + "learning_rate": 1.988955966281703e-06, + "loss": 0.9365, + "step": 2963 + }, + { + "epoch": 0.08, + "learning_rate": 1.9889436596820472e-06, + "loss": 0.8535, + "step": 2964 + }, + { + "epoch": 0.08, + "learning_rate": 1.988931346267573e-06, + "loss": 0.9922, + "step": 2965 + }, + { + "epoch": 0.08, + "learning_rate": 1.988919026038366e-06, + "loss": 0.96, + "step": 2966 + }, + { + "epoch": 0.08, + "learning_rate": 1.98890669899451e-06, + "loss": 0.7402, + "step": 2967 + }, + { + "epoch": 0.08, + "learning_rate": 1.9888943651360906e-06, + "loss": 0.8906, + "step": 2968 + }, + { + "epoch": 0.08, + "learning_rate": 1.9888820244631925e-06, + "loss": 0.8296, + "step": 2969 + }, + { + "epoch": 0.08, + "learning_rate": 1.9888696769759012e-06, + "loss": 0.6973, + "step": 2970 + }, + { + "epoch": 0.08, + "learning_rate": 1.9888573226743014e-06, + "loss": 1.0098, + "step": 2971 + }, + { + "epoch": 0.08, + "learning_rate": 1.9888449615584783e-06, + "loss": 0.7231, + "step": 2972 + }, + { + "epoch": 0.08, + "learning_rate": 1.988832593628517e-06, + "loss": 0.9717, + "step": 2973 + }, + { + "epoch": 0.08, + "learning_rate": 1.988820218884503e-06, + "loss": 0.875, + "step": 2974 + }, + { + "epoch": 0.08, + "learning_rate": 1.9888078373265213e-06, + "loss": 1.04, + "step": 2975 + }, + { + "epoch": 0.08, + "learning_rate": 1.9887954489546573e-06, + "loss": 0.9883, + "step": 2976 + }, + { + "epoch": 0.08, + "learning_rate": 1.9887830537689964e-06, + "loss": 0.8262, + "step": 2977 + }, + { + "epoch": 0.08, + "learning_rate": 1.9887706517696237e-06, + "loss": 0.9004, + "step": 2978 + }, + { + "epoch": 0.08, + "learning_rate": 1.9887582429566257e-06, + "loss": 0.9844, + "step": 2979 + }, + { + "epoch": 0.08, + "learning_rate": 1.9887458273300866e-06, + "loss": 0.8457, + "step": 2980 + }, + { + "epoch": 0.08, + "learning_rate": 1.988733404890093e-06, + "loss": 0.8315, + "step": 2981 + }, + { + "epoch": 0.08, + "learning_rate": 1.9887209756367296e-06, + "loss": 0.7615, + "step": 2982 + }, + { + "epoch": 0.08, + "learning_rate": 1.9887085395700823e-06, + "loss": 0.9316, + "step": 2983 + }, + { + "epoch": 0.08, + "learning_rate": 1.9886960966902373e-06, + "loss": 0.7651, + "step": 2984 + }, + { + "epoch": 0.08, + "learning_rate": 1.98868364699728e-06, + "loss": 0.75, + "step": 2985 + }, + { + "epoch": 0.08, + "learning_rate": 1.9886711904912965e-06, + "loss": 1.1426, + "step": 2986 + }, + { + "epoch": 0.08, + "learning_rate": 1.988658727172372e-06, + "loss": 0.9058, + "step": 2987 + }, + { + "epoch": 0.08, + "learning_rate": 1.9886462570405927e-06, + "loss": 1.042, + "step": 2988 + }, + { + "epoch": 0.08, + "learning_rate": 1.9886337800960447e-06, + "loss": 0.9932, + "step": 2989 + }, + { + "epoch": 0.08, + "learning_rate": 1.988621296338814e-06, + "loss": 1.1201, + "step": 2990 + }, + { + "epoch": 0.08, + "learning_rate": 1.9886088057689865e-06, + "loss": 0.9629, + "step": 2991 + }, + { + "epoch": 0.08, + "learning_rate": 1.9885963083866477e-06, + "loss": 0.9619, + "step": 2992 + }, + { + "epoch": 0.08, + "learning_rate": 1.988583804191885e-06, + "loss": 1.0273, + "step": 2993 + }, + { + "epoch": 0.08, + "learning_rate": 1.988571293184784e-06, + "loss": 1.0088, + "step": 2994 + }, + { + "epoch": 0.08, + "learning_rate": 1.98855877536543e-06, + "loss": 0.8584, + "step": 2995 + }, + { + "epoch": 0.08, + "learning_rate": 1.98854625073391e-06, + "loss": 1.0186, + "step": 2996 + }, + { + "epoch": 0.08, + "learning_rate": 1.9885337192903105e-06, + "loss": 0.9092, + "step": 2997 + }, + { + "epoch": 0.08, + "learning_rate": 1.9885211810347184e-06, + "loss": 0.9131, + "step": 2998 + }, + { + "epoch": 0.08, + "learning_rate": 1.9885086359672182e-06, + "loss": 0.9131, + "step": 2999 + }, + { + "epoch": 0.08, + "learning_rate": 1.988496084087898e-06, + "loss": 0.918, + "step": 3000 + }, + { + "epoch": 0.08, + "learning_rate": 1.988483525396844e-06, + "loss": 0.7183, + "step": 3001 + }, + { + "epoch": 0.08, + "learning_rate": 1.9884709598941427e-06, + "loss": 1.1016, + "step": 3002 + }, + { + "epoch": 0.08, + "learning_rate": 1.98845838757988e-06, + "loss": 0.9834, + "step": 3003 + }, + { + "epoch": 0.08, + "learning_rate": 1.9884458084541435e-06, + "loss": 1.0723, + "step": 3004 + }, + { + "epoch": 0.08, + "learning_rate": 1.9884332225170195e-06, + "loss": 0.832, + "step": 3005 + }, + { + "epoch": 0.08, + "learning_rate": 1.988420629768595e-06, + "loss": 1.1221, + "step": 3006 + }, + { + "epoch": 0.08, + "learning_rate": 1.9884080302089554e-06, + "loss": 1.0078, + "step": 3007 + }, + { + "epoch": 0.08, + "learning_rate": 1.9883954238381894e-06, + "loss": 1.084, + "step": 3008 + }, + { + "epoch": 0.08, + "learning_rate": 1.9883828106563828e-06, + "loss": 0.9556, + "step": 3009 + }, + { + "epoch": 0.08, + "learning_rate": 1.988370190663623e-06, + "loss": 1.2598, + "step": 3010 + }, + { + "epoch": 0.08, + "learning_rate": 1.9883575638599966e-06, + "loss": 0.8438, + "step": 3011 + }, + { + "epoch": 0.08, + "learning_rate": 1.9883449302455907e-06, + "loss": 1.0752, + "step": 3012 + }, + { + "epoch": 0.08, + "learning_rate": 1.9883322898204927e-06, + "loss": 1.0166, + "step": 3013 + }, + { + "epoch": 0.08, + "learning_rate": 1.988319642584789e-06, + "loss": 0.7588, + "step": 3014 + }, + { + "epoch": 0.08, + "learning_rate": 1.9883069885385673e-06, + "loss": 1.0791, + "step": 3015 + }, + { + "epoch": 0.08, + "learning_rate": 1.9882943276819153e-06, + "loss": 0.7661, + "step": 3016 + }, + { + "epoch": 0.08, + "learning_rate": 1.988281660014919e-06, + "loss": 1.168, + "step": 3017 + }, + { + "epoch": 0.08, + "learning_rate": 1.988268985537666e-06, + "loss": 0.9922, + "step": 3018 + }, + { + "epoch": 0.08, + "learning_rate": 1.988256304250245e-06, + "loss": 0.7769, + "step": 3019 + }, + { + "epoch": 0.08, + "learning_rate": 1.9882436161527413e-06, + "loss": 1.0811, + "step": 3020 + }, + { + "epoch": 0.08, + "learning_rate": 1.9882309212452437e-06, + "loss": 1.0225, + "step": 3021 + }, + { + "epoch": 0.08, + "learning_rate": 1.9882182195278396e-06, + "loss": 0.8896, + "step": 3022 + }, + { + "epoch": 0.08, + "learning_rate": 1.9882055110006163e-06, + "loss": 1.1553, + "step": 3023 + }, + { + "epoch": 0.08, + "learning_rate": 1.988192795663661e-06, + "loss": 0.8662, + "step": 3024 + }, + { + "epoch": 0.08, + "learning_rate": 1.988180073517062e-06, + "loss": 0.9863, + "step": 3025 + }, + { + "epoch": 0.08, + "learning_rate": 1.9881673445609065e-06, + "loss": 0.9277, + "step": 3026 + }, + { + "epoch": 0.08, + "learning_rate": 1.988154608795282e-06, + "loss": 0.9092, + "step": 3027 + }, + { + "epoch": 0.08, + "learning_rate": 1.9881418662202774e-06, + "loss": 0.9365, + "step": 3028 + }, + { + "epoch": 0.08, + "learning_rate": 1.9881291168359794e-06, + "loss": 1.1035, + "step": 3029 + }, + { + "epoch": 0.08, + "learning_rate": 1.988116360642476e-06, + "loss": 1.2432, + "step": 3030 + }, + { + "epoch": 0.08, + "learning_rate": 1.9881035976398554e-06, + "loss": 1.0527, + "step": 3031 + }, + { + "epoch": 0.08, + "learning_rate": 1.9880908278282055e-06, + "loss": 1.0098, + "step": 3032 + }, + { + "epoch": 0.08, + "learning_rate": 1.9880780512076143e-06, + "loss": 0.9434, + "step": 3033 + }, + { + "epoch": 0.08, + "learning_rate": 1.9880652677781696e-06, + "loss": 0.9805, + "step": 3034 + }, + { + "epoch": 0.08, + "learning_rate": 1.9880524775399597e-06, + "loss": 1.0381, + "step": 3035 + }, + { + "epoch": 0.08, + "learning_rate": 1.988039680493073e-06, + "loss": 1.0117, + "step": 3036 + }, + { + "epoch": 0.08, + "learning_rate": 1.9880268766375972e-06, + "loss": 1.0732, + "step": 3037 + }, + { + "epoch": 0.08, + "learning_rate": 1.9880140659736207e-06, + "loss": 0.9932, + "step": 3038 + }, + { + "epoch": 0.08, + "learning_rate": 1.988001248501232e-06, + "loss": 0.5859, + "step": 3039 + }, + { + "epoch": 0.08, + "learning_rate": 1.987988424220519e-06, + "loss": 0.9404, + "step": 3040 + }, + { + "epoch": 0.08, + "learning_rate": 1.98797559313157e-06, + "loss": 0.8506, + "step": 3041 + }, + { + "epoch": 0.08, + "learning_rate": 1.9879627552344743e-06, + "loss": 0.9756, + "step": 3042 + }, + { + "epoch": 0.08, + "learning_rate": 1.9879499105293194e-06, + "loss": 1.0381, + "step": 3043 + }, + { + "epoch": 0.08, + "learning_rate": 1.9879370590161948e-06, + "loss": 0.8311, + "step": 3044 + }, + { + "epoch": 0.08, + "learning_rate": 1.987924200695188e-06, + "loss": 0.958, + "step": 3045 + }, + { + "epoch": 0.08, + "learning_rate": 1.987911335566388e-06, + "loss": 0.7563, + "step": 3046 + }, + { + "epoch": 0.08, + "learning_rate": 1.987898463629884e-06, + "loss": 1.0742, + "step": 3047 + }, + { + "epoch": 0.08, + "learning_rate": 1.987885584885764e-06, + "loss": 0.7568, + "step": 3048 + }, + { + "epoch": 0.08, + "learning_rate": 1.987872699334116e-06, + "loss": 0.8818, + "step": 3049 + }, + { + "epoch": 0.08, + "learning_rate": 1.987859806975031e-06, + "loss": 0.917, + "step": 3050 + }, + { + "epoch": 0.08, + "learning_rate": 1.987846907808596e-06, + "loss": 0.8032, + "step": 3051 + }, + { + "epoch": 0.08, + "learning_rate": 1.9878340018349007e-06, + "loss": 1.2471, + "step": 3052 + }, + { + "epoch": 0.08, + "learning_rate": 1.987821089054034e-06, + "loss": 0.8525, + "step": 3053 + }, + { + "epoch": 0.08, + "learning_rate": 1.9878081694660847e-06, + "loss": 0.8027, + "step": 3054 + }, + { + "epoch": 0.08, + "learning_rate": 1.9877952430711415e-06, + "loss": 0.9883, + "step": 3055 + }, + { + "epoch": 0.08, + "learning_rate": 1.987782309869294e-06, + "loss": 0.873, + "step": 3056 + }, + { + "epoch": 0.08, + "learning_rate": 1.9877693698606316e-06, + "loss": 0.9307, + "step": 3057 + }, + { + "epoch": 0.08, + "learning_rate": 1.9877564230452424e-06, + "loss": 0.9541, + "step": 3058 + }, + { + "epoch": 0.08, + "learning_rate": 1.9877434694232163e-06, + "loss": 1.0898, + "step": 3059 + }, + { + "epoch": 0.08, + "learning_rate": 1.9877305089946426e-06, + "loss": 0.959, + "step": 3060 + }, + { + "epoch": 0.08, + "learning_rate": 1.9877175417596103e-06, + "loss": 1.0078, + "step": 3061 + }, + { + "epoch": 0.08, + "learning_rate": 1.987704567718209e-06, + "loss": 0.8857, + "step": 3062 + }, + { + "epoch": 0.08, + "learning_rate": 1.9876915868705286e-06, + "loss": 0.8984, + "step": 3063 + }, + { + "epoch": 0.08, + "learning_rate": 1.9876785992166575e-06, + "loss": 0.6851, + "step": 3064 + }, + { + "epoch": 0.08, + "learning_rate": 1.9876656047566857e-06, + "loss": 0.9609, + "step": 3065 + }, + { + "epoch": 0.08, + "learning_rate": 1.987652603490703e-06, + "loss": 1.0332, + "step": 3066 + }, + { + "epoch": 0.08, + "learning_rate": 1.987639595418799e-06, + "loss": 0.96, + "step": 3067 + }, + { + "epoch": 0.08, + "learning_rate": 1.9876265805410623e-06, + "loss": 1.0068, + "step": 3068 + }, + { + "epoch": 0.08, + "learning_rate": 1.987613558857584e-06, + "loss": 0.8779, + "step": 3069 + }, + { + "epoch": 0.08, + "learning_rate": 1.9876005303684532e-06, + "loss": 1.0859, + "step": 3070 + }, + { + "epoch": 0.08, + "learning_rate": 1.987587495073759e-06, + "loss": 0.8457, + "step": 3071 + }, + { + "epoch": 0.08, + "learning_rate": 1.9875744529735927e-06, + "loss": 1.1035, + "step": 3072 + }, + { + "epoch": 0.08, + "learning_rate": 1.987561404068043e-06, + "loss": 0.8066, + "step": 3073 + }, + { + "epoch": 0.08, + "learning_rate": 1.9875483483572002e-06, + "loss": 0.9883, + "step": 3074 + }, + { + "epoch": 0.08, + "learning_rate": 1.9875352858411546e-06, + "loss": 0.9014, + "step": 3075 + }, + { + "epoch": 0.08, + "learning_rate": 1.987522216519996e-06, + "loss": 0.9658, + "step": 3076 + }, + { + "epoch": 0.08, + "learning_rate": 1.9875091403938137e-06, + "loss": 1.0205, + "step": 3077 + }, + { + "epoch": 0.08, + "learning_rate": 1.9874960574626985e-06, + "loss": 0.7451, + "step": 3078 + }, + { + "epoch": 0.08, + "learning_rate": 1.987482967726741e-06, + "loss": 1.0986, + "step": 3079 + }, + { + "epoch": 0.08, + "learning_rate": 1.9874698711860306e-06, + "loss": 0.9277, + "step": 3080 + }, + { + "epoch": 0.08, + "learning_rate": 1.9874567678406578e-06, + "loss": 0.959, + "step": 3081 + }, + { + "epoch": 0.08, + "learning_rate": 1.987443657690713e-06, + "loss": 0.8799, + "step": 3082 + }, + { + "epoch": 0.08, + "learning_rate": 1.987430540736287e-06, + "loss": 0.8818, + "step": 3083 + }, + { + "epoch": 0.08, + "learning_rate": 1.987417416977469e-06, + "loss": 1.0889, + "step": 3084 + }, + { + "epoch": 0.08, + "learning_rate": 1.9874042864143506e-06, + "loss": 1.002, + "step": 3085 + }, + { + "epoch": 0.08, + "learning_rate": 1.9873911490470215e-06, + "loss": 0.812, + "step": 3086 + }, + { + "epoch": 0.08, + "learning_rate": 1.9873780048755725e-06, + "loss": 0.7695, + "step": 3087 + }, + { + "epoch": 0.08, + "learning_rate": 1.9873648539000946e-06, + "loss": 1.0557, + "step": 3088 + }, + { + "epoch": 0.08, + "learning_rate": 1.9873516961206776e-06, + "loss": 0.772, + "step": 3089 + }, + { + "epoch": 0.08, + "learning_rate": 1.987338531537413e-06, + "loss": 0.8403, + "step": 3090 + }, + { + "epoch": 0.08, + "learning_rate": 1.9873253601503904e-06, + "loss": 0.8594, + "step": 3091 + }, + { + "epoch": 0.08, + "learning_rate": 1.987312181959702e-06, + "loss": 0.7607, + "step": 3092 + }, + { + "epoch": 0.08, + "learning_rate": 1.9872989969654377e-06, + "loss": 1.0889, + "step": 3093 + }, + { + "epoch": 0.08, + "learning_rate": 1.9872858051676885e-06, + "loss": 0.9922, + "step": 3094 + }, + { + "epoch": 0.08, + "learning_rate": 1.987272606566545e-06, + "loss": 1.0107, + "step": 3095 + }, + { + "epoch": 0.08, + "learning_rate": 1.9872594011620993e-06, + "loss": 0.8613, + "step": 3096 + }, + { + "epoch": 0.08, + "learning_rate": 1.987246188954441e-06, + "loss": 1.0117, + "step": 3097 + }, + { + "epoch": 0.08, + "learning_rate": 1.987232969943662e-06, + "loss": 0.9609, + "step": 3098 + }, + { + "epoch": 0.08, + "learning_rate": 1.9872197441298534e-06, + "loss": 0.9365, + "step": 3099 + }, + { + "epoch": 0.08, + "learning_rate": 1.9872065115131057e-06, + "loss": 0.8657, + "step": 3100 + }, + { + "epoch": 0.08, + "learning_rate": 1.9871932720935103e-06, + "loss": 0.9648, + "step": 3101 + }, + { + "epoch": 0.08, + "learning_rate": 1.9871800258711586e-06, + "loss": 0.8789, + "step": 3102 + }, + { + "epoch": 0.08, + "learning_rate": 1.9871667728461427e-06, + "loss": 0.8555, + "step": 3103 + }, + { + "epoch": 0.08, + "learning_rate": 1.987153513018552e-06, + "loss": 0.9023, + "step": 3104 + }, + { + "epoch": 0.08, + "learning_rate": 1.98714024638848e-06, + "loss": 1.0361, + "step": 3105 + }, + { + "epoch": 0.08, + "learning_rate": 1.9871269729560164e-06, + "loss": 0.6875, + "step": 3106 + }, + { + "epoch": 0.08, + "learning_rate": 1.9871136927212538e-06, + "loss": 0.9385, + "step": 3107 + }, + { + "epoch": 0.08, + "learning_rate": 1.9871004056842833e-06, + "loss": 0.9941, + "step": 3108 + }, + { + "epoch": 0.08, + "learning_rate": 1.987087111845196e-06, + "loss": 0.604, + "step": 3109 + }, + { + "epoch": 0.08, + "learning_rate": 1.9870738112040845e-06, + "loss": 1.0596, + "step": 3110 + }, + { + "epoch": 0.08, + "learning_rate": 1.9870605037610396e-06, + "loss": 0.8696, + "step": 3111 + }, + { + "epoch": 0.08, + "learning_rate": 1.9870471895161533e-06, + "loss": 0.9336, + "step": 3112 + }, + { + "epoch": 0.08, + "learning_rate": 1.9870338684695174e-06, + "loss": 0.9424, + "step": 3113 + }, + { + "epoch": 0.08, + "learning_rate": 1.9870205406212235e-06, + "loss": 1.085, + "step": 3114 + }, + { + "epoch": 0.08, + "learning_rate": 1.987007205971364e-06, + "loss": 0.9434, + "step": 3115 + }, + { + "epoch": 0.08, + "learning_rate": 1.98699386452003e-06, + "loss": 1.0039, + "step": 3116 + }, + { + "epoch": 0.08, + "learning_rate": 1.9869805162673137e-06, + "loss": 0.8975, + "step": 3117 + }, + { + "epoch": 0.08, + "learning_rate": 1.9869671612133074e-06, + "loss": 0.9746, + "step": 3118 + }, + { + "epoch": 0.08, + "learning_rate": 1.9869537993581035e-06, + "loss": 1.0059, + "step": 3119 + }, + { + "epoch": 0.08, + "learning_rate": 1.9869404307017925e-06, + "loss": 1.1191, + "step": 3120 + }, + { + "epoch": 0.08, + "learning_rate": 1.9869270552444685e-06, + "loss": 1.0371, + "step": 3121 + }, + { + "epoch": 0.08, + "learning_rate": 1.986913672986222e-06, + "loss": 1.1426, + "step": 3122 + }, + { + "epoch": 0.08, + "learning_rate": 1.9869002839271464e-06, + "loss": 1.0234, + "step": 3123 + }, + { + "epoch": 0.08, + "learning_rate": 1.986886888067333e-06, + "loss": 0.9551, + "step": 3124 + }, + { + "epoch": 0.08, + "learning_rate": 1.986873485406875e-06, + "loss": 1.0537, + "step": 3125 + }, + { + "epoch": 0.08, + "learning_rate": 1.9868600759458644e-06, + "loss": 0.8486, + "step": 3126 + }, + { + "epoch": 0.08, + "learning_rate": 1.986846659684393e-06, + "loss": 0.8633, + "step": 3127 + }, + { + "epoch": 0.08, + "learning_rate": 1.9868332366225544e-06, + "loss": 0.8975, + "step": 3128 + }, + { + "epoch": 0.08, + "learning_rate": 1.98681980676044e-06, + "loss": 0.8994, + "step": 3129 + }, + { + "epoch": 0.08, + "learning_rate": 1.986806370098144e-06, + "loss": 0.7173, + "step": 3130 + }, + { + "epoch": 0.08, + "learning_rate": 1.9867929266357564e-06, + "loss": 0.9727, + "step": 3131 + }, + { + "epoch": 0.08, + "learning_rate": 1.986779476373372e-06, + "loss": 1.0381, + "step": 3132 + }, + { + "epoch": 0.08, + "learning_rate": 1.986766019311083e-06, + "loss": 1.0117, + "step": 3133 + }, + { + "epoch": 0.08, + "learning_rate": 1.9867525554489814e-06, + "loss": 0.8042, + "step": 3134 + }, + { + "epoch": 0.08, + "learning_rate": 1.9867390847871607e-06, + "loss": 0.957, + "step": 3135 + }, + { + "epoch": 0.08, + "learning_rate": 1.9867256073257136e-06, + "loss": 0.875, + "step": 3136 + }, + { + "epoch": 0.08, + "learning_rate": 1.986712123064733e-06, + "loss": 1.0723, + "step": 3137 + }, + { + "epoch": 0.08, + "learning_rate": 1.986698632004311e-06, + "loss": 1.0518, + "step": 3138 + }, + { + "epoch": 0.08, + "learning_rate": 1.986685134144542e-06, + "loss": 1.0625, + "step": 3139 + }, + { + "epoch": 0.08, + "learning_rate": 1.986671629485518e-06, + "loss": 0.6519, + "step": 3140 + }, + { + "epoch": 0.08, + "learning_rate": 1.9866581180273324e-06, + "loss": 0.7412, + "step": 3141 + }, + { + "epoch": 0.08, + "learning_rate": 1.986644599770078e-06, + "loss": 0.8452, + "step": 3142 + }, + { + "epoch": 0.08, + "learning_rate": 1.986631074713849e-06, + "loss": 0.8408, + "step": 3143 + }, + { + "epoch": 0.08, + "learning_rate": 1.986617542858737e-06, + "loss": 1.1816, + "step": 3144 + }, + { + "epoch": 0.08, + "learning_rate": 1.986604004204836e-06, + "loss": 1.04, + "step": 3145 + }, + { + "epoch": 0.08, + "learning_rate": 1.98659045875224e-06, + "loss": 0.9365, + "step": 3146 + }, + { + "epoch": 0.08, + "learning_rate": 1.986576906501041e-06, + "loss": 0.917, + "step": 3147 + }, + { + "epoch": 0.08, + "learning_rate": 1.9865633474513338e-06, + "loss": 1.0195, + "step": 3148 + }, + { + "epoch": 0.08, + "learning_rate": 1.9865497816032107e-06, + "loss": 1.0205, + "step": 3149 + }, + { + "epoch": 0.08, + "learning_rate": 1.9865362089567657e-06, + "loss": 0.9844, + "step": 3150 + }, + { + "epoch": 0.08, + "learning_rate": 1.9865226295120926e-06, + "loss": 0.8721, + "step": 3151 + }, + { + "epoch": 0.08, + "learning_rate": 1.986509043269284e-06, + "loss": 0.958, + "step": 3152 + }, + { + "epoch": 0.08, + "learning_rate": 1.9864954502284344e-06, + "loss": 1.1016, + "step": 3153 + }, + { + "epoch": 0.08, + "learning_rate": 1.9864818503896372e-06, + "loss": 0.9072, + "step": 3154 + }, + { + "epoch": 0.08, + "learning_rate": 1.986468243752986e-06, + "loss": 1.0371, + "step": 3155 + }, + { + "epoch": 0.08, + "learning_rate": 1.986454630318575e-06, + "loss": 0.9043, + "step": 3156 + }, + { + "epoch": 0.08, + "learning_rate": 1.9864410100864974e-06, + "loss": 1.0107, + "step": 3157 + }, + { + "epoch": 0.08, + "learning_rate": 1.9864273830568474e-06, + "loss": 0.9404, + "step": 3158 + }, + { + "epoch": 0.08, + "learning_rate": 1.9864137492297187e-06, + "loss": 0.7251, + "step": 3159 + }, + { + "epoch": 0.08, + "learning_rate": 1.986400108605205e-06, + "loss": 1.1445, + "step": 3160 + }, + { + "epoch": 0.08, + "learning_rate": 1.9863864611834018e-06, + "loss": 0.9609, + "step": 3161 + }, + { + "epoch": 0.08, + "learning_rate": 1.9863728069644016e-06, + "loss": 0.7861, + "step": 3162 + }, + { + "epoch": 0.08, + "learning_rate": 1.9863591459482988e-06, + "loss": 0.8867, + "step": 3163 + }, + { + "epoch": 0.08, + "learning_rate": 1.9863454781351877e-06, + "loss": 1.2627, + "step": 3164 + }, + { + "epoch": 0.08, + "learning_rate": 1.9863318035251623e-06, + "loss": 0.8125, + "step": 3165 + }, + { + "epoch": 0.08, + "learning_rate": 1.986318122118317e-06, + "loss": 0.9907, + "step": 3166 + }, + { + "epoch": 0.08, + "learning_rate": 1.9863044339147463e-06, + "loss": 1.0605, + "step": 3167 + }, + { + "epoch": 0.08, + "learning_rate": 1.9862907389145444e-06, + "loss": 0.8779, + "step": 3168 + }, + { + "epoch": 0.08, + "learning_rate": 1.9862770371178053e-06, + "loss": 0.8242, + "step": 3169 + }, + { + "epoch": 0.08, + "learning_rate": 1.986263328524624e-06, + "loss": 0.835, + "step": 3170 + }, + { + "epoch": 0.08, + "learning_rate": 1.986249613135094e-06, + "loss": 1.1562, + "step": 3171 + }, + { + "epoch": 0.08, + "learning_rate": 1.986235890949311e-06, + "loss": 0.8447, + "step": 3172 + }, + { + "epoch": 0.08, + "learning_rate": 1.9862221619673688e-06, + "loss": 0.8057, + "step": 3173 + }, + { + "epoch": 0.08, + "learning_rate": 1.9862084261893627e-06, + "loss": 0.8965, + "step": 3174 + }, + { + "epoch": 0.08, + "learning_rate": 1.9861946836153864e-06, + "loss": 1.126, + "step": 3175 + }, + { + "epoch": 0.08, + "learning_rate": 1.986180934245535e-06, + "loss": 1.1123, + "step": 3176 + }, + { + "epoch": 0.08, + "learning_rate": 1.986167178079904e-06, + "loss": 0.9248, + "step": 3177 + }, + { + "epoch": 0.08, + "learning_rate": 1.986153415118587e-06, + "loss": 0.9414, + "step": 3178 + }, + { + "epoch": 0.08, + "learning_rate": 1.9861396453616793e-06, + "loss": 1.0205, + "step": 3179 + }, + { + "epoch": 0.08, + "learning_rate": 1.986125868809276e-06, + "loss": 0.9067, + "step": 3180 + }, + { + "epoch": 0.08, + "learning_rate": 1.986112085461472e-06, + "loss": 0.9961, + "step": 3181 + }, + { + "epoch": 0.08, + "learning_rate": 1.986098295318362e-06, + "loss": 0.7607, + "step": 3182 + }, + { + "epoch": 0.08, + "learning_rate": 1.9860844983800415e-06, + "loss": 1.1641, + "step": 3183 + }, + { + "epoch": 0.08, + "learning_rate": 1.9860706946466048e-06, + "loss": 0.9355, + "step": 3184 + }, + { + "epoch": 0.08, + "learning_rate": 1.9860568841181478e-06, + "loss": 0.8818, + "step": 3185 + }, + { + "epoch": 0.08, + "learning_rate": 1.9860430667947654e-06, + "loss": 0.7275, + "step": 3186 + }, + { + "epoch": 0.08, + "learning_rate": 1.9860292426765524e-06, + "loss": 1.0098, + "step": 3187 + }, + { + "epoch": 0.08, + "learning_rate": 1.986015411763605e-06, + "loss": 0.8857, + "step": 3188 + }, + { + "epoch": 0.08, + "learning_rate": 1.986001574056018e-06, + "loss": 0.7896, + "step": 3189 + }, + { + "epoch": 0.08, + "learning_rate": 1.985987729553886e-06, + "loss": 0.7422, + "step": 3190 + }, + { + "epoch": 0.08, + "learning_rate": 1.9859738782573053e-06, + "loss": 0.9219, + "step": 3191 + }, + { + "epoch": 0.08, + "learning_rate": 1.9859600201663716e-06, + "loss": 0.9688, + "step": 3192 + }, + { + "epoch": 0.08, + "learning_rate": 1.9859461552811795e-06, + "loss": 0.666, + "step": 3193 + }, + { + "epoch": 0.08, + "learning_rate": 1.985932283601825e-06, + "loss": 0.8091, + "step": 3194 + }, + { + "epoch": 0.08, + "learning_rate": 1.985918405128404e-06, + "loss": 0.8887, + "step": 3195 + }, + { + "epoch": 0.08, + "learning_rate": 1.9859045198610114e-06, + "loss": 0.9834, + "step": 3196 + }, + { + "epoch": 0.08, + "learning_rate": 1.985890627799744e-06, + "loss": 1.0039, + "step": 3197 + }, + { + "epoch": 0.08, + "learning_rate": 1.9858767289446965e-06, + "loss": 0.9893, + "step": 3198 + }, + { + "epoch": 0.08, + "learning_rate": 1.9858628232959646e-06, + "loss": 0.9639, + "step": 3199 + }, + { + "epoch": 0.08, + "learning_rate": 1.985848910853645e-06, + "loss": 0.9043, + "step": 3200 + }, + { + "epoch": 0.08, + "learning_rate": 1.985834991617833e-06, + "loss": 0.7871, + "step": 3201 + }, + { + "epoch": 0.08, + "learning_rate": 1.9858210655886246e-06, + "loss": 0.7026, + "step": 3202 + }, + { + "epoch": 0.08, + "learning_rate": 1.985807132766116e-06, + "loss": 1.1328, + "step": 3203 + }, + { + "epoch": 0.08, + "learning_rate": 1.985793193150403e-06, + "loss": 0.8682, + "step": 3204 + }, + { + "epoch": 0.08, + "learning_rate": 1.985779246741581e-06, + "loss": 0.916, + "step": 3205 + }, + { + "epoch": 0.08, + "learning_rate": 1.9857652935397475e-06, + "loss": 0.6958, + "step": 3206 + }, + { + "epoch": 0.08, + "learning_rate": 1.9857513335449976e-06, + "loss": 0.7896, + "step": 3207 + }, + { + "epoch": 0.08, + "learning_rate": 1.9857373667574276e-06, + "loss": 1.0303, + "step": 3208 + }, + { + "epoch": 0.08, + "learning_rate": 1.9857233931771344e-06, + "loss": 0.9863, + "step": 3209 + }, + { + "epoch": 0.08, + "learning_rate": 1.985709412804214e-06, + "loss": 0.7676, + "step": 3210 + }, + { + "epoch": 0.08, + "learning_rate": 1.985695425638762e-06, + "loss": 0.8838, + "step": 3211 + }, + { + "epoch": 0.08, + "learning_rate": 1.9856814316808756e-06, + "loss": 1.0674, + "step": 3212 + }, + { + "epoch": 0.08, + "learning_rate": 1.985667430930651e-06, + "loss": 0.8101, + "step": 3213 + }, + { + "epoch": 0.08, + "learning_rate": 1.9856534233881846e-06, + "loss": 0.6655, + "step": 3214 + }, + { + "epoch": 0.08, + "learning_rate": 1.9856394090535734e-06, + "loss": 0.9443, + "step": 3215 + }, + { + "epoch": 0.08, + "learning_rate": 1.985625387926913e-06, + "loss": 0.8696, + "step": 3216 + }, + { + "epoch": 0.08, + "learning_rate": 1.985611360008301e-06, + "loss": 0.9023, + "step": 3217 + }, + { + "epoch": 0.08, + "learning_rate": 1.9855973252978338e-06, + "loss": 0.9639, + "step": 3218 + }, + { + "epoch": 0.08, + "learning_rate": 1.985583283795608e-06, + "loss": 0.8926, + "step": 3219 + }, + { + "epoch": 0.08, + "learning_rate": 1.98556923550172e-06, + "loss": 0.7139, + "step": 3220 + }, + { + "epoch": 0.08, + "learning_rate": 1.985555180416267e-06, + "loss": 0.8086, + "step": 3221 + }, + { + "epoch": 0.08, + "learning_rate": 1.985541118539346e-06, + "loss": 0.7598, + "step": 3222 + }, + { + "epoch": 0.08, + "learning_rate": 1.9855270498710536e-06, + "loss": 0.9248, + "step": 3223 + }, + { + "epoch": 0.08, + "learning_rate": 1.985512974411487e-06, + "loss": 0.6973, + "step": 3224 + }, + { + "epoch": 0.08, + "learning_rate": 1.985498892160743e-06, + "loss": 0.7969, + "step": 3225 + }, + { + "epoch": 0.08, + "learning_rate": 1.9854848031189183e-06, + "loss": 0.8638, + "step": 3226 + }, + { + "epoch": 0.08, + "learning_rate": 1.985470707286111e-06, + "loss": 1.0127, + "step": 3227 + }, + { + "epoch": 0.08, + "learning_rate": 1.985456604662417e-06, + "loss": 1.1738, + "step": 3228 + }, + { + "epoch": 0.08, + "learning_rate": 1.9854424952479343e-06, + "loss": 0.8657, + "step": 3229 + }, + { + "epoch": 0.08, + "learning_rate": 1.98542837904276e-06, + "loss": 0.7275, + "step": 3230 + }, + { + "epoch": 0.08, + "learning_rate": 1.9854142560469914e-06, + "loss": 0.8442, + "step": 3231 + }, + { + "epoch": 0.08, + "learning_rate": 1.9854001262607255e-06, + "loss": 0.9961, + "step": 3232 + }, + { + "epoch": 0.08, + "learning_rate": 1.98538598968406e-06, + "loss": 1.125, + "step": 3233 + }, + { + "epoch": 0.08, + "learning_rate": 1.9853718463170925e-06, + "loss": 1.0234, + "step": 3234 + }, + { + "epoch": 0.08, + "learning_rate": 1.9853576961599198e-06, + "loss": 1.0391, + "step": 3235 + }, + { + "epoch": 0.08, + "learning_rate": 1.9853435392126395e-06, + "loss": 1.0684, + "step": 3236 + }, + { + "epoch": 0.08, + "learning_rate": 1.98532937547535e-06, + "loss": 0.8672, + "step": 3237 + }, + { + "epoch": 0.08, + "learning_rate": 1.985315204948148e-06, + "loss": 1.0742, + "step": 3238 + }, + { + "epoch": 0.08, + "learning_rate": 1.9853010276311318e-06, + "loss": 0.9111, + "step": 3239 + }, + { + "epoch": 0.08, + "learning_rate": 1.9852868435243986e-06, + "loss": 0.8818, + "step": 3240 + }, + { + "epoch": 0.08, + "learning_rate": 1.9852726526280463e-06, + "loss": 1.0518, + "step": 3241 + }, + { + "epoch": 0.08, + "learning_rate": 1.9852584549421727e-06, + "loss": 0.8701, + "step": 3242 + }, + { + "epoch": 0.08, + "learning_rate": 1.9852442504668755e-06, + "loss": 0.9092, + "step": 3243 + }, + { + "epoch": 0.08, + "learning_rate": 1.985230039202253e-06, + "loss": 0.9404, + "step": 3244 + }, + { + "epoch": 0.08, + "learning_rate": 1.985215821148403e-06, + "loss": 0.8145, + "step": 3245 + }, + { + "epoch": 0.08, + "learning_rate": 1.9852015963054226e-06, + "loss": 0.8525, + "step": 3246 + }, + { + "epoch": 0.08, + "learning_rate": 1.985187364673411e-06, + "loss": 0.8701, + "step": 3247 + }, + { + "epoch": 0.08, + "learning_rate": 1.985173126252466e-06, + "loss": 0.9111, + "step": 3248 + }, + { + "epoch": 0.08, + "learning_rate": 1.9851588810426853e-06, + "loss": 1.0, + "step": 3249 + }, + { + "epoch": 0.08, + "learning_rate": 1.9851446290441675e-06, + "loss": 1.0293, + "step": 3250 + }, + { + "epoch": 0.08, + "learning_rate": 1.9851303702570102e-06, + "loss": 0.8877, + "step": 3251 + }, + { + "epoch": 0.08, + "learning_rate": 1.9851161046813125e-06, + "loss": 0.9023, + "step": 3252 + }, + { + "epoch": 0.08, + "learning_rate": 1.985101832317172e-06, + "loss": 0.8955, + "step": 3253 + }, + { + "epoch": 0.08, + "learning_rate": 1.9850875531646877e-06, + "loss": 0.6221, + "step": 3254 + }, + { + "epoch": 0.08, + "learning_rate": 1.9850732672239576e-06, + "loss": 0.8716, + "step": 3255 + }, + { + "epoch": 0.08, + "learning_rate": 1.98505897449508e-06, + "loss": 0.9668, + "step": 3256 + }, + { + "epoch": 0.08, + "learning_rate": 1.9850446749781533e-06, + "loss": 0.8262, + "step": 3257 + }, + { + "epoch": 0.08, + "learning_rate": 1.985030368673277e-06, + "loss": 0.8501, + "step": 3258 + }, + { + "epoch": 0.08, + "learning_rate": 1.9850160555805483e-06, + "loss": 0.9023, + "step": 3259 + }, + { + "epoch": 0.08, + "learning_rate": 1.985001735700067e-06, + "loss": 1.0498, + "step": 3260 + }, + { + "epoch": 0.08, + "learning_rate": 1.9849874090319306e-06, + "loss": 0.9395, + "step": 3261 + }, + { + "epoch": 0.08, + "learning_rate": 1.9849730755762394e-06, + "loss": 1.0752, + "step": 3262 + }, + { + "epoch": 0.08, + "learning_rate": 1.9849587353330906e-06, + "loss": 0.8926, + "step": 3263 + }, + { + "epoch": 0.08, + "learning_rate": 1.9849443883025842e-06, + "loss": 1.0176, + "step": 3264 + }, + { + "epoch": 0.08, + "learning_rate": 1.9849300344848185e-06, + "loss": 0.9248, + "step": 3265 + }, + { + "epoch": 0.08, + "learning_rate": 1.984915673879892e-06, + "loss": 0.7703, + "step": 3266 + }, + { + "epoch": 0.08, + "learning_rate": 1.9849013064879047e-06, + "loss": 0.9951, + "step": 3267 + }, + { + "epoch": 0.08, + "learning_rate": 1.984886932308955e-06, + "loss": 1.0205, + "step": 3268 + }, + { + "epoch": 0.08, + "learning_rate": 1.984872551343142e-06, + "loss": 1.1758, + "step": 3269 + }, + { + "epoch": 0.08, + "learning_rate": 1.9848581635905647e-06, + "loss": 1.0186, + "step": 3270 + }, + { + "epoch": 0.08, + "learning_rate": 1.984843769051322e-06, + "loss": 0.7812, + "step": 3271 + }, + { + "epoch": 0.08, + "learning_rate": 1.984829367725514e-06, + "loss": 0.8828, + "step": 3272 + }, + { + "epoch": 0.08, + "learning_rate": 1.9848149596132393e-06, + "loss": 0.8276, + "step": 3273 + }, + { + "epoch": 0.08, + "learning_rate": 1.984800544714597e-06, + "loss": 0.8643, + "step": 3274 + }, + { + "epoch": 0.08, + "learning_rate": 1.984786123029687e-06, + "loss": 1.0312, + "step": 3275 + }, + { + "epoch": 0.08, + "learning_rate": 1.9847716945586085e-06, + "loss": 0.998, + "step": 3276 + }, + { + "epoch": 0.08, + "learning_rate": 1.9847572593014604e-06, + "loss": 0.9189, + "step": 3277 + }, + { + "epoch": 0.08, + "learning_rate": 1.984742817258343e-06, + "loss": 1.2344, + "step": 3278 + }, + { + "epoch": 0.08, + "learning_rate": 1.984728368429355e-06, + "loss": 1.0449, + "step": 3279 + }, + { + "epoch": 0.08, + "learning_rate": 1.9847139128145966e-06, + "loss": 0.8521, + "step": 3280 + }, + { + "epoch": 0.08, + "learning_rate": 1.984699450414167e-06, + "loss": 1.0049, + "step": 3281 + }, + { + "epoch": 0.08, + "learning_rate": 1.9846849812281664e-06, + "loss": 0.8672, + "step": 3282 + }, + { + "epoch": 0.08, + "learning_rate": 1.984670505256694e-06, + "loss": 0.8438, + "step": 3283 + }, + { + "epoch": 0.08, + "learning_rate": 1.9846560224998496e-06, + "loss": 1.0605, + "step": 3284 + }, + { + "epoch": 0.08, + "learning_rate": 1.984641532957733e-06, + "loss": 1.0947, + "step": 3285 + }, + { + "epoch": 0.08, + "learning_rate": 1.9846270366304443e-06, + "loss": 0.5449, + "step": 3286 + }, + { + "epoch": 0.08, + "learning_rate": 1.9846125335180835e-06, + "loss": 1.2373, + "step": 3287 + }, + { + "epoch": 0.08, + "learning_rate": 1.98459802362075e-06, + "loss": 1.0996, + "step": 3288 + }, + { + "epoch": 0.08, + "learning_rate": 1.984583506938544e-06, + "loss": 0.9277, + "step": 3289 + }, + { + "epoch": 0.08, + "learning_rate": 1.984568983471566e-06, + "loss": 0.917, + "step": 3290 + }, + { + "epoch": 0.08, + "learning_rate": 1.9845544532199155e-06, + "loss": 0.9365, + "step": 3291 + }, + { + "epoch": 0.08, + "learning_rate": 1.984539916183693e-06, + "loss": 1.1699, + "step": 3292 + }, + { + "epoch": 0.08, + "learning_rate": 1.984525372362998e-06, + "loss": 0.8091, + "step": 3293 + }, + { + "epoch": 0.08, + "learning_rate": 1.9845108217579314e-06, + "loss": 0.8423, + "step": 3294 + }, + { + "epoch": 0.08, + "learning_rate": 1.984496264368594e-06, + "loss": 0.7661, + "step": 3295 + }, + { + "epoch": 0.08, + "learning_rate": 1.9844817001950843e-06, + "loss": 0.8066, + "step": 3296 + }, + { + "epoch": 0.08, + "learning_rate": 1.984467129237504e-06, + "loss": 0.8682, + "step": 3297 + }, + { + "epoch": 0.08, + "learning_rate": 1.9844525514959536e-06, + "loss": 0.8389, + "step": 3298 + }, + { + "epoch": 0.08, + "learning_rate": 1.9844379669705336e-06, + "loss": 0.8477, + "step": 3299 + }, + { + "epoch": 0.08, + "learning_rate": 1.9844233756613436e-06, + "loss": 1.127, + "step": 3300 + }, + { + "epoch": 0.08, + "learning_rate": 1.984408777568485e-06, + "loss": 0.9746, + "step": 3301 + }, + { + "epoch": 0.08, + "learning_rate": 1.9843941726920577e-06, + "loss": 1.208, + "step": 3302 + }, + { + "epoch": 0.08, + "learning_rate": 1.984379561032163e-06, + "loss": 1.166, + "step": 3303 + }, + { + "epoch": 0.08, + "learning_rate": 1.984364942588901e-06, + "loss": 0.8877, + "step": 3304 + }, + { + "epoch": 0.08, + "learning_rate": 1.984350317362373e-06, + "loss": 1.1562, + "step": 3305 + }, + { + "epoch": 0.08, + "learning_rate": 1.9843356853526795e-06, + "loss": 0.9668, + "step": 3306 + }, + { + "epoch": 0.08, + "learning_rate": 1.9843210465599215e-06, + "loss": 0.8662, + "step": 3307 + }, + { + "epoch": 0.08, + "learning_rate": 1.9843064009841995e-06, + "loss": 0.9365, + "step": 3308 + }, + { + "epoch": 0.08, + "learning_rate": 1.9842917486256146e-06, + "loss": 0.9268, + "step": 3309 + }, + { + "epoch": 0.08, + "learning_rate": 1.984277089484268e-06, + "loss": 0.9473, + "step": 3310 + }, + { + "epoch": 0.08, + "learning_rate": 1.9842624235602606e-06, + "loss": 0.8711, + "step": 3311 + }, + { + "epoch": 0.08, + "learning_rate": 1.9842477508536934e-06, + "loss": 1.1396, + "step": 3312 + }, + { + "epoch": 0.08, + "learning_rate": 1.984233071364667e-06, + "loss": 0.9805, + "step": 3313 + }, + { + "epoch": 0.08, + "learning_rate": 1.984218385093284e-06, + "loss": 0.8716, + "step": 3314 + }, + { + "epoch": 0.08, + "learning_rate": 1.984203692039644e-06, + "loss": 0.8896, + "step": 3315 + }, + { + "epoch": 0.08, + "learning_rate": 1.984188992203849e-06, + "loss": 0.8955, + "step": 3316 + }, + { + "epoch": 0.09, + "learning_rate": 1.984174285586e-06, + "loss": 0.9785, + "step": 3317 + }, + { + "epoch": 0.09, + "learning_rate": 1.9841595721861993e-06, + "loss": 0.8145, + "step": 3318 + }, + { + "epoch": 0.09, + "learning_rate": 1.984144852004547e-06, + "loss": 0.8926, + "step": 3319 + }, + { + "epoch": 0.09, + "learning_rate": 1.984130125041145e-06, + "loss": 0.9863, + "step": 3320 + }, + { + "epoch": 0.09, + "learning_rate": 1.984115391296095e-06, + "loss": 0.9766, + "step": 3321 + }, + { + "epoch": 0.09, + "learning_rate": 1.9841006507694987e-06, + "loss": 0.9287, + "step": 3322 + }, + { + "epoch": 0.09, + "learning_rate": 1.984085903461457e-06, + "loss": 1.1035, + "step": 3323 + }, + { + "epoch": 0.09, + "learning_rate": 1.984071149372072e-06, + "loss": 1.0615, + "step": 3324 + }, + { + "epoch": 0.09, + "learning_rate": 1.9840563885014456e-06, + "loss": 0.9932, + "step": 3325 + }, + { + "epoch": 0.09, + "learning_rate": 1.984041620849679e-06, + "loss": 0.8818, + "step": 3326 + }, + { + "epoch": 0.09, + "learning_rate": 1.9840268464168738e-06, + "loss": 0.9248, + "step": 3327 + }, + { + "epoch": 0.09, + "learning_rate": 1.9840120652031325e-06, + "loss": 0.9883, + "step": 3328 + }, + { + "epoch": 0.09, + "learning_rate": 1.9839972772085566e-06, + "loss": 0.9463, + "step": 3329 + }, + { + "epoch": 0.09, + "learning_rate": 1.983982482433248e-06, + "loss": 1.0312, + "step": 3330 + }, + { + "epoch": 0.09, + "learning_rate": 1.983967680877309e-06, + "loss": 0.8433, + "step": 3331 + }, + { + "epoch": 0.09, + "learning_rate": 1.983952872540841e-06, + "loss": 0.8613, + "step": 3332 + }, + { + "epoch": 0.09, + "learning_rate": 1.983938057423946e-06, + "loss": 1.041, + "step": 3333 + }, + { + "epoch": 0.09, + "learning_rate": 1.983923235526727e-06, + "loss": 0.874, + "step": 3334 + }, + { + "epoch": 0.09, + "learning_rate": 1.983908406849285e-06, + "loss": 0.8486, + "step": 3335 + }, + { + "epoch": 0.09, + "learning_rate": 1.9838935713917234e-06, + "loss": 0.7642, + "step": 3336 + }, + { + "epoch": 0.09, + "learning_rate": 1.983878729154143e-06, + "loss": 0.9082, + "step": 3337 + }, + { + "epoch": 0.09, + "learning_rate": 1.9838638801366476e-06, + "loss": 0.8296, + "step": 3338 + }, + { + "epoch": 0.09, + "learning_rate": 1.9838490243393383e-06, + "loss": 1.1025, + "step": 3339 + }, + { + "epoch": 0.09, + "learning_rate": 1.983834161762318e-06, + "loss": 0.9434, + "step": 3340 + }, + { + "epoch": 0.09, + "learning_rate": 1.983819292405689e-06, + "loss": 0.9658, + "step": 3341 + }, + { + "epoch": 0.09, + "learning_rate": 1.983804416269554e-06, + "loss": 0.7695, + "step": 3342 + }, + { + "epoch": 0.09, + "learning_rate": 1.9837895333540153e-06, + "loss": 0.8457, + "step": 3343 + }, + { + "epoch": 0.09, + "learning_rate": 1.983774643659175e-06, + "loss": 0.9414, + "step": 3344 + }, + { + "epoch": 0.09, + "learning_rate": 1.983759747185137e-06, + "loss": 1.1035, + "step": 3345 + }, + { + "epoch": 0.09, + "learning_rate": 1.9837448439320025e-06, + "loss": 1.0527, + "step": 3346 + }, + { + "epoch": 0.09, + "learning_rate": 1.9837299338998753e-06, + "loss": 0.9824, + "step": 3347 + }, + { + "epoch": 0.09, + "learning_rate": 1.9837150170888575e-06, + "loss": 0.9062, + "step": 3348 + }, + { + "epoch": 0.09, + "learning_rate": 1.9837000934990523e-06, + "loss": 0.9463, + "step": 3349 + }, + { + "epoch": 0.09, + "learning_rate": 1.983685163130562e-06, + "loss": 0.9443, + "step": 3350 + }, + { + "epoch": 0.09, + "learning_rate": 1.98367022598349e-06, + "loss": 1.0566, + "step": 3351 + }, + { + "epoch": 0.09, + "learning_rate": 1.9836552820579387e-06, + "loss": 0.8633, + "step": 3352 + }, + { + "epoch": 0.09, + "learning_rate": 1.983640331354012e-06, + "loss": 1.0088, + "step": 3353 + }, + { + "epoch": 0.09, + "learning_rate": 1.983625373871812e-06, + "loss": 1.1172, + "step": 3354 + }, + { + "epoch": 0.09, + "learning_rate": 1.983610409611442e-06, + "loss": 0.9316, + "step": 3355 + }, + { + "epoch": 0.09, + "learning_rate": 1.9835954385730056e-06, + "loss": 0.8877, + "step": 3356 + }, + { + "epoch": 0.09, + "learning_rate": 1.9835804607566056e-06, + "loss": 0.8691, + "step": 3357 + }, + { + "epoch": 0.09, + "learning_rate": 1.983565476162345e-06, + "loss": 0.9854, + "step": 3358 + }, + { + "epoch": 0.09, + "learning_rate": 1.9835504847903274e-06, + "loss": 0.8721, + "step": 3359 + }, + { + "epoch": 0.09, + "learning_rate": 1.983535486640656e-06, + "loss": 0.8423, + "step": 3360 + }, + { + "epoch": 0.09, + "learning_rate": 1.983520481713434e-06, + "loss": 1.0791, + "step": 3361 + }, + { + "epoch": 0.09, + "learning_rate": 1.983505470008765e-06, + "loss": 0.8301, + "step": 3362 + }, + { + "epoch": 0.09, + "learning_rate": 1.983490451526752e-06, + "loss": 1.0576, + "step": 3363 + }, + { + "epoch": 0.09, + "learning_rate": 1.9834754262674995e-06, + "loss": 1.0068, + "step": 3364 + }, + { + "epoch": 0.09, + "learning_rate": 1.98346039423111e-06, + "loss": 0.9512, + "step": 3365 + }, + { + "epoch": 0.09, + "learning_rate": 1.9834453554176874e-06, + "loss": 0.998, + "step": 3366 + }, + { + "epoch": 0.09, + "learning_rate": 1.9834303098273357e-06, + "loss": 0.9092, + "step": 3367 + }, + { + "epoch": 0.09, + "learning_rate": 1.9834152574601584e-06, + "loss": 0.8926, + "step": 3368 + }, + { + "epoch": 0.09, + "learning_rate": 1.983400198316259e-06, + "loss": 0.9404, + "step": 3369 + }, + { + "epoch": 0.09, + "learning_rate": 1.983385132395741e-06, + "loss": 0.8965, + "step": 3370 + }, + { + "epoch": 0.09, + "learning_rate": 1.9833700596987093e-06, + "loss": 0.9102, + "step": 3371 + }, + { + "epoch": 0.09, + "learning_rate": 1.983354980225267e-06, + "loss": 1.0439, + "step": 3372 + }, + { + "epoch": 0.09, + "learning_rate": 1.9833398939755176e-06, + "loss": 0.9551, + "step": 3373 + }, + { + "epoch": 0.09, + "learning_rate": 1.9833248009495658e-06, + "loss": 0.9688, + "step": 3374 + }, + { + "epoch": 0.09, + "learning_rate": 1.9833097011475155e-06, + "loss": 0.7656, + "step": 3375 + }, + { + "epoch": 0.09, + "learning_rate": 1.98329459456947e-06, + "loss": 0.8447, + "step": 3376 + }, + { + "epoch": 0.09, + "learning_rate": 1.9832794812155353e-06, + "loss": 1.0879, + "step": 3377 + }, + { + "epoch": 0.09, + "learning_rate": 1.9832643610858133e-06, + "loss": 1.123, + "step": 3378 + }, + { + "epoch": 0.09, + "learning_rate": 1.9832492341804095e-06, + "loss": 0.9346, + "step": 3379 + }, + { + "epoch": 0.09, + "learning_rate": 1.983234100499428e-06, + "loss": 0.9829, + "step": 3380 + }, + { + "epoch": 0.09, + "learning_rate": 1.983218960042972e-06, + "loss": 0.8594, + "step": 3381 + }, + { + "epoch": 0.09, + "learning_rate": 1.9832038128111473e-06, + "loss": 0.8994, + "step": 3382 + }, + { + "epoch": 0.09, + "learning_rate": 1.983188658804058e-06, + "loss": 1.0859, + "step": 3383 + }, + { + "epoch": 0.09, + "learning_rate": 1.983173498021808e-06, + "loss": 1.0703, + "step": 3384 + }, + { + "epoch": 0.09, + "learning_rate": 1.983158330464502e-06, + "loss": 1.0625, + "step": 3385 + }, + { + "epoch": 0.09, + "learning_rate": 1.983143156132244e-06, + "loss": 1.0137, + "step": 3386 + }, + { + "epoch": 0.09, + "learning_rate": 1.9831279750251396e-06, + "loss": 0.9873, + "step": 3387 + }, + { + "epoch": 0.09, + "learning_rate": 1.983112787143293e-06, + "loss": 0.9355, + "step": 3388 + }, + { + "epoch": 0.09, + "learning_rate": 1.9830975924868083e-06, + "loss": 0.7539, + "step": 3389 + }, + { + "epoch": 0.09, + "learning_rate": 1.9830823910557914e-06, + "loss": 0.8418, + "step": 3390 + }, + { + "epoch": 0.09, + "learning_rate": 1.9830671828503456e-06, + "loss": 0.7686, + "step": 3391 + }, + { + "epoch": 0.09, + "learning_rate": 1.9830519678705767e-06, + "loss": 0.9814, + "step": 3392 + }, + { + "epoch": 0.09, + "learning_rate": 1.983036746116589e-06, + "loss": 0.8325, + "step": 3393 + }, + { + "epoch": 0.09, + "learning_rate": 1.983021517588488e-06, + "loss": 0.7979, + "step": 3394 + }, + { + "epoch": 0.09, + "learning_rate": 1.983006282286378e-06, + "loss": 1.0898, + "step": 3395 + }, + { + "epoch": 0.09, + "learning_rate": 1.982991040210365e-06, + "loss": 0.9238, + "step": 3396 + }, + { + "epoch": 0.09, + "learning_rate": 1.9829757913605526e-06, + "loss": 0.9756, + "step": 3397 + }, + { + "epoch": 0.09, + "learning_rate": 1.9829605357370466e-06, + "loss": 0.9873, + "step": 3398 + }, + { + "epoch": 0.09, + "learning_rate": 1.9829452733399523e-06, + "loss": 0.6626, + "step": 3399 + }, + { + "epoch": 0.09, + "learning_rate": 1.982930004169375e-06, + "loss": 0.9766, + "step": 3400 + }, + { + "epoch": 0.09, + "learning_rate": 1.982914728225419e-06, + "loss": 0.6255, + "step": 3401 + }, + { + "epoch": 0.09, + "learning_rate": 1.9828994455081907e-06, + "loss": 0.9238, + "step": 3402 + }, + { + "epoch": 0.09, + "learning_rate": 1.9828841560177947e-06, + "loss": 1.0459, + "step": 3403 + }, + { + "epoch": 0.09, + "learning_rate": 1.9828688597543365e-06, + "loss": 1.1904, + "step": 3404 + }, + { + "epoch": 0.09, + "learning_rate": 1.9828535567179216e-06, + "loss": 0.897, + "step": 3405 + }, + { + "epoch": 0.09, + "learning_rate": 1.9828382469086554e-06, + "loss": 1.0635, + "step": 3406 + }, + { + "epoch": 0.09, + "learning_rate": 1.9828229303266437e-06, + "loss": 0.9521, + "step": 3407 + }, + { + "epoch": 0.09, + "learning_rate": 1.9828076069719916e-06, + "loss": 0.9014, + "step": 3408 + }, + { + "epoch": 0.09, + "learning_rate": 1.9827922768448046e-06, + "loss": 0.9609, + "step": 3409 + }, + { + "epoch": 0.09, + "learning_rate": 1.9827769399451886e-06, + "loss": 0.9697, + "step": 3410 + }, + { + "epoch": 0.09, + "learning_rate": 1.9827615962732498e-06, + "loss": 0.8291, + "step": 3411 + }, + { + "epoch": 0.09, + "learning_rate": 1.982746245829093e-06, + "loss": 0.8745, + "step": 3412 + }, + { + "epoch": 0.09, + "learning_rate": 1.9827308886128244e-06, + "loss": 1.0225, + "step": 3413 + }, + { + "epoch": 0.09, + "learning_rate": 1.9827155246245497e-06, + "loss": 0.7676, + "step": 3414 + }, + { + "epoch": 0.09, + "learning_rate": 1.9827001538643752e-06, + "loss": 0.9854, + "step": 3415 + }, + { + "epoch": 0.09, + "learning_rate": 1.9826847763324066e-06, + "loss": 1.0684, + "step": 3416 + }, + { + "epoch": 0.09, + "learning_rate": 1.9826693920287496e-06, + "loss": 0.8672, + "step": 3417 + }, + { + "epoch": 0.09, + "learning_rate": 1.98265400095351e-06, + "loss": 0.9668, + "step": 3418 + }, + { + "epoch": 0.09, + "learning_rate": 1.9826386031067946e-06, + "loss": 0.8311, + "step": 3419 + }, + { + "epoch": 0.09, + "learning_rate": 1.9826231984887096e-06, + "loss": 1.0596, + "step": 3420 + }, + { + "epoch": 0.09, + "learning_rate": 1.98260778709936e-06, + "loss": 0.8618, + "step": 3421 + }, + { + "epoch": 0.09, + "learning_rate": 1.982592368938853e-06, + "loss": 0.8994, + "step": 3422 + }, + { + "epoch": 0.09, + "learning_rate": 1.9825769440072947e-06, + "loss": 0.998, + "step": 3423 + }, + { + "epoch": 0.09, + "learning_rate": 1.9825615123047913e-06, + "loss": 0.8701, + "step": 3424 + }, + { + "epoch": 0.09, + "learning_rate": 1.9825460738314486e-06, + "loss": 1.0703, + "step": 3425 + }, + { + "epoch": 0.09, + "learning_rate": 1.9825306285873744e-06, + "loss": 0.9551, + "step": 3426 + }, + { + "epoch": 0.09, + "learning_rate": 1.982515176572673e-06, + "loss": 1.0049, + "step": 3427 + }, + { + "epoch": 0.09, + "learning_rate": 1.9824997177874533e-06, + "loss": 0.9814, + "step": 3428 + }, + { + "epoch": 0.09, + "learning_rate": 1.9824842522318195e-06, + "loss": 0.9756, + "step": 3429 + }, + { + "epoch": 0.09, + "learning_rate": 1.98246877990588e-06, + "loss": 0.9854, + "step": 3430 + }, + { + "epoch": 0.09, + "learning_rate": 1.9824533008097407e-06, + "loss": 0.8311, + "step": 3431 + }, + { + "epoch": 0.09, + "learning_rate": 1.9824378149435083e-06, + "loss": 0.7773, + "step": 3432 + }, + { + "epoch": 0.09, + "learning_rate": 1.9824223223072893e-06, + "loss": 1.0459, + "step": 3433 + }, + { + "epoch": 0.09, + "learning_rate": 1.982406822901191e-06, + "loss": 1.1885, + "step": 3434 + }, + { + "epoch": 0.09, + "learning_rate": 1.9823913167253195e-06, + "loss": 0.8291, + "step": 3435 + }, + { + "epoch": 0.09, + "learning_rate": 1.9823758037797818e-06, + "loss": 0.7935, + "step": 3436 + }, + { + "epoch": 0.09, + "learning_rate": 1.9823602840646856e-06, + "loss": 0.668, + "step": 3437 + }, + { + "epoch": 0.09, + "learning_rate": 1.9823447575801368e-06, + "loss": 0.8765, + "step": 3438 + }, + { + "epoch": 0.09, + "learning_rate": 1.982329224326243e-06, + "loss": 1.0137, + "step": 3439 + }, + { + "epoch": 0.09, + "learning_rate": 1.982313684303111e-06, + "loss": 1.083, + "step": 3440 + }, + { + "epoch": 0.09, + "learning_rate": 1.982298137510848e-06, + "loss": 0.9062, + "step": 3441 + }, + { + "epoch": 0.09, + "learning_rate": 1.9822825839495613e-06, + "loss": 0.9541, + "step": 3442 + }, + { + "epoch": 0.09, + "learning_rate": 1.982267023619358e-06, + "loss": 0.9253, + "step": 3443 + }, + { + "epoch": 0.09, + "learning_rate": 1.9822514565203448e-06, + "loss": 0.9795, + "step": 3444 + }, + { + "epoch": 0.09, + "learning_rate": 1.9822358826526298e-06, + "loss": 1.0156, + "step": 3445 + }, + { + "epoch": 0.09, + "learning_rate": 1.98222030201632e-06, + "loss": 0.8994, + "step": 3446 + }, + { + "epoch": 0.09, + "learning_rate": 1.982204714611522e-06, + "loss": 0.854, + "step": 3447 + }, + { + "epoch": 0.09, + "learning_rate": 1.9821891204383444e-06, + "loss": 1.0479, + "step": 3448 + }, + { + "epoch": 0.09, + "learning_rate": 1.982173519496894e-06, + "loss": 1.0957, + "step": 3449 + }, + { + "epoch": 0.09, + "learning_rate": 1.9821579117872787e-06, + "loss": 1.2402, + "step": 3450 + }, + { + "epoch": 0.09, + "learning_rate": 1.9821422973096054e-06, + "loss": 0.9775, + "step": 3451 + }, + { + "epoch": 0.09, + "learning_rate": 1.9821266760639826e-06, + "loss": 0.9121, + "step": 3452 + }, + { + "epoch": 0.09, + "learning_rate": 1.982111048050517e-06, + "loss": 1.1973, + "step": 3453 + }, + { + "epoch": 0.09, + "learning_rate": 1.982095413269317e-06, + "loss": 0.9146, + "step": 3454 + }, + { + "epoch": 0.09, + "learning_rate": 1.98207977172049e-06, + "loss": 0.7881, + "step": 3455 + }, + { + "epoch": 0.09, + "learning_rate": 1.982064123404144e-06, + "loss": 0.8799, + "step": 3456 + }, + { + "epoch": 0.09, + "learning_rate": 1.9820484683203867e-06, + "loss": 0.9336, + "step": 3457 + }, + { + "epoch": 0.09, + "learning_rate": 1.9820328064693257e-06, + "loss": 0.8975, + "step": 3458 + }, + { + "epoch": 0.09, + "learning_rate": 1.9820171378510695e-06, + "loss": 0.8398, + "step": 3459 + }, + { + "epoch": 0.09, + "learning_rate": 1.9820014624657257e-06, + "loss": 0.8477, + "step": 3460 + }, + { + "epoch": 0.09, + "learning_rate": 1.9819857803134025e-06, + "loss": 0.9717, + "step": 3461 + }, + { + "epoch": 0.09, + "learning_rate": 1.9819700913942077e-06, + "loss": 1.125, + "step": 3462 + }, + { + "epoch": 0.09, + "learning_rate": 1.9819543957082497e-06, + "loss": 0.9927, + "step": 3463 + }, + { + "epoch": 0.09, + "learning_rate": 1.9819386932556363e-06, + "loss": 0.9736, + "step": 3464 + }, + { + "epoch": 0.09, + "learning_rate": 1.981922984036476e-06, + "loss": 0.8535, + "step": 3465 + }, + { + "epoch": 0.09, + "learning_rate": 1.9819072680508776e-06, + "loss": 0.8262, + "step": 3466 + }, + { + "epoch": 0.09, + "learning_rate": 1.981891545298948e-06, + "loss": 1.2754, + "step": 3467 + }, + { + "epoch": 0.09, + "learning_rate": 1.9818758157807967e-06, + "loss": 0.6885, + "step": 3468 + }, + { + "epoch": 0.09, + "learning_rate": 1.9818600794965317e-06, + "loss": 0.8311, + "step": 3469 + }, + { + "epoch": 0.09, + "learning_rate": 1.9818443364462616e-06, + "loss": 0.7017, + "step": 3470 + }, + { + "epoch": 0.09, + "learning_rate": 1.9818285866300946e-06, + "loss": 1.0674, + "step": 3471 + }, + { + "epoch": 0.09, + "learning_rate": 1.9818128300481394e-06, + "loss": 1.0508, + "step": 3472 + }, + { + "epoch": 0.09, + "learning_rate": 1.9817970667005047e-06, + "loss": 1.0576, + "step": 3473 + }, + { + "epoch": 0.09, + "learning_rate": 1.981781296587299e-06, + "loss": 0.8584, + "step": 3474 + }, + { + "epoch": 0.09, + "learning_rate": 1.981765519708631e-06, + "loss": 1.0112, + "step": 3475 + }, + { + "epoch": 0.09, + "learning_rate": 1.9817497360646087e-06, + "loss": 0.9346, + "step": 3476 + }, + { + "epoch": 0.09, + "learning_rate": 1.9817339456553424e-06, + "loss": 0.9209, + "step": 3477 + }, + { + "epoch": 0.09, + "learning_rate": 1.9817181484809396e-06, + "loss": 0.8174, + "step": 3478 + }, + { + "epoch": 0.09, + "learning_rate": 1.9817023445415103e-06, + "loss": 0.9424, + "step": 3479 + }, + { + "epoch": 0.09, + "learning_rate": 1.9816865338371622e-06, + "loss": 0.9639, + "step": 3480 + }, + { + "epoch": 0.09, + "learning_rate": 1.9816707163680046e-06, + "loss": 0.9839, + "step": 3481 + }, + { + "epoch": 0.09, + "learning_rate": 1.981654892134147e-06, + "loss": 1.0654, + "step": 3482 + }, + { + "epoch": 0.09, + "learning_rate": 1.981639061135698e-06, + "loss": 0.9609, + "step": 3483 + }, + { + "epoch": 0.09, + "learning_rate": 1.9816232233727668e-06, + "loss": 0.9932, + "step": 3484 + }, + { + "epoch": 0.09, + "learning_rate": 1.9816073788454626e-06, + "loss": 0.853, + "step": 3485 + }, + { + "epoch": 0.09, + "learning_rate": 1.9815915275538944e-06, + "loss": 0.8066, + "step": 3486 + }, + { + "epoch": 0.09, + "learning_rate": 1.9815756694981718e-06, + "loss": 1.3145, + "step": 3487 + }, + { + "epoch": 0.09, + "learning_rate": 1.9815598046784036e-06, + "loss": 0.8789, + "step": 3488 + }, + { + "epoch": 0.09, + "learning_rate": 1.9815439330946996e-06, + "loss": 0.9424, + "step": 3489 + }, + { + "epoch": 0.09, + "learning_rate": 1.981528054747169e-06, + "loss": 1.0273, + "step": 3490 + }, + { + "epoch": 0.09, + "learning_rate": 1.981512169635921e-06, + "loss": 1.2324, + "step": 3491 + }, + { + "epoch": 0.09, + "learning_rate": 1.981496277761065e-06, + "loss": 0.9609, + "step": 3492 + }, + { + "epoch": 0.09, + "learning_rate": 1.9814803791227114e-06, + "loss": 0.8066, + "step": 3493 + }, + { + "epoch": 0.09, + "learning_rate": 1.9814644737209684e-06, + "loss": 0.9458, + "step": 3494 + }, + { + "epoch": 0.09, + "learning_rate": 1.9814485615559468e-06, + "loss": 1.0811, + "step": 3495 + }, + { + "epoch": 0.09, + "learning_rate": 1.9814326426277554e-06, + "loss": 0.9805, + "step": 3496 + }, + { + "epoch": 0.09, + "learning_rate": 1.981416716936504e-06, + "loss": 1.1035, + "step": 3497 + }, + { + "epoch": 0.09, + "learning_rate": 1.981400784482303e-06, + "loss": 0.9629, + "step": 3498 + }, + { + "epoch": 0.09, + "learning_rate": 1.981384845265262e-06, + "loss": 0.7427, + "step": 3499 + }, + { + "epoch": 0.09, + "learning_rate": 1.98136889928549e-06, + "loss": 1.1133, + "step": 3500 + }, + { + "epoch": 0.09, + "learning_rate": 1.9813529465430985e-06, + "loss": 1.1309, + "step": 3501 + }, + { + "epoch": 0.09, + "learning_rate": 1.9813369870381957e-06, + "loss": 0.9766, + "step": 3502 + }, + { + "epoch": 0.09, + "learning_rate": 1.9813210207708923e-06, + "loss": 1.0459, + "step": 3503 + }, + { + "epoch": 0.09, + "learning_rate": 1.9813050477412984e-06, + "loss": 0.9219, + "step": 3504 + }, + { + "epoch": 0.09, + "learning_rate": 1.981289067949524e-06, + "loss": 0.8691, + "step": 3505 + }, + { + "epoch": 0.09, + "learning_rate": 1.9812730813956792e-06, + "loss": 0.9092, + "step": 3506 + }, + { + "epoch": 0.09, + "learning_rate": 1.981257088079874e-06, + "loss": 1.0566, + "step": 3507 + }, + { + "epoch": 0.09, + "learning_rate": 1.9812410880022194e-06, + "loss": 0.9473, + "step": 3508 + }, + { + "epoch": 0.09, + "learning_rate": 1.9812250811628247e-06, + "loss": 0.7129, + "step": 3509 + }, + { + "epoch": 0.09, + "learning_rate": 1.9812090675618003e-06, + "loss": 0.7993, + "step": 3510 + }, + { + "epoch": 0.09, + "learning_rate": 1.981193047199257e-06, + "loss": 1.1602, + "step": 3511 + }, + { + "epoch": 0.09, + "learning_rate": 1.981177020075305e-06, + "loss": 1.0273, + "step": 3512 + }, + { + "epoch": 0.09, + "learning_rate": 1.981160986190055e-06, + "loss": 0.9531, + "step": 3513 + }, + { + "epoch": 0.09, + "learning_rate": 1.9811449455436167e-06, + "loss": 0.8975, + "step": 3514 + }, + { + "epoch": 0.09, + "learning_rate": 1.9811288981361017e-06, + "loss": 1.0117, + "step": 3515 + }, + { + "epoch": 0.09, + "learning_rate": 1.9811128439676196e-06, + "loss": 0.5906, + "step": 3516 + }, + { + "epoch": 0.09, + "learning_rate": 1.981096783038282e-06, + "loss": 1.0488, + "step": 3517 + }, + { + "epoch": 0.09, + "learning_rate": 1.9810807153481987e-06, + "loss": 0.6719, + "step": 3518 + }, + { + "epoch": 0.09, + "learning_rate": 1.9810646408974806e-06, + "loss": 0.9736, + "step": 3519 + }, + { + "epoch": 0.09, + "learning_rate": 1.981048559686239e-06, + "loss": 0.9824, + "step": 3520 + }, + { + "epoch": 0.09, + "learning_rate": 1.9810324717145844e-06, + "loss": 1.1797, + "step": 3521 + }, + { + "epoch": 0.09, + "learning_rate": 1.9810163769826275e-06, + "loss": 1.0225, + "step": 3522 + }, + { + "epoch": 0.09, + "learning_rate": 1.9810002754904795e-06, + "loss": 0.9707, + "step": 3523 + }, + { + "epoch": 0.09, + "learning_rate": 1.980984167238251e-06, + "loss": 1.0215, + "step": 3524 + }, + { + "epoch": 0.09, + "learning_rate": 1.980968052226053e-06, + "loss": 0.7119, + "step": 3525 + }, + { + "epoch": 0.09, + "learning_rate": 1.980951930453997e-06, + "loss": 0.8613, + "step": 3526 + }, + { + "epoch": 0.09, + "learning_rate": 1.9809358019221937e-06, + "loss": 0.6729, + "step": 3527 + }, + { + "epoch": 0.09, + "learning_rate": 1.9809196666307545e-06, + "loss": 0.9814, + "step": 3528 + }, + { + "epoch": 0.09, + "learning_rate": 1.9809035245797903e-06, + "loss": 0.8408, + "step": 3529 + }, + { + "epoch": 0.09, + "learning_rate": 1.980887375769413e-06, + "loss": 0.9688, + "step": 3530 + }, + { + "epoch": 0.09, + "learning_rate": 1.9808712201997327e-06, + "loss": 1.0371, + "step": 3531 + }, + { + "epoch": 0.09, + "learning_rate": 1.980855057870862e-06, + "loss": 0.8848, + "step": 3532 + }, + { + "epoch": 0.09, + "learning_rate": 1.9808388887829115e-06, + "loss": 0.9922, + "step": 3533 + }, + { + "epoch": 0.09, + "learning_rate": 1.9808227129359925e-06, + "loss": 1.127, + "step": 3534 + }, + { + "epoch": 0.09, + "learning_rate": 1.980806530330217e-06, + "loss": 0.8213, + "step": 3535 + }, + { + "epoch": 0.09, + "learning_rate": 1.980790340965696e-06, + "loss": 0.8018, + "step": 3536 + }, + { + "epoch": 0.09, + "learning_rate": 1.980774144842542e-06, + "loss": 0.9824, + "step": 3537 + }, + { + "epoch": 0.09, + "learning_rate": 1.9807579419608657e-06, + "loss": 0.8525, + "step": 3538 + }, + { + "epoch": 0.09, + "learning_rate": 1.9807417323207787e-06, + "loss": 0.6411, + "step": 3539 + }, + { + "epoch": 0.09, + "learning_rate": 1.9807255159223933e-06, + "loss": 0.8428, + "step": 3540 + }, + { + "epoch": 0.09, + "learning_rate": 1.980709292765821e-06, + "loss": 0.9795, + "step": 3541 + }, + { + "epoch": 0.09, + "learning_rate": 1.9806930628511732e-06, + "loss": 0.957, + "step": 3542 + }, + { + "epoch": 0.09, + "learning_rate": 1.9806768261785625e-06, + "loss": 0.8936, + "step": 3543 + }, + { + "epoch": 0.09, + "learning_rate": 1.9806605827481002e-06, + "loss": 1.041, + "step": 3544 + }, + { + "epoch": 0.09, + "learning_rate": 1.9806443325598985e-06, + "loss": 1.0479, + "step": 3545 + }, + { + "epoch": 0.09, + "learning_rate": 1.980628075614069e-06, + "loss": 1.0342, + "step": 3546 + }, + { + "epoch": 0.09, + "learning_rate": 1.9806118119107246e-06, + "loss": 1.1104, + "step": 3547 + }, + { + "epoch": 0.09, + "learning_rate": 1.980595541449976e-06, + "loss": 0.9688, + "step": 3548 + }, + { + "epoch": 0.09, + "learning_rate": 1.9805792642319366e-06, + "loss": 0.9521, + "step": 3549 + }, + { + "epoch": 0.09, + "learning_rate": 1.9805629802567184e-06, + "loss": 0.9111, + "step": 3550 + }, + { + "epoch": 0.09, + "learning_rate": 1.980546689524433e-06, + "loss": 0.8965, + "step": 3551 + }, + { + "epoch": 0.09, + "learning_rate": 1.9805303920351926e-06, + "loss": 0.9395, + "step": 3552 + }, + { + "epoch": 0.09, + "learning_rate": 1.9805140877891106e-06, + "loss": 1.0391, + "step": 3553 + }, + { + "epoch": 0.09, + "learning_rate": 1.980497776786298e-06, + "loss": 0.8467, + "step": 3554 + }, + { + "epoch": 0.09, + "learning_rate": 1.980481459026868e-06, + "loss": 0.9619, + "step": 3555 + }, + { + "epoch": 0.09, + "learning_rate": 1.9804651345109327e-06, + "loss": 1.1328, + "step": 3556 + }, + { + "epoch": 0.09, + "learning_rate": 1.9804488032386048e-06, + "loss": 0.8101, + "step": 3557 + }, + { + "epoch": 0.09, + "learning_rate": 1.980432465209997e-06, + "loss": 1.0, + "step": 3558 + }, + { + "epoch": 0.09, + "learning_rate": 1.9804161204252217e-06, + "loss": 0.8623, + "step": 3559 + }, + { + "epoch": 0.09, + "learning_rate": 1.9803997688843915e-06, + "loss": 0.8398, + "step": 3560 + }, + { + "epoch": 0.09, + "learning_rate": 1.980383410587619e-06, + "loss": 1.0117, + "step": 3561 + }, + { + "epoch": 0.09, + "learning_rate": 1.980367045535017e-06, + "loss": 0.7671, + "step": 3562 + }, + { + "epoch": 0.09, + "learning_rate": 1.9803506737266978e-06, + "loss": 0.9961, + "step": 3563 + }, + { + "epoch": 0.09, + "learning_rate": 1.9803342951627755e-06, + "loss": 1.1045, + "step": 3564 + }, + { + "epoch": 0.09, + "learning_rate": 1.980317909843362e-06, + "loss": 1.0381, + "step": 3565 + }, + { + "epoch": 0.09, + "learning_rate": 1.98030151776857e-06, + "loss": 0.9795, + "step": 3566 + }, + { + "epoch": 0.09, + "learning_rate": 1.980285118938513e-06, + "loss": 0.9883, + "step": 3567 + }, + { + "epoch": 0.09, + "learning_rate": 1.980268713353304e-06, + "loss": 0.998, + "step": 3568 + }, + { + "epoch": 0.09, + "learning_rate": 1.9802523010130557e-06, + "loss": 0.832, + "step": 3569 + }, + { + "epoch": 0.09, + "learning_rate": 1.9802358819178815e-06, + "loss": 1.1631, + "step": 3570 + }, + { + "epoch": 0.09, + "learning_rate": 1.9802194560678943e-06, + "loss": 0.8584, + "step": 3571 + }, + { + "epoch": 0.09, + "learning_rate": 1.9802030234632078e-06, + "loss": 1.1465, + "step": 3572 + }, + { + "epoch": 0.09, + "learning_rate": 1.980186584103934e-06, + "loss": 1.0527, + "step": 3573 + }, + { + "epoch": 0.09, + "learning_rate": 1.980170137990188e-06, + "loss": 1.1035, + "step": 3574 + }, + { + "epoch": 0.09, + "learning_rate": 1.9801536851220817e-06, + "loss": 0.7163, + "step": 3575 + }, + { + "epoch": 0.09, + "learning_rate": 1.9801372254997293e-06, + "loss": 0.9834, + "step": 3576 + }, + { + "epoch": 0.09, + "learning_rate": 1.9801207591232436e-06, + "loss": 0.9434, + "step": 3577 + }, + { + "epoch": 0.09, + "learning_rate": 1.980104285992738e-06, + "loss": 0.9004, + "step": 3578 + }, + { + "epoch": 0.09, + "learning_rate": 1.980087806108327e-06, + "loss": 0.9707, + "step": 3579 + }, + { + "epoch": 0.09, + "learning_rate": 1.9800713194701233e-06, + "loss": 0.916, + "step": 3580 + }, + { + "epoch": 0.09, + "learning_rate": 1.9800548260782406e-06, + "loss": 0.9883, + "step": 3581 + }, + { + "epoch": 0.09, + "learning_rate": 1.980038325932793e-06, + "loss": 1.0332, + "step": 3582 + }, + { + "epoch": 0.09, + "learning_rate": 1.9800218190338933e-06, + "loss": 0.8501, + "step": 3583 + }, + { + "epoch": 0.09, + "learning_rate": 1.9800053053816567e-06, + "loss": 0.769, + "step": 3584 + }, + { + "epoch": 0.09, + "learning_rate": 1.9799887849761954e-06, + "loss": 0.9287, + "step": 3585 + }, + { + "epoch": 0.09, + "learning_rate": 1.979972257817624e-06, + "loss": 1.1221, + "step": 3586 + }, + { + "epoch": 0.09, + "learning_rate": 1.979955723906057e-06, + "loss": 0.9307, + "step": 3587 + }, + { + "epoch": 0.09, + "learning_rate": 1.979939183241607e-06, + "loss": 0.9766, + "step": 3588 + }, + { + "epoch": 0.09, + "learning_rate": 1.979922635824389e-06, + "loss": 0.7964, + "step": 3589 + }, + { + "epoch": 0.09, + "learning_rate": 1.979906081654517e-06, + "loss": 0.9414, + "step": 3590 + }, + { + "epoch": 0.09, + "learning_rate": 1.9798895207321045e-06, + "loss": 0.7886, + "step": 3591 + }, + { + "epoch": 0.09, + "learning_rate": 1.9798729530572657e-06, + "loss": 0.8467, + "step": 3592 + }, + { + "epoch": 0.09, + "learning_rate": 1.9798563786301153e-06, + "loss": 0.9126, + "step": 3593 + }, + { + "epoch": 0.09, + "learning_rate": 1.979839797450767e-06, + "loss": 0.8506, + "step": 3594 + }, + { + "epoch": 0.09, + "learning_rate": 1.9798232095193353e-06, + "loss": 0.9785, + "step": 3595 + }, + { + "epoch": 0.09, + "learning_rate": 1.9798066148359344e-06, + "loss": 1.0801, + "step": 3596 + }, + { + "epoch": 0.09, + "learning_rate": 1.979790013400679e-06, + "loss": 1.1357, + "step": 3597 + }, + { + "epoch": 0.09, + "learning_rate": 1.979773405213683e-06, + "loss": 0.9746, + "step": 3598 + }, + { + "epoch": 0.09, + "learning_rate": 1.979756790275061e-06, + "loss": 1.0059, + "step": 3599 + }, + { + "epoch": 0.09, + "learning_rate": 1.979740168584928e-06, + "loss": 0.7754, + "step": 3600 + }, + { + "epoch": 0.09, + "learning_rate": 1.9797235401433973e-06, + "loss": 0.8628, + "step": 3601 + }, + { + "epoch": 0.09, + "learning_rate": 1.979706904950585e-06, + "loss": 0.9824, + "step": 3602 + }, + { + "epoch": 0.09, + "learning_rate": 1.9796902630066045e-06, + "loss": 0.8779, + "step": 3603 + }, + { + "epoch": 0.09, + "learning_rate": 1.9796736143115714e-06, + "loss": 0.9307, + "step": 3604 + }, + { + "epoch": 0.09, + "learning_rate": 1.9796569588656e-06, + "loss": 0.8379, + "step": 3605 + }, + { + "epoch": 0.09, + "learning_rate": 1.9796402966688046e-06, + "loss": 0.8311, + "step": 3606 + }, + { + "epoch": 0.09, + "learning_rate": 1.9796236277213014e-06, + "loss": 0.7515, + "step": 3607 + }, + { + "epoch": 0.09, + "learning_rate": 1.979606952023204e-06, + "loss": 0.9229, + "step": 3608 + }, + { + "epoch": 0.09, + "learning_rate": 1.9795902695746274e-06, + "loss": 0.6699, + "step": 3609 + }, + { + "epoch": 0.09, + "learning_rate": 1.9795735803756866e-06, + "loss": 1.2305, + "step": 3610 + }, + { + "epoch": 0.09, + "learning_rate": 1.9795568844264976e-06, + "loss": 0.8516, + "step": 3611 + }, + { + "epoch": 0.09, + "learning_rate": 1.979540181727174e-06, + "loss": 0.9365, + "step": 3612 + }, + { + "epoch": 0.09, + "learning_rate": 1.979523472277832e-06, + "loss": 0.9209, + "step": 3613 + }, + { + "epoch": 0.09, + "learning_rate": 1.9795067560785867e-06, + "loss": 1.0586, + "step": 3614 + }, + { + "epoch": 0.09, + "learning_rate": 1.9794900331295524e-06, + "loss": 1.0186, + "step": 3615 + }, + { + "epoch": 0.09, + "learning_rate": 1.979473303430845e-06, + "loss": 1.168, + "step": 3616 + }, + { + "epoch": 0.09, + "learning_rate": 1.97945656698258e-06, + "loss": 1.0156, + "step": 3617 + }, + { + "epoch": 0.09, + "learning_rate": 1.979439823784872e-06, + "loss": 1.0459, + "step": 3618 + }, + { + "epoch": 0.09, + "learning_rate": 1.979423073837837e-06, + "loss": 0.9873, + "step": 3619 + }, + { + "epoch": 0.09, + "learning_rate": 1.97940631714159e-06, + "loss": 1.1172, + "step": 3620 + }, + { + "epoch": 0.09, + "learning_rate": 1.979389553696247e-06, + "loss": 1.1152, + "step": 3621 + }, + { + "epoch": 0.09, + "learning_rate": 1.979372783501923e-06, + "loss": 1.1348, + "step": 3622 + }, + { + "epoch": 0.09, + "learning_rate": 1.9793560065587338e-06, + "loss": 1.0254, + "step": 3623 + }, + { + "epoch": 0.09, + "learning_rate": 1.9793392228667947e-06, + "loss": 0.9062, + "step": 3624 + }, + { + "epoch": 0.09, + "learning_rate": 1.979322432426222e-06, + "loss": 0.8447, + "step": 3625 + }, + { + "epoch": 0.09, + "learning_rate": 1.9793056352371303e-06, + "loss": 0.6501, + "step": 3626 + }, + { + "epoch": 0.09, + "learning_rate": 1.9792888312996367e-06, + "loss": 0.7432, + "step": 3627 + }, + { + "epoch": 0.09, + "learning_rate": 1.979272020613856e-06, + "loss": 0.8154, + "step": 3628 + }, + { + "epoch": 0.09, + "learning_rate": 1.979255203179905e-06, + "loss": 0.8408, + "step": 3629 + }, + { + "epoch": 0.09, + "learning_rate": 1.979238378997899e-06, + "loss": 1.1689, + "step": 3630 + }, + { + "epoch": 0.09, + "learning_rate": 1.979221548067953e-06, + "loss": 1.0488, + "step": 3631 + }, + { + "epoch": 0.09, + "learning_rate": 1.979204710390185e-06, + "loss": 1.3066, + "step": 3632 + }, + { + "epoch": 0.09, + "learning_rate": 1.979187865964709e-06, + "loss": 0.8789, + "step": 3633 + }, + { + "epoch": 0.09, + "learning_rate": 1.9791710147916426e-06, + "loss": 0.8496, + "step": 3634 + }, + { + "epoch": 0.09, + "learning_rate": 1.979154156871101e-06, + "loss": 0.9893, + "step": 3635 + }, + { + "epoch": 0.09, + "learning_rate": 1.979137292203201e-06, + "loss": 1.083, + "step": 3636 + }, + { + "epoch": 0.09, + "learning_rate": 1.9791204207880585e-06, + "loss": 0.7617, + "step": 3637 + }, + { + "epoch": 0.09, + "learning_rate": 1.97910354262579e-06, + "loss": 1.0557, + "step": 3638 + }, + { + "epoch": 0.09, + "learning_rate": 1.979086657716511e-06, + "loss": 1.0049, + "step": 3639 + }, + { + "epoch": 0.09, + "learning_rate": 1.979069766060339e-06, + "loss": 1.1094, + "step": 3640 + }, + { + "epoch": 0.09, + "learning_rate": 1.9790528676573895e-06, + "loss": 0.8398, + "step": 3641 + }, + { + "epoch": 0.09, + "learning_rate": 1.979035962507779e-06, + "loss": 0.8857, + "step": 3642 + }, + { + "epoch": 0.09, + "learning_rate": 1.979019050611625e-06, + "loss": 0.7837, + "step": 3643 + }, + { + "epoch": 0.09, + "learning_rate": 1.979002131969043e-06, + "loss": 0.7483, + "step": 3644 + }, + { + "epoch": 0.09, + "learning_rate": 1.97898520658015e-06, + "loss": 0.9727, + "step": 3645 + }, + { + "epoch": 0.09, + "learning_rate": 1.978968274445063e-06, + "loss": 1.0391, + "step": 3646 + }, + { + "epoch": 0.09, + "learning_rate": 1.9789513355638976e-06, + "loss": 0.8623, + "step": 3647 + }, + { + "epoch": 0.09, + "learning_rate": 1.978934389936771e-06, + "loss": 1.0908, + "step": 3648 + }, + { + "epoch": 0.09, + "learning_rate": 1.9789174375638002e-06, + "loss": 0.8848, + "step": 3649 + }, + { + "epoch": 0.09, + "learning_rate": 1.9789004784451023e-06, + "loss": 0.9619, + "step": 3650 + }, + { + "epoch": 0.09, + "learning_rate": 1.9788835125807933e-06, + "loss": 0.9473, + "step": 3651 + }, + { + "epoch": 0.09, + "learning_rate": 1.9788665399709912e-06, + "loss": 0.9629, + "step": 3652 + }, + { + "epoch": 0.09, + "learning_rate": 1.9788495606158122e-06, + "loss": 0.9316, + "step": 3653 + }, + { + "epoch": 0.09, + "learning_rate": 1.978832574515373e-06, + "loss": 0.9873, + "step": 3654 + }, + { + "epoch": 0.09, + "learning_rate": 1.978815581669792e-06, + "loss": 0.8789, + "step": 3655 + }, + { + "epoch": 0.09, + "learning_rate": 1.9787985820791846e-06, + "loss": 0.9248, + "step": 3656 + }, + { + "epoch": 0.09, + "learning_rate": 1.9787815757436693e-06, + "loss": 1.127, + "step": 3657 + }, + { + "epoch": 0.09, + "learning_rate": 1.9787645626633627e-06, + "loss": 0.8652, + "step": 3658 + }, + { + "epoch": 0.09, + "learning_rate": 1.978747542838382e-06, + "loss": 0.998, + "step": 3659 + }, + { + "epoch": 0.09, + "learning_rate": 1.9787305162688444e-06, + "loss": 0.96, + "step": 3660 + }, + { + "epoch": 0.09, + "learning_rate": 1.978713482954868e-06, + "loss": 1.165, + "step": 3661 + }, + { + "epoch": 0.09, + "learning_rate": 1.978696442896569e-06, + "loss": 0.9854, + "step": 3662 + }, + { + "epoch": 0.09, + "learning_rate": 1.9786793960940656e-06, + "loss": 1.0596, + "step": 3663 + }, + { + "epoch": 0.09, + "learning_rate": 1.9786623425474753e-06, + "loss": 1.0039, + "step": 3664 + }, + { + "epoch": 0.09, + "learning_rate": 1.9786452822569154e-06, + "loss": 0.9346, + "step": 3665 + }, + { + "epoch": 0.09, + "learning_rate": 1.9786282152225032e-06, + "loss": 0.9014, + "step": 3666 + }, + { + "epoch": 0.09, + "learning_rate": 1.9786111414443565e-06, + "loss": 1.0381, + "step": 3667 + }, + { + "epoch": 0.09, + "learning_rate": 1.9785940609225934e-06, + "loss": 0.957, + "step": 3668 + }, + { + "epoch": 0.09, + "learning_rate": 1.978576973657331e-06, + "loss": 0.9443, + "step": 3669 + }, + { + "epoch": 0.09, + "learning_rate": 1.9785598796486873e-06, + "loss": 0.9033, + "step": 3670 + }, + { + "epoch": 0.09, + "learning_rate": 1.97854277889678e-06, + "loss": 0.9331, + "step": 3671 + }, + { + "epoch": 0.09, + "learning_rate": 1.9785256714017272e-06, + "loss": 0.8008, + "step": 3672 + }, + { + "epoch": 0.09, + "learning_rate": 1.9785085571636466e-06, + "loss": 1.0693, + "step": 3673 + }, + { + "epoch": 0.09, + "learning_rate": 1.978491436182656e-06, + "loss": 0.7695, + "step": 3674 + }, + { + "epoch": 0.09, + "learning_rate": 1.978474308458874e-06, + "loss": 0.8545, + "step": 3675 + }, + { + "epoch": 0.09, + "learning_rate": 1.9784571739924174e-06, + "loss": 1.1025, + "step": 3676 + }, + { + "epoch": 0.09, + "learning_rate": 1.9784400327834055e-06, + "loss": 0.7803, + "step": 3677 + }, + { + "epoch": 0.09, + "learning_rate": 1.9784228848319557e-06, + "loss": 1.0234, + "step": 3678 + }, + { + "epoch": 0.09, + "learning_rate": 1.978405730138187e-06, + "loss": 0.9766, + "step": 3679 + }, + { + "epoch": 0.09, + "learning_rate": 1.978388568702216e-06, + "loss": 0.7783, + "step": 3680 + }, + { + "epoch": 0.09, + "learning_rate": 1.9783714005241626e-06, + "loss": 0.9697, + "step": 3681 + }, + { + "epoch": 0.09, + "learning_rate": 1.9783542256041444e-06, + "loss": 1.0332, + "step": 3682 + }, + { + "epoch": 0.09, + "learning_rate": 1.9783370439422797e-06, + "loss": 0.9961, + "step": 3683 + }, + { + "epoch": 0.09, + "learning_rate": 1.9783198555386874e-06, + "loss": 0.9785, + "step": 3684 + }, + { + "epoch": 0.09, + "learning_rate": 1.9783026603934854e-06, + "loss": 0.7075, + "step": 3685 + }, + { + "epoch": 0.09, + "learning_rate": 1.9782854585067923e-06, + "loss": 1.1289, + "step": 3686 + }, + { + "epoch": 0.09, + "learning_rate": 1.978268249878727e-06, + "loss": 0.6968, + "step": 3687 + }, + { + "epoch": 0.09, + "learning_rate": 1.9782510345094075e-06, + "loss": 1.0898, + "step": 3688 + }, + { + "epoch": 0.09, + "learning_rate": 1.9782338123989527e-06, + "loss": 1.0859, + "step": 3689 + }, + { + "epoch": 0.09, + "learning_rate": 1.9782165835474815e-06, + "loss": 0.79, + "step": 3690 + }, + { + "epoch": 0.09, + "learning_rate": 1.978199347955112e-06, + "loss": 0.915, + "step": 3691 + }, + { + "epoch": 0.09, + "learning_rate": 1.9781821056219638e-06, + "loss": 0.7925, + "step": 3692 + }, + { + "epoch": 0.09, + "learning_rate": 1.9781648565481556e-06, + "loss": 0.8066, + "step": 3693 + }, + { + "epoch": 0.09, + "learning_rate": 1.9781476007338054e-06, + "loss": 1.0156, + "step": 3694 + }, + { + "epoch": 0.09, + "learning_rate": 1.978130338179033e-06, + "loss": 1.124, + "step": 3695 + }, + { + "epoch": 0.09, + "learning_rate": 1.978113068883957e-06, + "loss": 0.9717, + "step": 3696 + }, + { + "epoch": 0.09, + "learning_rate": 1.9780957928486967e-06, + "loss": 1.168, + "step": 3697 + }, + { + "epoch": 0.09, + "learning_rate": 1.9780785100733708e-06, + "loss": 0.6641, + "step": 3698 + }, + { + "epoch": 0.09, + "learning_rate": 1.9780612205580983e-06, + "loss": 0.9961, + "step": 3699 + }, + { + "epoch": 0.09, + "learning_rate": 1.9780439243029986e-06, + "loss": 0.7305, + "step": 3700 + }, + { + "epoch": 0.09, + "learning_rate": 1.9780266213081907e-06, + "loss": 0.8867, + "step": 3701 + }, + { + "epoch": 0.09, + "learning_rate": 1.978009311573794e-06, + "loss": 0.8936, + "step": 3702 + }, + { + "epoch": 0.09, + "learning_rate": 1.977991995099928e-06, + "loss": 0.7646, + "step": 3703 + }, + { + "epoch": 0.09, + "learning_rate": 1.9779746718867114e-06, + "loss": 0.856, + "step": 3704 + }, + { + "epoch": 0.09, + "learning_rate": 1.9779573419342643e-06, + "loss": 0.792, + "step": 3705 + }, + { + "epoch": 0.09, + "learning_rate": 1.9779400052427053e-06, + "loss": 0.8894, + "step": 3706 + }, + { + "epoch": 0.1, + "learning_rate": 1.9779226618121548e-06, + "loss": 0.8242, + "step": 3707 + }, + { + "epoch": 0.1, + "learning_rate": 1.9779053116427316e-06, + "loss": 0.8091, + "step": 3708 + }, + { + "epoch": 0.1, + "learning_rate": 1.9778879547345557e-06, + "loss": 0.9805, + "step": 3709 + }, + { + "epoch": 0.1, + "learning_rate": 1.9778705910877466e-06, + "loss": 0.7881, + "step": 3710 + }, + { + "epoch": 0.1, + "learning_rate": 1.977853220702424e-06, + "loss": 0.8789, + "step": 3711 + }, + { + "epoch": 0.1, + "learning_rate": 1.977835843578707e-06, + "loss": 0.9951, + "step": 3712 + }, + { + "epoch": 0.1, + "learning_rate": 1.9778184597167157e-06, + "loss": 0.8535, + "step": 3713 + }, + { + "epoch": 0.1, + "learning_rate": 1.9778010691165707e-06, + "loss": 1.0898, + "step": 3714 + }, + { + "epoch": 0.1, + "learning_rate": 1.9777836717783908e-06, + "loss": 0.9424, + "step": 3715 + }, + { + "epoch": 0.1, + "learning_rate": 1.9777662677022963e-06, + "loss": 0.793, + "step": 3716 + }, + { + "epoch": 0.1, + "learning_rate": 1.9777488568884066e-06, + "loss": 0.832, + "step": 3717 + }, + { + "epoch": 0.1, + "learning_rate": 1.9777314393368425e-06, + "loss": 1.0088, + "step": 3718 + }, + { + "epoch": 0.1, + "learning_rate": 1.977714015047724e-06, + "loss": 1.0449, + "step": 3719 + }, + { + "epoch": 0.1, + "learning_rate": 1.9776965840211703e-06, + "loss": 0.9414, + "step": 3720 + }, + { + "epoch": 0.1, + "learning_rate": 1.977679146257302e-06, + "loss": 0.6611, + "step": 3721 + }, + { + "epoch": 0.1, + "learning_rate": 1.9776617017562395e-06, + "loss": 0.7129, + "step": 3722 + }, + { + "epoch": 0.1, + "learning_rate": 1.977644250518103e-06, + "loss": 1.1094, + "step": 3723 + }, + { + "epoch": 0.1, + "learning_rate": 1.9776267925430126e-06, + "loss": 0.9404, + "step": 3724 + }, + { + "epoch": 0.1, + "learning_rate": 1.9776093278310884e-06, + "loss": 1.0654, + "step": 3725 + }, + { + "epoch": 0.1, + "learning_rate": 1.977591856382451e-06, + "loss": 1.0811, + "step": 3726 + }, + { + "epoch": 0.1, + "learning_rate": 1.9775743781972205e-06, + "loss": 0.7852, + "step": 3727 + }, + { + "epoch": 0.1, + "learning_rate": 1.9775568932755184e-06, + "loss": 0.8833, + "step": 3728 + }, + { + "epoch": 0.1, + "learning_rate": 1.9775394016174635e-06, + "loss": 0.8271, + "step": 3729 + }, + { + "epoch": 0.1, + "learning_rate": 1.977521903223177e-06, + "loss": 0.9199, + "step": 3730 + }, + { + "epoch": 0.1, + "learning_rate": 1.9775043980927804e-06, + "loss": 1.0264, + "step": 3731 + }, + { + "epoch": 0.1, + "learning_rate": 1.9774868862263935e-06, + "loss": 1.0127, + "step": 3732 + }, + { + "epoch": 0.1, + "learning_rate": 1.977469367624137e-06, + "loss": 1.0791, + "step": 3733 + }, + { + "epoch": 0.1, + "learning_rate": 1.9774518422861317e-06, + "loss": 0.9199, + "step": 3734 + }, + { + "epoch": 0.1, + "learning_rate": 1.9774343102124986e-06, + "loss": 0.9575, + "step": 3735 + }, + { + "epoch": 0.1, + "learning_rate": 1.977416771403358e-06, + "loss": 0.7998, + "step": 3736 + }, + { + "epoch": 0.1, + "learning_rate": 1.977399225858831e-06, + "loss": 0.9448, + "step": 3737 + }, + { + "epoch": 0.1, + "learning_rate": 1.9773816735790383e-06, + "loss": 0.8604, + "step": 3738 + }, + { + "epoch": 0.1, + "learning_rate": 1.9773641145641015e-06, + "loss": 1.0996, + "step": 3739 + }, + { + "epoch": 0.1, + "learning_rate": 1.977346548814141e-06, + "loss": 0.9238, + "step": 3740 + }, + { + "epoch": 0.1, + "learning_rate": 1.9773289763292783e-06, + "loss": 1.0986, + "step": 3741 + }, + { + "epoch": 0.1, + "learning_rate": 1.977311397109634e-06, + "loss": 1.0186, + "step": 3742 + }, + { + "epoch": 0.1, + "learning_rate": 1.9772938111553295e-06, + "loss": 0.9746, + "step": 3743 + }, + { + "epoch": 0.1, + "learning_rate": 1.977276218466486e-06, + "loss": 1.0029, + "step": 3744 + }, + { + "epoch": 0.1, + "learning_rate": 1.977258619043225e-06, + "loss": 0.9932, + "step": 3745 + }, + { + "epoch": 0.1, + "learning_rate": 1.977241012885667e-06, + "loss": 0.6455, + "step": 3746 + }, + { + "epoch": 0.1, + "learning_rate": 1.9772233999939345e-06, + "loss": 0.8579, + "step": 3747 + }, + { + "epoch": 0.1, + "learning_rate": 1.9772057803681473e-06, + "loss": 0.9912, + "step": 3748 + }, + { + "epoch": 0.1, + "learning_rate": 1.977188154008428e-06, + "loss": 0.999, + "step": 3749 + }, + { + "epoch": 0.1, + "learning_rate": 1.9771705209148978e-06, + "loss": 0.8613, + "step": 3750 + }, + { + "epoch": 0.1, + "learning_rate": 1.9771528810876785e-06, + "loss": 1.0586, + "step": 3751 + }, + { + "epoch": 0.1, + "learning_rate": 1.9771352345268907e-06, + "loss": 0.8877, + "step": 3752 + }, + { + "epoch": 0.1, + "learning_rate": 1.977117581232657e-06, + "loss": 0.7451, + "step": 3753 + }, + { + "epoch": 0.1, + "learning_rate": 1.9770999212050986e-06, + "loss": 0.9238, + "step": 3754 + }, + { + "epoch": 0.1, + "learning_rate": 1.9770822544443373e-06, + "loss": 0.9521, + "step": 3755 + }, + { + "epoch": 0.1, + "learning_rate": 1.9770645809504946e-06, + "loss": 0.822, + "step": 3756 + }, + { + "epoch": 0.1, + "learning_rate": 1.977046900723693e-06, + "loss": 0.8496, + "step": 3757 + }, + { + "epoch": 0.1, + "learning_rate": 1.9770292137640532e-06, + "loss": 1.1211, + "step": 3758 + }, + { + "epoch": 0.1, + "learning_rate": 1.977011520071698e-06, + "loss": 0.9736, + "step": 3759 + }, + { + "epoch": 0.1, + "learning_rate": 1.9769938196467486e-06, + "loss": 0.6973, + "step": 3760 + }, + { + "epoch": 0.1, + "learning_rate": 1.976976112489328e-06, + "loss": 1.0176, + "step": 3761 + }, + { + "epoch": 0.1, + "learning_rate": 1.9769583985995574e-06, + "loss": 1.0283, + "step": 3762 + }, + { + "epoch": 0.1, + "learning_rate": 1.976940677977559e-06, + "loss": 0.5742, + "step": 3763 + }, + { + "epoch": 0.1, + "learning_rate": 1.9769229506234553e-06, + "loss": 0.9648, + "step": 3764 + }, + { + "epoch": 0.1, + "learning_rate": 1.9769052165373682e-06, + "loss": 0.9326, + "step": 3765 + }, + { + "epoch": 0.1, + "learning_rate": 1.97688747571942e-06, + "loss": 0.8574, + "step": 3766 + }, + { + "epoch": 0.1, + "learning_rate": 1.9768697281697322e-06, + "loss": 0.8145, + "step": 3767 + }, + { + "epoch": 0.1, + "learning_rate": 1.976851973888428e-06, + "loss": 1.1182, + "step": 3768 + }, + { + "epoch": 0.1, + "learning_rate": 1.9768342128756295e-06, + "loss": 1.0312, + "step": 3769 + }, + { + "epoch": 0.1, + "learning_rate": 1.976816445131459e-06, + "loss": 1.002, + "step": 3770 + }, + { + "epoch": 0.1, + "learning_rate": 1.976798670656039e-06, + "loss": 1.0244, + "step": 3771 + }, + { + "epoch": 0.1, + "learning_rate": 1.9767808894494923e-06, + "loss": 0.9922, + "step": 3772 + }, + { + "epoch": 0.1, + "learning_rate": 1.9767631015119405e-06, + "loss": 1.0879, + "step": 3773 + }, + { + "epoch": 0.1, + "learning_rate": 1.9767453068435075e-06, + "loss": 0.9453, + "step": 3774 + }, + { + "epoch": 0.1, + "learning_rate": 1.9767275054443147e-06, + "loss": 1.0098, + "step": 3775 + }, + { + "epoch": 0.1, + "learning_rate": 1.9767096973144855e-06, + "loss": 0.77, + "step": 3776 + }, + { + "epoch": 0.1, + "learning_rate": 1.9766918824541423e-06, + "loss": 1.0498, + "step": 3777 + }, + { + "epoch": 0.1, + "learning_rate": 1.976674060863408e-06, + "loss": 1.0684, + "step": 3778 + }, + { + "epoch": 0.1, + "learning_rate": 1.9766562325424053e-06, + "loss": 0.9658, + "step": 3779 + }, + { + "epoch": 0.1, + "learning_rate": 1.976638397491257e-06, + "loss": 1.0195, + "step": 3780 + }, + { + "epoch": 0.1, + "learning_rate": 1.9766205557100868e-06, + "loss": 1.0234, + "step": 3781 + }, + { + "epoch": 0.1, + "learning_rate": 1.9766027071990164e-06, + "loss": 0.9033, + "step": 3782 + }, + { + "epoch": 0.1, + "learning_rate": 1.9765848519581692e-06, + "loss": 1.0156, + "step": 3783 + }, + { + "epoch": 0.1, + "learning_rate": 1.9765669899876686e-06, + "loss": 1.0908, + "step": 3784 + }, + { + "epoch": 0.1, + "learning_rate": 1.976549121287638e-06, + "loss": 0.7427, + "step": 3785 + }, + { + "epoch": 0.1, + "learning_rate": 1.976531245858199e-06, + "loss": 0.6909, + "step": 3786 + }, + { + "epoch": 0.1, + "learning_rate": 1.9765133636994768e-06, + "loss": 0.8516, + "step": 3787 + }, + { + "epoch": 0.1, + "learning_rate": 1.976495474811593e-06, + "loss": 0.9834, + "step": 3788 + }, + { + "epoch": 0.1, + "learning_rate": 1.976477579194672e-06, + "loss": 0.8945, + "step": 3789 + }, + { + "epoch": 0.1, + "learning_rate": 1.976459676848836e-06, + "loss": 0.9639, + "step": 3790 + }, + { + "epoch": 0.1, + "learning_rate": 1.9764417677742095e-06, + "loss": 0.7886, + "step": 3791 + }, + { + "epoch": 0.1, + "learning_rate": 1.9764238519709154e-06, + "loss": 0.5181, + "step": 3792 + }, + { + "epoch": 0.1, + "learning_rate": 1.976405929439077e-06, + "loss": 1.1582, + "step": 3793 + }, + { + "epoch": 0.1, + "learning_rate": 1.976388000178818e-06, + "loss": 0.9111, + "step": 3794 + }, + { + "epoch": 0.1, + "learning_rate": 1.976370064190262e-06, + "loss": 1.0, + "step": 3795 + }, + { + "epoch": 0.1, + "learning_rate": 1.976352121473532e-06, + "loss": 0.855, + "step": 3796 + }, + { + "epoch": 0.1, + "learning_rate": 1.976334172028753e-06, + "loss": 0.9062, + "step": 3797 + }, + { + "epoch": 0.1, + "learning_rate": 1.976316215856047e-06, + "loss": 0.7915, + "step": 3798 + }, + { + "epoch": 0.1, + "learning_rate": 1.976298252955539e-06, + "loss": 1.0098, + "step": 3799 + }, + { + "epoch": 0.1, + "learning_rate": 1.9762802833273526e-06, + "loss": 0.8057, + "step": 3800 + }, + { + "epoch": 0.1, + "learning_rate": 1.976262306971611e-06, + "loss": 1.0459, + "step": 3801 + }, + { + "epoch": 0.1, + "learning_rate": 1.9762443238884386e-06, + "loss": 0.9053, + "step": 3802 + }, + { + "epoch": 0.1, + "learning_rate": 1.9762263340779595e-06, + "loss": 1.0508, + "step": 3803 + }, + { + "epoch": 0.1, + "learning_rate": 1.976208337540297e-06, + "loss": 0.9121, + "step": 3804 + }, + { + "epoch": 0.1, + "learning_rate": 1.9761903342755755e-06, + "loss": 0.8271, + "step": 3805 + }, + { + "epoch": 0.1, + "learning_rate": 1.976172324283919e-06, + "loss": 0.7041, + "step": 3806 + }, + { + "epoch": 0.1, + "learning_rate": 1.976154307565452e-06, + "loss": 1.0488, + "step": 3807 + }, + { + "epoch": 0.1, + "learning_rate": 1.9761362841202977e-06, + "loss": 0.9189, + "step": 3808 + }, + { + "epoch": 0.1, + "learning_rate": 1.9761182539485812e-06, + "loss": 0.8799, + "step": 3809 + }, + { + "epoch": 0.1, + "learning_rate": 1.9761002170504263e-06, + "loss": 1.0928, + "step": 3810 + }, + { + "epoch": 0.1, + "learning_rate": 1.9760821734259577e-06, + "loss": 1.0576, + "step": 3811 + }, + { + "epoch": 0.1, + "learning_rate": 1.976064123075299e-06, + "loss": 1.0557, + "step": 3812 + }, + { + "epoch": 0.1, + "learning_rate": 1.9760460659985755e-06, + "loss": 0.9053, + "step": 3813 + }, + { + "epoch": 0.1, + "learning_rate": 1.9760280021959115e-06, + "loss": 0.918, + "step": 3814 + }, + { + "epoch": 0.1, + "learning_rate": 1.9760099316674306e-06, + "loss": 0.9824, + "step": 3815 + }, + { + "epoch": 0.1, + "learning_rate": 1.9759918544132577e-06, + "loss": 0.9766, + "step": 3816 + }, + { + "epoch": 0.1, + "learning_rate": 1.975973770433518e-06, + "loss": 1.0664, + "step": 3817 + }, + { + "epoch": 0.1, + "learning_rate": 1.9759556797283357e-06, + "loss": 1.0635, + "step": 3818 + }, + { + "epoch": 0.1, + "learning_rate": 1.975937582297835e-06, + "loss": 0.8203, + "step": 3819 + }, + { + "epoch": 0.1, + "learning_rate": 1.9759194781421416e-06, + "loss": 0.8423, + "step": 3820 + }, + { + "epoch": 0.1, + "learning_rate": 1.9759013672613795e-06, + "loss": 0.8413, + "step": 3821 + }, + { + "epoch": 0.1, + "learning_rate": 1.9758832496556735e-06, + "loss": 0.7852, + "step": 3822 + }, + { + "epoch": 0.1, + "learning_rate": 1.975865125325149e-06, + "loss": 0.686, + "step": 3823 + }, + { + "epoch": 0.1, + "learning_rate": 1.97584699426993e-06, + "loss": 1.1602, + "step": 3824 + }, + { + "epoch": 0.1, + "learning_rate": 1.9758288564901427e-06, + "loss": 0.8428, + "step": 3825 + }, + { + "epoch": 0.1, + "learning_rate": 1.975810711985911e-06, + "loss": 0.9307, + "step": 3826 + }, + { + "epoch": 0.1, + "learning_rate": 1.9757925607573604e-06, + "loss": 1.0664, + "step": 3827 + }, + { + "epoch": 0.1, + "learning_rate": 1.9757744028046155e-06, + "loss": 1.0195, + "step": 3828 + }, + { + "epoch": 0.1, + "learning_rate": 1.9757562381278025e-06, + "loss": 1.1914, + "step": 3829 + }, + { + "epoch": 0.1, + "learning_rate": 1.9757380667270454e-06, + "loss": 0.8672, + "step": 3830 + }, + { + "epoch": 0.1, + "learning_rate": 1.97571988860247e-06, + "loss": 0.9707, + "step": 3831 + }, + { + "epoch": 0.1, + "learning_rate": 1.9757017037542014e-06, + "loss": 0.7891, + "step": 3832 + }, + { + "epoch": 0.1, + "learning_rate": 1.9756835121823652e-06, + "loss": 0.9746, + "step": 3833 + }, + { + "epoch": 0.1, + "learning_rate": 1.975665313887087e-06, + "loss": 1.124, + "step": 3834 + }, + { + "epoch": 0.1, + "learning_rate": 1.975647108868491e-06, + "loss": 1.0225, + "step": 3835 + }, + { + "epoch": 0.1, + "learning_rate": 1.9756288971267033e-06, + "loss": 1.0117, + "step": 3836 + }, + { + "epoch": 0.1, + "learning_rate": 1.9756106786618497e-06, + "loss": 0.8232, + "step": 3837 + }, + { + "epoch": 0.1, + "learning_rate": 1.9755924534740558e-06, + "loss": 1.0967, + "step": 3838 + }, + { + "epoch": 0.1, + "learning_rate": 1.975574221563447e-06, + "loss": 0.9443, + "step": 3839 + }, + { + "epoch": 0.1, + "learning_rate": 1.975555982930149e-06, + "loss": 0.8965, + "step": 3840 + }, + { + "epoch": 0.1, + "learning_rate": 1.9755377375742866e-06, + "loss": 0.8413, + "step": 3841 + }, + { + "epoch": 0.1, + "learning_rate": 1.9755194854959867e-06, + "loss": 0.8203, + "step": 3842 + }, + { + "epoch": 0.1, + "learning_rate": 1.9755012266953746e-06, + "loss": 1.0498, + "step": 3843 + }, + { + "epoch": 0.1, + "learning_rate": 1.975482961172576e-06, + "loss": 1.0635, + "step": 3844 + }, + { + "epoch": 0.1, + "learning_rate": 1.9754646889277177e-06, + "loss": 1.124, + "step": 3845 + }, + { + "epoch": 0.1, + "learning_rate": 1.975446409960924e-06, + "loss": 1.1738, + "step": 3846 + }, + { + "epoch": 0.1, + "learning_rate": 1.975428124272322e-06, + "loss": 1.1123, + "step": 3847 + }, + { + "epoch": 0.1, + "learning_rate": 1.9754098318620377e-06, + "loss": 0.8955, + "step": 3848 + }, + { + "epoch": 0.1, + "learning_rate": 1.9753915327301966e-06, + "loss": 1.0967, + "step": 3849 + }, + { + "epoch": 0.1, + "learning_rate": 1.975373226876925e-06, + "loss": 0.8691, + "step": 3850 + }, + { + "epoch": 0.1, + "learning_rate": 1.9753549143023496e-06, + "loss": 0.9639, + "step": 3851 + }, + { + "epoch": 0.1, + "learning_rate": 1.9753365950065957e-06, + "loss": 1.1211, + "step": 3852 + }, + { + "epoch": 0.1, + "learning_rate": 1.97531826898979e-06, + "loss": 1.0068, + "step": 3853 + }, + { + "epoch": 0.1, + "learning_rate": 1.975299936252059e-06, + "loss": 1.0361, + "step": 3854 + }, + { + "epoch": 0.1, + "learning_rate": 1.9752815967935285e-06, + "loss": 0.9033, + "step": 3855 + }, + { + "epoch": 0.1, + "learning_rate": 1.9752632506143253e-06, + "loss": 1.1719, + "step": 3856 + }, + { + "epoch": 0.1, + "learning_rate": 1.9752448977145755e-06, + "loss": 0.6787, + "step": 3857 + }, + { + "epoch": 0.1, + "learning_rate": 1.9752265380944057e-06, + "loss": 0.9475, + "step": 3858 + }, + { + "epoch": 0.1, + "learning_rate": 1.9752081717539426e-06, + "loss": 0.8574, + "step": 3859 + }, + { + "epoch": 0.1, + "learning_rate": 1.9751897986933128e-06, + "loss": 0.9268, + "step": 3860 + }, + { + "epoch": 0.1, + "learning_rate": 1.9751714189126425e-06, + "loss": 0.8833, + "step": 3861 + }, + { + "epoch": 0.1, + "learning_rate": 1.9751530324120583e-06, + "loss": 0.8853, + "step": 3862 + }, + { + "epoch": 0.1, + "learning_rate": 1.9751346391916877e-06, + "loss": 0.8984, + "step": 3863 + }, + { + "epoch": 0.1, + "learning_rate": 1.9751162392516565e-06, + "loss": 0.9351, + "step": 3864 + }, + { + "epoch": 0.1, + "learning_rate": 1.9750978325920923e-06, + "loss": 0.7559, + "step": 3865 + }, + { + "epoch": 0.1, + "learning_rate": 1.9750794192131215e-06, + "loss": 1.1113, + "step": 3866 + }, + { + "epoch": 0.1, + "learning_rate": 1.975060999114871e-06, + "loss": 0.7617, + "step": 3867 + }, + { + "epoch": 0.1, + "learning_rate": 1.975042572297468e-06, + "loss": 0.8345, + "step": 3868 + }, + { + "epoch": 0.1, + "learning_rate": 1.975024138761039e-06, + "loss": 0.6475, + "step": 3869 + }, + { + "epoch": 0.1, + "learning_rate": 1.975005698505711e-06, + "loss": 1.0059, + "step": 3870 + }, + { + "epoch": 0.1, + "learning_rate": 1.974987251531612e-06, + "loss": 1.041, + "step": 3871 + }, + { + "epoch": 0.1, + "learning_rate": 1.9749687978388683e-06, + "loss": 0.6875, + "step": 3872 + }, + { + "epoch": 0.1, + "learning_rate": 1.9749503374276067e-06, + "loss": 0.7793, + "step": 3873 + }, + { + "epoch": 0.1, + "learning_rate": 1.9749318702979554e-06, + "loss": 0.8242, + "step": 3874 + }, + { + "epoch": 0.1, + "learning_rate": 1.9749133964500416e-06, + "loss": 0.918, + "step": 3875 + }, + { + "epoch": 0.1, + "learning_rate": 1.9748949158839918e-06, + "loss": 1.001, + "step": 3876 + }, + { + "epoch": 0.1, + "learning_rate": 1.974876428599934e-06, + "loss": 1.085, + "step": 3877 + }, + { + "epoch": 0.1, + "learning_rate": 1.974857934597995e-06, + "loss": 0.8164, + "step": 3878 + }, + { + "epoch": 0.1, + "learning_rate": 1.9748394338783028e-06, + "loss": 0.7246, + "step": 3879 + }, + { + "epoch": 0.1, + "learning_rate": 1.974820926440985e-06, + "loss": 1.04, + "step": 3880 + }, + { + "epoch": 0.1, + "learning_rate": 1.9748024122861684e-06, + "loss": 0.8857, + "step": 3881 + }, + { + "epoch": 0.1, + "learning_rate": 1.974783891413981e-06, + "loss": 0.9473, + "step": 3882 + }, + { + "epoch": 0.1, + "learning_rate": 1.9747653638245505e-06, + "loss": 0.9448, + "step": 3883 + }, + { + "epoch": 0.1, + "learning_rate": 1.9747468295180045e-06, + "loss": 0.9111, + "step": 3884 + }, + { + "epoch": 0.1, + "learning_rate": 1.9747282884944708e-06, + "loss": 0.9209, + "step": 3885 + }, + { + "epoch": 0.1, + "learning_rate": 1.9747097407540775e-06, + "loss": 1.1074, + "step": 3886 + }, + { + "epoch": 0.1, + "learning_rate": 1.9746911862969515e-06, + "loss": 0.8193, + "step": 3887 + }, + { + "epoch": 0.1, + "learning_rate": 1.9746726251232213e-06, + "loss": 0.8555, + "step": 3888 + }, + { + "epoch": 0.1, + "learning_rate": 1.974654057233015e-06, + "loss": 0.9639, + "step": 3889 + }, + { + "epoch": 0.1, + "learning_rate": 1.97463548262646e-06, + "loss": 0.9346, + "step": 3890 + }, + { + "epoch": 0.1, + "learning_rate": 1.974616901303684e-06, + "loss": 0.8291, + "step": 3891 + }, + { + "epoch": 0.1, + "learning_rate": 1.974598313264816e-06, + "loss": 0.8179, + "step": 3892 + }, + { + "epoch": 0.1, + "learning_rate": 1.9745797185099837e-06, + "loss": 1.0742, + "step": 3893 + }, + { + "epoch": 0.1, + "learning_rate": 1.9745611170393155e-06, + "loss": 1.0947, + "step": 3894 + }, + { + "epoch": 0.1, + "learning_rate": 1.974542508852939e-06, + "loss": 0.7578, + "step": 3895 + }, + { + "epoch": 0.1, + "learning_rate": 1.9745238939509826e-06, + "loss": 0.6943, + "step": 3896 + }, + { + "epoch": 0.1, + "learning_rate": 1.9745052723335742e-06, + "loss": 0.5601, + "step": 3897 + }, + { + "epoch": 0.1, + "learning_rate": 1.9744866440008434e-06, + "loss": 0.8633, + "step": 3898 + }, + { + "epoch": 0.1, + "learning_rate": 1.974468008952918e-06, + "loss": 1.1123, + "step": 3899 + }, + { + "epoch": 0.1, + "learning_rate": 1.9744493671899253e-06, + "loss": 0.8223, + "step": 3900 + }, + { + "epoch": 0.1, + "learning_rate": 1.974430718711995e-06, + "loss": 0.8613, + "step": 3901 + }, + { + "epoch": 0.1, + "learning_rate": 1.9744120635192557e-06, + "loss": 0.585, + "step": 3902 + }, + { + "epoch": 0.1, + "learning_rate": 1.974393401611835e-06, + "loss": 0.7217, + "step": 3903 + }, + { + "epoch": 0.1, + "learning_rate": 1.974374732989862e-06, + "loss": 0.9531, + "step": 3904 + }, + { + "epoch": 0.1, + "learning_rate": 1.974356057653466e-06, + "loss": 0.8887, + "step": 3905 + }, + { + "epoch": 0.1, + "learning_rate": 1.974337375602774e-06, + "loss": 1.1221, + "step": 3906 + }, + { + "epoch": 0.1, + "learning_rate": 1.9743186868379164e-06, + "loss": 1.1699, + "step": 3907 + }, + { + "epoch": 0.1, + "learning_rate": 1.9742999913590212e-06, + "loss": 0.8867, + "step": 3908 + }, + { + "epoch": 0.1, + "learning_rate": 1.9742812891662176e-06, + "loss": 0.7773, + "step": 3909 + }, + { + "epoch": 0.1, + "learning_rate": 1.9742625802596343e-06, + "loss": 1.0039, + "step": 3910 + }, + { + "epoch": 0.1, + "learning_rate": 1.9742438646394e-06, + "loss": 1.0684, + "step": 3911 + }, + { + "epoch": 0.1, + "learning_rate": 1.974225142305644e-06, + "loss": 0.729, + "step": 3912 + }, + { + "epoch": 0.1, + "learning_rate": 1.974206413258495e-06, + "loss": 0.5249, + "step": 3913 + }, + { + "epoch": 0.1, + "learning_rate": 1.9741876774980827e-06, + "loss": 1.0332, + "step": 3914 + }, + { + "epoch": 0.1, + "learning_rate": 1.9741689350245353e-06, + "loss": 0.9268, + "step": 3915 + }, + { + "epoch": 0.1, + "learning_rate": 1.9741501858379825e-06, + "loss": 0.7861, + "step": 3916 + }, + { + "epoch": 0.1, + "learning_rate": 1.9741314299385534e-06, + "loss": 0.9463, + "step": 3917 + }, + { + "epoch": 0.1, + "learning_rate": 1.9741126673263776e-06, + "loss": 0.9219, + "step": 3918 + }, + { + "epoch": 0.1, + "learning_rate": 1.9740938980015835e-06, + "loss": 0.9414, + "step": 3919 + }, + { + "epoch": 0.1, + "learning_rate": 1.9740751219643014e-06, + "loss": 0.8174, + "step": 3920 + }, + { + "epoch": 0.1, + "learning_rate": 1.97405633921466e-06, + "loss": 0.8809, + "step": 3921 + }, + { + "epoch": 0.1, + "learning_rate": 1.9740375497527893e-06, + "loss": 0.7959, + "step": 3922 + }, + { + "epoch": 0.1, + "learning_rate": 1.9740187535788185e-06, + "loss": 1.0479, + "step": 3923 + }, + { + "epoch": 0.1, + "learning_rate": 1.973999950692877e-06, + "loss": 0.9932, + "step": 3924 + }, + { + "epoch": 0.1, + "learning_rate": 1.973981141095094e-06, + "loss": 0.8838, + "step": 3925 + }, + { + "epoch": 0.1, + "learning_rate": 1.9739623247856e-06, + "loss": 0.8867, + "step": 3926 + }, + { + "epoch": 0.1, + "learning_rate": 1.9739435017645243e-06, + "loss": 0.9346, + "step": 3927 + }, + { + "epoch": 0.1, + "learning_rate": 1.9739246720319967e-06, + "loss": 1.1387, + "step": 3928 + }, + { + "epoch": 0.1, + "learning_rate": 1.973905835588147e-06, + "loss": 1.126, + "step": 3929 + }, + { + "epoch": 0.1, + "learning_rate": 1.973886992433104e-06, + "loss": 1.0039, + "step": 3930 + }, + { + "epoch": 0.1, + "learning_rate": 1.973868142566999e-06, + "loss": 0.8716, + "step": 3931 + }, + { + "epoch": 0.1, + "learning_rate": 1.9738492859899613e-06, + "loss": 1.0859, + "step": 3932 + }, + { + "epoch": 0.1, + "learning_rate": 1.973830422702121e-06, + "loss": 0.8306, + "step": 3933 + }, + { + "epoch": 0.1, + "learning_rate": 1.973811552703607e-06, + "loss": 1.1133, + "step": 3934 + }, + { + "epoch": 0.1, + "learning_rate": 1.9737926759945508e-06, + "loss": 0.6754, + "step": 3935 + }, + { + "epoch": 0.1, + "learning_rate": 1.9737737925750823e-06, + "loss": 0.9805, + "step": 3936 + }, + { + "epoch": 0.1, + "learning_rate": 1.9737549024453307e-06, + "loss": 0.8906, + "step": 3937 + }, + { + "epoch": 0.1, + "learning_rate": 1.973736005605427e-06, + "loss": 0.791, + "step": 3938 + }, + { + "epoch": 0.1, + "learning_rate": 1.973717102055501e-06, + "loss": 0.8301, + "step": 3939 + }, + { + "epoch": 0.1, + "learning_rate": 1.973698191795683e-06, + "loss": 0.8838, + "step": 3940 + }, + { + "epoch": 0.1, + "learning_rate": 1.973679274826104e-06, + "loss": 0.8711, + "step": 3941 + }, + { + "epoch": 0.1, + "learning_rate": 1.973660351146893e-06, + "loss": 0.8984, + "step": 3942 + }, + { + "epoch": 0.1, + "learning_rate": 1.9736414207581813e-06, + "loss": 1.0605, + "step": 3943 + }, + { + "epoch": 0.1, + "learning_rate": 1.973622483660099e-06, + "loss": 0.9648, + "step": 3944 + }, + { + "epoch": 0.1, + "learning_rate": 1.9736035398527774e-06, + "loss": 0.9365, + "step": 3945 + }, + { + "epoch": 0.1, + "learning_rate": 1.973584589336346e-06, + "loss": 0.8994, + "step": 3946 + }, + { + "epoch": 0.1, + "learning_rate": 1.9735656321109362e-06, + "loss": 1.0713, + "step": 3947 + }, + { + "epoch": 0.1, + "learning_rate": 1.9735466681766785e-06, + "loss": 1.0352, + "step": 3948 + }, + { + "epoch": 0.1, + "learning_rate": 1.973527697533703e-06, + "loss": 0.7363, + "step": 3949 + }, + { + "epoch": 0.1, + "learning_rate": 1.9735087201821406e-06, + "loss": 0.875, + "step": 3950 + }, + { + "epoch": 0.1, + "learning_rate": 1.9734897361221225e-06, + "loss": 0.9492, + "step": 3951 + }, + { + "epoch": 0.1, + "learning_rate": 1.9734707453537793e-06, + "loss": 0.959, + "step": 3952 + }, + { + "epoch": 0.1, + "learning_rate": 1.9734517478772418e-06, + "loss": 0.9004, + "step": 3953 + }, + { + "epoch": 0.1, + "learning_rate": 1.9734327436926408e-06, + "loss": 0.7739, + "step": 3954 + }, + { + "epoch": 0.1, + "learning_rate": 1.9734137328001076e-06, + "loss": 1.2988, + "step": 3955 + }, + { + "epoch": 0.1, + "learning_rate": 1.9733947151997723e-06, + "loss": 0.8765, + "step": 3956 + }, + { + "epoch": 0.1, + "learning_rate": 1.9733756908917674e-06, + "loss": 0.8779, + "step": 3957 + }, + { + "epoch": 0.1, + "learning_rate": 1.9733566598762234e-06, + "loss": 0.9619, + "step": 3958 + }, + { + "epoch": 0.1, + "learning_rate": 1.9733376221532707e-06, + "loss": 1.0342, + "step": 3959 + }, + { + "epoch": 0.1, + "learning_rate": 1.9733185777230415e-06, + "loss": 1.0391, + "step": 3960 + }, + { + "epoch": 0.1, + "learning_rate": 1.973299526585667e-06, + "loss": 0.6128, + "step": 3961 + }, + { + "epoch": 0.1, + "learning_rate": 1.9732804687412776e-06, + "loss": 0.8564, + "step": 3962 + }, + { + "epoch": 0.1, + "learning_rate": 1.973261404190005e-06, + "loss": 1.1143, + "step": 3963 + }, + { + "epoch": 0.1, + "learning_rate": 1.973242332931981e-06, + "loss": 0.9326, + "step": 3964 + }, + { + "epoch": 0.1, + "learning_rate": 1.9732232549673365e-06, + "loss": 1.0537, + "step": 3965 + }, + { + "epoch": 0.1, + "learning_rate": 1.9732041702962037e-06, + "loss": 0.8398, + "step": 3966 + }, + { + "epoch": 0.1, + "learning_rate": 1.9731850789187134e-06, + "loss": 0.9482, + "step": 3967 + }, + { + "epoch": 0.1, + "learning_rate": 1.973165980834997e-06, + "loss": 0.8462, + "step": 3968 + }, + { + "epoch": 0.1, + "learning_rate": 1.9731468760451867e-06, + "loss": 0.6079, + "step": 3969 + }, + { + "epoch": 0.1, + "learning_rate": 1.9731277645494137e-06, + "loss": 0.6143, + "step": 3970 + }, + { + "epoch": 0.1, + "learning_rate": 1.9731086463478104e-06, + "loss": 0.9658, + "step": 3971 + }, + { + "epoch": 0.1, + "learning_rate": 1.9730895214405077e-06, + "loss": 0.915, + "step": 3972 + }, + { + "epoch": 0.1, + "learning_rate": 1.973070389827638e-06, + "loss": 0.9629, + "step": 3973 + }, + { + "epoch": 0.1, + "learning_rate": 1.973051251509333e-06, + "loss": 0.8066, + "step": 3974 + }, + { + "epoch": 0.1, + "learning_rate": 1.973032106485724e-06, + "loss": 0.9629, + "step": 3975 + }, + { + "epoch": 0.1, + "learning_rate": 1.973012954756944e-06, + "loss": 1.0137, + "step": 3976 + }, + { + "epoch": 0.1, + "learning_rate": 1.972993796323124e-06, + "loss": 0.8545, + "step": 3977 + }, + { + "epoch": 0.1, + "learning_rate": 1.972974631184396e-06, + "loss": 0.8154, + "step": 3978 + }, + { + "epoch": 0.1, + "learning_rate": 1.972955459340893e-06, + "loss": 1.0625, + "step": 3979 + }, + { + "epoch": 0.1, + "learning_rate": 1.9729362807927467e-06, + "loss": 0.9111, + "step": 3980 + }, + { + "epoch": 0.1, + "learning_rate": 1.972917095540089e-06, + "loss": 1.0439, + "step": 3981 + }, + { + "epoch": 0.1, + "learning_rate": 1.972897903583052e-06, + "loss": 0.8623, + "step": 3982 + }, + { + "epoch": 0.1, + "learning_rate": 1.9728787049217684e-06, + "loss": 0.876, + "step": 3983 + }, + { + "epoch": 0.1, + "learning_rate": 1.97285949955637e-06, + "loss": 0.96, + "step": 3984 + }, + { + "epoch": 0.1, + "learning_rate": 1.97284028748699e-06, + "loss": 0.7756, + "step": 3985 + }, + { + "epoch": 0.1, + "learning_rate": 1.9728210687137597e-06, + "loss": 0.9248, + "step": 3986 + }, + { + "epoch": 0.1, + "learning_rate": 1.972801843236812e-06, + "loss": 0.8652, + "step": 3987 + }, + { + "epoch": 0.1, + "learning_rate": 1.9727826110562804e-06, + "loss": 1.0176, + "step": 3988 + }, + { + "epoch": 0.1, + "learning_rate": 1.9727633721722955e-06, + "loss": 1.0732, + "step": 3989 + }, + { + "epoch": 0.1, + "learning_rate": 1.9727441265849914e-06, + "loss": 0.9336, + "step": 3990 + }, + { + "epoch": 0.1, + "learning_rate": 1.9727248742945e-06, + "loss": 0.9473, + "step": 3991 + }, + { + "epoch": 0.1, + "learning_rate": 1.972705615300954e-06, + "loss": 1.0498, + "step": 3992 + }, + { + "epoch": 0.1, + "learning_rate": 1.9726863496044864e-06, + "loss": 0.8486, + "step": 3993 + }, + { + "epoch": 0.1, + "learning_rate": 1.97266707720523e-06, + "loss": 1.0439, + "step": 3994 + }, + { + "epoch": 0.1, + "learning_rate": 1.9726477981033168e-06, + "loss": 1.0156, + "step": 3995 + }, + { + "epoch": 0.1, + "learning_rate": 1.9726285122988807e-06, + "loss": 0.9375, + "step": 3996 + }, + { + "epoch": 0.1, + "learning_rate": 1.9726092197920542e-06, + "loss": 0.9775, + "step": 3997 + }, + { + "epoch": 0.1, + "learning_rate": 1.9725899205829703e-06, + "loss": 0.9082, + "step": 3998 + }, + { + "epoch": 0.1, + "learning_rate": 1.9725706146717614e-06, + "loss": 0.9697, + "step": 3999 + }, + { + "epoch": 0.1, + "learning_rate": 1.972551302058562e-06, + "loss": 0.9521, + "step": 4000 + }, + { + "epoch": 0.1, + "learning_rate": 1.9725319827435034e-06, + "loss": 1.0049, + "step": 4001 + }, + { + "epoch": 0.1, + "learning_rate": 1.9725126567267195e-06, + "loss": 0.999, + "step": 4002 + }, + { + "epoch": 0.1, + "learning_rate": 1.9724933240083442e-06, + "loss": 0.8613, + "step": 4003 + }, + { + "epoch": 0.1, + "learning_rate": 1.97247398458851e-06, + "loss": 1.0322, + "step": 4004 + }, + { + "epoch": 0.1, + "learning_rate": 1.9724546384673493e-06, + "loss": 0.8623, + "step": 4005 + }, + { + "epoch": 0.1, + "learning_rate": 1.9724352856449973e-06, + "loss": 1.0869, + "step": 4006 + }, + { + "epoch": 0.1, + "learning_rate": 1.972415926121586e-06, + "loss": 1.0791, + "step": 4007 + }, + { + "epoch": 0.1, + "learning_rate": 1.972396559897249e-06, + "loss": 0.8252, + "step": 4008 + }, + { + "epoch": 0.1, + "learning_rate": 1.9723771869721206e-06, + "loss": 0.9951, + "step": 4009 + }, + { + "epoch": 0.1, + "learning_rate": 1.972357807346333e-06, + "loss": 0.9033, + "step": 4010 + }, + { + "epoch": 0.1, + "learning_rate": 1.972338421020021e-06, + "loss": 0.9199, + "step": 4011 + }, + { + "epoch": 0.1, + "learning_rate": 1.972319027993317e-06, + "loss": 0.8018, + "step": 4012 + }, + { + "epoch": 0.1, + "learning_rate": 1.972299628266356e-06, + "loss": 1.0283, + "step": 4013 + }, + { + "epoch": 0.1, + "learning_rate": 1.97228022183927e-06, + "loss": 0.8584, + "step": 4014 + }, + { + "epoch": 0.1, + "learning_rate": 1.9722608087121945e-06, + "loss": 0.8135, + "step": 4015 + }, + { + "epoch": 0.1, + "learning_rate": 1.972241388885262e-06, + "loss": 1.1162, + "step": 4016 + }, + { + "epoch": 0.1, + "learning_rate": 1.972221962358607e-06, + "loss": 0.7607, + "step": 4017 + }, + { + "epoch": 0.1, + "learning_rate": 1.9722025291323626e-06, + "loss": 1.0449, + "step": 4018 + }, + { + "epoch": 0.1, + "learning_rate": 1.9721830892066637e-06, + "loss": 0.7881, + "step": 4019 + }, + { + "epoch": 0.1, + "learning_rate": 1.972163642581643e-06, + "loss": 0.7793, + "step": 4020 + }, + { + "epoch": 0.1, + "learning_rate": 1.972144189257436e-06, + "loss": 0.8369, + "step": 4021 + }, + { + "epoch": 0.1, + "learning_rate": 1.972124729234176e-06, + "loss": 0.915, + "step": 4022 + }, + { + "epoch": 0.1, + "learning_rate": 1.9721052625119975e-06, + "loss": 0.9043, + "step": 4023 + }, + { + "epoch": 0.1, + "learning_rate": 1.9720857890910338e-06, + "loss": 0.9961, + "step": 4024 + }, + { + "epoch": 0.1, + "learning_rate": 1.972066308971419e-06, + "loss": 0.9932, + "step": 4025 + }, + { + "epoch": 0.1, + "learning_rate": 1.972046822153289e-06, + "loss": 0.8838, + "step": 4026 + }, + { + "epoch": 0.1, + "learning_rate": 1.9720273286367765e-06, + "loss": 0.6909, + "step": 4027 + }, + { + "epoch": 0.1, + "learning_rate": 1.9720078284220167e-06, + "loss": 1.1221, + "step": 4028 + }, + { + "epoch": 0.1, + "learning_rate": 1.9719883215091433e-06, + "loss": 0.9902, + "step": 4029 + }, + { + "epoch": 0.1, + "learning_rate": 1.971968807898291e-06, + "loss": 0.7812, + "step": 4030 + }, + { + "epoch": 0.1, + "learning_rate": 1.971949287589594e-06, + "loss": 1.0889, + "step": 4031 + }, + { + "epoch": 0.1, + "learning_rate": 1.9719297605831878e-06, + "loss": 0.8228, + "step": 4032 + }, + { + "epoch": 0.1, + "learning_rate": 1.971910226879206e-06, + "loss": 0.9961, + "step": 4033 + }, + { + "epoch": 0.1, + "learning_rate": 1.9718906864777838e-06, + "loss": 1.0088, + "step": 4034 + }, + { + "epoch": 0.1, + "learning_rate": 1.971871139379055e-06, + "loss": 0.8945, + "step": 4035 + }, + { + "epoch": 0.1, + "learning_rate": 1.971851585583155e-06, + "loss": 0.8877, + "step": 4036 + }, + { + "epoch": 0.1, + "learning_rate": 1.9718320250902183e-06, + "loss": 0.9531, + "step": 4037 + }, + { + "epoch": 0.1, + "learning_rate": 1.97181245790038e-06, + "loss": 0.873, + "step": 4038 + }, + { + "epoch": 0.1, + "learning_rate": 1.9717928840137744e-06, + "loss": 0.8281, + "step": 4039 + }, + { + "epoch": 0.1, + "learning_rate": 1.971773303430537e-06, + "loss": 0.6963, + "step": 4040 + }, + { + "epoch": 0.1, + "learning_rate": 1.971753716150802e-06, + "loss": 1.0762, + "step": 4041 + }, + { + "epoch": 0.1, + "learning_rate": 1.9717341221747056e-06, + "loss": 1.0059, + "step": 4042 + }, + { + "epoch": 0.1, + "learning_rate": 1.9717145215023818e-06, + "loss": 0.8906, + "step": 4043 + }, + { + "epoch": 0.1, + "learning_rate": 1.971694914133965e-06, + "loss": 1.123, + "step": 4044 + }, + { + "epoch": 0.1, + "learning_rate": 1.971675300069592e-06, + "loss": 1.1104, + "step": 4045 + }, + { + "epoch": 0.1, + "learning_rate": 1.9716556793093974e-06, + "loss": 1.0596, + "step": 4046 + }, + { + "epoch": 0.1, + "learning_rate": 1.9716360518535156e-06, + "loss": 0.833, + "step": 4047 + }, + { + "epoch": 0.1, + "learning_rate": 1.9716164177020828e-06, + "loss": 1.042, + "step": 4048 + }, + { + "epoch": 0.1, + "learning_rate": 1.9715967768552336e-06, + "loss": 0.915, + "step": 4049 + }, + { + "epoch": 0.1, + "learning_rate": 1.9715771293131034e-06, + "loss": 0.9639, + "step": 4050 + }, + { + "epoch": 0.1, + "learning_rate": 1.9715574750758284e-06, + "loss": 0.9453, + "step": 4051 + }, + { + "epoch": 0.1, + "learning_rate": 1.9715378141435435e-06, + "loss": 0.9893, + "step": 4052 + }, + { + "epoch": 0.1, + "learning_rate": 1.971518146516384e-06, + "loss": 0.9365, + "step": 4053 + }, + { + "epoch": 0.1, + "learning_rate": 1.9714984721944856e-06, + "loss": 0.9258, + "step": 4054 + }, + { + "epoch": 0.1, + "learning_rate": 1.9714787911779844e-06, + "loss": 1.1602, + "step": 4055 + }, + { + "epoch": 0.1, + "learning_rate": 1.9714591034670147e-06, + "loss": 1.1182, + "step": 4056 + }, + { + "epoch": 0.1, + "learning_rate": 1.9714394090617136e-06, + "loss": 0.8574, + "step": 4057 + }, + { + "epoch": 0.1, + "learning_rate": 1.9714197079622158e-06, + "loss": 0.9287, + "step": 4058 + }, + { + "epoch": 0.1, + "learning_rate": 1.9714000001686577e-06, + "loss": 0.9258, + "step": 4059 + }, + { + "epoch": 0.1, + "learning_rate": 1.9713802856811744e-06, + "loss": 0.9521, + "step": 4060 + }, + { + "epoch": 0.1, + "learning_rate": 1.971360564499903e-06, + "loss": 0.874, + "step": 4061 + }, + { + "epoch": 0.1, + "learning_rate": 1.971340836624978e-06, + "loss": 0.793, + "step": 4062 + }, + { + "epoch": 0.1, + "learning_rate": 1.9713211020565362e-06, + "loss": 1.1494, + "step": 4063 + }, + { + "epoch": 0.1, + "learning_rate": 1.971301360794713e-06, + "loss": 0.79, + "step": 4064 + }, + { + "epoch": 0.1, + "learning_rate": 1.9712816128396454e-06, + "loss": 0.8965, + "step": 4065 + }, + { + "epoch": 0.1, + "learning_rate": 1.9712618581914684e-06, + "loss": 1.0332, + "step": 4066 + }, + { + "epoch": 0.1, + "learning_rate": 1.971242096850319e-06, + "loss": 0.8359, + "step": 4067 + }, + { + "epoch": 0.1, + "learning_rate": 1.9712223288163326e-06, + "loss": 0.8838, + "step": 4068 + }, + { + "epoch": 0.1, + "learning_rate": 1.971202554089646e-06, + "loss": 0.9189, + "step": 4069 + }, + { + "epoch": 0.1, + "learning_rate": 1.971182772670395e-06, + "loss": 0.7852, + "step": 4070 + }, + { + "epoch": 0.1, + "learning_rate": 1.9711629845587163e-06, + "loss": 0.8828, + "step": 4071 + }, + { + "epoch": 0.1, + "learning_rate": 1.971143189754746e-06, + "loss": 0.8164, + "step": 4072 + }, + { + "epoch": 0.1, + "learning_rate": 1.971123388258621e-06, + "loss": 0.8032, + "step": 4073 + }, + { + "epoch": 0.1, + "learning_rate": 1.9711035800704773e-06, + "loss": 0.8345, + "step": 4074 + }, + { + "epoch": 0.1, + "learning_rate": 1.9710837651904515e-06, + "loss": 0.9355, + "step": 4075 + }, + { + "epoch": 0.1, + "learning_rate": 1.97106394361868e-06, + "loss": 1.042, + "step": 4076 + }, + { + "epoch": 0.1, + "learning_rate": 1.9710441153552993e-06, + "loss": 1.0791, + "step": 4077 + }, + { + "epoch": 0.1, + "learning_rate": 1.971024280400447e-06, + "loss": 0.7861, + "step": 4078 + }, + { + "epoch": 0.1, + "learning_rate": 1.9710044387542583e-06, + "loss": 0.8501, + "step": 4079 + }, + { + "epoch": 0.1, + "learning_rate": 1.970984590416871e-06, + "loss": 0.5171, + "step": 4080 + }, + { + "epoch": 0.1, + "learning_rate": 1.9709647353884217e-06, + "loss": 0.9697, + "step": 4081 + }, + { + "epoch": 0.1, + "learning_rate": 1.970944873669047e-06, + "loss": 0.7319, + "step": 4082 + }, + { + "epoch": 0.1, + "learning_rate": 1.9709250052588838e-06, + "loss": 0.7734, + "step": 4083 + }, + { + "epoch": 0.1, + "learning_rate": 1.970905130158069e-06, + "loss": 0.8809, + "step": 4084 + }, + { + "epoch": 0.1, + "learning_rate": 1.9708852483667393e-06, + "loss": 0.8789, + "step": 4085 + }, + { + "epoch": 0.1, + "learning_rate": 1.970865359885033e-06, + "loss": 0.9688, + "step": 4086 + }, + { + "epoch": 0.1, + "learning_rate": 1.970845464713085e-06, + "loss": 0.7573, + "step": 4087 + }, + { + "epoch": 0.1, + "learning_rate": 1.9708255628510344e-06, + "loss": 1.1367, + "step": 4088 + }, + { + "epoch": 0.1, + "learning_rate": 1.970805654299017e-06, + "loss": 1.0801, + "step": 4089 + }, + { + "epoch": 0.1, + "learning_rate": 1.970785739057171e-06, + "loss": 1.0654, + "step": 4090 + }, + { + "epoch": 0.1, + "learning_rate": 1.9707658171256326e-06, + "loss": 0.8672, + "step": 4091 + }, + { + "epoch": 0.1, + "learning_rate": 1.9707458885045395e-06, + "loss": 1.0713, + "step": 4092 + }, + { + "epoch": 0.1, + "learning_rate": 1.9707259531940295e-06, + "loss": 0.9482, + "step": 4093 + }, + { + "epoch": 0.1, + "learning_rate": 1.97070601119424e-06, + "loss": 0.8809, + "step": 4094 + }, + { + "epoch": 0.1, + "learning_rate": 1.9706860625053078e-06, + "loss": 1.1396, + "step": 4095 + }, + { + "epoch": 0.1, + "learning_rate": 1.97066610712737e-06, + "loss": 0.9102, + "step": 4096 + }, + { + "epoch": 0.11, + "learning_rate": 1.970646145060565e-06, + "loss": 0.8091, + "step": 4097 + }, + { + "epoch": 0.11, + "learning_rate": 1.970626176305031e-06, + "loss": 0.8896, + "step": 4098 + }, + { + "epoch": 0.11, + "learning_rate": 1.970606200860904e-06, + "loss": 0.8682, + "step": 4099 + }, + { + "epoch": 0.11, + "learning_rate": 1.970586218728322e-06, + "loss": 0.7229, + "step": 4100 + }, + { + "epoch": 0.11, + "learning_rate": 1.9705662299074235e-06, + "loss": 0.9893, + "step": 4101 + }, + { + "epoch": 0.11, + "learning_rate": 1.9705462343983454e-06, + "loss": 1.0615, + "step": 4102 + }, + { + "epoch": 0.11, + "learning_rate": 1.970526232201226e-06, + "loss": 1.0566, + "step": 4103 + }, + { + "epoch": 0.11, + "learning_rate": 1.970506223316203e-06, + "loss": 0.8394, + "step": 4104 + }, + { + "epoch": 0.11, + "learning_rate": 1.9704862077434146e-06, + "loss": 0.8198, + "step": 4105 + }, + { + "epoch": 0.11, + "learning_rate": 1.970466185482998e-06, + "loss": 0.7607, + "step": 4106 + }, + { + "epoch": 0.11, + "learning_rate": 1.9704461565350923e-06, + "loss": 0.7827, + "step": 4107 + }, + { + "epoch": 0.11, + "learning_rate": 1.9704261208998337e-06, + "loss": 0.874, + "step": 4108 + }, + { + "epoch": 0.11, + "learning_rate": 1.9704060785773623e-06, + "loss": 0.9248, + "step": 4109 + }, + { + "epoch": 0.11, + "learning_rate": 1.9703860295678147e-06, + "loss": 1.0449, + "step": 4110 + }, + { + "epoch": 0.11, + "learning_rate": 1.97036597387133e-06, + "loss": 1.0264, + "step": 4111 + }, + { + "epoch": 0.11, + "learning_rate": 1.9703459114880458e-06, + "loss": 0.8535, + "step": 4112 + }, + { + "epoch": 0.11, + "learning_rate": 1.970325842418101e-06, + "loss": 0.9912, + "step": 4113 + }, + { + "epoch": 0.11, + "learning_rate": 1.970305766661633e-06, + "loss": 0.917, + "step": 4114 + }, + { + "epoch": 0.11, + "learning_rate": 1.9702856842187807e-06, + "loss": 0.8306, + "step": 4115 + }, + { + "epoch": 0.11, + "learning_rate": 1.970265595089683e-06, + "loss": 0.9561, + "step": 4116 + }, + { + "epoch": 0.11, + "learning_rate": 1.970245499274477e-06, + "loss": 1.0127, + "step": 4117 + }, + { + "epoch": 0.11, + "learning_rate": 1.970225396773302e-06, + "loss": 0.9302, + "step": 4118 + }, + { + "epoch": 0.11, + "learning_rate": 1.9702052875862967e-06, + "loss": 0.6108, + "step": 4119 + }, + { + "epoch": 0.11, + "learning_rate": 1.9701851717135997e-06, + "loss": 1.166, + "step": 4120 + }, + { + "epoch": 0.11, + "learning_rate": 1.970165049155349e-06, + "loss": 0.8994, + "step": 4121 + }, + { + "epoch": 0.11, + "learning_rate": 1.970144919911684e-06, + "loss": 0.9668, + "step": 4122 + }, + { + "epoch": 0.11, + "learning_rate": 1.9701247839827427e-06, + "loss": 0.875, + "step": 4123 + }, + { + "epoch": 0.11, + "learning_rate": 1.970104641368664e-06, + "loss": 0.5879, + "step": 4124 + }, + { + "epoch": 0.11, + "learning_rate": 1.970084492069587e-06, + "loss": 1.083, + "step": 4125 + }, + { + "epoch": 0.11, + "learning_rate": 1.970064336085651e-06, + "loss": 0.9561, + "step": 4126 + }, + { + "epoch": 0.11, + "learning_rate": 1.9700441734169937e-06, + "loss": 0.8184, + "step": 4127 + }, + { + "epoch": 0.11, + "learning_rate": 1.970024004063755e-06, + "loss": 0.8857, + "step": 4128 + }, + { + "epoch": 0.11, + "learning_rate": 1.970003828026073e-06, + "loss": 0.8442, + "step": 4129 + }, + { + "epoch": 0.11, + "learning_rate": 1.969983645304088e-06, + "loss": 0.8438, + "step": 4130 + }, + { + "epoch": 0.11, + "learning_rate": 1.969963455897938e-06, + "loss": 0.9004, + "step": 4131 + }, + { + "epoch": 0.11, + "learning_rate": 1.9699432598077627e-06, + "loss": 0.9053, + "step": 4132 + }, + { + "epoch": 0.11, + "learning_rate": 1.969923057033701e-06, + "loss": 1.0908, + "step": 4133 + }, + { + "epoch": 0.11, + "learning_rate": 1.969902847575892e-06, + "loss": 0.8467, + "step": 4134 + }, + { + "epoch": 0.11, + "learning_rate": 1.9698826314344756e-06, + "loss": 1.0869, + "step": 4135 + }, + { + "epoch": 0.11, + "learning_rate": 1.96986240860959e-06, + "loss": 1.0703, + "step": 4136 + }, + { + "epoch": 0.11, + "learning_rate": 1.969842179101376e-06, + "loss": 1.1797, + "step": 4137 + }, + { + "epoch": 0.11, + "learning_rate": 1.9698219429099713e-06, + "loss": 0.8652, + "step": 4138 + }, + { + "epoch": 0.11, + "learning_rate": 1.969801700035517e-06, + "loss": 0.7227, + "step": 4139 + }, + { + "epoch": 0.11, + "learning_rate": 1.9697814504781514e-06, + "loss": 0.8379, + "step": 4140 + }, + { + "epoch": 0.11, + "learning_rate": 1.969761194238015e-06, + "loss": 0.8564, + "step": 4141 + }, + { + "epoch": 0.11, + "learning_rate": 1.9697409313152465e-06, + "loss": 0.9795, + "step": 4142 + }, + { + "epoch": 0.11, + "learning_rate": 1.969720661709986e-06, + "loss": 0.8955, + "step": 4143 + }, + { + "epoch": 0.11, + "learning_rate": 1.969700385422373e-06, + "loss": 1.0068, + "step": 4144 + }, + { + "epoch": 0.11, + "learning_rate": 1.9696801024525472e-06, + "loss": 1.0479, + "step": 4145 + }, + { + "epoch": 0.11, + "learning_rate": 1.969659812800649e-06, + "loss": 1.0615, + "step": 4146 + }, + { + "epoch": 0.11, + "learning_rate": 1.969639516466817e-06, + "loss": 0.9736, + "step": 4147 + }, + { + "epoch": 0.11, + "learning_rate": 1.9696192134511923e-06, + "loss": 0.8096, + "step": 4148 + }, + { + "epoch": 0.11, + "learning_rate": 1.969598903753914e-06, + "loss": 0.9844, + "step": 4149 + }, + { + "epoch": 0.11, + "learning_rate": 1.969578587375123e-06, + "loss": 0.9385, + "step": 4150 + }, + { + "epoch": 0.11, + "learning_rate": 1.969558264314958e-06, + "loss": 1.0068, + "step": 4151 + }, + { + "epoch": 0.11, + "learning_rate": 1.9695379345735596e-06, + "loss": 0.8867, + "step": 4152 + }, + { + "epoch": 0.11, + "learning_rate": 1.9695175981510684e-06, + "loss": 0.9043, + "step": 4153 + }, + { + "epoch": 0.11, + "learning_rate": 1.969497255047624e-06, + "loss": 0.8574, + "step": 4154 + }, + { + "epoch": 0.11, + "learning_rate": 1.9694769052633666e-06, + "loss": 1.0039, + "step": 4155 + }, + { + "epoch": 0.11, + "learning_rate": 1.9694565487984364e-06, + "loss": 0.9297, + "step": 4156 + }, + { + "epoch": 0.11, + "learning_rate": 1.969436185652974e-06, + "loss": 0.9844, + "step": 4157 + }, + { + "epoch": 0.11, + "learning_rate": 1.9694158158271192e-06, + "loss": 0.96, + "step": 4158 + }, + { + "epoch": 0.11, + "learning_rate": 1.969395439321013e-06, + "loss": 1.0469, + "step": 4159 + }, + { + "epoch": 0.11, + "learning_rate": 1.9693750561347954e-06, + "loss": 0.9756, + "step": 4160 + }, + { + "epoch": 0.11, + "learning_rate": 1.969354666268607e-06, + "loss": 1.0986, + "step": 4161 + }, + { + "epoch": 0.11, + "learning_rate": 1.969334269722588e-06, + "loss": 0.7256, + "step": 4162 + }, + { + "epoch": 0.11, + "learning_rate": 1.9693138664968797e-06, + "loss": 0.9614, + "step": 4163 + }, + { + "epoch": 0.11, + "learning_rate": 1.9692934565916215e-06, + "loss": 0.9912, + "step": 4164 + }, + { + "epoch": 0.11, + "learning_rate": 1.969273040006956e-06, + "loss": 1.1162, + "step": 4165 + }, + { + "epoch": 0.11, + "learning_rate": 1.9692526167430215e-06, + "loss": 0.8979, + "step": 4166 + }, + { + "epoch": 0.11, + "learning_rate": 1.96923218679996e-06, + "loss": 0.877, + "step": 4167 + }, + { + "epoch": 0.11, + "learning_rate": 1.9692117501779127e-06, + "loss": 0.9385, + "step": 4168 + }, + { + "epoch": 0.11, + "learning_rate": 1.9691913068770198e-06, + "loss": 0.731, + "step": 4169 + }, + { + "epoch": 0.11, + "learning_rate": 1.9691708568974224e-06, + "loss": 1.1953, + "step": 4170 + }, + { + "epoch": 0.11, + "learning_rate": 1.9691504002392608e-06, + "loss": 1.0586, + "step": 4171 + }, + { + "epoch": 0.11, + "learning_rate": 1.9691299369026767e-06, + "loss": 0.9844, + "step": 4172 + }, + { + "epoch": 0.11, + "learning_rate": 1.969109466887811e-06, + "loss": 0.9229, + "step": 4173 + }, + { + "epoch": 0.11, + "learning_rate": 1.969088990194805e-06, + "loss": 1.0283, + "step": 4174 + }, + { + "epoch": 0.11, + "learning_rate": 1.9690685068237986e-06, + "loss": 0.8535, + "step": 4175 + }, + { + "epoch": 0.11, + "learning_rate": 1.9690480167749346e-06, + "loss": 0.875, + "step": 4176 + }, + { + "epoch": 0.11, + "learning_rate": 1.969027520048353e-06, + "loss": 0.9121, + "step": 4177 + }, + { + "epoch": 0.11, + "learning_rate": 1.9690070166441954e-06, + "loss": 0.9619, + "step": 4178 + }, + { + "epoch": 0.11, + "learning_rate": 1.968986506562603e-06, + "loss": 0.9756, + "step": 4179 + }, + { + "epoch": 0.11, + "learning_rate": 1.9689659898037173e-06, + "loss": 0.9092, + "step": 4180 + }, + { + "epoch": 0.11, + "learning_rate": 1.96894546636768e-06, + "loss": 0.7373, + "step": 4181 + }, + { + "epoch": 0.11, + "learning_rate": 1.968924936254632e-06, + "loss": 0.9287, + "step": 4182 + }, + { + "epoch": 0.11, + "learning_rate": 1.9689043994647148e-06, + "loss": 0.9824, + "step": 4183 + }, + { + "epoch": 0.11, + "learning_rate": 1.9688838559980702e-06, + "loss": 0.9951, + "step": 4184 + }, + { + "epoch": 0.11, + "learning_rate": 1.9688633058548397e-06, + "loss": 0.9268, + "step": 4185 + }, + { + "epoch": 0.11, + "learning_rate": 1.968842749035165e-06, + "loss": 0.9668, + "step": 4186 + }, + { + "epoch": 0.11, + "learning_rate": 1.9688221855391873e-06, + "loss": 0.8438, + "step": 4187 + }, + { + "epoch": 0.11, + "learning_rate": 1.9688016153670483e-06, + "loss": 0.7729, + "step": 4188 + }, + { + "epoch": 0.11, + "learning_rate": 1.9687810385188904e-06, + "loss": 0.7739, + "step": 4189 + }, + { + "epoch": 0.11, + "learning_rate": 1.968760454994855e-06, + "loss": 0.8457, + "step": 4190 + }, + { + "epoch": 0.11, + "learning_rate": 1.968739864795084e-06, + "loss": 0.6318, + "step": 4191 + }, + { + "epoch": 0.11, + "learning_rate": 1.9687192679197194e-06, + "loss": 0.7949, + "step": 4192 + }, + { + "epoch": 0.11, + "learning_rate": 1.9686986643689033e-06, + "loss": 0.9941, + "step": 4193 + }, + { + "epoch": 0.11, + "learning_rate": 1.968678054142777e-06, + "loss": 0.7578, + "step": 4194 + }, + { + "epoch": 0.11, + "learning_rate": 1.9686574372414827e-06, + "loss": 0.7505, + "step": 4195 + }, + { + "epoch": 0.11, + "learning_rate": 1.968636813665163e-06, + "loss": 1.0195, + "step": 4196 + }, + { + "epoch": 0.11, + "learning_rate": 1.9686161834139594e-06, + "loss": 0.9824, + "step": 4197 + }, + { + "epoch": 0.11, + "learning_rate": 1.9685955464880145e-06, + "loss": 1.0107, + "step": 4198 + }, + { + "epoch": 0.11, + "learning_rate": 1.9685749028874706e-06, + "loss": 0.9053, + "step": 4199 + }, + { + "epoch": 0.11, + "learning_rate": 1.9685542526124698e-06, + "loss": 0.7881, + "step": 4200 + }, + { + "epoch": 0.11, + "learning_rate": 1.968533595663154e-06, + "loss": 0.7734, + "step": 4201 + }, + { + "epoch": 0.11, + "learning_rate": 1.968512932039666e-06, + "loss": 1.0234, + "step": 4202 + }, + { + "epoch": 0.11, + "learning_rate": 1.968492261742148e-06, + "loss": 0.9424, + "step": 4203 + }, + { + "epoch": 0.11, + "learning_rate": 1.9684715847707425e-06, + "loss": 0.9141, + "step": 4204 + }, + { + "epoch": 0.11, + "learning_rate": 1.968450901125592e-06, + "loss": 1.0635, + "step": 4205 + }, + { + "epoch": 0.11, + "learning_rate": 1.9684302108068393e-06, + "loss": 1.0596, + "step": 4206 + }, + { + "epoch": 0.11, + "learning_rate": 1.968409513814626e-06, + "loss": 0.8389, + "step": 4207 + }, + { + "epoch": 0.11, + "learning_rate": 1.9683888101490964e-06, + "loss": 1.0693, + "step": 4208 + }, + { + "epoch": 0.11, + "learning_rate": 1.9683680998103912e-06, + "loss": 0.8076, + "step": 4209 + }, + { + "epoch": 0.11, + "learning_rate": 1.9683473827986547e-06, + "loss": 0.9678, + "step": 4210 + }, + { + "epoch": 0.11, + "learning_rate": 1.968326659114029e-06, + "loss": 1.0166, + "step": 4211 + }, + { + "epoch": 0.11, + "learning_rate": 1.968305928756657e-06, + "loss": 0.877, + "step": 4212 + }, + { + "epoch": 0.11, + "learning_rate": 1.9682851917266815e-06, + "loss": 0.9639, + "step": 4213 + }, + { + "epoch": 0.11, + "learning_rate": 1.968264448024245e-06, + "loss": 0.9414, + "step": 4214 + }, + { + "epoch": 0.11, + "learning_rate": 1.968243697649492e-06, + "loss": 0.9199, + "step": 4215 + }, + { + "epoch": 0.11, + "learning_rate": 1.9682229406025634e-06, + "loss": 0.8164, + "step": 4216 + }, + { + "epoch": 0.11, + "learning_rate": 1.968202176883603e-06, + "loss": 0.9258, + "step": 4217 + }, + { + "epoch": 0.11, + "learning_rate": 1.968181406492755e-06, + "loss": 0.8662, + "step": 4218 + }, + { + "epoch": 0.11, + "learning_rate": 1.968160629430161e-06, + "loss": 0.894, + "step": 4219 + }, + { + "epoch": 0.11, + "learning_rate": 1.968139845695965e-06, + "loss": 1.1016, + "step": 4220 + }, + { + "epoch": 0.11, + "learning_rate": 1.9681190552903096e-06, + "loss": 0.8984, + "step": 4221 + }, + { + "epoch": 0.11, + "learning_rate": 1.968098258213339e-06, + "loss": 1.0225, + "step": 4222 + }, + { + "epoch": 0.11, + "learning_rate": 1.9680774544651956e-06, + "loss": 0.7485, + "step": 4223 + }, + { + "epoch": 0.11, + "learning_rate": 1.9680566440460237e-06, + "loss": 0.7822, + "step": 4224 + }, + { + "epoch": 0.11, + "learning_rate": 1.968035826955966e-06, + "loss": 0.8774, + "step": 4225 + }, + { + "epoch": 0.11, + "learning_rate": 1.9680150031951657e-06, + "loss": 1.0625, + "step": 4226 + }, + { + "epoch": 0.11, + "learning_rate": 1.9679941727637667e-06, + "loss": 1.0195, + "step": 4227 + }, + { + "epoch": 0.11, + "learning_rate": 1.967973335661913e-06, + "loss": 0.8022, + "step": 4228 + }, + { + "epoch": 0.11, + "learning_rate": 1.9679524918897473e-06, + "loss": 0.606, + "step": 4229 + }, + { + "epoch": 0.11, + "learning_rate": 1.967931641447414e-06, + "loss": 1.0977, + "step": 4230 + }, + { + "epoch": 0.11, + "learning_rate": 1.967910784335056e-06, + "loss": 0.9805, + "step": 4231 + }, + { + "epoch": 0.11, + "learning_rate": 1.967889920552818e-06, + "loss": 0.9307, + "step": 4232 + }, + { + "epoch": 0.11, + "learning_rate": 1.967869050100843e-06, + "loss": 0.9131, + "step": 4233 + }, + { + "epoch": 0.11, + "learning_rate": 1.967848172979275e-06, + "loss": 0.999, + "step": 4234 + }, + { + "epoch": 0.11, + "learning_rate": 1.967827289188258e-06, + "loss": 0.9873, + "step": 4235 + }, + { + "epoch": 0.11, + "learning_rate": 1.967806398727936e-06, + "loss": 0.8105, + "step": 4236 + }, + { + "epoch": 0.11, + "learning_rate": 1.9677855015984528e-06, + "loss": 0.9258, + "step": 4237 + }, + { + "epoch": 0.11, + "learning_rate": 1.967764597799952e-06, + "loss": 0.8042, + "step": 4238 + }, + { + "epoch": 0.11, + "learning_rate": 1.967743687332578e-06, + "loss": 0.959, + "step": 4239 + }, + { + "epoch": 0.11, + "learning_rate": 1.9677227701964757e-06, + "loss": 0.9199, + "step": 4240 + }, + { + "epoch": 0.11, + "learning_rate": 1.967701846391788e-06, + "loss": 0.8174, + "step": 4241 + }, + { + "epoch": 0.11, + "learning_rate": 1.9676809159186595e-06, + "loss": 1.0625, + "step": 4242 + }, + { + "epoch": 0.11, + "learning_rate": 1.9676599787772346e-06, + "loss": 0.9053, + "step": 4243 + }, + { + "epoch": 0.11, + "learning_rate": 1.9676390349676576e-06, + "loss": 1.0273, + "step": 4244 + }, + { + "epoch": 0.11, + "learning_rate": 1.9676180844900725e-06, + "loss": 0.8516, + "step": 4245 + }, + { + "epoch": 0.11, + "learning_rate": 1.9675971273446237e-06, + "loss": 0.8772, + "step": 4246 + }, + { + "epoch": 0.11, + "learning_rate": 1.967576163531456e-06, + "loss": 1.1572, + "step": 4247 + }, + { + "epoch": 0.11, + "learning_rate": 1.967555193050714e-06, + "loss": 0.917, + "step": 4248 + }, + { + "epoch": 0.11, + "learning_rate": 1.967534215902541e-06, + "loss": 1.0107, + "step": 4249 + }, + { + "epoch": 0.11, + "learning_rate": 1.967513232087083e-06, + "loss": 1.0303, + "step": 4250 + }, + { + "epoch": 0.11, + "learning_rate": 1.967492241604484e-06, + "loss": 0.9229, + "step": 4251 + }, + { + "epoch": 0.11, + "learning_rate": 1.967471244454889e-06, + "loss": 1.0859, + "step": 4252 + }, + { + "epoch": 0.11, + "learning_rate": 1.9674502406384415e-06, + "loss": 1.0605, + "step": 4253 + }, + { + "epoch": 0.11, + "learning_rate": 1.9674292301552878e-06, + "loss": 0.9468, + "step": 4254 + }, + { + "epoch": 0.11, + "learning_rate": 1.9674082130055714e-06, + "loss": 1.291, + "step": 4255 + }, + { + "epoch": 0.11, + "learning_rate": 1.967387189189438e-06, + "loss": 1.082, + "step": 4256 + }, + { + "epoch": 0.11, + "learning_rate": 1.9673661587070326e-06, + "loss": 1.0449, + "step": 4257 + }, + { + "epoch": 0.11, + "learning_rate": 1.967345121558499e-06, + "loss": 0.9941, + "step": 4258 + }, + { + "epoch": 0.11, + "learning_rate": 1.967324077743983e-06, + "loss": 1.1279, + "step": 4259 + }, + { + "epoch": 0.11, + "learning_rate": 1.9673030272636295e-06, + "loss": 0.7354, + "step": 4260 + }, + { + "epoch": 0.11, + "learning_rate": 1.9672819701175837e-06, + "loss": 0.9336, + "step": 4261 + }, + { + "epoch": 0.11, + "learning_rate": 1.9672609063059907e-06, + "loss": 0.9531, + "step": 4262 + }, + { + "epoch": 0.11, + "learning_rate": 1.967239835828995e-06, + "loss": 0.7742, + "step": 4263 + }, + { + "epoch": 0.11, + "learning_rate": 1.9672187586867426e-06, + "loss": 0.752, + "step": 4264 + }, + { + "epoch": 0.11, + "learning_rate": 1.9671976748793784e-06, + "loss": 0.8975, + "step": 4265 + }, + { + "epoch": 0.11, + "learning_rate": 1.9671765844070478e-06, + "loss": 0.9912, + "step": 4266 + }, + { + "epoch": 0.11, + "learning_rate": 1.967155487269896e-06, + "loss": 0.7002, + "step": 4267 + }, + { + "epoch": 0.11, + "learning_rate": 1.967134383468068e-06, + "loss": 0.9795, + "step": 4268 + }, + { + "epoch": 0.11, + "learning_rate": 1.96711327300171e-06, + "loss": 1.043, + "step": 4269 + }, + { + "epoch": 0.11, + "learning_rate": 1.9670921558709673e-06, + "loss": 0.7002, + "step": 4270 + }, + { + "epoch": 0.11, + "learning_rate": 1.967071032075985e-06, + "loss": 1.1182, + "step": 4271 + }, + { + "epoch": 0.11, + "learning_rate": 1.967049901616909e-06, + "loss": 0.9805, + "step": 4272 + }, + { + "epoch": 0.11, + "learning_rate": 1.967028764493885e-06, + "loss": 1.2305, + "step": 4273 + }, + { + "epoch": 0.11, + "learning_rate": 1.9670076207070583e-06, + "loss": 0.8701, + "step": 4274 + }, + { + "epoch": 0.11, + "learning_rate": 1.9669864702565746e-06, + "loss": 1.0898, + "step": 4275 + }, + { + "epoch": 0.11, + "learning_rate": 1.96696531314258e-06, + "loss": 0.7871, + "step": 4276 + }, + { + "epoch": 0.11, + "learning_rate": 1.9669441493652204e-06, + "loss": 0.9797, + "step": 4277 + }, + { + "epoch": 0.11, + "learning_rate": 1.966922978924641e-06, + "loss": 0.9766, + "step": 4278 + }, + { + "epoch": 0.11, + "learning_rate": 1.966901801820988e-06, + "loss": 0.8799, + "step": 4279 + }, + { + "epoch": 0.11, + "learning_rate": 1.9668806180544074e-06, + "loss": 1.0547, + "step": 4280 + }, + { + "epoch": 0.11, + "learning_rate": 1.9668594276250456e-06, + "loss": 0.7957, + "step": 4281 + }, + { + "epoch": 0.11, + "learning_rate": 1.966838230533048e-06, + "loss": 0.9912, + "step": 4282 + }, + { + "epoch": 0.11, + "learning_rate": 1.9668170267785606e-06, + "loss": 1.0234, + "step": 4283 + }, + { + "epoch": 0.11, + "learning_rate": 1.9667958163617297e-06, + "loss": 0.9336, + "step": 4284 + }, + { + "epoch": 0.11, + "learning_rate": 1.9667745992827017e-06, + "loss": 0.918, + "step": 4285 + }, + { + "epoch": 0.11, + "learning_rate": 1.9667533755416224e-06, + "loss": 0.7212, + "step": 4286 + }, + { + "epoch": 0.11, + "learning_rate": 1.9667321451386387e-06, + "loss": 0.5596, + "step": 4287 + }, + { + "epoch": 0.11, + "learning_rate": 1.9667109080738963e-06, + "loss": 0.9756, + "step": 4288 + }, + { + "epoch": 0.11, + "learning_rate": 1.966689664347542e-06, + "loss": 0.8882, + "step": 4289 + }, + { + "epoch": 0.11, + "learning_rate": 1.966668413959721e-06, + "loss": 1.0371, + "step": 4290 + }, + { + "epoch": 0.11, + "learning_rate": 1.966647156910582e-06, + "loss": 0.8398, + "step": 4291 + }, + { + "epoch": 0.11, + "learning_rate": 1.9666258932002692e-06, + "loss": 0.9688, + "step": 4292 + }, + { + "epoch": 0.11, + "learning_rate": 1.9666046228289306e-06, + "loss": 0.9736, + "step": 4293 + }, + { + "epoch": 0.11, + "learning_rate": 1.9665833457967115e-06, + "loss": 1.0684, + "step": 4294 + }, + { + "epoch": 0.11, + "learning_rate": 1.96656206210376e-06, + "loss": 0.7754, + "step": 4295 + }, + { + "epoch": 0.11, + "learning_rate": 1.9665407717502217e-06, + "loss": 0.8623, + "step": 4296 + }, + { + "epoch": 0.11, + "learning_rate": 1.966519474736244e-06, + "loss": 1.0107, + "step": 4297 + }, + { + "epoch": 0.11, + "learning_rate": 1.9664981710619727e-06, + "loss": 1.0234, + "step": 4298 + }, + { + "epoch": 0.11, + "learning_rate": 1.9664768607275556e-06, + "loss": 1.043, + "step": 4299 + }, + { + "epoch": 0.11, + "learning_rate": 1.966455543733139e-06, + "loss": 0.8408, + "step": 4300 + }, + { + "epoch": 0.11, + "learning_rate": 1.9664342200788697e-06, + "loss": 0.9243, + "step": 4301 + }, + { + "epoch": 0.11, + "learning_rate": 1.9664128897648953e-06, + "loss": 0.9922, + "step": 4302 + }, + { + "epoch": 0.11, + "learning_rate": 1.9663915527913623e-06, + "loss": 0.9316, + "step": 4303 + }, + { + "epoch": 0.11, + "learning_rate": 1.966370209158418e-06, + "loss": 1.0244, + "step": 4304 + }, + { + "epoch": 0.11, + "learning_rate": 1.966348858866209e-06, + "loss": 0.9316, + "step": 4305 + }, + { + "epoch": 0.11, + "learning_rate": 1.9663275019148827e-06, + "loss": 1.0107, + "step": 4306 + }, + { + "epoch": 0.11, + "learning_rate": 1.9663061383045864e-06, + "loss": 1.0469, + "step": 4307 + }, + { + "epoch": 0.11, + "learning_rate": 1.966284768035467e-06, + "loss": 0.7871, + "step": 4308 + }, + { + "epoch": 0.11, + "learning_rate": 1.9662633911076723e-06, + "loss": 0.9307, + "step": 4309 + }, + { + "epoch": 0.11, + "learning_rate": 1.966242007521349e-06, + "loss": 1.0068, + "step": 4310 + }, + { + "epoch": 0.11, + "learning_rate": 1.966220617276645e-06, + "loss": 0.9229, + "step": 4311 + }, + { + "epoch": 0.11, + "learning_rate": 1.966199220373707e-06, + "loss": 0.7954, + "step": 4312 + }, + { + "epoch": 0.11, + "learning_rate": 1.966177816812683e-06, + "loss": 1.0498, + "step": 4313 + }, + { + "epoch": 0.11, + "learning_rate": 1.9661564065937205e-06, + "loss": 0.8594, + "step": 4314 + }, + { + "epoch": 0.11, + "learning_rate": 1.966134989716967e-06, + "loss": 0.832, + "step": 4315 + }, + { + "epoch": 0.11, + "learning_rate": 1.96611356618257e-06, + "loss": 1.0068, + "step": 4316 + }, + { + "epoch": 0.11, + "learning_rate": 1.966092135990677e-06, + "loss": 0.981, + "step": 4317 + }, + { + "epoch": 0.11, + "learning_rate": 1.966070699141436e-06, + "loss": 0.915, + "step": 4318 + }, + { + "epoch": 0.11, + "learning_rate": 1.9660492556349943e-06, + "loss": 0.7178, + "step": 4319 + }, + { + "epoch": 0.11, + "learning_rate": 1.9660278054714995e-06, + "loss": 0.9521, + "step": 4320 + }, + { + "epoch": 0.11, + "learning_rate": 1.9660063486511003e-06, + "loss": 0.8682, + "step": 4321 + }, + { + "epoch": 0.11, + "learning_rate": 1.965984885173944e-06, + "loss": 0.7876, + "step": 4322 + }, + { + "epoch": 0.11, + "learning_rate": 1.9659634150401784e-06, + "loss": 1.0752, + "step": 4323 + }, + { + "epoch": 0.11, + "learning_rate": 1.9659419382499518e-06, + "loss": 0.873, + "step": 4324 + }, + { + "epoch": 0.11, + "learning_rate": 1.965920454803412e-06, + "loss": 0.9727, + "step": 4325 + }, + { + "epoch": 0.11, + "learning_rate": 1.965898964700707e-06, + "loss": 1.0068, + "step": 4326 + }, + { + "epoch": 0.11, + "learning_rate": 1.965877467941985e-06, + "loss": 0.8013, + "step": 4327 + }, + { + "epoch": 0.11, + "learning_rate": 1.9658559645273937e-06, + "loss": 0.7939, + "step": 4328 + }, + { + "epoch": 0.11, + "learning_rate": 1.965834454457082e-06, + "loss": 0.8613, + "step": 4329 + }, + { + "epoch": 0.11, + "learning_rate": 1.9658129377311975e-06, + "loss": 0.8359, + "step": 4330 + }, + { + "epoch": 0.11, + "learning_rate": 1.9657914143498893e-06, + "loss": 0.75, + "step": 4331 + }, + { + "epoch": 0.11, + "learning_rate": 1.9657698843133047e-06, + "loss": 0.833, + "step": 4332 + }, + { + "epoch": 0.11, + "learning_rate": 1.965748347621593e-06, + "loss": 0.7847, + "step": 4333 + }, + { + "epoch": 0.11, + "learning_rate": 1.9657268042749015e-06, + "loss": 0.9785, + "step": 4334 + }, + { + "epoch": 0.11, + "learning_rate": 1.9657052542733793e-06, + "loss": 0.9102, + "step": 4335 + }, + { + "epoch": 0.11, + "learning_rate": 1.9656836976171754e-06, + "loss": 1.335, + "step": 4336 + }, + { + "epoch": 0.11, + "learning_rate": 1.9656621343064376e-06, + "loss": 0.9014, + "step": 4337 + }, + { + "epoch": 0.11, + "learning_rate": 1.965640564341315e-06, + "loss": 0.9253, + "step": 4338 + }, + { + "epoch": 0.11, + "learning_rate": 1.9656189877219556e-06, + "loss": 0.9023, + "step": 4339 + }, + { + "epoch": 0.11, + "learning_rate": 1.965597404448509e-06, + "loss": 0.8857, + "step": 4340 + }, + { + "epoch": 0.11, + "learning_rate": 1.9655758145211226e-06, + "loss": 0.7158, + "step": 4341 + }, + { + "epoch": 0.11, + "learning_rate": 1.9655542179399467e-06, + "loss": 1.0186, + "step": 4342 + }, + { + "epoch": 0.11, + "learning_rate": 1.9655326147051287e-06, + "loss": 1.1797, + "step": 4343 + }, + { + "epoch": 0.11, + "learning_rate": 1.9655110048168186e-06, + "loss": 0.8462, + "step": 4344 + }, + { + "epoch": 0.11, + "learning_rate": 1.9654893882751647e-06, + "loss": 1.0371, + "step": 4345 + }, + { + "epoch": 0.11, + "learning_rate": 1.965467765080316e-06, + "loss": 0.749, + "step": 4346 + }, + { + "epoch": 0.11, + "learning_rate": 1.965446135232422e-06, + "loss": 0.8506, + "step": 4347 + }, + { + "epoch": 0.11, + "learning_rate": 1.9654244987316315e-06, + "loss": 1.0898, + "step": 4348 + }, + { + "epoch": 0.11, + "learning_rate": 1.9654028555780934e-06, + "loss": 0.7068, + "step": 4349 + }, + { + "epoch": 0.11, + "learning_rate": 1.9653812057719564e-06, + "loss": 0.9102, + "step": 4350 + }, + { + "epoch": 0.11, + "learning_rate": 1.965359549313371e-06, + "loss": 0.9521, + "step": 4351 + }, + { + "epoch": 0.11, + "learning_rate": 1.965337886202485e-06, + "loss": 0.9463, + "step": 4352 + }, + { + "epoch": 0.11, + "learning_rate": 1.9653162164394487e-06, + "loss": 0.7939, + "step": 4353 + }, + { + "epoch": 0.11, + "learning_rate": 1.965294540024411e-06, + "loss": 0.915, + "step": 4354 + }, + { + "epoch": 0.11, + "learning_rate": 1.965272856957521e-06, + "loss": 0.9463, + "step": 4355 + }, + { + "epoch": 0.11, + "learning_rate": 1.9652511672389286e-06, + "loss": 1.0742, + "step": 4356 + }, + { + "epoch": 0.11, + "learning_rate": 1.9652294708687833e-06, + "loss": 0.8271, + "step": 4357 + }, + { + "epoch": 0.11, + "learning_rate": 1.9652077678472347e-06, + "loss": 1.1113, + "step": 4358 + }, + { + "epoch": 0.11, + "learning_rate": 1.9651860581744315e-06, + "loss": 1.0225, + "step": 4359 + }, + { + "epoch": 0.11, + "learning_rate": 1.965164341850524e-06, + "loss": 0.8398, + "step": 4360 + }, + { + "epoch": 0.11, + "learning_rate": 1.965142618875662e-06, + "loss": 0.8193, + "step": 4361 + }, + { + "epoch": 0.11, + "learning_rate": 1.9651208892499945e-06, + "loss": 1.0479, + "step": 4362 + }, + { + "epoch": 0.11, + "learning_rate": 1.9650991529736723e-06, + "loss": 0.8623, + "step": 4363 + }, + { + "epoch": 0.11, + "learning_rate": 1.965077410046844e-06, + "loss": 0.8809, + "step": 4364 + }, + { + "epoch": 0.11, + "learning_rate": 1.96505566046966e-06, + "loss": 0.7996, + "step": 4365 + }, + { + "epoch": 0.11, + "learning_rate": 1.9650339042422705e-06, + "loss": 0.9121, + "step": 4366 + }, + { + "epoch": 0.11, + "learning_rate": 1.965012141364825e-06, + "loss": 0.6411, + "step": 4367 + }, + { + "epoch": 0.11, + "learning_rate": 1.9649903718374735e-06, + "loss": 0.8315, + "step": 4368 + }, + { + "epoch": 0.11, + "learning_rate": 1.964968595660366e-06, + "loss": 1.0449, + "step": 4369 + }, + { + "epoch": 0.11, + "learning_rate": 1.964946812833653e-06, + "loss": 0.9277, + "step": 4370 + }, + { + "epoch": 0.11, + "learning_rate": 1.9649250233574833e-06, + "loss": 1.0576, + "step": 4371 + }, + { + "epoch": 0.11, + "learning_rate": 1.9649032272320087e-06, + "loss": 1.083, + "step": 4372 + }, + { + "epoch": 0.11, + "learning_rate": 1.9648814244573783e-06, + "loss": 1.0371, + "step": 4373 + }, + { + "epoch": 0.11, + "learning_rate": 1.964859615033743e-06, + "loss": 0.9893, + "step": 4374 + }, + { + "epoch": 0.11, + "learning_rate": 1.9648377989612527e-06, + "loss": 0.9736, + "step": 4375 + }, + { + "epoch": 0.11, + "learning_rate": 1.9648159762400578e-06, + "loss": 0.9004, + "step": 4376 + }, + { + "epoch": 0.11, + "learning_rate": 1.9647941468703085e-06, + "loss": 1.0762, + "step": 4377 + }, + { + "epoch": 0.11, + "learning_rate": 1.9647723108521557e-06, + "loss": 1.0322, + "step": 4378 + }, + { + "epoch": 0.11, + "learning_rate": 1.96475046818575e-06, + "loss": 0.9692, + "step": 4379 + }, + { + "epoch": 0.11, + "learning_rate": 1.964728618871241e-06, + "loss": 0.8643, + "step": 4380 + }, + { + "epoch": 0.11, + "learning_rate": 1.96470676290878e-06, + "loss": 1.0488, + "step": 4381 + }, + { + "epoch": 0.11, + "learning_rate": 1.964684900298517e-06, + "loss": 1.001, + "step": 4382 + }, + { + "epoch": 0.11, + "learning_rate": 1.9646630310406036e-06, + "loss": 0.9492, + "step": 4383 + }, + { + "epoch": 0.11, + "learning_rate": 1.96464115513519e-06, + "loss": 0.6587, + "step": 4384 + }, + { + "epoch": 0.11, + "learning_rate": 1.9646192725824265e-06, + "loss": 0.958, + "step": 4385 + }, + { + "epoch": 0.11, + "learning_rate": 1.9645973833824647e-06, + "loss": 0.9258, + "step": 4386 + }, + { + "epoch": 0.11, + "learning_rate": 1.964575487535455e-06, + "loss": 0.6914, + "step": 4387 + }, + { + "epoch": 0.11, + "learning_rate": 1.964553585041548e-06, + "loss": 1.1113, + "step": 4388 + }, + { + "epoch": 0.11, + "learning_rate": 1.964531675900895e-06, + "loss": 1.0508, + "step": 4389 + }, + { + "epoch": 0.11, + "learning_rate": 1.9645097601136475e-06, + "loss": 0.998, + "step": 4390 + }, + { + "epoch": 0.11, + "learning_rate": 1.9644878376799555e-06, + "loss": 1.001, + "step": 4391 + }, + { + "epoch": 0.11, + "learning_rate": 1.9644659085999704e-06, + "loss": 1.04, + "step": 4392 + }, + { + "epoch": 0.11, + "learning_rate": 1.9644439728738437e-06, + "loss": 1.0615, + "step": 4393 + }, + { + "epoch": 0.11, + "learning_rate": 1.9644220305017263e-06, + "loss": 0.9648, + "step": 4394 + }, + { + "epoch": 0.11, + "learning_rate": 1.9644000814837693e-06, + "loss": 1.0234, + "step": 4395 + }, + { + "epoch": 0.11, + "learning_rate": 1.964378125820124e-06, + "loss": 1.0264, + "step": 4396 + }, + { + "epoch": 0.11, + "learning_rate": 1.9643561635109414e-06, + "loss": 0.8701, + "step": 4397 + }, + { + "epoch": 0.11, + "learning_rate": 1.964334194556374e-06, + "loss": 0.8916, + "step": 4398 + }, + { + "epoch": 0.11, + "learning_rate": 1.964312218956572e-06, + "loss": 1.0205, + "step": 4399 + }, + { + "epoch": 0.11, + "learning_rate": 1.964290236711687e-06, + "loss": 0.7769, + "step": 4400 + }, + { + "epoch": 0.11, + "learning_rate": 1.964268247821871e-06, + "loss": 0.6143, + "step": 4401 + }, + { + "epoch": 0.11, + "learning_rate": 1.9642462522872753e-06, + "loss": 1.0361, + "step": 4402 + }, + { + "epoch": 0.11, + "learning_rate": 1.964224250108051e-06, + "loss": 0.9717, + "step": 4403 + }, + { + "epoch": 0.11, + "learning_rate": 1.9642022412843504e-06, + "loss": 0.9336, + "step": 4404 + }, + { + "epoch": 0.11, + "learning_rate": 1.9641802258163245e-06, + "loss": 1.0068, + "step": 4405 + }, + { + "epoch": 0.11, + "learning_rate": 1.9641582037041257e-06, + "loss": 1.0283, + "step": 4406 + }, + { + "epoch": 0.11, + "learning_rate": 1.9641361749479054e-06, + "loss": 1.0059, + "step": 4407 + }, + { + "epoch": 0.11, + "learning_rate": 1.9641141395478157e-06, + "loss": 0.8994, + "step": 4408 + }, + { + "epoch": 0.11, + "learning_rate": 1.964092097504008e-06, + "loss": 1.207, + "step": 4409 + }, + { + "epoch": 0.11, + "learning_rate": 1.9640700488166344e-06, + "loss": 0.9023, + "step": 4410 + }, + { + "epoch": 0.11, + "learning_rate": 1.9640479934858463e-06, + "loss": 1.0703, + "step": 4411 + }, + { + "epoch": 0.11, + "learning_rate": 1.9640259315117967e-06, + "loss": 0.9844, + "step": 4412 + }, + { + "epoch": 0.11, + "learning_rate": 1.964003862894637e-06, + "loss": 1.0625, + "step": 4413 + }, + { + "epoch": 0.11, + "learning_rate": 1.9639817876345194e-06, + "loss": 0.9414, + "step": 4414 + }, + { + "epoch": 0.11, + "learning_rate": 1.9639597057315963e-06, + "loss": 1.0703, + "step": 4415 + }, + { + "epoch": 0.11, + "learning_rate": 1.963937617186019e-06, + "loss": 0.8267, + "step": 4416 + }, + { + "epoch": 0.11, + "learning_rate": 1.963915521997941e-06, + "loss": 0.6824, + "step": 4417 + }, + { + "epoch": 0.11, + "learning_rate": 1.9638934201675133e-06, + "loss": 1.0137, + "step": 4418 + }, + { + "epoch": 0.11, + "learning_rate": 1.9638713116948886e-06, + "loss": 1.0693, + "step": 4419 + }, + { + "epoch": 0.11, + "learning_rate": 1.96384919658022e-06, + "loss": 1.04, + "step": 4420 + }, + { + "epoch": 0.11, + "learning_rate": 1.963827074823659e-06, + "loss": 0.833, + "step": 4421 + }, + { + "epoch": 0.11, + "learning_rate": 1.9638049464253584e-06, + "loss": 1.0342, + "step": 4422 + }, + { + "epoch": 0.11, + "learning_rate": 1.963782811385471e-06, + "loss": 1.1064, + "step": 4423 + }, + { + "epoch": 0.11, + "learning_rate": 1.9637606697041483e-06, + "loss": 0.8237, + "step": 4424 + }, + { + "epoch": 0.11, + "learning_rate": 1.9637385213815437e-06, + "loss": 0.7256, + "step": 4425 + }, + { + "epoch": 0.11, + "learning_rate": 1.96371636641781e-06, + "loss": 1.0205, + "step": 4426 + }, + { + "epoch": 0.11, + "learning_rate": 1.963694204813099e-06, + "loss": 0.876, + "step": 4427 + }, + { + "epoch": 0.11, + "learning_rate": 1.9636720365675647e-06, + "loss": 0.9658, + "step": 4428 + }, + { + "epoch": 0.11, + "learning_rate": 1.963649861681359e-06, + "loss": 0.6602, + "step": 4429 + }, + { + "epoch": 0.11, + "learning_rate": 1.963627680154634e-06, + "loss": 0.7637, + "step": 4430 + }, + { + "epoch": 0.11, + "learning_rate": 1.963605491987544e-06, + "loss": 1.0029, + "step": 4431 + }, + { + "epoch": 0.11, + "learning_rate": 1.9635832971802414e-06, + "loss": 1.0508, + "step": 4432 + }, + { + "epoch": 0.11, + "learning_rate": 1.963561095732879e-06, + "loss": 0.9639, + "step": 4433 + }, + { + "epoch": 0.11, + "learning_rate": 1.9635388876456094e-06, + "loss": 0.6597, + "step": 4434 + }, + { + "epoch": 0.11, + "learning_rate": 1.9635166729185863e-06, + "loss": 0.9248, + "step": 4435 + }, + { + "epoch": 0.11, + "learning_rate": 1.9634944515519625e-06, + "loss": 0.707, + "step": 4436 + }, + { + "epoch": 0.11, + "learning_rate": 1.963472223545891e-06, + "loss": 1.0088, + "step": 4437 + }, + { + "epoch": 0.11, + "learning_rate": 1.963449988900526e-06, + "loss": 0.8848, + "step": 4438 + }, + { + "epoch": 0.11, + "learning_rate": 1.9634277476160188e-06, + "loss": 1.0073, + "step": 4439 + }, + { + "epoch": 0.11, + "learning_rate": 1.963405499692524e-06, + "loss": 1.0625, + "step": 4440 + }, + { + "epoch": 0.11, + "learning_rate": 1.9633832451301947e-06, + "loss": 0.8135, + "step": 4441 + }, + { + "epoch": 0.11, + "learning_rate": 1.963360983929184e-06, + "loss": 0.7588, + "step": 4442 + }, + { + "epoch": 0.11, + "learning_rate": 1.9633387160896455e-06, + "loss": 0.9355, + "step": 4443 + }, + { + "epoch": 0.11, + "learning_rate": 1.963316441611733e-06, + "loss": 0.6941, + "step": 4444 + }, + { + "epoch": 0.11, + "learning_rate": 1.9632941604955993e-06, + "loss": 0.9043, + "step": 4445 + }, + { + "epoch": 0.11, + "learning_rate": 1.9632718727413986e-06, + "loss": 1.0498, + "step": 4446 + }, + { + "epoch": 0.11, + "learning_rate": 1.9632495783492835e-06, + "loss": 0.9453, + "step": 4447 + }, + { + "epoch": 0.11, + "learning_rate": 1.9632272773194088e-06, + "loss": 0.957, + "step": 4448 + }, + { + "epoch": 0.11, + "learning_rate": 1.9632049696519276e-06, + "loss": 0.9434, + "step": 4449 + }, + { + "epoch": 0.11, + "learning_rate": 1.963182655346994e-06, + "loss": 0.7002, + "step": 4450 + }, + { + "epoch": 0.11, + "learning_rate": 1.9631603344047606e-06, + "loss": 0.9961, + "step": 4451 + }, + { + "epoch": 0.11, + "learning_rate": 1.9631380068253827e-06, + "loss": 0.9492, + "step": 4452 + }, + { + "epoch": 0.11, + "learning_rate": 1.9631156726090133e-06, + "loss": 0.793, + "step": 4453 + }, + { + "epoch": 0.11, + "learning_rate": 1.9630933317558066e-06, + "loss": 0.9873, + "step": 4454 + }, + { + "epoch": 0.11, + "learning_rate": 1.9630709842659163e-06, + "loss": 0.9268, + "step": 4455 + }, + { + "epoch": 0.11, + "learning_rate": 1.9630486301394967e-06, + "loss": 1.0215, + "step": 4456 + }, + { + "epoch": 0.11, + "learning_rate": 1.963026269376702e-06, + "loss": 1.002, + "step": 4457 + }, + { + "epoch": 0.11, + "learning_rate": 1.963003901977686e-06, + "loss": 0.9766, + "step": 4458 + }, + { + "epoch": 0.11, + "learning_rate": 1.962981527942602e-06, + "loss": 0.8613, + "step": 4459 + }, + { + "epoch": 0.11, + "learning_rate": 1.962959147271606e-06, + "loss": 0.6514, + "step": 4460 + }, + { + "epoch": 0.11, + "learning_rate": 1.9629367599648505e-06, + "loss": 0.7637, + "step": 4461 + }, + { + "epoch": 0.11, + "learning_rate": 1.962914366022491e-06, + "loss": 1.084, + "step": 4462 + }, + { + "epoch": 0.11, + "learning_rate": 1.962891965444681e-06, + "loss": 0.8633, + "step": 4463 + }, + { + "epoch": 0.11, + "learning_rate": 1.9628695582315756e-06, + "loss": 1.0732, + "step": 4464 + }, + { + "epoch": 0.11, + "learning_rate": 1.962847144383328e-06, + "loss": 0.9131, + "step": 4465 + }, + { + "epoch": 0.11, + "learning_rate": 1.962824723900094e-06, + "loss": 0.9961, + "step": 4466 + }, + { + "epoch": 0.11, + "learning_rate": 1.962802296782028e-06, + "loss": 0.6755, + "step": 4467 + }, + { + "epoch": 0.11, + "learning_rate": 1.9627798630292836e-06, + "loss": 0.8174, + "step": 4468 + }, + { + "epoch": 0.11, + "learning_rate": 1.9627574226420162e-06, + "loss": 0.8286, + "step": 4469 + }, + { + "epoch": 0.11, + "learning_rate": 1.96273497562038e-06, + "loss": 0.9111, + "step": 4470 + }, + { + "epoch": 0.11, + "learning_rate": 1.9627125219645294e-06, + "loss": 0.9121, + "step": 4471 + }, + { + "epoch": 0.11, + "learning_rate": 1.96269006167462e-06, + "loss": 1.0605, + "step": 4472 + }, + { + "epoch": 0.11, + "learning_rate": 1.962667594750806e-06, + "loss": 0.7646, + "step": 4473 + }, + { + "epoch": 0.11, + "learning_rate": 1.9626451211932423e-06, + "loss": 0.998, + "step": 4474 + }, + { + "epoch": 0.11, + "learning_rate": 1.962622641002084e-06, + "loss": 0.9463, + "step": 4475 + }, + { + "epoch": 0.11, + "learning_rate": 1.9626001541774856e-06, + "loss": 0.8877, + "step": 4476 + }, + { + "epoch": 0.11, + "learning_rate": 1.9625776607196023e-06, + "loss": 0.9512, + "step": 4477 + }, + { + "epoch": 0.11, + "learning_rate": 1.9625551606285887e-06, + "loss": 0.877, + "step": 4478 + }, + { + "epoch": 0.11, + "learning_rate": 1.9625326539046007e-06, + "loss": 0.9922, + "step": 4479 + }, + { + "epoch": 0.11, + "learning_rate": 1.9625101405477925e-06, + "loss": 1.1797, + "step": 4480 + }, + { + "epoch": 0.11, + "learning_rate": 1.96248762055832e-06, + "loss": 0.9199, + "step": 4481 + }, + { + "epoch": 0.11, + "learning_rate": 1.962465093936338e-06, + "loss": 0.8574, + "step": 4482 + }, + { + "epoch": 0.11, + "learning_rate": 1.962442560682002e-06, + "loss": 0.8701, + "step": 4483 + }, + { + "epoch": 0.11, + "learning_rate": 1.9624200207954663e-06, + "loss": 1.0703, + "step": 4484 + }, + { + "epoch": 0.11, + "learning_rate": 1.9623974742768874e-06, + "loss": 0.8379, + "step": 4485 + }, + { + "epoch": 0.11, + "learning_rate": 1.9623749211264205e-06, + "loss": 0.957, + "step": 4486 + }, + { + "epoch": 0.12, + "learning_rate": 1.9623523613442206e-06, + "loss": 0.835, + "step": 4487 + }, + { + "epoch": 0.12, + "learning_rate": 1.962329794930443e-06, + "loss": 0.8184, + "step": 4488 + }, + { + "epoch": 0.12, + "learning_rate": 1.962307221885244e-06, + "loss": 0.8652, + "step": 4489 + }, + { + "epoch": 0.12, + "learning_rate": 1.962284642208778e-06, + "loss": 0.9028, + "step": 4490 + }, + { + "epoch": 0.12, + "learning_rate": 1.962262055901202e-06, + "loss": 0.9019, + "step": 4491 + }, + { + "epoch": 0.12, + "learning_rate": 1.9622394629626706e-06, + "loss": 0.9492, + "step": 4492 + }, + { + "epoch": 0.12, + "learning_rate": 1.9622168633933396e-06, + "loss": 0.918, + "step": 4493 + }, + { + "epoch": 0.12, + "learning_rate": 1.9621942571933648e-06, + "loss": 0.8682, + "step": 4494 + }, + { + "epoch": 0.12, + "learning_rate": 1.9621716443629025e-06, + "loss": 0.8271, + "step": 4495 + }, + { + "epoch": 0.12, + "learning_rate": 1.962149024902108e-06, + "loss": 1.0273, + "step": 4496 + }, + { + "epoch": 0.12, + "learning_rate": 1.9621263988111375e-06, + "loss": 1.0195, + "step": 4497 + }, + { + "epoch": 0.12, + "learning_rate": 1.962103766090147e-06, + "loss": 0.9287, + "step": 4498 + }, + { + "epoch": 0.12, + "learning_rate": 1.9620811267392914e-06, + "loss": 0.8516, + "step": 4499 + }, + { + "epoch": 0.12, + "learning_rate": 1.9620584807587276e-06, + "loss": 1.0, + "step": 4500 + }, + { + "epoch": 0.12, + "learning_rate": 1.962035828148612e-06, + "loss": 0.9326, + "step": 4501 + }, + { + "epoch": 0.12, + "learning_rate": 1.9620131689090996e-06, + "loss": 0.7256, + "step": 4502 + }, + { + "epoch": 0.12, + "learning_rate": 1.961990503040348e-06, + "loss": 0.9453, + "step": 4503 + }, + { + "epoch": 0.12, + "learning_rate": 1.961967830542512e-06, + "loss": 1.0264, + "step": 4504 + }, + { + "epoch": 0.12, + "learning_rate": 1.9619451514157485e-06, + "loss": 0.6426, + "step": 4505 + }, + { + "epoch": 0.12, + "learning_rate": 1.9619224656602138e-06, + "loss": 0.9912, + "step": 4506 + }, + { + "epoch": 0.12, + "learning_rate": 1.961899773276064e-06, + "loss": 0.9922, + "step": 4507 + }, + { + "epoch": 0.12, + "learning_rate": 1.9618770742634555e-06, + "loss": 0.7822, + "step": 4508 + }, + { + "epoch": 0.12, + "learning_rate": 1.9618543686225454e-06, + "loss": 0.7827, + "step": 4509 + }, + { + "epoch": 0.12, + "learning_rate": 1.961831656353489e-06, + "loss": 0.958, + "step": 4510 + }, + { + "epoch": 0.12, + "learning_rate": 1.9618089374564433e-06, + "loss": 0.8789, + "step": 4511 + }, + { + "epoch": 0.12, + "learning_rate": 1.9617862119315656e-06, + "loss": 0.999, + "step": 4512 + }, + { + "epoch": 0.12, + "learning_rate": 1.9617634797790113e-06, + "loss": 1.0166, + "step": 4513 + }, + { + "epoch": 0.12, + "learning_rate": 1.961740740998938e-06, + "loss": 0.9014, + "step": 4514 + }, + { + "epoch": 0.12, + "learning_rate": 1.9617179955915017e-06, + "loss": 1.0967, + "step": 4515 + }, + { + "epoch": 0.12, + "learning_rate": 1.9616952435568594e-06, + "loss": 1.0166, + "step": 4516 + }, + { + "epoch": 0.12, + "learning_rate": 1.961672484895168e-06, + "loss": 0.8887, + "step": 4517 + }, + { + "epoch": 0.12, + "learning_rate": 1.961649719606584e-06, + "loss": 1.0703, + "step": 4518 + }, + { + "epoch": 0.12, + "learning_rate": 1.961626947691265e-06, + "loss": 0.9277, + "step": 4519 + }, + { + "epoch": 0.12, + "learning_rate": 1.961604169149367e-06, + "loss": 1.0, + "step": 4520 + }, + { + "epoch": 0.12, + "learning_rate": 1.9615813839810474e-06, + "loss": 1.0, + "step": 4521 + }, + { + "epoch": 0.12, + "learning_rate": 1.9615585921864634e-06, + "loss": 1.0752, + "step": 4522 + }, + { + "epoch": 0.12, + "learning_rate": 1.9615357937657723e-06, + "loss": 0.7461, + "step": 4523 + }, + { + "epoch": 0.12, + "learning_rate": 1.96151298871913e-06, + "loss": 0.7222, + "step": 4524 + }, + { + "epoch": 0.12, + "learning_rate": 1.961490177046695e-06, + "loss": 1.0684, + "step": 4525 + }, + { + "epoch": 0.12, + "learning_rate": 1.9614673587486235e-06, + "loss": 0.9727, + "step": 4526 + }, + { + "epoch": 0.12, + "learning_rate": 1.9614445338250737e-06, + "loss": 0.9453, + "step": 4527 + }, + { + "epoch": 0.12, + "learning_rate": 1.961421702276202e-06, + "loss": 0.8232, + "step": 4528 + }, + { + "epoch": 0.12, + "learning_rate": 1.9613988641021662e-06, + "loss": 1.0752, + "step": 4529 + }, + { + "epoch": 0.12, + "learning_rate": 1.9613760193031234e-06, + "loss": 1.0098, + "step": 4530 + }, + { + "epoch": 0.12, + "learning_rate": 1.9613531678792312e-06, + "loss": 0.8506, + "step": 4531 + }, + { + "epoch": 0.12, + "learning_rate": 1.961330309830647e-06, + "loss": 1.0498, + "step": 4532 + }, + { + "epoch": 0.12, + "learning_rate": 1.9613074451575286e-06, + "loss": 0.8496, + "step": 4533 + }, + { + "epoch": 0.12, + "learning_rate": 1.9612845738600332e-06, + "loss": 0.9551, + "step": 4534 + }, + { + "epoch": 0.12, + "learning_rate": 1.9612616959383188e-06, + "loss": 0.7803, + "step": 4535 + }, + { + "epoch": 0.12, + "learning_rate": 1.961238811392543e-06, + "loss": 0.7969, + "step": 4536 + }, + { + "epoch": 0.12, + "learning_rate": 1.9612159202228625e-06, + "loss": 0.9014, + "step": 4537 + }, + { + "epoch": 0.12, + "learning_rate": 1.9611930224294362e-06, + "loss": 1.0986, + "step": 4538 + }, + { + "epoch": 0.12, + "learning_rate": 1.9611701180124215e-06, + "loss": 1.0234, + "step": 4539 + }, + { + "epoch": 0.12, + "learning_rate": 1.9611472069719763e-06, + "loss": 1.0361, + "step": 4540 + }, + { + "epoch": 0.12, + "learning_rate": 1.9611242893082587e-06, + "loss": 0.9512, + "step": 4541 + }, + { + "epoch": 0.12, + "learning_rate": 1.9611013650214256e-06, + "loss": 0.9189, + "step": 4542 + }, + { + "epoch": 0.12, + "learning_rate": 1.9610784341116365e-06, + "loss": 0.9688, + "step": 4543 + }, + { + "epoch": 0.12, + "learning_rate": 1.9610554965790483e-06, + "loss": 0.9199, + "step": 4544 + }, + { + "epoch": 0.12, + "learning_rate": 1.9610325524238196e-06, + "loss": 0.8848, + "step": 4545 + }, + { + "epoch": 0.12, + "learning_rate": 1.961009601646108e-06, + "loss": 0.998, + "step": 4546 + }, + { + "epoch": 0.12, + "learning_rate": 1.960986644246072e-06, + "loss": 0.4448, + "step": 4547 + }, + { + "epoch": 0.12, + "learning_rate": 1.96096368022387e-06, + "loss": 1.0, + "step": 4548 + }, + { + "epoch": 0.12, + "learning_rate": 1.96094070957966e-06, + "loss": 0.834, + "step": 4549 + }, + { + "epoch": 0.12, + "learning_rate": 1.9609177323136005e-06, + "loss": 1.167, + "step": 4550 + }, + { + "epoch": 0.12, + "learning_rate": 1.9608947484258494e-06, + "loss": 0.918, + "step": 4551 + }, + { + "epoch": 0.12, + "learning_rate": 1.9608717579165655e-06, + "loss": 1.0176, + "step": 4552 + }, + { + "epoch": 0.12, + "learning_rate": 1.9608487607859066e-06, + "loss": 0.8828, + "step": 4553 + }, + { + "epoch": 0.12, + "learning_rate": 1.960825757034032e-06, + "loss": 1.0127, + "step": 4554 + }, + { + "epoch": 0.12, + "learning_rate": 1.9608027466611e-06, + "loss": 0.9287, + "step": 4555 + }, + { + "epoch": 0.12, + "learning_rate": 1.960779729667269e-06, + "loss": 0.9219, + "step": 4556 + }, + { + "epoch": 0.12, + "learning_rate": 1.960756706052697e-06, + "loss": 0.9053, + "step": 4557 + }, + { + "epoch": 0.12, + "learning_rate": 1.960733675817544e-06, + "loss": 0.9766, + "step": 4558 + }, + { + "epoch": 0.12, + "learning_rate": 1.9607106389619672e-06, + "loss": 1.0508, + "step": 4559 + }, + { + "epoch": 0.12, + "learning_rate": 1.960687595486127e-06, + "loss": 0.7871, + "step": 4560 + }, + { + "epoch": 0.12, + "learning_rate": 1.960664545390181e-06, + "loss": 0.8428, + "step": 4561 + }, + { + "epoch": 0.12, + "learning_rate": 1.9606414886742883e-06, + "loss": 1.0293, + "step": 4562 + }, + { + "epoch": 0.12, + "learning_rate": 1.960618425338608e-06, + "loss": 0.9014, + "step": 4563 + }, + { + "epoch": 0.12, + "learning_rate": 1.9605953553832986e-06, + "loss": 0.9375, + "step": 4564 + }, + { + "epoch": 0.12, + "learning_rate": 1.9605722788085196e-06, + "loss": 0.6968, + "step": 4565 + }, + { + "epoch": 0.12, + "learning_rate": 1.9605491956144296e-06, + "loss": 1.0156, + "step": 4566 + }, + { + "epoch": 0.12, + "learning_rate": 1.960526105801188e-06, + "loss": 0.8848, + "step": 4567 + }, + { + "epoch": 0.12, + "learning_rate": 1.9605030093689535e-06, + "loss": 0.8506, + "step": 4568 + }, + { + "epoch": 0.12, + "learning_rate": 1.960479906317886e-06, + "loss": 1.0742, + "step": 4569 + }, + { + "epoch": 0.12, + "learning_rate": 1.9604567966481434e-06, + "loss": 0.8174, + "step": 4570 + }, + { + "epoch": 0.12, + "learning_rate": 1.960433680359886e-06, + "loss": 0.9629, + "step": 4571 + }, + { + "epoch": 0.12, + "learning_rate": 1.9604105574532736e-06, + "loss": 0.9609, + "step": 4572 + }, + { + "epoch": 0.12, + "learning_rate": 1.960387427928464e-06, + "loss": 1.0059, + "step": 4573 + }, + { + "epoch": 0.12, + "learning_rate": 1.9603642917856176e-06, + "loss": 0.9287, + "step": 4574 + }, + { + "epoch": 0.12, + "learning_rate": 1.9603411490248936e-06, + "loss": 1.2695, + "step": 4575 + }, + { + "epoch": 0.12, + "learning_rate": 1.9603179996464516e-06, + "loss": 0.7305, + "step": 4576 + }, + { + "epoch": 0.12, + "learning_rate": 1.960294843650451e-06, + "loss": 0.8643, + "step": 4577 + }, + { + "epoch": 0.12, + "learning_rate": 1.9602716810370515e-06, + "loss": 1.0205, + "step": 4578 + }, + { + "epoch": 0.12, + "learning_rate": 1.9602485118064124e-06, + "loss": 0.96, + "step": 4579 + }, + { + "epoch": 0.12, + "learning_rate": 1.9602253359586935e-06, + "loss": 1.0107, + "step": 4580 + }, + { + "epoch": 0.12, + "learning_rate": 1.9602021534940544e-06, + "loss": 0.9839, + "step": 4581 + }, + { + "epoch": 0.12, + "learning_rate": 1.960178964412655e-06, + "loss": 0.8647, + "step": 4582 + }, + { + "epoch": 0.12, + "learning_rate": 1.9601557687146556e-06, + "loss": 0.8672, + "step": 4583 + }, + { + "epoch": 0.12, + "learning_rate": 1.9601325664002157e-06, + "loss": 1.1592, + "step": 4584 + }, + { + "epoch": 0.12, + "learning_rate": 1.9601093574694943e-06, + "loss": 1.0381, + "step": 4585 + }, + { + "epoch": 0.12, + "learning_rate": 1.9600861419226528e-06, + "loss": 1.2871, + "step": 4586 + }, + { + "epoch": 0.12, + "learning_rate": 1.96006291975985e-06, + "loss": 0.917, + "step": 4587 + }, + { + "epoch": 0.12, + "learning_rate": 1.960039690981246e-06, + "loss": 0.9746, + "step": 4588 + }, + { + "epoch": 0.12, + "learning_rate": 1.960016455587002e-06, + "loss": 0.9868, + "step": 4589 + }, + { + "epoch": 0.12, + "learning_rate": 1.959993213577277e-06, + "loss": 0.8584, + "step": 4590 + }, + { + "epoch": 0.12, + "learning_rate": 1.9599699649522312e-06, + "loss": 1.0684, + "step": 4591 + }, + { + "epoch": 0.12, + "learning_rate": 1.9599467097120256e-06, + "loss": 0.9443, + "step": 4592 + }, + { + "epoch": 0.12, + "learning_rate": 1.9599234478568197e-06, + "loss": 0.7471, + "step": 4593 + }, + { + "epoch": 0.12, + "learning_rate": 1.9599001793867743e-06, + "loss": 0.9893, + "step": 4594 + }, + { + "epoch": 0.12, + "learning_rate": 1.959876904302049e-06, + "loss": 0.7896, + "step": 4595 + }, + { + "epoch": 0.12, + "learning_rate": 1.959853622602805e-06, + "loss": 0.835, + "step": 4596 + }, + { + "epoch": 0.12, + "learning_rate": 1.959830334289203e-06, + "loss": 0.8828, + "step": 4597 + }, + { + "epoch": 0.12, + "learning_rate": 1.959807039361402e-06, + "loss": 0.9775, + "step": 4598 + }, + { + "epoch": 0.12, + "learning_rate": 1.959783737819564e-06, + "loss": 0.8535, + "step": 4599 + }, + { + "epoch": 0.12, + "learning_rate": 1.959760429663849e-06, + "loss": 0.9766, + "step": 4600 + }, + { + "epoch": 0.12, + "learning_rate": 1.9597371148944175e-06, + "loss": 0.8906, + "step": 4601 + }, + { + "epoch": 0.12, + "learning_rate": 1.9597137935114305e-06, + "loss": 0.9326, + "step": 4602 + }, + { + "epoch": 0.12, + "learning_rate": 1.9596904655150482e-06, + "loss": 0.9297, + "step": 4603 + }, + { + "epoch": 0.12, + "learning_rate": 1.9596671309054317e-06, + "loss": 0.9971, + "step": 4604 + }, + { + "epoch": 0.12, + "learning_rate": 1.9596437896827418e-06, + "loss": 1.1973, + "step": 4605 + }, + { + "epoch": 0.12, + "learning_rate": 1.9596204418471394e-06, + "loss": 0.959, + "step": 4606 + }, + { + "epoch": 0.12, + "learning_rate": 1.959597087398785e-06, + "loss": 1.2051, + "step": 4607 + }, + { + "epoch": 0.12, + "learning_rate": 1.9595737263378404e-06, + "loss": 1.1426, + "step": 4608 + }, + { + "epoch": 0.12, + "learning_rate": 1.959550358664465e-06, + "loss": 0.8188, + "step": 4609 + }, + { + "epoch": 0.12, + "learning_rate": 1.9595269843788216e-06, + "loss": 1.0508, + "step": 4610 + }, + { + "epoch": 0.12, + "learning_rate": 1.9595036034810708e-06, + "loss": 1.0742, + "step": 4611 + }, + { + "epoch": 0.12, + "learning_rate": 1.9594802159713727e-06, + "loss": 1.0391, + "step": 4612 + }, + { + "epoch": 0.12, + "learning_rate": 1.959456821849889e-06, + "loss": 0.9619, + "step": 4613 + }, + { + "epoch": 0.12, + "learning_rate": 1.959433421116782e-06, + "loss": 1.001, + "step": 4614 + }, + { + "epoch": 0.12, + "learning_rate": 1.959410013772211e-06, + "loss": 0.8486, + "step": 4615 + }, + { + "epoch": 0.12, + "learning_rate": 1.9593865998163395e-06, + "loss": 0.9424, + "step": 4616 + }, + { + "epoch": 0.12, + "learning_rate": 1.959363179249327e-06, + "loss": 0.9287, + "step": 4617 + }, + { + "epoch": 0.12, + "learning_rate": 1.9593397520713357e-06, + "loss": 0.8184, + "step": 4618 + }, + { + "epoch": 0.12, + "learning_rate": 1.959316318282527e-06, + "loss": 0.9648, + "step": 4619 + }, + { + "epoch": 0.12, + "learning_rate": 1.9592928778830623e-06, + "loss": 0.998, + "step": 4620 + }, + { + "epoch": 0.12, + "learning_rate": 1.9592694308731032e-06, + "loss": 0.6064, + "step": 4621 + }, + { + "epoch": 0.12, + "learning_rate": 1.959245977252811e-06, + "loss": 0.9189, + "step": 4622 + }, + { + "epoch": 0.12, + "learning_rate": 1.9592225170223473e-06, + "loss": 0.6179, + "step": 4623 + }, + { + "epoch": 0.12, + "learning_rate": 1.9591990501818745e-06, + "loss": 0.8438, + "step": 4624 + }, + { + "epoch": 0.12, + "learning_rate": 1.9591755767315537e-06, + "loss": 1.1123, + "step": 4625 + }, + { + "epoch": 0.12, + "learning_rate": 1.959152096671547e-06, + "loss": 0.9131, + "step": 4626 + }, + { + "epoch": 0.12, + "learning_rate": 1.9591286100020153e-06, + "loss": 0.8779, + "step": 4627 + }, + { + "epoch": 0.12, + "learning_rate": 1.9591051167231213e-06, + "loss": 0.9531, + "step": 4628 + }, + { + "epoch": 0.12, + "learning_rate": 1.959081616835027e-06, + "loss": 0.8369, + "step": 4629 + }, + { + "epoch": 0.12, + "learning_rate": 1.9590581103378936e-06, + "loss": 0.8218, + "step": 4630 + }, + { + "epoch": 0.12, + "learning_rate": 1.959034597231884e-06, + "loss": 0.7534, + "step": 4631 + }, + { + "epoch": 0.12, + "learning_rate": 1.9590110775171594e-06, + "loss": 0.9355, + "step": 4632 + }, + { + "epoch": 0.12, + "learning_rate": 1.958987551193882e-06, + "loss": 0.9912, + "step": 4633 + }, + { + "epoch": 0.12, + "learning_rate": 1.9589640182622146e-06, + "loss": 0.9355, + "step": 4634 + }, + { + "epoch": 0.12, + "learning_rate": 1.958940478722319e-06, + "loss": 1.002, + "step": 4635 + }, + { + "epoch": 0.12, + "learning_rate": 1.958916932574357e-06, + "loss": 0.9697, + "step": 4636 + }, + { + "epoch": 0.12, + "learning_rate": 1.958893379818491e-06, + "loss": 0.9014, + "step": 4637 + }, + { + "epoch": 0.12, + "learning_rate": 1.958869820454884e-06, + "loss": 1.0049, + "step": 4638 + }, + { + "epoch": 0.12, + "learning_rate": 1.9588462544836974e-06, + "loss": 1.082, + "step": 4639 + }, + { + "epoch": 0.12, + "learning_rate": 1.9588226819050943e-06, + "loss": 1.0547, + "step": 4640 + }, + { + "epoch": 0.12, + "learning_rate": 1.9587991027192365e-06, + "loss": 0.6802, + "step": 4641 + }, + { + "epoch": 0.12, + "learning_rate": 1.958775516926287e-06, + "loss": 0.8682, + "step": 4642 + }, + { + "epoch": 0.12, + "learning_rate": 1.9587519245264084e-06, + "loss": 1.0996, + "step": 4643 + }, + { + "epoch": 0.12, + "learning_rate": 1.958728325519763e-06, + "loss": 0.8994, + "step": 4644 + }, + { + "epoch": 0.12, + "learning_rate": 1.9587047199065136e-06, + "loss": 0.9009, + "step": 4645 + }, + { + "epoch": 0.12, + "learning_rate": 1.9586811076868223e-06, + "loss": 0.7886, + "step": 4646 + }, + { + "epoch": 0.12, + "learning_rate": 1.9586574888608522e-06, + "loss": 1.1826, + "step": 4647 + }, + { + "epoch": 0.12, + "learning_rate": 1.9586338634287663e-06, + "loss": 0.999, + "step": 4648 + }, + { + "epoch": 0.12, + "learning_rate": 1.9586102313907275e-06, + "loss": 0.8564, + "step": 4649 + }, + { + "epoch": 0.12, + "learning_rate": 1.9585865927468982e-06, + "loss": 1.0635, + "step": 4650 + }, + { + "epoch": 0.12, + "learning_rate": 1.9585629474974414e-06, + "loss": 0.7344, + "step": 4651 + }, + { + "epoch": 0.12, + "learning_rate": 1.9585392956425197e-06, + "loss": 0.9814, + "step": 4652 + }, + { + "epoch": 0.12, + "learning_rate": 1.958515637182297e-06, + "loss": 0.8462, + "step": 4653 + }, + { + "epoch": 0.12, + "learning_rate": 1.9584919721169355e-06, + "loss": 0.8906, + "step": 4654 + }, + { + "epoch": 0.12, + "learning_rate": 1.9584683004465987e-06, + "loss": 1.1426, + "step": 4655 + }, + { + "epoch": 0.12, + "learning_rate": 1.9584446221714497e-06, + "loss": 1.0361, + "step": 4656 + }, + { + "epoch": 0.12, + "learning_rate": 1.9584209372916514e-06, + "loss": 0.8989, + "step": 4657 + }, + { + "epoch": 0.12, + "learning_rate": 1.958397245807367e-06, + "loss": 1.0293, + "step": 4658 + }, + { + "epoch": 0.12, + "learning_rate": 1.9583735477187604e-06, + "loss": 0.6797, + "step": 4659 + }, + { + "epoch": 0.12, + "learning_rate": 1.958349843025994e-06, + "loss": 0.9639, + "step": 4660 + }, + { + "epoch": 0.12, + "learning_rate": 1.958326131729232e-06, + "loss": 0.8169, + "step": 4661 + }, + { + "epoch": 0.12, + "learning_rate": 1.9583024138286372e-06, + "loss": 0.9238, + "step": 4662 + }, + { + "epoch": 0.12, + "learning_rate": 1.9582786893243734e-06, + "loss": 0.8262, + "step": 4663 + }, + { + "epoch": 0.12, + "learning_rate": 1.9582549582166035e-06, + "loss": 1.0879, + "step": 4664 + }, + { + "epoch": 0.12, + "learning_rate": 1.958231220505492e-06, + "loss": 1.0332, + "step": 4665 + }, + { + "epoch": 0.12, + "learning_rate": 1.9582074761912013e-06, + "loss": 0.875, + "step": 4666 + }, + { + "epoch": 0.12, + "learning_rate": 1.958183725273896e-06, + "loss": 0.583, + "step": 4667 + }, + { + "epoch": 0.12, + "learning_rate": 1.9581599677537394e-06, + "loss": 1.0625, + "step": 4668 + }, + { + "epoch": 0.12, + "learning_rate": 1.958136203630895e-06, + "loss": 1.1504, + "step": 4669 + }, + { + "epoch": 0.12, + "learning_rate": 1.958112432905527e-06, + "loss": 0.9893, + "step": 4670 + }, + { + "epoch": 0.12, + "learning_rate": 1.9580886555777993e-06, + "loss": 0.9219, + "step": 4671 + }, + { + "epoch": 0.12, + "learning_rate": 1.958064871647875e-06, + "loss": 1.0254, + "step": 4672 + }, + { + "epoch": 0.12, + "learning_rate": 1.9580410811159186e-06, + "loss": 0.7803, + "step": 4673 + }, + { + "epoch": 0.12, + "learning_rate": 1.9580172839820935e-06, + "loss": 0.9102, + "step": 4674 + }, + { + "epoch": 0.12, + "learning_rate": 1.9579934802465647e-06, + "loss": 0.9814, + "step": 4675 + }, + { + "epoch": 0.12, + "learning_rate": 1.9579696699094954e-06, + "loss": 0.8037, + "step": 4676 + }, + { + "epoch": 0.12, + "learning_rate": 1.9579458529710494e-06, + "loss": 0.7871, + "step": 4677 + }, + { + "epoch": 0.12, + "learning_rate": 1.9579220294313914e-06, + "loss": 0.8799, + "step": 4678 + }, + { + "epoch": 0.12, + "learning_rate": 1.957898199290686e-06, + "loss": 0.7114, + "step": 4679 + }, + { + "epoch": 0.12, + "learning_rate": 1.957874362549096e-06, + "loss": 0.915, + "step": 4680 + }, + { + "epoch": 0.12, + "learning_rate": 1.9578505192067875e-06, + "loss": 0.8535, + "step": 4681 + }, + { + "epoch": 0.12, + "learning_rate": 1.9578266692639234e-06, + "loss": 1.1543, + "step": 4682 + }, + { + "epoch": 0.12, + "learning_rate": 1.9578028127206685e-06, + "loss": 0.8857, + "step": 4683 + }, + { + "epoch": 0.12, + "learning_rate": 1.957778949577187e-06, + "loss": 0.7671, + "step": 4684 + }, + { + "epoch": 0.12, + "learning_rate": 1.957755079833644e-06, + "loss": 0.9873, + "step": 4685 + }, + { + "epoch": 0.12, + "learning_rate": 1.957731203490203e-06, + "loss": 1.0654, + "step": 4686 + }, + { + "epoch": 0.12, + "learning_rate": 1.9577073205470293e-06, + "loss": 0.9287, + "step": 4687 + }, + { + "epoch": 0.12, + "learning_rate": 1.9576834310042873e-06, + "loss": 0.8613, + "step": 4688 + }, + { + "epoch": 0.12, + "learning_rate": 1.9576595348621413e-06, + "loss": 1.1543, + "step": 4689 + }, + { + "epoch": 0.12, + "learning_rate": 1.957635632120756e-06, + "loss": 0.8032, + "step": 4690 + }, + { + "epoch": 0.12, + "learning_rate": 1.957611722780297e-06, + "loss": 1.1348, + "step": 4691 + }, + { + "epoch": 0.12, + "learning_rate": 1.957587806840928e-06, + "loss": 1.1133, + "step": 4692 + }, + { + "epoch": 0.12, + "learning_rate": 1.9575638843028142e-06, + "loss": 0.7556, + "step": 4693 + }, + { + "epoch": 0.12, + "learning_rate": 1.9575399551661206e-06, + "loss": 1.0049, + "step": 4694 + }, + { + "epoch": 0.12, + "learning_rate": 1.9575160194310115e-06, + "loss": 0.7139, + "step": 4695 + }, + { + "epoch": 0.12, + "learning_rate": 1.957492077097653e-06, + "loss": 0.7769, + "step": 4696 + }, + { + "epoch": 0.12, + "learning_rate": 1.9574681281662085e-06, + "loss": 1.1074, + "step": 4697 + }, + { + "epoch": 0.12, + "learning_rate": 1.9574441726368445e-06, + "loss": 0.9717, + "step": 4698 + }, + { + "epoch": 0.12, + "learning_rate": 1.9574202105097253e-06, + "loss": 0.9502, + "step": 4699 + }, + { + "epoch": 0.12, + "learning_rate": 1.957396241785016e-06, + "loss": 0.918, + "step": 4700 + }, + { + "epoch": 0.12, + "learning_rate": 1.9573722664628824e-06, + "loss": 0.8145, + "step": 4701 + }, + { + "epoch": 0.12, + "learning_rate": 1.957348284543489e-06, + "loss": 1.0107, + "step": 4702 + }, + { + "epoch": 0.12, + "learning_rate": 1.9573242960270012e-06, + "loss": 0.8828, + "step": 4703 + }, + { + "epoch": 0.12, + "learning_rate": 1.957300300913585e-06, + "loss": 1.0674, + "step": 4704 + }, + { + "epoch": 0.12, + "learning_rate": 1.9572762992034048e-06, + "loss": 0.6616, + "step": 4705 + }, + { + "epoch": 0.12, + "learning_rate": 1.957252290896626e-06, + "loss": 1.1553, + "step": 4706 + }, + { + "epoch": 0.12, + "learning_rate": 1.9572282759934153e-06, + "loss": 0.9678, + "step": 4707 + }, + { + "epoch": 0.12, + "learning_rate": 1.9572042544939367e-06, + "loss": 0.9834, + "step": 4708 + }, + { + "epoch": 0.12, + "learning_rate": 1.9571802263983568e-06, + "loss": 0.9922, + "step": 4709 + }, + { + "epoch": 0.12, + "learning_rate": 1.9571561917068406e-06, + "loss": 1.0732, + "step": 4710 + }, + { + "epoch": 0.12, + "learning_rate": 1.9571321504195534e-06, + "loss": 0.9922, + "step": 4711 + }, + { + "epoch": 0.12, + "learning_rate": 1.9571081025366617e-06, + "loss": 0.9248, + "step": 4712 + }, + { + "epoch": 0.12, + "learning_rate": 1.9570840480583305e-06, + "loss": 1.0625, + "step": 4713 + }, + { + "epoch": 0.12, + "learning_rate": 1.9570599869847264e-06, + "loss": 0.6919, + "step": 4714 + }, + { + "epoch": 0.12, + "learning_rate": 1.9570359193160145e-06, + "loss": 0.8511, + "step": 4715 + }, + { + "epoch": 0.12, + "learning_rate": 1.9570118450523608e-06, + "loss": 1.1348, + "step": 4716 + }, + { + "epoch": 0.12, + "learning_rate": 1.9569877641939313e-06, + "loss": 0.959, + "step": 4717 + }, + { + "epoch": 0.12, + "learning_rate": 1.9569636767408917e-06, + "loss": 0.9609, + "step": 4718 + }, + { + "epoch": 0.12, + "learning_rate": 1.9569395826934083e-06, + "loss": 0.917, + "step": 4719 + }, + { + "epoch": 0.12, + "learning_rate": 1.956915482051647e-06, + "loss": 1.1621, + "step": 4720 + }, + { + "epoch": 0.12, + "learning_rate": 1.956891374815774e-06, + "loss": 0.9238, + "step": 4721 + }, + { + "epoch": 0.12, + "learning_rate": 1.9568672609859553e-06, + "loss": 0.9062, + "step": 4722 + }, + { + "epoch": 0.12, + "learning_rate": 1.956843140562357e-06, + "loss": 1.0615, + "step": 4723 + }, + { + "epoch": 0.12, + "learning_rate": 1.956819013545145e-06, + "loss": 0.8062, + "step": 4724 + }, + { + "epoch": 0.12, + "learning_rate": 1.9567948799344868e-06, + "loss": 0.8086, + "step": 4725 + }, + { + "epoch": 0.12, + "learning_rate": 1.956770739730547e-06, + "loss": 0.7227, + "step": 4726 + }, + { + "epoch": 0.12, + "learning_rate": 1.9567465929334933e-06, + "loss": 0.8799, + "step": 4727 + }, + { + "epoch": 0.12, + "learning_rate": 1.9567224395434915e-06, + "loss": 1.0381, + "step": 4728 + }, + { + "epoch": 0.12, + "learning_rate": 1.956698279560708e-06, + "loss": 1.0557, + "step": 4729 + }, + { + "epoch": 0.12, + "learning_rate": 1.9566741129853098e-06, + "loss": 1.0244, + "step": 4730 + }, + { + "epoch": 0.12, + "learning_rate": 1.956649939817463e-06, + "loss": 1.0986, + "step": 4731 + }, + { + "epoch": 0.12, + "learning_rate": 1.956625760057334e-06, + "loss": 0.6719, + "step": 4732 + }, + { + "epoch": 0.12, + "learning_rate": 1.9566015737050894e-06, + "loss": 0.8057, + "step": 4733 + }, + { + "epoch": 0.12, + "learning_rate": 1.9565773807608966e-06, + "loss": 0.8848, + "step": 4734 + }, + { + "epoch": 0.12, + "learning_rate": 1.9565531812249215e-06, + "loss": 1.1465, + "step": 4735 + }, + { + "epoch": 0.12, + "learning_rate": 1.9565289750973317e-06, + "loss": 0.9331, + "step": 4736 + }, + { + "epoch": 0.12, + "learning_rate": 1.956504762378293e-06, + "loss": 0.8955, + "step": 4737 + }, + { + "epoch": 0.12, + "learning_rate": 1.956480543067973e-06, + "loss": 0.9248, + "step": 4738 + }, + { + "epoch": 0.12, + "learning_rate": 1.9564563171665386e-06, + "loss": 0.7402, + "step": 4739 + }, + { + "epoch": 0.12, + "learning_rate": 1.956432084674156e-06, + "loss": 0.9512, + "step": 4740 + }, + { + "epoch": 0.12, + "learning_rate": 1.956407845590993e-06, + "loss": 1.0938, + "step": 4741 + }, + { + "epoch": 0.12, + "learning_rate": 1.9563835999172163e-06, + "loss": 1.0098, + "step": 4742 + }, + { + "epoch": 0.12, + "learning_rate": 1.956359347652993e-06, + "loss": 1.0762, + "step": 4743 + }, + { + "epoch": 0.12, + "learning_rate": 1.95633508879849e-06, + "loss": 1.0986, + "step": 4744 + }, + { + "epoch": 0.12, + "learning_rate": 1.9563108233538745e-06, + "loss": 1.0938, + "step": 4745 + }, + { + "epoch": 0.12, + "learning_rate": 1.9562865513193143e-06, + "loss": 0.917, + "step": 4746 + }, + { + "epoch": 0.12, + "learning_rate": 1.956262272694976e-06, + "loss": 1.0586, + "step": 4747 + }, + { + "epoch": 0.12, + "learning_rate": 1.9562379874810273e-06, + "loss": 0.9238, + "step": 4748 + }, + { + "epoch": 0.12, + "learning_rate": 1.9562136956776355e-06, + "loss": 0.9365, + "step": 4749 + }, + { + "epoch": 0.12, + "learning_rate": 1.9561893972849677e-06, + "loss": 0.9438, + "step": 4750 + }, + { + "epoch": 0.12, + "learning_rate": 1.9561650923031916e-06, + "loss": 0.9053, + "step": 4751 + }, + { + "epoch": 0.12, + "learning_rate": 1.9561407807324746e-06, + "loss": 0.9023, + "step": 4752 + }, + { + "epoch": 0.12, + "learning_rate": 1.9561164625729843e-06, + "loss": 0.7988, + "step": 4753 + }, + { + "epoch": 0.12, + "learning_rate": 1.9560921378248885e-06, + "loss": 0.9229, + "step": 4754 + }, + { + "epoch": 0.12, + "learning_rate": 1.9560678064883544e-06, + "loss": 0.8467, + "step": 4755 + }, + { + "epoch": 0.12, + "learning_rate": 1.9560434685635494e-06, + "loss": 0.9932, + "step": 4756 + }, + { + "epoch": 0.12, + "learning_rate": 1.956019124050642e-06, + "loss": 1.1113, + "step": 4757 + }, + { + "epoch": 0.12, + "learning_rate": 1.9559947729497997e-06, + "loss": 0.8516, + "step": 4758 + }, + { + "epoch": 0.12, + "learning_rate": 1.95597041526119e-06, + "loss": 1.0107, + "step": 4759 + }, + { + "epoch": 0.12, + "learning_rate": 1.955946050984981e-06, + "loss": 0.7876, + "step": 4760 + }, + { + "epoch": 0.12, + "learning_rate": 1.9559216801213405e-06, + "loss": 1.0537, + "step": 4761 + }, + { + "epoch": 0.12, + "learning_rate": 1.9558973026704367e-06, + "loss": 0.9014, + "step": 4762 + }, + { + "epoch": 0.12, + "learning_rate": 1.955872918632437e-06, + "loss": 0.7114, + "step": 4763 + }, + { + "epoch": 0.12, + "learning_rate": 1.95584852800751e-06, + "loss": 0.9658, + "step": 4764 + }, + { + "epoch": 0.12, + "learning_rate": 1.9558241307958235e-06, + "loss": 0.7617, + "step": 4765 + }, + { + "epoch": 0.12, + "learning_rate": 1.955799726997546e-06, + "loss": 1.0488, + "step": 4766 + }, + { + "epoch": 0.12, + "learning_rate": 1.955775316612845e-06, + "loss": 1.0801, + "step": 4767 + }, + { + "epoch": 0.12, + "learning_rate": 1.955750899641889e-06, + "loss": 1.0605, + "step": 4768 + }, + { + "epoch": 0.12, + "learning_rate": 1.9557264760848465e-06, + "loss": 1.332, + "step": 4769 + }, + { + "epoch": 0.12, + "learning_rate": 1.9557020459418857e-06, + "loss": 0.915, + "step": 4770 + }, + { + "epoch": 0.12, + "learning_rate": 1.955677609213175e-06, + "loss": 0.9707, + "step": 4771 + }, + { + "epoch": 0.12, + "learning_rate": 1.9556531658988824e-06, + "loss": 0.7236, + "step": 4772 + }, + { + "epoch": 0.12, + "learning_rate": 1.9556287159991766e-06, + "loss": 0.6362, + "step": 4773 + }, + { + "epoch": 0.12, + "learning_rate": 1.9556042595142263e-06, + "loss": 0.9648, + "step": 4774 + }, + { + "epoch": 0.12, + "learning_rate": 1.9555797964442e-06, + "loss": 0.9248, + "step": 4775 + }, + { + "epoch": 0.12, + "learning_rate": 1.9555553267892656e-06, + "loss": 0.876, + "step": 4776 + }, + { + "epoch": 0.12, + "learning_rate": 1.9555308505495923e-06, + "loss": 0.9043, + "step": 4777 + }, + { + "epoch": 0.12, + "learning_rate": 1.955506367725349e-06, + "loss": 1.083, + "step": 4778 + }, + { + "epoch": 0.12, + "learning_rate": 1.9554818783167038e-06, + "loss": 1.0527, + "step": 4779 + }, + { + "epoch": 0.12, + "learning_rate": 1.955457382323826e-06, + "loss": 1.0234, + "step": 4780 + }, + { + "epoch": 0.12, + "learning_rate": 1.9554328797468843e-06, + "loss": 0.9131, + "step": 4781 + }, + { + "epoch": 0.12, + "learning_rate": 1.9554083705860473e-06, + "loss": 0.8047, + "step": 4782 + }, + { + "epoch": 0.12, + "learning_rate": 1.9553838548414836e-06, + "loss": 0.9053, + "step": 4783 + }, + { + "epoch": 0.12, + "learning_rate": 1.955359332513363e-06, + "loss": 1.124, + "step": 4784 + }, + { + "epoch": 0.12, + "learning_rate": 1.955334803601854e-06, + "loss": 0.8135, + "step": 4785 + }, + { + "epoch": 0.12, + "learning_rate": 1.9553102681071257e-06, + "loss": 0.9951, + "step": 4786 + }, + { + "epoch": 0.12, + "learning_rate": 1.9552857260293466e-06, + "loss": 0.8604, + "step": 4787 + }, + { + "epoch": 0.12, + "learning_rate": 1.955261177368687e-06, + "loss": 1.042, + "step": 4788 + }, + { + "epoch": 0.12, + "learning_rate": 1.9552366221253147e-06, + "loss": 1.0703, + "step": 4789 + }, + { + "epoch": 0.12, + "learning_rate": 1.9552120602994004e-06, + "loss": 0.8887, + "step": 4790 + }, + { + "epoch": 0.12, + "learning_rate": 1.955187491891112e-06, + "loss": 0.9756, + "step": 4791 + }, + { + "epoch": 0.12, + "learning_rate": 1.9551629169006197e-06, + "loss": 0.9824, + "step": 4792 + }, + { + "epoch": 0.12, + "learning_rate": 1.9551383353280922e-06, + "loss": 1.0107, + "step": 4793 + }, + { + "epoch": 0.12, + "learning_rate": 1.9551137471736995e-06, + "loss": 1.0557, + "step": 4794 + }, + { + "epoch": 0.12, + "learning_rate": 1.955089152437611e-06, + "loss": 0.7991, + "step": 4795 + }, + { + "epoch": 0.12, + "learning_rate": 1.9550645511199953e-06, + "loss": 1.1338, + "step": 4796 + }, + { + "epoch": 0.12, + "learning_rate": 1.9550399432210227e-06, + "loss": 0.9893, + "step": 4797 + }, + { + "epoch": 0.12, + "learning_rate": 1.955015328740863e-06, + "loss": 0.8052, + "step": 4798 + }, + { + "epoch": 0.12, + "learning_rate": 1.9549907076796853e-06, + "loss": 0.7949, + "step": 4799 + }, + { + "epoch": 0.12, + "learning_rate": 1.954966080037659e-06, + "loss": 0.9951, + "step": 4800 + }, + { + "epoch": 0.12, + "learning_rate": 1.954941445814955e-06, + "loss": 0.9209, + "step": 4801 + }, + { + "epoch": 0.12, + "learning_rate": 1.954916805011742e-06, + "loss": 1.0576, + "step": 4802 + }, + { + "epoch": 0.12, + "learning_rate": 1.9548921576281896e-06, + "loss": 0.6929, + "step": 4803 + }, + { + "epoch": 0.12, + "learning_rate": 1.954867503664469e-06, + "loss": 1.0703, + "step": 4804 + }, + { + "epoch": 0.12, + "learning_rate": 1.9548428431207483e-06, + "loss": 0.8975, + "step": 4805 + }, + { + "epoch": 0.12, + "learning_rate": 1.954818175997199e-06, + "loss": 0.8262, + "step": 4806 + }, + { + "epoch": 0.12, + "learning_rate": 1.95479350229399e-06, + "loss": 0.8262, + "step": 4807 + }, + { + "epoch": 0.12, + "learning_rate": 1.9547688220112923e-06, + "loss": 1.0352, + "step": 4808 + }, + { + "epoch": 0.12, + "learning_rate": 1.954744135149275e-06, + "loss": 0.9238, + "step": 4809 + }, + { + "epoch": 0.12, + "learning_rate": 1.9547194417081088e-06, + "loss": 0.7949, + "step": 4810 + }, + { + "epoch": 0.12, + "learning_rate": 1.9546947416879635e-06, + "loss": 0.9805, + "step": 4811 + }, + { + "epoch": 0.12, + "learning_rate": 1.9546700350890095e-06, + "loss": 1.0635, + "step": 4812 + }, + { + "epoch": 0.12, + "learning_rate": 1.9546453219114175e-06, + "loss": 1.0527, + "step": 4813 + }, + { + "epoch": 0.12, + "learning_rate": 1.954620602155357e-06, + "loss": 1.0352, + "step": 4814 + }, + { + "epoch": 0.12, + "learning_rate": 1.9545958758209992e-06, + "loss": 0.8496, + "step": 4815 + }, + { + "epoch": 0.12, + "learning_rate": 1.9545711429085136e-06, + "loss": 0.6333, + "step": 4816 + }, + { + "epoch": 0.12, + "learning_rate": 1.954546403418071e-06, + "loss": 0.9424, + "step": 4817 + }, + { + "epoch": 0.12, + "learning_rate": 1.954521657349842e-06, + "loss": 0.8101, + "step": 4818 + }, + { + "epoch": 0.12, + "learning_rate": 1.9544969047039973e-06, + "loss": 1.1484, + "step": 4819 + }, + { + "epoch": 0.12, + "learning_rate": 1.954472145480707e-06, + "loss": 1.0176, + "step": 4820 + }, + { + "epoch": 0.12, + "learning_rate": 1.954447379680142e-06, + "loss": 1.0684, + "step": 4821 + }, + { + "epoch": 0.12, + "learning_rate": 1.9544226073024727e-06, + "loss": 0.9951, + "step": 4822 + }, + { + "epoch": 0.12, + "learning_rate": 1.9543978283478705e-06, + "loss": 0.8633, + "step": 4823 + }, + { + "epoch": 0.12, + "learning_rate": 1.954373042816505e-06, + "loss": 0.916, + "step": 4824 + }, + { + "epoch": 0.12, + "learning_rate": 1.954348250708548e-06, + "loss": 0.9805, + "step": 4825 + }, + { + "epoch": 0.12, + "learning_rate": 1.95432345202417e-06, + "loss": 1.0361, + "step": 4826 + }, + { + "epoch": 0.12, + "learning_rate": 1.954298646763542e-06, + "loss": 1.0293, + "step": 4827 + }, + { + "epoch": 0.12, + "learning_rate": 1.9542738349268343e-06, + "loss": 1.0889, + "step": 4828 + }, + { + "epoch": 0.12, + "learning_rate": 1.954249016514219e-06, + "loss": 0.9961, + "step": 4829 + }, + { + "epoch": 0.12, + "learning_rate": 1.954224191525866e-06, + "loss": 0.8555, + "step": 4830 + }, + { + "epoch": 0.12, + "learning_rate": 1.954199359961947e-06, + "loss": 1.0273, + "step": 4831 + }, + { + "epoch": 0.12, + "learning_rate": 1.9541745218226334e-06, + "loss": 0.873, + "step": 4832 + }, + { + "epoch": 0.12, + "learning_rate": 1.954149677108096e-06, + "loss": 0.8945, + "step": 4833 + }, + { + "epoch": 0.12, + "learning_rate": 1.9541248258185055e-06, + "loss": 0.8555, + "step": 4834 + }, + { + "epoch": 0.12, + "learning_rate": 1.954099967954034e-06, + "loss": 1.0723, + "step": 4835 + }, + { + "epoch": 0.12, + "learning_rate": 1.954075103514852e-06, + "loss": 0.9971, + "step": 4836 + }, + { + "epoch": 0.12, + "learning_rate": 1.9540502325011317e-06, + "loss": 0.8037, + "step": 4837 + }, + { + "epoch": 0.12, + "learning_rate": 1.9540253549130436e-06, + "loss": 0.8809, + "step": 4838 + }, + { + "epoch": 0.12, + "learning_rate": 1.9540004707507597e-06, + "loss": 0.9277, + "step": 4839 + }, + { + "epoch": 0.12, + "learning_rate": 1.953975580014452e-06, + "loss": 0.8271, + "step": 4840 + }, + { + "epoch": 0.12, + "learning_rate": 1.9539506827042904e-06, + "loss": 0.6279, + "step": 4841 + }, + { + "epoch": 0.12, + "learning_rate": 1.953925778820448e-06, + "loss": 0.9736, + "step": 4842 + }, + { + "epoch": 0.12, + "learning_rate": 1.9539008683630957e-06, + "loss": 1.0596, + "step": 4843 + }, + { + "epoch": 0.12, + "learning_rate": 1.953875951332405e-06, + "loss": 1.0557, + "step": 4844 + }, + { + "epoch": 0.12, + "learning_rate": 1.9538510277285487e-06, + "loss": 0.9365, + "step": 4845 + }, + { + "epoch": 0.12, + "learning_rate": 1.953826097551697e-06, + "loss": 0.7783, + "step": 4846 + }, + { + "epoch": 0.12, + "learning_rate": 1.9538011608020227e-06, + "loss": 1.1475, + "step": 4847 + }, + { + "epoch": 0.12, + "learning_rate": 1.9537762174796975e-06, + "loss": 0.7998, + "step": 4848 + }, + { + "epoch": 0.12, + "learning_rate": 1.953751267584893e-06, + "loss": 0.8745, + "step": 4849 + }, + { + "epoch": 0.12, + "learning_rate": 1.9537263111177815e-06, + "loss": 1.0049, + "step": 4850 + }, + { + "epoch": 0.12, + "learning_rate": 1.9537013480785346e-06, + "loss": 0.7881, + "step": 4851 + }, + { + "epoch": 0.12, + "learning_rate": 1.9536763784673247e-06, + "loss": 0.6265, + "step": 4852 + }, + { + "epoch": 0.12, + "learning_rate": 1.9536514022843237e-06, + "loss": 0.9121, + "step": 4853 + }, + { + "epoch": 0.12, + "learning_rate": 1.9536264195297035e-06, + "loss": 0.916, + "step": 4854 + }, + { + "epoch": 0.12, + "learning_rate": 1.9536014302036366e-06, + "loss": 0.832, + "step": 4855 + }, + { + "epoch": 0.12, + "learning_rate": 1.953576434306295e-06, + "loss": 1.0371, + "step": 4856 + }, + { + "epoch": 0.12, + "learning_rate": 1.9535514318378506e-06, + "loss": 0.7466, + "step": 4857 + }, + { + "epoch": 0.12, + "learning_rate": 1.9535264227984767e-06, + "loss": 0.9502, + "step": 4858 + }, + { + "epoch": 0.12, + "learning_rate": 1.9535014071883447e-06, + "loss": 0.8115, + "step": 4859 + }, + { + "epoch": 0.12, + "learning_rate": 1.9534763850076273e-06, + "loss": 0.9243, + "step": 4860 + }, + { + "epoch": 0.12, + "learning_rate": 1.953451356256497e-06, + "loss": 0.9844, + "step": 4861 + }, + { + "epoch": 0.12, + "learning_rate": 1.9534263209351265e-06, + "loss": 0.9971, + "step": 4862 + }, + { + "epoch": 0.12, + "learning_rate": 1.9534012790436877e-06, + "loss": 0.9541, + "step": 4863 + }, + { + "epoch": 0.12, + "learning_rate": 1.953376230582353e-06, + "loss": 0.7859, + "step": 4864 + }, + { + "epoch": 0.12, + "learning_rate": 1.9533511755512963e-06, + "loss": 1.0, + "step": 4865 + }, + { + "epoch": 0.12, + "learning_rate": 1.9533261139506888e-06, + "loss": 1.1523, + "step": 4866 + }, + { + "epoch": 0.12, + "learning_rate": 1.9533010457807046e-06, + "loss": 1.0869, + "step": 4867 + }, + { + "epoch": 0.12, + "learning_rate": 1.9532759710415154e-06, + "loss": 1.0195, + "step": 4868 + }, + { + "epoch": 0.12, + "learning_rate": 1.953250889733294e-06, + "loss": 0.8398, + "step": 4869 + }, + { + "epoch": 0.12, + "learning_rate": 1.9532258018562136e-06, + "loss": 0.812, + "step": 4870 + }, + { + "epoch": 0.12, + "learning_rate": 1.9532007074104467e-06, + "loss": 0.9531, + "step": 4871 + }, + { + "epoch": 0.12, + "learning_rate": 1.953175606396167e-06, + "loss": 0.8853, + "step": 4872 + }, + { + "epoch": 0.12, + "learning_rate": 1.953150498813547e-06, + "loss": 0.9746, + "step": 4873 + }, + { + "epoch": 0.12, + "learning_rate": 1.9531253846627594e-06, + "loss": 1.0469, + "step": 4874 + }, + { + "epoch": 0.12, + "learning_rate": 1.953100263943978e-06, + "loss": 0.7832, + "step": 4875 + }, + { + "epoch": 0.12, + "learning_rate": 1.953075136657375e-06, + "loss": 0.7559, + "step": 4876 + }, + { + "epoch": 0.12, + "learning_rate": 1.9530500028031245e-06, + "loss": 1.0391, + "step": 4877 + }, + { + "epoch": 0.13, + "learning_rate": 1.953024862381399e-06, + "loss": 1.0439, + "step": 4878 + }, + { + "epoch": 0.13, + "learning_rate": 1.952999715392372e-06, + "loss": 0.8232, + "step": 4879 + }, + { + "epoch": 0.13, + "learning_rate": 1.952974561836217e-06, + "loss": 0.8379, + "step": 4880 + }, + { + "epoch": 0.13, + "learning_rate": 1.9529494017131064e-06, + "loss": 0.8291, + "step": 4881 + }, + { + "epoch": 0.13, + "learning_rate": 1.952924235023215e-06, + "loss": 1.0752, + "step": 4882 + }, + { + "epoch": 0.13, + "learning_rate": 1.952899061766715e-06, + "loss": 1.1074, + "step": 4883 + }, + { + "epoch": 0.13, + "learning_rate": 1.952873881943781e-06, + "loss": 0.9385, + "step": 4884 + }, + { + "epoch": 0.13, + "learning_rate": 1.9528486955545854e-06, + "loss": 0.6804, + "step": 4885 + }, + { + "epoch": 0.13, + "learning_rate": 1.952823502599302e-06, + "loss": 0.9824, + "step": 4886 + }, + { + "epoch": 0.13, + "learning_rate": 1.9527983030781054e-06, + "loss": 0.8164, + "step": 4887 + }, + { + "epoch": 0.13, + "learning_rate": 1.952773096991168e-06, + "loss": 0.8877, + "step": 4888 + }, + { + "epoch": 0.13, + "learning_rate": 1.9527478843386637e-06, + "loss": 1.0732, + "step": 4889 + }, + { + "epoch": 0.13, + "learning_rate": 1.952722665120767e-06, + "loss": 0.8857, + "step": 4890 + }, + { + "epoch": 0.13, + "learning_rate": 1.952697439337651e-06, + "loss": 0.79, + "step": 4891 + }, + { + "epoch": 0.13, + "learning_rate": 1.95267220698949e-06, + "loss": 0.8584, + "step": 4892 + }, + { + "epoch": 0.13, + "learning_rate": 1.9526469680764573e-06, + "loss": 0.917, + "step": 4893 + }, + { + "epoch": 0.13, + "learning_rate": 1.9526217225987273e-06, + "loss": 1.0332, + "step": 4894 + }, + { + "epoch": 0.13, + "learning_rate": 1.952596470556474e-06, + "loss": 0.9053, + "step": 4895 + }, + { + "epoch": 0.13, + "learning_rate": 1.952571211949871e-06, + "loss": 0.8145, + "step": 4896 + }, + { + "epoch": 0.13, + "learning_rate": 1.9525459467790924e-06, + "loss": 0.9531, + "step": 4897 + }, + { + "epoch": 0.13, + "learning_rate": 1.952520675044313e-06, + "loss": 1.0576, + "step": 4898 + }, + { + "epoch": 0.13, + "learning_rate": 1.952495396745706e-06, + "loss": 0.999, + "step": 4899 + }, + { + "epoch": 0.13, + "learning_rate": 1.9524701118834465e-06, + "loss": 1.0303, + "step": 4900 + }, + { + "epoch": 0.13, + "learning_rate": 1.952444820457708e-06, + "loss": 0.9131, + "step": 4901 + }, + { + "epoch": 0.13, + "learning_rate": 1.9524195224686646e-06, + "loss": 0.9795, + "step": 4902 + }, + { + "epoch": 0.13, + "learning_rate": 1.9523942179164916e-06, + "loss": 1.0859, + "step": 4903 + }, + { + "epoch": 0.13, + "learning_rate": 1.952368906801363e-06, + "loss": 0.9082, + "step": 4904 + }, + { + "epoch": 0.13, + "learning_rate": 1.9523435891234525e-06, + "loss": 0.8135, + "step": 4905 + }, + { + "epoch": 0.13, + "learning_rate": 1.9523182648829354e-06, + "loss": 0.9873, + "step": 4906 + }, + { + "epoch": 0.13, + "learning_rate": 1.952292934079986e-06, + "loss": 0.873, + "step": 4907 + }, + { + "epoch": 0.13, + "learning_rate": 1.9522675967147786e-06, + "loss": 0.804, + "step": 4908 + }, + { + "epoch": 0.13, + "learning_rate": 1.9522422527874883e-06, + "loss": 0.8818, + "step": 4909 + }, + { + "epoch": 0.13, + "learning_rate": 1.9522169022982892e-06, + "loss": 0.6587, + "step": 4910 + }, + { + "epoch": 0.13, + "learning_rate": 1.9521915452473563e-06, + "loss": 1.0029, + "step": 4911 + }, + { + "epoch": 0.13, + "learning_rate": 1.9521661816348645e-06, + "loss": 1.2744, + "step": 4912 + }, + { + "epoch": 0.13, + "learning_rate": 1.952140811460988e-06, + "loss": 0.8184, + "step": 4913 + }, + { + "epoch": 0.13, + "learning_rate": 1.952115434725902e-06, + "loss": 1.0098, + "step": 4914 + }, + { + "epoch": 0.13, + "learning_rate": 1.952090051429782e-06, + "loss": 0.9834, + "step": 4915 + }, + { + "epoch": 0.13, + "learning_rate": 1.9520646615728013e-06, + "loss": 0.9058, + "step": 4916 + }, + { + "epoch": 0.13, + "learning_rate": 1.9520392651551363e-06, + "loss": 0.9385, + "step": 4917 + }, + { + "epoch": 0.13, + "learning_rate": 1.9520138621769615e-06, + "loss": 0.999, + "step": 4918 + }, + { + "epoch": 0.13, + "learning_rate": 1.951988452638452e-06, + "loss": 0.8896, + "step": 4919 + }, + { + "epoch": 0.13, + "learning_rate": 1.9519630365397826e-06, + "loss": 0.8584, + "step": 4920 + }, + { + "epoch": 0.13, + "learning_rate": 1.9519376138811293e-06, + "loss": 0.9258, + "step": 4921 + }, + { + "epoch": 0.13, + "learning_rate": 1.9519121846626665e-06, + "loss": 0.8184, + "step": 4922 + }, + { + "epoch": 0.13, + "learning_rate": 1.9518867488845693e-06, + "loss": 0.9492, + "step": 4923 + }, + { + "epoch": 0.13, + "learning_rate": 1.9518613065470134e-06, + "loss": 1.1582, + "step": 4924 + }, + { + "epoch": 0.13, + "learning_rate": 1.9518358576501745e-06, + "loss": 0.9111, + "step": 4925 + }, + { + "epoch": 0.13, + "learning_rate": 1.951810402194227e-06, + "loss": 1.166, + "step": 4926 + }, + { + "epoch": 0.13, + "learning_rate": 1.951784940179347e-06, + "loss": 1.0293, + "step": 4927 + }, + { + "epoch": 0.13, + "learning_rate": 1.95175947160571e-06, + "loss": 0.958, + "step": 4928 + }, + { + "epoch": 0.13, + "learning_rate": 1.951733996473491e-06, + "loss": 1.1025, + "step": 4929 + }, + { + "epoch": 0.13, + "learning_rate": 1.9517085147828665e-06, + "loss": 0.856, + "step": 4930 + }, + { + "epoch": 0.13, + "learning_rate": 1.9516830265340106e-06, + "loss": 0.8232, + "step": 4931 + }, + { + "epoch": 0.13, + "learning_rate": 1.9516575317271e-06, + "loss": 0.918, + "step": 4932 + }, + { + "epoch": 0.13, + "learning_rate": 1.9516320303623103e-06, + "loss": 0.7419, + "step": 4933 + }, + { + "epoch": 0.13, + "learning_rate": 1.951606522439817e-06, + "loss": 0.8706, + "step": 4934 + }, + { + "epoch": 0.13, + "learning_rate": 1.9515810079597962e-06, + "loss": 1.04, + "step": 4935 + }, + { + "epoch": 0.13, + "learning_rate": 1.9515554869224233e-06, + "loss": 0.6313, + "step": 4936 + }, + { + "epoch": 0.13, + "learning_rate": 1.9515299593278744e-06, + "loss": 0.9355, + "step": 4937 + }, + { + "epoch": 0.13, + "learning_rate": 1.951504425176325e-06, + "loss": 1.0703, + "step": 4938 + }, + { + "epoch": 0.13, + "learning_rate": 1.9514788844679517e-06, + "loss": 0.9072, + "step": 4939 + }, + { + "epoch": 0.13, + "learning_rate": 1.9514533372029304e-06, + "loss": 1.0391, + "step": 4940 + }, + { + "epoch": 0.13, + "learning_rate": 1.951427783381437e-06, + "loss": 0.9121, + "step": 4941 + }, + { + "epoch": 0.13, + "learning_rate": 1.9514022230036475e-06, + "loss": 1.0957, + "step": 4942 + }, + { + "epoch": 0.13, + "learning_rate": 1.9513766560697376e-06, + "loss": 0.9062, + "step": 4943 + }, + { + "epoch": 0.13, + "learning_rate": 1.9513510825798845e-06, + "loss": 0.9355, + "step": 4944 + }, + { + "epoch": 0.13, + "learning_rate": 1.9513255025342637e-06, + "loss": 0.9243, + "step": 4945 + }, + { + "epoch": 0.13, + "learning_rate": 1.9512999159330518e-06, + "loss": 1.0723, + "step": 4946 + }, + { + "epoch": 0.13, + "learning_rate": 1.951274322776425e-06, + "loss": 1.0498, + "step": 4947 + }, + { + "epoch": 0.13, + "learning_rate": 1.9512487230645595e-06, + "loss": 0.9453, + "step": 4948 + }, + { + "epoch": 0.13, + "learning_rate": 1.9512231167976315e-06, + "loss": 0.916, + "step": 4949 + }, + { + "epoch": 0.13, + "learning_rate": 1.9511975039758184e-06, + "loss": 0.8035, + "step": 4950 + }, + { + "epoch": 0.13, + "learning_rate": 1.951171884599296e-06, + "loss": 0.8203, + "step": 4951 + }, + { + "epoch": 0.13, + "learning_rate": 1.951146258668241e-06, + "loss": 0.9717, + "step": 4952 + }, + { + "epoch": 0.13, + "learning_rate": 1.95112062618283e-06, + "loss": 1.0596, + "step": 4953 + }, + { + "epoch": 0.13, + "learning_rate": 1.9510949871432396e-06, + "loss": 1.0479, + "step": 4954 + }, + { + "epoch": 0.13, + "learning_rate": 1.951069341549646e-06, + "loss": 0.9463, + "step": 4955 + }, + { + "epoch": 0.13, + "learning_rate": 1.9510436894022267e-06, + "loss": 0.9912, + "step": 4956 + }, + { + "epoch": 0.13, + "learning_rate": 1.951018030701158e-06, + "loss": 1.0049, + "step": 4957 + }, + { + "epoch": 0.13, + "learning_rate": 1.9509923654466174e-06, + "loss": 0.9619, + "step": 4958 + }, + { + "epoch": 0.13, + "learning_rate": 1.9509666936387804e-06, + "loss": 1.0312, + "step": 4959 + }, + { + "epoch": 0.13, + "learning_rate": 1.9509410152778256e-06, + "loss": 0.748, + "step": 4960 + }, + { + "epoch": 0.13, + "learning_rate": 1.9509153303639283e-06, + "loss": 0.8862, + "step": 4961 + }, + { + "epoch": 0.13, + "learning_rate": 1.950889638897267e-06, + "loss": 0.8525, + "step": 4962 + }, + { + "epoch": 0.13, + "learning_rate": 1.9508639408780173e-06, + "loss": 0.7832, + "step": 4963 + }, + { + "epoch": 0.13, + "learning_rate": 1.9508382363063572e-06, + "loss": 1.0703, + "step": 4964 + }, + { + "epoch": 0.13, + "learning_rate": 1.950812525182464e-06, + "loss": 1.0908, + "step": 4965 + }, + { + "epoch": 0.13, + "learning_rate": 1.950786807506514e-06, + "loss": 0.9717, + "step": 4966 + }, + { + "epoch": 0.13, + "learning_rate": 1.9507610832786853e-06, + "loss": 0.9424, + "step": 4967 + }, + { + "epoch": 0.13, + "learning_rate": 1.9507353524991545e-06, + "loss": 1.0547, + "step": 4968 + }, + { + "epoch": 0.13, + "learning_rate": 1.9507096151680997e-06, + "loss": 0.8984, + "step": 4969 + }, + { + "epoch": 0.13, + "learning_rate": 1.9506838712856973e-06, + "loss": 0.9072, + "step": 4970 + }, + { + "epoch": 0.13, + "learning_rate": 1.9506581208521252e-06, + "loss": 1.0518, + "step": 4971 + }, + { + "epoch": 0.13, + "learning_rate": 1.950632363867561e-06, + "loss": 0.6567, + "step": 4972 + }, + { + "epoch": 0.13, + "learning_rate": 1.950606600332182e-06, + "loss": 0.7812, + "step": 4973 + }, + { + "epoch": 0.13, + "learning_rate": 1.9505808302461653e-06, + "loss": 1.04, + "step": 4974 + }, + { + "epoch": 0.13, + "learning_rate": 1.9505550536096896e-06, + "loss": 0.7524, + "step": 4975 + }, + { + "epoch": 0.13, + "learning_rate": 1.9505292704229315e-06, + "loss": 0.9727, + "step": 4976 + }, + { + "epoch": 0.13, + "learning_rate": 1.950503480686069e-06, + "loss": 1.0908, + "step": 4977 + }, + { + "epoch": 0.13, + "learning_rate": 1.95047768439928e-06, + "loss": 1.0566, + "step": 4978 + }, + { + "epoch": 0.13, + "learning_rate": 1.950451881562742e-06, + "loss": 0.9873, + "step": 4979 + }, + { + "epoch": 0.13, + "learning_rate": 1.9504260721766328e-06, + "loss": 0.9414, + "step": 4980 + }, + { + "epoch": 0.13, + "learning_rate": 1.9504002562411305e-06, + "loss": 1.1328, + "step": 4981 + }, + { + "epoch": 0.13, + "learning_rate": 1.9503744337564126e-06, + "loss": 1.1367, + "step": 4982 + }, + { + "epoch": 0.13, + "learning_rate": 1.9503486047226575e-06, + "loss": 0.9619, + "step": 4983 + }, + { + "epoch": 0.13, + "learning_rate": 1.950322769140043e-06, + "loss": 1.0234, + "step": 4984 + }, + { + "epoch": 0.13, + "learning_rate": 1.950296927008747e-06, + "loss": 0.7251, + "step": 4985 + }, + { + "epoch": 0.13, + "learning_rate": 1.950271078328948e-06, + "loss": 0.9648, + "step": 4986 + }, + { + "epoch": 0.13, + "learning_rate": 1.9502452231008234e-06, + "loss": 1.0918, + "step": 4987 + }, + { + "epoch": 0.13, + "learning_rate": 1.950219361324552e-06, + "loss": 0.9961, + "step": 4988 + }, + { + "epoch": 0.13, + "learning_rate": 1.950193493000312e-06, + "loss": 0.9492, + "step": 4989 + }, + { + "epoch": 0.13, + "learning_rate": 1.9501676181282815e-06, + "loss": 1.042, + "step": 4990 + }, + { + "epoch": 0.13, + "learning_rate": 1.9501417367086383e-06, + "loss": 0.8633, + "step": 4991 + }, + { + "epoch": 0.13, + "learning_rate": 1.9501158487415613e-06, + "loss": 0.8525, + "step": 4992 + }, + { + "epoch": 0.13, + "learning_rate": 1.9500899542272292e-06, + "loss": 1.0811, + "step": 4993 + }, + { + "epoch": 0.13, + "learning_rate": 1.9500640531658195e-06, + "loss": 0.7583, + "step": 4994 + }, + { + "epoch": 0.13, + "learning_rate": 1.9500381455575117e-06, + "loss": 0.9961, + "step": 4995 + }, + { + "epoch": 0.13, + "learning_rate": 1.9500122314024838e-06, + "loss": 1.0859, + "step": 4996 + }, + { + "epoch": 0.13, + "learning_rate": 1.9499863107009143e-06, + "loss": 0.7959, + "step": 4997 + }, + { + "epoch": 0.13, + "learning_rate": 1.949960383452982e-06, + "loss": 0.792, + "step": 4998 + }, + { + "epoch": 0.13, + "learning_rate": 1.9499344496588655e-06, + "loss": 0.9727, + "step": 4999 + }, + { + "epoch": 0.13, + "learning_rate": 1.9499085093187436e-06, + "loss": 0.5552, + "step": 5000 + }, + { + "epoch": 0.13, + "learning_rate": 1.999151346260752e-06, + "loss": 1.1875, + "step": 5001 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991502061419393e-06, + "loss": 1.3135, + "step": 5002 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991490652581228e-06, + "loss": 0.833, + "step": 5003 + }, + { + "epoch": 0.13, + "learning_rate": 1.999147923609304e-06, + "loss": 0.96, + "step": 5004 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991467811954844e-06, + "loss": 0.8867, + "step": 5005 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991456380166635e-06, + "loss": 0.9023, + "step": 5006 + }, + { + "epoch": 0.13, + "learning_rate": 1.999144494072842e-06, + "loss": 0.8223, + "step": 5007 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991433493640226e-06, + "loss": 0.915, + "step": 5008 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991422038902045e-06, + "loss": 0.918, + "step": 5009 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991410576513897e-06, + "loss": 0.9062, + "step": 5010 + }, + { + "epoch": 0.13, + "learning_rate": 1.999139910647578e-06, + "loss": 0.8828, + "step": 5011 + }, + { + "epoch": 0.13, + "learning_rate": 1.999138762878771e-06, + "loss": 1.0586, + "step": 5012 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991376143449693e-06, + "loss": 0.8301, + "step": 5013 + }, + { + "epoch": 0.13, + "learning_rate": 1.999136465046174e-06, + "loss": 0.9434, + "step": 5014 + }, + { + "epoch": 0.13, + "learning_rate": 1.999135314982386e-06, + "loss": 1.0273, + "step": 5015 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991341641536055e-06, + "loss": 1.0654, + "step": 5016 + }, + { + "epoch": 0.13, + "learning_rate": 1.999133012559834e-06, + "loss": 0.9531, + "step": 5017 + }, + { + "epoch": 0.13, + "learning_rate": 1.999131860201073e-06, + "loss": 1.04, + "step": 5018 + }, + { + "epoch": 0.13, + "learning_rate": 1.999130707077322e-06, + "loss": 1.0762, + "step": 5019 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991295531885826e-06, + "loss": 0.9863, + "step": 5020 + }, + { + "epoch": 0.13, + "learning_rate": 1.999128398534856e-06, + "loss": 0.9482, + "step": 5021 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991272431161425e-06, + "loss": 0.7305, + "step": 5022 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991260869324427e-06, + "loss": 0.9287, + "step": 5023 + }, + { + "epoch": 0.13, + "learning_rate": 1.999124929983759e-06, + "loss": 0.8789, + "step": 5024 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991237722700907e-06, + "loss": 0.917, + "step": 5025 + }, + { + "epoch": 0.13, + "learning_rate": 1.999122613791439e-06, + "loss": 1.1738, + "step": 5026 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991214545478056e-06, + "loss": 0.8887, + "step": 5027 + }, + { + "epoch": 0.13, + "learning_rate": 1.999120294539191e-06, + "loss": 1.3105, + "step": 5028 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991191337655953e-06, + "loss": 0.9297, + "step": 5029 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991179722270205e-06, + "loss": 0.9941, + "step": 5030 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991168099234666e-06, + "loss": 0.9365, + "step": 5031 + }, + { + "epoch": 0.13, + "learning_rate": 1.999115646854935e-06, + "loss": 0.9414, + "step": 5032 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991144830214267e-06, + "loss": 0.6777, + "step": 5033 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991133184229425e-06, + "loss": 0.8989, + "step": 5034 + }, + { + "epoch": 0.13, + "learning_rate": 1.999112153059483e-06, + "loss": 1.0195, + "step": 5035 + }, + { + "epoch": 0.13, + "learning_rate": 1.999110986931049e-06, + "loss": 0.957, + "step": 5036 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991098200376422e-06, + "loss": 0.8501, + "step": 5037 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991086523792625e-06, + "loss": 0.9111, + "step": 5038 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991074839559116e-06, + "loss": 0.9072, + "step": 5039 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991063147675896e-06, + "loss": 1.0996, + "step": 5040 + }, + { + "epoch": 0.13, + "learning_rate": 1.999105144814298e-06, + "loss": 0.8662, + "step": 5041 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991039740960377e-06, + "loss": 0.8857, + "step": 5042 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991028026128095e-06, + "loss": 0.8481, + "step": 5043 + }, + { + "epoch": 0.13, + "learning_rate": 1.9991016303646136e-06, + "loss": 0.6938, + "step": 5044 + }, + { + "epoch": 0.13, + "learning_rate": 1.999100457351452e-06, + "loss": 1.002, + "step": 5045 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990992835733254e-06, + "loss": 0.9062, + "step": 5046 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990981090302343e-06, + "loss": 0.8906, + "step": 5047 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990969337221793e-06, + "loss": 1.0195, + "step": 5048 + }, + { + "epoch": 0.13, + "learning_rate": 1.999095757649162e-06, + "loss": 0.8633, + "step": 5049 + }, + { + "epoch": 0.13, + "learning_rate": 1.999094580811183e-06, + "loss": 0.8569, + "step": 5050 + }, + { + "epoch": 0.13, + "learning_rate": 1.999093403208243e-06, + "loss": 1.0654, + "step": 5051 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990922248403433e-06, + "loss": 0.7432, + "step": 5052 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990910457074848e-06, + "loss": 0.957, + "step": 5053 + }, + { + "epoch": 0.13, + "learning_rate": 1.999089865809668e-06, + "loss": 1.1035, + "step": 5054 + }, + { + "epoch": 0.13, + "learning_rate": 1.999088685146894e-06, + "loss": 1.0107, + "step": 5055 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990875037191637e-06, + "loss": 0.9521, + "step": 5056 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990863215264783e-06, + "loss": 0.9678, + "step": 5057 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990851385688382e-06, + "loss": 0.8965, + "step": 5058 + }, + { + "epoch": 0.13, + "learning_rate": 1.999083954846245e-06, + "loss": 1.041, + "step": 5059 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990827703586986e-06, + "loss": 0.7783, + "step": 5060 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990815851062006e-06, + "loss": 1.3086, + "step": 5061 + }, + { + "epoch": 0.13, + "learning_rate": 1.999080399088752e-06, + "loss": 0.8311, + "step": 5062 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990792123063532e-06, + "loss": 1.0273, + "step": 5063 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990780247590054e-06, + "loss": 0.8848, + "step": 5064 + }, + { + "epoch": 0.13, + "learning_rate": 1.99907683644671e-06, + "loss": 1.0615, + "step": 5065 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990756473694664e-06, + "loss": 0.7148, + "step": 5066 + }, + { + "epoch": 0.13, + "learning_rate": 1.999074457527277e-06, + "loss": 1.0596, + "step": 5067 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990732669201423e-06, + "loss": 1.0107, + "step": 5068 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990720755480634e-06, + "loss": 0.9238, + "step": 5069 + }, + { + "epoch": 0.13, + "learning_rate": 1.999070883411041e-06, + "loss": 0.7217, + "step": 5070 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990696905090757e-06, + "loss": 0.8779, + "step": 5071 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990684968421686e-06, + "loss": 0.8701, + "step": 5072 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990673024103208e-06, + "loss": 1.1138, + "step": 5073 + }, + { + "epoch": 0.13, + "learning_rate": 1.999066107213533e-06, + "loss": 0.834, + "step": 5074 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990649112518063e-06, + "loss": 0.9551, + "step": 5075 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990637145251413e-06, + "loss": 0.8857, + "step": 5076 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990625170335395e-06, + "loss": 1.0332, + "step": 5077 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990613187770012e-06, + "loss": 1.1074, + "step": 5078 + }, + { + "epoch": 0.13, + "learning_rate": 1.999060119755528e-06, + "loss": 1.0127, + "step": 5079 + }, + { + "epoch": 0.13, + "learning_rate": 1.99905891996912e-06, + "loss": 0.5747, + "step": 5080 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990577194177783e-06, + "loss": 0.9941, + "step": 5081 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990565181015047e-06, + "loss": 0.7622, + "step": 5082 + }, + { + "epoch": 0.13, + "learning_rate": 1.999055316020299e-06, + "loss": 0.9561, + "step": 5083 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990541131741626e-06, + "loss": 0.9453, + "step": 5084 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990529095630967e-06, + "loss": 0.8276, + "step": 5085 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990517051871016e-06, + "loss": 0.8887, + "step": 5086 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990505000461786e-06, + "loss": 1.1504, + "step": 5087 + }, + { + "epoch": 0.13, + "learning_rate": 1.999049294140329e-06, + "loss": 0.9961, + "step": 5088 + }, + { + "epoch": 0.13, + "learning_rate": 1.999048087469553e-06, + "loss": 0.4961, + "step": 5089 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990468800338517e-06, + "loss": 0.9307, + "step": 5090 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990456718332263e-06, + "loss": 1.0977, + "step": 5091 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990444628676777e-06, + "loss": 0.9434, + "step": 5092 + }, + { + "epoch": 0.13, + "learning_rate": 1.999043253137206e-06, + "loss": 0.9688, + "step": 5093 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990420426418135e-06, + "loss": 0.8867, + "step": 5094 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990408313815005e-06, + "loss": 1.0264, + "step": 5095 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990396193562672e-06, + "loss": 0.9961, + "step": 5096 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990384065661158e-06, + "loss": 1.0078, + "step": 5097 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990371930110465e-06, + "loss": 0.7246, + "step": 5098 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990359786910604e-06, + "loss": 0.9688, + "step": 5099 + }, + { + "epoch": 0.13, + "learning_rate": 1.999034763606158e-06, + "loss": 0.7329, + "step": 5100 + }, + { + "epoch": 0.13, + "learning_rate": 1.999033547756341e-06, + "loss": 1.0234, + "step": 5101 + }, + { + "epoch": 0.13, + "learning_rate": 1.99903233114161e-06, + "loss": 0.8496, + "step": 5102 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990311137619654e-06, + "loss": 1.123, + "step": 5103 + }, + { + "epoch": 0.13, + "learning_rate": 1.999029895617409e-06, + "loss": 0.6885, + "step": 5104 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990286767079418e-06, + "loss": 0.9697, + "step": 5105 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990274570335635e-06, + "loss": 0.8306, + "step": 5106 + }, + { + "epoch": 0.13, + "learning_rate": 1.999026236594276e-06, + "loss": 0.8926, + "step": 5107 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990250153900803e-06, + "loss": 1.0654, + "step": 5108 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990237934209767e-06, + "loss": 0.8208, + "step": 5109 + }, + { + "epoch": 0.13, + "learning_rate": 1.999022570686967e-06, + "loss": 1.1445, + "step": 5110 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990213471880514e-06, + "loss": 0.9023, + "step": 5111 + }, + { + "epoch": 0.13, + "learning_rate": 1.999020122924231e-06, + "loss": 0.9727, + "step": 5112 + }, + { + "epoch": 0.13, + "learning_rate": 1.999018897895507e-06, + "loss": 0.8115, + "step": 5113 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990176721018803e-06, + "loss": 1.0293, + "step": 5114 + }, + { + "epoch": 0.13, + "learning_rate": 1.999016445543351e-06, + "loss": 1.0439, + "step": 5115 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990152182199213e-06, + "loss": 1.0586, + "step": 5116 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990139901315916e-06, + "loss": 0.9893, + "step": 5117 + }, + { + "epoch": 0.13, + "learning_rate": 1.999012761278363e-06, + "loss": 1.0605, + "step": 5118 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990115316602358e-06, + "loss": 1.1885, + "step": 5119 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990103012772117e-06, + "loss": 0.957, + "step": 5120 + }, + { + "epoch": 0.13, + "learning_rate": 1.999009070129291e-06, + "loss": 0.8291, + "step": 5121 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990078382164755e-06, + "loss": 1.0938, + "step": 5122 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990066055387654e-06, + "loss": 0.9775, + "step": 5123 + }, + { + "epoch": 0.13, + "learning_rate": 1.999005372096162e-06, + "loss": 0.6768, + "step": 5124 + }, + { + "epoch": 0.13, + "learning_rate": 1.9990041378886654e-06, + "loss": 1.0635, + "step": 5125 + }, + { + "epoch": 0.13, + "learning_rate": 1.999002902916278e-06, + "loss": 0.8721, + "step": 5126 + }, + { + "epoch": 0.13, + "learning_rate": 1.999001667179e-06, + "loss": 0.8867, + "step": 5127 + }, + { + "epoch": 0.13, + "learning_rate": 1.999000430676832e-06, + "loss": 0.7139, + "step": 5128 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989991934097757e-06, + "loss": 0.9941, + "step": 5129 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989979553778315e-06, + "loss": 1.0684, + "step": 5130 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989967165810004e-06, + "loss": 0.8125, + "step": 5131 + }, + { + "epoch": 0.13, + "learning_rate": 1.998995477019284e-06, + "loss": 1.0098, + "step": 5132 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989942366926816e-06, + "loss": 0.9238, + "step": 5133 + }, + { + "epoch": 0.13, + "learning_rate": 1.998992995601196e-06, + "loss": 1.0391, + "step": 5134 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989917537448273e-06, + "loss": 0.679, + "step": 5135 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989905111235764e-06, + "loss": 1.0059, + "step": 5136 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989892677374446e-06, + "loss": 0.8535, + "step": 5137 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989880235864324e-06, + "loss": 1.0225, + "step": 5138 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989867786705413e-06, + "loss": 0.9316, + "step": 5139 + }, + { + "epoch": 0.13, + "learning_rate": 1.998985532989772e-06, + "loss": 0.8936, + "step": 5140 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989842865441253e-06, + "loss": 0.8604, + "step": 5141 + }, + { + "epoch": 0.13, + "learning_rate": 1.998983039333602e-06, + "loss": 0.8896, + "step": 5142 + }, + { + "epoch": 0.13, + "learning_rate": 1.998981791358204e-06, + "loss": 0.7856, + "step": 5143 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989805426179306e-06, + "loss": 0.8516, + "step": 5144 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989792931127846e-06, + "loss": 0.8115, + "step": 5145 + }, + { + "epoch": 0.13, + "learning_rate": 1.998978042842765e-06, + "loss": 0.9619, + "step": 5146 + }, + { + "epoch": 0.13, + "learning_rate": 1.998976791807875e-06, + "loss": 0.9111, + "step": 5147 + }, + { + "epoch": 0.13, + "learning_rate": 1.998975540008114e-06, + "loss": 0.8252, + "step": 5148 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989742874434834e-06, + "loss": 0.7056, + "step": 5149 + }, + { + "epoch": 0.13, + "learning_rate": 1.998973034113984e-06, + "loss": 0.9131, + "step": 5150 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989717800196172e-06, + "loss": 1.1348, + "step": 5151 + }, + { + "epoch": 0.13, + "learning_rate": 1.998970525160383e-06, + "loss": 0.8862, + "step": 5152 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989692695362837e-06, + "loss": 1.082, + "step": 5153 + }, + { + "epoch": 0.13, + "learning_rate": 1.998968013147319e-06, + "loss": 0.8203, + "step": 5154 + }, + { + "epoch": 0.13, + "learning_rate": 1.998966755993491e-06, + "loss": 0.9731, + "step": 5155 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989654980747996e-06, + "loss": 0.9243, + "step": 5156 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989642393912464e-06, + "loss": 0.9189, + "step": 5157 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989629799428323e-06, + "loss": 0.9048, + "step": 5158 + }, + { + "epoch": 0.13, + "learning_rate": 1.998961719729558e-06, + "loss": 0.8735, + "step": 5159 + }, + { + "epoch": 0.13, + "learning_rate": 1.998960458751425e-06, + "loss": 1.0127, + "step": 5160 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989591970084334e-06, + "loss": 1.1953, + "step": 5161 + }, + { + "epoch": 0.13, + "learning_rate": 1.998957934500585e-06, + "loss": 1.0674, + "step": 5162 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989566712278806e-06, + "loss": 0.9531, + "step": 5163 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989554071903206e-06, + "loss": 0.9424, + "step": 5164 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989541423879065e-06, + "loss": 0.8711, + "step": 5165 + }, + { + "epoch": 0.13, + "learning_rate": 1.99895287682064e-06, + "loss": 0.9297, + "step": 5166 + }, + { + "epoch": 0.13, + "learning_rate": 1.99895161048852e-06, + "loss": 0.8135, + "step": 5167 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989503433915493e-06, + "loss": 0.9141, + "step": 5168 + }, + { + "epoch": 0.13, + "learning_rate": 1.998949075529728e-06, + "loss": 0.8662, + "step": 5169 + }, + { + "epoch": 0.13, + "learning_rate": 1.998947806903057e-06, + "loss": 0.8525, + "step": 5170 + }, + { + "epoch": 0.13, + "learning_rate": 1.998946537511538e-06, + "loss": 0.7568, + "step": 5171 + }, + { + "epoch": 0.13, + "learning_rate": 1.998945267355172e-06, + "loss": 1.1768, + "step": 5172 + }, + { + "epoch": 0.13, + "learning_rate": 1.998943996433959e-06, + "loss": 1.0293, + "step": 5173 + }, + { + "epoch": 0.13, + "learning_rate": 1.998942724747901e-06, + "loss": 0.9697, + "step": 5174 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989414522969978e-06, + "loss": 1.0391, + "step": 5175 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989401790812514e-06, + "loss": 1.2441, + "step": 5176 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989389051006623e-06, + "loss": 0.9453, + "step": 5177 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989376303552316e-06, + "loss": 1.0361, + "step": 5178 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989363548449607e-06, + "loss": 0.9062, + "step": 5179 + }, + { + "epoch": 0.13, + "learning_rate": 1.99893507856985e-06, + "loss": 1.0674, + "step": 5180 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989338015299e-06, + "loss": 0.845, + "step": 5181 + }, + { + "epoch": 0.13, + "learning_rate": 1.998932523725113e-06, + "loss": 0.814, + "step": 5182 + }, + { + "epoch": 0.13, + "learning_rate": 1.998931245155489e-06, + "loss": 0.998, + "step": 5183 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989299658210297e-06, + "loss": 0.9375, + "step": 5184 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989286857217354e-06, + "loss": 0.8691, + "step": 5185 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989274048576077e-06, + "loss": 0.9512, + "step": 5186 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989261232286464e-06, + "loss": 0.7051, + "step": 5187 + }, + { + "epoch": 0.13, + "learning_rate": 1.998924840834854e-06, + "loss": 0.7319, + "step": 5188 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989235576762303e-06, + "loss": 0.9736, + "step": 5189 + }, + { + "epoch": 0.13, + "learning_rate": 1.998922273752777e-06, + "loss": 0.834, + "step": 5190 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989209890644946e-06, + "loss": 1.1523, + "step": 5191 + }, + { + "epoch": 0.13, + "learning_rate": 1.998919703611385e-06, + "loss": 1.1191, + "step": 5192 + }, + { + "epoch": 0.13, + "learning_rate": 1.998918417393448e-06, + "loss": 0.72, + "step": 5193 + }, + { + "epoch": 0.13, + "learning_rate": 1.998917130410685e-06, + "loss": 0.9922, + "step": 5194 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989158426630973e-06, + "loss": 1.0303, + "step": 5195 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989145541506856e-06, + "loss": 0.8623, + "step": 5196 + }, + { + "epoch": 0.13, + "learning_rate": 1.998913264873451e-06, + "loss": 1.166, + "step": 5197 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989119748313942e-06, + "loss": 0.8062, + "step": 5198 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989106840245168e-06, + "loss": 0.9648, + "step": 5199 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989093924528194e-06, + "loss": 0.8638, + "step": 5200 + }, + { + "epoch": 0.13, + "learning_rate": 1.998908100116303e-06, + "loss": 0.835, + "step": 5201 + }, + { + "epoch": 0.13, + "learning_rate": 1.998906807014968e-06, + "loss": 0.8535, + "step": 5202 + }, + { + "epoch": 0.13, + "learning_rate": 1.998905513148817e-06, + "loss": 0.917, + "step": 5203 + }, + { + "epoch": 0.13, + "learning_rate": 1.998904218517849e-06, + "loss": 0.7212, + "step": 5204 + }, + { + "epoch": 0.13, + "learning_rate": 1.998902923122067e-06, + "loss": 1.1143, + "step": 5205 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989016269614703e-06, + "loss": 0.7993, + "step": 5206 + }, + { + "epoch": 0.13, + "learning_rate": 1.9989003300360605e-06, + "loss": 0.7148, + "step": 5207 + }, + { + "epoch": 0.13, + "learning_rate": 1.998899032345839e-06, + "loss": 0.6194, + "step": 5208 + }, + { + "epoch": 0.13, + "learning_rate": 1.998897733890806e-06, + "loss": 0.9814, + "step": 5209 + }, + { + "epoch": 0.13, + "learning_rate": 1.998896434670963e-06, + "loss": 0.9277, + "step": 5210 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988951346863114e-06, + "loss": 0.9619, + "step": 5211 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988938339368515e-06, + "loss": 1.0195, + "step": 5212 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988925324225844e-06, + "loss": 0.9141, + "step": 5213 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988912301435113e-06, + "loss": 0.8066, + "step": 5214 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988899270996327e-06, + "loss": 0.9033, + "step": 5215 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988886232909507e-06, + "loss": 0.8545, + "step": 5216 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988873187174653e-06, + "loss": 1.083, + "step": 5217 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988860133791777e-06, + "loss": 0.9805, + "step": 5218 + }, + { + "epoch": 0.13, + "learning_rate": 1.998884707276089e-06, + "loss": 0.9697, + "step": 5219 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988834004082004e-06, + "loss": 1.0488, + "step": 5220 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988820927755127e-06, + "loss": 0.8789, + "step": 5221 + }, + { + "epoch": 0.13, + "learning_rate": 1.998880784378027e-06, + "loss": 0.9629, + "step": 5222 + }, + { + "epoch": 0.13, + "learning_rate": 1.998879475215744e-06, + "loss": 0.5991, + "step": 5223 + }, + { + "epoch": 0.13, + "learning_rate": 1.998878165288665e-06, + "loss": 0.9229, + "step": 5224 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988768545967908e-06, + "loss": 1.2188, + "step": 5225 + }, + { + "epoch": 0.13, + "learning_rate": 1.998875543140123e-06, + "loss": 0.7983, + "step": 5226 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988742309186614e-06, + "loss": 0.9033, + "step": 5227 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988729179324083e-06, + "loss": 0.6704, + "step": 5228 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988716041813637e-06, + "loss": 1.1797, + "step": 5229 + }, + { + "epoch": 0.13, + "learning_rate": 1.998870289665529e-06, + "loss": 1.0195, + "step": 5230 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988689743849057e-06, + "loss": 1.0186, + "step": 5231 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988676583394944e-06, + "loss": 0.915, + "step": 5232 + }, + { + "epoch": 0.13, + "learning_rate": 1.998866341529296e-06, + "loss": 0.7568, + "step": 5233 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988650239543113e-06, + "loss": 0.8887, + "step": 5234 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988637056145414e-06, + "loss": 1.0342, + "step": 5235 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988623865099877e-06, + "loss": 0.666, + "step": 5236 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988610666406513e-06, + "loss": 0.5898, + "step": 5237 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988597460065327e-06, + "loss": 0.9668, + "step": 5238 + }, + { + "epoch": 0.13, + "learning_rate": 1.998858424607633e-06, + "loss": 0.999, + "step": 5239 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988571024439538e-06, + "loss": 0.9727, + "step": 5240 + }, + { + "epoch": 0.13, + "learning_rate": 1.998855779515495e-06, + "loss": 0.8564, + "step": 5241 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988544558222586e-06, + "loss": 0.748, + "step": 5242 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988531313642453e-06, + "loss": 1.0518, + "step": 5243 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988518061414557e-06, + "loss": 1.1045, + "step": 5244 + }, + { + "epoch": 0.13, + "learning_rate": 1.998850480153892e-06, + "loss": 0.8564, + "step": 5245 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988491534015535e-06, + "loss": 0.401, + "step": 5246 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988478258844426e-06, + "loss": 1.1318, + "step": 5247 + }, + { + "epoch": 0.13, + "learning_rate": 1.99884649760256e-06, + "loss": 1.0654, + "step": 5248 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988451685559062e-06, + "loss": 0.8896, + "step": 5249 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988438387444825e-06, + "loss": 0.9336, + "step": 5250 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988425081682905e-06, + "loss": 0.8652, + "step": 5251 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988411768273306e-06, + "loss": 0.6875, + "step": 5252 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988398447216034e-06, + "loss": 1.0332, + "step": 5253 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988385118511113e-06, + "loss": 0.9346, + "step": 5254 + }, + { + "epoch": 0.13, + "learning_rate": 1.998837178215854e-06, + "loss": 0.9316, + "step": 5255 + }, + { + "epoch": 0.13, + "learning_rate": 1.998835843815833e-06, + "loss": 1.0645, + "step": 5256 + }, + { + "epoch": 0.13, + "learning_rate": 1.998834508651049e-06, + "loss": 1.0781, + "step": 5257 + }, + { + "epoch": 0.13, + "learning_rate": 1.998833172721504e-06, + "loss": 0.731, + "step": 5258 + }, + { + "epoch": 0.13, + "learning_rate": 1.998831836027198e-06, + "loss": 0.7827, + "step": 5259 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988304985681322e-06, + "loss": 0.9932, + "step": 5260 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988291603443084e-06, + "loss": 1.0088, + "step": 5261 + }, + { + "epoch": 0.13, + "learning_rate": 1.998827821355727e-06, + "loss": 0.8564, + "step": 5262 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988264816023883e-06, + "loss": 0.8955, + "step": 5263 + }, + { + "epoch": 0.13, + "learning_rate": 1.998825141084295e-06, + "loss": 0.6968, + "step": 5264 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988237998014468e-06, + "loss": 0.7283, + "step": 5265 + }, + { + "epoch": 0.13, + "learning_rate": 1.9988224577538448e-06, + "loss": 0.8438, + "step": 5266 + }, + { + "epoch": 0.13, + "learning_rate": 1.998821114941491e-06, + "loss": 0.9668, + "step": 5267 + }, + { + "epoch": 0.14, + "learning_rate": 1.998819771364385e-06, + "loss": 0.9409, + "step": 5268 + }, + { + "epoch": 0.14, + "learning_rate": 1.9988184270225292e-06, + "loss": 0.9512, + "step": 5269 + }, + { + "epoch": 0.14, + "learning_rate": 1.998817081915924e-06, + "loss": 0.8022, + "step": 5270 + }, + { + "epoch": 0.14, + "learning_rate": 1.9988157360445706e-06, + "loss": 0.8857, + "step": 5271 + }, + { + "epoch": 0.14, + "learning_rate": 1.9988143894084696e-06, + "loss": 0.959, + "step": 5272 + }, + { + "epoch": 0.14, + "learning_rate": 1.9988130420076228e-06, + "loss": 0.936, + "step": 5273 + }, + { + "epoch": 0.14, + "learning_rate": 1.99881169384203e-06, + "loss": 0.6899, + "step": 5274 + }, + { + "epoch": 0.14, + "learning_rate": 1.998810344911694e-06, + "loss": 0.8799, + "step": 5275 + }, + { + "epoch": 0.14, + "learning_rate": 1.9988089952166142e-06, + "loss": 1.0625, + "step": 5276 + }, + { + "epoch": 0.14, + "learning_rate": 1.9988076447567926e-06, + "loss": 0.9053, + "step": 5277 + }, + { + "epoch": 0.14, + "learning_rate": 1.99880629353223e-06, + "loss": 1.0547, + "step": 5278 + }, + { + "epoch": 0.14, + "learning_rate": 1.998804941542927e-06, + "loss": 1.0176, + "step": 5279 + }, + { + "epoch": 0.14, + "learning_rate": 1.998803588788885e-06, + "loss": 0.7144, + "step": 5280 + }, + { + "epoch": 0.14, + "learning_rate": 1.9988022352701052e-06, + "loss": 1.0137, + "step": 5281 + }, + { + "epoch": 0.14, + "learning_rate": 1.998800880986588e-06, + "loss": 1.0049, + "step": 5282 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987995259383356e-06, + "loss": 0.6733, + "step": 5283 + }, + { + "epoch": 0.14, + "learning_rate": 1.998798170125348e-06, + "loss": 0.9434, + "step": 5284 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987968135476267e-06, + "loss": 0.9404, + "step": 5285 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987954562051724e-06, + "loss": 0.9014, + "step": 5286 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987940980979863e-06, + "loss": 0.8105, + "step": 5287 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987927392260695e-06, + "loss": 1.0078, + "step": 5288 + }, + { + "epoch": 0.14, + "learning_rate": 1.998791379589423e-06, + "loss": 0.9346, + "step": 5289 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987900191880482e-06, + "loss": 1.0098, + "step": 5290 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987886580219453e-06, + "loss": 0.8857, + "step": 5291 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987872960911165e-06, + "loss": 1.0547, + "step": 5292 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987859333955618e-06, + "loss": 0.8125, + "step": 5293 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987845699352824e-06, + "loss": 1.0117, + "step": 5294 + }, + { + "epoch": 0.14, + "learning_rate": 1.99878320571028e-06, + "loss": 0.9355, + "step": 5295 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987818407205553e-06, + "loss": 1.0229, + "step": 5296 + }, + { + "epoch": 0.14, + "learning_rate": 1.998780474966109e-06, + "loss": 0.8984, + "step": 5297 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987791084469423e-06, + "loss": 0.9014, + "step": 5298 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987777411630567e-06, + "loss": 1.0762, + "step": 5299 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987763731144528e-06, + "loss": 0.7231, + "step": 5300 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987750043011314e-06, + "loss": 0.7188, + "step": 5301 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987736347230943e-06, + "loss": 0.8174, + "step": 5302 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987722643803424e-06, + "loss": 0.8193, + "step": 5303 + }, + { + "epoch": 0.14, + "learning_rate": 1.998770893272876e-06, + "loss": 0.9229, + "step": 5304 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987695214006967e-06, + "loss": 0.6689, + "step": 5305 + }, + { + "epoch": 0.14, + "learning_rate": 1.998768148763806e-06, + "loss": 0.9971, + "step": 5306 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987667753622037e-06, + "loss": 0.9502, + "step": 5307 + }, + { + "epoch": 0.14, + "learning_rate": 1.998765401195892e-06, + "loss": 0.8848, + "step": 5308 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987640262648714e-06, + "loss": 0.9492, + "step": 5309 + }, + { + "epoch": 0.14, + "learning_rate": 1.998762650569143e-06, + "loss": 0.6956, + "step": 5310 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987612741087084e-06, + "loss": 1.1416, + "step": 5311 + }, + { + "epoch": 0.14, + "learning_rate": 1.998759896883568e-06, + "loss": 0.9463, + "step": 5312 + }, + { + "epoch": 0.14, + "learning_rate": 1.998758518893723e-06, + "loss": 0.7988, + "step": 5313 + }, + { + "epoch": 0.14, + "learning_rate": 1.998757140139175e-06, + "loss": 1.084, + "step": 5314 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987557606199238e-06, + "loss": 0.9727, + "step": 5315 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987543803359717e-06, + "loss": 0.9912, + "step": 5316 + }, + { + "epoch": 0.14, + "learning_rate": 1.998752999287319e-06, + "loss": 1.0469, + "step": 5317 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987516174739674e-06, + "loss": 1.041, + "step": 5318 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987502348959177e-06, + "loss": 1.1094, + "step": 5319 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987488515531704e-06, + "loss": 0.708, + "step": 5320 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987474674457273e-06, + "loss": 0.7935, + "step": 5321 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987460825735892e-06, + "loss": 1.1152, + "step": 5322 + }, + { + "epoch": 0.14, + "learning_rate": 1.998744696936757e-06, + "loss": 0.9707, + "step": 5323 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987433105352323e-06, + "loss": 0.959, + "step": 5324 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987419233690156e-06, + "loss": 0.8125, + "step": 5325 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987405354381077e-06, + "loss": 0.9131, + "step": 5326 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987391467425107e-06, + "loss": 0.9795, + "step": 5327 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987377572822247e-06, + "loss": 1.0371, + "step": 5328 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987363670572513e-06, + "loss": 0.7822, + "step": 5329 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987349760675914e-06, + "loss": 0.8706, + "step": 5330 + }, + { + "epoch": 0.14, + "learning_rate": 1.998733584313246e-06, + "loss": 0.9199, + "step": 5331 + }, + { + "epoch": 0.14, + "learning_rate": 1.998732191794216e-06, + "loss": 1.1055, + "step": 5332 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987307985105027e-06, + "loss": 0.8398, + "step": 5333 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987294044621073e-06, + "loss": 1.0762, + "step": 5334 + }, + { + "epoch": 0.14, + "learning_rate": 1.998728009649031e-06, + "loss": 1.0205, + "step": 5335 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987266140712742e-06, + "loss": 0.8765, + "step": 5336 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987252177288383e-06, + "loss": 0.8394, + "step": 5337 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987238206217243e-06, + "loss": 0.8989, + "step": 5338 + }, + { + "epoch": 0.14, + "learning_rate": 1.998722422749934e-06, + "loss": 0.8579, + "step": 5339 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987210241134673e-06, + "loss": 0.8887, + "step": 5340 + }, + { + "epoch": 0.14, + "learning_rate": 1.998719624712326e-06, + "loss": 0.9131, + "step": 5341 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987182245465112e-06, + "loss": 0.6753, + "step": 5342 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987168236160235e-06, + "loss": 1.0342, + "step": 5343 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987154219208645e-06, + "loss": 1.0459, + "step": 5344 + }, + { + "epoch": 0.14, + "learning_rate": 1.998714019461035e-06, + "loss": 0.8184, + "step": 5345 + }, + { + "epoch": 0.14, + "learning_rate": 1.998712616236536e-06, + "loss": 0.9688, + "step": 5346 + }, + { + "epoch": 0.14, + "learning_rate": 1.998711212247369e-06, + "loss": 1.0986, + "step": 5347 + }, + { + "epoch": 0.14, + "learning_rate": 1.998709807493534e-06, + "loss": 0.9639, + "step": 5348 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987084019750335e-06, + "loss": 0.6875, + "step": 5349 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987069956918676e-06, + "loss": 0.9004, + "step": 5350 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987055886440377e-06, + "loss": 0.6086, + "step": 5351 + }, + { + "epoch": 0.14, + "learning_rate": 1.998704180831545e-06, + "loss": 1.084, + "step": 5352 + }, + { + "epoch": 0.14, + "learning_rate": 1.99870277225439e-06, + "loss": 0.9907, + "step": 5353 + }, + { + "epoch": 0.14, + "learning_rate": 1.9987013629125748e-06, + "loss": 0.8525, + "step": 5354 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986999528060995e-06, + "loss": 0.8813, + "step": 5355 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986985419349657e-06, + "loss": 0.9346, + "step": 5356 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986971302991746e-06, + "loss": 0.9766, + "step": 5357 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986957178987266e-06, + "loss": 0.9443, + "step": 5358 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986943047336234e-06, + "loss": 0.9043, + "step": 5359 + }, + { + "epoch": 0.14, + "learning_rate": 1.998692890803866e-06, + "loss": 0.8301, + "step": 5360 + }, + { + "epoch": 0.14, + "learning_rate": 1.998691476109455e-06, + "loss": 0.9766, + "step": 5361 + }, + { + "epoch": 0.14, + "learning_rate": 1.998690060650392e-06, + "loss": 0.9453, + "step": 5362 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986886444266784e-06, + "loss": 0.9365, + "step": 5363 + }, + { + "epoch": 0.14, + "learning_rate": 1.998687227438314e-06, + "loss": 1.0352, + "step": 5364 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986858096853014e-06, + "loss": 1.0312, + "step": 5365 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986843911676408e-06, + "loss": 0.9023, + "step": 5366 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986829718853334e-06, + "loss": 0.8721, + "step": 5367 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986815518383806e-06, + "loss": 0.9893, + "step": 5368 + }, + { + "epoch": 0.14, + "learning_rate": 1.998680131026783e-06, + "loss": 0.957, + "step": 5369 + }, + { + "epoch": 0.14, + "learning_rate": 1.998678709450542e-06, + "loss": 1.0078, + "step": 5370 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986772871096585e-06, + "loss": 0.9746, + "step": 5371 + }, + { + "epoch": 0.14, + "learning_rate": 1.998675864004134e-06, + "loss": 1.0918, + "step": 5372 + }, + { + "epoch": 0.14, + "learning_rate": 1.998674440133969e-06, + "loss": 0.6768, + "step": 5373 + }, + { + "epoch": 0.14, + "learning_rate": 1.998673015499165e-06, + "loss": 0.877, + "step": 5374 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986715900997234e-06, + "loss": 0.8271, + "step": 5375 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986701639356443e-06, + "loss": 0.9312, + "step": 5376 + }, + { + "epoch": 0.14, + "learning_rate": 1.99866873700693e-06, + "loss": 1.0034, + "step": 5377 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986673093135804e-06, + "loss": 0.7661, + "step": 5378 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986658808555972e-06, + "loss": 0.9971, + "step": 5379 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986644516329817e-06, + "loss": 0.8545, + "step": 5380 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986630216457348e-06, + "loss": 0.8262, + "step": 5381 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986615908938576e-06, + "loss": 1.1045, + "step": 5382 + }, + { + "epoch": 0.14, + "learning_rate": 1.998660159377351e-06, + "loss": 0.958, + "step": 5383 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986587270962157e-06, + "loss": 1.0908, + "step": 5384 + }, + { + "epoch": 0.14, + "learning_rate": 1.998657294050454e-06, + "loss": 0.8262, + "step": 5385 + }, + { + "epoch": 0.14, + "learning_rate": 1.998655860240066e-06, + "loss": 1.001, + "step": 5386 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986544256650536e-06, + "loss": 0.8408, + "step": 5387 + }, + { + "epoch": 0.14, + "learning_rate": 1.998652990325417e-06, + "loss": 0.7534, + "step": 5388 + }, + { + "epoch": 0.14, + "learning_rate": 1.998651554221158e-06, + "loss": 0.957, + "step": 5389 + }, + { + "epoch": 0.14, + "learning_rate": 1.998650117352277e-06, + "loss": 0.8857, + "step": 5390 + }, + { + "epoch": 0.14, + "learning_rate": 1.998648679718776e-06, + "loss": 0.9648, + "step": 5391 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986472413206553e-06, + "loss": 0.6479, + "step": 5392 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986458021579163e-06, + "loss": 1.001, + "step": 5393 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986443622305603e-06, + "loss": 1.0361, + "step": 5394 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986429215385884e-06, + "loss": 0.8916, + "step": 5395 + }, + { + "epoch": 0.14, + "learning_rate": 1.998641480082001e-06, + "loss": 0.9043, + "step": 5396 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986400378608003e-06, + "loss": 0.8037, + "step": 5397 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986385948749866e-06, + "loss": 0.9355, + "step": 5398 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986371511245613e-06, + "loss": 0.9023, + "step": 5399 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986357066095253e-06, + "loss": 1.0752, + "step": 5400 + }, + { + "epoch": 0.14, + "learning_rate": 1.99863426132988e-06, + "loss": 0.8086, + "step": 5401 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986328152856262e-06, + "loss": 0.8662, + "step": 5402 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986313684767653e-06, + "loss": 0.9707, + "step": 5403 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986299209032983e-06, + "loss": 0.7422, + "step": 5404 + }, + { + "epoch": 0.14, + "learning_rate": 1.998628472565226e-06, + "loss": 0.8965, + "step": 5405 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986270234625504e-06, + "loss": 0.699, + "step": 5406 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986255735952716e-06, + "loss": 0.9805, + "step": 5407 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986241229633914e-06, + "loss": 1.0352, + "step": 5408 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986226715669102e-06, + "loss": 1.084, + "step": 5409 + }, + { + "epoch": 0.14, + "learning_rate": 1.99862121940583e-06, + "loss": 1.1396, + "step": 5410 + }, + { + "epoch": 0.14, + "learning_rate": 1.998619766480151e-06, + "loss": 0.6528, + "step": 5411 + }, + { + "epoch": 0.14, + "learning_rate": 1.998618312789875e-06, + "loss": 0.9102, + "step": 5412 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986168583350026e-06, + "loss": 0.7998, + "step": 5413 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986154031155356e-06, + "loss": 0.9316, + "step": 5414 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986139471314744e-06, + "loss": 0.8887, + "step": 5415 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986124903828204e-06, + "loss": 0.875, + "step": 5416 + }, + { + "epoch": 0.14, + "learning_rate": 1.998611032869575e-06, + "loss": 0.8901, + "step": 5417 + }, + { + "epoch": 0.14, + "learning_rate": 1.998609574591739e-06, + "loss": 0.8252, + "step": 5418 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986081155493137e-06, + "loss": 0.96, + "step": 5419 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986066557422998e-06, + "loss": 1.0254, + "step": 5420 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986051951706984e-06, + "loss": 1.0195, + "step": 5421 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986037338345114e-06, + "loss": 0.8428, + "step": 5422 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986022717337394e-06, + "loss": 0.9297, + "step": 5423 + }, + { + "epoch": 0.14, + "learning_rate": 1.9986008088683835e-06, + "loss": 0.7266, + "step": 5424 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985993452384447e-06, + "loss": 0.835, + "step": 5425 + }, + { + "epoch": 0.14, + "learning_rate": 1.998597880843925e-06, + "loss": 1.1396, + "step": 5426 + }, + { + "epoch": 0.14, + "learning_rate": 1.998596415684824e-06, + "loss": 0.8252, + "step": 5427 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985949497611442e-06, + "loss": 0.8721, + "step": 5428 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985934830728855e-06, + "loss": 1.0879, + "step": 5429 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985920156200503e-06, + "loss": 0.7671, + "step": 5430 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985905474026387e-06, + "loss": 0.8169, + "step": 5431 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985890784206524e-06, + "loss": 0.9951, + "step": 5432 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985876086740923e-06, + "loss": 0.9424, + "step": 5433 + }, + { + "epoch": 0.14, + "learning_rate": 1.99858613816296e-06, + "loss": 0.8037, + "step": 5434 + }, + { + "epoch": 0.14, + "learning_rate": 1.998584666887256e-06, + "loss": 0.8408, + "step": 5435 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985831948469813e-06, + "loss": 0.8062, + "step": 5436 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985817220421376e-06, + "loss": 0.7637, + "step": 5437 + }, + { + "epoch": 0.14, + "learning_rate": 1.998580248472726e-06, + "loss": 0.8789, + "step": 5438 + }, + { + "epoch": 0.14, + "learning_rate": 1.998578774138747e-06, + "loss": 0.9609, + "step": 5439 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985772990402024e-06, + "loss": 0.9297, + "step": 5440 + }, + { + "epoch": 0.14, + "learning_rate": 1.998575823177093e-06, + "loss": 1.1426, + "step": 5441 + }, + { + "epoch": 0.14, + "learning_rate": 1.99857434654942e-06, + "loss": 0.917, + "step": 5442 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985728691571847e-06, + "loss": 0.7798, + "step": 5443 + }, + { + "epoch": 0.14, + "learning_rate": 1.998571391000388e-06, + "loss": 0.8818, + "step": 5444 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985699120790306e-06, + "loss": 0.8193, + "step": 5445 + }, + { + "epoch": 0.14, + "learning_rate": 1.998568432393115e-06, + "loss": 0.791, + "step": 5446 + }, + { + "epoch": 0.14, + "learning_rate": 1.998566951942641e-06, + "loss": 0.8403, + "step": 5447 + }, + { + "epoch": 0.14, + "learning_rate": 1.99856547072761e-06, + "loss": 1.165, + "step": 5448 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985639887480233e-06, + "loss": 0.9658, + "step": 5449 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985625060038823e-06, + "loss": 0.7969, + "step": 5450 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985610224951882e-06, + "loss": 0.8955, + "step": 5451 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985595382219415e-06, + "loss": 1.0391, + "step": 5452 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985580531841437e-06, + "loss": 0.9541, + "step": 5453 + }, + { + "epoch": 0.14, + "learning_rate": 1.998556567381796e-06, + "loss": 0.9727, + "step": 5454 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985550808149e-06, + "loss": 0.8975, + "step": 5455 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985535934834554e-06, + "loss": 0.7158, + "step": 5456 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985521053874642e-06, + "loss": 0.8071, + "step": 5457 + }, + { + "epoch": 0.14, + "learning_rate": 1.998550616526928e-06, + "loss": 0.9307, + "step": 5458 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985491269018475e-06, + "loss": 1.166, + "step": 5459 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985476365122237e-06, + "loss": 0.8457, + "step": 5460 + }, + { + "epoch": 0.14, + "learning_rate": 1.998546145358058e-06, + "loss": 1.0645, + "step": 5461 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985446534393514e-06, + "loss": 0.4753, + "step": 5462 + }, + { + "epoch": 0.14, + "learning_rate": 1.998543160756105e-06, + "loss": 0.9912, + "step": 5463 + }, + { + "epoch": 0.14, + "learning_rate": 1.99854166730832e-06, + "loss": 0.9922, + "step": 5464 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985401730959976e-06, + "loss": 0.8828, + "step": 5465 + }, + { + "epoch": 0.14, + "learning_rate": 1.998538678119139e-06, + "loss": 1.0098, + "step": 5466 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985371823777454e-06, + "loss": 0.9883, + "step": 5467 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985356858718173e-06, + "loss": 0.8828, + "step": 5468 + }, + { + "epoch": 0.14, + "learning_rate": 1.998534188601357e-06, + "loss": 1.0322, + "step": 5469 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985326905663646e-06, + "loss": 0.9497, + "step": 5470 + }, + { + "epoch": 0.14, + "learning_rate": 1.998531191766841e-06, + "loss": 1.0654, + "step": 5471 + }, + { + "epoch": 0.14, + "learning_rate": 1.998529692202789e-06, + "loss": 0.9316, + "step": 5472 + }, + { + "epoch": 0.14, + "learning_rate": 1.998528191874208e-06, + "loss": 0.7969, + "step": 5473 + }, + { + "epoch": 0.14, + "learning_rate": 1.998526690781101e-06, + "loss": 0.9639, + "step": 5474 + }, + { + "epoch": 0.14, + "learning_rate": 1.998525188923467e-06, + "loss": 1.1572, + "step": 5475 + }, + { + "epoch": 0.14, + "learning_rate": 1.998523686301308e-06, + "loss": 1.0684, + "step": 5476 + }, + { + "epoch": 0.14, + "learning_rate": 1.998522182914626e-06, + "loss": 1.0635, + "step": 5477 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985206787634213e-06, + "loss": 0.877, + "step": 5478 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985191738476953e-06, + "loss": 0.9668, + "step": 5479 + }, + { + "epoch": 0.14, + "learning_rate": 1.998517668167449e-06, + "loss": 1.0098, + "step": 5480 + }, + { + "epoch": 0.14, + "learning_rate": 1.998516161722683e-06, + "loss": 0.7876, + "step": 5481 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985146545134e-06, + "loss": 0.6973, + "step": 5482 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985131465396e-06, + "loss": 1.0674, + "step": 5483 + }, + { + "epoch": 0.14, + "learning_rate": 1.998511637801284e-06, + "loss": 1.166, + "step": 5484 + }, + { + "epoch": 0.14, + "learning_rate": 1.998510128298454e-06, + "loss": 0.7439, + "step": 5485 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985086180311104e-06, + "loss": 1.0371, + "step": 5486 + }, + { + "epoch": 0.14, + "learning_rate": 1.998507106999255e-06, + "loss": 0.9521, + "step": 5487 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985055952028886e-06, + "loss": 0.8633, + "step": 5488 + }, + { + "epoch": 0.14, + "learning_rate": 1.998504082642012e-06, + "loss": 0.9434, + "step": 5489 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985025693166267e-06, + "loss": 0.8823, + "step": 5490 + }, + { + "epoch": 0.14, + "learning_rate": 1.9985010552267343e-06, + "loss": 0.918, + "step": 5491 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984995403723354e-06, + "loss": 0.918, + "step": 5492 + }, + { + "epoch": 0.14, + "learning_rate": 1.998498024753431e-06, + "loss": 1.0908, + "step": 5493 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984965083700234e-06, + "loss": 0.9575, + "step": 5494 + }, + { + "epoch": 0.14, + "learning_rate": 1.998494991222112e-06, + "loss": 0.8467, + "step": 5495 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984934733096998e-06, + "loss": 0.999, + "step": 5496 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984919546327864e-06, + "loss": 0.8945, + "step": 5497 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984904351913737e-06, + "loss": 1.0918, + "step": 5498 + }, + { + "epoch": 0.14, + "learning_rate": 1.998488914985463e-06, + "loss": 0.9238, + "step": 5499 + }, + { + "epoch": 0.14, + "learning_rate": 1.998487394015055e-06, + "loss": 1.0068, + "step": 5500 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984858722801515e-06, + "loss": 0.8564, + "step": 5501 + }, + { + "epoch": 0.14, + "learning_rate": 1.998484349780753e-06, + "loss": 0.9951, + "step": 5502 + }, + { + "epoch": 0.14, + "learning_rate": 1.998482826516861e-06, + "loss": 0.7705, + "step": 5503 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984813024884764e-06, + "loss": 0.8604, + "step": 5504 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984797776956006e-06, + "loss": 0.8228, + "step": 5505 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984782521382352e-06, + "loss": 0.9932, + "step": 5506 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984767258163807e-06, + "loss": 0.8555, + "step": 5507 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984751987300387e-06, + "loss": 0.9336, + "step": 5508 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984736708792096e-06, + "loss": 0.9326, + "step": 5509 + }, + { + "epoch": 0.14, + "learning_rate": 1.998472142263895e-06, + "loss": 0.8608, + "step": 5510 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984706128840967e-06, + "loss": 0.917, + "step": 5511 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984690827398154e-06, + "loss": 1.0439, + "step": 5512 + }, + { + "epoch": 0.14, + "learning_rate": 1.998467551831052e-06, + "loss": 0.9316, + "step": 5513 + }, + { + "epoch": 0.14, + "learning_rate": 1.998466020157808e-06, + "loss": 0.9375, + "step": 5514 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984644877200843e-06, + "loss": 0.7876, + "step": 5515 + }, + { + "epoch": 0.14, + "learning_rate": 1.998462954517883e-06, + "loss": 1.2334, + "step": 5516 + }, + { + "epoch": 0.14, + "learning_rate": 1.998461420551204e-06, + "loss": 0.8081, + "step": 5517 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984598858200487e-06, + "loss": 0.7246, + "step": 5518 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984583503244186e-06, + "loss": 1.0703, + "step": 5519 + }, + { + "epoch": 0.14, + "learning_rate": 1.998456814064315e-06, + "loss": 1.1152, + "step": 5520 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984552770397393e-06, + "loss": 0.6763, + "step": 5521 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984537392506917e-06, + "loss": 0.9507, + "step": 5522 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984522006971744e-06, + "loss": 0.8491, + "step": 5523 + }, + { + "epoch": 0.14, + "learning_rate": 1.998450661379188e-06, + "loss": 1.0059, + "step": 5524 + }, + { + "epoch": 0.14, + "learning_rate": 1.998449121296734e-06, + "loss": 1.1943, + "step": 5525 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984475804498135e-06, + "loss": 0.9531, + "step": 5526 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984460388384272e-06, + "loss": 0.8242, + "step": 5527 + }, + { + "epoch": 0.14, + "learning_rate": 1.998444496462577e-06, + "loss": 0.8633, + "step": 5528 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984429533222635e-06, + "loss": 0.8447, + "step": 5529 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984414094174885e-06, + "loss": 0.9863, + "step": 5530 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984398647482524e-06, + "loss": 0.626, + "step": 5531 + }, + { + "epoch": 0.14, + "learning_rate": 1.998438319314557e-06, + "loss": 0.9214, + "step": 5532 + }, + { + "epoch": 0.14, + "learning_rate": 1.998436773116403e-06, + "loss": 0.9619, + "step": 5533 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984352261537923e-06, + "loss": 0.9077, + "step": 5534 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984336784267257e-06, + "loss": 0.9272, + "step": 5535 + }, + { + "epoch": 0.14, + "learning_rate": 1.998432129935204e-06, + "loss": 0.9697, + "step": 5536 + }, + { + "epoch": 0.14, + "learning_rate": 1.998430580679229e-06, + "loss": 1.0459, + "step": 5537 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984290306588013e-06, + "loss": 0.9111, + "step": 5538 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984274798739225e-06, + "loss": 0.8916, + "step": 5539 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984259283245943e-06, + "loss": 1.0645, + "step": 5540 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984243760108167e-06, + "loss": 0.8398, + "step": 5541 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984228229325915e-06, + "loss": 0.916, + "step": 5542 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984212690899195e-06, + "loss": 0.9541, + "step": 5543 + }, + { + "epoch": 0.14, + "learning_rate": 1.998419714482803e-06, + "loss": 0.9697, + "step": 5544 + }, + { + "epoch": 0.14, + "learning_rate": 1.998418159111242e-06, + "loss": 0.8975, + "step": 5545 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984166029752382e-06, + "loss": 0.9561, + "step": 5546 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984150460747925e-06, + "loss": 0.9531, + "step": 5547 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984134884099064e-06, + "loss": 0.7285, + "step": 5548 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984119299805814e-06, + "loss": 0.8232, + "step": 5549 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984103707868177e-06, + "loss": 0.9297, + "step": 5550 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984088108286174e-06, + "loss": 0.9902, + "step": 5551 + }, + { + "epoch": 0.14, + "learning_rate": 1.9984072501059812e-06, + "loss": 1.1172, + "step": 5552 + }, + { + "epoch": 0.14, + "learning_rate": 1.998405688618911e-06, + "loss": 0.9609, + "step": 5553 + }, + { + "epoch": 0.14, + "learning_rate": 1.998404126367407e-06, + "loss": 0.8799, + "step": 5554 + }, + { + "epoch": 0.14, + "learning_rate": 1.998402563351471e-06, + "loss": 1.0371, + "step": 5555 + }, + { + "epoch": 0.14, + "learning_rate": 1.998400999571104e-06, + "loss": 1.0469, + "step": 5556 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983994350263075e-06, + "loss": 0.8721, + "step": 5557 + }, + { + "epoch": 0.14, + "learning_rate": 1.998397869717082e-06, + "loss": 0.7549, + "step": 5558 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983963036434296e-06, + "loss": 1.0674, + "step": 5559 + }, + { + "epoch": 0.14, + "learning_rate": 1.998394736805351e-06, + "loss": 0.7539, + "step": 5560 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983931692028473e-06, + "loss": 1.0107, + "step": 5561 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983916008359197e-06, + "loss": 0.6118, + "step": 5562 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983900317045698e-06, + "loss": 0.7656, + "step": 5563 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983884618087985e-06, + "loss": 1.0869, + "step": 5564 + }, + { + "epoch": 0.14, + "learning_rate": 1.998386891148607e-06, + "loss": 0.9062, + "step": 5565 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983853197239968e-06, + "loss": 0.8682, + "step": 5566 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983837475349685e-06, + "loss": 1.0068, + "step": 5567 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983821745815243e-06, + "loss": 0.7998, + "step": 5568 + }, + { + "epoch": 0.14, + "learning_rate": 1.998380600863664e-06, + "loss": 0.9658, + "step": 5569 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983790263813903e-06, + "loss": 0.9502, + "step": 5570 + }, + { + "epoch": 0.14, + "learning_rate": 1.998377451134703e-06, + "loss": 1.1582, + "step": 5571 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983758751236046e-06, + "loss": 0.686, + "step": 5572 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983742983480953e-06, + "loss": 1.0137, + "step": 5573 + }, + { + "epoch": 0.14, + "learning_rate": 1.998372720808177e-06, + "loss": 0.6724, + "step": 5574 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983711425038503e-06, + "loss": 0.8145, + "step": 5575 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983695634351166e-06, + "loss": 0.7446, + "step": 5576 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983679836019776e-06, + "loss": 1.0244, + "step": 5577 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983664030044342e-06, + "loss": 1.0752, + "step": 5578 + }, + { + "epoch": 0.14, + "learning_rate": 1.998364821642487e-06, + "loss": 0.7764, + "step": 5579 + }, + { + "epoch": 0.14, + "learning_rate": 1.998363239516138e-06, + "loss": 0.8948, + "step": 5580 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983616566253886e-06, + "loss": 0.6699, + "step": 5581 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983600729702396e-06, + "loss": 0.6992, + "step": 5582 + }, + { + "epoch": 0.14, + "learning_rate": 1.998358488550692e-06, + "loss": 1.0996, + "step": 5583 + }, + { + "epoch": 0.14, + "learning_rate": 1.998356903366747e-06, + "loss": 0.7119, + "step": 5584 + }, + { + "epoch": 0.14, + "learning_rate": 1.998355317418406e-06, + "loss": 0.9736, + "step": 5585 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983537307056702e-06, + "loss": 0.8557, + "step": 5586 + }, + { + "epoch": 0.14, + "learning_rate": 1.998352143228541e-06, + "loss": 0.9141, + "step": 5587 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983505549870197e-06, + "loss": 1.0527, + "step": 5588 + }, + { + "epoch": 0.14, + "learning_rate": 1.998348965981107e-06, + "loss": 0.8164, + "step": 5589 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983473762108044e-06, + "loss": 0.8193, + "step": 5590 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983457856761135e-06, + "loss": 0.9102, + "step": 5591 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983441943770347e-06, + "loss": 0.7759, + "step": 5592 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983426023135696e-06, + "loss": 0.9277, + "step": 5593 + }, + { + "epoch": 0.14, + "learning_rate": 1.99834100948572e-06, + "loss": 1.0654, + "step": 5594 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983394158934863e-06, + "loss": 0.8208, + "step": 5595 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983378215368697e-06, + "loss": 0.915, + "step": 5596 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983362264158723e-06, + "loss": 0.9414, + "step": 5597 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983346305304942e-06, + "loss": 1.1396, + "step": 5598 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983330338807375e-06, + "loss": 0.8125, + "step": 5599 + }, + { + "epoch": 0.14, + "learning_rate": 1.998331436466603e-06, + "loss": 0.7285, + "step": 5600 + }, + { + "epoch": 0.14, + "learning_rate": 1.998329838288092e-06, + "loss": 0.9951, + "step": 5601 + }, + { + "epoch": 0.14, + "learning_rate": 1.998328239345206e-06, + "loss": 0.9697, + "step": 5602 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983266396379456e-06, + "loss": 0.8652, + "step": 5603 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983250391663127e-06, + "loss": 0.7734, + "step": 5604 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983234379303083e-06, + "loss": 0.918, + "step": 5605 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983218359299334e-06, + "loss": 1.0449, + "step": 5606 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983202331651892e-06, + "loss": 0.9121, + "step": 5607 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983186296360774e-06, + "loss": 0.8613, + "step": 5608 + }, + { + "epoch": 0.14, + "learning_rate": 1.998317025342599e-06, + "loss": 0.7646, + "step": 5609 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983154202847547e-06, + "loss": 0.8799, + "step": 5610 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983138144625464e-06, + "loss": 0.9004, + "step": 5611 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983122078759747e-06, + "loss": 0.9292, + "step": 5612 + }, + { + "epoch": 0.14, + "learning_rate": 1.998310600525042e-06, + "loss": 1.0225, + "step": 5613 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983089924097484e-06, + "loss": 1.0674, + "step": 5614 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983073835300954e-06, + "loss": 1.0449, + "step": 5615 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983057738860846e-06, + "loss": 1.0361, + "step": 5616 + }, + { + "epoch": 0.14, + "learning_rate": 1.998304163477717e-06, + "loss": 0.9658, + "step": 5617 + }, + { + "epoch": 0.14, + "learning_rate": 1.9983025523049936e-06, + "loss": 0.8838, + "step": 5618 + }, + { + "epoch": 0.14, + "learning_rate": 1.998300940367916e-06, + "loss": 0.8496, + "step": 5619 + }, + { + "epoch": 0.14, + "learning_rate": 1.998299327666485e-06, + "loss": 0.8604, + "step": 5620 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982977142007023e-06, + "loss": 0.769, + "step": 5621 + }, + { + "epoch": 0.14, + "learning_rate": 1.998296099970569e-06, + "loss": 1.0312, + "step": 5622 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982944849760864e-06, + "loss": 0.8682, + "step": 5623 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982928692172553e-06, + "loss": 1.0703, + "step": 5624 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982912526940775e-06, + "loss": 0.8555, + "step": 5625 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982896354065536e-06, + "loss": 0.6973, + "step": 5626 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982880173546858e-06, + "loss": 1.002, + "step": 5627 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982863985384745e-06, + "loss": 0.9424, + "step": 5628 + }, + { + "epoch": 0.14, + "learning_rate": 1.998284778957921e-06, + "loss": 0.9043, + "step": 5629 + }, + { + "epoch": 0.14, + "learning_rate": 1.998283158613027e-06, + "loss": 0.6655, + "step": 5630 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982815375037934e-06, + "loss": 0.749, + "step": 5631 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982799156302214e-06, + "loss": 1.082, + "step": 5632 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982782929923127e-06, + "loss": 1.1934, + "step": 5633 + }, + { + "epoch": 0.14, + "learning_rate": 1.998276669590068e-06, + "loss": 0.7783, + "step": 5634 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982750454234885e-06, + "loss": 1.043, + "step": 5635 + }, + { + "epoch": 0.14, + "learning_rate": 1.998273420492576e-06, + "loss": 0.9629, + "step": 5636 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982717947973316e-06, + "loss": 0.9248, + "step": 5637 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982701683377563e-06, + "loss": 1.0654, + "step": 5638 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982685411138515e-06, + "loss": 0.7686, + "step": 5639 + }, + { + "epoch": 0.14, + "learning_rate": 1.998266913125618e-06, + "loss": 0.9639, + "step": 5640 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982652843730577e-06, + "loss": 0.9844, + "step": 5641 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982636548561717e-06, + "loss": 1.1621, + "step": 5642 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982620245749608e-06, + "loss": 0.8892, + "step": 5643 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982603935294267e-06, + "loss": 1.1348, + "step": 5644 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982587617195704e-06, + "loss": 0.7651, + "step": 5645 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982571291453934e-06, + "loss": 0.8701, + "step": 5646 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982554958068967e-06, + "loss": 0.9258, + "step": 5647 + }, + { + "epoch": 0.14, + "learning_rate": 1.998253861704082e-06, + "loss": 0.9941, + "step": 5648 + }, + { + "epoch": 0.14, + "learning_rate": 1.99825222683695e-06, + "loss": 1.0898, + "step": 5649 + }, + { + "epoch": 0.14, + "learning_rate": 1.998250591205502e-06, + "loss": 1.001, + "step": 5650 + }, + { + "epoch": 0.14, + "learning_rate": 1.99824895480974e-06, + "loss": 0.9238, + "step": 5651 + }, + { + "epoch": 0.14, + "learning_rate": 1.998247317649664e-06, + "loss": 0.814, + "step": 5652 + }, + { + "epoch": 0.14, + "learning_rate": 1.998245679725276e-06, + "loss": 1.0332, + "step": 5653 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982440410365776e-06, + "loss": 0.8652, + "step": 5654 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982424015835694e-06, + "loss": 0.8906, + "step": 5655 + }, + { + "epoch": 0.14, + "learning_rate": 1.998240761366253e-06, + "loss": 0.8398, + "step": 5656 + }, + { + "epoch": 0.14, + "learning_rate": 1.9982391203846294e-06, + "loss": 0.9912, + "step": 5657 + }, + { + "epoch": 0.15, + "learning_rate": 1.9982374786387e-06, + "loss": 0.8174, + "step": 5658 + }, + { + "epoch": 0.15, + "learning_rate": 1.9982358361284663e-06, + "loss": 1.0352, + "step": 5659 + }, + { + "epoch": 0.15, + "learning_rate": 1.998234192853929e-06, + "loss": 0.9736, + "step": 5660 + }, + { + "epoch": 0.15, + "learning_rate": 1.99823254881509e-06, + "loss": 0.918, + "step": 5661 + }, + { + "epoch": 0.15, + "learning_rate": 1.99823090401195e-06, + "loss": 0.9609, + "step": 5662 + }, + { + "epoch": 0.15, + "learning_rate": 1.9982292584445104e-06, + "loss": 0.9065, + "step": 5663 + }, + { + "epoch": 0.15, + "learning_rate": 1.9982276121127727e-06, + "loss": 0.7937, + "step": 5664 + }, + { + "epoch": 0.15, + "learning_rate": 1.998225965016738e-06, + "loss": 1.0566, + "step": 5665 + }, + { + "epoch": 0.15, + "learning_rate": 1.998224317156408e-06, + "loss": 0.8208, + "step": 5666 + }, + { + "epoch": 0.15, + "learning_rate": 1.998222668531783e-06, + "loss": 0.7832, + "step": 5667 + }, + { + "epoch": 0.15, + "learning_rate": 1.998221019142865e-06, + "loss": 0.8389, + "step": 5668 + }, + { + "epoch": 0.15, + "learning_rate": 1.998219368989655e-06, + "loss": 0.9092, + "step": 5669 + }, + { + "epoch": 0.15, + "learning_rate": 1.9982177180721544e-06, + "loss": 0.8916, + "step": 5670 + }, + { + "epoch": 0.15, + "learning_rate": 1.9982160663903643e-06, + "loss": 1.0381, + "step": 5671 + }, + { + "epoch": 0.15, + "learning_rate": 1.998214413944286e-06, + "loss": 1.1406, + "step": 5672 + }, + { + "epoch": 0.15, + "learning_rate": 1.9982127607339213e-06, + "loss": 0.7715, + "step": 5673 + }, + { + "epoch": 0.15, + "learning_rate": 1.99821110675927e-06, + "loss": 1.082, + "step": 5674 + }, + { + "epoch": 0.15, + "learning_rate": 1.9982094520203353e-06, + "loss": 0.9482, + "step": 5675 + }, + { + "epoch": 0.15, + "learning_rate": 1.9982077965171175e-06, + "loss": 0.9092, + "step": 5676 + }, + { + "epoch": 0.15, + "learning_rate": 1.9982061402496172e-06, + "loss": 0.9675, + "step": 5677 + }, + { + "epoch": 0.15, + "learning_rate": 1.998204483217837e-06, + "loss": 1.1006, + "step": 5678 + }, + { + "epoch": 0.15, + "learning_rate": 1.9982028254217773e-06, + "loss": 0.7075, + "step": 5679 + }, + { + "epoch": 0.15, + "learning_rate": 1.9982011668614393e-06, + "loss": 0.8594, + "step": 5680 + }, + { + "epoch": 0.15, + "learning_rate": 1.998199507536825e-06, + "loss": 0.8931, + "step": 5681 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981978474479353e-06, + "loss": 0.835, + "step": 5682 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981961865947706e-06, + "loss": 0.9268, + "step": 5683 + }, + { + "epoch": 0.15, + "learning_rate": 1.998194524977334e-06, + "loss": 0.9727, + "step": 5684 + }, + { + "epoch": 0.15, + "learning_rate": 1.998192862595625e-06, + "loss": 0.875, + "step": 5685 + }, + { + "epoch": 0.15, + "learning_rate": 1.998191199449646e-06, + "loss": 0.9863, + "step": 5686 + }, + { + "epoch": 0.15, + "learning_rate": 1.998189535539398e-06, + "loss": 0.959, + "step": 5687 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981878708648817e-06, + "loss": 1.0586, + "step": 5688 + }, + { + "epoch": 0.15, + "learning_rate": 1.998186205426099e-06, + "loss": 1.0186, + "step": 5689 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981845392230514e-06, + "loss": 0.8906, + "step": 5690 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981828722557395e-06, + "loss": 0.9004, + "step": 5691 + }, + { + "epoch": 0.15, + "learning_rate": 1.998181204524165e-06, + "loss": 0.8311, + "step": 5692 + }, + { + "epoch": 0.15, + "learning_rate": 1.998179536028329e-06, + "loss": 0.8716, + "step": 5693 + }, + { + "epoch": 0.15, + "learning_rate": 1.998177866768233e-06, + "loss": 0.8711, + "step": 5694 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981761967438773e-06, + "loss": 0.9189, + "step": 5695 + }, + { + "epoch": 0.15, + "learning_rate": 1.998174525955265e-06, + "loss": 1.0, + "step": 5696 + }, + { + "epoch": 0.15, + "learning_rate": 1.998172854402396e-06, + "loss": 1.0029, + "step": 5697 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981711820852717e-06, + "loss": 0.9834, + "step": 5698 + }, + { + "epoch": 0.15, + "learning_rate": 1.998169509003894e-06, + "loss": 1.0547, + "step": 5699 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981678351582635e-06, + "loss": 0.9883, + "step": 5700 + }, + { + "epoch": 0.15, + "learning_rate": 1.998166160548382e-06, + "loss": 1.0166, + "step": 5701 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981644851742504e-06, + "loss": 0.7046, + "step": 5702 + }, + { + "epoch": 0.15, + "learning_rate": 1.99816280903587e-06, + "loss": 0.8657, + "step": 5703 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981611321332428e-06, + "loss": 1.1777, + "step": 5704 + }, + { + "epoch": 0.15, + "learning_rate": 1.998159454466369e-06, + "loss": 0.9902, + "step": 5705 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981577760352505e-06, + "loss": 0.9043, + "step": 5706 + }, + { + "epoch": 0.15, + "learning_rate": 1.998156096839889e-06, + "loss": 0.9639, + "step": 5707 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981544168802845e-06, + "loss": 0.9302, + "step": 5708 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981527361564396e-06, + "loss": 0.9004, + "step": 5709 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981510546683546e-06, + "loss": 0.793, + "step": 5710 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981493724160316e-06, + "loss": 0.8105, + "step": 5711 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981476893994714e-06, + "loss": 0.9912, + "step": 5712 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981460056186753e-06, + "loss": 0.9531, + "step": 5713 + }, + { + "epoch": 0.15, + "learning_rate": 1.998144321073645e-06, + "loss": 0.7188, + "step": 5714 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981426357643813e-06, + "loss": 0.999, + "step": 5715 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981409496908856e-06, + "loss": 1.0771, + "step": 5716 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981392628531594e-06, + "loss": 0.9629, + "step": 5717 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981375752512037e-06, + "loss": 0.9766, + "step": 5718 + }, + { + "epoch": 0.15, + "learning_rate": 1.99813588688502e-06, + "loss": 0.9941, + "step": 5719 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981341977546096e-06, + "loss": 0.9932, + "step": 5720 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981325078599738e-06, + "loss": 0.916, + "step": 5721 + }, + { + "epoch": 0.15, + "learning_rate": 1.998130817201114e-06, + "loss": 1.0947, + "step": 5722 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981291257780307e-06, + "loss": 0.8359, + "step": 5723 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981274335907266e-06, + "loss": 0.7358, + "step": 5724 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981257406392017e-06, + "loss": 1.042, + "step": 5725 + }, + { + "epoch": 0.15, + "learning_rate": 1.998124046923458e-06, + "loss": 1.0703, + "step": 5726 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981223524434965e-06, + "loss": 1.0811, + "step": 5727 + }, + { + "epoch": 0.15, + "learning_rate": 1.998120657199319e-06, + "loss": 0.7292, + "step": 5728 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981189611909255e-06, + "loss": 0.5605, + "step": 5729 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981172644183194e-06, + "loss": 0.9463, + "step": 5730 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981155668815e-06, + "loss": 0.9688, + "step": 5731 + }, + { + "epoch": 0.15, + "learning_rate": 1.99811386858047e-06, + "loss": 0.8096, + "step": 5732 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981121695152294e-06, + "loss": 1.0918, + "step": 5733 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981104696857805e-06, + "loss": 0.7705, + "step": 5734 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981087690921245e-06, + "loss": 1.0625, + "step": 5735 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981070677342623e-06, + "loss": 1.0537, + "step": 5736 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981053656121955e-06, + "loss": 1.0029, + "step": 5737 + }, + { + "epoch": 0.15, + "learning_rate": 1.998103662725925e-06, + "loss": 1.083, + "step": 5738 + }, + { + "epoch": 0.15, + "learning_rate": 1.998101959075453e-06, + "loss": 0.8877, + "step": 5739 + }, + { + "epoch": 0.15, + "learning_rate": 1.9981002546607796e-06, + "loss": 0.6938, + "step": 5740 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980985494819072e-06, + "loss": 0.8203, + "step": 5741 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980968435388363e-06, + "loss": 0.8184, + "step": 5742 + }, + { + "epoch": 0.15, + "learning_rate": 1.998095136831569e-06, + "loss": 0.7871, + "step": 5743 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980934293601056e-06, + "loss": 0.9902, + "step": 5744 + }, + { + "epoch": 0.15, + "learning_rate": 1.998091721124448e-06, + "loss": 0.9121, + "step": 5745 + }, + { + "epoch": 0.15, + "learning_rate": 1.998090012124598e-06, + "loss": 0.9688, + "step": 5746 + }, + { + "epoch": 0.15, + "learning_rate": 1.998088302360556e-06, + "loss": 0.9014, + "step": 5747 + }, + { + "epoch": 0.15, + "learning_rate": 1.998086591832324e-06, + "loss": 0.8398, + "step": 5748 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980848805399024e-06, + "loss": 0.8623, + "step": 5749 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980831684832936e-06, + "loss": 0.9814, + "step": 5750 + }, + { + "epoch": 0.15, + "learning_rate": 1.998081455662498e-06, + "loss": 0.7002, + "step": 5751 + }, + { + "epoch": 0.15, + "learning_rate": 1.998079742077518e-06, + "loss": 1.1357, + "step": 5752 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980780277283535e-06, + "loss": 0.8818, + "step": 5753 + }, + { + "epoch": 0.15, + "learning_rate": 1.998076312615007e-06, + "loss": 0.8652, + "step": 5754 + }, + { + "epoch": 0.15, + "learning_rate": 1.998074596737479e-06, + "loss": 0.7339, + "step": 5755 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980728800957713e-06, + "loss": 0.999, + "step": 5756 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980711626898852e-06, + "loss": 0.9707, + "step": 5757 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980694445198217e-06, + "loss": 1.145, + "step": 5758 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980677255855828e-06, + "loss": 1.0674, + "step": 5759 + }, + { + "epoch": 0.15, + "learning_rate": 1.998066005887169e-06, + "loss": 0.9795, + "step": 5760 + }, + { + "epoch": 0.15, + "learning_rate": 1.998064285424582e-06, + "loss": 0.9717, + "step": 5761 + }, + { + "epoch": 0.15, + "learning_rate": 1.998062564197823e-06, + "loss": 1.125, + "step": 5762 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980608422068933e-06, + "loss": 0.9326, + "step": 5763 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980591194517947e-06, + "loss": 0.8506, + "step": 5764 + }, + { + "epoch": 0.15, + "learning_rate": 1.998057395932528e-06, + "loss": 0.8726, + "step": 5765 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980556716490943e-06, + "loss": 0.6884, + "step": 5766 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980539466014955e-06, + "loss": 0.657, + "step": 5767 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980522207897327e-06, + "loss": 0.9351, + "step": 5768 + }, + { + "epoch": 0.15, + "learning_rate": 1.998050494213807e-06, + "loss": 0.6743, + "step": 5769 + }, + { + "epoch": 0.15, + "learning_rate": 1.99804876687372e-06, + "loss": 1.0264, + "step": 5770 + }, + { + "epoch": 0.15, + "learning_rate": 1.998047038769473e-06, + "loss": 0.843, + "step": 5771 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980453099010674e-06, + "loss": 0.9971, + "step": 5772 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980435802685042e-06, + "loss": 0.9609, + "step": 5773 + }, + { + "epoch": 0.15, + "learning_rate": 1.998041849871785e-06, + "loss": 1.0547, + "step": 5774 + }, + { + "epoch": 0.15, + "learning_rate": 1.998040118710911e-06, + "loss": 1.0732, + "step": 5775 + }, + { + "epoch": 0.15, + "learning_rate": 1.998038386785884e-06, + "loss": 0.7661, + "step": 5776 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980366540967044e-06, + "loss": 0.9004, + "step": 5777 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980349206433743e-06, + "loss": 0.8403, + "step": 5778 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980331864258946e-06, + "loss": 0.8955, + "step": 5779 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980314514442667e-06, + "loss": 1.2197, + "step": 5780 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980297156984923e-06, + "loss": 0.9902, + "step": 5781 + }, + { + "epoch": 0.15, + "learning_rate": 1.998027979188572e-06, + "loss": 0.9453, + "step": 5782 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980262419145076e-06, + "loss": 0.8555, + "step": 5783 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980245038763007e-06, + "loss": 0.9766, + "step": 5784 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980227650739524e-06, + "loss": 0.8027, + "step": 5785 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980210255074635e-06, + "loss": 0.9697, + "step": 5786 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980192851768365e-06, + "loss": 1.1484, + "step": 5787 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980175440820714e-06, + "loss": 0.8652, + "step": 5788 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980158022231704e-06, + "loss": 1.0176, + "step": 5789 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980140596001343e-06, + "loss": 0.9639, + "step": 5790 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980123162129652e-06, + "loss": 1.0664, + "step": 5791 + }, + { + "epoch": 0.15, + "learning_rate": 1.998010572061664e-06, + "loss": 0.9658, + "step": 5792 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980088271462315e-06, + "loss": 0.8262, + "step": 5793 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980070814666698e-06, + "loss": 0.832, + "step": 5794 + }, + { + "epoch": 0.15, + "learning_rate": 1.99800533502298e-06, + "loss": 0.9404, + "step": 5795 + }, + { + "epoch": 0.15, + "learning_rate": 1.9980035878151635e-06, + "loss": 0.957, + "step": 5796 + }, + { + "epoch": 0.15, + "learning_rate": 1.998001839843221e-06, + "loss": 0.96, + "step": 5797 + }, + { + "epoch": 0.15, + "learning_rate": 1.998000091107155e-06, + "loss": 1.0234, + "step": 5798 + }, + { + "epoch": 0.15, + "learning_rate": 1.997998341606966e-06, + "loss": 0.8574, + "step": 5799 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979965913426555e-06, + "loss": 0.7944, + "step": 5800 + }, + { + "epoch": 0.15, + "learning_rate": 1.997994840314225e-06, + "loss": 0.8198, + "step": 5801 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979930885216754e-06, + "loss": 0.9746, + "step": 5802 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979913359650087e-06, + "loss": 1.1738, + "step": 5803 + }, + { + "epoch": 0.15, + "learning_rate": 1.997989582644226e-06, + "loss": 1.0107, + "step": 5804 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979878285593285e-06, + "loss": 0.8584, + "step": 5805 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979860737103175e-06, + "loss": 0.8906, + "step": 5806 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979843180971943e-06, + "loss": 0.938, + "step": 5807 + }, + { + "epoch": 0.15, + "learning_rate": 1.997982561719961e-06, + "loss": 0.998, + "step": 5808 + }, + { + "epoch": 0.15, + "learning_rate": 1.997980804578618e-06, + "loss": 0.9404, + "step": 5809 + }, + { + "epoch": 0.15, + "learning_rate": 1.997979046673167e-06, + "loss": 1.0811, + "step": 5810 + }, + { + "epoch": 0.15, + "learning_rate": 1.997977288003609e-06, + "loss": 0.7686, + "step": 5811 + }, + { + "epoch": 0.15, + "learning_rate": 1.997975528569946e-06, + "loss": 0.9199, + "step": 5812 + }, + { + "epoch": 0.15, + "learning_rate": 1.997973768372179e-06, + "loss": 0.8555, + "step": 5813 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979720074103095e-06, + "loss": 1.0078, + "step": 5814 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979702456843384e-06, + "loss": 1.3057, + "step": 5815 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979684831942673e-06, + "loss": 0.8164, + "step": 5816 + }, + { + "epoch": 0.15, + "learning_rate": 1.997966719940098e-06, + "loss": 0.7744, + "step": 5817 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979649559218313e-06, + "loss": 1.1133, + "step": 5818 + }, + { + "epoch": 0.15, + "learning_rate": 1.997963191139469e-06, + "loss": 0.8906, + "step": 5819 + }, + { + "epoch": 0.15, + "learning_rate": 1.997961425593012e-06, + "loss": 0.6958, + "step": 5820 + }, + { + "epoch": 0.15, + "learning_rate": 1.997959659282462e-06, + "loss": 0.8047, + "step": 5821 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979578922078194e-06, + "loss": 0.7695, + "step": 5822 + }, + { + "epoch": 0.15, + "learning_rate": 1.997956124369087e-06, + "loss": 1.0596, + "step": 5823 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979543557662653e-06, + "loss": 0.9346, + "step": 5824 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979525863993556e-06, + "loss": 0.8818, + "step": 5825 + }, + { + "epoch": 0.15, + "learning_rate": 1.99795081626836e-06, + "loss": 1.041, + "step": 5826 + }, + { + "epoch": 0.15, + "learning_rate": 1.997949045373279e-06, + "loss": 0.9365, + "step": 5827 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979472737141147e-06, + "loss": 0.9507, + "step": 5828 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979455012908675e-06, + "loss": 0.9238, + "step": 5829 + }, + { + "epoch": 0.15, + "learning_rate": 1.99794372810354e-06, + "loss": 0.8428, + "step": 5830 + }, + { + "epoch": 0.15, + "learning_rate": 1.997941954152132e-06, + "loss": 0.752, + "step": 5831 + }, + { + "epoch": 0.15, + "learning_rate": 1.997940179436646e-06, + "loss": 0.8003, + "step": 5832 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979384039570837e-06, + "loss": 0.9834, + "step": 5833 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979366277134452e-06, + "loss": 0.792, + "step": 5834 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979348507057326e-06, + "loss": 0.9385, + "step": 5835 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979330729339475e-06, + "loss": 1.0068, + "step": 5836 + }, + { + "epoch": 0.15, + "learning_rate": 1.997931294398091e-06, + "loss": 0.9053, + "step": 5837 + }, + { + "epoch": 0.15, + "learning_rate": 1.997929515098164e-06, + "loss": 0.4937, + "step": 5838 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979277350341683e-06, + "loss": 0.8457, + "step": 5839 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979259542061054e-06, + "loss": 0.854, + "step": 5840 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979241726139765e-06, + "loss": 0.7764, + "step": 5841 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979223902577827e-06, + "loss": 0.9517, + "step": 5842 + }, + { + "epoch": 0.15, + "learning_rate": 1.997920607137526e-06, + "loss": 0.752, + "step": 5843 + }, + { + "epoch": 0.15, + "learning_rate": 1.997918823253207e-06, + "loss": 0.9385, + "step": 5844 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979170386048274e-06, + "loss": 1.2168, + "step": 5845 + }, + { + "epoch": 0.15, + "learning_rate": 1.997915253192389e-06, + "loss": 0.9678, + "step": 5846 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979134670158927e-06, + "loss": 1.0557, + "step": 5847 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979116800753397e-06, + "loss": 0.855, + "step": 5848 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979098923707318e-06, + "loss": 1.1055, + "step": 5849 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979081039020696e-06, + "loss": 1.1562, + "step": 5850 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979063146693557e-06, + "loss": 0.9775, + "step": 5851 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979045246725906e-06, + "loss": 0.9141, + "step": 5852 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979027339117764e-06, + "loss": 0.9473, + "step": 5853 + }, + { + "epoch": 0.15, + "learning_rate": 1.9979009423869134e-06, + "loss": 0.8447, + "step": 5854 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978991500980035e-06, + "loss": 0.8174, + "step": 5855 + }, + { + "epoch": 0.15, + "learning_rate": 1.997897357045048e-06, + "loss": 0.7744, + "step": 5856 + }, + { + "epoch": 0.15, + "learning_rate": 1.997895563228049e-06, + "loss": 1.0127, + "step": 5857 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978937686470068e-06, + "loss": 0.8984, + "step": 5858 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978919733019236e-06, + "loss": 1.042, + "step": 5859 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978901771927997e-06, + "loss": 1.001, + "step": 5860 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978883803196378e-06, + "loss": 0.9902, + "step": 5861 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978865826824386e-06, + "loss": 1.0078, + "step": 5862 + }, + { + "epoch": 0.15, + "learning_rate": 1.997884784281203e-06, + "loss": 0.9844, + "step": 5863 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978829851159334e-06, + "loss": 0.9707, + "step": 5864 + }, + { + "epoch": 0.15, + "learning_rate": 1.997881185186631e-06, + "loss": 1.0605, + "step": 5865 + }, + { + "epoch": 0.15, + "learning_rate": 1.997879384493296e-06, + "loss": 1.001, + "step": 5866 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978775830359308e-06, + "loss": 0.9121, + "step": 5867 + }, + { + "epoch": 0.15, + "learning_rate": 1.997875780814537e-06, + "loss": 0.8418, + "step": 5868 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978739778291156e-06, + "loss": 0.9551, + "step": 5869 + }, + { + "epoch": 0.15, + "learning_rate": 1.997872174079668e-06, + "loss": 0.9023, + "step": 5870 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978703695661953e-06, + "loss": 0.8081, + "step": 5871 + }, + { + "epoch": 0.15, + "learning_rate": 1.997868564288699e-06, + "loss": 1.0547, + "step": 5872 + }, + { + "epoch": 0.15, + "learning_rate": 1.997866758247181e-06, + "loss": 0.8564, + "step": 5873 + }, + { + "epoch": 0.15, + "learning_rate": 1.997864951441642e-06, + "loss": 0.8228, + "step": 5874 + }, + { + "epoch": 0.15, + "learning_rate": 1.997863143872084e-06, + "loss": 0.8438, + "step": 5875 + }, + { + "epoch": 0.15, + "learning_rate": 1.997861335538508e-06, + "loss": 0.8701, + "step": 5876 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978595264409157e-06, + "loss": 1.123, + "step": 5877 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978577165793077e-06, + "loss": 1.1562, + "step": 5878 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978559059536862e-06, + "loss": 0.8613, + "step": 5879 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978540945640525e-06, + "loss": 0.9834, + "step": 5880 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978522824104072e-06, + "loss": 1.0273, + "step": 5881 + }, + { + "epoch": 0.15, + "learning_rate": 1.997850469492753e-06, + "loss": 0.9648, + "step": 5882 + }, + { + "epoch": 0.15, + "learning_rate": 1.99784865581109e-06, + "loss": 1.0996, + "step": 5883 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978468413654207e-06, + "loss": 1.1465, + "step": 5884 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978450261557455e-06, + "loss": 0.981, + "step": 5885 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978432101820663e-06, + "loss": 0.9346, + "step": 5886 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978413934443847e-06, + "loss": 0.9648, + "step": 5887 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978395759427018e-06, + "loss": 1.2129, + "step": 5888 + }, + { + "epoch": 0.15, + "learning_rate": 1.997837757677019e-06, + "loss": 1.0273, + "step": 5889 + }, + { + "epoch": 0.15, + "learning_rate": 1.997835938647337e-06, + "loss": 0.9297, + "step": 5890 + }, + { + "epoch": 0.15, + "learning_rate": 1.997834118853659e-06, + "loss": 1.1816, + "step": 5891 + }, + { + "epoch": 0.15, + "learning_rate": 1.997832298295985e-06, + "loss": 0.9365, + "step": 5892 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978304769743163e-06, + "loss": 0.8877, + "step": 5893 + }, + { + "epoch": 0.15, + "learning_rate": 1.997828654888655e-06, + "loss": 1.0811, + "step": 5894 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978268320390017e-06, + "loss": 0.9639, + "step": 5895 + }, + { + "epoch": 0.15, + "learning_rate": 1.997825008425359e-06, + "loss": 0.9375, + "step": 5896 + }, + { + "epoch": 0.15, + "learning_rate": 1.997823184047727e-06, + "loss": 1.2168, + "step": 5897 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978213589061083e-06, + "loss": 1.1064, + "step": 5898 + }, + { + "epoch": 0.15, + "learning_rate": 1.997819533000503e-06, + "loss": 0.8052, + "step": 5899 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978177063309136e-06, + "loss": 0.6492, + "step": 5900 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978158788973407e-06, + "loss": 0.7031, + "step": 5901 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978140506997865e-06, + "loss": 0.8032, + "step": 5902 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978122217382514e-06, + "loss": 0.895, + "step": 5903 + }, + { + "epoch": 0.15, + "learning_rate": 1.997810392012738e-06, + "loss": 0.9844, + "step": 5904 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978085615232463e-06, + "loss": 1.1484, + "step": 5905 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978067302697794e-06, + "loss": 0.9219, + "step": 5906 + }, + { + "epoch": 0.15, + "learning_rate": 1.997804898252337e-06, + "loss": 0.9756, + "step": 5907 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978030654709217e-06, + "loss": 0.9463, + "step": 5908 + }, + { + "epoch": 0.15, + "learning_rate": 1.9978012319255343e-06, + "loss": 0.8813, + "step": 5909 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977993976161767e-06, + "loss": 0.8008, + "step": 5910 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977975625428494e-06, + "loss": 0.9531, + "step": 5911 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977957267055544e-06, + "loss": 1.0938, + "step": 5912 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977938901042933e-06, + "loss": 0.8271, + "step": 5913 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977920527390673e-06, + "loss": 0.9688, + "step": 5914 + }, + { + "epoch": 0.15, + "learning_rate": 1.997790214609878e-06, + "loss": 0.8584, + "step": 5915 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977883757167263e-06, + "loss": 1.0342, + "step": 5916 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977865360596146e-06, + "loss": 0.9688, + "step": 5917 + }, + { + "epoch": 0.15, + "learning_rate": 1.997784695638543e-06, + "loss": 0.9238, + "step": 5918 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977828544535137e-06, + "loss": 0.9443, + "step": 5919 + }, + { + "epoch": 0.15, + "learning_rate": 1.997781012504528e-06, + "loss": 0.8359, + "step": 5920 + }, + { + "epoch": 0.15, + "learning_rate": 1.997779169791587e-06, + "loss": 0.7622, + "step": 5921 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977773263146925e-06, + "loss": 0.9736, + "step": 5922 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977754820738456e-06, + "loss": 0.9834, + "step": 5923 + }, + { + "epoch": 0.15, + "learning_rate": 1.997773637069048e-06, + "loss": 0.6057, + "step": 5924 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977717913003016e-06, + "loss": 0.771, + "step": 5925 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977699447676062e-06, + "loss": 0.9561, + "step": 5926 + }, + { + "epoch": 0.15, + "learning_rate": 1.997768097470965e-06, + "loss": 1.1084, + "step": 5927 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977662494103786e-06, + "loss": 0.9824, + "step": 5928 + }, + { + "epoch": 0.15, + "learning_rate": 1.997764400585848e-06, + "loss": 1.1426, + "step": 5929 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977625509973754e-06, + "loss": 0.8076, + "step": 5930 + }, + { + "epoch": 0.15, + "learning_rate": 1.997760700644962e-06, + "loss": 0.8037, + "step": 5931 + }, + { + "epoch": 0.15, + "learning_rate": 1.997758849528609e-06, + "loss": 0.8643, + "step": 5932 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977569976483177e-06, + "loss": 1.002, + "step": 5933 + }, + { + "epoch": 0.15, + "learning_rate": 1.99775514500409e-06, + "loss": 1.1338, + "step": 5934 + }, + { + "epoch": 0.15, + "learning_rate": 1.997753291595927e-06, + "loss": 0.9238, + "step": 5935 + }, + { + "epoch": 0.15, + "learning_rate": 1.99775143742383e-06, + "loss": 1.0869, + "step": 5936 + }, + { + "epoch": 0.15, + "learning_rate": 1.997749582487801e-06, + "loss": 1.1289, + "step": 5937 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977477267878402e-06, + "loss": 1.041, + "step": 5938 + }, + { + "epoch": 0.15, + "learning_rate": 1.997745870323951e-06, + "loss": 1.1162, + "step": 5939 + }, + { + "epoch": 0.15, + "learning_rate": 1.997744013096133e-06, + "loss": 1.0361, + "step": 5940 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977421551043884e-06, + "loss": 0.8281, + "step": 5941 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977402963487184e-06, + "loss": 1.1104, + "step": 5942 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977384368291246e-06, + "loss": 0.7705, + "step": 5943 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977365765456083e-06, + "loss": 0.9414, + "step": 5944 + }, + { + "epoch": 0.15, + "learning_rate": 1.997734715498171e-06, + "loss": 1.0469, + "step": 5945 + }, + { + "epoch": 0.15, + "learning_rate": 1.997732853686814e-06, + "loss": 0.7827, + "step": 5946 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977309911115392e-06, + "loss": 1.0264, + "step": 5947 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977291277723473e-06, + "loss": 0.9541, + "step": 5948 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977272636692406e-06, + "loss": 0.8125, + "step": 5949 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977253988022194e-06, + "loss": 0.8887, + "step": 5950 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977235331712862e-06, + "loss": 0.998, + "step": 5951 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977216667764416e-06, + "loss": 0.7949, + "step": 5952 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977197996176876e-06, + "loss": 0.7363, + "step": 5953 + }, + { + "epoch": 0.15, + "learning_rate": 1.997717931695025e-06, + "loss": 0.8057, + "step": 5954 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977160630084562e-06, + "loss": 0.8076, + "step": 5955 + }, + { + "epoch": 0.15, + "learning_rate": 1.997714193557982e-06, + "loss": 0.9863, + "step": 5956 + }, + { + "epoch": 0.15, + "learning_rate": 1.997712323343604e-06, + "loss": 0.8623, + "step": 5957 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977104523653234e-06, + "loss": 0.9287, + "step": 5958 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977085806231415e-06, + "loss": 0.8789, + "step": 5959 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977067081170605e-06, + "loss": 0.9131, + "step": 5960 + }, + { + "epoch": 0.15, + "learning_rate": 1.997704834847081e-06, + "loss": 0.9805, + "step": 5961 + }, + { + "epoch": 0.15, + "learning_rate": 1.997702960813205e-06, + "loss": 1.127, + "step": 5962 + }, + { + "epoch": 0.15, + "learning_rate": 1.9977010860154337e-06, + "loss": 1.1543, + "step": 5963 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976992104537685e-06, + "loss": 0.9863, + "step": 5964 + }, + { + "epoch": 0.15, + "learning_rate": 1.997697334128211e-06, + "loss": 0.9434, + "step": 5965 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976954570387622e-06, + "loss": 0.7144, + "step": 5966 + }, + { + "epoch": 0.15, + "learning_rate": 1.997693579185424e-06, + "loss": 0.8506, + "step": 5967 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976917005681977e-06, + "loss": 0.9248, + "step": 5968 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976898211870848e-06, + "loss": 1.1562, + "step": 5969 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976879410420867e-06, + "loss": 1.0156, + "step": 5970 + }, + { + "epoch": 0.15, + "learning_rate": 1.997686060133205e-06, + "loss": 0.9707, + "step": 5971 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976841784604407e-06, + "loss": 1.0186, + "step": 5972 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976822960237954e-06, + "loss": 0.7423, + "step": 5973 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976804128232708e-06, + "loss": 1.1357, + "step": 5974 + }, + { + "epoch": 0.15, + "learning_rate": 1.997678528858868e-06, + "loss": 0.7515, + "step": 5975 + }, + { + "epoch": 0.15, + "learning_rate": 1.997676644130589e-06, + "loss": 0.8828, + "step": 5976 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976747586384346e-06, + "loss": 1.0527, + "step": 5977 + }, + { + "epoch": 0.15, + "learning_rate": 1.997672872382407e-06, + "loss": 0.9688, + "step": 5978 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976709853625064e-06, + "loss": 0.9043, + "step": 5979 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976690975787352e-06, + "loss": 0.7217, + "step": 5980 + }, + { + "epoch": 0.15, + "learning_rate": 1.997667209031095e-06, + "loss": 1.0508, + "step": 5981 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976653197195867e-06, + "loss": 0.7021, + "step": 5982 + }, + { + "epoch": 0.15, + "learning_rate": 1.997663429644212e-06, + "loss": 1.0781, + "step": 5983 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976615388049722e-06, + "loss": 0.8633, + "step": 5984 + }, + { + "epoch": 0.15, + "learning_rate": 1.997659647201869e-06, + "loss": 0.9258, + "step": 5985 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976577548349032e-06, + "loss": 0.8369, + "step": 5986 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976558617040773e-06, + "loss": 0.8179, + "step": 5987 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976539678093916e-06, + "loss": 0.9912, + "step": 5988 + }, + { + "epoch": 0.15, + "learning_rate": 1.997652073150849e-06, + "loss": 0.9473, + "step": 5989 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976501777284496e-06, + "loss": 1.0928, + "step": 5990 + }, + { + "epoch": 0.15, + "learning_rate": 1.997648281542195e-06, + "loss": 0.7959, + "step": 5991 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976463845920873e-06, + "loss": 0.9805, + "step": 5992 + }, + { + "epoch": 0.15, + "learning_rate": 1.997644486878128e-06, + "loss": 0.7324, + "step": 5993 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976425884003176e-06, + "loss": 0.7036, + "step": 5994 + }, + { + "epoch": 0.15, + "learning_rate": 1.997640689158658e-06, + "loss": 0.7578, + "step": 5995 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976387891531513e-06, + "loss": 1.0557, + "step": 5996 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976368883837984e-06, + "loss": 1.083, + "step": 5997 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976349868506004e-06, + "loss": 0.752, + "step": 5998 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976330845535596e-06, + "loss": 0.9023, + "step": 5999 + }, + { + "epoch": 0.15, + "learning_rate": 1.997631181492677e-06, + "loss": 1.207, + "step": 6000 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976292776679536e-06, + "loss": 0.8984, + "step": 6001 + }, + { + "epoch": 0.15, + "learning_rate": 1.997627373079392e-06, + "loss": 1.1162, + "step": 6002 + }, + { + "epoch": 0.15, + "learning_rate": 1.997625467726992e-06, + "loss": 0.9453, + "step": 6003 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976235616107573e-06, + "loss": 0.8877, + "step": 6004 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976216547306876e-06, + "loss": 1.084, + "step": 6005 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976197470867848e-06, + "loss": 0.9902, + "step": 6006 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976178386790505e-06, + "loss": 1.0879, + "step": 6007 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976159295074856e-06, + "loss": 0.8984, + "step": 6008 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976140195720927e-06, + "loss": 0.9736, + "step": 6009 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976121088728726e-06, + "loss": 0.7651, + "step": 6010 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976101974098265e-06, + "loss": 0.8232, + "step": 6011 + }, + { + "epoch": 0.15, + "learning_rate": 1.997608285182956e-06, + "loss": 0.5034, + "step": 6012 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976063721922633e-06, + "loss": 1.1406, + "step": 6013 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976044584377488e-06, + "loss": 0.8652, + "step": 6014 + }, + { + "epoch": 0.15, + "learning_rate": 1.997602543919414e-06, + "loss": 1.0342, + "step": 6015 + }, + { + "epoch": 0.15, + "learning_rate": 1.9976006286372617e-06, + "loss": 1.1182, + "step": 6016 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975987125912922e-06, + "loss": 1.0283, + "step": 6017 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975967957815074e-06, + "loss": 0.6411, + "step": 6018 + }, + { + "epoch": 0.15, + "learning_rate": 1.997594878207908e-06, + "loss": 0.835, + "step": 6019 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975929598704967e-06, + "loss": 0.6238, + "step": 6020 + }, + { + "epoch": 0.15, + "learning_rate": 1.997591040769274e-06, + "loss": 0.8291, + "step": 6021 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975891209042416e-06, + "loss": 0.9355, + "step": 6022 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975872002754012e-06, + "loss": 0.8369, + "step": 6023 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975852788827543e-06, + "loss": 0.9453, + "step": 6024 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975833567263023e-06, + "loss": 1.2227, + "step": 6025 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975814338060463e-06, + "loss": 1.2393, + "step": 6026 + }, + { + "epoch": 0.15, + "learning_rate": 1.997579510121988e-06, + "loss": 1.1514, + "step": 6027 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975775856741294e-06, + "loss": 1.0146, + "step": 6028 + }, + { + "epoch": 0.15, + "learning_rate": 1.997575660462471e-06, + "loss": 0.9941, + "step": 6029 + }, + { + "epoch": 0.15, + "learning_rate": 1.997573734487015e-06, + "loss": 0.9287, + "step": 6030 + }, + { + "epoch": 0.15, + "learning_rate": 1.997571807747763e-06, + "loss": 0.918, + "step": 6031 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975698802447156e-06, + "loss": 1.0469, + "step": 6032 + }, + { + "epoch": 0.15, + "learning_rate": 1.997567951977875e-06, + "loss": 0.8262, + "step": 6033 + }, + { + "epoch": 0.15, + "learning_rate": 1.997566022947243e-06, + "loss": 0.7939, + "step": 6034 + }, + { + "epoch": 0.15, + "learning_rate": 1.99756409315282e-06, + "loss": 1.5156, + "step": 6035 + }, + { + "epoch": 0.15, + "learning_rate": 1.997562162594608e-06, + "loss": 0.7715, + "step": 6036 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975602312726087e-06, + "loss": 0.917, + "step": 6037 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975582991868235e-06, + "loss": 0.9785, + "step": 6038 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975563663372534e-06, + "loss": 1.1123, + "step": 6039 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975544327239006e-06, + "loss": 0.9365, + "step": 6040 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975524983467664e-06, + "loss": 0.8003, + "step": 6041 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975505632058515e-06, + "loss": 0.6558, + "step": 6042 + }, + { + "epoch": 0.15, + "learning_rate": 1.997548627301158e-06, + "loss": 0.9121, + "step": 6043 + }, + { + "epoch": 0.15, + "learning_rate": 1.997546690632688e-06, + "loss": 0.9473, + "step": 6044 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975447532004423e-06, + "loss": 0.9512, + "step": 6045 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975428150044223e-06, + "loss": 0.8652, + "step": 6046 + }, + { + "epoch": 0.15, + "learning_rate": 1.9975408760446293e-06, + "loss": 0.7344, + "step": 6047 + }, + { + "epoch": 0.16, + "learning_rate": 1.9975389363210654e-06, + "loss": 0.6387, + "step": 6048 + }, + { + "epoch": 0.16, + "learning_rate": 1.997536995833732e-06, + "loss": 0.9805, + "step": 6049 + }, + { + "epoch": 0.16, + "learning_rate": 1.9975350545826306e-06, + "loss": 0.9082, + "step": 6050 + }, + { + "epoch": 0.16, + "learning_rate": 1.9975331125677617e-06, + "loss": 0.7764, + "step": 6051 + }, + { + "epoch": 0.16, + "learning_rate": 1.997531169789128e-06, + "loss": 0.7139, + "step": 6052 + }, + { + "epoch": 0.16, + "learning_rate": 1.9975292262467304e-06, + "loss": 0.7407, + "step": 6053 + }, + { + "epoch": 0.16, + "learning_rate": 1.9975272819405705e-06, + "loss": 1.0215, + "step": 6054 + }, + { + "epoch": 0.16, + "learning_rate": 1.9975253368706503e-06, + "loss": 0.6831, + "step": 6055 + }, + { + "epoch": 0.16, + "learning_rate": 1.9975233910369706e-06, + "loss": 0.9609, + "step": 6056 + }, + { + "epoch": 0.16, + "learning_rate": 1.997521444439533e-06, + "loss": 0.8252, + "step": 6057 + }, + { + "epoch": 0.16, + "learning_rate": 1.997519497078339e-06, + "loss": 1.0186, + "step": 6058 + }, + { + "epoch": 0.16, + "learning_rate": 1.99751754895339e-06, + "loss": 0.8232, + "step": 6059 + }, + { + "epoch": 0.16, + "learning_rate": 1.997515600064688e-06, + "loss": 0.833, + "step": 6060 + }, + { + "epoch": 0.16, + "learning_rate": 1.997513650412234e-06, + "loss": 0.9502, + "step": 6061 + }, + { + "epoch": 0.16, + "learning_rate": 1.99751169999603e-06, + "loss": 0.8306, + "step": 6062 + }, + { + "epoch": 0.16, + "learning_rate": 1.997509748816077e-06, + "loss": 0.8267, + "step": 6063 + }, + { + "epoch": 0.16, + "learning_rate": 1.9975077968723764e-06, + "loss": 0.873, + "step": 6064 + }, + { + "epoch": 0.16, + "learning_rate": 1.99750584416493e-06, + "loss": 0.9688, + "step": 6065 + }, + { + "epoch": 0.16, + "learning_rate": 1.9975038906937397e-06, + "loss": 0.7876, + "step": 6066 + }, + { + "epoch": 0.16, + "learning_rate": 1.997501936458806e-06, + "loss": 1.0996, + "step": 6067 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974999814601313e-06, + "loss": 0.8438, + "step": 6068 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974980256977166e-06, + "loss": 0.9287, + "step": 6069 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974960691715635e-06, + "loss": 0.8984, + "step": 6070 + }, + { + "epoch": 0.16, + "learning_rate": 1.997494111881674e-06, + "loss": 0.9111, + "step": 6071 + }, + { + "epoch": 0.16, + "learning_rate": 1.997492153828048e-06, + "loss": 0.8896, + "step": 6072 + }, + { + "epoch": 0.16, + "learning_rate": 1.997490195010689e-06, + "loss": 0.8926, + "step": 6073 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974882354295975e-06, + "loss": 0.9497, + "step": 6074 + }, + { + "epoch": 0.16, + "learning_rate": 1.997486275084775e-06, + "loss": 1.0039, + "step": 6075 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974843139762234e-06, + "loss": 0.8687, + "step": 6076 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974823521039435e-06, + "loss": 0.8877, + "step": 6077 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974803894679377e-06, + "loss": 1.0664, + "step": 6078 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974784260682063e-06, + "loss": 1.0508, + "step": 6079 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974764619047523e-06, + "loss": 0.8857, + "step": 6080 + }, + { + "epoch": 0.16, + "learning_rate": 1.997474496977576e-06, + "loss": 1.1621, + "step": 6081 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974725312866795e-06, + "loss": 0.9443, + "step": 6082 + }, + { + "epoch": 0.16, + "learning_rate": 1.997470564832064e-06, + "loss": 0.812, + "step": 6083 + }, + { + "epoch": 0.16, + "learning_rate": 1.997468597613731e-06, + "loss": 0.9893, + "step": 6084 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974666296316828e-06, + "loss": 1.0479, + "step": 6085 + }, + { + "epoch": 0.16, + "learning_rate": 1.99746466088592e-06, + "loss": 0.8945, + "step": 6086 + }, + { + "epoch": 0.16, + "learning_rate": 1.997462691376444e-06, + "loss": 0.8916, + "step": 6087 + }, + { + "epoch": 0.16, + "learning_rate": 1.997460721103257e-06, + "loss": 0.7891, + "step": 6088 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974587500663604e-06, + "loss": 0.9385, + "step": 6089 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974567782657554e-06, + "loss": 1.002, + "step": 6090 + }, + { + "epoch": 0.16, + "learning_rate": 1.997454805701443e-06, + "loss": 0.8818, + "step": 6091 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974528323734263e-06, + "loss": 0.9033, + "step": 6092 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974508582817047e-06, + "loss": 0.8086, + "step": 6093 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974488834262817e-06, + "loss": 1.0479, + "step": 6094 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974469078071577e-06, + "loss": 0.9492, + "step": 6095 + }, + { + "epoch": 0.16, + "learning_rate": 1.997444931424335e-06, + "loss": 1.0381, + "step": 6096 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974429542778136e-06, + "loss": 0.6196, + "step": 6097 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974409763675968e-06, + "loss": 0.9922, + "step": 6098 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974389976936844e-06, + "loss": 0.9248, + "step": 6099 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974370182560796e-06, + "loss": 1.0166, + "step": 6100 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974350380547827e-06, + "loss": 1.0244, + "step": 6101 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974330570897957e-06, + "loss": 0.8926, + "step": 6102 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974310753611205e-06, + "loss": 0.9668, + "step": 6103 + }, + { + "epoch": 0.16, + "learning_rate": 1.997429092868758e-06, + "loss": 0.8682, + "step": 6104 + }, + { + "epoch": 0.16, + "learning_rate": 1.99742710961271e-06, + "loss": 0.9619, + "step": 6105 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974251255929774e-06, + "loss": 1.1807, + "step": 6106 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974231408095625e-06, + "loss": 0.8633, + "step": 6107 + }, + { + "epoch": 0.16, + "learning_rate": 1.997421155262467e-06, + "loss": 0.8838, + "step": 6108 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974191689516913e-06, + "loss": 0.9248, + "step": 6109 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974171818772382e-06, + "loss": 1.0469, + "step": 6110 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974151940391083e-06, + "loss": 0.8906, + "step": 6111 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974132054373037e-06, + "loss": 1.1123, + "step": 6112 + }, + { + "epoch": 0.16, + "learning_rate": 1.997411216071825e-06, + "loss": 0.8789, + "step": 6113 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974092259426753e-06, + "loss": 0.915, + "step": 6114 + }, + { + "epoch": 0.16, + "learning_rate": 1.997407235049855e-06, + "loss": 1.1377, + "step": 6115 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974052433933653e-06, + "loss": 0.9229, + "step": 6116 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974032509732085e-06, + "loss": 0.7988, + "step": 6117 + }, + { + "epoch": 0.16, + "learning_rate": 1.9974012577893864e-06, + "loss": 1.042, + "step": 6118 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973992638418996e-06, + "loss": 1.1035, + "step": 6119 + }, + { + "epoch": 0.16, + "learning_rate": 1.99739726913075e-06, + "loss": 0.9531, + "step": 6120 + }, + { + "epoch": 0.16, + "learning_rate": 1.997395273655939e-06, + "loss": 0.7847, + "step": 6121 + }, + { + "epoch": 0.16, + "learning_rate": 1.997393277417469e-06, + "loss": 1.0, + "step": 6122 + }, + { + "epoch": 0.16, + "learning_rate": 1.99739128041534e-06, + "loss": 0.8086, + "step": 6123 + }, + { + "epoch": 0.16, + "learning_rate": 1.997389282649555e-06, + "loss": 0.9512, + "step": 6124 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973872841201145e-06, + "loss": 1.0156, + "step": 6125 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973852848270206e-06, + "loss": 0.8906, + "step": 6126 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973832847702745e-06, + "loss": 0.7642, + "step": 6127 + }, + { + "epoch": 0.16, + "learning_rate": 1.997381283949878e-06, + "loss": 1.0859, + "step": 6128 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973792823658324e-06, + "loss": 0.8135, + "step": 6129 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973772800181395e-06, + "loss": 0.873, + "step": 6130 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973752769068003e-06, + "loss": 0.8418, + "step": 6131 + }, + { + "epoch": 0.16, + "learning_rate": 1.997373273031817e-06, + "loss": 1.0645, + "step": 6132 + }, + { + "epoch": 0.16, + "learning_rate": 1.997371268393191e-06, + "loss": 0.877, + "step": 6133 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973692629909237e-06, + "loss": 0.8857, + "step": 6134 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973672568250164e-06, + "loss": 1.0557, + "step": 6135 + }, + { + "epoch": 0.16, + "learning_rate": 1.997365249895471e-06, + "loss": 0.6982, + "step": 6136 + }, + { + "epoch": 0.16, + "learning_rate": 1.997363242202289e-06, + "loss": 0.8804, + "step": 6137 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973612337454716e-06, + "loss": 0.9961, + "step": 6138 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973592245250203e-06, + "loss": 0.9365, + "step": 6139 + }, + { + "epoch": 0.16, + "learning_rate": 1.997357214540937e-06, + "loss": 0.8926, + "step": 6140 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973552037932234e-06, + "loss": 0.8828, + "step": 6141 + }, + { + "epoch": 0.16, + "learning_rate": 1.997353192281881e-06, + "loss": 0.8301, + "step": 6142 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973511800069106e-06, + "loss": 0.8477, + "step": 6143 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973491669683143e-06, + "loss": 0.895, + "step": 6144 + }, + { + "epoch": 0.16, + "learning_rate": 1.997347153166094e-06, + "loss": 0.8037, + "step": 6145 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973451386002507e-06, + "loss": 1.3008, + "step": 6146 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973431232707856e-06, + "loss": 1.083, + "step": 6147 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973411071777016e-06, + "loss": 1.1016, + "step": 6148 + }, + { + "epoch": 0.16, + "learning_rate": 1.997339090320999e-06, + "loss": 0.9375, + "step": 6149 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973370727006793e-06, + "loss": 1.1846, + "step": 6150 + }, + { + "epoch": 0.16, + "learning_rate": 1.997335054316745e-06, + "loss": 0.9932, + "step": 6151 + }, + { + "epoch": 0.16, + "learning_rate": 1.997333035169197e-06, + "loss": 0.9473, + "step": 6152 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973310152580366e-06, + "loss": 0.9326, + "step": 6153 + }, + { + "epoch": 0.16, + "learning_rate": 1.997328994583266e-06, + "loss": 0.6665, + "step": 6154 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973269731448865e-06, + "loss": 0.9951, + "step": 6155 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973249509428997e-06, + "loss": 0.9639, + "step": 6156 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973229279773064e-06, + "loss": 0.7725, + "step": 6157 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973209042481094e-06, + "loss": 1.1455, + "step": 6158 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973188797553093e-06, + "loss": 1.0137, + "step": 6159 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973168544989086e-06, + "loss": 1.0, + "step": 6160 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973148284789077e-06, + "loss": 0.9482, + "step": 6161 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973128016953087e-06, + "loss": 1.0342, + "step": 6162 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973107741481133e-06, + "loss": 0.9854, + "step": 6163 + }, + { + "epoch": 0.16, + "learning_rate": 1.9973087458373228e-06, + "loss": 0.9062, + "step": 6164 + }, + { + "epoch": 0.16, + "learning_rate": 1.997306716762939e-06, + "loss": 0.9648, + "step": 6165 + }, + { + "epoch": 0.16, + "learning_rate": 1.997304686924963e-06, + "loss": 1.0986, + "step": 6166 + }, + { + "epoch": 0.16, + "learning_rate": 1.997302656323397e-06, + "loss": 0.9268, + "step": 6167 + }, + { + "epoch": 0.16, + "learning_rate": 1.997300624958242e-06, + "loss": 1.2861, + "step": 6168 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972985928294997e-06, + "loss": 0.9307, + "step": 6169 + }, + { + "epoch": 0.16, + "learning_rate": 1.997296559937172e-06, + "loss": 0.8818, + "step": 6170 + }, + { + "epoch": 0.16, + "learning_rate": 1.99729452628126e-06, + "loss": 0.8252, + "step": 6171 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972924918617657e-06, + "loss": 1.0098, + "step": 6172 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972904566786903e-06, + "loss": 0.7153, + "step": 6173 + }, + { + "epoch": 0.16, + "learning_rate": 1.997288420732035e-06, + "loss": 1.21, + "step": 6174 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972863840218023e-06, + "loss": 1.0703, + "step": 6175 + }, + { + "epoch": 0.16, + "learning_rate": 1.997284346547993e-06, + "loss": 0.918, + "step": 6176 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972823083106092e-06, + "loss": 0.9233, + "step": 6177 + }, + { + "epoch": 0.16, + "learning_rate": 1.997280269309652e-06, + "loss": 0.999, + "step": 6178 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972782295451233e-06, + "loss": 1.0225, + "step": 6179 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972761890170244e-06, + "loss": 0.875, + "step": 6180 + }, + { + "epoch": 0.16, + "learning_rate": 1.997274147725357e-06, + "loss": 0.832, + "step": 6181 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972721056701223e-06, + "loss": 1.0156, + "step": 6182 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972700628513227e-06, + "loss": 0.9941, + "step": 6183 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972680192689593e-06, + "loss": 1.1543, + "step": 6184 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972659749230333e-06, + "loss": 1.04, + "step": 6185 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972639298135466e-06, + "loss": 0.8623, + "step": 6186 + }, + { + "epoch": 0.16, + "learning_rate": 1.997261883940501e-06, + "loss": 1.0137, + "step": 6187 + }, + { + "epoch": 0.16, + "learning_rate": 1.997259837303898e-06, + "loss": 1.0996, + "step": 6188 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972577899037384e-06, + "loss": 1.0791, + "step": 6189 + }, + { + "epoch": 0.16, + "learning_rate": 1.997255741740025e-06, + "loss": 0.918, + "step": 6190 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972536928127583e-06, + "loss": 0.9785, + "step": 6191 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972516431219405e-06, + "loss": 0.9453, + "step": 6192 + }, + { + "epoch": 0.16, + "learning_rate": 1.997249592667573e-06, + "loss": 0.9268, + "step": 6193 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972475414496573e-06, + "loss": 1.0303, + "step": 6194 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972454894681948e-06, + "loss": 0.9648, + "step": 6195 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972434367231876e-06, + "loss": 0.9238, + "step": 6196 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972413832146365e-06, + "loss": 0.8821, + "step": 6197 + }, + { + "epoch": 0.16, + "learning_rate": 1.997239328942544e-06, + "loss": 0.7886, + "step": 6198 + }, + { + "epoch": 0.16, + "learning_rate": 1.997237273906911e-06, + "loss": 0.8242, + "step": 6199 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972352181077394e-06, + "loss": 1.0586, + "step": 6200 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972331615450306e-06, + "loss": 1.0195, + "step": 6201 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972311042187864e-06, + "loss": 1.0439, + "step": 6202 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972290461290076e-06, + "loss": 0.7812, + "step": 6203 + }, + { + "epoch": 0.16, + "learning_rate": 1.997226987275697e-06, + "loss": 1.0732, + "step": 6204 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972249276588553e-06, + "loss": 0.877, + "step": 6205 + }, + { + "epoch": 0.16, + "learning_rate": 1.997222867278484e-06, + "loss": 0.7075, + "step": 6206 + }, + { + "epoch": 0.16, + "learning_rate": 1.997220806134585e-06, + "loss": 0.9482, + "step": 6207 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972187442271606e-06, + "loss": 0.7344, + "step": 6208 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972166815562113e-06, + "loss": 0.96, + "step": 6209 + }, + { + "epoch": 0.16, + "learning_rate": 1.997214618121739e-06, + "loss": 1.0605, + "step": 6210 + }, + { + "epoch": 0.16, + "learning_rate": 1.997212553923745e-06, + "loss": 1.0645, + "step": 6211 + }, + { + "epoch": 0.16, + "learning_rate": 1.997210488962232e-06, + "loss": 0.894, + "step": 6212 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972084232372e-06, + "loss": 0.9043, + "step": 6213 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972063567486517e-06, + "loss": 1.1406, + "step": 6214 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972042894965882e-06, + "loss": 0.9023, + "step": 6215 + }, + { + "epoch": 0.16, + "learning_rate": 1.9972022214810114e-06, + "loss": 0.9233, + "step": 6216 + }, + { + "epoch": 0.16, + "learning_rate": 1.997200152701923e-06, + "loss": 0.9424, + "step": 6217 + }, + { + "epoch": 0.16, + "learning_rate": 1.997198083159324e-06, + "loss": 1.1523, + "step": 6218 + }, + { + "epoch": 0.16, + "learning_rate": 1.997196012853216e-06, + "loss": 1.0303, + "step": 6219 + }, + { + "epoch": 0.16, + "learning_rate": 1.997193941783601e-06, + "loss": 0.9385, + "step": 6220 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971918699504804e-06, + "loss": 0.8931, + "step": 6221 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971897973538563e-06, + "loss": 0.8115, + "step": 6222 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971877239937295e-06, + "loss": 0.707, + "step": 6223 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971856498701015e-06, + "loss": 0.7227, + "step": 6224 + }, + { + "epoch": 0.16, + "learning_rate": 1.997183574982975e-06, + "loss": 0.8389, + "step": 6225 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971814993323508e-06, + "loss": 0.9854, + "step": 6226 + }, + { + "epoch": 0.16, + "learning_rate": 1.99717942291823e-06, + "loss": 0.8657, + "step": 6227 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971773457406155e-06, + "loss": 1.1572, + "step": 6228 + }, + { + "epoch": 0.16, + "learning_rate": 1.997175267799508e-06, + "loss": 0.8472, + "step": 6229 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971731890949085e-06, + "loss": 0.9844, + "step": 6230 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971711096268203e-06, + "loss": 1.1318, + "step": 6231 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971690293952433e-06, + "loss": 0.9883, + "step": 6232 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971669484001804e-06, + "loss": 0.7383, + "step": 6233 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971648666416325e-06, + "loss": 1.0439, + "step": 6234 + }, + { + "epoch": 0.16, + "learning_rate": 1.997162784119601e-06, + "loss": 0.8867, + "step": 6235 + }, + { + "epoch": 0.16, + "learning_rate": 1.997160700834088e-06, + "loss": 0.9307, + "step": 6236 + }, + { + "epoch": 0.16, + "learning_rate": 1.997158616785095e-06, + "loss": 1.1113, + "step": 6237 + }, + { + "epoch": 0.16, + "learning_rate": 1.997156531972623e-06, + "loss": 0.9028, + "step": 6238 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971544463966747e-06, + "loss": 0.9814, + "step": 6239 + }, + { + "epoch": 0.16, + "learning_rate": 1.997152360057251e-06, + "loss": 0.8213, + "step": 6240 + }, + { + "epoch": 0.16, + "learning_rate": 1.997150272954353e-06, + "loss": 0.8311, + "step": 6241 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971481850879835e-06, + "loss": 0.8252, + "step": 6242 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971460964581434e-06, + "loss": 1.0547, + "step": 6243 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971440070648344e-06, + "loss": 1.0742, + "step": 6244 + }, + { + "epoch": 0.16, + "learning_rate": 1.997141916908058e-06, + "loss": 0.9111, + "step": 6245 + }, + { + "epoch": 0.16, + "learning_rate": 1.997139825987816e-06, + "loss": 0.877, + "step": 6246 + }, + { + "epoch": 0.16, + "learning_rate": 1.99713773430411e-06, + "loss": 1.2109, + "step": 6247 + }, + { + "epoch": 0.16, + "learning_rate": 1.997135641856941e-06, + "loss": 1.0264, + "step": 6248 + }, + { + "epoch": 0.16, + "learning_rate": 1.997133548646311e-06, + "loss": 0.8447, + "step": 6249 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971314546722226e-06, + "loss": 1.0107, + "step": 6250 + }, + { + "epoch": 0.16, + "learning_rate": 1.997129359934676e-06, + "loss": 0.8008, + "step": 6251 + }, + { + "epoch": 0.16, + "learning_rate": 1.997127264433673e-06, + "loss": 0.9072, + "step": 6252 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971251681692157e-06, + "loss": 1.1299, + "step": 6253 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971230711413057e-06, + "loss": 0.7422, + "step": 6254 + }, + { + "epoch": 0.16, + "learning_rate": 1.997120973349944e-06, + "loss": 0.9316, + "step": 6255 + }, + { + "epoch": 0.16, + "learning_rate": 1.997118874795133e-06, + "loss": 1.041, + "step": 6256 + }, + { + "epoch": 0.16, + "learning_rate": 1.997116775476874e-06, + "loss": 0.7578, + "step": 6257 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971146753951683e-06, + "loss": 1.0781, + "step": 6258 + }, + { + "epoch": 0.16, + "learning_rate": 1.997112574550018e-06, + "loss": 0.9863, + "step": 6259 + }, + { + "epoch": 0.16, + "learning_rate": 1.997110472941424e-06, + "loss": 0.9199, + "step": 6260 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971083705693882e-06, + "loss": 0.9238, + "step": 6261 + }, + { + "epoch": 0.16, + "learning_rate": 1.997106267433913e-06, + "loss": 0.8672, + "step": 6262 + }, + { + "epoch": 0.16, + "learning_rate": 1.997104163534999e-06, + "loss": 0.8906, + "step": 6263 + }, + { + "epoch": 0.16, + "learning_rate": 1.9971020588726485e-06, + "loss": 0.8848, + "step": 6264 + }, + { + "epoch": 0.16, + "learning_rate": 1.997099953446863e-06, + "loss": 1.0127, + "step": 6265 + }, + { + "epoch": 0.16, + "learning_rate": 1.997097847257643e-06, + "loss": 0.9326, + "step": 6266 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970957403049917e-06, + "loss": 0.7383, + "step": 6267 + }, + { + "epoch": 0.16, + "learning_rate": 1.99709363258891e-06, + "loss": 1.0166, + "step": 6268 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970915241093995e-06, + "loss": 0.8174, + "step": 6269 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970894148664616e-06, + "loss": 0.6146, + "step": 6270 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970873048600984e-06, + "loss": 0.9229, + "step": 6271 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970851940903117e-06, + "loss": 0.8159, + "step": 6272 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970830825571018e-06, + "loss": 1.0537, + "step": 6273 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970809702604716e-06, + "loss": 0.8779, + "step": 6274 + }, + { + "epoch": 0.16, + "learning_rate": 1.997078857200423e-06, + "loss": 1.1484, + "step": 6275 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970767433769563e-06, + "loss": 0.9824, + "step": 6276 + }, + { + "epoch": 0.16, + "learning_rate": 1.997074628790074e-06, + "loss": 0.8208, + "step": 6277 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970725134397774e-06, + "loss": 1.0469, + "step": 6278 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970703973260683e-06, + "loss": 0.6956, + "step": 6279 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970682804489483e-06, + "loss": 0.8428, + "step": 6280 + }, + { + "epoch": 0.16, + "learning_rate": 1.997066162808419e-06, + "loss": 0.8516, + "step": 6281 + }, + { + "epoch": 0.16, + "learning_rate": 1.997064044404482e-06, + "loss": 0.9736, + "step": 6282 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970619252371385e-06, + "loss": 0.8154, + "step": 6283 + }, + { + "epoch": 0.16, + "learning_rate": 1.997059805306391e-06, + "loss": 0.875, + "step": 6284 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970576846122402e-06, + "loss": 1.001, + "step": 6285 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970555631546887e-06, + "loss": 0.7803, + "step": 6286 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970534409337373e-06, + "loss": 0.8389, + "step": 6287 + }, + { + "epoch": 0.16, + "learning_rate": 1.997051317949388e-06, + "loss": 0.8105, + "step": 6288 + }, + { + "epoch": 0.16, + "learning_rate": 1.997049194201642e-06, + "loss": 0.8633, + "step": 6289 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970470696905017e-06, + "loss": 0.9004, + "step": 6290 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970449444159682e-06, + "loss": 1.0557, + "step": 6291 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970428183780433e-06, + "loss": 0.8716, + "step": 6292 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970406915767282e-06, + "loss": 0.9473, + "step": 6293 + }, + { + "epoch": 0.16, + "learning_rate": 1.997038564012025e-06, + "loss": 1.0986, + "step": 6294 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970364356839357e-06, + "loss": 1.0342, + "step": 6295 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970343065924613e-06, + "loss": 1.0957, + "step": 6296 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970321767376034e-06, + "loss": 1.0996, + "step": 6297 + }, + { + "epoch": 0.16, + "learning_rate": 1.997030046119364e-06, + "loss": 0.7466, + "step": 6298 + }, + { + "epoch": 0.16, + "learning_rate": 1.997027914737744e-06, + "loss": 0.8574, + "step": 6299 + }, + { + "epoch": 0.16, + "learning_rate": 1.997025782592746e-06, + "loss": 0.7256, + "step": 6300 + }, + { + "epoch": 0.16, + "learning_rate": 1.997023649684371e-06, + "loss": 0.8271, + "step": 6301 + }, + { + "epoch": 0.16, + "learning_rate": 1.997021516012621e-06, + "loss": 0.9551, + "step": 6302 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970193815774977e-06, + "loss": 1.0371, + "step": 6303 + }, + { + "epoch": 0.16, + "learning_rate": 1.997017246379002e-06, + "loss": 0.9912, + "step": 6304 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970151104171363e-06, + "loss": 0.9609, + "step": 6305 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970129736919023e-06, + "loss": 1.0068, + "step": 6306 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970108362033006e-06, + "loss": 0.7581, + "step": 6307 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970086979513343e-06, + "loss": 0.835, + "step": 6308 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970065589360036e-06, + "loss": 0.9326, + "step": 6309 + }, + { + "epoch": 0.16, + "learning_rate": 1.997004419157311e-06, + "loss": 1.0117, + "step": 6310 + }, + { + "epoch": 0.16, + "learning_rate": 1.997002278615258e-06, + "loss": 0.7842, + "step": 6311 + }, + { + "epoch": 0.16, + "learning_rate": 1.9970001373098464e-06, + "loss": 0.8525, + "step": 6312 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969979952410776e-06, + "loss": 0.9297, + "step": 6313 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969958524089533e-06, + "loss": 0.8848, + "step": 6314 + }, + { + "epoch": 0.16, + "learning_rate": 1.996993708813475e-06, + "loss": 0.9424, + "step": 6315 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969915644546445e-06, + "loss": 0.9619, + "step": 6316 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969894193324633e-06, + "loss": 0.7539, + "step": 6317 + }, + { + "epoch": 0.16, + "learning_rate": 1.996987273446933e-06, + "loss": 0.874, + "step": 6318 + }, + { + "epoch": 0.16, + "learning_rate": 1.996985126798056e-06, + "loss": 0.9834, + "step": 6319 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969829793858327e-06, + "loss": 0.7891, + "step": 6320 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969808312102655e-06, + "loss": 0.875, + "step": 6321 + }, + { + "epoch": 0.16, + "learning_rate": 1.996978682271356e-06, + "loss": 0.8232, + "step": 6322 + }, + { + "epoch": 0.16, + "learning_rate": 1.996976532569106e-06, + "loss": 0.9346, + "step": 6323 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969743821035165e-06, + "loss": 1.0186, + "step": 6324 + }, + { + "epoch": 0.16, + "learning_rate": 1.99697223087459e-06, + "loss": 0.877, + "step": 6325 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969700788823273e-06, + "loss": 0.9902, + "step": 6326 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969679261267305e-06, + "loss": 1.0928, + "step": 6327 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969657726078017e-06, + "loss": 1.041, + "step": 6328 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969636183255415e-06, + "loss": 0.7871, + "step": 6329 + }, + { + "epoch": 0.16, + "learning_rate": 1.996961463279952e-06, + "loss": 0.9082, + "step": 6330 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969593074710354e-06, + "loss": 0.9932, + "step": 6331 + }, + { + "epoch": 0.16, + "learning_rate": 1.996957150898793e-06, + "loss": 0.9141, + "step": 6332 + }, + { + "epoch": 0.16, + "learning_rate": 1.996954993563226e-06, + "loss": 1.0479, + "step": 6333 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969528354643365e-06, + "loss": 1.0488, + "step": 6334 + }, + { + "epoch": 0.16, + "learning_rate": 1.996950676602126e-06, + "loss": 0.8613, + "step": 6335 + }, + { + "epoch": 0.16, + "learning_rate": 1.996948516976596e-06, + "loss": 0.7979, + "step": 6336 + }, + { + "epoch": 0.16, + "learning_rate": 1.996946356587749e-06, + "loss": 0.9268, + "step": 6337 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969441954355856e-06, + "loss": 1.0605, + "step": 6338 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969420335201077e-06, + "loss": 0.9688, + "step": 6339 + }, + { + "epoch": 0.16, + "learning_rate": 1.996939870841317e-06, + "loss": 1.0615, + "step": 6340 + }, + { + "epoch": 0.16, + "learning_rate": 1.996937707399216e-06, + "loss": 0.8652, + "step": 6341 + }, + { + "epoch": 0.16, + "learning_rate": 1.996935543193805e-06, + "loss": 0.915, + "step": 6342 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969333782250864e-06, + "loss": 1.1572, + "step": 6343 + }, + { + "epoch": 0.16, + "learning_rate": 1.996931212493062e-06, + "loss": 0.8389, + "step": 6344 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969290459977333e-06, + "loss": 0.7471, + "step": 6345 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969268787391017e-06, + "loss": 1.0117, + "step": 6346 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969247107171688e-06, + "loss": 0.8779, + "step": 6347 + }, + { + "epoch": 0.16, + "learning_rate": 1.996922541931937e-06, + "loss": 0.8154, + "step": 6348 + }, + { + "epoch": 0.16, + "learning_rate": 1.996920372383407e-06, + "loss": 0.9561, + "step": 6349 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969182020715807e-06, + "loss": 1.124, + "step": 6350 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969160309964604e-06, + "loss": 1.0205, + "step": 6351 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969138591580473e-06, + "loss": 0.9395, + "step": 6352 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969116865563432e-06, + "loss": 0.8706, + "step": 6353 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969095131913494e-06, + "loss": 0.9092, + "step": 6354 + }, + { + "epoch": 0.16, + "learning_rate": 1.996907339063068e-06, + "loss": 0.8008, + "step": 6355 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969051641715004e-06, + "loss": 0.9756, + "step": 6356 + }, + { + "epoch": 0.16, + "learning_rate": 1.9969029885166483e-06, + "loss": 0.8838, + "step": 6357 + }, + { + "epoch": 0.16, + "learning_rate": 1.996900812098513e-06, + "loss": 0.9741, + "step": 6358 + }, + { + "epoch": 0.16, + "learning_rate": 1.996898634917097e-06, + "loss": 1.1738, + "step": 6359 + }, + { + "epoch": 0.16, + "learning_rate": 1.996896456972402e-06, + "loss": 0.7871, + "step": 6360 + }, + { + "epoch": 0.16, + "learning_rate": 1.996894278264429e-06, + "loss": 0.8726, + "step": 6361 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968920987931797e-06, + "loss": 0.8018, + "step": 6362 + }, + { + "epoch": 0.16, + "learning_rate": 1.996889918558656e-06, + "loss": 1.0713, + "step": 6363 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968877375608597e-06, + "loss": 1.0811, + "step": 6364 + }, + { + "epoch": 0.16, + "learning_rate": 1.996885555799792e-06, + "loss": 0.9482, + "step": 6365 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968833732754547e-06, + "loss": 1.0879, + "step": 6366 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968811899878502e-06, + "loss": 0.9551, + "step": 6367 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968790059369792e-06, + "loss": 0.9316, + "step": 6368 + }, + { + "epoch": 0.16, + "learning_rate": 1.996876821122844e-06, + "loss": 0.8623, + "step": 6369 + }, + { + "epoch": 0.16, + "learning_rate": 1.996874635545446e-06, + "loss": 0.8101, + "step": 6370 + }, + { + "epoch": 0.16, + "learning_rate": 1.996872449204787e-06, + "loss": 1.1143, + "step": 6371 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968702621008683e-06, + "loss": 0.645, + "step": 6372 + }, + { + "epoch": 0.16, + "learning_rate": 1.996868074233692e-06, + "loss": 0.8955, + "step": 6373 + }, + { + "epoch": 0.16, + "learning_rate": 1.99686588560326e-06, + "loss": 1.1309, + "step": 6374 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968636962095732e-06, + "loss": 0.8711, + "step": 6375 + }, + { + "epoch": 0.16, + "learning_rate": 1.996861506052634e-06, + "loss": 0.9092, + "step": 6376 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968593151324436e-06, + "loss": 1.0264, + "step": 6377 + }, + { + "epoch": 0.16, + "learning_rate": 1.996857123449004e-06, + "loss": 0.916, + "step": 6378 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968549310023166e-06, + "loss": 0.9902, + "step": 6379 + }, + { + "epoch": 0.16, + "learning_rate": 1.996852737792383e-06, + "loss": 1.123, + "step": 6380 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968505438192055e-06, + "loss": 0.8965, + "step": 6381 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968483490827852e-06, + "loss": 0.8457, + "step": 6382 + }, + { + "epoch": 0.16, + "learning_rate": 1.996846153583124e-06, + "loss": 0.8975, + "step": 6383 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968439573202235e-06, + "loss": 1.0332, + "step": 6384 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968417602940856e-06, + "loss": 0.8154, + "step": 6385 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968395625047116e-06, + "loss": 0.9316, + "step": 6386 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968373639521034e-06, + "loss": 1.0498, + "step": 6387 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968351646362625e-06, + "loss": 1.0127, + "step": 6388 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968329645571912e-06, + "loss": 0.8799, + "step": 6389 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968307637148903e-06, + "loss": 0.8184, + "step": 6390 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968285621093623e-06, + "loss": 0.9658, + "step": 6391 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968263597406084e-06, + "loss": 0.876, + "step": 6392 + }, + { + "epoch": 0.16, + "learning_rate": 1.99682415660863e-06, + "loss": 0.8955, + "step": 6393 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968219527134297e-06, + "loss": 0.918, + "step": 6394 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968197480550086e-06, + "loss": 0.9355, + "step": 6395 + }, + { + "epoch": 0.16, + "learning_rate": 1.996817542633368e-06, + "loss": 0.7949, + "step": 6396 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968153364485105e-06, + "loss": 0.9604, + "step": 6397 + }, + { + "epoch": 0.16, + "learning_rate": 1.996813129500437e-06, + "loss": 1.1455, + "step": 6398 + }, + { + "epoch": 0.16, + "learning_rate": 1.99681092178915e-06, + "loss": 0.9883, + "step": 6399 + }, + { + "epoch": 0.16, + "learning_rate": 1.99680871331465e-06, + "loss": 1.0557, + "step": 6400 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968065040769398e-06, + "loss": 1.1699, + "step": 6401 + }, + { + "epoch": 0.16, + "learning_rate": 1.996804294076021e-06, + "loss": 1.043, + "step": 6402 + }, + { + "epoch": 0.16, + "learning_rate": 1.9968020833118946e-06, + "loss": 0.8438, + "step": 6403 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967998717845627e-06, + "loss": 0.9814, + "step": 6404 + }, + { + "epoch": 0.16, + "learning_rate": 1.996797659494027e-06, + "loss": 1.1953, + "step": 6405 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967954464402893e-06, + "loss": 0.9336, + "step": 6406 + }, + { + "epoch": 0.16, + "learning_rate": 1.996793232623351e-06, + "loss": 0.959, + "step": 6407 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967910180432143e-06, + "loss": 0.8877, + "step": 6408 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967888026998804e-06, + "loss": 0.998, + "step": 6409 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967865865933507e-06, + "loss": 0.8799, + "step": 6410 + }, + { + "epoch": 0.16, + "learning_rate": 1.996784369723628e-06, + "loss": 0.9597, + "step": 6411 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967821520907127e-06, + "loss": 0.8857, + "step": 6412 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967799336946073e-06, + "loss": 0.8716, + "step": 6413 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967777145353137e-06, + "loss": 0.873, + "step": 6414 + }, + { + "epoch": 0.16, + "learning_rate": 1.996775494612833e-06, + "loss": 0.9395, + "step": 6415 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967732739271674e-06, + "loss": 0.8901, + "step": 6416 + }, + { + "epoch": 0.16, + "learning_rate": 1.996771052478318e-06, + "loss": 0.9326, + "step": 6417 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967688302662867e-06, + "loss": 0.9912, + "step": 6418 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967666072910754e-06, + "loss": 0.8301, + "step": 6419 + }, + { + "epoch": 0.16, + "learning_rate": 1.996764383552686e-06, + "loss": 1.0166, + "step": 6420 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967621590511203e-06, + "loss": 1.1211, + "step": 6421 + }, + { + "epoch": 0.16, + "learning_rate": 1.996759933786379e-06, + "loss": 0.896, + "step": 6422 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967577077584647e-06, + "loss": 0.6357, + "step": 6423 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967554809673785e-06, + "loss": 0.959, + "step": 6424 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967532534131228e-06, + "loss": 0.75, + "step": 6425 + }, + { + "epoch": 0.16, + "learning_rate": 1.996751025095699e-06, + "loss": 0.8955, + "step": 6426 + }, + { + "epoch": 0.16, + "learning_rate": 1.996748796015109e-06, + "loss": 0.8506, + "step": 6427 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967465661713535e-06, + "loss": 0.8428, + "step": 6428 + }, + { + "epoch": 0.16, + "learning_rate": 1.996744335564436e-06, + "loss": 0.8545, + "step": 6429 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967421041943565e-06, + "loss": 0.8237, + "step": 6430 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967398720611173e-06, + "loss": 0.7686, + "step": 6431 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967376391647205e-06, + "loss": 0.8018, + "step": 6432 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967354055051678e-06, + "loss": 1.1006, + "step": 6433 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967331710824604e-06, + "loss": 0.7974, + "step": 6434 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967309358966e-06, + "loss": 0.7788, + "step": 6435 + }, + { + "epoch": 0.16, + "learning_rate": 1.9967286999475888e-06, + "loss": 1.001, + "step": 6436 + }, + { + "epoch": 0.16, + "learning_rate": 1.996726463235428e-06, + "loss": 1.0625, + "step": 6437 + }, + { + "epoch": 0.17, + "learning_rate": 1.9967242257601197e-06, + "loss": 0.8262, + "step": 6438 + }, + { + "epoch": 0.17, + "learning_rate": 1.9967219875216657e-06, + "loss": 0.6118, + "step": 6439 + }, + { + "epoch": 0.17, + "learning_rate": 1.996719748520067e-06, + "loss": 1.0381, + "step": 6440 + }, + { + "epoch": 0.17, + "learning_rate": 1.9967175087553267e-06, + "loss": 0.9844, + "step": 6441 + }, + { + "epoch": 0.17, + "learning_rate": 1.996715268227445e-06, + "loss": 0.9404, + "step": 6442 + }, + { + "epoch": 0.17, + "learning_rate": 1.9967130269364245e-06, + "loss": 0.6919, + "step": 6443 + }, + { + "epoch": 0.17, + "learning_rate": 1.9967107848822666e-06, + "loss": 1.0918, + "step": 6444 + }, + { + "epoch": 0.17, + "learning_rate": 1.9967085420649727e-06, + "loss": 0.7017, + "step": 6445 + }, + { + "epoch": 0.17, + "learning_rate": 1.9967062984845453e-06, + "loss": 1.125, + "step": 6446 + }, + { + "epoch": 0.17, + "learning_rate": 1.9967040541409856e-06, + "loss": 0.7422, + "step": 6447 + }, + { + "epoch": 0.17, + "learning_rate": 1.9967018090342955e-06, + "loss": 0.8975, + "step": 6448 + }, + { + "epoch": 0.17, + "learning_rate": 1.996699563164477e-06, + "loss": 0.9033, + "step": 6449 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966973165315304e-06, + "loss": 0.9717, + "step": 6450 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966950691354593e-06, + "loss": 0.9268, + "step": 6451 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966928209762644e-06, + "loss": 1.1016, + "step": 6452 + }, + { + "epoch": 0.17, + "learning_rate": 1.996690572053948e-06, + "loss": 0.8779, + "step": 6453 + }, + { + "epoch": 0.17, + "learning_rate": 1.996688322368511e-06, + "loss": 1.0664, + "step": 6454 + }, + { + "epoch": 0.17, + "learning_rate": 1.996686071919956e-06, + "loss": 0.9004, + "step": 6455 + }, + { + "epoch": 0.17, + "learning_rate": 1.996683820708284e-06, + "loss": 0.8984, + "step": 6456 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966815687334974e-06, + "loss": 0.9014, + "step": 6457 + }, + { + "epoch": 0.17, + "learning_rate": 1.996679315995597e-06, + "loss": 0.8501, + "step": 6458 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966770624945854e-06, + "loss": 0.96, + "step": 6459 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966748082304637e-06, + "loss": 0.9805, + "step": 6460 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966725532032343e-06, + "loss": 0.9482, + "step": 6461 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966702974128985e-06, + "loss": 1.0703, + "step": 6462 + }, + { + "epoch": 0.17, + "learning_rate": 1.996668040859458e-06, + "loss": 1.0303, + "step": 6463 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966657835429146e-06, + "loss": 0.9668, + "step": 6464 + }, + { + "epoch": 0.17, + "learning_rate": 1.99666352546327e-06, + "loss": 0.915, + "step": 6465 + }, + { + "epoch": 0.17, + "learning_rate": 1.996661266620526e-06, + "loss": 0.8291, + "step": 6466 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966590070146845e-06, + "loss": 0.8877, + "step": 6467 + }, + { + "epoch": 0.17, + "learning_rate": 1.996656746645747e-06, + "loss": 0.8838, + "step": 6468 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966544855137147e-06, + "loss": 1.1133, + "step": 6469 + }, + { + "epoch": 0.17, + "learning_rate": 1.99665222361859e-06, + "loss": 1.0146, + "step": 6470 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966499609603753e-06, + "loss": 0.9326, + "step": 6471 + }, + { + "epoch": 0.17, + "learning_rate": 1.996647697539071e-06, + "loss": 0.9346, + "step": 6472 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966454333546794e-06, + "loss": 0.9844, + "step": 6473 + }, + { + "epoch": 0.17, + "learning_rate": 1.996643168407202e-06, + "loss": 0.9541, + "step": 6474 + }, + { + "epoch": 0.17, + "learning_rate": 1.996640902696641e-06, + "loss": 0.9165, + "step": 6475 + }, + { + "epoch": 0.17, + "learning_rate": 1.996638636222998e-06, + "loss": 0.8203, + "step": 6476 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966363689862744e-06, + "loss": 0.957, + "step": 6477 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966341009864725e-06, + "loss": 0.8901, + "step": 6478 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966318322235933e-06, + "loss": 0.833, + "step": 6479 + }, + { + "epoch": 0.17, + "learning_rate": 1.996629562697639e-06, + "loss": 1.0762, + "step": 6480 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966272924086116e-06, + "loss": 0.9014, + "step": 6481 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966250213565125e-06, + "loss": 1.1367, + "step": 6482 + }, + { + "epoch": 0.17, + "learning_rate": 1.996622749541343e-06, + "loss": 0.6929, + "step": 6483 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966204769631055e-06, + "loss": 0.8105, + "step": 6484 + }, + { + "epoch": 0.17, + "learning_rate": 1.996618203621802e-06, + "loss": 0.7129, + "step": 6485 + }, + { + "epoch": 0.17, + "learning_rate": 1.996615929517433e-06, + "loss": 1.1006, + "step": 6486 + }, + { + "epoch": 0.17, + "learning_rate": 1.996613654650001e-06, + "loss": 1.1992, + "step": 6487 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966113790195084e-06, + "loss": 1.0059, + "step": 6488 + }, + { + "epoch": 0.17, + "learning_rate": 1.996609102625956e-06, + "loss": 0.9121, + "step": 6489 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966068254693454e-06, + "loss": 0.832, + "step": 6490 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966045475496792e-06, + "loss": 0.9077, + "step": 6491 + }, + { + "epoch": 0.17, + "learning_rate": 1.9966022688669592e-06, + "loss": 0.791, + "step": 6492 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965999894211862e-06, + "loss": 0.8594, + "step": 6493 + }, + { + "epoch": 0.17, + "learning_rate": 1.996597709212362e-06, + "loss": 0.9971, + "step": 6494 + }, + { + "epoch": 0.17, + "learning_rate": 1.996595428240489e-06, + "loss": 1.0986, + "step": 6495 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965931465055694e-06, + "loss": 0.9072, + "step": 6496 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965908640076034e-06, + "loss": 0.8477, + "step": 6497 + }, + { + "epoch": 0.17, + "learning_rate": 1.996588580746594e-06, + "loss": 0.8984, + "step": 6498 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965862967225423e-06, + "loss": 0.6973, + "step": 6499 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965840119354503e-06, + "loss": 1.0225, + "step": 6500 + }, + { + "epoch": 0.17, + "learning_rate": 1.99658172638532e-06, + "loss": 0.9058, + "step": 6501 + }, + { + "epoch": 0.17, + "learning_rate": 1.996579440072153e-06, + "loss": 0.8584, + "step": 6502 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965771529959504e-06, + "loss": 0.6104, + "step": 6503 + }, + { + "epoch": 0.17, + "learning_rate": 1.996574865156715e-06, + "loss": 0.8447, + "step": 6504 + }, + { + "epoch": 0.17, + "learning_rate": 1.996572576554448e-06, + "loss": 0.6143, + "step": 6505 + }, + { + "epoch": 0.17, + "learning_rate": 1.996570287189151e-06, + "loss": 0.9668, + "step": 6506 + }, + { + "epoch": 0.17, + "learning_rate": 1.996567997060826e-06, + "loss": 0.7373, + "step": 6507 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965657061694748e-06, + "loss": 0.8442, + "step": 6508 + }, + { + "epoch": 0.17, + "learning_rate": 1.996563414515099e-06, + "loss": 0.6055, + "step": 6509 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965611220977005e-06, + "loss": 0.9355, + "step": 6510 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965588289172806e-06, + "loss": 1.0137, + "step": 6511 + }, + { + "epoch": 0.17, + "learning_rate": 1.996556534973842e-06, + "loss": 1.0029, + "step": 6512 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965542402673855e-06, + "loss": 0.8228, + "step": 6513 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965519447979133e-06, + "loss": 0.7617, + "step": 6514 + }, + { + "epoch": 0.17, + "learning_rate": 1.996549648565427e-06, + "loss": 0.9053, + "step": 6515 + }, + { + "epoch": 0.17, + "learning_rate": 1.996547351569929e-06, + "loss": 0.8662, + "step": 6516 + }, + { + "epoch": 0.17, + "learning_rate": 1.99654505381142e-06, + "loss": 1.1113, + "step": 6517 + }, + { + "epoch": 0.17, + "learning_rate": 1.996542755289902e-06, + "loss": 0.959, + "step": 6518 + }, + { + "epoch": 0.17, + "learning_rate": 1.996540456005378e-06, + "loss": 0.9854, + "step": 6519 + }, + { + "epoch": 0.17, + "learning_rate": 1.996538155957848e-06, + "loss": 0.8896, + "step": 6520 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965358551473147e-06, + "loss": 1.0771, + "step": 6521 + }, + { + "epoch": 0.17, + "learning_rate": 1.99653355357378e-06, + "loss": 1.042, + "step": 6522 + }, + { + "epoch": 0.17, + "learning_rate": 1.996531251237245e-06, + "loss": 0.8857, + "step": 6523 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965289481377117e-06, + "loss": 1.0039, + "step": 6524 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965266442751827e-06, + "loss": 0.8174, + "step": 6525 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965243396496583e-06, + "loss": 0.8916, + "step": 6526 + }, + { + "epoch": 0.17, + "learning_rate": 1.996522034261142e-06, + "loss": 0.8667, + "step": 6527 + }, + { + "epoch": 0.17, + "learning_rate": 1.996519728109634e-06, + "loss": 0.9131, + "step": 6528 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965174211951363e-06, + "loss": 0.6948, + "step": 6529 + }, + { + "epoch": 0.17, + "learning_rate": 1.996515113517652e-06, + "loss": 0.8213, + "step": 6530 + }, + { + "epoch": 0.17, + "learning_rate": 1.996512805077181e-06, + "loss": 1.1201, + "step": 6531 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965104958737263e-06, + "loss": 1.0059, + "step": 6532 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965081859072894e-06, + "loss": 0.957, + "step": 6533 + }, + { + "epoch": 0.17, + "learning_rate": 1.996505875177872e-06, + "loss": 1.0039, + "step": 6534 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965035636854756e-06, + "loss": 1.0137, + "step": 6535 + }, + { + "epoch": 0.17, + "learning_rate": 1.9965012514301024e-06, + "loss": 1.0156, + "step": 6536 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964989384117538e-06, + "loss": 0.7607, + "step": 6537 + }, + { + "epoch": 0.17, + "learning_rate": 1.996496624630432e-06, + "loss": 0.8857, + "step": 6538 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964943100861388e-06, + "loss": 0.7485, + "step": 6539 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964919947788754e-06, + "loss": 1.1875, + "step": 6540 + }, + { + "epoch": 0.17, + "learning_rate": 1.996489678708644e-06, + "loss": 1.0137, + "step": 6541 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964873618754467e-06, + "loss": 0.9453, + "step": 6542 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964850442792844e-06, + "loss": 1.0039, + "step": 6543 + }, + { + "epoch": 0.17, + "learning_rate": 1.996482725920159e-06, + "loss": 0.8579, + "step": 6544 + }, + { + "epoch": 0.17, + "learning_rate": 1.996480406798073e-06, + "loss": 1.0586, + "step": 6545 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964780869130276e-06, + "loss": 0.8389, + "step": 6546 + }, + { + "epoch": 0.17, + "learning_rate": 1.996475766265025e-06, + "loss": 1.3164, + "step": 6547 + }, + { + "epoch": 0.17, + "learning_rate": 1.996473444854067e-06, + "loss": 0.8145, + "step": 6548 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964711226801547e-06, + "loss": 0.8389, + "step": 6549 + }, + { + "epoch": 0.17, + "learning_rate": 1.99646879974329e-06, + "loss": 1.0762, + "step": 6550 + }, + { + "epoch": 0.17, + "learning_rate": 1.996466476043475e-06, + "loss": 1.0264, + "step": 6551 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964641515807118e-06, + "loss": 0.9404, + "step": 6552 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964618263550018e-06, + "loss": 0.7397, + "step": 6553 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964595003663467e-06, + "loss": 0.9473, + "step": 6554 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964571736147484e-06, + "loss": 0.873, + "step": 6555 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964548461002084e-06, + "loss": 0.9961, + "step": 6556 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964525178227293e-06, + "loss": 0.9014, + "step": 6557 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964501887823116e-06, + "loss": 0.9873, + "step": 6558 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964478589789586e-06, + "loss": 0.8423, + "step": 6559 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964455284126707e-06, + "loss": 0.9336, + "step": 6560 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964431970834505e-06, + "loss": 0.9727, + "step": 6561 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964408649912997e-06, + "loss": 1.1426, + "step": 6562 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964385321362195e-06, + "loss": 0.7136, + "step": 6563 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964361985182125e-06, + "loss": 1.0742, + "step": 6564 + }, + { + "epoch": 0.17, + "learning_rate": 1.99643386413728e-06, + "loss": 0.8398, + "step": 6565 + }, + { + "epoch": 0.17, + "learning_rate": 1.996431528993424e-06, + "loss": 1.0449, + "step": 6566 + }, + { + "epoch": 0.17, + "learning_rate": 1.996429193086646e-06, + "loss": 0.8555, + "step": 6567 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964268564169482e-06, + "loss": 0.9033, + "step": 6568 + }, + { + "epoch": 0.17, + "learning_rate": 1.996424518984332e-06, + "loss": 1.1035, + "step": 6569 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964221807888e-06, + "loss": 0.9482, + "step": 6570 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964198418303523e-06, + "loss": 1.0615, + "step": 6571 + }, + { + "epoch": 0.17, + "learning_rate": 1.996417502108992e-06, + "loss": 1.0762, + "step": 6572 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964151616247214e-06, + "loss": 0.8154, + "step": 6573 + }, + { + "epoch": 0.17, + "learning_rate": 1.996412820377541e-06, + "loss": 0.7856, + "step": 6574 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964104783674532e-06, + "loss": 0.8926, + "step": 6575 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964081355944596e-06, + "loss": 1.1016, + "step": 6576 + }, + { + "epoch": 0.17, + "learning_rate": 1.996405792058562e-06, + "loss": 0.9014, + "step": 6577 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964034477597623e-06, + "loss": 0.8018, + "step": 6578 + }, + { + "epoch": 0.17, + "learning_rate": 1.9964011026980628e-06, + "loss": 0.9951, + "step": 6579 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963987568734644e-06, + "loss": 0.959, + "step": 6580 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963964102859693e-06, + "loss": 0.9346, + "step": 6581 + }, + { + "epoch": 0.17, + "learning_rate": 1.996394062935579e-06, + "loss": 0.9424, + "step": 6582 + }, + { + "epoch": 0.17, + "learning_rate": 1.996391714822296e-06, + "loss": 0.8545, + "step": 6583 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963893659461217e-06, + "loss": 0.937, + "step": 6584 + }, + { + "epoch": 0.17, + "learning_rate": 1.996387016307058e-06, + "loss": 0.9502, + "step": 6585 + }, + { + "epoch": 0.17, + "learning_rate": 1.996384665905106e-06, + "loss": 0.9941, + "step": 6586 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963823147402683e-06, + "loss": 1.0098, + "step": 6587 + }, + { + "epoch": 0.17, + "learning_rate": 1.996379962812547e-06, + "loss": 0.9014, + "step": 6588 + }, + { + "epoch": 0.17, + "learning_rate": 1.996377610121943e-06, + "loss": 0.9961, + "step": 6589 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963752566684586e-06, + "loss": 0.8774, + "step": 6590 + }, + { + "epoch": 0.17, + "learning_rate": 1.996372902452095e-06, + "loss": 0.8892, + "step": 6591 + }, + { + "epoch": 0.17, + "learning_rate": 1.996370547472855e-06, + "loss": 0.96, + "step": 6592 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963681917307395e-06, + "loss": 1.002, + "step": 6593 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963658352257507e-06, + "loss": 0.876, + "step": 6594 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963634779578905e-06, + "loss": 0.8013, + "step": 6595 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963611199271607e-06, + "loss": 0.9932, + "step": 6596 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963587611335634e-06, + "loss": 1.0645, + "step": 6597 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963564015770994e-06, + "loss": 0.8672, + "step": 6598 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963540412577713e-06, + "loss": 0.9658, + "step": 6599 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963516801755807e-06, + "loss": 1.0684, + "step": 6600 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963493183305294e-06, + "loss": 1.0293, + "step": 6601 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963469557226195e-06, + "loss": 0.8496, + "step": 6602 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963445923518522e-06, + "loss": 0.8779, + "step": 6603 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963422282182297e-06, + "loss": 0.9053, + "step": 6604 + }, + { + "epoch": 0.17, + "learning_rate": 1.996339863321754e-06, + "loss": 0.9258, + "step": 6605 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963374976624266e-06, + "loss": 1.083, + "step": 6606 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963351312402494e-06, + "loss": 0.8184, + "step": 6607 + }, + { + "epoch": 0.17, + "learning_rate": 1.996332764055224e-06, + "loss": 0.7705, + "step": 6608 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963303961073525e-06, + "loss": 0.6948, + "step": 6609 + }, + { + "epoch": 0.17, + "learning_rate": 1.996328027396637e-06, + "loss": 0.7383, + "step": 6610 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963256579230784e-06, + "loss": 0.9258, + "step": 6611 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963232876866796e-06, + "loss": 0.8945, + "step": 6612 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963209166874413e-06, + "loss": 1.0166, + "step": 6613 + }, + { + "epoch": 0.17, + "learning_rate": 1.996318544925366e-06, + "loss": 0.876, + "step": 6614 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963161724004556e-06, + "loss": 1.1016, + "step": 6615 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963137991127117e-06, + "loss": 0.7764, + "step": 6616 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963114250621363e-06, + "loss": 1.0664, + "step": 6617 + }, + { + "epoch": 0.17, + "learning_rate": 1.996309050248731e-06, + "loss": 1.1133, + "step": 6618 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963066746724973e-06, + "loss": 0.8018, + "step": 6619 + }, + { + "epoch": 0.17, + "learning_rate": 1.996304298333438e-06, + "loss": 0.7847, + "step": 6620 + }, + { + "epoch": 0.17, + "learning_rate": 1.9963019212315533e-06, + "loss": 0.8906, + "step": 6621 + }, + { + "epoch": 0.17, + "learning_rate": 1.996299543366847e-06, + "loss": 0.9932, + "step": 6622 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962971647393197e-06, + "loss": 0.9609, + "step": 6623 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962947853489732e-06, + "loss": 0.8926, + "step": 6624 + }, + { + "epoch": 0.17, + "learning_rate": 1.99629240519581e-06, + "loss": 0.6577, + "step": 6625 + }, + { + "epoch": 0.17, + "learning_rate": 1.996290024279831e-06, + "loss": 1.002, + "step": 6626 + }, + { + "epoch": 0.17, + "learning_rate": 1.996287642601039e-06, + "loss": 1.0479, + "step": 6627 + }, + { + "epoch": 0.17, + "learning_rate": 1.996285260159435e-06, + "loss": 1.0371, + "step": 6628 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962828769550216e-06, + "loss": 1.0391, + "step": 6629 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962804929878e-06, + "loss": 0.9004, + "step": 6630 + }, + { + "epoch": 0.17, + "learning_rate": 1.996278108257772e-06, + "loss": 0.8223, + "step": 6631 + }, + { + "epoch": 0.17, + "learning_rate": 1.99627572276494e-06, + "loss": 0.7305, + "step": 6632 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962733365093058e-06, + "loss": 0.8799, + "step": 6633 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962709494908702e-06, + "loss": 1.1211, + "step": 6634 + }, + { + "epoch": 0.17, + "learning_rate": 1.996268561709636e-06, + "loss": 0.8755, + "step": 6635 + }, + { + "epoch": 0.17, + "learning_rate": 1.996266173165605e-06, + "loss": 0.7661, + "step": 6636 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962637838587786e-06, + "loss": 1.0527, + "step": 6637 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962613937891584e-06, + "loss": 1.0781, + "step": 6638 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962590029567474e-06, + "loss": 1.0586, + "step": 6639 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962566113615464e-06, + "loss": 0.916, + "step": 6640 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962542190035574e-06, + "loss": 0.9131, + "step": 6641 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962518258827827e-06, + "loss": 0.6523, + "step": 6642 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962494319992235e-06, + "loss": 0.9883, + "step": 6643 + }, + { + "epoch": 0.17, + "learning_rate": 1.996247037352882e-06, + "loss": 0.832, + "step": 6644 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962446419437595e-06, + "loss": 0.9111, + "step": 6645 + }, + { + "epoch": 0.17, + "learning_rate": 1.996242245771859e-06, + "loss": 0.9482, + "step": 6646 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962398488371813e-06, + "loss": 0.8008, + "step": 6647 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962374511397287e-06, + "loss": 1.0186, + "step": 6648 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962350526795027e-06, + "loss": 0.8516, + "step": 6649 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962326534565057e-06, + "loss": 0.8857, + "step": 6650 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962302534707386e-06, + "loss": 0.9404, + "step": 6651 + }, + { + "epoch": 0.17, + "learning_rate": 1.996227852722204e-06, + "loss": 0.9072, + "step": 6652 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962254512109037e-06, + "loss": 1.0166, + "step": 6653 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962230489368394e-06, + "loss": 0.9004, + "step": 6654 + }, + { + "epoch": 0.17, + "learning_rate": 1.996220645900013e-06, + "loss": 0.9473, + "step": 6655 + }, + { + "epoch": 0.17, + "learning_rate": 1.996218242100426e-06, + "loss": 0.5815, + "step": 6656 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962158375380804e-06, + "loss": 0.8896, + "step": 6657 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962134322129785e-06, + "loss": 0.9814, + "step": 6658 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962110261251216e-06, + "loss": 0.8418, + "step": 6659 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962086192745116e-06, + "loss": 1.0615, + "step": 6660 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962062116611505e-06, + "loss": 0.9717, + "step": 6661 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962038032850405e-06, + "loss": 1.0303, + "step": 6662 + }, + { + "epoch": 0.17, + "learning_rate": 1.9962013941461825e-06, + "loss": 0.9092, + "step": 6663 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961989842445792e-06, + "loss": 0.8994, + "step": 6664 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961965735802318e-06, + "loss": 0.833, + "step": 6665 + }, + { + "epoch": 0.17, + "learning_rate": 1.996194162153143e-06, + "loss": 0.8945, + "step": 6666 + }, + { + "epoch": 0.17, + "learning_rate": 1.996191749963314e-06, + "loss": 1.1377, + "step": 6667 + }, + { + "epoch": 0.17, + "learning_rate": 1.996189337010747e-06, + "loss": 0.8018, + "step": 6668 + }, + { + "epoch": 0.17, + "learning_rate": 1.996186923295443e-06, + "loss": 0.916, + "step": 6669 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961845088174048e-06, + "loss": 0.8525, + "step": 6670 + }, + { + "epoch": 0.17, + "learning_rate": 1.996182093576634e-06, + "loss": 0.7646, + "step": 6671 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961796775731325e-06, + "loss": 0.8887, + "step": 6672 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961772608069015e-06, + "loss": 0.9189, + "step": 6673 + }, + { + "epoch": 0.17, + "learning_rate": 1.996174843277944e-06, + "loss": 0.8721, + "step": 6674 + }, + { + "epoch": 0.17, + "learning_rate": 1.996172424986261e-06, + "loss": 0.8467, + "step": 6675 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961700059318544e-06, + "loss": 0.9854, + "step": 6676 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961675861147264e-06, + "loss": 1.0059, + "step": 6677 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961651655348786e-06, + "loss": 0.8311, + "step": 6678 + }, + { + "epoch": 0.17, + "learning_rate": 1.996162744192313e-06, + "loss": 0.9434, + "step": 6679 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961603220870313e-06, + "loss": 0.9863, + "step": 6680 + }, + { + "epoch": 0.17, + "learning_rate": 1.996157899219036e-06, + "loss": 0.7812, + "step": 6681 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961554755883275e-06, + "loss": 1.166, + "step": 6682 + }, + { + "epoch": 0.17, + "learning_rate": 1.996153051194909e-06, + "loss": 1.0332, + "step": 6683 + }, + { + "epoch": 0.17, + "learning_rate": 1.996150626038782e-06, + "loss": 0.9102, + "step": 6684 + }, + { + "epoch": 0.17, + "learning_rate": 1.996148200119948e-06, + "loss": 0.8403, + "step": 6685 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961457734384096e-06, + "loss": 0.9434, + "step": 6686 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961433459941675e-06, + "loss": 1.0762, + "step": 6687 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961409177872247e-06, + "loss": 0.9736, + "step": 6688 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961384888175826e-06, + "loss": 1.2139, + "step": 6689 + }, + { + "epoch": 0.17, + "learning_rate": 1.996136059085243e-06, + "loss": 0.8682, + "step": 6690 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961336285902077e-06, + "loss": 0.8281, + "step": 6691 + }, + { + "epoch": 0.17, + "learning_rate": 1.996131197332479e-06, + "loss": 0.8413, + "step": 6692 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961287653120583e-06, + "loss": 0.75, + "step": 6693 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961263325289476e-06, + "loss": 1.0264, + "step": 6694 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961238989831485e-06, + "loss": 1.0576, + "step": 6695 + }, + { + "epoch": 0.17, + "learning_rate": 1.996121464674663e-06, + "loss": 1.0088, + "step": 6696 + }, + { + "epoch": 0.17, + "learning_rate": 1.996119029603494e-06, + "loss": 0.7788, + "step": 6697 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961165937696414e-06, + "loss": 0.9004, + "step": 6698 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961141571731092e-06, + "loss": 1.0332, + "step": 6699 + }, + { + "epoch": 0.17, + "learning_rate": 1.996111719813897e-06, + "loss": 0.8955, + "step": 6700 + }, + { + "epoch": 0.17, + "learning_rate": 1.996109281692009e-06, + "loss": 0.9209, + "step": 6701 + }, + { + "epoch": 0.17, + "learning_rate": 1.996106842807445e-06, + "loss": 1.0049, + "step": 6702 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961044031602085e-06, + "loss": 0.8115, + "step": 6703 + }, + { + "epoch": 0.17, + "learning_rate": 1.9961019627503005e-06, + "loss": 0.8579, + "step": 6704 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960995215777227e-06, + "loss": 0.7529, + "step": 6705 + }, + { + "epoch": 0.17, + "learning_rate": 1.996097079642478e-06, + "loss": 0.8369, + "step": 6706 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960946369445665e-06, + "loss": 0.9121, + "step": 6707 + }, + { + "epoch": 0.17, + "learning_rate": 1.996092193483992e-06, + "loss": 0.9644, + "step": 6708 + }, + { + "epoch": 0.17, + "learning_rate": 1.996089749260755e-06, + "loss": 1.0078, + "step": 6709 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960873042748583e-06, + "loss": 0.9521, + "step": 6710 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960848585263032e-06, + "loss": 0.8652, + "step": 6711 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960824120150916e-06, + "loss": 0.9199, + "step": 6712 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960799647412254e-06, + "loss": 1.002, + "step": 6713 + }, + { + "epoch": 0.17, + "learning_rate": 1.996077516704707e-06, + "loss": 0.9258, + "step": 6714 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960750679055372e-06, + "loss": 0.8594, + "step": 6715 + }, + { + "epoch": 0.17, + "learning_rate": 1.996072618343719e-06, + "loss": 0.7705, + "step": 6716 + }, + { + "epoch": 0.17, + "learning_rate": 1.996070168019254e-06, + "loss": 0.959, + "step": 6717 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960677169321433e-06, + "loss": 0.9766, + "step": 6718 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960652650823896e-06, + "loss": 0.8457, + "step": 6719 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960628124699945e-06, + "loss": 0.9814, + "step": 6720 + }, + { + "epoch": 0.17, + "learning_rate": 1.99606035909496e-06, + "loss": 0.9404, + "step": 6721 + }, + { + "epoch": 0.17, + "learning_rate": 1.996057904957288e-06, + "loss": 0.7598, + "step": 6722 + }, + { + "epoch": 0.17, + "learning_rate": 1.99605545005698e-06, + "loss": 0.9453, + "step": 6723 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960529943940382e-06, + "loss": 1.0889, + "step": 6724 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960505379684643e-06, + "loss": 0.7617, + "step": 6725 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960480807802604e-06, + "loss": 0.8945, + "step": 6726 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960456228294284e-06, + "loss": 0.8848, + "step": 6727 + }, + { + "epoch": 0.17, + "learning_rate": 1.99604316411597e-06, + "loss": 0.9199, + "step": 6728 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960407046398875e-06, + "loss": 0.9756, + "step": 6729 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960382444011818e-06, + "loss": 0.9609, + "step": 6730 + }, + { + "epoch": 0.17, + "learning_rate": 1.996035783399856e-06, + "loss": 0.7988, + "step": 6731 + }, + { + "epoch": 0.17, + "learning_rate": 1.996033321635911e-06, + "loss": 0.9463, + "step": 6732 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960308591093493e-06, + "loss": 0.7773, + "step": 6733 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960283958201725e-06, + "loss": 0.7422, + "step": 6734 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960259317683823e-06, + "loss": 0.876, + "step": 6735 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960234669539813e-06, + "loss": 0.9775, + "step": 6736 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960210013769706e-06, + "loss": 0.9482, + "step": 6737 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960185350373525e-06, + "loss": 0.8862, + "step": 6738 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960160679351286e-06, + "loss": 1.1367, + "step": 6739 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960136000703014e-06, + "loss": 0.8428, + "step": 6740 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960111314428723e-06, + "loss": 0.8613, + "step": 6741 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960086620528433e-06, + "loss": 0.8643, + "step": 6742 + }, + { + "epoch": 0.17, + "learning_rate": 1.996006191900216e-06, + "loss": 0.9932, + "step": 6743 + }, + { + "epoch": 0.17, + "learning_rate": 1.9960037209849926e-06, + "loss": 1.0557, + "step": 6744 + }, + { + "epoch": 0.17, + "learning_rate": 1.996001249307175e-06, + "loss": 0.8042, + "step": 6745 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959987768667653e-06, + "loss": 0.9707, + "step": 6746 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959963036637645e-06, + "loss": 1.0312, + "step": 6747 + }, + { + "epoch": 0.17, + "learning_rate": 1.995993829698176e-06, + "loss": 0.833, + "step": 6748 + }, + { + "epoch": 0.17, + "learning_rate": 1.99599135497e-06, + "loss": 1.0615, + "step": 6749 + }, + { + "epoch": 0.17, + "learning_rate": 1.99598887947924e-06, + "loss": 1.0908, + "step": 6750 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959864032258964e-06, + "loss": 0.8369, + "step": 6751 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959839262099722e-06, + "loss": 1.1025, + "step": 6752 + }, + { + "epoch": 0.17, + "learning_rate": 1.995981448431469e-06, + "loss": 0.6089, + "step": 6753 + }, + { + "epoch": 0.17, + "learning_rate": 1.995978969890388e-06, + "loss": 0.9414, + "step": 6754 + }, + { + "epoch": 0.17, + "learning_rate": 1.995976490586732e-06, + "loss": 1.0537, + "step": 6755 + }, + { + "epoch": 0.17, + "learning_rate": 1.995974010520503e-06, + "loss": 1.0283, + "step": 6756 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959715296917023e-06, + "loss": 1.0908, + "step": 6757 + }, + { + "epoch": 0.17, + "learning_rate": 1.995969048100332e-06, + "loss": 1.001, + "step": 6758 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959665657463938e-06, + "loss": 0.9434, + "step": 6759 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959640826298897e-06, + "loss": 0.9092, + "step": 6760 + }, + { + "epoch": 0.17, + "learning_rate": 1.995961598750822e-06, + "loss": 0.8887, + "step": 6761 + }, + { + "epoch": 0.17, + "learning_rate": 1.995959114109192e-06, + "loss": 0.6328, + "step": 6762 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959566287050023e-06, + "loss": 0.9473, + "step": 6763 + }, + { + "epoch": 0.17, + "learning_rate": 1.995954142538254e-06, + "loss": 0.9062, + "step": 6764 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959516556089495e-06, + "loss": 0.7866, + "step": 6765 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959491679170906e-06, + "loss": 1.0811, + "step": 6766 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959466794626797e-06, + "loss": 0.9688, + "step": 6767 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959441902457177e-06, + "loss": 1.0791, + "step": 6768 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959417002662075e-06, + "loss": 0.8955, + "step": 6769 + }, + { + "epoch": 0.17, + "learning_rate": 1.99593920952415e-06, + "loss": 0.8271, + "step": 6770 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959367180195476e-06, + "loss": 0.7935, + "step": 6771 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959342257524026e-06, + "loss": 0.7725, + "step": 6772 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959317327227166e-06, + "loss": 0.9043, + "step": 6773 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959292389304913e-06, + "loss": 0.9619, + "step": 6774 + }, + { + "epoch": 0.17, + "learning_rate": 1.995926744375729e-06, + "loss": 0.9014, + "step": 6775 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959242490584313e-06, + "loss": 0.7729, + "step": 6776 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959217529786e-06, + "loss": 0.8857, + "step": 6777 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959192561362374e-06, + "loss": 1.0605, + "step": 6778 + }, + { + "epoch": 0.17, + "learning_rate": 1.995916758531345e-06, + "loss": 0.9746, + "step": 6779 + }, + { + "epoch": 0.17, + "learning_rate": 1.995914260163925e-06, + "loss": 0.6294, + "step": 6780 + }, + { + "epoch": 0.17, + "learning_rate": 1.995911761033979e-06, + "loss": 1.04, + "step": 6781 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959092611415094e-06, + "loss": 0.7773, + "step": 6782 + }, + { + "epoch": 0.17, + "learning_rate": 1.995906760486518e-06, + "loss": 0.875, + "step": 6783 + }, + { + "epoch": 0.17, + "learning_rate": 1.9959042590690066e-06, + "loss": 1.0566, + "step": 6784 + }, + { + "epoch": 0.17, + "learning_rate": 1.995901756888977e-06, + "loss": 0.6748, + "step": 6785 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958992539464314e-06, + "loss": 0.9912, + "step": 6786 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958967502413714e-06, + "loss": 0.7979, + "step": 6787 + }, + { + "epoch": 0.17, + "learning_rate": 1.995894245773799e-06, + "loss": 0.9482, + "step": 6788 + }, + { + "epoch": 0.17, + "learning_rate": 1.995891740543716e-06, + "loss": 0.9248, + "step": 6789 + }, + { + "epoch": 0.17, + "learning_rate": 1.995889234551125e-06, + "loss": 1.2266, + "step": 6790 + }, + { + "epoch": 0.17, + "learning_rate": 1.995886727796027e-06, + "loss": 1.002, + "step": 6791 + }, + { + "epoch": 0.17, + "learning_rate": 1.995884220278424e-06, + "loss": 0.9414, + "step": 6792 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958817119983186e-06, + "loss": 0.916, + "step": 6793 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958792029557127e-06, + "loss": 1.082, + "step": 6794 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958766931506074e-06, + "loss": 0.8037, + "step": 6795 + }, + { + "epoch": 0.17, + "learning_rate": 1.995874182583005e-06, + "loss": 0.6543, + "step": 6796 + }, + { + "epoch": 0.17, + "learning_rate": 1.995871671252908e-06, + "loss": 0.8264, + "step": 6797 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958691591603178e-06, + "loss": 0.8584, + "step": 6798 + }, + { + "epoch": 0.17, + "learning_rate": 1.995866646305236e-06, + "loss": 0.833, + "step": 6799 + }, + { + "epoch": 0.17, + "learning_rate": 1.995864132687665e-06, + "loss": 1.1445, + "step": 6800 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958616183076073e-06, + "loss": 0.6812, + "step": 6801 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958591031650636e-06, + "loss": 0.7637, + "step": 6802 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958565872600366e-06, + "loss": 0.9111, + "step": 6803 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958540705925274e-06, + "loss": 0.8857, + "step": 6804 + }, + { + "epoch": 0.17, + "learning_rate": 1.995851553162539e-06, + "loss": 1.1641, + "step": 6805 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958490349700728e-06, + "loss": 0.6763, + "step": 6806 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958465160151307e-06, + "loss": 0.7061, + "step": 6807 + }, + { + "epoch": 0.17, + "learning_rate": 1.995843996297715e-06, + "loss": 0.9385, + "step": 6808 + }, + { + "epoch": 0.17, + "learning_rate": 1.995841475817827e-06, + "loss": 0.9834, + "step": 6809 + }, + { + "epoch": 0.17, + "learning_rate": 1.995838954575469e-06, + "loss": 0.8657, + "step": 6810 + }, + { + "epoch": 0.17, + "learning_rate": 1.995836432570643e-06, + "loss": 0.8799, + "step": 6811 + }, + { + "epoch": 0.17, + "learning_rate": 1.995833909803351e-06, + "loss": 0.8174, + "step": 6812 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958313862735948e-06, + "loss": 1.0234, + "step": 6813 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958288619813758e-06, + "loss": 0.9175, + "step": 6814 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958263369266967e-06, + "loss": 0.9033, + "step": 6815 + }, + { + "epoch": 0.17, + "learning_rate": 1.995823811109559e-06, + "loss": 1.0391, + "step": 6816 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958212845299654e-06, + "loss": 0.8223, + "step": 6817 + }, + { + "epoch": 0.17, + "learning_rate": 1.995818757187917e-06, + "loss": 0.9258, + "step": 6818 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958162290834157e-06, + "loss": 0.7725, + "step": 6819 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958137002164637e-06, + "loss": 0.7998, + "step": 6820 + }, + { + "epoch": 0.17, + "learning_rate": 1.995811170587063e-06, + "loss": 1.0156, + "step": 6821 + }, + { + "epoch": 0.17, + "learning_rate": 1.9958086401952157e-06, + "loss": 0.748, + "step": 6822 + }, + { + "epoch": 0.17, + "learning_rate": 1.995806109040923e-06, + "loss": 0.5327, + "step": 6823 + }, + { + "epoch": 0.17, + "learning_rate": 1.995803577124188e-06, + "loss": 1.1523, + "step": 6824 + }, + { + "epoch": 0.17, + "learning_rate": 1.995801044445011e-06, + "loss": 0.957, + "step": 6825 + }, + { + "epoch": 0.17, + "learning_rate": 1.995798511003396e-06, + "loss": 0.7397, + "step": 6826 + }, + { + "epoch": 0.17, + "learning_rate": 1.9957959767993435e-06, + "loss": 0.8174, + "step": 6827 + }, + { + "epoch": 0.18, + "learning_rate": 1.995793441832856e-06, + "loss": 0.915, + "step": 6828 + }, + { + "epoch": 0.18, + "learning_rate": 1.995790906103935e-06, + "loss": 0.8252, + "step": 6829 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957883696125823e-06, + "loss": 1.1699, + "step": 6830 + }, + { + "epoch": 0.18, + "learning_rate": 1.995785832358801e-06, + "loss": 1.0635, + "step": 6831 + }, + { + "epoch": 0.18, + "learning_rate": 1.995783294342592e-06, + "loss": 1.0068, + "step": 6832 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957807555639573e-06, + "loss": 0.917, + "step": 6833 + }, + { + "epoch": 0.18, + "learning_rate": 1.995778216022899e-06, + "loss": 0.8682, + "step": 6834 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957756757194194e-06, + "loss": 0.9229, + "step": 6835 + }, + { + "epoch": 0.18, + "learning_rate": 1.99577313465352e-06, + "loss": 1.1426, + "step": 6836 + }, + { + "epoch": 0.18, + "learning_rate": 1.995770592825203e-06, + "loss": 1.0576, + "step": 6837 + }, + { + "epoch": 0.18, + "learning_rate": 1.99576805023447e-06, + "loss": 0.9395, + "step": 6838 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957655068813234e-06, + "loss": 0.7998, + "step": 6839 + }, + { + "epoch": 0.18, + "learning_rate": 1.995762962765765e-06, + "loss": 0.897, + "step": 6840 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957604178877967e-06, + "loss": 1.1846, + "step": 6841 + }, + { + "epoch": 0.18, + "learning_rate": 1.99575787224742e-06, + "loss": 0.916, + "step": 6842 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957553258446376e-06, + "loss": 1.1016, + "step": 6843 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957527786794513e-06, + "loss": 0.9033, + "step": 6844 + }, + { + "epoch": 0.18, + "learning_rate": 1.995750230751863e-06, + "loss": 0.855, + "step": 6845 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957476820618742e-06, + "loss": 1.0049, + "step": 6846 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957451326094873e-06, + "loss": 0.7783, + "step": 6847 + }, + { + "epoch": 0.18, + "learning_rate": 1.995742582394704e-06, + "loss": 1.0312, + "step": 6848 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957400314175265e-06, + "loss": 0.9531, + "step": 6849 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957374796779566e-06, + "loss": 0.7256, + "step": 6850 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957349271759965e-06, + "loss": 0.9688, + "step": 6851 + }, + { + "epoch": 0.18, + "learning_rate": 1.995732373911648e-06, + "loss": 1.0889, + "step": 6852 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957298198849128e-06, + "loss": 0.9004, + "step": 6853 + }, + { + "epoch": 0.18, + "learning_rate": 1.995727265095793e-06, + "loss": 0.9326, + "step": 6854 + }, + { + "epoch": 0.18, + "learning_rate": 1.99572470954429e-06, + "loss": 0.6863, + "step": 6855 + }, + { + "epoch": 0.18, + "learning_rate": 1.995722153230408e-06, + "loss": 0.9912, + "step": 6856 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957195961541458e-06, + "loss": 1.0615, + "step": 6857 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957170383155075e-06, + "loss": 1.0176, + "step": 6858 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957144797144942e-06, + "loss": 0.9619, + "step": 6859 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957119203511085e-06, + "loss": 1.0615, + "step": 6860 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957093602253517e-06, + "loss": 0.7285, + "step": 6861 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957067993372263e-06, + "loss": 0.7402, + "step": 6862 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957042376867335e-06, + "loss": 0.96, + "step": 6863 + }, + { + "epoch": 0.18, + "learning_rate": 1.9957016752738763e-06, + "loss": 0.8965, + "step": 6864 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956991120986556e-06, + "loss": 0.8677, + "step": 6865 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956965481610743e-06, + "loss": 0.6758, + "step": 6866 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956939834611337e-06, + "loss": 0.9912, + "step": 6867 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956914179988364e-06, + "loss": 1.0762, + "step": 6868 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956888517741836e-06, + "loss": 0.8555, + "step": 6869 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956862847871774e-06, + "loss": 0.958, + "step": 6870 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956837170378204e-06, + "loss": 1.002, + "step": 6871 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956811485261138e-06, + "loss": 0.6783, + "step": 6872 + }, + { + "epoch": 0.18, + "learning_rate": 1.99567857925206e-06, + "loss": 1.0459, + "step": 6873 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956760092156613e-06, + "loss": 1.001, + "step": 6874 + }, + { + "epoch": 0.18, + "learning_rate": 1.995673438416919e-06, + "loss": 1.0166, + "step": 6875 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956708668558355e-06, + "loss": 0.9219, + "step": 6876 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956682945324125e-06, + "loss": 0.8047, + "step": 6877 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956657214466518e-06, + "loss": 0.9727, + "step": 6878 + }, + { + "epoch": 0.18, + "learning_rate": 1.995663147598556e-06, + "loss": 0.9307, + "step": 6879 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956605729881265e-06, + "loss": 0.9814, + "step": 6880 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956579976153654e-06, + "loss": 1.0908, + "step": 6881 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956554214802746e-06, + "loss": 0.9746, + "step": 6882 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956528445828568e-06, + "loss": 0.917, + "step": 6883 + }, + { + "epoch": 0.18, + "learning_rate": 1.995650266923113e-06, + "loss": 0.8003, + "step": 6884 + }, + { + "epoch": 0.18, + "learning_rate": 1.995647688501046e-06, + "loss": 0.7876, + "step": 6885 + }, + { + "epoch": 0.18, + "learning_rate": 1.995645109316657e-06, + "loss": 1.1377, + "step": 6886 + }, + { + "epoch": 0.18, + "learning_rate": 1.995642529369948e-06, + "loss": 0.7495, + "step": 6887 + }, + { + "epoch": 0.18, + "learning_rate": 1.995639948660922e-06, + "loss": 1.0527, + "step": 6888 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956373671895797e-06, + "loss": 1.043, + "step": 6889 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956347849559237e-06, + "loss": 1.1318, + "step": 6890 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956322019599562e-06, + "loss": 1.1699, + "step": 6891 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956296182016786e-06, + "loss": 0.8506, + "step": 6892 + }, + { + "epoch": 0.18, + "learning_rate": 1.995627033681094e-06, + "loss": 0.6597, + "step": 6893 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956244483982026e-06, + "loss": 0.9746, + "step": 6894 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956218623530077e-06, + "loss": 0.8818, + "step": 6895 + }, + { + "epoch": 0.18, + "learning_rate": 1.995619275545511e-06, + "loss": 1.0781, + "step": 6896 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956166879757143e-06, + "loss": 1.0537, + "step": 6897 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956140996436197e-06, + "loss": 1.0195, + "step": 6898 + }, + { + "epoch": 0.18, + "learning_rate": 1.995611510549229e-06, + "loss": 0.8101, + "step": 6899 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956089206925445e-06, + "loss": 0.6479, + "step": 6900 + }, + { + "epoch": 0.18, + "learning_rate": 1.995606330073568e-06, + "loss": 0.7568, + "step": 6901 + }, + { + "epoch": 0.18, + "learning_rate": 1.9956037386923014e-06, + "loss": 0.7002, + "step": 6902 + }, + { + "epoch": 0.18, + "learning_rate": 1.995601146548747e-06, + "loss": 0.9277, + "step": 6903 + }, + { + "epoch": 0.18, + "learning_rate": 1.995598553642906e-06, + "loss": 0.8271, + "step": 6904 + }, + { + "epoch": 0.18, + "learning_rate": 1.995595959974782e-06, + "loss": 0.8599, + "step": 6905 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955933655443753e-06, + "loss": 0.7793, + "step": 6906 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955907703516887e-06, + "loss": 0.877, + "step": 6907 + }, + { + "epoch": 0.18, + "learning_rate": 1.995588174396724e-06, + "loss": 0.9482, + "step": 6908 + }, + { + "epoch": 0.18, + "learning_rate": 1.995585577679483e-06, + "loss": 0.8623, + "step": 6909 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955829801999685e-06, + "loss": 0.835, + "step": 6910 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955803819581813e-06, + "loss": 0.7461, + "step": 6911 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955777829541243e-06, + "loss": 0.8789, + "step": 6912 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955751831877985e-06, + "loss": 0.9795, + "step": 6913 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955725826592075e-06, + "loss": 0.9668, + "step": 6914 + }, + { + "epoch": 0.18, + "learning_rate": 1.995569981368352e-06, + "loss": 0.9199, + "step": 6915 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955673793152343e-06, + "loss": 0.915, + "step": 6916 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955647764998563e-06, + "loss": 1.0107, + "step": 6917 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955621729222203e-06, + "loss": 0.9219, + "step": 6918 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955595685823282e-06, + "loss": 1.0098, + "step": 6919 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955569634801816e-06, + "loss": 0.689, + "step": 6920 + }, + { + "epoch": 0.18, + "learning_rate": 1.995554357615783e-06, + "loss": 0.7676, + "step": 6921 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955517509891343e-06, + "loss": 0.9873, + "step": 6922 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955491436002375e-06, + "loss": 1.2285, + "step": 6923 + }, + { + "epoch": 0.18, + "learning_rate": 1.995546535449094e-06, + "loss": 1.1064, + "step": 6924 + }, + { + "epoch": 0.18, + "learning_rate": 1.995543926535707e-06, + "loss": 0.9453, + "step": 6925 + }, + { + "epoch": 0.18, + "learning_rate": 1.995541316860077e-06, + "loss": 1.1211, + "step": 6926 + }, + { + "epoch": 0.18, + "learning_rate": 1.995538706422207e-06, + "loss": 0.874, + "step": 6927 + }, + { + "epoch": 0.18, + "learning_rate": 1.995536095222099e-06, + "loss": 0.8975, + "step": 6928 + }, + { + "epoch": 0.18, + "learning_rate": 1.995533483259755e-06, + "loss": 1.0654, + "step": 6929 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955308705351763e-06, + "loss": 0.8301, + "step": 6930 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955282570483657e-06, + "loss": 0.8447, + "step": 6931 + }, + { + "epoch": 0.18, + "learning_rate": 1.995525642799325e-06, + "loss": 0.9609, + "step": 6932 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955230277880557e-06, + "loss": 0.8989, + "step": 6933 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955204120145606e-06, + "loss": 0.7607, + "step": 6934 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955177954788413e-06, + "loss": 0.7568, + "step": 6935 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955151781808996e-06, + "loss": 0.9521, + "step": 6936 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955125601207374e-06, + "loss": 1.04, + "step": 6937 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955099412983578e-06, + "loss": 0.8076, + "step": 6938 + }, + { + "epoch": 0.18, + "learning_rate": 1.995507321713761e-06, + "loss": 1.2461, + "step": 6939 + }, + { + "epoch": 0.18, + "learning_rate": 1.9955047013669506e-06, + "loss": 0.8564, + "step": 6940 + }, + { + "epoch": 0.18, + "learning_rate": 1.995502080257928e-06, + "loss": 0.9912, + "step": 6941 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954994583866953e-06, + "loss": 0.8232, + "step": 6942 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954968357532544e-06, + "loss": 0.9229, + "step": 6943 + }, + { + "epoch": 0.18, + "learning_rate": 1.995494212357607e-06, + "loss": 0.6648, + "step": 6944 + }, + { + "epoch": 0.18, + "learning_rate": 1.995491588199756e-06, + "loss": 0.9688, + "step": 6945 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954889632797026e-06, + "loss": 0.916, + "step": 6946 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954863375974493e-06, + "loss": 1.0469, + "step": 6947 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954837111529975e-06, + "loss": 0.957, + "step": 6948 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954810839463496e-06, + "loss": 0.79, + "step": 6949 + }, + { + "epoch": 0.18, + "learning_rate": 1.995478455977508e-06, + "loss": 0.6865, + "step": 6950 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954758272464738e-06, + "loss": 1.0439, + "step": 6951 + }, + { + "epoch": 0.18, + "learning_rate": 1.99547319775325e-06, + "loss": 0.9463, + "step": 6952 + }, + { + "epoch": 0.18, + "learning_rate": 1.995470567497838e-06, + "loss": 1.0039, + "step": 6953 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954679364802397e-06, + "loss": 0.8799, + "step": 6954 + }, + { + "epoch": 0.18, + "learning_rate": 1.995465304700458e-06, + "loss": 1.0098, + "step": 6955 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954626721584933e-06, + "loss": 0.9438, + "step": 6956 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954600388543495e-06, + "loss": 0.9678, + "step": 6957 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954574047880276e-06, + "loss": 0.8896, + "step": 6958 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954547699595294e-06, + "loss": 0.7705, + "step": 6959 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954521343688574e-06, + "loss": 0.8389, + "step": 6960 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954494980160133e-06, + "loss": 0.8779, + "step": 6961 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954468609009997e-06, + "loss": 0.9893, + "step": 6962 + }, + { + "epoch": 0.18, + "learning_rate": 1.995444223023818e-06, + "loss": 0.8398, + "step": 6963 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954415843844704e-06, + "loss": 0.875, + "step": 6964 + }, + { + "epoch": 0.18, + "learning_rate": 1.995438944982959e-06, + "loss": 1.0039, + "step": 6965 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954363048192854e-06, + "loss": 1.0557, + "step": 6966 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954336638934523e-06, + "loss": 0.8657, + "step": 6967 + }, + { + "epoch": 0.18, + "learning_rate": 1.995431022205462e-06, + "loss": 0.8799, + "step": 6968 + }, + { + "epoch": 0.18, + "learning_rate": 1.995428379755315e-06, + "loss": 0.9316, + "step": 6969 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954257365430144e-06, + "loss": 0.7437, + "step": 6970 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954230925685627e-06, + "loss": 0.958, + "step": 6971 + }, + { + "epoch": 0.18, + "learning_rate": 1.995420447831961e-06, + "loss": 0.8008, + "step": 6972 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954178023332113e-06, + "loss": 1.1416, + "step": 6973 + }, + { + "epoch": 0.18, + "learning_rate": 1.995415156072316e-06, + "loss": 0.8613, + "step": 6974 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954125090492778e-06, + "loss": 0.8828, + "step": 6975 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954098612640973e-06, + "loss": 0.7534, + "step": 6976 + }, + { + "epoch": 0.18, + "learning_rate": 1.9954072127167774e-06, + "loss": 0.9336, + "step": 6977 + }, + { + "epoch": 0.18, + "learning_rate": 1.99540456340732e-06, + "loss": 1.1201, + "step": 6978 + }, + { + "epoch": 0.18, + "learning_rate": 1.995401913335727e-06, + "loss": 0.8652, + "step": 6979 + }, + { + "epoch": 0.18, + "learning_rate": 1.995399262502001e-06, + "loss": 1.0762, + "step": 6980 + }, + { + "epoch": 0.18, + "learning_rate": 1.995396610906143e-06, + "loss": 0.8213, + "step": 6981 + }, + { + "epoch": 0.18, + "learning_rate": 1.995393958548156e-06, + "loss": 1.0088, + "step": 6982 + }, + { + "epoch": 0.18, + "learning_rate": 1.995391305428041e-06, + "loss": 0.5601, + "step": 6983 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953886515458014e-06, + "loss": 0.9199, + "step": 6984 + }, + { + "epoch": 0.18, + "learning_rate": 1.995385996901438e-06, + "loss": 0.7734, + "step": 6985 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953833414949536e-06, + "loss": 1.1084, + "step": 6986 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953806853263496e-06, + "loss": 1.0635, + "step": 6987 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953780283956287e-06, + "loss": 0.873, + "step": 6988 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953753707027923e-06, + "loss": 1.0547, + "step": 6989 + }, + { + "epoch": 0.18, + "learning_rate": 1.995372712247843e-06, + "loss": 0.9106, + "step": 6990 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953700530307825e-06, + "loss": 0.9443, + "step": 6991 + }, + { + "epoch": 0.18, + "learning_rate": 1.995367393051613e-06, + "loss": 0.8184, + "step": 6992 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953647323103363e-06, + "loss": 0.8018, + "step": 6993 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953620708069546e-06, + "loss": 0.9912, + "step": 6994 + }, + { + "epoch": 0.18, + "learning_rate": 1.99535940854147e-06, + "loss": 0.8154, + "step": 6995 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953567455138844e-06, + "loss": 1.0557, + "step": 6996 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953540817242002e-06, + "loss": 1.0098, + "step": 6997 + }, + { + "epoch": 0.18, + "learning_rate": 1.995351417172419e-06, + "loss": 1.0166, + "step": 6998 + }, + { + "epoch": 0.18, + "learning_rate": 1.995348751858543e-06, + "loss": 0.9814, + "step": 6999 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953460857825737e-06, + "loss": 1.0566, + "step": 7000 + }, + { + "epoch": 0.18, + "learning_rate": 1.995343418944514e-06, + "loss": 0.9453, + "step": 7001 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953407513443662e-06, + "loss": 0.7954, + "step": 7002 + }, + { + "epoch": 0.18, + "learning_rate": 1.995338082982131e-06, + "loss": 0.9316, + "step": 7003 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953354138578117e-06, + "loss": 0.8838, + "step": 7004 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953327439714096e-06, + "loss": 1.0303, + "step": 7005 + }, + { + "epoch": 0.18, + "learning_rate": 1.995330073322927e-06, + "loss": 0.8828, + "step": 7006 + }, + { + "epoch": 0.18, + "learning_rate": 1.995327401912366e-06, + "loss": 1.0205, + "step": 7007 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953247297397283e-06, + "loss": 0.8809, + "step": 7008 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953220568050165e-06, + "loss": 1.0391, + "step": 7009 + }, + { + "epoch": 0.18, + "learning_rate": 1.995319383108232e-06, + "loss": 0.9043, + "step": 7010 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953167086493776e-06, + "loss": 0.9492, + "step": 7011 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953140334284553e-06, + "loss": 0.7075, + "step": 7012 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953113574454663e-06, + "loss": 0.9512, + "step": 7013 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953086807004127e-06, + "loss": 0.7505, + "step": 7014 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953060031932976e-06, + "loss": 0.875, + "step": 7015 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953033249241227e-06, + "loss": 0.6748, + "step": 7016 + }, + { + "epoch": 0.18, + "learning_rate": 1.9953006458928895e-06, + "loss": 0.9043, + "step": 7017 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952979660996003e-06, + "loss": 1.1992, + "step": 7018 + }, + { + "epoch": 0.18, + "learning_rate": 1.995295285544257e-06, + "loss": 0.813, + "step": 7019 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952926042268626e-06, + "loss": 0.7881, + "step": 7020 + }, + { + "epoch": 0.18, + "learning_rate": 1.995289922147418e-06, + "loss": 0.8633, + "step": 7021 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952872393059256e-06, + "loss": 0.8291, + "step": 7022 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952845557023874e-06, + "loss": 0.5107, + "step": 7023 + }, + { + "epoch": 0.18, + "learning_rate": 1.995281871336806e-06, + "loss": 1.0156, + "step": 7024 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952791862091827e-06, + "loss": 1.0176, + "step": 7025 + }, + { + "epoch": 0.18, + "learning_rate": 1.99527650031952e-06, + "loss": 0.8389, + "step": 7026 + }, + { + "epoch": 0.18, + "learning_rate": 1.99527381366782e-06, + "loss": 0.8599, + "step": 7027 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952711262540843e-06, + "loss": 0.916, + "step": 7028 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952684380783152e-06, + "loss": 0.9717, + "step": 7029 + }, + { + "epoch": 0.18, + "learning_rate": 1.995265749140515e-06, + "loss": 0.79, + "step": 7030 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952630594406855e-06, + "loss": 1.0303, + "step": 7031 + }, + { + "epoch": 0.18, + "learning_rate": 1.995260368978829e-06, + "loss": 0.8184, + "step": 7032 + }, + { + "epoch": 0.18, + "learning_rate": 1.995257677754947e-06, + "loss": 0.7476, + "step": 7033 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952549857690427e-06, + "loss": 0.6899, + "step": 7034 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952522930211168e-06, + "loss": 0.9414, + "step": 7035 + }, + { + "epoch": 0.18, + "learning_rate": 1.995249599511172e-06, + "loss": 0.9385, + "step": 7036 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952469052392108e-06, + "loss": 0.791, + "step": 7037 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952442102052344e-06, + "loss": 0.8965, + "step": 7038 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952415144092452e-06, + "loss": 0.8906, + "step": 7039 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952388178512457e-06, + "loss": 0.9561, + "step": 7040 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952361205312376e-06, + "loss": 0.8633, + "step": 7041 + }, + { + "epoch": 0.18, + "learning_rate": 1.995233422449223e-06, + "loss": 0.9346, + "step": 7042 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952307236052035e-06, + "loss": 0.9727, + "step": 7043 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952280239991818e-06, + "loss": 0.9873, + "step": 7044 + }, + { + "epoch": 0.18, + "learning_rate": 1.99522532363116e-06, + "loss": 0.8281, + "step": 7045 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952226225011395e-06, + "loss": 0.9033, + "step": 7046 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952199206091232e-06, + "loss": 0.9209, + "step": 7047 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952172179551127e-06, + "loss": 0.9756, + "step": 7048 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952145145391097e-06, + "loss": 0.7114, + "step": 7049 + }, + { + "epoch": 0.18, + "learning_rate": 1.995211810361117e-06, + "loss": 0.8398, + "step": 7050 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952091054211366e-06, + "loss": 0.9062, + "step": 7051 + }, + { + "epoch": 0.18, + "learning_rate": 1.9952063997191704e-06, + "loss": 0.9512, + "step": 7052 + }, + { + "epoch": 0.18, + "learning_rate": 1.99520369325522e-06, + "loss": 1.1426, + "step": 7053 + }, + { + "epoch": 0.18, + "learning_rate": 1.995200986029288e-06, + "loss": 0.9473, + "step": 7054 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951982780413766e-06, + "loss": 0.9941, + "step": 7055 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951955692914876e-06, + "loss": 0.9092, + "step": 7056 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951928597796227e-06, + "loss": 0.8154, + "step": 7057 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951901495057847e-06, + "loss": 1.0791, + "step": 7058 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951874384699753e-06, + "loss": 0.8726, + "step": 7059 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951847266721967e-06, + "loss": 0.8818, + "step": 7060 + }, + { + "epoch": 0.18, + "learning_rate": 1.995182014112451e-06, + "loss": 0.9902, + "step": 7061 + }, + { + "epoch": 0.18, + "learning_rate": 1.99517930079074e-06, + "loss": 0.9395, + "step": 7062 + }, + { + "epoch": 0.18, + "learning_rate": 1.995176586707066e-06, + "loss": 0.8213, + "step": 7063 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951738718614314e-06, + "loss": 0.7573, + "step": 7064 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951711562538375e-06, + "loss": 0.8237, + "step": 7065 + }, + { + "epoch": 0.18, + "learning_rate": 1.995168439884287e-06, + "loss": 0.9629, + "step": 7066 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951657227527814e-06, + "loss": 0.9609, + "step": 7067 + }, + { + "epoch": 0.18, + "learning_rate": 1.995163004859324e-06, + "loss": 0.8652, + "step": 7068 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951602862039153e-06, + "loss": 0.8086, + "step": 7069 + }, + { + "epoch": 0.18, + "learning_rate": 1.995157566786558e-06, + "loss": 0.8369, + "step": 7070 + }, + { + "epoch": 0.18, + "learning_rate": 1.995154846607255e-06, + "loss": 0.6631, + "step": 7071 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951521256660074e-06, + "loss": 0.7676, + "step": 7072 + }, + { + "epoch": 0.18, + "learning_rate": 1.995149403962817e-06, + "loss": 0.8218, + "step": 7073 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951466814976878e-06, + "loss": 0.9121, + "step": 7074 + }, + { + "epoch": 0.18, + "learning_rate": 1.995143958270619e-06, + "loss": 1.0596, + "step": 7075 + }, + { + "epoch": 0.18, + "learning_rate": 1.995141234281615e-06, + "loss": 0.9072, + "step": 7076 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951385095306776e-06, + "loss": 0.9326, + "step": 7077 + }, + { + "epoch": 0.18, + "learning_rate": 1.995135784017808e-06, + "loss": 0.7854, + "step": 7078 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951330577430085e-06, + "loss": 1.1006, + "step": 7079 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951303307062814e-06, + "loss": 0.563, + "step": 7080 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951276029076286e-06, + "loss": 1.0605, + "step": 7081 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951248743470527e-06, + "loss": 0.748, + "step": 7082 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951221450245554e-06, + "loss": 0.8906, + "step": 7083 + }, + { + "epoch": 0.18, + "learning_rate": 1.995119414940139e-06, + "loss": 0.9375, + "step": 7084 + }, + { + "epoch": 0.18, + "learning_rate": 1.995116684093805e-06, + "loss": 0.6401, + "step": 7085 + }, + { + "epoch": 0.18, + "learning_rate": 1.995113952485556e-06, + "loss": 0.8809, + "step": 7086 + }, + { + "epoch": 0.18, + "learning_rate": 1.995111220115394e-06, + "loss": 1.1152, + "step": 7087 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951084869833212e-06, + "loss": 0.8447, + "step": 7088 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951057530893393e-06, + "loss": 0.9277, + "step": 7089 + }, + { + "epoch": 0.18, + "learning_rate": 1.995103018433451e-06, + "loss": 1.1357, + "step": 7090 + }, + { + "epoch": 0.18, + "learning_rate": 1.9951002830156583e-06, + "loss": 0.8564, + "step": 7091 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950975468359626e-06, + "loss": 0.9121, + "step": 7092 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950948098943667e-06, + "loss": 0.7568, + "step": 7093 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950920721908723e-06, + "loss": 0.9619, + "step": 7094 + }, + { + "epoch": 0.18, + "learning_rate": 1.995089333725482e-06, + "loss": 0.8184, + "step": 7095 + }, + { + "epoch": 0.18, + "learning_rate": 1.995086594498197e-06, + "loss": 0.9932, + "step": 7096 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950838545090205e-06, + "loss": 0.8848, + "step": 7097 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950811137579536e-06, + "loss": 0.7493, + "step": 7098 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950783722449993e-06, + "loss": 0.8135, + "step": 7099 + }, + { + "epoch": 0.18, + "learning_rate": 1.995075629970159e-06, + "loss": 0.75, + "step": 7100 + }, + { + "epoch": 0.18, + "learning_rate": 1.995072886933435e-06, + "loss": 1.2041, + "step": 7101 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950701431348294e-06, + "loss": 1.0693, + "step": 7102 + }, + { + "epoch": 0.18, + "learning_rate": 1.995067398574344e-06, + "loss": 0.7173, + "step": 7103 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950646532519823e-06, + "loss": 0.7988, + "step": 7104 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950619071677445e-06, + "loss": 1.0146, + "step": 7105 + }, + { + "epoch": 0.18, + "learning_rate": 1.995059160321634e-06, + "loss": 1.0312, + "step": 7106 + }, + { + "epoch": 0.18, + "learning_rate": 1.995056412713652e-06, + "loss": 1.04, + "step": 7107 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950536643438016e-06, + "loss": 0.959, + "step": 7108 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950509152120836e-06, + "loss": 0.8564, + "step": 7109 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950481653185014e-06, + "loss": 0.8662, + "step": 7110 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950454146630567e-06, + "loss": 1.0713, + "step": 7111 + }, + { + "epoch": 0.18, + "learning_rate": 1.995042663245751e-06, + "loss": 0.7812, + "step": 7112 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950399110665874e-06, + "loss": 0.874, + "step": 7113 + }, + { + "epoch": 0.18, + "learning_rate": 1.995037158125567e-06, + "loss": 1.1416, + "step": 7114 + }, + { + "epoch": 0.18, + "learning_rate": 1.995034404422693e-06, + "loss": 0.8652, + "step": 7115 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950316499579666e-06, + "loss": 1.0664, + "step": 7116 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950288947313905e-06, + "loss": 0.7529, + "step": 7117 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950261387429657e-06, + "loss": 1.002, + "step": 7118 + }, + { + "epoch": 0.18, + "learning_rate": 1.995023381992696e-06, + "loss": 1.0205, + "step": 7119 + }, + { + "epoch": 0.18, + "learning_rate": 1.995020624480582e-06, + "loss": 0.8364, + "step": 7120 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950178662066267e-06, + "loss": 1.0166, + "step": 7121 + }, + { + "epoch": 0.18, + "learning_rate": 1.995015107170832e-06, + "loss": 0.7754, + "step": 7122 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950123473732e-06, + "loss": 0.9766, + "step": 7123 + }, + { + "epoch": 0.18, + "learning_rate": 1.995009586813733e-06, + "loss": 0.833, + "step": 7124 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950068254924324e-06, + "loss": 0.8438, + "step": 7125 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950040634093015e-06, + "loss": 0.8965, + "step": 7126 + }, + { + "epoch": 0.18, + "learning_rate": 1.9950013005643412e-06, + "loss": 0.7837, + "step": 7127 + }, + { + "epoch": 0.18, + "learning_rate": 1.994998536957555e-06, + "loss": 1.1055, + "step": 7128 + }, + { + "epoch": 0.18, + "learning_rate": 1.994995772588943e-06, + "loss": 0.8145, + "step": 7129 + }, + { + "epoch": 0.18, + "learning_rate": 1.994993007458509e-06, + "loss": 0.8496, + "step": 7130 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949902415662547e-06, + "loss": 0.7461, + "step": 7131 + }, + { + "epoch": 0.18, + "learning_rate": 1.994987474912182e-06, + "loss": 0.8174, + "step": 7132 + }, + { + "epoch": 0.18, + "learning_rate": 1.994984707496293e-06, + "loss": 1.0664, + "step": 7133 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949819393185905e-06, + "loss": 0.9561, + "step": 7134 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949791703790756e-06, + "loss": 0.9453, + "step": 7135 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949764006777508e-06, + "loss": 1.04, + "step": 7136 + }, + { + "epoch": 0.18, + "learning_rate": 1.994973630214619e-06, + "loss": 1.0078, + "step": 7137 + }, + { + "epoch": 0.18, + "learning_rate": 1.994970858989681e-06, + "loss": 0.9229, + "step": 7138 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949680870029395e-06, + "loss": 0.8486, + "step": 7139 + }, + { + "epoch": 0.18, + "learning_rate": 1.994965314254397e-06, + "loss": 1.0635, + "step": 7140 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949625407440554e-06, + "loss": 0.834, + "step": 7141 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949597664719167e-06, + "loss": 0.8262, + "step": 7142 + }, + { + "epoch": 0.18, + "learning_rate": 1.994956991437983e-06, + "loss": 0.8408, + "step": 7143 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949542156422564e-06, + "loss": 0.9033, + "step": 7144 + }, + { + "epoch": 0.18, + "learning_rate": 1.994951439084739e-06, + "loss": 1.0947, + "step": 7145 + }, + { + "epoch": 0.18, + "learning_rate": 1.994948661765433e-06, + "loss": 0.8262, + "step": 7146 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949458836843406e-06, + "loss": 0.7266, + "step": 7147 + }, + { + "epoch": 0.18, + "learning_rate": 1.994943104841464e-06, + "loss": 0.9121, + "step": 7148 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949403252368052e-06, + "loss": 0.9111, + "step": 7149 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949375448703666e-06, + "loss": 0.9023, + "step": 7150 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949347637421497e-06, + "loss": 0.8794, + "step": 7151 + }, + { + "epoch": 0.18, + "learning_rate": 1.994931981852157e-06, + "loss": 0.9229, + "step": 7152 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949291992003905e-06, + "loss": 0.8164, + "step": 7153 + }, + { + "epoch": 0.18, + "learning_rate": 1.994926415786853e-06, + "loss": 1.0439, + "step": 7154 + }, + { + "epoch": 0.18, + "learning_rate": 1.994923631611546e-06, + "loss": 1.0391, + "step": 7155 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949208466744713e-06, + "loss": 0.521, + "step": 7156 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949180609756316e-06, + "loss": 0.9307, + "step": 7157 + }, + { + "epoch": 0.18, + "learning_rate": 1.994915274515029e-06, + "loss": 0.9014, + "step": 7158 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949124872926654e-06, + "loss": 0.9453, + "step": 7159 + }, + { + "epoch": 0.18, + "learning_rate": 1.994909699308543e-06, + "loss": 0.7358, + "step": 7160 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949069105626645e-06, + "loss": 0.9111, + "step": 7161 + }, + { + "epoch": 0.18, + "learning_rate": 1.994904121055031e-06, + "loss": 0.9932, + "step": 7162 + }, + { + "epoch": 0.18, + "learning_rate": 1.9949013307856456e-06, + "loss": 1.0146, + "step": 7163 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948985397545095e-06, + "loss": 0.8325, + "step": 7164 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948957479616256e-06, + "loss": 0.8965, + "step": 7165 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948929554069956e-06, + "loss": 1.0391, + "step": 7166 + }, + { + "epoch": 0.18, + "learning_rate": 1.994890162090622e-06, + "loss": 0.6484, + "step": 7167 + }, + { + "epoch": 0.18, + "learning_rate": 1.994887368012507e-06, + "loss": 0.7886, + "step": 7168 + }, + { + "epoch": 0.18, + "learning_rate": 1.994884573172652e-06, + "loss": 0.8848, + "step": 7169 + }, + { + "epoch": 0.18, + "learning_rate": 1.99488177757106e-06, + "loss": 0.96, + "step": 7170 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948789812077323e-06, + "loss": 0.9023, + "step": 7171 + }, + { + "epoch": 0.18, + "learning_rate": 1.994876184082672e-06, + "loss": 0.8535, + "step": 7172 + }, + { + "epoch": 0.18, + "learning_rate": 1.99487338619588e-06, + "loss": 0.9541, + "step": 7173 + }, + { + "epoch": 0.18, + "learning_rate": 1.99487058754736e-06, + "loss": 0.9487, + "step": 7174 + }, + { + "epoch": 0.18, + "learning_rate": 1.994867788137113e-06, + "loss": 0.8975, + "step": 7175 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948649879651414e-06, + "loss": 0.8369, + "step": 7176 + }, + { + "epoch": 0.18, + "learning_rate": 1.994862187031448e-06, + "loss": 0.8005, + "step": 7177 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948593853360337e-06, + "loss": 0.9316, + "step": 7178 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948565828789013e-06, + "loss": 0.7136, + "step": 7179 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948537796600533e-06, + "loss": 0.8613, + "step": 7180 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948509756794914e-06, + "loss": 1.0352, + "step": 7181 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948481709372182e-06, + "loss": 0.8926, + "step": 7182 + }, + { + "epoch": 0.18, + "learning_rate": 1.994845365433235e-06, + "loss": 0.8857, + "step": 7183 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948425591675447e-06, + "loss": 0.9629, + "step": 7184 + }, + { + "epoch": 0.18, + "learning_rate": 1.994839752140149e-06, + "loss": 0.9014, + "step": 7185 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948369443510504e-06, + "loss": 1.1328, + "step": 7186 + }, + { + "epoch": 0.18, + "learning_rate": 1.994834135800251e-06, + "loss": 0.719, + "step": 7187 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948313264877524e-06, + "loss": 0.9141, + "step": 7188 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948285164135575e-06, + "loss": 0.9414, + "step": 7189 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948257055776683e-06, + "loss": 0.9443, + "step": 7190 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948228939800864e-06, + "loss": 0.9404, + "step": 7191 + }, + { + "epoch": 0.18, + "learning_rate": 1.994820081620815e-06, + "loss": 0.9492, + "step": 7192 + }, + { + "epoch": 0.18, + "learning_rate": 1.994817268499855e-06, + "loss": 0.9619, + "step": 7193 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948144546172093e-06, + "loss": 0.8218, + "step": 7194 + }, + { + "epoch": 0.18, + "learning_rate": 1.99481163997288e-06, + "loss": 0.793, + "step": 7195 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948088245668694e-06, + "loss": 0.9922, + "step": 7196 + }, + { + "epoch": 0.18, + "learning_rate": 1.994806008399179e-06, + "loss": 1.0967, + "step": 7197 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948031914698117e-06, + "loss": 0.8188, + "step": 7198 + }, + { + "epoch": 0.18, + "learning_rate": 1.9948003737787688e-06, + "loss": 1.0088, + "step": 7199 + }, + { + "epoch": 0.18, + "learning_rate": 1.9947975553260535e-06, + "loss": 0.9053, + "step": 7200 + }, + { + "epoch": 0.18, + "learning_rate": 1.9947947361116672e-06, + "loss": 0.9307, + "step": 7201 + }, + { + "epoch": 0.18, + "learning_rate": 1.9947919161356128e-06, + "loss": 0.9033, + "step": 7202 + }, + { + "epoch": 0.18, + "learning_rate": 1.9947890953978915e-06, + "loss": 0.8857, + "step": 7203 + }, + { + "epoch": 0.18, + "learning_rate": 1.994786273898506e-06, + "loss": 0.8311, + "step": 7204 + }, + { + "epoch": 0.18, + "learning_rate": 1.9947834516374585e-06, + "loss": 1.0156, + "step": 7205 + }, + { + "epoch": 0.18, + "learning_rate": 1.9947806286147507e-06, + "loss": 1.1172, + "step": 7206 + }, + { + "epoch": 0.18, + "learning_rate": 1.9947778048303857e-06, + "loss": 0.8281, + "step": 7207 + }, + { + "epoch": 0.18, + "learning_rate": 1.994774980284365e-06, + "loss": 0.915, + "step": 7208 + }, + { + "epoch": 0.18, + "learning_rate": 1.9947721549766903e-06, + "loss": 0.8955, + "step": 7209 + }, + { + "epoch": 0.18, + "learning_rate": 1.9947693289073646e-06, + "loss": 0.7788, + "step": 7210 + }, + { + "epoch": 0.18, + "learning_rate": 1.99476650207639e-06, + "loss": 0.7622, + "step": 7211 + }, + { + "epoch": 0.18, + "learning_rate": 1.994763674483768e-06, + "loss": 0.8833, + "step": 7212 + }, + { + "epoch": 0.18, + "learning_rate": 1.9947608461295016e-06, + "loss": 0.7998, + "step": 7213 + }, + { + "epoch": 0.18, + "learning_rate": 1.9947580170135923e-06, + "loss": 0.8906, + "step": 7214 + }, + { + "epoch": 0.18, + "learning_rate": 1.9947551871360425e-06, + "loss": 0.8906, + "step": 7215 + }, + { + "epoch": 0.18, + "learning_rate": 1.9947523564968546e-06, + "loss": 0.9287, + "step": 7216 + }, + { + "epoch": 0.18, + "learning_rate": 1.9947495250960308e-06, + "loss": 0.8115, + "step": 7217 + }, + { + "epoch": 0.19, + "learning_rate": 1.9947466929335723e-06, + "loss": 0.7881, + "step": 7218 + }, + { + "epoch": 0.19, + "learning_rate": 1.9947438600094825e-06, + "loss": 0.9492, + "step": 7219 + }, + { + "epoch": 0.19, + "learning_rate": 1.9947410263237628e-06, + "loss": 1.0107, + "step": 7220 + }, + { + "epoch": 0.19, + "learning_rate": 1.994738191876416e-06, + "loss": 0.7556, + "step": 7221 + }, + { + "epoch": 0.19, + "learning_rate": 1.994735356667444e-06, + "loss": 0.874, + "step": 7222 + }, + { + "epoch": 0.19, + "learning_rate": 1.994732520696848e-06, + "loss": 0.689, + "step": 7223 + }, + { + "epoch": 0.19, + "learning_rate": 1.994729683964632e-06, + "loss": 0.8447, + "step": 7224 + }, + { + "epoch": 0.19, + "learning_rate": 1.9947268464707965e-06, + "loss": 0.6499, + "step": 7225 + }, + { + "epoch": 0.19, + "learning_rate": 1.994724008215345e-06, + "loss": 1.0762, + "step": 7226 + }, + { + "epoch": 0.19, + "learning_rate": 1.9947211691982787e-06, + "loss": 0.7109, + "step": 7227 + }, + { + "epoch": 0.19, + "learning_rate": 1.9947183294196003e-06, + "loss": 0.8511, + "step": 7228 + }, + { + "epoch": 0.19, + "learning_rate": 1.9947154888793117e-06, + "loss": 0.877, + "step": 7229 + }, + { + "epoch": 0.19, + "learning_rate": 1.994712647577415e-06, + "loss": 1.0337, + "step": 7230 + }, + { + "epoch": 0.19, + "learning_rate": 1.994709805513913e-06, + "loss": 0.875, + "step": 7231 + }, + { + "epoch": 0.19, + "learning_rate": 1.994706962688807e-06, + "loss": 1.1074, + "step": 7232 + }, + { + "epoch": 0.19, + "learning_rate": 1.9947041191021e-06, + "loss": 0.9453, + "step": 7233 + }, + { + "epoch": 0.19, + "learning_rate": 1.994701274753794e-06, + "loss": 0.9209, + "step": 7234 + }, + { + "epoch": 0.19, + "learning_rate": 1.99469842964389e-06, + "loss": 1.0293, + "step": 7235 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946955837723923e-06, + "loss": 0.8037, + "step": 7236 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946927371393013e-06, + "loss": 0.8916, + "step": 7237 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946898897446197e-06, + "loss": 0.707, + "step": 7238 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946870415883504e-06, + "loss": 0.8994, + "step": 7239 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946841926704943e-06, + "loss": 0.8955, + "step": 7240 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946813429910544e-06, + "loss": 0.7695, + "step": 7241 + }, + { + "epoch": 0.19, + "learning_rate": 1.994678492550033e-06, + "loss": 0.7661, + "step": 7242 + }, + { + "epoch": 0.19, + "learning_rate": 1.994675641347432e-06, + "loss": 0.8838, + "step": 7243 + }, + { + "epoch": 0.19, + "learning_rate": 1.994672789383253e-06, + "loss": 0.876, + "step": 7244 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946699366574995e-06, + "loss": 0.877, + "step": 7245 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946670831701726e-06, + "loss": 0.9756, + "step": 7246 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946642289212754e-06, + "loss": 0.9648, + "step": 7247 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946613739108087e-06, + "loss": 0.7588, + "step": 7248 + }, + { + "epoch": 0.19, + "learning_rate": 1.994658518138776e-06, + "loss": 0.8223, + "step": 7249 + }, + { + "epoch": 0.19, + "learning_rate": 1.994655661605179e-06, + "loss": 1.0186, + "step": 7250 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946528043100196e-06, + "loss": 1.0996, + "step": 7251 + }, + { + "epoch": 0.19, + "learning_rate": 1.994649946253301e-06, + "loss": 0.9053, + "step": 7252 + }, + { + "epoch": 0.19, + "learning_rate": 1.994647087435024e-06, + "loss": 0.9951, + "step": 7253 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946442278551915e-06, + "loss": 0.9541, + "step": 7254 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946413675138057e-06, + "loss": 0.8594, + "step": 7255 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946385064108686e-06, + "loss": 0.8604, + "step": 7256 + }, + { + "epoch": 0.19, + "learning_rate": 1.994635644546383e-06, + "loss": 0.833, + "step": 7257 + }, + { + "epoch": 0.19, + "learning_rate": 1.99463278192035e-06, + "loss": 0.8291, + "step": 7258 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946299185327734e-06, + "loss": 1.0762, + "step": 7259 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946270543836534e-06, + "loss": 0.916, + "step": 7260 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946241894729937e-06, + "loss": 0.8955, + "step": 7261 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946213238007963e-06, + "loss": 1.0254, + "step": 7262 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946184573670624e-06, + "loss": 0.96, + "step": 7263 + }, + { + "epoch": 0.19, + "learning_rate": 1.994615590171795e-06, + "loss": 0.7593, + "step": 7264 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946127222149966e-06, + "loss": 0.8069, + "step": 7265 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946098534966683e-06, + "loss": 0.8857, + "step": 7266 + }, + { + "epoch": 0.19, + "learning_rate": 1.994606984016814e-06, + "loss": 0.915, + "step": 7267 + }, + { + "epoch": 0.19, + "learning_rate": 1.994604113775434e-06, + "loss": 0.7969, + "step": 7268 + }, + { + "epoch": 0.19, + "learning_rate": 1.9946012427725317e-06, + "loss": 0.9639, + "step": 7269 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945983710081087e-06, + "loss": 0.9639, + "step": 7270 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945954984821675e-06, + "loss": 0.7949, + "step": 7271 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945926251947106e-06, + "loss": 0.8667, + "step": 7272 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945897511457393e-06, + "loss": 0.8604, + "step": 7273 + }, + { + "epoch": 0.19, + "learning_rate": 1.994586876335257e-06, + "loss": 0.7852, + "step": 7274 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945840007632647e-06, + "loss": 0.8643, + "step": 7275 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945811244297655e-06, + "loss": 0.9043, + "step": 7276 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945782473347613e-06, + "loss": 0.8428, + "step": 7277 + }, + { + "epoch": 0.19, + "learning_rate": 1.994575369478254e-06, + "loss": 1.0312, + "step": 7278 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945724908602465e-06, + "loss": 0.8804, + "step": 7279 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945696114807402e-06, + "loss": 0.9688, + "step": 7280 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945667313397378e-06, + "loss": 0.9893, + "step": 7281 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945638504372412e-06, + "loss": 0.9072, + "step": 7282 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945609687732528e-06, + "loss": 0.9717, + "step": 7283 + }, + { + "epoch": 0.19, + "learning_rate": 1.994558086347775e-06, + "loss": 1.0977, + "step": 7284 + }, + { + "epoch": 0.19, + "learning_rate": 1.99455520316081e-06, + "loss": 0.8975, + "step": 7285 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945523192123595e-06, + "loss": 0.9971, + "step": 7286 + }, + { + "epoch": 0.19, + "learning_rate": 1.994549434502426e-06, + "loss": 0.9355, + "step": 7287 + }, + { + "epoch": 0.19, + "learning_rate": 1.994546549031012e-06, + "loss": 0.8955, + "step": 7288 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945436627981192e-06, + "loss": 1.1318, + "step": 7289 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945407758037503e-06, + "loss": 0.8936, + "step": 7290 + }, + { + "epoch": 0.19, + "learning_rate": 1.994537888047907e-06, + "loss": 0.71, + "step": 7291 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945349995305917e-06, + "loss": 0.9395, + "step": 7292 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945321102518067e-06, + "loss": 1.0449, + "step": 7293 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945292202115543e-06, + "loss": 0.8389, + "step": 7294 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945263294098367e-06, + "loss": 0.6997, + "step": 7295 + }, + { + "epoch": 0.19, + "learning_rate": 1.994523437846656e-06, + "loss": 1.0391, + "step": 7296 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945205455220146e-06, + "loss": 0.9619, + "step": 7297 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945176524359143e-06, + "loss": 0.8037, + "step": 7298 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945147585883576e-06, + "loss": 0.9805, + "step": 7299 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945118639793463e-06, + "loss": 0.7705, + "step": 7300 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945089686088833e-06, + "loss": 0.9082, + "step": 7301 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945060724769707e-06, + "loss": 0.7349, + "step": 7302 + }, + { + "epoch": 0.19, + "learning_rate": 1.9945031755836107e-06, + "loss": 0.9961, + "step": 7303 + }, + { + "epoch": 0.19, + "learning_rate": 1.994500277928805e-06, + "loss": 1.0137, + "step": 7304 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944973795125558e-06, + "loss": 0.959, + "step": 7305 + }, + { + "epoch": 0.19, + "learning_rate": 1.994494480334866e-06, + "loss": 1.0039, + "step": 7306 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944915803957377e-06, + "loss": 1.0146, + "step": 7307 + }, + { + "epoch": 0.19, + "learning_rate": 1.994488679695173e-06, + "loss": 1.083, + "step": 7308 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944857782331738e-06, + "loss": 0.6694, + "step": 7309 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944828760097424e-06, + "loss": 0.998, + "step": 7310 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944799730248814e-06, + "loss": 0.7983, + "step": 7311 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944770692785932e-06, + "loss": 0.7266, + "step": 7312 + }, + { + "epoch": 0.19, + "learning_rate": 1.994474164770879e-06, + "loss": 0.9531, + "step": 7313 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944712595017422e-06, + "loss": 0.6921, + "step": 7314 + }, + { + "epoch": 0.19, + "learning_rate": 1.994468353471184e-06, + "loss": 1.0596, + "step": 7315 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944654466792073e-06, + "loss": 0.8262, + "step": 7316 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944625391258143e-06, + "loss": 0.9326, + "step": 7317 + }, + { + "epoch": 0.19, + "learning_rate": 1.994459630811007e-06, + "loss": 1.0967, + "step": 7318 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944567217347873e-06, + "loss": 1.082, + "step": 7319 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944538118971582e-06, + "loss": 1.0322, + "step": 7320 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944509012981215e-06, + "loss": 0.8164, + "step": 7321 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944479899376793e-06, + "loss": 0.9023, + "step": 7322 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944450778158345e-06, + "loss": 0.8965, + "step": 7323 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944421649325883e-06, + "loss": 0.9541, + "step": 7324 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944392512879434e-06, + "loss": 0.7109, + "step": 7325 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944363368819028e-06, + "loss": 1.0537, + "step": 7326 + }, + { + "epoch": 0.19, + "learning_rate": 1.994433421714467e-06, + "loss": 0.8486, + "step": 7327 + }, + { + "epoch": 0.19, + "learning_rate": 1.99443050578564e-06, + "loss": 0.8633, + "step": 7328 + }, + { + "epoch": 0.19, + "learning_rate": 1.994427589095423e-06, + "loss": 0.8267, + "step": 7329 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944246716438185e-06, + "loss": 1.0576, + "step": 7330 + }, + { + "epoch": 0.19, + "learning_rate": 1.994421753430829e-06, + "loss": 0.7739, + "step": 7331 + }, + { + "epoch": 0.19, + "learning_rate": 1.994418834456456e-06, + "loss": 0.8457, + "step": 7332 + }, + { + "epoch": 0.19, + "learning_rate": 1.994415914720703e-06, + "loss": 0.9775, + "step": 7333 + }, + { + "epoch": 0.19, + "learning_rate": 1.994412994223571e-06, + "loss": 0.582, + "step": 7334 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944100729650628e-06, + "loss": 0.9688, + "step": 7335 + }, + { + "epoch": 0.19, + "learning_rate": 1.99440715094518e-06, + "loss": 0.8457, + "step": 7336 + }, + { + "epoch": 0.19, + "learning_rate": 1.9944042281639263e-06, + "loss": 1.0566, + "step": 7337 + }, + { + "epoch": 0.19, + "learning_rate": 1.994401304621302e-06, + "loss": 1.25, + "step": 7338 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943983803173112e-06, + "loss": 0.9736, + "step": 7339 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943954552519547e-06, + "loss": 1.0752, + "step": 7340 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943925294252358e-06, + "loss": 0.9326, + "step": 7341 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943896028371562e-06, + "loss": 1.0645, + "step": 7342 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943866754877177e-06, + "loss": 0.6782, + "step": 7343 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943837473769232e-06, + "loss": 0.7925, + "step": 7344 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943808185047753e-06, + "loss": 0.7178, + "step": 7345 + }, + { + "epoch": 0.19, + "learning_rate": 1.994377888871275e-06, + "loss": 1.0166, + "step": 7346 + }, + { + "epoch": 0.19, + "learning_rate": 1.994374958476426e-06, + "loss": 0.9385, + "step": 7347 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943720273202295e-06, + "loss": 1.1289, + "step": 7348 + }, + { + "epoch": 0.19, + "learning_rate": 1.994369095402688e-06, + "loss": 0.9521, + "step": 7349 + }, + { + "epoch": 0.19, + "learning_rate": 1.994366162723804e-06, + "loss": 1.1465, + "step": 7350 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943632292835797e-06, + "loss": 0.8701, + "step": 7351 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943602950820165e-06, + "loss": 0.7788, + "step": 7352 + }, + { + "epoch": 0.19, + "learning_rate": 1.994357360119118e-06, + "loss": 0.8955, + "step": 7353 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943544243948852e-06, + "loss": 1.0029, + "step": 7354 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943514879093214e-06, + "loss": 1.001, + "step": 7355 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943485506624283e-06, + "loss": 0.8691, + "step": 7356 + }, + { + "epoch": 0.19, + "learning_rate": 1.994345612654208e-06, + "loss": 0.9512, + "step": 7357 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943426738846635e-06, + "loss": 1.0195, + "step": 7358 + }, + { + "epoch": 0.19, + "learning_rate": 1.994339734353796e-06, + "loss": 0.917, + "step": 7359 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943367940616085e-06, + "loss": 1.0186, + "step": 7360 + }, + { + "epoch": 0.19, + "learning_rate": 1.994333853008103e-06, + "loss": 0.9756, + "step": 7361 + }, + { + "epoch": 0.19, + "learning_rate": 1.994330911193282e-06, + "loss": 0.6533, + "step": 7362 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943279686171473e-06, + "loss": 0.7783, + "step": 7363 + }, + { + "epoch": 0.19, + "learning_rate": 1.994325025279702e-06, + "loss": 1.5605, + "step": 7364 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943220811809466e-06, + "loss": 0.834, + "step": 7365 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943191363208854e-06, + "loss": 0.9365, + "step": 7366 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943161906995194e-06, + "loss": 0.8403, + "step": 7367 + }, + { + "epoch": 0.19, + "learning_rate": 1.994313244316851e-06, + "loss": 0.9189, + "step": 7368 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943102971728833e-06, + "loss": 1.0781, + "step": 7369 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943073492676175e-06, + "loss": 0.8613, + "step": 7370 + }, + { + "epoch": 0.19, + "learning_rate": 1.9943044006010563e-06, + "loss": 1.0049, + "step": 7371 + }, + { + "epoch": 0.19, + "learning_rate": 1.994301451173202e-06, + "loss": 0.8955, + "step": 7372 + }, + { + "epoch": 0.19, + "learning_rate": 1.994298500984057e-06, + "loss": 0.9014, + "step": 7373 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942955500336233e-06, + "loss": 0.7783, + "step": 7374 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942925983219027e-06, + "loss": 0.6914, + "step": 7375 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942896458488987e-06, + "loss": 1.0244, + "step": 7376 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942866926146123e-06, + "loss": 0.8857, + "step": 7377 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942837386190466e-06, + "loss": 0.9277, + "step": 7378 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942807838622033e-06, + "loss": 0.9038, + "step": 7379 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942778283440853e-06, + "loss": 0.9028, + "step": 7380 + }, + { + "epoch": 0.19, + "learning_rate": 1.994274872064694e-06, + "loss": 0.9639, + "step": 7381 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942719150240324e-06, + "loss": 0.9912, + "step": 7382 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942689572221027e-06, + "loss": 0.8687, + "step": 7383 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942659986589067e-06, + "loss": 0.9717, + "step": 7384 + }, + { + "epoch": 0.19, + "learning_rate": 1.994263039334447e-06, + "loss": 0.7974, + "step": 7385 + }, + { + "epoch": 0.19, + "learning_rate": 1.994260079248726e-06, + "loss": 0.6245, + "step": 7386 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942571184017454e-06, + "loss": 1.1426, + "step": 7387 + }, + { + "epoch": 0.19, + "learning_rate": 1.994254156793508e-06, + "loss": 0.8594, + "step": 7388 + }, + { + "epoch": 0.19, + "learning_rate": 1.994251194424016e-06, + "loss": 0.8174, + "step": 7389 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942482312932717e-06, + "loss": 0.9873, + "step": 7390 + }, + { + "epoch": 0.19, + "learning_rate": 1.994245267401277e-06, + "loss": 0.6895, + "step": 7391 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942423027480345e-06, + "loss": 1.0361, + "step": 7392 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942393373335465e-06, + "loss": 0.9521, + "step": 7393 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942363711578147e-06, + "loss": 0.8557, + "step": 7394 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942334042208426e-06, + "loss": 0.7202, + "step": 7395 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942304365226314e-06, + "loss": 0.7256, + "step": 7396 + }, + { + "epoch": 0.19, + "learning_rate": 1.994227468063183e-06, + "loss": 0.9971, + "step": 7397 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942244988425014e-06, + "loss": 0.9131, + "step": 7398 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942215288605872e-06, + "loss": 0.9756, + "step": 7399 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942185581174433e-06, + "loss": 1.0547, + "step": 7400 + }, + { + "epoch": 0.19, + "learning_rate": 1.994215586613072e-06, + "loss": 0.8662, + "step": 7401 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942126143474755e-06, + "loss": 0.9355, + "step": 7402 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942096413206562e-06, + "loss": 0.9717, + "step": 7403 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942066675326165e-06, + "loss": 0.877, + "step": 7404 + }, + { + "epoch": 0.19, + "learning_rate": 1.9942036929833584e-06, + "loss": 0.9004, + "step": 7405 + }, + { + "epoch": 0.19, + "learning_rate": 1.994200717672884e-06, + "loss": 1.0322, + "step": 7406 + }, + { + "epoch": 0.19, + "learning_rate": 1.994197741601196e-06, + "loss": 1.0264, + "step": 7407 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941947647682965e-06, + "loss": 0.8984, + "step": 7408 + }, + { + "epoch": 0.19, + "learning_rate": 1.994191787174188e-06, + "loss": 0.7466, + "step": 7409 + }, + { + "epoch": 0.19, + "learning_rate": 1.994188808818872e-06, + "loss": 0.9873, + "step": 7410 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941858297023517e-06, + "loss": 0.8062, + "step": 7411 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941828498246288e-06, + "loss": 0.7295, + "step": 7412 + }, + { + "epoch": 0.19, + "learning_rate": 1.994179869185706e-06, + "loss": 0.6675, + "step": 7413 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941768877855854e-06, + "loss": 0.7119, + "step": 7414 + }, + { + "epoch": 0.19, + "learning_rate": 1.994173905624269e-06, + "loss": 0.8906, + "step": 7415 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941709227017597e-06, + "loss": 0.8887, + "step": 7416 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941679390180598e-06, + "loss": 0.647, + "step": 7417 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941649545731703e-06, + "loss": 0.9014, + "step": 7418 + }, + { + "epoch": 0.19, + "learning_rate": 1.994161969367095e-06, + "loss": 0.8574, + "step": 7419 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941589833998354e-06, + "loss": 0.8516, + "step": 7420 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941559966713943e-06, + "loss": 0.9648, + "step": 7421 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941530091817733e-06, + "loss": 0.752, + "step": 7422 + }, + { + "epoch": 0.19, + "learning_rate": 1.994150020930975e-06, + "loss": 0.9902, + "step": 7423 + }, + { + "epoch": 0.19, + "learning_rate": 1.994147031919002e-06, + "loss": 0.9414, + "step": 7424 + }, + { + "epoch": 0.19, + "learning_rate": 1.994144042145856e-06, + "loss": 0.8643, + "step": 7425 + }, + { + "epoch": 0.19, + "learning_rate": 1.99414105161154e-06, + "loss": 0.748, + "step": 7426 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941380603160556e-06, + "loss": 1.002, + "step": 7427 + }, + { + "epoch": 0.19, + "learning_rate": 1.994135068259406e-06, + "loss": 1.0176, + "step": 7428 + }, + { + "epoch": 0.19, + "learning_rate": 1.994132075441592e-06, + "loss": 0.8223, + "step": 7429 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941290818626175e-06, + "loss": 0.9873, + "step": 7430 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941260875224838e-06, + "loss": 0.9893, + "step": 7431 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941230924211935e-06, + "loss": 0.8389, + "step": 7432 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941200965587484e-06, + "loss": 1.0654, + "step": 7433 + }, + { + "epoch": 0.19, + "learning_rate": 1.994117099935152e-06, + "loss": 1.0889, + "step": 7434 + }, + { + "epoch": 0.19, + "learning_rate": 1.994114102550405e-06, + "loss": 1.0, + "step": 7435 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941111044045113e-06, + "loss": 0.8447, + "step": 7436 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941081054974724e-06, + "loss": 0.8379, + "step": 7437 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941051058292905e-06, + "loss": 0.8301, + "step": 7438 + }, + { + "epoch": 0.19, + "learning_rate": 1.9941021053999677e-06, + "loss": 0.9785, + "step": 7439 + }, + { + "epoch": 0.19, + "learning_rate": 1.994099104209507e-06, + "loss": 1.0283, + "step": 7440 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940961022579102e-06, + "loss": 0.877, + "step": 7441 + }, + { + "epoch": 0.19, + "learning_rate": 1.99409309954518e-06, + "loss": 0.8828, + "step": 7442 + }, + { + "epoch": 0.19, + "learning_rate": 1.994090096071318e-06, + "loss": 0.8896, + "step": 7443 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940870918363273e-06, + "loss": 0.958, + "step": 7444 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940840868402094e-06, + "loss": 0.8154, + "step": 7445 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940810810829673e-06, + "loss": 0.9277, + "step": 7446 + }, + { + "epoch": 0.19, + "learning_rate": 1.994078074564603e-06, + "loss": 0.7729, + "step": 7447 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940750672851185e-06, + "loss": 0.9639, + "step": 7448 + }, + { + "epoch": 0.19, + "learning_rate": 1.994072059244517e-06, + "loss": 1.041, + "step": 7449 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940690504428e-06, + "loss": 0.9199, + "step": 7450 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940660408799696e-06, + "loss": 1.0669, + "step": 7451 + }, + { + "epoch": 0.19, + "learning_rate": 1.994063030556029e-06, + "loss": 0.9043, + "step": 7452 + }, + { + "epoch": 0.19, + "learning_rate": 1.99406001947098e-06, + "loss": 0.7607, + "step": 7453 + }, + { + "epoch": 0.19, + "learning_rate": 1.994057007624825e-06, + "loss": 0.9385, + "step": 7454 + }, + { + "epoch": 0.19, + "learning_rate": 1.994053995017566e-06, + "loss": 0.9775, + "step": 7455 + }, + { + "epoch": 0.19, + "learning_rate": 1.994050981649206e-06, + "loss": 0.7441, + "step": 7456 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940479675197465e-06, + "loss": 0.9658, + "step": 7457 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940449526291904e-06, + "loss": 0.8457, + "step": 7458 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940419369775395e-06, + "loss": 1.1104, + "step": 7459 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940389205647965e-06, + "loss": 1.1836, + "step": 7460 + }, + { + "epoch": 0.19, + "learning_rate": 1.994035903390964e-06, + "loss": 1.0303, + "step": 7461 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940328854560434e-06, + "loss": 0.9443, + "step": 7462 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940298667600376e-06, + "loss": 1.1094, + "step": 7463 + }, + { + "epoch": 0.19, + "learning_rate": 1.994026847302949e-06, + "loss": 0.8555, + "step": 7464 + }, + { + "epoch": 0.19, + "learning_rate": 1.99402382708478e-06, + "loss": 0.9473, + "step": 7465 + }, + { + "epoch": 0.19, + "learning_rate": 1.994020806105532e-06, + "loss": 0.9502, + "step": 7466 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940177843652084e-06, + "loss": 1.0439, + "step": 7467 + }, + { + "epoch": 0.19, + "learning_rate": 1.994014761863811e-06, + "loss": 0.7959, + "step": 7468 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940117386013425e-06, + "loss": 0.96, + "step": 7469 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940087145778043e-06, + "loss": 1.0293, + "step": 7470 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940056897932e-06, + "loss": 0.7441, + "step": 7471 + }, + { + "epoch": 0.19, + "learning_rate": 1.9940026642475308e-06, + "loss": 0.9111, + "step": 7472 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939996379407996e-06, + "loss": 0.8877, + "step": 7473 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939966108730086e-06, + "loss": 1.0498, + "step": 7474 + }, + { + "epoch": 0.19, + "learning_rate": 1.99399358304416e-06, + "loss": 1.0127, + "step": 7475 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939905544542563e-06, + "loss": 0.9961, + "step": 7476 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939875251032997e-06, + "loss": 0.8228, + "step": 7477 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939844949912926e-06, + "loss": 1.1348, + "step": 7478 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939814641182373e-06, + "loss": 0.9082, + "step": 7479 + }, + { + "epoch": 0.19, + "learning_rate": 1.993978432484136e-06, + "loss": 1.0264, + "step": 7480 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939754000889914e-06, + "loss": 0.9473, + "step": 7481 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939723669328054e-06, + "loss": 0.8496, + "step": 7482 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939693330155802e-06, + "loss": 1.04, + "step": 7483 + }, + { + "epoch": 0.19, + "learning_rate": 1.993966298337319e-06, + "loss": 0.8682, + "step": 7484 + }, + { + "epoch": 0.19, + "learning_rate": 1.993963262898023e-06, + "loss": 0.8789, + "step": 7485 + }, + { + "epoch": 0.19, + "learning_rate": 1.993960226697695e-06, + "loss": 1.0908, + "step": 7486 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939571897363375e-06, + "loss": 0.8169, + "step": 7487 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939541520139523e-06, + "loss": 0.6921, + "step": 7488 + }, + { + "epoch": 0.19, + "learning_rate": 1.993951113530543e-06, + "loss": 0.999, + "step": 7489 + }, + { + "epoch": 0.19, + "learning_rate": 1.99394807428611e-06, + "loss": 0.877, + "step": 7490 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939450342806573e-06, + "loss": 0.7354, + "step": 7491 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939419935141865e-06, + "loss": 1.0332, + "step": 7492 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939389519867002e-06, + "loss": 0.8486, + "step": 7493 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939359096982e-06, + "loss": 0.9082, + "step": 7494 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939328666486893e-06, + "loss": 0.8667, + "step": 7495 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939298228381697e-06, + "loss": 0.8711, + "step": 7496 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939267782666435e-06, + "loss": 0.9961, + "step": 7497 + }, + { + "epoch": 0.19, + "learning_rate": 1.993923732934114e-06, + "loss": 1.002, + "step": 7498 + }, + { + "epoch": 0.19, + "learning_rate": 1.993920686840582e-06, + "loss": 1.0225, + "step": 7499 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939176399860508e-06, + "loss": 1.0195, + "step": 7500 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939145923705228e-06, + "loss": 0.8218, + "step": 7501 + }, + { + "epoch": 0.19, + "learning_rate": 1.993911543994e-06, + "loss": 0.9629, + "step": 7502 + }, + { + "epoch": 0.19, + "learning_rate": 1.9939084948564848e-06, + "loss": 1.1094, + "step": 7503 + }, + { + "epoch": 0.19, + "learning_rate": 1.99390544495798e-06, + "loss": 0.9727, + "step": 7504 + }, + { + "epoch": 0.19, + "learning_rate": 1.993902394298487e-06, + "loss": 0.9658, + "step": 7505 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938993428780085e-06, + "loss": 0.9619, + "step": 7506 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938962906965473e-06, + "loss": 0.8838, + "step": 7507 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938932377541054e-06, + "loss": 0.876, + "step": 7508 + }, + { + "epoch": 0.19, + "learning_rate": 1.993890184050685e-06, + "loss": 0.9385, + "step": 7509 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938871295862886e-06, + "loss": 0.8809, + "step": 7510 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938840743609187e-06, + "loss": 0.8579, + "step": 7511 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938810183745775e-06, + "loss": 0.6924, + "step": 7512 + }, + { + "epoch": 0.19, + "learning_rate": 1.993877961627267e-06, + "loss": 0.9336, + "step": 7513 + }, + { + "epoch": 0.19, + "learning_rate": 1.99387490411899e-06, + "loss": 0.9761, + "step": 7514 + }, + { + "epoch": 0.19, + "learning_rate": 1.993871845849749e-06, + "loss": 1.04, + "step": 7515 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938687868195456e-06, + "loss": 0.814, + "step": 7516 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938657270283823e-06, + "loss": 0.7646, + "step": 7517 + }, + { + "epoch": 0.19, + "learning_rate": 1.993862666476262e-06, + "loss": 0.7485, + "step": 7518 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938596051631872e-06, + "loss": 0.7847, + "step": 7519 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938565430891592e-06, + "loss": 1.0908, + "step": 7520 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938534802541814e-06, + "loss": 0.8213, + "step": 7521 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938504166582554e-06, + "loss": 1.1855, + "step": 7522 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938473523013838e-06, + "loss": 0.8867, + "step": 7523 + }, + { + "epoch": 0.19, + "learning_rate": 1.993844287183569e-06, + "loss": 0.9268, + "step": 7524 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938412213048135e-06, + "loss": 1.0293, + "step": 7525 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938381546651195e-06, + "loss": 0.7129, + "step": 7526 + }, + { + "epoch": 0.19, + "learning_rate": 1.993835087264489e-06, + "loss": 0.7842, + "step": 7527 + }, + { + "epoch": 0.19, + "learning_rate": 1.993832019102925e-06, + "loss": 1.0938, + "step": 7528 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938289501804295e-06, + "loss": 0.9336, + "step": 7529 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938258804970048e-06, + "loss": 0.9209, + "step": 7530 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938228100526535e-06, + "loss": 1.0977, + "step": 7531 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938197388473774e-06, + "loss": 1.0957, + "step": 7532 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938166668811794e-06, + "loss": 0.8789, + "step": 7533 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938135941540616e-06, + "loss": 1.0234, + "step": 7534 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938105206660266e-06, + "loss": 1.0132, + "step": 7535 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938074464170765e-06, + "loss": 0.8574, + "step": 7536 + }, + { + "epoch": 0.19, + "learning_rate": 1.993804371407214e-06, + "loss": 0.8525, + "step": 7537 + }, + { + "epoch": 0.19, + "learning_rate": 1.9938012956364407e-06, + "loss": 1.2109, + "step": 7538 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937982191047596e-06, + "loss": 0.9805, + "step": 7539 + }, + { + "epoch": 0.19, + "learning_rate": 1.993795141812173e-06, + "loss": 0.9863, + "step": 7540 + }, + { + "epoch": 0.19, + "learning_rate": 1.993792063758683e-06, + "loss": 0.7451, + "step": 7541 + }, + { + "epoch": 0.19, + "learning_rate": 1.993788984944292e-06, + "loss": 0.8193, + "step": 7542 + }, + { + "epoch": 0.19, + "learning_rate": 1.993785905369003e-06, + "loss": 0.8154, + "step": 7543 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937828250328176e-06, + "loss": 0.7625, + "step": 7544 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937797439357382e-06, + "loss": 0.8931, + "step": 7545 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937766620777675e-06, + "loss": 0.833, + "step": 7546 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937735794589075e-06, + "loss": 0.7761, + "step": 7547 + }, + { + "epoch": 0.19, + "learning_rate": 1.993770496079161e-06, + "loss": 0.9268, + "step": 7548 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937674119385298e-06, + "loss": 0.6821, + "step": 7549 + }, + { + "epoch": 0.19, + "learning_rate": 1.993764327037017e-06, + "loss": 0.8516, + "step": 7550 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937612413746242e-06, + "loss": 0.7202, + "step": 7551 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937581549513543e-06, + "loss": 0.7627, + "step": 7552 + }, + { + "epoch": 0.19, + "learning_rate": 1.99375506776721e-06, + "loss": 0.8574, + "step": 7553 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937519798221923e-06, + "loss": 0.8896, + "step": 7554 + }, + { + "epoch": 0.19, + "learning_rate": 1.993748891116305e-06, + "loss": 0.7217, + "step": 7555 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937458016495494e-06, + "loss": 0.7354, + "step": 7556 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937427114219284e-06, + "loss": 1.1484, + "step": 7557 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937396204334443e-06, + "loss": 0.7231, + "step": 7558 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937365286841e-06, + "loss": 0.915, + "step": 7559 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937334361738965e-06, + "loss": 0.9111, + "step": 7560 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937303429028374e-06, + "loss": 0.8486, + "step": 7561 + }, + { + "epoch": 0.19, + "learning_rate": 1.993727248870925e-06, + "loss": 0.9082, + "step": 7562 + }, + { + "epoch": 0.19, + "learning_rate": 1.993724154078161e-06, + "loss": 0.8853, + "step": 7563 + }, + { + "epoch": 0.19, + "learning_rate": 1.993721058524548e-06, + "loss": 0.9258, + "step": 7564 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937179622100885e-06, + "loss": 1.0195, + "step": 7565 + }, + { + "epoch": 0.19, + "learning_rate": 1.993714865134785e-06, + "loss": 0.8613, + "step": 7566 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937117672986398e-06, + "loss": 0.5889, + "step": 7567 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937086687016547e-06, + "loss": 0.8091, + "step": 7568 + }, + { + "epoch": 0.19, + "learning_rate": 1.993705569343833e-06, + "loss": 0.7026, + "step": 7569 + }, + { + "epoch": 0.19, + "learning_rate": 1.9937024692251765e-06, + "loss": 0.9756, + "step": 7570 + }, + { + "epoch": 0.19, + "learning_rate": 1.993699368345688e-06, + "loss": 0.9385, + "step": 7571 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936962667053695e-06, + "loss": 0.9189, + "step": 7572 + }, + { + "epoch": 0.19, + "learning_rate": 1.993693164304223e-06, + "loss": 0.6958, + "step": 7573 + }, + { + "epoch": 0.19, + "learning_rate": 1.993690061142252e-06, + "loss": 1.1611, + "step": 7574 + }, + { + "epoch": 0.19, + "learning_rate": 1.993686957219458e-06, + "loss": 1.0537, + "step": 7575 + }, + { + "epoch": 0.19, + "learning_rate": 1.993683852535843e-06, + "loss": 0.9297, + "step": 7576 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936807470914107e-06, + "loss": 0.8281, + "step": 7577 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936776408861623e-06, + "loss": 0.7202, + "step": 7578 + }, + { + "epoch": 0.19, + "learning_rate": 1.993674533920101e-06, + "loss": 0.6978, + "step": 7579 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936714261932285e-06, + "loss": 1.0078, + "step": 7580 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936683177055478e-06, + "loss": 1.1035, + "step": 7581 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936652084570603e-06, + "loss": 1.0137, + "step": 7582 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936620984477696e-06, + "loss": 0.7036, + "step": 7583 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936589876776772e-06, + "loss": 0.749, + "step": 7584 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936558761467863e-06, + "loss": 1.0049, + "step": 7585 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936527638550983e-06, + "loss": 0.8452, + "step": 7586 + }, + { + "epoch": 0.19, + "learning_rate": 1.993649650802616e-06, + "loss": 0.8818, + "step": 7587 + }, + { + "epoch": 0.19, + "learning_rate": 1.993646536989342e-06, + "loss": 0.8887, + "step": 7588 + }, + { + "epoch": 0.19, + "learning_rate": 1.993643422415279e-06, + "loss": 0.7583, + "step": 7589 + }, + { + "epoch": 0.19, + "learning_rate": 1.993640307080429e-06, + "loss": 0.7622, + "step": 7590 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936371909847934e-06, + "loss": 1.3301, + "step": 7591 + }, + { + "epoch": 0.19, + "learning_rate": 1.993634074128376e-06, + "loss": 0.9873, + "step": 7592 + }, + { + "epoch": 0.19, + "learning_rate": 1.993630956511179e-06, + "loss": 1.0977, + "step": 7593 + }, + { + "epoch": 0.19, + "learning_rate": 1.993627838133204e-06, + "loss": 1.0986, + "step": 7594 + }, + { + "epoch": 0.19, + "learning_rate": 1.993624718994454e-06, + "loss": 0.8262, + "step": 7595 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936215990949308e-06, + "loss": 0.9673, + "step": 7596 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936184784346378e-06, + "loss": 0.7715, + "step": 7597 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936153570135766e-06, + "loss": 0.9102, + "step": 7598 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936122348317495e-06, + "loss": 0.9736, + "step": 7599 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936091118891597e-06, + "loss": 0.9883, + "step": 7600 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936059881858085e-06, + "loss": 0.7705, + "step": 7601 + }, + { + "epoch": 0.19, + "learning_rate": 1.9936028637216998e-06, + "loss": 0.728, + "step": 7602 + }, + { + "epoch": 0.19, + "learning_rate": 1.9935997384968343e-06, + "loss": 1.0303, + "step": 7603 + }, + { + "epoch": 0.19, + "learning_rate": 1.9935966125112156e-06, + "loss": 0.7861, + "step": 7604 + }, + { + "epoch": 0.19, + "learning_rate": 1.9935934857648456e-06, + "loss": 0.8818, + "step": 7605 + }, + { + "epoch": 0.19, + "learning_rate": 1.9935903582577265e-06, + "loss": 0.9443, + "step": 7606 + }, + { + "epoch": 0.19, + "learning_rate": 1.993587229989861e-06, + "loss": 1.0977, + "step": 7607 + }, + { + "epoch": 0.19, + "learning_rate": 1.9935841009612517e-06, + "loss": 0.8057, + "step": 7608 + }, + { + "epoch": 0.2, + "learning_rate": 1.9935809711719006e-06, + "loss": 0.8545, + "step": 7609 + }, + { + "epoch": 0.2, + "learning_rate": 1.9935778406218106e-06, + "loss": 0.6428, + "step": 7610 + }, + { + "epoch": 0.2, + "learning_rate": 1.993574709310983e-06, + "loss": 1.0625, + "step": 7611 + }, + { + "epoch": 0.2, + "learning_rate": 1.9935715772394215e-06, + "loss": 0.8813, + "step": 7612 + }, + { + "epoch": 0.2, + "learning_rate": 1.993568444407128e-06, + "loss": 0.8467, + "step": 7613 + }, + { + "epoch": 0.2, + "learning_rate": 1.993565310814104e-06, + "loss": 0.6943, + "step": 7614 + }, + { + "epoch": 0.2, + "learning_rate": 1.9935621764603534e-06, + "loss": 1.082, + "step": 7615 + }, + { + "epoch": 0.2, + "learning_rate": 1.9935590413458777e-06, + "loss": 1.0879, + "step": 7616 + }, + { + "epoch": 0.2, + "learning_rate": 1.99355590547068e-06, + "loss": 1.3418, + "step": 7617 + }, + { + "epoch": 0.2, + "learning_rate": 1.9935527688347616e-06, + "loss": 1.0107, + "step": 7618 + }, + { + "epoch": 0.2, + "learning_rate": 1.993549631438126e-06, + "loss": 0.9961, + "step": 7619 + }, + { + "epoch": 0.2, + "learning_rate": 1.9935464932807745e-06, + "loss": 1.0469, + "step": 7620 + }, + { + "epoch": 0.2, + "learning_rate": 1.993543354362711e-06, + "loss": 1.2129, + "step": 7621 + }, + { + "epoch": 0.2, + "learning_rate": 1.9935402146839364e-06, + "loss": 0.8018, + "step": 7622 + }, + { + "epoch": 0.2, + "learning_rate": 1.9935370742444538e-06, + "loss": 1.0801, + "step": 7623 + }, + { + "epoch": 0.2, + "learning_rate": 1.993533933044266e-06, + "loss": 0.9404, + "step": 7624 + }, + { + "epoch": 0.2, + "learning_rate": 1.9935307910833743e-06, + "loss": 0.9414, + "step": 7625 + }, + { + "epoch": 0.2, + "learning_rate": 1.993527648361782e-06, + "loss": 0.8481, + "step": 7626 + }, + { + "epoch": 0.2, + "learning_rate": 1.9935245048794917e-06, + "loss": 1.1602, + "step": 7627 + }, + { + "epoch": 0.2, + "learning_rate": 1.993521360636505e-06, + "loss": 1.043, + "step": 7628 + }, + { + "epoch": 0.2, + "learning_rate": 1.993518215632825e-06, + "loss": 0.8921, + "step": 7629 + }, + { + "epoch": 0.2, + "learning_rate": 1.993515069868453e-06, + "loss": 0.9258, + "step": 7630 + }, + { + "epoch": 0.2, + "learning_rate": 1.993511923343393e-06, + "loss": 0.5981, + "step": 7631 + }, + { + "epoch": 0.2, + "learning_rate": 1.9935087760576462e-06, + "loss": 0.7261, + "step": 7632 + }, + { + "epoch": 0.2, + "learning_rate": 1.9935056280112153e-06, + "loss": 0.6523, + "step": 7633 + }, + { + "epoch": 0.2, + "learning_rate": 1.9935024792041034e-06, + "loss": 1.0098, + "step": 7634 + }, + { + "epoch": 0.2, + "learning_rate": 1.993499329636312e-06, + "loss": 1.0146, + "step": 7635 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934961793078434e-06, + "loss": 1.0684, + "step": 7636 + }, + { + "epoch": 0.2, + "learning_rate": 1.993493028218701e-06, + "loss": 0.9824, + "step": 7637 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934898763688864e-06, + "loss": 0.7939, + "step": 7638 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934867237584027e-06, + "loss": 1.1719, + "step": 7639 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934835703872516e-06, + "loss": 0.9072, + "step": 7640 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934804162554357e-06, + "loss": 0.9951, + "step": 7641 + }, + { + "epoch": 0.2, + "learning_rate": 1.993477261362958e-06, + "loss": 0.9668, + "step": 7642 + }, + { + "epoch": 0.2, + "learning_rate": 1.99347410570982e-06, + "loss": 0.7773, + "step": 7643 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934709492960245e-06, + "loss": 1.0264, + "step": 7644 + }, + { + "epoch": 0.2, + "learning_rate": 1.993467792121574e-06, + "loss": 0.9248, + "step": 7645 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934646341864712e-06, + "loss": 1.0742, + "step": 7646 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934614754907177e-06, + "loss": 1.0117, + "step": 7647 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934583160343167e-06, + "loss": 0.9844, + "step": 7648 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934551558172704e-06, + "loss": 0.8916, + "step": 7649 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934519948395814e-06, + "loss": 0.7622, + "step": 7650 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934488331012516e-06, + "loss": 0.8345, + "step": 7651 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934456706022837e-06, + "loss": 0.896, + "step": 7652 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934425073426803e-06, + "loss": 0.8779, + "step": 7653 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934393433224438e-06, + "loss": 0.875, + "step": 7654 + }, + { + "epoch": 0.2, + "learning_rate": 1.993436178541576e-06, + "loss": 0.8955, + "step": 7655 + }, + { + "epoch": 0.2, + "learning_rate": 1.99343301300008e-06, + "loss": 1.0996, + "step": 7656 + }, + { + "epoch": 0.2, + "learning_rate": 1.993429846697958e-06, + "loss": 0.7637, + "step": 7657 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934266796352126e-06, + "loss": 0.3926, + "step": 7658 + }, + { + "epoch": 0.2, + "learning_rate": 1.993423511811846e-06, + "loss": 0.9941, + "step": 7659 + }, + { + "epoch": 0.2, + "learning_rate": 1.993420343227861e-06, + "loss": 0.9014, + "step": 7660 + }, + { + "epoch": 0.2, + "learning_rate": 1.993417173883259e-06, + "loss": 0.6885, + "step": 7661 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934140037780437e-06, + "loss": 1.0312, + "step": 7662 + }, + { + "epoch": 0.2, + "learning_rate": 1.993410832912217e-06, + "loss": 0.8086, + "step": 7663 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934076612857804e-06, + "loss": 0.8765, + "step": 7664 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934044888987384e-06, + "loss": 1.0996, + "step": 7665 + }, + { + "epoch": 0.2, + "learning_rate": 1.9934013157510917e-06, + "loss": 0.8442, + "step": 7666 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933981418428433e-06, + "loss": 0.6479, + "step": 7667 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933949671739957e-06, + "loss": 1.0205, + "step": 7668 + }, + { + "epoch": 0.2, + "learning_rate": 1.993391791744551e-06, + "loss": 0.9004, + "step": 7669 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933886155545124e-06, + "loss": 0.8813, + "step": 7670 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933854386038817e-06, + "loss": 0.7908, + "step": 7671 + }, + { + "epoch": 0.2, + "learning_rate": 1.993382260892661e-06, + "loss": 0.9775, + "step": 7672 + }, + { + "epoch": 0.2, + "learning_rate": 1.993379082420854e-06, + "loss": 0.8691, + "step": 7673 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933759031884616e-06, + "loss": 0.77, + "step": 7674 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933727231954873e-06, + "loss": 1.0059, + "step": 7675 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933695424419328e-06, + "loss": 0.6592, + "step": 7676 + }, + { + "epoch": 0.2, + "learning_rate": 1.993366360927801e-06, + "loss": 0.7876, + "step": 7677 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933631786530945e-06, + "loss": 1.0254, + "step": 7678 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933599956178153e-06, + "loss": 0.6318, + "step": 7679 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933568118219663e-06, + "loss": 0.9727, + "step": 7680 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933536272655498e-06, + "loss": 0.9268, + "step": 7681 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933504419485676e-06, + "loss": 0.9502, + "step": 7682 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933472558710227e-06, + "loss": 0.8877, + "step": 7683 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933440690329175e-06, + "loss": 1.1348, + "step": 7684 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933408814342547e-06, + "loss": 1.1367, + "step": 7685 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933376930750364e-06, + "loss": 0.7573, + "step": 7686 + }, + { + "epoch": 0.2, + "learning_rate": 1.993334503955265e-06, + "loss": 0.749, + "step": 7687 + }, + { + "epoch": 0.2, + "learning_rate": 1.993331314074943e-06, + "loss": 0.8428, + "step": 7688 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933281234340727e-06, + "loss": 0.958, + "step": 7689 + }, + { + "epoch": 0.2, + "learning_rate": 1.993324932032657e-06, + "loss": 1.0088, + "step": 7690 + }, + { + "epoch": 0.2, + "learning_rate": 1.993321739870698e-06, + "loss": 0.8555, + "step": 7691 + }, + { + "epoch": 0.2, + "learning_rate": 1.993318546948198e-06, + "loss": 0.9229, + "step": 7692 + }, + { + "epoch": 0.2, + "learning_rate": 1.99331535326516e-06, + "loss": 0.6309, + "step": 7693 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933121588215863e-06, + "loss": 0.9287, + "step": 7694 + }, + { + "epoch": 0.2, + "learning_rate": 1.993308963617479e-06, + "loss": 0.728, + "step": 7695 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933057676528404e-06, + "loss": 0.9355, + "step": 7696 + }, + { + "epoch": 0.2, + "learning_rate": 1.9933025709276733e-06, + "loss": 0.8867, + "step": 7697 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932993734419803e-06, + "loss": 0.7249, + "step": 7698 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932961751957635e-06, + "loss": 1.1113, + "step": 7699 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932929761890255e-06, + "loss": 0.8193, + "step": 7700 + }, + { + "epoch": 0.2, + "learning_rate": 1.993289776421769e-06, + "loss": 0.8789, + "step": 7701 + }, + { + "epoch": 0.2, + "learning_rate": 1.993286575893996e-06, + "loss": 1.0537, + "step": 7702 + }, + { + "epoch": 0.2, + "learning_rate": 1.993283374605709e-06, + "loss": 1.0615, + "step": 7703 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932801725569107e-06, + "loss": 0.9316, + "step": 7704 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932769697476034e-06, + "loss": 0.8428, + "step": 7705 + }, + { + "epoch": 0.2, + "learning_rate": 1.99327376617779e-06, + "loss": 0.749, + "step": 7706 + }, + { + "epoch": 0.2, + "learning_rate": 1.993270561847472e-06, + "loss": 0.7554, + "step": 7707 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932673567566526e-06, + "loss": 1.0176, + "step": 7708 + }, + { + "epoch": 0.2, + "learning_rate": 1.993264150905334e-06, + "loss": 0.7839, + "step": 7709 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932609442935188e-06, + "loss": 0.8398, + "step": 7710 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932577369212094e-06, + "loss": 1.0322, + "step": 7711 + }, + { + "epoch": 0.2, + "learning_rate": 1.993254528788408e-06, + "loss": 1.0625, + "step": 7712 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932513198951175e-06, + "loss": 0.9307, + "step": 7713 + }, + { + "epoch": 0.2, + "learning_rate": 1.99324811024134e-06, + "loss": 0.9717, + "step": 7714 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932448998270783e-06, + "loss": 0.9766, + "step": 7715 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932416886523347e-06, + "loss": 0.9395, + "step": 7716 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932384767171113e-06, + "loss": 1.0537, + "step": 7717 + }, + { + "epoch": 0.2, + "learning_rate": 1.993235264021411e-06, + "loss": 1.0273, + "step": 7718 + }, + { + "epoch": 0.2, + "learning_rate": 1.993232050565236e-06, + "loss": 0.7852, + "step": 7719 + }, + { + "epoch": 0.2, + "learning_rate": 1.993228836348589e-06, + "loss": 0.7793, + "step": 7720 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932256213714726e-06, + "loss": 1.2559, + "step": 7721 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932224056338886e-06, + "loss": 0.8447, + "step": 7722 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932191891358402e-06, + "loss": 0.7266, + "step": 7723 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932159718773295e-06, + "loss": 1.0488, + "step": 7724 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932127538583584e-06, + "loss": 0.8296, + "step": 7725 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932095350789306e-06, + "loss": 1.0225, + "step": 7726 + }, + { + "epoch": 0.2, + "learning_rate": 1.993206315539048e-06, + "loss": 0.8281, + "step": 7727 + }, + { + "epoch": 0.2, + "learning_rate": 1.9932030952387127e-06, + "loss": 0.7461, + "step": 7728 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931998741779273e-06, + "loss": 1.125, + "step": 7729 + }, + { + "epoch": 0.2, + "learning_rate": 1.993196652356695e-06, + "loss": 0.9717, + "step": 7730 + }, + { + "epoch": 0.2, + "learning_rate": 1.993193429775017e-06, + "loss": 0.9727, + "step": 7731 + }, + { + "epoch": 0.2, + "learning_rate": 1.993190206432897e-06, + "loss": 1.1777, + "step": 7732 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931869823303367e-06, + "loss": 0.6738, + "step": 7733 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931837574673387e-06, + "loss": 0.8496, + "step": 7734 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931805318439057e-06, + "loss": 0.8408, + "step": 7735 + }, + { + "epoch": 0.2, + "learning_rate": 1.99317730546004e-06, + "loss": 1.0244, + "step": 7736 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931740783157443e-06, + "loss": 1.0732, + "step": 7737 + }, + { + "epoch": 0.2, + "learning_rate": 1.993170850411021e-06, + "loss": 1.0459, + "step": 7738 + }, + { + "epoch": 0.2, + "learning_rate": 1.993167621745872e-06, + "loss": 0.7803, + "step": 7739 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931643923203003e-06, + "loss": 0.9824, + "step": 7740 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931611621343083e-06, + "loss": 0.9766, + "step": 7741 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931579311878984e-06, + "loss": 0.8691, + "step": 7742 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931546994810736e-06, + "loss": 0.9639, + "step": 7743 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931514670138355e-06, + "loss": 0.7578, + "step": 7744 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931482337861867e-06, + "loss": 0.9883, + "step": 7745 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931449997981302e-06, + "loss": 1.124, + "step": 7746 + }, + { + "epoch": 0.2, + "learning_rate": 1.993141765049669e-06, + "loss": 1.0391, + "step": 7747 + }, + { + "epoch": 0.2, + "learning_rate": 1.993138529540804e-06, + "loss": 0.8682, + "step": 7748 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931352932715385e-06, + "loss": 0.9697, + "step": 7749 + }, + { + "epoch": 0.2, + "learning_rate": 1.993132056241875e-06, + "loss": 0.9185, + "step": 7750 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931288184518164e-06, + "loss": 1.04, + "step": 7751 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931255799013644e-06, + "loss": 1.0449, + "step": 7752 + }, + { + "epoch": 0.2, + "learning_rate": 1.993122340590522e-06, + "loss": 0.645, + "step": 7753 + }, + { + "epoch": 0.2, + "learning_rate": 1.993119100519291e-06, + "loss": 0.9717, + "step": 7754 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931158596876748e-06, + "loss": 1.0127, + "step": 7755 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931126180956756e-06, + "loss": 0.7959, + "step": 7756 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931093757432954e-06, + "loss": 0.8994, + "step": 7757 + }, + { + "epoch": 0.2, + "learning_rate": 1.993106132630537e-06, + "loss": 0.9307, + "step": 7758 + }, + { + "epoch": 0.2, + "learning_rate": 1.9931028887574032e-06, + "loss": 1.1133, + "step": 7759 + }, + { + "epoch": 0.2, + "learning_rate": 1.993099644123896e-06, + "loss": 0.8457, + "step": 7760 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930963987300178e-06, + "loss": 1.1172, + "step": 7761 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930931525757717e-06, + "loss": 0.8057, + "step": 7762 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930899056611598e-06, + "loss": 0.9912, + "step": 7763 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930866579861846e-06, + "loss": 1.1367, + "step": 7764 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930834095508483e-06, + "loss": 0.8975, + "step": 7765 + }, + { + "epoch": 0.2, + "learning_rate": 1.993080160355154e-06, + "loss": 0.5972, + "step": 7766 + }, + { + "epoch": 0.2, + "learning_rate": 1.993076910399104e-06, + "loss": 0.8662, + "step": 7767 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930736596827004e-06, + "loss": 0.9824, + "step": 7768 + }, + { + "epoch": 0.2, + "learning_rate": 1.993070408205946e-06, + "loss": 1.1523, + "step": 7769 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930671559688435e-06, + "loss": 0.9482, + "step": 7770 + }, + { + "epoch": 0.2, + "learning_rate": 1.993063902971395e-06, + "loss": 0.8955, + "step": 7771 + }, + { + "epoch": 0.2, + "learning_rate": 1.993060649213603e-06, + "loss": 1.1592, + "step": 7772 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930573946954702e-06, + "loss": 0.9297, + "step": 7773 + }, + { + "epoch": 0.2, + "learning_rate": 1.993054139416999e-06, + "loss": 1.0781, + "step": 7774 + }, + { + "epoch": 0.2, + "learning_rate": 1.993050883378192e-06, + "loss": 0.8125, + "step": 7775 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930476265790516e-06, + "loss": 0.8828, + "step": 7776 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930443690195806e-06, + "loss": 1.2207, + "step": 7777 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930411106997806e-06, + "loss": 0.9365, + "step": 7778 + }, + { + "epoch": 0.2, + "learning_rate": 1.993037851619655e-06, + "loss": 0.8848, + "step": 7779 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930345917792055e-06, + "loss": 0.8086, + "step": 7780 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930313311784356e-06, + "loss": 1.166, + "step": 7781 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930280698173473e-06, + "loss": 0.7744, + "step": 7782 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930248076959427e-06, + "loss": 0.7322, + "step": 7783 + }, + { + "epoch": 0.2, + "learning_rate": 1.993021544814225e-06, + "loss": 0.8462, + "step": 7784 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930182811721962e-06, + "loss": 1.0127, + "step": 7785 + }, + { + "epoch": 0.2, + "learning_rate": 1.993015016769859e-06, + "loss": 0.7891, + "step": 7786 + }, + { + "epoch": 0.2, + "learning_rate": 1.993011751607216e-06, + "loss": 0.8955, + "step": 7787 + }, + { + "epoch": 0.2, + "learning_rate": 1.993008485684269e-06, + "loss": 1.1992, + "step": 7788 + }, + { + "epoch": 0.2, + "learning_rate": 1.9930052190010217e-06, + "loss": 0.9512, + "step": 7789 + }, + { + "epoch": 0.2, + "learning_rate": 1.993001951557476e-06, + "loss": 1.0361, + "step": 7790 + }, + { + "epoch": 0.2, + "learning_rate": 1.992998683353634e-06, + "loss": 0.9697, + "step": 7791 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929954143894987e-06, + "loss": 1.2949, + "step": 7792 + }, + { + "epoch": 0.2, + "learning_rate": 1.992992144665072e-06, + "loss": 0.8877, + "step": 7793 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929888741803578e-06, + "loss": 0.9023, + "step": 7794 + }, + { + "epoch": 0.2, + "learning_rate": 1.992985602935357e-06, + "loss": 0.7646, + "step": 7795 + }, + { + "epoch": 0.2, + "learning_rate": 1.992982330930073e-06, + "loss": 0.7959, + "step": 7796 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929790581645085e-06, + "loss": 1.0547, + "step": 7797 + }, + { + "epoch": 0.2, + "learning_rate": 1.992975784638665e-06, + "loss": 0.9863, + "step": 7798 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929725103525455e-06, + "loss": 0.9697, + "step": 7799 + }, + { + "epoch": 0.2, + "learning_rate": 1.992969235306153e-06, + "loss": 0.5564, + "step": 7800 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929659594994895e-06, + "loss": 0.7539, + "step": 7801 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929626829325576e-06, + "loss": 0.9434, + "step": 7802 + }, + { + "epoch": 0.2, + "learning_rate": 1.99295940560536e-06, + "loss": 0.8691, + "step": 7803 + }, + { + "epoch": 0.2, + "learning_rate": 1.992956127517899e-06, + "loss": 0.9785, + "step": 7804 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929528486701766e-06, + "loss": 1.1084, + "step": 7805 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929495690621965e-06, + "loss": 0.9121, + "step": 7806 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929462886939603e-06, + "loss": 0.8535, + "step": 7807 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929430075654706e-06, + "loss": 0.9248, + "step": 7808 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929397256767306e-06, + "loss": 0.8691, + "step": 7809 + }, + { + "epoch": 0.2, + "learning_rate": 1.992936443027742e-06, + "loss": 0.9648, + "step": 7810 + }, + { + "epoch": 0.2, + "learning_rate": 1.992933159618508e-06, + "loss": 0.9854, + "step": 7811 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929298754490304e-06, + "loss": 0.9697, + "step": 7812 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929265905193118e-06, + "loss": 1.0254, + "step": 7813 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929233048293552e-06, + "loss": 0.8545, + "step": 7814 + }, + { + "epoch": 0.2, + "learning_rate": 1.992920018379163e-06, + "loss": 0.7227, + "step": 7815 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929167311687373e-06, + "loss": 1.0166, + "step": 7816 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929134431980814e-06, + "loss": 0.6182, + "step": 7817 + }, + { + "epoch": 0.2, + "learning_rate": 1.992910154467197e-06, + "loss": 0.8477, + "step": 7818 + }, + { + "epoch": 0.2, + "learning_rate": 1.992906864976087e-06, + "loss": 0.9531, + "step": 7819 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929035747247536e-06, + "loss": 0.9355, + "step": 7820 + }, + { + "epoch": 0.2, + "learning_rate": 1.9929002837132e-06, + "loss": 0.9834, + "step": 7821 + }, + { + "epoch": 0.2, + "learning_rate": 1.992896991941428e-06, + "loss": 1.1465, + "step": 7822 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928936994094406e-06, + "loss": 0.7935, + "step": 7823 + }, + { + "epoch": 0.2, + "learning_rate": 1.99289040611724e-06, + "loss": 0.75, + "step": 7824 + }, + { + "epoch": 0.2, + "learning_rate": 1.992887112064829e-06, + "loss": 0.9746, + "step": 7825 + }, + { + "epoch": 0.2, + "learning_rate": 1.99288381725221e-06, + "loss": 1.0332, + "step": 7826 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928805216793856e-06, + "loss": 1.1416, + "step": 7827 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928772253463584e-06, + "loss": 0.9658, + "step": 7828 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928739282531306e-06, + "loss": 0.9912, + "step": 7829 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928706303997047e-06, + "loss": 0.7046, + "step": 7830 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928673317860836e-06, + "loss": 0.9463, + "step": 7831 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928640324122696e-06, + "loss": 0.6748, + "step": 7832 + }, + { + "epoch": 0.2, + "learning_rate": 1.992860732278265e-06, + "loss": 0.7695, + "step": 7833 + }, + { + "epoch": 0.2, + "learning_rate": 1.992857431384073e-06, + "loss": 0.9512, + "step": 7834 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928541297296955e-06, + "loss": 0.9414, + "step": 7835 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928508273151353e-06, + "loss": 0.8193, + "step": 7836 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928475241403947e-06, + "loss": 0.8721, + "step": 7837 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928442202054768e-06, + "loss": 0.918, + "step": 7838 + }, + { + "epoch": 0.2, + "learning_rate": 1.992840915510383e-06, + "loss": 0.9707, + "step": 7839 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928376100551173e-06, + "loss": 0.7158, + "step": 7840 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928343038396814e-06, + "loss": 0.9561, + "step": 7841 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928309968640774e-06, + "loss": 0.656, + "step": 7842 + }, + { + "epoch": 0.2, + "learning_rate": 1.992827689128309e-06, + "loss": 1.0508, + "step": 7843 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928243806323776e-06, + "loss": 0.8467, + "step": 7844 + }, + { + "epoch": 0.2, + "learning_rate": 1.992821071376287e-06, + "loss": 0.9102, + "step": 7845 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928177613600383e-06, + "loss": 1.1172, + "step": 7846 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928144505836344e-06, + "loss": 0.9678, + "step": 7847 + }, + { + "epoch": 0.2, + "learning_rate": 1.9928111390470786e-06, + "loss": 0.7988, + "step": 7848 + }, + { + "epoch": 0.2, + "learning_rate": 1.992807826750373e-06, + "loss": 1.0645, + "step": 7849 + }, + { + "epoch": 0.2, + "learning_rate": 1.99280451369352e-06, + "loss": 0.8926, + "step": 7850 + }, + { + "epoch": 0.2, + "learning_rate": 1.992801199876522e-06, + "loss": 0.7915, + "step": 7851 + }, + { + "epoch": 0.2, + "learning_rate": 1.992797885299382e-06, + "loss": 0.8506, + "step": 7852 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927945699621023e-06, + "loss": 1.0508, + "step": 7853 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927912538646857e-06, + "loss": 0.9512, + "step": 7854 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927879370071337e-06, + "loss": 0.8564, + "step": 7855 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927846193894505e-06, + "loss": 0.9453, + "step": 7856 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927813010116374e-06, + "loss": 0.957, + "step": 7857 + }, + { + "epoch": 0.2, + "learning_rate": 1.992777981873697e-06, + "loss": 1.0195, + "step": 7858 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927746619756325e-06, + "loss": 0.8682, + "step": 7859 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927713413174463e-06, + "loss": 0.9404, + "step": 7860 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927680198991402e-06, + "loss": 1.1758, + "step": 7861 + }, + { + "epoch": 0.2, + "learning_rate": 1.992764697720718e-06, + "loss": 0.9629, + "step": 7862 + }, + { + "epoch": 0.2, + "learning_rate": 1.992761374782181e-06, + "loss": 0.6934, + "step": 7863 + }, + { + "epoch": 0.2, + "learning_rate": 1.992758051083532e-06, + "loss": 0.9463, + "step": 7864 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927547266247746e-06, + "loss": 0.916, + "step": 7865 + }, + { + "epoch": 0.2, + "learning_rate": 1.99275140140591e-06, + "loss": 0.6348, + "step": 7866 + }, + { + "epoch": 0.2, + "learning_rate": 1.992748075426941e-06, + "loss": 1.0879, + "step": 7867 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927447486878713e-06, + "loss": 1.0312, + "step": 7868 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927414211887022e-06, + "loss": 0.8086, + "step": 7869 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927380929294362e-06, + "loss": 0.832, + "step": 7870 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927347639100768e-06, + "loss": 1.0244, + "step": 7871 + }, + { + "epoch": 0.2, + "learning_rate": 1.992731434130626e-06, + "loss": 0.9531, + "step": 7872 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927281035910863e-06, + "loss": 0.9229, + "step": 7873 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927247722914603e-06, + "loss": 1.2012, + "step": 7874 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927214402317506e-06, + "loss": 1.0488, + "step": 7875 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927181074119597e-06, + "loss": 0.957, + "step": 7876 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927147738320906e-06, + "loss": 0.8677, + "step": 7877 + }, + { + "epoch": 0.2, + "learning_rate": 1.992711439492145e-06, + "loss": 0.9463, + "step": 7878 + }, + { + "epoch": 0.2, + "learning_rate": 1.992708104392126e-06, + "loss": 1.0049, + "step": 7879 + }, + { + "epoch": 0.2, + "learning_rate": 1.992704768532036e-06, + "loss": 1.0596, + "step": 7880 + }, + { + "epoch": 0.2, + "learning_rate": 1.9927014319118778e-06, + "loss": 0.8633, + "step": 7881 + }, + { + "epoch": 0.2, + "learning_rate": 1.9926980945316534e-06, + "loss": 0.8594, + "step": 7882 + }, + { + "epoch": 0.2, + "learning_rate": 1.992694756391366e-06, + "loss": 0.9814, + "step": 7883 + }, + { + "epoch": 0.2, + "learning_rate": 1.992691417491018e-06, + "loss": 1.1025, + "step": 7884 + }, + { + "epoch": 0.2, + "learning_rate": 1.9926880778306114e-06, + "loss": 1.2188, + "step": 7885 + }, + { + "epoch": 0.2, + "learning_rate": 1.9926847374101495e-06, + "loss": 0.6938, + "step": 7886 + }, + { + "epoch": 0.2, + "learning_rate": 1.9926813962296343e-06, + "loss": 0.9072, + "step": 7887 + }, + { + "epoch": 0.2, + "learning_rate": 1.992678054289069e-06, + "loss": 0.7349, + "step": 7888 + }, + { + "epoch": 0.2, + "learning_rate": 1.9926747115884557e-06, + "loss": 0.7964, + "step": 7889 + }, + { + "epoch": 0.2, + "learning_rate": 1.992671368127797e-06, + "loss": 0.8652, + "step": 7890 + }, + { + "epoch": 0.2, + "learning_rate": 1.992668023907095e-06, + "loss": 0.9424, + "step": 7891 + }, + { + "epoch": 0.2, + "learning_rate": 1.992664678926353e-06, + "loss": 0.751, + "step": 7892 + }, + { + "epoch": 0.2, + "learning_rate": 1.9926613331855733e-06, + "loss": 0.8359, + "step": 7893 + }, + { + "epoch": 0.2, + "learning_rate": 1.9926579866847586e-06, + "loss": 0.8936, + "step": 7894 + }, + { + "epoch": 0.2, + "learning_rate": 1.992654639423911e-06, + "loss": 0.9414, + "step": 7895 + }, + { + "epoch": 0.2, + "learning_rate": 1.9926512914030335e-06, + "loss": 0.7412, + "step": 7896 + }, + { + "epoch": 0.2, + "learning_rate": 1.992647942622129e-06, + "loss": 1.0723, + "step": 7897 + }, + { + "epoch": 0.2, + "learning_rate": 1.992644593081199e-06, + "loss": 0.9766, + "step": 7898 + }, + { + "epoch": 0.2, + "learning_rate": 1.9926412427802475e-06, + "loss": 0.6621, + "step": 7899 + }, + { + "epoch": 0.2, + "learning_rate": 1.9926378917192755e-06, + "loss": 1.1191, + "step": 7900 + }, + { + "epoch": 0.2, + "learning_rate": 1.9926345398982863e-06, + "loss": 0.9668, + "step": 7901 + }, + { + "epoch": 0.2, + "learning_rate": 1.992631187317283e-06, + "loss": 1.0381, + "step": 7902 + }, + { + "epoch": 0.2, + "learning_rate": 1.992627833976267e-06, + "loss": 0.7043, + "step": 7903 + }, + { + "epoch": 0.2, + "learning_rate": 1.992624479875242e-06, + "loss": 1.0303, + "step": 7904 + }, + { + "epoch": 0.2, + "learning_rate": 1.99262112501421e-06, + "loss": 0.998, + "step": 7905 + }, + { + "epoch": 0.2, + "learning_rate": 1.9926177693931734e-06, + "loss": 0.9014, + "step": 7906 + }, + { + "epoch": 0.2, + "learning_rate": 1.9926144130121353e-06, + "loss": 1.0156, + "step": 7907 + }, + { + "epoch": 0.2, + "learning_rate": 1.9926110558710978e-06, + "loss": 0.8613, + "step": 7908 + }, + { + "epoch": 0.2, + "learning_rate": 1.9926076979700637e-06, + "loss": 1.082, + "step": 7909 + }, + { + "epoch": 0.2, + "learning_rate": 1.9926043393090357e-06, + "loss": 0.8457, + "step": 7910 + }, + { + "epoch": 0.2, + "learning_rate": 1.992600979888016e-06, + "loss": 0.915, + "step": 7911 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925976197070075e-06, + "loss": 0.8213, + "step": 7912 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925942587660125e-06, + "loss": 0.6411, + "step": 7913 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925908970650336e-06, + "loss": 0.9082, + "step": 7914 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925875346040735e-06, + "loss": 1.0107, + "step": 7915 + }, + { + "epoch": 0.2, + "learning_rate": 1.992584171383135e-06, + "loss": 0.832, + "step": 7916 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925808074022205e-06, + "loss": 1.0415, + "step": 7917 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925774426613323e-06, + "loss": 0.8525, + "step": 7918 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925740771604734e-06, + "loss": 1.083, + "step": 7919 + }, + { + "epoch": 0.2, + "learning_rate": 1.992570710899646e-06, + "loss": 1.0098, + "step": 7920 + }, + { + "epoch": 0.2, + "learning_rate": 1.992567343878853e-06, + "loss": 0.8516, + "step": 7921 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925639760980965e-06, + "loss": 1.0693, + "step": 7922 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925606075573796e-06, + "loss": 0.8564, + "step": 7923 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925572382567046e-06, + "loss": 0.812, + "step": 7924 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925538681960747e-06, + "loss": 0.8965, + "step": 7925 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925504973754915e-06, + "loss": 1.1162, + "step": 7926 + }, + { + "epoch": 0.2, + "learning_rate": 1.992547125794958e-06, + "loss": 0.771, + "step": 7927 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925437534544766e-06, + "loss": 1.0322, + "step": 7928 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925403803540504e-06, + "loss": 1.1221, + "step": 7929 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925370064936815e-06, + "loss": 0.7432, + "step": 7930 + }, + { + "epoch": 0.2, + "learning_rate": 1.992533631873373e-06, + "loss": 0.9814, + "step": 7931 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925302564931265e-06, + "loss": 0.9473, + "step": 7932 + }, + { + "epoch": 0.2, + "learning_rate": 1.992526880352946e-06, + "loss": 0.9531, + "step": 7933 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925235034528325e-06, + "loss": 0.7305, + "step": 7934 + }, + { + "epoch": 0.2, + "learning_rate": 1.99252012579279e-06, + "loss": 0.8438, + "step": 7935 + }, + { + "epoch": 0.2, + "learning_rate": 1.99251674737282e-06, + "loss": 1.0312, + "step": 7936 + }, + { + "epoch": 0.2, + "learning_rate": 1.992513368192926e-06, + "loss": 0.9385, + "step": 7937 + }, + { + "epoch": 0.2, + "learning_rate": 1.99250998825311e-06, + "loss": 1.1953, + "step": 7938 + }, + { + "epoch": 0.2, + "learning_rate": 1.9925066075533746e-06, + "loss": 0.9971, + "step": 7939 + }, + { + "epoch": 0.2, + "learning_rate": 1.992503226093723e-06, + "loss": 0.7983, + "step": 7940 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924998438741566e-06, + "loss": 0.6494, + "step": 7941 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924964608946792e-06, + "loss": 0.9834, + "step": 7942 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924930771552927e-06, + "loss": 0.814, + "step": 7943 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924896926559998e-06, + "loss": 0.8174, + "step": 7944 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924863073968036e-06, + "loss": 1.0469, + "step": 7945 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924829213777057e-06, + "loss": 0.9014, + "step": 7946 + }, + { + "epoch": 0.2, + "learning_rate": 1.99247953459871e-06, + "loss": 0.9668, + "step": 7947 + }, + { + "epoch": 0.2, + "learning_rate": 1.992476147059818e-06, + "loss": 1.1182, + "step": 7948 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924727587610325e-06, + "loss": 0.9082, + "step": 7949 + }, + { + "epoch": 0.2, + "learning_rate": 1.992469369702356e-06, + "loss": 0.752, + "step": 7950 + }, + { + "epoch": 0.2, + "learning_rate": 1.992465979883792e-06, + "loss": 0.9648, + "step": 7951 + }, + { + "epoch": 0.2, + "learning_rate": 1.992462589305342e-06, + "loss": 0.7842, + "step": 7952 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924591979670093e-06, + "loss": 1.0088, + "step": 7953 + }, + { + "epoch": 0.2, + "learning_rate": 1.992455805868796e-06, + "loss": 0.9072, + "step": 7954 + }, + { + "epoch": 0.2, + "learning_rate": 1.992452413010705e-06, + "loss": 0.7559, + "step": 7955 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924490193927385e-06, + "loss": 0.7046, + "step": 7956 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924456250148997e-06, + "loss": 1.124, + "step": 7957 + }, + { + "epoch": 0.2, + "learning_rate": 1.992442229877191e-06, + "loss": 0.8623, + "step": 7958 + }, + { + "epoch": 0.2, + "learning_rate": 1.992438833979615e-06, + "loss": 0.7188, + "step": 7959 + }, + { + "epoch": 0.2, + "learning_rate": 1.992435437322174e-06, + "loss": 0.8945, + "step": 7960 + }, + { + "epoch": 0.2, + "learning_rate": 1.992432039904871e-06, + "loss": 0.9043, + "step": 7961 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924286417277082e-06, + "loss": 0.5986, + "step": 7962 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924252427906884e-06, + "loss": 0.8657, + "step": 7963 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924218430938143e-06, + "loss": 1.0166, + "step": 7964 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924184426370886e-06, + "loss": 0.8242, + "step": 7965 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924150414205137e-06, + "loss": 0.7017, + "step": 7966 + }, + { + "epoch": 0.2, + "learning_rate": 1.992411639444092e-06, + "loss": 0.832, + "step": 7967 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924082367078265e-06, + "loss": 0.7437, + "step": 7968 + }, + { + "epoch": 0.2, + "learning_rate": 1.9924048332117195e-06, + "loss": 0.957, + "step": 7969 + }, + { + "epoch": 0.2, + "learning_rate": 1.992401428955774e-06, + "loss": 0.8711, + "step": 7970 + }, + { + "epoch": 0.2, + "learning_rate": 1.992398023939992e-06, + "loss": 0.7881, + "step": 7971 + }, + { + "epoch": 0.2, + "learning_rate": 1.992394618164377e-06, + "loss": 1.0996, + "step": 7972 + }, + { + "epoch": 0.2, + "learning_rate": 1.9923912116289306e-06, + "loss": 0.8496, + "step": 7973 + }, + { + "epoch": 0.2, + "learning_rate": 1.9923878043336564e-06, + "loss": 0.9082, + "step": 7974 + }, + { + "epoch": 0.2, + "learning_rate": 1.992384396278556e-06, + "loss": 0.8369, + "step": 7975 + }, + { + "epoch": 0.2, + "learning_rate": 1.9923809874636327e-06, + "loss": 0.8545, + "step": 7976 + }, + { + "epoch": 0.2, + "learning_rate": 1.992377577888889e-06, + "loss": 0.9922, + "step": 7977 + }, + { + "epoch": 0.2, + "learning_rate": 1.992374167554327e-06, + "loss": 1.0117, + "step": 7978 + }, + { + "epoch": 0.2, + "learning_rate": 1.9923707564599503e-06, + "loss": 0.8936, + "step": 7979 + }, + { + "epoch": 0.2, + "learning_rate": 1.9923673446057606e-06, + "loss": 0.8311, + "step": 7980 + }, + { + "epoch": 0.2, + "learning_rate": 1.9923639319917607e-06, + "loss": 0.9365, + "step": 7981 + }, + { + "epoch": 0.2, + "learning_rate": 1.9923605186179536e-06, + "loss": 1.0273, + "step": 7982 + }, + { + "epoch": 0.2, + "learning_rate": 1.9923571044843415e-06, + "loss": 0.9302, + "step": 7983 + }, + { + "epoch": 0.2, + "learning_rate": 1.9923536895909273e-06, + "loss": 0.9102, + "step": 7984 + }, + { + "epoch": 0.2, + "learning_rate": 1.992350273937714e-06, + "loss": 0.9902, + "step": 7985 + }, + { + "epoch": 0.2, + "learning_rate": 1.992346857524703e-06, + "loss": 0.875, + "step": 7986 + }, + { + "epoch": 0.2, + "learning_rate": 1.992343440351898e-06, + "loss": 1.0352, + "step": 7987 + }, + { + "epoch": 0.2, + "learning_rate": 1.992340022419301e-06, + "loss": 0.9697, + "step": 7988 + }, + { + "epoch": 0.2, + "learning_rate": 1.992336603726915e-06, + "loss": 0.9707, + "step": 7989 + }, + { + "epoch": 0.2, + "learning_rate": 1.992333184274743e-06, + "loss": 0.9434, + "step": 7990 + }, + { + "epoch": 0.2, + "learning_rate": 1.9923297640627867e-06, + "loss": 1.0381, + "step": 7991 + }, + { + "epoch": 0.2, + "learning_rate": 1.9923263430910488e-06, + "loss": 0.8784, + "step": 7992 + }, + { + "epoch": 0.2, + "learning_rate": 1.9923229213595324e-06, + "loss": 0.8311, + "step": 7993 + }, + { + "epoch": 0.2, + "learning_rate": 1.9923194988682403e-06, + "loss": 0.8408, + "step": 7994 + }, + { + "epoch": 0.2, + "learning_rate": 1.9923160756171744e-06, + "loss": 1.0732, + "step": 7995 + }, + { + "epoch": 0.2, + "learning_rate": 1.992312651606338e-06, + "loss": 0.8271, + "step": 7996 + }, + { + "epoch": 0.2, + "learning_rate": 1.9923092268357333e-06, + "loss": 1.0371, + "step": 7997 + }, + { + "epoch": 0.2, + "learning_rate": 1.992305801305363e-06, + "loss": 0.8193, + "step": 7998 + }, + { + "epoch": 0.21, + "learning_rate": 1.99230237501523e-06, + "loss": 0.9004, + "step": 7999 + }, + { + "epoch": 0.21, + "learning_rate": 1.9922989479653364e-06, + "loss": 0.7939, + "step": 8000 + }, + { + "epoch": 0.21, + "learning_rate": 1.9922955201556853e-06, + "loss": 0.8057, + "step": 8001 + }, + { + "epoch": 0.21, + "learning_rate": 1.992292091586279e-06, + "loss": 0.9766, + "step": 8002 + }, + { + "epoch": 0.21, + "learning_rate": 1.9922886622571204e-06, + "loss": 0.9658, + "step": 8003 + }, + { + "epoch": 0.21, + "learning_rate": 1.992285232168212e-06, + "loss": 0.75, + "step": 8004 + }, + { + "epoch": 0.21, + "learning_rate": 1.9922818013195566e-06, + "loss": 0.9785, + "step": 8005 + }, + { + "epoch": 0.21, + "learning_rate": 1.9922783697111563e-06, + "loss": 0.8662, + "step": 8006 + }, + { + "epoch": 0.21, + "learning_rate": 1.9922749373430145e-06, + "loss": 0.6714, + "step": 8007 + }, + { + "epoch": 0.21, + "learning_rate": 1.992271504215133e-06, + "loss": 1.0996, + "step": 8008 + }, + { + "epoch": 0.21, + "learning_rate": 1.992268070327515e-06, + "loss": 0.8213, + "step": 8009 + }, + { + "epoch": 0.21, + "learning_rate": 1.992264635680163e-06, + "loss": 0.8545, + "step": 8010 + }, + { + "epoch": 0.21, + "learning_rate": 1.9922612002730794e-06, + "loss": 1.041, + "step": 8011 + }, + { + "epoch": 0.21, + "learning_rate": 1.992257764106267e-06, + "loss": 1.0723, + "step": 8012 + }, + { + "epoch": 0.21, + "learning_rate": 1.992254327179729e-06, + "loss": 1.001, + "step": 8013 + }, + { + "epoch": 0.21, + "learning_rate": 1.992250889493467e-06, + "loss": 1.2529, + "step": 8014 + }, + { + "epoch": 0.21, + "learning_rate": 1.992247451047484e-06, + "loss": 0.8394, + "step": 8015 + }, + { + "epoch": 0.21, + "learning_rate": 1.9922440118417833e-06, + "loss": 1.0225, + "step": 8016 + }, + { + "epoch": 0.21, + "learning_rate": 1.9922405718763666e-06, + "loss": 0.9512, + "step": 8017 + }, + { + "epoch": 0.21, + "learning_rate": 1.9922371311512368e-06, + "loss": 1.0469, + "step": 8018 + }, + { + "epoch": 0.21, + "learning_rate": 1.992233689666397e-06, + "loss": 0.9316, + "step": 8019 + }, + { + "epoch": 0.21, + "learning_rate": 1.9922302474218494e-06, + "loss": 0.9663, + "step": 8020 + }, + { + "epoch": 0.21, + "learning_rate": 1.9922268044175966e-06, + "loss": 1.0283, + "step": 8021 + }, + { + "epoch": 0.21, + "learning_rate": 1.992223360653641e-06, + "loss": 0.9014, + "step": 8022 + }, + { + "epoch": 0.21, + "learning_rate": 1.9922199161299865e-06, + "loss": 0.9111, + "step": 8023 + }, + { + "epoch": 0.21, + "learning_rate": 1.992216470846634e-06, + "loss": 0.7363, + "step": 8024 + }, + { + "epoch": 0.21, + "learning_rate": 1.9922130248035873e-06, + "loss": 0.874, + "step": 8025 + }, + { + "epoch": 0.21, + "learning_rate": 1.9922095780008487e-06, + "loss": 0.9521, + "step": 8026 + }, + { + "epoch": 0.21, + "learning_rate": 1.992206130438421e-06, + "loss": 0.9209, + "step": 8027 + }, + { + "epoch": 0.21, + "learning_rate": 1.992202682116307e-06, + "loss": 0.8184, + "step": 8028 + }, + { + "epoch": 0.21, + "learning_rate": 1.9921992330345084e-06, + "loss": 0.7949, + "step": 8029 + }, + { + "epoch": 0.21, + "learning_rate": 1.9921957831930284e-06, + "loss": 0.853, + "step": 8030 + }, + { + "epoch": 0.21, + "learning_rate": 1.99219233259187e-06, + "loss": 0.8652, + "step": 8031 + }, + { + "epoch": 0.21, + "learning_rate": 1.9921888812310354e-06, + "loss": 0.8818, + "step": 8032 + }, + { + "epoch": 0.21, + "learning_rate": 1.9921854291105274e-06, + "loss": 0.7266, + "step": 8033 + }, + { + "epoch": 0.21, + "learning_rate": 1.992181976230349e-06, + "loss": 1.2266, + "step": 8034 + }, + { + "epoch": 0.21, + "learning_rate": 1.9921785225905022e-06, + "loss": 0.8906, + "step": 8035 + }, + { + "epoch": 0.21, + "learning_rate": 1.99217506819099e-06, + "loss": 1.1748, + "step": 8036 + }, + { + "epoch": 0.21, + "learning_rate": 1.992171613031815e-06, + "loss": 1.0283, + "step": 8037 + }, + { + "epoch": 0.21, + "learning_rate": 1.99216815711298e-06, + "loss": 1.0146, + "step": 8038 + }, + { + "epoch": 0.21, + "learning_rate": 1.992164700434487e-06, + "loss": 1.0869, + "step": 8039 + }, + { + "epoch": 0.21, + "learning_rate": 1.9921612429963394e-06, + "loss": 0.7754, + "step": 8040 + }, + { + "epoch": 0.21, + "learning_rate": 1.992157784798539e-06, + "loss": 0.6963, + "step": 8041 + }, + { + "epoch": 0.21, + "learning_rate": 1.9921543258410897e-06, + "loss": 0.8291, + "step": 8042 + }, + { + "epoch": 0.21, + "learning_rate": 1.9921508661239934e-06, + "loss": 1.0674, + "step": 8043 + }, + { + "epoch": 0.21, + "learning_rate": 1.992147405647253e-06, + "loss": 0.7642, + "step": 8044 + }, + { + "epoch": 0.21, + "learning_rate": 1.9921439444108704e-06, + "loss": 0.7529, + "step": 8045 + }, + { + "epoch": 0.21, + "learning_rate": 1.992140482414849e-06, + "loss": 0.9082, + "step": 8046 + }, + { + "epoch": 0.21, + "learning_rate": 1.992137019659191e-06, + "loss": 1.0596, + "step": 8047 + }, + { + "epoch": 0.21, + "learning_rate": 1.9921335561438996e-06, + "loss": 0.8501, + "step": 8048 + }, + { + "epoch": 0.21, + "learning_rate": 1.992130091868977e-06, + "loss": 0.957, + "step": 8049 + }, + { + "epoch": 0.21, + "learning_rate": 1.9921266268344263e-06, + "loss": 1.209, + "step": 8050 + }, + { + "epoch": 0.21, + "learning_rate": 1.9921231610402497e-06, + "loss": 0.835, + "step": 8051 + }, + { + "epoch": 0.21, + "learning_rate": 1.9921196944864498e-06, + "loss": 0.6782, + "step": 8052 + }, + { + "epoch": 0.21, + "learning_rate": 1.99211622717303e-06, + "loss": 1.0127, + "step": 8053 + }, + { + "epoch": 0.21, + "learning_rate": 1.9921127590999916e-06, + "loss": 0.8955, + "step": 8054 + }, + { + "epoch": 0.21, + "learning_rate": 1.992109290267339e-06, + "loss": 0.7397, + "step": 8055 + }, + { + "epoch": 0.21, + "learning_rate": 1.9921058206750733e-06, + "loss": 1.0557, + "step": 8056 + }, + { + "epoch": 0.21, + "learning_rate": 1.992102350323198e-06, + "loss": 1.1055, + "step": 8057 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920988792117157e-06, + "loss": 0.6382, + "step": 8058 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920954073406287e-06, + "loss": 1.0977, + "step": 8059 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920919347099395e-06, + "loss": 1.1797, + "step": 8060 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920884613196515e-06, + "loss": 0.896, + "step": 8061 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920849871697672e-06, + "loss": 1.1133, + "step": 8062 + }, + { + "epoch": 0.21, + "learning_rate": 1.992081512260289e-06, + "loss": 1.0254, + "step": 8063 + }, + { + "epoch": 0.21, + "learning_rate": 1.992078036591219e-06, + "loss": 0.9219, + "step": 8064 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920745601625613e-06, + "loss": 0.666, + "step": 8065 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920710829743173e-06, + "loss": 0.9111, + "step": 8066 + }, + { + "epoch": 0.21, + "learning_rate": 1.99206760502649e-06, + "loss": 0.9756, + "step": 8067 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920641263190824e-06, + "loss": 1.0127, + "step": 8068 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920606468520966e-06, + "loss": 0.9619, + "step": 8069 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920571666255357e-06, + "loss": 0.8535, + "step": 8070 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920536856394027e-06, + "loss": 0.752, + "step": 8071 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920502038936996e-06, + "loss": 0.9883, + "step": 8072 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920467213884287e-06, + "loss": 1.0732, + "step": 8073 + }, + { + "epoch": 0.21, + "learning_rate": 1.992043238123594e-06, + "loss": 0.7256, + "step": 8074 + }, + { + "epoch": 0.21, + "learning_rate": 1.992039754099197e-06, + "loss": 1.1094, + "step": 8075 + }, + { + "epoch": 0.21, + "learning_rate": 1.992036269315241e-06, + "loss": 0.8452, + "step": 8076 + }, + { + "epoch": 0.21, + "learning_rate": 1.992032783771728e-06, + "loss": 0.7515, + "step": 8077 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920292974686612e-06, + "loss": 0.9248, + "step": 8078 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920258104060434e-06, + "loss": 0.8223, + "step": 8079 + }, + { + "epoch": 0.21, + "learning_rate": 1.992022322583877e-06, + "loss": 0.6875, + "step": 8080 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920188340021647e-06, + "loss": 0.7139, + "step": 8081 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920153446609092e-06, + "loss": 1.0894, + "step": 8082 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920118545601134e-06, + "loss": 0.8701, + "step": 8083 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920083636997798e-06, + "loss": 0.8105, + "step": 8084 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920048720799104e-06, + "loss": 0.9727, + "step": 8085 + }, + { + "epoch": 0.21, + "learning_rate": 1.9920013797005087e-06, + "loss": 0.8604, + "step": 8086 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919978865615772e-06, + "loss": 0.709, + "step": 8087 + }, + { + "epoch": 0.21, + "learning_rate": 1.991994392663119e-06, + "loss": 1.3594, + "step": 8088 + }, + { + "epoch": 0.21, + "learning_rate": 1.991990898005136e-06, + "loss": 0.9873, + "step": 8089 + }, + { + "epoch": 0.21, + "learning_rate": 1.991987402587631e-06, + "loss": 0.8179, + "step": 8090 + }, + { + "epoch": 0.21, + "learning_rate": 1.991983906410607e-06, + "loss": 1.0439, + "step": 8091 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919804094740663e-06, + "loss": 0.8594, + "step": 8092 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919769117780124e-06, + "loss": 0.7881, + "step": 8093 + }, + { + "epoch": 0.21, + "learning_rate": 1.991973413322447e-06, + "loss": 0.9629, + "step": 8094 + }, + { + "epoch": 0.21, + "learning_rate": 1.991969914107373e-06, + "loss": 0.8789, + "step": 8095 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919664141327933e-06, + "loss": 0.957, + "step": 8096 + }, + { + "epoch": 0.21, + "learning_rate": 1.991962913398711e-06, + "loss": 1.1064, + "step": 8097 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919594119051275e-06, + "loss": 0.9658, + "step": 8098 + }, + { + "epoch": 0.21, + "learning_rate": 1.991955909652047e-06, + "loss": 0.9531, + "step": 8099 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919524066394714e-06, + "loss": 0.8311, + "step": 8100 + }, + { + "epoch": 0.21, + "learning_rate": 1.991948902867403e-06, + "loss": 0.7354, + "step": 8101 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919453983358453e-06, + "loss": 0.876, + "step": 8102 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919418930448006e-06, + "loss": 1.1562, + "step": 8103 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919383869942715e-06, + "loss": 0.7207, + "step": 8104 + }, + { + "epoch": 0.21, + "learning_rate": 1.991934880184261e-06, + "loss": 0.8721, + "step": 8105 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919313726147712e-06, + "loss": 1.0186, + "step": 8106 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919278642858052e-06, + "loss": 1.0332, + "step": 8107 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919243551973658e-06, + "loss": 1.1494, + "step": 8108 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919208453494558e-06, + "loss": 1.1309, + "step": 8109 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919173347420774e-06, + "loss": 0.9307, + "step": 8110 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919138233752333e-06, + "loss": 0.8467, + "step": 8111 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919103112489262e-06, + "loss": 0.8936, + "step": 8112 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919067983631597e-06, + "loss": 0.8057, + "step": 8113 + }, + { + "epoch": 0.21, + "learning_rate": 1.9919032847179354e-06, + "loss": 0.9043, + "step": 8114 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918997703132562e-06, + "loss": 0.8242, + "step": 8115 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918962551491252e-06, + "loss": 0.8071, + "step": 8116 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918927392255445e-06, + "loss": 0.9277, + "step": 8117 + }, + { + "epoch": 0.21, + "learning_rate": 1.991889222542518e-06, + "loss": 0.625, + "step": 8118 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918857051000465e-06, + "loss": 0.7041, + "step": 8119 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918821868981343e-06, + "loss": 0.7625, + "step": 8120 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918786679367834e-06, + "loss": 0.7959, + "step": 8121 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918751482159964e-06, + "loss": 1.1445, + "step": 8122 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918716277357765e-06, + "loss": 0.8276, + "step": 8123 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918681064961263e-06, + "loss": 0.876, + "step": 8124 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918645844970476e-06, + "loss": 0.9932, + "step": 8125 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918610617385446e-06, + "loss": 0.707, + "step": 8126 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918575382206185e-06, + "loss": 0.9775, + "step": 8127 + }, + { + "epoch": 0.21, + "learning_rate": 1.991854013943273e-06, + "loss": 0.8589, + "step": 8128 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918504889065107e-06, + "loss": 1.0469, + "step": 8129 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918469631103336e-06, + "loss": 0.9775, + "step": 8130 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918434365547453e-06, + "loss": 1.0781, + "step": 8131 + }, + { + "epoch": 0.21, + "learning_rate": 1.991839909239748e-06, + "loss": 0.8945, + "step": 8132 + }, + { + "epoch": 0.21, + "learning_rate": 1.991836381165344e-06, + "loss": 0.918, + "step": 8133 + }, + { + "epoch": 0.21, + "learning_rate": 1.991832852331537e-06, + "loss": 1.0264, + "step": 8134 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918293227383294e-06, + "loss": 0.8662, + "step": 8135 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918257923857232e-06, + "loss": 0.9277, + "step": 8136 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918222612737216e-06, + "loss": 0.9492, + "step": 8137 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918187294023277e-06, + "loss": 0.8223, + "step": 8138 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918151967715435e-06, + "loss": 0.8042, + "step": 8139 + }, + { + "epoch": 0.21, + "learning_rate": 1.991811663381372e-06, + "loss": 0.7676, + "step": 8140 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918081292318163e-06, + "loss": 0.7969, + "step": 8141 + }, + { + "epoch": 0.21, + "learning_rate": 1.9918045943228784e-06, + "loss": 1.002, + "step": 8142 + }, + { + "epoch": 0.21, + "learning_rate": 1.991801058654561e-06, + "loss": 1.1504, + "step": 8143 + }, + { + "epoch": 0.21, + "learning_rate": 1.991797522226868e-06, + "loss": 0.9043, + "step": 8144 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917939850398006e-06, + "loss": 0.6736, + "step": 8145 + }, + { + "epoch": 0.21, + "learning_rate": 1.991790447093362e-06, + "loss": 0.7134, + "step": 8146 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917869083875558e-06, + "loss": 1.0957, + "step": 8147 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917833689223833e-06, + "loss": 0.9678, + "step": 8148 + }, + { + "epoch": 0.21, + "learning_rate": 1.991779828697848e-06, + "loss": 0.9453, + "step": 8149 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917762877139524e-06, + "loss": 0.7793, + "step": 8150 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917727459706996e-06, + "loss": 0.9775, + "step": 8151 + }, + { + "epoch": 0.21, + "learning_rate": 1.991769203468092e-06, + "loss": 0.9639, + "step": 8152 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917656602061323e-06, + "loss": 0.75, + "step": 8153 + }, + { + "epoch": 0.21, + "learning_rate": 1.991762116184823e-06, + "loss": 0.6724, + "step": 8154 + }, + { + "epoch": 0.21, + "learning_rate": 1.991758571404167e-06, + "loss": 1.1475, + "step": 8155 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917550258641675e-06, + "loss": 1.0518, + "step": 8156 + }, + { + "epoch": 0.21, + "learning_rate": 1.991751479564826e-06, + "loss": 1.0938, + "step": 8157 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917479325061472e-06, + "loss": 1.1475, + "step": 8158 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917443846881317e-06, + "loss": 0.9536, + "step": 8159 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917408361107833e-06, + "loss": 0.8506, + "step": 8160 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917372867741045e-06, + "loss": 0.9541, + "step": 8161 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917337366780985e-06, + "loss": 0.8994, + "step": 8162 + }, + { + "epoch": 0.21, + "learning_rate": 1.991730185822767e-06, + "loss": 0.9023, + "step": 8163 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917266342081136e-06, + "loss": 0.8643, + "step": 8164 + }, + { + "epoch": 0.21, + "learning_rate": 1.991723081834141e-06, + "loss": 0.8945, + "step": 8165 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917195287008508e-06, + "loss": 1.1543, + "step": 8166 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917159748082474e-06, + "loss": 0.8555, + "step": 8167 + }, + { + "epoch": 0.21, + "learning_rate": 1.991712420156332e-06, + "loss": 0.7251, + "step": 8168 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917088647451085e-06, + "loss": 0.6892, + "step": 8169 + }, + { + "epoch": 0.21, + "learning_rate": 1.991705308574579e-06, + "loss": 0.9229, + "step": 8170 + }, + { + "epoch": 0.21, + "learning_rate": 1.9917017516447463e-06, + "loss": 0.7617, + "step": 8171 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916981939556133e-06, + "loss": 0.7363, + "step": 8172 + }, + { + "epoch": 0.21, + "learning_rate": 1.991694635507182e-06, + "loss": 0.9131, + "step": 8173 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916910762994564e-06, + "loss": 1.0146, + "step": 8174 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916875163324384e-06, + "loss": 0.8516, + "step": 8175 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916839556061307e-06, + "loss": 0.9346, + "step": 8176 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916803941205363e-06, + "loss": 0.6929, + "step": 8177 + }, + { + "epoch": 0.21, + "learning_rate": 1.991676831875658e-06, + "loss": 0.7659, + "step": 8178 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916732688714977e-06, + "loss": 0.7939, + "step": 8179 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916697051080594e-06, + "loss": 0.7644, + "step": 8180 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916661405853454e-06, + "loss": 0.7583, + "step": 8181 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916625753033574e-06, + "loss": 0.8613, + "step": 8182 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916590092620997e-06, + "loss": 0.917, + "step": 8183 + }, + { + "epoch": 0.21, + "learning_rate": 1.991655442461574e-06, + "loss": 0.9082, + "step": 8184 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916518749017835e-06, + "loss": 0.751, + "step": 8185 + }, + { + "epoch": 0.21, + "learning_rate": 1.99164830658273e-06, + "loss": 1.1953, + "step": 8186 + }, + { + "epoch": 0.21, + "learning_rate": 1.991644737504418e-06, + "loss": 0.8516, + "step": 8187 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916411676668488e-06, + "loss": 1.0576, + "step": 8188 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916375970700255e-06, + "loss": 1.041, + "step": 8189 + }, + { + "epoch": 0.21, + "learning_rate": 1.991634025713951e-06, + "loss": 0.9463, + "step": 8190 + }, + { + "epoch": 0.21, + "learning_rate": 1.991630453598628e-06, + "loss": 1.0146, + "step": 8191 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916268807240592e-06, + "loss": 0.9287, + "step": 8192 + }, + { + "epoch": 0.21, + "learning_rate": 1.991623307090247e-06, + "loss": 0.9111, + "step": 8193 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916197326971942e-06, + "loss": 1.0986, + "step": 8194 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916161575449045e-06, + "loss": 0.7168, + "step": 8195 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916125816333794e-06, + "loss": 0.7607, + "step": 8196 + }, + { + "epoch": 0.21, + "learning_rate": 1.991609004962622e-06, + "loss": 0.9766, + "step": 8197 + }, + { + "epoch": 0.21, + "learning_rate": 1.991605427532636e-06, + "loss": 0.9082, + "step": 8198 + }, + { + "epoch": 0.21, + "learning_rate": 1.9916018493434227e-06, + "loss": 0.7344, + "step": 8199 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915982703949854e-06, + "loss": 0.915, + "step": 8200 + }, + { + "epoch": 0.21, + "learning_rate": 1.991594690687327e-06, + "loss": 0.8281, + "step": 8201 + }, + { + "epoch": 0.21, + "learning_rate": 1.99159111022045e-06, + "loss": 1.0146, + "step": 8202 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915875289943576e-06, + "loss": 0.749, + "step": 8203 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915839470090523e-06, + "loss": 0.9072, + "step": 8204 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915803642645365e-06, + "loss": 0.689, + "step": 8205 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915767807608132e-06, + "loss": 1.0322, + "step": 8206 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915731964978854e-06, + "loss": 0.7505, + "step": 8207 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915696114757552e-06, + "loss": 0.918, + "step": 8208 + }, + { + "epoch": 0.21, + "learning_rate": 1.991566025694426e-06, + "loss": 0.9268, + "step": 8209 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915624391539003e-06, + "loss": 0.9697, + "step": 8210 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915588518541807e-06, + "loss": 1.0342, + "step": 8211 + }, + { + "epoch": 0.21, + "learning_rate": 1.99155526379527e-06, + "loss": 0.7822, + "step": 8212 + }, + { + "epoch": 0.21, + "learning_rate": 1.991551674977171e-06, + "loss": 1.1123, + "step": 8213 + }, + { + "epoch": 0.21, + "learning_rate": 1.991548085399887e-06, + "loss": 0.7744, + "step": 8214 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915444950634195e-06, + "loss": 0.9336, + "step": 8215 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915409039677726e-06, + "loss": 1.0615, + "step": 8216 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915373121129486e-06, + "loss": 0.9551, + "step": 8217 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915337194989493e-06, + "loss": 1.0723, + "step": 8218 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915301261257786e-06, + "loss": 0.8506, + "step": 8219 + }, + { + "epoch": 0.21, + "learning_rate": 1.991526531993439e-06, + "loss": 0.9951, + "step": 8220 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915229371019328e-06, + "loss": 0.8877, + "step": 8221 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915193414512632e-06, + "loss": 0.7739, + "step": 8222 + }, + { + "epoch": 0.21, + "learning_rate": 1.991515745041433e-06, + "loss": 0.7705, + "step": 8223 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915121478724444e-06, + "loss": 0.9678, + "step": 8224 + }, + { + "epoch": 0.21, + "learning_rate": 1.991508549944301e-06, + "loss": 0.7607, + "step": 8225 + }, + { + "epoch": 0.21, + "learning_rate": 1.9915049512570052e-06, + "loss": 0.9004, + "step": 8226 + }, + { + "epoch": 0.21, + "learning_rate": 1.991501351810559e-06, + "loss": 1.084, + "step": 8227 + }, + { + "epoch": 0.21, + "learning_rate": 1.991497751604966e-06, + "loss": 0.6821, + "step": 8228 + }, + { + "epoch": 0.21, + "learning_rate": 1.991494150640229e-06, + "loss": 0.9287, + "step": 8229 + }, + { + "epoch": 0.21, + "learning_rate": 1.9914905489163507e-06, + "loss": 0.6323, + "step": 8230 + }, + { + "epoch": 0.21, + "learning_rate": 1.9914869464333334e-06, + "loss": 0.9561, + "step": 8231 + }, + { + "epoch": 0.21, + "learning_rate": 1.99148334319118e-06, + "loss": 1.0176, + "step": 8232 + }, + { + "epoch": 0.21, + "learning_rate": 1.9914797391898936e-06, + "loss": 0.7373, + "step": 8233 + }, + { + "epoch": 0.21, + "learning_rate": 1.9914761344294766e-06, + "loss": 0.8857, + "step": 8234 + }, + { + "epoch": 0.21, + "learning_rate": 1.991472528909932e-06, + "loss": 1.0557, + "step": 8235 + }, + { + "epoch": 0.21, + "learning_rate": 1.9914689226312624e-06, + "loss": 0.9814, + "step": 8236 + }, + { + "epoch": 0.21, + "learning_rate": 1.9914653155934706e-06, + "loss": 1.0254, + "step": 8237 + }, + { + "epoch": 0.21, + "learning_rate": 1.9914617077965595e-06, + "loss": 0.6997, + "step": 8238 + }, + { + "epoch": 0.21, + "learning_rate": 1.991458099240532e-06, + "loss": 0.7012, + "step": 8239 + }, + { + "epoch": 0.21, + "learning_rate": 1.9914544899253906e-06, + "loss": 0.8159, + "step": 8240 + }, + { + "epoch": 0.21, + "learning_rate": 1.9914508798511374e-06, + "loss": 0.8535, + "step": 8241 + }, + { + "epoch": 0.21, + "learning_rate": 1.991447269017776e-06, + "loss": 0.8916, + "step": 8242 + }, + { + "epoch": 0.21, + "learning_rate": 1.99144365742531e-06, + "loss": 0.874, + "step": 8243 + }, + { + "epoch": 0.21, + "learning_rate": 1.9914400450737406e-06, + "loss": 0.9453, + "step": 8244 + }, + { + "epoch": 0.21, + "learning_rate": 1.9914364319630708e-06, + "loss": 0.6169, + "step": 8245 + }, + { + "epoch": 0.21, + "learning_rate": 1.991432818093304e-06, + "loss": 1.0771, + "step": 8246 + }, + { + "epoch": 0.21, + "learning_rate": 1.991429203464443e-06, + "loss": 0.6748, + "step": 8247 + }, + { + "epoch": 0.21, + "learning_rate": 1.99142558807649e-06, + "loss": 0.9775, + "step": 8248 + }, + { + "epoch": 0.21, + "learning_rate": 1.9914219719294474e-06, + "loss": 0.7437, + "step": 8249 + }, + { + "epoch": 0.21, + "learning_rate": 1.991418355023319e-06, + "loss": 0.9404, + "step": 8250 + }, + { + "epoch": 0.21, + "learning_rate": 1.9914147373581074e-06, + "loss": 0.7734, + "step": 8251 + }, + { + "epoch": 0.21, + "learning_rate": 1.991411118933815e-06, + "loss": 0.9658, + "step": 8252 + }, + { + "epoch": 0.21, + "learning_rate": 1.991407499750445e-06, + "loss": 1.1846, + "step": 8253 + }, + { + "epoch": 0.21, + "learning_rate": 1.9914038798079994e-06, + "loss": 0.9736, + "step": 8254 + }, + { + "epoch": 0.21, + "learning_rate": 1.9914002591064812e-06, + "loss": 0.8699, + "step": 8255 + }, + { + "epoch": 0.21, + "learning_rate": 1.991396637645894e-06, + "loss": 0.9971, + "step": 8256 + }, + { + "epoch": 0.21, + "learning_rate": 1.9913930154262396e-06, + "loss": 1.1465, + "step": 8257 + }, + { + "epoch": 0.21, + "learning_rate": 1.9913893924475216e-06, + "loss": 0.937, + "step": 8258 + }, + { + "epoch": 0.21, + "learning_rate": 1.9913857687097418e-06, + "loss": 0.9912, + "step": 8259 + }, + { + "epoch": 0.21, + "learning_rate": 1.9913821442129036e-06, + "loss": 0.875, + "step": 8260 + }, + { + "epoch": 0.21, + "learning_rate": 1.99137851895701e-06, + "loss": 0.9844, + "step": 8261 + }, + { + "epoch": 0.21, + "learning_rate": 1.9913748929420634e-06, + "loss": 1.1055, + "step": 8262 + }, + { + "epoch": 0.21, + "learning_rate": 1.991371266168066e-06, + "loss": 1.0674, + "step": 8263 + }, + { + "epoch": 0.21, + "learning_rate": 1.991367638635022e-06, + "loss": 0.9824, + "step": 8264 + }, + { + "epoch": 0.21, + "learning_rate": 1.991364010342933e-06, + "loss": 0.8037, + "step": 8265 + }, + { + "epoch": 0.21, + "learning_rate": 1.9913603812918023e-06, + "loss": 0.7632, + "step": 8266 + }, + { + "epoch": 0.21, + "learning_rate": 1.9913567514816327e-06, + "loss": 1.002, + "step": 8267 + }, + { + "epoch": 0.21, + "learning_rate": 1.9913531209124263e-06, + "loss": 0.7412, + "step": 8268 + }, + { + "epoch": 0.21, + "learning_rate": 1.991349489584187e-06, + "loss": 0.9404, + "step": 8269 + }, + { + "epoch": 0.21, + "learning_rate": 1.9913458574969162e-06, + "loss": 0.8672, + "step": 8270 + }, + { + "epoch": 0.21, + "learning_rate": 1.991342224650618e-06, + "loss": 0.8008, + "step": 8271 + }, + { + "epoch": 0.21, + "learning_rate": 1.9913385910452945e-06, + "loss": 0.9385, + "step": 8272 + }, + { + "epoch": 0.21, + "learning_rate": 1.991334956680949e-06, + "loss": 1.0371, + "step": 8273 + }, + { + "epoch": 0.21, + "learning_rate": 1.9913313215575835e-06, + "loss": 0.9912, + "step": 8274 + }, + { + "epoch": 0.21, + "learning_rate": 1.9913276856752016e-06, + "loss": 1.0137, + "step": 8275 + }, + { + "epoch": 0.21, + "learning_rate": 1.991324049033805e-06, + "loss": 0.8506, + "step": 8276 + }, + { + "epoch": 0.21, + "learning_rate": 1.9913204116333976e-06, + "loss": 0.6814, + "step": 8277 + }, + { + "epoch": 0.21, + "learning_rate": 1.991316773473982e-06, + "loss": 1.0811, + "step": 8278 + }, + { + "epoch": 0.21, + "learning_rate": 1.9913131345555603e-06, + "loss": 0.9014, + "step": 8279 + }, + { + "epoch": 0.21, + "learning_rate": 1.991309494878136e-06, + "loss": 1.0176, + "step": 8280 + }, + { + "epoch": 0.21, + "learning_rate": 1.9913058544417113e-06, + "loss": 0.96, + "step": 8281 + }, + { + "epoch": 0.21, + "learning_rate": 1.991302213246289e-06, + "loss": 0.8994, + "step": 8282 + }, + { + "epoch": 0.21, + "learning_rate": 1.991298571291873e-06, + "loss": 1.042, + "step": 8283 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912949285784648e-06, + "loss": 0.8965, + "step": 8284 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912912851060675e-06, + "loss": 0.6812, + "step": 8285 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912876408746843e-06, + "loss": 0.8296, + "step": 8286 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912839958843176e-06, + "loss": 1.0537, + "step": 8287 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912803501349704e-06, + "loss": 0.6904, + "step": 8288 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912767036266453e-06, + "loss": 0.8652, + "step": 8289 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912730563593457e-06, + "loss": 1.04, + "step": 8290 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912694083330736e-06, + "loss": 0.7061, + "step": 8291 + }, + { + "epoch": 0.21, + "learning_rate": 1.991265759547832e-06, + "loss": 0.8926, + "step": 8292 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912621100036235e-06, + "loss": 0.7725, + "step": 8293 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912584597004514e-06, + "loss": 0.8662, + "step": 8294 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912548086383184e-06, + "loss": 0.9402, + "step": 8295 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912511568172273e-06, + "loss": 0.7788, + "step": 8296 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912475042371807e-06, + "loss": 0.9844, + "step": 8297 + }, + { + "epoch": 0.21, + "learning_rate": 1.991243850898181e-06, + "loss": 0.6172, + "step": 8298 + }, + { + "epoch": 0.21, + "learning_rate": 1.991240196800232e-06, + "loss": 0.9609, + "step": 8299 + }, + { + "epoch": 0.21, + "learning_rate": 1.991236541943336e-06, + "loss": 0.8677, + "step": 8300 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912328863274953e-06, + "loss": 0.9014, + "step": 8301 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912292299527136e-06, + "loss": 0.7817, + "step": 8302 + }, + { + "epoch": 0.21, + "learning_rate": 1.991225572818993e-06, + "loss": 0.9121, + "step": 8303 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912219149263366e-06, + "loss": 1.1172, + "step": 8304 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912182562747472e-06, + "loss": 0.813, + "step": 8305 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912145968642274e-06, + "loss": 1.0986, + "step": 8306 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912109366947804e-06, + "loss": 0.6729, + "step": 8307 + }, + { + "epoch": 0.21, + "learning_rate": 1.991207275766409e-06, + "loss": 1.1035, + "step": 8308 + }, + { + "epoch": 0.21, + "learning_rate": 1.9912036140791153e-06, + "loss": 0.6245, + "step": 8309 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911999516329026e-06, + "loss": 0.8379, + "step": 8310 + }, + { + "epoch": 0.21, + "learning_rate": 1.991196288427774e-06, + "loss": 0.8701, + "step": 8311 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911926244637315e-06, + "loss": 1.1504, + "step": 8312 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911889597407786e-06, + "loss": 1.0996, + "step": 8313 + }, + { + "epoch": 0.21, + "learning_rate": 1.991185294258918e-06, + "loss": 0.8223, + "step": 8314 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911816280181523e-06, + "loss": 1.0195, + "step": 8315 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911779610184845e-06, + "loss": 0.9121, + "step": 8316 + }, + { + "epoch": 0.21, + "learning_rate": 1.991174293259917e-06, + "loss": 0.9336, + "step": 8317 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911706247424534e-06, + "loss": 0.96, + "step": 8318 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911669554660957e-06, + "loss": 0.7017, + "step": 8319 + }, + { + "epoch": 0.21, + "learning_rate": 1.991163285430847e-06, + "loss": 0.915, + "step": 8320 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911596146367104e-06, + "loss": 0.8701, + "step": 8321 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911559430836886e-06, + "loss": 0.8809, + "step": 8322 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911522707717838e-06, + "loss": 0.8496, + "step": 8323 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911485977009993e-06, + "loss": 0.9121, + "step": 8324 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911449238713384e-06, + "loss": 0.8135, + "step": 8325 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911412492828026e-06, + "loss": 0.7778, + "step": 8326 + }, + { + "epoch": 0.21, + "learning_rate": 1.991137573935396e-06, + "loss": 0.9805, + "step": 8327 + }, + { + "epoch": 0.21, + "learning_rate": 1.991133897829121e-06, + "loss": 0.9189, + "step": 8328 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911302209639805e-06, + "loss": 0.9473, + "step": 8329 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911265433399767e-06, + "loss": 0.77, + "step": 8330 + }, + { + "epoch": 0.21, + "learning_rate": 1.991122864957113e-06, + "loss": 0.9883, + "step": 8331 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911191858153928e-06, + "loss": 0.9756, + "step": 8332 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911155059148173e-06, + "loss": 0.8428, + "step": 8333 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911118252553905e-06, + "loss": 0.9375, + "step": 8334 + }, + { + "epoch": 0.21, + "learning_rate": 1.991108143837115e-06, + "loss": 0.8662, + "step": 8335 + }, + { + "epoch": 0.21, + "learning_rate": 1.9911044616599935e-06, + "loss": 0.7402, + "step": 8336 + }, + { + "epoch": 0.21, + "learning_rate": 1.991100778724029e-06, + "loss": 1.2109, + "step": 8337 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910970950292244e-06, + "loss": 0.835, + "step": 8338 + }, + { + "epoch": 0.21, + "learning_rate": 1.991093410575582e-06, + "loss": 1.1143, + "step": 8339 + }, + { + "epoch": 0.21, + "learning_rate": 1.991089725363105e-06, + "loss": 0.9326, + "step": 8340 + }, + { + "epoch": 0.21, + "learning_rate": 1.991086039391796e-06, + "loss": 0.791, + "step": 8341 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910823526616583e-06, + "loss": 0.7998, + "step": 8342 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910786651726947e-06, + "loss": 0.9805, + "step": 8343 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910749769249068e-06, + "loss": 0.8174, + "step": 8344 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910712879182993e-06, + "loss": 0.8223, + "step": 8345 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910675981528736e-06, + "loss": 0.9521, + "step": 8346 + }, + { + "epoch": 0.21, + "learning_rate": 1.991063907628633e-06, + "loss": 0.9023, + "step": 8347 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910602163455805e-06, + "loss": 0.9766, + "step": 8348 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910565243037186e-06, + "loss": 0.8867, + "step": 8349 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910528315030503e-06, + "loss": 0.998, + "step": 8350 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910491379435785e-06, + "loss": 0.9248, + "step": 8351 + }, + { + "epoch": 0.21, + "learning_rate": 1.991045443625306e-06, + "loss": 0.6685, + "step": 8352 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910417485482356e-06, + "loss": 0.6826, + "step": 8353 + }, + { + "epoch": 0.21, + "learning_rate": 1.99103805271237e-06, + "loss": 1.1162, + "step": 8354 + }, + { + "epoch": 0.21, + "learning_rate": 1.991034356117712e-06, + "loss": 0.874, + "step": 8355 + }, + { + "epoch": 0.21, + "learning_rate": 1.991030658764265e-06, + "loss": 0.8721, + "step": 8356 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910269606520308e-06, + "loss": 0.8506, + "step": 8357 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910232617810136e-06, + "loss": 1.1592, + "step": 8358 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910195621512145e-06, + "loss": 0.811, + "step": 8359 + }, + { + "epoch": 0.21, + "learning_rate": 1.991015861762638e-06, + "loss": 0.9463, + "step": 8360 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910121606152857e-06, + "loss": 1.0596, + "step": 8361 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910084587091615e-06, + "loss": 0.915, + "step": 8362 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910047560442676e-06, + "loss": 0.8501, + "step": 8363 + }, + { + "epoch": 0.21, + "learning_rate": 1.9910010526206067e-06, + "loss": 1.0576, + "step": 8364 + }, + { + "epoch": 0.21, + "learning_rate": 1.9909973484381818e-06, + "loss": 1.0166, + "step": 8365 + }, + { + "epoch": 0.21, + "learning_rate": 1.990993643496996e-06, + "loss": 0.9458, + "step": 8366 + }, + { + "epoch": 0.21, + "learning_rate": 1.990989937797052e-06, + "loss": 0.8438, + "step": 8367 + }, + { + "epoch": 0.21, + "learning_rate": 1.990986231338352e-06, + "loss": 0.8047, + "step": 8368 + }, + { + "epoch": 0.21, + "learning_rate": 1.9909825241209e-06, + "loss": 0.9365, + "step": 8369 + }, + { + "epoch": 0.21, + "learning_rate": 1.9909788161446985e-06, + "loss": 1.0107, + "step": 8370 + }, + { + "epoch": 0.21, + "learning_rate": 1.9909751074097497e-06, + "loss": 1.1514, + "step": 8371 + }, + { + "epoch": 0.21, + "learning_rate": 1.990971397916057e-06, + "loss": 0.915, + "step": 8372 + }, + { + "epoch": 0.21, + "learning_rate": 1.9909676876636226e-06, + "loss": 0.7808, + "step": 8373 + }, + { + "epoch": 0.21, + "learning_rate": 1.9909639766524503e-06, + "loss": 1.0, + "step": 8374 + }, + { + "epoch": 0.21, + "learning_rate": 1.9909602648825418e-06, + "loss": 0.9209, + "step": 8375 + }, + { + "epoch": 0.21, + "learning_rate": 1.9909565523539014e-06, + "loss": 0.8564, + "step": 8376 + }, + { + "epoch": 0.21, + "learning_rate": 1.9909528390665304e-06, + "loss": 1.0977, + "step": 8377 + }, + { + "epoch": 0.21, + "learning_rate": 1.990949125020433e-06, + "loss": 0.998, + "step": 8378 + }, + { + "epoch": 0.21, + "learning_rate": 1.990945410215611e-06, + "loss": 0.7964, + "step": 8379 + }, + { + "epoch": 0.21, + "learning_rate": 1.990941694652068e-06, + "loss": 0.9058, + "step": 8380 + }, + { + "epoch": 0.21, + "learning_rate": 1.990937978329806e-06, + "loss": 0.7168, + "step": 8381 + }, + { + "epoch": 0.21, + "learning_rate": 1.990934261248829e-06, + "loss": 1.0156, + "step": 8382 + }, + { + "epoch": 0.21, + "learning_rate": 1.9909305434091387e-06, + "loss": 1.1191, + "step": 8383 + }, + { + "epoch": 0.21, + "learning_rate": 1.9909268248107386e-06, + "loss": 0.8091, + "step": 8384 + }, + { + "epoch": 0.21, + "learning_rate": 1.9909231054536316e-06, + "loss": 0.6785, + "step": 8385 + }, + { + "epoch": 0.21, + "learning_rate": 1.9909193853378202e-06, + "loss": 0.7217, + "step": 8386 + }, + { + "epoch": 0.21, + "learning_rate": 1.9909156644633075e-06, + "loss": 0.8594, + "step": 8387 + }, + { + "epoch": 0.21, + "learning_rate": 1.990911942830096e-06, + "loss": 1.0547, + "step": 8388 + }, + { + "epoch": 0.22, + "learning_rate": 1.990908220438189e-06, + "loss": 0.9326, + "step": 8389 + }, + { + "epoch": 0.22, + "learning_rate": 1.990904497287589e-06, + "loss": 0.8887, + "step": 8390 + }, + { + "epoch": 0.22, + "learning_rate": 1.990900773378299e-06, + "loss": 0.8438, + "step": 8391 + }, + { + "epoch": 0.22, + "learning_rate": 1.990897048710322e-06, + "loss": 0.9238, + "step": 8392 + }, + { + "epoch": 0.22, + "learning_rate": 1.9908933232836606e-06, + "loss": 0.8594, + "step": 8393 + }, + { + "epoch": 0.22, + "learning_rate": 1.9908895970983174e-06, + "loss": 0.8213, + "step": 8394 + }, + { + "epoch": 0.22, + "learning_rate": 1.990885870154296e-06, + "loss": 0.9873, + "step": 8395 + }, + { + "epoch": 0.22, + "learning_rate": 1.9908821424515987e-06, + "loss": 0.9688, + "step": 8396 + }, + { + "epoch": 0.22, + "learning_rate": 1.9908784139902287e-06, + "loss": 0.8169, + "step": 8397 + }, + { + "epoch": 0.22, + "learning_rate": 1.9908746847701884e-06, + "loss": 0.6599, + "step": 8398 + }, + { + "epoch": 0.22, + "learning_rate": 1.990870954791481e-06, + "loss": 0.9023, + "step": 8399 + }, + { + "epoch": 0.22, + "learning_rate": 1.9908672240541093e-06, + "loss": 1.1543, + "step": 8400 + }, + { + "epoch": 0.22, + "learning_rate": 1.990863492558076e-06, + "loss": 0.7109, + "step": 8401 + }, + { + "epoch": 0.22, + "learning_rate": 1.990859760303384e-06, + "loss": 0.8467, + "step": 8402 + }, + { + "epoch": 0.22, + "learning_rate": 1.990856027290037e-06, + "loss": 0.8965, + "step": 8403 + }, + { + "epoch": 0.22, + "learning_rate": 1.9908522935180364e-06, + "loss": 0.8926, + "step": 8404 + }, + { + "epoch": 0.22, + "learning_rate": 1.9908485589873857e-06, + "loss": 0.6917, + "step": 8405 + }, + { + "epoch": 0.22, + "learning_rate": 1.990844823698088e-06, + "loss": 0.9473, + "step": 8406 + }, + { + "epoch": 0.22, + "learning_rate": 1.990841087650146e-06, + "loss": 1.0254, + "step": 8407 + }, + { + "epoch": 0.22, + "learning_rate": 1.9908373508435625e-06, + "loss": 0.9873, + "step": 8408 + }, + { + "epoch": 0.22, + "learning_rate": 1.990833613278341e-06, + "loss": 0.9238, + "step": 8409 + }, + { + "epoch": 0.22, + "learning_rate": 1.9908298749544827e-06, + "loss": 0.9014, + "step": 8410 + }, + { + "epoch": 0.22, + "learning_rate": 1.990826135871992e-06, + "loss": 1.0947, + "step": 8411 + }, + { + "epoch": 0.22, + "learning_rate": 1.9908223960308714e-06, + "loss": 1.1416, + "step": 8412 + }, + { + "epoch": 0.22, + "learning_rate": 1.9908186554311233e-06, + "loss": 0.7837, + "step": 8413 + }, + { + "epoch": 0.22, + "learning_rate": 1.9908149140727514e-06, + "loss": 0.9492, + "step": 8414 + }, + { + "epoch": 0.22, + "learning_rate": 1.9908111719557577e-06, + "loss": 0.8496, + "step": 8415 + }, + { + "epoch": 0.22, + "learning_rate": 1.9908074290801456e-06, + "loss": 0.9541, + "step": 8416 + }, + { + "epoch": 0.22, + "learning_rate": 1.990803685445918e-06, + "loss": 0.9141, + "step": 8417 + }, + { + "epoch": 0.22, + "learning_rate": 1.9907999410530774e-06, + "loss": 0.9648, + "step": 8418 + }, + { + "epoch": 0.22, + "learning_rate": 1.9907961959016267e-06, + "loss": 0.7979, + "step": 8419 + }, + { + "epoch": 0.22, + "learning_rate": 1.9907924499915695e-06, + "loss": 1.0195, + "step": 8420 + }, + { + "epoch": 0.22, + "learning_rate": 1.9907887033229074e-06, + "loss": 0.8604, + "step": 8421 + }, + { + "epoch": 0.22, + "learning_rate": 1.9907849558956444e-06, + "loss": 0.8301, + "step": 8422 + }, + { + "epoch": 0.22, + "learning_rate": 1.9907812077097825e-06, + "loss": 0.9092, + "step": 8423 + }, + { + "epoch": 0.22, + "learning_rate": 1.990777458765325e-06, + "loss": 0.7646, + "step": 8424 + }, + { + "epoch": 0.22, + "learning_rate": 1.990773709062275e-06, + "loss": 1.043, + "step": 8425 + }, + { + "epoch": 0.22, + "learning_rate": 1.9907699586006354e-06, + "loss": 0.8135, + "step": 8426 + }, + { + "epoch": 0.22, + "learning_rate": 1.990766207380408e-06, + "loss": 0.9941, + "step": 8427 + }, + { + "epoch": 0.22, + "learning_rate": 1.9907624554015973e-06, + "loss": 0.9189, + "step": 8428 + }, + { + "epoch": 0.22, + "learning_rate": 1.990758702664205e-06, + "loss": 1.0596, + "step": 8429 + }, + { + "epoch": 0.22, + "learning_rate": 1.990754949168234e-06, + "loss": 0.9355, + "step": 8430 + }, + { + "epoch": 0.22, + "learning_rate": 1.9907511949136884e-06, + "loss": 0.8062, + "step": 8431 + }, + { + "epoch": 0.22, + "learning_rate": 1.990747439900569e-06, + "loss": 1.0557, + "step": 8432 + }, + { + "epoch": 0.22, + "learning_rate": 1.9907436841288806e-06, + "loss": 1.0801, + "step": 8433 + }, + { + "epoch": 0.22, + "learning_rate": 1.990739927598625e-06, + "loss": 1.1729, + "step": 8434 + }, + { + "epoch": 0.22, + "learning_rate": 1.9907361703098057e-06, + "loss": 0.8057, + "step": 8435 + }, + { + "epoch": 0.22, + "learning_rate": 1.990732412262425e-06, + "loss": 0.8633, + "step": 8436 + }, + { + "epoch": 0.22, + "learning_rate": 1.990728653456486e-06, + "loss": 0.7568, + "step": 8437 + }, + { + "epoch": 0.22, + "learning_rate": 1.990724893891992e-06, + "loss": 0.8564, + "step": 8438 + }, + { + "epoch": 0.22, + "learning_rate": 1.990721133568945e-06, + "loss": 1.0234, + "step": 8439 + }, + { + "epoch": 0.22, + "learning_rate": 1.9907173724873486e-06, + "loss": 0.8613, + "step": 8440 + }, + { + "epoch": 0.22, + "learning_rate": 1.9907136106472055e-06, + "loss": 0.9209, + "step": 8441 + }, + { + "epoch": 0.22, + "learning_rate": 1.990709848048519e-06, + "loss": 0.8242, + "step": 8442 + }, + { + "epoch": 0.22, + "learning_rate": 1.9907060846912906e-06, + "loss": 1.0371, + "step": 8443 + }, + { + "epoch": 0.22, + "learning_rate": 1.990702320575525e-06, + "loss": 0.917, + "step": 8444 + }, + { + "epoch": 0.22, + "learning_rate": 1.9906985557012236e-06, + "loss": 0.8525, + "step": 8445 + }, + { + "epoch": 0.22, + "learning_rate": 1.99069479006839e-06, + "loss": 0.9746, + "step": 8446 + }, + { + "epoch": 0.22, + "learning_rate": 1.990691023677027e-06, + "loss": 1.0508, + "step": 8447 + }, + { + "epoch": 0.22, + "learning_rate": 1.990687256527137e-06, + "loss": 0.8477, + "step": 8448 + }, + { + "epoch": 0.22, + "learning_rate": 1.990683488618724e-06, + "loss": 0.8115, + "step": 8449 + }, + { + "epoch": 0.22, + "learning_rate": 1.99067971995179e-06, + "loss": 0.7705, + "step": 8450 + }, + { + "epoch": 0.22, + "learning_rate": 1.990675950526338e-06, + "loss": 0.8799, + "step": 8451 + }, + { + "epoch": 0.22, + "learning_rate": 1.990672180342371e-06, + "loss": 0.9922, + "step": 8452 + }, + { + "epoch": 0.22, + "learning_rate": 1.990668409399892e-06, + "loss": 0.918, + "step": 8453 + }, + { + "epoch": 0.22, + "learning_rate": 1.9906646376989036e-06, + "loss": 0.8252, + "step": 8454 + }, + { + "epoch": 0.22, + "learning_rate": 1.990660865239409e-06, + "loss": 0.9541, + "step": 8455 + }, + { + "epoch": 0.22, + "learning_rate": 1.9906570920214105e-06, + "loss": 0.8564, + "step": 8456 + }, + { + "epoch": 0.22, + "learning_rate": 1.9906533180449115e-06, + "loss": 0.7817, + "step": 8457 + }, + { + "epoch": 0.22, + "learning_rate": 1.9906495433099153e-06, + "loss": 0.9453, + "step": 8458 + }, + { + "epoch": 0.22, + "learning_rate": 1.990645767816424e-06, + "loss": 1.0771, + "step": 8459 + }, + { + "epoch": 0.22, + "learning_rate": 1.9906419915644407e-06, + "loss": 0.8174, + "step": 8460 + }, + { + "epoch": 0.22, + "learning_rate": 1.9906382145539684e-06, + "loss": 0.9561, + "step": 8461 + }, + { + "epoch": 0.22, + "learning_rate": 1.9906344367850103e-06, + "loss": 0.8369, + "step": 8462 + }, + { + "epoch": 0.22, + "learning_rate": 1.990630658257569e-06, + "loss": 0.6333, + "step": 8463 + }, + { + "epoch": 0.22, + "learning_rate": 1.9906268789716467e-06, + "loss": 1.0645, + "step": 8464 + }, + { + "epoch": 0.22, + "learning_rate": 1.990623098927247e-06, + "loss": 0.8867, + "step": 8465 + }, + { + "epoch": 0.22, + "learning_rate": 1.9906193181243733e-06, + "loss": 0.8779, + "step": 8466 + }, + { + "epoch": 0.22, + "learning_rate": 1.9906155365630275e-06, + "loss": 1.0195, + "step": 8467 + }, + { + "epoch": 0.22, + "learning_rate": 1.9906117542432134e-06, + "loss": 0.7412, + "step": 8468 + }, + { + "epoch": 0.22, + "learning_rate": 1.9906079711649333e-06, + "loss": 0.9463, + "step": 8469 + }, + { + "epoch": 0.22, + "learning_rate": 1.99060418732819e-06, + "loss": 0.9932, + "step": 8470 + }, + { + "epoch": 0.22, + "learning_rate": 1.9906004027329868e-06, + "loss": 0.9189, + "step": 8471 + }, + { + "epoch": 0.22, + "learning_rate": 1.990596617379326e-06, + "loss": 0.9375, + "step": 8472 + }, + { + "epoch": 0.22, + "learning_rate": 1.9905928312672114e-06, + "loss": 1.0, + "step": 8473 + }, + { + "epoch": 0.22, + "learning_rate": 1.9905890443966453e-06, + "loss": 1.0791, + "step": 8474 + }, + { + "epoch": 0.22, + "learning_rate": 1.9905852567676303e-06, + "loss": 0.7695, + "step": 8475 + }, + { + "epoch": 0.22, + "learning_rate": 1.99058146838017e-06, + "loss": 0.9658, + "step": 8476 + }, + { + "epoch": 0.22, + "learning_rate": 1.9905776792342674e-06, + "loss": 1.0771, + "step": 8477 + }, + { + "epoch": 0.22, + "learning_rate": 1.9905738893299245e-06, + "loss": 0.999, + "step": 8478 + }, + { + "epoch": 0.22, + "learning_rate": 1.9905700986671454e-06, + "loss": 0.8887, + "step": 8479 + }, + { + "epoch": 0.22, + "learning_rate": 1.9905663072459317e-06, + "loss": 0.9668, + "step": 8480 + }, + { + "epoch": 0.22, + "learning_rate": 1.9905625150662872e-06, + "loss": 1.1006, + "step": 8481 + }, + { + "epoch": 0.22, + "learning_rate": 1.990558722128214e-06, + "loss": 0.9697, + "step": 8482 + }, + { + "epoch": 0.22, + "learning_rate": 1.990554928431716e-06, + "loss": 1.1328, + "step": 8483 + }, + { + "epoch": 0.22, + "learning_rate": 1.9905511339767956e-06, + "loss": 0.6729, + "step": 8484 + }, + { + "epoch": 0.22, + "learning_rate": 1.990547338763456e-06, + "loss": 0.9736, + "step": 8485 + }, + { + "epoch": 0.22, + "learning_rate": 1.9905435427916997e-06, + "loss": 0.7842, + "step": 8486 + }, + { + "epoch": 0.22, + "learning_rate": 1.9905397460615295e-06, + "loss": 0.8926, + "step": 8487 + }, + { + "epoch": 0.22, + "learning_rate": 1.990535948572949e-06, + "loss": 1.0967, + "step": 8488 + }, + { + "epoch": 0.22, + "learning_rate": 1.99053215032596e-06, + "loss": 1.0029, + "step": 8489 + }, + { + "epoch": 0.22, + "learning_rate": 1.9905283513205667e-06, + "loss": 1.0098, + "step": 8490 + }, + { + "epoch": 0.22, + "learning_rate": 1.990524551556771e-06, + "loss": 1.1494, + "step": 8491 + }, + { + "epoch": 0.22, + "learning_rate": 1.990520751034576e-06, + "loss": 1.0664, + "step": 8492 + }, + { + "epoch": 0.22, + "learning_rate": 1.9905169497539858e-06, + "loss": 0.8096, + "step": 8493 + }, + { + "epoch": 0.22, + "learning_rate": 1.9905131477150015e-06, + "loss": 0.8945, + "step": 8494 + }, + { + "epoch": 0.22, + "learning_rate": 1.990509344917627e-06, + "loss": 0.9004, + "step": 8495 + }, + { + "epoch": 0.22, + "learning_rate": 1.990505541361865e-06, + "loss": 1.0576, + "step": 8496 + }, + { + "epoch": 0.22, + "learning_rate": 1.9905017370477185e-06, + "loss": 1.1602, + "step": 8497 + }, + { + "epoch": 0.22, + "learning_rate": 1.9904979319751904e-06, + "loss": 0.8447, + "step": 8498 + }, + { + "epoch": 0.22, + "learning_rate": 1.9904941261442835e-06, + "loss": 0.9028, + "step": 8499 + }, + { + "epoch": 0.22, + "learning_rate": 1.990490319555001e-06, + "loss": 1.2139, + "step": 8500 + }, + { + "epoch": 0.22, + "learning_rate": 1.9904865122073452e-06, + "loss": 0.7651, + "step": 8501 + }, + { + "epoch": 0.22, + "learning_rate": 1.9904827041013197e-06, + "loss": 0.8555, + "step": 8502 + }, + { + "epoch": 0.22, + "learning_rate": 1.990478895236927e-06, + "loss": 0.9424, + "step": 8503 + }, + { + "epoch": 0.22, + "learning_rate": 1.9904750856141704e-06, + "loss": 0.958, + "step": 8504 + }, + { + "epoch": 0.22, + "learning_rate": 1.990471275233052e-06, + "loss": 0.9785, + "step": 8505 + }, + { + "epoch": 0.22, + "learning_rate": 1.990467464093576e-06, + "loss": 1.0566, + "step": 8506 + }, + { + "epoch": 0.22, + "learning_rate": 1.9904636521957443e-06, + "loss": 0.9102, + "step": 8507 + }, + { + "epoch": 0.22, + "learning_rate": 1.99045983953956e-06, + "loss": 1.0137, + "step": 8508 + }, + { + "epoch": 0.22, + "learning_rate": 1.9904560261250265e-06, + "loss": 0.8071, + "step": 8509 + }, + { + "epoch": 0.22, + "learning_rate": 1.9904522119521457e-06, + "loss": 0.6309, + "step": 8510 + }, + { + "epoch": 0.22, + "learning_rate": 1.990448397020922e-06, + "loss": 0.8379, + "step": 8511 + }, + { + "epoch": 0.22, + "learning_rate": 1.990444581331357e-06, + "loss": 0.748, + "step": 8512 + }, + { + "epoch": 0.22, + "learning_rate": 1.990440764883454e-06, + "loss": 0.957, + "step": 8513 + }, + { + "epoch": 0.22, + "learning_rate": 1.9904369476772163e-06, + "loss": 0.9629, + "step": 8514 + }, + { + "epoch": 0.22, + "learning_rate": 1.9904331297126468e-06, + "loss": 0.9766, + "step": 8515 + }, + { + "epoch": 0.22, + "learning_rate": 1.9904293109897477e-06, + "loss": 1.1738, + "step": 8516 + }, + { + "epoch": 0.22, + "learning_rate": 1.990425491508523e-06, + "loss": 0.8662, + "step": 8517 + }, + { + "epoch": 0.22, + "learning_rate": 1.990421671268975e-06, + "loss": 0.7451, + "step": 8518 + }, + { + "epoch": 0.22, + "learning_rate": 1.9904178502711062e-06, + "loss": 0.9111, + "step": 8519 + }, + { + "epoch": 0.22, + "learning_rate": 1.99041402851492e-06, + "loss": 0.9053, + "step": 8520 + }, + { + "epoch": 0.22, + "learning_rate": 1.9904102060004197e-06, + "loss": 0.6328, + "step": 8521 + }, + { + "epoch": 0.22, + "learning_rate": 1.9904063827276073e-06, + "loss": 1.0049, + "step": 8522 + }, + { + "epoch": 0.22, + "learning_rate": 1.9904025586964866e-06, + "loss": 0.9785, + "step": 8523 + }, + { + "epoch": 0.22, + "learning_rate": 1.9903987339070605e-06, + "loss": 1.0508, + "step": 8524 + }, + { + "epoch": 0.22, + "learning_rate": 1.9903949083593315e-06, + "loss": 0.9033, + "step": 8525 + }, + { + "epoch": 0.22, + "learning_rate": 1.990391082053302e-06, + "loss": 0.7344, + "step": 8526 + }, + { + "epoch": 0.22, + "learning_rate": 1.9903872549889764e-06, + "loss": 0.6831, + "step": 8527 + }, + { + "epoch": 0.22, + "learning_rate": 1.9903834271663566e-06, + "loss": 0.8682, + "step": 8528 + }, + { + "epoch": 0.22, + "learning_rate": 1.9903795985854454e-06, + "loss": 0.8418, + "step": 8529 + }, + { + "epoch": 0.22, + "learning_rate": 1.9903757692462466e-06, + "loss": 0.7979, + "step": 8530 + }, + { + "epoch": 0.22, + "learning_rate": 1.9903719391487623e-06, + "loss": 0.9199, + "step": 8531 + }, + { + "epoch": 0.22, + "learning_rate": 1.990368108292996e-06, + "loss": 1.0547, + "step": 8532 + }, + { + "epoch": 0.22, + "learning_rate": 1.99036427667895e-06, + "loss": 1.1504, + "step": 8533 + }, + { + "epoch": 0.22, + "learning_rate": 1.9903604443066277e-06, + "loss": 1.0322, + "step": 8534 + }, + { + "epoch": 0.22, + "learning_rate": 1.990356611176032e-06, + "loss": 0.8232, + "step": 8535 + }, + { + "epoch": 0.22, + "learning_rate": 1.990352777287166e-06, + "loss": 0.9795, + "step": 8536 + }, + { + "epoch": 0.22, + "learning_rate": 1.990348942640032e-06, + "loss": 1.0283, + "step": 8537 + }, + { + "epoch": 0.22, + "learning_rate": 1.9903451072346337e-06, + "loss": 0.7808, + "step": 8538 + }, + { + "epoch": 0.22, + "learning_rate": 1.9903412710709734e-06, + "loss": 1.0195, + "step": 8539 + }, + { + "epoch": 0.22, + "learning_rate": 1.990337434149055e-06, + "loss": 0.9321, + "step": 8540 + }, + { + "epoch": 0.22, + "learning_rate": 1.99033359646888e-06, + "loss": 0.9629, + "step": 8541 + }, + { + "epoch": 0.22, + "learning_rate": 1.990329758030452e-06, + "loss": 0.8203, + "step": 8542 + }, + { + "epoch": 0.22, + "learning_rate": 1.990325918833775e-06, + "loss": 0.999, + "step": 8543 + }, + { + "epoch": 0.22, + "learning_rate": 1.99032207887885e-06, + "loss": 0.9727, + "step": 8544 + }, + { + "epoch": 0.22, + "learning_rate": 1.9903182381656815e-06, + "loss": 0.8066, + "step": 8545 + }, + { + "epoch": 0.22, + "learning_rate": 1.9903143966942713e-06, + "loss": 0.7305, + "step": 8546 + }, + { + "epoch": 0.22, + "learning_rate": 1.9903105544646236e-06, + "loss": 0.8906, + "step": 8547 + }, + { + "epoch": 0.22, + "learning_rate": 1.99030671147674e-06, + "loss": 0.7673, + "step": 8548 + }, + { + "epoch": 0.22, + "learning_rate": 1.9903028677306245e-06, + "loss": 0.7578, + "step": 8549 + }, + { + "epoch": 0.22, + "learning_rate": 1.9902990232262795e-06, + "loss": 0.7344, + "step": 8550 + }, + { + "epoch": 0.22, + "learning_rate": 1.9902951779637084e-06, + "loss": 0.6953, + "step": 8551 + }, + { + "epoch": 0.22, + "learning_rate": 1.9902913319429135e-06, + "loss": 0.8994, + "step": 8552 + }, + { + "epoch": 0.22, + "learning_rate": 1.990287485163898e-06, + "loss": 1.042, + "step": 8553 + }, + { + "epoch": 0.22, + "learning_rate": 1.990283637626665e-06, + "loss": 0.8516, + "step": 8554 + }, + { + "epoch": 0.22, + "learning_rate": 1.9902797893312175e-06, + "loss": 0.8154, + "step": 8555 + }, + { + "epoch": 0.22, + "learning_rate": 1.990275940277558e-06, + "loss": 0.9492, + "step": 8556 + }, + { + "epoch": 0.22, + "learning_rate": 1.9902720904656894e-06, + "loss": 0.8186, + "step": 8557 + }, + { + "epoch": 0.22, + "learning_rate": 1.9902682398956157e-06, + "loss": 0.9404, + "step": 8558 + }, + { + "epoch": 0.22, + "learning_rate": 1.990264388567339e-06, + "loss": 0.9751, + "step": 8559 + }, + { + "epoch": 0.22, + "learning_rate": 1.9902605364808625e-06, + "loss": 0.811, + "step": 8560 + }, + { + "epoch": 0.22, + "learning_rate": 1.9902566836361886e-06, + "loss": 0.8877, + "step": 8561 + }, + { + "epoch": 0.22, + "learning_rate": 1.990252830033321e-06, + "loss": 0.8721, + "step": 8562 + }, + { + "epoch": 0.22, + "learning_rate": 1.9902489756722624e-06, + "loss": 1.0312, + "step": 8563 + }, + { + "epoch": 0.22, + "learning_rate": 1.9902451205530153e-06, + "loss": 1.1191, + "step": 8564 + }, + { + "epoch": 0.22, + "learning_rate": 1.9902412646755835e-06, + "loss": 0.9717, + "step": 8565 + }, + { + "epoch": 0.22, + "learning_rate": 1.990237408039969e-06, + "loss": 1.0127, + "step": 8566 + }, + { + "epoch": 0.22, + "learning_rate": 1.990233550646176e-06, + "loss": 1.2324, + "step": 8567 + }, + { + "epoch": 0.22, + "learning_rate": 1.990229692494206e-06, + "loss": 0.8369, + "step": 8568 + }, + { + "epoch": 0.22, + "learning_rate": 1.990225833584063e-06, + "loss": 0.8506, + "step": 8569 + }, + { + "epoch": 0.22, + "learning_rate": 1.9902219739157493e-06, + "loss": 0.9746, + "step": 8570 + }, + { + "epoch": 0.22, + "learning_rate": 1.9902181134892687e-06, + "loss": 1.1689, + "step": 8571 + }, + { + "epoch": 0.22, + "learning_rate": 1.990214252304623e-06, + "loss": 0.8501, + "step": 8572 + }, + { + "epoch": 0.22, + "learning_rate": 1.9902103903618163e-06, + "loss": 0.7725, + "step": 8573 + }, + { + "epoch": 0.22, + "learning_rate": 1.990206527660851e-06, + "loss": 1.0879, + "step": 8574 + }, + { + "epoch": 0.22, + "learning_rate": 1.99020266420173e-06, + "loss": 1.0547, + "step": 8575 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901987999844564e-06, + "loss": 0.8535, + "step": 8576 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901949350090327e-06, + "loss": 1.0713, + "step": 8577 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901910692754624e-06, + "loss": 0.9062, + "step": 8578 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901872027837485e-06, + "loss": 0.7256, + "step": 8579 + }, + { + "epoch": 0.22, + "learning_rate": 1.990183335533894e-06, + "loss": 0.9678, + "step": 8580 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901794675259013e-06, + "loss": 0.8672, + "step": 8581 + }, + { + "epoch": 0.22, + "learning_rate": 1.990175598759774e-06, + "loss": 0.9526, + "step": 8582 + }, + { + "epoch": 0.22, + "learning_rate": 1.990171729235515e-06, + "loss": 0.9189, + "step": 8583 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901678589531265e-06, + "loss": 0.9722, + "step": 8584 + }, + { + "epoch": 0.22, + "learning_rate": 1.990163987912612e-06, + "loss": 1.1699, + "step": 8585 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901601161139744e-06, + "loss": 0.8311, + "step": 8586 + }, + { + "epoch": 0.22, + "learning_rate": 1.990156243557217e-06, + "loss": 0.9736, + "step": 8587 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901523702423423e-06, + "loss": 1.0195, + "step": 8588 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901484961693536e-06, + "loss": 0.7905, + "step": 8589 + }, + { + "epoch": 0.22, + "learning_rate": 1.990144621338254e-06, + "loss": 0.9961, + "step": 8590 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901407457490457e-06, + "loss": 0.999, + "step": 8591 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901368694017325e-06, + "loss": 0.8535, + "step": 8592 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901329922963167e-06, + "loss": 0.7939, + "step": 8593 + }, + { + "epoch": 0.22, + "learning_rate": 1.990129114432802e-06, + "loss": 0.8701, + "step": 8594 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901252358111907e-06, + "loss": 0.9639, + "step": 8595 + }, + { + "epoch": 0.22, + "learning_rate": 1.990121356431486e-06, + "loss": 0.9404, + "step": 8596 + }, + { + "epoch": 0.22, + "learning_rate": 1.990117476293691e-06, + "loss": 0.9062, + "step": 8597 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901135953978087e-06, + "loss": 0.8711, + "step": 8598 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901097137438417e-06, + "loss": 0.9697, + "step": 8599 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901058313317933e-06, + "loss": 0.8042, + "step": 8600 + }, + { + "epoch": 0.22, + "learning_rate": 1.9901019481616665e-06, + "loss": 0.9404, + "step": 8601 + }, + { + "epoch": 0.22, + "learning_rate": 1.990098064233464e-06, + "loss": 0.9795, + "step": 8602 + }, + { + "epoch": 0.22, + "learning_rate": 1.990094179547189e-06, + "loss": 0.9785, + "step": 8603 + }, + { + "epoch": 0.22, + "learning_rate": 1.9900902941028446e-06, + "loss": 0.8984, + "step": 8604 + }, + { + "epoch": 0.22, + "learning_rate": 1.990086407900433e-06, + "loss": 0.6182, + "step": 8605 + }, + { + "epoch": 0.22, + "learning_rate": 1.9900825209399583e-06, + "loss": 0.8569, + "step": 8606 + }, + { + "epoch": 0.22, + "learning_rate": 1.990078633221423e-06, + "loss": 0.8691, + "step": 8607 + }, + { + "epoch": 0.22, + "learning_rate": 1.99007474474483e-06, + "loss": 0.6846, + "step": 8608 + }, + { + "epoch": 0.22, + "learning_rate": 1.990070855510182e-06, + "loss": 0.9023, + "step": 8609 + }, + { + "epoch": 0.22, + "learning_rate": 1.9900669655174826e-06, + "loss": 0.9922, + "step": 8610 + }, + { + "epoch": 0.22, + "learning_rate": 1.990063074766734e-06, + "loss": 0.957, + "step": 8611 + }, + { + "epoch": 0.22, + "learning_rate": 1.99005918325794e-06, + "loss": 0.9873, + "step": 8612 + }, + { + "epoch": 0.22, + "learning_rate": 1.990055290991103e-06, + "loss": 0.9072, + "step": 8613 + }, + { + "epoch": 0.22, + "learning_rate": 1.990051397966226e-06, + "loss": 1.0156, + "step": 8614 + }, + { + "epoch": 0.22, + "learning_rate": 1.9900475041833127e-06, + "loss": 0.9541, + "step": 8615 + }, + { + "epoch": 0.22, + "learning_rate": 1.9900436096423653e-06, + "loss": 0.9473, + "step": 8616 + }, + { + "epoch": 0.22, + "learning_rate": 1.990039714343387e-06, + "loss": 0.9292, + "step": 8617 + }, + { + "epoch": 0.22, + "learning_rate": 1.9900358182863807e-06, + "loss": 1.1035, + "step": 8618 + }, + { + "epoch": 0.22, + "learning_rate": 1.9900319214713498e-06, + "loss": 0.635, + "step": 8619 + }, + { + "epoch": 0.22, + "learning_rate": 1.9900280238982968e-06, + "loss": 0.9297, + "step": 8620 + }, + { + "epoch": 0.22, + "learning_rate": 1.990024125567225e-06, + "loss": 0.8818, + "step": 8621 + }, + { + "epoch": 0.22, + "learning_rate": 1.990020226478137e-06, + "loss": 0.9629, + "step": 8622 + }, + { + "epoch": 0.22, + "learning_rate": 1.9900163266310363e-06, + "loss": 1.0098, + "step": 8623 + }, + { + "epoch": 0.22, + "learning_rate": 1.990012426025925e-06, + "loss": 0.7712, + "step": 8624 + }, + { + "epoch": 0.22, + "learning_rate": 1.9900085246628075e-06, + "loss": 0.8457, + "step": 8625 + }, + { + "epoch": 0.22, + "learning_rate": 1.9900046225416857e-06, + "loss": 0.9316, + "step": 8626 + }, + { + "epoch": 0.22, + "learning_rate": 1.990000719662563e-06, + "loss": 0.9883, + "step": 8627 + }, + { + "epoch": 0.22, + "learning_rate": 1.989996816025442e-06, + "loss": 0.833, + "step": 8628 + }, + { + "epoch": 0.22, + "learning_rate": 1.989992911630326e-06, + "loss": 0.9023, + "step": 8629 + }, + { + "epoch": 0.22, + "learning_rate": 1.989989006477218e-06, + "loss": 0.5591, + "step": 8630 + }, + { + "epoch": 0.22, + "learning_rate": 1.989985100566121e-06, + "loss": 0.9146, + "step": 8631 + }, + { + "epoch": 0.22, + "learning_rate": 1.9899811938970382e-06, + "loss": 0.9463, + "step": 8632 + }, + { + "epoch": 0.22, + "learning_rate": 1.9899772864699716e-06, + "loss": 0.9062, + "step": 8633 + }, + { + "epoch": 0.22, + "learning_rate": 1.9899733782849256e-06, + "loss": 0.833, + "step": 8634 + }, + { + "epoch": 0.22, + "learning_rate": 1.9899694693419024e-06, + "loss": 1.0137, + "step": 8635 + }, + { + "epoch": 0.22, + "learning_rate": 1.989965559640905e-06, + "loss": 0.875, + "step": 8636 + }, + { + "epoch": 0.22, + "learning_rate": 1.989961649181936e-06, + "loss": 0.751, + "step": 8637 + }, + { + "epoch": 0.22, + "learning_rate": 1.9899577379649996e-06, + "loss": 0.9111, + "step": 8638 + }, + { + "epoch": 0.22, + "learning_rate": 1.9899538259900978e-06, + "loss": 1.1406, + "step": 8639 + }, + { + "epoch": 0.22, + "learning_rate": 1.989949913257234e-06, + "loss": 0.6367, + "step": 8640 + }, + { + "epoch": 0.22, + "learning_rate": 1.989945999766411e-06, + "loss": 0.8955, + "step": 8641 + }, + { + "epoch": 0.22, + "learning_rate": 1.9899420855176315e-06, + "loss": 1.0576, + "step": 8642 + }, + { + "epoch": 0.22, + "learning_rate": 1.9899381705108993e-06, + "loss": 0.9355, + "step": 8643 + }, + { + "epoch": 0.22, + "learning_rate": 1.9899342547462167e-06, + "loss": 0.9502, + "step": 8644 + }, + { + "epoch": 0.22, + "learning_rate": 1.9899303382235874e-06, + "loss": 0.6582, + "step": 8645 + }, + { + "epoch": 0.22, + "learning_rate": 1.9899264209430135e-06, + "loss": 0.9624, + "step": 8646 + }, + { + "epoch": 0.22, + "learning_rate": 1.989922502904499e-06, + "loss": 0.8789, + "step": 8647 + }, + { + "epoch": 0.22, + "learning_rate": 1.9899185841080457e-06, + "loss": 0.918, + "step": 8648 + }, + { + "epoch": 0.22, + "learning_rate": 1.9899146645536576e-06, + "loss": 1.1162, + "step": 8649 + }, + { + "epoch": 0.22, + "learning_rate": 1.9899107442413373e-06, + "loss": 0.9619, + "step": 8650 + }, + { + "epoch": 0.22, + "learning_rate": 1.9899068231710876e-06, + "loss": 0.8145, + "step": 8651 + }, + { + "epoch": 0.22, + "learning_rate": 1.989902901342912e-06, + "loss": 0.8467, + "step": 8652 + }, + { + "epoch": 0.22, + "learning_rate": 1.9898989787568135e-06, + "loss": 0.7344, + "step": 8653 + }, + { + "epoch": 0.22, + "learning_rate": 1.9898950554127945e-06, + "loss": 0.8516, + "step": 8654 + }, + { + "epoch": 0.22, + "learning_rate": 1.9898911313108585e-06, + "loss": 0.9326, + "step": 8655 + }, + { + "epoch": 0.22, + "learning_rate": 1.989887206451009e-06, + "loss": 0.7969, + "step": 8656 + }, + { + "epoch": 0.22, + "learning_rate": 1.989883280833247e-06, + "loss": 0.7949, + "step": 8657 + }, + { + "epoch": 0.22, + "learning_rate": 1.989879354457578e-06, + "loss": 0.8359, + "step": 8658 + }, + { + "epoch": 0.22, + "learning_rate": 1.9898754273240033e-06, + "loss": 0.9551, + "step": 8659 + }, + { + "epoch": 0.22, + "learning_rate": 1.989871499432527e-06, + "loss": 0.9697, + "step": 8660 + }, + { + "epoch": 0.22, + "learning_rate": 1.9898675707831515e-06, + "loss": 1.0137, + "step": 8661 + }, + { + "epoch": 0.22, + "learning_rate": 1.9898636413758797e-06, + "loss": 1.0, + "step": 8662 + }, + { + "epoch": 0.22, + "learning_rate": 1.9898597112107145e-06, + "loss": 0.8857, + "step": 8663 + }, + { + "epoch": 0.22, + "learning_rate": 1.98985578028766e-06, + "loss": 0.8662, + "step": 8664 + }, + { + "epoch": 0.22, + "learning_rate": 1.989851848606718e-06, + "loss": 0.8291, + "step": 8665 + }, + { + "epoch": 0.22, + "learning_rate": 1.9898479161678923e-06, + "loss": 0.9043, + "step": 8666 + }, + { + "epoch": 0.22, + "learning_rate": 1.989843982971185e-06, + "loss": 0.79, + "step": 8667 + }, + { + "epoch": 0.22, + "learning_rate": 1.9898400490166e-06, + "loss": 0.9385, + "step": 8668 + }, + { + "epoch": 0.22, + "learning_rate": 1.9898361143041402e-06, + "loss": 0.834, + "step": 8669 + }, + { + "epoch": 0.22, + "learning_rate": 1.989832178833808e-06, + "loss": 0.9233, + "step": 8670 + }, + { + "epoch": 0.22, + "learning_rate": 1.989828242605607e-06, + "loss": 1.1445, + "step": 8671 + }, + { + "epoch": 0.22, + "learning_rate": 1.98982430561954e-06, + "loss": 0.7607, + "step": 8672 + }, + { + "epoch": 0.22, + "learning_rate": 1.9898203678756104e-06, + "loss": 1.2188, + "step": 8673 + }, + { + "epoch": 0.22, + "learning_rate": 1.9898164293738204e-06, + "loss": 0.917, + "step": 8674 + }, + { + "epoch": 0.22, + "learning_rate": 1.9898124901141735e-06, + "loss": 0.9326, + "step": 8675 + }, + { + "epoch": 0.22, + "learning_rate": 1.9898085500966726e-06, + "loss": 0.8018, + "step": 8676 + }, + { + "epoch": 0.22, + "learning_rate": 1.989804609321321e-06, + "loss": 0.9346, + "step": 8677 + }, + { + "epoch": 0.22, + "learning_rate": 1.9898006677881218e-06, + "loss": 1.0918, + "step": 8678 + }, + { + "epoch": 0.22, + "learning_rate": 1.9897967254970773e-06, + "loss": 0.9131, + "step": 8679 + }, + { + "epoch": 0.22, + "learning_rate": 1.9897927824481912e-06, + "loss": 0.834, + "step": 8680 + }, + { + "epoch": 0.22, + "learning_rate": 1.989788838641466e-06, + "loss": 0.9844, + "step": 8681 + }, + { + "epoch": 0.22, + "learning_rate": 1.989784894076905e-06, + "loss": 0.999, + "step": 8682 + }, + { + "epoch": 0.22, + "learning_rate": 1.9897809487545115e-06, + "loss": 1.0146, + "step": 8683 + }, + { + "epoch": 0.22, + "learning_rate": 1.9897770026742884e-06, + "loss": 0.7725, + "step": 8684 + }, + { + "epoch": 0.22, + "learning_rate": 1.989773055836238e-06, + "loss": 1.1777, + "step": 8685 + }, + { + "epoch": 0.22, + "learning_rate": 1.9897691082403644e-06, + "loss": 0.8643, + "step": 8686 + }, + { + "epoch": 0.22, + "learning_rate": 1.9897651598866698e-06, + "loss": 0.8975, + "step": 8687 + }, + { + "epoch": 0.22, + "learning_rate": 1.9897612107751576e-06, + "loss": 0.9648, + "step": 8688 + }, + { + "epoch": 0.22, + "learning_rate": 1.989757260905831e-06, + "loss": 0.8867, + "step": 8689 + }, + { + "epoch": 0.22, + "learning_rate": 1.9897533102786923e-06, + "loss": 0.6387, + "step": 8690 + }, + { + "epoch": 0.22, + "learning_rate": 1.9897493588937454e-06, + "loss": 0.96, + "step": 8691 + }, + { + "epoch": 0.22, + "learning_rate": 1.989745406750993e-06, + "loss": 0.7822, + "step": 8692 + }, + { + "epoch": 0.22, + "learning_rate": 1.9897414538504377e-06, + "loss": 1.0244, + "step": 8693 + }, + { + "epoch": 0.22, + "learning_rate": 1.9897375001920828e-06, + "loss": 0.9453, + "step": 8694 + }, + { + "epoch": 0.22, + "learning_rate": 1.9897335457759315e-06, + "loss": 1.1924, + "step": 8695 + }, + { + "epoch": 0.22, + "learning_rate": 1.989729590601987e-06, + "loss": 0.8623, + "step": 8696 + }, + { + "epoch": 0.22, + "learning_rate": 1.989725634670252e-06, + "loss": 0.7881, + "step": 8697 + }, + { + "epoch": 0.22, + "learning_rate": 1.9897216779807294e-06, + "loss": 0.8853, + "step": 8698 + }, + { + "epoch": 0.22, + "learning_rate": 1.9897177205334225e-06, + "loss": 0.9521, + "step": 8699 + }, + { + "epoch": 0.22, + "learning_rate": 1.989713762328334e-06, + "loss": 1.0137, + "step": 8700 + }, + { + "epoch": 0.22, + "learning_rate": 1.989709803365468e-06, + "loss": 0.916, + "step": 8701 + }, + { + "epoch": 0.22, + "learning_rate": 1.9897058436448258e-06, + "loss": 0.8564, + "step": 8702 + }, + { + "epoch": 0.22, + "learning_rate": 1.989701883166412e-06, + "loss": 0.9365, + "step": 8703 + }, + { + "epoch": 0.22, + "learning_rate": 1.9896979219302287e-06, + "loss": 0.8281, + "step": 8704 + }, + { + "epoch": 0.22, + "learning_rate": 1.989693959936279e-06, + "loss": 1.2402, + "step": 8705 + }, + { + "epoch": 0.22, + "learning_rate": 1.989689997184566e-06, + "loss": 0.8711, + "step": 8706 + }, + { + "epoch": 0.22, + "learning_rate": 1.9896860336750936e-06, + "loss": 1.0254, + "step": 8707 + }, + { + "epoch": 0.22, + "learning_rate": 1.9896820694078636e-06, + "loss": 0.9268, + "step": 8708 + }, + { + "epoch": 0.22, + "learning_rate": 1.9896781043828796e-06, + "loss": 0.9346, + "step": 8709 + }, + { + "epoch": 0.22, + "learning_rate": 1.9896741386001446e-06, + "loss": 0.7163, + "step": 8710 + }, + { + "epoch": 0.22, + "learning_rate": 1.9896701720596616e-06, + "loss": 0.8359, + "step": 8711 + }, + { + "epoch": 0.22, + "learning_rate": 1.989666204761434e-06, + "loss": 0.8809, + "step": 8712 + }, + { + "epoch": 0.22, + "learning_rate": 1.989662236705464e-06, + "loss": 0.6641, + "step": 8713 + }, + { + "epoch": 0.22, + "learning_rate": 1.989658267891755e-06, + "loss": 1.0029, + "step": 8714 + }, + { + "epoch": 0.22, + "learning_rate": 1.989654298320311e-06, + "loss": 0.8232, + "step": 8715 + }, + { + "epoch": 0.22, + "learning_rate": 1.9896503279911337e-06, + "loss": 0.9141, + "step": 8716 + }, + { + "epoch": 0.22, + "learning_rate": 1.9896463569042267e-06, + "loss": 0.9648, + "step": 8717 + }, + { + "epoch": 0.22, + "learning_rate": 1.989642385059593e-06, + "loss": 1.0674, + "step": 8718 + }, + { + "epoch": 0.22, + "learning_rate": 1.9896384124572356e-06, + "loss": 0.8799, + "step": 8719 + }, + { + "epoch": 0.22, + "learning_rate": 1.9896344390971573e-06, + "loss": 1.0, + "step": 8720 + }, + { + "epoch": 0.22, + "learning_rate": 1.9896304649793615e-06, + "loss": 0.958, + "step": 8721 + }, + { + "epoch": 0.22, + "learning_rate": 1.9896264901038515e-06, + "loss": 0.9961, + "step": 8722 + }, + { + "epoch": 0.22, + "learning_rate": 1.98962251447063e-06, + "loss": 0.9395, + "step": 8723 + }, + { + "epoch": 0.22, + "learning_rate": 1.9896185380797e-06, + "loss": 0.9814, + "step": 8724 + }, + { + "epoch": 0.22, + "learning_rate": 1.989614560931064e-06, + "loss": 0.9536, + "step": 8725 + }, + { + "epoch": 0.22, + "learning_rate": 1.989610583024726e-06, + "loss": 1.0391, + "step": 8726 + }, + { + "epoch": 0.22, + "learning_rate": 1.9896066043606893e-06, + "loss": 0.9492, + "step": 8727 + }, + { + "epoch": 0.22, + "learning_rate": 1.9896026249389557e-06, + "loss": 0.7646, + "step": 8728 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895986447595287e-06, + "loss": 0.9912, + "step": 8729 + }, + { + "epoch": 0.22, + "learning_rate": 1.989594663822412e-06, + "loss": 0.6636, + "step": 8730 + }, + { + "epoch": 0.22, + "learning_rate": 1.989590682127608e-06, + "loss": 0.8926, + "step": 8731 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895866996751197e-06, + "loss": 1.123, + "step": 8732 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895827164649507e-06, + "loss": 1.0566, + "step": 8733 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895787324971036e-06, + "loss": 0.7632, + "step": 8734 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895747477715817e-06, + "loss": 0.4839, + "step": 8735 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895707622883876e-06, + "loss": 0.7407, + "step": 8736 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895667760475246e-06, + "loss": 0.9414, + "step": 8737 + }, + { + "epoch": 0.22, + "learning_rate": 1.989562789048996e-06, + "loss": 0.874, + "step": 8738 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895588012928052e-06, + "loss": 0.873, + "step": 8739 + }, + { + "epoch": 0.22, + "learning_rate": 1.989554812778954e-06, + "loss": 0.6748, + "step": 8740 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895508235074464e-06, + "loss": 1.166, + "step": 8741 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895468334782853e-06, + "loss": 1.084, + "step": 8742 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895428426914736e-06, + "loss": 0.7529, + "step": 8743 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895388511470146e-06, + "loss": 0.8213, + "step": 8744 + }, + { + "epoch": 0.22, + "learning_rate": 1.989534858844911e-06, + "loss": 0.7275, + "step": 8745 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895308657851663e-06, + "loss": 0.96, + "step": 8746 + }, + { + "epoch": 0.22, + "learning_rate": 1.989526871967783e-06, + "loss": 0.918, + "step": 8747 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895228773927646e-06, + "loss": 1.1074, + "step": 8748 + }, + { + "epoch": 0.22, + "learning_rate": 1.989518882060114e-06, + "loss": 0.875, + "step": 8749 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895148859698344e-06, + "loss": 0.7515, + "step": 8750 + }, + { + "epoch": 0.22, + "learning_rate": 1.989510889121929e-06, + "loss": 1.0205, + "step": 8751 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895068915164003e-06, + "loss": 0.8711, + "step": 8752 + }, + { + "epoch": 0.22, + "learning_rate": 1.9895028931532515e-06, + "loss": 1.2109, + "step": 8753 + }, + { + "epoch": 0.22, + "learning_rate": 1.989498894032486e-06, + "loss": 0.8584, + "step": 8754 + }, + { + "epoch": 0.22, + "learning_rate": 1.9894948941541067e-06, + "loss": 0.6992, + "step": 8755 + }, + { + "epoch": 0.22, + "learning_rate": 1.9894908935181166e-06, + "loss": 0.8237, + "step": 8756 + }, + { + "epoch": 0.22, + "learning_rate": 1.989486892124519e-06, + "loss": 0.876, + "step": 8757 + }, + { + "epoch": 0.22, + "learning_rate": 1.989482889973317e-06, + "loss": 0.9707, + "step": 8758 + }, + { + "epoch": 0.22, + "learning_rate": 1.989478887064513e-06, + "loss": 0.9023, + "step": 8759 + }, + { + "epoch": 0.22, + "learning_rate": 1.9894748833981104e-06, + "loss": 0.9502, + "step": 8760 + }, + { + "epoch": 0.22, + "learning_rate": 1.9894708789741127e-06, + "loss": 0.9141, + "step": 8761 + }, + { + "epoch": 0.22, + "learning_rate": 1.9894668737925227e-06, + "loss": 1.0273, + "step": 8762 + }, + { + "epoch": 0.22, + "learning_rate": 1.989462867853343e-06, + "loss": 0.8672, + "step": 8763 + }, + { + "epoch": 0.22, + "learning_rate": 1.9894588611565778e-06, + "loss": 0.791, + "step": 8764 + }, + { + "epoch": 0.22, + "learning_rate": 1.989454853702229e-06, + "loss": 0.8169, + "step": 8765 + }, + { + "epoch": 0.22, + "learning_rate": 1.9894508454903e-06, + "loss": 0.7939, + "step": 8766 + }, + { + "epoch": 0.22, + "learning_rate": 1.989446836520794e-06, + "loss": 1.2529, + "step": 8767 + }, + { + "epoch": 0.22, + "learning_rate": 1.9894428267937144e-06, + "loss": 0.9199, + "step": 8768 + }, + { + "epoch": 0.22, + "learning_rate": 1.9894388163090634e-06, + "loss": 0.8037, + "step": 8769 + }, + { + "epoch": 0.22, + "learning_rate": 1.989434805066845e-06, + "loss": 0.8809, + "step": 8770 + }, + { + "epoch": 0.22, + "learning_rate": 1.989430793067062e-06, + "loss": 0.9941, + "step": 8771 + }, + { + "epoch": 0.22, + "learning_rate": 1.9894267803097173e-06, + "loss": 0.677, + "step": 8772 + }, + { + "epoch": 0.22, + "learning_rate": 1.9894227667948135e-06, + "loss": 0.9375, + "step": 8773 + }, + { + "epoch": 0.22, + "learning_rate": 1.9894187525223544e-06, + "loss": 0.7764, + "step": 8774 + }, + { + "epoch": 0.22, + "learning_rate": 1.989414737492343e-06, + "loss": 1.0225, + "step": 8775 + }, + { + "epoch": 0.22, + "learning_rate": 1.989410721704782e-06, + "loss": 0.8467, + "step": 8776 + }, + { + "epoch": 0.22, + "learning_rate": 1.989406705159675e-06, + "loss": 0.6572, + "step": 8777 + }, + { + "epoch": 0.22, + "learning_rate": 1.9894026878570246e-06, + "loss": 0.7974, + "step": 8778 + }, + { + "epoch": 0.23, + "learning_rate": 1.989398669796834e-06, + "loss": 0.769, + "step": 8779 + }, + { + "epoch": 0.23, + "learning_rate": 1.989394650979107e-06, + "loss": 0.6606, + "step": 8780 + }, + { + "epoch": 0.23, + "learning_rate": 1.989390631403845e-06, + "loss": 0.8496, + "step": 8781 + }, + { + "epoch": 0.23, + "learning_rate": 1.9893866110710523e-06, + "loss": 1.0693, + "step": 8782 + }, + { + "epoch": 0.23, + "learning_rate": 1.9893825899807322e-06, + "loss": 0.9883, + "step": 8783 + }, + { + "epoch": 0.23, + "learning_rate": 1.9893785681328873e-06, + "loss": 0.9648, + "step": 8784 + }, + { + "epoch": 0.23, + "learning_rate": 1.9893745455275205e-06, + "loss": 1.001, + "step": 8785 + }, + { + "epoch": 0.23, + "learning_rate": 1.9893705221646352e-06, + "loss": 0.8594, + "step": 8786 + }, + { + "epoch": 0.23, + "learning_rate": 1.9893664980442344e-06, + "loss": 1.0361, + "step": 8787 + }, + { + "epoch": 0.23, + "learning_rate": 1.989362473166321e-06, + "loss": 0.825, + "step": 8788 + }, + { + "epoch": 0.23, + "learning_rate": 1.9893584475308983e-06, + "loss": 0.9922, + "step": 8789 + }, + { + "epoch": 0.23, + "learning_rate": 1.9893544211379695e-06, + "loss": 1.043, + "step": 8790 + }, + { + "epoch": 0.23, + "learning_rate": 1.9893503939875374e-06, + "loss": 0.6387, + "step": 8791 + }, + { + "epoch": 0.23, + "learning_rate": 1.9893463660796054e-06, + "loss": 0.9814, + "step": 8792 + }, + { + "epoch": 0.23, + "learning_rate": 1.989342337414176e-06, + "loss": 0.9092, + "step": 8793 + }, + { + "epoch": 0.23, + "learning_rate": 1.989338307991253e-06, + "loss": 0.7793, + "step": 8794 + }, + { + "epoch": 0.23, + "learning_rate": 1.9893342778108387e-06, + "loss": 1.001, + "step": 8795 + }, + { + "epoch": 0.23, + "learning_rate": 1.989330246872937e-06, + "loss": 0.6812, + "step": 8796 + }, + { + "epoch": 0.23, + "learning_rate": 1.9893262151775505e-06, + "loss": 0.8428, + "step": 8797 + }, + { + "epoch": 0.23, + "learning_rate": 1.9893221827246824e-06, + "loss": 0.834, + "step": 8798 + }, + { + "epoch": 0.23, + "learning_rate": 1.989318149514336e-06, + "loss": 0.8662, + "step": 8799 + }, + { + "epoch": 0.23, + "learning_rate": 1.989314115546514e-06, + "loss": 0.8369, + "step": 8800 + }, + { + "epoch": 0.23, + "learning_rate": 1.98931008082122e-06, + "loss": 0.7808, + "step": 8801 + }, + { + "epoch": 0.23, + "learning_rate": 1.989306045338456e-06, + "loss": 0.9902, + "step": 8802 + }, + { + "epoch": 0.23, + "learning_rate": 1.9893020090982263e-06, + "loss": 0.7793, + "step": 8803 + }, + { + "epoch": 0.23, + "learning_rate": 1.989297972100534e-06, + "loss": 0.9824, + "step": 8804 + }, + { + "epoch": 0.23, + "learning_rate": 1.989293934345381e-06, + "loss": 0.9268, + "step": 8805 + }, + { + "epoch": 0.23, + "learning_rate": 1.9892898958327715e-06, + "loss": 0.8916, + "step": 8806 + }, + { + "epoch": 0.23, + "learning_rate": 1.989285856562708e-06, + "loss": 0.9043, + "step": 8807 + }, + { + "epoch": 0.23, + "learning_rate": 1.9892818165351942e-06, + "loss": 0.9473, + "step": 8808 + }, + { + "epoch": 0.23, + "learning_rate": 1.9892777757502324e-06, + "loss": 0.9932, + "step": 8809 + }, + { + "epoch": 0.23, + "learning_rate": 1.9892737342078263e-06, + "loss": 0.8857, + "step": 8810 + }, + { + "epoch": 0.23, + "learning_rate": 1.9892696919079787e-06, + "loss": 0.7578, + "step": 8811 + }, + { + "epoch": 0.23, + "learning_rate": 1.9892656488506926e-06, + "loss": 0.8125, + "step": 8812 + }, + { + "epoch": 0.23, + "learning_rate": 1.9892616050359715e-06, + "loss": 0.9346, + "step": 8813 + }, + { + "epoch": 0.23, + "learning_rate": 1.9892575604638183e-06, + "loss": 0.8672, + "step": 8814 + }, + { + "epoch": 0.23, + "learning_rate": 1.9892535151342363e-06, + "loss": 0.9424, + "step": 8815 + }, + { + "epoch": 0.23, + "learning_rate": 1.9892494690472277e-06, + "loss": 0.8193, + "step": 8816 + }, + { + "epoch": 0.23, + "learning_rate": 1.989245422202797e-06, + "loss": 0.8838, + "step": 8817 + }, + { + "epoch": 0.23, + "learning_rate": 1.989241374600946e-06, + "loss": 1.0146, + "step": 8818 + }, + { + "epoch": 0.23, + "learning_rate": 1.9892373262416784e-06, + "loss": 1.0283, + "step": 8819 + }, + { + "epoch": 0.23, + "learning_rate": 1.9892332771249978e-06, + "loss": 0.9863, + "step": 8820 + }, + { + "epoch": 0.23, + "learning_rate": 1.989229227250906e-06, + "loss": 0.7998, + "step": 8821 + }, + { + "epoch": 0.23, + "learning_rate": 1.989225176619408e-06, + "loss": 0.9023, + "step": 8822 + }, + { + "epoch": 0.23, + "learning_rate": 1.9892211252305046e-06, + "loss": 1.0791, + "step": 8823 + }, + { + "epoch": 0.23, + "learning_rate": 1.989217073084201e-06, + "loss": 0.5728, + "step": 8824 + }, + { + "epoch": 0.23, + "learning_rate": 1.9892130201804987e-06, + "loss": 0.9697, + "step": 8825 + }, + { + "epoch": 0.23, + "learning_rate": 1.9892089665194015e-06, + "loss": 1.1338, + "step": 8826 + }, + { + "epoch": 0.23, + "learning_rate": 1.989204912100913e-06, + "loss": 1.0273, + "step": 8827 + }, + { + "epoch": 0.23, + "learning_rate": 1.989200856925035e-06, + "loss": 0.7637, + "step": 8828 + }, + { + "epoch": 0.23, + "learning_rate": 1.989196800991772e-06, + "loss": 1.0371, + "step": 8829 + }, + { + "epoch": 0.23, + "learning_rate": 1.9891927443011264e-06, + "loss": 1.1943, + "step": 8830 + }, + { + "epoch": 0.23, + "learning_rate": 1.9891886868531013e-06, + "loss": 1.0918, + "step": 8831 + }, + { + "epoch": 0.23, + "learning_rate": 1.9891846286477e-06, + "loss": 1.0352, + "step": 8832 + }, + { + "epoch": 0.23, + "learning_rate": 1.9891805696849257e-06, + "loss": 1.0029, + "step": 8833 + }, + { + "epoch": 0.23, + "learning_rate": 1.989176509964781e-06, + "loss": 1.1289, + "step": 8834 + }, + { + "epoch": 0.23, + "learning_rate": 1.989172449487269e-06, + "loss": 0.9639, + "step": 8835 + }, + { + "epoch": 0.23, + "learning_rate": 1.989168388252394e-06, + "loss": 0.9648, + "step": 8836 + }, + { + "epoch": 0.23, + "learning_rate": 1.9891643262601576e-06, + "loss": 0.9053, + "step": 8837 + }, + { + "epoch": 0.23, + "learning_rate": 1.989160263510564e-06, + "loss": 0.9219, + "step": 8838 + }, + { + "epoch": 0.23, + "learning_rate": 1.9891562000036154e-06, + "loss": 0.8311, + "step": 8839 + }, + { + "epoch": 0.23, + "learning_rate": 1.9891521357393154e-06, + "loss": 0.7231, + "step": 8840 + }, + { + "epoch": 0.23, + "learning_rate": 1.9891480707176675e-06, + "loss": 0.8169, + "step": 8841 + }, + { + "epoch": 0.23, + "learning_rate": 1.9891440049386744e-06, + "loss": 1.1465, + "step": 8842 + }, + { + "epoch": 0.23, + "learning_rate": 1.989139938402339e-06, + "loss": 1.1562, + "step": 8843 + }, + { + "epoch": 0.23, + "learning_rate": 1.9891358711086645e-06, + "loss": 0.7529, + "step": 8844 + }, + { + "epoch": 0.23, + "learning_rate": 1.989131803057654e-06, + "loss": 0.8091, + "step": 8845 + }, + { + "epoch": 0.23, + "learning_rate": 1.989127734249311e-06, + "loss": 1.082, + "step": 8846 + }, + { + "epoch": 0.23, + "learning_rate": 1.989123664683639e-06, + "loss": 0.7505, + "step": 8847 + }, + { + "epoch": 0.23, + "learning_rate": 1.98911959436064e-06, + "loss": 0.8252, + "step": 8848 + }, + { + "epoch": 0.23, + "learning_rate": 1.9891155232803173e-06, + "loss": 0.8916, + "step": 8849 + }, + { + "epoch": 0.23, + "learning_rate": 1.9891114514426745e-06, + "loss": 0.9268, + "step": 8850 + }, + { + "epoch": 0.23, + "learning_rate": 1.989107378847715e-06, + "loss": 0.8911, + "step": 8851 + }, + { + "epoch": 0.23, + "learning_rate": 1.9891033054954403e-06, + "loss": 1.1719, + "step": 8852 + }, + { + "epoch": 0.23, + "learning_rate": 1.9890992313858557e-06, + "loss": 0.9717, + "step": 8853 + }, + { + "epoch": 0.23, + "learning_rate": 1.989095156518963e-06, + "loss": 0.9346, + "step": 8854 + }, + { + "epoch": 0.23, + "learning_rate": 1.9890910808947658e-06, + "loss": 0.998, + "step": 8855 + }, + { + "epoch": 0.23, + "learning_rate": 1.989087004513267e-06, + "loss": 0.6006, + "step": 8856 + }, + { + "epoch": 0.23, + "learning_rate": 1.989082927374469e-06, + "loss": 0.7793, + "step": 8857 + }, + { + "epoch": 0.23, + "learning_rate": 1.9890788494783767e-06, + "loss": 0.6191, + "step": 8858 + }, + { + "epoch": 0.23, + "learning_rate": 1.9890747708249918e-06, + "loss": 1.1904, + "step": 8859 + }, + { + "epoch": 0.23, + "learning_rate": 1.989070691414318e-06, + "loss": 0.9248, + "step": 8860 + }, + { + "epoch": 0.23, + "learning_rate": 1.989066611246358e-06, + "loss": 0.8076, + "step": 8861 + }, + { + "epoch": 0.23, + "learning_rate": 1.9890625303211157e-06, + "loss": 0.9355, + "step": 8862 + }, + { + "epoch": 0.23, + "learning_rate": 1.9890584486385927e-06, + "loss": 0.7852, + "step": 8863 + }, + { + "epoch": 0.23, + "learning_rate": 1.989054366198794e-06, + "loss": 0.7642, + "step": 8864 + }, + { + "epoch": 0.23, + "learning_rate": 1.9890502830017215e-06, + "loss": 0.9561, + "step": 8865 + }, + { + "epoch": 0.23, + "learning_rate": 1.9890461990473787e-06, + "loss": 0.8174, + "step": 8866 + }, + { + "epoch": 0.23, + "learning_rate": 1.9890421143357685e-06, + "loss": 0.9971, + "step": 8867 + }, + { + "epoch": 0.23, + "learning_rate": 1.989038028866895e-06, + "loss": 0.7598, + "step": 8868 + }, + { + "epoch": 0.23, + "learning_rate": 1.9890339426407597e-06, + "loss": 0.9243, + "step": 8869 + }, + { + "epoch": 0.23, + "learning_rate": 1.989029855657367e-06, + "loss": 0.9072, + "step": 8870 + }, + { + "epoch": 0.23, + "learning_rate": 1.9890257679167195e-06, + "loss": 0.9785, + "step": 8871 + }, + { + "epoch": 0.23, + "learning_rate": 1.9890216794188204e-06, + "loss": 0.9028, + "step": 8872 + }, + { + "epoch": 0.23, + "learning_rate": 1.989017590163673e-06, + "loss": 0.7422, + "step": 8873 + }, + { + "epoch": 0.23, + "learning_rate": 1.9890135001512803e-06, + "loss": 0.6768, + "step": 8874 + }, + { + "epoch": 0.23, + "learning_rate": 1.9890094093816456e-06, + "loss": 0.7676, + "step": 8875 + }, + { + "epoch": 0.23, + "learning_rate": 1.9890053178547715e-06, + "loss": 0.853, + "step": 8876 + }, + { + "epoch": 0.23, + "learning_rate": 1.989001225570662e-06, + "loss": 1.0752, + "step": 8877 + }, + { + "epoch": 0.23, + "learning_rate": 1.988997132529319e-06, + "loss": 0.7222, + "step": 8878 + }, + { + "epoch": 0.23, + "learning_rate": 1.9889930387307466e-06, + "loss": 0.8662, + "step": 8879 + }, + { + "epoch": 0.23, + "learning_rate": 1.988988944174948e-06, + "loss": 0.8242, + "step": 8880 + }, + { + "epoch": 0.23, + "learning_rate": 1.988984848861926e-06, + "loss": 0.6709, + "step": 8881 + }, + { + "epoch": 0.23, + "learning_rate": 1.9889807527916836e-06, + "loss": 0.8896, + "step": 8882 + }, + { + "epoch": 0.23, + "learning_rate": 1.9889766559642242e-06, + "loss": 0.9521, + "step": 8883 + }, + { + "epoch": 0.23, + "learning_rate": 1.988972558379551e-06, + "loss": 0.959, + "step": 8884 + }, + { + "epoch": 0.23, + "learning_rate": 1.988968460037667e-06, + "loss": 0.834, + "step": 8885 + }, + { + "epoch": 0.23, + "learning_rate": 1.988964360938575e-06, + "loss": 0.915, + "step": 8886 + }, + { + "epoch": 0.23, + "learning_rate": 1.9889602610822788e-06, + "loss": 0.7803, + "step": 8887 + }, + { + "epoch": 0.23, + "learning_rate": 1.988956160468781e-06, + "loss": 1.0967, + "step": 8888 + }, + { + "epoch": 0.23, + "learning_rate": 1.988952059098085e-06, + "loss": 0.9307, + "step": 8889 + }, + { + "epoch": 0.23, + "learning_rate": 1.9889479569701937e-06, + "loss": 0.9492, + "step": 8890 + }, + { + "epoch": 0.23, + "learning_rate": 1.9889438540851105e-06, + "loss": 0.8184, + "step": 8891 + }, + { + "epoch": 0.23, + "learning_rate": 1.9889397504428387e-06, + "loss": 0.8711, + "step": 8892 + }, + { + "epoch": 0.23, + "learning_rate": 1.988935646043381e-06, + "loss": 0.7944, + "step": 8893 + }, + { + "epoch": 0.23, + "learning_rate": 1.9889315408867408e-06, + "loss": 0.9102, + "step": 8894 + }, + { + "epoch": 0.23, + "learning_rate": 1.9889274349729214e-06, + "loss": 0.9697, + "step": 8895 + }, + { + "epoch": 0.23, + "learning_rate": 1.9889233283019254e-06, + "loss": 0.7744, + "step": 8896 + }, + { + "epoch": 0.23, + "learning_rate": 1.9889192208737564e-06, + "loss": 1.0, + "step": 8897 + }, + { + "epoch": 0.23, + "learning_rate": 1.9889151126884175e-06, + "loss": 0.9697, + "step": 8898 + }, + { + "epoch": 0.23, + "learning_rate": 1.988911003745912e-06, + "loss": 1.0605, + "step": 8899 + }, + { + "epoch": 0.23, + "learning_rate": 1.9889068940462424e-06, + "loss": 1.0078, + "step": 8900 + }, + { + "epoch": 0.23, + "learning_rate": 1.9889027835894123e-06, + "loss": 0.875, + "step": 8901 + }, + { + "epoch": 0.23, + "learning_rate": 1.988898672375425e-06, + "loss": 0.9736, + "step": 8902 + }, + { + "epoch": 0.23, + "learning_rate": 1.988894560404283e-06, + "loss": 0.627, + "step": 8903 + }, + { + "epoch": 0.23, + "learning_rate": 1.9888904476759906e-06, + "loss": 0.9434, + "step": 8904 + }, + { + "epoch": 0.23, + "learning_rate": 1.9888863341905497e-06, + "loss": 1.0098, + "step": 8905 + }, + { + "epoch": 0.23, + "learning_rate": 1.988882219947964e-06, + "loss": 0.9727, + "step": 8906 + }, + { + "epoch": 0.23, + "learning_rate": 1.988878104948237e-06, + "loss": 0.6646, + "step": 8907 + }, + { + "epoch": 0.23, + "learning_rate": 1.988873989191371e-06, + "loss": 0.9932, + "step": 8908 + }, + { + "epoch": 0.23, + "learning_rate": 1.9888698726773707e-06, + "loss": 1.0576, + "step": 8909 + }, + { + "epoch": 0.23, + "learning_rate": 1.988865755406237e-06, + "loss": 0.9385, + "step": 8910 + }, + { + "epoch": 0.23, + "learning_rate": 1.988861637377975e-06, + "loss": 0.6936, + "step": 8911 + }, + { + "epoch": 0.23, + "learning_rate": 1.9888575185925868e-06, + "loss": 0.9893, + "step": 8912 + }, + { + "epoch": 0.23, + "learning_rate": 1.9888533990500763e-06, + "loss": 1.1094, + "step": 8913 + }, + { + "epoch": 0.23, + "learning_rate": 1.988849278750446e-06, + "loss": 0.8076, + "step": 8914 + }, + { + "epoch": 0.23, + "learning_rate": 1.988845157693699e-06, + "loss": 0.9023, + "step": 8915 + }, + { + "epoch": 0.23, + "learning_rate": 1.9888410358798388e-06, + "loss": 0.9395, + "step": 8916 + }, + { + "epoch": 0.23, + "learning_rate": 1.9888369133088683e-06, + "loss": 1.0244, + "step": 8917 + }, + { + "epoch": 0.23, + "learning_rate": 1.9888327899807915e-06, + "loss": 0.8066, + "step": 8918 + }, + { + "epoch": 0.23, + "learning_rate": 1.9888286658956103e-06, + "loss": 1.1074, + "step": 8919 + }, + { + "epoch": 0.23, + "learning_rate": 1.9888245410533287e-06, + "loss": 0.6292, + "step": 8920 + }, + { + "epoch": 0.23, + "learning_rate": 1.98882041545395e-06, + "loss": 0.8408, + "step": 8921 + }, + { + "epoch": 0.23, + "learning_rate": 1.9888162890974766e-06, + "loss": 0.7258, + "step": 8922 + }, + { + "epoch": 0.23, + "learning_rate": 1.9888121619839117e-06, + "loss": 0.9961, + "step": 8923 + }, + { + "epoch": 0.23, + "learning_rate": 1.988808034113259e-06, + "loss": 0.6824, + "step": 8924 + }, + { + "epoch": 0.23, + "learning_rate": 1.988803905485522e-06, + "loss": 0.7637, + "step": 8925 + }, + { + "epoch": 0.23, + "learning_rate": 1.9887997761007024e-06, + "loss": 0.9248, + "step": 8926 + }, + { + "epoch": 0.23, + "learning_rate": 1.988795645958805e-06, + "loss": 1.0283, + "step": 8927 + }, + { + "epoch": 0.23, + "learning_rate": 1.988791515059832e-06, + "loss": 1.0459, + "step": 8928 + }, + { + "epoch": 0.23, + "learning_rate": 1.9887873834037865e-06, + "loss": 0.8975, + "step": 8929 + }, + { + "epoch": 0.23, + "learning_rate": 1.9887832509906727e-06, + "loss": 1.1592, + "step": 8930 + }, + { + "epoch": 0.23, + "learning_rate": 1.9887791178204923e-06, + "loss": 0.8311, + "step": 8931 + }, + { + "epoch": 0.23, + "learning_rate": 1.9887749838932495e-06, + "loss": 1.0557, + "step": 8932 + }, + { + "epoch": 0.23, + "learning_rate": 1.9887708492089473e-06, + "loss": 1.0781, + "step": 8933 + }, + { + "epoch": 0.23, + "learning_rate": 1.9887667137675886e-06, + "loss": 0.855, + "step": 8934 + }, + { + "epoch": 0.23, + "learning_rate": 1.988762577569177e-06, + "loss": 0.9727, + "step": 8935 + }, + { + "epoch": 0.23, + "learning_rate": 1.9887584406137147e-06, + "loss": 0.9199, + "step": 8936 + }, + { + "epoch": 0.23, + "learning_rate": 1.9887543029012057e-06, + "loss": 0.791, + "step": 8937 + }, + { + "epoch": 0.23, + "learning_rate": 1.9887501644316535e-06, + "loss": 0.9258, + "step": 8938 + }, + { + "epoch": 0.23, + "learning_rate": 1.98874602520506e-06, + "loss": 0.9766, + "step": 8939 + }, + { + "epoch": 0.23, + "learning_rate": 1.98874188522143e-06, + "loss": 0.9375, + "step": 8940 + }, + { + "epoch": 0.23, + "learning_rate": 1.988737744480765e-06, + "loss": 0.9453, + "step": 8941 + }, + { + "epoch": 0.23, + "learning_rate": 1.9887336029830697e-06, + "loss": 0.9531, + "step": 8942 + }, + { + "epoch": 0.23, + "learning_rate": 1.9887294607283457e-06, + "loss": 0.9268, + "step": 8943 + }, + { + "epoch": 0.23, + "learning_rate": 1.988725317716598e-06, + "loss": 0.9336, + "step": 8944 + }, + { + "epoch": 0.23, + "learning_rate": 1.988721173947828e-06, + "loss": 1.0869, + "step": 8945 + }, + { + "epoch": 0.23, + "learning_rate": 1.98871702942204e-06, + "loss": 0.7227, + "step": 8946 + }, + { + "epoch": 0.23, + "learning_rate": 1.988712884139237e-06, + "loss": 0.9219, + "step": 8947 + }, + { + "epoch": 0.23, + "learning_rate": 1.9887087380994216e-06, + "loss": 0.7529, + "step": 8948 + }, + { + "epoch": 0.23, + "learning_rate": 1.9887045913025974e-06, + "loss": 0.8433, + "step": 8949 + }, + { + "epoch": 0.23, + "learning_rate": 1.9887004437487675e-06, + "loss": 0.8853, + "step": 8950 + }, + { + "epoch": 0.23, + "learning_rate": 1.9886962954379354e-06, + "loss": 0.9307, + "step": 8951 + }, + { + "epoch": 0.23, + "learning_rate": 1.988692146370104e-06, + "loss": 0.8809, + "step": 8952 + }, + { + "epoch": 0.23, + "learning_rate": 1.9886879965452764e-06, + "loss": 0.96, + "step": 8953 + }, + { + "epoch": 0.23, + "learning_rate": 1.9886838459634562e-06, + "loss": 1.0005, + "step": 8954 + }, + { + "epoch": 0.23, + "learning_rate": 1.9886796946246457e-06, + "loss": 0.7349, + "step": 8955 + }, + { + "epoch": 0.23, + "learning_rate": 1.988675542528849e-06, + "loss": 0.7949, + "step": 8956 + }, + { + "epoch": 0.23, + "learning_rate": 1.9886713896760687e-06, + "loss": 0.8955, + "step": 8957 + }, + { + "epoch": 0.23, + "learning_rate": 1.988667236066308e-06, + "loss": 0.9883, + "step": 8958 + }, + { + "epoch": 0.23, + "learning_rate": 1.9886630816995704e-06, + "loss": 1.0664, + "step": 8959 + }, + { + "epoch": 0.23, + "learning_rate": 1.988658926575859e-06, + "loss": 0.9727, + "step": 8960 + }, + { + "epoch": 0.23, + "learning_rate": 1.9886547706951775e-06, + "loss": 0.8213, + "step": 8961 + }, + { + "epoch": 0.23, + "learning_rate": 1.988650614057528e-06, + "loss": 1.0059, + "step": 8962 + }, + { + "epoch": 0.23, + "learning_rate": 1.9886464566629137e-06, + "loss": 0.9417, + "step": 8963 + }, + { + "epoch": 0.23, + "learning_rate": 1.9886422985113388e-06, + "loss": 0.6252, + "step": 8964 + }, + { + "epoch": 0.23, + "learning_rate": 1.9886381396028057e-06, + "loss": 1.0137, + "step": 8965 + }, + { + "epoch": 0.23, + "learning_rate": 1.9886339799373178e-06, + "loss": 0.8682, + "step": 8966 + }, + { + "epoch": 0.23, + "learning_rate": 1.988629819514879e-06, + "loss": 1.0957, + "step": 8967 + }, + { + "epoch": 0.23, + "learning_rate": 1.988625658335491e-06, + "loss": 0.8081, + "step": 8968 + }, + { + "epoch": 0.23, + "learning_rate": 1.9886214963991583e-06, + "loss": 0.5977, + "step": 8969 + }, + { + "epoch": 0.23, + "learning_rate": 1.988617333705883e-06, + "loss": 0.9219, + "step": 8970 + }, + { + "epoch": 0.23, + "learning_rate": 1.9886131702556693e-06, + "loss": 1.1387, + "step": 8971 + }, + { + "epoch": 0.23, + "learning_rate": 1.98860900604852e-06, + "loss": 1.1836, + "step": 8972 + }, + { + "epoch": 0.23, + "learning_rate": 1.988604841084438e-06, + "loss": 0.8916, + "step": 8973 + }, + { + "epoch": 0.23, + "learning_rate": 1.988600675363427e-06, + "loss": 0.812, + "step": 8974 + }, + { + "epoch": 0.23, + "learning_rate": 1.98859650888549e-06, + "loss": 0.5825, + "step": 8975 + }, + { + "epoch": 0.23, + "learning_rate": 1.9885923416506297e-06, + "loss": 1.0, + "step": 8976 + }, + { + "epoch": 0.23, + "learning_rate": 1.98858817365885e-06, + "loss": 1.126, + "step": 8977 + }, + { + "epoch": 0.23, + "learning_rate": 1.9885840049101533e-06, + "loss": 1.0801, + "step": 8978 + }, + { + "epoch": 0.23, + "learning_rate": 1.988579835404544e-06, + "loss": 0.7852, + "step": 8979 + }, + { + "epoch": 0.23, + "learning_rate": 1.988575665142024e-06, + "loss": 0.9736, + "step": 8980 + }, + { + "epoch": 0.23, + "learning_rate": 1.9885714941225975e-06, + "loss": 0.8066, + "step": 8981 + }, + { + "epoch": 0.23, + "learning_rate": 1.9885673223462672e-06, + "loss": 0.9131, + "step": 8982 + }, + { + "epoch": 0.23, + "learning_rate": 1.9885631498130364e-06, + "loss": 1.0059, + "step": 8983 + }, + { + "epoch": 0.23, + "learning_rate": 1.988558976522908e-06, + "loss": 0.8047, + "step": 8984 + }, + { + "epoch": 0.23, + "learning_rate": 1.988554802475885e-06, + "loss": 0.6328, + "step": 8985 + }, + { + "epoch": 0.23, + "learning_rate": 1.988550627671972e-06, + "loss": 1.126, + "step": 8986 + }, + { + "epoch": 0.23, + "learning_rate": 1.9885464521111706e-06, + "loss": 0.8496, + "step": 8987 + }, + { + "epoch": 0.23, + "learning_rate": 1.988542275793485e-06, + "loss": 0.998, + "step": 8988 + }, + { + "epoch": 0.23, + "learning_rate": 1.988538098718918e-06, + "loss": 0.5942, + "step": 8989 + }, + { + "epoch": 0.23, + "learning_rate": 1.9885339208874727e-06, + "loss": 1.1025, + "step": 8990 + }, + { + "epoch": 0.23, + "learning_rate": 1.9885297422991523e-06, + "loss": 0.9658, + "step": 8991 + }, + { + "epoch": 0.23, + "learning_rate": 1.98852556295396e-06, + "loss": 0.8496, + "step": 8992 + }, + { + "epoch": 0.23, + "learning_rate": 1.9885213828519e-06, + "loss": 0.7386, + "step": 8993 + }, + { + "epoch": 0.23, + "learning_rate": 1.9885172019929735e-06, + "loss": 0.8745, + "step": 8994 + }, + { + "epoch": 0.23, + "learning_rate": 1.988513020377186e-06, + "loss": 0.8, + "step": 8995 + }, + { + "epoch": 0.23, + "learning_rate": 1.9885088380045386e-06, + "loss": 0.7332, + "step": 8996 + }, + { + "epoch": 0.23, + "learning_rate": 1.9885046548750357e-06, + "loss": 0.9219, + "step": 8997 + }, + { + "epoch": 0.23, + "learning_rate": 1.98850047098868e-06, + "loss": 0.8525, + "step": 8998 + }, + { + "epoch": 0.23, + "learning_rate": 1.9884962863454755e-06, + "loss": 1.0957, + "step": 8999 + }, + { + "epoch": 0.23, + "learning_rate": 1.9884921009454245e-06, + "loss": 1.0293, + "step": 9000 + }, + { + "epoch": 0.23, + "learning_rate": 1.9884879147885306e-06, + "loss": 0.8711, + "step": 9001 + }, + { + "epoch": 0.23, + "learning_rate": 1.988483727874797e-06, + "loss": 0.8857, + "step": 9002 + }, + { + "epoch": 0.23, + "learning_rate": 1.988479540204227e-06, + "loss": 1.0088, + "step": 9003 + }, + { + "epoch": 0.23, + "learning_rate": 1.9884753517768234e-06, + "loss": 0.916, + "step": 9004 + }, + { + "epoch": 0.23, + "learning_rate": 1.9884711625925896e-06, + "loss": 0.9268, + "step": 9005 + }, + { + "epoch": 0.23, + "learning_rate": 1.9884669726515294e-06, + "loss": 0.8232, + "step": 9006 + }, + { + "epoch": 0.23, + "learning_rate": 1.988462781953645e-06, + "loss": 0.8389, + "step": 9007 + }, + { + "epoch": 0.23, + "learning_rate": 1.98845859049894e-06, + "loss": 0.9805, + "step": 9008 + }, + { + "epoch": 0.23, + "learning_rate": 1.988454398287418e-06, + "loss": 0.9541, + "step": 9009 + }, + { + "epoch": 0.23, + "learning_rate": 1.9884502053190818e-06, + "loss": 0.7974, + "step": 9010 + }, + { + "epoch": 0.23, + "learning_rate": 1.988446011593935e-06, + "loss": 1.0381, + "step": 9011 + }, + { + "epoch": 0.23, + "learning_rate": 1.98844181711198e-06, + "loss": 1.0781, + "step": 9012 + }, + { + "epoch": 0.23, + "learning_rate": 1.9884376218732214e-06, + "loss": 0.9219, + "step": 9013 + }, + { + "epoch": 0.23, + "learning_rate": 1.988433425877661e-06, + "loss": 0.9238, + "step": 9014 + }, + { + "epoch": 0.23, + "learning_rate": 1.9884292291253028e-06, + "loss": 0.9893, + "step": 9015 + }, + { + "epoch": 0.23, + "learning_rate": 1.9884250316161493e-06, + "loss": 0.647, + "step": 9016 + }, + { + "epoch": 0.23, + "learning_rate": 1.9884208333502045e-06, + "loss": 0.8467, + "step": 9017 + }, + { + "epoch": 0.23, + "learning_rate": 1.9884166343274713e-06, + "loss": 0.918, + "step": 9018 + }, + { + "epoch": 0.23, + "learning_rate": 1.988412434547953e-06, + "loss": 0.6909, + "step": 9019 + }, + { + "epoch": 0.23, + "learning_rate": 1.988408234011653e-06, + "loss": 0.9854, + "step": 9020 + }, + { + "epoch": 0.23, + "learning_rate": 1.9884040327185737e-06, + "loss": 1.1836, + "step": 9021 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883998306687193e-06, + "loss": 0.9121, + "step": 9022 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883956278620926e-06, + "loss": 0.7378, + "step": 9023 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883914242986965e-06, + "loss": 0.8525, + "step": 9024 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883872199785346e-06, + "loss": 0.8887, + "step": 9025 + }, + { + "epoch": 0.23, + "learning_rate": 1.98838301490161e-06, + "loss": 0.8284, + "step": 9026 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883788090679265e-06, + "loss": 0.8497, + "step": 9027 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883746024774863e-06, + "loss": 0.8145, + "step": 9028 + }, + { + "epoch": 0.23, + "learning_rate": 1.988370395130293e-06, + "loss": 1.002, + "step": 9029 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883661870263505e-06, + "loss": 0.6392, + "step": 9030 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883619781656612e-06, + "loss": 0.6111, + "step": 9031 + }, + { + "epoch": 0.23, + "learning_rate": 1.988357768548228e-06, + "loss": 0.8975, + "step": 9032 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883535581740553e-06, + "loss": 0.7441, + "step": 9033 + }, + { + "epoch": 0.23, + "learning_rate": 1.988349347043146e-06, + "loss": 0.957, + "step": 9034 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883451351555026e-06, + "loss": 0.8093, + "step": 9035 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883409225111286e-06, + "loss": 0.8936, + "step": 9036 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883367091100276e-06, + "loss": 0.9307, + "step": 9037 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883324949522027e-06, + "loss": 0.8438, + "step": 9038 + }, + { + "epoch": 0.23, + "learning_rate": 1.988328280037657e-06, + "loss": 0.7598, + "step": 9039 + }, + { + "epoch": 0.23, + "learning_rate": 1.988324064366394e-06, + "loss": 0.864, + "step": 9040 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883198479384166e-06, + "loss": 0.8203, + "step": 9041 + }, + { + "epoch": 0.23, + "learning_rate": 1.988315630753728e-06, + "loss": 0.8984, + "step": 9042 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883114128123317e-06, + "loss": 0.8369, + "step": 9043 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883071941142306e-06, + "loss": 0.999, + "step": 9044 + }, + { + "epoch": 0.23, + "learning_rate": 1.9883029746594284e-06, + "loss": 0.7842, + "step": 9045 + }, + { + "epoch": 0.23, + "learning_rate": 1.988298754447928e-06, + "loss": 1.0186, + "step": 9046 + }, + { + "epoch": 0.23, + "learning_rate": 1.9882945334797324e-06, + "loss": 0.7549, + "step": 9047 + }, + { + "epoch": 0.23, + "learning_rate": 1.9882903117548455e-06, + "loss": 1.0664, + "step": 9048 + }, + { + "epoch": 0.23, + "learning_rate": 1.9882860892732697e-06, + "loss": 0.8672, + "step": 9049 + }, + { + "epoch": 0.23, + "learning_rate": 1.9882818660350093e-06, + "loss": 0.9395, + "step": 9050 + }, + { + "epoch": 0.23, + "learning_rate": 1.9882776420400664e-06, + "loss": 0.9287, + "step": 9051 + }, + { + "epoch": 0.23, + "learning_rate": 1.988273417288445e-06, + "loss": 0.8955, + "step": 9052 + }, + { + "epoch": 0.23, + "learning_rate": 1.988269191780148e-06, + "loss": 0.748, + "step": 9053 + }, + { + "epoch": 0.23, + "learning_rate": 1.9882649655151785e-06, + "loss": 0.8662, + "step": 9054 + }, + { + "epoch": 0.23, + "learning_rate": 1.9882607384935404e-06, + "loss": 0.9922, + "step": 9055 + }, + { + "epoch": 0.23, + "learning_rate": 1.988256510715236e-06, + "loss": 1.0508, + "step": 9056 + }, + { + "epoch": 0.23, + "learning_rate": 1.9882522821802694e-06, + "loss": 0.9463, + "step": 9057 + }, + { + "epoch": 0.23, + "learning_rate": 1.9882480528886436e-06, + "loss": 1.0742, + "step": 9058 + }, + { + "epoch": 0.23, + "learning_rate": 1.988243822840361e-06, + "loss": 1.0146, + "step": 9059 + }, + { + "epoch": 0.23, + "learning_rate": 1.9882395920354266e-06, + "loss": 0.959, + "step": 9060 + }, + { + "epoch": 0.23, + "learning_rate": 1.988235360473842e-06, + "loss": 0.8496, + "step": 9061 + }, + { + "epoch": 0.23, + "learning_rate": 1.9882311281556107e-06, + "loss": 0.9531, + "step": 9062 + }, + { + "epoch": 0.23, + "learning_rate": 1.9882268950807368e-06, + "loss": 0.918, + "step": 9063 + }, + { + "epoch": 0.23, + "learning_rate": 1.9882226612492227e-06, + "loss": 0.8555, + "step": 9064 + }, + { + "epoch": 0.23, + "learning_rate": 1.988218426661072e-06, + "loss": 0.8496, + "step": 9065 + }, + { + "epoch": 0.23, + "learning_rate": 1.988214191316288e-06, + "loss": 0.833, + "step": 9066 + }, + { + "epoch": 0.23, + "learning_rate": 1.9882099552148737e-06, + "loss": 0.9854, + "step": 9067 + }, + { + "epoch": 0.23, + "learning_rate": 1.9882057183568326e-06, + "loss": 0.75, + "step": 9068 + }, + { + "epoch": 0.23, + "learning_rate": 1.988201480742168e-06, + "loss": 0.8701, + "step": 9069 + }, + { + "epoch": 0.23, + "learning_rate": 1.9881972423708825e-06, + "loss": 1.0342, + "step": 9070 + }, + { + "epoch": 0.23, + "learning_rate": 1.9881930032429803e-06, + "loss": 0.9424, + "step": 9071 + }, + { + "epoch": 0.23, + "learning_rate": 1.988188763358464e-06, + "loss": 1.0693, + "step": 9072 + }, + { + "epoch": 0.23, + "learning_rate": 1.988184522717337e-06, + "loss": 0.874, + "step": 9073 + }, + { + "epoch": 0.23, + "learning_rate": 1.988180281319602e-06, + "loss": 1.2021, + "step": 9074 + }, + { + "epoch": 0.23, + "learning_rate": 1.988176039165263e-06, + "loss": 0.9492, + "step": 9075 + }, + { + "epoch": 0.23, + "learning_rate": 1.988171796254324e-06, + "loss": 1.2012, + "step": 9076 + }, + { + "epoch": 0.23, + "learning_rate": 1.9881675525867862e-06, + "loss": 0.8799, + "step": 9077 + }, + { + "epoch": 0.23, + "learning_rate": 1.9881633081626542e-06, + "loss": 0.8516, + "step": 9078 + }, + { + "epoch": 0.23, + "learning_rate": 1.9881590629819312e-06, + "loss": 0.9541, + "step": 9079 + }, + { + "epoch": 0.23, + "learning_rate": 1.98815481704462e-06, + "loss": 0.7065, + "step": 9080 + }, + { + "epoch": 0.23, + "learning_rate": 1.9881505703507245e-06, + "loss": 1.0264, + "step": 9081 + }, + { + "epoch": 0.23, + "learning_rate": 1.988146322900247e-06, + "loss": 0.9502, + "step": 9082 + }, + { + "epoch": 0.23, + "learning_rate": 1.988142074693192e-06, + "loss": 0.9424, + "step": 9083 + }, + { + "epoch": 0.23, + "learning_rate": 1.9881378257295617e-06, + "loss": 0.9199, + "step": 9084 + }, + { + "epoch": 0.23, + "learning_rate": 1.9881335760093596e-06, + "loss": 1.0176, + "step": 9085 + }, + { + "epoch": 0.23, + "learning_rate": 1.988129325532589e-06, + "loss": 0.9414, + "step": 9086 + }, + { + "epoch": 0.23, + "learning_rate": 1.9881250742992535e-06, + "loss": 1.0586, + "step": 9087 + }, + { + "epoch": 0.23, + "learning_rate": 1.988120822309356e-06, + "loss": 0.8457, + "step": 9088 + }, + { + "epoch": 0.23, + "learning_rate": 1.9881165695628995e-06, + "loss": 0.9473, + "step": 9089 + }, + { + "epoch": 0.23, + "learning_rate": 1.9881123160598876e-06, + "loss": 0.9541, + "step": 9090 + }, + { + "epoch": 0.23, + "learning_rate": 1.9881080618003237e-06, + "loss": 0.9531, + "step": 9091 + }, + { + "epoch": 0.23, + "learning_rate": 1.988103806784211e-06, + "loss": 0.592, + "step": 9092 + }, + { + "epoch": 0.23, + "learning_rate": 1.988099551011553e-06, + "loss": 0.7852, + "step": 9093 + }, + { + "epoch": 0.23, + "learning_rate": 1.9880952944823515e-06, + "loss": 0.8975, + "step": 9094 + }, + { + "epoch": 0.23, + "learning_rate": 1.9880910371966117e-06, + "loss": 0.9336, + "step": 9095 + }, + { + "epoch": 0.23, + "learning_rate": 1.9880867791543363e-06, + "loss": 1.1074, + "step": 9096 + }, + { + "epoch": 0.23, + "learning_rate": 1.9880825203555274e-06, + "loss": 1.0879, + "step": 9097 + }, + { + "epoch": 0.23, + "learning_rate": 1.98807826080019e-06, + "loss": 0.8042, + "step": 9098 + }, + { + "epoch": 0.23, + "learning_rate": 1.9880740004883257e-06, + "loss": 1.0781, + "step": 9099 + }, + { + "epoch": 0.23, + "learning_rate": 1.988069739419939e-06, + "loss": 0.9062, + "step": 9100 + }, + { + "epoch": 0.23, + "learning_rate": 1.988065477595033e-06, + "loss": 0.7451, + "step": 9101 + }, + { + "epoch": 0.23, + "learning_rate": 1.9880612150136102e-06, + "loss": 0.7354, + "step": 9102 + }, + { + "epoch": 0.23, + "learning_rate": 1.9880569516756747e-06, + "loss": 1.0254, + "step": 9103 + }, + { + "epoch": 0.23, + "learning_rate": 1.9880526875812294e-06, + "loss": 0.8799, + "step": 9104 + }, + { + "epoch": 0.23, + "learning_rate": 1.9880484227302775e-06, + "loss": 0.8984, + "step": 9105 + }, + { + "epoch": 0.23, + "learning_rate": 1.988044157122822e-06, + "loss": 0.8789, + "step": 9106 + }, + { + "epoch": 0.23, + "learning_rate": 1.9880398907588673e-06, + "loss": 0.8184, + "step": 9107 + }, + { + "epoch": 0.23, + "learning_rate": 1.988035623638415e-06, + "loss": 0.9756, + "step": 9108 + }, + { + "epoch": 0.23, + "learning_rate": 1.9880313557614697e-06, + "loss": 0.8018, + "step": 9109 + }, + { + "epoch": 0.23, + "learning_rate": 1.988027087128034e-06, + "loss": 0.8994, + "step": 9110 + }, + { + "epoch": 0.23, + "learning_rate": 1.988022817738112e-06, + "loss": 1.0098, + "step": 9111 + }, + { + "epoch": 0.23, + "learning_rate": 1.9880185475917058e-06, + "loss": 0.9082, + "step": 9112 + }, + { + "epoch": 0.23, + "learning_rate": 1.9880142766888194e-06, + "loss": 0.915, + "step": 9113 + }, + { + "epoch": 0.23, + "learning_rate": 1.988010005029456e-06, + "loss": 0.9492, + "step": 9114 + }, + { + "epoch": 0.23, + "learning_rate": 1.9880057326136185e-06, + "loss": 1.0859, + "step": 9115 + }, + { + "epoch": 0.23, + "learning_rate": 1.9880014594413107e-06, + "loss": 0.9766, + "step": 9116 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879971855125355e-06, + "loss": 0.7783, + "step": 9117 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879929108272964e-06, + "loss": 0.9795, + "step": 9118 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879886353855967e-06, + "loss": 0.916, + "step": 9119 + }, + { + "epoch": 0.23, + "learning_rate": 1.987984359187439e-06, + "loss": 0.9922, + "step": 9120 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879800822328276e-06, + "loss": 0.9541, + "step": 9121 + }, + { + "epoch": 0.23, + "learning_rate": 1.987975804521765e-06, + "loss": 0.7598, + "step": 9122 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879715260542547e-06, + "loss": 0.8037, + "step": 9123 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879672468303e-06, + "loss": 1.1074, + "step": 9124 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879629668499044e-06, + "loss": 0.7017, + "step": 9125 + }, + { + "epoch": 0.23, + "learning_rate": 1.987958686113071e-06, + "loss": 0.8389, + "step": 9126 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879544046198033e-06, + "loss": 0.9844, + "step": 9127 + }, + { + "epoch": 0.23, + "learning_rate": 1.987950122370104e-06, + "loss": 0.79, + "step": 9128 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879458393639764e-06, + "loss": 0.8262, + "step": 9129 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879415556014244e-06, + "loss": 0.9316, + "step": 9130 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879372710824513e-06, + "loss": 0.9238, + "step": 9131 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879329858070595e-06, + "loss": 1.1885, + "step": 9132 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879286997752533e-06, + "loss": 0.833, + "step": 9133 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879244129870357e-06, + "loss": 0.8335, + "step": 9134 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879201254424092e-06, + "loss": 1.0273, + "step": 9135 + }, + { + "epoch": 0.23, + "learning_rate": 1.987915837141378e-06, + "loss": 1.001, + "step": 9136 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879115480839452e-06, + "loss": 0.8174, + "step": 9137 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879072582701136e-06, + "loss": 0.7651, + "step": 9138 + }, + { + "epoch": 0.23, + "learning_rate": 1.9879029676998867e-06, + "loss": 0.8828, + "step": 9139 + }, + { + "epoch": 0.23, + "learning_rate": 1.9878986763732683e-06, + "loss": 0.9219, + "step": 9140 + }, + { + "epoch": 0.23, + "learning_rate": 1.9878943842902617e-06, + "loss": 1.0576, + "step": 9141 + }, + { + "epoch": 0.23, + "learning_rate": 1.987890091450869e-06, + "loss": 0.9258, + "step": 9142 + }, + { + "epoch": 0.23, + "learning_rate": 1.9878857978550947e-06, + "loss": 0.9658, + "step": 9143 + }, + { + "epoch": 0.23, + "learning_rate": 1.987881503502942e-06, + "loss": 0.8594, + "step": 9144 + }, + { + "epoch": 0.23, + "learning_rate": 1.987877208394413e-06, + "loss": 0.8242, + "step": 9145 + }, + { + "epoch": 0.23, + "learning_rate": 1.987872912529512e-06, + "loss": 0.9658, + "step": 9146 + }, + { + "epoch": 0.23, + "learning_rate": 1.9878686159082428e-06, + "loss": 0.8564, + "step": 9147 + }, + { + "epoch": 0.23, + "learning_rate": 1.9878643185306077e-06, + "loss": 0.9043, + "step": 9148 + }, + { + "epoch": 0.23, + "learning_rate": 1.98786002039661e-06, + "loss": 0.7559, + "step": 9149 + }, + { + "epoch": 0.23, + "learning_rate": 1.9878557215062536e-06, + "loss": 1.001, + "step": 9150 + }, + { + "epoch": 0.23, + "learning_rate": 1.9878514218595414e-06, + "loss": 1.0381, + "step": 9151 + }, + { + "epoch": 0.23, + "learning_rate": 1.987847121456477e-06, + "loss": 0.6719, + "step": 9152 + }, + { + "epoch": 0.23, + "learning_rate": 1.987842820297063e-06, + "loss": 0.79, + "step": 9153 + }, + { + "epoch": 0.23, + "learning_rate": 1.987838518381304e-06, + "loss": 0.8828, + "step": 9154 + }, + { + "epoch": 0.23, + "learning_rate": 1.987834215709202e-06, + "loss": 0.7593, + "step": 9155 + }, + { + "epoch": 0.23, + "learning_rate": 1.987829912280761e-06, + "loss": 0.959, + "step": 9156 + }, + { + "epoch": 0.23, + "learning_rate": 1.9878256080959832e-06, + "loss": 0.8799, + "step": 9157 + }, + { + "epoch": 0.23, + "learning_rate": 1.9878213031548733e-06, + "loss": 0.9775, + "step": 9158 + }, + { + "epoch": 0.23, + "learning_rate": 1.987816997457434e-06, + "loss": 0.8643, + "step": 9159 + }, + { + "epoch": 0.23, + "learning_rate": 1.987812691003669e-06, + "loss": 0.9189, + "step": 9160 + }, + { + "epoch": 0.23, + "learning_rate": 1.9878083837935812e-06, + "loss": 0.8281, + "step": 9161 + }, + { + "epoch": 0.23, + "learning_rate": 1.9878040758271733e-06, + "loss": 1.0, + "step": 9162 + }, + { + "epoch": 0.23, + "learning_rate": 1.98779976710445e-06, + "loss": 1.042, + "step": 9163 + }, + { + "epoch": 0.23, + "learning_rate": 1.9877954576254133e-06, + "loss": 0.8555, + "step": 9164 + }, + { + "epoch": 0.23, + "learning_rate": 1.987791147390067e-06, + "loss": 1.0088, + "step": 9165 + }, + { + "epoch": 0.23, + "learning_rate": 1.987786836398415e-06, + "loss": 0.8711, + "step": 9166 + }, + { + "epoch": 0.23, + "learning_rate": 1.98778252465046e-06, + "loss": 0.7246, + "step": 9167 + }, + { + "epoch": 0.23, + "learning_rate": 1.987778212146205e-06, + "loss": 0.7979, + "step": 9168 + }, + { + "epoch": 0.24, + "learning_rate": 1.9877738988856536e-06, + "loss": 0.9697, + "step": 9169 + }, + { + "epoch": 0.24, + "learning_rate": 1.9877695848688094e-06, + "loss": 1.04, + "step": 9170 + }, + { + "epoch": 0.24, + "learning_rate": 1.987765270095675e-06, + "loss": 0.918, + "step": 9171 + }, + { + "epoch": 0.24, + "learning_rate": 1.9877609545662545e-06, + "loss": 0.959, + "step": 9172 + }, + { + "epoch": 0.24, + "learning_rate": 1.9877566382805507e-06, + "loss": 0.8701, + "step": 9173 + }, + { + "epoch": 0.24, + "learning_rate": 1.9877523212385673e-06, + "loss": 1.0298, + "step": 9174 + }, + { + "epoch": 0.24, + "learning_rate": 1.9877480034403074e-06, + "loss": 0.9067, + "step": 9175 + }, + { + "epoch": 0.24, + "learning_rate": 1.987743684885774e-06, + "loss": 0.9365, + "step": 9176 + }, + { + "epoch": 0.24, + "learning_rate": 1.9877393655749706e-06, + "loss": 0.8018, + "step": 9177 + }, + { + "epoch": 0.24, + "learning_rate": 1.987735045507901e-06, + "loss": 0.8906, + "step": 9178 + }, + { + "epoch": 0.24, + "learning_rate": 1.987730724684568e-06, + "loss": 0.8262, + "step": 9179 + }, + { + "epoch": 0.24, + "learning_rate": 1.9877264031049747e-06, + "loss": 0.8389, + "step": 9180 + }, + { + "epoch": 0.24, + "learning_rate": 1.9877220807691246e-06, + "loss": 1.0137, + "step": 9181 + }, + { + "epoch": 0.24, + "learning_rate": 1.9877177576770216e-06, + "loss": 0.9521, + "step": 9182 + }, + { + "epoch": 0.24, + "learning_rate": 1.9877134338286684e-06, + "loss": 1.1621, + "step": 9183 + }, + { + "epoch": 0.24, + "learning_rate": 1.987709109224068e-06, + "loss": 0.8799, + "step": 9184 + }, + { + "epoch": 0.24, + "learning_rate": 1.987704783863225e-06, + "loss": 1.0957, + "step": 9185 + }, + { + "epoch": 0.24, + "learning_rate": 1.987700457746141e-06, + "loss": 0.8438, + "step": 9186 + }, + { + "epoch": 0.24, + "learning_rate": 1.9876961308728206e-06, + "loss": 0.877, + "step": 9187 + }, + { + "epoch": 0.24, + "learning_rate": 1.9876918032432667e-06, + "loss": 0.644, + "step": 9188 + }, + { + "epoch": 0.24, + "learning_rate": 1.9876874748574825e-06, + "loss": 0.6123, + "step": 9189 + }, + { + "epoch": 0.24, + "learning_rate": 1.9876831457154716e-06, + "loss": 0.8301, + "step": 9190 + }, + { + "epoch": 0.24, + "learning_rate": 1.987678815817237e-06, + "loss": 0.9609, + "step": 9191 + }, + { + "epoch": 0.24, + "learning_rate": 1.987674485162782e-06, + "loss": 0.6943, + "step": 9192 + }, + { + "epoch": 0.24, + "learning_rate": 1.9876701537521103e-06, + "loss": 0.9229, + "step": 9193 + }, + { + "epoch": 0.24, + "learning_rate": 1.987665821585225e-06, + "loss": 0.8662, + "step": 9194 + }, + { + "epoch": 0.24, + "learning_rate": 1.987661488662129e-06, + "loss": 1.0166, + "step": 9195 + }, + { + "epoch": 0.24, + "learning_rate": 1.987657154982826e-06, + "loss": 1.001, + "step": 9196 + }, + { + "epoch": 0.24, + "learning_rate": 1.98765282054732e-06, + "loss": 0.7109, + "step": 9197 + }, + { + "epoch": 0.24, + "learning_rate": 1.987648485355613e-06, + "loss": 1.0928, + "step": 9198 + }, + { + "epoch": 0.24, + "learning_rate": 1.9876441494077093e-06, + "loss": 0.9287, + "step": 9199 + }, + { + "epoch": 0.24, + "learning_rate": 1.987639812703612e-06, + "loss": 0.9482, + "step": 9200 + }, + { + "epoch": 0.24, + "learning_rate": 1.987635475243324e-06, + "loss": 1.1084, + "step": 9201 + }, + { + "epoch": 0.24, + "learning_rate": 1.987631137026849e-06, + "loss": 0.6577, + "step": 9202 + }, + { + "epoch": 0.24, + "learning_rate": 1.9876267980541905e-06, + "loss": 0.9121, + "step": 9203 + }, + { + "epoch": 0.24, + "learning_rate": 1.9876224583253515e-06, + "loss": 0.8877, + "step": 9204 + }, + { + "epoch": 0.24, + "learning_rate": 1.9876181178403353e-06, + "loss": 1.1387, + "step": 9205 + }, + { + "epoch": 0.24, + "learning_rate": 1.9876137765991448e-06, + "loss": 0.7637, + "step": 9206 + }, + { + "epoch": 0.24, + "learning_rate": 1.9876094346017843e-06, + "loss": 0.9473, + "step": 9207 + }, + { + "epoch": 0.24, + "learning_rate": 1.9876050918482567e-06, + "loss": 0.9473, + "step": 9208 + }, + { + "epoch": 0.24, + "learning_rate": 1.9876007483385654e-06, + "loss": 0.9043, + "step": 9209 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875964040727135e-06, + "loss": 1.2295, + "step": 9210 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875920590507046e-06, + "loss": 0.958, + "step": 9211 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875877132725418e-06, + "loss": 1.0127, + "step": 9212 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875833667382284e-06, + "loss": 0.8945, + "step": 9213 + }, + { + "epoch": 0.24, + "learning_rate": 1.987579019447768e-06, + "loss": 0.8936, + "step": 9214 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875746714011632e-06, + "loss": 1.0, + "step": 9215 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875703225984186e-06, + "loss": 0.7671, + "step": 9216 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875659730395365e-06, + "loss": 0.8027, + "step": 9217 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875616227245204e-06, + "loss": 1.0098, + "step": 9218 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875572716533736e-06, + "loss": 0.8408, + "step": 9219 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875529198261e-06, + "loss": 0.6987, + "step": 9220 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875485672427026e-06, + "loss": 1.0186, + "step": 9221 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875442139031847e-06, + "loss": 0.9766, + "step": 9222 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875398598075492e-06, + "loss": 1.0371, + "step": 9223 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875355049558e-06, + "loss": 0.7357, + "step": 9224 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875311493479406e-06, + "loss": 1.0713, + "step": 9225 + }, + { + "epoch": 0.24, + "learning_rate": 1.987526792983974e-06, + "loss": 1.0684, + "step": 9226 + }, + { + "epoch": 0.24, + "learning_rate": 1.987522435863903e-06, + "loss": 0.9346, + "step": 9227 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875180779877317e-06, + "loss": 0.8643, + "step": 9228 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875137193554632e-06, + "loss": 0.7808, + "step": 9229 + }, + { + "epoch": 0.24, + "learning_rate": 1.987509359967101e-06, + "loss": 1.0566, + "step": 9230 + }, + { + "epoch": 0.24, + "learning_rate": 1.987504999822648e-06, + "loss": 0.9668, + "step": 9231 + }, + { + "epoch": 0.24, + "learning_rate": 1.9875006389221085e-06, + "loss": 0.6887, + "step": 9232 + }, + { + "epoch": 0.24, + "learning_rate": 1.9874962772654842e-06, + "loss": 0.8027, + "step": 9233 + }, + { + "epoch": 0.24, + "learning_rate": 1.9874919148527806e-06, + "loss": 0.9199, + "step": 9234 + }, + { + "epoch": 0.24, + "learning_rate": 1.987487551683999e-06, + "loss": 0.832, + "step": 9235 + }, + { + "epoch": 0.24, + "learning_rate": 1.9874831877591437e-06, + "loss": 0.7275, + "step": 9236 + }, + { + "epoch": 0.24, + "learning_rate": 1.987478823078218e-06, + "loss": 0.8545, + "step": 9237 + }, + { + "epoch": 0.24, + "learning_rate": 1.987474457641225e-06, + "loss": 0.9023, + "step": 9238 + }, + { + "epoch": 0.24, + "learning_rate": 1.9874700914481686e-06, + "loss": 1.1055, + "step": 9239 + }, + { + "epoch": 0.24, + "learning_rate": 1.9874657244990513e-06, + "loss": 0.79, + "step": 9240 + }, + { + "epoch": 0.24, + "learning_rate": 1.987461356793877e-06, + "loss": 0.8789, + "step": 9241 + }, + { + "epoch": 0.24, + "learning_rate": 1.987456988332649e-06, + "loss": 1.0352, + "step": 9242 + }, + { + "epoch": 0.24, + "learning_rate": 1.987452619115371e-06, + "loss": 0.8164, + "step": 9243 + }, + { + "epoch": 0.24, + "learning_rate": 1.9874482491420455e-06, + "loss": 1.0518, + "step": 9244 + }, + { + "epoch": 0.24, + "learning_rate": 1.9874438784126765e-06, + "loss": 1.0557, + "step": 9245 + }, + { + "epoch": 0.24, + "learning_rate": 1.987439506927267e-06, + "loss": 1.0381, + "step": 9246 + }, + { + "epoch": 0.24, + "learning_rate": 1.9874351346858205e-06, + "loss": 0.792, + "step": 9247 + }, + { + "epoch": 0.24, + "learning_rate": 1.98743076168834e-06, + "loss": 0.9609, + "step": 9248 + }, + { + "epoch": 0.24, + "learning_rate": 1.9874263879348295e-06, + "loss": 0.8232, + "step": 9249 + }, + { + "epoch": 0.24, + "learning_rate": 1.9874220134252922e-06, + "loss": 0.8604, + "step": 9250 + }, + { + "epoch": 0.24, + "learning_rate": 1.987417638159731e-06, + "loss": 0.9805, + "step": 9251 + }, + { + "epoch": 0.24, + "learning_rate": 1.9874132621381497e-06, + "loss": 0.9043, + "step": 9252 + }, + { + "epoch": 0.24, + "learning_rate": 1.987408885360551e-06, + "loss": 0.9893, + "step": 9253 + }, + { + "epoch": 0.24, + "learning_rate": 1.9874045078269394e-06, + "loss": 0.5669, + "step": 9254 + }, + { + "epoch": 0.24, + "learning_rate": 1.9874001295373172e-06, + "loss": 0.7163, + "step": 9255 + }, + { + "epoch": 0.24, + "learning_rate": 1.987395750491688e-06, + "loss": 0.9707, + "step": 9256 + }, + { + "epoch": 0.24, + "learning_rate": 1.9873913706900558e-06, + "loss": 0.751, + "step": 9257 + }, + { + "epoch": 0.24, + "learning_rate": 1.987386990132423e-06, + "loss": 0.8354, + "step": 9258 + }, + { + "epoch": 0.24, + "learning_rate": 1.987382608818793e-06, + "loss": 0.916, + "step": 9259 + }, + { + "epoch": 0.24, + "learning_rate": 1.98737822674917e-06, + "loss": 0.8135, + "step": 9260 + }, + { + "epoch": 0.24, + "learning_rate": 1.987373843923557e-06, + "loss": 0.9482, + "step": 9261 + }, + { + "epoch": 0.24, + "learning_rate": 1.987369460341957e-06, + "loss": 1.1562, + "step": 9262 + }, + { + "epoch": 0.24, + "learning_rate": 1.987365076004374e-06, + "loss": 0.9854, + "step": 9263 + }, + { + "epoch": 0.24, + "learning_rate": 1.9873606909108104e-06, + "loss": 0.9385, + "step": 9264 + }, + { + "epoch": 0.24, + "learning_rate": 1.9873563050612706e-06, + "loss": 0.7842, + "step": 9265 + }, + { + "epoch": 0.24, + "learning_rate": 1.987351918455757e-06, + "loss": 0.8491, + "step": 9266 + }, + { + "epoch": 0.24, + "learning_rate": 1.987347531094274e-06, + "loss": 0.6943, + "step": 9267 + }, + { + "epoch": 0.24, + "learning_rate": 1.9873431429768243e-06, + "loss": 0.9883, + "step": 9268 + }, + { + "epoch": 0.24, + "learning_rate": 1.987338754103411e-06, + "loss": 0.835, + "step": 9269 + }, + { + "epoch": 0.24, + "learning_rate": 1.987334364474038e-06, + "loss": 0.9775, + "step": 9270 + }, + { + "epoch": 0.24, + "learning_rate": 1.9873299740887086e-06, + "loss": 0.876, + "step": 9271 + }, + { + "epoch": 0.24, + "learning_rate": 1.9873255829474257e-06, + "loss": 0.7861, + "step": 9272 + }, + { + "epoch": 0.24, + "learning_rate": 1.987321191050193e-06, + "loss": 1.123, + "step": 9273 + }, + { + "epoch": 0.24, + "learning_rate": 1.9873167983970143e-06, + "loss": 1.1172, + "step": 9274 + }, + { + "epoch": 0.24, + "learning_rate": 1.987312404987892e-06, + "loss": 0.9531, + "step": 9275 + }, + { + "epoch": 0.24, + "learning_rate": 1.9873080108228307e-06, + "loss": 0.7893, + "step": 9276 + }, + { + "epoch": 0.24, + "learning_rate": 1.9873036159018323e-06, + "loss": 0.9531, + "step": 9277 + }, + { + "epoch": 0.24, + "learning_rate": 1.9872992202249014e-06, + "loss": 0.9062, + "step": 9278 + }, + { + "epoch": 0.24, + "learning_rate": 1.9872948237920406e-06, + "loss": 1.1621, + "step": 9279 + }, + { + "epoch": 0.24, + "learning_rate": 1.9872904266032537e-06, + "loss": 1.0234, + "step": 9280 + }, + { + "epoch": 0.24, + "learning_rate": 1.987286028658544e-06, + "loss": 0.9395, + "step": 9281 + }, + { + "epoch": 0.24, + "learning_rate": 1.9872816299579144e-06, + "loss": 0.917, + "step": 9282 + }, + { + "epoch": 0.24, + "learning_rate": 1.987277230501369e-06, + "loss": 1.123, + "step": 9283 + }, + { + "epoch": 0.24, + "learning_rate": 1.987272830288911e-06, + "loss": 1.0654, + "step": 9284 + }, + { + "epoch": 0.24, + "learning_rate": 1.9872684293205433e-06, + "loss": 0.9053, + "step": 9285 + }, + { + "epoch": 0.24, + "learning_rate": 1.9872640275962693e-06, + "loss": 0.7354, + "step": 9286 + }, + { + "epoch": 0.24, + "learning_rate": 1.987259625116093e-06, + "loss": 0.916, + "step": 9287 + }, + { + "epoch": 0.24, + "learning_rate": 1.9872552218800178e-06, + "loss": 0.9609, + "step": 9288 + }, + { + "epoch": 0.24, + "learning_rate": 1.987250817888046e-06, + "loss": 1.0615, + "step": 9289 + }, + { + "epoch": 0.24, + "learning_rate": 1.9872464131401818e-06, + "loss": 0.917, + "step": 9290 + }, + { + "epoch": 0.24, + "learning_rate": 1.9872420076364286e-06, + "loss": 0.8633, + "step": 9291 + }, + { + "epoch": 0.24, + "learning_rate": 1.987237601376789e-06, + "loss": 0.9072, + "step": 9292 + }, + { + "epoch": 0.24, + "learning_rate": 1.9872331943612677e-06, + "loss": 1.0273, + "step": 9293 + }, + { + "epoch": 0.24, + "learning_rate": 1.9872287865898668e-06, + "loss": 0.793, + "step": 9294 + }, + { + "epoch": 0.24, + "learning_rate": 1.987224378062591e-06, + "loss": 0.7305, + "step": 9295 + }, + { + "epoch": 0.24, + "learning_rate": 1.987219968779442e-06, + "loss": 0.9668, + "step": 9296 + }, + { + "epoch": 0.24, + "learning_rate": 1.9872155587404246e-06, + "loss": 1.0049, + "step": 9297 + }, + { + "epoch": 0.24, + "learning_rate": 1.9872111479455413e-06, + "loss": 1.0283, + "step": 9298 + }, + { + "epoch": 0.24, + "learning_rate": 1.987206736394796e-06, + "loss": 0.5579, + "step": 9299 + }, + { + "epoch": 0.24, + "learning_rate": 1.987202324088192e-06, + "loss": 1.0264, + "step": 9300 + }, + { + "epoch": 0.24, + "learning_rate": 1.9871979110257324e-06, + "loss": 0.8145, + "step": 9301 + }, + { + "epoch": 0.24, + "learning_rate": 1.987193497207421e-06, + "loss": 0.8574, + "step": 9302 + }, + { + "epoch": 0.24, + "learning_rate": 1.9871890826332603e-06, + "loss": 1.082, + "step": 9303 + }, + { + "epoch": 0.24, + "learning_rate": 1.987184667303255e-06, + "loss": 1.0439, + "step": 9304 + }, + { + "epoch": 0.24, + "learning_rate": 1.9871802512174074e-06, + "loss": 0.624, + "step": 9305 + }, + { + "epoch": 0.24, + "learning_rate": 1.9871758343757214e-06, + "loss": 1.082, + "step": 9306 + }, + { + "epoch": 0.24, + "learning_rate": 1.9871714167782004e-06, + "loss": 1.1514, + "step": 9307 + }, + { + "epoch": 0.24, + "learning_rate": 1.9871669984248473e-06, + "loss": 0.8154, + "step": 9308 + }, + { + "epoch": 0.24, + "learning_rate": 1.987162579315666e-06, + "loss": 0.7529, + "step": 9309 + }, + { + "epoch": 0.24, + "learning_rate": 1.98715815945066e-06, + "loss": 1.0615, + "step": 9310 + }, + { + "epoch": 0.24, + "learning_rate": 1.9871537388298317e-06, + "loss": 0.9199, + "step": 9311 + }, + { + "epoch": 0.24, + "learning_rate": 1.9871493174531856e-06, + "loss": 1.1094, + "step": 9312 + }, + { + "epoch": 0.24, + "learning_rate": 1.9871448953207247e-06, + "loss": 0.9697, + "step": 9313 + }, + { + "epoch": 0.24, + "learning_rate": 1.987140472432452e-06, + "loss": 0.7871, + "step": 9314 + }, + { + "epoch": 0.24, + "learning_rate": 1.987136048788372e-06, + "loss": 0.9033, + "step": 9315 + }, + { + "epoch": 0.24, + "learning_rate": 1.987131624388487e-06, + "loss": 1.0146, + "step": 9316 + }, + { + "epoch": 0.24, + "learning_rate": 1.9871271992328003e-06, + "loss": 1.166, + "step": 9317 + }, + { + "epoch": 0.24, + "learning_rate": 1.987122773321316e-06, + "loss": 0.8799, + "step": 9318 + }, + { + "epoch": 0.24, + "learning_rate": 1.987118346654037e-06, + "loss": 0.832, + "step": 9319 + }, + { + "epoch": 0.24, + "learning_rate": 1.987113919230967e-06, + "loss": 0.6704, + "step": 9320 + }, + { + "epoch": 0.24, + "learning_rate": 1.9871094910521093e-06, + "loss": 1.2793, + "step": 9321 + }, + { + "epoch": 0.24, + "learning_rate": 1.9871050621174673e-06, + "loss": 1.0957, + "step": 9322 + }, + { + "epoch": 0.24, + "learning_rate": 1.9871006324270437e-06, + "loss": 0.8252, + "step": 9323 + }, + { + "epoch": 0.24, + "learning_rate": 1.987096201980843e-06, + "loss": 0.8174, + "step": 9324 + }, + { + "epoch": 0.24, + "learning_rate": 1.9870917707788684e-06, + "loss": 1.2246, + "step": 9325 + }, + { + "epoch": 0.24, + "learning_rate": 1.987087338821123e-06, + "loss": 0.9785, + "step": 9326 + }, + { + "epoch": 0.24, + "learning_rate": 1.98708290610761e-06, + "loss": 0.75, + "step": 9327 + }, + { + "epoch": 0.24, + "learning_rate": 1.987078472638333e-06, + "loss": 0.9092, + "step": 9328 + }, + { + "epoch": 0.24, + "learning_rate": 1.9870740384132954e-06, + "loss": 0.9053, + "step": 9329 + }, + { + "epoch": 0.24, + "learning_rate": 1.987069603432501e-06, + "loss": 1.0098, + "step": 9330 + }, + { + "epoch": 0.24, + "learning_rate": 1.987065167695952e-06, + "loss": 0.8613, + "step": 9331 + }, + { + "epoch": 0.24, + "learning_rate": 1.987060731203653e-06, + "loss": 0.9404, + "step": 9332 + }, + { + "epoch": 0.24, + "learning_rate": 1.987056293955607e-06, + "loss": 0.9707, + "step": 9333 + }, + { + "epoch": 0.24, + "learning_rate": 1.9870518559518176e-06, + "loss": 0.8223, + "step": 9334 + }, + { + "epoch": 0.24, + "learning_rate": 1.9870474171922876e-06, + "loss": 0.9766, + "step": 9335 + }, + { + "epoch": 0.24, + "learning_rate": 1.987042977677021e-06, + "loss": 0.8154, + "step": 9336 + }, + { + "epoch": 0.24, + "learning_rate": 1.987038537406021e-06, + "loss": 0.8447, + "step": 9337 + }, + { + "epoch": 0.24, + "learning_rate": 1.9870340963792906e-06, + "loss": 0.8418, + "step": 9338 + }, + { + "epoch": 0.24, + "learning_rate": 1.9870296545968342e-06, + "loss": 0.9268, + "step": 9339 + }, + { + "epoch": 0.24, + "learning_rate": 1.9870252120586542e-06, + "loss": 0.9404, + "step": 9340 + }, + { + "epoch": 0.24, + "learning_rate": 1.987020768764754e-06, + "loss": 1.0303, + "step": 9341 + }, + { + "epoch": 0.24, + "learning_rate": 1.9870163247151378e-06, + "loss": 1.0381, + "step": 9342 + }, + { + "epoch": 0.24, + "learning_rate": 1.987011879909809e-06, + "loss": 0.8018, + "step": 9343 + }, + { + "epoch": 0.24, + "learning_rate": 1.98700743434877e-06, + "loss": 0.8672, + "step": 9344 + }, + { + "epoch": 0.24, + "learning_rate": 1.987002988032025e-06, + "loss": 0.8066, + "step": 9345 + }, + { + "epoch": 0.24, + "learning_rate": 1.986998540959577e-06, + "loss": 0.8408, + "step": 9346 + }, + { + "epoch": 0.24, + "learning_rate": 1.9869940931314297e-06, + "loss": 1.1885, + "step": 9347 + }, + { + "epoch": 0.24, + "learning_rate": 1.986989644547587e-06, + "loss": 1.1172, + "step": 9348 + }, + { + "epoch": 0.24, + "learning_rate": 1.9869851952080507e-06, + "loss": 1.1416, + "step": 9349 + }, + { + "epoch": 0.24, + "learning_rate": 1.986980745112826e-06, + "loss": 1.2637, + "step": 9350 + }, + { + "epoch": 0.24, + "learning_rate": 1.986976294261915e-06, + "loss": 1.1592, + "step": 9351 + }, + { + "epoch": 0.24, + "learning_rate": 1.9869718426553218e-06, + "loss": 0.9277, + "step": 9352 + }, + { + "epoch": 0.24, + "learning_rate": 1.9869673902930495e-06, + "loss": 1.1191, + "step": 9353 + }, + { + "epoch": 0.24, + "learning_rate": 1.986962937175102e-06, + "loss": 0.5625, + "step": 9354 + }, + { + "epoch": 0.24, + "learning_rate": 1.9869584833014824e-06, + "loss": 0.9355, + "step": 9355 + }, + { + "epoch": 0.24, + "learning_rate": 1.986954028672194e-06, + "loss": 0.7939, + "step": 9356 + }, + { + "epoch": 0.24, + "learning_rate": 1.98694957328724e-06, + "loss": 0.9551, + "step": 9357 + }, + { + "epoch": 0.24, + "learning_rate": 1.9869451171466244e-06, + "loss": 1.084, + "step": 9358 + }, + { + "epoch": 0.24, + "learning_rate": 1.98694066025035e-06, + "loss": 1.0234, + "step": 9359 + }, + { + "epoch": 0.24, + "learning_rate": 1.9869362025984205e-06, + "loss": 0.6665, + "step": 9360 + }, + { + "epoch": 0.24, + "learning_rate": 1.98693174419084e-06, + "loss": 0.8535, + "step": 9361 + }, + { + "epoch": 0.24, + "learning_rate": 1.9869272850276105e-06, + "loss": 0.8193, + "step": 9362 + }, + { + "epoch": 0.24, + "learning_rate": 1.9869228251087363e-06, + "loss": 0.9844, + "step": 9363 + }, + { + "epoch": 0.24, + "learning_rate": 1.986918364434221e-06, + "loss": 1.0059, + "step": 9364 + }, + { + "epoch": 0.24, + "learning_rate": 1.986913903004067e-06, + "loss": 0.9834, + "step": 9365 + }, + { + "epoch": 0.24, + "learning_rate": 1.986909440818279e-06, + "loss": 1.0332, + "step": 9366 + }, + { + "epoch": 0.24, + "learning_rate": 1.9869049778768597e-06, + "loss": 0.8799, + "step": 9367 + }, + { + "epoch": 0.24, + "learning_rate": 1.9869005141798128e-06, + "loss": 0.9756, + "step": 9368 + }, + { + "epoch": 0.24, + "learning_rate": 1.9868960497271413e-06, + "loss": 1.0527, + "step": 9369 + }, + { + "epoch": 0.24, + "learning_rate": 1.986891584518849e-06, + "loss": 0.8906, + "step": 9370 + }, + { + "epoch": 0.24, + "learning_rate": 1.986887118554939e-06, + "loss": 1.0176, + "step": 9371 + }, + { + "epoch": 0.24, + "learning_rate": 1.9868826518354153e-06, + "loss": 0.9458, + "step": 9372 + }, + { + "epoch": 0.24, + "learning_rate": 1.986878184360281e-06, + "loss": 0.96, + "step": 9373 + }, + { + "epoch": 0.24, + "learning_rate": 1.986873716129539e-06, + "loss": 0.7852, + "step": 9374 + }, + { + "epoch": 0.24, + "learning_rate": 1.986869247143193e-06, + "loss": 1.0645, + "step": 9375 + }, + { + "epoch": 0.24, + "learning_rate": 1.986864777401247e-06, + "loss": 0.7744, + "step": 9376 + }, + { + "epoch": 0.24, + "learning_rate": 1.986860306903704e-06, + "loss": 0.9883, + "step": 9377 + }, + { + "epoch": 0.24, + "learning_rate": 1.9868558356505674e-06, + "loss": 0.9473, + "step": 9378 + }, + { + "epoch": 0.24, + "learning_rate": 1.9868513636418408e-06, + "loss": 0.7764, + "step": 9379 + }, + { + "epoch": 0.24, + "learning_rate": 1.9868468908775272e-06, + "loss": 0.8057, + "step": 9380 + }, + { + "epoch": 0.24, + "learning_rate": 1.9868424173576302e-06, + "loss": 0.8643, + "step": 9381 + }, + { + "epoch": 0.24, + "learning_rate": 1.9868379430821536e-06, + "loss": 1.0352, + "step": 9382 + }, + { + "epoch": 0.24, + "learning_rate": 1.9868334680511007e-06, + "loss": 0.916, + "step": 9383 + }, + { + "epoch": 0.24, + "learning_rate": 1.9868289922644745e-06, + "loss": 1.0547, + "step": 9384 + }, + { + "epoch": 0.24, + "learning_rate": 1.986824515722279e-06, + "loss": 0.7979, + "step": 9385 + }, + { + "epoch": 0.24, + "learning_rate": 1.986820038424517e-06, + "loss": 0.958, + "step": 9386 + }, + { + "epoch": 0.24, + "learning_rate": 1.9868155603711926e-06, + "loss": 0.9297, + "step": 9387 + }, + { + "epoch": 0.24, + "learning_rate": 1.986811081562309e-06, + "loss": 0.8633, + "step": 9388 + }, + { + "epoch": 0.24, + "learning_rate": 1.986806601997869e-06, + "loss": 1.0117, + "step": 9389 + }, + { + "epoch": 0.24, + "learning_rate": 1.986802121677877e-06, + "loss": 0.9678, + "step": 9390 + }, + { + "epoch": 0.24, + "learning_rate": 1.986797640602336e-06, + "loss": 0.7827, + "step": 9391 + }, + { + "epoch": 0.24, + "learning_rate": 1.986793158771249e-06, + "loss": 0.959, + "step": 9392 + }, + { + "epoch": 0.24, + "learning_rate": 1.98678867618462e-06, + "loss": 1.0352, + "step": 9393 + }, + { + "epoch": 0.24, + "learning_rate": 1.9867841928424526e-06, + "loss": 0.9404, + "step": 9394 + }, + { + "epoch": 0.24, + "learning_rate": 1.9867797087447498e-06, + "loss": 0.9092, + "step": 9395 + }, + { + "epoch": 0.24, + "learning_rate": 1.9867752238915147e-06, + "loss": 0.9482, + "step": 9396 + }, + { + "epoch": 0.24, + "learning_rate": 1.9867707382827516e-06, + "loss": 0.8096, + "step": 9397 + }, + { + "epoch": 0.24, + "learning_rate": 1.9867662519184635e-06, + "loss": 0.9863, + "step": 9398 + }, + { + "epoch": 0.24, + "learning_rate": 1.986761764798654e-06, + "loss": 0.8135, + "step": 9399 + }, + { + "epoch": 0.24, + "learning_rate": 1.9867572769233263e-06, + "loss": 0.8486, + "step": 9400 + }, + { + "epoch": 0.24, + "learning_rate": 1.986752788292484e-06, + "loss": 0.9209, + "step": 9401 + }, + { + "epoch": 0.24, + "learning_rate": 1.98674829890613e-06, + "loss": 0.9502, + "step": 9402 + }, + { + "epoch": 0.24, + "learning_rate": 1.9867438087642686e-06, + "loss": 0.8838, + "step": 9403 + }, + { + "epoch": 0.24, + "learning_rate": 1.9867393178669024e-06, + "loss": 0.9668, + "step": 9404 + }, + { + "epoch": 0.24, + "learning_rate": 1.986734826214036e-06, + "loss": 1.1484, + "step": 9405 + }, + { + "epoch": 0.24, + "learning_rate": 1.9867303338056717e-06, + "loss": 1.0195, + "step": 9406 + }, + { + "epoch": 0.24, + "learning_rate": 1.986725840641813e-06, + "loss": 0.9463, + "step": 9407 + }, + { + "epoch": 0.24, + "learning_rate": 1.986721346722464e-06, + "loss": 1.0439, + "step": 9408 + }, + { + "epoch": 0.24, + "learning_rate": 1.9867168520476284e-06, + "loss": 0.876, + "step": 9409 + }, + { + "epoch": 0.24, + "learning_rate": 1.986712356617308e-06, + "loss": 0.9463, + "step": 9410 + }, + { + "epoch": 0.24, + "learning_rate": 1.9867078604315083e-06, + "loss": 0.9785, + "step": 9411 + }, + { + "epoch": 0.24, + "learning_rate": 1.9867033634902313e-06, + "loss": 1.0635, + "step": 9412 + }, + { + "epoch": 0.24, + "learning_rate": 1.986698865793481e-06, + "loss": 0.9131, + "step": 9413 + }, + { + "epoch": 0.24, + "learning_rate": 1.9866943673412607e-06, + "loss": 0.8428, + "step": 9414 + }, + { + "epoch": 0.24, + "learning_rate": 1.9866898681335738e-06, + "loss": 0.8467, + "step": 9415 + }, + { + "epoch": 0.24, + "learning_rate": 1.986685368170424e-06, + "loss": 0.9004, + "step": 9416 + }, + { + "epoch": 0.24, + "learning_rate": 1.9866808674518147e-06, + "loss": 0.9014, + "step": 9417 + }, + { + "epoch": 0.24, + "learning_rate": 1.986676365977749e-06, + "loss": 1.1855, + "step": 9418 + }, + { + "epoch": 0.24, + "learning_rate": 1.9866718637482304e-06, + "loss": 0.8496, + "step": 9419 + }, + { + "epoch": 0.24, + "learning_rate": 1.986667360763263e-06, + "loss": 0.8994, + "step": 9420 + }, + { + "epoch": 0.24, + "learning_rate": 1.9866628570228494e-06, + "loss": 0.7085, + "step": 9421 + }, + { + "epoch": 0.24, + "learning_rate": 1.9866583525269935e-06, + "loss": 0.8643, + "step": 9422 + }, + { + "epoch": 0.24, + "learning_rate": 1.986653847275699e-06, + "loss": 1.0352, + "step": 9423 + }, + { + "epoch": 0.24, + "learning_rate": 1.9866493412689684e-06, + "loss": 0.833, + "step": 9424 + }, + { + "epoch": 0.24, + "learning_rate": 1.9866448345068065e-06, + "loss": 1.0312, + "step": 9425 + }, + { + "epoch": 0.24, + "learning_rate": 1.986640326989215e-06, + "loss": 0.9072, + "step": 9426 + }, + { + "epoch": 0.24, + "learning_rate": 1.9866358187161993e-06, + "loss": 0.833, + "step": 9427 + }, + { + "epoch": 0.24, + "learning_rate": 1.9866313096877617e-06, + "loss": 1.1279, + "step": 9428 + }, + { + "epoch": 0.24, + "learning_rate": 1.9866267999039058e-06, + "loss": 0.9961, + "step": 9429 + }, + { + "epoch": 0.24, + "learning_rate": 1.986622289364635e-06, + "loss": 1.0146, + "step": 9430 + }, + { + "epoch": 0.24, + "learning_rate": 1.9866177780699527e-06, + "loss": 0.9297, + "step": 9431 + }, + { + "epoch": 0.24, + "learning_rate": 1.986613266019863e-06, + "loss": 0.8823, + "step": 9432 + }, + { + "epoch": 0.24, + "learning_rate": 1.986608753214369e-06, + "loss": 0.771, + "step": 9433 + }, + { + "epoch": 0.24, + "learning_rate": 1.9866042396534736e-06, + "loss": 0.7119, + "step": 9434 + }, + { + "epoch": 0.24, + "learning_rate": 1.986599725337181e-06, + "loss": 0.7178, + "step": 9435 + }, + { + "epoch": 0.24, + "learning_rate": 1.986595210265494e-06, + "loss": 0.9395, + "step": 9436 + }, + { + "epoch": 0.24, + "learning_rate": 1.9865906944384167e-06, + "loss": 0.7607, + "step": 9437 + }, + { + "epoch": 0.24, + "learning_rate": 1.986586177855952e-06, + "loss": 1.0088, + "step": 9438 + }, + { + "epoch": 0.24, + "learning_rate": 1.986581660518104e-06, + "loss": 0.9766, + "step": 9439 + }, + { + "epoch": 0.24, + "learning_rate": 1.9865771424248756e-06, + "loss": 0.897, + "step": 9440 + }, + { + "epoch": 0.24, + "learning_rate": 1.9865726235762705e-06, + "loss": 1.0654, + "step": 9441 + }, + { + "epoch": 0.24, + "learning_rate": 1.9865681039722915e-06, + "loss": 0.9521, + "step": 9442 + }, + { + "epoch": 0.24, + "learning_rate": 1.9865635836129434e-06, + "loss": 0.9092, + "step": 9443 + }, + { + "epoch": 0.24, + "learning_rate": 1.9865590624982287e-06, + "loss": 1.0947, + "step": 9444 + }, + { + "epoch": 0.24, + "learning_rate": 1.9865545406281516e-06, + "loss": 0.876, + "step": 9445 + }, + { + "epoch": 0.24, + "learning_rate": 1.9865500180027142e-06, + "loss": 0.8052, + "step": 9446 + }, + { + "epoch": 0.24, + "learning_rate": 1.9865454946219213e-06, + "loss": 0.8525, + "step": 9447 + }, + { + "epoch": 0.24, + "learning_rate": 1.9865409704857756e-06, + "loss": 1.0068, + "step": 9448 + }, + { + "epoch": 0.24, + "learning_rate": 1.986536445594281e-06, + "loss": 0.7773, + "step": 9449 + }, + { + "epoch": 0.24, + "learning_rate": 1.986531919947441e-06, + "loss": 0.7542, + "step": 9450 + }, + { + "epoch": 0.24, + "learning_rate": 1.9865273935452585e-06, + "loss": 0.9346, + "step": 9451 + }, + { + "epoch": 0.24, + "learning_rate": 1.986522866387738e-06, + "loss": 0.8506, + "step": 9452 + }, + { + "epoch": 0.24, + "learning_rate": 1.9865183384748816e-06, + "loss": 0.9521, + "step": 9453 + }, + { + "epoch": 0.24, + "learning_rate": 1.9865138098066934e-06, + "loss": 0.9336, + "step": 9454 + }, + { + "epoch": 0.24, + "learning_rate": 1.9865092803831775e-06, + "loss": 0.8535, + "step": 9455 + }, + { + "epoch": 0.24, + "learning_rate": 1.9865047502043366e-06, + "loss": 1.0996, + "step": 9456 + }, + { + "epoch": 0.24, + "learning_rate": 1.9865002192701743e-06, + "loss": 0.916, + "step": 9457 + }, + { + "epoch": 0.24, + "learning_rate": 1.986495687580694e-06, + "loss": 1.001, + "step": 9458 + }, + { + "epoch": 0.24, + "learning_rate": 1.9864911551358994e-06, + "loss": 0.958, + "step": 9459 + }, + { + "epoch": 0.24, + "learning_rate": 1.986486621935794e-06, + "loss": 1.3447, + "step": 9460 + }, + { + "epoch": 0.24, + "learning_rate": 1.9864820879803812e-06, + "loss": 0.918, + "step": 9461 + }, + { + "epoch": 0.24, + "learning_rate": 1.986477553269664e-06, + "loss": 0.8623, + "step": 9462 + }, + { + "epoch": 0.24, + "learning_rate": 1.986473017803647e-06, + "loss": 0.8828, + "step": 9463 + }, + { + "epoch": 0.24, + "learning_rate": 1.9864684815823325e-06, + "loss": 1.084, + "step": 9464 + }, + { + "epoch": 0.24, + "learning_rate": 1.9864639446057247e-06, + "loss": 0.8242, + "step": 9465 + }, + { + "epoch": 0.24, + "learning_rate": 1.9864594068738266e-06, + "loss": 0.9658, + "step": 9466 + }, + { + "epoch": 0.24, + "learning_rate": 1.986454868386642e-06, + "loss": 1.1035, + "step": 9467 + }, + { + "epoch": 0.24, + "learning_rate": 1.986450329144174e-06, + "loss": 0.6523, + "step": 9468 + }, + { + "epoch": 0.24, + "learning_rate": 1.9864457891464267e-06, + "loss": 1.0381, + "step": 9469 + }, + { + "epoch": 0.24, + "learning_rate": 1.986441248393403e-06, + "loss": 0.7769, + "step": 9470 + }, + { + "epoch": 0.24, + "learning_rate": 1.9864367068851068e-06, + "loss": 0.957, + "step": 9471 + }, + { + "epoch": 0.24, + "learning_rate": 1.986432164621541e-06, + "loss": 1.1064, + "step": 9472 + }, + { + "epoch": 0.24, + "learning_rate": 1.9864276216027096e-06, + "loss": 0.8657, + "step": 9473 + }, + { + "epoch": 0.24, + "learning_rate": 1.9864230778286162e-06, + "loss": 0.7979, + "step": 9474 + }, + { + "epoch": 0.24, + "learning_rate": 1.986418533299264e-06, + "loss": 0.8359, + "step": 9475 + }, + { + "epoch": 0.24, + "learning_rate": 1.986413988014656e-06, + "loss": 1.1172, + "step": 9476 + }, + { + "epoch": 0.24, + "learning_rate": 1.9864094419747964e-06, + "loss": 0.8008, + "step": 9477 + }, + { + "epoch": 0.24, + "learning_rate": 1.986404895179689e-06, + "loss": 1.1816, + "step": 9478 + }, + { + "epoch": 0.24, + "learning_rate": 1.986400347629336e-06, + "loss": 1.0869, + "step": 9479 + }, + { + "epoch": 0.24, + "learning_rate": 1.9863957993237418e-06, + "loss": 0.6968, + "step": 9480 + }, + { + "epoch": 0.24, + "learning_rate": 1.9863912502629097e-06, + "loss": 1.1426, + "step": 9481 + }, + { + "epoch": 0.24, + "learning_rate": 1.986386700446843e-06, + "loss": 1.0332, + "step": 9482 + }, + { + "epoch": 0.24, + "learning_rate": 1.986382149875546e-06, + "loss": 0.8643, + "step": 9483 + }, + { + "epoch": 0.24, + "learning_rate": 1.986377598549021e-06, + "loss": 0.9072, + "step": 9484 + }, + { + "epoch": 0.24, + "learning_rate": 1.986373046467272e-06, + "loss": 0.7617, + "step": 9485 + }, + { + "epoch": 0.24, + "learning_rate": 1.9863684936303027e-06, + "loss": 0.9658, + "step": 9486 + }, + { + "epoch": 0.24, + "learning_rate": 1.9863639400381163e-06, + "loss": 0.9258, + "step": 9487 + }, + { + "epoch": 0.24, + "learning_rate": 1.9863593856907165e-06, + "loss": 0.6582, + "step": 9488 + }, + { + "epoch": 0.24, + "learning_rate": 1.9863548305881064e-06, + "loss": 0.958, + "step": 9489 + }, + { + "epoch": 0.24, + "learning_rate": 1.98635027473029e-06, + "loss": 1.0557, + "step": 9490 + }, + { + "epoch": 0.24, + "learning_rate": 1.986345718117271e-06, + "loss": 0.7773, + "step": 9491 + }, + { + "epoch": 0.24, + "learning_rate": 1.9863411607490517e-06, + "loss": 0.9756, + "step": 9492 + }, + { + "epoch": 0.24, + "learning_rate": 1.9863366026256367e-06, + "loss": 0.9648, + "step": 9493 + }, + { + "epoch": 0.24, + "learning_rate": 1.986332043747029e-06, + "loss": 0.8945, + "step": 9494 + }, + { + "epoch": 0.24, + "learning_rate": 1.986327484113232e-06, + "loss": 0.8037, + "step": 9495 + }, + { + "epoch": 0.24, + "learning_rate": 1.9863229237242498e-06, + "loss": 0.8877, + "step": 9496 + }, + { + "epoch": 0.24, + "learning_rate": 1.9863183625800853e-06, + "loss": 0.9443, + "step": 9497 + }, + { + "epoch": 0.24, + "learning_rate": 1.986313800680742e-06, + "loss": 0.834, + "step": 9498 + }, + { + "epoch": 0.24, + "learning_rate": 1.986309238026224e-06, + "loss": 0.8896, + "step": 9499 + }, + { + "epoch": 0.24, + "learning_rate": 1.986304674616534e-06, + "loss": 1.0518, + "step": 9500 + }, + { + "epoch": 0.24, + "learning_rate": 1.9863001104516758e-06, + "loss": 1.0762, + "step": 9501 + }, + { + "epoch": 0.24, + "learning_rate": 1.986295545531653e-06, + "loss": 0.9766, + "step": 9502 + }, + { + "epoch": 0.24, + "learning_rate": 1.9862909798564697e-06, + "loss": 0.8706, + "step": 9503 + }, + { + "epoch": 0.24, + "learning_rate": 1.986286413426128e-06, + "loss": 0.9062, + "step": 9504 + }, + { + "epoch": 0.24, + "learning_rate": 1.9862818462406327e-06, + "loss": 1.0205, + "step": 9505 + }, + { + "epoch": 0.24, + "learning_rate": 1.9862772782999863e-06, + "loss": 0.8096, + "step": 9506 + }, + { + "epoch": 0.24, + "learning_rate": 1.9862727096041928e-06, + "loss": 0.9854, + "step": 9507 + }, + { + "epoch": 0.24, + "learning_rate": 1.9862681401532554e-06, + "loss": 0.6694, + "step": 9508 + }, + { + "epoch": 0.24, + "learning_rate": 1.9862635699471783e-06, + "loss": 0.9053, + "step": 9509 + }, + { + "epoch": 0.24, + "learning_rate": 1.986258998985964e-06, + "loss": 0.9658, + "step": 9510 + }, + { + "epoch": 0.24, + "learning_rate": 1.9862544272696173e-06, + "loss": 1.0303, + "step": 9511 + }, + { + "epoch": 0.24, + "learning_rate": 1.9862498547981404e-06, + "loss": 0.8574, + "step": 9512 + }, + { + "epoch": 0.24, + "learning_rate": 1.9862452815715376e-06, + "loss": 0.9102, + "step": 9513 + }, + { + "epoch": 0.24, + "learning_rate": 1.986240707589812e-06, + "loss": 0.7461, + "step": 9514 + }, + { + "epoch": 0.24, + "learning_rate": 1.986236132852967e-06, + "loss": 0.8594, + "step": 9515 + }, + { + "epoch": 0.24, + "learning_rate": 1.986231557361007e-06, + "loss": 0.9492, + "step": 9516 + }, + { + "epoch": 0.24, + "learning_rate": 1.9862269811139345e-06, + "loss": 0.8682, + "step": 9517 + }, + { + "epoch": 0.24, + "learning_rate": 1.986222404111753e-06, + "loss": 0.8799, + "step": 9518 + }, + { + "epoch": 0.24, + "learning_rate": 1.986217826354467e-06, + "loss": 0.9199, + "step": 9519 + }, + { + "epoch": 0.24, + "learning_rate": 1.9862132478420787e-06, + "loss": 1.0293, + "step": 9520 + }, + { + "epoch": 0.24, + "learning_rate": 1.9862086685745927e-06, + "loss": 0.5576, + "step": 9521 + }, + { + "epoch": 0.24, + "learning_rate": 1.9862040885520115e-06, + "loss": 0.7969, + "step": 9522 + }, + { + "epoch": 0.24, + "learning_rate": 1.98619950777434e-06, + "loss": 0.8999, + "step": 9523 + }, + { + "epoch": 0.24, + "learning_rate": 1.9861949262415803e-06, + "loss": 0.7305, + "step": 9524 + }, + { + "epoch": 0.24, + "learning_rate": 1.9861903439537366e-06, + "loss": 0.8223, + "step": 9525 + }, + { + "epoch": 0.24, + "learning_rate": 1.9861857609108126e-06, + "loss": 0.5046, + "step": 9526 + }, + { + "epoch": 0.24, + "learning_rate": 1.986181177112811e-06, + "loss": 1.001, + "step": 9527 + }, + { + "epoch": 0.24, + "learning_rate": 1.9861765925597362e-06, + "loss": 0.8135, + "step": 9528 + }, + { + "epoch": 0.24, + "learning_rate": 1.9861720072515916e-06, + "loss": 0.9463, + "step": 9529 + }, + { + "epoch": 0.24, + "learning_rate": 1.9861674211883797e-06, + "loss": 1.0742, + "step": 9530 + }, + { + "epoch": 0.24, + "learning_rate": 1.9861628343701053e-06, + "loss": 1.084, + "step": 9531 + }, + { + "epoch": 0.24, + "learning_rate": 1.986158246796771e-06, + "loss": 0.7549, + "step": 9532 + }, + { + "epoch": 0.24, + "learning_rate": 1.986153658468381e-06, + "loss": 0.834, + "step": 9533 + }, + { + "epoch": 0.24, + "learning_rate": 1.9861490693849383e-06, + "loss": 1.0527, + "step": 9534 + }, + { + "epoch": 0.24, + "learning_rate": 1.986144479546447e-06, + "loss": 0.8828, + "step": 9535 + }, + { + "epoch": 0.24, + "learning_rate": 1.9861398889529097e-06, + "loss": 1.0449, + "step": 9536 + }, + { + "epoch": 0.24, + "learning_rate": 1.9861352976043304e-06, + "loss": 0.9863, + "step": 9537 + }, + { + "epoch": 0.24, + "learning_rate": 1.986130705500713e-06, + "loss": 0.9492, + "step": 9538 + }, + { + "epoch": 0.24, + "learning_rate": 1.9861261126420605e-06, + "loss": 0.7227, + "step": 9539 + }, + { + "epoch": 0.24, + "learning_rate": 1.9861215190283766e-06, + "loss": 0.7803, + "step": 9540 + }, + { + "epoch": 0.24, + "learning_rate": 1.986116924659665e-06, + "loss": 1.0527, + "step": 9541 + }, + { + "epoch": 0.24, + "learning_rate": 1.9861123295359284e-06, + "loss": 0.6318, + "step": 9542 + }, + { + "epoch": 0.24, + "learning_rate": 1.9861077336571713e-06, + "loss": 1.125, + "step": 9543 + }, + { + "epoch": 0.24, + "learning_rate": 1.986103137023397e-06, + "loss": 0.8438, + "step": 9544 + }, + { + "epoch": 0.24, + "learning_rate": 1.9860985396346088e-06, + "loss": 0.8887, + "step": 9545 + }, + { + "epoch": 0.24, + "learning_rate": 1.98609394149081e-06, + "loss": 0.7842, + "step": 9546 + }, + { + "epoch": 0.24, + "learning_rate": 1.986089342592005e-06, + "loss": 0.8398, + "step": 9547 + }, + { + "epoch": 0.24, + "learning_rate": 1.986084742938196e-06, + "loss": 0.8464, + "step": 9548 + }, + { + "epoch": 0.24, + "learning_rate": 1.986080142529388e-06, + "loss": 0.834, + "step": 9549 + }, + { + "epoch": 0.24, + "learning_rate": 1.9860755413655833e-06, + "loss": 0.9043, + "step": 9550 + }, + { + "epoch": 0.24, + "learning_rate": 1.9860709394467862e-06, + "loss": 0.9629, + "step": 9551 + }, + { + "epoch": 0.24, + "learning_rate": 1.9860663367729995e-06, + "loss": 0.8809, + "step": 9552 + }, + { + "epoch": 0.24, + "learning_rate": 1.9860617333442273e-06, + "loss": 0.9609, + "step": 9553 + }, + { + "epoch": 0.24, + "learning_rate": 1.986057129160473e-06, + "loss": 0.8076, + "step": 9554 + }, + { + "epoch": 0.24, + "learning_rate": 1.98605252422174e-06, + "loss": 0.8018, + "step": 9555 + }, + { + "epoch": 0.24, + "learning_rate": 1.9860479185280324e-06, + "loss": 1.1982, + "step": 9556 + }, + { + "epoch": 0.24, + "learning_rate": 1.986043312079353e-06, + "loss": 0.8643, + "step": 9557 + }, + { + "epoch": 0.24, + "learning_rate": 1.9860387048757054e-06, + "loss": 0.8301, + "step": 9558 + }, + { + "epoch": 0.25, + "learning_rate": 1.9860340969170933e-06, + "loss": 0.8965, + "step": 9559 + }, + { + "epoch": 0.25, + "learning_rate": 1.9860294882035204e-06, + "loss": 0.8525, + "step": 9560 + }, + { + "epoch": 0.25, + "learning_rate": 1.98602487873499e-06, + "loss": 0.9307, + "step": 9561 + }, + { + "epoch": 0.25, + "learning_rate": 1.986020268511506e-06, + "loss": 1.001, + "step": 9562 + }, + { + "epoch": 0.25, + "learning_rate": 1.986015657533071e-06, + "loss": 1.043, + "step": 9563 + }, + { + "epoch": 0.25, + "learning_rate": 1.9860110457996896e-06, + "loss": 0.8364, + "step": 9564 + }, + { + "epoch": 0.25, + "learning_rate": 1.9860064333113647e-06, + "loss": 0.6614, + "step": 9565 + }, + { + "epoch": 0.25, + "learning_rate": 1.9860018200680997e-06, + "loss": 0.6748, + "step": 9566 + }, + { + "epoch": 0.25, + "learning_rate": 1.9859972060698992e-06, + "loss": 0.9717, + "step": 9567 + }, + { + "epoch": 0.25, + "learning_rate": 1.9859925913167654e-06, + "loss": 1.0039, + "step": 9568 + }, + { + "epoch": 0.25, + "learning_rate": 1.9859879758087024e-06, + "loss": 0.8643, + "step": 9569 + }, + { + "epoch": 0.25, + "learning_rate": 1.985983359545714e-06, + "loss": 0.8281, + "step": 9570 + }, + { + "epoch": 0.25, + "learning_rate": 1.9859787425278035e-06, + "loss": 1.0693, + "step": 9571 + }, + { + "epoch": 0.25, + "learning_rate": 1.9859741247549743e-06, + "loss": 0.9316, + "step": 9572 + }, + { + "epoch": 0.25, + "learning_rate": 1.98596950622723e-06, + "loss": 1.042, + "step": 9573 + }, + { + "epoch": 0.25, + "learning_rate": 1.9859648869445743e-06, + "loss": 0.8643, + "step": 9574 + }, + { + "epoch": 0.25, + "learning_rate": 1.9859602669070107e-06, + "loss": 0.9854, + "step": 9575 + }, + { + "epoch": 0.25, + "learning_rate": 1.9859556461145425e-06, + "loss": 1.0586, + "step": 9576 + }, + { + "epoch": 0.25, + "learning_rate": 1.985951024567173e-06, + "loss": 0.71, + "step": 9577 + }, + { + "epoch": 0.25, + "learning_rate": 1.985946402264907e-06, + "loss": 1.082, + "step": 9578 + }, + { + "epoch": 0.25, + "learning_rate": 1.9859417792077462e-06, + "loss": 0.7676, + "step": 9579 + }, + { + "epoch": 0.25, + "learning_rate": 1.985937155395696e-06, + "loss": 0.8564, + "step": 9580 + }, + { + "epoch": 0.25, + "learning_rate": 1.9859325308287586e-06, + "loss": 1.0146, + "step": 9581 + }, + { + "epoch": 0.25, + "learning_rate": 1.985927905506938e-06, + "loss": 0.7969, + "step": 9582 + }, + { + "epoch": 0.25, + "learning_rate": 1.985923279430238e-06, + "loss": 0.9229, + "step": 9583 + }, + { + "epoch": 0.25, + "learning_rate": 1.9859186525986615e-06, + "loss": 0.9482, + "step": 9584 + }, + { + "epoch": 0.25, + "learning_rate": 1.985914025012213e-06, + "loss": 0.9492, + "step": 9585 + }, + { + "epoch": 0.25, + "learning_rate": 1.9859093966708947e-06, + "loss": 0.8682, + "step": 9586 + }, + { + "epoch": 0.25, + "learning_rate": 1.9859047675747114e-06, + "loss": 1.0166, + "step": 9587 + }, + { + "epoch": 0.25, + "learning_rate": 1.9859001377236663e-06, + "loss": 0.9375, + "step": 9588 + }, + { + "epoch": 0.25, + "learning_rate": 1.9858955071177624e-06, + "loss": 0.8154, + "step": 9589 + }, + { + "epoch": 0.25, + "learning_rate": 1.9858908757570035e-06, + "loss": 0.8848, + "step": 9590 + }, + { + "epoch": 0.25, + "learning_rate": 1.9858862436413938e-06, + "loss": 0.7988, + "step": 9591 + }, + { + "epoch": 0.25, + "learning_rate": 1.985881610770936e-06, + "loss": 1.0029, + "step": 9592 + }, + { + "epoch": 0.25, + "learning_rate": 1.9858769771456343e-06, + "loss": 0.8975, + "step": 9593 + }, + { + "epoch": 0.25, + "learning_rate": 1.9858723427654914e-06, + "loss": 1.1973, + "step": 9594 + }, + { + "epoch": 0.25, + "learning_rate": 1.985867707630512e-06, + "loss": 1.0625, + "step": 9595 + }, + { + "epoch": 0.25, + "learning_rate": 1.985863071740699e-06, + "loss": 0.9756, + "step": 9596 + }, + { + "epoch": 0.25, + "learning_rate": 1.9858584350960552e-06, + "loss": 1.0254, + "step": 9597 + }, + { + "epoch": 0.25, + "learning_rate": 1.985853797696586e-06, + "loss": 0.6426, + "step": 9598 + }, + { + "epoch": 0.25, + "learning_rate": 1.985849159542293e-06, + "loss": 0.8682, + "step": 9599 + }, + { + "epoch": 0.25, + "learning_rate": 1.985844520633181e-06, + "loss": 0.8406, + "step": 9600 + }, + { + "epoch": 0.25, + "learning_rate": 1.985839880969253e-06, + "loss": 1.0967, + "step": 9601 + }, + { + "epoch": 0.25, + "learning_rate": 1.985835240550513e-06, + "loss": 0.7356, + "step": 9602 + }, + { + "epoch": 0.25, + "learning_rate": 1.985830599376964e-06, + "loss": 0.998, + "step": 9603 + }, + { + "epoch": 0.25, + "learning_rate": 1.98582595744861e-06, + "loss": 0.916, + "step": 9604 + }, + { + "epoch": 0.25, + "learning_rate": 1.9858213147654545e-06, + "loss": 0.6084, + "step": 9605 + }, + { + "epoch": 0.25, + "learning_rate": 1.9858166713275008e-06, + "loss": 0.877, + "step": 9606 + }, + { + "epoch": 0.25, + "learning_rate": 1.9858120271347526e-06, + "loss": 0.6006, + "step": 9607 + }, + { + "epoch": 0.25, + "learning_rate": 1.9858073821872133e-06, + "loss": 0.8916, + "step": 9608 + }, + { + "epoch": 0.25, + "learning_rate": 1.985802736484887e-06, + "loss": 0.9492, + "step": 9609 + }, + { + "epoch": 0.25, + "learning_rate": 1.9857980900277765e-06, + "loss": 1.0117, + "step": 9610 + }, + { + "epoch": 0.25, + "learning_rate": 1.985793442815886e-06, + "loss": 1.0732, + "step": 9611 + }, + { + "epoch": 0.25, + "learning_rate": 1.9857887948492186e-06, + "loss": 0.7246, + "step": 9612 + }, + { + "epoch": 0.25, + "learning_rate": 1.9857841461277783e-06, + "loss": 0.8633, + "step": 9613 + }, + { + "epoch": 0.25, + "learning_rate": 1.985779496651568e-06, + "loss": 0.5659, + "step": 9614 + }, + { + "epoch": 0.25, + "learning_rate": 1.9857748464205922e-06, + "loss": 1.1445, + "step": 9615 + }, + { + "epoch": 0.25, + "learning_rate": 1.9857701954348537e-06, + "loss": 0.9707, + "step": 9616 + }, + { + "epoch": 0.25, + "learning_rate": 1.9857655436943563e-06, + "loss": 1.0244, + "step": 9617 + }, + { + "epoch": 0.25, + "learning_rate": 1.9857608911991034e-06, + "loss": 1.0088, + "step": 9618 + }, + { + "epoch": 0.25, + "learning_rate": 1.985756237949099e-06, + "loss": 0.7681, + "step": 9619 + }, + { + "epoch": 0.25, + "learning_rate": 1.985751583944346e-06, + "loss": 0.9092, + "step": 9620 + }, + { + "epoch": 0.25, + "learning_rate": 1.9857469291848486e-06, + "loss": 0.8877, + "step": 9621 + }, + { + "epoch": 0.25, + "learning_rate": 1.9857422736706098e-06, + "loss": 0.8682, + "step": 9622 + }, + { + "epoch": 0.25, + "learning_rate": 1.9857376174016337e-06, + "loss": 1.0859, + "step": 9623 + }, + { + "epoch": 0.25, + "learning_rate": 1.9857329603779237e-06, + "loss": 0.9009, + "step": 9624 + }, + { + "epoch": 0.25, + "learning_rate": 1.985728302599483e-06, + "loss": 0.8047, + "step": 9625 + }, + { + "epoch": 0.25, + "learning_rate": 1.985723644066316e-06, + "loss": 0.7139, + "step": 9626 + }, + { + "epoch": 0.25, + "learning_rate": 1.985718984778425e-06, + "loss": 0.9805, + "step": 9627 + }, + { + "epoch": 0.25, + "learning_rate": 1.985714324735815e-06, + "loss": 1.0615, + "step": 9628 + }, + { + "epoch": 0.25, + "learning_rate": 1.9857096639384887e-06, + "loss": 0.9688, + "step": 9629 + }, + { + "epoch": 0.25, + "learning_rate": 1.9857050023864495e-06, + "loss": 0.915, + "step": 9630 + }, + { + "epoch": 0.25, + "learning_rate": 1.985700340079702e-06, + "loss": 0.8564, + "step": 9631 + }, + { + "epoch": 0.25, + "learning_rate": 1.9856956770182483e-06, + "loss": 0.8047, + "step": 9632 + }, + { + "epoch": 0.25, + "learning_rate": 1.985691013202093e-06, + "loss": 0.7314, + "step": 9633 + }, + { + "epoch": 0.25, + "learning_rate": 1.9856863486312394e-06, + "loss": 0.96, + "step": 9634 + }, + { + "epoch": 0.25, + "learning_rate": 1.9856816833056913e-06, + "loss": 0.9736, + "step": 9635 + }, + { + "epoch": 0.25, + "learning_rate": 1.9856770172254516e-06, + "loss": 0.7871, + "step": 9636 + }, + { + "epoch": 0.25, + "learning_rate": 1.9856723503905247e-06, + "loss": 0.8242, + "step": 9637 + }, + { + "epoch": 0.25, + "learning_rate": 1.985667682800914e-06, + "loss": 0.9375, + "step": 9638 + }, + { + "epoch": 0.25, + "learning_rate": 1.985663014456622e-06, + "loss": 0.8945, + "step": 9639 + }, + { + "epoch": 0.25, + "learning_rate": 1.985658345357654e-06, + "loss": 0.9287, + "step": 9640 + }, + { + "epoch": 0.25, + "learning_rate": 1.9856536755040126e-06, + "loss": 1.1426, + "step": 9641 + }, + { + "epoch": 0.25, + "learning_rate": 1.9856490048957013e-06, + "loss": 0.8623, + "step": 9642 + }, + { + "epoch": 0.25, + "learning_rate": 1.985644333532724e-06, + "loss": 0.7964, + "step": 9643 + }, + { + "epoch": 0.25, + "learning_rate": 1.985639661415084e-06, + "loss": 0.9922, + "step": 9644 + }, + { + "epoch": 0.25, + "learning_rate": 1.985634988542785e-06, + "loss": 0.8594, + "step": 9645 + }, + { + "epoch": 0.25, + "learning_rate": 1.9856303149158312e-06, + "loss": 0.8809, + "step": 9646 + }, + { + "epoch": 0.25, + "learning_rate": 1.985625640534225e-06, + "loss": 0.7393, + "step": 9647 + }, + { + "epoch": 0.25, + "learning_rate": 1.9856209653979706e-06, + "loss": 0.833, + "step": 9648 + }, + { + "epoch": 0.25, + "learning_rate": 1.9856162895070714e-06, + "loss": 1.0801, + "step": 9649 + }, + { + "epoch": 0.25, + "learning_rate": 1.9856116128615315e-06, + "loss": 0.8838, + "step": 9650 + }, + { + "epoch": 0.25, + "learning_rate": 1.9856069354613542e-06, + "loss": 0.959, + "step": 9651 + }, + { + "epoch": 0.25, + "learning_rate": 1.9856022573065426e-06, + "loss": 0.9111, + "step": 9652 + }, + { + "epoch": 0.25, + "learning_rate": 1.985597578397101e-06, + "loss": 0.8613, + "step": 9653 + }, + { + "epoch": 0.25, + "learning_rate": 1.9855928987330324e-06, + "loss": 0.9844, + "step": 9654 + }, + { + "epoch": 0.25, + "learning_rate": 1.9855882183143406e-06, + "loss": 0.8311, + "step": 9655 + }, + { + "epoch": 0.25, + "learning_rate": 1.9855835371410293e-06, + "loss": 0.9365, + "step": 9656 + }, + { + "epoch": 0.25, + "learning_rate": 1.9855788552131022e-06, + "loss": 0.9287, + "step": 9657 + }, + { + "epoch": 0.25, + "learning_rate": 1.985574172530563e-06, + "loss": 0.9238, + "step": 9658 + }, + { + "epoch": 0.25, + "learning_rate": 1.985569489093414e-06, + "loss": 0.688, + "step": 9659 + }, + { + "epoch": 0.25, + "learning_rate": 1.9855648049016605e-06, + "loss": 0.8535, + "step": 9660 + }, + { + "epoch": 0.25, + "learning_rate": 1.9855601199553053e-06, + "loss": 1.0059, + "step": 9661 + }, + { + "epoch": 0.25, + "learning_rate": 1.9855554342543517e-06, + "loss": 0.874, + "step": 9662 + }, + { + "epoch": 0.25, + "learning_rate": 1.9855507477988036e-06, + "loss": 0.7598, + "step": 9663 + }, + { + "epoch": 0.25, + "learning_rate": 1.985546060588665e-06, + "loss": 0.8413, + "step": 9664 + }, + { + "epoch": 0.25, + "learning_rate": 1.985541372623939e-06, + "loss": 0.7529, + "step": 9665 + }, + { + "epoch": 0.25, + "learning_rate": 1.985536683904629e-06, + "loss": 1.0127, + "step": 9666 + }, + { + "epoch": 0.25, + "learning_rate": 1.985531994430739e-06, + "loss": 0.9844, + "step": 9667 + }, + { + "epoch": 0.25, + "learning_rate": 1.9855273042022726e-06, + "loss": 0.8174, + "step": 9668 + }, + { + "epoch": 0.25, + "learning_rate": 1.985522613219233e-06, + "loss": 0.7163, + "step": 9669 + }, + { + "epoch": 0.25, + "learning_rate": 1.9855179214816246e-06, + "loss": 0.9805, + "step": 9670 + }, + { + "epoch": 0.25, + "learning_rate": 1.9855132289894497e-06, + "loss": 1.1084, + "step": 9671 + }, + { + "epoch": 0.25, + "learning_rate": 1.9855085357427132e-06, + "loss": 1.249, + "step": 9672 + }, + { + "epoch": 0.25, + "learning_rate": 1.985503841741418e-06, + "loss": 0.9375, + "step": 9673 + }, + { + "epoch": 0.25, + "learning_rate": 1.9854991469855677e-06, + "loss": 0.4714, + "step": 9674 + }, + { + "epoch": 0.25, + "learning_rate": 1.985494451475166e-06, + "loss": 0.7324, + "step": 9675 + }, + { + "epoch": 0.25, + "learning_rate": 1.9854897552102167e-06, + "loss": 1.0967, + "step": 9676 + }, + { + "epoch": 0.25, + "learning_rate": 1.985485058190723e-06, + "loss": 0.8623, + "step": 9677 + }, + { + "epoch": 0.25, + "learning_rate": 1.9854803604166888e-06, + "loss": 1.04, + "step": 9678 + }, + { + "epoch": 0.25, + "learning_rate": 1.985475661888118e-06, + "loss": 0.7583, + "step": 9679 + }, + { + "epoch": 0.25, + "learning_rate": 1.9854709626050134e-06, + "loss": 0.8486, + "step": 9680 + }, + { + "epoch": 0.25, + "learning_rate": 1.9854662625673788e-06, + "loss": 1.0801, + "step": 9681 + }, + { + "epoch": 0.25, + "learning_rate": 1.985461561775218e-06, + "loss": 0.9141, + "step": 9682 + }, + { + "epoch": 0.25, + "learning_rate": 1.9854568602285347e-06, + "loss": 0.7109, + "step": 9683 + }, + { + "epoch": 0.25, + "learning_rate": 1.985452157927333e-06, + "loss": 0.7915, + "step": 9684 + }, + { + "epoch": 0.25, + "learning_rate": 1.985447454871615e-06, + "loss": 0.582, + "step": 9685 + }, + { + "epoch": 0.25, + "learning_rate": 1.985442751061386e-06, + "loss": 0.7012, + "step": 9686 + }, + { + "epoch": 0.25, + "learning_rate": 1.985438046496648e-06, + "loss": 0.8345, + "step": 9687 + }, + { + "epoch": 0.25, + "learning_rate": 1.9854333411774058e-06, + "loss": 1.0732, + "step": 9688 + }, + { + "epoch": 0.25, + "learning_rate": 1.9854286351036627e-06, + "loss": 1.1338, + "step": 9689 + }, + { + "epoch": 0.25, + "learning_rate": 1.985423928275422e-06, + "loss": 0.9951, + "step": 9690 + }, + { + "epoch": 0.25, + "learning_rate": 1.9854192206926874e-06, + "loss": 0.8291, + "step": 9691 + }, + { + "epoch": 0.25, + "learning_rate": 1.9854145123554627e-06, + "loss": 0.9209, + "step": 9692 + }, + { + "epoch": 0.25, + "learning_rate": 1.985409803263752e-06, + "loss": 1.0361, + "step": 9693 + }, + { + "epoch": 0.25, + "learning_rate": 1.985405093417558e-06, + "loss": 0.7808, + "step": 9694 + }, + { + "epoch": 0.25, + "learning_rate": 1.985400382816884e-06, + "loss": 0.603, + "step": 9695 + }, + { + "epoch": 0.25, + "learning_rate": 1.9853956714617348e-06, + "loss": 0.7021, + "step": 9696 + }, + { + "epoch": 0.25, + "learning_rate": 1.9853909593521133e-06, + "loss": 0.8105, + "step": 9697 + }, + { + "epoch": 0.25, + "learning_rate": 1.9853862464880235e-06, + "loss": 0.9463, + "step": 9698 + }, + { + "epoch": 0.25, + "learning_rate": 1.9853815328694683e-06, + "loss": 0.8652, + "step": 9699 + }, + { + "epoch": 0.25, + "learning_rate": 1.9853768184964524e-06, + "loss": 1.0381, + "step": 9700 + }, + { + "epoch": 0.25, + "learning_rate": 1.9853721033689784e-06, + "loss": 1.0898, + "step": 9701 + }, + { + "epoch": 0.25, + "learning_rate": 1.9853673874870503e-06, + "loss": 1.043, + "step": 9702 + }, + { + "epoch": 0.25, + "learning_rate": 1.9853626708506718e-06, + "loss": 1.0254, + "step": 9703 + }, + { + "epoch": 0.25, + "learning_rate": 1.985357953459846e-06, + "loss": 0.9922, + "step": 9704 + }, + { + "epoch": 0.25, + "learning_rate": 1.9853532353145774e-06, + "loss": 1.082, + "step": 9705 + }, + { + "epoch": 0.25, + "learning_rate": 1.985348516414869e-06, + "loss": 0.96, + "step": 9706 + }, + { + "epoch": 0.25, + "learning_rate": 1.9853437967607244e-06, + "loss": 0.6548, + "step": 9707 + }, + { + "epoch": 0.25, + "learning_rate": 1.9853390763521478e-06, + "loss": 0.5996, + "step": 9708 + }, + { + "epoch": 0.25, + "learning_rate": 1.985334355189142e-06, + "loss": 1.085, + "step": 9709 + }, + { + "epoch": 0.25, + "learning_rate": 1.985329633271711e-06, + "loss": 0.873, + "step": 9710 + }, + { + "epoch": 0.25, + "learning_rate": 1.9853249105998584e-06, + "loss": 0.9082, + "step": 9711 + }, + { + "epoch": 0.25, + "learning_rate": 1.985320187173588e-06, + "loss": 0.832, + "step": 9712 + }, + { + "epoch": 0.25, + "learning_rate": 1.985315462992903e-06, + "loss": 1.1104, + "step": 9713 + }, + { + "epoch": 0.25, + "learning_rate": 1.9853107380578075e-06, + "loss": 0.9795, + "step": 9714 + }, + { + "epoch": 0.25, + "learning_rate": 1.9853060123683044e-06, + "loss": 1.0322, + "step": 9715 + }, + { + "epoch": 0.25, + "learning_rate": 1.9853012859243986e-06, + "loss": 0.7207, + "step": 9716 + }, + { + "epoch": 0.25, + "learning_rate": 1.985296558726092e-06, + "loss": 0.8252, + "step": 9717 + }, + { + "epoch": 0.25, + "learning_rate": 1.98529183077339e-06, + "loss": 0.9238, + "step": 9718 + }, + { + "epoch": 0.25, + "learning_rate": 1.985287102066295e-06, + "loss": 0.9189, + "step": 9719 + }, + { + "epoch": 0.25, + "learning_rate": 1.9852823726048106e-06, + "loss": 0.7373, + "step": 9720 + }, + { + "epoch": 0.25, + "learning_rate": 1.985277642388941e-06, + "loss": 0.8096, + "step": 9721 + }, + { + "epoch": 0.25, + "learning_rate": 1.98527291141869e-06, + "loss": 1.0371, + "step": 9722 + }, + { + "epoch": 0.25, + "learning_rate": 1.9852681796940607e-06, + "loss": 0.8125, + "step": 9723 + }, + { + "epoch": 0.25, + "learning_rate": 1.9852634472150565e-06, + "loss": 0.8833, + "step": 9724 + }, + { + "epoch": 0.25, + "learning_rate": 1.9852587139816815e-06, + "loss": 0.9033, + "step": 9725 + }, + { + "epoch": 0.25, + "learning_rate": 1.9852539799939393e-06, + "loss": 0.9404, + "step": 9726 + }, + { + "epoch": 0.25, + "learning_rate": 1.9852492452518334e-06, + "loss": 1.0742, + "step": 9727 + }, + { + "epoch": 0.25, + "learning_rate": 1.9852445097553675e-06, + "loss": 0.8647, + "step": 9728 + }, + { + "epoch": 0.25, + "learning_rate": 1.985239773504545e-06, + "loss": 0.9053, + "step": 9729 + }, + { + "epoch": 0.25, + "learning_rate": 1.98523503649937e-06, + "loss": 0.8779, + "step": 9730 + }, + { + "epoch": 0.25, + "learning_rate": 1.9852302987398457e-06, + "loss": 0.9795, + "step": 9731 + }, + { + "epoch": 0.25, + "learning_rate": 1.985225560225976e-06, + "loss": 0.6963, + "step": 9732 + }, + { + "epoch": 0.25, + "learning_rate": 1.9852208209577645e-06, + "loss": 0.8867, + "step": 9733 + }, + { + "epoch": 0.25, + "learning_rate": 1.985216080935214e-06, + "loss": 0.6108, + "step": 9734 + }, + { + "epoch": 0.25, + "learning_rate": 1.9852113401583296e-06, + "loss": 1.0225, + "step": 9735 + }, + { + "epoch": 0.25, + "learning_rate": 1.9852065986271136e-06, + "loss": 0.8633, + "step": 9736 + }, + { + "epoch": 0.25, + "learning_rate": 1.9852018563415707e-06, + "loss": 0.9414, + "step": 9737 + }, + { + "epoch": 0.25, + "learning_rate": 1.985197113301704e-06, + "loss": 0.7415, + "step": 9738 + }, + { + "epoch": 0.25, + "learning_rate": 1.985192369507517e-06, + "loss": 0.8999, + "step": 9739 + }, + { + "epoch": 0.25, + "learning_rate": 1.9851876249590137e-06, + "loss": 0.7119, + "step": 9740 + }, + { + "epoch": 0.25, + "learning_rate": 1.985182879656197e-06, + "loss": 0.9092, + "step": 9741 + }, + { + "epoch": 0.25, + "learning_rate": 1.9851781335990715e-06, + "loss": 1.0312, + "step": 9742 + }, + { + "epoch": 0.25, + "learning_rate": 1.98517338678764e-06, + "loss": 0.9473, + "step": 9743 + }, + { + "epoch": 0.25, + "learning_rate": 1.9851686392219073e-06, + "loss": 0.9297, + "step": 9744 + }, + { + "epoch": 0.25, + "learning_rate": 1.985163890901876e-06, + "loss": 0.9248, + "step": 9745 + }, + { + "epoch": 0.25, + "learning_rate": 1.9851591418275495e-06, + "loss": 0.7666, + "step": 9746 + }, + { + "epoch": 0.25, + "learning_rate": 1.9851543919989325e-06, + "loss": 0.7891, + "step": 9747 + }, + { + "epoch": 0.25, + "learning_rate": 1.9851496414160277e-06, + "loss": 0.8271, + "step": 9748 + }, + { + "epoch": 0.25, + "learning_rate": 1.9851448900788396e-06, + "loss": 0.9536, + "step": 9749 + }, + { + "epoch": 0.25, + "learning_rate": 1.9851401379873707e-06, + "loss": 0.7583, + "step": 9750 + }, + { + "epoch": 0.25, + "learning_rate": 1.985135385141626e-06, + "loss": 0.8311, + "step": 9751 + }, + { + "epoch": 0.25, + "learning_rate": 1.985130631541608e-06, + "loss": 1.0186, + "step": 9752 + }, + { + "epoch": 0.25, + "learning_rate": 1.985125877187321e-06, + "loss": 0.9414, + "step": 9753 + }, + { + "epoch": 0.25, + "learning_rate": 1.985121122078768e-06, + "loss": 0.9434, + "step": 9754 + }, + { + "epoch": 0.25, + "learning_rate": 1.9851163662159533e-06, + "loss": 0.7927, + "step": 9755 + }, + { + "epoch": 0.25, + "learning_rate": 1.9851116095988806e-06, + "loss": 0.8003, + "step": 9756 + }, + { + "epoch": 0.25, + "learning_rate": 1.9851068522275526e-06, + "loss": 1.1436, + "step": 9757 + }, + { + "epoch": 0.25, + "learning_rate": 1.985102094101974e-06, + "loss": 0.9053, + "step": 9758 + }, + { + "epoch": 0.25, + "learning_rate": 1.985097335222148e-06, + "loss": 0.9961, + "step": 9759 + }, + { + "epoch": 0.25, + "learning_rate": 1.985092575588078e-06, + "loss": 0.958, + "step": 9760 + }, + { + "epoch": 0.25, + "learning_rate": 1.9850878151997683e-06, + "loss": 0.7378, + "step": 9761 + }, + { + "epoch": 0.25, + "learning_rate": 1.985083054057222e-06, + "loss": 0.8799, + "step": 9762 + }, + { + "epoch": 0.25, + "learning_rate": 1.985078292160443e-06, + "loss": 1.0361, + "step": 9763 + }, + { + "epoch": 0.25, + "learning_rate": 1.9850735295094347e-06, + "loss": 0.876, + "step": 9764 + }, + { + "epoch": 0.25, + "learning_rate": 1.985068766104201e-06, + "loss": 0.9102, + "step": 9765 + }, + { + "epoch": 0.25, + "learning_rate": 1.985064001944745e-06, + "loss": 0.8892, + "step": 9766 + }, + { + "epoch": 0.25, + "learning_rate": 1.9850592370310714e-06, + "loss": 0.8213, + "step": 9767 + }, + { + "epoch": 0.25, + "learning_rate": 1.985054471363183e-06, + "loss": 0.957, + "step": 9768 + }, + { + "epoch": 0.25, + "learning_rate": 1.9850497049410836e-06, + "loss": 0.8486, + "step": 9769 + }, + { + "epoch": 0.25, + "learning_rate": 1.985044937764777e-06, + "loss": 0.8643, + "step": 9770 + }, + { + "epoch": 0.25, + "learning_rate": 1.985040169834267e-06, + "loss": 0.8237, + "step": 9771 + }, + { + "epoch": 0.25, + "learning_rate": 1.985035401149557e-06, + "loss": 1.0322, + "step": 9772 + }, + { + "epoch": 0.25, + "learning_rate": 1.9850306317106504e-06, + "loss": 1.1445, + "step": 9773 + }, + { + "epoch": 0.25, + "learning_rate": 1.985025861517551e-06, + "loss": 0.7529, + "step": 9774 + }, + { + "epoch": 0.25, + "learning_rate": 1.985021090570263e-06, + "loss": 0.9736, + "step": 9775 + }, + { + "epoch": 0.25, + "learning_rate": 1.9850163188687896e-06, + "loss": 0.9531, + "step": 9776 + }, + { + "epoch": 0.25, + "learning_rate": 1.985011546413134e-06, + "loss": 0.9146, + "step": 9777 + }, + { + "epoch": 0.25, + "learning_rate": 1.985006773203301e-06, + "loss": 1.0605, + "step": 9778 + }, + { + "epoch": 0.25, + "learning_rate": 1.9850019992392934e-06, + "loss": 0.9575, + "step": 9779 + }, + { + "epoch": 0.25, + "learning_rate": 1.9849972245211147e-06, + "loss": 1.0605, + "step": 9780 + }, + { + "epoch": 0.25, + "learning_rate": 1.9849924490487693e-06, + "loss": 0.9365, + "step": 9781 + }, + { + "epoch": 0.25, + "learning_rate": 1.9849876728222604e-06, + "loss": 1.0625, + "step": 9782 + }, + { + "epoch": 0.25, + "learning_rate": 1.984982895841592e-06, + "loss": 0.8525, + "step": 9783 + }, + { + "epoch": 0.25, + "learning_rate": 1.984978118106767e-06, + "loss": 1.0088, + "step": 9784 + }, + { + "epoch": 0.25, + "learning_rate": 1.98497333961779e-06, + "loss": 1.0801, + "step": 9785 + }, + { + "epoch": 0.25, + "learning_rate": 1.9849685603746638e-06, + "loss": 0.9453, + "step": 9786 + }, + { + "epoch": 0.25, + "learning_rate": 1.9849637803773925e-06, + "loss": 0.8103, + "step": 9787 + }, + { + "epoch": 0.25, + "learning_rate": 1.98495899962598e-06, + "loss": 0.5916, + "step": 9788 + }, + { + "epoch": 0.25, + "learning_rate": 1.9849542181204292e-06, + "loss": 0.9414, + "step": 9789 + }, + { + "epoch": 0.25, + "learning_rate": 1.984949435860745e-06, + "loss": 0.707, + "step": 9790 + }, + { + "epoch": 0.25, + "learning_rate": 1.9849446528469296e-06, + "loss": 0.9756, + "step": 9791 + }, + { + "epoch": 0.25, + "learning_rate": 1.984939869078988e-06, + "loss": 1.0195, + "step": 9792 + }, + { + "epoch": 0.25, + "learning_rate": 1.9849350845569225e-06, + "loss": 1.0107, + "step": 9793 + }, + { + "epoch": 0.25, + "learning_rate": 1.984930299280738e-06, + "loss": 0.8623, + "step": 9794 + }, + { + "epoch": 0.25, + "learning_rate": 1.9849255132504375e-06, + "loss": 0.9805, + "step": 9795 + }, + { + "epoch": 0.25, + "learning_rate": 1.9849207264660247e-06, + "loss": 0.9883, + "step": 9796 + }, + { + "epoch": 0.25, + "learning_rate": 1.9849159389275035e-06, + "loss": 0.998, + "step": 9797 + }, + { + "epoch": 0.25, + "learning_rate": 1.9849111506348777e-06, + "loss": 0.877, + "step": 9798 + }, + { + "epoch": 0.25, + "learning_rate": 1.9849063615881504e-06, + "loss": 0.8237, + "step": 9799 + }, + { + "epoch": 0.25, + "learning_rate": 1.9849015717873257e-06, + "loss": 0.9873, + "step": 9800 + }, + { + "epoch": 0.25, + "learning_rate": 1.9848967812324075e-06, + "loss": 1.1543, + "step": 9801 + }, + { + "epoch": 0.25, + "learning_rate": 1.9848919899233984e-06, + "loss": 0.9316, + "step": 9802 + }, + { + "epoch": 0.25, + "learning_rate": 1.9848871978603033e-06, + "loss": 0.8936, + "step": 9803 + }, + { + "epoch": 0.25, + "learning_rate": 1.9848824050431253e-06, + "loss": 0.9717, + "step": 9804 + }, + { + "epoch": 0.25, + "learning_rate": 1.984877611471868e-06, + "loss": 0.9038, + "step": 9805 + }, + { + "epoch": 0.25, + "learning_rate": 1.9848728171465352e-06, + "loss": 1.123, + "step": 9806 + }, + { + "epoch": 0.25, + "learning_rate": 1.984868022067131e-06, + "loss": 0.9482, + "step": 9807 + }, + { + "epoch": 0.25, + "learning_rate": 1.984863226233658e-06, + "loss": 1.0381, + "step": 9808 + }, + { + "epoch": 0.25, + "learning_rate": 1.9848584296461207e-06, + "loss": 1.0801, + "step": 9809 + }, + { + "epoch": 0.25, + "learning_rate": 1.9848536323045225e-06, + "loss": 1.0166, + "step": 9810 + }, + { + "epoch": 0.25, + "learning_rate": 1.9848488342088677e-06, + "loss": 0.6909, + "step": 9811 + }, + { + "epoch": 0.25, + "learning_rate": 1.9848440353591587e-06, + "loss": 0.8545, + "step": 9812 + }, + { + "epoch": 0.25, + "learning_rate": 1.9848392357554007e-06, + "loss": 0.9434, + "step": 9813 + }, + { + "epoch": 0.25, + "learning_rate": 1.9848344353975957e-06, + "loss": 0.9893, + "step": 9814 + }, + { + "epoch": 0.25, + "learning_rate": 1.984829634285749e-06, + "loss": 0.8105, + "step": 9815 + }, + { + "epoch": 0.25, + "learning_rate": 1.984824832419863e-06, + "loss": 1.1211, + "step": 9816 + }, + { + "epoch": 0.25, + "learning_rate": 1.9848200297999423e-06, + "loss": 0.9678, + "step": 9817 + }, + { + "epoch": 0.25, + "learning_rate": 1.9848152264259902e-06, + "loss": 0.624, + "step": 9818 + }, + { + "epoch": 0.25, + "learning_rate": 1.98481042229801e-06, + "loss": 1.2012, + "step": 9819 + }, + { + "epoch": 0.25, + "learning_rate": 1.984805617416006e-06, + "loss": 1.0557, + "step": 9820 + }, + { + "epoch": 0.25, + "learning_rate": 1.9848008117799815e-06, + "loss": 0.9922, + "step": 9821 + }, + { + "epoch": 0.25, + "learning_rate": 1.9847960053899404e-06, + "loss": 0.7622, + "step": 9822 + }, + { + "epoch": 0.25, + "learning_rate": 1.984791198245886e-06, + "loss": 0.7114, + "step": 9823 + }, + { + "epoch": 0.25, + "learning_rate": 1.9847863903478227e-06, + "loss": 0.9189, + "step": 9824 + }, + { + "epoch": 0.25, + "learning_rate": 1.9847815816957537e-06, + "loss": 1.001, + "step": 9825 + }, + { + "epoch": 0.25, + "learning_rate": 1.9847767722896824e-06, + "loss": 0.9404, + "step": 9826 + }, + { + "epoch": 0.25, + "learning_rate": 1.984771962129613e-06, + "loss": 1.0, + "step": 9827 + }, + { + "epoch": 0.25, + "learning_rate": 1.9847671512155487e-06, + "loss": 0.8779, + "step": 9828 + }, + { + "epoch": 0.25, + "learning_rate": 1.984762339547494e-06, + "loss": 1.0088, + "step": 9829 + }, + { + "epoch": 0.25, + "learning_rate": 1.9847575271254517e-06, + "loss": 0.873, + "step": 9830 + }, + { + "epoch": 0.25, + "learning_rate": 1.984752713949426e-06, + "loss": 0.8706, + "step": 9831 + }, + { + "epoch": 0.25, + "learning_rate": 1.9847479000194203e-06, + "loss": 1.0234, + "step": 9832 + }, + { + "epoch": 0.25, + "learning_rate": 1.9847430853354387e-06, + "loss": 0.4941, + "step": 9833 + }, + { + "epoch": 0.25, + "learning_rate": 1.984738269897484e-06, + "loss": 1.0977, + "step": 9834 + }, + { + "epoch": 0.25, + "learning_rate": 1.984733453705561e-06, + "loss": 0.9902, + "step": 9835 + }, + { + "epoch": 0.25, + "learning_rate": 1.984728636759673e-06, + "loss": 0.9219, + "step": 9836 + }, + { + "epoch": 0.25, + "learning_rate": 1.984723819059823e-06, + "loss": 1.1699, + "step": 9837 + }, + { + "epoch": 0.25, + "learning_rate": 1.9847190006060154e-06, + "loss": 0.7988, + "step": 9838 + }, + { + "epoch": 0.25, + "learning_rate": 1.984714181398254e-06, + "loss": 1.0137, + "step": 9839 + }, + { + "epoch": 0.25, + "learning_rate": 1.984709361436542e-06, + "loss": 0.8281, + "step": 9840 + }, + { + "epoch": 0.25, + "learning_rate": 1.9847045407208837e-06, + "loss": 0.8633, + "step": 9841 + }, + { + "epoch": 0.25, + "learning_rate": 1.984699719251282e-06, + "loss": 0.9893, + "step": 9842 + }, + { + "epoch": 0.25, + "learning_rate": 1.984694897027741e-06, + "loss": 0.833, + "step": 9843 + }, + { + "epoch": 0.25, + "learning_rate": 1.9846900740502647e-06, + "loss": 1.1484, + "step": 9844 + }, + { + "epoch": 0.25, + "learning_rate": 1.9846852503188565e-06, + "loss": 0.8975, + "step": 9845 + }, + { + "epoch": 0.25, + "learning_rate": 1.9846804258335197e-06, + "loss": 0.751, + "step": 9846 + }, + { + "epoch": 0.25, + "learning_rate": 1.9846756005942587e-06, + "loss": 0.9287, + "step": 9847 + }, + { + "epoch": 0.25, + "learning_rate": 1.9846707746010765e-06, + "loss": 0.9336, + "step": 9848 + }, + { + "epoch": 0.25, + "learning_rate": 1.9846659478539774e-06, + "loss": 0.8882, + "step": 9849 + }, + { + "epoch": 0.25, + "learning_rate": 1.9846611203529652e-06, + "loss": 1.1914, + "step": 9850 + }, + { + "epoch": 0.25, + "learning_rate": 1.984656292098043e-06, + "loss": 0.8647, + "step": 9851 + }, + { + "epoch": 0.25, + "learning_rate": 1.984651463089214e-06, + "loss": 0.9824, + "step": 9852 + }, + { + "epoch": 0.25, + "learning_rate": 1.984646633326484e-06, + "loss": 0.9219, + "step": 9853 + }, + { + "epoch": 0.25, + "learning_rate": 1.9846418028098544e-06, + "loss": 1.0986, + "step": 9854 + }, + { + "epoch": 0.25, + "learning_rate": 1.9846369715393304e-06, + "loss": 1.0557, + "step": 9855 + }, + { + "epoch": 0.25, + "learning_rate": 1.9846321395149145e-06, + "loss": 0.9697, + "step": 9856 + }, + { + "epoch": 0.25, + "learning_rate": 1.984627306736612e-06, + "loss": 0.8945, + "step": 9857 + }, + { + "epoch": 0.25, + "learning_rate": 1.9846224732044247e-06, + "loss": 0.96, + "step": 9858 + }, + { + "epoch": 0.25, + "learning_rate": 1.9846176389183576e-06, + "loss": 1.0977, + "step": 9859 + }, + { + "epoch": 0.25, + "learning_rate": 1.9846128038784142e-06, + "loss": 0.9355, + "step": 9860 + }, + { + "epoch": 0.25, + "learning_rate": 1.9846079680845975e-06, + "loss": 0.9941, + "step": 9861 + }, + { + "epoch": 0.25, + "learning_rate": 1.9846031315369126e-06, + "loss": 1.1016, + "step": 9862 + }, + { + "epoch": 0.25, + "learning_rate": 1.984598294235362e-06, + "loss": 0.9463, + "step": 9863 + }, + { + "epoch": 0.25, + "learning_rate": 1.9845934561799496e-06, + "loss": 0.7002, + "step": 9864 + }, + { + "epoch": 0.25, + "learning_rate": 1.984588617370679e-06, + "loss": 1.0166, + "step": 9865 + }, + { + "epoch": 0.25, + "learning_rate": 1.984583777807555e-06, + "loss": 1.0801, + "step": 9866 + }, + { + "epoch": 0.25, + "learning_rate": 1.9845789374905796e-06, + "loss": 0.8809, + "step": 9867 + }, + { + "epoch": 0.25, + "learning_rate": 1.984574096419758e-06, + "loss": 0.7832, + "step": 9868 + }, + { + "epoch": 0.25, + "learning_rate": 1.984569254595093e-06, + "loss": 1.041, + "step": 9869 + }, + { + "epoch": 0.25, + "learning_rate": 1.9845644120165884e-06, + "loss": 0.9443, + "step": 9870 + }, + { + "epoch": 0.25, + "learning_rate": 1.9845595686842484e-06, + "loss": 0.7676, + "step": 9871 + }, + { + "epoch": 0.25, + "learning_rate": 1.9845547245980765e-06, + "loss": 0.9189, + "step": 9872 + }, + { + "epoch": 0.25, + "learning_rate": 1.984549879758076e-06, + "loss": 1.0371, + "step": 9873 + }, + { + "epoch": 0.25, + "learning_rate": 1.984545034164251e-06, + "loss": 0.874, + "step": 9874 + }, + { + "epoch": 0.25, + "learning_rate": 1.9845401878166054e-06, + "loss": 1.041, + "step": 9875 + }, + { + "epoch": 0.25, + "learning_rate": 1.9845353407151424e-06, + "loss": 1.001, + "step": 9876 + }, + { + "epoch": 0.25, + "learning_rate": 1.9845304928598662e-06, + "loss": 0.8955, + "step": 9877 + }, + { + "epoch": 0.25, + "learning_rate": 1.98452564425078e-06, + "loss": 1.0068, + "step": 9878 + }, + { + "epoch": 0.25, + "learning_rate": 1.984520794887888e-06, + "loss": 0.9658, + "step": 9879 + }, + { + "epoch": 0.25, + "learning_rate": 1.9845159447711935e-06, + "loss": 0.9038, + "step": 9880 + }, + { + "epoch": 0.25, + "learning_rate": 1.9845110939007007e-06, + "loss": 0.8945, + "step": 9881 + }, + { + "epoch": 0.25, + "learning_rate": 1.984506242276413e-06, + "loss": 1.0693, + "step": 9882 + }, + { + "epoch": 0.25, + "learning_rate": 1.984501389898334e-06, + "loss": 0.7183, + "step": 9883 + }, + { + "epoch": 0.25, + "learning_rate": 1.9844965367664674e-06, + "loss": 1.1465, + "step": 9884 + }, + { + "epoch": 0.25, + "learning_rate": 1.9844916828808168e-06, + "loss": 0.832, + "step": 9885 + }, + { + "epoch": 0.25, + "learning_rate": 1.984486828241387e-06, + "loss": 0.6868, + "step": 9886 + }, + { + "epoch": 0.25, + "learning_rate": 1.9844819728481803e-06, + "loss": 0.9111, + "step": 9887 + }, + { + "epoch": 0.25, + "learning_rate": 1.984477116701201e-06, + "loss": 0.666, + "step": 9888 + }, + { + "epoch": 0.25, + "learning_rate": 1.9844722598004534e-06, + "loss": 0.7856, + "step": 9889 + }, + { + "epoch": 0.25, + "learning_rate": 1.9844674021459403e-06, + "loss": 0.9961, + "step": 9890 + }, + { + "epoch": 0.25, + "learning_rate": 1.9844625437376657e-06, + "loss": 0.8652, + "step": 9891 + }, + { + "epoch": 0.25, + "learning_rate": 1.9844576845756335e-06, + "loss": 0.8203, + "step": 9892 + }, + { + "epoch": 0.25, + "learning_rate": 1.984452824659847e-06, + "loss": 0.8398, + "step": 9893 + }, + { + "epoch": 0.25, + "learning_rate": 1.9844479639903107e-06, + "loss": 0.7646, + "step": 9894 + }, + { + "epoch": 0.25, + "learning_rate": 1.984443102567028e-06, + "loss": 0.9233, + "step": 9895 + }, + { + "epoch": 0.25, + "learning_rate": 1.984438240390002e-06, + "loss": 0.9814, + "step": 9896 + }, + { + "epoch": 0.25, + "learning_rate": 1.984433377459237e-06, + "loss": 0.8887, + "step": 9897 + }, + { + "epoch": 0.25, + "learning_rate": 1.9844285137747366e-06, + "loss": 0.7207, + "step": 9898 + }, + { + "epoch": 0.25, + "learning_rate": 1.984423649336505e-06, + "loss": 1.041, + "step": 9899 + }, + { + "epoch": 0.25, + "learning_rate": 1.984418784144545e-06, + "loss": 0.7065, + "step": 9900 + }, + { + "epoch": 0.25, + "learning_rate": 1.9844139181988608e-06, + "loss": 1.0391, + "step": 9901 + }, + { + "epoch": 0.25, + "learning_rate": 1.9844090514994563e-06, + "loss": 0.6558, + "step": 9902 + }, + { + "epoch": 0.25, + "learning_rate": 1.984404184046335e-06, + "loss": 0.9619, + "step": 9903 + }, + { + "epoch": 0.25, + "learning_rate": 1.984399315839501e-06, + "loss": 0.916, + "step": 9904 + }, + { + "epoch": 0.25, + "learning_rate": 1.984394446878957e-06, + "loss": 0.9746, + "step": 9905 + }, + { + "epoch": 0.25, + "learning_rate": 1.9843895771647083e-06, + "loss": 0.9404, + "step": 9906 + }, + { + "epoch": 0.25, + "learning_rate": 1.984384706696757e-06, + "loss": 0.936, + "step": 9907 + }, + { + "epoch": 0.25, + "learning_rate": 1.984379835475108e-06, + "loss": 0.8428, + "step": 9908 + }, + { + "epoch": 0.25, + "learning_rate": 1.9843749634997646e-06, + "loss": 0.8828, + "step": 9909 + }, + { + "epoch": 0.25, + "learning_rate": 1.9843700907707302e-06, + "loss": 0.8838, + "step": 9910 + }, + { + "epoch": 0.25, + "learning_rate": 1.9843652172880093e-06, + "loss": 0.7754, + "step": 9911 + }, + { + "epoch": 0.25, + "learning_rate": 1.9843603430516053e-06, + "loss": 0.8662, + "step": 9912 + }, + { + "epoch": 0.25, + "learning_rate": 1.9843554680615215e-06, + "loss": 0.8857, + "step": 9913 + }, + { + "epoch": 0.25, + "learning_rate": 1.984350592317762e-06, + "loss": 0.8843, + "step": 9914 + }, + { + "epoch": 0.25, + "learning_rate": 1.9843457158203308e-06, + "loss": 0.7432, + "step": 9915 + }, + { + "epoch": 0.25, + "learning_rate": 1.984340838569231e-06, + "loss": 1.1094, + "step": 9916 + }, + { + "epoch": 0.25, + "learning_rate": 1.9843359605644668e-06, + "loss": 0.9766, + "step": 9917 + }, + { + "epoch": 0.25, + "learning_rate": 1.984331081806042e-06, + "loss": 0.9668, + "step": 9918 + }, + { + "epoch": 0.25, + "learning_rate": 1.98432620229396e-06, + "loss": 0.8799, + "step": 9919 + }, + { + "epoch": 0.25, + "learning_rate": 1.9843213220282247e-06, + "loss": 0.7783, + "step": 9920 + }, + { + "epoch": 0.25, + "learning_rate": 1.9843164410088397e-06, + "loss": 1.1426, + "step": 9921 + }, + { + "epoch": 0.25, + "learning_rate": 1.984311559235809e-06, + "loss": 0.8047, + "step": 9922 + }, + { + "epoch": 0.25, + "learning_rate": 1.9843066767091363e-06, + "loss": 0.9482, + "step": 9923 + }, + { + "epoch": 0.25, + "learning_rate": 1.984301793428825e-06, + "loss": 0.9424, + "step": 9924 + }, + { + "epoch": 0.25, + "learning_rate": 1.9842969093948795e-06, + "loss": 0.8071, + "step": 9925 + }, + { + "epoch": 0.25, + "learning_rate": 1.984292024607303e-06, + "loss": 0.8279, + "step": 9926 + }, + { + "epoch": 0.25, + "learning_rate": 1.984287139066099e-06, + "loss": 0.917, + "step": 9927 + }, + { + "epoch": 0.25, + "learning_rate": 1.9842822527712716e-06, + "loss": 1.0234, + "step": 9928 + }, + { + "epoch": 0.25, + "learning_rate": 1.9842773657228246e-06, + "loss": 0.9404, + "step": 9929 + }, + { + "epoch": 0.25, + "learning_rate": 1.984272477920762e-06, + "loss": 0.9551, + "step": 9930 + }, + { + "epoch": 0.25, + "learning_rate": 1.9842675893650867e-06, + "loss": 0.9648, + "step": 9931 + }, + { + "epoch": 0.25, + "learning_rate": 1.9842627000558034e-06, + "loss": 0.9717, + "step": 9932 + }, + { + "epoch": 0.25, + "learning_rate": 1.9842578099929153e-06, + "loss": 0.96, + "step": 9933 + }, + { + "epoch": 0.25, + "learning_rate": 1.984252919176426e-06, + "loss": 0.8604, + "step": 9934 + }, + { + "epoch": 0.25, + "learning_rate": 1.98424802760634e-06, + "loss": 0.8145, + "step": 9935 + }, + { + "epoch": 0.25, + "learning_rate": 1.9842431352826603e-06, + "loss": 0.8604, + "step": 9936 + }, + { + "epoch": 0.25, + "learning_rate": 1.9842382422053907e-06, + "loss": 1.0244, + "step": 9937 + }, + { + "epoch": 0.25, + "learning_rate": 1.9842333483745354e-06, + "loss": 0.8262, + "step": 9938 + }, + { + "epoch": 0.25, + "learning_rate": 1.9842284537900977e-06, + "loss": 0.8721, + "step": 9939 + }, + { + "epoch": 0.25, + "learning_rate": 1.9842235584520815e-06, + "loss": 0.6067, + "step": 9940 + }, + { + "epoch": 0.25, + "learning_rate": 1.984218662360491e-06, + "loss": 0.9639, + "step": 9941 + }, + { + "epoch": 0.25, + "learning_rate": 1.984213765515329e-06, + "loss": 1.0078, + "step": 9942 + }, + { + "epoch": 0.25, + "learning_rate": 1.9842088679166e-06, + "loss": 1.0107, + "step": 9943 + }, + { + "epoch": 0.25, + "learning_rate": 1.984203969564307e-06, + "loss": 1.0469, + "step": 9944 + }, + { + "epoch": 0.25, + "learning_rate": 1.984199070458455e-06, + "loss": 0.7285, + "step": 9945 + }, + { + "epoch": 0.25, + "learning_rate": 1.9841941705990473e-06, + "loss": 0.9336, + "step": 9946 + }, + { + "epoch": 0.25, + "learning_rate": 1.984189269986087e-06, + "loss": 1.0244, + "step": 9947 + }, + { + "epoch": 0.25, + "learning_rate": 1.984184368619578e-06, + "loss": 0.918, + "step": 9948 + }, + { + "epoch": 0.25, + "learning_rate": 1.984179466499524e-06, + "loss": 0.9043, + "step": 9949 + }, + { + "epoch": 0.26, + "learning_rate": 1.9841745636259295e-06, + "loss": 0.6816, + "step": 9950 + }, + { + "epoch": 0.26, + "learning_rate": 1.9841696599987977e-06, + "loss": 0.7852, + "step": 9951 + }, + { + "epoch": 0.26, + "learning_rate": 1.9841647556181326e-06, + "loss": 0.9639, + "step": 9952 + }, + { + "epoch": 0.26, + "learning_rate": 1.9841598504839377e-06, + "loss": 0.9248, + "step": 9953 + }, + { + "epoch": 0.26, + "learning_rate": 1.9841549445962168e-06, + "loss": 0.96, + "step": 9954 + }, + { + "epoch": 0.26, + "learning_rate": 1.9841500379549737e-06, + "loss": 0.8345, + "step": 9955 + }, + { + "epoch": 0.26, + "learning_rate": 1.984145130560212e-06, + "loss": 0.9121, + "step": 9956 + }, + { + "epoch": 0.26, + "learning_rate": 1.984140222411936e-06, + "loss": 0.9717, + "step": 9957 + }, + { + "epoch": 0.26, + "learning_rate": 1.984135313510149e-06, + "loss": 0.9082, + "step": 9958 + }, + { + "epoch": 0.26, + "learning_rate": 1.984130403854855e-06, + "loss": 1.0498, + "step": 9959 + }, + { + "epoch": 0.26, + "learning_rate": 1.984125493446057e-06, + "loss": 0.8691, + "step": 9960 + }, + { + "epoch": 0.26, + "learning_rate": 1.98412058228376e-06, + "loss": 0.9126, + "step": 9961 + }, + { + "epoch": 0.26, + "learning_rate": 1.984115670367967e-06, + "loss": 0.9102, + "step": 9962 + }, + { + "epoch": 0.26, + "learning_rate": 1.984110757698681e-06, + "loss": 0.917, + "step": 9963 + }, + { + "epoch": 0.26, + "learning_rate": 1.9841058442759077e-06, + "loss": 0.8867, + "step": 9964 + }, + { + "epoch": 0.26, + "learning_rate": 1.9841009300996496e-06, + "loss": 0.7539, + "step": 9965 + }, + { + "epoch": 0.26, + "learning_rate": 1.984096015169911e-06, + "loss": 0.6943, + "step": 9966 + }, + { + "epoch": 0.26, + "learning_rate": 1.9840910994866943e-06, + "loss": 1.0908, + "step": 9967 + }, + { + "epoch": 0.26, + "learning_rate": 1.9840861830500047e-06, + "loss": 0.834, + "step": 9968 + }, + { + "epoch": 0.26, + "learning_rate": 1.984081265859846e-06, + "loss": 0.6274, + "step": 9969 + }, + { + "epoch": 0.26, + "learning_rate": 1.984076347916221e-06, + "loss": 0.9307, + "step": 9970 + }, + { + "epoch": 0.26, + "learning_rate": 1.9840714292191344e-06, + "loss": 1.0996, + "step": 9971 + }, + { + "epoch": 0.26, + "learning_rate": 1.9840665097685894e-06, + "loss": 0.8945, + "step": 9972 + }, + { + "epoch": 0.26, + "learning_rate": 1.98406158956459e-06, + "loss": 0.7686, + "step": 9973 + }, + { + "epoch": 0.26, + "learning_rate": 1.98405666860714e-06, + "loss": 1.1143, + "step": 9974 + }, + { + "epoch": 0.26, + "learning_rate": 1.9840517468962425e-06, + "loss": 1.1055, + "step": 9975 + }, + { + "epoch": 0.26, + "learning_rate": 1.9840468244319025e-06, + "loss": 1.1602, + "step": 9976 + }, + { + "epoch": 0.26, + "learning_rate": 1.9840419012141226e-06, + "loss": 1.0293, + "step": 9977 + }, + { + "epoch": 0.26, + "learning_rate": 1.984036977242907e-06, + "loss": 0.8281, + "step": 9978 + }, + { + "epoch": 0.26, + "learning_rate": 1.98403205251826e-06, + "loss": 0.7861, + "step": 9979 + }, + { + "epoch": 0.26, + "learning_rate": 1.9840271270401847e-06, + "loss": 0.8525, + "step": 9980 + }, + { + "epoch": 0.26, + "learning_rate": 1.9840222008086853e-06, + "loss": 0.623, + "step": 9981 + }, + { + "epoch": 0.26, + "learning_rate": 1.984017273823765e-06, + "loss": 1.0342, + "step": 9982 + }, + { + "epoch": 0.26, + "learning_rate": 1.984012346085428e-06, + "loss": 0.9492, + "step": 9983 + }, + { + "epoch": 0.26, + "learning_rate": 1.984007417593678e-06, + "loss": 0.7852, + "step": 9984 + }, + { + "epoch": 0.26, + "learning_rate": 1.9840024883485186e-06, + "loss": 0.9531, + "step": 9985 + }, + { + "epoch": 0.26, + "learning_rate": 1.983997558349954e-06, + "loss": 0.9023, + "step": 9986 + }, + { + "epoch": 0.26, + "learning_rate": 1.9839926275979875e-06, + "loss": 1.0781, + "step": 9987 + }, + { + "epoch": 0.26, + "learning_rate": 1.9839876960926233e-06, + "loss": 0.7373, + "step": 9988 + }, + { + "epoch": 0.26, + "learning_rate": 1.983982763833865e-06, + "loss": 1.0713, + "step": 9989 + }, + { + "epoch": 0.26, + "learning_rate": 1.9839778308217162e-06, + "loss": 0.8223, + "step": 9990 + }, + { + "epoch": 0.26, + "learning_rate": 1.983972897056181e-06, + "loss": 0.9902, + "step": 9991 + }, + { + "epoch": 0.26, + "learning_rate": 1.983967962537263e-06, + "loss": 1.0117, + "step": 9992 + }, + { + "epoch": 0.26, + "learning_rate": 1.9839630272649653e-06, + "loss": 0.9824, + "step": 9993 + }, + { + "epoch": 0.26, + "learning_rate": 1.9839580912392933e-06, + "loss": 0.8672, + "step": 9994 + }, + { + "epoch": 0.26, + "learning_rate": 1.9839531544602494e-06, + "loss": 1.2695, + "step": 9995 + }, + { + "epoch": 0.26, + "learning_rate": 1.9839482169278375e-06, + "loss": 1.1426, + "step": 9996 + }, + { + "epoch": 0.26, + "learning_rate": 1.9839432786420622e-06, + "loss": 1.0713, + "step": 9997 + }, + { + "epoch": 0.26, + "learning_rate": 1.9839383396029265e-06, + "loss": 0.8125, + "step": 9998 + }, + { + "epoch": 0.26, + "learning_rate": 1.9839333998104347e-06, + "loss": 0.9385, + "step": 9999 + }, + { + "epoch": 0.26, + "learning_rate": 1.98392845926459e-06, + "loss": 0.8252, + "step": 10000 + }, + { + "epoch": 0.26, + "learning_rate": 1.9839235179653967e-06, + "loss": 0.8003, + "step": 10001 + }, + { + "epoch": 0.26, + "learning_rate": 1.9839185759128587e-06, + "loss": 0.7197, + "step": 10002 + }, + { + "epoch": 0.26, + "learning_rate": 1.983913633106979e-06, + "loss": 0.9688, + "step": 10003 + }, + { + "epoch": 0.26, + "learning_rate": 1.983908689547762e-06, + "loss": 1.041, + "step": 10004 + }, + { + "epoch": 0.26, + "learning_rate": 1.9839037452352114e-06, + "loss": 0.9365, + "step": 10005 + }, + { + "epoch": 0.26, + "learning_rate": 1.9838988001693313e-06, + "loss": 0.7334, + "step": 10006 + }, + { + "epoch": 0.26, + "learning_rate": 1.9838938543501246e-06, + "loss": 0.7178, + "step": 10007 + }, + { + "epoch": 0.26, + "learning_rate": 1.983888907777596e-06, + "loss": 0.8301, + "step": 10008 + }, + { + "epoch": 0.26, + "learning_rate": 1.983883960451749e-06, + "loss": 0.9375, + "step": 10009 + }, + { + "epoch": 0.26, + "learning_rate": 1.9838790123725868e-06, + "loss": 1.0332, + "step": 10010 + }, + { + "epoch": 0.26, + "learning_rate": 1.9838740635401137e-06, + "loss": 0.9736, + "step": 10011 + }, + { + "epoch": 0.26, + "learning_rate": 1.9838691139543337e-06, + "loss": 1.0303, + "step": 10012 + }, + { + "epoch": 0.26, + "learning_rate": 1.9838641636152503e-06, + "loss": 0.9448, + "step": 10013 + }, + { + "epoch": 0.26, + "learning_rate": 1.9838592125228675e-06, + "loss": 1.0264, + "step": 10014 + }, + { + "epoch": 0.26, + "learning_rate": 1.9838542606771887e-06, + "loss": 1.1133, + "step": 10015 + }, + { + "epoch": 0.26, + "learning_rate": 1.983849308078218e-06, + "loss": 0.7732, + "step": 10016 + }, + { + "epoch": 0.26, + "learning_rate": 1.983844354725959e-06, + "loss": 0.75, + "step": 10017 + }, + { + "epoch": 0.26, + "learning_rate": 1.983839400620416e-06, + "loss": 1.0098, + "step": 10018 + }, + { + "epoch": 0.26, + "learning_rate": 1.983834445761592e-06, + "loss": 0.8257, + "step": 10019 + }, + { + "epoch": 0.26, + "learning_rate": 1.9838294901494916e-06, + "loss": 1.0498, + "step": 10020 + }, + { + "epoch": 0.26, + "learning_rate": 1.983824533784118e-06, + "loss": 0.9375, + "step": 10021 + }, + { + "epoch": 0.26, + "learning_rate": 1.983819576665475e-06, + "loss": 0.9043, + "step": 10022 + }, + { + "epoch": 0.26, + "learning_rate": 1.9838146187935672e-06, + "loss": 1.0283, + "step": 10023 + }, + { + "epoch": 0.26, + "learning_rate": 1.983809660168397e-06, + "loss": 0.7183, + "step": 10024 + }, + { + "epoch": 0.26, + "learning_rate": 1.9838047007899697e-06, + "loss": 0.9434, + "step": 10025 + }, + { + "epoch": 0.26, + "learning_rate": 1.9837997406582876e-06, + "loss": 0.793, + "step": 10026 + }, + { + "epoch": 0.26, + "learning_rate": 1.983794779773356e-06, + "loss": 0.9502, + "step": 10027 + }, + { + "epoch": 0.26, + "learning_rate": 1.9837898181351777e-06, + "loss": 0.7549, + "step": 10028 + }, + { + "epoch": 0.26, + "learning_rate": 1.9837848557437565e-06, + "loss": 0.8564, + "step": 10029 + }, + { + "epoch": 0.26, + "learning_rate": 1.983779892599097e-06, + "loss": 1.001, + "step": 10030 + }, + { + "epoch": 0.26, + "learning_rate": 1.983774928701202e-06, + "loss": 0.9629, + "step": 10031 + }, + { + "epoch": 0.26, + "learning_rate": 1.983769964050076e-06, + "loss": 0.7061, + "step": 10032 + }, + { + "epoch": 0.26, + "learning_rate": 1.9837649986457227e-06, + "loss": 0.9229, + "step": 10033 + }, + { + "epoch": 0.26, + "learning_rate": 1.9837600324881453e-06, + "loss": 0.916, + "step": 10034 + }, + { + "epoch": 0.26, + "learning_rate": 1.9837550655773486e-06, + "loss": 0.7119, + "step": 10035 + }, + { + "epoch": 0.26, + "learning_rate": 1.983750097913336e-06, + "loss": 0.9004, + "step": 10036 + }, + { + "epoch": 0.26, + "learning_rate": 1.9837451294961105e-06, + "loss": 0.7559, + "step": 10037 + }, + { + "epoch": 0.26, + "learning_rate": 1.9837401603256767e-06, + "loss": 0.9707, + "step": 10038 + }, + { + "epoch": 0.26, + "learning_rate": 1.983735190402039e-06, + "loss": 1.0566, + "step": 10039 + }, + { + "epoch": 0.26, + "learning_rate": 1.9837302197251997e-06, + "loss": 0.9678, + "step": 10040 + }, + { + "epoch": 0.26, + "learning_rate": 1.9837252482951637e-06, + "loss": 0.8438, + "step": 10041 + }, + { + "epoch": 0.26, + "learning_rate": 1.9837202761119346e-06, + "loss": 1.0264, + "step": 10042 + }, + { + "epoch": 0.26, + "learning_rate": 1.9837153031755157e-06, + "loss": 0.8252, + "step": 10043 + }, + { + "epoch": 0.26, + "learning_rate": 1.9837103294859117e-06, + "loss": 0.7646, + "step": 10044 + }, + { + "epoch": 0.26, + "learning_rate": 1.983705355043126e-06, + "loss": 0.9316, + "step": 10045 + }, + { + "epoch": 0.26, + "learning_rate": 1.983700379847162e-06, + "loss": 0.8047, + "step": 10046 + }, + { + "epoch": 0.26, + "learning_rate": 1.9836954038980244e-06, + "loss": 0.9814, + "step": 10047 + }, + { + "epoch": 0.26, + "learning_rate": 1.9836904271957157e-06, + "loss": 0.9346, + "step": 10048 + }, + { + "epoch": 0.26, + "learning_rate": 1.983685449740241e-06, + "loss": 0.7183, + "step": 10049 + }, + { + "epoch": 0.26, + "learning_rate": 1.9836804715316035e-06, + "loss": 1.0146, + "step": 10050 + }, + { + "epoch": 0.26, + "learning_rate": 1.983675492569807e-06, + "loss": 1.0898, + "step": 10051 + }, + { + "epoch": 0.26, + "learning_rate": 1.9836705128548552e-06, + "loss": 0.8613, + "step": 10052 + }, + { + "epoch": 0.26, + "learning_rate": 1.9836655323867524e-06, + "loss": 0.916, + "step": 10053 + }, + { + "epoch": 0.26, + "learning_rate": 1.983660551165502e-06, + "loss": 0.9873, + "step": 10054 + }, + { + "epoch": 0.26, + "learning_rate": 1.9836555691911082e-06, + "loss": 1.0205, + "step": 10055 + }, + { + "epoch": 0.26, + "learning_rate": 1.983650586463574e-06, + "loss": 1.1758, + "step": 10056 + }, + { + "epoch": 0.26, + "learning_rate": 1.9836456029829046e-06, + "loss": 0.834, + "step": 10057 + }, + { + "epoch": 0.26, + "learning_rate": 1.9836406187491025e-06, + "loss": 0.8359, + "step": 10058 + }, + { + "epoch": 0.26, + "learning_rate": 1.983635633762172e-06, + "loss": 0.9346, + "step": 10059 + }, + { + "epoch": 0.26, + "learning_rate": 1.983630648022117e-06, + "loss": 0.917, + "step": 10060 + }, + { + "epoch": 0.26, + "learning_rate": 1.983625661528941e-06, + "loss": 0.7803, + "step": 10061 + }, + { + "epoch": 0.26, + "learning_rate": 1.9836206742826483e-06, + "loss": 1.0859, + "step": 10062 + }, + { + "epoch": 0.26, + "learning_rate": 1.9836156862832426e-06, + "loss": 0.8691, + "step": 10063 + }, + { + "epoch": 0.26, + "learning_rate": 1.9836106975307272e-06, + "loss": 0.9453, + "step": 10064 + }, + { + "epoch": 0.26, + "learning_rate": 1.983605708025107e-06, + "loss": 0.7979, + "step": 10065 + }, + { + "epoch": 0.26, + "learning_rate": 1.9836007177663843e-06, + "loss": 0.8428, + "step": 10066 + }, + { + "epoch": 0.26, + "learning_rate": 1.9835957267545644e-06, + "loss": 0.8594, + "step": 10067 + }, + { + "epoch": 0.26, + "learning_rate": 1.98359073498965e-06, + "loss": 0.793, + "step": 10068 + }, + { + "epoch": 0.26, + "learning_rate": 1.983585742471646e-06, + "loss": 0.8325, + "step": 10069 + }, + { + "epoch": 0.26, + "learning_rate": 1.9835807492005553e-06, + "loss": 0.9043, + "step": 10070 + }, + { + "epoch": 0.26, + "learning_rate": 1.9835757551763817e-06, + "loss": 0.731, + "step": 10071 + }, + { + "epoch": 0.26, + "learning_rate": 1.9835707603991297e-06, + "loss": 0.9854, + "step": 10072 + }, + { + "epoch": 0.26, + "learning_rate": 1.983565764868803e-06, + "loss": 0.9629, + "step": 10073 + }, + { + "epoch": 0.26, + "learning_rate": 1.9835607685854047e-06, + "loss": 1.1221, + "step": 10074 + }, + { + "epoch": 0.26, + "learning_rate": 1.9835557715489393e-06, + "loss": 0.8926, + "step": 10075 + }, + { + "epoch": 0.26, + "learning_rate": 1.9835507737594108e-06, + "loss": 0.8486, + "step": 10076 + }, + { + "epoch": 0.26, + "learning_rate": 1.9835457752168225e-06, + "loss": 1.0625, + "step": 10077 + }, + { + "epoch": 0.26, + "learning_rate": 1.9835407759211783e-06, + "loss": 0.918, + "step": 10078 + }, + { + "epoch": 0.26, + "learning_rate": 1.9835357758724825e-06, + "loss": 1.0762, + "step": 10079 + }, + { + "epoch": 0.26, + "learning_rate": 1.9835307750707383e-06, + "loss": 0.7852, + "step": 10080 + }, + { + "epoch": 0.26, + "learning_rate": 1.9835257735159497e-06, + "loss": 0.9648, + "step": 10081 + }, + { + "epoch": 0.26, + "learning_rate": 1.983520771208121e-06, + "loss": 1.0605, + "step": 10082 + }, + { + "epoch": 0.26, + "learning_rate": 1.9835157681472556e-06, + "loss": 0.8481, + "step": 10083 + }, + { + "epoch": 0.26, + "learning_rate": 1.9835107643333573e-06, + "loss": 0.9102, + "step": 10084 + }, + { + "epoch": 0.26, + "learning_rate": 1.9835057597664297e-06, + "loss": 0.8623, + "step": 10085 + }, + { + "epoch": 0.26, + "learning_rate": 1.9835007544464776e-06, + "loss": 0.9619, + "step": 10086 + }, + { + "epoch": 0.26, + "learning_rate": 1.983495748373504e-06, + "loss": 0.8994, + "step": 10087 + }, + { + "epoch": 0.26, + "learning_rate": 1.9834907415475123e-06, + "loss": 0.9087, + "step": 10088 + }, + { + "epoch": 0.26, + "learning_rate": 1.9834857339685076e-06, + "loss": 1.0078, + "step": 10089 + }, + { + "epoch": 0.26, + "learning_rate": 1.983480725636493e-06, + "loss": 0.9424, + "step": 10090 + }, + { + "epoch": 0.26, + "learning_rate": 1.9834757165514724e-06, + "loss": 0.8174, + "step": 10091 + }, + { + "epoch": 0.26, + "learning_rate": 1.9834707067134495e-06, + "loss": 1.0947, + "step": 10092 + }, + { + "epoch": 0.26, + "learning_rate": 1.9834656961224287e-06, + "loss": 1.0283, + "step": 10093 + }, + { + "epoch": 0.26, + "learning_rate": 1.983460684778413e-06, + "loss": 0.8916, + "step": 10094 + }, + { + "epoch": 0.26, + "learning_rate": 1.983455672681407e-06, + "loss": 1.0078, + "step": 10095 + }, + { + "epoch": 0.26, + "learning_rate": 1.983450659831414e-06, + "loss": 0.7437, + "step": 10096 + }, + { + "epoch": 0.26, + "learning_rate": 1.983445646228438e-06, + "loss": 1.1309, + "step": 10097 + }, + { + "epoch": 0.26, + "learning_rate": 1.983440631872483e-06, + "loss": 1.002, + "step": 10098 + }, + { + "epoch": 0.26, + "learning_rate": 1.9834356167635527e-06, + "loss": 0.873, + "step": 10099 + }, + { + "epoch": 0.26, + "learning_rate": 1.9834306009016513e-06, + "loss": 0.9106, + "step": 10100 + }, + { + "epoch": 0.26, + "learning_rate": 1.983425584286782e-06, + "loss": 1.0049, + "step": 10101 + }, + { + "epoch": 0.26, + "learning_rate": 1.983420566918949e-06, + "loss": 1.1025, + "step": 10102 + }, + { + "epoch": 0.26, + "learning_rate": 1.983415548798156e-06, + "loss": 0.9033, + "step": 10103 + }, + { + "epoch": 0.26, + "learning_rate": 1.983410529924407e-06, + "loss": 1.04, + "step": 10104 + }, + { + "epoch": 0.26, + "learning_rate": 1.9834055102977056e-06, + "loss": 0.8027, + "step": 10105 + }, + { + "epoch": 0.26, + "learning_rate": 1.983400489918056e-06, + "loss": 1.0518, + "step": 10106 + }, + { + "epoch": 0.26, + "learning_rate": 1.983395468785462e-06, + "loss": 1.082, + "step": 10107 + }, + { + "epoch": 0.26, + "learning_rate": 1.983390446899927e-06, + "loss": 0.7646, + "step": 10108 + }, + { + "epoch": 0.26, + "learning_rate": 1.9833854242614554e-06, + "loss": 1.0596, + "step": 10109 + }, + { + "epoch": 0.26, + "learning_rate": 1.9833804008700506e-06, + "loss": 0.8011, + "step": 10110 + }, + { + "epoch": 0.26, + "learning_rate": 1.983375376725717e-06, + "loss": 0.9814, + "step": 10111 + }, + { + "epoch": 0.26, + "learning_rate": 1.9833703518284576e-06, + "loss": 0.7432, + "step": 10112 + }, + { + "epoch": 0.26, + "learning_rate": 1.983365326178277e-06, + "loss": 1.0078, + "step": 10113 + }, + { + "epoch": 0.26, + "learning_rate": 1.9833602997751787e-06, + "loss": 0.9609, + "step": 10114 + }, + { + "epoch": 0.26, + "learning_rate": 1.9833552726191666e-06, + "loss": 0.9609, + "step": 10115 + }, + { + "epoch": 0.26, + "learning_rate": 1.983350244710245e-06, + "loss": 0.9756, + "step": 10116 + }, + { + "epoch": 0.26, + "learning_rate": 1.9833452160484167e-06, + "loss": 0.8867, + "step": 10117 + }, + { + "epoch": 0.26, + "learning_rate": 1.9833401866336865e-06, + "loss": 0.8877, + "step": 10118 + }, + { + "epoch": 0.26, + "learning_rate": 1.983335156466058e-06, + "loss": 1.167, + "step": 10119 + }, + { + "epoch": 0.26, + "learning_rate": 1.983330125545535e-06, + "loss": 0.8008, + "step": 10120 + }, + { + "epoch": 0.26, + "learning_rate": 1.9833250938721212e-06, + "loss": 0.8047, + "step": 10121 + }, + { + "epoch": 0.26, + "learning_rate": 1.983320061445821e-06, + "loss": 0.8398, + "step": 10122 + }, + { + "epoch": 0.26, + "learning_rate": 1.983315028266637e-06, + "loss": 0.5034, + "step": 10123 + }, + { + "epoch": 0.26, + "learning_rate": 1.9833099943345744e-06, + "loss": 1.0859, + "step": 10124 + }, + { + "epoch": 0.26, + "learning_rate": 1.9833049596496366e-06, + "loss": 0.8252, + "step": 10125 + }, + { + "epoch": 0.26, + "learning_rate": 1.9832999242118276e-06, + "loss": 0.6182, + "step": 10126 + }, + { + "epoch": 0.26, + "learning_rate": 1.9832948880211506e-06, + "loss": 0.8428, + "step": 10127 + }, + { + "epoch": 0.26, + "learning_rate": 1.98328985107761e-06, + "loss": 0.7676, + "step": 10128 + }, + { + "epoch": 0.26, + "learning_rate": 1.9832848133812097e-06, + "loss": 1.0068, + "step": 10129 + }, + { + "epoch": 0.26, + "learning_rate": 1.9832797749319538e-06, + "loss": 0.8452, + "step": 10130 + }, + { + "epoch": 0.26, + "learning_rate": 1.983274735729845e-06, + "loss": 0.9082, + "step": 10131 + }, + { + "epoch": 0.26, + "learning_rate": 1.9832696957748886e-06, + "loss": 0.9453, + "step": 10132 + }, + { + "epoch": 0.26, + "learning_rate": 1.983264655067088e-06, + "loss": 0.7085, + "step": 10133 + }, + { + "epoch": 0.26, + "learning_rate": 1.983259613606446e-06, + "loss": 0.9688, + "step": 10134 + }, + { + "epoch": 0.26, + "learning_rate": 1.983254571392968e-06, + "loss": 1.0, + "step": 10135 + }, + { + "epoch": 0.26, + "learning_rate": 1.983249528426657e-06, + "loss": 1.127, + "step": 10136 + }, + { + "epoch": 0.26, + "learning_rate": 1.983244484707517e-06, + "loss": 1.0039, + "step": 10137 + }, + { + "epoch": 0.26, + "learning_rate": 1.9832394402355517e-06, + "loss": 0.77, + "step": 10138 + }, + { + "epoch": 0.26, + "learning_rate": 1.9832343950107652e-06, + "loss": 0.7734, + "step": 10139 + }, + { + "epoch": 0.26, + "learning_rate": 1.9832293490331617e-06, + "loss": 0.834, + "step": 10140 + }, + { + "epoch": 0.26, + "learning_rate": 1.9832243023027446e-06, + "loss": 1.209, + "step": 10141 + }, + { + "epoch": 0.26, + "learning_rate": 1.9832192548195176e-06, + "loss": 0.9224, + "step": 10142 + }, + { + "epoch": 0.26, + "learning_rate": 1.983214206583485e-06, + "loss": 1.1025, + "step": 10143 + }, + { + "epoch": 0.26, + "learning_rate": 1.9832091575946506e-06, + "loss": 0.9023, + "step": 10144 + }, + { + "epoch": 0.26, + "learning_rate": 1.9832041078530178e-06, + "loss": 0.5852, + "step": 10145 + }, + { + "epoch": 0.26, + "learning_rate": 1.983199057358591e-06, + "loss": 0.9521, + "step": 10146 + }, + { + "epoch": 0.26, + "learning_rate": 1.9831940061113742e-06, + "loss": 0.9307, + "step": 10147 + }, + { + "epoch": 0.26, + "learning_rate": 1.9831889541113703e-06, + "loss": 0.8369, + "step": 10148 + }, + { + "epoch": 0.26, + "learning_rate": 1.9831839013585845e-06, + "loss": 0.9561, + "step": 10149 + }, + { + "epoch": 0.26, + "learning_rate": 1.9831788478530197e-06, + "loss": 0.7988, + "step": 10150 + }, + { + "epoch": 0.26, + "learning_rate": 1.9831737935946803e-06, + "loss": 1.042, + "step": 10151 + }, + { + "epoch": 0.26, + "learning_rate": 1.9831687385835695e-06, + "loss": 0.8125, + "step": 10152 + }, + { + "epoch": 0.26, + "learning_rate": 1.983163682819692e-06, + "loss": 1.0264, + "step": 10153 + }, + { + "epoch": 0.26, + "learning_rate": 1.983158626303051e-06, + "loss": 0.9512, + "step": 10154 + }, + { + "epoch": 0.26, + "learning_rate": 1.983153569033651e-06, + "loss": 0.8975, + "step": 10155 + }, + { + "epoch": 0.26, + "learning_rate": 1.983148511011495e-06, + "loss": 1.0381, + "step": 10156 + }, + { + "epoch": 0.26, + "learning_rate": 1.983143452236588e-06, + "loss": 0.9043, + "step": 10157 + }, + { + "epoch": 0.26, + "learning_rate": 1.9831383927089327e-06, + "loss": 0.918, + "step": 10158 + }, + { + "epoch": 0.26, + "learning_rate": 1.9831333324285338e-06, + "loss": 1.0898, + "step": 10159 + }, + { + "epoch": 0.26, + "learning_rate": 1.983128271395395e-06, + "loss": 0.9473, + "step": 10160 + }, + { + "epoch": 0.26, + "learning_rate": 1.9831232096095198e-06, + "loss": 0.8945, + "step": 10161 + }, + { + "epoch": 0.26, + "learning_rate": 1.9831181470709123e-06, + "loss": 1.0781, + "step": 10162 + }, + { + "epoch": 0.26, + "learning_rate": 1.9831130837795768e-06, + "loss": 0.96, + "step": 10163 + }, + { + "epoch": 0.26, + "learning_rate": 1.983108019735517e-06, + "loss": 1.0791, + "step": 10164 + }, + { + "epoch": 0.26, + "learning_rate": 1.983102954938736e-06, + "loss": 0.9404, + "step": 10165 + }, + { + "epoch": 0.26, + "learning_rate": 1.9830978893892383e-06, + "loss": 0.6255, + "step": 10166 + }, + { + "epoch": 0.26, + "learning_rate": 1.9830928230870284e-06, + "loss": 1.1006, + "step": 10167 + }, + { + "epoch": 0.26, + "learning_rate": 1.983087756032109e-06, + "loss": 0.959, + "step": 10168 + }, + { + "epoch": 0.26, + "learning_rate": 1.9830826882244845e-06, + "loss": 0.8838, + "step": 10169 + }, + { + "epoch": 0.26, + "learning_rate": 1.9830776196641593e-06, + "loss": 0.9512, + "step": 10170 + }, + { + "epoch": 0.26, + "learning_rate": 1.983072550351136e-06, + "loss": 1.0977, + "step": 10171 + }, + { + "epoch": 0.26, + "learning_rate": 1.98306748028542e-06, + "loss": 0.9658, + "step": 10172 + }, + { + "epoch": 0.26, + "learning_rate": 1.9830624094670138e-06, + "loss": 1.0352, + "step": 10173 + }, + { + "epoch": 0.26, + "learning_rate": 1.9830573378959223e-06, + "loss": 0.71, + "step": 10174 + }, + { + "epoch": 0.26, + "learning_rate": 1.983052265572149e-06, + "loss": 0.7783, + "step": 10175 + }, + { + "epoch": 0.26, + "learning_rate": 1.9830471924956976e-06, + "loss": 1.2266, + "step": 10176 + }, + { + "epoch": 0.26, + "learning_rate": 1.983042118666572e-06, + "loss": 1.0488, + "step": 10177 + }, + { + "epoch": 0.26, + "learning_rate": 1.9830370440847766e-06, + "loss": 0.7393, + "step": 10178 + }, + { + "epoch": 0.26, + "learning_rate": 1.983031968750315e-06, + "loss": 1.0078, + "step": 10179 + }, + { + "epoch": 0.26, + "learning_rate": 1.983026892663191e-06, + "loss": 0.7935, + "step": 10180 + }, + { + "epoch": 0.26, + "learning_rate": 1.9830218158234083e-06, + "loss": 0.8682, + "step": 10181 + }, + { + "epoch": 0.26, + "learning_rate": 1.983016738230971e-06, + "loss": 0.8994, + "step": 10182 + }, + { + "epoch": 0.26, + "learning_rate": 1.983011659885883e-06, + "loss": 1.1191, + "step": 10183 + }, + { + "epoch": 0.26, + "learning_rate": 1.983006580788148e-06, + "loss": 0.8408, + "step": 10184 + }, + { + "epoch": 0.26, + "learning_rate": 1.9830015009377703e-06, + "loss": 0.8926, + "step": 10185 + }, + { + "epoch": 0.26, + "learning_rate": 1.982996420334754e-06, + "loss": 1.0801, + "step": 10186 + }, + { + "epoch": 0.26, + "learning_rate": 1.982991338979102e-06, + "loss": 0.917, + "step": 10187 + }, + { + "epoch": 0.26, + "learning_rate": 1.9829862568708185e-06, + "loss": 0.8926, + "step": 10188 + }, + { + "epoch": 0.26, + "learning_rate": 1.982981174009908e-06, + "loss": 0.9922, + "step": 10189 + }, + { + "epoch": 0.26, + "learning_rate": 1.9829760903963744e-06, + "loss": 0.9795, + "step": 10190 + }, + { + "epoch": 0.26, + "learning_rate": 1.9829710060302204e-06, + "loss": 1.0068, + "step": 10191 + }, + { + "epoch": 0.26, + "learning_rate": 1.982965920911451e-06, + "loss": 0.9307, + "step": 10192 + }, + { + "epoch": 0.26, + "learning_rate": 1.9829608350400696e-06, + "loss": 1.0371, + "step": 10193 + }, + { + "epoch": 0.26, + "learning_rate": 1.9829557484160807e-06, + "loss": 0.9336, + "step": 10194 + }, + { + "epoch": 0.26, + "learning_rate": 1.982950661039488e-06, + "loss": 0.8452, + "step": 10195 + }, + { + "epoch": 0.26, + "learning_rate": 1.9829455729102947e-06, + "loss": 0.8223, + "step": 10196 + }, + { + "epoch": 0.26, + "learning_rate": 1.9829404840285048e-06, + "loss": 0.9053, + "step": 10197 + }, + { + "epoch": 0.26, + "learning_rate": 1.9829353943941235e-06, + "loss": 1.0371, + "step": 10198 + }, + { + "epoch": 0.26, + "learning_rate": 1.982930304007153e-06, + "loss": 0.9473, + "step": 10199 + }, + { + "epoch": 0.26, + "learning_rate": 1.9829252128675986e-06, + "loss": 1.0283, + "step": 10200 + }, + { + "epoch": 0.26, + "learning_rate": 1.982920120975463e-06, + "loss": 0.7871, + "step": 10201 + }, + { + "epoch": 0.26, + "learning_rate": 1.9829150283307507e-06, + "loss": 0.9385, + "step": 10202 + }, + { + "epoch": 0.26, + "learning_rate": 1.982909934933466e-06, + "loss": 0.9307, + "step": 10203 + }, + { + "epoch": 0.26, + "learning_rate": 1.982904840783612e-06, + "loss": 0.9604, + "step": 10204 + }, + { + "epoch": 0.26, + "learning_rate": 1.982899745881193e-06, + "loss": 0.8291, + "step": 10205 + }, + { + "epoch": 0.26, + "learning_rate": 1.982894650226213e-06, + "loss": 0.9341, + "step": 10206 + }, + { + "epoch": 0.26, + "learning_rate": 1.9828895538186754e-06, + "loss": 0.8789, + "step": 10207 + }, + { + "epoch": 0.26, + "learning_rate": 1.9828844566585847e-06, + "loss": 0.9746, + "step": 10208 + }, + { + "epoch": 0.26, + "learning_rate": 1.9828793587459446e-06, + "loss": 1.043, + "step": 10209 + }, + { + "epoch": 0.26, + "learning_rate": 1.982874260080759e-06, + "loss": 0.8735, + "step": 10210 + }, + { + "epoch": 0.26, + "learning_rate": 1.9828691606630316e-06, + "loss": 0.8926, + "step": 10211 + }, + { + "epoch": 0.26, + "learning_rate": 1.9828640604927667e-06, + "loss": 0.9766, + "step": 10212 + }, + { + "epoch": 0.26, + "learning_rate": 1.982858959569968e-06, + "loss": 1.0723, + "step": 10213 + }, + { + "epoch": 0.26, + "learning_rate": 1.982853857894639e-06, + "loss": 0.9473, + "step": 10214 + }, + { + "epoch": 0.26, + "learning_rate": 1.9828487554667844e-06, + "loss": 1.0439, + "step": 10215 + }, + { + "epoch": 0.26, + "learning_rate": 1.982843652286408e-06, + "loss": 0.8301, + "step": 10216 + }, + { + "epoch": 0.26, + "learning_rate": 1.982838548353513e-06, + "loss": 0.8809, + "step": 10217 + }, + { + "epoch": 0.26, + "learning_rate": 1.9828334436681033e-06, + "loss": 0.8623, + "step": 10218 + }, + { + "epoch": 0.26, + "learning_rate": 1.9828283382301837e-06, + "loss": 1.2178, + "step": 10219 + }, + { + "epoch": 0.26, + "learning_rate": 1.9828232320397575e-06, + "loss": 0.9033, + "step": 10220 + }, + { + "epoch": 0.26, + "learning_rate": 1.982818125096829e-06, + "loss": 0.8965, + "step": 10221 + }, + { + "epoch": 0.26, + "learning_rate": 1.9828130174014017e-06, + "loss": 1.0215, + "step": 10222 + }, + { + "epoch": 0.26, + "learning_rate": 1.9828079089534794e-06, + "loss": 0.915, + "step": 10223 + }, + { + "epoch": 0.26, + "learning_rate": 1.9828027997530665e-06, + "loss": 0.9111, + "step": 10224 + }, + { + "epoch": 0.26, + "learning_rate": 1.982797689800167e-06, + "loss": 0.8594, + "step": 10225 + }, + { + "epoch": 0.26, + "learning_rate": 1.982792579094784e-06, + "loss": 0.8677, + "step": 10226 + }, + { + "epoch": 0.26, + "learning_rate": 1.982787467636922e-06, + "loss": 0.9365, + "step": 10227 + }, + { + "epoch": 0.26, + "learning_rate": 1.9827823554265848e-06, + "loss": 0.9404, + "step": 10228 + }, + { + "epoch": 0.26, + "learning_rate": 1.9827772424637765e-06, + "loss": 0.4443, + "step": 10229 + }, + { + "epoch": 0.26, + "learning_rate": 1.982772128748501e-06, + "loss": 0.8965, + "step": 10230 + }, + { + "epoch": 0.26, + "learning_rate": 1.9827670142807617e-06, + "loss": 0.8848, + "step": 10231 + }, + { + "epoch": 0.26, + "learning_rate": 1.982761899060563e-06, + "loss": 0.9424, + "step": 10232 + }, + { + "epoch": 0.26, + "learning_rate": 1.982756783087909e-06, + "loss": 0.8418, + "step": 10233 + }, + { + "epoch": 0.26, + "learning_rate": 1.982751666362803e-06, + "loss": 1.0098, + "step": 10234 + }, + { + "epoch": 0.26, + "learning_rate": 1.9827465488852493e-06, + "loss": 0.9209, + "step": 10235 + }, + { + "epoch": 0.26, + "learning_rate": 1.982741430655252e-06, + "loss": 0.9248, + "step": 10236 + }, + { + "epoch": 0.26, + "learning_rate": 1.982736311672814e-06, + "loss": 1.0117, + "step": 10237 + }, + { + "epoch": 0.26, + "learning_rate": 1.9827311919379406e-06, + "loss": 1.0283, + "step": 10238 + }, + { + "epoch": 0.26, + "learning_rate": 1.982726071450635e-06, + "loss": 0.9863, + "step": 10239 + }, + { + "epoch": 0.26, + "learning_rate": 1.9827209502109015e-06, + "loss": 0.9668, + "step": 10240 + }, + { + "epoch": 0.26, + "learning_rate": 1.9827158282187436e-06, + "loss": 1.0254, + "step": 10241 + }, + { + "epoch": 0.26, + "learning_rate": 1.982710705474165e-06, + "loss": 0.9131, + "step": 10242 + }, + { + "epoch": 0.26, + "learning_rate": 1.9827055819771706e-06, + "loss": 0.8281, + "step": 10243 + }, + { + "epoch": 0.26, + "learning_rate": 1.9827004577277635e-06, + "loss": 0.8438, + "step": 10244 + }, + { + "epoch": 0.26, + "learning_rate": 1.9826953327259476e-06, + "loss": 1.04, + "step": 10245 + }, + { + "epoch": 0.26, + "learning_rate": 1.9826902069717276e-06, + "loss": 0.8633, + "step": 10246 + }, + { + "epoch": 0.26, + "learning_rate": 1.9826850804651064e-06, + "loss": 1.082, + "step": 10247 + }, + { + "epoch": 0.26, + "learning_rate": 1.9826799532060887e-06, + "loss": 0.752, + "step": 10248 + }, + { + "epoch": 0.26, + "learning_rate": 1.982674825194678e-06, + "loss": 0.8828, + "step": 10249 + }, + { + "epoch": 0.26, + "learning_rate": 1.9826696964308783e-06, + "loss": 1.002, + "step": 10250 + }, + { + "epoch": 0.26, + "learning_rate": 1.9826645669146936e-06, + "loss": 0.9736, + "step": 10251 + }, + { + "epoch": 0.26, + "learning_rate": 1.982659436646128e-06, + "loss": 1.085, + "step": 10252 + }, + { + "epoch": 0.26, + "learning_rate": 1.982654305625185e-06, + "loss": 0.9883, + "step": 10253 + }, + { + "epoch": 0.26, + "learning_rate": 1.9826491738518693e-06, + "loss": 0.8818, + "step": 10254 + }, + { + "epoch": 0.26, + "learning_rate": 1.9826440413261838e-06, + "loss": 0.9043, + "step": 10255 + }, + { + "epoch": 0.26, + "learning_rate": 1.982638908048133e-06, + "loss": 0.8408, + "step": 10256 + }, + { + "epoch": 0.26, + "learning_rate": 1.982633774017721e-06, + "loss": 0.8501, + "step": 10257 + }, + { + "epoch": 0.26, + "learning_rate": 1.982628639234951e-06, + "loss": 0.811, + "step": 10258 + }, + { + "epoch": 0.26, + "learning_rate": 1.982623503699828e-06, + "loss": 0.8521, + "step": 10259 + }, + { + "epoch": 0.26, + "learning_rate": 1.9826183674123552e-06, + "loss": 0.7627, + "step": 10260 + }, + { + "epoch": 0.26, + "learning_rate": 1.9826132303725367e-06, + "loss": 0.9355, + "step": 10261 + }, + { + "epoch": 0.26, + "learning_rate": 1.9826080925803764e-06, + "loss": 0.9033, + "step": 10262 + }, + { + "epoch": 0.26, + "learning_rate": 1.982602954035878e-06, + "loss": 1.0557, + "step": 10263 + }, + { + "epoch": 0.26, + "learning_rate": 1.982597814739046e-06, + "loss": 0.8955, + "step": 10264 + }, + { + "epoch": 0.26, + "learning_rate": 1.9825926746898844e-06, + "loss": 1.0049, + "step": 10265 + }, + { + "epoch": 0.26, + "learning_rate": 1.982587533888396e-06, + "loss": 0.7205, + "step": 10266 + }, + { + "epoch": 0.26, + "learning_rate": 1.982582392334586e-06, + "loss": 0.7046, + "step": 10267 + }, + { + "epoch": 0.26, + "learning_rate": 1.982577250028458e-06, + "loss": 1.0439, + "step": 10268 + }, + { + "epoch": 0.26, + "learning_rate": 1.982572106970015e-06, + "loss": 1.0205, + "step": 10269 + }, + { + "epoch": 0.26, + "learning_rate": 1.9825669631592625e-06, + "loss": 0.9746, + "step": 10270 + }, + { + "epoch": 0.26, + "learning_rate": 1.9825618185962033e-06, + "loss": 0.7451, + "step": 10271 + }, + { + "epoch": 0.26, + "learning_rate": 1.982556673280842e-06, + "loss": 0.7002, + "step": 10272 + }, + { + "epoch": 0.26, + "learning_rate": 1.982551527213182e-06, + "loss": 1.0439, + "step": 10273 + }, + { + "epoch": 0.26, + "learning_rate": 1.982546380393227e-06, + "loss": 0.8877, + "step": 10274 + }, + { + "epoch": 0.26, + "learning_rate": 1.982541232820982e-06, + "loss": 0.8906, + "step": 10275 + }, + { + "epoch": 0.26, + "learning_rate": 1.9825360844964504e-06, + "loss": 0.9883, + "step": 10276 + }, + { + "epoch": 0.26, + "learning_rate": 1.982530935419636e-06, + "loss": 1.0225, + "step": 10277 + }, + { + "epoch": 0.26, + "learning_rate": 1.982525785590543e-06, + "loss": 1.0381, + "step": 10278 + }, + { + "epoch": 0.26, + "learning_rate": 1.9825206350091747e-06, + "loss": 0.8848, + "step": 10279 + }, + { + "epoch": 0.26, + "learning_rate": 1.982515483675536e-06, + "loss": 0.9756, + "step": 10280 + }, + { + "epoch": 0.26, + "learning_rate": 1.9825103315896298e-06, + "loss": 0.8145, + "step": 10281 + }, + { + "epoch": 0.26, + "learning_rate": 1.9825051787514614e-06, + "loss": 0.7739, + "step": 10282 + }, + { + "epoch": 0.26, + "learning_rate": 1.9825000251610333e-06, + "loss": 0.7622, + "step": 10283 + }, + { + "epoch": 0.26, + "learning_rate": 1.9824948708183506e-06, + "loss": 0.8115, + "step": 10284 + }, + { + "epoch": 0.26, + "learning_rate": 1.9824897157234163e-06, + "loss": 0.8896, + "step": 10285 + }, + { + "epoch": 0.26, + "learning_rate": 1.982484559876235e-06, + "loss": 0.833, + "step": 10286 + }, + { + "epoch": 0.26, + "learning_rate": 1.9824794032768104e-06, + "loss": 0.9062, + "step": 10287 + }, + { + "epoch": 0.26, + "learning_rate": 1.9824742459251465e-06, + "loss": 0.8154, + "step": 10288 + }, + { + "epoch": 0.26, + "learning_rate": 1.9824690878212474e-06, + "loss": 0.9463, + "step": 10289 + }, + { + "epoch": 0.26, + "learning_rate": 1.9824639289651166e-06, + "loss": 0.7402, + "step": 10290 + }, + { + "epoch": 0.26, + "learning_rate": 1.9824587693567587e-06, + "loss": 0.9629, + "step": 10291 + }, + { + "epoch": 0.26, + "learning_rate": 1.982453608996177e-06, + "loss": 1.2344, + "step": 10292 + }, + { + "epoch": 0.26, + "learning_rate": 1.982448447883376e-06, + "loss": 0.8008, + "step": 10293 + }, + { + "epoch": 0.26, + "learning_rate": 1.9824432860183594e-06, + "loss": 1.1494, + "step": 10294 + }, + { + "epoch": 0.26, + "learning_rate": 1.982438123401131e-06, + "loss": 0.7915, + "step": 10295 + }, + { + "epoch": 0.26, + "learning_rate": 1.9824329600316947e-06, + "loss": 0.8662, + "step": 10296 + }, + { + "epoch": 0.26, + "learning_rate": 1.982427795910055e-06, + "loss": 0.8608, + "step": 10297 + }, + { + "epoch": 0.26, + "learning_rate": 1.9824226310362152e-06, + "loss": 0.9395, + "step": 10298 + }, + { + "epoch": 0.26, + "learning_rate": 1.98241746541018e-06, + "loss": 1.0684, + "step": 10299 + }, + { + "epoch": 0.26, + "learning_rate": 1.9824122990319523e-06, + "loss": 1.0322, + "step": 10300 + }, + { + "epoch": 0.26, + "learning_rate": 1.9824071319015374e-06, + "loss": 1.1611, + "step": 10301 + }, + { + "epoch": 0.26, + "learning_rate": 1.982401964018938e-06, + "loss": 0.7871, + "step": 10302 + }, + { + "epoch": 0.26, + "learning_rate": 1.982396795384159e-06, + "loss": 0.9326, + "step": 10303 + }, + { + "epoch": 0.26, + "learning_rate": 1.9823916259972037e-06, + "loss": 0.8701, + "step": 10304 + }, + { + "epoch": 0.26, + "learning_rate": 1.982386455858076e-06, + "loss": 0.7422, + "step": 10305 + }, + { + "epoch": 0.26, + "learning_rate": 1.982381284966781e-06, + "loss": 0.6772, + "step": 10306 + }, + { + "epoch": 0.26, + "learning_rate": 1.9823761133233213e-06, + "loss": 0.7617, + "step": 10307 + }, + { + "epoch": 0.26, + "learning_rate": 1.9823709409277013e-06, + "loss": 1.0337, + "step": 10308 + }, + { + "epoch": 0.26, + "learning_rate": 1.982365767779925e-06, + "loss": 1.001, + "step": 10309 + }, + { + "epoch": 0.26, + "learning_rate": 1.9823605938799965e-06, + "loss": 0.8994, + "step": 10310 + }, + { + "epoch": 0.26, + "learning_rate": 1.9823554192279197e-06, + "loss": 0.8213, + "step": 10311 + }, + { + "epoch": 0.26, + "learning_rate": 1.9823502438236983e-06, + "loss": 0.7253, + "step": 10312 + }, + { + "epoch": 0.26, + "learning_rate": 1.982345067667337e-06, + "loss": 0.8403, + "step": 10313 + }, + { + "epoch": 0.26, + "learning_rate": 1.9823398907588387e-06, + "loss": 0.8047, + "step": 10314 + }, + { + "epoch": 0.26, + "learning_rate": 1.982334713098208e-06, + "loss": 1.2227, + "step": 10315 + }, + { + "epoch": 0.26, + "learning_rate": 1.982329534685449e-06, + "loss": 0.9482, + "step": 10316 + }, + { + "epoch": 0.26, + "learning_rate": 1.9823243555205657e-06, + "loss": 0.7639, + "step": 10317 + }, + { + "epoch": 0.26, + "learning_rate": 1.9823191756035612e-06, + "loss": 0.9609, + "step": 10318 + }, + { + "epoch": 0.26, + "learning_rate": 1.9823139949344406e-06, + "loss": 0.9834, + "step": 10319 + }, + { + "epoch": 0.26, + "learning_rate": 1.9823088135132073e-06, + "loss": 0.9883, + "step": 10320 + }, + { + "epoch": 0.26, + "learning_rate": 1.982303631339865e-06, + "loss": 0.7153, + "step": 10321 + }, + { + "epoch": 0.26, + "learning_rate": 1.982298448414418e-06, + "loss": 1.1318, + "step": 10322 + }, + { + "epoch": 0.26, + "learning_rate": 1.9822932647368706e-06, + "loss": 0.9102, + "step": 10323 + }, + { + "epoch": 0.26, + "learning_rate": 1.982288080307226e-06, + "loss": 0.7764, + "step": 10324 + }, + { + "epoch": 0.26, + "learning_rate": 1.9822828951254887e-06, + "loss": 0.9316, + "step": 10325 + }, + { + "epoch": 0.26, + "learning_rate": 1.982277709191663e-06, + "loss": 0.7441, + "step": 10326 + }, + { + "epoch": 0.26, + "learning_rate": 1.9822725225057516e-06, + "loss": 1.0029, + "step": 10327 + }, + { + "epoch": 0.26, + "learning_rate": 1.98226733506776e-06, + "loss": 0.646, + "step": 10328 + }, + { + "epoch": 0.26, + "learning_rate": 1.982262146877691e-06, + "loss": 0.5181, + "step": 10329 + }, + { + "epoch": 0.26, + "learning_rate": 1.9822569579355493e-06, + "loss": 0.9561, + "step": 10330 + }, + { + "epoch": 0.26, + "learning_rate": 1.9822517682413383e-06, + "loss": 0.8525, + "step": 10331 + }, + { + "epoch": 0.26, + "learning_rate": 1.982246577795063e-06, + "loss": 0.9336, + "step": 10332 + }, + { + "epoch": 0.26, + "learning_rate": 1.9822413865967257e-06, + "loss": 0.8052, + "step": 10333 + }, + { + "epoch": 0.26, + "learning_rate": 1.9822361946463324e-06, + "loss": 1.0352, + "step": 10334 + }, + { + "epoch": 0.26, + "learning_rate": 1.982231001943885e-06, + "loss": 0.79, + "step": 10335 + }, + { + "epoch": 0.26, + "learning_rate": 1.982225808489389e-06, + "loss": 0.6455, + "step": 10336 + }, + { + "epoch": 0.26, + "learning_rate": 1.982220614282848e-06, + "loss": 1.0977, + "step": 10337 + }, + { + "epoch": 0.26, + "learning_rate": 1.9822154193242654e-06, + "loss": 0.7891, + "step": 10338 + }, + { + "epoch": 0.26, + "learning_rate": 1.982210223613646e-06, + "loss": 1.0293, + "step": 10339 + }, + { + "epoch": 0.27, + "learning_rate": 1.982205027150993e-06, + "loss": 0.8867, + "step": 10340 + }, + { + "epoch": 0.27, + "learning_rate": 1.982199829936311e-06, + "loss": 0.8877, + "step": 10341 + }, + { + "epoch": 0.27, + "learning_rate": 1.982194631969604e-06, + "loss": 0.8599, + "step": 10342 + }, + { + "epoch": 0.27, + "learning_rate": 1.9821894332508754e-06, + "loss": 0.8652, + "step": 10343 + }, + { + "epoch": 0.27, + "learning_rate": 1.9821842337801298e-06, + "loss": 0.8223, + "step": 10344 + }, + { + "epoch": 0.27, + "learning_rate": 1.9821790335573705e-06, + "loss": 0.8701, + "step": 10345 + }, + { + "epoch": 0.27, + "learning_rate": 1.9821738325826018e-06, + "loss": 0.9551, + "step": 10346 + }, + { + "epoch": 0.27, + "learning_rate": 1.982168630855828e-06, + "loss": 0.9775, + "step": 10347 + }, + { + "epoch": 0.27, + "learning_rate": 1.982163428377053e-06, + "loss": 0.958, + "step": 10348 + }, + { + "epoch": 0.27, + "learning_rate": 1.9821582251462807e-06, + "loss": 0.9209, + "step": 10349 + }, + { + "epoch": 0.27, + "learning_rate": 1.9821530211635146e-06, + "loss": 0.8193, + "step": 10350 + }, + { + "epoch": 0.27, + "learning_rate": 1.9821478164287595e-06, + "loss": 0.9775, + "step": 10351 + }, + { + "epoch": 0.27, + "learning_rate": 1.9821426109420186e-06, + "loss": 0.6221, + "step": 10352 + }, + { + "epoch": 0.27, + "learning_rate": 1.9821374047032963e-06, + "loss": 1.1152, + "step": 10353 + }, + { + "epoch": 0.27, + "learning_rate": 1.982132197712597e-06, + "loss": 0.9053, + "step": 10354 + }, + { + "epoch": 0.27, + "learning_rate": 1.982126989969924e-06, + "loss": 1.1475, + "step": 10355 + }, + { + "epoch": 0.27, + "learning_rate": 1.9821217814752814e-06, + "loss": 0.8799, + "step": 10356 + }, + { + "epoch": 0.27, + "learning_rate": 1.982116572228673e-06, + "loss": 0.7275, + "step": 10357 + }, + { + "epoch": 0.27, + "learning_rate": 1.9821113622301037e-06, + "loss": 0.8936, + "step": 10358 + }, + { + "epoch": 0.27, + "learning_rate": 1.9821061514795765e-06, + "loss": 0.9102, + "step": 10359 + }, + { + "epoch": 0.27, + "learning_rate": 1.982100939977096e-06, + "loss": 0.9365, + "step": 10360 + }, + { + "epoch": 0.27, + "learning_rate": 1.982095727722666e-06, + "loss": 0.6919, + "step": 10361 + }, + { + "epoch": 0.27, + "learning_rate": 1.98209051471629e-06, + "loss": 1.1367, + "step": 10362 + }, + { + "epoch": 0.27, + "learning_rate": 1.982085300957973e-06, + "loss": 1.1172, + "step": 10363 + }, + { + "epoch": 0.27, + "learning_rate": 1.9820800864477183e-06, + "loss": 1.0527, + "step": 10364 + }, + { + "epoch": 0.27, + "learning_rate": 1.9820748711855303e-06, + "loss": 0.6191, + "step": 10365 + }, + { + "epoch": 0.27, + "learning_rate": 1.982069655171412e-06, + "loss": 1.0273, + "step": 10366 + }, + { + "epoch": 0.27, + "learning_rate": 1.982064438405369e-06, + "loss": 0.9707, + "step": 10367 + }, + { + "epoch": 0.27, + "learning_rate": 1.9820592208874037e-06, + "loss": 1.0596, + "step": 10368 + }, + { + "epoch": 0.27, + "learning_rate": 1.982054002617521e-06, + "loss": 0.7534, + "step": 10369 + }, + { + "epoch": 0.27, + "learning_rate": 1.982048783595725e-06, + "loss": 0.8369, + "step": 10370 + }, + { + "epoch": 0.27, + "learning_rate": 1.9820435638220188e-06, + "loss": 0.5999, + "step": 10371 + }, + { + "epoch": 0.27, + "learning_rate": 1.9820383432964074e-06, + "loss": 1.0391, + "step": 10372 + }, + { + "epoch": 0.27, + "learning_rate": 1.9820331220188943e-06, + "loss": 0.7764, + "step": 10373 + }, + { + "epoch": 0.27, + "learning_rate": 1.982027899989484e-06, + "loss": 0.7363, + "step": 10374 + }, + { + "epoch": 0.27, + "learning_rate": 1.9820226772081793e-06, + "loss": 0.6836, + "step": 10375 + }, + { + "epoch": 0.27, + "learning_rate": 1.9820174536749857e-06, + "loss": 0.9834, + "step": 10376 + }, + { + "epoch": 0.27, + "learning_rate": 1.9820122293899062e-06, + "loss": 0.9194, + "step": 10377 + }, + { + "epoch": 0.27, + "learning_rate": 1.982007004352945e-06, + "loss": 1.0879, + "step": 10378 + }, + { + "epoch": 0.27, + "learning_rate": 1.9820017785641063e-06, + "loss": 1.1309, + "step": 10379 + }, + { + "epoch": 0.27, + "learning_rate": 1.9819965520233942e-06, + "loss": 0.8037, + "step": 10380 + }, + { + "epoch": 0.27, + "learning_rate": 1.981991324730812e-06, + "loss": 0.8301, + "step": 10381 + }, + { + "epoch": 0.27, + "learning_rate": 1.9819860966863646e-06, + "loss": 0.9902, + "step": 10382 + }, + { + "epoch": 0.27, + "learning_rate": 1.9819808678900554e-06, + "loss": 0.4985, + "step": 10383 + }, + { + "epoch": 0.27, + "learning_rate": 1.981975638341889e-06, + "loss": 0.7568, + "step": 10384 + }, + { + "epoch": 0.27, + "learning_rate": 1.9819704080418685e-06, + "loss": 0.7842, + "step": 10385 + }, + { + "epoch": 0.27, + "learning_rate": 1.9819651769899987e-06, + "loss": 0.8672, + "step": 10386 + }, + { + "epoch": 0.27, + "learning_rate": 1.981959945186283e-06, + "loss": 0.8359, + "step": 10387 + }, + { + "epoch": 0.27, + "learning_rate": 1.981954712630726e-06, + "loss": 0.9658, + "step": 10388 + }, + { + "epoch": 0.27, + "learning_rate": 1.9819494793233316e-06, + "loss": 0.7188, + "step": 10389 + }, + { + "epoch": 0.27, + "learning_rate": 1.9819442452641035e-06, + "loss": 0.834, + "step": 10390 + }, + { + "epoch": 0.27, + "learning_rate": 1.9819390104530456e-06, + "loss": 0.9824, + "step": 10391 + }, + { + "epoch": 0.27, + "learning_rate": 1.9819337748901625e-06, + "loss": 0.8916, + "step": 10392 + }, + { + "epoch": 0.27, + "learning_rate": 1.9819285385754572e-06, + "loss": 0.8584, + "step": 10393 + }, + { + "epoch": 0.27, + "learning_rate": 1.9819233015089353e-06, + "loss": 1.0098, + "step": 10394 + }, + { + "epoch": 0.27, + "learning_rate": 1.981918063690599e-06, + "loss": 0.8828, + "step": 10395 + }, + { + "epoch": 0.27, + "learning_rate": 1.981912825120454e-06, + "loss": 1.0068, + "step": 10396 + }, + { + "epoch": 0.27, + "learning_rate": 1.981907585798503e-06, + "loss": 0.9736, + "step": 10397 + }, + { + "epoch": 0.27, + "learning_rate": 1.98190234572475e-06, + "loss": 0.79, + "step": 10398 + }, + { + "epoch": 0.27, + "learning_rate": 1.9818971048992006e-06, + "loss": 0.8848, + "step": 10399 + }, + { + "epoch": 0.27, + "learning_rate": 1.981891863321857e-06, + "loss": 0.8223, + "step": 10400 + }, + { + "epoch": 0.27, + "learning_rate": 1.9818866209927245e-06, + "loss": 0.8467, + "step": 10401 + }, + { + "epoch": 0.27, + "learning_rate": 1.981881377911806e-06, + "loss": 0.9893, + "step": 10402 + }, + { + "epoch": 0.27, + "learning_rate": 1.9818761340791066e-06, + "loss": 1.0293, + "step": 10403 + }, + { + "epoch": 0.27, + "learning_rate": 1.9818708894946298e-06, + "loss": 0.9346, + "step": 10404 + }, + { + "epoch": 0.27, + "learning_rate": 1.981865644158379e-06, + "loss": 0.793, + "step": 10405 + }, + { + "epoch": 0.27, + "learning_rate": 1.9818603980703594e-06, + "loss": 0.8926, + "step": 10406 + }, + { + "epoch": 0.27, + "learning_rate": 1.9818551512305743e-06, + "loss": 1.0918, + "step": 10407 + }, + { + "epoch": 0.27, + "learning_rate": 1.9818499036390276e-06, + "loss": 0.9248, + "step": 10408 + }, + { + "epoch": 0.27, + "learning_rate": 1.9818446552957235e-06, + "loss": 0.9375, + "step": 10409 + }, + { + "epoch": 0.27, + "learning_rate": 1.9818394062006666e-06, + "loss": 0.9453, + "step": 10410 + }, + { + "epoch": 0.27, + "learning_rate": 1.98183415635386e-06, + "loss": 0.8828, + "step": 10411 + }, + { + "epoch": 0.27, + "learning_rate": 1.9818289057553085e-06, + "loss": 0.751, + "step": 10412 + }, + { + "epoch": 0.27, + "learning_rate": 1.9818236544050154e-06, + "loss": 0.8594, + "step": 10413 + }, + { + "epoch": 0.27, + "learning_rate": 1.9818184023029852e-06, + "loss": 1.0, + "step": 10414 + }, + { + "epoch": 0.27, + "learning_rate": 1.9818131494492218e-06, + "loss": 0.8408, + "step": 10415 + }, + { + "epoch": 0.27, + "learning_rate": 1.9818078958437293e-06, + "loss": 1.0254, + "step": 10416 + }, + { + "epoch": 0.27, + "learning_rate": 1.9818026414865116e-06, + "loss": 1.0723, + "step": 10417 + }, + { + "epoch": 0.27, + "learning_rate": 1.981797386377573e-06, + "loss": 0.5859, + "step": 10418 + }, + { + "epoch": 0.27, + "learning_rate": 1.9817921305169165e-06, + "loss": 0.9326, + "step": 10419 + }, + { + "epoch": 0.27, + "learning_rate": 1.9817868739045477e-06, + "loss": 0.9512, + "step": 10420 + }, + { + "epoch": 0.27, + "learning_rate": 1.9817816165404693e-06, + "loss": 1.0908, + "step": 10421 + }, + { + "epoch": 0.27, + "learning_rate": 1.9817763584246865e-06, + "loss": 0.8394, + "step": 10422 + }, + { + "epoch": 0.27, + "learning_rate": 1.981771099557202e-06, + "loss": 1.0508, + "step": 10423 + }, + { + "epoch": 0.27, + "learning_rate": 1.981765839938021e-06, + "loss": 0.8218, + "step": 10424 + }, + { + "epoch": 0.27, + "learning_rate": 1.9817605795671466e-06, + "loss": 0.9263, + "step": 10425 + }, + { + "epoch": 0.27, + "learning_rate": 1.9817553184445836e-06, + "loss": 0.8848, + "step": 10426 + }, + { + "epoch": 0.27, + "learning_rate": 1.9817500565703356e-06, + "loss": 0.6201, + "step": 10427 + }, + { + "epoch": 0.27, + "learning_rate": 1.9817447939444068e-06, + "loss": 0.8779, + "step": 10428 + }, + { + "epoch": 0.27, + "learning_rate": 1.981739530566801e-06, + "loss": 0.8555, + "step": 10429 + }, + { + "epoch": 0.27, + "learning_rate": 1.9817342664375226e-06, + "loss": 0.8374, + "step": 10430 + }, + { + "epoch": 0.27, + "learning_rate": 1.9817290015565753e-06, + "loss": 0.897, + "step": 10431 + }, + { + "epoch": 0.27, + "learning_rate": 1.9817237359239633e-06, + "loss": 0.9248, + "step": 10432 + }, + { + "epoch": 0.27, + "learning_rate": 1.9817184695396904e-06, + "loss": 1.1494, + "step": 10433 + }, + { + "epoch": 0.27, + "learning_rate": 1.981713202403761e-06, + "loss": 0.9219, + "step": 10434 + }, + { + "epoch": 0.27, + "learning_rate": 1.9817079345161787e-06, + "loss": 0.8799, + "step": 10435 + }, + { + "epoch": 0.27, + "learning_rate": 1.981702665876948e-06, + "loss": 0.9385, + "step": 10436 + }, + { + "epoch": 0.27, + "learning_rate": 1.9816973964860727e-06, + "loss": 1.0215, + "step": 10437 + }, + { + "epoch": 0.27, + "learning_rate": 1.9816921263435566e-06, + "loss": 0.9238, + "step": 10438 + }, + { + "epoch": 0.27, + "learning_rate": 1.9816868554494042e-06, + "loss": 0.7822, + "step": 10439 + }, + { + "epoch": 0.27, + "learning_rate": 1.9816815838036194e-06, + "loss": 1.0078, + "step": 10440 + }, + { + "epoch": 0.27, + "learning_rate": 1.981676311406206e-06, + "loss": 0.9121, + "step": 10441 + }, + { + "epoch": 0.27, + "learning_rate": 1.981671038257168e-06, + "loss": 1.0718, + "step": 10442 + }, + { + "epoch": 0.27, + "learning_rate": 1.98166576435651e-06, + "loss": 0.9775, + "step": 10443 + }, + { + "epoch": 0.27, + "learning_rate": 1.9816604897042356e-06, + "loss": 0.689, + "step": 10444 + }, + { + "epoch": 0.27, + "learning_rate": 1.9816552143003485e-06, + "loss": 0.9053, + "step": 10445 + }, + { + "epoch": 0.27, + "learning_rate": 1.9816499381448535e-06, + "loss": 0.9443, + "step": 10446 + }, + { + "epoch": 0.27, + "learning_rate": 1.9816446612377544e-06, + "loss": 1.1562, + "step": 10447 + }, + { + "epoch": 0.27, + "learning_rate": 1.9816393835790546e-06, + "loss": 0.958, + "step": 10448 + }, + { + "epoch": 0.27, + "learning_rate": 1.981634105168759e-06, + "loss": 0.9346, + "step": 10449 + }, + { + "epoch": 0.27, + "learning_rate": 1.9816288260068715e-06, + "loss": 0.9844, + "step": 10450 + }, + { + "epoch": 0.27, + "learning_rate": 1.981623546093396e-06, + "loss": 0.7563, + "step": 10451 + }, + { + "epoch": 0.27, + "learning_rate": 1.981618265428336e-06, + "loss": 0.9023, + "step": 10452 + }, + { + "epoch": 0.27, + "learning_rate": 1.981612984011696e-06, + "loss": 0.7944, + "step": 10453 + }, + { + "epoch": 0.27, + "learning_rate": 1.9816077018434806e-06, + "loss": 0.9893, + "step": 10454 + }, + { + "epoch": 0.27, + "learning_rate": 1.981602418923693e-06, + "loss": 0.999, + "step": 10455 + }, + { + "epoch": 0.27, + "learning_rate": 1.9815971352523376e-06, + "loss": 0.8774, + "step": 10456 + }, + { + "epoch": 0.27, + "learning_rate": 1.9815918508294186e-06, + "loss": 1.0791, + "step": 10457 + }, + { + "epoch": 0.27, + "learning_rate": 1.9815865656549395e-06, + "loss": 0.9307, + "step": 10458 + }, + { + "epoch": 0.27, + "learning_rate": 1.981581279728905e-06, + "loss": 1.0234, + "step": 10459 + }, + { + "epoch": 0.27, + "learning_rate": 1.9815759930513186e-06, + "loss": 0.8926, + "step": 10460 + }, + { + "epoch": 0.27, + "learning_rate": 1.981570705622185e-06, + "loss": 1.0586, + "step": 10461 + }, + { + "epoch": 0.27, + "learning_rate": 1.9815654174415075e-06, + "loss": 1.043, + "step": 10462 + }, + { + "epoch": 0.27, + "learning_rate": 1.9815601285092904e-06, + "loss": 1.0312, + "step": 10463 + }, + { + "epoch": 0.27, + "learning_rate": 1.981554838825538e-06, + "loss": 0.7996, + "step": 10464 + }, + { + "epoch": 0.27, + "learning_rate": 1.981549548390254e-06, + "loss": 0.8315, + "step": 10465 + }, + { + "epoch": 0.27, + "learning_rate": 1.9815442572034433e-06, + "loss": 0.8125, + "step": 10466 + }, + { + "epoch": 0.27, + "learning_rate": 1.981538965265109e-06, + "loss": 0.9346, + "step": 10467 + }, + { + "epoch": 0.27, + "learning_rate": 1.981533672575255e-06, + "loss": 0.9824, + "step": 10468 + }, + { + "epoch": 0.27, + "learning_rate": 1.981528379133886e-06, + "loss": 1.0947, + "step": 10469 + }, + { + "epoch": 0.27, + "learning_rate": 1.9815230849410056e-06, + "loss": 1.1025, + "step": 10470 + }, + { + "epoch": 0.27, + "learning_rate": 1.981517789996619e-06, + "loss": 1.1113, + "step": 10471 + }, + { + "epoch": 0.27, + "learning_rate": 1.9815124943007287e-06, + "loss": 0.8633, + "step": 10472 + }, + { + "epoch": 0.27, + "learning_rate": 1.9815071978533397e-06, + "loss": 0.7578, + "step": 10473 + }, + { + "epoch": 0.27, + "learning_rate": 1.9815019006544555e-06, + "loss": 1.0986, + "step": 10474 + }, + { + "epoch": 0.27, + "learning_rate": 1.9814966027040802e-06, + "loss": 0.8799, + "step": 10475 + }, + { + "epoch": 0.27, + "learning_rate": 1.9814913040022186e-06, + "loss": 1.0596, + "step": 10476 + }, + { + "epoch": 0.27, + "learning_rate": 1.981486004548874e-06, + "loss": 0.8613, + "step": 10477 + }, + { + "epoch": 0.27, + "learning_rate": 1.9814807043440507e-06, + "loss": 0.6587, + "step": 10478 + }, + { + "epoch": 0.27, + "learning_rate": 1.981475403387753e-06, + "loss": 1.0059, + "step": 10479 + }, + { + "epoch": 0.27, + "learning_rate": 1.9814701016799844e-06, + "loss": 0.7305, + "step": 10480 + }, + { + "epoch": 0.27, + "learning_rate": 1.9814647992207494e-06, + "loss": 1.0527, + "step": 10481 + }, + { + "epoch": 0.27, + "learning_rate": 1.9814594960100518e-06, + "loss": 1.0859, + "step": 10482 + }, + { + "epoch": 0.27, + "learning_rate": 1.981454192047896e-06, + "loss": 0.7754, + "step": 10483 + }, + { + "epoch": 0.27, + "learning_rate": 1.9814488873342856e-06, + "loss": 0.7202, + "step": 10484 + }, + { + "epoch": 0.27, + "learning_rate": 1.981443581869225e-06, + "loss": 0.7979, + "step": 10485 + }, + { + "epoch": 0.27, + "learning_rate": 1.9814382756527183e-06, + "loss": 0.9141, + "step": 10486 + }, + { + "epoch": 0.27, + "learning_rate": 1.9814329686847693e-06, + "loss": 0.9404, + "step": 10487 + }, + { + "epoch": 0.27, + "learning_rate": 1.9814276609653823e-06, + "loss": 0.9404, + "step": 10488 + }, + { + "epoch": 0.27, + "learning_rate": 1.9814223524945613e-06, + "loss": 0.8018, + "step": 10489 + }, + { + "epoch": 0.27, + "learning_rate": 1.9814170432723104e-06, + "loss": 0.9258, + "step": 10490 + }, + { + "epoch": 0.27, + "learning_rate": 1.981411733298633e-06, + "loss": 1.1484, + "step": 10491 + }, + { + "epoch": 0.27, + "learning_rate": 1.9814064225735345e-06, + "loss": 0.9385, + "step": 10492 + }, + { + "epoch": 0.27, + "learning_rate": 1.981401111097018e-06, + "loss": 0.958, + "step": 10493 + }, + { + "epoch": 0.27, + "learning_rate": 1.9813957988690876e-06, + "loss": 1.0576, + "step": 10494 + }, + { + "epoch": 0.27, + "learning_rate": 1.9813904858897483e-06, + "loss": 0.8521, + "step": 10495 + }, + { + "epoch": 0.27, + "learning_rate": 1.9813851721590023e-06, + "loss": 0.9697, + "step": 10496 + }, + { + "epoch": 0.27, + "learning_rate": 1.981379857676856e-06, + "loss": 0.9824, + "step": 10497 + }, + { + "epoch": 0.27, + "learning_rate": 1.981374542443311e-06, + "loss": 0.6826, + "step": 10498 + }, + { + "epoch": 0.27, + "learning_rate": 1.9813692264583733e-06, + "loss": 0.5854, + "step": 10499 + }, + { + "epoch": 0.27, + "learning_rate": 1.9813639097220465e-06, + "loss": 0.834, + "step": 10500 + }, + { + "epoch": 0.27, + "learning_rate": 1.981358592234334e-06, + "loss": 0.6577, + "step": 10501 + }, + { + "epoch": 0.27, + "learning_rate": 1.981353273995241e-06, + "loss": 0.8481, + "step": 10502 + }, + { + "epoch": 0.27, + "learning_rate": 1.98134795500477e-06, + "loss": 1.1094, + "step": 10503 + }, + { + "epoch": 0.27, + "learning_rate": 1.981342635262927e-06, + "loss": 0.9209, + "step": 10504 + }, + { + "epoch": 0.27, + "learning_rate": 1.9813373147697145e-06, + "loss": 0.9814, + "step": 10505 + }, + { + "epoch": 0.27, + "learning_rate": 1.981331993525137e-06, + "loss": 0.9062, + "step": 10506 + }, + { + "epoch": 0.27, + "learning_rate": 1.981326671529199e-06, + "loss": 0.877, + "step": 10507 + }, + { + "epoch": 0.27, + "learning_rate": 1.981321348781904e-06, + "loss": 1.0156, + "step": 10508 + }, + { + "epoch": 0.27, + "learning_rate": 1.9813160252832567e-06, + "loss": 0.7354, + "step": 10509 + }, + { + "epoch": 0.27, + "learning_rate": 1.9813107010332606e-06, + "loss": 1.1396, + "step": 10510 + }, + { + "epoch": 0.27, + "learning_rate": 1.9813053760319204e-06, + "loss": 1.0225, + "step": 10511 + }, + { + "epoch": 0.27, + "learning_rate": 1.9813000502792396e-06, + "loss": 0.9678, + "step": 10512 + }, + { + "epoch": 0.27, + "learning_rate": 1.9812947237752223e-06, + "loss": 1.0166, + "step": 10513 + }, + { + "epoch": 0.27, + "learning_rate": 1.9812893965198733e-06, + "loss": 0.8711, + "step": 10514 + }, + { + "epoch": 0.27, + "learning_rate": 1.9812840685131955e-06, + "loss": 1.0234, + "step": 10515 + }, + { + "epoch": 0.27, + "learning_rate": 1.981278739755194e-06, + "loss": 0.9443, + "step": 10516 + }, + { + "epoch": 0.27, + "learning_rate": 1.981273410245872e-06, + "loss": 1.0859, + "step": 10517 + }, + { + "epoch": 0.27, + "learning_rate": 1.9812680799852343e-06, + "loss": 1.0703, + "step": 10518 + }, + { + "epoch": 0.27, + "learning_rate": 1.981262748973285e-06, + "loss": 0.8115, + "step": 10519 + }, + { + "epoch": 0.27, + "learning_rate": 1.9812574172100277e-06, + "loss": 0.8779, + "step": 10520 + }, + { + "epoch": 0.27, + "learning_rate": 1.981252084695467e-06, + "loss": 0.9248, + "step": 10521 + }, + { + "epoch": 0.27, + "learning_rate": 1.9812467514296063e-06, + "loss": 0.9824, + "step": 10522 + }, + { + "epoch": 0.27, + "learning_rate": 1.98124141741245e-06, + "loss": 0.9824, + "step": 10523 + }, + { + "epoch": 0.27, + "learning_rate": 1.9812360826440025e-06, + "loss": 0.9795, + "step": 10524 + }, + { + "epoch": 0.27, + "learning_rate": 1.981230747124268e-06, + "loss": 1.0908, + "step": 10525 + }, + { + "epoch": 0.27, + "learning_rate": 1.98122541085325e-06, + "loss": 0.9531, + "step": 10526 + }, + { + "epoch": 0.27, + "learning_rate": 1.9812200738309525e-06, + "loss": 0.875, + "step": 10527 + }, + { + "epoch": 0.27, + "learning_rate": 1.98121473605738e-06, + "loss": 0.8799, + "step": 10528 + }, + { + "epoch": 0.27, + "learning_rate": 1.9812093975325367e-06, + "loss": 0.8672, + "step": 10529 + }, + { + "epoch": 0.27, + "learning_rate": 1.9812040582564264e-06, + "loss": 0.8916, + "step": 10530 + }, + { + "epoch": 0.27, + "learning_rate": 1.9811987182290534e-06, + "loss": 0.916, + "step": 10531 + }, + { + "epoch": 0.27, + "learning_rate": 1.9811933774504214e-06, + "loss": 0.8525, + "step": 10532 + }, + { + "epoch": 0.27, + "learning_rate": 1.9811880359205347e-06, + "loss": 0.9863, + "step": 10533 + }, + { + "epoch": 0.27, + "learning_rate": 1.9811826936393976e-06, + "loss": 1.1143, + "step": 10534 + }, + { + "epoch": 0.27, + "learning_rate": 1.9811773506070143e-06, + "loss": 0.833, + "step": 10535 + }, + { + "epoch": 0.27, + "learning_rate": 1.9811720068233885e-06, + "loss": 0.957, + "step": 10536 + }, + { + "epoch": 0.27, + "learning_rate": 1.981166662288524e-06, + "loss": 0.9854, + "step": 10537 + }, + { + "epoch": 0.27, + "learning_rate": 1.981161317002426e-06, + "loss": 0.8682, + "step": 10538 + }, + { + "epoch": 0.27, + "learning_rate": 1.981155970965097e-06, + "loss": 0.792, + "step": 10539 + }, + { + "epoch": 0.27, + "learning_rate": 1.9811506241765426e-06, + "loss": 1.1172, + "step": 10540 + }, + { + "epoch": 0.27, + "learning_rate": 1.981145276636766e-06, + "loss": 0.9785, + "step": 10541 + }, + { + "epoch": 0.27, + "learning_rate": 1.981139928345772e-06, + "loss": 0.9971, + "step": 10542 + }, + { + "epoch": 0.27, + "learning_rate": 1.981134579303564e-06, + "loss": 0.9551, + "step": 10543 + }, + { + "epoch": 0.27, + "learning_rate": 1.981129229510146e-06, + "loss": 0.9248, + "step": 10544 + }, + { + "epoch": 0.27, + "learning_rate": 1.981123878965523e-06, + "loss": 0.959, + "step": 10545 + }, + { + "epoch": 0.27, + "learning_rate": 1.9811185276696985e-06, + "loss": 0.7686, + "step": 10546 + }, + { + "epoch": 0.27, + "learning_rate": 1.9811131756226764e-06, + "loss": 0.8813, + "step": 10547 + }, + { + "epoch": 0.27, + "learning_rate": 1.981107822824461e-06, + "loss": 0.8408, + "step": 10548 + }, + { + "epoch": 0.27, + "learning_rate": 1.981102469275057e-06, + "loss": 0.8643, + "step": 10549 + }, + { + "epoch": 0.27, + "learning_rate": 1.9810971149744672e-06, + "loss": 0.9551, + "step": 10550 + }, + { + "epoch": 0.27, + "learning_rate": 1.981091759922697e-06, + "loss": 0.9863, + "step": 10551 + }, + { + "epoch": 0.27, + "learning_rate": 1.98108640411975e-06, + "loss": 0.9463, + "step": 10552 + }, + { + "epoch": 0.27, + "learning_rate": 1.98108104756563e-06, + "loss": 1.0391, + "step": 10553 + }, + { + "epoch": 0.27, + "learning_rate": 1.981075690260341e-06, + "loss": 0.8857, + "step": 10554 + }, + { + "epoch": 0.27, + "learning_rate": 1.9810703322038884e-06, + "loss": 0.7388, + "step": 10555 + }, + { + "epoch": 0.27, + "learning_rate": 1.9810649733962745e-06, + "loss": 1.0215, + "step": 10556 + }, + { + "epoch": 0.27, + "learning_rate": 1.9810596138375046e-06, + "loss": 0.6738, + "step": 10557 + }, + { + "epoch": 0.27, + "learning_rate": 1.9810542535275825e-06, + "loss": 0.6782, + "step": 10558 + }, + { + "epoch": 0.27, + "learning_rate": 1.981048892466512e-06, + "loss": 0.5791, + "step": 10559 + }, + { + "epoch": 0.27, + "learning_rate": 1.9810435306542977e-06, + "loss": 0.9746, + "step": 10560 + }, + { + "epoch": 0.27, + "learning_rate": 1.9810381680909435e-06, + "loss": 1.0557, + "step": 10561 + }, + { + "epoch": 0.27, + "learning_rate": 1.9810328047764537e-06, + "loss": 0.9639, + "step": 10562 + }, + { + "epoch": 0.27, + "learning_rate": 1.981027440710832e-06, + "loss": 0.8262, + "step": 10563 + }, + { + "epoch": 0.27, + "learning_rate": 1.981022075894082e-06, + "loss": 0.7852, + "step": 10564 + }, + { + "epoch": 0.27, + "learning_rate": 1.9810167103262093e-06, + "loss": 0.9023, + "step": 10565 + }, + { + "epoch": 0.27, + "learning_rate": 1.9810113440072174e-06, + "loss": 0.7744, + "step": 10566 + }, + { + "epoch": 0.27, + "learning_rate": 1.9810059769371097e-06, + "loss": 0.8799, + "step": 10567 + }, + { + "epoch": 0.27, + "learning_rate": 1.9810006091158908e-06, + "loss": 0.8203, + "step": 10568 + }, + { + "epoch": 0.27, + "learning_rate": 1.980995240543565e-06, + "loss": 0.959, + "step": 10569 + }, + { + "epoch": 0.27, + "learning_rate": 1.9809898712201366e-06, + "loss": 0.8838, + "step": 10570 + }, + { + "epoch": 0.27, + "learning_rate": 1.980984501145609e-06, + "loss": 0.9189, + "step": 10571 + }, + { + "epoch": 0.27, + "learning_rate": 1.9809791303199867e-06, + "loss": 0.834, + "step": 10572 + }, + { + "epoch": 0.27, + "learning_rate": 1.9809737587432736e-06, + "loss": 1.0234, + "step": 10573 + }, + { + "epoch": 0.27, + "learning_rate": 1.9809683864154744e-06, + "loss": 0.8857, + "step": 10574 + }, + { + "epoch": 0.27, + "learning_rate": 1.980963013336593e-06, + "loss": 1.1973, + "step": 10575 + }, + { + "epoch": 0.27, + "learning_rate": 1.9809576395066324e-06, + "loss": 0.875, + "step": 10576 + }, + { + "epoch": 0.27, + "learning_rate": 1.9809522649255985e-06, + "loss": 0.9248, + "step": 10577 + }, + { + "epoch": 0.27, + "learning_rate": 1.980946889593494e-06, + "loss": 1.0703, + "step": 10578 + }, + { + "epoch": 0.27, + "learning_rate": 1.980941513510324e-06, + "loss": 0.9736, + "step": 10579 + }, + { + "epoch": 0.27, + "learning_rate": 1.980936136676092e-06, + "loss": 0.8916, + "step": 10580 + }, + { + "epoch": 0.27, + "learning_rate": 1.980930759090802e-06, + "loss": 0.9463, + "step": 10581 + }, + { + "epoch": 0.27, + "learning_rate": 1.980925380754459e-06, + "loss": 0.9961, + "step": 10582 + }, + { + "epoch": 0.27, + "learning_rate": 1.9809200016670664e-06, + "loss": 0.8857, + "step": 10583 + }, + { + "epoch": 0.27, + "learning_rate": 1.980914621828628e-06, + "loss": 0.6204, + "step": 10584 + }, + { + "epoch": 0.27, + "learning_rate": 1.980909241239149e-06, + "loss": 0.9561, + "step": 10585 + }, + { + "epoch": 0.27, + "learning_rate": 1.9809038598986326e-06, + "loss": 0.7666, + "step": 10586 + }, + { + "epoch": 0.27, + "learning_rate": 1.980898477807083e-06, + "loss": 0.9463, + "step": 10587 + }, + { + "epoch": 0.27, + "learning_rate": 1.9808930949645047e-06, + "loss": 0.9756, + "step": 10588 + }, + { + "epoch": 0.27, + "learning_rate": 1.980887711370902e-06, + "loss": 0.9297, + "step": 10589 + }, + { + "epoch": 0.27, + "learning_rate": 1.9808823270262783e-06, + "loss": 1.207, + "step": 10590 + }, + { + "epoch": 0.27, + "learning_rate": 1.980876941930638e-06, + "loss": 1.0205, + "step": 10591 + }, + { + "epoch": 0.27, + "learning_rate": 1.9808715560839855e-06, + "loss": 0.7939, + "step": 10592 + }, + { + "epoch": 0.27, + "learning_rate": 1.980866169486325e-06, + "loss": 0.8906, + "step": 10593 + }, + { + "epoch": 0.27, + "learning_rate": 1.98086078213766e-06, + "loss": 1.0664, + "step": 10594 + }, + { + "epoch": 0.27, + "learning_rate": 1.9808553940379955e-06, + "loss": 0.9443, + "step": 10595 + }, + { + "epoch": 0.27, + "learning_rate": 1.9808500051873346e-06, + "loss": 0.8921, + "step": 10596 + }, + { + "epoch": 0.27, + "learning_rate": 1.980844615585682e-06, + "loss": 0.8965, + "step": 10597 + }, + { + "epoch": 0.27, + "learning_rate": 1.980839225233042e-06, + "loss": 0.8105, + "step": 10598 + }, + { + "epoch": 0.27, + "learning_rate": 1.9808338341294184e-06, + "loss": 0.7417, + "step": 10599 + }, + { + "epoch": 0.27, + "learning_rate": 1.980828442274816e-06, + "loss": 0.9033, + "step": 10600 + }, + { + "epoch": 0.27, + "learning_rate": 1.9808230496692376e-06, + "loss": 1.0225, + "step": 10601 + }, + { + "epoch": 0.27, + "learning_rate": 1.980817656312688e-06, + "loss": 1.1035, + "step": 10602 + }, + { + "epoch": 0.27, + "learning_rate": 1.980812262205172e-06, + "loss": 0.9395, + "step": 10603 + }, + { + "epoch": 0.27, + "learning_rate": 1.980806867346693e-06, + "loss": 0.6216, + "step": 10604 + }, + { + "epoch": 0.27, + "learning_rate": 1.980801471737255e-06, + "loss": 0.9219, + "step": 10605 + }, + { + "epoch": 0.27, + "learning_rate": 1.9807960753768623e-06, + "loss": 0.958, + "step": 10606 + }, + { + "epoch": 0.27, + "learning_rate": 1.9807906782655194e-06, + "loss": 0.7266, + "step": 10607 + }, + { + "epoch": 0.27, + "learning_rate": 1.98078528040323e-06, + "loss": 0.9863, + "step": 10608 + }, + { + "epoch": 0.27, + "learning_rate": 1.980779881789999e-06, + "loss": 0.8535, + "step": 10609 + }, + { + "epoch": 0.27, + "learning_rate": 1.9807744824258294e-06, + "loss": 1.1914, + "step": 10610 + }, + { + "epoch": 0.27, + "learning_rate": 1.980769082310726e-06, + "loss": 0.9229, + "step": 10611 + }, + { + "epoch": 0.27, + "learning_rate": 1.980763681444693e-06, + "loss": 0.7285, + "step": 10612 + }, + { + "epoch": 0.27, + "learning_rate": 1.980758279827734e-06, + "loss": 0.9541, + "step": 10613 + }, + { + "epoch": 0.27, + "learning_rate": 1.980752877459854e-06, + "loss": 1.1641, + "step": 10614 + }, + { + "epoch": 0.27, + "learning_rate": 1.980747474341056e-06, + "loss": 0.9854, + "step": 10615 + }, + { + "epoch": 0.27, + "learning_rate": 1.980742070471345e-06, + "loss": 1.0049, + "step": 10616 + }, + { + "epoch": 0.27, + "learning_rate": 1.980736665850725e-06, + "loss": 0.9492, + "step": 10617 + }, + { + "epoch": 0.27, + "learning_rate": 1.9807312604792e-06, + "loss": 0.7822, + "step": 10618 + }, + { + "epoch": 0.27, + "learning_rate": 1.980725854356774e-06, + "loss": 1.1279, + "step": 10619 + }, + { + "epoch": 0.27, + "learning_rate": 1.9807204474834514e-06, + "loss": 0.7456, + "step": 10620 + }, + { + "epoch": 0.27, + "learning_rate": 1.980715039859236e-06, + "loss": 0.916, + "step": 10621 + }, + { + "epoch": 0.27, + "learning_rate": 1.980709631484133e-06, + "loss": 0.7778, + "step": 10622 + }, + { + "epoch": 0.27, + "learning_rate": 1.980704222358145e-06, + "loss": 0.8438, + "step": 10623 + }, + { + "epoch": 0.27, + "learning_rate": 1.9806988124812772e-06, + "loss": 0.9023, + "step": 10624 + }, + { + "epoch": 0.27, + "learning_rate": 1.980693401853533e-06, + "loss": 1.043, + "step": 10625 + }, + { + "epoch": 0.27, + "learning_rate": 1.9806879904749176e-06, + "loss": 0.9111, + "step": 10626 + }, + { + "epoch": 0.27, + "learning_rate": 1.980682578345434e-06, + "loss": 1.0869, + "step": 10627 + }, + { + "epoch": 0.27, + "learning_rate": 1.9806771654650867e-06, + "loss": 0.9717, + "step": 10628 + }, + { + "epoch": 0.27, + "learning_rate": 1.9806717518338803e-06, + "loss": 0.8311, + "step": 10629 + }, + { + "epoch": 0.27, + "learning_rate": 1.9806663374518185e-06, + "loss": 0.915, + "step": 10630 + }, + { + "epoch": 0.27, + "learning_rate": 1.980660922318906e-06, + "loss": 0.6211, + "step": 10631 + }, + { + "epoch": 0.27, + "learning_rate": 1.9806555064351463e-06, + "loss": 0.7217, + "step": 10632 + }, + { + "epoch": 0.27, + "learning_rate": 1.9806500898005436e-06, + "loss": 0.8965, + "step": 10633 + }, + { + "epoch": 0.27, + "learning_rate": 1.980644672415102e-06, + "loss": 0.9238, + "step": 10634 + }, + { + "epoch": 0.27, + "learning_rate": 1.9806392542788263e-06, + "loss": 0.7446, + "step": 10635 + }, + { + "epoch": 0.27, + "learning_rate": 1.98063383539172e-06, + "loss": 0.6826, + "step": 10636 + }, + { + "epoch": 0.27, + "learning_rate": 1.9806284157537877e-06, + "loss": 0.9736, + "step": 10637 + }, + { + "epoch": 0.27, + "learning_rate": 1.980622995365033e-06, + "loss": 1.0156, + "step": 10638 + }, + { + "epoch": 0.27, + "learning_rate": 1.9806175742254604e-06, + "loss": 0.8135, + "step": 10639 + }, + { + "epoch": 0.27, + "learning_rate": 1.980612152335074e-06, + "loss": 0.9219, + "step": 10640 + }, + { + "epoch": 0.27, + "learning_rate": 1.9806067296938783e-06, + "loss": 0.4023, + "step": 10641 + }, + { + "epoch": 0.27, + "learning_rate": 1.980601306301877e-06, + "loss": 1.1582, + "step": 10642 + }, + { + "epoch": 0.27, + "learning_rate": 1.9805958821590743e-06, + "loss": 0.9502, + "step": 10643 + }, + { + "epoch": 0.27, + "learning_rate": 1.9805904572654743e-06, + "loss": 0.873, + "step": 10644 + }, + { + "epoch": 0.27, + "learning_rate": 1.980585031621081e-06, + "loss": 0.9961, + "step": 10645 + }, + { + "epoch": 0.27, + "learning_rate": 1.9805796052258996e-06, + "loss": 0.958, + "step": 10646 + }, + { + "epoch": 0.27, + "learning_rate": 1.980574178079933e-06, + "loss": 0.9883, + "step": 10647 + }, + { + "epoch": 0.27, + "learning_rate": 1.980568750183186e-06, + "loss": 0.915, + "step": 10648 + }, + { + "epoch": 0.27, + "learning_rate": 1.9805633215356623e-06, + "loss": 0.7598, + "step": 10649 + }, + { + "epoch": 0.27, + "learning_rate": 1.9805578921373666e-06, + "loss": 1.0205, + "step": 10650 + }, + { + "epoch": 0.27, + "learning_rate": 1.9805524619883028e-06, + "loss": 0.999, + "step": 10651 + }, + { + "epoch": 0.27, + "learning_rate": 1.980547031088475e-06, + "loss": 1.0127, + "step": 10652 + }, + { + "epoch": 0.27, + "learning_rate": 1.9805415994378874e-06, + "loss": 0.8438, + "step": 10653 + }, + { + "epoch": 0.27, + "learning_rate": 1.9805361670365443e-06, + "loss": 0.8701, + "step": 10654 + }, + { + "epoch": 0.27, + "learning_rate": 1.9805307338844497e-06, + "loss": 0.834, + "step": 10655 + }, + { + "epoch": 0.27, + "learning_rate": 1.980525299981608e-06, + "loss": 0.6772, + "step": 10656 + }, + { + "epoch": 0.27, + "learning_rate": 1.9805198653280227e-06, + "loss": 0.6511, + "step": 10657 + }, + { + "epoch": 0.27, + "learning_rate": 1.980514429923699e-06, + "loss": 0.9023, + "step": 10658 + }, + { + "epoch": 0.27, + "learning_rate": 1.9805089937686403e-06, + "loss": 0.731, + "step": 10659 + }, + { + "epoch": 0.27, + "learning_rate": 1.9805035568628506e-06, + "loss": 1.0654, + "step": 10660 + }, + { + "epoch": 0.27, + "learning_rate": 1.9804981192063347e-06, + "loss": 0.9258, + "step": 10661 + }, + { + "epoch": 0.27, + "learning_rate": 1.9804926807990964e-06, + "loss": 0.9382, + "step": 10662 + }, + { + "epoch": 0.27, + "learning_rate": 1.9804872416411397e-06, + "loss": 0.8242, + "step": 10663 + }, + { + "epoch": 0.27, + "learning_rate": 1.9804818017324695e-06, + "loss": 1.0801, + "step": 10664 + }, + { + "epoch": 0.27, + "learning_rate": 1.980476361073089e-06, + "loss": 1.0312, + "step": 10665 + }, + { + "epoch": 0.27, + "learning_rate": 1.980470919663003e-06, + "loss": 0.8545, + "step": 10666 + }, + { + "epoch": 0.27, + "learning_rate": 1.9804654775022155e-06, + "loss": 0.9004, + "step": 10667 + }, + { + "epoch": 0.27, + "learning_rate": 1.980460034590731e-06, + "loss": 0.9541, + "step": 10668 + }, + { + "epoch": 0.27, + "learning_rate": 1.9804545909285533e-06, + "loss": 0.9688, + "step": 10669 + }, + { + "epoch": 0.27, + "learning_rate": 1.980449146515686e-06, + "loss": 0.9531, + "step": 10670 + }, + { + "epoch": 0.27, + "learning_rate": 1.980443701352134e-06, + "loss": 0.8574, + "step": 10671 + }, + { + "epoch": 0.27, + "learning_rate": 1.9804382554379017e-06, + "loss": 1.0654, + "step": 10672 + }, + { + "epoch": 0.27, + "learning_rate": 1.980432808772993e-06, + "loss": 0.9678, + "step": 10673 + }, + { + "epoch": 0.27, + "learning_rate": 1.9804273613574117e-06, + "loss": 0.8262, + "step": 10674 + }, + { + "epoch": 0.27, + "learning_rate": 1.980421913191162e-06, + "loss": 0.9424, + "step": 10675 + }, + { + "epoch": 0.27, + "learning_rate": 1.9804164642742487e-06, + "loss": 1.1562, + "step": 10676 + }, + { + "epoch": 0.27, + "learning_rate": 1.9804110146066756e-06, + "loss": 0.6128, + "step": 10677 + }, + { + "epoch": 0.27, + "learning_rate": 1.9804055641884466e-06, + "loss": 1.0293, + "step": 10678 + }, + { + "epoch": 0.27, + "learning_rate": 1.9804001130195665e-06, + "loss": 0.707, + "step": 10679 + }, + { + "epoch": 0.27, + "learning_rate": 1.980394661100039e-06, + "loss": 1.0732, + "step": 10680 + }, + { + "epoch": 0.27, + "learning_rate": 1.9803892084298683e-06, + "loss": 0.7646, + "step": 10681 + }, + { + "epoch": 0.27, + "learning_rate": 1.9803837550090583e-06, + "loss": 0.8552, + "step": 10682 + }, + { + "epoch": 0.27, + "learning_rate": 1.980378300837614e-06, + "loss": 0.9272, + "step": 10683 + }, + { + "epoch": 0.27, + "learning_rate": 1.9803728459155395e-06, + "loss": 0.9473, + "step": 10684 + }, + { + "epoch": 0.27, + "learning_rate": 1.9803673902428378e-06, + "loss": 0.8799, + "step": 10685 + }, + { + "epoch": 0.27, + "learning_rate": 1.980361933819514e-06, + "loss": 1.1592, + "step": 10686 + }, + { + "epoch": 0.27, + "learning_rate": 1.9803564766455727e-06, + "loss": 0.8516, + "step": 10687 + }, + { + "epoch": 0.27, + "learning_rate": 1.9803510187210174e-06, + "loss": 0.8242, + "step": 10688 + }, + { + "epoch": 0.27, + "learning_rate": 1.980345560045852e-06, + "loss": 0.688, + "step": 10689 + }, + { + "epoch": 0.27, + "learning_rate": 1.980340100620081e-06, + "loss": 0.9014, + "step": 10690 + }, + { + "epoch": 0.27, + "learning_rate": 1.980334640443709e-06, + "loss": 0.8311, + "step": 10691 + }, + { + "epoch": 0.27, + "learning_rate": 1.9803291795167396e-06, + "loss": 1.0029, + "step": 10692 + }, + { + "epoch": 0.27, + "learning_rate": 1.9803237178391774e-06, + "loss": 0.6018, + "step": 10693 + }, + { + "epoch": 0.27, + "learning_rate": 1.9803182554110267e-06, + "loss": 1.0859, + "step": 10694 + }, + { + "epoch": 0.27, + "learning_rate": 1.980312792232291e-06, + "loss": 0.8682, + "step": 10695 + }, + { + "epoch": 0.27, + "learning_rate": 1.980307328302975e-06, + "loss": 0.8926, + "step": 10696 + }, + { + "epoch": 0.27, + "learning_rate": 1.9803018636230825e-06, + "loss": 0.7026, + "step": 10697 + }, + { + "epoch": 0.27, + "learning_rate": 1.9802963981926184e-06, + "loss": 0.9893, + "step": 10698 + }, + { + "epoch": 0.27, + "learning_rate": 1.980290932011586e-06, + "loss": 0.8242, + "step": 10699 + }, + { + "epoch": 0.27, + "learning_rate": 1.9802854650799904e-06, + "loss": 1.0176, + "step": 10700 + }, + { + "epoch": 0.27, + "learning_rate": 1.980279997397835e-06, + "loss": 0.9307, + "step": 10701 + }, + { + "epoch": 0.27, + "learning_rate": 1.980274528965124e-06, + "loss": 1.126, + "step": 10702 + }, + { + "epoch": 0.27, + "learning_rate": 1.9802690597818622e-06, + "loss": 0.8848, + "step": 10703 + }, + { + "epoch": 0.27, + "learning_rate": 1.9802635898480535e-06, + "loss": 0.5903, + "step": 10704 + }, + { + "epoch": 0.27, + "learning_rate": 1.9802581191637015e-06, + "loss": 0.9932, + "step": 10705 + }, + { + "epoch": 0.27, + "learning_rate": 1.9802526477288115e-06, + "loss": 1.0469, + "step": 10706 + }, + { + "epoch": 0.27, + "learning_rate": 1.980247175543387e-06, + "loss": 0.9854, + "step": 10707 + }, + { + "epoch": 0.27, + "learning_rate": 1.980241702607432e-06, + "loss": 0.8223, + "step": 10708 + }, + { + "epoch": 0.27, + "learning_rate": 1.9802362289209516e-06, + "loss": 0.814, + "step": 10709 + }, + { + "epoch": 0.27, + "learning_rate": 1.980230754483949e-06, + "loss": 0.7461, + "step": 10710 + }, + { + "epoch": 0.27, + "learning_rate": 1.980225279296429e-06, + "loss": 0.9326, + "step": 10711 + }, + { + "epoch": 0.27, + "learning_rate": 1.9802198033583954e-06, + "loss": 0.8438, + "step": 10712 + }, + { + "epoch": 0.27, + "learning_rate": 1.9802143266698525e-06, + "loss": 0.7168, + "step": 10713 + }, + { + "epoch": 0.27, + "learning_rate": 1.9802088492308045e-06, + "loss": 0.728, + "step": 10714 + }, + { + "epoch": 0.27, + "learning_rate": 1.9802033710412558e-06, + "loss": 1.0107, + "step": 10715 + }, + { + "epoch": 0.27, + "learning_rate": 1.9801978921012104e-06, + "loss": 0.832, + "step": 10716 + }, + { + "epoch": 0.27, + "learning_rate": 1.9801924124106726e-06, + "loss": 0.7754, + "step": 10717 + }, + { + "epoch": 0.27, + "learning_rate": 1.9801869319696467e-06, + "loss": 1.1289, + "step": 10718 + }, + { + "epoch": 0.27, + "learning_rate": 1.9801814507781365e-06, + "loss": 0.958, + "step": 10719 + }, + { + "epoch": 0.27, + "learning_rate": 1.9801759688361466e-06, + "loss": 0.8774, + "step": 10720 + }, + { + "epoch": 0.27, + "learning_rate": 1.980170486143681e-06, + "loss": 0.8354, + "step": 10721 + }, + { + "epoch": 0.27, + "learning_rate": 1.980165002700744e-06, + "loss": 1.1582, + "step": 10722 + }, + { + "epoch": 0.27, + "learning_rate": 1.9801595185073393e-06, + "loss": 0.9102, + "step": 10723 + }, + { + "epoch": 0.27, + "learning_rate": 1.9801540335634723e-06, + "loss": 0.708, + "step": 10724 + }, + { + "epoch": 0.27, + "learning_rate": 1.980148547869146e-06, + "loss": 0.9766, + "step": 10725 + }, + { + "epoch": 0.27, + "learning_rate": 1.9801430614243645e-06, + "loss": 0.9736, + "step": 10726 + }, + { + "epoch": 0.27, + "learning_rate": 1.980137574229133e-06, + "loss": 0.7041, + "step": 10727 + }, + { + "epoch": 0.27, + "learning_rate": 1.9801320862834554e-06, + "loss": 0.8354, + "step": 10728 + }, + { + "epoch": 0.27, + "learning_rate": 1.9801265975873353e-06, + "loss": 0.9043, + "step": 10729 + }, + { + "epoch": 0.28, + "learning_rate": 1.9801211081407775e-06, + "loss": 0.9155, + "step": 10730 + }, + { + "epoch": 0.28, + "learning_rate": 1.9801156179437862e-06, + "loss": 0.8213, + "step": 10731 + }, + { + "epoch": 0.28, + "learning_rate": 1.9801101269963657e-06, + "loss": 0.7065, + "step": 10732 + }, + { + "epoch": 0.28, + "learning_rate": 1.9801046352985193e-06, + "loss": 1.0791, + "step": 10733 + }, + { + "epoch": 0.28, + "learning_rate": 1.980099142850252e-06, + "loss": 1.0342, + "step": 10734 + }, + { + "epoch": 0.28, + "learning_rate": 1.9800936496515683e-06, + "loss": 1.0781, + "step": 10735 + }, + { + "epoch": 0.28, + "learning_rate": 1.9800881557024718e-06, + "loss": 0.9316, + "step": 10736 + }, + { + "epoch": 0.28, + "learning_rate": 1.9800826610029667e-06, + "loss": 0.8662, + "step": 10737 + }, + { + "epoch": 0.28, + "learning_rate": 1.9800771655530574e-06, + "loss": 0.9033, + "step": 10738 + }, + { + "epoch": 0.28, + "learning_rate": 1.980071669352748e-06, + "loss": 0.833, + "step": 10739 + }, + { + "epoch": 0.28, + "learning_rate": 1.980066172402043e-06, + "loss": 0.7676, + "step": 10740 + }, + { + "epoch": 0.28, + "learning_rate": 1.980060674700946e-06, + "loss": 0.9502, + "step": 10741 + }, + { + "epoch": 0.28, + "learning_rate": 1.980055176249462e-06, + "loss": 0.8799, + "step": 10742 + }, + { + "epoch": 0.28, + "learning_rate": 1.9800496770475946e-06, + "loss": 0.9551, + "step": 10743 + }, + { + "epoch": 0.28, + "learning_rate": 1.9800441770953485e-06, + "loss": 1.0605, + "step": 10744 + }, + { + "epoch": 0.28, + "learning_rate": 1.9800386763927275e-06, + "loss": 0.9707, + "step": 10745 + }, + { + "epoch": 0.28, + "learning_rate": 1.9800331749397356e-06, + "loss": 0.9814, + "step": 10746 + }, + { + "epoch": 0.28, + "learning_rate": 1.980027672736378e-06, + "loss": 0.8662, + "step": 10747 + }, + { + "epoch": 0.28, + "learning_rate": 1.9800221697826575e-06, + "loss": 1.1064, + "step": 10748 + }, + { + "epoch": 0.28, + "learning_rate": 1.98001666607858e-06, + "loss": 1.0859, + "step": 10749 + }, + { + "epoch": 0.28, + "learning_rate": 1.980011161624148e-06, + "loss": 0.8574, + "step": 10750 + }, + { + "epoch": 0.28, + "learning_rate": 1.980005656419367e-06, + "loss": 0.8838, + "step": 10751 + }, + { + "epoch": 0.28, + "learning_rate": 1.9800001504642406e-06, + "loss": 0.8447, + "step": 10752 + }, + { + "epoch": 0.28, + "learning_rate": 1.979994643758773e-06, + "loss": 0.7378, + "step": 10753 + }, + { + "epoch": 0.28, + "learning_rate": 1.9799891363029685e-06, + "loss": 0.7124, + "step": 10754 + }, + { + "epoch": 0.28, + "learning_rate": 1.9799836280968315e-06, + "loss": 0.8271, + "step": 10755 + }, + { + "epoch": 0.28, + "learning_rate": 1.9799781191403665e-06, + "loss": 0.6528, + "step": 10756 + }, + { + "epoch": 0.28, + "learning_rate": 1.979972609433577e-06, + "loss": 0.8232, + "step": 10757 + }, + { + "epoch": 0.28, + "learning_rate": 1.979967098976467e-06, + "loss": 0.6895, + "step": 10758 + }, + { + "epoch": 0.28, + "learning_rate": 1.979961587769042e-06, + "loss": 1.1191, + "step": 10759 + }, + { + "epoch": 0.28, + "learning_rate": 1.979956075811305e-06, + "loss": 0.957, + "step": 10760 + }, + { + "epoch": 0.28, + "learning_rate": 1.979950563103261e-06, + "loss": 0.8594, + "step": 10761 + }, + { + "epoch": 0.28, + "learning_rate": 1.979945049644914e-06, + "loss": 0.7451, + "step": 10762 + }, + { + "epoch": 0.28, + "learning_rate": 1.979939535436268e-06, + "loss": 0.874, + "step": 10763 + }, + { + "epoch": 0.28, + "learning_rate": 1.9799340204773273e-06, + "loss": 0.916, + "step": 10764 + }, + { + "epoch": 0.28, + "learning_rate": 1.979928504768096e-06, + "loss": 0.9043, + "step": 10765 + }, + { + "epoch": 0.28, + "learning_rate": 1.979922988308579e-06, + "loss": 1.001, + "step": 10766 + }, + { + "epoch": 0.28, + "learning_rate": 1.9799174710987795e-06, + "loss": 1.0029, + "step": 10767 + }, + { + "epoch": 0.28, + "learning_rate": 1.9799119531387024e-06, + "loss": 0.8906, + "step": 10768 + }, + { + "epoch": 0.28, + "learning_rate": 1.979906434428352e-06, + "loss": 1.0195, + "step": 10769 + }, + { + "epoch": 0.28, + "learning_rate": 1.979900914967732e-06, + "loss": 0.752, + "step": 10770 + }, + { + "epoch": 0.28, + "learning_rate": 1.979895394756847e-06, + "loss": 1.0146, + "step": 10771 + }, + { + "epoch": 0.28, + "learning_rate": 1.9798898737957014e-06, + "loss": 0.8154, + "step": 10772 + }, + { + "epoch": 0.28, + "learning_rate": 1.979884352084299e-06, + "loss": 0.8379, + "step": 10773 + }, + { + "epoch": 0.28, + "learning_rate": 1.9798788296226447e-06, + "loss": 0.8203, + "step": 10774 + }, + { + "epoch": 0.28, + "learning_rate": 1.9798733064107418e-06, + "loss": 0.7744, + "step": 10775 + }, + { + "epoch": 0.28, + "learning_rate": 1.9798677824485947e-06, + "loss": 0.8525, + "step": 10776 + }, + { + "epoch": 0.28, + "learning_rate": 1.979862257736208e-06, + "loss": 0.9785, + "step": 10777 + }, + { + "epoch": 0.28, + "learning_rate": 1.9798567322735858e-06, + "loss": 0.8535, + "step": 10778 + }, + { + "epoch": 0.28, + "learning_rate": 1.979851206060733e-06, + "loss": 1.1855, + "step": 10779 + }, + { + "epoch": 0.28, + "learning_rate": 1.979845679097652e-06, + "loss": 0.7964, + "step": 10780 + }, + { + "epoch": 0.28, + "learning_rate": 1.9798401513843494e-06, + "loss": 0.9883, + "step": 10781 + }, + { + "epoch": 0.28, + "learning_rate": 1.9798346229208274e-06, + "loss": 0.8408, + "step": 10782 + }, + { + "epoch": 0.28, + "learning_rate": 1.9798290937070917e-06, + "loss": 0.8809, + "step": 10783 + }, + { + "epoch": 0.28, + "learning_rate": 1.9798235637431453e-06, + "loss": 0.8828, + "step": 10784 + }, + { + "epoch": 0.28, + "learning_rate": 1.9798180330289937e-06, + "loss": 0.8672, + "step": 10785 + }, + { + "epoch": 0.28, + "learning_rate": 1.9798125015646402e-06, + "loss": 0.9814, + "step": 10786 + }, + { + "epoch": 0.28, + "learning_rate": 1.9798069693500896e-06, + "loss": 0.9902, + "step": 10787 + }, + { + "epoch": 0.28, + "learning_rate": 1.979801436385345e-06, + "loss": 0.8018, + "step": 10788 + }, + { + "epoch": 0.28, + "learning_rate": 1.9797959026704124e-06, + "loss": 0.9297, + "step": 10789 + }, + { + "epoch": 0.28, + "learning_rate": 1.9797903682052944e-06, + "loss": 0.8892, + "step": 10790 + }, + { + "epoch": 0.28, + "learning_rate": 1.9797848329899966e-06, + "loss": 0.832, + "step": 10791 + }, + { + "epoch": 0.28, + "learning_rate": 1.9797792970245223e-06, + "loss": 1.0205, + "step": 10792 + }, + { + "epoch": 0.28, + "learning_rate": 1.979773760308876e-06, + "loss": 1.0234, + "step": 10793 + }, + { + "epoch": 0.28, + "learning_rate": 1.9797682228430623e-06, + "loss": 0.9492, + "step": 10794 + }, + { + "epoch": 0.28, + "learning_rate": 1.9797626846270846e-06, + "loss": 0.6768, + "step": 10795 + }, + { + "epoch": 0.28, + "learning_rate": 1.9797571456609482e-06, + "loss": 0.8213, + "step": 10796 + }, + { + "epoch": 0.28, + "learning_rate": 1.9797516059446566e-06, + "loss": 0.8486, + "step": 10797 + }, + { + "epoch": 0.28, + "learning_rate": 1.9797460654782145e-06, + "loss": 0.9453, + "step": 10798 + }, + { + "epoch": 0.28, + "learning_rate": 1.979740524261625e-06, + "loss": 0.8711, + "step": 10799 + }, + { + "epoch": 0.28, + "learning_rate": 1.979734982294894e-06, + "loss": 0.9395, + "step": 10800 + }, + { + "epoch": 0.28, + "learning_rate": 1.979729439578025e-06, + "loss": 0.9902, + "step": 10801 + }, + { + "epoch": 0.28, + "learning_rate": 1.979723896111022e-06, + "loss": 0.9473, + "step": 10802 + }, + { + "epoch": 0.28, + "learning_rate": 1.9797183518938896e-06, + "loss": 0.8584, + "step": 10803 + }, + { + "epoch": 0.28, + "learning_rate": 1.979712806926632e-06, + "loss": 0.918, + "step": 10804 + }, + { + "epoch": 0.28, + "learning_rate": 1.9797072612092526e-06, + "loss": 1.0176, + "step": 10805 + }, + { + "epoch": 0.28, + "learning_rate": 1.9797017147417573e-06, + "loss": 1.0078, + "step": 10806 + }, + { + "epoch": 0.28, + "learning_rate": 1.9796961675241487e-06, + "loss": 0.9541, + "step": 10807 + }, + { + "epoch": 0.28, + "learning_rate": 1.9796906195564323e-06, + "loss": 0.8755, + "step": 10808 + }, + { + "epoch": 0.28, + "learning_rate": 1.979685070838612e-06, + "loss": 0.9434, + "step": 10809 + }, + { + "epoch": 0.28, + "learning_rate": 1.9796795213706913e-06, + "loss": 1.2549, + "step": 10810 + }, + { + "epoch": 0.28, + "learning_rate": 1.9796739711526756e-06, + "loss": 0.9775, + "step": 10811 + }, + { + "epoch": 0.28, + "learning_rate": 1.979668420184568e-06, + "loss": 0.8809, + "step": 10812 + }, + { + "epoch": 0.28, + "learning_rate": 1.979662868466374e-06, + "loss": 0.7524, + "step": 10813 + }, + { + "epoch": 0.28, + "learning_rate": 1.9796573159980968e-06, + "loss": 0.8335, + "step": 10814 + }, + { + "epoch": 0.28, + "learning_rate": 1.9796517627797413e-06, + "loss": 1.002, + "step": 10815 + }, + { + "epoch": 0.28, + "learning_rate": 1.979646208811311e-06, + "loss": 1.0312, + "step": 10816 + }, + { + "epoch": 0.28, + "learning_rate": 1.979640654092811e-06, + "loss": 0.8506, + "step": 10817 + }, + { + "epoch": 0.28, + "learning_rate": 1.979635098624245e-06, + "loss": 0.6201, + "step": 10818 + }, + { + "epoch": 0.28, + "learning_rate": 1.9796295424056177e-06, + "loss": 1.1016, + "step": 10819 + }, + { + "epoch": 0.28, + "learning_rate": 1.9796239854369328e-06, + "loss": 0.9932, + "step": 10820 + }, + { + "epoch": 0.28, + "learning_rate": 1.979618427718195e-06, + "loss": 0.9561, + "step": 10821 + }, + { + "epoch": 0.28, + "learning_rate": 1.979612869249409e-06, + "loss": 0.8652, + "step": 10822 + }, + { + "epoch": 0.28, + "learning_rate": 1.9796073100305776e-06, + "loss": 1.1582, + "step": 10823 + }, + { + "epoch": 0.28, + "learning_rate": 1.979601750061706e-06, + "loss": 0.9854, + "step": 10824 + }, + { + "epoch": 0.28, + "learning_rate": 1.979596189342799e-06, + "loss": 0.8242, + "step": 10825 + }, + { + "epoch": 0.28, + "learning_rate": 1.97959062787386e-06, + "loss": 1.041, + "step": 10826 + }, + { + "epoch": 0.28, + "learning_rate": 1.9795850656548933e-06, + "loss": 1.0684, + "step": 10827 + }, + { + "epoch": 0.28, + "learning_rate": 1.979579502685903e-06, + "loss": 0.9902, + "step": 10828 + }, + { + "epoch": 0.28, + "learning_rate": 1.9795739389668946e-06, + "loss": 0.9941, + "step": 10829 + }, + { + "epoch": 0.28, + "learning_rate": 1.979568374497871e-06, + "loss": 0.7158, + "step": 10830 + }, + { + "epoch": 0.28, + "learning_rate": 1.9795628092788366e-06, + "loss": 0.9873, + "step": 10831 + }, + { + "epoch": 0.28, + "learning_rate": 1.979557243309797e-06, + "loss": 1.0244, + "step": 10832 + }, + { + "epoch": 0.28, + "learning_rate": 1.9795516765907543e-06, + "loss": 0.9404, + "step": 10833 + }, + { + "epoch": 0.28, + "learning_rate": 1.9795461091217145e-06, + "loss": 1.0791, + "step": 10834 + }, + { + "epoch": 0.28, + "learning_rate": 1.9795405409026813e-06, + "loss": 0.8101, + "step": 10835 + }, + { + "epoch": 0.28, + "learning_rate": 1.9795349719336588e-06, + "loss": 1.0771, + "step": 10836 + }, + { + "epoch": 0.28, + "learning_rate": 1.9795294022146517e-06, + "loss": 0.8516, + "step": 10837 + }, + { + "epoch": 0.28, + "learning_rate": 1.979523831745664e-06, + "loss": 0.7349, + "step": 10838 + }, + { + "epoch": 0.28, + "learning_rate": 1.9795182605266995e-06, + "loss": 0.9006, + "step": 10839 + }, + { + "epoch": 0.28, + "learning_rate": 1.979512688557763e-06, + "loss": 1.0693, + "step": 10840 + }, + { + "epoch": 0.28, + "learning_rate": 1.9795071158388586e-06, + "loss": 0.999, + "step": 10841 + }, + { + "epoch": 0.28, + "learning_rate": 1.979501542369991e-06, + "loss": 0.916, + "step": 10842 + }, + { + "epoch": 0.28, + "learning_rate": 1.979495968151164e-06, + "loss": 0.637, + "step": 10843 + }, + { + "epoch": 0.28, + "learning_rate": 1.979490393182382e-06, + "loss": 0.728, + "step": 10844 + }, + { + "epoch": 0.28, + "learning_rate": 1.979484817463649e-06, + "loss": 0.8955, + "step": 10845 + }, + { + "epoch": 0.28, + "learning_rate": 1.9794792409949697e-06, + "loss": 1.0215, + "step": 10846 + }, + { + "epoch": 0.28, + "learning_rate": 1.979473663776348e-06, + "loss": 0.9326, + "step": 10847 + }, + { + "epoch": 0.28, + "learning_rate": 1.9794680858077887e-06, + "loss": 0.9717, + "step": 10848 + }, + { + "epoch": 0.28, + "learning_rate": 1.979462507089296e-06, + "loss": 0.8252, + "step": 10849 + }, + { + "epoch": 0.28, + "learning_rate": 1.9794569276208726e-06, + "loss": 0.9082, + "step": 10850 + }, + { + "epoch": 0.28, + "learning_rate": 1.9794513474025254e-06, + "loss": 0.9395, + "step": 10851 + }, + { + "epoch": 0.28, + "learning_rate": 1.9794457664342567e-06, + "loss": 0.9482, + "step": 10852 + }, + { + "epoch": 0.28, + "learning_rate": 1.9794401847160716e-06, + "loss": 0.9346, + "step": 10853 + }, + { + "epoch": 0.28, + "learning_rate": 1.979434602247974e-06, + "loss": 0.9258, + "step": 10854 + }, + { + "epoch": 0.28, + "learning_rate": 1.9794290190299684e-06, + "loss": 0.8965, + "step": 10855 + }, + { + "epoch": 0.28, + "learning_rate": 1.979423435062059e-06, + "loss": 0.8557, + "step": 10856 + }, + { + "epoch": 0.28, + "learning_rate": 1.9794178503442505e-06, + "loss": 0.8481, + "step": 10857 + }, + { + "epoch": 0.28, + "learning_rate": 1.9794122648765466e-06, + "loss": 0.71, + "step": 10858 + }, + { + "epoch": 0.28, + "learning_rate": 1.9794066786589518e-06, + "loss": 0.7812, + "step": 10859 + }, + { + "epoch": 0.28, + "learning_rate": 1.97940109169147e-06, + "loss": 0.7588, + "step": 10860 + }, + { + "epoch": 0.28, + "learning_rate": 1.979395503974106e-06, + "loss": 0.8003, + "step": 10861 + }, + { + "epoch": 0.28, + "learning_rate": 1.979389915506864e-06, + "loss": 0.9395, + "step": 10862 + }, + { + "epoch": 0.28, + "learning_rate": 1.979384326289748e-06, + "loss": 1.0195, + "step": 10863 + }, + { + "epoch": 0.28, + "learning_rate": 1.9793787363227628e-06, + "loss": 0.9473, + "step": 10864 + }, + { + "epoch": 0.28, + "learning_rate": 1.979373145605912e-06, + "loss": 0.8965, + "step": 10865 + }, + { + "epoch": 0.28, + "learning_rate": 1.9793675541392004e-06, + "loss": 0.7817, + "step": 10866 + }, + { + "epoch": 0.28, + "learning_rate": 1.979361961922632e-06, + "loss": 0.9238, + "step": 10867 + }, + { + "epoch": 0.28, + "learning_rate": 1.979356368956211e-06, + "loss": 0.9629, + "step": 10868 + }, + { + "epoch": 0.28, + "learning_rate": 1.979350775239942e-06, + "loss": 1.0684, + "step": 10869 + }, + { + "epoch": 0.28, + "learning_rate": 1.9793451807738296e-06, + "loss": 0.9668, + "step": 10870 + }, + { + "epoch": 0.28, + "learning_rate": 1.9793395855578773e-06, + "loss": 0.6836, + "step": 10871 + }, + { + "epoch": 0.28, + "learning_rate": 1.9793339895920894e-06, + "loss": 0.822, + "step": 10872 + }, + { + "epoch": 0.28, + "learning_rate": 1.9793283928764706e-06, + "loss": 0.5303, + "step": 10873 + }, + { + "epoch": 0.28, + "learning_rate": 1.9793227954110253e-06, + "loss": 1.0029, + "step": 10874 + }, + { + "epoch": 0.28, + "learning_rate": 1.9793171971957572e-06, + "loss": 1.0459, + "step": 10875 + }, + { + "epoch": 0.28, + "learning_rate": 1.979311598230672e-06, + "loss": 1.1064, + "step": 10876 + }, + { + "epoch": 0.28, + "learning_rate": 1.9793059985157717e-06, + "loss": 0.9033, + "step": 10877 + }, + { + "epoch": 0.28, + "learning_rate": 1.9793003980510623e-06, + "loss": 1.0029, + "step": 10878 + }, + { + "epoch": 0.28, + "learning_rate": 1.9792947968365475e-06, + "loss": 0.793, + "step": 10879 + }, + { + "epoch": 0.28, + "learning_rate": 1.979289194872232e-06, + "loss": 0.812, + "step": 10880 + }, + { + "epoch": 0.28, + "learning_rate": 1.9792835921581195e-06, + "loss": 0.7998, + "step": 10881 + }, + { + "epoch": 0.28, + "learning_rate": 1.9792779886942147e-06, + "loss": 0.7935, + "step": 10882 + }, + { + "epoch": 0.28, + "learning_rate": 1.979272384480522e-06, + "loss": 0.8096, + "step": 10883 + }, + { + "epoch": 0.28, + "learning_rate": 1.979266779517045e-06, + "loss": 1.0801, + "step": 10884 + }, + { + "epoch": 0.28, + "learning_rate": 1.979261173803789e-06, + "loss": 0.8242, + "step": 10885 + }, + { + "epoch": 0.28, + "learning_rate": 1.9792555673407572e-06, + "loss": 0.9365, + "step": 10886 + }, + { + "epoch": 0.28, + "learning_rate": 1.9792499601279545e-06, + "loss": 0.9883, + "step": 10887 + }, + { + "epoch": 0.28, + "learning_rate": 1.9792443521653853e-06, + "loss": 0.8691, + "step": 10888 + }, + { + "epoch": 0.28, + "learning_rate": 1.979238743453054e-06, + "loss": 0.9297, + "step": 10889 + }, + { + "epoch": 0.28, + "learning_rate": 1.9792331339909644e-06, + "loss": 0.75, + "step": 10890 + }, + { + "epoch": 0.28, + "learning_rate": 1.979227523779121e-06, + "loss": 0.9287, + "step": 10891 + }, + { + "epoch": 0.28, + "learning_rate": 1.9792219128175277e-06, + "loss": 1.0674, + "step": 10892 + }, + { + "epoch": 0.28, + "learning_rate": 1.9792163011061898e-06, + "loss": 0.9639, + "step": 10893 + }, + { + "epoch": 0.28, + "learning_rate": 1.9792106886451107e-06, + "loss": 0.7783, + "step": 10894 + }, + { + "epoch": 0.28, + "learning_rate": 1.979205075434295e-06, + "loss": 0.8994, + "step": 10895 + }, + { + "epoch": 0.28, + "learning_rate": 1.979199461473747e-06, + "loss": 1.3086, + "step": 10896 + }, + { + "epoch": 0.28, + "learning_rate": 1.9791938467634714e-06, + "loss": 0.8081, + "step": 10897 + }, + { + "epoch": 0.28, + "learning_rate": 1.9791882313034714e-06, + "loss": 0.8149, + "step": 10898 + }, + { + "epoch": 0.28, + "learning_rate": 1.9791826150937523e-06, + "loss": 0.9824, + "step": 10899 + }, + { + "epoch": 0.28, + "learning_rate": 1.9791769981343185e-06, + "loss": 1.002, + "step": 10900 + }, + { + "epoch": 0.28, + "learning_rate": 1.9791713804251737e-06, + "loss": 0.9131, + "step": 10901 + }, + { + "epoch": 0.28, + "learning_rate": 1.979165761966322e-06, + "loss": 0.7334, + "step": 10902 + }, + { + "epoch": 0.28, + "learning_rate": 1.9791601427577685e-06, + "loss": 0.8896, + "step": 10903 + }, + { + "epoch": 0.28, + "learning_rate": 1.979154522799517e-06, + "loss": 0.8467, + "step": 10904 + }, + { + "epoch": 0.28, + "learning_rate": 1.979148902091572e-06, + "loss": 1.0674, + "step": 10905 + }, + { + "epoch": 0.28, + "learning_rate": 1.9791432806339374e-06, + "loss": 0.7495, + "step": 10906 + }, + { + "epoch": 0.28, + "learning_rate": 1.979137658426618e-06, + "loss": 0.9453, + "step": 10907 + }, + { + "epoch": 0.28, + "learning_rate": 1.9791320354696176e-06, + "loss": 0.8916, + "step": 10908 + }, + { + "epoch": 0.28, + "learning_rate": 1.9791264117629412e-06, + "loss": 0.708, + "step": 10909 + }, + { + "epoch": 0.28, + "learning_rate": 1.979120787306593e-06, + "loss": 1.0615, + "step": 10910 + }, + { + "epoch": 0.28, + "learning_rate": 1.9791151621005767e-06, + "loss": 0.6472, + "step": 10911 + }, + { + "epoch": 0.28, + "learning_rate": 1.9791095361448965e-06, + "loss": 0.9365, + "step": 10912 + }, + { + "epoch": 0.28, + "learning_rate": 1.979103909439558e-06, + "loss": 1.0469, + "step": 10913 + }, + { + "epoch": 0.28, + "learning_rate": 1.9790982819845642e-06, + "loss": 0.8008, + "step": 10914 + }, + { + "epoch": 0.28, + "learning_rate": 1.9790926537799197e-06, + "loss": 0.8154, + "step": 10915 + }, + { + "epoch": 0.28, + "learning_rate": 1.9790870248256295e-06, + "loss": 0.8159, + "step": 10916 + }, + { + "epoch": 0.28, + "learning_rate": 1.979081395121697e-06, + "loss": 1.123, + "step": 10917 + }, + { + "epoch": 0.28, + "learning_rate": 1.979075764668127e-06, + "loss": 0.8125, + "step": 10918 + }, + { + "epoch": 0.28, + "learning_rate": 1.9790701334649235e-06, + "loss": 0.9893, + "step": 10919 + }, + { + "epoch": 0.28, + "learning_rate": 1.979064501512091e-06, + "loss": 0.8271, + "step": 10920 + }, + { + "epoch": 0.28, + "learning_rate": 1.979058868809634e-06, + "loss": 1.1162, + "step": 10921 + }, + { + "epoch": 0.28, + "learning_rate": 1.979053235357557e-06, + "loss": 0.9834, + "step": 10922 + }, + { + "epoch": 0.28, + "learning_rate": 1.9790476011558636e-06, + "loss": 0.7778, + "step": 10923 + }, + { + "epoch": 0.28, + "learning_rate": 1.9790419662045585e-06, + "loss": 0.8926, + "step": 10924 + }, + { + "epoch": 0.28, + "learning_rate": 1.9790363305036457e-06, + "loss": 0.9932, + "step": 10925 + }, + { + "epoch": 0.28, + "learning_rate": 1.97903069405313e-06, + "loss": 0.7163, + "step": 10926 + }, + { + "epoch": 0.28, + "learning_rate": 1.9790250568530154e-06, + "loss": 0.9551, + "step": 10927 + }, + { + "epoch": 0.28, + "learning_rate": 1.979019418903307e-06, + "loss": 0.9785, + "step": 10928 + }, + { + "epoch": 0.28, + "learning_rate": 1.9790137802040075e-06, + "loss": 0.9746, + "step": 10929 + }, + { + "epoch": 0.28, + "learning_rate": 1.979008140755123e-06, + "loss": 0.915, + "step": 10930 + }, + { + "epoch": 0.28, + "learning_rate": 1.9790025005566563e-06, + "loss": 1.042, + "step": 10931 + }, + { + "epoch": 0.28, + "learning_rate": 1.978996859608613e-06, + "loss": 0.8535, + "step": 10932 + }, + { + "epoch": 0.28, + "learning_rate": 1.9789912179109965e-06, + "loss": 1.0938, + "step": 10933 + }, + { + "epoch": 0.28, + "learning_rate": 1.9789855754638114e-06, + "loss": 0.9238, + "step": 10934 + }, + { + "epoch": 0.28, + "learning_rate": 1.978979932267062e-06, + "loss": 1.0361, + "step": 10935 + }, + { + "epoch": 0.28, + "learning_rate": 1.978974288320753e-06, + "loss": 0.9697, + "step": 10936 + }, + { + "epoch": 0.28, + "learning_rate": 1.978968643624888e-06, + "loss": 0.959, + "step": 10937 + }, + { + "epoch": 0.28, + "learning_rate": 1.978962998179472e-06, + "loss": 0.639, + "step": 10938 + }, + { + "epoch": 0.28, + "learning_rate": 1.978957351984509e-06, + "loss": 0.9023, + "step": 10939 + }, + { + "epoch": 0.28, + "learning_rate": 1.9789517050400033e-06, + "loss": 0.8872, + "step": 10940 + }, + { + "epoch": 0.28, + "learning_rate": 1.9789460573459595e-06, + "loss": 1.0156, + "step": 10941 + }, + { + "epoch": 0.28, + "learning_rate": 1.9789404089023813e-06, + "loss": 0.6934, + "step": 10942 + }, + { + "epoch": 0.28, + "learning_rate": 1.978934759709274e-06, + "loss": 0.7681, + "step": 10943 + }, + { + "epoch": 0.28, + "learning_rate": 1.978929109766641e-06, + "loss": 0.7148, + "step": 10944 + }, + { + "epoch": 0.28, + "learning_rate": 1.978923459074487e-06, + "loss": 0.8848, + "step": 10945 + }, + { + "epoch": 0.28, + "learning_rate": 1.9789178076328163e-06, + "loss": 0.915, + "step": 10946 + }, + { + "epoch": 0.28, + "learning_rate": 1.9789121554416336e-06, + "loss": 0.8047, + "step": 10947 + }, + { + "epoch": 0.28, + "learning_rate": 1.9789065025009424e-06, + "loss": 0.8262, + "step": 10948 + }, + { + "epoch": 0.28, + "learning_rate": 1.9789008488107477e-06, + "loss": 0.9678, + "step": 10949 + }, + { + "epoch": 0.28, + "learning_rate": 1.9788951943710533e-06, + "loss": 0.834, + "step": 10950 + }, + { + "epoch": 0.28, + "learning_rate": 1.9788895391818644e-06, + "loss": 0.7842, + "step": 10951 + }, + { + "epoch": 0.28, + "learning_rate": 1.9788838832431847e-06, + "loss": 0.8105, + "step": 10952 + }, + { + "epoch": 0.28, + "learning_rate": 1.9788782265550186e-06, + "loss": 0.8818, + "step": 10953 + }, + { + "epoch": 0.28, + "learning_rate": 1.97887256911737e-06, + "loss": 1.0449, + "step": 10954 + }, + { + "epoch": 0.28, + "learning_rate": 1.9788669109302445e-06, + "loss": 1.0508, + "step": 10955 + }, + { + "epoch": 0.28, + "learning_rate": 1.9788612519936446e-06, + "loss": 1.1582, + "step": 10956 + }, + { + "epoch": 0.28, + "learning_rate": 1.9788555923075764e-06, + "loss": 0.9561, + "step": 10957 + }, + { + "epoch": 0.28, + "learning_rate": 1.9788499318720433e-06, + "loss": 0.8125, + "step": 10958 + }, + { + "epoch": 0.28, + "learning_rate": 1.97884427068705e-06, + "loss": 0.7495, + "step": 10959 + }, + { + "epoch": 0.28, + "learning_rate": 1.9788386087526005e-06, + "loss": 0.918, + "step": 10960 + }, + { + "epoch": 0.28, + "learning_rate": 1.978832946068699e-06, + "loss": 0.7744, + "step": 10961 + }, + { + "epoch": 0.28, + "learning_rate": 1.9788272826353506e-06, + "loss": 0.8242, + "step": 10962 + }, + { + "epoch": 0.28, + "learning_rate": 1.978821618452559e-06, + "loss": 0.9629, + "step": 10963 + }, + { + "epoch": 0.28, + "learning_rate": 1.9788159535203283e-06, + "loss": 1.0049, + "step": 10964 + }, + { + "epoch": 0.28, + "learning_rate": 1.9788102878386636e-06, + "loss": 0.918, + "step": 10965 + }, + { + "epoch": 0.28, + "learning_rate": 1.9788046214075687e-06, + "loss": 1.1797, + "step": 10966 + }, + { + "epoch": 0.28, + "learning_rate": 1.9787989542270483e-06, + "loss": 0.71, + "step": 10967 + }, + { + "epoch": 0.28, + "learning_rate": 1.9787932862971066e-06, + "loss": 0.9512, + "step": 10968 + }, + { + "epoch": 0.28, + "learning_rate": 1.9787876176177478e-06, + "loss": 0.8164, + "step": 10969 + }, + { + "epoch": 0.28, + "learning_rate": 1.978781948188976e-06, + "loss": 1.0039, + "step": 10970 + }, + { + "epoch": 0.28, + "learning_rate": 1.978776278010796e-06, + "loss": 1.0225, + "step": 10971 + }, + { + "epoch": 0.28, + "learning_rate": 1.9787706070832123e-06, + "loss": 0.832, + "step": 10972 + }, + { + "epoch": 0.28, + "learning_rate": 1.978764935406229e-06, + "loss": 0.9961, + "step": 10973 + }, + { + "epoch": 0.28, + "learning_rate": 1.97875926297985e-06, + "loss": 0.877, + "step": 10974 + }, + { + "epoch": 0.28, + "learning_rate": 1.9787535898040804e-06, + "loss": 0.8652, + "step": 10975 + }, + { + "epoch": 0.28, + "learning_rate": 1.978747915878924e-06, + "loss": 0.9062, + "step": 10976 + }, + { + "epoch": 0.28, + "learning_rate": 1.9787422412043853e-06, + "loss": 0.9199, + "step": 10977 + }, + { + "epoch": 0.28, + "learning_rate": 1.9787365657804686e-06, + "loss": 0.696, + "step": 10978 + }, + { + "epoch": 0.28, + "learning_rate": 1.9787308896071786e-06, + "loss": 0.7852, + "step": 10979 + }, + { + "epoch": 0.28, + "learning_rate": 1.9787252126845193e-06, + "loss": 1.0703, + "step": 10980 + }, + { + "epoch": 0.28, + "learning_rate": 1.9787195350124946e-06, + "loss": 0.7822, + "step": 10981 + }, + { + "epoch": 0.28, + "learning_rate": 1.97871385659111e-06, + "loss": 1.2539, + "step": 10982 + }, + { + "epoch": 0.28, + "learning_rate": 1.978708177420369e-06, + "loss": 0.8721, + "step": 10983 + }, + { + "epoch": 0.28, + "learning_rate": 1.978702497500276e-06, + "loss": 0.9971, + "step": 10984 + }, + { + "epoch": 0.28, + "learning_rate": 1.9786968168308357e-06, + "loss": 1.0605, + "step": 10985 + }, + { + "epoch": 0.28, + "learning_rate": 1.9786911354120522e-06, + "loss": 0.9775, + "step": 10986 + }, + { + "epoch": 0.28, + "learning_rate": 1.9786854532439297e-06, + "loss": 0.7686, + "step": 10987 + }, + { + "epoch": 0.28, + "learning_rate": 1.9786797703264726e-06, + "loss": 1.0977, + "step": 10988 + }, + { + "epoch": 0.28, + "learning_rate": 1.9786740866596862e-06, + "loss": 0.8223, + "step": 10989 + }, + { + "epoch": 0.28, + "learning_rate": 1.9786684022435734e-06, + "loss": 0.8672, + "step": 10990 + }, + { + "epoch": 0.28, + "learning_rate": 1.978662717078139e-06, + "loss": 1.0312, + "step": 10991 + }, + { + "epoch": 0.28, + "learning_rate": 1.9786570311633883e-06, + "loss": 0.8096, + "step": 10992 + }, + { + "epoch": 0.28, + "learning_rate": 1.9786513444993246e-06, + "loss": 0.9893, + "step": 10993 + }, + { + "epoch": 0.28, + "learning_rate": 1.9786456570859526e-06, + "loss": 0.6323, + "step": 10994 + }, + { + "epoch": 0.28, + "learning_rate": 1.9786399689232762e-06, + "loss": 1.0234, + "step": 10995 + }, + { + "epoch": 0.28, + "learning_rate": 1.9786342800113005e-06, + "loss": 0.8584, + "step": 10996 + }, + { + "epoch": 0.28, + "learning_rate": 1.9786285903500297e-06, + "loss": 0.8037, + "step": 10997 + }, + { + "epoch": 0.28, + "learning_rate": 1.9786228999394677e-06, + "loss": 0.5598, + "step": 10998 + }, + { + "epoch": 0.28, + "learning_rate": 1.978617208779619e-06, + "loss": 0.7178, + "step": 10999 + }, + { + "epoch": 0.28, + "learning_rate": 1.9786115168704884e-06, + "loss": 0.9238, + "step": 11000 + }, + { + "epoch": 0.28, + "learning_rate": 1.97860582421208e-06, + "loss": 0.7578, + "step": 11001 + }, + { + "epoch": 0.28, + "learning_rate": 1.9786001308043982e-06, + "loss": 0.7539, + "step": 11002 + }, + { + "epoch": 0.28, + "learning_rate": 1.978594436647447e-06, + "loss": 0.8916, + "step": 11003 + }, + { + "epoch": 0.28, + "learning_rate": 1.978588741741231e-06, + "loss": 0.9824, + "step": 11004 + }, + { + "epoch": 0.28, + "learning_rate": 1.978583046085755e-06, + "loss": 1.125, + "step": 11005 + }, + { + "epoch": 0.28, + "learning_rate": 1.9785773496810224e-06, + "loss": 0.7593, + "step": 11006 + }, + { + "epoch": 0.28, + "learning_rate": 1.978571652527039e-06, + "loss": 0.9521, + "step": 11007 + }, + { + "epoch": 0.28, + "learning_rate": 1.978565954623807e-06, + "loss": 0.8486, + "step": 11008 + }, + { + "epoch": 0.28, + "learning_rate": 1.978560255971333e-06, + "loss": 1.0908, + "step": 11009 + }, + { + "epoch": 0.28, + "learning_rate": 1.97855455656962e-06, + "loss": 0.9316, + "step": 11010 + }, + { + "epoch": 0.28, + "learning_rate": 1.978548856418673e-06, + "loss": 0.8105, + "step": 11011 + }, + { + "epoch": 0.28, + "learning_rate": 1.978543155518496e-06, + "loss": 0.8848, + "step": 11012 + }, + { + "epoch": 0.28, + "learning_rate": 1.9785374538690935e-06, + "loss": 0.8994, + "step": 11013 + }, + { + "epoch": 0.28, + "learning_rate": 1.97853175147047e-06, + "loss": 0.7295, + "step": 11014 + }, + { + "epoch": 0.28, + "learning_rate": 1.97852604832263e-06, + "loss": 0.9849, + "step": 11015 + }, + { + "epoch": 0.28, + "learning_rate": 1.9785203444255768e-06, + "loss": 0.9404, + "step": 11016 + }, + { + "epoch": 0.28, + "learning_rate": 1.978514639779316e-06, + "loss": 0.7871, + "step": 11017 + }, + { + "epoch": 0.28, + "learning_rate": 1.978508934383852e-06, + "loss": 0.8838, + "step": 11018 + }, + { + "epoch": 0.28, + "learning_rate": 1.978503228239188e-06, + "loss": 0.8896, + "step": 11019 + }, + { + "epoch": 0.28, + "learning_rate": 1.9784975213453294e-06, + "loss": 0.8945, + "step": 11020 + }, + { + "epoch": 0.28, + "learning_rate": 1.97849181370228e-06, + "loss": 0.8418, + "step": 11021 + }, + { + "epoch": 0.28, + "learning_rate": 1.9784861053100446e-06, + "loss": 0.7764, + "step": 11022 + }, + { + "epoch": 0.28, + "learning_rate": 1.9784803961686276e-06, + "loss": 0.8013, + "step": 11023 + }, + { + "epoch": 0.28, + "learning_rate": 1.9784746862780327e-06, + "loss": 0.9941, + "step": 11024 + }, + { + "epoch": 0.28, + "learning_rate": 1.978468975638265e-06, + "loss": 1.0703, + "step": 11025 + }, + { + "epoch": 0.28, + "learning_rate": 1.9784632642493287e-06, + "loss": 0.8867, + "step": 11026 + }, + { + "epoch": 0.28, + "learning_rate": 1.9784575521112277e-06, + "loss": 0.7881, + "step": 11027 + }, + { + "epoch": 0.28, + "learning_rate": 1.978451839223967e-06, + "loss": 1.0098, + "step": 11028 + }, + { + "epoch": 0.28, + "learning_rate": 1.9784461255875507e-06, + "loss": 0.8926, + "step": 11029 + }, + { + "epoch": 0.28, + "learning_rate": 1.978440411201983e-06, + "loss": 0.9238, + "step": 11030 + }, + { + "epoch": 0.28, + "learning_rate": 1.9784346960672684e-06, + "loss": 0.9141, + "step": 11031 + }, + { + "epoch": 0.28, + "learning_rate": 1.978428980183412e-06, + "loss": 0.9243, + "step": 11032 + }, + { + "epoch": 0.28, + "learning_rate": 1.9784232635504166e-06, + "loss": 0.915, + "step": 11033 + }, + { + "epoch": 0.28, + "learning_rate": 1.978417546168288e-06, + "loss": 0.9717, + "step": 11034 + }, + { + "epoch": 0.28, + "learning_rate": 1.9784118280370303e-06, + "loss": 0.8994, + "step": 11035 + }, + { + "epoch": 0.28, + "learning_rate": 1.9784061091566473e-06, + "loss": 0.8682, + "step": 11036 + }, + { + "epoch": 0.28, + "learning_rate": 1.9784003895271438e-06, + "loss": 0.8955, + "step": 11037 + }, + { + "epoch": 0.28, + "learning_rate": 1.9783946691485243e-06, + "loss": 0.6479, + "step": 11038 + }, + { + "epoch": 0.28, + "learning_rate": 1.9783889480207927e-06, + "loss": 0.8008, + "step": 11039 + }, + { + "epoch": 0.28, + "learning_rate": 1.978383226143954e-06, + "loss": 0.8184, + "step": 11040 + }, + { + "epoch": 0.28, + "learning_rate": 1.978377503518012e-06, + "loss": 0.9814, + "step": 11041 + }, + { + "epoch": 0.28, + "learning_rate": 1.9783717801429712e-06, + "loss": 1.0127, + "step": 11042 + }, + { + "epoch": 0.28, + "learning_rate": 1.9783660560188364e-06, + "loss": 0.666, + "step": 11043 + }, + { + "epoch": 0.28, + "learning_rate": 1.9783603311456115e-06, + "loss": 1.0166, + "step": 11044 + }, + { + "epoch": 0.28, + "learning_rate": 1.9783546055233016e-06, + "loss": 0.7251, + "step": 11045 + }, + { + "epoch": 0.28, + "learning_rate": 1.97834887915191e-06, + "loss": 0.9482, + "step": 11046 + }, + { + "epoch": 0.28, + "learning_rate": 1.978343152031442e-06, + "loss": 0.9268, + "step": 11047 + }, + { + "epoch": 0.28, + "learning_rate": 1.978337424161901e-06, + "loss": 0.7124, + "step": 11048 + }, + { + "epoch": 0.28, + "learning_rate": 1.9783316955432925e-06, + "loss": 0.8848, + "step": 11049 + }, + { + "epoch": 0.28, + "learning_rate": 1.9783259661756206e-06, + "loss": 0.791, + "step": 11050 + }, + { + "epoch": 0.28, + "learning_rate": 1.978320236058889e-06, + "loss": 0.7925, + "step": 11051 + }, + { + "epoch": 0.28, + "learning_rate": 1.978314505193103e-06, + "loss": 0.792, + "step": 11052 + }, + { + "epoch": 0.28, + "learning_rate": 1.9783087735782666e-06, + "loss": 0.8818, + "step": 11053 + }, + { + "epoch": 0.28, + "learning_rate": 1.9783030412143837e-06, + "loss": 0.9385, + "step": 11054 + }, + { + "epoch": 0.28, + "learning_rate": 1.9782973081014595e-06, + "loss": 0.8896, + "step": 11055 + }, + { + "epoch": 0.28, + "learning_rate": 1.9782915742394976e-06, + "loss": 1.0117, + "step": 11056 + }, + { + "epoch": 0.28, + "learning_rate": 1.9782858396285033e-06, + "loss": 0.8564, + "step": 11057 + }, + { + "epoch": 0.28, + "learning_rate": 1.9782801042684802e-06, + "loss": 1.0596, + "step": 11058 + }, + { + "epoch": 0.28, + "learning_rate": 1.9782743681594336e-06, + "loss": 1.0205, + "step": 11059 + }, + { + "epoch": 0.28, + "learning_rate": 1.9782686313013667e-06, + "loss": 1.0166, + "step": 11060 + }, + { + "epoch": 0.28, + "learning_rate": 1.9782628936942847e-06, + "loss": 1.1738, + "step": 11061 + }, + { + "epoch": 0.28, + "learning_rate": 1.9782571553381918e-06, + "loss": 0.7129, + "step": 11062 + }, + { + "epoch": 0.28, + "learning_rate": 1.978251416233092e-06, + "loss": 1.0527, + "step": 11063 + }, + { + "epoch": 0.28, + "learning_rate": 1.9782456763789906e-06, + "loss": 0.8633, + "step": 11064 + }, + { + "epoch": 0.28, + "learning_rate": 1.978239935775891e-06, + "loss": 0.752, + "step": 11065 + }, + { + "epoch": 0.28, + "learning_rate": 1.9782341944237982e-06, + "loss": 1.0137, + "step": 11066 + }, + { + "epoch": 0.28, + "learning_rate": 1.978228452322717e-06, + "loss": 0.8574, + "step": 11067 + }, + { + "epoch": 0.28, + "learning_rate": 1.978222709472651e-06, + "loss": 0.6001, + "step": 11068 + }, + { + "epoch": 0.28, + "learning_rate": 1.9782169658736044e-06, + "loss": 0.9541, + "step": 11069 + }, + { + "epoch": 0.28, + "learning_rate": 1.978211221525582e-06, + "loss": 0.7397, + "step": 11070 + }, + { + "epoch": 0.28, + "learning_rate": 1.978205476428589e-06, + "loss": 0.917, + "step": 11071 + }, + { + "epoch": 0.28, + "learning_rate": 1.9781997305826287e-06, + "loss": 0.9316, + "step": 11072 + }, + { + "epoch": 0.28, + "learning_rate": 1.9781939839877055e-06, + "loss": 0.8584, + "step": 11073 + }, + { + "epoch": 0.28, + "learning_rate": 1.9781882366438243e-06, + "loss": 0.8154, + "step": 11074 + }, + { + "epoch": 0.28, + "learning_rate": 1.97818248855099e-06, + "loss": 1.0312, + "step": 11075 + }, + { + "epoch": 0.28, + "learning_rate": 1.9781767397092054e-06, + "loss": 0.9834, + "step": 11076 + }, + { + "epoch": 0.28, + "learning_rate": 1.9781709901184766e-06, + "loss": 1.1348, + "step": 11077 + }, + { + "epoch": 0.28, + "learning_rate": 1.9781652397788067e-06, + "loss": 0.9678, + "step": 11078 + }, + { + "epoch": 0.28, + "learning_rate": 1.978159488690201e-06, + "loss": 0.6294, + "step": 11079 + }, + { + "epoch": 0.28, + "learning_rate": 1.978153736852663e-06, + "loss": 1.0791, + "step": 11080 + }, + { + "epoch": 0.28, + "learning_rate": 1.9781479842661985e-06, + "loss": 1.0957, + "step": 11081 + }, + { + "epoch": 0.28, + "learning_rate": 1.9781422309308103e-06, + "loss": 0.9834, + "step": 11082 + }, + { + "epoch": 0.28, + "learning_rate": 1.978136476846504e-06, + "loss": 0.8184, + "step": 11083 + }, + { + "epoch": 0.28, + "learning_rate": 1.9781307220132836e-06, + "loss": 1.0479, + "step": 11084 + }, + { + "epoch": 0.28, + "learning_rate": 1.9781249664311536e-06, + "loss": 1.0957, + "step": 11085 + }, + { + "epoch": 0.28, + "learning_rate": 1.9781192101001178e-06, + "loss": 0.9443, + "step": 11086 + }, + { + "epoch": 0.28, + "learning_rate": 1.978113453020181e-06, + "loss": 0.9067, + "step": 11087 + }, + { + "epoch": 0.28, + "learning_rate": 1.9781076951913484e-06, + "loss": 0.9434, + "step": 11088 + }, + { + "epoch": 0.28, + "learning_rate": 1.9781019366136233e-06, + "loss": 0.7773, + "step": 11089 + }, + { + "epoch": 0.28, + "learning_rate": 1.9780961772870105e-06, + "loss": 0.7056, + "step": 11090 + }, + { + "epoch": 0.28, + "learning_rate": 1.9780904172115147e-06, + "loss": 0.8242, + "step": 11091 + }, + { + "epoch": 0.28, + "learning_rate": 1.9780846563871398e-06, + "loss": 0.9248, + "step": 11092 + }, + { + "epoch": 0.28, + "learning_rate": 1.9780788948138903e-06, + "loss": 0.8218, + "step": 11093 + }, + { + "epoch": 0.28, + "learning_rate": 1.9780731324917714e-06, + "loss": 0.9688, + "step": 11094 + }, + { + "epoch": 0.28, + "learning_rate": 1.9780673694207863e-06, + "loss": 0.874, + "step": 11095 + }, + { + "epoch": 0.28, + "learning_rate": 1.9780616056009404e-06, + "loss": 0.9795, + "step": 11096 + }, + { + "epoch": 0.28, + "learning_rate": 1.978055841032237e-06, + "loss": 0.7837, + "step": 11097 + }, + { + "epoch": 0.28, + "learning_rate": 1.978050075714682e-06, + "loss": 0.8633, + "step": 11098 + }, + { + "epoch": 0.28, + "learning_rate": 1.9780443096482784e-06, + "loss": 0.9648, + "step": 11099 + }, + { + "epoch": 0.28, + "learning_rate": 1.9780385428330317e-06, + "loss": 1.0205, + "step": 11100 + }, + { + "epoch": 0.28, + "learning_rate": 1.9780327752689456e-06, + "loss": 0.8242, + "step": 11101 + }, + { + "epoch": 0.28, + "learning_rate": 1.9780270069560248e-06, + "loss": 0.9619, + "step": 11102 + }, + { + "epoch": 0.28, + "learning_rate": 1.978021237894274e-06, + "loss": 0.9385, + "step": 11103 + }, + { + "epoch": 0.28, + "learning_rate": 1.9780154680836968e-06, + "loss": 0.959, + "step": 11104 + }, + { + "epoch": 0.28, + "learning_rate": 1.9780096975242984e-06, + "loss": 1.0098, + "step": 11105 + }, + { + "epoch": 0.28, + "learning_rate": 1.978003926216083e-06, + "loss": 0.9062, + "step": 11106 + }, + { + "epoch": 0.28, + "learning_rate": 1.977998154159055e-06, + "loss": 0.9932, + "step": 11107 + }, + { + "epoch": 0.28, + "learning_rate": 1.977992381353219e-06, + "loss": 1.0498, + "step": 11108 + }, + { + "epoch": 0.28, + "learning_rate": 1.9779866077985786e-06, + "loss": 0.7393, + "step": 11109 + }, + { + "epoch": 0.28, + "learning_rate": 1.9779808334951392e-06, + "loss": 0.6968, + "step": 11110 + }, + { + "epoch": 0.28, + "learning_rate": 1.9779750584429045e-06, + "loss": 0.8945, + "step": 11111 + }, + { + "epoch": 0.28, + "learning_rate": 1.9779692826418796e-06, + "loss": 1.002, + "step": 11112 + }, + { + "epoch": 0.28, + "learning_rate": 1.9779635060920686e-06, + "loss": 0.7588, + "step": 11113 + }, + { + "epoch": 0.28, + "learning_rate": 1.977957728793476e-06, + "loss": 0.8994, + "step": 11114 + }, + { + "epoch": 0.28, + "learning_rate": 1.977951950746106e-06, + "loss": 1.0566, + "step": 11115 + }, + { + "epoch": 0.28, + "learning_rate": 1.9779461719499627e-06, + "loss": 0.9473, + "step": 11116 + }, + { + "epoch": 0.28, + "learning_rate": 1.9779403924050513e-06, + "loss": 1.0117, + "step": 11117 + }, + { + "epoch": 0.28, + "learning_rate": 1.9779346121113763e-06, + "loss": 0.6704, + "step": 11118 + }, + { + "epoch": 0.28, + "learning_rate": 1.9779288310689415e-06, + "loss": 0.8994, + "step": 11119 + }, + { + "epoch": 0.29, + "learning_rate": 1.9779230492777512e-06, + "loss": 0.998, + "step": 11120 + }, + { + "epoch": 0.29, + "learning_rate": 1.9779172667378105e-06, + "loss": 0.9678, + "step": 11121 + }, + { + "epoch": 0.29, + "learning_rate": 1.9779114834491235e-06, + "loss": 0.5981, + "step": 11122 + }, + { + "epoch": 0.29, + "learning_rate": 1.977905699411695e-06, + "loss": 0.7705, + "step": 11123 + }, + { + "epoch": 0.29, + "learning_rate": 1.9778999146255284e-06, + "loss": 0.7725, + "step": 11124 + }, + { + "epoch": 0.29, + "learning_rate": 1.977894129090629e-06, + "loss": 0.8506, + "step": 11125 + }, + { + "epoch": 0.29, + "learning_rate": 1.9778883428070013e-06, + "loss": 0.9912, + "step": 11126 + }, + { + "epoch": 0.29, + "learning_rate": 1.9778825557746494e-06, + "loss": 0.7676, + "step": 11127 + }, + { + "epoch": 0.29, + "learning_rate": 1.9778767679935775e-06, + "loss": 0.7295, + "step": 11128 + }, + { + "epoch": 0.29, + "learning_rate": 1.977870979463791e-06, + "loss": 0.9912, + "step": 11129 + }, + { + "epoch": 0.29, + "learning_rate": 1.9778651901852926e-06, + "loss": 0.9463, + "step": 11130 + }, + { + "epoch": 0.29, + "learning_rate": 1.977859400158089e-06, + "loss": 0.8672, + "step": 11131 + }, + { + "epoch": 0.29, + "learning_rate": 1.9778536093821824e-06, + "loss": 0.9824, + "step": 11132 + }, + { + "epoch": 0.29, + "learning_rate": 1.9778478178575786e-06, + "loss": 0.9844, + "step": 11133 + }, + { + "epoch": 0.29, + "learning_rate": 1.977842025584282e-06, + "loss": 0.8633, + "step": 11134 + }, + { + "epoch": 0.29, + "learning_rate": 1.9778362325622965e-06, + "loss": 0.9932, + "step": 11135 + }, + { + "epoch": 0.29, + "learning_rate": 1.9778304387916264e-06, + "loss": 1.082, + "step": 11136 + }, + { + "epoch": 0.29, + "learning_rate": 1.9778246442722766e-06, + "loss": 0.9199, + "step": 11137 + }, + { + "epoch": 0.29, + "learning_rate": 1.9778188490042517e-06, + "loss": 0.8823, + "step": 11138 + }, + { + "epoch": 0.29, + "learning_rate": 1.977813052987556e-06, + "loss": 1.0088, + "step": 11139 + }, + { + "epoch": 0.29, + "learning_rate": 1.9778072562221933e-06, + "loss": 0.79, + "step": 11140 + }, + { + "epoch": 0.29, + "learning_rate": 1.977801458708169e-06, + "loss": 1.0957, + "step": 11141 + }, + { + "epoch": 0.29, + "learning_rate": 1.977795660445487e-06, + "loss": 1.042, + "step": 11142 + }, + { + "epoch": 0.29, + "learning_rate": 1.977789861434152e-06, + "loss": 0.8975, + "step": 11143 + }, + { + "epoch": 0.29, + "learning_rate": 1.977784061674168e-06, + "loss": 0.79, + "step": 11144 + }, + { + "epoch": 0.29, + "learning_rate": 1.9777782611655396e-06, + "loss": 0.9463, + "step": 11145 + }, + { + "epoch": 0.29, + "learning_rate": 1.9777724599082714e-06, + "loss": 0.9521, + "step": 11146 + }, + { + "epoch": 0.29, + "learning_rate": 1.977766657902368e-06, + "loss": 1.0908, + "step": 11147 + }, + { + "epoch": 0.29, + "learning_rate": 1.9777608551478334e-06, + "loss": 0.8779, + "step": 11148 + }, + { + "epoch": 0.29, + "learning_rate": 1.9777550516446726e-06, + "loss": 0.8379, + "step": 11149 + }, + { + "epoch": 0.29, + "learning_rate": 1.977749247392889e-06, + "loss": 0.6709, + "step": 11150 + }, + { + "epoch": 0.29, + "learning_rate": 1.9777434423924888e-06, + "loss": 0.9902, + "step": 11151 + }, + { + "epoch": 0.29, + "learning_rate": 1.9777376366434747e-06, + "loss": 0.9727, + "step": 11152 + }, + { + "epoch": 0.29, + "learning_rate": 1.977731830145852e-06, + "loss": 0.9521, + "step": 11153 + }, + { + "epoch": 0.29, + "learning_rate": 1.9777260228996247e-06, + "loss": 0.7026, + "step": 11154 + }, + { + "epoch": 0.29, + "learning_rate": 1.977720214904798e-06, + "loss": 0.7578, + "step": 11155 + }, + { + "epoch": 0.29, + "learning_rate": 1.9777144061613755e-06, + "loss": 0.8926, + "step": 11156 + }, + { + "epoch": 0.29, + "learning_rate": 1.9777085966693627e-06, + "loss": 0.958, + "step": 11157 + }, + { + "epoch": 0.29, + "learning_rate": 1.977702786428763e-06, + "loss": 0.6636, + "step": 11158 + }, + { + "epoch": 0.29, + "learning_rate": 1.9776969754395807e-06, + "loss": 1.0303, + "step": 11159 + }, + { + "epoch": 0.29, + "learning_rate": 1.9776911637018214e-06, + "loss": 0.9121, + "step": 11160 + }, + { + "epoch": 0.29, + "learning_rate": 1.9776853512154886e-06, + "loss": 1.0303, + "step": 11161 + }, + { + "epoch": 0.29, + "learning_rate": 1.977679537980587e-06, + "loss": 0.9199, + "step": 11162 + }, + { + "epoch": 0.29, + "learning_rate": 1.977673723997122e-06, + "loss": 0.7549, + "step": 11163 + }, + { + "epoch": 0.29, + "learning_rate": 1.9776679092650964e-06, + "loss": 0.7607, + "step": 11164 + }, + { + "epoch": 0.29, + "learning_rate": 1.9776620937845157e-06, + "loss": 0.875, + "step": 11165 + }, + { + "epoch": 0.29, + "learning_rate": 1.977656277555384e-06, + "loss": 0.8252, + "step": 11166 + }, + { + "epoch": 0.29, + "learning_rate": 1.9776504605777057e-06, + "loss": 1.0332, + "step": 11167 + }, + { + "epoch": 0.29, + "learning_rate": 1.9776446428514857e-06, + "loss": 0.7988, + "step": 11168 + }, + { + "epoch": 0.29, + "learning_rate": 1.977638824376728e-06, + "loss": 0.6409, + "step": 11169 + }, + { + "epoch": 0.29, + "learning_rate": 1.977633005153437e-06, + "loss": 0.9121, + "step": 11170 + }, + { + "epoch": 0.29, + "learning_rate": 1.9776271851816176e-06, + "loss": 1.0078, + "step": 11171 + }, + { + "epoch": 0.29, + "learning_rate": 1.977621364461274e-06, + "loss": 0.9424, + "step": 11172 + }, + { + "epoch": 0.29, + "learning_rate": 1.9776155429924107e-06, + "loss": 0.9512, + "step": 11173 + }, + { + "epoch": 0.29, + "learning_rate": 1.9776097207750318e-06, + "loss": 0.9023, + "step": 11174 + }, + { + "epoch": 0.29, + "learning_rate": 1.9776038978091426e-06, + "loss": 0.7568, + "step": 11175 + }, + { + "epoch": 0.29, + "learning_rate": 1.9775980740947465e-06, + "loss": 0.8955, + "step": 11176 + }, + { + "epoch": 0.29, + "learning_rate": 1.977592249631849e-06, + "loss": 0.7764, + "step": 11177 + }, + { + "epoch": 0.29, + "learning_rate": 1.977586424420454e-06, + "loss": 0.9141, + "step": 11178 + }, + { + "epoch": 0.29, + "learning_rate": 1.9775805984605658e-06, + "loss": 0.8037, + "step": 11179 + }, + { + "epoch": 0.29, + "learning_rate": 1.9775747717521894e-06, + "loss": 1.0918, + "step": 11180 + }, + { + "epoch": 0.29, + "learning_rate": 1.9775689442953285e-06, + "loss": 1.0049, + "step": 11181 + }, + { + "epoch": 0.29, + "learning_rate": 1.9775631160899883e-06, + "loss": 0.7715, + "step": 11182 + }, + { + "epoch": 0.29, + "learning_rate": 1.977557287136173e-06, + "loss": 0.7681, + "step": 11183 + }, + { + "epoch": 0.29, + "learning_rate": 1.9775514574338866e-06, + "loss": 0.7746, + "step": 11184 + }, + { + "epoch": 0.29, + "learning_rate": 1.977545626983135e-06, + "loss": 0.9375, + "step": 11185 + }, + { + "epoch": 0.29, + "learning_rate": 1.9775397957839207e-06, + "loss": 1.0205, + "step": 11186 + }, + { + "epoch": 0.29, + "learning_rate": 1.9775339638362496e-06, + "loss": 0.8623, + "step": 11187 + }, + { + "epoch": 0.29, + "learning_rate": 1.9775281311401253e-06, + "loss": 1.0811, + "step": 11188 + }, + { + "epoch": 0.29, + "learning_rate": 1.977522297695553e-06, + "loss": 0.9229, + "step": 11189 + }, + { + "epoch": 0.29, + "learning_rate": 1.977516463502537e-06, + "loss": 0.9688, + "step": 11190 + }, + { + "epoch": 0.29, + "learning_rate": 1.977510628561081e-06, + "loss": 0.8975, + "step": 11191 + }, + { + "epoch": 0.29, + "learning_rate": 1.9775047928711905e-06, + "loss": 0.9141, + "step": 11192 + }, + { + "epoch": 0.29, + "learning_rate": 1.977498956432869e-06, + "loss": 0.8569, + "step": 11193 + }, + { + "epoch": 0.29, + "learning_rate": 1.977493119246122e-06, + "loss": 1.0654, + "step": 11194 + }, + { + "epoch": 0.29, + "learning_rate": 1.9774872813109535e-06, + "loss": 0.9072, + "step": 11195 + }, + { + "epoch": 0.29, + "learning_rate": 1.977481442627368e-06, + "loss": 0.6484, + "step": 11196 + }, + { + "epoch": 0.29, + "learning_rate": 1.9774756031953692e-06, + "loss": 1.0137, + "step": 11197 + }, + { + "epoch": 0.29, + "learning_rate": 1.977469763014963e-06, + "loss": 0.8037, + "step": 11198 + }, + { + "epoch": 0.29, + "learning_rate": 1.977463922086153e-06, + "loss": 0.7891, + "step": 11199 + }, + { + "epoch": 0.29, + "learning_rate": 1.977458080408944e-06, + "loss": 0.8525, + "step": 11200 + }, + { + "epoch": 0.29, + "learning_rate": 1.9774522379833396e-06, + "loss": 0.9453, + "step": 11201 + }, + { + "epoch": 0.29, + "learning_rate": 1.9774463948093458e-06, + "loss": 0.9883, + "step": 11202 + }, + { + "epoch": 0.29, + "learning_rate": 1.9774405508869657e-06, + "loss": 0.8906, + "step": 11203 + }, + { + "epoch": 0.29, + "learning_rate": 1.977434706216204e-06, + "loss": 0.9785, + "step": 11204 + }, + { + "epoch": 0.29, + "learning_rate": 1.977428860797066e-06, + "loss": 0.9844, + "step": 11205 + }, + { + "epoch": 0.29, + "learning_rate": 1.9774230146295557e-06, + "loss": 0.8096, + "step": 11206 + }, + { + "epoch": 0.29, + "learning_rate": 1.9774171677136774e-06, + "loss": 0.9961, + "step": 11207 + }, + { + "epoch": 0.29, + "learning_rate": 1.977411320049436e-06, + "loss": 0.9038, + "step": 11208 + }, + { + "epoch": 0.29, + "learning_rate": 1.9774054716368353e-06, + "loss": 0.7363, + "step": 11209 + }, + { + "epoch": 0.29, + "learning_rate": 1.9773996224758805e-06, + "loss": 1.0791, + "step": 11210 + }, + { + "epoch": 0.29, + "learning_rate": 1.977393772566576e-06, + "loss": 0.9756, + "step": 11211 + }, + { + "epoch": 0.29, + "learning_rate": 1.9773879219089253e-06, + "loss": 0.7827, + "step": 11212 + }, + { + "epoch": 0.29, + "learning_rate": 1.9773820705029337e-06, + "loss": 0.7495, + "step": 11213 + }, + { + "epoch": 0.29, + "learning_rate": 1.977376218348606e-06, + "loss": 0.8486, + "step": 11214 + }, + { + "epoch": 0.29, + "learning_rate": 1.9773703654459458e-06, + "loss": 0.7783, + "step": 11215 + }, + { + "epoch": 0.29, + "learning_rate": 1.9773645117949587e-06, + "loss": 0.8252, + "step": 11216 + }, + { + "epoch": 0.29, + "learning_rate": 1.977358657395648e-06, + "loss": 0.8535, + "step": 11217 + }, + { + "epoch": 0.29, + "learning_rate": 1.977352802248019e-06, + "loss": 0.6978, + "step": 11218 + }, + { + "epoch": 0.29, + "learning_rate": 1.9773469463520755e-06, + "loss": 0.957, + "step": 11219 + }, + { + "epoch": 0.29, + "learning_rate": 1.977341089707823e-06, + "loss": 0.8823, + "step": 11220 + }, + { + "epoch": 0.29, + "learning_rate": 1.977335232315265e-06, + "loss": 0.8174, + "step": 11221 + }, + { + "epoch": 0.29, + "learning_rate": 1.9773293741744064e-06, + "loss": 0.9473, + "step": 11222 + }, + { + "epoch": 0.29, + "learning_rate": 1.9773235152852514e-06, + "loss": 0.9277, + "step": 11223 + }, + { + "epoch": 0.29, + "learning_rate": 1.977317655647805e-06, + "loss": 0.7871, + "step": 11224 + }, + { + "epoch": 0.29, + "learning_rate": 1.9773117952620714e-06, + "loss": 1.2305, + "step": 11225 + }, + { + "epoch": 0.29, + "learning_rate": 1.977305934128055e-06, + "loss": 0.5601, + "step": 11226 + }, + { + "epoch": 0.29, + "learning_rate": 1.9773000722457606e-06, + "loss": 0.7622, + "step": 11227 + }, + { + "epoch": 0.29, + "learning_rate": 1.977294209615192e-06, + "loss": 0.8018, + "step": 11228 + }, + { + "epoch": 0.29, + "learning_rate": 1.9772883462363544e-06, + "loss": 0.9951, + "step": 11229 + }, + { + "epoch": 0.29, + "learning_rate": 1.9772824821092523e-06, + "loss": 0.6323, + "step": 11230 + }, + { + "epoch": 0.29, + "learning_rate": 1.97727661723389e-06, + "loss": 0.9814, + "step": 11231 + }, + { + "epoch": 0.29, + "learning_rate": 1.9772707516102716e-06, + "loss": 0.7441, + "step": 11232 + }, + { + "epoch": 0.29, + "learning_rate": 1.9772648852384018e-06, + "loss": 0.8975, + "step": 11233 + }, + { + "epoch": 0.29, + "learning_rate": 1.9772590181182855e-06, + "loss": 0.8574, + "step": 11234 + }, + { + "epoch": 0.29, + "learning_rate": 1.9772531502499266e-06, + "loss": 0.6782, + "step": 11235 + }, + { + "epoch": 0.29, + "learning_rate": 1.97724728163333e-06, + "loss": 0.9893, + "step": 11236 + }, + { + "epoch": 0.29, + "learning_rate": 1.9772414122685003e-06, + "loss": 0.8574, + "step": 11237 + }, + { + "epoch": 0.29, + "learning_rate": 1.9772355421554423e-06, + "loss": 1.0645, + "step": 11238 + }, + { + "epoch": 0.29, + "learning_rate": 1.9772296712941594e-06, + "loss": 0.9316, + "step": 11239 + }, + { + "epoch": 0.29, + "learning_rate": 1.9772237996846562e-06, + "loss": 0.9482, + "step": 11240 + }, + { + "epoch": 0.29, + "learning_rate": 1.9772179273269384e-06, + "loss": 0.895, + "step": 11241 + }, + { + "epoch": 0.29, + "learning_rate": 1.9772120542210093e-06, + "loss": 0.9443, + "step": 11242 + }, + { + "epoch": 0.29, + "learning_rate": 1.977206180366874e-06, + "loss": 0.4089, + "step": 11243 + }, + { + "epoch": 0.29, + "learning_rate": 1.977200305764537e-06, + "loss": 0.6807, + "step": 11244 + }, + { + "epoch": 0.29, + "learning_rate": 1.9771944304140024e-06, + "loss": 0.959, + "step": 11245 + }, + { + "epoch": 0.29, + "learning_rate": 1.9771885543152755e-06, + "loss": 0.8848, + "step": 11246 + }, + { + "epoch": 0.29, + "learning_rate": 1.9771826774683597e-06, + "loss": 0.8936, + "step": 11247 + }, + { + "epoch": 0.29, + "learning_rate": 1.97717679987326e-06, + "loss": 0.8037, + "step": 11248 + }, + { + "epoch": 0.29, + "learning_rate": 1.9771709215299815e-06, + "loss": 0.9121, + "step": 11249 + }, + { + "epoch": 0.29, + "learning_rate": 1.977165042438528e-06, + "loss": 0.8647, + "step": 11250 + }, + { + "epoch": 0.29, + "learning_rate": 1.9771591625989037e-06, + "loss": 0.9521, + "step": 11251 + }, + { + "epoch": 0.29, + "learning_rate": 1.977153282011114e-06, + "loss": 1.0215, + "step": 11252 + }, + { + "epoch": 0.29, + "learning_rate": 1.977147400675163e-06, + "loss": 0.9385, + "step": 11253 + }, + { + "epoch": 0.29, + "learning_rate": 1.977141518591055e-06, + "loss": 0.7822, + "step": 11254 + }, + { + "epoch": 0.29, + "learning_rate": 1.9771356357587944e-06, + "loss": 0.9004, + "step": 11255 + }, + { + "epoch": 0.29, + "learning_rate": 1.9771297521783864e-06, + "loss": 1.1484, + "step": 11256 + }, + { + "epoch": 0.29, + "learning_rate": 1.977123867849835e-06, + "loss": 1.1091, + "step": 11257 + }, + { + "epoch": 0.29, + "learning_rate": 1.9771179827731445e-06, + "loss": 0.9316, + "step": 11258 + }, + { + "epoch": 0.29, + "learning_rate": 1.97711209694832e-06, + "loss": 0.9082, + "step": 11259 + }, + { + "epoch": 0.29, + "learning_rate": 1.9771062103753656e-06, + "loss": 1.04, + "step": 11260 + }, + { + "epoch": 0.29, + "learning_rate": 1.977100323054286e-06, + "loss": 0.853, + "step": 11261 + }, + { + "epoch": 0.29, + "learning_rate": 1.9770944349850854e-06, + "loss": 0.7334, + "step": 11262 + }, + { + "epoch": 0.29, + "learning_rate": 1.9770885461677687e-06, + "loss": 0.8213, + "step": 11263 + }, + { + "epoch": 0.29, + "learning_rate": 1.9770826566023402e-06, + "loss": 0.7622, + "step": 11264 + }, + { + "epoch": 0.29, + "learning_rate": 1.9770767662888042e-06, + "loss": 0.9658, + "step": 11265 + }, + { + "epoch": 0.29, + "learning_rate": 1.9770708752271658e-06, + "loss": 0.8594, + "step": 11266 + }, + { + "epoch": 0.29, + "learning_rate": 1.977064983417429e-06, + "loss": 0.834, + "step": 11267 + }, + { + "epoch": 0.29, + "learning_rate": 1.9770590908595984e-06, + "loss": 0.7637, + "step": 11268 + }, + { + "epoch": 0.29, + "learning_rate": 1.977053197553679e-06, + "loss": 0.8979, + "step": 11269 + }, + { + "epoch": 0.29, + "learning_rate": 1.977047303499674e-06, + "loss": 0.7842, + "step": 11270 + }, + { + "epoch": 0.29, + "learning_rate": 1.9770414086975894e-06, + "loss": 1.0938, + "step": 11271 + }, + { + "epoch": 0.29, + "learning_rate": 1.9770355131474293e-06, + "loss": 1.124, + "step": 11272 + }, + { + "epoch": 0.29, + "learning_rate": 1.9770296168491977e-06, + "loss": 0.9541, + "step": 11273 + }, + { + "epoch": 0.29, + "learning_rate": 1.9770237198028996e-06, + "loss": 1.1426, + "step": 11274 + }, + { + "epoch": 0.29, + "learning_rate": 1.9770178220085393e-06, + "loss": 0.7383, + "step": 11275 + }, + { + "epoch": 0.29, + "learning_rate": 1.9770119234661214e-06, + "loss": 0.8125, + "step": 11276 + }, + { + "epoch": 0.29, + "learning_rate": 1.97700602417565e-06, + "loss": 1.0244, + "step": 11277 + }, + { + "epoch": 0.29, + "learning_rate": 1.9770001241371307e-06, + "loss": 0.9199, + "step": 11278 + }, + { + "epoch": 0.29, + "learning_rate": 1.9769942233505672e-06, + "loss": 0.7959, + "step": 11279 + }, + { + "epoch": 0.29, + "learning_rate": 1.976988321815964e-06, + "loss": 0.8008, + "step": 11280 + }, + { + "epoch": 0.29, + "learning_rate": 1.9769824195333256e-06, + "loss": 0.7373, + "step": 11281 + }, + { + "epoch": 0.29, + "learning_rate": 1.9769765165026567e-06, + "loss": 1.0312, + "step": 11282 + }, + { + "epoch": 0.29, + "learning_rate": 1.976970612723962e-06, + "loss": 0.6875, + "step": 11283 + }, + { + "epoch": 0.29, + "learning_rate": 1.9769647081972458e-06, + "loss": 0.7422, + "step": 11284 + }, + { + "epoch": 0.29, + "learning_rate": 1.9769588029225126e-06, + "loss": 1.0156, + "step": 11285 + }, + { + "epoch": 0.29, + "learning_rate": 1.976952896899767e-06, + "loss": 0.7134, + "step": 11286 + }, + { + "epoch": 0.29, + "learning_rate": 1.9769469901290134e-06, + "loss": 0.8477, + "step": 11287 + }, + { + "epoch": 0.29, + "learning_rate": 1.9769410826102566e-06, + "loss": 0.9424, + "step": 11288 + }, + { + "epoch": 0.29, + "learning_rate": 1.9769351743435006e-06, + "loss": 0.7231, + "step": 11289 + }, + { + "epoch": 0.29, + "learning_rate": 1.9769292653287507e-06, + "loss": 0.6748, + "step": 11290 + }, + { + "epoch": 0.29, + "learning_rate": 1.9769233555660105e-06, + "loss": 1.0391, + "step": 11291 + }, + { + "epoch": 0.29, + "learning_rate": 1.976917445055285e-06, + "loss": 1.0264, + "step": 11292 + }, + { + "epoch": 0.29, + "learning_rate": 1.9769115337965793e-06, + "loss": 0.7861, + "step": 11293 + }, + { + "epoch": 0.29, + "learning_rate": 1.976905621789897e-06, + "loss": 1.1475, + "step": 11294 + }, + { + "epoch": 0.29, + "learning_rate": 1.9768997090352427e-06, + "loss": 0.8281, + "step": 11295 + }, + { + "epoch": 0.29, + "learning_rate": 1.976893795532622e-06, + "loss": 0.9424, + "step": 11296 + }, + { + "epoch": 0.29, + "learning_rate": 1.976887881282038e-06, + "loss": 0.9316, + "step": 11297 + }, + { + "epoch": 0.29, + "learning_rate": 1.976881966283496e-06, + "loss": 0.9443, + "step": 11298 + }, + { + "epoch": 0.29, + "learning_rate": 1.9768760505370005e-06, + "loss": 0.8584, + "step": 11299 + }, + { + "epoch": 0.29, + "learning_rate": 1.9768701340425557e-06, + "loss": 0.7727, + "step": 11300 + }, + { + "epoch": 0.29, + "learning_rate": 1.9768642168001665e-06, + "loss": 0.8691, + "step": 11301 + }, + { + "epoch": 0.29, + "learning_rate": 1.9768582988098374e-06, + "loss": 0.9619, + "step": 11302 + }, + { + "epoch": 0.29, + "learning_rate": 1.9768523800715727e-06, + "loss": 1.0449, + "step": 11303 + }, + { + "epoch": 0.29, + "learning_rate": 1.976846460585377e-06, + "loss": 1.0693, + "step": 11304 + }, + { + "epoch": 0.29, + "learning_rate": 1.9768405403512548e-06, + "loss": 1.083, + "step": 11305 + }, + { + "epoch": 0.29, + "learning_rate": 1.9768346193692113e-06, + "loss": 1.1006, + "step": 11306 + }, + { + "epoch": 0.29, + "learning_rate": 1.9768286976392495e-06, + "loss": 1.1113, + "step": 11307 + }, + { + "epoch": 0.29, + "learning_rate": 1.976822775161376e-06, + "loss": 0.9258, + "step": 11308 + }, + { + "epoch": 0.29, + "learning_rate": 1.9768168519355933e-06, + "loss": 0.8779, + "step": 11309 + }, + { + "epoch": 0.29, + "learning_rate": 1.9768109279619073e-06, + "loss": 0.8545, + "step": 11310 + }, + { + "epoch": 0.29, + "learning_rate": 1.9768050032403218e-06, + "loss": 0.8955, + "step": 11311 + }, + { + "epoch": 0.29, + "learning_rate": 1.9767990777708417e-06, + "loss": 0.7383, + "step": 11312 + }, + { + "epoch": 0.29, + "learning_rate": 1.9767931515534718e-06, + "loss": 0.7651, + "step": 11313 + }, + { + "epoch": 0.29, + "learning_rate": 1.9767872245882158e-06, + "loss": 0.9517, + "step": 11314 + }, + { + "epoch": 0.29, + "learning_rate": 1.976781296875079e-06, + "loss": 0.8564, + "step": 11315 + }, + { + "epoch": 0.29, + "learning_rate": 1.9767753684140656e-06, + "loss": 1.0479, + "step": 11316 + }, + { + "epoch": 0.29, + "learning_rate": 1.9767694392051802e-06, + "loss": 0.7622, + "step": 11317 + }, + { + "epoch": 0.29, + "learning_rate": 1.9767635092484275e-06, + "loss": 0.9033, + "step": 11318 + }, + { + "epoch": 0.29, + "learning_rate": 1.9767575785438116e-06, + "loss": 0.7617, + "step": 11319 + }, + { + "epoch": 0.29, + "learning_rate": 1.9767516470913376e-06, + "loss": 0.8735, + "step": 11320 + }, + { + "epoch": 0.29, + "learning_rate": 1.9767457148910097e-06, + "loss": 0.7563, + "step": 11321 + }, + { + "epoch": 0.29, + "learning_rate": 1.9767397819428326e-06, + "loss": 0.6709, + "step": 11322 + }, + { + "epoch": 0.29, + "learning_rate": 1.9767338482468106e-06, + "loss": 0.9082, + "step": 11323 + }, + { + "epoch": 0.29, + "learning_rate": 1.9767279138029487e-06, + "loss": 1.0625, + "step": 11324 + }, + { + "epoch": 0.29, + "learning_rate": 1.9767219786112507e-06, + "loss": 0.8662, + "step": 11325 + }, + { + "epoch": 0.29, + "learning_rate": 1.976716042671722e-06, + "loss": 0.9062, + "step": 11326 + }, + { + "epoch": 0.29, + "learning_rate": 1.9767101059843664e-06, + "loss": 0.9023, + "step": 11327 + }, + { + "epoch": 0.29, + "learning_rate": 1.976704168549189e-06, + "loss": 0.8496, + "step": 11328 + }, + { + "epoch": 0.29, + "learning_rate": 1.976698230366194e-06, + "loss": 0.917, + "step": 11329 + }, + { + "epoch": 0.29, + "learning_rate": 1.976692291435386e-06, + "loss": 0.8281, + "step": 11330 + }, + { + "epoch": 0.29, + "learning_rate": 1.9766863517567704e-06, + "loss": 0.9463, + "step": 11331 + }, + { + "epoch": 0.29, + "learning_rate": 1.9766804113303503e-06, + "loss": 0.8506, + "step": 11332 + }, + { + "epoch": 0.29, + "learning_rate": 1.9766744701561306e-06, + "loss": 1.0225, + "step": 11333 + }, + { + "epoch": 0.29, + "learning_rate": 1.9766685282341168e-06, + "loss": 1.0244, + "step": 11334 + }, + { + "epoch": 0.29, + "learning_rate": 1.976662585564312e-06, + "loss": 1.0312, + "step": 11335 + }, + { + "epoch": 0.29, + "learning_rate": 1.9766566421467227e-06, + "loss": 0.8965, + "step": 11336 + }, + { + "epoch": 0.29, + "learning_rate": 1.9766506979813515e-06, + "loss": 0.9443, + "step": 11337 + }, + { + "epoch": 0.29, + "learning_rate": 1.976644753068204e-06, + "loss": 1.0068, + "step": 11338 + }, + { + "epoch": 0.29, + "learning_rate": 1.9766388074072845e-06, + "loss": 1.0, + "step": 11339 + }, + { + "epoch": 0.29, + "learning_rate": 1.9766328609985977e-06, + "loss": 0.9141, + "step": 11340 + }, + { + "epoch": 0.29, + "learning_rate": 1.976626913842148e-06, + "loss": 0.7842, + "step": 11341 + }, + { + "epoch": 0.29, + "learning_rate": 1.97662096593794e-06, + "loss": 0.8906, + "step": 11342 + }, + { + "epoch": 0.29, + "learning_rate": 1.976615017285978e-06, + "loss": 0.8838, + "step": 11343 + }, + { + "epoch": 0.29, + "learning_rate": 1.976609067886267e-06, + "loss": 1.0459, + "step": 11344 + }, + { + "epoch": 0.29, + "learning_rate": 1.976603117738811e-06, + "loss": 0.9316, + "step": 11345 + }, + { + "epoch": 0.29, + "learning_rate": 1.976597166843615e-06, + "loss": 0.7778, + "step": 11346 + }, + { + "epoch": 0.29, + "learning_rate": 1.976591215200684e-06, + "loss": 1.0146, + "step": 11347 + }, + { + "epoch": 0.29, + "learning_rate": 1.9765852628100214e-06, + "loss": 0.8613, + "step": 11348 + }, + { + "epoch": 0.29, + "learning_rate": 1.9765793096716324e-06, + "loss": 0.8955, + "step": 11349 + }, + { + "epoch": 0.29, + "learning_rate": 1.976573355785522e-06, + "loss": 0.9561, + "step": 11350 + }, + { + "epoch": 0.29, + "learning_rate": 1.976567401151694e-06, + "loss": 0.9893, + "step": 11351 + }, + { + "epoch": 0.29, + "learning_rate": 1.9765614457701533e-06, + "loss": 0.8877, + "step": 11352 + }, + { + "epoch": 0.29, + "learning_rate": 1.976555489640904e-06, + "loss": 0.8232, + "step": 11353 + }, + { + "epoch": 0.29, + "learning_rate": 1.9765495327639515e-06, + "loss": 0.9287, + "step": 11354 + }, + { + "epoch": 0.29, + "learning_rate": 1.9765435751393e-06, + "loss": 1.0029, + "step": 11355 + }, + { + "epoch": 0.29, + "learning_rate": 1.9765376167669537e-06, + "loss": 1.2188, + "step": 11356 + }, + { + "epoch": 0.29, + "learning_rate": 1.9765316576469176e-06, + "loss": 0.8613, + "step": 11357 + }, + { + "epoch": 0.29, + "learning_rate": 1.976525697779196e-06, + "loss": 0.6992, + "step": 11358 + }, + { + "epoch": 0.29, + "learning_rate": 1.9765197371637937e-06, + "loss": 0.752, + "step": 11359 + }, + { + "epoch": 0.29, + "learning_rate": 1.9765137758007152e-06, + "loss": 0.9492, + "step": 11360 + }, + { + "epoch": 0.29, + "learning_rate": 1.976507813689965e-06, + "loss": 0.8389, + "step": 11361 + }, + { + "epoch": 0.29, + "learning_rate": 1.9765018508315477e-06, + "loss": 0.77, + "step": 11362 + }, + { + "epoch": 0.29, + "learning_rate": 1.9764958872254675e-06, + "loss": 0.8594, + "step": 11363 + }, + { + "epoch": 0.29, + "learning_rate": 1.9764899228717296e-06, + "loss": 1.0508, + "step": 11364 + }, + { + "epoch": 0.29, + "learning_rate": 1.976483957770338e-06, + "loss": 0.7266, + "step": 11365 + }, + { + "epoch": 0.29, + "learning_rate": 1.9764779919212978e-06, + "loss": 1.1133, + "step": 11366 + }, + { + "epoch": 0.29, + "learning_rate": 1.976472025324613e-06, + "loss": 1.1289, + "step": 11367 + }, + { + "epoch": 0.29, + "learning_rate": 1.9764660579802887e-06, + "loss": 0.752, + "step": 11368 + }, + { + "epoch": 0.29, + "learning_rate": 1.9764600898883296e-06, + "loss": 0.9404, + "step": 11369 + }, + { + "epoch": 0.29, + "learning_rate": 1.9764541210487395e-06, + "loss": 1.0215, + "step": 11370 + }, + { + "epoch": 0.29, + "learning_rate": 1.9764481514615234e-06, + "loss": 0.9468, + "step": 11371 + }, + { + "epoch": 0.29, + "learning_rate": 1.9764421811266855e-06, + "loss": 0.8867, + "step": 11372 + }, + { + "epoch": 0.29, + "learning_rate": 1.9764362100442313e-06, + "loss": 0.9395, + "step": 11373 + }, + { + "epoch": 0.29, + "learning_rate": 1.9764302382141643e-06, + "loss": 0.9365, + "step": 11374 + }, + { + "epoch": 0.29, + "learning_rate": 1.97642426563649e-06, + "loss": 0.7734, + "step": 11375 + }, + { + "epoch": 0.29, + "learning_rate": 1.9764182923112123e-06, + "loss": 0.7246, + "step": 11376 + }, + { + "epoch": 0.29, + "learning_rate": 1.9764123182383363e-06, + "loss": 0.9023, + "step": 11377 + }, + { + "epoch": 0.29, + "learning_rate": 1.976406343417866e-06, + "loss": 1.0352, + "step": 11378 + }, + { + "epoch": 0.29, + "learning_rate": 1.976400367849806e-06, + "loss": 0.874, + "step": 11379 + }, + { + "epoch": 0.29, + "learning_rate": 1.9763943915341618e-06, + "loss": 1.0059, + "step": 11380 + }, + { + "epoch": 0.29, + "learning_rate": 1.9763884144709367e-06, + "loss": 0.666, + "step": 11381 + }, + { + "epoch": 0.29, + "learning_rate": 1.9763824366601365e-06, + "loss": 0.7412, + "step": 11382 + }, + { + "epoch": 0.29, + "learning_rate": 1.9763764581017644e-06, + "loss": 1.0444, + "step": 11383 + }, + { + "epoch": 0.29, + "learning_rate": 1.9763704787958265e-06, + "loss": 1.1289, + "step": 11384 + }, + { + "epoch": 0.29, + "learning_rate": 1.976364498742326e-06, + "loss": 0.7964, + "step": 11385 + }, + { + "epoch": 0.29, + "learning_rate": 1.9763585179412683e-06, + "loss": 0.7363, + "step": 11386 + }, + { + "epoch": 0.29, + "learning_rate": 1.9763525363926582e-06, + "loss": 0.916, + "step": 11387 + }, + { + "epoch": 0.29, + "learning_rate": 1.9763465540964992e-06, + "loss": 0.9971, + "step": 11388 + }, + { + "epoch": 0.29, + "learning_rate": 1.9763405710527968e-06, + "loss": 0.7627, + "step": 11389 + }, + { + "epoch": 0.29, + "learning_rate": 1.9763345872615555e-06, + "loss": 1.0381, + "step": 11390 + }, + { + "epoch": 0.29, + "learning_rate": 1.97632860272278e-06, + "loss": 0.9844, + "step": 11391 + }, + { + "epoch": 0.29, + "learning_rate": 1.9763226174364738e-06, + "loss": 0.7385, + "step": 11392 + }, + { + "epoch": 0.29, + "learning_rate": 1.9763166314026425e-06, + "loss": 0.9023, + "step": 11393 + }, + { + "epoch": 0.29, + "learning_rate": 1.9763106446212907e-06, + "loss": 0.835, + "step": 11394 + }, + { + "epoch": 0.29, + "learning_rate": 1.9763046570924226e-06, + "loss": 1.0049, + "step": 11395 + }, + { + "epoch": 0.29, + "learning_rate": 1.976298668816043e-06, + "loss": 0.8867, + "step": 11396 + }, + { + "epoch": 0.29, + "learning_rate": 1.976292679792156e-06, + "loss": 0.9531, + "step": 11397 + }, + { + "epoch": 0.29, + "learning_rate": 1.976286690020767e-06, + "loss": 1.0273, + "step": 11398 + }, + { + "epoch": 0.29, + "learning_rate": 1.9762806995018797e-06, + "loss": 1.0352, + "step": 11399 + }, + { + "epoch": 0.29, + "learning_rate": 1.9762747082355e-06, + "loss": 1.0156, + "step": 11400 + }, + { + "epoch": 0.29, + "learning_rate": 1.976268716221631e-06, + "loss": 1.083, + "step": 11401 + }, + { + "epoch": 0.29, + "learning_rate": 1.976262723460278e-06, + "loss": 0.8965, + "step": 11402 + }, + { + "epoch": 0.29, + "learning_rate": 1.9762567299514455e-06, + "loss": 0.7744, + "step": 11403 + }, + { + "epoch": 0.29, + "learning_rate": 1.9762507356951385e-06, + "loss": 1.0234, + "step": 11404 + }, + { + "epoch": 0.29, + "learning_rate": 1.976244740691361e-06, + "loss": 0.8232, + "step": 11405 + }, + { + "epoch": 0.29, + "learning_rate": 1.976238744940118e-06, + "loss": 0.8984, + "step": 11406 + }, + { + "epoch": 0.29, + "learning_rate": 1.976232748441413e-06, + "loss": 1.0684, + "step": 11407 + }, + { + "epoch": 0.29, + "learning_rate": 1.9762267511952525e-06, + "loss": 0.7146, + "step": 11408 + }, + { + "epoch": 0.29, + "learning_rate": 1.9762207532016396e-06, + "loss": 0.8311, + "step": 11409 + }, + { + "epoch": 0.29, + "learning_rate": 1.9762147544605794e-06, + "loss": 1.1826, + "step": 11410 + }, + { + "epoch": 0.29, + "learning_rate": 1.976208754972076e-06, + "loss": 0.7529, + "step": 11411 + }, + { + "epoch": 0.29, + "learning_rate": 1.976202754736135e-06, + "loss": 1.0527, + "step": 11412 + }, + { + "epoch": 0.29, + "learning_rate": 1.9761967537527605e-06, + "loss": 0.8682, + "step": 11413 + }, + { + "epoch": 0.29, + "learning_rate": 1.976190752021957e-06, + "loss": 0.9482, + "step": 11414 + }, + { + "epoch": 0.29, + "learning_rate": 1.976184749543729e-06, + "loss": 0.7686, + "step": 11415 + }, + { + "epoch": 0.29, + "learning_rate": 1.976178746318081e-06, + "loss": 0.875, + "step": 11416 + }, + { + "epoch": 0.29, + "learning_rate": 1.9761727423450184e-06, + "loss": 0.8799, + "step": 11417 + }, + { + "epoch": 0.29, + "learning_rate": 1.9761667376245447e-06, + "loss": 1.0215, + "step": 11418 + }, + { + "epoch": 0.29, + "learning_rate": 1.976160732156665e-06, + "loss": 0.9746, + "step": 11419 + }, + { + "epoch": 0.29, + "learning_rate": 1.976154725941384e-06, + "loss": 0.999, + "step": 11420 + }, + { + "epoch": 0.29, + "learning_rate": 1.9761487189787067e-06, + "loss": 0.9336, + "step": 11421 + }, + { + "epoch": 0.29, + "learning_rate": 1.9761427112686366e-06, + "loss": 0.8423, + "step": 11422 + }, + { + "epoch": 0.29, + "learning_rate": 1.976136702811179e-06, + "loss": 0.9678, + "step": 11423 + }, + { + "epoch": 0.29, + "learning_rate": 1.9761306936063382e-06, + "loss": 1.0361, + "step": 11424 + }, + { + "epoch": 0.29, + "learning_rate": 1.97612468365412e-06, + "loss": 0.8604, + "step": 11425 + }, + { + "epoch": 0.29, + "learning_rate": 1.9761186729545273e-06, + "loss": 1.0068, + "step": 11426 + }, + { + "epoch": 0.29, + "learning_rate": 1.976112661507565e-06, + "loss": 0.9385, + "step": 11427 + }, + { + "epoch": 0.29, + "learning_rate": 1.9761066493132386e-06, + "loss": 0.876, + "step": 11428 + }, + { + "epoch": 0.29, + "learning_rate": 1.9761006363715525e-06, + "loss": 1.0303, + "step": 11429 + }, + { + "epoch": 0.29, + "learning_rate": 1.9760946226825106e-06, + "loss": 1.1357, + "step": 11430 + }, + { + "epoch": 0.29, + "learning_rate": 1.976088608246118e-06, + "loss": 0.8711, + "step": 11431 + }, + { + "epoch": 0.29, + "learning_rate": 1.9760825930623796e-06, + "loss": 0.6274, + "step": 11432 + }, + { + "epoch": 0.29, + "learning_rate": 1.976076577131299e-06, + "loss": 0.7412, + "step": 11433 + }, + { + "epoch": 0.29, + "learning_rate": 1.9760705604528818e-06, + "loss": 0.8232, + "step": 11434 + }, + { + "epoch": 0.29, + "learning_rate": 1.9760645430271324e-06, + "loss": 0.8936, + "step": 11435 + }, + { + "epoch": 0.29, + "learning_rate": 1.9760585248540548e-06, + "loss": 1.1602, + "step": 11436 + }, + { + "epoch": 0.29, + "learning_rate": 1.9760525059336548e-06, + "loss": 0.917, + "step": 11437 + }, + { + "epoch": 0.29, + "learning_rate": 1.976046486265936e-06, + "loss": 0.6792, + "step": 11438 + }, + { + "epoch": 0.29, + "learning_rate": 1.9760404658509026e-06, + "loss": 0.7144, + "step": 11439 + }, + { + "epoch": 0.29, + "learning_rate": 1.9760344446885605e-06, + "loss": 0.7168, + "step": 11440 + }, + { + "epoch": 0.29, + "learning_rate": 1.9760284227789135e-06, + "loss": 0.7754, + "step": 11441 + }, + { + "epoch": 0.29, + "learning_rate": 1.9760224001219666e-06, + "loss": 0.834, + "step": 11442 + }, + { + "epoch": 0.29, + "learning_rate": 1.976016376717724e-06, + "loss": 1.0166, + "step": 11443 + }, + { + "epoch": 0.29, + "learning_rate": 1.9760103525661908e-06, + "loss": 1.2617, + "step": 11444 + }, + { + "epoch": 0.29, + "learning_rate": 1.9760043276673713e-06, + "loss": 0.8994, + "step": 11445 + }, + { + "epoch": 0.29, + "learning_rate": 1.9759983020212705e-06, + "loss": 1.0693, + "step": 11446 + }, + { + "epoch": 0.29, + "learning_rate": 1.975992275627892e-06, + "loss": 1.1963, + "step": 11447 + }, + { + "epoch": 0.29, + "learning_rate": 1.975986248487241e-06, + "loss": 0.958, + "step": 11448 + }, + { + "epoch": 0.29, + "learning_rate": 1.975980220599323e-06, + "loss": 0.9189, + "step": 11449 + }, + { + "epoch": 0.29, + "learning_rate": 1.9759741919641415e-06, + "loss": 0.9629, + "step": 11450 + }, + { + "epoch": 0.29, + "learning_rate": 1.9759681625817013e-06, + "loss": 0.9346, + "step": 11451 + }, + { + "epoch": 0.29, + "learning_rate": 1.975962132452007e-06, + "loss": 0.5938, + "step": 11452 + }, + { + "epoch": 0.29, + "learning_rate": 1.9759561015750635e-06, + "loss": 0.9756, + "step": 11453 + }, + { + "epoch": 0.29, + "learning_rate": 1.9759500699508756e-06, + "loss": 1.1289, + "step": 11454 + }, + { + "epoch": 0.29, + "learning_rate": 1.975944037579447e-06, + "loss": 0.7905, + "step": 11455 + }, + { + "epoch": 0.29, + "learning_rate": 1.9759380044607836e-06, + "loss": 0.9297, + "step": 11456 + }, + { + "epoch": 0.29, + "learning_rate": 1.9759319705948887e-06, + "loss": 0.8032, + "step": 11457 + }, + { + "epoch": 0.29, + "learning_rate": 1.975925935981768e-06, + "loss": 1.0986, + "step": 11458 + }, + { + "epoch": 0.29, + "learning_rate": 1.975919900621426e-06, + "loss": 0.8848, + "step": 11459 + }, + { + "epoch": 0.29, + "learning_rate": 1.9759138645138664e-06, + "loss": 0.665, + "step": 11460 + }, + { + "epoch": 0.29, + "learning_rate": 1.9759078276590947e-06, + "loss": 0.9922, + "step": 11461 + }, + { + "epoch": 0.29, + "learning_rate": 1.975901790057115e-06, + "loss": 0.9697, + "step": 11462 + }, + { + "epoch": 0.29, + "learning_rate": 1.9758957517079323e-06, + "loss": 0.9248, + "step": 11463 + }, + { + "epoch": 0.29, + "learning_rate": 1.9758897126115514e-06, + "loss": 0.7427, + "step": 11464 + }, + { + "epoch": 0.29, + "learning_rate": 1.9758836727679765e-06, + "loss": 0.9697, + "step": 11465 + }, + { + "epoch": 0.29, + "learning_rate": 1.9758776321772118e-06, + "loss": 0.6082, + "step": 11466 + }, + { + "epoch": 0.29, + "learning_rate": 1.9758715908392628e-06, + "loss": 1.0557, + "step": 11467 + }, + { + "epoch": 0.29, + "learning_rate": 1.975865548754134e-06, + "loss": 0.9502, + "step": 11468 + }, + { + "epoch": 0.29, + "learning_rate": 1.9758595059218297e-06, + "loss": 0.9014, + "step": 11469 + }, + { + "epoch": 0.29, + "learning_rate": 1.975853462342355e-06, + "loss": 0.875, + "step": 11470 + }, + { + "epoch": 0.29, + "learning_rate": 1.9758474180157134e-06, + "loss": 1.0547, + "step": 11471 + }, + { + "epoch": 0.29, + "learning_rate": 1.975841372941911e-06, + "loss": 0.832, + "step": 11472 + }, + { + "epoch": 0.29, + "learning_rate": 1.975835327120951e-06, + "loss": 0.79, + "step": 11473 + }, + { + "epoch": 0.29, + "learning_rate": 1.9758292805528395e-06, + "loss": 0.8037, + "step": 11474 + }, + { + "epoch": 0.29, + "learning_rate": 1.97582323323758e-06, + "loss": 1.0312, + "step": 11475 + }, + { + "epoch": 0.29, + "learning_rate": 1.9758171851751776e-06, + "loss": 0.7975, + "step": 11476 + }, + { + "epoch": 0.29, + "learning_rate": 1.975811136365637e-06, + "loss": 1.0723, + "step": 11477 + }, + { + "epoch": 0.29, + "learning_rate": 1.9758050868089624e-06, + "loss": 0.8486, + "step": 11478 + }, + { + "epoch": 0.29, + "learning_rate": 1.975799036505159e-06, + "loss": 0.8584, + "step": 11479 + }, + { + "epoch": 0.29, + "learning_rate": 1.975792985454231e-06, + "loss": 0.7942, + "step": 11480 + }, + { + "epoch": 0.29, + "learning_rate": 1.975786933656183e-06, + "loss": 0.7246, + "step": 11481 + }, + { + "epoch": 0.29, + "learning_rate": 1.97578088111102e-06, + "loss": 1.0176, + "step": 11482 + }, + { + "epoch": 0.29, + "learning_rate": 1.9757748278187468e-06, + "loss": 0.8667, + "step": 11483 + }, + { + "epoch": 0.29, + "learning_rate": 1.975768773779367e-06, + "loss": 1.0898, + "step": 11484 + }, + { + "epoch": 0.29, + "learning_rate": 1.9757627189928864e-06, + "loss": 0.9189, + "step": 11485 + }, + { + "epoch": 0.29, + "learning_rate": 1.975756663459309e-06, + "loss": 1.0527, + "step": 11486 + }, + { + "epoch": 0.29, + "learning_rate": 1.9757506071786395e-06, + "loss": 0.8486, + "step": 11487 + }, + { + "epoch": 0.29, + "learning_rate": 1.975744550150883e-06, + "loss": 1.0742, + "step": 11488 + }, + { + "epoch": 0.29, + "learning_rate": 1.975738492376043e-06, + "loss": 1.1816, + "step": 11489 + }, + { + "epoch": 0.29, + "learning_rate": 1.975732433854126e-06, + "loss": 1.0879, + "step": 11490 + }, + { + "epoch": 0.29, + "learning_rate": 1.9757263745851348e-06, + "loss": 0.9482, + "step": 11491 + }, + { + "epoch": 0.29, + "learning_rate": 1.9757203145690746e-06, + "loss": 1.0088, + "step": 11492 + }, + { + "epoch": 0.29, + "learning_rate": 1.9757142538059505e-06, + "loss": 1.0264, + "step": 11493 + }, + { + "epoch": 0.29, + "learning_rate": 1.975708192295767e-06, + "loss": 0.8384, + "step": 11494 + }, + { + "epoch": 0.29, + "learning_rate": 1.9757021300385284e-06, + "loss": 0.9268, + "step": 11495 + }, + { + "epoch": 0.29, + "learning_rate": 1.9756960670342394e-06, + "loss": 0.7544, + "step": 11496 + }, + { + "epoch": 0.29, + "learning_rate": 1.975690003282905e-06, + "loss": 1.0713, + "step": 11497 + }, + { + "epoch": 0.29, + "learning_rate": 1.97568393878453e-06, + "loss": 0.9453, + "step": 11498 + }, + { + "epoch": 0.29, + "learning_rate": 1.9756778735391183e-06, + "loss": 0.9414, + "step": 11499 + }, + { + "epoch": 0.29, + "learning_rate": 1.975671807546675e-06, + "loss": 0.8081, + "step": 11500 + }, + { + "epoch": 0.29, + "learning_rate": 1.9756657408072044e-06, + "loss": 0.8271, + "step": 11501 + }, + { + "epoch": 0.29, + "learning_rate": 1.975659673320712e-06, + "loss": 1.0303, + "step": 11502 + }, + { + "epoch": 0.29, + "learning_rate": 1.975653605087201e-06, + "loss": 0.6865, + "step": 11503 + }, + { + "epoch": 0.29, + "learning_rate": 1.9756475361066777e-06, + "loss": 0.9971, + "step": 11504 + }, + { + "epoch": 0.29, + "learning_rate": 1.9756414663791456e-06, + "loss": 0.9167, + "step": 11505 + }, + { + "epoch": 0.29, + "learning_rate": 1.9756353959046095e-06, + "loss": 0.8486, + "step": 11506 + }, + { + "epoch": 0.29, + "learning_rate": 1.9756293246830743e-06, + "loss": 0.7622, + "step": 11507 + }, + { + "epoch": 0.29, + "learning_rate": 1.9756232527145445e-06, + "loss": 0.8125, + "step": 11508 + }, + { + "epoch": 0.29, + "learning_rate": 1.975617179999025e-06, + "loss": 0.7146, + "step": 11509 + }, + { + "epoch": 0.3, + "learning_rate": 1.9756111065365204e-06, + "loss": 0.7915, + "step": 11510 + }, + { + "epoch": 0.3, + "learning_rate": 1.9756050323270354e-06, + "loss": 0.7783, + "step": 11511 + }, + { + "epoch": 0.3, + "learning_rate": 1.975598957370574e-06, + "loss": 0.8013, + "step": 11512 + }, + { + "epoch": 0.3, + "learning_rate": 1.9755928816671415e-06, + "loss": 0.9033, + "step": 11513 + }, + { + "epoch": 0.3, + "learning_rate": 1.9755868052167427e-06, + "loss": 0.6582, + "step": 11514 + }, + { + "epoch": 0.3, + "learning_rate": 1.9755807280193815e-06, + "loss": 1.0459, + "step": 11515 + }, + { + "epoch": 0.3, + "learning_rate": 1.9755746500750636e-06, + "loss": 0.8237, + "step": 11516 + }, + { + "epoch": 0.3, + "learning_rate": 1.9755685713837925e-06, + "loss": 0.9297, + "step": 11517 + }, + { + "epoch": 0.3, + "learning_rate": 1.9755624919455736e-06, + "loss": 0.7891, + "step": 11518 + }, + { + "epoch": 0.3, + "learning_rate": 1.9755564117604113e-06, + "loss": 0.8447, + "step": 11519 + }, + { + "epoch": 0.3, + "learning_rate": 1.97555033082831e-06, + "loss": 0.9795, + "step": 11520 + }, + { + "epoch": 0.3, + "learning_rate": 1.975544249149275e-06, + "loss": 0.8652, + "step": 11521 + }, + { + "epoch": 0.3, + "learning_rate": 1.975538166723311e-06, + "loss": 0.832, + "step": 11522 + }, + { + "epoch": 0.3, + "learning_rate": 1.9755320835504215e-06, + "loss": 1.0635, + "step": 11523 + }, + { + "epoch": 0.3, + "learning_rate": 1.9755259996306126e-06, + "loss": 0.7441, + "step": 11524 + }, + { + "epoch": 0.3, + "learning_rate": 1.975519914963888e-06, + "loss": 0.959, + "step": 11525 + }, + { + "epoch": 0.3, + "learning_rate": 1.9755138295502526e-06, + "loss": 0.8022, + "step": 11526 + }, + { + "epoch": 0.3, + "learning_rate": 1.975507743389711e-06, + "loss": 1.0234, + "step": 11527 + }, + { + "epoch": 0.3, + "learning_rate": 1.9755016564822684e-06, + "loss": 0.8252, + "step": 11528 + }, + { + "epoch": 0.3, + "learning_rate": 1.9754955688279285e-06, + "loss": 1.1387, + "step": 11529 + }, + { + "epoch": 0.3, + "learning_rate": 1.975489480426697e-06, + "loss": 0.9033, + "step": 11530 + }, + { + "epoch": 0.3, + "learning_rate": 1.975483391278578e-06, + "loss": 0.9326, + "step": 11531 + }, + { + "epoch": 0.3, + "learning_rate": 1.975477301383576e-06, + "loss": 0.9277, + "step": 11532 + }, + { + "epoch": 0.3, + "learning_rate": 1.9754712107416963e-06, + "loss": 1.0195, + "step": 11533 + }, + { + "epoch": 0.3, + "learning_rate": 1.9754651193529427e-06, + "loss": 0.96, + "step": 11534 + }, + { + "epoch": 0.3, + "learning_rate": 1.9754590272173204e-06, + "loss": 1.0615, + "step": 11535 + }, + { + "epoch": 0.3, + "learning_rate": 1.975452934334834e-06, + "loss": 0.8013, + "step": 11536 + }, + { + "epoch": 0.3, + "learning_rate": 1.975446840705488e-06, + "loss": 0.708, + "step": 11537 + }, + { + "epoch": 0.3, + "learning_rate": 1.9754407463292874e-06, + "loss": 0.9844, + "step": 11538 + }, + { + "epoch": 0.3, + "learning_rate": 1.9754346512062366e-06, + "loss": 0.8135, + "step": 11539 + }, + { + "epoch": 0.3, + "learning_rate": 1.9754285553363404e-06, + "loss": 1.0713, + "step": 11540 + }, + { + "epoch": 0.3, + "learning_rate": 1.9754224587196037e-06, + "loss": 0.9092, + "step": 11541 + }, + { + "epoch": 0.3, + "learning_rate": 1.9754163613560305e-06, + "loss": 1.001, + "step": 11542 + }, + { + "epoch": 0.3, + "learning_rate": 1.975410263245626e-06, + "loss": 0.9541, + "step": 11543 + }, + { + "epoch": 0.3, + "learning_rate": 1.9754041643883943e-06, + "loss": 0.8047, + "step": 11544 + }, + { + "epoch": 0.3, + "learning_rate": 1.975398064784341e-06, + "loss": 0.7129, + "step": 11545 + }, + { + "epoch": 0.3, + "learning_rate": 1.97539196443347e-06, + "loss": 0.8086, + "step": 11546 + }, + { + "epoch": 0.3, + "learning_rate": 1.975385863335786e-06, + "loss": 0.7983, + "step": 11547 + }, + { + "epoch": 0.3, + "learning_rate": 1.9753797614912943e-06, + "loss": 1.0391, + "step": 11548 + }, + { + "epoch": 0.3, + "learning_rate": 1.9753736588999993e-06, + "loss": 0.957, + "step": 11549 + }, + { + "epoch": 0.3, + "learning_rate": 1.975367555561905e-06, + "loss": 0.7744, + "step": 11550 + }, + { + "epoch": 0.3, + "learning_rate": 1.975361451477017e-06, + "loss": 0.7168, + "step": 11551 + }, + { + "epoch": 0.3, + "learning_rate": 1.9753553466453393e-06, + "loss": 0.8818, + "step": 11552 + }, + { + "epoch": 0.3, + "learning_rate": 1.9753492410668772e-06, + "loss": 1.2031, + "step": 11553 + }, + { + "epoch": 0.3, + "learning_rate": 1.975343134741635e-06, + "loss": 1.0469, + "step": 11554 + }, + { + "epoch": 0.3, + "learning_rate": 1.975337027669617e-06, + "loss": 0.7178, + "step": 11555 + }, + { + "epoch": 0.3, + "learning_rate": 1.9753309198508285e-06, + "loss": 0.793, + "step": 11556 + }, + { + "epoch": 0.3, + "learning_rate": 1.975324811285274e-06, + "loss": 0.7727, + "step": 11557 + }, + { + "epoch": 0.3, + "learning_rate": 1.9753187019729583e-06, + "loss": 0.7705, + "step": 11558 + }, + { + "epoch": 0.3, + "learning_rate": 1.9753125919138854e-06, + "loss": 0.8364, + "step": 11559 + }, + { + "epoch": 0.3, + "learning_rate": 1.975306481108061e-06, + "loss": 0.8643, + "step": 11560 + }, + { + "epoch": 0.3, + "learning_rate": 1.975300369555489e-06, + "loss": 0.8279, + "step": 11561 + }, + { + "epoch": 0.3, + "learning_rate": 1.9752942572561747e-06, + "loss": 0.9404, + "step": 11562 + }, + { + "epoch": 0.3, + "learning_rate": 1.9752881442101223e-06, + "loss": 1.0732, + "step": 11563 + }, + { + "epoch": 0.3, + "learning_rate": 1.9752820304173367e-06, + "loss": 0.9395, + "step": 11564 + }, + { + "epoch": 0.3, + "learning_rate": 1.975275915877822e-06, + "loss": 0.8506, + "step": 11565 + }, + { + "epoch": 0.3, + "learning_rate": 1.9752698005915836e-06, + "loss": 1.1201, + "step": 11566 + }, + { + "epoch": 0.3, + "learning_rate": 1.9752636845586262e-06, + "loss": 1.0283, + "step": 11567 + }, + { + "epoch": 0.3, + "learning_rate": 1.975257567778954e-06, + "loss": 0.9199, + "step": 11568 + }, + { + "epoch": 0.3, + "learning_rate": 1.975251450252572e-06, + "loss": 0.9375, + "step": 11569 + }, + { + "epoch": 0.3, + "learning_rate": 1.9752453319794847e-06, + "loss": 0.9893, + "step": 11570 + }, + { + "epoch": 0.3, + "learning_rate": 1.9752392129596973e-06, + "loss": 0.8088, + "step": 11571 + }, + { + "epoch": 0.3, + "learning_rate": 1.9752330931932135e-06, + "loss": 0.9619, + "step": 11572 + }, + { + "epoch": 0.3, + "learning_rate": 1.9752269726800393e-06, + "loss": 0.9775, + "step": 11573 + }, + { + "epoch": 0.3, + "learning_rate": 1.975220851420178e-06, + "loss": 0.9717, + "step": 11574 + }, + { + "epoch": 0.3, + "learning_rate": 1.975214729413635e-06, + "loss": 0.8457, + "step": 11575 + }, + { + "epoch": 0.3, + "learning_rate": 1.9752086066604153e-06, + "loss": 0.9648, + "step": 11576 + }, + { + "epoch": 0.3, + "learning_rate": 1.975202483160523e-06, + "loss": 0.9893, + "step": 11577 + }, + { + "epoch": 0.3, + "learning_rate": 1.975196358913963e-06, + "loss": 0.9053, + "step": 11578 + }, + { + "epoch": 0.3, + "learning_rate": 1.97519023392074e-06, + "loss": 0.7979, + "step": 11579 + }, + { + "epoch": 0.3, + "learning_rate": 1.9751841081808586e-06, + "loss": 0.9243, + "step": 11580 + }, + { + "epoch": 0.3, + "learning_rate": 1.9751779816943233e-06, + "loss": 0.9834, + "step": 11581 + }, + { + "epoch": 0.3, + "learning_rate": 1.9751718544611395e-06, + "loss": 1.0938, + "step": 11582 + }, + { + "epoch": 0.3, + "learning_rate": 1.9751657264813114e-06, + "loss": 0.9736, + "step": 11583 + }, + { + "epoch": 0.3, + "learning_rate": 1.975159597754844e-06, + "loss": 0.958, + "step": 11584 + }, + { + "epoch": 0.3, + "learning_rate": 1.975153468281741e-06, + "loss": 0.8154, + "step": 11585 + }, + { + "epoch": 0.3, + "learning_rate": 1.9751473380620082e-06, + "loss": 1.0645, + "step": 11586 + }, + { + "epoch": 0.3, + "learning_rate": 1.97514120709565e-06, + "loss": 0.96, + "step": 11587 + }, + { + "epoch": 0.3, + "learning_rate": 1.975135075382671e-06, + "loss": 0.8027, + "step": 11588 + }, + { + "epoch": 0.3, + "learning_rate": 1.975128942923076e-06, + "loss": 0.8525, + "step": 11589 + }, + { + "epoch": 0.3, + "learning_rate": 1.9751228097168694e-06, + "loss": 0.9541, + "step": 11590 + }, + { + "epoch": 0.3, + "learning_rate": 1.9751166757640563e-06, + "loss": 0.7722, + "step": 11591 + }, + { + "epoch": 0.3, + "learning_rate": 1.975110541064641e-06, + "loss": 1.1426, + "step": 11592 + }, + { + "epoch": 0.3, + "learning_rate": 1.9751044056186285e-06, + "loss": 0.875, + "step": 11593 + }, + { + "epoch": 0.3, + "learning_rate": 1.9750982694260236e-06, + "loss": 0.9199, + "step": 11594 + }, + { + "epoch": 0.3, + "learning_rate": 1.9750921324868303e-06, + "loss": 0.8613, + "step": 11595 + }, + { + "epoch": 0.3, + "learning_rate": 1.975085994801054e-06, + "loss": 0.6284, + "step": 11596 + }, + { + "epoch": 0.3, + "learning_rate": 1.9750798563686996e-06, + "loss": 0.9277, + "step": 11597 + }, + { + "epoch": 0.3, + "learning_rate": 1.9750737171897707e-06, + "loss": 0.9697, + "step": 11598 + }, + { + "epoch": 0.3, + "learning_rate": 1.9750675772642734e-06, + "loss": 0.9785, + "step": 11599 + }, + { + "epoch": 0.3, + "learning_rate": 1.975061436592211e-06, + "loss": 0.9961, + "step": 11600 + }, + { + "epoch": 0.3, + "learning_rate": 1.9750552951735893e-06, + "loss": 0.5579, + "step": 11601 + }, + { + "epoch": 0.3, + "learning_rate": 1.9750491530084124e-06, + "loss": 0.9951, + "step": 11602 + }, + { + "epoch": 0.3, + "learning_rate": 1.9750430100966855e-06, + "loss": 1.0137, + "step": 11603 + }, + { + "epoch": 0.3, + "learning_rate": 1.9750368664384127e-06, + "loss": 0.9873, + "step": 11604 + }, + { + "epoch": 0.3, + "learning_rate": 1.9750307220335993e-06, + "loss": 1.043, + "step": 11605 + }, + { + "epoch": 0.3, + "learning_rate": 1.975024576882249e-06, + "loss": 0.8877, + "step": 11606 + }, + { + "epoch": 0.3, + "learning_rate": 1.975018430984368e-06, + "loss": 0.8008, + "step": 11607 + }, + { + "epoch": 0.3, + "learning_rate": 1.97501228433996e-06, + "loss": 0.9458, + "step": 11608 + }, + { + "epoch": 0.3, + "learning_rate": 1.9750061369490297e-06, + "loss": 0.6963, + "step": 11609 + }, + { + "epoch": 0.3, + "learning_rate": 1.974999988811582e-06, + "loss": 0.8398, + "step": 11610 + }, + { + "epoch": 0.3, + "learning_rate": 1.974993839927622e-06, + "loss": 0.5505, + "step": 11611 + }, + { + "epoch": 0.3, + "learning_rate": 1.974987690297154e-06, + "loss": 0.9043, + "step": 11612 + }, + { + "epoch": 0.3, + "learning_rate": 1.974981539920183e-06, + "loss": 0.6816, + "step": 11613 + }, + { + "epoch": 0.3, + "learning_rate": 1.974975388796713e-06, + "loss": 1.0049, + "step": 11614 + }, + { + "epoch": 0.3, + "learning_rate": 1.9749692369267493e-06, + "loss": 0.8418, + "step": 11615 + }, + { + "epoch": 0.3, + "learning_rate": 1.974963084310296e-06, + "loss": 0.833, + "step": 11616 + }, + { + "epoch": 0.3, + "learning_rate": 1.9749569309473593e-06, + "loss": 0.7441, + "step": 11617 + }, + { + "epoch": 0.3, + "learning_rate": 1.974950776837942e-06, + "loss": 0.7334, + "step": 11618 + }, + { + "epoch": 0.3, + "learning_rate": 1.9749446219820503e-06, + "loss": 0.7114, + "step": 11619 + }, + { + "epoch": 0.3, + "learning_rate": 1.9749384663796884e-06, + "loss": 1.041, + "step": 11620 + }, + { + "epoch": 0.3, + "learning_rate": 1.9749323100308604e-06, + "loss": 0.7979, + "step": 11621 + }, + { + "epoch": 0.3, + "learning_rate": 1.974926152935572e-06, + "loss": 1.0625, + "step": 11622 + }, + { + "epoch": 0.3, + "learning_rate": 1.9749199950938273e-06, + "loss": 0.8711, + "step": 11623 + }, + { + "epoch": 0.3, + "learning_rate": 1.9749138365056314e-06, + "loss": 0.8145, + "step": 11624 + }, + { + "epoch": 0.3, + "learning_rate": 1.974907677170988e-06, + "loss": 1.0781, + "step": 11625 + }, + { + "epoch": 0.3, + "learning_rate": 1.9749015170899035e-06, + "loss": 0.8613, + "step": 11626 + }, + { + "epoch": 0.3, + "learning_rate": 1.974895356262381e-06, + "loss": 0.7827, + "step": 11627 + }, + { + "epoch": 0.3, + "learning_rate": 1.9748891946884268e-06, + "loss": 0.9727, + "step": 11628 + }, + { + "epoch": 0.3, + "learning_rate": 1.9748830323680445e-06, + "loss": 0.9795, + "step": 11629 + }, + { + "epoch": 0.3, + "learning_rate": 1.974876869301239e-06, + "loss": 0.9297, + "step": 11630 + }, + { + "epoch": 0.3, + "learning_rate": 1.9748707054880154e-06, + "loss": 0.9395, + "step": 11631 + }, + { + "epoch": 0.3, + "learning_rate": 1.9748645409283774e-06, + "loss": 0.9941, + "step": 11632 + }, + { + "epoch": 0.3, + "learning_rate": 1.9748583756223306e-06, + "loss": 0.5496, + "step": 11633 + }, + { + "epoch": 0.3, + "learning_rate": 1.97485220956988e-06, + "loss": 1.0146, + "step": 11634 + }, + { + "epoch": 0.3, + "learning_rate": 1.9748460427710296e-06, + "loss": 0.8613, + "step": 11635 + }, + { + "epoch": 0.3, + "learning_rate": 1.9748398752257847e-06, + "loss": 0.9219, + "step": 11636 + }, + { + "epoch": 0.3, + "learning_rate": 1.9748337069341497e-06, + "loss": 0.8228, + "step": 11637 + }, + { + "epoch": 0.3, + "learning_rate": 1.974827537896129e-06, + "loss": 0.9707, + "step": 11638 + }, + { + "epoch": 0.3, + "learning_rate": 1.974821368111728e-06, + "loss": 0.5952, + "step": 11639 + }, + { + "epoch": 0.3, + "learning_rate": 1.974815197580951e-06, + "loss": 0.8828, + "step": 11640 + }, + { + "epoch": 0.3, + "learning_rate": 1.974809026303803e-06, + "loss": 1.0723, + "step": 11641 + }, + { + "epoch": 0.3, + "learning_rate": 1.974802854280288e-06, + "loss": 0.9326, + "step": 11642 + }, + { + "epoch": 0.3, + "learning_rate": 1.9747966815104117e-06, + "loss": 0.7422, + "step": 11643 + }, + { + "epoch": 0.3, + "learning_rate": 1.9747905079941783e-06, + "loss": 0.9346, + "step": 11644 + }, + { + "epoch": 0.3, + "learning_rate": 1.9747843337315925e-06, + "loss": 0.8945, + "step": 11645 + }, + { + "epoch": 0.3, + "learning_rate": 1.9747781587226596e-06, + "loss": 0.7686, + "step": 11646 + }, + { + "epoch": 0.3, + "learning_rate": 1.9747719829673836e-06, + "loss": 1.0225, + "step": 11647 + }, + { + "epoch": 0.3, + "learning_rate": 1.9747658064657694e-06, + "loss": 0.7275, + "step": 11648 + }, + { + "epoch": 0.3, + "learning_rate": 1.974759629217822e-06, + "loss": 0.6787, + "step": 11649 + }, + { + "epoch": 0.3, + "learning_rate": 1.974753451223546e-06, + "loss": 0.8945, + "step": 11650 + }, + { + "epoch": 0.3, + "learning_rate": 1.9747472724829463e-06, + "loss": 0.8281, + "step": 11651 + }, + { + "epoch": 0.3, + "learning_rate": 1.9747410929960268e-06, + "loss": 0.6997, + "step": 11652 + }, + { + "epoch": 0.3, + "learning_rate": 1.9747349127627933e-06, + "loss": 1.1699, + "step": 11653 + }, + { + "epoch": 0.3, + "learning_rate": 1.97472873178325e-06, + "loss": 0.8994, + "step": 11654 + }, + { + "epoch": 0.3, + "learning_rate": 1.974722550057402e-06, + "loss": 0.8242, + "step": 11655 + }, + { + "epoch": 0.3, + "learning_rate": 1.9747163675852533e-06, + "loss": 1.0117, + "step": 11656 + }, + { + "epoch": 0.3, + "learning_rate": 1.9747101843668093e-06, + "loss": 0.875, + "step": 11657 + }, + { + "epoch": 0.3, + "learning_rate": 1.9747040004020747e-06, + "loss": 0.998, + "step": 11658 + }, + { + "epoch": 0.3, + "learning_rate": 1.9746978156910537e-06, + "loss": 0.9727, + "step": 11659 + }, + { + "epoch": 0.3, + "learning_rate": 1.9746916302337517e-06, + "loss": 0.9736, + "step": 11660 + }, + { + "epoch": 0.3, + "learning_rate": 1.974685444030173e-06, + "loss": 0.7573, + "step": 11661 + }, + { + "epoch": 0.3, + "learning_rate": 1.974679257080323e-06, + "loss": 0.9053, + "step": 11662 + }, + { + "epoch": 0.3, + "learning_rate": 1.974673069384205e-06, + "loss": 0.8447, + "step": 11663 + }, + { + "epoch": 0.3, + "learning_rate": 1.9746668809418253e-06, + "loss": 0.7227, + "step": 11664 + }, + { + "epoch": 0.3, + "learning_rate": 1.9746606917531878e-06, + "loss": 0.8589, + "step": 11665 + }, + { + "epoch": 0.3, + "learning_rate": 1.9746545018182973e-06, + "loss": 0.7759, + "step": 11666 + }, + { + "epoch": 0.3, + "learning_rate": 1.974648311137159e-06, + "loss": 1.0879, + "step": 11667 + }, + { + "epoch": 0.3, + "learning_rate": 1.974642119709777e-06, + "loss": 1.001, + "step": 11668 + }, + { + "epoch": 0.3, + "learning_rate": 1.9746359275361563e-06, + "loss": 0.7068, + "step": 11669 + }, + { + "epoch": 0.3, + "learning_rate": 1.974629734616302e-06, + "loss": 0.8765, + "step": 11670 + }, + { + "epoch": 0.3, + "learning_rate": 1.974623540950218e-06, + "loss": 0.9141, + "step": 11671 + }, + { + "epoch": 0.3, + "learning_rate": 1.9746173465379097e-06, + "loss": 0.9365, + "step": 11672 + }, + { + "epoch": 0.3, + "learning_rate": 1.9746111513793823e-06, + "loss": 0.9521, + "step": 11673 + }, + { + "epoch": 0.3, + "learning_rate": 1.9746049554746396e-06, + "loss": 0.8086, + "step": 11674 + }, + { + "epoch": 0.3, + "learning_rate": 1.9745987588236862e-06, + "loss": 0.6948, + "step": 11675 + }, + { + "epoch": 0.3, + "learning_rate": 1.9745925614265282e-06, + "loss": 0.9619, + "step": 11676 + }, + { + "epoch": 0.3, + "learning_rate": 1.974586363283169e-06, + "loss": 0.9814, + "step": 11677 + }, + { + "epoch": 0.3, + "learning_rate": 1.974580164393614e-06, + "loss": 0.9102, + "step": 11678 + }, + { + "epoch": 0.3, + "learning_rate": 1.9745739647578676e-06, + "loss": 0.6841, + "step": 11679 + }, + { + "epoch": 0.3, + "learning_rate": 1.974567764375935e-06, + "loss": 1.0742, + "step": 11680 + }, + { + "epoch": 0.3, + "learning_rate": 1.9745615632478204e-06, + "loss": 1.1406, + "step": 11681 + }, + { + "epoch": 0.3, + "learning_rate": 1.9745553613735287e-06, + "loss": 0.8057, + "step": 11682 + }, + { + "epoch": 0.3, + "learning_rate": 1.9745491587530654e-06, + "loss": 0.8652, + "step": 11683 + }, + { + "epoch": 0.3, + "learning_rate": 1.9745429553864338e-06, + "loss": 0.8486, + "step": 11684 + }, + { + "epoch": 0.3, + "learning_rate": 1.9745367512736403e-06, + "loss": 0.8799, + "step": 11685 + }, + { + "epoch": 0.3, + "learning_rate": 1.9745305464146882e-06, + "loss": 0.9854, + "step": 11686 + }, + { + "epoch": 0.3, + "learning_rate": 1.974524340809583e-06, + "loss": 0.9775, + "step": 11687 + }, + { + "epoch": 0.3, + "learning_rate": 1.9745181344583294e-06, + "loss": 1.0518, + "step": 11688 + }, + { + "epoch": 0.3, + "learning_rate": 1.9745119273609322e-06, + "loss": 0.6113, + "step": 11689 + }, + { + "epoch": 0.3, + "learning_rate": 1.974505719517396e-06, + "loss": 0.7791, + "step": 11690 + }, + { + "epoch": 0.3, + "learning_rate": 1.974499510927725e-06, + "loss": 1.1094, + "step": 11691 + }, + { + "epoch": 0.3, + "learning_rate": 1.9744933015919253e-06, + "loss": 0.79, + "step": 11692 + }, + { + "epoch": 0.3, + "learning_rate": 1.974487091510001e-06, + "loss": 0.9443, + "step": 11693 + }, + { + "epoch": 0.3, + "learning_rate": 1.974480880681956e-06, + "loss": 1.0752, + "step": 11694 + }, + { + "epoch": 0.3, + "learning_rate": 1.974474669107796e-06, + "loss": 0.834, + "step": 11695 + }, + { + "epoch": 0.3, + "learning_rate": 1.9744684567875257e-06, + "loss": 0.7578, + "step": 11696 + }, + { + "epoch": 0.3, + "learning_rate": 1.9744622437211497e-06, + "loss": 0.9248, + "step": 11697 + }, + { + "epoch": 0.3, + "learning_rate": 1.9744560299086728e-06, + "loss": 1.0938, + "step": 11698 + }, + { + "epoch": 0.3, + "learning_rate": 1.9744498153500995e-06, + "loss": 0.9316, + "step": 11699 + }, + { + "epoch": 0.3, + "learning_rate": 1.9744436000454356e-06, + "loss": 0.6265, + "step": 11700 + }, + { + "epoch": 0.3, + "learning_rate": 1.9744373839946838e-06, + "loss": 0.8252, + "step": 11701 + }, + { + "epoch": 0.3, + "learning_rate": 1.974431167197851e-06, + "loss": 0.9082, + "step": 11702 + }, + { + "epoch": 0.3, + "learning_rate": 1.9744249496549406e-06, + "loss": 0.8662, + "step": 11703 + }, + { + "epoch": 0.3, + "learning_rate": 1.974418731365958e-06, + "loss": 1.0566, + "step": 11704 + }, + { + "epoch": 0.3, + "learning_rate": 1.974412512330908e-06, + "loss": 0.9873, + "step": 11705 + }, + { + "epoch": 0.3, + "learning_rate": 1.9744062925497947e-06, + "loss": 0.9814, + "step": 11706 + }, + { + "epoch": 0.3, + "learning_rate": 1.9744000720226238e-06, + "loss": 0.8838, + "step": 11707 + }, + { + "epoch": 0.3, + "learning_rate": 1.9743938507493993e-06, + "loss": 0.7029, + "step": 11708 + }, + { + "epoch": 0.3, + "learning_rate": 1.974387628730126e-06, + "loss": 1.0303, + "step": 11709 + }, + { + "epoch": 0.3, + "learning_rate": 1.9743814059648094e-06, + "loss": 0.4863, + "step": 11710 + }, + { + "epoch": 0.3, + "learning_rate": 1.9743751824534532e-06, + "loss": 1.002, + "step": 11711 + }, + { + "epoch": 0.3, + "learning_rate": 1.974368958196063e-06, + "loss": 0.9688, + "step": 11712 + }, + { + "epoch": 0.3, + "learning_rate": 1.9743627331926436e-06, + "loss": 1.0176, + "step": 11713 + }, + { + "epoch": 0.3, + "learning_rate": 1.974356507443199e-06, + "loss": 0.793, + "step": 11714 + }, + { + "epoch": 0.3, + "learning_rate": 1.9743502809477347e-06, + "loss": 0.9004, + "step": 11715 + }, + { + "epoch": 0.3, + "learning_rate": 1.974344053706255e-06, + "loss": 1.0215, + "step": 11716 + }, + { + "epoch": 0.3, + "learning_rate": 1.9743378257187652e-06, + "loss": 0.8052, + "step": 11717 + }, + { + "epoch": 0.3, + "learning_rate": 1.9743315969852693e-06, + "loss": 0.9785, + "step": 11718 + }, + { + "epoch": 0.3, + "learning_rate": 1.974325367505773e-06, + "loss": 0.7012, + "step": 11719 + }, + { + "epoch": 0.3, + "learning_rate": 1.97431913728028e-06, + "loss": 1.0566, + "step": 11720 + }, + { + "epoch": 0.3, + "learning_rate": 1.974312906308796e-06, + "loss": 0.7383, + "step": 11721 + }, + { + "epoch": 0.3, + "learning_rate": 1.974306674591325e-06, + "loss": 0.8438, + "step": 11722 + }, + { + "epoch": 0.3, + "learning_rate": 1.9743004421278723e-06, + "loss": 0.8574, + "step": 11723 + }, + { + "epoch": 0.3, + "learning_rate": 1.974294208918443e-06, + "loss": 0.833, + "step": 11724 + }, + { + "epoch": 0.3, + "learning_rate": 1.9742879749630414e-06, + "loss": 0.9014, + "step": 11725 + }, + { + "epoch": 0.3, + "learning_rate": 1.974281740261672e-06, + "loss": 0.8984, + "step": 11726 + }, + { + "epoch": 0.3, + "learning_rate": 1.9742755048143396e-06, + "loss": 0.8154, + "step": 11727 + }, + { + "epoch": 0.3, + "learning_rate": 1.9742692686210494e-06, + "loss": 1.0518, + "step": 11728 + }, + { + "epoch": 0.3, + "learning_rate": 1.974263031681806e-06, + "loss": 1.2412, + "step": 11729 + }, + { + "epoch": 0.3, + "learning_rate": 1.9742567939966145e-06, + "loss": 0.9834, + "step": 11730 + }, + { + "epoch": 0.3, + "learning_rate": 1.9742505555654794e-06, + "loss": 1.0469, + "step": 11731 + }, + { + "epoch": 0.3, + "learning_rate": 1.974244316388405e-06, + "loss": 0.7417, + "step": 11732 + }, + { + "epoch": 0.3, + "learning_rate": 1.9742380764653973e-06, + "loss": 0.9102, + "step": 11733 + }, + { + "epoch": 0.3, + "learning_rate": 1.9742318357964596e-06, + "loss": 0.8789, + "step": 11734 + }, + { + "epoch": 0.3, + "learning_rate": 1.9742255943815976e-06, + "loss": 0.9863, + "step": 11735 + }, + { + "epoch": 0.3, + "learning_rate": 1.9742193522208155e-06, + "loss": 0.8013, + "step": 11736 + }, + { + "epoch": 0.3, + "learning_rate": 1.9742131093141193e-06, + "loss": 0.959, + "step": 11737 + }, + { + "epoch": 0.3, + "learning_rate": 1.9742068656615123e-06, + "loss": 1.2422, + "step": 11738 + }, + { + "epoch": 0.3, + "learning_rate": 1.9742006212629996e-06, + "loss": 0.9902, + "step": 11739 + }, + { + "epoch": 0.3, + "learning_rate": 1.974194376118587e-06, + "loss": 0.9678, + "step": 11740 + }, + { + "epoch": 0.3, + "learning_rate": 1.974188130228278e-06, + "loss": 0.7495, + "step": 11741 + }, + { + "epoch": 0.3, + "learning_rate": 1.9741818835920783e-06, + "loss": 0.6851, + "step": 11742 + }, + { + "epoch": 0.3, + "learning_rate": 1.9741756362099924e-06, + "loss": 0.9697, + "step": 11743 + }, + { + "epoch": 0.3, + "learning_rate": 1.9741693880820246e-06, + "loss": 0.7119, + "step": 11744 + }, + { + "epoch": 0.3, + "learning_rate": 1.9741631392081803e-06, + "loss": 1.0234, + "step": 11745 + }, + { + "epoch": 0.3, + "learning_rate": 1.974156889588464e-06, + "loss": 0.7842, + "step": 11746 + }, + { + "epoch": 0.3, + "learning_rate": 1.974150639222881e-06, + "loss": 0.8203, + "step": 11747 + }, + { + "epoch": 0.3, + "learning_rate": 1.974144388111435e-06, + "loss": 0.8193, + "step": 11748 + }, + { + "epoch": 0.3, + "learning_rate": 1.9741381362541316e-06, + "loss": 0.7793, + "step": 11749 + }, + { + "epoch": 0.3, + "learning_rate": 1.9741318836509757e-06, + "loss": 0.9365, + "step": 11750 + }, + { + "epoch": 0.3, + "learning_rate": 1.9741256303019718e-06, + "loss": 0.9893, + "step": 11751 + }, + { + "epoch": 0.3, + "learning_rate": 1.9741193762071244e-06, + "loss": 0.7461, + "step": 11752 + }, + { + "epoch": 0.3, + "learning_rate": 1.9741131213664387e-06, + "loss": 0.7339, + "step": 11753 + }, + { + "epoch": 0.3, + "learning_rate": 1.9741068657799197e-06, + "loss": 1.1426, + "step": 11754 + }, + { + "epoch": 0.3, + "learning_rate": 1.9741006094475712e-06, + "loss": 1.042, + "step": 11755 + }, + { + "epoch": 0.3, + "learning_rate": 1.9740943523693992e-06, + "loss": 0.7451, + "step": 11756 + }, + { + "epoch": 0.3, + "learning_rate": 1.974088094545408e-06, + "loss": 0.9111, + "step": 11757 + }, + { + "epoch": 0.3, + "learning_rate": 1.974081835975602e-06, + "loss": 0.9678, + "step": 11758 + }, + { + "epoch": 0.3, + "learning_rate": 1.9740755766599863e-06, + "loss": 0.8879, + "step": 11759 + }, + { + "epoch": 0.3, + "learning_rate": 1.974069316598566e-06, + "loss": 0.9863, + "step": 11760 + }, + { + "epoch": 0.3, + "learning_rate": 1.9740630557913454e-06, + "loss": 0.79, + "step": 11761 + }, + { + "epoch": 0.3, + "learning_rate": 1.9740567942383297e-06, + "loss": 1.1592, + "step": 11762 + }, + { + "epoch": 0.3, + "learning_rate": 1.974050531939523e-06, + "loss": 0.8125, + "step": 11763 + }, + { + "epoch": 0.3, + "learning_rate": 1.974044268894931e-06, + "loss": 1.0977, + "step": 11764 + }, + { + "epoch": 0.3, + "learning_rate": 1.9740380051045584e-06, + "loss": 0.9805, + "step": 11765 + }, + { + "epoch": 0.3, + "learning_rate": 1.974031740568409e-06, + "loss": 0.7979, + "step": 11766 + }, + { + "epoch": 0.3, + "learning_rate": 1.974025475286489e-06, + "loss": 0.9736, + "step": 11767 + }, + { + "epoch": 0.3, + "learning_rate": 1.974019209258802e-06, + "loss": 1.084, + "step": 11768 + }, + { + "epoch": 0.3, + "learning_rate": 1.9740129424853535e-06, + "loss": 0.9365, + "step": 11769 + }, + { + "epoch": 0.3, + "learning_rate": 1.9740066749661477e-06, + "loss": 0.6792, + "step": 11770 + }, + { + "epoch": 0.3, + "learning_rate": 1.97400040670119e-06, + "loss": 0.9141, + "step": 11771 + }, + { + "epoch": 0.3, + "learning_rate": 1.9739941376904855e-06, + "loss": 0.8086, + "step": 11772 + }, + { + "epoch": 0.3, + "learning_rate": 1.9739878679340374e-06, + "loss": 1.1094, + "step": 11773 + }, + { + "epoch": 0.3, + "learning_rate": 1.9739815974318527e-06, + "loss": 0.7383, + "step": 11774 + }, + { + "epoch": 0.3, + "learning_rate": 1.973975326183934e-06, + "loss": 0.793, + "step": 11775 + }, + { + "epoch": 0.3, + "learning_rate": 1.973969054190288e-06, + "loss": 0.957, + "step": 11776 + }, + { + "epoch": 0.3, + "learning_rate": 1.9739627814509185e-06, + "loss": 0.9307, + "step": 11777 + }, + { + "epoch": 0.3, + "learning_rate": 1.9739565079658305e-06, + "loss": 0.7393, + "step": 11778 + }, + { + "epoch": 0.3, + "learning_rate": 1.9739502337350284e-06, + "loss": 0.7871, + "step": 11779 + }, + { + "epoch": 0.3, + "learning_rate": 1.973943958758518e-06, + "loss": 0.8154, + "step": 11780 + }, + { + "epoch": 0.3, + "learning_rate": 1.973937683036303e-06, + "loss": 0.9443, + "step": 11781 + }, + { + "epoch": 0.3, + "learning_rate": 1.973931406568389e-06, + "loss": 0.8643, + "step": 11782 + }, + { + "epoch": 0.3, + "learning_rate": 1.97392512935478e-06, + "loss": 0.6235, + "step": 11783 + }, + { + "epoch": 0.3, + "learning_rate": 1.973918851395482e-06, + "loss": 1.0674, + "step": 11784 + }, + { + "epoch": 0.3, + "learning_rate": 1.9739125726904984e-06, + "loss": 1.0137, + "step": 11785 + }, + { + "epoch": 0.3, + "learning_rate": 1.9739062932398354e-06, + "loss": 1.0342, + "step": 11786 + }, + { + "epoch": 0.3, + "learning_rate": 1.973900013043497e-06, + "loss": 0.6802, + "step": 11787 + }, + { + "epoch": 0.3, + "learning_rate": 1.9738937321014877e-06, + "loss": 1.0195, + "step": 11788 + }, + { + "epoch": 0.3, + "learning_rate": 1.973887450413813e-06, + "loss": 0.8691, + "step": 11789 + }, + { + "epoch": 0.3, + "learning_rate": 1.9738811679804773e-06, + "loss": 0.8496, + "step": 11790 + }, + { + "epoch": 0.3, + "learning_rate": 1.973874884801486e-06, + "loss": 0.8584, + "step": 11791 + }, + { + "epoch": 0.3, + "learning_rate": 1.9738686008768433e-06, + "loss": 1.0166, + "step": 11792 + }, + { + "epoch": 0.3, + "learning_rate": 1.973862316206554e-06, + "loss": 0.9883, + "step": 11793 + }, + { + "epoch": 0.3, + "learning_rate": 1.9738560307906233e-06, + "loss": 0.9478, + "step": 11794 + }, + { + "epoch": 0.3, + "learning_rate": 1.9738497446290555e-06, + "loss": 0.9199, + "step": 11795 + }, + { + "epoch": 0.3, + "learning_rate": 1.9738434577218563e-06, + "loss": 1.1553, + "step": 11796 + }, + { + "epoch": 0.3, + "learning_rate": 1.9738371700690294e-06, + "loss": 0.9941, + "step": 11797 + }, + { + "epoch": 0.3, + "learning_rate": 1.9738308816705805e-06, + "loss": 0.7529, + "step": 11798 + }, + { + "epoch": 0.3, + "learning_rate": 1.973824592526514e-06, + "loss": 1.0488, + "step": 11799 + }, + { + "epoch": 0.3, + "learning_rate": 1.9738183026368347e-06, + "loss": 0.8936, + "step": 11800 + }, + { + "epoch": 0.3, + "learning_rate": 1.973812012001548e-06, + "loss": 0.9893, + "step": 11801 + }, + { + "epoch": 0.3, + "learning_rate": 1.9738057206206575e-06, + "loss": 0.9932, + "step": 11802 + }, + { + "epoch": 0.3, + "learning_rate": 1.973799428494169e-06, + "loss": 1.0107, + "step": 11803 + }, + { + "epoch": 0.3, + "learning_rate": 1.973793135622087e-06, + "loss": 0.8652, + "step": 11804 + }, + { + "epoch": 0.3, + "learning_rate": 1.9737868420044164e-06, + "loss": 0.7969, + "step": 11805 + }, + { + "epoch": 0.3, + "learning_rate": 1.973780547641162e-06, + "loss": 0.7393, + "step": 11806 + }, + { + "epoch": 0.3, + "learning_rate": 1.9737742525323287e-06, + "loss": 0.8584, + "step": 11807 + }, + { + "epoch": 0.3, + "learning_rate": 1.973767956677921e-06, + "loss": 0.8682, + "step": 11808 + }, + { + "epoch": 0.3, + "learning_rate": 1.9737616600779443e-06, + "loss": 0.9492, + "step": 11809 + }, + { + "epoch": 0.3, + "learning_rate": 1.973755362732403e-06, + "loss": 1.0342, + "step": 11810 + }, + { + "epoch": 0.3, + "learning_rate": 1.9737490646413017e-06, + "loss": 0.7695, + "step": 11811 + }, + { + "epoch": 0.3, + "learning_rate": 1.9737427658046456e-06, + "loss": 1.1406, + "step": 11812 + }, + { + "epoch": 0.3, + "learning_rate": 1.9737364662224395e-06, + "loss": 0.8804, + "step": 11813 + }, + { + "epoch": 0.3, + "learning_rate": 1.973730165894688e-06, + "loss": 0.8252, + "step": 11814 + }, + { + "epoch": 0.3, + "learning_rate": 1.9737238648213967e-06, + "loss": 0.9697, + "step": 11815 + }, + { + "epoch": 0.3, + "learning_rate": 1.973717563002569e-06, + "loss": 0.916, + "step": 11816 + }, + { + "epoch": 0.3, + "learning_rate": 1.9737112604382113e-06, + "loss": 0.6758, + "step": 11817 + }, + { + "epoch": 0.3, + "learning_rate": 1.973704957128327e-06, + "loss": 0.585, + "step": 11818 + }, + { + "epoch": 0.3, + "learning_rate": 1.973698653072922e-06, + "loss": 0.8467, + "step": 11819 + }, + { + "epoch": 0.3, + "learning_rate": 1.9736923482720005e-06, + "loss": 0.8271, + "step": 11820 + }, + { + "epoch": 0.3, + "learning_rate": 1.973686042725568e-06, + "loss": 0.9297, + "step": 11821 + }, + { + "epoch": 0.3, + "learning_rate": 1.9736797364336284e-06, + "loss": 0.8672, + "step": 11822 + }, + { + "epoch": 0.3, + "learning_rate": 1.973673429396187e-06, + "loss": 1.0293, + "step": 11823 + }, + { + "epoch": 0.3, + "learning_rate": 1.9736671216132484e-06, + "loss": 1.1523, + "step": 11824 + }, + { + "epoch": 0.3, + "learning_rate": 1.9736608130848184e-06, + "loss": 0.7495, + "step": 11825 + }, + { + "epoch": 0.3, + "learning_rate": 1.9736545038109003e-06, + "loss": 0.9551, + "step": 11826 + }, + { + "epoch": 0.3, + "learning_rate": 1.9736481937915e-06, + "loss": 1.0078, + "step": 11827 + }, + { + "epoch": 0.3, + "learning_rate": 1.9736418830266223e-06, + "loss": 0.874, + "step": 11828 + }, + { + "epoch": 0.3, + "learning_rate": 1.9736355715162717e-06, + "loss": 1.0732, + "step": 11829 + }, + { + "epoch": 0.3, + "learning_rate": 1.973629259260453e-06, + "loss": 1.0645, + "step": 11830 + }, + { + "epoch": 0.3, + "learning_rate": 1.973622946259171e-06, + "loss": 1.0723, + "step": 11831 + }, + { + "epoch": 0.3, + "learning_rate": 1.973616632512431e-06, + "loss": 0.9561, + "step": 11832 + }, + { + "epoch": 0.3, + "learning_rate": 1.9736103180202373e-06, + "loss": 0.9268, + "step": 11833 + }, + { + "epoch": 0.3, + "learning_rate": 1.973604002782595e-06, + "loss": 0.9482, + "step": 11834 + }, + { + "epoch": 0.3, + "learning_rate": 1.973597686799509e-06, + "loss": 0.9639, + "step": 11835 + }, + { + "epoch": 0.3, + "learning_rate": 1.9735913700709838e-06, + "loss": 1.0068, + "step": 11836 + }, + { + "epoch": 0.3, + "learning_rate": 1.9735850525970244e-06, + "loss": 0.7676, + "step": 11837 + }, + { + "epoch": 0.3, + "learning_rate": 1.973578734377636e-06, + "loss": 0.8389, + "step": 11838 + }, + { + "epoch": 0.3, + "learning_rate": 1.9735724154128227e-06, + "loss": 0.9277, + "step": 11839 + }, + { + "epoch": 0.3, + "learning_rate": 1.97356609570259e-06, + "loss": 0.6328, + "step": 11840 + }, + { + "epoch": 0.3, + "learning_rate": 1.9735597752469426e-06, + "loss": 0.9678, + "step": 11841 + }, + { + "epoch": 0.3, + "learning_rate": 1.973553454045885e-06, + "loss": 0.9102, + "step": 11842 + }, + { + "epoch": 0.3, + "learning_rate": 1.9735471320994227e-06, + "loss": 1.04, + "step": 11843 + }, + { + "epoch": 0.3, + "learning_rate": 1.97354080940756e-06, + "loss": 1.0166, + "step": 11844 + }, + { + "epoch": 0.3, + "learning_rate": 1.9735344859703015e-06, + "loss": 0.9902, + "step": 11845 + }, + { + "epoch": 0.3, + "learning_rate": 1.9735281617876528e-06, + "loss": 0.79, + "step": 11846 + }, + { + "epoch": 0.3, + "learning_rate": 1.9735218368596184e-06, + "loss": 0.8052, + "step": 11847 + }, + { + "epoch": 0.3, + "learning_rate": 1.973515511186203e-06, + "loss": 0.832, + "step": 11848 + }, + { + "epoch": 0.3, + "learning_rate": 1.973509184767411e-06, + "loss": 0.9717, + "step": 11849 + }, + { + "epoch": 0.3, + "learning_rate": 1.9735028576032487e-06, + "loss": 0.8447, + "step": 11850 + }, + { + "epoch": 0.3, + "learning_rate": 1.9734965296937194e-06, + "loss": 0.6902, + "step": 11851 + }, + { + "epoch": 0.3, + "learning_rate": 1.9734902010388286e-06, + "loss": 0.9297, + "step": 11852 + }, + { + "epoch": 0.3, + "learning_rate": 1.9734838716385814e-06, + "loss": 0.7563, + "step": 11853 + }, + { + "epoch": 0.3, + "learning_rate": 1.9734775414929825e-06, + "loss": 0.9795, + "step": 11854 + }, + { + "epoch": 0.3, + "learning_rate": 1.973471210602036e-06, + "loss": 0.8779, + "step": 11855 + }, + { + "epoch": 0.3, + "learning_rate": 1.9734648789657477e-06, + "loss": 1.1826, + "step": 11856 + }, + { + "epoch": 0.3, + "learning_rate": 1.973458546584122e-06, + "loss": 0.8613, + "step": 11857 + }, + { + "epoch": 0.3, + "learning_rate": 1.973452213457164e-06, + "loss": 1.1455, + "step": 11858 + }, + { + "epoch": 0.3, + "learning_rate": 1.9734458795848785e-06, + "loss": 0.9775, + "step": 11859 + }, + { + "epoch": 0.3, + "learning_rate": 1.97343954496727e-06, + "loss": 1.2812, + "step": 11860 + }, + { + "epoch": 0.3, + "learning_rate": 1.9734332096043437e-06, + "loss": 1.1191, + "step": 11861 + }, + { + "epoch": 0.3, + "learning_rate": 1.9734268734961042e-06, + "loss": 0.9629, + "step": 11862 + }, + { + "epoch": 0.3, + "learning_rate": 1.9734205366425566e-06, + "loss": 1.0283, + "step": 11863 + }, + { + "epoch": 0.3, + "learning_rate": 1.9734141990437056e-06, + "loss": 1.0674, + "step": 11864 + }, + { + "epoch": 0.3, + "learning_rate": 1.973407860699556e-06, + "loss": 0.8677, + "step": 11865 + }, + { + "epoch": 0.3, + "learning_rate": 1.973401521610113e-06, + "loss": 0.7812, + "step": 11866 + }, + { + "epoch": 0.3, + "learning_rate": 1.9733951817753814e-06, + "loss": 0.7871, + "step": 11867 + }, + { + "epoch": 0.3, + "learning_rate": 1.9733888411953657e-06, + "loss": 1.0781, + "step": 11868 + }, + { + "epoch": 0.3, + "learning_rate": 1.9733824998700707e-06, + "loss": 0.9043, + "step": 11869 + }, + { + "epoch": 0.3, + "learning_rate": 1.9733761577995015e-06, + "loss": 0.9932, + "step": 11870 + }, + { + "epoch": 0.3, + "learning_rate": 1.973369814983663e-06, + "loss": 0.6987, + "step": 11871 + }, + { + "epoch": 0.3, + "learning_rate": 1.9733634714225604e-06, + "loss": 0.9648, + "step": 11872 + }, + { + "epoch": 0.3, + "learning_rate": 1.9733571271161977e-06, + "loss": 0.9502, + "step": 11873 + }, + { + "epoch": 0.3, + "learning_rate": 1.9733507820645803e-06, + "loss": 0.8218, + "step": 11874 + }, + { + "epoch": 0.3, + "learning_rate": 1.973344436267713e-06, + "loss": 0.9658, + "step": 11875 + }, + { + "epoch": 0.3, + "learning_rate": 1.9733380897256004e-06, + "loss": 0.7773, + "step": 11876 + }, + { + "epoch": 0.3, + "learning_rate": 1.973331742438248e-06, + "loss": 0.7725, + "step": 11877 + }, + { + "epoch": 0.3, + "learning_rate": 1.97332539440566e-06, + "loss": 0.8262, + "step": 11878 + }, + { + "epoch": 0.3, + "learning_rate": 1.9733190456278413e-06, + "loss": 0.874, + "step": 11879 + }, + { + "epoch": 0.3, + "learning_rate": 1.973312696104797e-06, + "loss": 0.7102, + "step": 11880 + }, + { + "epoch": 0.3, + "learning_rate": 1.973306345836532e-06, + "loss": 1.0557, + "step": 11881 + }, + { + "epoch": 0.3, + "learning_rate": 1.9732999948230517e-06, + "loss": 0.9277, + "step": 11882 + }, + { + "epoch": 0.3, + "learning_rate": 1.97329364306436e-06, + "loss": 0.876, + "step": 11883 + }, + { + "epoch": 0.3, + "learning_rate": 1.9732872905604615e-06, + "loss": 0.9414, + "step": 11884 + }, + { + "epoch": 0.3, + "learning_rate": 1.973280937311362e-06, + "loss": 1.0723, + "step": 11885 + }, + { + "epoch": 0.3, + "learning_rate": 1.9732745833170665e-06, + "loss": 0.9531, + "step": 11886 + }, + { + "epoch": 0.3, + "learning_rate": 1.973268228577579e-06, + "loss": 0.8135, + "step": 11887 + }, + { + "epoch": 0.3, + "learning_rate": 1.9732618730929046e-06, + "loss": 1.0977, + "step": 11888 + }, + { + "epoch": 0.3, + "learning_rate": 1.973255516863049e-06, + "loss": 0.7798, + "step": 11889 + }, + { + "epoch": 0.3, + "learning_rate": 1.9732491598880155e-06, + "loss": 1.0, + "step": 11890 + }, + { + "epoch": 0.3, + "learning_rate": 1.9732428021678104e-06, + "loss": 0.8525, + "step": 11891 + }, + { + "epoch": 0.3, + "learning_rate": 1.973236443702438e-06, + "loss": 0.9092, + "step": 11892 + }, + { + "epoch": 0.3, + "learning_rate": 1.9732300844919032e-06, + "loss": 1.0381, + "step": 11893 + }, + { + "epoch": 0.3, + "learning_rate": 1.973223724536211e-06, + "loss": 1.043, + "step": 11894 + }, + { + "epoch": 0.3, + "learning_rate": 1.973217363835366e-06, + "loss": 0.8506, + "step": 11895 + }, + { + "epoch": 0.3, + "learning_rate": 1.973211002389373e-06, + "loss": 0.8809, + "step": 11896 + }, + { + "epoch": 0.3, + "learning_rate": 1.9732046401982374e-06, + "loss": 0.9072, + "step": 11897 + }, + { + "epoch": 0.3, + "learning_rate": 1.9731982772619636e-06, + "loss": 0.9736, + "step": 11898 + }, + { + "epoch": 0.3, + "learning_rate": 1.973191913580556e-06, + "loss": 1.083, + "step": 11899 + }, + { + "epoch": 0.31, + "learning_rate": 1.973185549154021e-06, + "loss": 0.9619, + "step": 11900 + }, + { + "epoch": 0.31, + "learning_rate": 1.9731791839823625e-06, + "loss": 0.9082, + "step": 11901 + }, + { + "epoch": 0.31, + "learning_rate": 1.9731728180655852e-06, + "loss": 0.9551, + "step": 11902 + }, + { + "epoch": 0.31, + "learning_rate": 1.9731664514036946e-06, + "loss": 0.9697, + "step": 11903 + }, + { + "epoch": 0.31, + "learning_rate": 1.973160083996695e-06, + "loss": 1.1357, + "step": 11904 + }, + { + "epoch": 0.31, + "learning_rate": 1.9731537158445913e-06, + "loss": 0.9199, + "step": 11905 + }, + { + "epoch": 0.31, + "learning_rate": 1.9731473469473884e-06, + "loss": 0.7739, + "step": 11906 + }, + { + "epoch": 0.31, + "learning_rate": 1.9731409773050916e-06, + "loss": 1.0117, + "step": 11907 + }, + { + "epoch": 0.31, + "learning_rate": 1.9731346069177053e-06, + "loss": 1.0596, + "step": 11908 + }, + { + "epoch": 0.31, + "learning_rate": 1.973128235785235e-06, + "loss": 0.8306, + "step": 11909 + }, + { + "epoch": 0.31, + "learning_rate": 1.9731218639076848e-06, + "loss": 0.8906, + "step": 11910 + }, + { + "epoch": 0.31, + "learning_rate": 1.9731154912850602e-06, + "loss": 0.918, + "step": 11911 + }, + { + "epoch": 0.31, + "learning_rate": 1.9731091179173656e-06, + "loss": 0.6396, + "step": 11912 + }, + { + "epoch": 0.31, + "learning_rate": 1.973102743804606e-06, + "loss": 1.0684, + "step": 11913 + }, + { + "epoch": 0.31, + "learning_rate": 1.9730963689467865e-06, + "loss": 0.9961, + "step": 11914 + }, + { + "epoch": 0.31, + "learning_rate": 1.9730899933439117e-06, + "loss": 0.8906, + "step": 11915 + }, + { + "epoch": 0.31, + "learning_rate": 1.973083616995987e-06, + "loss": 0.7925, + "step": 11916 + }, + { + "epoch": 0.31, + "learning_rate": 1.9730772399030167e-06, + "loss": 0.6987, + "step": 11917 + }, + { + "epoch": 0.31, + "learning_rate": 1.9730708620650057e-06, + "loss": 1.0469, + "step": 11918 + }, + { + "epoch": 0.31, + "learning_rate": 1.9730644834819594e-06, + "loss": 1.0244, + "step": 11919 + }, + { + "epoch": 0.31, + "learning_rate": 1.9730581041538825e-06, + "loss": 0.7046, + "step": 11920 + }, + { + "epoch": 0.31, + "learning_rate": 1.973051724080779e-06, + "loss": 0.8057, + "step": 11921 + }, + { + "epoch": 0.31, + "learning_rate": 1.9730453432626554e-06, + "loss": 0.8359, + "step": 11922 + }, + { + "epoch": 0.31, + "learning_rate": 1.973038961699515e-06, + "loss": 0.8369, + "step": 11923 + }, + { + "epoch": 0.31, + "learning_rate": 1.973032579391364e-06, + "loss": 0.9912, + "step": 11924 + }, + { + "epoch": 0.31, + "learning_rate": 1.9730261963382064e-06, + "loss": 0.9126, + "step": 11925 + }, + { + "epoch": 0.31, + "learning_rate": 1.9730198125400473e-06, + "loss": 0.8271, + "step": 11926 + }, + { + "epoch": 0.31, + "learning_rate": 1.973013427996892e-06, + "loss": 0.9531, + "step": 11927 + }, + { + "epoch": 0.31, + "learning_rate": 1.973007042708745e-06, + "loss": 0.4449, + "step": 11928 + }, + { + "epoch": 0.31, + "learning_rate": 1.973000656675611e-06, + "loss": 0.8262, + "step": 11929 + }, + { + "epoch": 0.31, + "learning_rate": 1.9729942698974952e-06, + "loss": 0.8594, + "step": 11930 + }, + { + "epoch": 0.31, + "learning_rate": 1.9729878823744024e-06, + "loss": 0.7881, + "step": 11931 + }, + { + "epoch": 0.31, + "learning_rate": 1.9729814941063378e-06, + "loss": 0.8604, + "step": 11932 + }, + { + "epoch": 0.31, + "learning_rate": 1.972975105093306e-06, + "loss": 0.8215, + "step": 11933 + }, + { + "epoch": 0.31, + "learning_rate": 1.9729687153353117e-06, + "loss": 0.9883, + "step": 11934 + }, + { + "epoch": 0.31, + "learning_rate": 1.97296232483236e-06, + "loss": 0.7305, + "step": 11935 + }, + { + "epoch": 0.31, + "learning_rate": 1.972955933584456e-06, + "loss": 1.0273, + "step": 11936 + }, + { + "epoch": 0.31, + "learning_rate": 1.9729495415916036e-06, + "loss": 1.043, + "step": 11937 + }, + { + "epoch": 0.31, + "learning_rate": 1.9729431488538092e-06, + "loss": 0.8438, + "step": 11938 + }, + { + "epoch": 0.31, + "learning_rate": 1.972936755371077e-06, + "loss": 0.9307, + "step": 11939 + }, + { + "epoch": 0.31, + "learning_rate": 1.9729303611434117e-06, + "loss": 0.8809, + "step": 11940 + }, + { + "epoch": 0.31, + "learning_rate": 1.9729239661708183e-06, + "loss": 1.0586, + "step": 11941 + }, + { + "epoch": 0.31, + "learning_rate": 1.9729175704533017e-06, + "loss": 0.9746, + "step": 11942 + }, + { + "epoch": 0.31, + "learning_rate": 1.972911173990867e-06, + "loss": 0.853, + "step": 11943 + }, + { + "epoch": 0.31, + "learning_rate": 1.9729047767835188e-06, + "loss": 0.9902, + "step": 11944 + }, + { + "epoch": 0.31, + "learning_rate": 1.9728983788312625e-06, + "loss": 1.248, + "step": 11945 + }, + { + "epoch": 0.31, + "learning_rate": 1.972891980134102e-06, + "loss": 0.592, + "step": 11946 + }, + { + "epoch": 0.31, + "learning_rate": 1.9728855806920433e-06, + "loss": 0.8252, + "step": 11947 + }, + { + "epoch": 0.31, + "learning_rate": 1.972879180505091e-06, + "loss": 0.8193, + "step": 11948 + }, + { + "epoch": 0.31, + "learning_rate": 1.9728727795732497e-06, + "loss": 0.8867, + "step": 11949 + }, + { + "epoch": 0.31, + "learning_rate": 1.9728663778965243e-06, + "loss": 0.7637, + "step": 11950 + }, + { + "epoch": 0.31, + "learning_rate": 1.97285997547492e-06, + "loss": 0.9395, + "step": 11951 + }, + { + "epoch": 0.31, + "learning_rate": 1.9728535723084415e-06, + "loss": 1.0029, + "step": 11952 + }, + { + "epoch": 0.31, + "learning_rate": 1.9728471683970937e-06, + "loss": 1.0117, + "step": 11953 + }, + { + "epoch": 0.31, + "learning_rate": 1.9728407637408817e-06, + "loss": 0.9902, + "step": 11954 + }, + { + "epoch": 0.31, + "learning_rate": 1.97283435833981e-06, + "loss": 1.0869, + "step": 11955 + }, + { + "epoch": 0.31, + "learning_rate": 1.972827952193884e-06, + "loss": 1.1104, + "step": 11956 + }, + { + "epoch": 0.31, + "learning_rate": 1.972821545303108e-06, + "loss": 0.7969, + "step": 11957 + }, + { + "epoch": 0.31, + "learning_rate": 1.972815137667488e-06, + "loss": 0.7759, + "step": 11958 + }, + { + "epoch": 0.31, + "learning_rate": 1.972808729287027e-06, + "loss": 0.7588, + "step": 11959 + }, + { + "epoch": 0.31, + "learning_rate": 1.9728023201617324e-06, + "loss": 0.8574, + "step": 11960 + }, + { + "epoch": 0.31, + "learning_rate": 1.972795910291607e-06, + "loss": 0.9297, + "step": 11961 + }, + { + "epoch": 0.31, + "learning_rate": 1.9727894996766566e-06, + "loss": 1.0625, + "step": 11962 + }, + { + "epoch": 0.31, + "learning_rate": 1.9727830883168865e-06, + "loss": 0.9365, + "step": 11963 + }, + { + "epoch": 0.31, + "learning_rate": 1.9727766762123004e-06, + "loss": 0.7852, + "step": 11964 + }, + { + "epoch": 0.31, + "learning_rate": 1.9727702633629043e-06, + "loss": 0.9453, + "step": 11965 + }, + { + "epoch": 0.31, + "learning_rate": 1.9727638497687028e-06, + "loss": 1.0059, + "step": 11966 + }, + { + "epoch": 0.31, + "learning_rate": 1.972757435429701e-06, + "loss": 0.9111, + "step": 11967 + }, + { + "epoch": 0.31, + "learning_rate": 1.9727510203459026e-06, + "loss": 0.7705, + "step": 11968 + }, + { + "epoch": 0.31, + "learning_rate": 1.9727446045173146e-06, + "loss": 0.8271, + "step": 11969 + }, + { + "epoch": 0.31, + "learning_rate": 1.9727381879439398e-06, + "loss": 0.9775, + "step": 11970 + }, + { + "epoch": 0.31, + "learning_rate": 1.972731770625785e-06, + "loss": 0.6309, + "step": 11971 + }, + { + "epoch": 0.31, + "learning_rate": 1.9727253525628536e-06, + "loss": 0.7441, + "step": 11972 + }, + { + "epoch": 0.31, + "learning_rate": 1.972718933755151e-06, + "loss": 1.0752, + "step": 11973 + }, + { + "epoch": 0.31, + "learning_rate": 1.9727125142026828e-06, + "loss": 0.8657, + "step": 11974 + }, + { + "epoch": 0.31, + "learning_rate": 1.972706093905453e-06, + "loss": 0.7085, + "step": 11975 + }, + { + "epoch": 0.31, + "learning_rate": 1.972699672863467e-06, + "loss": 0.8506, + "step": 11976 + }, + { + "epoch": 0.31, + "learning_rate": 1.9726932510767297e-06, + "loss": 0.8896, + "step": 11977 + }, + { + "epoch": 0.31, + "learning_rate": 1.9726868285452455e-06, + "loss": 0.7402, + "step": 11978 + }, + { + "epoch": 0.31, + "learning_rate": 1.97268040526902e-06, + "loss": 0.9639, + "step": 11979 + }, + { + "epoch": 0.31, + "learning_rate": 1.972673981248058e-06, + "loss": 1.251, + "step": 11980 + }, + { + "epoch": 0.31, + "learning_rate": 1.972667556482364e-06, + "loss": 1.0859, + "step": 11981 + }, + { + "epoch": 0.31, + "learning_rate": 1.9726611309719436e-06, + "loss": 0.688, + "step": 11982 + }, + { + "epoch": 0.31, + "learning_rate": 1.9726547047168006e-06, + "loss": 0.8887, + "step": 11983 + }, + { + "epoch": 0.31, + "learning_rate": 1.972648277716941e-06, + "loss": 1.0684, + "step": 11984 + }, + { + "epoch": 0.31, + "learning_rate": 1.9726418499723693e-06, + "loss": 1.042, + "step": 11985 + }, + { + "epoch": 0.31, + "learning_rate": 1.9726354214830904e-06, + "loss": 0.9121, + "step": 11986 + }, + { + "epoch": 0.31, + "learning_rate": 1.972628992249109e-06, + "loss": 0.9268, + "step": 11987 + }, + { + "epoch": 0.31, + "learning_rate": 1.972622562270431e-06, + "loss": 0.8535, + "step": 11988 + }, + { + "epoch": 0.31, + "learning_rate": 1.97261613154706e-06, + "loss": 0.9385, + "step": 11989 + }, + { + "epoch": 0.31, + "learning_rate": 1.972609700079002e-06, + "loss": 1.1182, + "step": 11990 + }, + { + "epoch": 0.31, + "learning_rate": 1.9726032678662615e-06, + "loss": 0.8604, + "step": 11991 + }, + { + "epoch": 0.31, + "learning_rate": 1.972596834908843e-06, + "loss": 0.96, + "step": 11992 + }, + { + "epoch": 0.31, + "learning_rate": 1.972590401206752e-06, + "loss": 1.0273, + "step": 11993 + }, + { + "epoch": 0.31, + "learning_rate": 1.9725839667599936e-06, + "loss": 0.9883, + "step": 11994 + }, + { + "epoch": 0.31, + "learning_rate": 1.972577531568572e-06, + "loss": 0.8804, + "step": 11995 + }, + { + "epoch": 0.31, + "learning_rate": 1.9725710956324925e-06, + "loss": 0.6748, + "step": 11996 + }, + { + "epoch": 0.31, + "learning_rate": 1.97256465895176e-06, + "loss": 1.0068, + "step": 11997 + }, + { + "epoch": 0.31, + "learning_rate": 1.9725582215263797e-06, + "loss": 0.8281, + "step": 11998 + }, + { + "epoch": 0.31, + "learning_rate": 1.9725517833563557e-06, + "loss": 1.0498, + "step": 11999 + }, + { + "epoch": 0.31, + "learning_rate": 1.972545344441694e-06, + "loss": 0.8564, + "step": 12000 + }, + { + "epoch": 0.31, + "learning_rate": 1.972538904782399e-06, + "loss": 1.042, + "step": 12001 + }, + { + "epoch": 0.31, + "learning_rate": 1.9725324643784757e-06, + "loss": 0.9512, + "step": 12002 + }, + { + "epoch": 0.31, + "learning_rate": 1.972526023229929e-06, + "loss": 0.8662, + "step": 12003 + }, + { + "epoch": 0.31, + "learning_rate": 1.972519581336764e-06, + "loss": 1.127, + "step": 12004 + }, + { + "epoch": 0.31, + "learning_rate": 1.9725131386989853e-06, + "loss": 0.7861, + "step": 12005 + }, + { + "epoch": 0.31, + "learning_rate": 1.972506695316598e-06, + "loss": 1.1016, + "step": 12006 + }, + { + "epoch": 0.31, + "learning_rate": 1.972500251189607e-06, + "loss": 0.8643, + "step": 12007 + }, + { + "epoch": 0.31, + "learning_rate": 1.9724938063180176e-06, + "loss": 1.0518, + "step": 12008 + }, + { + "epoch": 0.31, + "learning_rate": 1.9724873607018338e-06, + "loss": 0.8374, + "step": 12009 + }, + { + "epoch": 0.31, + "learning_rate": 1.9724809143410614e-06, + "loss": 0.9053, + "step": 12010 + }, + { + "epoch": 0.31, + "learning_rate": 1.9724744672357055e-06, + "loss": 1.0107, + "step": 12011 + }, + { + "epoch": 0.31, + "learning_rate": 1.97246801938577e-06, + "loss": 0.7119, + "step": 12012 + }, + { + "epoch": 0.31, + "learning_rate": 1.972461570791261e-06, + "loss": 0.9111, + "step": 12013 + }, + { + "epoch": 0.31, + "learning_rate": 1.9724551214521825e-06, + "loss": 0.8867, + "step": 12014 + }, + { + "epoch": 0.31, + "learning_rate": 1.97244867136854e-06, + "loss": 0.873, + "step": 12015 + }, + { + "epoch": 0.31, + "learning_rate": 1.972442220540338e-06, + "loss": 0.7695, + "step": 12016 + }, + { + "epoch": 0.31, + "learning_rate": 1.972435768967582e-06, + "loss": 1.041, + "step": 12017 + }, + { + "epoch": 0.31, + "learning_rate": 1.9724293166502765e-06, + "loss": 1.1064, + "step": 12018 + }, + { + "epoch": 0.31, + "learning_rate": 1.972422863588427e-06, + "loss": 1.0947, + "step": 12019 + }, + { + "epoch": 0.31, + "learning_rate": 1.9724164097820376e-06, + "loss": 0.752, + "step": 12020 + }, + { + "epoch": 0.31, + "learning_rate": 1.9724099552311135e-06, + "loss": 1.0459, + "step": 12021 + }, + { + "epoch": 0.31, + "learning_rate": 1.97240349993566e-06, + "loss": 0.9258, + "step": 12022 + }, + { + "epoch": 0.31, + "learning_rate": 1.972397043895682e-06, + "loss": 0.7654, + "step": 12023 + }, + { + "epoch": 0.31, + "learning_rate": 1.9723905871111843e-06, + "loss": 0.8555, + "step": 12024 + }, + { + "epoch": 0.31, + "learning_rate": 1.9723841295821715e-06, + "loss": 0.9204, + "step": 12025 + }, + { + "epoch": 0.31, + "learning_rate": 1.9723776713086494e-06, + "loss": 0.6177, + "step": 12026 + }, + { + "epoch": 0.31, + "learning_rate": 1.9723712122906222e-06, + "loss": 0.9688, + "step": 12027 + }, + { + "epoch": 0.31, + "learning_rate": 1.972364752528095e-06, + "loss": 1.0254, + "step": 12028 + }, + { + "epoch": 0.31, + "learning_rate": 1.9723582920210728e-06, + "loss": 0.8555, + "step": 12029 + }, + { + "epoch": 0.31, + "learning_rate": 1.9723518307695607e-06, + "loss": 1.0244, + "step": 12030 + }, + { + "epoch": 0.31, + "learning_rate": 1.9723453687735634e-06, + "loss": 1.04, + "step": 12031 + }, + { + "epoch": 0.31, + "learning_rate": 1.972338906033086e-06, + "loss": 0.9492, + "step": 12032 + }, + { + "epoch": 0.31, + "learning_rate": 1.9723324425481335e-06, + "loss": 0.7998, + "step": 12033 + }, + { + "epoch": 0.31, + "learning_rate": 1.9723259783187107e-06, + "loss": 1.0293, + "step": 12034 + }, + { + "epoch": 0.31, + "learning_rate": 1.972319513344822e-06, + "loss": 0.8428, + "step": 12035 + }, + { + "epoch": 0.31, + "learning_rate": 1.972313047626474e-06, + "loss": 0.8662, + "step": 12036 + }, + { + "epoch": 0.31, + "learning_rate": 1.9723065811636703e-06, + "loss": 0.7783, + "step": 12037 + }, + { + "epoch": 0.31, + "learning_rate": 1.9723001139564154e-06, + "loss": 1.1758, + "step": 12038 + }, + { + "epoch": 0.31, + "learning_rate": 1.972293646004716e-06, + "loss": 0.752, + "step": 12039 + }, + { + "epoch": 0.31, + "learning_rate": 1.9722871773085755e-06, + "loss": 1.0195, + "step": 12040 + }, + { + "epoch": 0.31, + "learning_rate": 1.9722807078679997e-06, + "loss": 0.959, + "step": 12041 + }, + { + "epoch": 0.31, + "learning_rate": 1.972274237682993e-06, + "loss": 1.0693, + "step": 12042 + }, + { + "epoch": 0.31, + "learning_rate": 1.9722677667535607e-06, + "loss": 1.0029, + "step": 12043 + }, + { + "epoch": 0.31, + "learning_rate": 1.9722612950797075e-06, + "loss": 0.7959, + "step": 12044 + }, + { + "epoch": 0.31, + "learning_rate": 1.972254822661439e-06, + "loss": 0.7854, + "step": 12045 + }, + { + "epoch": 0.31, + "learning_rate": 1.9722483494987596e-06, + "loss": 0.8779, + "step": 12046 + }, + { + "epoch": 0.31, + "learning_rate": 1.972241875591674e-06, + "loss": 1.0645, + "step": 12047 + }, + { + "epoch": 0.31, + "learning_rate": 1.972235400940188e-06, + "loss": 0.834, + "step": 12048 + }, + { + "epoch": 0.31, + "learning_rate": 1.9722289255443056e-06, + "loss": 0.9736, + "step": 12049 + }, + { + "epoch": 0.31, + "learning_rate": 1.9722224494040325e-06, + "loss": 0.9258, + "step": 12050 + }, + { + "epoch": 0.31, + "learning_rate": 1.9722159725193734e-06, + "loss": 1.0449, + "step": 12051 + }, + { + "epoch": 0.31, + "learning_rate": 1.972209494890333e-06, + "loss": 0.9746, + "step": 12052 + }, + { + "epoch": 0.31, + "learning_rate": 1.9722030165169165e-06, + "loss": 1.1592, + "step": 12053 + }, + { + "epoch": 0.31, + "learning_rate": 1.972196537399129e-06, + "loss": 0.9355, + "step": 12054 + }, + { + "epoch": 0.31, + "learning_rate": 1.972190057536975e-06, + "loss": 1.0654, + "step": 12055 + }, + { + "epoch": 0.31, + "learning_rate": 1.97218357693046e-06, + "loss": 1.0059, + "step": 12056 + }, + { + "epoch": 0.31, + "learning_rate": 1.972177095579589e-06, + "loss": 0.9082, + "step": 12057 + }, + { + "epoch": 0.31, + "learning_rate": 1.9721706134843664e-06, + "loss": 0.6075, + "step": 12058 + }, + { + "epoch": 0.31, + "learning_rate": 1.9721641306447975e-06, + "loss": 1.2324, + "step": 12059 + }, + { + "epoch": 0.31, + "learning_rate": 1.972157647060887e-06, + "loss": 0.9062, + "step": 12060 + }, + { + "epoch": 0.31, + "learning_rate": 1.9721511627326407e-06, + "loss": 0.7871, + "step": 12061 + }, + { + "epoch": 0.31, + "learning_rate": 1.972144677660062e-06, + "loss": 0.9521, + "step": 12062 + }, + { + "epoch": 0.31, + "learning_rate": 1.972138191843158e-06, + "loss": 0.9893, + "step": 12063 + }, + { + "epoch": 0.31, + "learning_rate": 1.972131705281932e-06, + "loss": 1.0537, + "step": 12064 + }, + { + "epoch": 0.31, + "learning_rate": 1.972125217976389e-06, + "loss": 1.0664, + "step": 12065 + }, + { + "epoch": 0.31, + "learning_rate": 1.972118729926535e-06, + "loss": 0.9736, + "step": 12066 + }, + { + "epoch": 0.31, + "learning_rate": 1.972112241132374e-06, + "loss": 0.8027, + "step": 12067 + }, + { + "epoch": 0.31, + "learning_rate": 1.9721057515939115e-06, + "loss": 0.8906, + "step": 12068 + }, + { + "epoch": 0.31, + "learning_rate": 1.9720992613111524e-06, + "loss": 1.0029, + "step": 12069 + }, + { + "epoch": 0.31, + "learning_rate": 1.9720927702841016e-06, + "loss": 0.9111, + "step": 12070 + }, + { + "epoch": 0.31, + "learning_rate": 1.972086278512764e-06, + "loss": 0.8281, + "step": 12071 + }, + { + "epoch": 0.31, + "learning_rate": 1.9720797859971445e-06, + "loss": 0.9951, + "step": 12072 + }, + { + "epoch": 0.31, + "learning_rate": 1.9720732927372484e-06, + "loss": 0.5347, + "step": 12073 + }, + { + "epoch": 0.31, + "learning_rate": 1.9720667987330805e-06, + "loss": 1.0234, + "step": 12074 + }, + { + "epoch": 0.31, + "learning_rate": 1.9720603039846456e-06, + "loss": 0.7734, + "step": 12075 + }, + { + "epoch": 0.31, + "learning_rate": 1.972053808491949e-06, + "loss": 0.7988, + "step": 12076 + }, + { + "epoch": 0.31, + "learning_rate": 1.9720473122549955e-06, + "loss": 0.8259, + "step": 12077 + }, + { + "epoch": 0.31, + "learning_rate": 1.9720408152737897e-06, + "loss": 1.126, + "step": 12078 + }, + { + "epoch": 0.31, + "learning_rate": 1.972034317548337e-06, + "loss": 1.0449, + "step": 12079 + }, + { + "epoch": 0.31, + "learning_rate": 1.972027819078643e-06, + "loss": 0.8848, + "step": 12080 + }, + { + "epoch": 0.31, + "learning_rate": 1.9720213198647112e-06, + "loss": 0.9277, + "step": 12081 + }, + { + "epoch": 0.31, + "learning_rate": 1.9720148199065476e-06, + "loss": 1.0146, + "step": 12082 + }, + { + "epoch": 0.31, + "learning_rate": 1.972008319204157e-06, + "loss": 0.9932, + "step": 12083 + }, + { + "epoch": 0.31, + "learning_rate": 1.9720018177575444e-06, + "loss": 0.7344, + "step": 12084 + }, + { + "epoch": 0.31, + "learning_rate": 1.971995315566715e-06, + "loss": 0.9541, + "step": 12085 + }, + { + "epoch": 0.31, + "learning_rate": 1.971988812631673e-06, + "loss": 0.9668, + "step": 12086 + }, + { + "epoch": 0.31, + "learning_rate": 1.971982308952424e-06, + "loss": 1.0215, + "step": 12087 + }, + { + "epoch": 0.31, + "learning_rate": 1.9719758045289727e-06, + "loss": 0.9863, + "step": 12088 + }, + { + "epoch": 0.31, + "learning_rate": 1.9719692993613244e-06, + "loss": 0.8467, + "step": 12089 + }, + { + "epoch": 0.31, + "learning_rate": 1.971962793449484e-06, + "loss": 0.9922, + "step": 12090 + }, + { + "epoch": 0.31, + "learning_rate": 1.971956286793456e-06, + "loss": 1.0249, + "step": 12091 + }, + { + "epoch": 0.31, + "learning_rate": 1.971949779393246e-06, + "loss": 0.8516, + "step": 12092 + }, + { + "epoch": 0.31, + "learning_rate": 1.9719432712488588e-06, + "loss": 0.749, + "step": 12093 + }, + { + "epoch": 0.31, + "learning_rate": 1.9719367623602993e-06, + "loss": 0.8311, + "step": 12094 + }, + { + "epoch": 0.31, + "learning_rate": 1.9719302527275727e-06, + "loss": 0.8696, + "step": 12095 + }, + { + "epoch": 0.31, + "learning_rate": 1.9719237423506836e-06, + "loss": 0.7227, + "step": 12096 + }, + { + "epoch": 0.31, + "learning_rate": 1.9719172312296366e-06, + "loss": 0.772, + "step": 12097 + }, + { + "epoch": 0.31, + "learning_rate": 1.9719107193644378e-06, + "loss": 1.0322, + "step": 12098 + }, + { + "epoch": 0.31, + "learning_rate": 1.971904206755092e-06, + "loss": 1.0479, + "step": 12099 + }, + { + "epoch": 0.31, + "learning_rate": 1.9718976934016034e-06, + "loss": 1.0635, + "step": 12100 + }, + { + "epoch": 0.31, + "learning_rate": 1.9718911793039777e-06, + "loss": 1.1211, + "step": 12101 + }, + { + "epoch": 0.31, + "learning_rate": 1.9718846644622195e-06, + "loss": 0.9365, + "step": 12102 + }, + { + "epoch": 0.31, + "learning_rate": 1.9718781488763336e-06, + "loss": 0.7354, + "step": 12103 + }, + { + "epoch": 0.31, + "learning_rate": 1.971871632546326e-06, + "loss": 0.8789, + "step": 12104 + }, + { + "epoch": 0.31, + "learning_rate": 1.9718651154722e-06, + "loss": 1.0586, + "step": 12105 + }, + { + "epoch": 0.31, + "learning_rate": 1.971858597653962e-06, + "loss": 0.7705, + "step": 12106 + }, + { + "epoch": 0.31, + "learning_rate": 1.971852079091617e-06, + "loss": 0.8389, + "step": 12107 + }, + { + "epoch": 0.31, + "learning_rate": 1.971845559785169e-06, + "loss": 0.7593, + "step": 12108 + }, + { + "epoch": 0.31, + "learning_rate": 1.971839039734624e-06, + "loss": 0.5977, + "step": 12109 + }, + { + "epoch": 0.31, + "learning_rate": 1.971832518939986e-06, + "loss": 0.9492, + "step": 12110 + }, + { + "epoch": 0.31, + "learning_rate": 1.971825997401261e-06, + "loss": 0.9346, + "step": 12111 + }, + { + "epoch": 0.31, + "learning_rate": 1.9718194751184533e-06, + "loss": 0.9561, + "step": 12112 + }, + { + "epoch": 0.31, + "learning_rate": 1.971812952091568e-06, + "loss": 0.6294, + "step": 12113 + }, + { + "epoch": 0.31, + "learning_rate": 1.9718064283206104e-06, + "loss": 1.0879, + "step": 12114 + }, + { + "epoch": 0.31, + "learning_rate": 1.971799903805585e-06, + "loss": 0.7031, + "step": 12115 + }, + { + "epoch": 0.31, + "learning_rate": 1.9717933785464974e-06, + "loss": 0.917, + "step": 12116 + }, + { + "epoch": 0.31, + "learning_rate": 1.9717868525433526e-06, + "loss": 0.9502, + "step": 12117 + }, + { + "epoch": 0.31, + "learning_rate": 1.9717803257961546e-06, + "loss": 0.7205, + "step": 12118 + }, + { + "epoch": 0.31, + "learning_rate": 1.9717737983049094e-06, + "loss": 0.9941, + "step": 12119 + }, + { + "epoch": 0.31, + "learning_rate": 1.971767270069622e-06, + "loss": 0.9229, + "step": 12120 + }, + { + "epoch": 0.31, + "learning_rate": 1.971760741090297e-06, + "loss": 0.8379, + "step": 12121 + }, + { + "epoch": 0.31, + "learning_rate": 1.971754211366939e-06, + "loss": 0.7959, + "step": 12122 + }, + { + "epoch": 0.31, + "learning_rate": 1.9717476808995535e-06, + "loss": 1.0195, + "step": 12123 + }, + { + "epoch": 0.31, + "learning_rate": 1.971741149688146e-06, + "loss": 1.0615, + "step": 12124 + }, + { + "epoch": 0.31, + "learning_rate": 1.9717346177327206e-06, + "loss": 0.834, + "step": 12125 + }, + { + "epoch": 0.31, + "learning_rate": 1.9717280850332827e-06, + "loss": 1.1074, + "step": 12126 + }, + { + "epoch": 0.31, + "learning_rate": 1.9717215515898374e-06, + "loss": 0.9326, + "step": 12127 + }, + { + "epoch": 0.31, + "learning_rate": 1.9717150174023896e-06, + "loss": 1.0088, + "step": 12128 + }, + { + "epoch": 0.31, + "learning_rate": 1.9717084824709446e-06, + "loss": 1.1934, + "step": 12129 + }, + { + "epoch": 0.31, + "learning_rate": 1.9717019467955064e-06, + "loss": 1.0757, + "step": 12130 + }, + { + "epoch": 0.31, + "learning_rate": 1.971695410376081e-06, + "loss": 0.9102, + "step": 12131 + }, + { + "epoch": 0.31, + "learning_rate": 1.9716888732126733e-06, + "loss": 1.0127, + "step": 12132 + }, + { + "epoch": 0.31, + "learning_rate": 1.9716823353052877e-06, + "loss": 0.6724, + "step": 12133 + }, + { + "epoch": 0.31, + "learning_rate": 1.97167579665393e-06, + "loss": 1.0098, + "step": 12134 + }, + { + "epoch": 0.31, + "learning_rate": 1.971669257258605e-06, + "loss": 0.9414, + "step": 12135 + }, + { + "epoch": 0.31, + "learning_rate": 1.971662717119317e-06, + "loss": 1.1797, + "step": 12136 + }, + { + "epoch": 0.31, + "learning_rate": 1.971656176236072e-06, + "loss": 0.9497, + "step": 12137 + }, + { + "epoch": 0.31, + "learning_rate": 1.971649634608874e-06, + "loss": 1.0938, + "step": 12138 + }, + { + "epoch": 0.31, + "learning_rate": 1.971643092237729e-06, + "loss": 0.9619, + "step": 12139 + }, + { + "epoch": 0.31, + "learning_rate": 1.9716365491226417e-06, + "loss": 0.9766, + "step": 12140 + }, + { + "epoch": 0.31, + "learning_rate": 1.9716300052636168e-06, + "loss": 0.907, + "step": 12141 + }, + { + "epoch": 0.31, + "learning_rate": 1.971623460660659e-06, + "loss": 0.9053, + "step": 12142 + }, + { + "epoch": 0.31, + "learning_rate": 1.9716169153137744e-06, + "loss": 0.9707, + "step": 12143 + }, + { + "epoch": 0.31, + "learning_rate": 1.971610369222967e-06, + "loss": 0.7295, + "step": 12144 + }, + { + "epoch": 0.31, + "learning_rate": 1.9716038223882426e-06, + "loss": 0.6226, + "step": 12145 + }, + { + "epoch": 0.31, + "learning_rate": 1.9715972748096055e-06, + "loss": 0.79, + "step": 12146 + }, + { + "epoch": 0.31, + "learning_rate": 1.9715907264870612e-06, + "loss": 0.8115, + "step": 12147 + }, + { + "epoch": 0.31, + "learning_rate": 1.9715841774206145e-06, + "loss": 0.8994, + "step": 12148 + }, + { + "epoch": 0.31, + "learning_rate": 1.9715776276102705e-06, + "loss": 0.8042, + "step": 12149 + }, + { + "epoch": 0.31, + "learning_rate": 1.9715710770560345e-06, + "loss": 0.707, + "step": 12150 + }, + { + "epoch": 0.31, + "learning_rate": 1.9715645257579105e-06, + "loss": 0.7451, + "step": 12151 + }, + { + "epoch": 0.31, + "learning_rate": 1.9715579737159044e-06, + "loss": 1.0205, + "step": 12152 + }, + { + "epoch": 0.31, + "learning_rate": 1.9715514209300213e-06, + "loss": 0.7954, + "step": 12153 + }, + { + "epoch": 0.31, + "learning_rate": 1.9715448674002657e-06, + "loss": 1.0586, + "step": 12154 + }, + { + "epoch": 0.31, + "learning_rate": 1.9715383131266433e-06, + "loss": 0.8203, + "step": 12155 + }, + { + "epoch": 0.31, + "learning_rate": 1.9715317581091587e-06, + "loss": 0.7598, + "step": 12156 + }, + { + "epoch": 0.31, + "learning_rate": 1.9715252023478165e-06, + "loss": 1.0684, + "step": 12157 + }, + { + "epoch": 0.31, + "learning_rate": 1.9715186458426223e-06, + "loss": 0.8374, + "step": 12158 + }, + { + "epoch": 0.31, + "learning_rate": 1.971512088593581e-06, + "loss": 0.8828, + "step": 12159 + }, + { + "epoch": 0.31, + "learning_rate": 1.971505530600697e-06, + "loss": 0.8486, + "step": 12160 + }, + { + "epoch": 0.31, + "learning_rate": 1.971498971863977e-06, + "loss": 0.9814, + "step": 12161 + }, + { + "epoch": 0.31, + "learning_rate": 1.971492412383424e-06, + "loss": 1.0742, + "step": 12162 + }, + { + "epoch": 0.31, + "learning_rate": 1.971485852159044e-06, + "loss": 0.7622, + "step": 12163 + }, + { + "epoch": 0.31, + "learning_rate": 1.9714792911908425e-06, + "loss": 0.874, + "step": 12164 + }, + { + "epoch": 0.31, + "learning_rate": 1.9714727294788232e-06, + "loss": 0.9072, + "step": 12165 + }, + { + "epoch": 0.31, + "learning_rate": 1.9714661670229926e-06, + "loss": 0.8438, + "step": 12166 + }, + { + "epoch": 0.31, + "learning_rate": 1.9714596038233548e-06, + "loss": 0.8945, + "step": 12167 + }, + { + "epoch": 0.31, + "learning_rate": 1.971453039879915e-06, + "loss": 0.9346, + "step": 12168 + }, + { + "epoch": 0.31, + "learning_rate": 1.9714464751926784e-06, + "loss": 0.71, + "step": 12169 + }, + { + "epoch": 0.31, + "learning_rate": 1.9714399097616496e-06, + "loss": 1.1592, + "step": 12170 + }, + { + "epoch": 0.31, + "learning_rate": 1.9714333435868344e-06, + "loss": 0.9346, + "step": 12171 + }, + { + "epoch": 0.31, + "learning_rate": 1.971426776668237e-06, + "loss": 0.8369, + "step": 12172 + }, + { + "epoch": 0.31, + "learning_rate": 1.9714202090058626e-06, + "loss": 0.7871, + "step": 12173 + }, + { + "epoch": 0.31, + "learning_rate": 1.9714136405997165e-06, + "loss": 0.8281, + "step": 12174 + }, + { + "epoch": 0.31, + "learning_rate": 1.971407071449804e-06, + "loss": 0.8013, + "step": 12175 + }, + { + "epoch": 0.31, + "learning_rate": 1.9714005015561295e-06, + "loss": 0.8672, + "step": 12176 + }, + { + "epoch": 0.31, + "learning_rate": 1.9713939309186984e-06, + "loss": 0.7803, + "step": 12177 + }, + { + "epoch": 0.31, + "learning_rate": 1.9713873595375155e-06, + "loss": 1.0947, + "step": 12178 + }, + { + "epoch": 0.31, + "learning_rate": 1.971380787412586e-06, + "loss": 0.8633, + "step": 12179 + }, + { + "epoch": 0.31, + "learning_rate": 1.971374214543915e-06, + "loss": 0.8564, + "step": 12180 + }, + { + "epoch": 0.31, + "learning_rate": 1.9713676409315078e-06, + "loss": 0.7168, + "step": 12181 + }, + { + "epoch": 0.31, + "learning_rate": 1.9713610665753686e-06, + "loss": 0.7637, + "step": 12182 + }, + { + "epoch": 0.31, + "learning_rate": 1.9713544914755028e-06, + "loss": 0.9648, + "step": 12183 + }, + { + "epoch": 0.31, + "learning_rate": 1.9713479156319157e-06, + "loss": 0.8096, + "step": 12184 + }, + { + "epoch": 0.31, + "learning_rate": 1.971341339044612e-06, + "loss": 0.8262, + "step": 12185 + }, + { + "epoch": 0.31, + "learning_rate": 1.971334761713597e-06, + "loss": 0.7017, + "step": 12186 + }, + { + "epoch": 0.31, + "learning_rate": 1.971328183638876e-06, + "loss": 0.7271, + "step": 12187 + }, + { + "epoch": 0.31, + "learning_rate": 1.971321604820453e-06, + "loss": 0.9102, + "step": 12188 + }, + { + "epoch": 0.31, + "learning_rate": 1.9713150252583343e-06, + "loss": 0.9873, + "step": 12189 + }, + { + "epoch": 0.31, + "learning_rate": 1.971308444952524e-06, + "loss": 0.8955, + "step": 12190 + }, + { + "epoch": 0.31, + "learning_rate": 1.9713018639030275e-06, + "loss": 1.0469, + "step": 12191 + }, + { + "epoch": 0.31, + "learning_rate": 1.97129528210985e-06, + "loss": 0.8965, + "step": 12192 + }, + { + "epoch": 0.31, + "learning_rate": 1.9712886995729965e-06, + "loss": 0.8896, + "step": 12193 + }, + { + "epoch": 0.31, + "learning_rate": 1.9712821162924716e-06, + "loss": 0.8335, + "step": 12194 + }, + { + "epoch": 0.31, + "learning_rate": 1.971275532268281e-06, + "loss": 1.1934, + "step": 12195 + }, + { + "epoch": 0.31, + "learning_rate": 1.971268947500429e-06, + "loss": 1.043, + "step": 12196 + }, + { + "epoch": 0.31, + "learning_rate": 1.9712623619889214e-06, + "loss": 0.7119, + "step": 12197 + }, + { + "epoch": 0.31, + "learning_rate": 1.971255775733762e-06, + "loss": 0.8203, + "step": 12198 + }, + { + "epoch": 0.31, + "learning_rate": 1.9712491887349578e-06, + "loss": 0.8457, + "step": 12199 + }, + { + "epoch": 0.31, + "learning_rate": 1.9712426009925124e-06, + "loss": 0.9492, + "step": 12200 + }, + { + "epoch": 0.31, + "learning_rate": 1.971236012506431e-06, + "loss": 0.9932, + "step": 12201 + }, + { + "epoch": 0.31, + "learning_rate": 1.971229423276719e-06, + "loss": 0.8232, + "step": 12202 + }, + { + "epoch": 0.31, + "learning_rate": 1.971222833303381e-06, + "loss": 0.9072, + "step": 12203 + }, + { + "epoch": 0.31, + "learning_rate": 1.9712162425864226e-06, + "loss": 1.2363, + "step": 12204 + }, + { + "epoch": 0.31, + "learning_rate": 1.9712096511258486e-06, + "loss": 1.0635, + "step": 12205 + }, + { + "epoch": 0.31, + "learning_rate": 1.971203058921664e-06, + "loss": 0.8652, + "step": 12206 + }, + { + "epoch": 0.31, + "learning_rate": 1.9711964659738737e-06, + "loss": 1.0596, + "step": 12207 + }, + { + "epoch": 0.31, + "learning_rate": 1.971189872282483e-06, + "loss": 0.875, + "step": 12208 + }, + { + "epoch": 0.31, + "learning_rate": 1.971183277847497e-06, + "loss": 0.8284, + "step": 12209 + }, + { + "epoch": 0.31, + "learning_rate": 1.9711766826689207e-06, + "loss": 0.833, + "step": 12210 + }, + { + "epoch": 0.31, + "learning_rate": 1.971170086746759e-06, + "loss": 0.7715, + "step": 12211 + }, + { + "epoch": 0.31, + "learning_rate": 1.9711634900810168e-06, + "loss": 0.75, + "step": 12212 + }, + { + "epoch": 0.31, + "learning_rate": 1.9711568926716994e-06, + "loss": 1.0566, + "step": 12213 + }, + { + "epoch": 0.31, + "learning_rate": 1.971150294518812e-06, + "loss": 0.8469, + "step": 12214 + }, + { + "epoch": 0.31, + "learning_rate": 1.9711436956223594e-06, + "loss": 0.7222, + "step": 12215 + }, + { + "epoch": 0.31, + "learning_rate": 1.971137095982347e-06, + "loss": 0.8623, + "step": 12216 + }, + { + "epoch": 0.31, + "learning_rate": 1.9711304955987793e-06, + "loss": 0.8262, + "step": 12217 + }, + { + "epoch": 0.31, + "learning_rate": 1.9711238944716615e-06, + "loss": 0.6489, + "step": 12218 + }, + { + "epoch": 0.31, + "learning_rate": 1.971117292600999e-06, + "loss": 1.0762, + "step": 12219 + }, + { + "epoch": 0.31, + "learning_rate": 1.9711106899867965e-06, + "loss": 0.9971, + "step": 12220 + }, + { + "epoch": 0.31, + "learning_rate": 1.9711040866290595e-06, + "loss": 0.9238, + "step": 12221 + }, + { + "epoch": 0.31, + "learning_rate": 1.971097482527792e-06, + "loss": 0.9824, + "step": 12222 + }, + { + "epoch": 0.31, + "learning_rate": 1.9710908776830007e-06, + "loss": 0.8418, + "step": 12223 + }, + { + "epoch": 0.31, + "learning_rate": 1.971084272094689e-06, + "loss": 0.8716, + "step": 12224 + }, + { + "epoch": 0.31, + "learning_rate": 1.9710776657628635e-06, + "loss": 1.0293, + "step": 12225 + }, + { + "epoch": 0.31, + "learning_rate": 1.971071058687528e-06, + "loss": 1.1289, + "step": 12226 + }, + { + "epoch": 0.31, + "learning_rate": 1.9710644508686883e-06, + "loss": 0.9551, + "step": 12227 + }, + { + "epoch": 0.31, + "learning_rate": 1.971057842306349e-06, + "loss": 0.7793, + "step": 12228 + }, + { + "epoch": 0.31, + "learning_rate": 1.9710512330005155e-06, + "loss": 1.0576, + "step": 12229 + }, + { + "epoch": 0.31, + "learning_rate": 1.9710446229511927e-06, + "loss": 0.7266, + "step": 12230 + }, + { + "epoch": 0.31, + "learning_rate": 1.9710380121583855e-06, + "loss": 0.7319, + "step": 12231 + }, + { + "epoch": 0.31, + "learning_rate": 1.9710314006220994e-06, + "loss": 0.8047, + "step": 12232 + }, + { + "epoch": 0.31, + "learning_rate": 1.971024788342339e-06, + "loss": 0.96, + "step": 12233 + }, + { + "epoch": 0.31, + "learning_rate": 1.9710181753191093e-06, + "loss": 1.041, + "step": 12234 + }, + { + "epoch": 0.31, + "learning_rate": 1.9710115615524164e-06, + "loss": 1.0293, + "step": 12235 + }, + { + "epoch": 0.31, + "learning_rate": 1.971004947042264e-06, + "loss": 1.0166, + "step": 12236 + }, + { + "epoch": 0.31, + "learning_rate": 1.9709983317886582e-06, + "loss": 0.9771, + "step": 12237 + }, + { + "epoch": 0.31, + "learning_rate": 1.970991715791603e-06, + "loss": 0.9453, + "step": 12238 + }, + { + "epoch": 0.31, + "learning_rate": 1.9709850990511046e-06, + "loss": 0.8633, + "step": 12239 + }, + { + "epoch": 0.31, + "learning_rate": 1.9709784815671674e-06, + "loss": 0.8594, + "step": 12240 + }, + { + "epoch": 0.31, + "learning_rate": 1.9709718633397965e-06, + "loss": 0.7881, + "step": 12241 + }, + { + "epoch": 0.31, + "learning_rate": 1.970965244368997e-06, + "loss": 0.9658, + "step": 12242 + }, + { + "epoch": 0.31, + "learning_rate": 1.9709586246547744e-06, + "loss": 0.8115, + "step": 12243 + }, + { + "epoch": 0.31, + "learning_rate": 1.9709520041971336e-06, + "loss": 0.8447, + "step": 12244 + }, + { + "epoch": 0.31, + "learning_rate": 1.970945382996079e-06, + "loss": 0.8462, + "step": 12245 + }, + { + "epoch": 0.31, + "learning_rate": 1.9709387610516164e-06, + "loss": 0.9502, + "step": 12246 + }, + { + "epoch": 0.31, + "learning_rate": 1.9709321383637506e-06, + "loss": 1.084, + "step": 12247 + }, + { + "epoch": 0.31, + "learning_rate": 1.9709255149324868e-06, + "loss": 1.0508, + "step": 12248 + }, + { + "epoch": 0.31, + "learning_rate": 1.97091889075783e-06, + "loss": 0.8682, + "step": 12249 + }, + { + "epoch": 0.31, + "learning_rate": 1.970912265839785e-06, + "loss": 0.8599, + "step": 12250 + }, + { + "epoch": 0.31, + "learning_rate": 1.970905640178357e-06, + "loss": 0.7217, + "step": 12251 + }, + { + "epoch": 0.31, + "learning_rate": 1.9708990137735517e-06, + "loss": 0.918, + "step": 12252 + }, + { + "epoch": 0.31, + "learning_rate": 1.9708923866253735e-06, + "loss": 1.1875, + "step": 12253 + }, + { + "epoch": 0.31, + "learning_rate": 1.9708857587338273e-06, + "loss": 1.0791, + "step": 12254 + }, + { + "epoch": 0.31, + "learning_rate": 1.970879130098919e-06, + "loss": 0.8271, + "step": 12255 + }, + { + "epoch": 0.31, + "learning_rate": 1.970872500720653e-06, + "loss": 0.9766, + "step": 12256 + }, + { + "epoch": 0.31, + "learning_rate": 1.9708658705990345e-06, + "loss": 0.9297, + "step": 12257 + }, + { + "epoch": 0.31, + "learning_rate": 1.9708592397340685e-06, + "loss": 0.8887, + "step": 12258 + }, + { + "epoch": 0.31, + "learning_rate": 1.9708526081257608e-06, + "loss": 0.7148, + "step": 12259 + }, + { + "epoch": 0.31, + "learning_rate": 1.970845975774115e-06, + "loss": 0.8564, + "step": 12260 + }, + { + "epoch": 0.31, + "learning_rate": 1.9708393426791375e-06, + "loss": 0.6367, + "step": 12261 + }, + { + "epoch": 0.31, + "learning_rate": 1.970832708840833e-06, + "loss": 0.8027, + "step": 12262 + }, + { + "epoch": 0.31, + "learning_rate": 1.970826074259207e-06, + "loss": 0.7896, + "step": 12263 + }, + { + "epoch": 0.31, + "learning_rate": 1.9708194389342636e-06, + "loss": 0.8672, + "step": 12264 + }, + { + "epoch": 0.31, + "learning_rate": 1.970812802866008e-06, + "loss": 0.8506, + "step": 12265 + }, + { + "epoch": 0.31, + "learning_rate": 1.9708061660544464e-06, + "loss": 0.8809, + "step": 12266 + }, + { + "epoch": 0.31, + "learning_rate": 1.9707995284995832e-06, + "loss": 0.8867, + "step": 12267 + }, + { + "epoch": 0.31, + "learning_rate": 1.970792890201423e-06, + "loss": 0.9199, + "step": 12268 + }, + { + "epoch": 0.31, + "learning_rate": 1.9707862511599715e-06, + "loss": 0.8936, + "step": 12269 + }, + { + "epoch": 0.31, + "learning_rate": 1.9707796113752336e-06, + "loss": 1.082, + "step": 12270 + }, + { + "epoch": 0.31, + "learning_rate": 1.9707729708472145e-06, + "loss": 1.0137, + "step": 12271 + }, + { + "epoch": 0.31, + "learning_rate": 1.970766329575919e-06, + "loss": 0.8359, + "step": 12272 + }, + { + "epoch": 0.31, + "learning_rate": 1.9707596875613523e-06, + "loss": 0.9902, + "step": 12273 + }, + { + "epoch": 0.31, + "learning_rate": 1.9707530448035198e-06, + "loss": 1.1123, + "step": 12274 + }, + { + "epoch": 0.31, + "learning_rate": 1.970746401302426e-06, + "loss": 1.1592, + "step": 12275 + }, + { + "epoch": 0.31, + "learning_rate": 1.9707397570580765e-06, + "loss": 0.9287, + "step": 12276 + }, + { + "epoch": 0.31, + "learning_rate": 1.9707331120704764e-06, + "loss": 1.0068, + "step": 12277 + }, + { + "epoch": 0.31, + "learning_rate": 1.9707264663396303e-06, + "loss": 1.0605, + "step": 12278 + }, + { + "epoch": 0.31, + "learning_rate": 1.9707198198655436e-06, + "loss": 0.8894, + "step": 12279 + }, + { + "epoch": 0.31, + "learning_rate": 1.970713172648221e-06, + "loss": 0.8066, + "step": 12280 + }, + { + "epoch": 0.31, + "learning_rate": 1.9707065246876688e-06, + "loss": 1.0439, + "step": 12281 + }, + { + "epoch": 0.31, + "learning_rate": 1.9706998759838907e-06, + "loss": 0.9443, + "step": 12282 + }, + { + "epoch": 0.31, + "learning_rate": 1.9706932265368925e-06, + "loss": 0.8975, + "step": 12283 + }, + { + "epoch": 0.31, + "learning_rate": 1.970686576346679e-06, + "loss": 0.8945, + "step": 12284 + }, + { + "epoch": 0.31, + "learning_rate": 1.970679925413256e-06, + "loss": 0.7195, + "step": 12285 + }, + { + "epoch": 0.31, + "learning_rate": 1.9706732737366272e-06, + "loss": 0.8988, + "step": 12286 + }, + { + "epoch": 0.31, + "learning_rate": 1.9706666213167988e-06, + "loss": 0.8628, + "step": 12287 + }, + { + "epoch": 0.31, + "learning_rate": 1.9706599681537755e-06, + "loss": 0.8691, + "step": 12288 + }, + { + "epoch": 0.31, + "learning_rate": 1.970653314247563e-06, + "loss": 0.9165, + "step": 12289 + }, + { + "epoch": 0.31, + "learning_rate": 1.9706466595981655e-06, + "loss": 0.8721, + "step": 12290 + }, + { + "epoch": 0.32, + "learning_rate": 1.9706400042055885e-06, + "loss": 0.8525, + "step": 12291 + }, + { + "epoch": 0.32, + "learning_rate": 1.970633348069837e-06, + "loss": 0.7505, + "step": 12292 + }, + { + "epoch": 0.32, + "learning_rate": 1.9706266911909163e-06, + "loss": 1.0049, + "step": 12293 + }, + { + "epoch": 0.32, + "learning_rate": 1.9706200335688313e-06, + "loss": 1.1172, + "step": 12294 + }, + { + "epoch": 0.32, + "learning_rate": 1.9706133752035875e-06, + "loss": 0.7031, + "step": 12295 + }, + { + "epoch": 0.32, + "learning_rate": 1.970606716095189e-06, + "loss": 0.7812, + "step": 12296 + }, + { + "epoch": 0.32, + "learning_rate": 1.9706000562436423e-06, + "loss": 0.9573, + "step": 12297 + }, + { + "epoch": 0.32, + "learning_rate": 1.9705933956489514e-06, + "loss": 1.0391, + "step": 12298 + }, + { + "epoch": 0.32, + "learning_rate": 1.9705867343111217e-06, + "loss": 0.8867, + "step": 12299 + }, + { + "epoch": 0.32, + "learning_rate": 1.9705800722301583e-06, + "loss": 0.7183, + "step": 12300 + }, + { + "epoch": 0.32, + "learning_rate": 1.9705734094060666e-06, + "loss": 0.9443, + "step": 12301 + }, + { + "epoch": 0.32, + "learning_rate": 1.9705667458388512e-06, + "loss": 1.0146, + "step": 12302 + }, + { + "epoch": 0.32, + "learning_rate": 1.970560081528518e-06, + "loss": 0.7317, + "step": 12303 + }, + { + "epoch": 0.32, + "learning_rate": 1.970553416475071e-06, + "loss": 0.9648, + "step": 12304 + }, + { + "epoch": 0.32, + "learning_rate": 1.970546750678516e-06, + "loss": 0.8418, + "step": 12305 + }, + { + "epoch": 0.32, + "learning_rate": 1.970540084138858e-06, + "loss": 0.9229, + "step": 12306 + }, + { + "epoch": 0.32, + "learning_rate": 1.9705334168561027e-06, + "loss": 0.7744, + "step": 12307 + }, + { + "epoch": 0.32, + "learning_rate": 1.970526748830254e-06, + "loss": 1.125, + "step": 12308 + }, + { + "epoch": 0.32, + "learning_rate": 1.9705200800613176e-06, + "loss": 0.9648, + "step": 12309 + }, + { + "epoch": 0.32, + "learning_rate": 1.9705134105492985e-06, + "loss": 0.9062, + "step": 12310 + }, + { + "epoch": 0.32, + "learning_rate": 1.970506740294202e-06, + "loss": 0.9189, + "step": 12311 + }, + { + "epoch": 0.32, + "learning_rate": 1.970500069296033e-06, + "loss": 0.9668, + "step": 12312 + }, + { + "epoch": 0.32, + "learning_rate": 1.9704933975547974e-06, + "loss": 0.8574, + "step": 12313 + }, + { + "epoch": 0.32, + "learning_rate": 1.970486725070499e-06, + "loss": 0.835, + "step": 12314 + }, + { + "epoch": 0.32, + "learning_rate": 1.9704800518431436e-06, + "loss": 0.8564, + "step": 12315 + }, + { + "epoch": 0.32, + "learning_rate": 1.970473377872736e-06, + "loss": 0.8486, + "step": 12316 + }, + { + "epoch": 0.32, + "learning_rate": 1.9704667031592825e-06, + "loss": 0.8555, + "step": 12317 + }, + { + "epoch": 0.32, + "learning_rate": 1.970460027702786e-06, + "loss": 0.8281, + "step": 12318 + }, + { + "epoch": 0.32, + "learning_rate": 1.970453351503254e-06, + "loss": 0.7549, + "step": 12319 + }, + { + "epoch": 0.32, + "learning_rate": 1.97044667456069e-06, + "loss": 1.0068, + "step": 12320 + }, + { + "epoch": 0.32, + "learning_rate": 1.9704399968750994e-06, + "loss": 0.8164, + "step": 12321 + }, + { + "epoch": 0.32, + "learning_rate": 1.9704333184464878e-06, + "loss": 1.0156, + "step": 12322 + }, + { + "epoch": 0.32, + "learning_rate": 1.97042663927486e-06, + "loss": 0.8032, + "step": 12323 + }, + { + "epoch": 0.32, + "learning_rate": 1.970419959360221e-06, + "loss": 0.9209, + "step": 12324 + }, + { + "epoch": 0.32, + "learning_rate": 1.970413278702576e-06, + "loss": 0.8096, + "step": 12325 + }, + { + "epoch": 0.32, + "learning_rate": 1.9704065973019307e-06, + "loss": 0.9268, + "step": 12326 + }, + { + "epoch": 0.32, + "learning_rate": 1.9703999151582893e-06, + "loss": 0.6699, + "step": 12327 + }, + { + "epoch": 0.32, + "learning_rate": 1.9703932322716573e-06, + "loss": 0.7109, + "step": 12328 + }, + { + "epoch": 0.32, + "learning_rate": 1.97038654864204e-06, + "loss": 0.9834, + "step": 12329 + }, + { + "epoch": 0.32, + "learning_rate": 1.970379864269442e-06, + "loss": 0.9053, + "step": 12330 + }, + { + "epoch": 0.32, + "learning_rate": 1.970373179153869e-06, + "loss": 0.6991, + "step": 12331 + }, + { + "epoch": 0.32, + "learning_rate": 1.9703664932953258e-06, + "loss": 0.9854, + "step": 12332 + }, + { + "epoch": 0.32, + "learning_rate": 1.9703598066938177e-06, + "loss": 1.1475, + "step": 12333 + }, + { + "epoch": 0.32, + "learning_rate": 1.9703531193493495e-06, + "loss": 0.8804, + "step": 12334 + }, + { + "epoch": 0.32, + "learning_rate": 1.9703464312619267e-06, + "loss": 0.7207, + "step": 12335 + }, + { + "epoch": 0.32, + "learning_rate": 1.9703397424315544e-06, + "loss": 1.1084, + "step": 12336 + }, + { + "epoch": 0.32, + "learning_rate": 1.9703330528582375e-06, + "loss": 0.8984, + "step": 12337 + }, + { + "epoch": 0.32, + "learning_rate": 1.970326362541981e-06, + "loss": 0.9844, + "step": 12338 + }, + { + "epoch": 0.32, + "learning_rate": 1.9703196714827905e-06, + "loss": 0.8418, + "step": 12339 + }, + { + "epoch": 0.32, + "learning_rate": 1.9703129796806704e-06, + "loss": 1.0762, + "step": 12340 + }, + { + "epoch": 0.32, + "learning_rate": 1.9703062871356265e-06, + "loss": 0.8818, + "step": 12341 + }, + { + "epoch": 0.32, + "learning_rate": 1.9702995938476637e-06, + "loss": 0.7051, + "step": 12342 + }, + { + "epoch": 0.32, + "learning_rate": 1.9702928998167873e-06, + "loss": 1.0215, + "step": 12343 + }, + { + "epoch": 0.32, + "learning_rate": 1.970286205043002e-06, + "loss": 1.1895, + "step": 12344 + }, + { + "epoch": 0.32, + "learning_rate": 1.9702795095263133e-06, + "loss": 1.124, + "step": 12345 + }, + { + "epoch": 0.32, + "learning_rate": 1.970272813266726e-06, + "loss": 0.7139, + "step": 12346 + }, + { + "epoch": 0.32, + "learning_rate": 1.970266116264246e-06, + "loss": 1.0957, + "step": 12347 + }, + { + "epoch": 0.32, + "learning_rate": 1.970259418518877e-06, + "loss": 0.9141, + "step": 12348 + }, + { + "epoch": 0.32, + "learning_rate": 1.9702527200306258e-06, + "loss": 0.8452, + "step": 12349 + }, + { + "epoch": 0.32, + "learning_rate": 1.970246020799496e-06, + "loss": 0.7974, + "step": 12350 + }, + { + "epoch": 0.32, + "learning_rate": 1.970239320825494e-06, + "loss": 0.9355, + "step": 12351 + }, + { + "epoch": 0.32, + "learning_rate": 1.970232620108624e-06, + "loss": 0.8838, + "step": 12352 + }, + { + "epoch": 0.32, + "learning_rate": 1.9702259186488916e-06, + "loss": 1.0, + "step": 12353 + }, + { + "epoch": 0.32, + "learning_rate": 1.9702192164463017e-06, + "loss": 0.9355, + "step": 12354 + }, + { + "epoch": 0.32, + "learning_rate": 1.9702125135008597e-06, + "loss": 0.873, + "step": 12355 + }, + { + "epoch": 0.32, + "learning_rate": 1.9702058098125706e-06, + "loss": 0.7065, + "step": 12356 + }, + { + "epoch": 0.32, + "learning_rate": 1.9701991053814395e-06, + "loss": 0.7021, + "step": 12357 + }, + { + "epoch": 0.32, + "learning_rate": 1.9701924002074716e-06, + "loss": 0.5825, + "step": 12358 + }, + { + "epoch": 0.32, + "learning_rate": 1.970185694290672e-06, + "loss": 0.9268, + "step": 12359 + }, + { + "epoch": 0.32, + "learning_rate": 1.9701789876310454e-06, + "loss": 0.915, + "step": 12360 + }, + { + "epoch": 0.32, + "learning_rate": 1.9701722802285977e-06, + "loss": 0.8721, + "step": 12361 + }, + { + "epoch": 0.32, + "learning_rate": 1.970165572083334e-06, + "loss": 1.1406, + "step": 12362 + }, + { + "epoch": 0.32, + "learning_rate": 1.9701588631952586e-06, + "loss": 0.8398, + "step": 12363 + }, + { + "epoch": 0.32, + "learning_rate": 1.970152153564378e-06, + "loss": 0.8359, + "step": 12364 + }, + { + "epoch": 0.32, + "learning_rate": 1.9701454431906957e-06, + "loss": 0.9619, + "step": 12365 + }, + { + "epoch": 0.32, + "learning_rate": 1.9701387320742173e-06, + "loss": 0.9717, + "step": 12366 + }, + { + "epoch": 0.32, + "learning_rate": 1.970132020214949e-06, + "loss": 0.7261, + "step": 12367 + }, + { + "epoch": 0.32, + "learning_rate": 1.9701253076128952e-06, + "loss": 0.9009, + "step": 12368 + }, + { + "epoch": 0.32, + "learning_rate": 1.970118594268061e-06, + "loss": 0.8076, + "step": 12369 + }, + { + "epoch": 0.32, + "learning_rate": 1.9701118801804514e-06, + "loss": 0.8516, + "step": 12370 + }, + { + "epoch": 0.32, + "learning_rate": 1.970105165350072e-06, + "loss": 0.8125, + "step": 12371 + }, + { + "epoch": 0.32, + "learning_rate": 1.9700984497769276e-06, + "loss": 0.9785, + "step": 12372 + }, + { + "epoch": 0.32, + "learning_rate": 1.9700917334610235e-06, + "loss": 0.6285, + "step": 12373 + }, + { + "epoch": 0.32, + "learning_rate": 1.9700850164023642e-06, + "loss": 0.9326, + "step": 12374 + }, + { + "epoch": 0.32, + "learning_rate": 1.970078298600956e-06, + "loss": 1.0264, + "step": 12375 + }, + { + "epoch": 0.32, + "learning_rate": 1.970071580056803e-06, + "loss": 0.7915, + "step": 12376 + }, + { + "epoch": 0.32, + "learning_rate": 1.9700648607699114e-06, + "loss": 0.7793, + "step": 12377 + }, + { + "epoch": 0.32, + "learning_rate": 1.9700581407402854e-06, + "loss": 0.915, + "step": 12378 + }, + { + "epoch": 0.32, + "learning_rate": 1.9700514199679304e-06, + "loss": 0.9463, + "step": 12379 + }, + { + "epoch": 0.32, + "learning_rate": 1.970044698452852e-06, + "loss": 0.7705, + "step": 12380 + }, + { + "epoch": 0.32, + "learning_rate": 1.9700379761950546e-06, + "loss": 0.7122, + "step": 12381 + }, + { + "epoch": 0.32, + "learning_rate": 1.970031253194544e-06, + "loss": 0.8389, + "step": 12382 + }, + { + "epoch": 0.32, + "learning_rate": 1.970024529451325e-06, + "loss": 0.7559, + "step": 12383 + }, + { + "epoch": 0.32, + "learning_rate": 1.9700178049654024e-06, + "loss": 0.8994, + "step": 12384 + }, + { + "epoch": 0.32, + "learning_rate": 1.9700110797367825e-06, + "loss": 0.875, + "step": 12385 + }, + { + "epoch": 0.32, + "learning_rate": 1.970004353765469e-06, + "loss": 0.8857, + "step": 12386 + }, + { + "epoch": 0.32, + "learning_rate": 1.969997627051468e-06, + "loss": 0.8154, + "step": 12387 + }, + { + "epoch": 0.32, + "learning_rate": 1.9699908995947847e-06, + "loss": 1.1162, + "step": 12388 + }, + { + "epoch": 0.32, + "learning_rate": 1.969984171395424e-06, + "loss": 0.9912, + "step": 12389 + }, + { + "epoch": 0.32, + "learning_rate": 1.969977442453391e-06, + "loss": 0.916, + "step": 12390 + }, + { + "epoch": 0.32, + "learning_rate": 1.9699707127686903e-06, + "loss": 1.1074, + "step": 12391 + }, + { + "epoch": 0.32, + "learning_rate": 1.9699639823413282e-06, + "loss": 0.9922, + "step": 12392 + }, + { + "epoch": 0.32, + "learning_rate": 1.969957251171309e-06, + "loss": 1.0469, + "step": 12393 + }, + { + "epoch": 0.32, + "learning_rate": 1.969950519258638e-06, + "loss": 1.1299, + "step": 12394 + }, + { + "epoch": 0.32, + "learning_rate": 1.969943786603321e-06, + "loss": 0.9072, + "step": 12395 + }, + { + "epoch": 0.32, + "learning_rate": 1.969937053205362e-06, + "loss": 1.0703, + "step": 12396 + }, + { + "epoch": 0.32, + "learning_rate": 1.9699303190647675e-06, + "loss": 1.3232, + "step": 12397 + }, + { + "epoch": 0.32, + "learning_rate": 1.969923584181541e-06, + "loss": 0.7891, + "step": 12398 + }, + { + "epoch": 0.32, + "learning_rate": 1.9699168485556897e-06, + "loss": 0.5786, + "step": 12399 + }, + { + "epoch": 0.32, + "learning_rate": 1.9699101121872174e-06, + "loss": 0.9644, + "step": 12400 + }, + { + "epoch": 0.32, + "learning_rate": 1.9699033750761292e-06, + "loss": 0.7744, + "step": 12401 + }, + { + "epoch": 0.32, + "learning_rate": 1.969896637222431e-06, + "loss": 0.9248, + "step": 12402 + }, + { + "epoch": 0.32, + "learning_rate": 1.9698898986261267e-06, + "loss": 1.0596, + "step": 12403 + }, + { + "epoch": 0.32, + "learning_rate": 1.969883159287223e-06, + "loss": 0.812, + "step": 12404 + }, + { + "epoch": 0.32, + "learning_rate": 1.969876419205724e-06, + "loss": 0.8232, + "step": 12405 + }, + { + "epoch": 0.32, + "learning_rate": 1.9698696783816352e-06, + "loss": 0.7949, + "step": 12406 + }, + { + "epoch": 0.32, + "learning_rate": 1.9698629368149624e-06, + "loss": 0.9053, + "step": 12407 + }, + { + "epoch": 0.32, + "learning_rate": 1.9698561945057097e-06, + "loss": 0.8057, + "step": 12408 + }, + { + "epoch": 0.32, + "learning_rate": 1.9698494514538827e-06, + "loss": 0.688, + "step": 12409 + }, + { + "epoch": 0.32, + "learning_rate": 1.9698427076594865e-06, + "loss": 0.8516, + "step": 12410 + }, + { + "epoch": 0.32, + "learning_rate": 1.9698359631225266e-06, + "loss": 0.7012, + "step": 12411 + }, + { + "epoch": 0.32, + "learning_rate": 1.969829217843008e-06, + "loss": 0.9385, + "step": 12412 + }, + { + "epoch": 0.32, + "learning_rate": 1.9698224718209355e-06, + "loss": 1.0518, + "step": 12413 + }, + { + "epoch": 0.32, + "learning_rate": 1.969815725056314e-06, + "loss": 1.0356, + "step": 12414 + }, + { + "epoch": 0.32, + "learning_rate": 1.96980897754915e-06, + "loss": 0.8174, + "step": 12415 + }, + { + "epoch": 0.32, + "learning_rate": 1.9698022292994474e-06, + "loss": 0.8408, + "step": 12416 + }, + { + "epoch": 0.32, + "learning_rate": 1.969795480307212e-06, + "loss": 1.0771, + "step": 12417 + }, + { + "epoch": 0.32, + "learning_rate": 1.969788730572449e-06, + "loss": 0.834, + "step": 12418 + }, + { + "epoch": 0.32, + "learning_rate": 1.9697819800951633e-06, + "loss": 0.688, + "step": 12419 + }, + { + "epoch": 0.32, + "learning_rate": 1.9697752288753595e-06, + "loss": 0.7839, + "step": 12420 + }, + { + "epoch": 0.32, + "learning_rate": 1.969768476913044e-06, + "loss": 0.8691, + "step": 12421 + }, + { + "epoch": 0.32, + "learning_rate": 1.9697617242082213e-06, + "loss": 0.7561, + "step": 12422 + }, + { + "epoch": 0.32, + "learning_rate": 1.969754970760897e-06, + "loss": 0.9287, + "step": 12423 + }, + { + "epoch": 0.32, + "learning_rate": 1.969748216571075e-06, + "loss": 0.835, + "step": 12424 + }, + { + "epoch": 0.32, + "learning_rate": 1.9697414616387623e-06, + "loss": 0.9658, + "step": 12425 + }, + { + "epoch": 0.32, + "learning_rate": 1.9697347059639624e-06, + "loss": 0.8506, + "step": 12426 + }, + { + "epoch": 0.32, + "learning_rate": 1.969727949546682e-06, + "loss": 1.0176, + "step": 12427 + }, + { + "epoch": 0.32, + "learning_rate": 1.969721192386925e-06, + "loss": 0.8711, + "step": 12428 + }, + { + "epoch": 0.32, + "learning_rate": 1.969714434484697e-06, + "loss": 0.9307, + "step": 12429 + }, + { + "epoch": 0.32, + "learning_rate": 1.9697076758400034e-06, + "loss": 0.7114, + "step": 12430 + }, + { + "epoch": 0.32, + "learning_rate": 1.969700916452849e-06, + "loss": 0.7559, + "step": 12431 + }, + { + "epoch": 0.32, + "learning_rate": 1.9696941563232396e-06, + "loss": 0.8071, + "step": 12432 + }, + { + "epoch": 0.32, + "learning_rate": 1.96968739545118e-06, + "loss": 0.9463, + "step": 12433 + }, + { + "epoch": 0.32, + "learning_rate": 1.969680633836675e-06, + "loss": 0.7587, + "step": 12434 + }, + { + "epoch": 0.32, + "learning_rate": 1.9696738714797304e-06, + "loss": 0.9121, + "step": 12435 + }, + { + "epoch": 0.32, + "learning_rate": 1.9696671083803505e-06, + "loss": 1.123, + "step": 12436 + }, + { + "epoch": 0.32, + "learning_rate": 1.969660344538542e-06, + "loss": 0.832, + "step": 12437 + }, + { + "epoch": 0.32, + "learning_rate": 1.9696535799543086e-06, + "loss": 0.9736, + "step": 12438 + }, + { + "epoch": 0.32, + "learning_rate": 1.969646814627656e-06, + "loss": 0.5723, + "step": 12439 + }, + { + "epoch": 0.32, + "learning_rate": 1.9696400485585896e-06, + "loss": 0.8701, + "step": 12440 + }, + { + "epoch": 0.32, + "learning_rate": 1.9696332817471145e-06, + "loss": 0.9199, + "step": 12441 + }, + { + "epoch": 0.32, + "learning_rate": 1.9696265141932353e-06, + "loss": 0.7754, + "step": 12442 + }, + { + "epoch": 0.32, + "learning_rate": 1.969619745896958e-06, + "loss": 0.8477, + "step": 12443 + }, + { + "epoch": 0.32, + "learning_rate": 1.9696129768582877e-06, + "loss": 0.6147, + "step": 12444 + }, + { + "epoch": 0.32, + "learning_rate": 1.969606207077229e-06, + "loss": 0.9375, + "step": 12445 + }, + { + "epoch": 0.32, + "learning_rate": 1.9695994365537874e-06, + "loss": 1.0352, + "step": 12446 + }, + { + "epoch": 0.32, + "learning_rate": 1.969592665287968e-06, + "loss": 0.999, + "step": 12447 + }, + { + "epoch": 0.32, + "learning_rate": 1.9695858932797764e-06, + "loss": 0.7656, + "step": 12448 + }, + { + "epoch": 0.32, + "learning_rate": 1.9695791205292175e-06, + "loss": 0.833, + "step": 12449 + }, + { + "epoch": 0.32, + "learning_rate": 1.969572347036296e-06, + "loss": 0.8633, + "step": 12450 + }, + { + "epoch": 0.32, + "learning_rate": 1.9695655728010177e-06, + "loss": 0.8691, + "step": 12451 + }, + { + "epoch": 0.32, + "learning_rate": 1.9695587978233877e-06, + "loss": 0.916, + "step": 12452 + }, + { + "epoch": 0.32, + "learning_rate": 1.9695520221034113e-06, + "loss": 0.7827, + "step": 12453 + }, + { + "epoch": 0.32, + "learning_rate": 1.9695452456410935e-06, + "loss": 1.1787, + "step": 12454 + }, + { + "epoch": 0.32, + "learning_rate": 1.9695384684364394e-06, + "loss": 0.7998, + "step": 12455 + }, + { + "epoch": 0.32, + "learning_rate": 1.969531690489454e-06, + "loss": 0.6958, + "step": 12456 + }, + { + "epoch": 0.32, + "learning_rate": 1.969524911800143e-06, + "loss": 0.8418, + "step": 12457 + }, + { + "epoch": 0.32, + "learning_rate": 1.9695181323685115e-06, + "loss": 0.874, + "step": 12458 + }, + { + "epoch": 0.32, + "learning_rate": 1.9695113521945644e-06, + "loss": 0.9189, + "step": 12459 + }, + { + "epoch": 0.32, + "learning_rate": 1.9695045712783068e-06, + "loss": 0.9307, + "step": 12460 + }, + { + "epoch": 0.32, + "learning_rate": 1.9694977896197442e-06, + "loss": 0.9492, + "step": 12461 + }, + { + "epoch": 0.32, + "learning_rate": 1.969491007218882e-06, + "loss": 0.7266, + "step": 12462 + }, + { + "epoch": 0.32, + "learning_rate": 1.969484224075725e-06, + "loss": 0.7305, + "step": 12463 + }, + { + "epoch": 0.32, + "learning_rate": 1.969477440190278e-06, + "loss": 0.9404, + "step": 12464 + }, + { + "epoch": 0.32, + "learning_rate": 1.9694706555625475e-06, + "loss": 0.8691, + "step": 12465 + }, + { + "epoch": 0.32, + "learning_rate": 1.9694638701925378e-06, + "loss": 0.9248, + "step": 12466 + }, + { + "epoch": 0.32, + "learning_rate": 1.969457084080254e-06, + "loss": 0.6606, + "step": 12467 + }, + { + "epoch": 0.32, + "learning_rate": 1.9694502972257016e-06, + "loss": 0.9434, + "step": 12468 + }, + { + "epoch": 0.32, + "learning_rate": 1.9694435096288854e-06, + "loss": 0.9951, + "step": 12469 + }, + { + "epoch": 0.32, + "learning_rate": 1.969436721289811e-06, + "loss": 0.8018, + "step": 12470 + }, + { + "epoch": 0.32, + "learning_rate": 1.9694299322084835e-06, + "loss": 0.7998, + "step": 12471 + }, + { + "epoch": 0.32, + "learning_rate": 1.969423142384908e-06, + "loss": 0.7383, + "step": 12472 + }, + { + "epoch": 0.32, + "learning_rate": 1.9694163518190896e-06, + "loss": 0.877, + "step": 12473 + }, + { + "epoch": 0.32, + "learning_rate": 1.969409560511034e-06, + "loss": 0.9111, + "step": 12474 + }, + { + "epoch": 0.32, + "learning_rate": 1.969402768460746e-06, + "loss": 0.8984, + "step": 12475 + }, + { + "epoch": 0.32, + "learning_rate": 1.969395975668231e-06, + "loss": 1.1514, + "step": 12476 + }, + { + "epoch": 0.32, + "learning_rate": 1.9693891821334937e-06, + "loss": 0.9824, + "step": 12477 + }, + { + "epoch": 0.32, + "learning_rate": 1.96938238785654e-06, + "loss": 0.8516, + "step": 12478 + }, + { + "epoch": 0.32, + "learning_rate": 1.9693755928373748e-06, + "loss": 0.9585, + "step": 12479 + }, + { + "epoch": 0.32, + "learning_rate": 1.969368797076003e-06, + "loss": 0.877, + "step": 12480 + }, + { + "epoch": 0.32, + "learning_rate": 1.9693620005724303e-06, + "loss": 0.9268, + "step": 12481 + }, + { + "epoch": 0.32, + "learning_rate": 1.969355203326662e-06, + "loss": 0.8721, + "step": 12482 + }, + { + "epoch": 0.32, + "learning_rate": 1.9693484053387023e-06, + "loss": 0.8975, + "step": 12483 + }, + { + "epoch": 0.32, + "learning_rate": 1.9693416066085575e-06, + "loss": 0.7686, + "step": 12484 + }, + { + "epoch": 0.32, + "learning_rate": 1.9693348071362322e-06, + "loss": 0.8818, + "step": 12485 + }, + { + "epoch": 0.32, + "learning_rate": 1.969328006921732e-06, + "loss": 0.9531, + "step": 12486 + }, + { + "epoch": 0.32, + "learning_rate": 1.969321205965062e-06, + "loss": 0.9707, + "step": 12487 + }, + { + "epoch": 0.32, + "learning_rate": 1.969314404266227e-06, + "loss": 0.9316, + "step": 12488 + }, + { + "epoch": 0.32, + "learning_rate": 1.9693076018252327e-06, + "loss": 0.7881, + "step": 12489 + }, + { + "epoch": 0.32, + "learning_rate": 1.9693007986420845e-06, + "loss": 0.7231, + "step": 12490 + }, + { + "epoch": 0.32, + "learning_rate": 1.9692939947167868e-06, + "loss": 0.9434, + "step": 12491 + }, + { + "epoch": 0.32, + "learning_rate": 1.9692871900493454e-06, + "loss": 0.9766, + "step": 12492 + }, + { + "epoch": 0.32, + "learning_rate": 1.969280384639765e-06, + "loss": 1.1758, + "step": 12493 + }, + { + "epoch": 0.32, + "learning_rate": 1.969273578488052e-06, + "loss": 1.0762, + "step": 12494 + }, + { + "epoch": 0.32, + "learning_rate": 1.9692667715942103e-06, + "loss": 0.957, + "step": 12495 + }, + { + "epoch": 0.32, + "learning_rate": 1.9692599639582455e-06, + "loss": 1.002, + "step": 12496 + }, + { + "epoch": 0.32, + "learning_rate": 1.969253155580163e-06, + "loss": 0.54, + "step": 12497 + }, + { + "epoch": 0.32, + "learning_rate": 1.969246346459968e-06, + "loss": 1.1357, + "step": 12498 + }, + { + "epoch": 0.32, + "learning_rate": 1.9692395365976656e-06, + "loss": 0.8955, + "step": 12499 + }, + { + "epoch": 0.32, + "learning_rate": 1.9692327259932606e-06, + "loss": 0.6982, + "step": 12500 + }, + { + "epoch": 0.32, + "learning_rate": 1.9692259146467595e-06, + "loss": 1.0537, + "step": 12501 + }, + { + "epoch": 0.32, + "learning_rate": 1.969219102558166e-06, + "loss": 0.7075, + "step": 12502 + }, + { + "epoch": 0.32, + "learning_rate": 1.9692122897274867e-06, + "loss": 0.9756, + "step": 12503 + }, + { + "epoch": 0.32, + "learning_rate": 1.9692054761547255e-06, + "loss": 0.8789, + "step": 12504 + }, + { + "epoch": 0.32, + "learning_rate": 1.9691986618398885e-06, + "loss": 1.0537, + "step": 12505 + }, + { + "epoch": 0.32, + "learning_rate": 1.9691918467829807e-06, + "loss": 0.959, + "step": 12506 + }, + { + "epoch": 0.32, + "learning_rate": 1.9691850309840073e-06, + "loss": 0.8848, + "step": 12507 + }, + { + "epoch": 0.32, + "learning_rate": 1.9691782144429733e-06, + "loss": 0.8369, + "step": 12508 + }, + { + "epoch": 0.32, + "learning_rate": 1.969171397159884e-06, + "loss": 0.8867, + "step": 12509 + }, + { + "epoch": 0.32, + "learning_rate": 1.969164579134745e-06, + "loss": 0.8628, + "step": 12510 + }, + { + "epoch": 0.32, + "learning_rate": 1.969157760367561e-06, + "loss": 0.8965, + "step": 12511 + }, + { + "epoch": 0.32, + "learning_rate": 1.9691509408583375e-06, + "loss": 0.8218, + "step": 12512 + }, + { + "epoch": 0.32, + "learning_rate": 1.96914412060708e-06, + "loss": 0.873, + "step": 12513 + }, + { + "epoch": 0.32, + "learning_rate": 1.9691372996137933e-06, + "loss": 1.1299, + "step": 12514 + }, + { + "epoch": 0.32, + "learning_rate": 1.9691304778784823e-06, + "loss": 0.9141, + "step": 12515 + }, + { + "epoch": 0.32, + "learning_rate": 1.969123655401153e-06, + "loss": 0.9229, + "step": 12516 + }, + { + "epoch": 0.32, + "learning_rate": 1.96911683218181e-06, + "loss": 0.9648, + "step": 12517 + }, + { + "epoch": 0.32, + "learning_rate": 1.969110008220459e-06, + "loss": 0.7832, + "step": 12518 + }, + { + "epoch": 0.32, + "learning_rate": 1.9691031835171053e-06, + "loss": 0.9961, + "step": 12519 + }, + { + "epoch": 0.32, + "learning_rate": 1.9690963580717535e-06, + "loss": 0.876, + "step": 12520 + }, + { + "epoch": 0.32, + "learning_rate": 1.9690895318844097e-06, + "loss": 0.7627, + "step": 12521 + }, + { + "epoch": 0.32, + "learning_rate": 1.969082704955078e-06, + "loss": 0.959, + "step": 12522 + }, + { + "epoch": 0.32, + "learning_rate": 1.9690758772837645e-06, + "loss": 1.0078, + "step": 12523 + }, + { + "epoch": 0.32, + "learning_rate": 1.969069048870474e-06, + "loss": 0.8408, + "step": 12524 + }, + { + "epoch": 0.32, + "learning_rate": 1.969062219715212e-06, + "loss": 0.7822, + "step": 12525 + }, + { + "epoch": 0.32, + "learning_rate": 1.9690553898179837e-06, + "loss": 1.0078, + "step": 12526 + }, + { + "epoch": 0.32, + "learning_rate": 1.969048559178794e-06, + "loss": 0.9023, + "step": 12527 + }, + { + "epoch": 0.32, + "learning_rate": 1.9690417277976484e-06, + "loss": 0.8931, + "step": 12528 + }, + { + "epoch": 0.32, + "learning_rate": 1.9690348956745522e-06, + "loss": 1.0176, + "step": 12529 + }, + { + "epoch": 0.32, + "learning_rate": 1.9690280628095107e-06, + "loss": 0.9434, + "step": 12530 + }, + { + "epoch": 0.32, + "learning_rate": 1.969021229202529e-06, + "loss": 1.0244, + "step": 12531 + }, + { + "epoch": 0.32, + "learning_rate": 1.9690143948536123e-06, + "loss": 0.9219, + "step": 12532 + }, + { + "epoch": 0.32, + "learning_rate": 1.9690075597627656e-06, + "loss": 0.9629, + "step": 12533 + }, + { + "epoch": 0.32, + "learning_rate": 1.969000723929994e-06, + "loss": 1.0127, + "step": 12534 + }, + { + "epoch": 0.32, + "learning_rate": 1.968993887355304e-06, + "loss": 0.8774, + "step": 12535 + }, + { + "epoch": 0.32, + "learning_rate": 1.9689870500386996e-06, + "loss": 1.0195, + "step": 12536 + }, + { + "epoch": 0.32, + "learning_rate": 1.968980211980186e-06, + "loss": 1.1582, + "step": 12537 + }, + { + "epoch": 0.32, + "learning_rate": 1.968973373179769e-06, + "loss": 0.9883, + "step": 12538 + }, + { + "epoch": 0.32, + "learning_rate": 1.968966533637454e-06, + "loss": 1.0977, + "step": 12539 + }, + { + "epoch": 0.32, + "learning_rate": 1.9689596933532453e-06, + "loss": 0.9316, + "step": 12540 + }, + { + "epoch": 0.32, + "learning_rate": 1.968952852327149e-06, + "loss": 0.7031, + "step": 12541 + }, + { + "epoch": 0.32, + "learning_rate": 1.9689460105591702e-06, + "loss": 0.9326, + "step": 12542 + }, + { + "epoch": 0.32, + "learning_rate": 1.9689391680493135e-06, + "loss": 0.957, + "step": 12543 + }, + { + "epoch": 0.32, + "learning_rate": 1.968932324797585e-06, + "loss": 0.7988, + "step": 12544 + }, + { + "epoch": 0.32, + "learning_rate": 1.9689254808039897e-06, + "loss": 0.7725, + "step": 12545 + }, + { + "epoch": 0.32, + "learning_rate": 1.9689186360685328e-06, + "loss": 1.1494, + "step": 12546 + }, + { + "epoch": 0.32, + "learning_rate": 1.968911790591219e-06, + "loss": 0.9941, + "step": 12547 + }, + { + "epoch": 0.32, + "learning_rate": 1.9689049443720546e-06, + "loss": 1.0479, + "step": 12548 + }, + { + "epoch": 0.32, + "learning_rate": 1.9688980974110436e-06, + "loss": 1.1631, + "step": 12549 + }, + { + "epoch": 0.32, + "learning_rate": 1.968891249708192e-06, + "loss": 0.8818, + "step": 12550 + }, + { + "epoch": 0.32, + "learning_rate": 1.968884401263505e-06, + "loss": 0.7939, + "step": 12551 + }, + { + "epoch": 0.32, + "learning_rate": 1.968877552076988e-06, + "loss": 0.9482, + "step": 12552 + }, + { + "epoch": 0.32, + "learning_rate": 1.968870702148646e-06, + "loss": 0.8027, + "step": 12553 + }, + { + "epoch": 0.32, + "learning_rate": 1.968863851478484e-06, + "loss": 0.7832, + "step": 12554 + }, + { + "epoch": 0.32, + "learning_rate": 1.9688570000665075e-06, + "loss": 0.5684, + "step": 12555 + }, + { + "epoch": 0.32, + "learning_rate": 1.9688501479127216e-06, + "loss": 0.7842, + "step": 12556 + }, + { + "epoch": 0.32, + "learning_rate": 1.9688432950171322e-06, + "loss": 0.9268, + "step": 12557 + }, + { + "epoch": 0.32, + "learning_rate": 1.968836441379744e-06, + "loss": 0.9434, + "step": 12558 + }, + { + "epoch": 0.32, + "learning_rate": 1.968829587000562e-06, + "loss": 1.0117, + "step": 12559 + }, + { + "epoch": 0.32, + "learning_rate": 1.9688227318795913e-06, + "loss": 1.0908, + "step": 12560 + }, + { + "epoch": 0.32, + "learning_rate": 1.9688158760168383e-06, + "loss": 0.8066, + "step": 12561 + }, + { + "epoch": 0.32, + "learning_rate": 1.968809019412307e-06, + "loss": 0.999, + "step": 12562 + }, + { + "epoch": 0.32, + "learning_rate": 1.968802162066004e-06, + "loss": 0.8135, + "step": 12563 + }, + { + "epoch": 0.32, + "learning_rate": 1.9687953039779327e-06, + "loss": 0.7349, + "step": 12564 + }, + { + "epoch": 0.32, + "learning_rate": 1.9687884451481e-06, + "loss": 0.9678, + "step": 12565 + }, + { + "epoch": 0.32, + "learning_rate": 1.9687815855765102e-06, + "loss": 0.7949, + "step": 12566 + }, + { + "epoch": 0.32, + "learning_rate": 1.968774725263169e-06, + "loss": 1.0625, + "step": 12567 + }, + { + "epoch": 0.32, + "learning_rate": 1.968767864208082e-06, + "loss": 0.6665, + "step": 12568 + }, + { + "epoch": 0.32, + "learning_rate": 1.9687610024112534e-06, + "loss": 1.0068, + "step": 12569 + }, + { + "epoch": 0.32, + "learning_rate": 1.9687541398726894e-06, + "loss": 0.8262, + "step": 12570 + }, + { + "epoch": 0.32, + "learning_rate": 1.968747276592395e-06, + "loss": 0.8052, + "step": 12571 + }, + { + "epoch": 0.32, + "learning_rate": 1.968740412570375e-06, + "loss": 0.9004, + "step": 12572 + }, + { + "epoch": 0.32, + "learning_rate": 1.968733547806635e-06, + "loss": 0.7832, + "step": 12573 + }, + { + "epoch": 0.32, + "learning_rate": 1.9687266823011807e-06, + "loss": 0.9092, + "step": 12574 + }, + { + "epoch": 0.32, + "learning_rate": 1.9687198160540163e-06, + "loss": 0.7715, + "step": 12575 + }, + { + "epoch": 0.32, + "learning_rate": 1.968712949065148e-06, + "loss": 0.812, + "step": 12576 + }, + { + "epoch": 0.32, + "learning_rate": 1.968706081334581e-06, + "loss": 0.8721, + "step": 12577 + }, + { + "epoch": 0.32, + "learning_rate": 1.9686992128623198e-06, + "loss": 0.8862, + "step": 12578 + }, + { + "epoch": 0.32, + "learning_rate": 1.9686923436483704e-06, + "loss": 0.8408, + "step": 12579 + }, + { + "epoch": 0.32, + "learning_rate": 1.9686854736927374e-06, + "loss": 0.5581, + "step": 12580 + }, + { + "epoch": 0.32, + "learning_rate": 1.9686786029954276e-06, + "loss": 1.0166, + "step": 12581 + }, + { + "epoch": 0.32, + "learning_rate": 1.9686717315564443e-06, + "loss": 1.0713, + "step": 12582 + }, + { + "epoch": 0.32, + "learning_rate": 1.9686648593757934e-06, + "loss": 0.9253, + "step": 12583 + }, + { + "epoch": 0.32, + "learning_rate": 1.968657986453481e-06, + "loss": 1.0371, + "step": 12584 + }, + { + "epoch": 0.32, + "learning_rate": 1.968651112789511e-06, + "loss": 0.9707, + "step": 12585 + }, + { + "epoch": 0.32, + "learning_rate": 1.96864423838389e-06, + "loss": 0.8755, + "step": 12586 + }, + { + "epoch": 0.32, + "learning_rate": 1.9686373632366222e-06, + "loss": 0.834, + "step": 12587 + }, + { + "epoch": 0.32, + "learning_rate": 1.9686304873477136e-06, + "loss": 0.8242, + "step": 12588 + }, + { + "epoch": 0.32, + "learning_rate": 1.9686236107171692e-06, + "loss": 0.9697, + "step": 12589 + }, + { + "epoch": 0.32, + "learning_rate": 1.968616733344994e-06, + "loss": 1.0098, + "step": 12590 + }, + { + "epoch": 0.32, + "learning_rate": 1.9686098552311938e-06, + "loss": 0.958, + "step": 12591 + }, + { + "epoch": 0.32, + "learning_rate": 1.9686029763757733e-06, + "loss": 0.9531, + "step": 12592 + }, + { + "epoch": 0.32, + "learning_rate": 1.968596096778738e-06, + "loss": 1.0342, + "step": 12593 + }, + { + "epoch": 0.32, + "learning_rate": 1.9685892164400933e-06, + "loss": 0.8062, + "step": 12594 + }, + { + "epoch": 0.32, + "learning_rate": 1.9685823353598447e-06, + "loss": 0.8271, + "step": 12595 + }, + { + "epoch": 0.32, + "learning_rate": 1.9685754535379967e-06, + "loss": 0.8477, + "step": 12596 + }, + { + "epoch": 0.32, + "learning_rate": 1.9685685709745552e-06, + "loss": 0.9814, + "step": 12597 + }, + { + "epoch": 0.32, + "learning_rate": 1.9685616876695255e-06, + "loss": 0.7627, + "step": 12598 + }, + { + "epoch": 0.32, + "learning_rate": 1.9685548036229124e-06, + "loss": 1.0566, + "step": 12599 + }, + { + "epoch": 0.32, + "learning_rate": 1.968547918834721e-06, + "loss": 1.0088, + "step": 12600 + }, + { + "epoch": 0.32, + "learning_rate": 1.968541033304958e-06, + "loss": 0.8604, + "step": 12601 + }, + { + "epoch": 0.32, + "learning_rate": 1.968534147033627e-06, + "loss": 0.7959, + "step": 12602 + }, + { + "epoch": 0.32, + "learning_rate": 1.9685272600207338e-06, + "loss": 0.7656, + "step": 12603 + }, + { + "epoch": 0.32, + "learning_rate": 1.9685203722662844e-06, + "loss": 1.1494, + "step": 12604 + }, + { + "epoch": 0.32, + "learning_rate": 1.9685134837702826e-06, + "loss": 0.8848, + "step": 12605 + }, + { + "epoch": 0.32, + "learning_rate": 1.9685065945327353e-06, + "loss": 0.9863, + "step": 12606 + }, + { + "epoch": 0.32, + "learning_rate": 1.968499704553647e-06, + "loss": 0.8408, + "step": 12607 + }, + { + "epoch": 0.32, + "learning_rate": 1.9684928138330226e-06, + "loss": 1.0146, + "step": 12608 + }, + { + "epoch": 0.32, + "learning_rate": 1.968485922370868e-06, + "loss": 0.9756, + "step": 12609 + }, + { + "epoch": 0.32, + "learning_rate": 1.9684790301671885e-06, + "loss": 0.8984, + "step": 12610 + }, + { + "epoch": 0.32, + "learning_rate": 1.9684721372219886e-06, + "loss": 0.6523, + "step": 12611 + }, + { + "epoch": 0.32, + "learning_rate": 1.9684652435352745e-06, + "loss": 0.998, + "step": 12612 + }, + { + "epoch": 0.32, + "learning_rate": 1.9684583491070513e-06, + "loss": 0.8838, + "step": 12613 + }, + { + "epoch": 0.32, + "learning_rate": 1.9684514539373235e-06, + "loss": 0.8359, + "step": 12614 + }, + { + "epoch": 0.32, + "learning_rate": 1.9684445580260976e-06, + "loss": 0.6777, + "step": 12615 + }, + { + "epoch": 0.32, + "learning_rate": 1.968437661373378e-06, + "loss": 0.9395, + "step": 12616 + }, + { + "epoch": 0.32, + "learning_rate": 1.9684307639791696e-06, + "loss": 0.6689, + "step": 12617 + }, + { + "epoch": 0.32, + "learning_rate": 1.968423865843479e-06, + "loss": 0.8926, + "step": 12618 + }, + { + "epoch": 0.32, + "learning_rate": 1.9684169669663104e-06, + "loss": 0.9766, + "step": 12619 + }, + { + "epoch": 0.32, + "learning_rate": 1.9684100673476696e-06, + "loss": 1.2344, + "step": 12620 + }, + { + "epoch": 0.32, + "learning_rate": 1.968403166987562e-06, + "loss": 0.8882, + "step": 12621 + }, + { + "epoch": 0.32, + "learning_rate": 1.9683962658859926e-06, + "loss": 0.9653, + "step": 12622 + }, + { + "epoch": 0.32, + "learning_rate": 1.968389364042966e-06, + "loss": 0.9531, + "step": 12623 + }, + { + "epoch": 0.32, + "learning_rate": 1.968382461458489e-06, + "loss": 0.9756, + "step": 12624 + }, + { + "epoch": 0.32, + "learning_rate": 1.968375558132566e-06, + "loss": 0.9092, + "step": 12625 + }, + { + "epoch": 0.32, + "learning_rate": 1.9683686540652017e-06, + "loss": 0.9727, + "step": 12626 + }, + { + "epoch": 0.32, + "learning_rate": 1.9683617492564025e-06, + "loss": 0.9385, + "step": 12627 + }, + { + "epoch": 0.32, + "learning_rate": 1.9683548437061733e-06, + "loss": 0.8389, + "step": 12628 + }, + { + "epoch": 0.32, + "learning_rate": 1.9683479374145193e-06, + "loss": 0.7266, + "step": 12629 + }, + { + "epoch": 0.32, + "learning_rate": 1.968341030381446e-06, + "loss": 1.0566, + "step": 12630 + }, + { + "epoch": 0.32, + "learning_rate": 1.9683341226069577e-06, + "loss": 0.9473, + "step": 12631 + }, + { + "epoch": 0.32, + "learning_rate": 1.9683272140910612e-06, + "loss": 0.9189, + "step": 12632 + }, + { + "epoch": 0.32, + "learning_rate": 1.968320304833761e-06, + "loss": 1.0361, + "step": 12633 + }, + { + "epoch": 0.32, + "learning_rate": 1.968313394835062e-06, + "loss": 1.002, + "step": 12634 + }, + { + "epoch": 0.32, + "learning_rate": 1.9683064840949707e-06, + "loss": 0.9883, + "step": 12635 + }, + { + "epoch": 0.32, + "learning_rate": 1.968299572613491e-06, + "loss": 0.9053, + "step": 12636 + }, + { + "epoch": 0.32, + "learning_rate": 1.9682926603906295e-06, + "loss": 0.6416, + "step": 12637 + }, + { + "epoch": 0.32, + "learning_rate": 1.9682857474263904e-06, + "loss": 0.8838, + "step": 12638 + }, + { + "epoch": 0.32, + "learning_rate": 1.9682788337207793e-06, + "loss": 0.701, + "step": 12639 + }, + { + "epoch": 0.32, + "learning_rate": 1.968271919273802e-06, + "loss": 0.7666, + "step": 12640 + }, + { + "epoch": 0.32, + "learning_rate": 1.968265004085463e-06, + "loss": 0.7891, + "step": 12641 + }, + { + "epoch": 0.32, + "learning_rate": 1.9682580881557684e-06, + "loss": 1.0664, + "step": 12642 + }, + { + "epoch": 0.32, + "learning_rate": 1.968251171484723e-06, + "loss": 0.738, + "step": 12643 + }, + { + "epoch": 0.32, + "learning_rate": 1.968244254072332e-06, + "loss": 0.9629, + "step": 12644 + }, + { + "epoch": 0.32, + "learning_rate": 1.968237335918601e-06, + "loss": 0.8213, + "step": 12645 + }, + { + "epoch": 0.32, + "learning_rate": 1.9682304170235354e-06, + "loss": 0.7095, + "step": 12646 + }, + { + "epoch": 0.32, + "learning_rate": 1.96822349738714e-06, + "loss": 0.897, + "step": 12647 + }, + { + "epoch": 0.32, + "learning_rate": 1.9682165770094206e-06, + "loss": 0.8374, + "step": 12648 + }, + { + "epoch": 0.32, + "learning_rate": 1.968209655890382e-06, + "loss": 0.9756, + "step": 12649 + }, + { + "epoch": 0.32, + "learning_rate": 1.96820273403003e-06, + "loss": 0.8438, + "step": 12650 + }, + { + "epoch": 0.32, + "learning_rate": 1.9681958114283693e-06, + "loss": 0.9443, + "step": 12651 + }, + { + "epoch": 0.32, + "learning_rate": 1.9681888880854063e-06, + "loss": 0.9404, + "step": 12652 + }, + { + "epoch": 0.32, + "learning_rate": 1.968181964001145e-06, + "loss": 0.9873, + "step": 12653 + }, + { + "epoch": 0.32, + "learning_rate": 1.9681750391755915e-06, + "loss": 0.9688, + "step": 12654 + }, + { + "epoch": 0.32, + "learning_rate": 1.968168113608751e-06, + "loss": 0.918, + "step": 12655 + }, + { + "epoch": 0.32, + "learning_rate": 1.9681611873006285e-06, + "loss": 0.7568, + "step": 12656 + }, + { + "epoch": 0.32, + "learning_rate": 1.9681542602512297e-06, + "loss": 0.9062, + "step": 12657 + }, + { + "epoch": 0.32, + "learning_rate": 1.9681473324605594e-06, + "loss": 0.6234, + "step": 12658 + }, + { + "epoch": 0.32, + "learning_rate": 1.9681404039286234e-06, + "loss": 0.5459, + "step": 12659 + }, + { + "epoch": 0.32, + "learning_rate": 1.968133474655427e-06, + "loss": 0.9863, + "step": 12660 + }, + { + "epoch": 0.32, + "learning_rate": 1.9681265446409752e-06, + "loss": 0.7598, + "step": 12661 + }, + { + "epoch": 0.32, + "learning_rate": 1.9681196138852733e-06, + "loss": 0.8301, + "step": 12662 + }, + { + "epoch": 0.32, + "learning_rate": 1.968112682388327e-06, + "loss": 0.8945, + "step": 12663 + }, + { + "epoch": 0.32, + "learning_rate": 1.968105750150141e-06, + "loss": 0.9668, + "step": 12664 + }, + { + "epoch": 0.32, + "learning_rate": 1.968098817170721e-06, + "loss": 0.9443, + "step": 12665 + }, + { + "epoch": 0.32, + "learning_rate": 1.968091883450072e-06, + "loss": 0.9258, + "step": 12666 + }, + { + "epoch": 0.32, + "learning_rate": 1.9680849489882e-06, + "loss": 0.834, + "step": 12667 + }, + { + "epoch": 0.32, + "learning_rate": 1.9680780137851098e-06, + "loss": 0.8633, + "step": 12668 + }, + { + "epoch": 0.32, + "learning_rate": 1.9680710778408067e-06, + "loss": 0.7632, + "step": 12669 + }, + { + "epoch": 0.32, + "learning_rate": 1.968064141155296e-06, + "loss": 1.0479, + "step": 12670 + }, + { + "epoch": 0.32, + "learning_rate": 1.968057203728583e-06, + "loss": 0.8232, + "step": 12671 + }, + { + "epoch": 0.32, + "learning_rate": 1.9680502655606737e-06, + "loss": 1.0771, + "step": 12672 + }, + { + "epoch": 0.32, + "learning_rate": 1.968043326651572e-06, + "loss": 0.9336, + "step": 12673 + }, + { + "epoch": 0.32, + "learning_rate": 1.968036387001285e-06, + "loss": 0.9844, + "step": 12674 + }, + { + "epoch": 0.32, + "learning_rate": 1.9680294466098162e-06, + "loss": 0.9473, + "step": 12675 + }, + { + "epoch": 0.32, + "learning_rate": 1.968022505477172e-06, + "loss": 1.042, + "step": 12676 + }, + { + "epoch": 0.32, + "learning_rate": 1.9680155636033575e-06, + "loss": 0.793, + "step": 12677 + }, + { + "epoch": 0.32, + "learning_rate": 1.968008620988378e-06, + "loss": 0.9131, + "step": 12678 + }, + { + "epoch": 0.32, + "learning_rate": 1.968001677632239e-06, + "loss": 0.9756, + "step": 12679 + }, + { + "epoch": 0.32, + "learning_rate": 1.9679947335349457e-06, + "loss": 0.7002, + "step": 12680 + }, + { + "epoch": 0.33, + "learning_rate": 1.9679877886965027e-06, + "loss": 0.9463, + "step": 12681 + }, + { + "epoch": 0.33, + "learning_rate": 1.9679808431169165e-06, + "loss": 0.9766, + "step": 12682 + }, + { + "epoch": 0.33, + "learning_rate": 1.9679738967961917e-06, + "loss": 0.7119, + "step": 12683 + }, + { + "epoch": 0.33, + "learning_rate": 1.967966949734334e-06, + "loss": 0.9707, + "step": 12684 + }, + { + "epoch": 0.33, + "learning_rate": 1.9679600019313484e-06, + "loss": 1.001, + "step": 12685 + }, + { + "epoch": 0.33, + "learning_rate": 1.9679530533872405e-06, + "loss": 0.7539, + "step": 12686 + }, + { + "epoch": 0.33, + "learning_rate": 1.9679461041020147e-06, + "loss": 0.843, + "step": 12687 + }, + { + "epoch": 0.33, + "learning_rate": 1.967939154075678e-06, + "loss": 0.9912, + "step": 12688 + }, + { + "epoch": 0.33, + "learning_rate": 1.9679322033082343e-06, + "loss": 1.0352, + "step": 12689 + }, + { + "epoch": 0.33, + "learning_rate": 1.9679252517996898e-06, + "loss": 0.54, + "step": 12690 + }, + { + "epoch": 0.33, + "learning_rate": 1.967918299550049e-06, + "loss": 0.9111, + "step": 12691 + }, + { + "epoch": 0.33, + "learning_rate": 1.967911346559318e-06, + "loss": 0.8242, + "step": 12692 + }, + { + "epoch": 0.33, + "learning_rate": 1.9679043928275013e-06, + "loss": 0.7283, + "step": 12693 + }, + { + "epoch": 0.33, + "learning_rate": 1.9678974383546053e-06, + "loss": 0.9023, + "step": 12694 + }, + { + "epoch": 0.33, + "learning_rate": 1.9678904831406343e-06, + "loss": 0.8135, + "step": 12695 + }, + { + "epoch": 0.33, + "learning_rate": 1.967883527185594e-06, + "loss": 0.9141, + "step": 12696 + }, + { + "epoch": 0.33, + "learning_rate": 1.9678765704894903e-06, + "loss": 0.8838, + "step": 12697 + }, + { + "epoch": 0.33, + "learning_rate": 1.9678696130523276e-06, + "loss": 1.0391, + "step": 12698 + }, + { + "epoch": 0.33, + "learning_rate": 1.967862654874112e-06, + "loss": 0.9277, + "step": 12699 + }, + { + "epoch": 0.33, + "learning_rate": 1.967855695954848e-06, + "loss": 0.8525, + "step": 12700 + }, + { + "epoch": 0.33, + "learning_rate": 1.967848736294542e-06, + "loss": 0.8296, + "step": 12701 + }, + { + "epoch": 0.33, + "learning_rate": 1.9678417758931984e-06, + "loss": 0.9883, + "step": 12702 + }, + { + "epoch": 0.33, + "learning_rate": 1.9678348147508226e-06, + "loss": 0.8389, + "step": 12703 + }, + { + "epoch": 0.33, + "learning_rate": 1.9678278528674205e-06, + "loss": 1.0801, + "step": 12704 + }, + { + "epoch": 0.33, + "learning_rate": 1.967820890242997e-06, + "loss": 0.8691, + "step": 12705 + }, + { + "epoch": 0.33, + "learning_rate": 1.967813926877558e-06, + "loss": 0.8408, + "step": 12706 + }, + { + "epoch": 0.33, + "learning_rate": 1.9678069627711075e-06, + "loss": 0.7632, + "step": 12707 + }, + { + "epoch": 0.33, + "learning_rate": 1.9677999979236525e-06, + "loss": 1.0918, + "step": 12708 + }, + { + "epoch": 0.33, + "learning_rate": 1.967793032335197e-06, + "loss": 0.7209, + "step": 12709 + }, + { + "epoch": 0.33, + "learning_rate": 1.9677860660057472e-06, + "loss": 0.7104, + "step": 12710 + }, + { + "epoch": 0.33, + "learning_rate": 1.967779098935308e-06, + "loss": 0.8193, + "step": 12711 + }, + { + "epoch": 0.33, + "learning_rate": 1.9677721311238848e-06, + "loss": 0.7559, + "step": 12712 + }, + { + "epoch": 0.33, + "learning_rate": 1.967765162571483e-06, + "loss": 1.0947, + "step": 12713 + }, + { + "epoch": 0.33, + "learning_rate": 1.967758193278108e-06, + "loss": 0.9854, + "step": 12714 + }, + { + "epoch": 0.33, + "learning_rate": 1.967751223243765e-06, + "loss": 0.7354, + "step": 12715 + }, + { + "epoch": 0.33, + "learning_rate": 1.9677442524684594e-06, + "loss": 0.9033, + "step": 12716 + }, + { + "epoch": 0.33, + "learning_rate": 1.9677372809521963e-06, + "loss": 0.8906, + "step": 12717 + }, + { + "epoch": 0.33, + "learning_rate": 1.9677303086949813e-06, + "loss": 1.0664, + "step": 12718 + }, + { + "epoch": 0.33, + "learning_rate": 1.96772333569682e-06, + "loss": 0.9277, + "step": 12719 + }, + { + "epoch": 0.33, + "learning_rate": 1.9677163619577175e-06, + "loss": 1.1201, + "step": 12720 + }, + { + "epoch": 0.33, + "learning_rate": 1.967709387477679e-06, + "loss": 0.8486, + "step": 12721 + }, + { + "epoch": 0.33, + "learning_rate": 1.9677024122567095e-06, + "loss": 0.8818, + "step": 12722 + }, + { + "epoch": 0.33, + "learning_rate": 1.967695436294815e-06, + "loss": 0.9814, + "step": 12723 + }, + { + "epoch": 0.33, + "learning_rate": 1.9676884595920006e-06, + "loss": 1.1309, + "step": 12724 + }, + { + "epoch": 0.33, + "learning_rate": 1.9676814821482716e-06, + "loss": 0.9609, + "step": 12725 + }, + { + "epoch": 0.33, + "learning_rate": 1.9676745039636336e-06, + "loss": 0.8291, + "step": 12726 + }, + { + "epoch": 0.33, + "learning_rate": 1.9676675250380916e-06, + "loss": 0.73, + "step": 12727 + }, + { + "epoch": 0.33, + "learning_rate": 1.967660545371651e-06, + "loss": 0.9346, + "step": 12728 + }, + { + "epoch": 0.33, + "learning_rate": 1.9676535649643173e-06, + "loss": 0.8848, + "step": 12729 + }, + { + "epoch": 0.33, + "learning_rate": 1.967646583816096e-06, + "loss": 0.791, + "step": 12730 + }, + { + "epoch": 0.33, + "learning_rate": 1.967639601926992e-06, + "loss": 0.8018, + "step": 12731 + }, + { + "epoch": 0.33, + "learning_rate": 1.9676326192970107e-06, + "loss": 1.0693, + "step": 12732 + }, + { + "epoch": 0.33, + "learning_rate": 1.9676256359261576e-06, + "loss": 0.752, + "step": 12733 + }, + { + "epoch": 0.33, + "learning_rate": 1.9676186518144383e-06, + "loss": 0.8428, + "step": 12734 + }, + { + "epoch": 0.33, + "learning_rate": 1.9676116669618578e-06, + "loss": 0.8672, + "step": 12735 + }, + { + "epoch": 0.33, + "learning_rate": 1.967604681368421e-06, + "loss": 0.9873, + "step": 12736 + }, + { + "epoch": 0.33, + "learning_rate": 1.967597695034135e-06, + "loss": 0.8623, + "step": 12737 + }, + { + "epoch": 0.33, + "learning_rate": 1.967590707959003e-06, + "loss": 0.9121, + "step": 12738 + }, + { + "epoch": 0.33, + "learning_rate": 1.967583720143031e-06, + "loss": 0.9902, + "step": 12739 + }, + { + "epoch": 0.33, + "learning_rate": 1.9675767315862256e-06, + "loss": 0.7617, + "step": 12740 + }, + { + "epoch": 0.33, + "learning_rate": 1.9675697422885906e-06, + "loss": 0.793, + "step": 12741 + }, + { + "epoch": 0.33, + "learning_rate": 1.967562752250132e-06, + "loss": 0.7388, + "step": 12742 + }, + { + "epoch": 0.33, + "learning_rate": 1.967555761470855e-06, + "loss": 0.856, + "step": 12743 + }, + { + "epoch": 0.33, + "learning_rate": 1.9675487699507653e-06, + "loss": 0.9209, + "step": 12744 + }, + { + "epoch": 0.33, + "learning_rate": 1.9675417776898677e-06, + "loss": 0.9033, + "step": 12745 + }, + { + "epoch": 0.33, + "learning_rate": 1.9675347846881683e-06, + "loss": 0.8975, + "step": 12746 + }, + { + "epoch": 0.33, + "learning_rate": 1.9675277909456716e-06, + "loss": 0.7114, + "step": 12747 + }, + { + "epoch": 0.33, + "learning_rate": 1.9675207964623833e-06, + "loss": 0.9072, + "step": 12748 + }, + { + "epoch": 0.33, + "learning_rate": 1.967513801238309e-06, + "loss": 1.0088, + "step": 12749 + }, + { + "epoch": 0.33, + "learning_rate": 1.9675068052734542e-06, + "loss": 0.9795, + "step": 12750 + }, + { + "epoch": 0.33, + "learning_rate": 1.9674998085678233e-06, + "loss": 1.1504, + "step": 12751 + }, + { + "epoch": 0.33, + "learning_rate": 1.9674928111214227e-06, + "loss": 0.8975, + "step": 12752 + }, + { + "epoch": 0.33, + "learning_rate": 1.967485812934257e-06, + "loss": 0.9512, + "step": 12753 + }, + { + "epoch": 0.33, + "learning_rate": 1.9674788140063322e-06, + "loss": 0.6968, + "step": 12754 + }, + { + "epoch": 0.33, + "learning_rate": 1.9674718143376534e-06, + "loss": 0.959, + "step": 12755 + }, + { + "epoch": 0.33, + "learning_rate": 1.9674648139282257e-06, + "loss": 0.8369, + "step": 12756 + }, + { + "epoch": 0.33, + "learning_rate": 1.967457812778055e-06, + "loss": 1.0742, + "step": 12757 + }, + { + "epoch": 0.33, + "learning_rate": 1.9674508108871458e-06, + "loss": 0.8135, + "step": 12758 + }, + { + "epoch": 0.33, + "learning_rate": 1.9674438082555046e-06, + "loss": 1.0703, + "step": 12759 + }, + { + "epoch": 0.33, + "learning_rate": 1.9674368048831357e-06, + "loss": 0.6216, + "step": 12760 + }, + { + "epoch": 0.33, + "learning_rate": 1.967429800770045e-06, + "loss": 0.9609, + "step": 12761 + }, + { + "epoch": 0.33, + "learning_rate": 1.967422795916238e-06, + "loss": 0.9971, + "step": 12762 + }, + { + "epoch": 0.33, + "learning_rate": 1.9674157903217195e-06, + "loss": 0.8193, + "step": 12763 + }, + { + "epoch": 0.33, + "learning_rate": 1.967408783986496e-06, + "loss": 1.04, + "step": 12764 + }, + { + "epoch": 0.33, + "learning_rate": 1.967401776910571e-06, + "loss": 0.8496, + "step": 12765 + }, + { + "epoch": 0.33, + "learning_rate": 1.9673947690939516e-06, + "loss": 1.0645, + "step": 12766 + }, + { + "epoch": 0.33, + "learning_rate": 1.9673877605366425e-06, + "loss": 1.0176, + "step": 12767 + }, + { + "epoch": 0.33, + "learning_rate": 1.9673807512386487e-06, + "loss": 0.9502, + "step": 12768 + }, + { + "epoch": 0.33, + "learning_rate": 1.9673737411999764e-06, + "loss": 0.8877, + "step": 12769 + }, + { + "epoch": 0.33, + "learning_rate": 1.9673667304206304e-06, + "loss": 1.0459, + "step": 12770 + }, + { + "epoch": 0.33, + "learning_rate": 1.967359718900616e-06, + "loss": 0.793, + "step": 12771 + }, + { + "epoch": 0.33, + "learning_rate": 1.9673527066399387e-06, + "loss": 0.9883, + "step": 12772 + }, + { + "epoch": 0.33, + "learning_rate": 1.967345693638604e-06, + "loss": 0.8262, + "step": 12773 + }, + { + "epoch": 0.33, + "learning_rate": 1.967338679896617e-06, + "loss": 0.8447, + "step": 12774 + }, + { + "epoch": 0.33, + "learning_rate": 1.9673316654139837e-06, + "loss": 0.9443, + "step": 12775 + }, + { + "epoch": 0.33, + "learning_rate": 1.9673246501907087e-06, + "loss": 1.0459, + "step": 12776 + }, + { + "epoch": 0.33, + "learning_rate": 1.9673176342267977e-06, + "loss": 0.8633, + "step": 12777 + }, + { + "epoch": 0.33, + "learning_rate": 1.9673106175222564e-06, + "loss": 0.5034, + "step": 12778 + }, + { + "epoch": 0.33, + "learning_rate": 1.9673036000770895e-06, + "loss": 0.957, + "step": 12779 + }, + { + "epoch": 0.33, + "learning_rate": 1.9672965818913027e-06, + "loss": 0.6245, + "step": 12780 + }, + { + "epoch": 0.33, + "learning_rate": 1.9672895629649012e-06, + "loss": 0.8379, + "step": 12781 + }, + { + "epoch": 0.33, + "learning_rate": 1.967282543297891e-06, + "loss": 0.7422, + "step": 12782 + }, + { + "epoch": 0.33, + "learning_rate": 1.9672755228902767e-06, + "loss": 1.0723, + "step": 12783 + }, + { + "epoch": 0.33, + "learning_rate": 1.967268501742064e-06, + "loss": 0.707, + "step": 12784 + }, + { + "epoch": 0.33, + "learning_rate": 1.9672614798532586e-06, + "loss": 0.9062, + "step": 12785 + }, + { + "epoch": 0.33, + "learning_rate": 1.9672544572238654e-06, + "loss": 0.9043, + "step": 12786 + }, + { + "epoch": 0.33, + "learning_rate": 1.96724743385389e-06, + "loss": 1.1074, + "step": 12787 + }, + { + "epoch": 0.33, + "learning_rate": 1.967240409743338e-06, + "loss": 0.7471, + "step": 12788 + }, + { + "epoch": 0.33, + "learning_rate": 1.9672333848922136e-06, + "loss": 0.9355, + "step": 12789 + }, + { + "epoch": 0.33, + "learning_rate": 1.967226359300524e-06, + "loss": 0.8723, + "step": 12790 + }, + { + "epoch": 0.33, + "learning_rate": 1.9672193329682732e-06, + "loss": 0.9951, + "step": 12791 + }, + { + "epoch": 0.33, + "learning_rate": 1.967212305895467e-06, + "loss": 0.9678, + "step": 12792 + }, + { + "epoch": 0.33, + "learning_rate": 1.967205278082111e-06, + "loss": 0.9912, + "step": 12793 + }, + { + "epoch": 0.33, + "learning_rate": 1.96719824952821e-06, + "loss": 0.9307, + "step": 12794 + }, + { + "epoch": 0.33, + "learning_rate": 1.9671912202337704e-06, + "loss": 0.9385, + "step": 12795 + }, + { + "epoch": 0.33, + "learning_rate": 1.9671841901987965e-06, + "loss": 0.9893, + "step": 12796 + }, + { + "epoch": 0.33, + "learning_rate": 1.9671771594232944e-06, + "loss": 0.7598, + "step": 12797 + }, + { + "epoch": 0.33, + "learning_rate": 1.967170127907269e-06, + "loss": 0.8384, + "step": 12798 + }, + { + "epoch": 0.33, + "learning_rate": 1.9671630956507263e-06, + "loss": 0.7095, + "step": 12799 + }, + { + "epoch": 0.33, + "learning_rate": 1.9671560626536706e-06, + "loss": 0.9355, + "step": 12800 + }, + { + "epoch": 0.33, + "learning_rate": 1.9671490289161086e-06, + "loss": 0.9053, + "step": 12801 + }, + { + "epoch": 0.33, + "learning_rate": 1.967141994438045e-06, + "loss": 0.7764, + "step": 12802 + }, + { + "epoch": 0.33, + "learning_rate": 1.967134959219485e-06, + "loss": 0.7529, + "step": 12803 + }, + { + "epoch": 0.33, + "learning_rate": 1.967127923260434e-06, + "loss": 0.915, + "step": 12804 + }, + { + "epoch": 0.33, + "learning_rate": 1.967120886560898e-06, + "loss": 0.8457, + "step": 12805 + }, + { + "epoch": 0.33, + "learning_rate": 1.967113849120882e-06, + "loss": 0.8975, + "step": 12806 + }, + { + "epoch": 0.33, + "learning_rate": 1.9671068109403913e-06, + "loss": 0.9131, + "step": 12807 + }, + { + "epoch": 0.33, + "learning_rate": 1.9670997720194316e-06, + "loss": 1.1436, + "step": 12808 + }, + { + "epoch": 0.33, + "learning_rate": 1.967092732358008e-06, + "loss": 0.8203, + "step": 12809 + }, + { + "epoch": 0.33, + "learning_rate": 1.9670856919561258e-06, + "loss": 0.877, + "step": 12810 + }, + { + "epoch": 0.33, + "learning_rate": 1.9670786508137903e-06, + "loss": 1.3301, + "step": 12811 + }, + { + "epoch": 0.33, + "learning_rate": 1.9670716089310075e-06, + "loss": 0.8086, + "step": 12812 + }, + { + "epoch": 0.33, + "learning_rate": 1.9670645663077823e-06, + "loss": 0.8359, + "step": 12813 + }, + { + "epoch": 0.33, + "learning_rate": 1.9670575229441203e-06, + "loss": 1.0811, + "step": 12814 + }, + { + "epoch": 0.33, + "learning_rate": 1.967050478840027e-06, + "loss": 0.793, + "step": 12815 + }, + { + "epoch": 0.33, + "learning_rate": 1.9670434339955075e-06, + "loss": 0.8047, + "step": 12816 + }, + { + "epoch": 0.33, + "learning_rate": 1.967036388410567e-06, + "loss": 0.707, + "step": 12817 + }, + { + "epoch": 0.33, + "learning_rate": 1.9670293420852114e-06, + "loss": 0.7739, + "step": 12818 + }, + { + "epoch": 0.33, + "learning_rate": 1.9670222950194462e-06, + "loss": 0.9961, + "step": 12819 + }, + { + "epoch": 0.33, + "learning_rate": 1.967015247213276e-06, + "loss": 0.8423, + "step": 12820 + }, + { + "epoch": 0.33, + "learning_rate": 1.967008198666707e-06, + "loss": 0.8223, + "step": 12821 + }, + { + "epoch": 0.33, + "learning_rate": 1.967001149379744e-06, + "loss": 0.7871, + "step": 12822 + }, + { + "epoch": 0.33, + "learning_rate": 1.966994099352393e-06, + "loss": 0.999, + "step": 12823 + }, + { + "epoch": 0.33, + "learning_rate": 1.9669870485846594e-06, + "loss": 1.0713, + "step": 12824 + }, + { + "epoch": 0.33, + "learning_rate": 1.9669799970765478e-06, + "loss": 1.04, + "step": 12825 + }, + { + "epoch": 0.33, + "learning_rate": 1.9669729448280637e-06, + "loss": 1.1016, + "step": 12826 + }, + { + "epoch": 0.33, + "learning_rate": 1.9669658918392136e-06, + "loss": 0.8818, + "step": 12827 + }, + { + "epoch": 0.33, + "learning_rate": 1.966958838110002e-06, + "loss": 0.8125, + "step": 12828 + }, + { + "epoch": 0.33, + "learning_rate": 1.9669517836404345e-06, + "loss": 0.917, + "step": 12829 + }, + { + "epoch": 0.33, + "learning_rate": 1.966944728430516e-06, + "loss": 0.9189, + "step": 12830 + }, + { + "epoch": 0.33, + "learning_rate": 1.966937672480253e-06, + "loss": 1.0303, + "step": 12831 + }, + { + "epoch": 0.33, + "learning_rate": 1.96693061578965e-06, + "loss": 0.8643, + "step": 12832 + }, + { + "epoch": 0.33, + "learning_rate": 1.966923558358713e-06, + "loss": 0.8125, + "step": 12833 + }, + { + "epoch": 0.33, + "learning_rate": 1.966916500187446e-06, + "loss": 0.8018, + "step": 12834 + }, + { + "epoch": 0.33, + "learning_rate": 1.966909441275857e-06, + "loss": 1.002, + "step": 12835 + }, + { + "epoch": 0.33, + "learning_rate": 1.966902381623949e-06, + "loss": 0.8311, + "step": 12836 + }, + { + "epoch": 0.33, + "learning_rate": 1.9668953212317283e-06, + "loss": 0.8701, + "step": 12837 + }, + { + "epoch": 0.33, + "learning_rate": 1.9668882600992006e-06, + "loss": 0.5903, + "step": 12838 + }, + { + "epoch": 0.33, + "learning_rate": 1.966881198226371e-06, + "loss": 0.8105, + "step": 12839 + }, + { + "epoch": 0.33, + "learning_rate": 1.966874135613245e-06, + "loss": 0.8945, + "step": 12840 + }, + { + "epoch": 0.33, + "learning_rate": 1.966867072259828e-06, + "loss": 1.0098, + "step": 12841 + }, + { + "epoch": 0.33, + "learning_rate": 1.9668600081661247e-06, + "loss": 0.8525, + "step": 12842 + }, + { + "epoch": 0.33, + "learning_rate": 1.9668529433321418e-06, + "loss": 0.5835, + "step": 12843 + }, + { + "epoch": 0.33, + "learning_rate": 1.966845877757884e-06, + "loss": 0.8223, + "step": 12844 + }, + { + "epoch": 0.33, + "learning_rate": 1.9668388114433563e-06, + "loss": 1.0352, + "step": 12845 + }, + { + "epoch": 0.33, + "learning_rate": 1.966831744388565e-06, + "loss": 0.957, + "step": 12846 + }, + { + "epoch": 0.33, + "learning_rate": 1.966824676593515e-06, + "loss": 0.7607, + "step": 12847 + }, + { + "epoch": 0.33, + "learning_rate": 1.966817608058212e-06, + "loss": 0.7148, + "step": 12848 + }, + { + "epoch": 0.33, + "learning_rate": 1.966810538782661e-06, + "loss": 1.0225, + "step": 12849 + }, + { + "epoch": 0.33, + "learning_rate": 1.9668034687668675e-06, + "loss": 0.8545, + "step": 12850 + }, + { + "epoch": 0.33, + "learning_rate": 1.966796398010837e-06, + "loss": 0.7783, + "step": 12851 + }, + { + "epoch": 0.33, + "learning_rate": 1.966789326514575e-06, + "loss": 0.8398, + "step": 12852 + }, + { + "epoch": 0.33, + "learning_rate": 1.966782254278087e-06, + "loss": 0.9385, + "step": 12853 + }, + { + "epoch": 0.33, + "learning_rate": 1.9667751813013786e-06, + "loss": 0.9463, + "step": 12854 + }, + { + "epoch": 0.33, + "learning_rate": 1.9667681075844544e-06, + "loss": 0.9697, + "step": 12855 + }, + { + "epoch": 0.33, + "learning_rate": 1.9667610331273204e-06, + "loss": 1.0107, + "step": 12856 + }, + { + "epoch": 0.33, + "learning_rate": 1.966753957929982e-06, + "loss": 0.9731, + "step": 12857 + }, + { + "epoch": 0.33, + "learning_rate": 1.9667468819924446e-06, + "loss": 1.0713, + "step": 12858 + }, + { + "epoch": 0.33, + "learning_rate": 1.9667398053147134e-06, + "loss": 1.0869, + "step": 12859 + }, + { + "epoch": 0.33, + "learning_rate": 1.9667327278967944e-06, + "loss": 0.7471, + "step": 12860 + }, + { + "epoch": 0.33, + "learning_rate": 1.9667256497386923e-06, + "loss": 1.0771, + "step": 12861 + }, + { + "epoch": 0.33, + "learning_rate": 1.9667185708404125e-06, + "loss": 1.0205, + "step": 12862 + }, + { + "epoch": 0.33, + "learning_rate": 1.9667114912019615e-06, + "loss": 0.6924, + "step": 12863 + }, + { + "epoch": 0.33, + "learning_rate": 1.9667044108233434e-06, + "loss": 0.8003, + "step": 12864 + }, + { + "epoch": 0.33, + "learning_rate": 1.9666973297045642e-06, + "loss": 0.7876, + "step": 12865 + }, + { + "epoch": 0.33, + "learning_rate": 1.9666902478456295e-06, + "loss": 0.8184, + "step": 12866 + }, + { + "epoch": 0.33, + "learning_rate": 1.966683165246544e-06, + "loss": 0.9814, + "step": 12867 + }, + { + "epoch": 0.33, + "learning_rate": 1.9666760819073143e-06, + "loss": 0.6562, + "step": 12868 + }, + { + "epoch": 0.33, + "learning_rate": 1.966668997827945e-06, + "loss": 0.9053, + "step": 12869 + }, + { + "epoch": 0.33, + "learning_rate": 1.9666619130084415e-06, + "loss": 0.8408, + "step": 12870 + }, + { + "epoch": 0.33, + "learning_rate": 1.9666548274488096e-06, + "loss": 0.7461, + "step": 12871 + }, + { + "epoch": 0.33, + "learning_rate": 1.9666477411490547e-06, + "loss": 0.8574, + "step": 12872 + }, + { + "epoch": 0.33, + "learning_rate": 1.966640654109182e-06, + "loss": 1.1758, + "step": 12873 + }, + { + "epoch": 0.33, + "learning_rate": 1.9666335663291968e-06, + "loss": 0.8301, + "step": 12874 + }, + { + "epoch": 0.33, + "learning_rate": 1.9666264778091047e-06, + "loss": 1.0322, + "step": 12875 + }, + { + "epoch": 0.33, + "learning_rate": 1.966619388548911e-06, + "loss": 1.0625, + "step": 12876 + }, + { + "epoch": 0.33, + "learning_rate": 1.966612298548622e-06, + "loss": 0.832, + "step": 12877 + }, + { + "epoch": 0.33, + "learning_rate": 1.966605207808242e-06, + "loss": 1.0439, + "step": 12878 + }, + { + "epoch": 0.33, + "learning_rate": 1.9665981163277766e-06, + "loss": 0.9268, + "step": 12879 + }, + { + "epoch": 0.33, + "learning_rate": 1.966591024107232e-06, + "loss": 1.0264, + "step": 12880 + }, + { + "epoch": 0.33, + "learning_rate": 1.9665839311466127e-06, + "loss": 0.8525, + "step": 12881 + }, + { + "epoch": 0.33, + "learning_rate": 1.9665768374459244e-06, + "loss": 1.1865, + "step": 12882 + }, + { + "epoch": 0.33, + "learning_rate": 1.966569743005173e-06, + "loss": 0.9951, + "step": 12883 + }, + { + "epoch": 0.33, + "learning_rate": 1.9665626478243635e-06, + "loss": 0.835, + "step": 12884 + }, + { + "epoch": 0.33, + "learning_rate": 1.966555551903501e-06, + "loss": 1.0723, + "step": 12885 + }, + { + "epoch": 0.33, + "learning_rate": 1.9665484552425918e-06, + "loss": 0.8179, + "step": 12886 + }, + { + "epoch": 0.33, + "learning_rate": 1.966541357841641e-06, + "loss": 0.8965, + "step": 12887 + }, + { + "epoch": 0.33, + "learning_rate": 1.9665342597006534e-06, + "loss": 1.1055, + "step": 12888 + }, + { + "epoch": 0.33, + "learning_rate": 1.9665271608196357e-06, + "loss": 0.7405, + "step": 12889 + }, + { + "epoch": 0.33, + "learning_rate": 1.9665200611985923e-06, + "loss": 0.8311, + "step": 12890 + }, + { + "epoch": 0.33, + "learning_rate": 1.9665129608375285e-06, + "loss": 1.0264, + "step": 12891 + }, + { + "epoch": 0.33, + "learning_rate": 1.9665058597364506e-06, + "loss": 0.9238, + "step": 12892 + }, + { + "epoch": 0.33, + "learning_rate": 1.9664987578953636e-06, + "loss": 0.9082, + "step": 12893 + }, + { + "epoch": 0.33, + "learning_rate": 1.9664916553142726e-06, + "loss": 0.8325, + "step": 12894 + }, + { + "epoch": 0.33, + "learning_rate": 1.966484551993184e-06, + "loss": 0.8828, + "step": 12895 + }, + { + "epoch": 0.33, + "learning_rate": 1.966477447932102e-06, + "loss": 0.647, + "step": 12896 + }, + { + "epoch": 0.33, + "learning_rate": 1.966470343131033e-06, + "loss": 0.8301, + "step": 12897 + }, + { + "epoch": 0.33, + "learning_rate": 1.966463237589982e-06, + "loss": 0.916, + "step": 12898 + }, + { + "epoch": 0.33, + "learning_rate": 1.9664561313089544e-06, + "loss": 0.9121, + "step": 12899 + }, + { + "epoch": 0.33, + "learning_rate": 1.966449024287956e-06, + "loss": 0.7578, + "step": 12900 + }, + { + "epoch": 0.33, + "learning_rate": 1.966441916526992e-06, + "loss": 0.8887, + "step": 12901 + }, + { + "epoch": 0.33, + "learning_rate": 1.966434808026068e-06, + "loss": 0.7749, + "step": 12902 + }, + { + "epoch": 0.33, + "learning_rate": 1.9664276987851888e-06, + "loss": 1.1934, + "step": 12903 + }, + { + "epoch": 0.33, + "learning_rate": 1.9664205888043608e-06, + "loss": 0.9082, + "step": 12904 + }, + { + "epoch": 0.33, + "learning_rate": 1.966413478083589e-06, + "loss": 0.9678, + "step": 12905 + }, + { + "epoch": 0.33, + "learning_rate": 1.9664063666228783e-06, + "loss": 1.1504, + "step": 12906 + }, + { + "epoch": 0.33, + "learning_rate": 1.9663992544222353e-06, + "loss": 0.96, + "step": 12907 + }, + { + "epoch": 0.33, + "learning_rate": 1.9663921414816645e-06, + "loss": 0.8594, + "step": 12908 + }, + { + "epoch": 0.33, + "learning_rate": 1.966385027801172e-06, + "loss": 0.7559, + "step": 12909 + }, + { + "epoch": 0.33, + "learning_rate": 1.9663779133807627e-06, + "loss": 1.1572, + "step": 12910 + }, + { + "epoch": 0.33, + "learning_rate": 1.966370798220442e-06, + "loss": 0.7202, + "step": 12911 + }, + { + "epoch": 0.33, + "learning_rate": 1.966363682320216e-06, + "loss": 0.6108, + "step": 12912 + }, + { + "epoch": 0.33, + "learning_rate": 1.9663565656800898e-06, + "loss": 1.04, + "step": 12913 + }, + { + "epoch": 0.33, + "learning_rate": 1.966349448300068e-06, + "loss": 0.9951, + "step": 12914 + }, + { + "epoch": 0.33, + "learning_rate": 1.9663423301801577e-06, + "loss": 0.8232, + "step": 12915 + }, + { + "epoch": 0.33, + "learning_rate": 1.966335211320363e-06, + "loss": 0.8848, + "step": 12916 + }, + { + "epoch": 0.33, + "learning_rate": 1.9663280917206904e-06, + "loss": 0.8682, + "step": 12917 + }, + { + "epoch": 0.33, + "learning_rate": 1.966320971381145e-06, + "loss": 1.0537, + "step": 12918 + }, + { + "epoch": 0.33, + "learning_rate": 1.9663138503017315e-06, + "loss": 0.8237, + "step": 12919 + }, + { + "epoch": 0.33, + "learning_rate": 1.966306728482456e-06, + "loss": 1.041, + "step": 12920 + }, + { + "epoch": 0.33, + "learning_rate": 1.966299605923324e-06, + "loss": 1.1426, + "step": 12921 + }, + { + "epoch": 0.33, + "learning_rate": 1.9662924826243405e-06, + "loss": 1.0205, + "step": 12922 + }, + { + "epoch": 0.33, + "learning_rate": 1.9662853585855117e-06, + "loss": 0.9863, + "step": 12923 + }, + { + "epoch": 0.33, + "learning_rate": 1.9662782338068428e-06, + "loss": 0.917, + "step": 12924 + }, + { + "epoch": 0.33, + "learning_rate": 1.9662711082883384e-06, + "loss": 0.8701, + "step": 12925 + }, + { + "epoch": 0.33, + "learning_rate": 1.966263982030005e-06, + "loss": 0.9053, + "step": 12926 + }, + { + "epoch": 0.33, + "learning_rate": 1.966256855031848e-06, + "loss": 1.0615, + "step": 12927 + }, + { + "epoch": 0.33, + "learning_rate": 1.966249727293872e-06, + "loss": 0.9619, + "step": 12928 + }, + { + "epoch": 0.33, + "learning_rate": 1.9662425988160833e-06, + "loss": 0.9121, + "step": 12929 + }, + { + "epoch": 0.33, + "learning_rate": 1.966235469598487e-06, + "loss": 0.9697, + "step": 12930 + }, + { + "epoch": 0.33, + "learning_rate": 1.9662283396410886e-06, + "loss": 1.0293, + "step": 12931 + }, + { + "epoch": 0.33, + "learning_rate": 1.9662212089438935e-06, + "loss": 1.0264, + "step": 12932 + }, + { + "epoch": 0.33, + "learning_rate": 1.9662140775069078e-06, + "loss": 0.7783, + "step": 12933 + }, + { + "epoch": 0.33, + "learning_rate": 1.966206945330136e-06, + "loss": 1.0352, + "step": 12934 + }, + { + "epoch": 0.33, + "learning_rate": 1.966199812413584e-06, + "loss": 1.124, + "step": 12935 + }, + { + "epoch": 0.33, + "learning_rate": 1.966192678757257e-06, + "loss": 0.9346, + "step": 12936 + }, + { + "epoch": 0.33, + "learning_rate": 1.966185544361161e-06, + "loss": 0.7754, + "step": 12937 + }, + { + "epoch": 0.33, + "learning_rate": 1.9661784092253013e-06, + "loss": 1.043, + "step": 12938 + }, + { + "epoch": 0.33, + "learning_rate": 1.9661712733496825e-06, + "loss": 0.8301, + "step": 12939 + }, + { + "epoch": 0.33, + "learning_rate": 1.9661641367343113e-06, + "loss": 0.7925, + "step": 12940 + }, + { + "epoch": 0.33, + "learning_rate": 1.966156999379193e-06, + "loss": 0.7356, + "step": 12941 + }, + { + "epoch": 0.33, + "learning_rate": 1.966149861284332e-06, + "loss": 0.7852, + "step": 12942 + }, + { + "epoch": 0.33, + "learning_rate": 1.966142722449735e-06, + "loss": 0.9121, + "step": 12943 + }, + { + "epoch": 0.33, + "learning_rate": 1.9661355828754067e-06, + "loss": 0.7573, + "step": 12944 + }, + { + "epoch": 0.33, + "learning_rate": 1.9661284425613526e-06, + "loss": 0.8311, + "step": 12945 + }, + { + "epoch": 0.33, + "learning_rate": 1.9661213015075788e-06, + "loss": 0.9922, + "step": 12946 + }, + { + "epoch": 0.33, + "learning_rate": 1.96611415971409e-06, + "loss": 0.7751, + "step": 12947 + }, + { + "epoch": 0.33, + "learning_rate": 1.9661070171808924e-06, + "loss": 1.0518, + "step": 12948 + }, + { + "epoch": 0.33, + "learning_rate": 1.966099873907991e-06, + "loss": 0.9463, + "step": 12949 + }, + { + "epoch": 0.33, + "learning_rate": 1.966092729895391e-06, + "loss": 0.7915, + "step": 12950 + }, + { + "epoch": 0.33, + "learning_rate": 1.9660855851430984e-06, + "loss": 0.8682, + "step": 12951 + }, + { + "epoch": 0.33, + "learning_rate": 1.9660784396511184e-06, + "loss": 0.9336, + "step": 12952 + }, + { + "epoch": 0.33, + "learning_rate": 1.966071293419457e-06, + "loss": 0.7729, + "step": 12953 + }, + { + "epoch": 0.33, + "learning_rate": 1.966064146448119e-06, + "loss": 0.7227, + "step": 12954 + }, + { + "epoch": 0.33, + "learning_rate": 1.96605699873711e-06, + "loss": 0.8708, + "step": 12955 + }, + { + "epoch": 0.33, + "learning_rate": 1.9660498502864353e-06, + "loss": 0.7578, + "step": 12956 + }, + { + "epoch": 0.33, + "learning_rate": 1.966042701096101e-06, + "loss": 0.7446, + "step": 12957 + }, + { + "epoch": 0.33, + "learning_rate": 1.966035551166112e-06, + "loss": 0.8623, + "step": 12958 + }, + { + "epoch": 0.33, + "learning_rate": 1.9660284004964744e-06, + "loss": 0.7659, + "step": 12959 + }, + { + "epoch": 0.33, + "learning_rate": 1.966021249087193e-06, + "loss": 0.8262, + "step": 12960 + }, + { + "epoch": 0.33, + "learning_rate": 1.9660140969382734e-06, + "loss": 0.9971, + "step": 12961 + }, + { + "epoch": 0.33, + "learning_rate": 1.9660069440497214e-06, + "loss": 0.918, + "step": 12962 + }, + { + "epoch": 0.33, + "learning_rate": 1.9659997904215422e-06, + "loss": 0.9258, + "step": 12963 + }, + { + "epoch": 0.33, + "learning_rate": 1.9659926360537416e-06, + "loss": 0.8184, + "step": 12964 + }, + { + "epoch": 0.33, + "learning_rate": 1.965985480946325e-06, + "loss": 0.9893, + "step": 12965 + }, + { + "epoch": 0.33, + "learning_rate": 1.965978325099297e-06, + "loss": 0.9336, + "step": 12966 + }, + { + "epoch": 0.33, + "learning_rate": 1.9659711685126645e-06, + "loss": 0.6787, + "step": 12967 + }, + { + "epoch": 0.33, + "learning_rate": 1.9659640111864323e-06, + "loss": 0.8838, + "step": 12968 + }, + { + "epoch": 0.33, + "learning_rate": 1.9659568531206056e-06, + "loss": 0.6665, + "step": 12969 + }, + { + "epoch": 0.33, + "learning_rate": 1.96594969431519e-06, + "loss": 0.9883, + "step": 12970 + }, + { + "epoch": 0.33, + "learning_rate": 1.9659425347701914e-06, + "loss": 0.8467, + "step": 12971 + }, + { + "epoch": 0.33, + "learning_rate": 1.965935374485615e-06, + "loss": 0.7236, + "step": 12972 + }, + { + "epoch": 0.33, + "learning_rate": 1.965928213461466e-06, + "loss": 0.7256, + "step": 12973 + }, + { + "epoch": 0.33, + "learning_rate": 1.9659210516977505e-06, + "loss": 1.04, + "step": 12974 + }, + { + "epoch": 0.33, + "learning_rate": 1.9659138891944737e-06, + "loss": 0.8652, + "step": 12975 + }, + { + "epoch": 0.33, + "learning_rate": 1.965906725951641e-06, + "loss": 1.0684, + "step": 12976 + }, + { + "epoch": 0.33, + "learning_rate": 1.9658995619692578e-06, + "loss": 0.9551, + "step": 12977 + }, + { + "epoch": 0.33, + "learning_rate": 1.9658923972473298e-06, + "loss": 0.8408, + "step": 12978 + }, + { + "epoch": 0.33, + "learning_rate": 1.9658852317858623e-06, + "loss": 1.1289, + "step": 12979 + }, + { + "epoch": 0.33, + "learning_rate": 1.965878065584861e-06, + "loss": 0.9893, + "step": 12980 + }, + { + "epoch": 0.33, + "learning_rate": 1.9658708986443314e-06, + "loss": 0.7905, + "step": 12981 + }, + { + "epoch": 0.33, + "learning_rate": 1.965863730964279e-06, + "loss": 0.7632, + "step": 12982 + }, + { + "epoch": 0.33, + "learning_rate": 1.9658565625447085e-06, + "loss": 0.8486, + "step": 12983 + }, + { + "epoch": 0.33, + "learning_rate": 1.965849393385627e-06, + "loss": 0.8252, + "step": 12984 + }, + { + "epoch": 0.33, + "learning_rate": 1.965842223487038e-06, + "loss": 0.8652, + "step": 12985 + }, + { + "epoch": 0.33, + "learning_rate": 1.9658350528489485e-06, + "loss": 1.0693, + "step": 12986 + }, + { + "epoch": 0.33, + "learning_rate": 1.9658278814713638e-06, + "loss": 0.9121, + "step": 12987 + }, + { + "epoch": 0.33, + "learning_rate": 1.9658207093542884e-06, + "loss": 0.7603, + "step": 12988 + }, + { + "epoch": 0.33, + "learning_rate": 1.965813536497729e-06, + "loss": 0.7332, + "step": 12989 + }, + { + "epoch": 0.33, + "learning_rate": 1.9658063629016906e-06, + "loss": 1.0576, + "step": 12990 + }, + { + "epoch": 0.33, + "learning_rate": 1.9657991885661783e-06, + "loss": 0.9688, + "step": 12991 + }, + { + "epoch": 0.33, + "learning_rate": 1.9657920134911982e-06, + "loss": 0.8018, + "step": 12992 + }, + { + "epoch": 0.33, + "learning_rate": 1.9657848376767554e-06, + "loss": 0.7502, + "step": 12993 + }, + { + "epoch": 0.33, + "learning_rate": 1.965777661122856e-06, + "loss": 0.8164, + "step": 12994 + }, + { + "epoch": 0.33, + "learning_rate": 1.965770483829505e-06, + "loss": 0.6963, + "step": 12995 + }, + { + "epoch": 0.33, + "learning_rate": 1.965763305796708e-06, + "loss": 1.04, + "step": 12996 + }, + { + "epoch": 0.33, + "learning_rate": 1.9657561270244696e-06, + "loss": 0.9541, + "step": 12997 + }, + { + "epoch": 0.33, + "learning_rate": 1.965748947512797e-06, + "loss": 0.9102, + "step": 12998 + }, + { + "epoch": 0.33, + "learning_rate": 1.9657417672616943e-06, + "loss": 0.9326, + "step": 12999 + }, + { + "epoch": 0.33, + "learning_rate": 1.9657345862711683e-06, + "loss": 0.5737, + "step": 13000 + }, + { + "epoch": 0.33, + "learning_rate": 1.9657274045412227e-06, + "loss": 0.689, + "step": 13001 + }, + { + "epoch": 0.33, + "learning_rate": 1.9657202220718648e-06, + "loss": 0.6602, + "step": 13002 + }, + { + "epoch": 0.33, + "learning_rate": 1.9657130388630988e-06, + "loss": 1.0063, + "step": 13003 + }, + { + "epoch": 0.33, + "learning_rate": 1.965705854914931e-06, + "loss": 0.8545, + "step": 13004 + }, + { + "epoch": 0.33, + "learning_rate": 1.965698670227367e-06, + "loss": 0.8013, + "step": 13005 + }, + { + "epoch": 0.33, + "learning_rate": 1.9656914848004115e-06, + "loss": 1.0518, + "step": 13006 + }, + { + "epoch": 0.33, + "learning_rate": 1.9656842986340707e-06, + "loss": 0.7798, + "step": 13007 + }, + { + "epoch": 0.33, + "learning_rate": 1.9656771117283494e-06, + "loss": 0.8291, + "step": 13008 + }, + { + "epoch": 0.33, + "learning_rate": 1.965669924083254e-06, + "loss": 0.7939, + "step": 13009 + }, + { + "epoch": 0.33, + "learning_rate": 1.965662735698789e-06, + "loss": 0.9785, + "step": 13010 + }, + { + "epoch": 0.33, + "learning_rate": 1.9656555465749613e-06, + "loss": 0.8838, + "step": 13011 + }, + { + "epoch": 0.33, + "learning_rate": 1.965648356711775e-06, + "loss": 0.8418, + "step": 13012 + }, + { + "epoch": 0.33, + "learning_rate": 1.965641166109236e-06, + "loss": 0.9883, + "step": 13013 + }, + { + "epoch": 0.33, + "learning_rate": 1.96563397476735e-06, + "loss": 0.7642, + "step": 13014 + }, + { + "epoch": 0.33, + "learning_rate": 1.9656267826861228e-06, + "loss": 0.8716, + "step": 13015 + }, + { + "epoch": 0.33, + "learning_rate": 1.9656195898655593e-06, + "loss": 0.8965, + "step": 13016 + }, + { + "epoch": 0.33, + "learning_rate": 1.9656123963056653e-06, + "loss": 1.0439, + "step": 13017 + }, + { + "epoch": 0.33, + "learning_rate": 1.9656052020064462e-06, + "loss": 0.9346, + "step": 13018 + }, + { + "epoch": 0.33, + "learning_rate": 1.965598006967908e-06, + "loss": 0.9951, + "step": 13019 + }, + { + "epoch": 0.33, + "learning_rate": 1.9655908111900557e-06, + "loss": 0.8403, + "step": 13020 + }, + { + "epoch": 0.33, + "learning_rate": 1.9655836146728948e-06, + "loss": 0.5229, + "step": 13021 + }, + { + "epoch": 0.33, + "learning_rate": 1.965576417416431e-06, + "loss": 0.668, + "step": 13022 + }, + { + "epoch": 0.33, + "learning_rate": 1.9655692194206693e-06, + "loss": 0.9756, + "step": 13023 + }, + { + "epoch": 0.33, + "learning_rate": 1.965562020685616e-06, + "loss": 0.8018, + "step": 13024 + }, + { + "epoch": 0.33, + "learning_rate": 1.965554821211276e-06, + "loss": 0.9746, + "step": 13025 + }, + { + "epoch": 0.33, + "learning_rate": 1.9655476209976553e-06, + "loss": 0.9268, + "step": 13026 + }, + { + "epoch": 0.33, + "learning_rate": 1.9655404200447595e-06, + "loss": 0.8906, + "step": 13027 + }, + { + "epoch": 0.33, + "learning_rate": 1.9655332183525936e-06, + "loss": 1.1348, + "step": 13028 + }, + { + "epoch": 0.33, + "learning_rate": 1.9655260159211633e-06, + "loss": 0.9941, + "step": 13029 + }, + { + "epoch": 0.33, + "learning_rate": 1.965518812750474e-06, + "loss": 0.9189, + "step": 13030 + }, + { + "epoch": 0.33, + "learning_rate": 1.965511608840531e-06, + "loss": 0.875, + "step": 13031 + }, + { + "epoch": 0.33, + "learning_rate": 1.9655044041913405e-06, + "loss": 0.7832, + "step": 13032 + }, + { + "epoch": 0.33, + "learning_rate": 1.965497198802908e-06, + "loss": 0.8936, + "step": 13033 + }, + { + "epoch": 0.33, + "learning_rate": 1.9654899926752383e-06, + "loss": 0.9375, + "step": 13034 + }, + { + "epoch": 0.33, + "learning_rate": 1.9654827858083373e-06, + "loss": 1.0449, + "step": 13035 + }, + { + "epoch": 0.33, + "learning_rate": 1.9654755782022107e-06, + "loss": 0.7539, + "step": 13036 + }, + { + "epoch": 0.33, + "learning_rate": 1.9654683698568636e-06, + "loss": 0.7776, + "step": 13037 + }, + { + "epoch": 0.33, + "learning_rate": 1.965461160772302e-06, + "loss": 0.7988, + "step": 13038 + }, + { + "epoch": 0.33, + "learning_rate": 1.965453950948531e-06, + "loss": 0.8193, + "step": 13039 + }, + { + "epoch": 0.33, + "learning_rate": 1.9654467403855563e-06, + "loss": 0.9023, + "step": 13040 + }, + { + "epoch": 0.33, + "learning_rate": 1.9654395290833836e-06, + "loss": 0.8169, + "step": 13041 + }, + { + "epoch": 0.33, + "learning_rate": 1.965432317042018e-06, + "loss": 0.7354, + "step": 13042 + }, + { + "epoch": 0.33, + "learning_rate": 1.965425104261466e-06, + "loss": 0.833, + "step": 13043 + }, + { + "epoch": 0.33, + "learning_rate": 1.9654178907417317e-06, + "loss": 1.0225, + "step": 13044 + }, + { + "epoch": 0.33, + "learning_rate": 1.9654106764828215e-06, + "loss": 0.9951, + "step": 13045 + }, + { + "epoch": 0.33, + "learning_rate": 1.9654034614847405e-06, + "loss": 0.8135, + "step": 13046 + }, + { + "epoch": 0.33, + "learning_rate": 1.965396245747495e-06, + "loss": 1.0928, + "step": 13047 + }, + { + "epoch": 0.33, + "learning_rate": 1.9653890292710893e-06, + "loss": 0.9297, + "step": 13048 + }, + { + "epoch": 0.33, + "learning_rate": 1.9653818120555297e-06, + "loss": 0.8545, + "step": 13049 + }, + { + "epoch": 0.33, + "learning_rate": 1.965374594100822e-06, + "loss": 0.8994, + "step": 13050 + }, + { + "epoch": 0.33, + "learning_rate": 1.965367375406971e-06, + "loss": 1.1162, + "step": 13051 + }, + { + "epoch": 0.33, + "learning_rate": 1.965360155973983e-06, + "loss": 0.9453, + "step": 13052 + }, + { + "epoch": 0.33, + "learning_rate": 1.965352935801863e-06, + "loss": 0.8491, + "step": 13053 + }, + { + "epoch": 0.33, + "learning_rate": 1.9653457148906167e-06, + "loss": 0.9072, + "step": 13054 + }, + { + "epoch": 0.33, + "learning_rate": 1.9653384932402493e-06, + "loss": 0.5557, + "step": 13055 + }, + { + "epoch": 0.33, + "learning_rate": 1.965331270850767e-06, + "loss": 0.9238, + "step": 13056 + }, + { + "epoch": 0.33, + "learning_rate": 1.9653240477221745e-06, + "loss": 0.9404, + "step": 13057 + }, + { + "epoch": 0.33, + "learning_rate": 1.965316823854478e-06, + "loss": 0.7246, + "step": 13058 + }, + { + "epoch": 0.33, + "learning_rate": 1.965309599247683e-06, + "loss": 0.8047, + "step": 13059 + }, + { + "epoch": 0.33, + "learning_rate": 1.965302373901794e-06, + "loss": 0.4795, + "step": 13060 + }, + { + "epoch": 0.33, + "learning_rate": 1.9652951478168184e-06, + "loss": 0.9443, + "step": 13061 + }, + { + "epoch": 0.33, + "learning_rate": 1.96528792099276e-06, + "loss": 1.0161, + "step": 13062 + }, + { + "epoch": 0.33, + "learning_rate": 1.9652806934296255e-06, + "loss": 0.8701, + "step": 13063 + }, + { + "epoch": 0.33, + "learning_rate": 1.9652734651274194e-06, + "loss": 0.9043, + "step": 13064 + }, + { + "epoch": 0.33, + "learning_rate": 1.9652662360861483e-06, + "loss": 0.7939, + "step": 13065 + }, + { + "epoch": 0.33, + "learning_rate": 1.965259006305817e-06, + "loss": 0.9434, + "step": 13066 + }, + { + "epoch": 0.33, + "learning_rate": 1.9652517757864313e-06, + "loss": 0.8857, + "step": 13067 + }, + { + "epoch": 0.33, + "learning_rate": 1.9652445445279968e-06, + "loss": 0.7578, + "step": 13068 + }, + { + "epoch": 0.33, + "learning_rate": 1.965237312530519e-06, + "loss": 0.9854, + "step": 13069 + }, + { + "epoch": 0.33, + "learning_rate": 1.965230079794003e-06, + "loss": 0.9951, + "step": 13070 + }, + { + "epoch": 0.34, + "learning_rate": 1.9652228463184547e-06, + "loss": 0.832, + "step": 13071 + }, + { + "epoch": 0.34, + "learning_rate": 1.9652156121038803e-06, + "loss": 0.5474, + "step": 13072 + }, + { + "epoch": 0.34, + "learning_rate": 1.965208377150284e-06, + "loss": 0.8037, + "step": 13073 + }, + { + "epoch": 0.34, + "learning_rate": 1.9652011414576723e-06, + "loss": 0.7322, + "step": 13074 + }, + { + "epoch": 0.34, + "learning_rate": 1.96519390502605e-06, + "loss": 0.8662, + "step": 13075 + }, + { + "epoch": 0.34, + "learning_rate": 1.965186667855424e-06, + "loss": 0.9258, + "step": 13076 + }, + { + "epoch": 0.34, + "learning_rate": 1.9651794299457983e-06, + "loss": 0.7827, + "step": 13077 + }, + { + "epoch": 0.34, + "learning_rate": 1.9651721912971793e-06, + "loss": 1.0078, + "step": 13078 + }, + { + "epoch": 0.34, + "learning_rate": 1.965164951909572e-06, + "loss": 0.7529, + "step": 13079 + }, + { + "epoch": 0.34, + "learning_rate": 1.965157711782983e-06, + "loss": 1.0166, + "step": 13080 + }, + { + "epoch": 0.34, + "learning_rate": 1.9651504709174167e-06, + "loss": 0.6934, + "step": 13081 + }, + { + "epoch": 0.34, + "learning_rate": 1.965143229312879e-06, + "loss": 0.915, + "step": 13082 + }, + { + "epoch": 0.34, + "learning_rate": 1.9651359869693753e-06, + "loss": 0.917, + "step": 13083 + }, + { + "epoch": 0.34, + "learning_rate": 1.965128743886912e-06, + "loss": 0.7383, + "step": 13084 + }, + { + "epoch": 0.34, + "learning_rate": 1.9651215000654935e-06, + "loss": 0.8926, + "step": 13085 + }, + { + "epoch": 0.34, + "learning_rate": 1.965114255505126e-06, + "loss": 0.7295, + "step": 13086 + }, + { + "epoch": 0.34, + "learning_rate": 1.965107010205815e-06, + "loss": 0.9834, + "step": 13087 + }, + { + "epoch": 0.34, + "learning_rate": 1.9650997641675656e-06, + "loss": 0.8184, + "step": 13088 + }, + { + "epoch": 0.34, + "learning_rate": 1.9650925173903843e-06, + "loss": 0.9141, + "step": 13089 + }, + { + "epoch": 0.34, + "learning_rate": 1.9650852698742755e-06, + "loss": 0.959, + "step": 13090 + }, + { + "epoch": 0.34, + "learning_rate": 1.9650780216192453e-06, + "loss": 0.916, + "step": 13091 + }, + { + "epoch": 0.34, + "learning_rate": 1.965070772625299e-06, + "loss": 0.9971, + "step": 13092 + }, + { + "epoch": 0.34, + "learning_rate": 1.965063522892443e-06, + "loss": 1.0693, + "step": 13093 + }, + { + "epoch": 0.34, + "learning_rate": 1.965056272420682e-06, + "loss": 0.7739, + "step": 13094 + }, + { + "epoch": 0.34, + "learning_rate": 1.965049021210022e-06, + "loss": 0.8711, + "step": 13095 + }, + { + "epoch": 0.34, + "learning_rate": 1.9650417692604678e-06, + "loss": 0.8701, + "step": 13096 + }, + { + "epoch": 0.34, + "learning_rate": 1.965034516572026e-06, + "loss": 0.7974, + "step": 13097 + }, + { + "epoch": 0.34, + "learning_rate": 1.9650272631447013e-06, + "loss": 1.0186, + "step": 13098 + }, + { + "epoch": 0.34, + "learning_rate": 1.9650200089784996e-06, + "loss": 0.7202, + "step": 13099 + }, + { + "epoch": 0.34, + "learning_rate": 1.965012754073427e-06, + "loss": 0.9678, + "step": 13100 + }, + { + "epoch": 0.34, + "learning_rate": 1.965005498429488e-06, + "loss": 0.9229, + "step": 13101 + }, + { + "epoch": 0.34, + "learning_rate": 1.9649982420466885e-06, + "loss": 0.8145, + "step": 13102 + }, + { + "epoch": 0.34, + "learning_rate": 1.9649909849250347e-06, + "loss": 0.7666, + "step": 13103 + }, + { + "epoch": 0.34, + "learning_rate": 1.9649837270645314e-06, + "loss": 0.9678, + "step": 13104 + }, + { + "epoch": 0.34, + "learning_rate": 1.9649764684651846e-06, + "loss": 0.8506, + "step": 13105 + }, + { + "epoch": 0.34, + "learning_rate": 1.9649692091269993e-06, + "loss": 0.5674, + "step": 13106 + }, + { + "epoch": 0.34, + "learning_rate": 1.964961949049982e-06, + "loss": 0.9902, + "step": 13107 + }, + { + "epoch": 0.34, + "learning_rate": 1.964954688234137e-06, + "loss": 1.0371, + "step": 13108 + }, + { + "epoch": 0.34, + "learning_rate": 1.964947426679471e-06, + "loss": 0.9053, + "step": 13109 + }, + { + "epoch": 0.34, + "learning_rate": 1.964940164385989e-06, + "loss": 0.8276, + "step": 13110 + }, + { + "epoch": 0.34, + "learning_rate": 1.964932901353697e-06, + "loss": 1.083, + "step": 13111 + }, + { + "epoch": 0.34, + "learning_rate": 1.9649256375826e-06, + "loss": 0.7529, + "step": 13112 + }, + { + "epoch": 0.34, + "learning_rate": 1.964918373072704e-06, + "loss": 1.1309, + "step": 13113 + }, + { + "epoch": 0.34, + "learning_rate": 1.964911107824014e-06, + "loss": 0.8833, + "step": 13114 + }, + { + "epoch": 0.34, + "learning_rate": 1.9649038418365364e-06, + "loss": 0.9395, + "step": 13115 + }, + { + "epoch": 0.34, + "learning_rate": 1.964896575110276e-06, + "loss": 0.9629, + "step": 13116 + }, + { + "epoch": 0.34, + "learning_rate": 1.9648893076452387e-06, + "loss": 1.1055, + "step": 13117 + }, + { + "epoch": 0.34, + "learning_rate": 1.9648820394414297e-06, + "loss": 0.9219, + "step": 13118 + }, + { + "epoch": 0.34, + "learning_rate": 1.9648747704988556e-06, + "loss": 0.9561, + "step": 13119 + }, + { + "epoch": 0.34, + "learning_rate": 1.9648675008175205e-06, + "loss": 1.0547, + "step": 13120 + }, + { + "epoch": 0.34, + "learning_rate": 1.9648602303974312e-06, + "loss": 1.0068, + "step": 13121 + }, + { + "epoch": 0.34, + "learning_rate": 1.964852959238593e-06, + "loss": 0.9814, + "step": 13122 + }, + { + "epoch": 0.34, + "learning_rate": 1.9648456873410104e-06, + "loss": 0.8154, + "step": 13123 + }, + { + "epoch": 0.34, + "learning_rate": 1.9648384147046908e-06, + "loss": 0.8018, + "step": 13124 + }, + { + "epoch": 0.34, + "learning_rate": 1.9648311413296386e-06, + "loss": 0.8506, + "step": 13125 + }, + { + "epoch": 0.34, + "learning_rate": 1.964823867215859e-06, + "loss": 0.8369, + "step": 13126 + }, + { + "epoch": 0.34, + "learning_rate": 1.9648165923633584e-06, + "loss": 0.998, + "step": 13127 + }, + { + "epoch": 0.34, + "learning_rate": 1.964809316772142e-06, + "loss": 0.8535, + "step": 13128 + }, + { + "epoch": 0.34, + "learning_rate": 1.964802040442216e-06, + "loss": 0.8887, + "step": 13129 + }, + { + "epoch": 0.34, + "learning_rate": 1.9647947633735847e-06, + "loss": 0.873, + "step": 13130 + }, + { + "epoch": 0.34, + "learning_rate": 1.964787485566255e-06, + "loss": 0.9092, + "step": 13131 + }, + { + "epoch": 0.34, + "learning_rate": 1.9647802070202315e-06, + "loss": 0.96, + "step": 13132 + }, + { + "epoch": 0.34, + "learning_rate": 1.96477292773552e-06, + "loss": 0.8447, + "step": 13133 + }, + { + "epoch": 0.34, + "learning_rate": 1.9647656477121267e-06, + "loss": 0.9268, + "step": 13134 + }, + { + "epoch": 0.34, + "learning_rate": 1.964758366950057e-06, + "loss": 1.0029, + "step": 13135 + }, + { + "epoch": 0.34, + "learning_rate": 1.964751085449315e-06, + "loss": 0.7109, + "step": 13136 + }, + { + "epoch": 0.34, + "learning_rate": 1.9647438032099085e-06, + "loss": 0.9111, + "step": 13137 + }, + { + "epoch": 0.34, + "learning_rate": 1.9647365202318417e-06, + "loss": 0.8027, + "step": 13138 + }, + { + "epoch": 0.34, + "learning_rate": 1.9647292365151203e-06, + "loss": 0.8115, + "step": 13139 + }, + { + "epoch": 0.34, + "learning_rate": 1.9647219520597506e-06, + "loss": 1.0674, + "step": 13140 + }, + { + "epoch": 0.34, + "learning_rate": 1.964714666865737e-06, + "loss": 0.9648, + "step": 13141 + }, + { + "epoch": 0.34, + "learning_rate": 1.964707380933086e-06, + "loss": 0.959, + "step": 13142 + }, + { + "epoch": 0.34, + "learning_rate": 1.964700094261803e-06, + "loss": 0.9023, + "step": 13143 + }, + { + "epoch": 0.34, + "learning_rate": 1.9646928068518936e-06, + "loss": 0.9746, + "step": 13144 + }, + { + "epoch": 0.34, + "learning_rate": 1.9646855187033632e-06, + "loss": 0.9814, + "step": 13145 + }, + { + "epoch": 0.34, + "learning_rate": 1.9646782298162176e-06, + "loss": 0.8184, + "step": 13146 + }, + { + "epoch": 0.34, + "learning_rate": 1.964670940190462e-06, + "loss": 0.7446, + "step": 13147 + }, + { + "epoch": 0.34, + "learning_rate": 1.964663649826102e-06, + "loss": 0.8486, + "step": 13148 + }, + { + "epoch": 0.34, + "learning_rate": 1.964656358723144e-06, + "loss": 0.9131, + "step": 13149 + }, + { + "epoch": 0.34, + "learning_rate": 1.964649066881593e-06, + "loss": 0.8926, + "step": 13150 + }, + { + "epoch": 0.34, + "learning_rate": 1.964641774301454e-06, + "loss": 0.7383, + "step": 13151 + }, + { + "epoch": 0.34, + "learning_rate": 1.9646344809827335e-06, + "loss": 0.9307, + "step": 13152 + }, + { + "epoch": 0.34, + "learning_rate": 1.9646271869254364e-06, + "loss": 0.9463, + "step": 13153 + }, + { + "epoch": 0.34, + "learning_rate": 1.964619892129569e-06, + "loss": 0.9688, + "step": 13154 + }, + { + "epoch": 0.34, + "learning_rate": 1.964612596595136e-06, + "loss": 1.0996, + "step": 13155 + }, + { + "epoch": 0.34, + "learning_rate": 1.964605300322144e-06, + "loss": 0.8496, + "step": 13156 + }, + { + "epoch": 0.34, + "learning_rate": 1.964598003310598e-06, + "loss": 0.918, + "step": 13157 + }, + { + "epoch": 0.34, + "learning_rate": 1.964590705560503e-06, + "loss": 0.6428, + "step": 13158 + }, + { + "epoch": 0.34, + "learning_rate": 1.964583407071866e-06, + "loss": 1.1318, + "step": 13159 + }, + { + "epoch": 0.34, + "learning_rate": 1.964576107844692e-06, + "loss": 0.8076, + "step": 13160 + }, + { + "epoch": 0.34, + "learning_rate": 1.964568807878986e-06, + "loss": 0.8442, + "step": 13161 + }, + { + "epoch": 0.34, + "learning_rate": 1.964561507174754e-06, + "loss": 0.9609, + "step": 13162 + }, + { + "epoch": 0.34, + "learning_rate": 1.9645542057320016e-06, + "loss": 0.8252, + "step": 13163 + }, + { + "epoch": 0.34, + "learning_rate": 1.9645469035507345e-06, + "loss": 0.9219, + "step": 13164 + }, + { + "epoch": 0.34, + "learning_rate": 1.9645396006309583e-06, + "loss": 1.0518, + "step": 13165 + }, + { + "epoch": 0.34, + "learning_rate": 1.9645322969726783e-06, + "loss": 0.7969, + "step": 13166 + }, + { + "epoch": 0.34, + "learning_rate": 1.9645249925759003e-06, + "loss": 0.9014, + "step": 13167 + }, + { + "epoch": 0.34, + "learning_rate": 1.96451768744063e-06, + "loss": 0.9004, + "step": 13168 + }, + { + "epoch": 0.34, + "learning_rate": 1.9645103815668724e-06, + "loss": 0.9521, + "step": 13169 + }, + { + "epoch": 0.34, + "learning_rate": 1.964503074954634e-06, + "loss": 0.8438, + "step": 13170 + }, + { + "epoch": 0.34, + "learning_rate": 1.9644957676039197e-06, + "loss": 0.7275, + "step": 13171 + }, + { + "epoch": 0.34, + "learning_rate": 1.9644884595147357e-06, + "loss": 0.7805, + "step": 13172 + }, + { + "epoch": 0.34, + "learning_rate": 1.964481150687087e-06, + "loss": 0.9492, + "step": 13173 + }, + { + "epoch": 0.34, + "learning_rate": 1.9644738411209795e-06, + "loss": 1.0645, + "step": 13174 + }, + { + "epoch": 0.34, + "learning_rate": 1.9644665308164186e-06, + "loss": 0.918, + "step": 13175 + }, + { + "epoch": 0.34, + "learning_rate": 1.96445921977341e-06, + "loss": 0.8691, + "step": 13176 + }, + { + "epoch": 0.34, + "learning_rate": 1.9644519079919596e-06, + "loss": 0.6343, + "step": 13177 + }, + { + "epoch": 0.34, + "learning_rate": 1.9644445954720725e-06, + "loss": 0.7588, + "step": 13178 + }, + { + "epoch": 0.34, + "learning_rate": 1.964437282213755e-06, + "loss": 0.9985, + "step": 13179 + }, + { + "epoch": 0.34, + "learning_rate": 1.964429968217011e-06, + "loss": 0.9346, + "step": 13180 + }, + { + "epoch": 0.34, + "learning_rate": 1.9644226534818483e-06, + "loss": 0.8984, + "step": 13181 + }, + { + "epoch": 0.34, + "learning_rate": 1.9644153380082714e-06, + "loss": 0.8467, + "step": 13182 + }, + { + "epoch": 0.34, + "learning_rate": 1.964408021796286e-06, + "loss": 0.7373, + "step": 13183 + }, + { + "epoch": 0.34, + "learning_rate": 1.9644007048458973e-06, + "loss": 1.0605, + "step": 13184 + }, + { + "epoch": 0.34, + "learning_rate": 1.964393387157112e-06, + "loss": 0.9258, + "step": 13185 + }, + { + "epoch": 0.34, + "learning_rate": 1.964386068729935e-06, + "loss": 0.7725, + "step": 13186 + }, + { + "epoch": 0.34, + "learning_rate": 1.9643787495643714e-06, + "loss": 0.7432, + "step": 13187 + }, + { + "epoch": 0.34, + "learning_rate": 1.9643714296604276e-06, + "loss": 0.8364, + "step": 13188 + }, + { + "epoch": 0.34, + "learning_rate": 1.964364109018109e-06, + "loss": 0.9678, + "step": 13189 + }, + { + "epoch": 0.34, + "learning_rate": 1.964356787637421e-06, + "loss": 0.8096, + "step": 13190 + }, + { + "epoch": 0.34, + "learning_rate": 1.9643494655183695e-06, + "loss": 1.0195, + "step": 13191 + }, + { + "epoch": 0.34, + "learning_rate": 1.9643421426609595e-06, + "loss": 0.9424, + "step": 13192 + }, + { + "epoch": 0.34, + "learning_rate": 1.9643348190651976e-06, + "loss": 1.1621, + "step": 13193 + }, + { + "epoch": 0.34, + "learning_rate": 1.964327494731089e-06, + "loss": 1.0977, + "step": 13194 + }, + { + "epoch": 0.34, + "learning_rate": 1.9643201696586386e-06, + "loss": 0.7432, + "step": 13195 + }, + { + "epoch": 0.34, + "learning_rate": 1.964312843847853e-06, + "loss": 0.9805, + "step": 13196 + }, + { + "epoch": 0.34, + "learning_rate": 1.964305517298737e-06, + "loss": 1.1309, + "step": 13197 + }, + { + "epoch": 0.34, + "learning_rate": 1.964298190011297e-06, + "loss": 0.8027, + "step": 13198 + }, + { + "epoch": 0.34, + "learning_rate": 1.9642908619855383e-06, + "loss": 0.7842, + "step": 13199 + }, + { + "epoch": 0.34, + "learning_rate": 1.964283533221466e-06, + "loss": 0.8613, + "step": 13200 + }, + { + "epoch": 0.34, + "learning_rate": 1.9642762037190862e-06, + "loss": 0.9043, + "step": 13201 + }, + { + "epoch": 0.34, + "learning_rate": 1.9642688734784047e-06, + "loss": 0.8477, + "step": 13202 + }, + { + "epoch": 0.34, + "learning_rate": 1.9642615424994267e-06, + "loss": 0.8877, + "step": 13203 + }, + { + "epoch": 0.34, + "learning_rate": 1.964254210782158e-06, + "loss": 0.6704, + "step": 13204 + }, + { + "epoch": 0.34, + "learning_rate": 1.9642468783266042e-06, + "loss": 0.8994, + "step": 13205 + }, + { + "epoch": 0.34, + "learning_rate": 1.964239545132771e-06, + "loss": 0.8174, + "step": 13206 + }, + { + "epoch": 0.34, + "learning_rate": 1.964232211200664e-06, + "loss": 0.8955, + "step": 13207 + }, + { + "epoch": 0.34, + "learning_rate": 1.9642248765302886e-06, + "loss": 0.6753, + "step": 13208 + }, + { + "epoch": 0.34, + "learning_rate": 1.96421754112165e-06, + "loss": 0.9248, + "step": 13209 + }, + { + "epoch": 0.34, + "learning_rate": 1.9642102049747553e-06, + "loss": 0.7415, + "step": 13210 + }, + { + "epoch": 0.34, + "learning_rate": 1.964202868089609e-06, + "loss": 0.6934, + "step": 13211 + }, + { + "epoch": 0.34, + "learning_rate": 1.9641955304662165e-06, + "loss": 0.8945, + "step": 13212 + }, + { + "epoch": 0.34, + "learning_rate": 1.9641881921045837e-06, + "loss": 0.8535, + "step": 13213 + }, + { + "epoch": 0.34, + "learning_rate": 1.9641808530047168e-06, + "loss": 0.9785, + "step": 13214 + }, + { + "epoch": 0.34, + "learning_rate": 1.964173513166621e-06, + "loss": 0.9365, + "step": 13215 + }, + { + "epoch": 0.34, + "learning_rate": 1.9641661725903014e-06, + "loss": 1.0693, + "step": 13216 + }, + { + "epoch": 0.34, + "learning_rate": 1.9641588312757643e-06, + "loss": 0.6865, + "step": 13217 + }, + { + "epoch": 0.34, + "learning_rate": 1.964151489223015e-06, + "loss": 0.9561, + "step": 13218 + }, + { + "epoch": 0.34, + "learning_rate": 1.9641441464320595e-06, + "loss": 0.9014, + "step": 13219 + }, + { + "epoch": 0.34, + "learning_rate": 1.964136802902903e-06, + "loss": 0.9785, + "step": 13220 + }, + { + "epoch": 0.34, + "learning_rate": 1.9641294586355516e-06, + "loss": 0.8174, + "step": 13221 + }, + { + "epoch": 0.34, + "learning_rate": 1.9641221136300104e-06, + "loss": 0.7476, + "step": 13222 + }, + { + "epoch": 0.34, + "learning_rate": 1.964114767886285e-06, + "loss": 0.9092, + "step": 13223 + }, + { + "epoch": 0.34, + "learning_rate": 1.9641074214043812e-06, + "loss": 0.832, + "step": 13224 + }, + { + "epoch": 0.34, + "learning_rate": 1.964100074184305e-06, + "loss": 1.1523, + "step": 13225 + }, + { + "epoch": 0.34, + "learning_rate": 1.9640927262260617e-06, + "loss": 0.9844, + "step": 13226 + }, + { + "epoch": 0.34, + "learning_rate": 1.9640853775296567e-06, + "loss": 1.0879, + "step": 13227 + }, + { + "epoch": 0.34, + "learning_rate": 1.9640780280950963e-06, + "loss": 0.9277, + "step": 13228 + }, + { + "epoch": 0.34, + "learning_rate": 1.9640706779223852e-06, + "loss": 0.9155, + "step": 13229 + }, + { + "epoch": 0.34, + "learning_rate": 1.96406332701153e-06, + "loss": 0.895, + "step": 13230 + }, + { + "epoch": 0.34, + "learning_rate": 1.9640559753625352e-06, + "loss": 0.7778, + "step": 13231 + }, + { + "epoch": 0.34, + "learning_rate": 1.9640486229754073e-06, + "loss": 0.8052, + "step": 13232 + }, + { + "epoch": 0.34, + "learning_rate": 1.964041269850152e-06, + "loss": 0.7529, + "step": 13233 + }, + { + "epoch": 0.34, + "learning_rate": 1.9640339159867744e-06, + "loss": 0.8311, + "step": 13234 + }, + { + "epoch": 0.34, + "learning_rate": 1.9640265613852804e-06, + "loss": 0.7432, + "step": 13235 + }, + { + "epoch": 0.34, + "learning_rate": 1.9640192060456756e-06, + "loss": 1.0654, + "step": 13236 + }, + { + "epoch": 0.34, + "learning_rate": 1.9640118499679654e-06, + "loss": 0.9502, + "step": 13237 + }, + { + "epoch": 0.34, + "learning_rate": 1.964004493152156e-06, + "loss": 1.207, + "step": 13238 + }, + { + "epoch": 0.34, + "learning_rate": 1.9639971355982526e-06, + "loss": 0.9487, + "step": 13239 + }, + { + "epoch": 0.34, + "learning_rate": 1.9639897773062607e-06, + "loss": 0.9473, + "step": 13240 + }, + { + "epoch": 0.34, + "learning_rate": 1.9639824182761862e-06, + "loss": 0.9014, + "step": 13241 + }, + { + "epoch": 0.34, + "learning_rate": 1.963975058508035e-06, + "loss": 0.8125, + "step": 13242 + }, + { + "epoch": 0.34, + "learning_rate": 1.963967698001812e-06, + "loss": 0.9238, + "step": 13243 + }, + { + "epoch": 0.34, + "learning_rate": 1.963960336757524e-06, + "loss": 1.0146, + "step": 13244 + }, + { + "epoch": 0.34, + "learning_rate": 1.963952974775175e-06, + "loss": 0.8633, + "step": 13245 + }, + { + "epoch": 0.34, + "learning_rate": 1.963945612054772e-06, + "loss": 0.959, + "step": 13246 + }, + { + "epoch": 0.34, + "learning_rate": 1.96393824859632e-06, + "loss": 1.2422, + "step": 13247 + }, + { + "epoch": 0.34, + "learning_rate": 1.9639308843998247e-06, + "loss": 0.7485, + "step": 13248 + }, + { + "epoch": 0.34, + "learning_rate": 1.963923519465292e-06, + "loss": 0.9072, + "step": 13249 + }, + { + "epoch": 0.34, + "learning_rate": 1.9639161537927275e-06, + "loss": 0.8701, + "step": 13250 + }, + { + "epoch": 0.34, + "learning_rate": 1.9639087873821365e-06, + "loss": 0.9092, + "step": 13251 + }, + { + "epoch": 0.34, + "learning_rate": 1.9639014202335253e-06, + "loss": 1.0195, + "step": 13252 + }, + { + "epoch": 0.34, + "learning_rate": 1.9638940523468985e-06, + "loss": 1.0215, + "step": 13253 + }, + { + "epoch": 0.34, + "learning_rate": 1.963886683722263e-06, + "loss": 0.9395, + "step": 13254 + }, + { + "epoch": 0.34, + "learning_rate": 1.963879314359623e-06, + "loss": 0.854, + "step": 13255 + }, + { + "epoch": 0.34, + "learning_rate": 1.9638719442589852e-06, + "loss": 0.8984, + "step": 13256 + }, + { + "epoch": 0.34, + "learning_rate": 1.963864573420355e-06, + "loss": 0.4907, + "step": 13257 + }, + { + "epoch": 0.34, + "learning_rate": 1.9638572018437384e-06, + "loss": 0.7969, + "step": 13258 + }, + { + "epoch": 0.34, + "learning_rate": 1.9638498295291406e-06, + "loss": 0.7437, + "step": 13259 + }, + { + "epoch": 0.34, + "learning_rate": 1.963842456476567e-06, + "loss": 0.9082, + "step": 13260 + }, + { + "epoch": 0.34, + "learning_rate": 1.9638350826860236e-06, + "loss": 1.0205, + "step": 13261 + }, + { + "epoch": 0.34, + "learning_rate": 1.9638277081575162e-06, + "loss": 0.9639, + "step": 13262 + }, + { + "epoch": 0.34, + "learning_rate": 1.96382033289105e-06, + "loss": 0.9775, + "step": 13263 + }, + { + "epoch": 0.34, + "learning_rate": 1.963812956886631e-06, + "loss": 0.6929, + "step": 13264 + }, + { + "epoch": 0.34, + "learning_rate": 1.9638055801442646e-06, + "loss": 0.8516, + "step": 13265 + }, + { + "epoch": 0.34, + "learning_rate": 1.9637982026639567e-06, + "loss": 0.9785, + "step": 13266 + }, + { + "epoch": 0.34, + "learning_rate": 1.963790824445713e-06, + "loss": 1.1416, + "step": 13267 + }, + { + "epoch": 0.34, + "learning_rate": 1.9637834454895386e-06, + "loss": 0.6143, + "step": 13268 + }, + { + "epoch": 0.34, + "learning_rate": 1.96377606579544e-06, + "loss": 0.8994, + "step": 13269 + }, + { + "epoch": 0.34, + "learning_rate": 1.963768685363422e-06, + "loss": 0.959, + "step": 13270 + }, + { + "epoch": 0.34, + "learning_rate": 1.9637613041934907e-06, + "loss": 0.6519, + "step": 13271 + }, + { + "epoch": 0.34, + "learning_rate": 1.9637539222856518e-06, + "loss": 0.9395, + "step": 13272 + }, + { + "epoch": 0.34, + "learning_rate": 1.963746539639911e-06, + "loss": 0.9062, + "step": 13273 + }, + { + "epoch": 0.34, + "learning_rate": 1.9637391562562733e-06, + "loss": 0.9375, + "step": 13274 + }, + { + "epoch": 0.34, + "learning_rate": 1.963731772134745e-06, + "loss": 1.082, + "step": 13275 + }, + { + "epoch": 0.34, + "learning_rate": 1.963724387275332e-06, + "loss": 0.9863, + "step": 13276 + }, + { + "epoch": 0.34, + "learning_rate": 1.963717001678039e-06, + "loss": 0.7229, + "step": 13277 + }, + { + "epoch": 0.34, + "learning_rate": 1.9637096153428724e-06, + "loss": 0.915, + "step": 13278 + }, + { + "epoch": 0.34, + "learning_rate": 1.9637022282698376e-06, + "loss": 0.874, + "step": 13279 + }, + { + "epoch": 0.34, + "learning_rate": 1.9636948404589405e-06, + "loss": 1.1396, + "step": 13280 + }, + { + "epoch": 0.34, + "learning_rate": 1.9636874519101867e-06, + "loss": 0.8438, + "step": 13281 + }, + { + "epoch": 0.34, + "learning_rate": 1.9636800626235812e-06, + "loss": 0.9146, + "step": 13282 + }, + { + "epoch": 0.34, + "learning_rate": 1.963672672599131e-06, + "loss": 0.9854, + "step": 13283 + }, + { + "epoch": 0.34, + "learning_rate": 1.9636652818368403e-06, + "loss": 0.9424, + "step": 13284 + }, + { + "epoch": 0.34, + "learning_rate": 1.9636578903367154e-06, + "loss": 0.916, + "step": 13285 + }, + { + "epoch": 0.34, + "learning_rate": 1.963650498098762e-06, + "loss": 0.7432, + "step": 13286 + }, + { + "epoch": 0.34, + "learning_rate": 1.963643105122986e-06, + "loss": 0.8047, + "step": 13287 + }, + { + "epoch": 0.34, + "learning_rate": 1.963635711409393e-06, + "loss": 0.8164, + "step": 13288 + }, + { + "epoch": 0.34, + "learning_rate": 1.963628316957988e-06, + "loss": 0.7095, + "step": 13289 + }, + { + "epoch": 0.34, + "learning_rate": 1.963620921768777e-06, + "loss": 1.0742, + "step": 13290 + }, + { + "epoch": 0.34, + "learning_rate": 1.963613525841766e-06, + "loss": 0.6787, + "step": 13291 + }, + { + "epoch": 0.34, + "learning_rate": 1.9636061291769607e-06, + "loss": 1.0371, + "step": 13292 + }, + { + "epoch": 0.34, + "learning_rate": 1.963598731774366e-06, + "loss": 0.8682, + "step": 13293 + }, + { + "epoch": 0.34, + "learning_rate": 1.963591333633988e-06, + "loss": 0.8389, + "step": 13294 + }, + { + "epoch": 0.34, + "learning_rate": 1.963583934755833e-06, + "loss": 0.8262, + "step": 13295 + }, + { + "epoch": 0.34, + "learning_rate": 1.9635765351399055e-06, + "loss": 0.8506, + "step": 13296 + }, + { + "epoch": 0.34, + "learning_rate": 1.963569134786212e-06, + "loss": 0.9033, + "step": 13297 + }, + { + "epoch": 0.34, + "learning_rate": 1.963561733694758e-06, + "loss": 1.0713, + "step": 13298 + }, + { + "epoch": 0.34, + "learning_rate": 1.963554331865549e-06, + "loss": 0.8691, + "step": 13299 + }, + { + "epoch": 0.34, + "learning_rate": 1.9635469292985908e-06, + "loss": 0.9922, + "step": 13300 + }, + { + "epoch": 0.34, + "learning_rate": 1.963539525993889e-06, + "loss": 1.209, + "step": 13301 + }, + { + "epoch": 0.34, + "learning_rate": 1.963532121951449e-06, + "loss": 0.9922, + "step": 13302 + }, + { + "epoch": 0.34, + "learning_rate": 1.9635247171712774e-06, + "loss": 0.9414, + "step": 13303 + }, + { + "epoch": 0.34, + "learning_rate": 1.963517311653379e-06, + "loss": 0.7749, + "step": 13304 + }, + { + "epoch": 0.34, + "learning_rate": 1.9635099053977592e-06, + "loss": 1.1143, + "step": 13305 + }, + { + "epoch": 0.34, + "learning_rate": 1.9635024984044247e-06, + "loss": 0.7578, + "step": 13306 + }, + { + "epoch": 0.34, + "learning_rate": 1.9634950906733803e-06, + "loss": 0.7388, + "step": 13307 + }, + { + "epoch": 0.34, + "learning_rate": 1.9634876822046325e-06, + "loss": 0.7998, + "step": 13308 + }, + { + "epoch": 0.34, + "learning_rate": 1.963480272998186e-06, + "loss": 0.7651, + "step": 13309 + }, + { + "epoch": 0.34, + "learning_rate": 1.9634728630540473e-06, + "loss": 0.7334, + "step": 13310 + }, + { + "epoch": 0.34, + "learning_rate": 1.9634654523722214e-06, + "loss": 1.0439, + "step": 13311 + }, + { + "epoch": 0.34, + "learning_rate": 1.9634580409527145e-06, + "loss": 0.8442, + "step": 13312 + }, + { + "epoch": 0.34, + "learning_rate": 1.963450628795532e-06, + "loss": 0.6587, + "step": 13313 + }, + { + "epoch": 0.34, + "learning_rate": 1.9634432159006796e-06, + "loss": 0.998, + "step": 13314 + }, + { + "epoch": 0.34, + "learning_rate": 1.963435802268163e-06, + "loss": 0.8867, + "step": 13315 + }, + { + "epoch": 0.34, + "learning_rate": 1.963428387897988e-06, + "loss": 0.9561, + "step": 13316 + }, + { + "epoch": 0.34, + "learning_rate": 1.9634209727901606e-06, + "loss": 1.1445, + "step": 13317 + }, + { + "epoch": 0.34, + "learning_rate": 1.9634135569446854e-06, + "loss": 1.0, + "step": 13318 + }, + { + "epoch": 0.34, + "learning_rate": 1.963406140361569e-06, + "loss": 0.8647, + "step": 13319 + }, + { + "epoch": 0.34, + "learning_rate": 1.963398723040817e-06, + "loss": 0.9717, + "step": 13320 + }, + { + "epoch": 0.34, + "learning_rate": 1.963391304982435e-06, + "loss": 0.8721, + "step": 13321 + }, + { + "epoch": 0.34, + "learning_rate": 1.963383886186428e-06, + "loss": 0.6763, + "step": 13322 + }, + { + "epoch": 0.34, + "learning_rate": 1.9633764666528025e-06, + "loss": 1.1094, + "step": 13323 + }, + { + "epoch": 0.34, + "learning_rate": 1.963369046381564e-06, + "loss": 0.876, + "step": 13324 + }, + { + "epoch": 0.34, + "learning_rate": 1.9633616253727184e-06, + "loss": 0.9297, + "step": 13325 + }, + { + "epoch": 0.34, + "learning_rate": 1.963354203626271e-06, + "loss": 0.7186, + "step": 13326 + }, + { + "epoch": 0.34, + "learning_rate": 1.9633467811422267e-06, + "loss": 1.1621, + "step": 13327 + }, + { + "epoch": 0.34, + "learning_rate": 1.963339357920593e-06, + "loss": 0.8711, + "step": 13328 + }, + { + "epoch": 0.34, + "learning_rate": 1.9633319339613744e-06, + "loss": 0.7876, + "step": 13329 + }, + { + "epoch": 0.34, + "learning_rate": 1.963324509264577e-06, + "loss": 0.8809, + "step": 13330 + }, + { + "epoch": 0.34, + "learning_rate": 1.9633170838302064e-06, + "loss": 0.8486, + "step": 13331 + }, + { + "epoch": 0.34, + "learning_rate": 1.9633096576582675e-06, + "loss": 0.9385, + "step": 13332 + }, + { + "epoch": 0.34, + "learning_rate": 1.963302230748767e-06, + "loss": 0.8447, + "step": 13333 + }, + { + "epoch": 0.34, + "learning_rate": 1.9632948031017107e-06, + "loss": 0.5957, + "step": 13334 + }, + { + "epoch": 0.34, + "learning_rate": 1.9632873747171037e-06, + "loss": 0.9131, + "step": 13335 + }, + { + "epoch": 0.34, + "learning_rate": 1.9632799455949516e-06, + "loss": 0.7935, + "step": 13336 + }, + { + "epoch": 0.34, + "learning_rate": 1.9632725157352604e-06, + "loss": 0.6377, + "step": 13337 + }, + { + "epoch": 0.34, + "learning_rate": 1.963265085138036e-06, + "loss": 0.9512, + "step": 13338 + }, + { + "epoch": 0.34, + "learning_rate": 1.9632576538032836e-06, + "loss": 0.79, + "step": 13339 + }, + { + "epoch": 0.34, + "learning_rate": 1.963250221731009e-06, + "loss": 0.8203, + "step": 13340 + }, + { + "epoch": 0.34, + "learning_rate": 1.963242788921218e-06, + "loss": 0.8066, + "step": 13341 + }, + { + "epoch": 0.34, + "learning_rate": 1.963235355373917e-06, + "loss": 0.8691, + "step": 13342 + }, + { + "epoch": 0.34, + "learning_rate": 1.96322792108911e-06, + "loss": 1.0088, + "step": 13343 + }, + { + "epoch": 0.34, + "learning_rate": 1.9632204860668043e-06, + "loss": 0.918, + "step": 13344 + }, + { + "epoch": 0.34, + "learning_rate": 1.9632130503070048e-06, + "loss": 1.0029, + "step": 13345 + }, + { + "epoch": 0.34, + "learning_rate": 1.963205613809717e-06, + "loss": 0.8662, + "step": 13346 + }, + { + "epoch": 0.34, + "learning_rate": 1.963198176574947e-06, + "loss": 0.8154, + "step": 13347 + }, + { + "epoch": 0.34, + "learning_rate": 1.963190738602701e-06, + "loss": 0.8086, + "step": 13348 + }, + { + "epoch": 0.34, + "learning_rate": 1.963183299892984e-06, + "loss": 0.9446, + "step": 13349 + }, + { + "epoch": 0.34, + "learning_rate": 1.9631758604458013e-06, + "loss": 0.9941, + "step": 13350 + }, + { + "epoch": 0.34, + "learning_rate": 1.9631684202611596e-06, + "loss": 0.9932, + "step": 13351 + }, + { + "epoch": 0.34, + "learning_rate": 1.963160979339064e-06, + "loss": 0.9551, + "step": 13352 + }, + { + "epoch": 0.34, + "learning_rate": 1.9631535376795203e-06, + "loss": 0.8979, + "step": 13353 + }, + { + "epoch": 0.34, + "learning_rate": 1.963146095282534e-06, + "loss": 0.8447, + "step": 13354 + }, + { + "epoch": 0.34, + "learning_rate": 1.9631386521481117e-06, + "loss": 0.7734, + "step": 13355 + }, + { + "epoch": 0.34, + "learning_rate": 1.963131208276258e-06, + "loss": 1.1309, + "step": 13356 + }, + { + "epoch": 0.34, + "learning_rate": 1.963123763666979e-06, + "loss": 0.9512, + "step": 13357 + }, + { + "epoch": 0.34, + "learning_rate": 1.9631163183202805e-06, + "loss": 1.0771, + "step": 13358 + }, + { + "epoch": 0.34, + "learning_rate": 1.9631088722361683e-06, + "loss": 0.9141, + "step": 13359 + }, + { + "epoch": 0.34, + "learning_rate": 1.9631014254146475e-06, + "loss": 0.8555, + "step": 13360 + }, + { + "epoch": 0.34, + "learning_rate": 1.9630939778557243e-06, + "loss": 0.9497, + "step": 13361 + }, + { + "epoch": 0.34, + "learning_rate": 1.9630865295594043e-06, + "loss": 1.1094, + "step": 13362 + }, + { + "epoch": 0.34, + "learning_rate": 1.9630790805256934e-06, + "loss": 0.7798, + "step": 13363 + }, + { + "epoch": 0.34, + "learning_rate": 1.963071630754597e-06, + "loss": 0.6733, + "step": 13364 + }, + { + "epoch": 0.34, + "learning_rate": 1.963064180246121e-06, + "loss": 0.8193, + "step": 13365 + }, + { + "epoch": 0.34, + "learning_rate": 1.9630567290002714e-06, + "loss": 0.8496, + "step": 13366 + }, + { + "epoch": 0.34, + "learning_rate": 1.963049277017053e-06, + "loss": 0.6421, + "step": 13367 + }, + { + "epoch": 0.34, + "learning_rate": 1.9630418242964723e-06, + "loss": 0.8496, + "step": 13368 + }, + { + "epoch": 0.34, + "learning_rate": 1.9630343708385347e-06, + "loss": 0.8809, + "step": 13369 + }, + { + "epoch": 0.34, + "learning_rate": 1.9630269166432465e-06, + "loss": 0.7485, + "step": 13370 + }, + { + "epoch": 0.34, + "learning_rate": 1.963019461710612e-06, + "loss": 0.917, + "step": 13371 + }, + { + "epoch": 0.34, + "learning_rate": 1.963012006040638e-06, + "loss": 0.9219, + "step": 13372 + }, + { + "epoch": 0.34, + "learning_rate": 1.9630045496333303e-06, + "loss": 1.0146, + "step": 13373 + }, + { + "epoch": 0.34, + "learning_rate": 1.962997092488694e-06, + "loss": 1.1221, + "step": 13374 + }, + { + "epoch": 0.34, + "learning_rate": 1.962989634606735e-06, + "loss": 0.9668, + "step": 13375 + }, + { + "epoch": 0.34, + "learning_rate": 1.96298217598746e-06, + "loss": 0.8135, + "step": 13376 + }, + { + "epoch": 0.34, + "learning_rate": 1.962974716630873e-06, + "loss": 0.9912, + "step": 13377 + }, + { + "epoch": 0.34, + "learning_rate": 1.9629672565369807e-06, + "loss": 0.96, + "step": 13378 + }, + { + "epoch": 0.34, + "learning_rate": 1.9629597957057886e-06, + "loss": 0.8574, + "step": 13379 + }, + { + "epoch": 0.34, + "learning_rate": 1.9629523341373025e-06, + "loss": 0.5601, + "step": 13380 + }, + { + "epoch": 0.34, + "learning_rate": 1.962944871831528e-06, + "loss": 0.9492, + "step": 13381 + }, + { + "epoch": 0.34, + "learning_rate": 1.9629374087884713e-06, + "loss": 0.7998, + "step": 13382 + }, + { + "epoch": 0.34, + "learning_rate": 1.962929945008137e-06, + "loss": 0.8965, + "step": 13383 + }, + { + "epoch": 0.34, + "learning_rate": 1.962922480490532e-06, + "loss": 0.9219, + "step": 13384 + }, + { + "epoch": 0.34, + "learning_rate": 1.9629150152356613e-06, + "loss": 0.811, + "step": 13385 + }, + { + "epoch": 0.34, + "learning_rate": 1.9629075492435313e-06, + "loss": 0.8779, + "step": 13386 + }, + { + "epoch": 0.34, + "learning_rate": 1.962900082514147e-06, + "loss": 0.8926, + "step": 13387 + }, + { + "epoch": 0.34, + "learning_rate": 1.962892615047514e-06, + "loss": 0.6348, + "step": 13388 + }, + { + "epoch": 0.34, + "learning_rate": 1.962885146843639e-06, + "loss": 0.8398, + "step": 13389 + }, + { + "epoch": 0.34, + "learning_rate": 1.962877677902527e-06, + "loss": 0.7173, + "step": 13390 + }, + { + "epoch": 0.34, + "learning_rate": 1.9628702082241836e-06, + "loss": 1.0244, + "step": 13391 + }, + { + "epoch": 0.34, + "learning_rate": 1.962862737808615e-06, + "loss": 0.8633, + "step": 13392 + }, + { + "epoch": 0.34, + "learning_rate": 1.9628552666558263e-06, + "loss": 0.9902, + "step": 13393 + }, + { + "epoch": 0.34, + "learning_rate": 1.9628477947658237e-06, + "loss": 0.8818, + "step": 13394 + }, + { + "epoch": 0.34, + "learning_rate": 1.962840322138613e-06, + "loss": 1.0293, + "step": 13395 + }, + { + "epoch": 0.34, + "learning_rate": 1.9628328487741998e-06, + "loss": 0.8184, + "step": 13396 + }, + { + "epoch": 0.34, + "learning_rate": 1.9628253746725895e-06, + "loss": 0.9619, + "step": 13397 + }, + { + "epoch": 0.34, + "learning_rate": 1.962817899833788e-06, + "loss": 0.7764, + "step": 13398 + }, + { + "epoch": 0.34, + "learning_rate": 1.9628104242578015e-06, + "loss": 0.917, + "step": 13399 + }, + { + "epoch": 0.34, + "learning_rate": 1.962802947944635e-06, + "loss": 0.9707, + "step": 13400 + }, + { + "epoch": 0.34, + "learning_rate": 1.962795470894295e-06, + "loss": 0.8096, + "step": 13401 + }, + { + "epoch": 0.34, + "learning_rate": 1.9627879931067868e-06, + "loss": 0.8662, + "step": 13402 + }, + { + "epoch": 0.34, + "learning_rate": 1.9627805145821153e-06, + "loss": 0.9658, + "step": 13403 + }, + { + "epoch": 0.34, + "learning_rate": 1.9627730353202875e-06, + "loss": 0.917, + "step": 13404 + }, + { + "epoch": 0.34, + "learning_rate": 1.9627655553213086e-06, + "loss": 0.6838, + "step": 13405 + }, + { + "epoch": 0.34, + "learning_rate": 1.962758074585185e-06, + "loss": 0.7944, + "step": 13406 + }, + { + "epoch": 0.34, + "learning_rate": 1.962750593111921e-06, + "loss": 1.1201, + "step": 13407 + }, + { + "epoch": 0.34, + "learning_rate": 1.962743110901523e-06, + "loss": 0.8369, + "step": 13408 + }, + { + "epoch": 0.34, + "learning_rate": 1.9627356279539976e-06, + "loss": 0.9102, + "step": 13409 + }, + { + "epoch": 0.34, + "learning_rate": 1.9627281442693496e-06, + "loss": 0.7275, + "step": 13410 + }, + { + "epoch": 0.34, + "learning_rate": 1.9627206598475843e-06, + "loss": 0.7412, + "step": 13411 + }, + { + "epoch": 0.34, + "learning_rate": 1.962713174688709e-06, + "loss": 0.8289, + "step": 13412 + }, + { + "epoch": 0.34, + "learning_rate": 1.962705688792728e-06, + "loss": 0.8389, + "step": 13413 + }, + { + "epoch": 0.34, + "learning_rate": 1.962698202159648e-06, + "loss": 0.8945, + "step": 13414 + }, + { + "epoch": 0.34, + "learning_rate": 1.9626907147894735e-06, + "loss": 0.9014, + "step": 13415 + }, + { + "epoch": 0.34, + "learning_rate": 1.962683226682211e-06, + "loss": 0.9072, + "step": 13416 + }, + { + "epoch": 0.34, + "learning_rate": 1.9626757378378666e-06, + "loss": 0.9463, + "step": 13417 + }, + { + "epoch": 0.34, + "learning_rate": 1.9626682482564455e-06, + "loss": 0.8867, + "step": 13418 + }, + { + "epoch": 0.34, + "learning_rate": 1.9626607579379536e-06, + "loss": 0.9893, + "step": 13419 + }, + { + "epoch": 0.34, + "learning_rate": 1.962653266882397e-06, + "loss": 0.6162, + "step": 13420 + }, + { + "epoch": 0.34, + "learning_rate": 1.9626457750897806e-06, + "loss": 1.1484, + "step": 13421 + }, + { + "epoch": 0.34, + "learning_rate": 1.962638282560111e-06, + "loss": 0.8208, + "step": 13422 + }, + { + "epoch": 0.34, + "learning_rate": 1.962630789293393e-06, + "loss": 0.8252, + "step": 13423 + }, + { + "epoch": 0.34, + "learning_rate": 1.962623295289633e-06, + "loss": 0.9834, + "step": 13424 + }, + { + "epoch": 0.34, + "learning_rate": 1.962615800548837e-06, + "loss": 0.9746, + "step": 13425 + }, + { + "epoch": 0.34, + "learning_rate": 1.96260830507101e-06, + "loss": 0.8516, + "step": 13426 + }, + { + "epoch": 0.34, + "learning_rate": 1.962600808856158e-06, + "loss": 0.9795, + "step": 13427 + }, + { + "epoch": 0.34, + "learning_rate": 1.9625933119042873e-06, + "loss": 0.8516, + "step": 13428 + }, + { + "epoch": 0.34, + "learning_rate": 1.9625858142154027e-06, + "loss": 0.8574, + "step": 13429 + }, + { + "epoch": 0.34, + "learning_rate": 1.962578315789511e-06, + "loss": 0.8887, + "step": 13430 + }, + { + "epoch": 0.34, + "learning_rate": 1.9625708166266164e-06, + "loss": 1.0332, + "step": 13431 + }, + { + "epoch": 0.34, + "learning_rate": 1.9625633167267263e-06, + "loss": 0.9404, + "step": 13432 + }, + { + "epoch": 0.34, + "learning_rate": 1.9625558160898455e-06, + "loss": 1.0381, + "step": 13433 + }, + { + "epoch": 0.34, + "learning_rate": 1.96254831471598e-06, + "loss": 0.8735, + "step": 13434 + }, + { + "epoch": 0.34, + "learning_rate": 1.9625408126051352e-06, + "loss": 0.8203, + "step": 13435 + }, + { + "epoch": 0.34, + "learning_rate": 1.9625333097573176e-06, + "loss": 0.9492, + "step": 13436 + }, + { + "epoch": 0.34, + "learning_rate": 1.9625258061725326e-06, + "loss": 0.8359, + "step": 13437 + }, + { + "epoch": 0.34, + "learning_rate": 1.9625183018507854e-06, + "loss": 0.749, + "step": 13438 + }, + { + "epoch": 0.34, + "learning_rate": 1.9625107967920826e-06, + "loss": 0.7173, + "step": 13439 + }, + { + "epoch": 0.34, + "learning_rate": 1.962503290996429e-06, + "loss": 0.9385, + "step": 13440 + }, + { + "epoch": 0.34, + "learning_rate": 1.9624957844638312e-06, + "loss": 0.7812, + "step": 13441 + }, + { + "epoch": 0.34, + "learning_rate": 1.962488277194295e-06, + "loss": 1.166, + "step": 13442 + }, + { + "epoch": 0.34, + "learning_rate": 1.962480769187825e-06, + "loss": 0.8291, + "step": 13443 + }, + { + "epoch": 0.34, + "learning_rate": 1.9624732604444283e-06, + "loss": 0.8848, + "step": 13444 + }, + { + "epoch": 0.34, + "learning_rate": 1.96246575096411e-06, + "loss": 0.8652, + "step": 13445 + }, + { + "epoch": 0.34, + "learning_rate": 1.962458240746876e-06, + "loss": 0.8125, + "step": 13446 + }, + { + "epoch": 0.34, + "learning_rate": 1.962450729792732e-06, + "loss": 1.084, + "step": 13447 + }, + { + "epoch": 0.34, + "learning_rate": 1.9624432181016833e-06, + "loss": 0.8691, + "step": 13448 + }, + { + "epoch": 0.34, + "learning_rate": 1.9624357056737362e-06, + "loss": 0.8662, + "step": 13449 + }, + { + "epoch": 0.34, + "learning_rate": 1.962428192508897e-06, + "loss": 0.8047, + "step": 13450 + }, + { + "epoch": 0.34, + "learning_rate": 1.96242067860717e-06, + "loss": 0.9482, + "step": 13451 + }, + { + "epoch": 0.34, + "learning_rate": 1.9624131639685623e-06, + "loss": 1.0654, + "step": 13452 + }, + { + "epoch": 0.34, + "learning_rate": 1.9624056485930787e-06, + "loss": 0.9932, + "step": 13453 + }, + { + "epoch": 0.34, + "learning_rate": 1.9623981324807256e-06, + "loss": 0.8701, + "step": 13454 + }, + { + "epoch": 0.34, + "learning_rate": 1.9623906156315084e-06, + "loss": 0.8574, + "step": 13455 + }, + { + "epoch": 0.34, + "learning_rate": 1.9623830980454327e-06, + "loss": 1.0557, + "step": 13456 + }, + { + "epoch": 0.34, + "learning_rate": 1.9623755797225048e-06, + "loss": 0.918, + "step": 13457 + }, + { + "epoch": 0.34, + "learning_rate": 1.9623680606627302e-06, + "loss": 0.7041, + "step": 13458 + }, + { + "epoch": 0.34, + "learning_rate": 1.9623605408661145e-06, + "loss": 0.666, + "step": 13459 + }, + { + "epoch": 0.34, + "learning_rate": 1.9623530203326636e-06, + "loss": 1.1211, + "step": 13460 + }, + { + "epoch": 0.35, + "learning_rate": 1.9623454990623834e-06, + "loss": 0.6279, + "step": 13461 + }, + { + "epoch": 0.35, + "learning_rate": 1.9623379770552793e-06, + "loss": 1.0098, + "step": 13462 + }, + { + "epoch": 0.35, + "learning_rate": 1.9623304543113574e-06, + "loss": 1.0605, + "step": 13463 + }, + { + "epoch": 0.35, + "learning_rate": 1.962322930830623e-06, + "loss": 0.9043, + "step": 13464 + }, + { + "epoch": 0.35, + "learning_rate": 1.962315406613083e-06, + "loss": 0.8799, + "step": 13465 + }, + { + "epoch": 0.35, + "learning_rate": 1.9623078816587417e-06, + "loss": 0.7598, + "step": 13466 + }, + { + "epoch": 0.35, + "learning_rate": 1.9623003559676055e-06, + "loss": 0.6401, + "step": 13467 + }, + { + "epoch": 0.35, + "learning_rate": 1.9622928295396802e-06, + "loss": 1.0039, + "step": 13468 + }, + { + "epoch": 0.35, + "learning_rate": 1.9622853023749714e-06, + "loss": 0.8486, + "step": 13469 + }, + { + "epoch": 0.35, + "learning_rate": 1.9622777744734854e-06, + "loss": 0.874, + "step": 13470 + }, + { + "epoch": 0.35, + "learning_rate": 1.962270245835227e-06, + "loss": 0.8096, + "step": 13471 + }, + { + "epoch": 0.35, + "learning_rate": 1.962262716460203e-06, + "loss": 0.7852, + "step": 13472 + }, + { + "epoch": 0.35, + "learning_rate": 1.9622551863484186e-06, + "loss": 0.8711, + "step": 13473 + }, + { + "epoch": 0.35, + "learning_rate": 1.9622476554998797e-06, + "loss": 0.9678, + "step": 13474 + }, + { + "epoch": 0.35, + "learning_rate": 1.962240123914592e-06, + "loss": 0.8789, + "step": 13475 + }, + { + "epoch": 0.35, + "learning_rate": 1.9622325915925607e-06, + "loss": 0.8857, + "step": 13476 + }, + { + "epoch": 0.35, + "learning_rate": 1.962225058533793e-06, + "loss": 0.7725, + "step": 13477 + }, + { + "epoch": 0.35, + "learning_rate": 1.9622175247382935e-06, + "loss": 0.6416, + "step": 13478 + }, + { + "epoch": 0.35, + "learning_rate": 1.962209990206068e-06, + "loss": 0.9111, + "step": 13479 + }, + { + "epoch": 0.35, + "learning_rate": 1.9622024549371228e-06, + "loss": 0.9688, + "step": 13480 + }, + { + "epoch": 0.35, + "learning_rate": 1.9621949189314635e-06, + "loss": 0.9736, + "step": 13481 + }, + { + "epoch": 0.35, + "learning_rate": 1.9621873821890957e-06, + "loss": 0.8154, + "step": 13482 + }, + { + "epoch": 0.35, + "learning_rate": 1.962179844710025e-06, + "loss": 1.0996, + "step": 13483 + }, + { + "epoch": 0.35, + "learning_rate": 1.962172306494258e-06, + "loss": 0.9072, + "step": 13484 + }, + { + "epoch": 0.35, + "learning_rate": 1.9621647675417994e-06, + "loss": 0.7144, + "step": 13485 + }, + { + "epoch": 0.35, + "learning_rate": 1.9621572278526555e-06, + "loss": 0.8472, + "step": 13486 + }, + { + "epoch": 0.35, + "learning_rate": 1.9621496874268323e-06, + "loss": 0.6958, + "step": 13487 + }, + { + "epoch": 0.35, + "learning_rate": 1.9621421462643353e-06, + "loss": 0.9893, + "step": 13488 + }, + { + "epoch": 0.35, + "learning_rate": 1.9621346043651703e-06, + "loss": 1.1025, + "step": 13489 + }, + { + "epoch": 0.35, + "learning_rate": 1.9621270617293433e-06, + "loss": 0.8682, + "step": 13490 + }, + { + "epoch": 0.35, + "learning_rate": 1.9621195183568593e-06, + "loss": 0.8896, + "step": 13491 + }, + { + "epoch": 0.35, + "learning_rate": 1.9621119742477252e-06, + "loss": 0.6711, + "step": 13492 + }, + { + "epoch": 0.35, + "learning_rate": 1.9621044294019456e-06, + "loss": 0.8066, + "step": 13493 + }, + { + "epoch": 0.35, + "learning_rate": 1.9620968838195273e-06, + "loss": 0.918, + "step": 13494 + }, + { + "epoch": 0.35, + "learning_rate": 1.9620893375004753e-06, + "loss": 0.8672, + "step": 13495 + }, + { + "epoch": 0.35, + "learning_rate": 1.962081790444796e-06, + "loss": 0.8682, + "step": 13496 + }, + { + "epoch": 0.35, + "learning_rate": 1.962074242652495e-06, + "loss": 0.8965, + "step": 13497 + }, + { + "epoch": 0.35, + "learning_rate": 1.9620666941235778e-06, + "loss": 0.7543, + "step": 13498 + }, + { + "epoch": 0.35, + "learning_rate": 1.9620591448580506e-06, + "loss": 0.957, + "step": 13499 + }, + { + "epoch": 0.35, + "learning_rate": 1.962051594855919e-06, + "loss": 0.8799, + "step": 13500 + }, + { + "epoch": 0.35, + "learning_rate": 1.962044044117188e-06, + "loss": 0.7432, + "step": 13501 + }, + { + "epoch": 0.35, + "learning_rate": 1.962036492641865e-06, + "loss": 1.2236, + "step": 13502 + }, + { + "epoch": 0.35, + "learning_rate": 1.9620289404299543e-06, + "loss": 0.998, + "step": 13503 + }, + { + "epoch": 0.35, + "learning_rate": 1.9620213874814626e-06, + "loss": 0.9951, + "step": 13504 + }, + { + "epoch": 0.35, + "learning_rate": 1.9620138337963953e-06, + "loss": 0.8408, + "step": 13505 + }, + { + "epoch": 0.35, + "learning_rate": 1.962006279374758e-06, + "loss": 0.8223, + "step": 13506 + }, + { + "epoch": 0.35, + "learning_rate": 1.961998724216557e-06, + "loss": 0.8682, + "step": 13507 + }, + { + "epoch": 0.35, + "learning_rate": 1.9619911683217977e-06, + "loss": 0.7495, + "step": 13508 + }, + { + "epoch": 0.35, + "learning_rate": 1.9619836116904864e-06, + "loss": 0.8887, + "step": 13509 + }, + { + "epoch": 0.35, + "learning_rate": 1.961976054322628e-06, + "loss": 0.999, + "step": 13510 + }, + { + "epoch": 0.35, + "learning_rate": 1.961968496218229e-06, + "loss": 1.0137, + "step": 13511 + }, + { + "epoch": 0.35, + "learning_rate": 1.9619609373772944e-06, + "loss": 0.7275, + "step": 13512 + }, + { + "epoch": 0.35, + "learning_rate": 1.961953377799831e-06, + "loss": 0.7695, + "step": 13513 + }, + { + "epoch": 0.35, + "learning_rate": 1.9619458174858444e-06, + "loss": 0.5688, + "step": 13514 + }, + { + "epoch": 0.35, + "learning_rate": 1.96193825643534e-06, + "loss": 1.0205, + "step": 13515 + }, + { + "epoch": 0.35, + "learning_rate": 1.9619306946483232e-06, + "loss": 1.0654, + "step": 13516 + }, + { + "epoch": 0.35, + "learning_rate": 1.961923132124801e-06, + "loss": 0.7798, + "step": 13517 + }, + { + "epoch": 0.35, + "learning_rate": 1.961915568864778e-06, + "loss": 0.9521, + "step": 13518 + }, + { + "epoch": 0.35, + "learning_rate": 1.9619080048682605e-06, + "loss": 0.9072, + "step": 13519 + }, + { + "epoch": 0.35, + "learning_rate": 1.9619004401352543e-06, + "loss": 0.8291, + "step": 13520 + }, + { + "epoch": 0.35, + "learning_rate": 1.9618928746657654e-06, + "loss": 0.6948, + "step": 13521 + }, + { + "epoch": 0.35, + "learning_rate": 1.961885308459799e-06, + "loss": 0.9004, + "step": 13522 + }, + { + "epoch": 0.35, + "learning_rate": 1.9618777415173616e-06, + "loss": 0.7407, + "step": 13523 + }, + { + "epoch": 0.35, + "learning_rate": 1.9618701738384583e-06, + "loss": 0.9248, + "step": 13524 + }, + { + "epoch": 0.35, + "learning_rate": 1.9618626054230955e-06, + "loss": 0.8838, + "step": 13525 + }, + { + "epoch": 0.35, + "learning_rate": 1.9618550362712786e-06, + "loss": 1.0186, + "step": 13526 + }, + { + "epoch": 0.35, + "learning_rate": 1.9618474663830135e-06, + "loss": 0.7705, + "step": 13527 + }, + { + "epoch": 0.35, + "learning_rate": 1.961839895758306e-06, + "loss": 0.9209, + "step": 13528 + }, + { + "epoch": 0.35, + "learning_rate": 1.9618323243971623e-06, + "loss": 0.9707, + "step": 13529 + }, + { + "epoch": 0.35, + "learning_rate": 1.9618247522995875e-06, + "loss": 0.9326, + "step": 13530 + }, + { + "epoch": 0.35, + "learning_rate": 1.9618171794655875e-06, + "loss": 1.0781, + "step": 13531 + }, + { + "epoch": 0.35, + "learning_rate": 1.9618096058951686e-06, + "loss": 1.0439, + "step": 13532 + }, + { + "epoch": 0.35, + "learning_rate": 1.9618020315883362e-06, + "loss": 0.8193, + "step": 13533 + }, + { + "epoch": 0.35, + "learning_rate": 1.9617944565450964e-06, + "loss": 0.7607, + "step": 13534 + }, + { + "epoch": 0.35, + "learning_rate": 1.9617868807654546e-06, + "loss": 1.0244, + "step": 13535 + }, + { + "epoch": 0.35, + "learning_rate": 1.9617793042494172e-06, + "loss": 0.9502, + "step": 13536 + }, + { + "epoch": 0.35, + "learning_rate": 1.961771726996989e-06, + "loss": 0.7412, + "step": 13537 + }, + { + "epoch": 0.35, + "learning_rate": 1.9617641490081767e-06, + "loss": 0.7395, + "step": 13538 + }, + { + "epoch": 0.35, + "learning_rate": 1.961756570282986e-06, + "loss": 0.7756, + "step": 13539 + }, + { + "epoch": 0.35, + "learning_rate": 1.9617489908214223e-06, + "loss": 1.0156, + "step": 13540 + }, + { + "epoch": 0.35, + "learning_rate": 1.9617414106234915e-06, + "loss": 0.9395, + "step": 13541 + }, + { + "epoch": 0.35, + "learning_rate": 1.9617338296892e-06, + "loss": 0.9482, + "step": 13542 + }, + { + "epoch": 0.35, + "learning_rate": 1.9617262480185527e-06, + "loss": 0.9297, + "step": 13543 + }, + { + "epoch": 0.35, + "learning_rate": 1.9617186656115557e-06, + "loss": 0.7773, + "step": 13544 + }, + { + "epoch": 0.35, + "learning_rate": 1.9617110824682152e-06, + "loss": 0.9727, + "step": 13545 + }, + { + "epoch": 0.35, + "learning_rate": 1.9617034985885367e-06, + "loss": 0.7578, + "step": 13546 + }, + { + "epoch": 0.35, + "learning_rate": 1.961695913972526e-06, + "loss": 0.9844, + "step": 13547 + }, + { + "epoch": 0.35, + "learning_rate": 1.9616883286201893e-06, + "loss": 0.874, + "step": 13548 + }, + { + "epoch": 0.35, + "learning_rate": 1.9616807425315314e-06, + "loss": 1.0127, + "step": 13549 + }, + { + "epoch": 0.35, + "learning_rate": 1.9616731557065597e-06, + "loss": 0.918, + "step": 13550 + }, + { + "epoch": 0.35, + "learning_rate": 1.9616655681452783e-06, + "loss": 0.9214, + "step": 13551 + }, + { + "epoch": 0.35, + "learning_rate": 1.9616579798476944e-06, + "loss": 0.8257, + "step": 13552 + }, + { + "epoch": 0.35, + "learning_rate": 1.9616503908138123e-06, + "loss": 0.9404, + "step": 13553 + }, + { + "epoch": 0.35, + "learning_rate": 1.9616428010436397e-06, + "loss": 0.998, + "step": 13554 + }, + { + "epoch": 0.35, + "learning_rate": 1.9616352105371807e-06, + "loss": 0.6592, + "step": 13555 + }, + { + "epoch": 0.35, + "learning_rate": 1.961627619294442e-06, + "loss": 1.0283, + "step": 13556 + }, + { + "epoch": 0.35, + "learning_rate": 1.96162002731543e-06, + "loss": 0.9326, + "step": 13557 + }, + { + "epoch": 0.35, + "learning_rate": 1.9616124346001487e-06, + "loss": 0.9082, + "step": 13558 + }, + { + "epoch": 0.35, + "learning_rate": 1.9616048411486057e-06, + "loss": 0.9111, + "step": 13559 + }, + { + "epoch": 0.35, + "learning_rate": 1.961597246960806e-06, + "loss": 0.9053, + "step": 13560 + }, + { + "epoch": 0.35, + "learning_rate": 1.961589652036755e-06, + "loss": 0.7529, + "step": 13561 + }, + { + "epoch": 0.35, + "learning_rate": 1.9615820563764593e-06, + "loss": 0.9912, + "step": 13562 + }, + { + "epoch": 0.35, + "learning_rate": 1.9615744599799246e-06, + "loss": 0.9814, + "step": 13563 + }, + { + "epoch": 0.35, + "learning_rate": 1.961566862847156e-06, + "loss": 1.0938, + "step": 13564 + }, + { + "epoch": 0.35, + "learning_rate": 1.9615592649781605e-06, + "loss": 1.124, + "step": 13565 + }, + { + "epoch": 0.35, + "learning_rate": 1.961551666372943e-06, + "loss": 0.9404, + "step": 13566 + }, + { + "epoch": 0.35, + "learning_rate": 1.96154406703151e-06, + "loss": 0.8145, + "step": 13567 + }, + { + "epoch": 0.35, + "learning_rate": 1.9615364669538664e-06, + "loss": 0.9951, + "step": 13568 + }, + { + "epoch": 0.35, + "learning_rate": 1.961528866140019e-06, + "loss": 0.7407, + "step": 13569 + }, + { + "epoch": 0.35, + "learning_rate": 1.9615212645899727e-06, + "loss": 0.9902, + "step": 13570 + }, + { + "epoch": 0.35, + "learning_rate": 1.961513662303734e-06, + "loss": 1.04, + "step": 13571 + }, + { + "epoch": 0.35, + "learning_rate": 1.9615060592813084e-06, + "loss": 0.7183, + "step": 13572 + }, + { + "epoch": 0.35, + "learning_rate": 1.9614984555227017e-06, + "loss": 0.9746, + "step": 13573 + }, + { + "epoch": 0.35, + "learning_rate": 1.96149085102792e-06, + "loss": 0.9258, + "step": 13574 + }, + { + "epoch": 0.35, + "learning_rate": 1.9614832457969694e-06, + "loss": 0.9268, + "step": 13575 + }, + { + "epoch": 0.35, + "learning_rate": 1.9614756398298547e-06, + "loss": 0.8496, + "step": 13576 + }, + { + "epoch": 0.35, + "learning_rate": 1.9614680331265825e-06, + "loss": 0.7734, + "step": 13577 + }, + { + "epoch": 0.35, + "learning_rate": 1.9614604256871585e-06, + "loss": 0.8218, + "step": 13578 + }, + { + "epoch": 0.35, + "learning_rate": 1.9614528175115885e-06, + "loss": 0.9688, + "step": 13579 + }, + { + "epoch": 0.35, + "learning_rate": 1.961445208599878e-06, + "loss": 0.9951, + "step": 13580 + }, + { + "epoch": 0.35, + "learning_rate": 1.9614375989520335e-06, + "loss": 0.8467, + "step": 13581 + }, + { + "epoch": 0.35, + "learning_rate": 1.96142998856806e-06, + "loss": 0.9834, + "step": 13582 + }, + { + "epoch": 0.35, + "learning_rate": 1.961422377447964e-06, + "loss": 0.8359, + "step": 13583 + }, + { + "epoch": 0.35, + "learning_rate": 1.9614147655917513e-06, + "loss": 0.9297, + "step": 13584 + }, + { + "epoch": 0.35, + "learning_rate": 1.961407152999427e-06, + "loss": 1.0303, + "step": 13585 + }, + { + "epoch": 0.35, + "learning_rate": 1.961399539670998e-06, + "loss": 0.7236, + "step": 13586 + }, + { + "epoch": 0.35, + "learning_rate": 1.9613919256064695e-06, + "loss": 0.8838, + "step": 13587 + }, + { + "epoch": 0.35, + "learning_rate": 1.961384310805847e-06, + "loss": 0.7715, + "step": 13588 + }, + { + "epoch": 0.35, + "learning_rate": 1.961376695269137e-06, + "loss": 1.0625, + "step": 13589 + }, + { + "epoch": 0.35, + "learning_rate": 1.961369078996345e-06, + "loss": 0.9453, + "step": 13590 + }, + { + "epoch": 0.35, + "learning_rate": 1.961361461987477e-06, + "loss": 0.8555, + "step": 13591 + }, + { + "epoch": 0.35, + "learning_rate": 1.961353844242539e-06, + "loss": 0.8447, + "step": 13592 + }, + { + "epoch": 0.35, + "learning_rate": 1.961346225761536e-06, + "loss": 1.0195, + "step": 13593 + }, + { + "epoch": 0.35, + "learning_rate": 1.9613386065444747e-06, + "loss": 1.0762, + "step": 13594 + }, + { + "epoch": 0.35, + "learning_rate": 1.9613309865913604e-06, + "loss": 0.9014, + "step": 13595 + }, + { + "epoch": 0.35, + "learning_rate": 1.9613233659021995e-06, + "loss": 1.1543, + "step": 13596 + }, + { + "epoch": 0.35, + "learning_rate": 1.9613157444769974e-06, + "loss": 1.0, + "step": 13597 + }, + { + "epoch": 0.35, + "learning_rate": 1.96130812231576e-06, + "loss": 1.083, + "step": 13598 + }, + { + "epoch": 0.35, + "learning_rate": 1.961300499418493e-06, + "loss": 0.8877, + "step": 13599 + }, + { + "epoch": 0.35, + "learning_rate": 1.9612928757852028e-06, + "loss": 0.7822, + "step": 13600 + }, + { + "epoch": 0.35, + "learning_rate": 1.9612852514158946e-06, + "loss": 1.1025, + "step": 13601 + }, + { + "epoch": 0.35, + "learning_rate": 1.9612776263105745e-06, + "loss": 0.9014, + "step": 13602 + }, + { + "epoch": 0.35, + "learning_rate": 1.9612700004692484e-06, + "loss": 1.2051, + "step": 13603 + }, + { + "epoch": 0.35, + "learning_rate": 1.961262373891922e-06, + "loss": 1.0244, + "step": 13604 + }, + { + "epoch": 0.35, + "learning_rate": 1.961254746578601e-06, + "loss": 0.9893, + "step": 13605 + }, + { + "epoch": 0.35, + "learning_rate": 1.961247118529292e-06, + "loss": 0.9902, + "step": 13606 + }, + { + "epoch": 0.35, + "learning_rate": 1.961239489744e-06, + "loss": 0.9775, + "step": 13607 + }, + { + "epoch": 0.35, + "learning_rate": 1.9612318602227306e-06, + "loss": 0.7627, + "step": 13608 + }, + { + "epoch": 0.35, + "learning_rate": 1.9612242299654906e-06, + "loss": 0.8398, + "step": 13609 + }, + { + "epoch": 0.35, + "learning_rate": 1.9612165989722856e-06, + "loss": 0.9453, + "step": 13610 + }, + { + "epoch": 0.35, + "learning_rate": 1.9612089672431213e-06, + "loss": 1.125, + "step": 13611 + }, + { + "epoch": 0.35, + "learning_rate": 1.961201334778003e-06, + "loss": 0.9229, + "step": 13612 + }, + { + "epoch": 0.35, + "learning_rate": 1.961193701576937e-06, + "loss": 0.9531, + "step": 13613 + }, + { + "epoch": 0.35, + "learning_rate": 1.9611860676399295e-06, + "loss": 0.8691, + "step": 13614 + }, + { + "epoch": 0.35, + "learning_rate": 1.961178432966986e-06, + "loss": 0.7915, + "step": 13615 + }, + { + "epoch": 0.35, + "learning_rate": 1.9611707975581123e-06, + "loss": 0.9795, + "step": 13616 + }, + { + "epoch": 0.35, + "learning_rate": 1.9611631614133144e-06, + "loss": 0.709, + "step": 13617 + }, + { + "epoch": 0.35, + "learning_rate": 1.961155524532598e-06, + "loss": 0.7988, + "step": 13618 + }, + { + "epoch": 0.35, + "learning_rate": 1.961147886915969e-06, + "loss": 1.0127, + "step": 13619 + }, + { + "epoch": 0.35, + "learning_rate": 1.9611402485634337e-06, + "loss": 0.6426, + "step": 13620 + }, + { + "epoch": 0.35, + "learning_rate": 1.9611326094749968e-06, + "loss": 0.8535, + "step": 13621 + }, + { + "epoch": 0.35, + "learning_rate": 1.9611249696506653e-06, + "loss": 0.8711, + "step": 13622 + }, + { + "epoch": 0.35, + "learning_rate": 1.9611173290904443e-06, + "loss": 0.8389, + "step": 13623 + }, + { + "epoch": 0.35, + "learning_rate": 1.96110968779434e-06, + "loss": 0.6367, + "step": 13624 + }, + { + "epoch": 0.35, + "learning_rate": 1.9611020457623587e-06, + "loss": 0.5769, + "step": 13625 + }, + { + "epoch": 0.35, + "learning_rate": 1.961094402994505e-06, + "loss": 0.6895, + "step": 13626 + }, + { + "epoch": 0.35, + "learning_rate": 1.9610867594907862e-06, + "loss": 0.8818, + "step": 13627 + }, + { + "epoch": 0.35, + "learning_rate": 1.961079115251207e-06, + "loss": 0.873, + "step": 13628 + }, + { + "epoch": 0.35, + "learning_rate": 1.961071470275774e-06, + "loss": 0.9727, + "step": 13629 + }, + { + "epoch": 0.35, + "learning_rate": 1.9610638245644926e-06, + "loss": 0.9287, + "step": 13630 + }, + { + "epoch": 0.35, + "learning_rate": 1.961056178117369e-06, + "loss": 0.8096, + "step": 13631 + }, + { + "epoch": 0.35, + "learning_rate": 1.9610485309344086e-06, + "loss": 0.8955, + "step": 13632 + }, + { + "epoch": 0.35, + "learning_rate": 1.9610408830156177e-06, + "loss": 0.9243, + "step": 13633 + }, + { + "epoch": 0.35, + "learning_rate": 1.961033234361002e-06, + "loss": 1.1406, + "step": 13634 + }, + { + "epoch": 0.35, + "learning_rate": 1.961025584970567e-06, + "loss": 0.7974, + "step": 13635 + }, + { + "epoch": 0.35, + "learning_rate": 1.9610179348443195e-06, + "loss": 1.041, + "step": 13636 + }, + { + "epoch": 0.35, + "learning_rate": 1.9610102839822644e-06, + "loss": 1.0596, + "step": 13637 + }, + { + "epoch": 0.35, + "learning_rate": 1.961002632384408e-06, + "loss": 0.8848, + "step": 13638 + }, + { + "epoch": 0.35, + "learning_rate": 1.960994980050756e-06, + "loss": 1.1914, + "step": 13639 + }, + { + "epoch": 0.35, + "learning_rate": 1.9609873269813143e-06, + "loss": 0.707, + "step": 13640 + }, + { + "epoch": 0.35, + "learning_rate": 1.9609796731760886e-06, + "loss": 1.0303, + "step": 13641 + }, + { + "epoch": 0.35, + "learning_rate": 1.9609720186350853e-06, + "loss": 0.7241, + "step": 13642 + }, + { + "epoch": 0.35, + "learning_rate": 1.96096436335831e-06, + "loss": 0.9883, + "step": 13643 + }, + { + "epoch": 0.35, + "learning_rate": 1.9609567073457683e-06, + "loss": 1.1582, + "step": 13644 + }, + { + "epoch": 0.35, + "learning_rate": 1.960949050597466e-06, + "loss": 0.8828, + "step": 13645 + }, + { + "epoch": 0.35, + "learning_rate": 1.9609413931134095e-06, + "loss": 0.8164, + "step": 13646 + }, + { + "epoch": 0.35, + "learning_rate": 1.9609337348936044e-06, + "loss": 0.877, + "step": 13647 + }, + { + "epoch": 0.35, + "learning_rate": 1.9609260759380564e-06, + "loss": 0.8408, + "step": 13648 + }, + { + "epoch": 0.35, + "learning_rate": 1.9609184162467712e-06, + "loss": 0.7529, + "step": 13649 + }, + { + "epoch": 0.35, + "learning_rate": 1.9609107558197554e-06, + "loss": 1.0127, + "step": 13650 + }, + { + "epoch": 0.35, + "learning_rate": 1.9609030946570144e-06, + "loss": 0.8442, + "step": 13651 + }, + { + "epoch": 0.35, + "learning_rate": 1.9608954327585537e-06, + "loss": 0.7554, + "step": 13652 + }, + { + "epoch": 0.35, + "learning_rate": 1.9608877701243796e-06, + "loss": 1.0215, + "step": 13653 + }, + { + "epoch": 0.35, + "learning_rate": 1.9608801067544986e-06, + "loss": 1.0059, + "step": 13654 + }, + { + "epoch": 0.35, + "learning_rate": 1.9608724426489152e-06, + "loss": 0.8574, + "step": 13655 + }, + { + "epoch": 0.35, + "learning_rate": 1.9608647778076363e-06, + "loss": 0.8442, + "step": 13656 + }, + { + "epoch": 0.35, + "learning_rate": 1.960857112230667e-06, + "loss": 0.9834, + "step": 13657 + }, + { + "epoch": 0.35, + "learning_rate": 1.960849445918014e-06, + "loss": 0.9814, + "step": 13658 + }, + { + "epoch": 0.35, + "learning_rate": 1.9608417788696827e-06, + "loss": 0.8809, + "step": 13659 + }, + { + "epoch": 0.35, + "learning_rate": 1.960834111085679e-06, + "loss": 0.9009, + "step": 13660 + }, + { + "epoch": 0.35, + "learning_rate": 1.9608264425660085e-06, + "loss": 0.9062, + "step": 13661 + }, + { + "epoch": 0.35, + "learning_rate": 1.960818773310678e-06, + "loss": 0.9287, + "step": 13662 + }, + { + "epoch": 0.35, + "learning_rate": 1.9608111033196923e-06, + "loss": 0.8486, + "step": 13663 + }, + { + "epoch": 0.35, + "learning_rate": 1.9608034325930574e-06, + "loss": 0.731, + "step": 13664 + }, + { + "epoch": 0.35, + "learning_rate": 1.9607957611307803e-06, + "loss": 0.9092, + "step": 13665 + }, + { + "epoch": 0.35, + "learning_rate": 1.9607880889328653e-06, + "loss": 0.8145, + "step": 13666 + }, + { + "epoch": 0.35, + "learning_rate": 1.9607804159993194e-06, + "loss": 0.9648, + "step": 13667 + }, + { + "epoch": 0.35, + "learning_rate": 1.9607727423301484e-06, + "loss": 0.9863, + "step": 13668 + }, + { + "epoch": 0.35, + "learning_rate": 1.9607650679253576e-06, + "loss": 0.9307, + "step": 13669 + }, + { + "epoch": 0.35, + "learning_rate": 1.960757392784953e-06, + "loss": 0.8916, + "step": 13670 + }, + { + "epoch": 0.35, + "learning_rate": 1.960749716908941e-06, + "loss": 0.7764, + "step": 13671 + }, + { + "epoch": 0.35, + "learning_rate": 1.9607420402973265e-06, + "loss": 0.6411, + "step": 13672 + }, + { + "epoch": 0.35, + "learning_rate": 1.9607343629501165e-06, + "loss": 0.8379, + "step": 13673 + }, + { + "epoch": 0.35, + "learning_rate": 1.9607266848673164e-06, + "loss": 0.7837, + "step": 13674 + }, + { + "epoch": 0.35, + "learning_rate": 1.960719006048932e-06, + "loss": 0.9541, + "step": 13675 + }, + { + "epoch": 0.35, + "learning_rate": 1.960711326494969e-06, + "loss": 0.6724, + "step": 13676 + }, + { + "epoch": 0.35, + "learning_rate": 1.9607036462054335e-06, + "loss": 0.8296, + "step": 13677 + }, + { + "epoch": 0.35, + "learning_rate": 1.960695965180332e-06, + "loss": 0.7871, + "step": 13678 + }, + { + "epoch": 0.35, + "learning_rate": 1.9606882834196693e-06, + "loss": 0.8994, + "step": 13679 + }, + { + "epoch": 0.35, + "learning_rate": 1.960680600923452e-06, + "loss": 0.8145, + "step": 13680 + }, + { + "epoch": 0.35, + "learning_rate": 1.960672917691685e-06, + "loss": 0.8662, + "step": 13681 + }, + { + "epoch": 0.35, + "learning_rate": 1.9606652337243755e-06, + "loss": 0.9395, + "step": 13682 + }, + { + "epoch": 0.35, + "learning_rate": 1.960657549021529e-06, + "loss": 0.8018, + "step": 13683 + }, + { + "epoch": 0.35, + "learning_rate": 1.960649863583151e-06, + "loss": 0.959, + "step": 13684 + }, + { + "epoch": 0.35, + "learning_rate": 1.9606421774092473e-06, + "loss": 0.7344, + "step": 13685 + }, + { + "epoch": 0.35, + "learning_rate": 1.9606344904998243e-06, + "loss": 0.6802, + "step": 13686 + }, + { + "epoch": 0.35, + "learning_rate": 1.9606268028548874e-06, + "loss": 1.0234, + "step": 13687 + }, + { + "epoch": 0.35, + "learning_rate": 1.960619114474443e-06, + "loss": 0.8267, + "step": 13688 + }, + { + "epoch": 0.35, + "learning_rate": 1.9606114253584967e-06, + "loss": 0.8525, + "step": 13689 + }, + { + "epoch": 0.35, + "learning_rate": 1.9606037355070547e-06, + "loss": 0.9072, + "step": 13690 + }, + { + "epoch": 0.35, + "learning_rate": 1.960596044920122e-06, + "loss": 1.0977, + "step": 13691 + }, + { + "epoch": 0.35, + "learning_rate": 1.9605883535977053e-06, + "loss": 0.6934, + "step": 13692 + }, + { + "epoch": 0.35, + "learning_rate": 1.9605806615398102e-06, + "loss": 0.9346, + "step": 13693 + }, + { + "epoch": 0.35, + "learning_rate": 1.960572968746443e-06, + "loss": 0.8906, + "step": 13694 + }, + { + "epoch": 0.35, + "learning_rate": 1.960565275217609e-06, + "loss": 1.0127, + "step": 13695 + }, + { + "epoch": 0.35, + "learning_rate": 1.960557580953314e-06, + "loss": 1.0439, + "step": 13696 + }, + { + "epoch": 0.35, + "learning_rate": 1.960549885953565e-06, + "loss": 0.9121, + "step": 13697 + }, + { + "epoch": 0.35, + "learning_rate": 1.9605421902183664e-06, + "loss": 0.7959, + "step": 13698 + }, + { + "epoch": 0.35, + "learning_rate": 1.960534493747725e-06, + "loss": 0.6616, + "step": 13699 + }, + { + "epoch": 0.35, + "learning_rate": 1.9605267965416466e-06, + "loss": 0.8345, + "step": 13700 + }, + { + "epoch": 0.35, + "learning_rate": 1.960519098600137e-06, + "loss": 1.124, + "step": 13701 + }, + { + "epoch": 0.35, + "learning_rate": 1.960511399923202e-06, + "loss": 0.9268, + "step": 13702 + }, + { + "epoch": 0.35, + "learning_rate": 1.9605037005108477e-06, + "loss": 0.7529, + "step": 13703 + }, + { + "epoch": 0.35, + "learning_rate": 1.96049600036308e-06, + "loss": 0.9277, + "step": 13704 + }, + { + "epoch": 0.35, + "learning_rate": 1.9604882994799044e-06, + "loss": 0.9668, + "step": 13705 + }, + { + "epoch": 0.35, + "learning_rate": 1.9604805978613274e-06, + "loss": 0.9785, + "step": 13706 + }, + { + "epoch": 0.35, + "learning_rate": 1.9604728955073543e-06, + "loss": 0.8506, + "step": 13707 + }, + { + "epoch": 0.35, + "learning_rate": 1.9604651924179913e-06, + "loss": 0.6016, + "step": 13708 + }, + { + "epoch": 0.35, + "learning_rate": 1.960457488593244e-06, + "loss": 0.7788, + "step": 13709 + }, + { + "epoch": 0.35, + "learning_rate": 1.9604497840331195e-06, + "loss": 0.6895, + "step": 13710 + }, + { + "epoch": 0.35, + "learning_rate": 1.9604420787376216e-06, + "loss": 1.042, + "step": 13711 + }, + { + "epoch": 0.35, + "learning_rate": 1.960434372706758e-06, + "loss": 0.9023, + "step": 13712 + }, + { + "epoch": 0.35, + "learning_rate": 1.960426665940534e-06, + "loss": 0.8477, + "step": 13713 + }, + { + "epoch": 0.35, + "learning_rate": 1.9604189584389556e-06, + "loss": 0.8066, + "step": 13714 + }, + { + "epoch": 0.35, + "learning_rate": 1.960411250202028e-06, + "loss": 0.9062, + "step": 13715 + }, + { + "epoch": 0.35, + "learning_rate": 1.960403541229758e-06, + "loss": 0.9561, + "step": 13716 + }, + { + "epoch": 0.35, + "learning_rate": 1.960395831522151e-06, + "loss": 0.998, + "step": 13717 + }, + { + "epoch": 0.35, + "learning_rate": 1.960388121079213e-06, + "loss": 1.1309, + "step": 13718 + }, + { + "epoch": 0.35, + "learning_rate": 1.9603804099009503e-06, + "loss": 0.9277, + "step": 13719 + }, + { + "epoch": 0.35, + "learning_rate": 1.9603726979873684e-06, + "loss": 1.1289, + "step": 13720 + }, + { + "epoch": 0.35, + "learning_rate": 1.9603649853384734e-06, + "loss": 1.0049, + "step": 13721 + }, + { + "epoch": 0.35, + "learning_rate": 1.9603572719542707e-06, + "loss": 0.6719, + "step": 13722 + }, + { + "epoch": 0.35, + "learning_rate": 1.9603495578347673e-06, + "loss": 0.8647, + "step": 13723 + }, + { + "epoch": 0.35, + "learning_rate": 1.9603418429799676e-06, + "loss": 1.0605, + "step": 13724 + }, + { + "epoch": 0.35, + "learning_rate": 1.9603341273898786e-06, + "loss": 0.918, + "step": 13725 + }, + { + "epoch": 0.35, + "learning_rate": 1.960326411064506e-06, + "loss": 0.9868, + "step": 13726 + }, + { + "epoch": 0.35, + "learning_rate": 1.9603186940038556e-06, + "loss": 0.8623, + "step": 13727 + }, + { + "epoch": 0.35, + "learning_rate": 1.960310976207933e-06, + "loss": 0.9141, + "step": 13728 + }, + { + "epoch": 0.35, + "learning_rate": 1.960303257676745e-06, + "loss": 0.627, + "step": 13729 + }, + { + "epoch": 0.35, + "learning_rate": 1.9602955384102966e-06, + "loss": 0.9531, + "step": 13730 + }, + { + "epoch": 0.35, + "learning_rate": 1.960287818408594e-06, + "loss": 0.918, + "step": 13731 + }, + { + "epoch": 0.35, + "learning_rate": 1.9602800976716436e-06, + "loss": 0.9717, + "step": 13732 + }, + { + "epoch": 0.35, + "learning_rate": 1.9602723761994503e-06, + "loss": 0.8467, + "step": 13733 + }, + { + "epoch": 0.35, + "learning_rate": 1.960264653992021e-06, + "loss": 0.6885, + "step": 13734 + }, + { + "epoch": 0.35, + "learning_rate": 1.960256931049361e-06, + "loss": 0.7534, + "step": 13735 + }, + { + "epoch": 0.35, + "learning_rate": 1.960249207371477e-06, + "loss": 0.8809, + "step": 13736 + }, + { + "epoch": 0.35, + "learning_rate": 1.9602414829583735e-06, + "loss": 0.9121, + "step": 13737 + }, + { + "epoch": 0.35, + "learning_rate": 1.9602337578100577e-06, + "loss": 0.8633, + "step": 13738 + }, + { + "epoch": 0.35, + "learning_rate": 1.960226031926535e-06, + "loss": 0.7759, + "step": 13739 + }, + { + "epoch": 0.35, + "learning_rate": 1.9602183053078115e-06, + "loss": 0.7, + "step": 13740 + }, + { + "epoch": 0.35, + "learning_rate": 1.9602105779538925e-06, + "loss": 0.6655, + "step": 13741 + }, + { + "epoch": 0.35, + "learning_rate": 1.960202849864785e-06, + "loss": 0.7451, + "step": 13742 + }, + { + "epoch": 0.35, + "learning_rate": 1.960195121040494e-06, + "loss": 0.9395, + "step": 13743 + }, + { + "epoch": 0.35, + "learning_rate": 1.960187391481026e-06, + "loss": 0.8672, + "step": 13744 + }, + { + "epoch": 0.35, + "learning_rate": 1.9601796611863867e-06, + "loss": 0.9111, + "step": 13745 + }, + { + "epoch": 0.35, + "learning_rate": 1.9601719301565816e-06, + "loss": 0.7715, + "step": 13746 + }, + { + "epoch": 0.35, + "learning_rate": 1.9601641983916175e-06, + "loss": 1.083, + "step": 13747 + }, + { + "epoch": 0.35, + "learning_rate": 1.9601564658914995e-06, + "loss": 0.7773, + "step": 13748 + }, + { + "epoch": 0.35, + "learning_rate": 1.9601487326562335e-06, + "loss": 0.7158, + "step": 13749 + }, + { + "epoch": 0.35, + "learning_rate": 1.9601409986858264e-06, + "loss": 0.6836, + "step": 13750 + }, + { + "epoch": 0.35, + "learning_rate": 1.9601332639802832e-06, + "loss": 0.8154, + "step": 13751 + }, + { + "epoch": 0.35, + "learning_rate": 1.96012552853961e-06, + "loss": 0.8848, + "step": 13752 + }, + { + "epoch": 0.35, + "learning_rate": 1.960117792363813e-06, + "loss": 0.9326, + "step": 13753 + }, + { + "epoch": 0.35, + "learning_rate": 1.960110055452898e-06, + "loss": 0.8652, + "step": 13754 + }, + { + "epoch": 0.35, + "learning_rate": 1.9601023178068704e-06, + "loss": 0.915, + "step": 13755 + }, + { + "epoch": 0.35, + "learning_rate": 1.9600945794257374e-06, + "loss": 0.9902, + "step": 13756 + }, + { + "epoch": 0.35, + "learning_rate": 1.9600868403095035e-06, + "loss": 1.0557, + "step": 13757 + }, + { + "epoch": 0.35, + "learning_rate": 1.9600791004581755e-06, + "loss": 0.8672, + "step": 13758 + }, + { + "epoch": 0.35, + "learning_rate": 1.960071359871759e-06, + "loss": 0.9688, + "step": 13759 + }, + { + "epoch": 0.35, + "learning_rate": 1.96006361855026e-06, + "loss": 1.002, + "step": 13760 + }, + { + "epoch": 0.35, + "learning_rate": 1.960055876493685e-06, + "loss": 1.082, + "step": 13761 + }, + { + "epoch": 0.35, + "learning_rate": 1.9600481337020386e-06, + "loss": 0.9951, + "step": 13762 + }, + { + "epoch": 0.35, + "learning_rate": 1.960040390175328e-06, + "loss": 0.6831, + "step": 13763 + }, + { + "epoch": 0.35, + "learning_rate": 1.960032645913558e-06, + "loss": 0.6016, + "step": 13764 + }, + { + "epoch": 0.35, + "learning_rate": 1.9600249009167357e-06, + "loss": 0.6465, + "step": 13765 + }, + { + "epoch": 0.35, + "learning_rate": 1.9600171551848657e-06, + "loss": 0.7819, + "step": 13766 + }, + { + "epoch": 0.35, + "learning_rate": 1.960009408717956e-06, + "loss": 0.8428, + "step": 13767 + }, + { + "epoch": 0.35, + "learning_rate": 1.96000166151601e-06, + "loss": 0.918, + "step": 13768 + }, + { + "epoch": 0.35, + "learning_rate": 1.9599939135790357e-06, + "loss": 0.7969, + "step": 13769 + }, + { + "epoch": 0.35, + "learning_rate": 1.9599861649070377e-06, + "loss": 0.9424, + "step": 13770 + }, + { + "epoch": 0.35, + "learning_rate": 1.9599784155000226e-06, + "loss": 0.8291, + "step": 13771 + }, + { + "epoch": 0.35, + "learning_rate": 1.959970665357996e-06, + "loss": 0.9395, + "step": 13772 + }, + { + "epoch": 0.35, + "learning_rate": 1.9599629144809646e-06, + "loss": 1.0439, + "step": 13773 + }, + { + "epoch": 0.35, + "learning_rate": 1.959955162868933e-06, + "loss": 1.1465, + "step": 13774 + }, + { + "epoch": 0.35, + "learning_rate": 1.9599474105219086e-06, + "loss": 0.8057, + "step": 13775 + }, + { + "epoch": 0.35, + "learning_rate": 1.9599396574398962e-06, + "loss": 0.832, + "step": 13776 + }, + { + "epoch": 0.35, + "learning_rate": 1.959931903622902e-06, + "loss": 1.1562, + "step": 13777 + }, + { + "epoch": 0.35, + "learning_rate": 1.959924149070932e-06, + "loss": 0.8008, + "step": 13778 + }, + { + "epoch": 0.35, + "learning_rate": 1.9599163937839927e-06, + "loss": 1.0195, + "step": 13779 + }, + { + "epoch": 0.35, + "learning_rate": 1.959908637762089e-06, + "loss": 1.1787, + "step": 13780 + }, + { + "epoch": 0.35, + "learning_rate": 1.959900881005228e-06, + "loss": 0.8965, + "step": 13781 + }, + { + "epoch": 0.35, + "learning_rate": 1.9598931235134144e-06, + "loss": 0.7617, + "step": 13782 + }, + { + "epoch": 0.35, + "learning_rate": 1.9598853652866552e-06, + "loss": 0.7666, + "step": 13783 + }, + { + "epoch": 0.35, + "learning_rate": 1.959877606324956e-06, + "loss": 1.2031, + "step": 13784 + }, + { + "epoch": 0.35, + "learning_rate": 1.9598698466283224e-06, + "loss": 1.0449, + "step": 13785 + }, + { + "epoch": 0.35, + "learning_rate": 1.9598620861967606e-06, + "loss": 0.8115, + "step": 13786 + }, + { + "epoch": 0.35, + "learning_rate": 1.9598543250302766e-06, + "loss": 1.0537, + "step": 13787 + }, + { + "epoch": 0.35, + "learning_rate": 1.9598465631288764e-06, + "loss": 0.9814, + "step": 13788 + }, + { + "epoch": 0.35, + "learning_rate": 1.9598388004925657e-06, + "loss": 0.9062, + "step": 13789 + }, + { + "epoch": 0.35, + "learning_rate": 1.9598310371213507e-06, + "loss": 0.8418, + "step": 13790 + }, + { + "epoch": 0.35, + "learning_rate": 1.9598232730152367e-06, + "loss": 0.8623, + "step": 13791 + }, + { + "epoch": 0.35, + "learning_rate": 1.959815508174231e-06, + "loss": 0.9082, + "step": 13792 + }, + { + "epoch": 0.35, + "learning_rate": 1.959807742598338e-06, + "loss": 1.1201, + "step": 13793 + }, + { + "epoch": 0.35, + "learning_rate": 1.9597999762875645e-06, + "loss": 0.8438, + "step": 13794 + }, + { + "epoch": 0.35, + "learning_rate": 1.9597922092419163e-06, + "loss": 0.9854, + "step": 13795 + }, + { + "epoch": 0.35, + "learning_rate": 1.9597844414613997e-06, + "loss": 0.8984, + "step": 13796 + }, + { + "epoch": 0.35, + "learning_rate": 1.9597766729460197e-06, + "loss": 0.4937, + "step": 13797 + }, + { + "epoch": 0.35, + "learning_rate": 1.959768903695783e-06, + "loss": 0.916, + "step": 13798 + }, + { + "epoch": 0.35, + "learning_rate": 1.9597611337106956e-06, + "loss": 0.7285, + "step": 13799 + }, + { + "epoch": 0.35, + "learning_rate": 1.9597533629907633e-06, + "loss": 0.8516, + "step": 13800 + }, + { + "epoch": 0.35, + "learning_rate": 1.959745591535992e-06, + "loss": 0.9683, + "step": 13801 + }, + { + "epoch": 0.35, + "learning_rate": 1.959737819346387e-06, + "loss": 0.8389, + "step": 13802 + }, + { + "epoch": 0.35, + "learning_rate": 1.9597300464219554e-06, + "loss": 0.8074, + "step": 13803 + }, + { + "epoch": 0.35, + "learning_rate": 1.9597222727627027e-06, + "loss": 0.6816, + "step": 13804 + }, + { + "epoch": 0.35, + "learning_rate": 1.9597144983686346e-06, + "loss": 0.7695, + "step": 13805 + }, + { + "epoch": 0.35, + "learning_rate": 1.9597067232397573e-06, + "loss": 0.6978, + "step": 13806 + }, + { + "epoch": 0.35, + "learning_rate": 1.9596989473760764e-06, + "loss": 0.9023, + "step": 13807 + }, + { + "epoch": 0.35, + "learning_rate": 1.9596911707775987e-06, + "loss": 0.9912, + "step": 13808 + }, + { + "epoch": 0.35, + "learning_rate": 1.959683393444329e-06, + "loss": 1.1367, + "step": 13809 + }, + { + "epoch": 0.35, + "learning_rate": 1.9596756153762747e-06, + "loss": 0.665, + "step": 13810 + }, + { + "epoch": 0.35, + "learning_rate": 1.9596678365734403e-06, + "loss": 1.0068, + "step": 13811 + }, + { + "epoch": 0.35, + "learning_rate": 1.9596600570358324e-06, + "loss": 0.8994, + "step": 13812 + }, + { + "epoch": 0.35, + "learning_rate": 1.9596522767634568e-06, + "loss": 0.71, + "step": 13813 + }, + { + "epoch": 0.35, + "learning_rate": 1.95964449575632e-06, + "loss": 0.7754, + "step": 13814 + }, + { + "epoch": 0.35, + "learning_rate": 1.9596367140144273e-06, + "loss": 0.915, + "step": 13815 + }, + { + "epoch": 0.35, + "learning_rate": 1.9596289315377845e-06, + "loss": 0.7861, + "step": 13816 + }, + { + "epoch": 0.35, + "learning_rate": 1.9596211483263985e-06, + "loss": 0.876, + "step": 13817 + }, + { + "epoch": 0.35, + "learning_rate": 1.959613364380274e-06, + "loss": 0.6665, + "step": 13818 + }, + { + "epoch": 0.35, + "learning_rate": 1.9596055796994187e-06, + "loss": 1.0117, + "step": 13819 + }, + { + "epoch": 0.35, + "learning_rate": 1.959597794283837e-06, + "loss": 1.1328, + "step": 13820 + }, + { + "epoch": 0.35, + "learning_rate": 1.9595900081335356e-06, + "loss": 0.8379, + "step": 13821 + }, + { + "epoch": 0.35, + "learning_rate": 1.95958222124852e-06, + "loss": 0.958, + "step": 13822 + }, + { + "epoch": 0.35, + "learning_rate": 1.9595744336287963e-06, + "loss": 0.9307, + "step": 13823 + }, + { + "epoch": 0.35, + "learning_rate": 1.9595666452743708e-06, + "loss": 1.2324, + "step": 13824 + }, + { + "epoch": 0.35, + "learning_rate": 1.959558856185249e-06, + "loss": 0.8701, + "step": 13825 + }, + { + "epoch": 0.35, + "learning_rate": 1.9595510663614374e-06, + "loss": 0.7192, + "step": 13826 + }, + { + "epoch": 0.35, + "learning_rate": 1.959543275802942e-06, + "loss": 0.9102, + "step": 13827 + }, + { + "epoch": 0.35, + "learning_rate": 1.959535484509768e-06, + "loss": 0.8779, + "step": 13828 + }, + { + "epoch": 0.35, + "learning_rate": 1.9595276924819216e-06, + "loss": 0.9346, + "step": 13829 + }, + { + "epoch": 0.35, + "learning_rate": 1.959519899719409e-06, + "loss": 0.8936, + "step": 13830 + }, + { + "epoch": 0.35, + "learning_rate": 1.9595121062222366e-06, + "loss": 0.8345, + "step": 13831 + }, + { + "epoch": 0.35, + "learning_rate": 1.95950431199041e-06, + "loss": 0.771, + "step": 13832 + }, + { + "epoch": 0.35, + "learning_rate": 1.959496517023934e-06, + "loss": 0.9609, + "step": 13833 + }, + { + "epoch": 0.35, + "learning_rate": 1.9594887213228166e-06, + "loss": 0.7471, + "step": 13834 + }, + { + "epoch": 0.35, + "learning_rate": 1.9594809248870623e-06, + "loss": 0.8584, + "step": 13835 + }, + { + "epoch": 0.35, + "learning_rate": 1.959473127716678e-06, + "loss": 0.9238, + "step": 13836 + }, + { + "epoch": 0.35, + "learning_rate": 1.9594653298116693e-06, + "loss": 0.8184, + "step": 13837 + }, + { + "epoch": 0.35, + "learning_rate": 1.959457531172042e-06, + "loss": 0.8672, + "step": 13838 + }, + { + "epoch": 0.35, + "learning_rate": 1.9594497317978016e-06, + "loss": 1.0391, + "step": 13839 + }, + { + "epoch": 0.35, + "learning_rate": 1.9594419316889554e-06, + "loss": 1.1914, + "step": 13840 + }, + { + "epoch": 0.35, + "learning_rate": 1.959434130845508e-06, + "loss": 0.8877, + "step": 13841 + }, + { + "epoch": 0.35, + "learning_rate": 1.9594263292674667e-06, + "loss": 0.9629, + "step": 13842 + }, + { + "epoch": 0.35, + "learning_rate": 1.9594185269548364e-06, + "loss": 1.0352, + "step": 13843 + }, + { + "epoch": 0.35, + "learning_rate": 1.959410723907623e-06, + "loss": 0.5269, + "step": 13844 + }, + { + "epoch": 0.35, + "learning_rate": 1.9594029201258338e-06, + "loss": 1.123, + "step": 13845 + }, + { + "epoch": 0.35, + "learning_rate": 1.9593951156094732e-06, + "loss": 0.9004, + "step": 13846 + }, + { + "epoch": 0.35, + "learning_rate": 1.9593873103585484e-06, + "loss": 0.9976, + "step": 13847 + }, + { + "epoch": 0.35, + "learning_rate": 1.9593795043730647e-06, + "loss": 0.9346, + "step": 13848 + }, + { + "epoch": 0.35, + "learning_rate": 1.959371697653028e-06, + "loss": 0.9355, + "step": 13849 + }, + { + "epoch": 0.35, + "learning_rate": 1.9593638901984445e-06, + "loss": 0.7612, + "step": 13850 + }, + { + "epoch": 0.36, + "learning_rate": 1.9593560820093203e-06, + "loss": 0.8975, + "step": 13851 + }, + { + "epoch": 0.36, + "learning_rate": 1.9593482730856614e-06, + "loss": 0.8496, + "step": 13852 + }, + { + "epoch": 0.36, + "learning_rate": 1.9593404634274733e-06, + "loss": 0.7382, + "step": 13853 + }, + { + "epoch": 0.36, + "learning_rate": 1.959332653034763e-06, + "loss": 0.8887, + "step": 13854 + }, + { + "epoch": 0.36, + "learning_rate": 1.959324841907535e-06, + "loss": 0.7725, + "step": 13855 + }, + { + "epoch": 0.36, + "learning_rate": 1.9593170300457963e-06, + "loss": 1.0381, + "step": 13856 + }, + { + "epoch": 0.36, + "learning_rate": 1.9593092174495533e-06, + "loss": 0.957, + "step": 13857 + }, + { + "epoch": 0.36, + "learning_rate": 1.9593014041188104e-06, + "loss": 0.7656, + "step": 13858 + }, + { + "epoch": 0.36, + "learning_rate": 1.959293590053575e-06, + "loss": 0.79, + "step": 13859 + }, + { + "epoch": 0.36, + "learning_rate": 1.9592857752538526e-06, + "loss": 0.9521, + "step": 13860 + }, + { + "epoch": 0.36, + "learning_rate": 1.959277959719649e-06, + "loss": 0.7637, + "step": 13861 + }, + { + "epoch": 0.36, + "learning_rate": 1.9592701434509708e-06, + "loss": 0.8411, + "step": 13862 + }, + { + "epoch": 0.36, + "learning_rate": 1.9592623264478233e-06, + "loss": 0.8223, + "step": 13863 + }, + { + "epoch": 0.36, + "learning_rate": 1.9592545087102127e-06, + "loss": 0.9453, + "step": 13864 + }, + { + "epoch": 0.36, + "learning_rate": 1.959246690238145e-06, + "loss": 0.9814, + "step": 13865 + }, + { + "epoch": 0.36, + "learning_rate": 1.9592388710316264e-06, + "loss": 0.6138, + "step": 13866 + }, + { + "epoch": 0.36, + "learning_rate": 1.9592310510906625e-06, + "loss": 0.9551, + "step": 13867 + }, + { + "epoch": 0.36, + "learning_rate": 1.959223230415259e-06, + "loss": 0.7119, + "step": 13868 + }, + { + "epoch": 0.36, + "learning_rate": 1.9592154090054237e-06, + "loss": 0.9756, + "step": 13869 + }, + { + "epoch": 0.36, + "learning_rate": 1.95920758686116e-06, + "loss": 0.6836, + "step": 13870 + }, + { + "epoch": 0.36, + "learning_rate": 1.959199763982476e-06, + "loss": 0.9165, + "step": 13871 + }, + { + "epoch": 0.36, + "learning_rate": 1.9591919403693765e-06, + "loss": 0.7842, + "step": 13872 + }, + { + "epoch": 0.36, + "learning_rate": 1.9591841160218676e-06, + "loss": 0.6294, + "step": 13873 + }, + { + "epoch": 0.36, + "learning_rate": 1.959176290939956e-06, + "loss": 0.7451, + "step": 13874 + }, + { + "epoch": 0.36, + "learning_rate": 1.959168465123647e-06, + "loss": 0.8564, + "step": 13875 + }, + { + "epoch": 0.36, + "learning_rate": 1.9591606385729466e-06, + "loss": 0.9365, + "step": 13876 + }, + { + "epoch": 0.36, + "learning_rate": 1.9591528112878614e-06, + "loss": 0.9297, + "step": 13877 + }, + { + "epoch": 0.36, + "learning_rate": 1.9591449832683966e-06, + "loss": 0.9277, + "step": 13878 + }, + { + "epoch": 0.36, + "learning_rate": 1.959137154514559e-06, + "loss": 0.8433, + "step": 13879 + }, + { + "epoch": 0.36, + "learning_rate": 1.959129325026354e-06, + "loss": 0.9863, + "step": 13880 + }, + { + "epoch": 0.36, + "learning_rate": 1.959121494803788e-06, + "loss": 0.9922, + "step": 13881 + }, + { + "epoch": 0.36, + "learning_rate": 1.9591136638468662e-06, + "loss": 0.8623, + "step": 13882 + }, + { + "epoch": 0.36, + "learning_rate": 1.9591058321555957e-06, + "loss": 0.8867, + "step": 13883 + }, + { + "epoch": 0.36, + "learning_rate": 1.9590979997299815e-06, + "loss": 0.9883, + "step": 13884 + }, + { + "epoch": 0.36, + "learning_rate": 1.9590901665700304e-06, + "loss": 0.8633, + "step": 13885 + }, + { + "epoch": 0.36, + "learning_rate": 1.959082332675748e-06, + "loss": 0.8789, + "step": 13886 + }, + { + "epoch": 0.36, + "learning_rate": 1.9590744980471404e-06, + "loss": 0.957, + "step": 13887 + }, + { + "epoch": 0.36, + "learning_rate": 1.9590666626842133e-06, + "loss": 0.96, + "step": 13888 + }, + { + "epoch": 0.36, + "learning_rate": 1.959058826586973e-06, + "loss": 0.6309, + "step": 13889 + }, + { + "epoch": 0.36, + "learning_rate": 1.959050989755426e-06, + "loss": 1.0625, + "step": 13890 + }, + { + "epoch": 0.36, + "learning_rate": 1.959043152189577e-06, + "loss": 1.1113, + "step": 13891 + }, + { + "epoch": 0.36, + "learning_rate": 1.959035313889433e-06, + "loss": 0.8184, + "step": 13892 + }, + { + "epoch": 0.36, + "learning_rate": 1.9590274748550003e-06, + "loss": 0.708, + "step": 13893 + }, + { + "epoch": 0.36, + "learning_rate": 1.959019635086284e-06, + "loss": 0.7344, + "step": 13894 + }, + { + "epoch": 0.36, + "learning_rate": 1.95901179458329e-06, + "loss": 0.9521, + "step": 13895 + }, + { + "epoch": 0.36, + "learning_rate": 1.9590039533460253e-06, + "loss": 0.8799, + "step": 13896 + }, + { + "epoch": 0.36, + "learning_rate": 1.9589961113744955e-06, + "loss": 0.9717, + "step": 13897 + }, + { + "epoch": 0.36, + "learning_rate": 1.958988268668706e-06, + "loss": 0.8828, + "step": 13898 + }, + { + "epoch": 0.36, + "learning_rate": 1.9589804252286636e-06, + "loss": 1.0312, + "step": 13899 + }, + { + "epoch": 0.36, + "learning_rate": 1.9589725810543738e-06, + "loss": 1.1504, + "step": 13900 + }, + { + "epoch": 0.36, + "learning_rate": 1.9589647361458428e-06, + "loss": 0.9111, + "step": 13901 + }, + { + "epoch": 0.36, + "learning_rate": 1.9589568905030765e-06, + "loss": 0.7568, + "step": 13902 + }, + { + "epoch": 0.36, + "learning_rate": 1.9589490441260813e-06, + "loss": 0.8799, + "step": 13903 + }, + { + "epoch": 0.36, + "learning_rate": 1.9589411970148627e-06, + "loss": 0.8721, + "step": 13904 + }, + { + "epoch": 0.36, + "learning_rate": 1.958933349169427e-06, + "loss": 1.1797, + "step": 13905 + }, + { + "epoch": 0.36, + "learning_rate": 1.9589255005897803e-06, + "loss": 0.7651, + "step": 13906 + }, + { + "epoch": 0.36, + "learning_rate": 1.9589176512759284e-06, + "loss": 1.04, + "step": 13907 + }, + { + "epoch": 0.36, + "learning_rate": 1.958909801227877e-06, + "loss": 0.7803, + "step": 13908 + }, + { + "epoch": 0.36, + "learning_rate": 1.9589019504456326e-06, + "loss": 0.9248, + "step": 13909 + }, + { + "epoch": 0.36, + "learning_rate": 1.958894098929201e-06, + "loss": 1.1035, + "step": 13910 + }, + { + "epoch": 0.36, + "learning_rate": 1.9588862466785885e-06, + "loss": 0.9209, + "step": 13911 + }, + { + "epoch": 0.36, + "learning_rate": 1.9588783936938007e-06, + "loss": 0.9189, + "step": 13912 + }, + { + "epoch": 0.36, + "learning_rate": 1.958870539974844e-06, + "loss": 0.9424, + "step": 13913 + }, + { + "epoch": 0.36, + "learning_rate": 1.958862685521724e-06, + "loss": 0.7524, + "step": 13914 + }, + { + "epoch": 0.36, + "learning_rate": 1.9588548303344474e-06, + "loss": 0.9795, + "step": 13915 + }, + { + "epoch": 0.36, + "learning_rate": 1.9588469744130193e-06, + "loss": 1.0381, + "step": 13916 + }, + { + "epoch": 0.36, + "learning_rate": 1.958839117757446e-06, + "loss": 0.8818, + "step": 13917 + }, + { + "epoch": 0.36, + "learning_rate": 1.958831260367734e-06, + "loss": 1.1152, + "step": 13918 + }, + { + "epoch": 0.36, + "learning_rate": 1.958823402243889e-06, + "loss": 0.8794, + "step": 13919 + }, + { + "epoch": 0.36, + "learning_rate": 1.958815543385917e-06, + "loss": 0.8281, + "step": 13920 + }, + { + "epoch": 0.36, + "learning_rate": 1.958807683793824e-06, + "loss": 0.8799, + "step": 13921 + }, + { + "epoch": 0.36, + "learning_rate": 1.9587998234676156e-06, + "loss": 0.7896, + "step": 13922 + }, + { + "epoch": 0.36, + "learning_rate": 1.958791962407299e-06, + "loss": 0.7422, + "step": 13923 + }, + { + "epoch": 0.36, + "learning_rate": 1.958784100612879e-06, + "loss": 0.9414, + "step": 13924 + }, + { + "epoch": 0.36, + "learning_rate": 1.958776238084362e-06, + "loss": 0.8818, + "step": 13925 + }, + { + "epoch": 0.36, + "learning_rate": 1.9587683748217546e-06, + "loss": 0.8223, + "step": 13926 + }, + { + "epoch": 0.36, + "learning_rate": 1.958760510825062e-06, + "loss": 0.8525, + "step": 13927 + }, + { + "epoch": 0.36, + "learning_rate": 1.958752646094291e-06, + "loss": 0.8311, + "step": 13928 + }, + { + "epoch": 0.36, + "learning_rate": 1.9587447806294465e-06, + "loss": 0.9912, + "step": 13929 + }, + { + "epoch": 0.36, + "learning_rate": 1.9587369144305357e-06, + "loss": 0.998, + "step": 13930 + }, + { + "epoch": 0.36, + "learning_rate": 1.958729047497564e-06, + "loss": 1.1558, + "step": 13931 + }, + { + "epoch": 0.36, + "learning_rate": 1.9587211798305377e-06, + "loss": 0.9668, + "step": 13932 + }, + { + "epoch": 0.36, + "learning_rate": 1.9587133114294623e-06, + "loss": 0.9844, + "step": 13933 + }, + { + "epoch": 0.36, + "learning_rate": 1.9587054422943444e-06, + "loss": 0.9648, + "step": 13934 + }, + { + "epoch": 0.36, + "learning_rate": 1.95869757242519e-06, + "loss": 0.7881, + "step": 13935 + }, + { + "epoch": 0.36, + "learning_rate": 1.9586897018220046e-06, + "loss": 0.6758, + "step": 13936 + }, + { + "epoch": 0.36, + "learning_rate": 1.9586818304847946e-06, + "loss": 0.9551, + "step": 13937 + }, + { + "epoch": 0.36, + "learning_rate": 1.958673958413566e-06, + "loss": 0.9766, + "step": 13938 + }, + { + "epoch": 0.36, + "learning_rate": 1.958666085608325e-06, + "loss": 0.7725, + "step": 13939 + }, + { + "epoch": 0.36, + "learning_rate": 1.9586582120690777e-06, + "loss": 0.9834, + "step": 13940 + }, + { + "epoch": 0.36, + "learning_rate": 1.95865033779583e-06, + "loss": 1.21, + "step": 13941 + }, + { + "epoch": 0.36, + "learning_rate": 1.958642462788587e-06, + "loss": 1.1436, + "step": 13942 + }, + { + "epoch": 0.36, + "learning_rate": 1.9586345870473563e-06, + "loss": 0.9492, + "step": 13943 + }, + { + "epoch": 0.36, + "learning_rate": 1.9586267105721427e-06, + "loss": 1.0068, + "step": 13944 + }, + { + "epoch": 0.36, + "learning_rate": 1.958618833362953e-06, + "loss": 0.9512, + "step": 13945 + }, + { + "epoch": 0.36, + "learning_rate": 1.9586109554197927e-06, + "loss": 0.9688, + "step": 13946 + }, + { + "epoch": 0.36, + "learning_rate": 1.9586030767426682e-06, + "loss": 0.8701, + "step": 13947 + }, + { + "epoch": 0.36, + "learning_rate": 1.9585951973315855e-06, + "loss": 0.8252, + "step": 13948 + }, + { + "epoch": 0.36, + "learning_rate": 1.9585873171865503e-06, + "loss": 0.8203, + "step": 13949 + }, + { + "epoch": 0.36, + "learning_rate": 1.9585794363075692e-06, + "loss": 0.958, + "step": 13950 + }, + { + "epoch": 0.36, + "learning_rate": 1.9585715546946476e-06, + "loss": 0.9219, + "step": 13951 + }, + { + "epoch": 0.36, + "learning_rate": 1.958563672347792e-06, + "loss": 0.9756, + "step": 13952 + }, + { + "epoch": 0.36, + "learning_rate": 1.9585557892670083e-06, + "loss": 1.0586, + "step": 13953 + }, + { + "epoch": 0.36, + "learning_rate": 1.958547905452302e-06, + "loss": 1.0586, + "step": 13954 + }, + { + "epoch": 0.36, + "learning_rate": 1.9585400209036803e-06, + "loss": 0.9062, + "step": 13955 + }, + { + "epoch": 0.36, + "learning_rate": 1.9585321356211485e-06, + "loss": 1.1533, + "step": 13956 + }, + { + "epoch": 0.36, + "learning_rate": 1.9585242496047126e-06, + "loss": 0.896, + "step": 13957 + }, + { + "epoch": 0.36, + "learning_rate": 1.9585163628543787e-06, + "loss": 0.6743, + "step": 13958 + }, + { + "epoch": 0.36, + "learning_rate": 1.958508475370153e-06, + "loss": 0.6572, + "step": 13959 + }, + { + "epoch": 0.36, + "learning_rate": 1.9585005871520412e-06, + "loss": 0.8623, + "step": 13960 + }, + { + "epoch": 0.36, + "learning_rate": 1.9584926982000497e-06, + "loss": 0.8691, + "step": 13961 + }, + { + "epoch": 0.36, + "learning_rate": 1.9584848085141845e-06, + "loss": 0.8252, + "step": 13962 + }, + { + "epoch": 0.36, + "learning_rate": 1.9584769180944513e-06, + "loss": 0.8374, + "step": 13963 + }, + { + "epoch": 0.36, + "learning_rate": 1.9584690269408567e-06, + "loss": 0.833, + "step": 13964 + }, + { + "epoch": 0.36, + "learning_rate": 1.9584611350534064e-06, + "loss": 0.5725, + "step": 13965 + }, + { + "epoch": 0.36, + "learning_rate": 1.958453242432106e-06, + "loss": 0.6519, + "step": 13966 + }, + { + "epoch": 0.36, + "learning_rate": 1.9584453490769625e-06, + "loss": 0.9736, + "step": 13967 + }, + { + "epoch": 0.36, + "learning_rate": 1.9584374549879816e-06, + "loss": 0.8047, + "step": 13968 + }, + { + "epoch": 0.36, + "learning_rate": 1.958429560165169e-06, + "loss": 0.9932, + "step": 13969 + }, + { + "epoch": 0.36, + "learning_rate": 1.958421664608531e-06, + "loss": 1.0078, + "step": 13970 + }, + { + "epoch": 0.36, + "learning_rate": 1.9584137683180733e-06, + "loss": 0.8799, + "step": 13971 + }, + { + "epoch": 0.36, + "learning_rate": 1.9584058712938027e-06, + "loss": 0.8706, + "step": 13972 + }, + { + "epoch": 0.36, + "learning_rate": 1.9583979735357245e-06, + "loss": 0.8945, + "step": 13973 + }, + { + "epoch": 0.36, + "learning_rate": 1.9583900750438452e-06, + "loss": 0.9014, + "step": 13974 + }, + { + "epoch": 0.36, + "learning_rate": 1.9583821758181707e-06, + "loss": 0.7852, + "step": 13975 + }, + { + "epoch": 0.36, + "learning_rate": 1.958374275858707e-06, + "loss": 0.7251, + "step": 13976 + }, + { + "epoch": 0.36, + "learning_rate": 1.95836637516546e-06, + "loss": 0.7842, + "step": 13977 + }, + { + "epoch": 0.36, + "learning_rate": 1.958358473738436e-06, + "loss": 0.7002, + "step": 13978 + }, + { + "epoch": 0.36, + "learning_rate": 1.958350571577641e-06, + "loss": 0.9407, + "step": 13979 + }, + { + "epoch": 0.36, + "learning_rate": 1.9583426686830814e-06, + "loss": 0.9639, + "step": 13980 + }, + { + "epoch": 0.36, + "learning_rate": 1.9583347650547625e-06, + "loss": 1.0674, + "step": 13981 + }, + { + "epoch": 0.36, + "learning_rate": 1.958326860692691e-06, + "loss": 0.8965, + "step": 13982 + }, + { + "epoch": 0.36, + "learning_rate": 1.9583189555968726e-06, + "loss": 0.8379, + "step": 13983 + }, + { + "epoch": 0.36, + "learning_rate": 1.958311049767313e-06, + "loss": 1.0195, + "step": 13984 + }, + { + "epoch": 0.36, + "learning_rate": 1.958303143204019e-06, + "loss": 0.8569, + "step": 13985 + }, + { + "epoch": 0.36, + "learning_rate": 1.9582952359069967e-06, + "loss": 0.833, + "step": 13986 + }, + { + "epoch": 0.36, + "learning_rate": 1.958287327876251e-06, + "loss": 0.6816, + "step": 13987 + }, + { + "epoch": 0.36, + "learning_rate": 1.9582794191117897e-06, + "loss": 0.7156, + "step": 13988 + }, + { + "epoch": 0.36, + "learning_rate": 1.958271509613617e-06, + "loss": 0.9189, + "step": 13989 + }, + { + "epoch": 0.36, + "learning_rate": 1.9582635993817405e-06, + "loss": 0.9619, + "step": 13990 + }, + { + "epoch": 0.36, + "learning_rate": 1.9582556884161656e-06, + "loss": 0.7622, + "step": 13991 + }, + { + "epoch": 0.36, + "learning_rate": 1.958247776716898e-06, + "loss": 1.0654, + "step": 13992 + }, + { + "epoch": 0.36, + "learning_rate": 1.9582398642839444e-06, + "loss": 0.7246, + "step": 13993 + }, + { + "epoch": 0.36, + "learning_rate": 1.958231951117311e-06, + "loss": 0.9238, + "step": 13994 + }, + { + "epoch": 0.36, + "learning_rate": 1.9582240372170026e-06, + "loss": 0.7598, + "step": 13995 + }, + { + "epoch": 0.36, + "learning_rate": 1.9582161225830263e-06, + "loss": 1.0244, + "step": 13996 + }, + { + "epoch": 0.36, + "learning_rate": 1.9582082072153886e-06, + "loss": 0.8301, + "step": 13997 + }, + { + "epoch": 0.36, + "learning_rate": 1.9582002911140945e-06, + "loss": 0.9043, + "step": 13998 + }, + { + "epoch": 0.36, + "learning_rate": 1.9581923742791505e-06, + "loss": 0.7119, + "step": 13999 + }, + { + "epoch": 0.36, + "learning_rate": 1.958184456710563e-06, + "loss": 0.7344, + "step": 14000 + }, + { + "epoch": 0.36, + "learning_rate": 1.958176538408337e-06, + "loss": 0.8574, + "step": 14001 + }, + { + "epoch": 0.36, + "learning_rate": 1.9581686193724797e-06, + "loss": 0.4805, + "step": 14002 + }, + { + "epoch": 0.36, + "learning_rate": 1.958160699602997e-06, + "loss": 1.0078, + "step": 14003 + }, + { + "epoch": 0.36, + "learning_rate": 1.9581527790998945e-06, + "loss": 0.9795, + "step": 14004 + }, + { + "epoch": 0.36, + "learning_rate": 1.958144857863178e-06, + "loss": 0.9277, + "step": 14005 + }, + { + "epoch": 0.36, + "learning_rate": 1.9581369358928547e-06, + "loss": 0.7671, + "step": 14006 + }, + { + "epoch": 0.36, + "learning_rate": 1.95812901318893e-06, + "loss": 0.9199, + "step": 14007 + }, + { + "epoch": 0.36, + "learning_rate": 1.9581210897514094e-06, + "loss": 0.8335, + "step": 14008 + }, + { + "epoch": 0.36, + "learning_rate": 1.9581131655803e-06, + "loss": 0.835, + "step": 14009 + }, + { + "epoch": 0.36, + "learning_rate": 1.9581052406756073e-06, + "loss": 0.7573, + "step": 14010 + }, + { + "epoch": 0.36, + "learning_rate": 1.9580973150373373e-06, + "loss": 0.9385, + "step": 14011 + }, + { + "epoch": 0.36, + "learning_rate": 1.9580893886654964e-06, + "loss": 0.9189, + "step": 14012 + }, + { + "epoch": 0.36, + "learning_rate": 1.9580814615600907e-06, + "loss": 0.916, + "step": 14013 + }, + { + "epoch": 0.36, + "learning_rate": 1.9580735337211257e-06, + "loss": 0.7671, + "step": 14014 + }, + { + "epoch": 0.36, + "learning_rate": 1.958065605148608e-06, + "loss": 0.5688, + "step": 14015 + }, + { + "epoch": 0.36, + "learning_rate": 1.958057675842544e-06, + "loss": 0.8096, + "step": 14016 + }, + { + "epoch": 0.36, + "learning_rate": 1.9580497458029386e-06, + "loss": 0.7793, + "step": 14017 + }, + { + "epoch": 0.36, + "learning_rate": 1.958041815029799e-06, + "loss": 0.8232, + "step": 14018 + }, + { + "epoch": 0.36, + "learning_rate": 1.9580338835231304e-06, + "loss": 0.8896, + "step": 14019 + }, + { + "epoch": 0.36, + "learning_rate": 1.9580259512829394e-06, + "loss": 0.9131, + "step": 14020 + }, + { + "epoch": 0.36, + "learning_rate": 1.9580180183092323e-06, + "loss": 0.9531, + "step": 14021 + }, + { + "epoch": 0.36, + "learning_rate": 1.9580100846020146e-06, + "loss": 1.1016, + "step": 14022 + }, + { + "epoch": 0.36, + "learning_rate": 1.9580021501612925e-06, + "loss": 0.7764, + "step": 14023 + }, + { + "epoch": 0.36, + "learning_rate": 1.9579942149870726e-06, + "loss": 0.752, + "step": 14024 + }, + { + "epoch": 0.36, + "learning_rate": 1.9579862790793602e-06, + "loss": 0.9053, + "step": 14025 + }, + { + "epoch": 0.36, + "learning_rate": 1.9579783424381622e-06, + "loss": 0.708, + "step": 14026 + }, + { + "epoch": 0.36, + "learning_rate": 1.957970405063484e-06, + "loss": 1.0195, + "step": 14027 + }, + { + "epoch": 0.36, + "learning_rate": 1.9579624669553318e-06, + "loss": 0.9863, + "step": 14028 + }, + { + "epoch": 0.36, + "learning_rate": 1.957954528113712e-06, + "loss": 0.5334, + "step": 14029 + }, + { + "epoch": 0.36, + "learning_rate": 1.9579465885386303e-06, + "loss": 1.0488, + "step": 14030 + }, + { + "epoch": 0.36, + "learning_rate": 1.957938648230093e-06, + "loss": 0.8428, + "step": 14031 + }, + { + "epoch": 0.36, + "learning_rate": 1.957930707188106e-06, + "loss": 0.9385, + "step": 14032 + }, + { + "epoch": 0.36, + "learning_rate": 1.957922765412676e-06, + "loss": 0.8625, + "step": 14033 + }, + { + "epoch": 0.36, + "learning_rate": 1.957914822903808e-06, + "loss": 0.9668, + "step": 14034 + }, + { + "epoch": 0.36, + "learning_rate": 1.957906879661509e-06, + "loss": 0.9482, + "step": 14035 + }, + { + "epoch": 0.36, + "learning_rate": 1.9578989356857845e-06, + "loss": 0.8916, + "step": 14036 + }, + { + "epoch": 0.36, + "learning_rate": 1.957890990976641e-06, + "loss": 1.1172, + "step": 14037 + }, + { + "epoch": 0.36, + "learning_rate": 1.957883045534084e-06, + "loss": 0.8447, + "step": 14038 + }, + { + "epoch": 0.36, + "learning_rate": 1.9578750993581204e-06, + "loss": 0.6487, + "step": 14039 + }, + { + "epoch": 0.36, + "learning_rate": 1.957867152448756e-06, + "loss": 0.8184, + "step": 14040 + }, + { + "epoch": 0.36, + "learning_rate": 1.9578592048059965e-06, + "loss": 0.8545, + "step": 14041 + }, + { + "epoch": 0.36, + "learning_rate": 1.957851256429848e-06, + "loss": 0.7061, + "step": 14042 + }, + { + "epoch": 0.36, + "learning_rate": 1.9578433073203176e-06, + "loss": 0.9248, + "step": 14043 + }, + { + "epoch": 0.36, + "learning_rate": 1.95783535747741e-06, + "loss": 0.8936, + "step": 14044 + }, + { + "epoch": 0.36, + "learning_rate": 1.9578274069011323e-06, + "loss": 0.7686, + "step": 14045 + }, + { + "epoch": 0.36, + "learning_rate": 1.95781945559149e-06, + "loss": 1.127, + "step": 14046 + }, + { + "epoch": 0.36, + "learning_rate": 1.9578115035484894e-06, + "loss": 0.9355, + "step": 14047 + }, + { + "epoch": 0.36, + "learning_rate": 1.9578035507721367e-06, + "loss": 0.7671, + "step": 14048 + }, + { + "epoch": 0.36, + "learning_rate": 1.9577955972624376e-06, + "loss": 0.9326, + "step": 14049 + }, + { + "epoch": 0.36, + "learning_rate": 1.9577876430193986e-06, + "loss": 0.77, + "step": 14050 + }, + { + "epoch": 0.36, + "learning_rate": 1.9577796880430256e-06, + "loss": 0.8013, + "step": 14051 + }, + { + "epoch": 0.36, + "learning_rate": 1.957771732333325e-06, + "loss": 0.9648, + "step": 14052 + }, + { + "epoch": 0.36, + "learning_rate": 1.957763775890302e-06, + "loss": 1.0205, + "step": 14053 + }, + { + "epoch": 0.36, + "learning_rate": 1.957755818713964e-06, + "loss": 0.8613, + "step": 14054 + }, + { + "epoch": 0.36, + "learning_rate": 1.957747860804316e-06, + "loss": 0.9077, + "step": 14055 + }, + { + "epoch": 0.36, + "learning_rate": 1.957739902161365e-06, + "loss": 0.8076, + "step": 14056 + }, + { + "epoch": 0.36, + "learning_rate": 1.957731942785116e-06, + "loss": 0.9551, + "step": 14057 + }, + { + "epoch": 0.36, + "learning_rate": 1.9577239826755756e-06, + "loss": 0.7021, + "step": 14058 + }, + { + "epoch": 0.36, + "learning_rate": 1.9577160218327506e-06, + "loss": 0.7607, + "step": 14059 + }, + { + "epoch": 0.36, + "learning_rate": 1.957708060256646e-06, + "loss": 0.8384, + "step": 14060 + }, + { + "epoch": 0.36, + "learning_rate": 1.9577000979472684e-06, + "loss": 1.0391, + "step": 14061 + }, + { + "epoch": 0.36, + "learning_rate": 1.957692134904624e-06, + "loss": 0.9297, + "step": 14062 + }, + { + "epoch": 0.36, + "learning_rate": 1.9576841711287187e-06, + "loss": 1.0625, + "step": 14063 + }, + { + "epoch": 0.36, + "learning_rate": 1.957676206619559e-06, + "loss": 0.761, + "step": 14064 + }, + { + "epoch": 0.36, + "learning_rate": 1.9576682413771505e-06, + "loss": 0.8555, + "step": 14065 + }, + { + "epoch": 0.36, + "learning_rate": 1.9576602754014995e-06, + "loss": 0.918, + "step": 14066 + }, + { + "epoch": 0.36, + "learning_rate": 1.9576523086926118e-06, + "loss": 1.0176, + "step": 14067 + }, + { + "epoch": 0.36, + "learning_rate": 1.957644341250494e-06, + "loss": 0.8867, + "step": 14068 + }, + { + "epoch": 0.36, + "learning_rate": 1.9576363730751515e-06, + "loss": 0.7632, + "step": 14069 + }, + { + "epoch": 0.36, + "learning_rate": 1.9576284041665913e-06, + "loss": 0.709, + "step": 14070 + }, + { + "epoch": 0.36, + "learning_rate": 1.957620434524819e-06, + "loss": 0.8398, + "step": 14071 + }, + { + "epoch": 0.36, + "learning_rate": 1.957612464149841e-06, + "loss": 0.9805, + "step": 14072 + }, + { + "epoch": 0.36, + "learning_rate": 1.957604493041663e-06, + "loss": 0.9404, + "step": 14073 + }, + { + "epoch": 0.36, + "learning_rate": 1.9575965212002908e-06, + "loss": 0.8267, + "step": 14074 + }, + { + "epoch": 0.36, + "learning_rate": 1.9575885486257313e-06, + "loss": 1.1465, + "step": 14075 + }, + { + "epoch": 0.36, + "learning_rate": 1.95758057531799e-06, + "loss": 0.9565, + "step": 14076 + }, + { + "epoch": 0.36, + "learning_rate": 1.957572601277074e-06, + "loss": 0.9287, + "step": 14077 + }, + { + "epoch": 0.36, + "learning_rate": 1.957564626502988e-06, + "loss": 0.8779, + "step": 14078 + }, + { + "epoch": 0.36, + "learning_rate": 1.957556650995739e-06, + "loss": 0.8887, + "step": 14079 + }, + { + "epoch": 0.36, + "learning_rate": 1.9575486747553332e-06, + "loss": 0.7363, + "step": 14080 + }, + { + "epoch": 0.36, + "learning_rate": 1.9575406977817767e-06, + "loss": 0.7988, + "step": 14081 + }, + { + "epoch": 0.36, + "learning_rate": 1.9575327200750746e-06, + "loss": 0.6392, + "step": 14082 + }, + { + "epoch": 0.36, + "learning_rate": 1.957524741635234e-06, + "loss": 1.1758, + "step": 14083 + }, + { + "epoch": 0.36, + "learning_rate": 1.9575167624622605e-06, + "loss": 0.8955, + "step": 14084 + }, + { + "epoch": 0.36, + "learning_rate": 1.9575087825561608e-06, + "loss": 0.9199, + "step": 14085 + }, + { + "epoch": 0.36, + "learning_rate": 1.9575008019169404e-06, + "loss": 0.918, + "step": 14086 + }, + { + "epoch": 0.36, + "learning_rate": 1.957492820544606e-06, + "loss": 0.9697, + "step": 14087 + }, + { + "epoch": 0.36, + "learning_rate": 1.957484838439163e-06, + "loss": 0.8369, + "step": 14088 + }, + { + "epoch": 0.36, + "learning_rate": 1.957476855600618e-06, + "loss": 0.9248, + "step": 14089 + }, + { + "epoch": 0.36, + "learning_rate": 1.957468872028977e-06, + "loss": 0.9072, + "step": 14090 + }, + { + "epoch": 0.36, + "learning_rate": 1.957460887724246e-06, + "loss": 0.9502, + "step": 14091 + }, + { + "epoch": 0.36, + "learning_rate": 1.957452902686431e-06, + "loss": 0.8428, + "step": 14092 + }, + { + "epoch": 0.36, + "learning_rate": 1.9574449169155393e-06, + "loss": 1.0225, + "step": 14093 + }, + { + "epoch": 0.36, + "learning_rate": 1.957436930411575e-06, + "loss": 1.0898, + "step": 14094 + }, + { + "epoch": 0.36, + "learning_rate": 1.9574289431745457e-06, + "loss": 0.9106, + "step": 14095 + }, + { + "epoch": 0.36, + "learning_rate": 1.9574209552044572e-06, + "loss": 1.0039, + "step": 14096 + }, + { + "epoch": 0.36, + "learning_rate": 1.9574129665013155e-06, + "loss": 0.877, + "step": 14097 + }, + { + "epoch": 0.36, + "learning_rate": 1.9574049770651265e-06, + "loss": 1.0488, + "step": 14098 + }, + { + "epoch": 0.36, + "learning_rate": 1.9573969868958965e-06, + "loss": 0.6309, + "step": 14099 + }, + { + "epoch": 0.36, + "learning_rate": 1.957388995993632e-06, + "loss": 0.9092, + "step": 14100 + }, + { + "epoch": 0.36, + "learning_rate": 1.9573810043583384e-06, + "loss": 0.9229, + "step": 14101 + }, + { + "epoch": 0.36, + "learning_rate": 1.9573730119900224e-06, + "loss": 0.8711, + "step": 14102 + }, + { + "epoch": 0.36, + "learning_rate": 1.95736501888869e-06, + "loss": 1.0762, + "step": 14103 + }, + { + "epoch": 0.36, + "learning_rate": 1.957357025054347e-06, + "loss": 0.916, + "step": 14104 + }, + { + "epoch": 0.36, + "learning_rate": 1.9573490304869995e-06, + "loss": 0.8262, + "step": 14105 + }, + { + "epoch": 0.36, + "learning_rate": 1.9573410351866545e-06, + "loss": 0.9102, + "step": 14106 + }, + { + "epoch": 0.36, + "learning_rate": 1.9573330391533168e-06, + "loss": 0.7803, + "step": 14107 + }, + { + "epoch": 0.36, + "learning_rate": 1.957325042386994e-06, + "loss": 0.8496, + "step": 14108 + }, + { + "epoch": 0.36, + "learning_rate": 1.957317044887691e-06, + "loss": 0.9404, + "step": 14109 + }, + { + "epoch": 0.36, + "learning_rate": 1.957309046655414e-06, + "loss": 0.875, + "step": 14110 + }, + { + "epoch": 0.36, + "learning_rate": 1.95730104769017e-06, + "loss": 0.8926, + "step": 14111 + }, + { + "epoch": 0.36, + "learning_rate": 1.9572930479919647e-06, + "loss": 0.8535, + "step": 14112 + }, + { + "epoch": 0.36, + "learning_rate": 1.9572850475608035e-06, + "loss": 0.832, + "step": 14113 + }, + { + "epoch": 0.36, + "learning_rate": 1.9572770463966933e-06, + "loss": 0.5476, + "step": 14114 + }, + { + "epoch": 0.36, + "learning_rate": 1.9572690444996404e-06, + "loss": 0.9219, + "step": 14115 + }, + { + "epoch": 0.36, + "learning_rate": 1.9572610418696507e-06, + "loss": 0.5986, + "step": 14116 + }, + { + "epoch": 0.36, + "learning_rate": 1.9572530385067302e-06, + "loss": 0.8096, + "step": 14117 + }, + { + "epoch": 0.36, + "learning_rate": 1.957245034410885e-06, + "loss": 0.8955, + "step": 14118 + }, + { + "epoch": 0.36, + "learning_rate": 1.957237029582121e-06, + "loss": 0.6021, + "step": 14119 + }, + { + "epoch": 0.36, + "learning_rate": 1.957229024020445e-06, + "loss": 0.8877, + "step": 14120 + }, + { + "epoch": 0.36, + "learning_rate": 1.9572210177258627e-06, + "loss": 1.0098, + "step": 14121 + }, + { + "epoch": 0.36, + "learning_rate": 1.95721301069838e-06, + "loss": 0.8999, + "step": 14122 + }, + { + "epoch": 0.36, + "learning_rate": 1.9572050029380037e-06, + "loss": 0.709, + "step": 14123 + }, + { + "epoch": 0.36, + "learning_rate": 1.957196994444739e-06, + "loss": 0.6538, + "step": 14124 + }, + { + "epoch": 0.36, + "learning_rate": 1.957188985218593e-06, + "loss": 1.0527, + "step": 14125 + }, + { + "epoch": 0.36, + "learning_rate": 1.9571809752595713e-06, + "loss": 0.8965, + "step": 14126 + }, + { + "epoch": 0.36, + "learning_rate": 1.95717296456768e-06, + "loss": 0.8525, + "step": 14127 + }, + { + "epoch": 0.36, + "learning_rate": 1.9571649531429257e-06, + "loss": 0.9688, + "step": 14128 + }, + { + "epoch": 0.36, + "learning_rate": 1.9571569409853138e-06, + "loss": 0.9775, + "step": 14129 + }, + { + "epoch": 0.36, + "learning_rate": 1.957148928094851e-06, + "loss": 0.9561, + "step": 14130 + }, + { + "epoch": 0.36, + "learning_rate": 1.9571409144715435e-06, + "loss": 0.8022, + "step": 14131 + }, + { + "epoch": 0.36, + "learning_rate": 1.957132900115397e-06, + "loss": 1.1396, + "step": 14132 + }, + { + "epoch": 0.36, + "learning_rate": 1.9571248850264184e-06, + "loss": 0.8042, + "step": 14133 + }, + { + "epoch": 0.36, + "learning_rate": 1.957116869204612e-06, + "loss": 0.9072, + "step": 14134 + }, + { + "epoch": 0.36, + "learning_rate": 1.957108852649986e-06, + "loss": 0.8721, + "step": 14135 + }, + { + "epoch": 0.36, + "learning_rate": 1.9571008353625462e-06, + "loss": 0.96, + "step": 14136 + }, + { + "epoch": 0.36, + "learning_rate": 1.957092817342298e-06, + "loss": 0.7969, + "step": 14137 + }, + { + "epoch": 0.36, + "learning_rate": 1.9570847985892478e-06, + "loss": 0.9092, + "step": 14138 + }, + { + "epoch": 0.36, + "learning_rate": 1.9570767791034016e-06, + "loss": 0.8887, + "step": 14139 + }, + { + "epoch": 0.36, + "learning_rate": 1.9570687588847655e-06, + "loss": 0.833, + "step": 14140 + }, + { + "epoch": 0.36, + "learning_rate": 1.9570607379333465e-06, + "loss": 0.8564, + "step": 14141 + }, + { + "epoch": 0.36, + "learning_rate": 1.9570527162491495e-06, + "loss": 0.8135, + "step": 14142 + }, + { + "epoch": 0.36, + "learning_rate": 1.957044693832182e-06, + "loss": 0.9111, + "step": 14143 + }, + { + "epoch": 0.36, + "learning_rate": 1.9570366706824484e-06, + "loss": 1.0098, + "step": 14144 + }, + { + "epoch": 0.36, + "learning_rate": 1.9570286467999566e-06, + "loss": 0.9287, + "step": 14145 + }, + { + "epoch": 0.36, + "learning_rate": 1.9570206221847118e-06, + "loss": 0.7449, + "step": 14146 + }, + { + "epoch": 0.36, + "learning_rate": 1.95701259683672e-06, + "loss": 1.1621, + "step": 14147 + }, + { + "epoch": 0.36, + "learning_rate": 1.957004570755988e-06, + "loss": 1.0586, + "step": 14148 + }, + { + "epoch": 0.36, + "learning_rate": 1.9569965439425214e-06, + "loss": 0.8662, + "step": 14149 + }, + { + "epoch": 0.36, + "learning_rate": 1.9569885163963266e-06, + "loss": 0.5864, + "step": 14150 + }, + { + "epoch": 0.36, + "learning_rate": 1.95698048811741e-06, + "loss": 0.9326, + "step": 14151 + }, + { + "epoch": 0.36, + "learning_rate": 1.956972459105777e-06, + "loss": 0.6548, + "step": 14152 + }, + { + "epoch": 0.36, + "learning_rate": 1.956964429361434e-06, + "loss": 0.9189, + "step": 14153 + }, + { + "epoch": 0.36, + "learning_rate": 1.9569563988843876e-06, + "loss": 0.748, + "step": 14154 + }, + { + "epoch": 0.36, + "learning_rate": 1.956948367674644e-06, + "loss": 0.9492, + "step": 14155 + }, + { + "epoch": 0.36, + "learning_rate": 1.956940335732209e-06, + "loss": 0.772, + "step": 14156 + }, + { + "epoch": 0.36, + "learning_rate": 1.956932303057088e-06, + "loss": 0.8643, + "step": 14157 + }, + { + "epoch": 0.36, + "learning_rate": 1.956924269649289e-06, + "loss": 0.7998, + "step": 14158 + }, + { + "epoch": 0.36, + "learning_rate": 1.9569162355088165e-06, + "loss": 0.748, + "step": 14159 + }, + { + "epoch": 0.36, + "learning_rate": 1.9569082006356774e-06, + "loss": 0.8887, + "step": 14160 + }, + { + "epoch": 0.36, + "learning_rate": 1.9569001650298777e-06, + "loss": 1.0039, + "step": 14161 + }, + { + "epoch": 0.36, + "learning_rate": 1.9568921286914233e-06, + "loss": 0.999, + "step": 14162 + }, + { + "epoch": 0.36, + "learning_rate": 1.956884091620321e-06, + "loss": 0.9902, + "step": 14163 + }, + { + "epoch": 0.36, + "learning_rate": 1.9568760538165763e-06, + "loss": 0.7368, + "step": 14164 + }, + { + "epoch": 0.36, + "learning_rate": 1.956868015280196e-06, + "loss": 1.1533, + "step": 14165 + }, + { + "epoch": 0.36, + "learning_rate": 1.9568599760111854e-06, + "loss": 0.8242, + "step": 14166 + }, + { + "epoch": 0.36, + "learning_rate": 1.956851936009551e-06, + "loss": 0.8828, + "step": 14167 + }, + { + "epoch": 0.36, + "learning_rate": 1.9568438952752994e-06, + "loss": 0.9277, + "step": 14168 + }, + { + "epoch": 0.36, + "learning_rate": 1.956835853808436e-06, + "loss": 0.8896, + "step": 14169 + }, + { + "epoch": 0.36, + "learning_rate": 1.956827811608968e-06, + "loss": 0.9551, + "step": 14170 + }, + { + "epoch": 0.36, + "learning_rate": 1.9568197686769006e-06, + "loss": 0.9619, + "step": 14171 + }, + { + "epoch": 0.36, + "learning_rate": 1.95681172501224e-06, + "loss": 0.8496, + "step": 14172 + }, + { + "epoch": 0.36, + "learning_rate": 1.956803680614993e-06, + "loss": 0.9375, + "step": 14173 + }, + { + "epoch": 0.36, + "learning_rate": 1.9567956354851656e-06, + "loss": 0.9043, + "step": 14174 + }, + { + "epoch": 0.36, + "learning_rate": 1.956787589622764e-06, + "loss": 0.8257, + "step": 14175 + }, + { + "epoch": 0.36, + "learning_rate": 1.9567795430277933e-06, + "loss": 0.7627, + "step": 14176 + }, + { + "epoch": 0.36, + "learning_rate": 1.956771495700261e-06, + "loss": 0.5884, + "step": 14177 + }, + { + "epoch": 0.36, + "learning_rate": 1.9567634476401724e-06, + "loss": 0.8223, + "step": 14178 + }, + { + "epoch": 0.36, + "learning_rate": 1.9567553988475346e-06, + "loss": 0.7148, + "step": 14179 + }, + { + "epoch": 0.36, + "learning_rate": 1.9567473493223527e-06, + "loss": 0.7832, + "step": 14180 + }, + { + "epoch": 0.36, + "learning_rate": 1.9567392990646335e-06, + "loss": 1.0439, + "step": 14181 + }, + { + "epoch": 0.36, + "learning_rate": 1.956731248074383e-06, + "loss": 0.8257, + "step": 14182 + }, + { + "epoch": 0.36, + "learning_rate": 1.9567231963516077e-06, + "loss": 1.0439, + "step": 14183 + }, + { + "epoch": 0.36, + "learning_rate": 1.956715143896313e-06, + "loss": 0.9678, + "step": 14184 + }, + { + "epoch": 0.36, + "learning_rate": 1.9567070907085057e-06, + "loss": 0.9922, + "step": 14185 + }, + { + "epoch": 0.36, + "learning_rate": 1.956699036788192e-06, + "loss": 0.9668, + "step": 14186 + }, + { + "epoch": 0.36, + "learning_rate": 1.9566909821353774e-06, + "loss": 1.0547, + "step": 14187 + }, + { + "epoch": 0.36, + "learning_rate": 1.9566829267500684e-06, + "loss": 0.7656, + "step": 14188 + }, + { + "epoch": 0.36, + "learning_rate": 1.9566748706322715e-06, + "loss": 0.8984, + "step": 14189 + }, + { + "epoch": 0.36, + "learning_rate": 1.9566668137819927e-06, + "loss": 0.7126, + "step": 14190 + }, + { + "epoch": 0.36, + "learning_rate": 1.9566587561992384e-06, + "loss": 0.6553, + "step": 14191 + }, + { + "epoch": 0.36, + "learning_rate": 1.956650697884014e-06, + "loss": 0.9688, + "step": 14192 + }, + { + "epoch": 0.36, + "learning_rate": 1.9566426388363264e-06, + "loss": 0.8779, + "step": 14193 + }, + { + "epoch": 0.36, + "learning_rate": 1.9566345790561814e-06, + "loss": 0.8232, + "step": 14194 + }, + { + "epoch": 0.36, + "learning_rate": 1.9566265185435854e-06, + "loss": 0.8506, + "step": 14195 + }, + { + "epoch": 0.36, + "learning_rate": 1.9566184572985444e-06, + "loss": 0.9204, + "step": 14196 + }, + { + "epoch": 0.36, + "learning_rate": 1.9566103953210646e-06, + "loss": 0.9785, + "step": 14197 + }, + { + "epoch": 0.36, + "learning_rate": 1.956602332611152e-06, + "loss": 0.9043, + "step": 14198 + }, + { + "epoch": 0.36, + "learning_rate": 1.956594269168813e-06, + "loss": 0.9282, + "step": 14199 + }, + { + "epoch": 0.36, + "learning_rate": 1.956586204994054e-06, + "loss": 0.9033, + "step": 14200 + }, + { + "epoch": 0.36, + "learning_rate": 1.9565781400868814e-06, + "loss": 0.8174, + "step": 14201 + }, + { + "epoch": 0.36, + "learning_rate": 1.9565700744473004e-06, + "loss": 0.8525, + "step": 14202 + }, + { + "epoch": 0.36, + "learning_rate": 1.9565620080753176e-06, + "loss": 0.9404, + "step": 14203 + }, + { + "epoch": 0.36, + "learning_rate": 1.9565539409709393e-06, + "loss": 0.8281, + "step": 14204 + }, + { + "epoch": 0.36, + "learning_rate": 1.956545873134172e-06, + "loss": 0.835, + "step": 14205 + }, + { + "epoch": 0.36, + "learning_rate": 1.9565378045650207e-06, + "loss": 0.8779, + "step": 14206 + }, + { + "epoch": 0.36, + "learning_rate": 1.9565297352634927e-06, + "loss": 0.9111, + "step": 14207 + }, + { + "epoch": 0.36, + "learning_rate": 1.9565216652295946e-06, + "loss": 0.5991, + "step": 14208 + }, + { + "epoch": 0.36, + "learning_rate": 1.956513594463331e-06, + "loss": 0.748, + "step": 14209 + }, + { + "epoch": 0.36, + "learning_rate": 1.9565055229647093e-06, + "loss": 1.0239, + "step": 14210 + }, + { + "epoch": 0.36, + "learning_rate": 1.956497450733735e-06, + "loss": 1.0166, + "step": 14211 + }, + { + "epoch": 0.36, + "learning_rate": 1.9564893777704147e-06, + "loss": 0.9658, + "step": 14212 + }, + { + "epoch": 0.36, + "learning_rate": 1.9564813040747547e-06, + "loss": 0.8408, + "step": 14213 + }, + { + "epoch": 0.36, + "learning_rate": 1.956473229646761e-06, + "loss": 0.8428, + "step": 14214 + }, + { + "epoch": 0.36, + "learning_rate": 1.9564651544864394e-06, + "loss": 0.7939, + "step": 14215 + }, + { + "epoch": 0.36, + "learning_rate": 1.9564570785937965e-06, + "loss": 0.8301, + "step": 14216 + }, + { + "epoch": 0.36, + "learning_rate": 1.9564490019688386e-06, + "loss": 1.2012, + "step": 14217 + }, + { + "epoch": 0.36, + "learning_rate": 1.956440924611571e-06, + "loss": 0.9248, + "step": 14218 + }, + { + "epoch": 0.36, + "learning_rate": 1.9564328465220014e-06, + "loss": 0.9893, + "step": 14219 + }, + { + "epoch": 0.36, + "learning_rate": 1.9564247677001347e-06, + "loss": 0.833, + "step": 14220 + }, + { + "epoch": 0.36, + "learning_rate": 1.9564166881459777e-06, + "loss": 0.7607, + "step": 14221 + }, + { + "epoch": 0.36, + "learning_rate": 1.956408607859536e-06, + "loss": 0.9111, + "step": 14222 + }, + { + "epoch": 0.36, + "learning_rate": 1.9564005268408166e-06, + "loss": 0.9062, + "step": 14223 + }, + { + "epoch": 0.36, + "learning_rate": 1.9563924450898253e-06, + "loss": 0.9238, + "step": 14224 + }, + { + "epoch": 0.36, + "learning_rate": 1.956384362606568e-06, + "loss": 0.9414, + "step": 14225 + }, + { + "epoch": 0.36, + "learning_rate": 1.9563762793910514e-06, + "loss": 0.8691, + "step": 14226 + }, + { + "epoch": 0.36, + "learning_rate": 1.956368195443282e-06, + "loss": 1.0928, + "step": 14227 + }, + { + "epoch": 0.36, + "learning_rate": 1.9563601107632647e-06, + "loss": 1.0312, + "step": 14228 + }, + { + "epoch": 0.36, + "learning_rate": 1.9563520253510066e-06, + "loss": 0.8721, + "step": 14229 + }, + { + "epoch": 0.36, + "learning_rate": 1.956343939206514e-06, + "loss": 0.5947, + "step": 14230 + }, + { + "epoch": 0.36, + "learning_rate": 1.9563358523297925e-06, + "loss": 0.6338, + "step": 14231 + }, + { + "epoch": 0.36, + "learning_rate": 1.956327764720849e-06, + "loss": 0.9092, + "step": 14232 + }, + { + "epoch": 0.36, + "learning_rate": 1.956319676379689e-06, + "loss": 0.9062, + "step": 14233 + }, + { + "epoch": 0.36, + "learning_rate": 1.9563115873063185e-06, + "loss": 0.8682, + "step": 14234 + }, + { + "epoch": 0.36, + "learning_rate": 1.956303497500745e-06, + "loss": 0.8506, + "step": 14235 + }, + { + "epoch": 0.36, + "learning_rate": 1.9562954069629734e-06, + "loss": 1.0576, + "step": 14236 + }, + { + "epoch": 0.36, + "learning_rate": 1.9562873156930107e-06, + "loss": 0.9839, + "step": 14237 + }, + { + "epoch": 0.36, + "learning_rate": 1.9562792236908624e-06, + "loss": 0.7385, + "step": 14238 + }, + { + "epoch": 0.36, + "learning_rate": 1.9562711309565356e-06, + "loss": 0.7295, + "step": 14239 + }, + { + "epoch": 0.36, + "learning_rate": 1.9562630374900355e-06, + "loss": 0.8965, + "step": 14240 + }, + { + "epoch": 0.37, + "learning_rate": 1.9562549432913687e-06, + "loss": 0.9922, + "step": 14241 + }, + { + "epoch": 0.37, + "learning_rate": 1.956246848360542e-06, + "loss": 0.7656, + "step": 14242 + }, + { + "epoch": 0.37, + "learning_rate": 1.9562387526975604e-06, + "loss": 1.0293, + "step": 14243 + }, + { + "epoch": 0.37, + "learning_rate": 1.9562306563024312e-06, + "loss": 0.9717, + "step": 14244 + }, + { + "epoch": 0.37, + "learning_rate": 1.9562225591751603e-06, + "loss": 0.9902, + "step": 14245 + }, + { + "epoch": 0.37, + "learning_rate": 1.9562144613157534e-06, + "loss": 1.0225, + "step": 14246 + }, + { + "epoch": 0.37, + "learning_rate": 1.956206362724217e-06, + "loss": 0.8906, + "step": 14247 + }, + { + "epoch": 0.37, + "learning_rate": 1.956198263400558e-06, + "loss": 0.9473, + "step": 14248 + }, + { + "epoch": 0.37, + "learning_rate": 1.956190163344781e-06, + "loss": 0.8916, + "step": 14249 + }, + { + "epoch": 0.37, + "learning_rate": 1.956182062556894e-06, + "loss": 0.9639, + "step": 14250 + }, + { + "epoch": 0.37, + "learning_rate": 1.9561739610369017e-06, + "loss": 0.9141, + "step": 14251 + }, + { + "epoch": 0.37, + "learning_rate": 1.9561658587848112e-06, + "loss": 0.8496, + "step": 14252 + }, + { + "epoch": 0.37, + "learning_rate": 1.956157755800629e-06, + "loss": 0.8301, + "step": 14253 + }, + { + "epoch": 0.37, + "learning_rate": 1.95614965208436e-06, + "loss": 0.9111, + "step": 14254 + }, + { + "epoch": 0.37, + "learning_rate": 1.9561415476360115e-06, + "loss": 0.9346, + "step": 14255 + }, + { + "epoch": 0.37, + "learning_rate": 1.956133442455589e-06, + "loss": 0.8037, + "step": 14256 + }, + { + "epoch": 0.37, + "learning_rate": 1.9561253365431e-06, + "loss": 0.9746, + "step": 14257 + }, + { + "epoch": 0.37, + "learning_rate": 1.956117229898549e-06, + "loss": 0.9609, + "step": 14258 + }, + { + "epoch": 0.37, + "learning_rate": 1.9561091225219435e-06, + "loss": 0.8633, + "step": 14259 + }, + { + "epoch": 0.37, + "learning_rate": 1.956101014413289e-06, + "loss": 0.6567, + "step": 14260 + }, + { + "epoch": 0.37, + "learning_rate": 1.9560929055725915e-06, + "loss": 0.79, + "step": 14261 + }, + { + "epoch": 0.37, + "learning_rate": 1.9560847959998582e-06, + "loss": 1.0996, + "step": 14262 + }, + { + "epoch": 0.37, + "learning_rate": 1.9560766856950945e-06, + "loss": 0.7998, + "step": 14263 + }, + { + "epoch": 0.37, + "learning_rate": 1.9560685746583067e-06, + "loss": 1.0273, + "step": 14264 + }, + { + "epoch": 0.37, + "learning_rate": 1.9560604628895016e-06, + "loss": 1.0664, + "step": 14265 + }, + { + "epoch": 0.37, + "learning_rate": 1.9560523503886843e-06, + "loss": 1.0518, + "step": 14266 + }, + { + "epoch": 0.37, + "learning_rate": 1.9560442371558624e-06, + "loss": 1.2109, + "step": 14267 + }, + { + "epoch": 0.37, + "learning_rate": 1.956036123191041e-06, + "loss": 0.8906, + "step": 14268 + }, + { + "epoch": 0.37, + "learning_rate": 1.9560280084942267e-06, + "loss": 0.8291, + "step": 14269 + }, + { + "epoch": 0.37, + "learning_rate": 1.9560198930654257e-06, + "loss": 1.0078, + "step": 14270 + }, + { + "epoch": 0.37, + "learning_rate": 1.9560117769046443e-06, + "loss": 1.0977, + "step": 14271 + }, + { + "epoch": 0.37, + "learning_rate": 1.9560036600118887e-06, + "loss": 0.8096, + "step": 14272 + }, + { + "epoch": 0.37, + "learning_rate": 1.955995542387165e-06, + "loss": 1.0498, + "step": 14273 + }, + { + "epoch": 0.37, + "learning_rate": 1.9559874240304793e-06, + "loss": 1.1191, + "step": 14274 + }, + { + "epoch": 0.37, + "learning_rate": 1.9559793049418383e-06, + "loss": 0.8223, + "step": 14275 + }, + { + "epoch": 0.37, + "learning_rate": 1.9559711851212477e-06, + "loss": 1.0518, + "step": 14276 + }, + { + "epoch": 0.37, + "learning_rate": 1.955963064568714e-06, + "loss": 0.8066, + "step": 14277 + }, + { + "epoch": 0.37, + "learning_rate": 1.9559549432842432e-06, + "loss": 1.1152, + "step": 14278 + }, + { + "epoch": 0.37, + "learning_rate": 1.9559468212678417e-06, + "loss": 1.2012, + "step": 14279 + }, + { + "epoch": 0.37, + "learning_rate": 1.955938698519516e-06, + "loss": 0.8359, + "step": 14280 + }, + { + "epoch": 0.37, + "learning_rate": 1.9559305750392717e-06, + "loss": 1.0146, + "step": 14281 + }, + { + "epoch": 0.37, + "learning_rate": 1.955922450827115e-06, + "loss": 0.8643, + "step": 14282 + }, + { + "epoch": 0.37, + "learning_rate": 1.955914325883053e-06, + "loss": 0.8125, + "step": 14283 + }, + { + "epoch": 0.37, + "learning_rate": 1.955906200207091e-06, + "loss": 0.7188, + "step": 14284 + }, + { + "epoch": 0.37, + "learning_rate": 1.955898073799236e-06, + "loss": 1.0225, + "step": 14285 + }, + { + "epoch": 0.37, + "learning_rate": 1.9558899466594934e-06, + "loss": 0.9795, + "step": 14286 + }, + { + "epoch": 0.37, + "learning_rate": 1.95588181878787e-06, + "loss": 0.8965, + "step": 14287 + }, + { + "epoch": 0.37, + "learning_rate": 1.955873690184372e-06, + "loss": 0.7666, + "step": 14288 + }, + { + "epoch": 0.37, + "learning_rate": 1.955865560849005e-06, + "loss": 0.5674, + "step": 14289 + }, + { + "epoch": 0.37, + "learning_rate": 1.955857430781776e-06, + "loss": 0.9609, + "step": 14290 + }, + { + "epoch": 0.37, + "learning_rate": 1.955849299982691e-06, + "loss": 0.9111, + "step": 14291 + }, + { + "epoch": 0.37, + "learning_rate": 1.9558411684517555e-06, + "loss": 0.8975, + "step": 14292 + }, + { + "epoch": 0.37, + "learning_rate": 1.955833036188977e-06, + "loss": 0.6123, + "step": 14293 + }, + { + "epoch": 0.37, + "learning_rate": 1.955824903194361e-06, + "loss": 1.1064, + "step": 14294 + }, + { + "epoch": 0.37, + "learning_rate": 1.955816769467914e-06, + "loss": 1.0312, + "step": 14295 + }, + { + "epoch": 0.37, + "learning_rate": 1.9558086350096414e-06, + "loss": 0.9004, + "step": 14296 + }, + { + "epoch": 0.37, + "learning_rate": 1.9558004998195507e-06, + "loss": 0.7832, + "step": 14297 + }, + { + "epoch": 0.37, + "learning_rate": 1.9557923638976473e-06, + "loss": 0.9287, + "step": 14298 + }, + { + "epoch": 0.37, + "learning_rate": 1.9557842272439375e-06, + "loss": 0.9863, + "step": 14299 + }, + { + "epoch": 0.37, + "learning_rate": 1.955776089858428e-06, + "loss": 0.8843, + "step": 14300 + }, + { + "epoch": 0.37, + "learning_rate": 1.9557679517411245e-06, + "loss": 0.8789, + "step": 14301 + }, + { + "epoch": 0.37, + "learning_rate": 1.955759812892033e-06, + "loss": 0.7363, + "step": 14302 + }, + { + "epoch": 0.37, + "learning_rate": 1.955751673311161e-06, + "loss": 0.8877, + "step": 14303 + }, + { + "epoch": 0.37, + "learning_rate": 1.955743532998513e-06, + "loss": 0.7822, + "step": 14304 + }, + { + "epoch": 0.37, + "learning_rate": 1.955735391954097e-06, + "loss": 0.8804, + "step": 14305 + }, + { + "epoch": 0.37, + "learning_rate": 1.9557272501779177e-06, + "loss": 0.874, + "step": 14306 + }, + { + "epoch": 0.37, + "learning_rate": 1.9557191076699824e-06, + "loss": 0.9736, + "step": 14307 + }, + { + "epoch": 0.37, + "learning_rate": 1.9557109644302967e-06, + "loss": 0.8291, + "step": 14308 + }, + { + "epoch": 0.37, + "learning_rate": 1.9557028204588672e-06, + "loss": 1.2051, + "step": 14309 + }, + { + "epoch": 0.37, + "learning_rate": 1.9556946757557e-06, + "loss": 0.9658, + "step": 14310 + }, + { + "epoch": 0.37, + "learning_rate": 1.9556865303208013e-06, + "loss": 0.8418, + "step": 14311 + }, + { + "epoch": 0.37, + "learning_rate": 1.9556783841541775e-06, + "loss": 0.7126, + "step": 14312 + }, + { + "epoch": 0.37, + "learning_rate": 1.955670237255834e-06, + "loss": 0.9492, + "step": 14313 + }, + { + "epoch": 0.37, + "learning_rate": 1.9556620896257784e-06, + "loss": 0.9736, + "step": 14314 + }, + { + "epoch": 0.37, + "learning_rate": 1.9556539412640162e-06, + "loss": 0.9141, + "step": 14315 + }, + { + "epoch": 0.37, + "learning_rate": 1.955645792170554e-06, + "loss": 0.8857, + "step": 14316 + }, + { + "epoch": 0.37, + "learning_rate": 1.955637642345397e-06, + "loss": 1.0244, + "step": 14317 + }, + { + "epoch": 0.37, + "learning_rate": 1.955629491788553e-06, + "loss": 0.6914, + "step": 14318 + }, + { + "epoch": 0.37, + "learning_rate": 1.955621340500027e-06, + "loss": 0.9043, + "step": 14319 + }, + { + "epoch": 0.37, + "learning_rate": 1.955613188479826e-06, + "loss": 0.9268, + "step": 14320 + }, + { + "epoch": 0.37, + "learning_rate": 1.9556050357279555e-06, + "loss": 1.0908, + "step": 14321 + }, + { + "epoch": 0.37, + "learning_rate": 1.9555968822444222e-06, + "loss": 1.0508, + "step": 14322 + }, + { + "epoch": 0.37, + "learning_rate": 1.9555887280292325e-06, + "loss": 0.7529, + "step": 14323 + }, + { + "epoch": 0.37, + "learning_rate": 1.9555805730823923e-06, + "loss": 0.7192, + "step": 14324 + }, + { + "epoch": 0.37, + "learning_rate": 1.9555724174039083e-06, + "loss": 0.9082, + "step": 14325 + }, + { + "epoch": 0.37, + "learning_rate": 1.955564260993786e-06, + "loss": 0.917, + "step": 14326 + }, + { + "epoch": 0.37, + "learning_rate": 1.955556103852032e-06, + "loss": 0.8389, + "step": 14327 + }, + { + "epoch": 0.37, + "learning_rate": 1.9555479459786533e-06, + "loss": 0.9639, + "step": 14328 + }, + { + "epoch": 0.37, + "learning_rate": 1.955539787373655e-06, + "loss": 0.771, + "step": 14329 + }, + { + "epoch": 0.37, + "learning_rate": 1.955531628037044e-06, + "loss": 1.042, + "step": 14330 + }, + { + "epoch": 0.37, + "learning_rate": 1.955523467968826e-06, + "loss": 1.0176, + "step": 14331 + }, + { + "epoch": 0.37, + "learning_rate": 1.955515307169008e-06, + "loss": 0.7451, + "step": 14332 + }, + { + "epoch": 0.37, + "learning_rate": 1.955507145637596e-06, + "loss": 0.7715, + "step": 14333 + }, + { + "epoch": 0.37, + "learning_rate": 1.955498983374596e-06, + "loss": 0.9932, + "step": 14334 + }, + { + "epoch": 0.37, + "learning_rate": 1.955490820380014e-06, + "loss": 0.7725, + "step": 14335 + }, + { + "epoch": 0.37, + "learning_rate": 1.955482656653857e-06, + "loss": 0.813, + "step": 14336 + }, + { + "epoch": 0.37, + "learning_rate": 1.9554744921961304e-06, + "loss": 0.8457, + "step": 14337 + }, + { + "epoch": 0.37, + "learning_rate": 1.9554663270068416e-06, + "loss": 0.9756, + "step": 14338 + }, + { + "epoch": 0.37, + "learning_rate": 1.9554581610859958e-06, + "loss": 1.0576, + "step": 14339 + }, + { + "epoch": 0.37, + "learning_rate": 1.9554499944336e-06, + "loss": 0.8506, + "step": 14340 + }, + { + "epoch": 0.37, + "learning_rate": 1.955441827049659e-06, + "loss": 0.6606, + "step": 14341 + }, + { + "epoch": 0.37, + "learning_rate": 1.955433658934181e-06, + "loss": 0.8542, + "step": 14342 + }, + { + "epoch": 0.37, + "learning_rate": 1.9554254900871714e-06, + "loss": 0.958, + "step": 14343 + }, + { + "epoch": 0.37, + "learning_rate": 1.955417320508636e-06, + "loss": 0.8428, + "step": 14344 + }, + { + "epoch": 0.37, + "learning_rate": 1.9554091501985817e-06, + "loss": 1.0918, + "step": 14345 + }, + { + "epoch": 0.37, + "learning_rate": 1.955400979157015e-06, + "loss": 1.0273, + "step": 14346 + }, + { + "epoch": 0.37, + "learning_rate": 1.955392807383941e-06, + "loss": 0.8242, + "step": 14347 + }, + { + "epoch": 0.37, + "learning_rate": 1.955384634879367e-06, + "loss": 1.0137, + "step": 14348 + }, + { + "epoch": 0.37, + "learning_rate": 1.9553764616432987e-06, + "loss": 0.8779, + "step": 14349 + }, + { + "epoch": 0.37, + "learning_rate": 1.9553682876757428e-06, + "loss": 0.6497, + "step": 14350 + }, + { + "epoch": 0.37, + "learning_rate": 1.9553601129767053e-06, + "loss": 0.5366, + "step": 14351 + }, + { + "epoch": 0.37, + "learning_rate": 1.9553519375461922e-06, + "loss": 0.9058, + "step": 14352 + }, + { + "epoch": 0.37, + "learning_rate": 1.9553437613842107e-06, + "loss": 0.96, + "step": 14353 + }, + { + "epoch": 0.37, + "learning_rate": 1.955335584490766e-06, + "loss": 0.5698, + "step": 14354 + }, + { + "epoch": 0.37, + "learning_rate": 1.955327406865865e-06, + "loss": 0.8027, + "step": 14355 + }, + { + "epoch": 0.37, + "learning_rate": 1.955319228509513e-06, + "loss": 0.8242, + "step": 14356 + }, + { + "epoch": 0.37, + "learning_rate": 1.9553110494217177e-06, + "loss": 0.9707, + "step": 14357 + }, + { + "epoch": 0.37, + "learning_rate": 1.9553028696024847e-06, + "loss": 1.125, + "step": 14358 + }, + { + "epoch": 0.37, + "learning_rate": 1.9552946890518196e-06, + "loss": 0.8203, + "step": 14359 + }, + { + "epoch": 0.37, + "learning_rate": 1.9552865077697298e-06, + "loss": 0.8662, + "step": 14360 + }, + { + "epoch": 0.37, + "learning_rate": 1.955278325756221e-06, + "loss": 0.7529, + "step": 14361 + }, + { + "epoch": 0.37, + "learning_rate": 1.9552701430112994e-06, + "loss": 1.2188, + "step": 14362 + }, + { + "epoch": 0.37, + "learning_rate": 1.9552619595349715e-06, + "loss": 0.8232, + "step": 14363 + }, + { + "epoch": 0.37, + "learning_rate": 1.955253775327243e-06, + "loss": 0.7241, + "step": 14364 + }, + { + "epoch": 0.37, + "learning_rate": 1.955245590388121e-06, + "loss": 0.7676, + "step": 14365 + }, + { + "epoch": 0.37, + "learning_rate": 1.9552374047176115e-06, + "loss": 0.8555, + "step": 14366 + }, + { + "epoch": 0.37, + "learning_rate": 1.9552292183157203e-06, + "loss": 0.8091, + "step": 14367 + }, + { + "epoch": 0.37, + "learning_rate": 1.9552210311824544e-06, + "loss": 0.7744, + "step": 14368 + }, + { + "epoch": 0.37, + "learning_rate": 1.9552128433178195e-06, + "loss": 0.8369, + "step": 14369 + }, + { + "epoch": 0.37, + "learning_rate": 1.9552046547218217e-06, + "loss": 0.9834, + "step": 14370 + }, + { + "epoch": 0.37, + "learning_rate": 1.955196465394468e-06, + "loss": 0.8496, + "step": 14371 + }, + { + "epoch": 0.37, + "learning_rate": 1.955188275335764e-06, + "loss": 0.7114, + "step": 14372 + }, + { + "epoch": 0.37, + "learning_rate": 1.9551800845457168e-06, + "loss": 0.9912, + "step": 14373 + }, + { + "epoch": 0.37, + "learning_rate": 1.955171893024332e-06, + "loss": 0.7871, + "step": 14374 + }, + { + "epoch": 0.37, + "learning_rate": 1.9551637007716156e-06, + "loss": 0.835, + "step": 14375 + }, + { + "epoch": 0.37, + "learning_rate": 1.955155507787574e-06, + "loss": 0.7983, + "step": 14376 + }, + { + "epoch": 0.37, + "learning_rate": 1.9551473140722147e-06, + "loss": 1.1182, + "step": 14377 + }, + { + "epoch": 0.37, + "learning_rate": 1.955139119625542e-06, + "loss": 0.9448, + "step": 14378 + }, + { + "epoch": 0.37, + "learning_rate": 1.9551309244475642e-06, + "loss": 0.9219, + "step": 14379 + }, + { + "epoch": 0.37, + "learning_rate": 1.955122728538286e-06, + "loss": 1.0879, + "step": 14380 + }, + { + "epoch": 0.37, + "learning_rate": 1.9551145318977143e-06, + "loss": 1.0195, + "step": 14381 + }, + { + "epoch": 0.37, + "learning_rate": 1.9551063345258554e-06, + "loss": 1.0381, + "step": 14382 + }, + { + "epoch": 0.37, + "learning_rate": 1.9550981364227153e-06, + "loss": 0.8159, + "step": 14383 + }, + { + "epoch": 0.37, + "learning_rate": 1.9550899375883008e-06, + "loss": 0.8711, + "step": 14384 + }, + { + "epoch": 0.37, + "learning_rate": 1.9550817380226176e-06, + "loss": 0.7769, + "step": 14385 + }, + { + "epoch": 0.37, + "learning_rate": 1.9550735377256724e-06, + "loss": 0.8691, + "step": 14386 + }, + { + "epoch": 0.37, + "learning_rate": 1.9550653366974712e-06, + "loss": 0.7559, + "step": 14387 + }, + { + "epoch": 0.37, + "learning_rate": 1.9550571349380202e-06, + "loss": 0.6904, + "step": 14388 + }, + { + "epoch": 0.37, + "learning_rate": 1.955048932447326e-06, + "loss": 0.9346, + "step": 14389 + }, + { + "epoch": 0.37, + "learning_rate": 1.955040729225395e-06, + "loss": 1.0654, + "step": 14390 + }, + { + "epoch": 0.37, + "learning_rate": 1.9550325252722335e-06, + "loss": 0.8701, + "step": 14391 + }, + { + "epoch": 0.37, + "learning_rate": 1.955024320587847e-06, + "loss": 0.8496, + "step": 14392 + }, + { + "epoch": 0.37, + "learning_rate": 1.955016115172242e-06, + "loss": 0.9531, + "step": 14393 + }, + { + "epoch": 0.37, + "learning_rate": 1.9550079090254255e-06, + "loss": 0.8203, + "step": 14394 + }, + { + "epoch": 0.37, + "learning_rate": 1.954999702147403e-06, + "loss": 0.7827, + "step": 14395 + }, + { + "epoch": 0.37, + "learning_rate": 1.9549914945381816e-06, + "loss": 0.9365, + "step": 14396 + }, + { + "epoch": 0.37, + "learning_rate": 1.954983286197767e-06, + "loss": 1.0488, + "step": 14397 + }, + { + "epoch": 0.37, + "learning_rate": 1.9549750771261656e-06, + "loss": 0.9766, + "step": 14398 + }, + { + "epoch": 0.37, + "learning_rate": 1.9549668673233833e-06, + "loss": 0.8965, + "step": 14399 + }, + { + "epoch": 0.37, + "learning_rate": 1.9549586567894274e-06, + "loss": 0.665, + "step": 14400 + }, + { + "epoch": 0.37, + "learning_rate": 1.9549504455243033e-06, + "loss": 0.8887, + "step": 14401 + }, + { + "epoch": 0.37, + "learning_rate": 1.954942233528018e-06, + "loss": 1.1357, + "step": 14402 + }, + { + "epoch": 0.37, + "learning_rate": 1.9549340208005764e-06, + "loss": 0.8477, + "step": 14403 + }, + { + "epoch": 0.37, + "learning_rate": 1.9549258073419864e-06, + "loss": 0.7959, + "step": 14404 + }, + { + "epoch": 0.37, + "learning_rate": 1.954917593152253e-06, + "loss": 0.875, + "step": 14405 + }, + { + "epoch": 0.37, + "learning_rate": 1.9549093782313836e-06, + "loss": 1.1475, + "step": 14406 + }, + { + "epoch": 0.37, + "learning_rate": 1.954901162579384e-06, + "loss": 0.8516, + "step": 14407 + }, + { + "epoch": 0.37, + "learning_rate": 1.9548929461962602e-06, + "loss": 0.9268, + "step": 14408 + }, + { + "epoch": 0.37, + "learning_rate": 1.9548847290820196e-06, + "loss": 1.1777, + "step": 14409 + }, + { + "epoch": 0.37, + "learning_rate": 1.9548765112366667e-06, + "loss": 0.627, + "step": 14410 + }, + { + "epoch": 0.37, + "learning_rate": 1.954868292660209e-06, + "loss": 1.0273, + "step": 14411 + }, + { + "epoch": 0.37, + "learning_rate": 1.954860073352653e-06, + "loss": 0.9033, + "step": 14412 + }, + { + "epoch": 0.37, + "learning_rate": 1.9548518533140043e-06, + "loss": 1.1758, + "step": 14413 + }, + { + "epoch": 0.37, + "learning_rate": 1.9548436325442693e-06, + "loss": 0.9248, + "step": 14414 + }, + { + "epoch": 0.37, + "learning_rate": 1.954835411043454e-06, + "loss": 0.7185, + "step": 14415 + }, + { + "epoch": 0.37, + "learning_rate": 1.9548271888115663e-06, + "loss": 0.8652, + "step": 14416 + }, + { + "epoch": 0.37, + "learning_rate": 1.9548189658486105e-06, + "loss": 0.8193, + "step": 14417 + }, + { + "epoch": 0.37, + "learning_rate": 1.954810742154594e-06, + "loss": 0.7275, + "step": 14418 + }, + { + "epoch": 0.37, + "learning_rate": 1.954802517729523e-06, + "loss": 0.9141, + "step": 14419 + }, + { + "epoch": 0.37, + "learning_rate": 1.9547942925734027e-06, + "loss": 1.0273, + "step": 14420 + }, + { + "epoch": 0.37, + "learning_rate": 1.954786066686241e-06, + "loss": 0.6997, + "step": 14421 + }, + { + "epoch": 0.37, + "learning_rate": 1.9547778400680434e-06, + "loss": 0.8115, + "step": 14422 + }, + { + "epoch": 0.37, + "learning_rate": 1.9547696127188165e-06, + "loss": 0.8799, + "step": 14423 + }, + { + "epoch": 0.37, + "learning_rate": 1.9547613846385663e-06, + "loss": 1.0605, + "step": 14424 + }, + { + "epoch": 0.37, + "learning_rate": 1.954753155827299e-06, + "loss": 0.9102, + "step": 14425 + }, + { + "epoch": 0.37, + "learning_rate": 1.9547449262850213e-06, + "loss": 0.7666, + "step": 14426 + }, + { + "epoch": 0.37, + "learning_rate": 1.9547366960117397e-06, + "loss": 0.9775, + "step": 14427 + }, + { + "epoch": 0.37, + "learning_rate": 1.9547284650074593e-06, + "loss": 0.8281, + "step": 14428 + }, + { + "epoch": 0.37, + "learning_rate": 1.954720233272188e-06, + "loss": 0.6035, + "step": 14429 + }, + { + "epoch": 0.37, + "learning_rate": 1.9547120008059307e-06, + "loss": 0.9824, + "step": 14430 + }, + { + "epoch": 0.37, + "learning_rate": 1.9547037676086947e-06, + "loss": 1.0811, + "step": 14431 + }, + { + "epoch": 0.37, + "learning_rate": 1.9546955336804854e-06, + "loss": 1.1816, + "step": 14432 + }, + { + "epoch": 0.37, + "learning_rate": 1.95468729902131e-06, + "loss": 0.8345, + "step": 14433 + }, + { + "epoch": 0.37, + "learning_rate": 1.9546790636311747e-06, + "loss": 0.9177, + "step": 14434 + }, + { + "epoch": 0.37, + "learning_rate": 1.954670827510085e-06, + "loss": 1.0225, + "step": 14435 + }, + { + "epoch": 0.37, + "learning_rate": 1.954662590658048e-06, + "loss": 0.8525, + "step": 14436 + }, + { + "epoch": 0.37, + "learning_rate": 1.95465435307507e-06, + "loss": 0.748, + "step": 14437 + }, + { + "epoch": 0.37, + "learning_rate": 1.954646114761157e-06, + "loss": 0.8779, + "step": 14438 + }, + { + "epoch": 0.37, + "learning_rate": 1.954637875716315e-06, + "loss": 0.9912, + "step": 14439 + }, + { + "epoch": 0.37, + "learning_rate": 1.954629635940551e-06, + "loss": 1.0215, + "step": 14440 + }, + { + "epoch": 0.37, + "learning_rate": 1.9546213954338707e-06, + "loss": 0.6445, + "step": 14441 + }, + { + "epoch": 0.37, + "learning_rate": 1.954613154196281e-06, + "loss": 0.9727, + "step": 14442 + }, + { + "epoch": 0.37, + "learning_rate": 1.954604912227788e-06, + "loss": 0.7471, + "step": 14443 + }, + { + "epoch": 0.37, + "learning_rate": 1.9545966695283973e-06, + "loss": 0.9404, + "step": 14444 + }, + { + "epoch": 0.37, + "learning_rate": 1.954588426098116e-06, + "loss": 0.7568, + "step": 14445 + }, + { + "epoch": 0.37, + "learning_rate": 1.954580181936951e-06, + "loss": 1.0713, + "step": 14446 + }, + { + "epoch": 0.37, + "learning_rate": 1.9545719370449068e-06, + "loss": 0.9893, + "step": 14447 + }, + { + "epoch": 0.37, + "learning_rate": 1.9545636914219914e-06, + "loss": 0.6655, + "step": 14448 + }, + { + "epoch": 0.37, + "learning_rate": 1.9545554450682102e-06, + "loss": 0.7947, + "step": 14449 + }, + { + "epoch": 0.37, + "learning_rate": 1.95454719798357e-06, + "loss": 1.0723, + "step": 14450 + }, + { + "epoch": 0.37, + "learning_rate": 1.954538950168077e-06, + "loss": 0.6992, + "step": 14451 + }, + { + "epoch": 0.37, + "learning_rate": 1.954530701621737e-06, + "loss": 0.8584, + "step": 14452 + }, + { + "epoch": 0.37, + "learning_rate": 1.954522452344557e-06, + "loss": 0.8838, + "step": 14453 + }, + { + "epoch": 0.37, + "learning_rate": 1.954514202336543e-06, + "loss": 0.6987, + "step": 14454 + }, + { + "epoch": 0.37, + "learning_rate": 1.9545059515977014e-06, + "loss": 0.9482, + "step": 14455 + }, + { + "epoch": 0.37, + "learning_rate": 1.954497700128038e-06, + "loss": 0.9902, + "step": 14456 + }, + { + "epoch": 0.37, + "learning_rate": 1.9544894479275604e-06, + "loss": 1.0117, + "step": 14457 + }, + { + "epoch": 0.37, + "learning_rate": 1.9544811949962736e-06, + "loss": 0.9248, + "step": 14458 + }, + { + "epoch": 0.37, + "learning_rate": 1.9544729413341847e-06, + "loss": 0.6807, + "step": 14459 + }, + { + "epoch": 0.37, + "learning_rate": 1.9544646869412993e-06, + "loss": 0.7695, + "step": 14460 + }, + { + "epoch": 0.37, + "learning_rate": 1.954456431817625e-06, + "loss": 0.7764, + "step": 14461 + }, + { + "epoch": 0.37, + "learning_rate": 1.954448175963167e-06, + "loss": 0.7505, + "step": 14462 + }, + { + "epoch": 0.37, + "learning_rate": 1.9544399193779312e-06, + "loss": 0.8984, + "step": 14463 + }, + { + "epoch": 0.37, + "learning_rate": 1.954431662061925e-06, + "loss": 0.8789, + "step": 14464 + }, + { + "epoch": 0.37, + "learning_rate": 1.9544234040151548e-06, + "loss": 0.8584, + "step": 14465 + }, + { + "epoch": 0.37, + "learning_rate": 1.9544151452376263e-06, + "loss": 0.752, + "step": 14466 + }, + { + "epoch": 0.37, + "learning_rate": 1.954406885729346e-06, + "loss": 0.6335, + "step": 14467 + }, + { + "epoch": 0.37, + "learning_rate": 1.95439862549032e-06, + "loss": 0.7612, + "step": 14468 + }, + { + "epoch": 0.37, + "learning_rate": 1.954390364520555e-06, + "loss": 0.835, + "step": 14469 + }, + { + "epoch": 0.37, + "learning_rate": 1.9543821028200574e-06, + "loss": 0.7104, + "step": 14470 + }, + { + "epoch": 0.37, + "learning_rate": 1.954373840388833e-06, + "loss": 0.8828, + "step": 14471 + }, + { + "epoch": 0.37, + "learning_rate": 1.9543655772268886e-06, + "loss": 0.835, + "step": 14472 + }, + { + "epoch": 0.37, + "learning_rate": 1.9543573133342302e-06, + "loss": 0.9336, + "step": 14473 + }, + { + "epoch": 0.37, + "learning_rate": 1.9543490487108645e-06, + "loss": 0.9531, + "step": 14474 + }, + { + "epoch": 0.37, + "learning_rate": 1.9543407833567977e-06, + "loss": 0.7827, + "step": 14475 + }, + { + "epoch": 0.37, + "learning_rate": 1.954332517272036e-06, + "loss": 0.751, + "step": 14476 + }, + { + "epoch": 0.37, + "learning_rate": 1.9543242504565852e-06, + "loss": 0.7568, + "step": 14477 + }, + { + "epoch": 0.37, + "learning_rate": 1.9543159829104527e-06, + "loss": 1.0947, + "step": 14478 + }, + { + "epoch": 0.37, + "learning_rate": 1.954307714633644e-06, + "loss": 0.9258, + "step": 14479 + }, + { + "epoch": 0.37, + "learning_rate": 1.9542994456261662e-06, + "loss": 0.7832, + "step": 14480 + }, + { + "epoch": 0.37, + "learning_rate": 1.954291175888025e-06, + "loss": 1.0, + "step": 14481 + }, + { + "epoch": 0.37, + "learning_rate": 1.9542829054192273e-06, + "loss": 0.9014, + "step": 14482 + }, + { + "epoch": 0.37, + "learning_rate": 1.9542746342197785e-06, + "loss": 0.7715, + "step": 14483 + }, + { + "epoch": 0.37, + "learning_rate": 1.954266362289686e-06, + "loss": 0.9922, + "step": 14484 + }, + { + "epoch": 0.37, + "learning_rate": 1.954258089628955e-06, + "loss": 0.6709, + "step": 14485 + }, + { + "epoch": 0.37, + "learning_rate": 1.954249816237593e-06, + "loss": 0.918, + "step": 14486 + }, + { + "epoch": 0.37, + "learning_rate": 1.954241542115605e-06, + "loss": 0.7173, + "step": 14487 + }, + { + "epoch": 0.37, + "learning_rate": 1.954233267262999e-06, + "loss": 0.708, + "step": 14488 + }, + { + "epoch": 0.37, + "learning_rate": 1.9542249916797803e-06, + "loss": 0.8911, + "step": 14489 + }, + { + "epoch": 0.37, + "learning_rate": 1.954216715365955e-06, + "loss": 0.6816, + "step": 14490 + }, + { + "epoch": 0.37, + "learning_rate": 1.95420843832153e-06, + "loss": 0.957, + "step": 14491 + }, + { + "epoch": 0.37, + "learning_rate": 1.9542001605465116e-06, + "loss": 0.7969, + "step": 14492 + }, + { + "epoch": 0.37, + "learning_rate": 1.954191882040906e-06, + "loss": 0.8848, + "step": 14493 + }, + { + "epoch": 0.37, + "learning_rate": 1.9541836028047197e-06, + "loss": 0.9795, + "step": 14494 + }, + { + "epoch": 0.37, + "learning_rate": 1.9541753228379586e-06, + "loss": 1.0898, + "step": 14495 + }, + { + "epoch": 0.37, + "learning_rate": 1.9541670421406294e-06, + "loss": 0.9521, + "step": 14496 + }, + { + "epoch": 0.37, + "learning_rate": 1.9541587607127386e-06, + "loss": 0.8506, + "step": 14497 + }, + { + "epoch": 0.37, + "learning_rate": 1.9541504785542924e-06, + "loss": 0.9258, + "step": 14498 + }, + { + "epoch": 0.37, + "learning_rate": 1.9541421956652964e-06, + "loss": 0.9346, + "step": 14499 + }, + { + "epoch": 0.37, + "learning_rate": 1.9541339120457582e-06, + "loss": 0.9395, + "step": 14500 + }, + { + "epoch": 0.37, + "learning_rate": 1.9541256276956834e-06, + "loss": 0.7554, + "step": 14501 + }, + { + "epoch": 0.37, + "learning_rate": 1.954117342615078e-06, + "loss": 1.0537, + "step": 14502 + }, + { + "epoch": 0.37, + "learning_rate": 1.9541090568039493e-06, + "loss": 0.7256, + "step": 14503 + }, + { + "epoch": 0.37, + "learning_rate": 1.9541007702623033e-06, + "loss": 0.9824, + "step": 14504 + }, + { + "epoch": 0.37, + "learning_rate": 1.954092482990146e-06, + "loss": 0.8408, + "step": 14505 + }, + { + "epoch": 0.37, + "learning_rate": 1.954084194987484e-06, + "loss": 0.9795, + "step": 14506 + }, + { + "epoch": 0.37, + "learning_rate": 1.9540759062543235e-06, + "loss": 1.1113, + "step": 14507 + }, + { + "epoch": 0.37, + "learning_rate": 1.9540676167906713e-06, + "loss": 1.0049, + "step": 14508 + }, + { + "epoch": 0.37, + "learning_rate": 1.954059326596533e-06, + "loss": 0.8027, + "step": 14509 + }, + { + "epoch": 0.37, + "learning_rate": 1.9540510356719152e-06, + "loss": 1.0322, + "step": 14510 + }, + { + "epoch": 0.37, + "learning_rate": 1.954042744016825e-06, + "loss": 0.9541, + "step": 14511 + }, + { + "epoch": 0.37, + "learning_rate": 1.9540344516312674e-06, + "loss": 0.7871, + "step": 14512 + }, + { + "epoch": 0.37, + "learning_rate": 1.95402615851525e-06, + "loss": 0.8525, + "step": 14513 + }, + { + "epoch": 0.37, + "learning_rate": 1.9540178646687785e-06, + "loss": 0.792, + "step": 14514 + }, + { + "epoch": 0.37, + "learning_rate": 1.9540095700918595e-06, + "loss": 0.7656, + "step": 14515 + }, + { + "epoch": 0.37, + "learning_rate": 1.954001274784499e-06, + "loss": 0.7764, + "step": 14516 + }, + { + "epoch": 0.37, + "learning_rate": 1.9539929787467036e-06, + "loss": 0.9775, + "step": 14517 + }, + { + "epoch": 0.37, + "learning_rate": 1.95398468197848e-06, + "loss": 0.8857, + "step": 14518 + }, + { + "epoch": 0.37, + "learning_rate": 1.9539763844798337e-06, + "loss": 0.9209, + "step": 14519 + }, + { + "epoch": 0.37, + "learning_rate": 1.953968086250772e-06, + "loss": 0.8955, + "step": 14520 + }, + { + "epoch": 0.37, + "learning_rate": 1.9539597872913003e-06, + "loss": 1.084, + "step": 14521 + }, + { + "epoch": 0.37, + "learning_rate": 1.9539514876014257e-06, + "loss": 0.8418, + "step": 14522 + }, + { + "epoch": 0.37, + "learning_rate": 1.9539431871811546e-06, + "loss": 0.9639, + "step": 14523 + }, + { + "epoch": 0.37, + "learning_rate": 1.9539348860304925e-06, + "loss": 0.8096, + "step": 14524 + }, + { + "epoch": 0.37, + "learning_rate": 1.953926584149447e-06, + "loss": 0.7778, + "step": 14525 + }, + { + "epoch": 0.37, + "learning_rate": 1.9539182815380232e-06, + "loss": 0.7881, + "step": 14526 + }, + { + "epoch": 0.37, + "learning_rate": 1.9539099781962283e-06, + "loss": 0.9863, + "step": 14527 + }, + { + "epoch": 0.37, + "learning_rate": 1.9539016741240687e-06, + "loss": 0.9199, + "step": 14528 + }, + { + "epoch": 0.37, + "learning_rate": 1.95389336932155e-06, + "loss": 0.8828, + "step": 14529 + }, + { + "epoch": 0.37, + "learning_rate": 1.953885063788679e-06, + "loss": 0.7876, + "step": 14530 + }, + { + "epoch": 0.37, + "learning_rate": 1.9538767575254623e-06, + "loss": 0.9521, + "step": 14531 + }, + { + "epoch": 0.37, + "learning_rate": 1.953868450531906e-06, + "loss": 1.0488, + "step": 14532 + }, + { + "epoch": 0.37, + "learning_rate": 1.953860142808016e-06, + "loss": 1.0664, + "step": 14533 + }, + { + "epoch": 0.37, + "learning_rate": 1.9538518343537998e-06, + "loss": 0.7295, + "step": 14534 + }, + { + "epoch": 0.37, + "learning_rate": 1.9538435251692627e-06, + "loss": 1.0195, + "step": 14535 + }, + { + "epoch": 0.37, + "learning_rate": 1.9538352152544116e-06, + "loss": 0.8984, + "step": 14536 + }, + { + "epoch": 0.37, + "learning_rate": 1.953826904609253e-06, + "loss": 0.8691, + "step": 14537 + }, + { + "epoch": 0.37, + "learning_rate": 1.9538185932337928e-06, + "loss": 1.0977, + "step": 14538 + }, + { + "epoch": 0.37, + "learning_rate": 1.9538102811280372e-06, + "loss": 0.8174, + "step": 14539 + }, + { + "epoch": 0.37, + "learning_rate": 1.953801968291993e-06, + "loss": 0.916, + "step": 14540 + }, + { + "epoch": 0.37, + "learning_rate": 1.953793654725667e-06, + "loss": 1.0215, + "step": 14541 + }, + { + "epoch": 0.37, + "learning_rate": 1.9537853404290646e-06, + "loss": 0.9443, + "step": 14542 + }, + { + "epoch": 0.37, + "learning_rate": 1.953777025402193e-06, + "loss": 0.8262, + "step": 14543 + }, + { + "epoch": 0.37, + "learning_rate": 1.953768709645058e-06, + "loss": 0.7871, + "step": 14544 + }, + { + "epoch": 0.37, + "learning_rate": 1.9537603931576663e-06, + "loss": 0.7676, + "step": 14545 + }, + { + "epoch": 0.37, + "learning_rate": 1.9537520759400238e-06, + "loss": 0.9883, + "step": 14546 + }, + { + "epoch": 0.37, + "learning_rate": 1.9537437579921376e-06, + "loss": 0.7734, + "step": 14547 + }, + { + "epoch": 0.37, + "learning_rate": 1.9537354393140133e-06, + "loss": 1.0713, + "step": 14548 + }, + { + "epoch": 0.37, + "learning_rate": 1.9537271199056576e-06, + "loss": 1.0107, + "step": 14549 + }, + { + "epoch": 0.37, + "learning_rate": 1.9537187997670774e-06, + "loss": 0.9229, + "step": 14550 + }, + { + "epoch": 0.37, + "learning_rate": 1.9537104788982777e-06, + "loss": 0.8525, + "step": 14551 + }, + { + "epoch": 0.37, + "learning_rate": 1.9537021572992666e-06, + "loss": 1.0752, + "step": 14552 + }, + { + "epoch": 0.37, + "learning_rate": 1.953693834970049e-06, + "loss": 1.0723, + "step": 14553 + }, + { + "epoch": 0.37, + "learning_rate": 1.953685511910632e-06, + "loss": 1.1221, + "step": 14554 + }, + { + "epoch": 0.37, + "learning_rate": 1.9536771881210222e-06, + "loss": 0.9775, + "step": 14555 + }, + { + "epoch": 0.37, + "learning_rate": 1.9536688636012255e-06, + "loss": 0.9229, + "step": 14556 + }, + { + "epoch": 0.37, + "learning_rate": 1.9536605383512483e-06, + "loss": 0.9707, + "step": 14557 + }, + { + "epoch": 0.37, + "learning_rate": 1.953652212371097e-06, + "loss": 0.9561, + "step": 14558 + }, + { + "epoch": 0.37, + "learning_rate": 1.9536438856607785e-06, + "loss": 0.7974, + "step": 14559 + }, + { + "epoch": 0.37, + "learning_rate": 1.9536355582202983e-06, + "loss": 0.6421, + "step": 14560 + }, + { + "epoch": 0.37, + "learning_rate": 1.9536272300496634e-06, + "loss": 0.8662, + "step": 14561 + }, + { + "epoch": 0.37, + "learning_rate": 1.9536189011488797e-06, + "loss": 1.0029, + "step": 14562 + }, + { + "epoch": 0.37, + "learning_rate": 1.953610571517954e-06, + "loss": 0.9658, + "step": 14563 + }, + { + "epoch": 0.37, + "learning_rate": 1.9536022411568927e-06, + "loss": 0.8115, + "step": 14564 + }, + { + "epoch": 0.37, + "learning_rate": 1.9535939100657013e-06, + "loss": 0.8545, + "step": 14565 + }, + { + "epoch": 0.37, + "learning_rate": 1.953585578244388e-06, + "loss": 0.8633, + "step": 14566 + }, + { + "epoch": 0.37, + "learning_rate": 1.9535772456929574e-06, + "loss": 1.0059, + "step": 14567 + }, + { + "epoch": 0.37, + "learning_rate": 1.9535689124114167e-06, + "loss": 1.0078, + "step": 14568 + }, + { + "epoch": 0.37, + "learning_rate": 1.9535605783997718e-06, + "loss": 0.7871, + "step": 14569 + }, + { + "epoch": 0.37, + "learning_rate": 1.9535522436580297e-06, + "loss": 1.0107, + "step": 14570 + }, + { + "epoch": 0.37, + "learning_rate": 1.9535439081861965e-06, + "loss": 0.7949, + "step": 14571 + }, + { + "epoch": 0.37, + "learning_rate": 1.953535571984279e-06, + "loss": 0.875, + "step": 14572 + }, + { + "epoch": 0.37, + "learning_rate": 1.9535272350522825e-06, + "loss": 0.7822, + "step": 14573 + }, + { + "epoch": 0.37, + "learning_rate": 1.9535188973902144e-06, + "loss": 0.877, + "step": 14574 + }, + { + "epoch": 0.37, + "learning_rate": 1.9535105589980805e-06, + "loss": 0.5229, + "step": 14575 + }, + { + "epoch": 0.37, + "learning_rate": 1.9535022198758877e-06, + "loss": 0.6836, + "step": 14576 + }, + { + "epoch": 0.37, + "learning_rate": 1.953493880023642e-06, + "loss": 0.7515, + "step": 14577 + }, + { + "epoch": 0.37, + "learning_rate": 1.9534855394413492e-06, + "loss": 0.9629, + "step": 14578 + }, + { + "epoch": 0.37, + "learning_rate": 1.9534771981290176e-06, + "loss": 0.9023, + "step": 14579 + }, + { + "epoch": 0.37, + "learning_rate": 1.9534688560866516e-06, + "loss": 0.7585, + "step": 14580 + }, + { + "epoch": 0.37, + "learning_rate": 1.9534605133142584e-06, + "loss": 0.7891, + "step": 14581 + }, + { + "epoch": 0.37, + "learning_rate": 1.9534521698118443e-06, + "loss": 0.9336, + "step": 14582 + }, + { + "epoch": 0.37, + "learning_rate": 1.9534438255794157e-06, + "loss": 0.8584, + "step": 14583 + }, + { + "epoch": 0.37, + "learning_rate": 1.9534354806169794e-06, + "loss": 0.8438, + "step": 14584 + }, + { + "epoch": 0.37, + "learning_rate": 1.953427134924541e-06, + "loss": 0.5938, + "step": 14585 + }, + { + "epoch": 0.37, + "learning_rate": 1.9534187885021073e-06, + "loss": 1.0234, + "step": 14586 + }, + { + "epoch": 0.37, + "learning_rate": 1.9534104413496847e-06, + "loss": 0.9648, + "step": 14587 + }, + { + "epoch": 0.37, + "learning_rate": 1.9534020934672794e-06, + "loss": 0.9268, + "step": 14588 + }, + { + "epoch": 0.37, + "learning_rate": 1.9533937448548985e-06, + "loss": 0.7153, + "step": 14589 + }, + { + "epoch": 0.37, + "learning_rate": 1.953385395512547e-06, + "loss": 0.686, + "step": 14590 + }, + { + "epoch": 0.37, + "learning_rate": 1.953377045440233e-06, + "loss": 1.1748, + "step": 14591 + }, + { + "epoch": 0.37, + "learning_rate": 1.9533686946379614e-06, + "loss": 1.1523, + "step": 14592 + }, + { + "epoch": 0.37, + "learning_rate": 1.95336034310574e-06, + "loss": 0.8013, + "step": 14593 + }, + { + "epoch": 0.37, + "learning_rate": 1.9533519908435736e-06, + "loss": 0.9375, + "step": 14594 + }, + { + "epoch": 0.37, + "learning_rate": 1.9533436378514695e-06, + "loss": 0.916, + "step": 14595 + }, + { + "epoch": 0.37, + "learning_rate": 1.9533352841294348e-06, + "loss": 0.8721, + "step": 14596 + }, + { + "epoch": 0.37, + "learning_rate": 1.953326929677474e-06, + "loss": 0.6052, + "step": 14597 + }, + { + "epoch": 0.37, + "learning_rate": 1.9533185744955954e-06, + "loss": 0.9248, + "step": 14598 + }, + { + "epoch": 0.37, + "learning_rate": 1.9533102185838043e-06, + "loss": 0.8787, + "step": 14599 + }, + { + "epoch": 0.37, + "learning_rate": 1.9533018619421076e-06, + "loss": 0.9209, + "step": 14600 + }, + { + "epoch": 0.37, + "learning_rate": 1.953293504570511e-06, + "loss": 0.833, + "step": 14601 + }, + { + "epoch": 0.37, + "learning_rate": 1.953285146469022e-06, + "loss": 0.8564, + "step": 14602 + }, + { + "epoch": 0.37, + "learning_rate": 1.953276787637646e-06, + "loss": 0.834, + "step": 14603 + }, + { + "epoch": 0.37, + "learning_rate": 1.9532684280763903e-06, + "loss": 0.9551, + "step": 14604 + }, + { + "epoch": 0.37, + "learning_rate": 1.95326006778526e-06, + "loss": 0.769, + "step": 14605 + }, + { + "epoch": 0.37, + "learning_rate": 1.953251706764263e-06, + "loss": 0.8682, + "step": 14606 + }, + { + "epoch": 0.37, + "learning_rate": 1.953243345013405e-06, + "loss": 0.873, + "step": 14607 + }, + { + "epoch": 0.37, + "learning_rate": 1.953234982532692e-06, + "loss": 0.8994, + "step": 14608 + }, + { + "epoch": 0.37, + "learning_rate": 1.9532266193221308e-06, + "loss": 0.9102, + "step": 14609 + }, + { + "epoch": 0.37, + "learning_rate": 1.953218255381728e-06, + "loss": 0.8818, + "step": 14610 + }, + { + "epoch": 0.37, + "learning_rate": 1.95320989071149e-06, + "loss": 0.7803, + "step": 14611 + }, + { + "epoch": 0.37, + "learning_rate": 1.953201525311423e-06, + "loss": 0.9482, + "step": 14612 + }, + { + "epoch": 0.37, + "learning_rate": 1.9531931591815328e-06, + "loss": 1.0801, + "step": 14613 + }, + { + "epoch": 0.37, + "learning_rate": 1.953184792321827e-06, + "loss": 0.8633, + "step": 14614 + }, + { + "epoch": 0.37, + "learning_rate": 1.9531764247323115e-06, + "loss": 0.915, + "step": 14615 + }, + { + "epoch": 0.37, + "learning_rate": 1.953168056412992e-06, + "loss": 0.8711, + "step": 14616 + }, + { + "epoch": 0.37, + "learning_rate": 1.9531596873638762e-06, + "loss": 0.7539, + "step": 14617 + }, + { + "epoch": 0.37, + "learning_rate": 1.9531513175849695e-06, + "loss": 0.8477, + "step": 14618 + }, + { + "epoch": 0.37, + "learning_rate": 1.9531429470762787e-06, + "loss": 1.0518, + "step": 14619 + }, + { + "epoch": 0.37, + "learning_rate": 1.95313457583781e-06, + "loss": 0.9302, + "step": 14620 + }, + { + "epoch": 0.37, + "learning_rate": 1.9531262038695707e-06, + "loss": 0.8457, + "step": 14621 + }, + { + "epoch": 0.37, + "learning_rate": 1.953117831171566e-06, + "loss": 0.8325, + "step": 14622 + }, + { + "epoch": 0.37, + "learning_rate": 1.953109457743803e-06, + "loss": 0.8408, + "step": 14623 + }, + { + "epoch": 0.37, + "learning_rate": 1.953101083586287e-06, + "loss": 0.9077, + "step": 14624 + }, + { + "epoch": 0.37, + "learning_rate": 1.9530927086990264e-06, + "loss": 0.7532, + "step": 14625 + }, + { + "epoch": 0.37, + "learning_rate": 1.9530843330820265e-06, + "loss": 0.8037, + "step": 14626 + }, + { + "epoch": 0.37, + "learning_rate": 1.9530759567352932e-06, + "loss": 0.5752, + "step": 14627 + }, + { + "epoch": 0.37, + "learning_rate": 1.953067579658834e-06, + "loss": 0.76, + "step": 14628 + }, + { + "epoch": 0.37, + "learning_rate": 1.9530592018526544e-06, + "loss": 1.0117, + "step": 14629 + }, + { + "epoch": 0.37, + "learning_rate": 1.953050823316761e-06, + "loss": 0.6641, + "step": 14630 + }, + { + "epoch": 0.38, + "learning_rate": 1.953042444051161e-06, + "loss": 1.0098, + "step": 14631 + }, + { + "epoch": 0.38, + "learning_rate": 1.95303406405586e-06, + "loss": 0.7395, + "step": 14632 + }, + { + "epoch": 0.38, + "learning_rate": 1.9530256833308645e-06, + "loss": 0.9111, + "step": 14633 + }, + { + "epoch": 0.38, + "learning_rate": 1.9530173018761808e-06, + "loss": 1.0957, + "step": 14634 + }, + { + "epoch": 0.38, + "learning_rate": 1.953008919691816e-06, + "loss": 0.9629, + "step": 14635 + }, + { + "epoch": 0.38, + "learning_rate": 1.953000536777776e-06, + "loss": 0.9551, + "step": 14636 + }, + { + "epoch": 0.38, + "learning_rate": 1.952992153134067e-06, + "loss": 0.8398, + "step": 14637 + }, + { + "epoch": 0.38, + "learning_rate": 1.9529837687606963e-06, + "loss": 0.9287, + "step": 14638 + }, + { + "epoch": 0.38, + "learning_rate": 1.9529753836576694e-06, + "loss": 1.0889, + "step": 14639 + }, + { + "epoch": 0.38, + "learning_rate": 1.9529669978249934e-06, + "loss": 0.9072, + "step": 14640 + }, + { + "epoch": 0.38, + "learning_rate": 1.952958611262674e-06, + "loss": 0.873, + "step": 14641 + }, + { + "epoch": 0.38, + "learning_rate": 1.952950223970718e-06, + "loss": 0.9863, + "step": 14642 + }, + { + "epoch": 0.38, + "learning_rate": 1.952941835949132e-06, + "loss": 0.7153, + "step": 14643 + }, + { + "epoch": 0.38, + "learning_rate": 1.9529334471979222e-06, + "loss": 0.834, + "step": 14644 + }, + { + "epoch": 0.38, + "learning_rate": 1.952925057717095e-06, + "loss": 0.9277, + "step": 14645 + }, + { + "epoch": 0.38, + "learning_rate": 1.952916667506657e-06, + "loss": 0.9209, + "step": 14646 + }, + { + "epoch": 0.38, + "learning_rate": 1.9529082765666146e-06, + "loss": 0.9434, + "step": 14647 + }, + { + "epoch": 0.38, + "learning_rate": 1.9528998848969744e-06, + "loss": 0.6096, + "step": 14648 + }, + { + "epoch": 0.38, + "learning_rate": 1.952891492497742e-06, + "loss": 0.998, + "step": 14649 + }, + { + "epoch": 0.38, + "learning_rate": 1.9528830993689245e-06, + "loss": 0.665, + "step": 14650 + }, + { + "epoch": 0.38, + "learning_rate": 1.9528747055105284e-06, + "loss": 0.7725, + "step": 14651 + }, + { + "epoch": 0.38, + "learning_rate": 1.95286631092256e-06, + "loss": 0.8193, + "step": 14652 + }, + { + "epoch": 0.38, + "learning_rate": 1.9528579156050253e-06, + "loss": 0.874, + "step": 14653 + }, + { + "epoch": 0.38, + "learning_rate": 1.9528495195579316e-06, + "loss": 0.8906, + "step": 14654 + }, + { + "epoch": 0.38, + "learning_rate": 1.9528411227812846e-06, + "loss": 0.7988, + "step": 14655 + }, + { + "epoch": 0.38, + "learning_rate": 1.952832725275091e-06, + "loss": 0.8223, + "step": 14656 + }, + { + "epoch": 0.38, + "learning_rate": 1.9528243270393574e-06, + "loss": 1.0674, + "step": 14657 + }, + { + "epoch": 0.38, + "learning_rate": 1.9528159280740895e-06, + "loss": 0.7593, + "step": 14658 + }, + { + "epoch": 0.38, + "learning_rate": 1.952807528379295e-06, + "loss": 0.9844, + "step": 14659 + }, + { + "epoch": 0.38, + "learning_rate": 1.952799127954979e-06, + "loss": 0.8418, + "step": 14660 + }, + { + "epoch": 0.38, + "learning_rate": 1.9527907268011485e-06, + "loss": 0.8545, + "step": 14661 + }, + { + "epoch": 0.38, + "learning_rate": 1.95278232491781e-06, + "loss": 0.8066, + "step": 14662 + }, + { + "epoch": 0.38, + "learning_rate": 1.95277392230497e-06, + "loss": 0.8379, + "step": 14663 + }, + { + "epoch": 0.38, + "learning_rate": 1.952765518962635e-06, + "loss": 0.7432, + "step": 14664 + }, + { + "epoch": 0.38, + "learning_rate": 1.9527571148908112e-06, + "loss": 1.0254, + "step": 14665 + }, + { + "epoch": 0.38, + "learning_rate": 1.952748710089505e-06, + "loss": 1.1367, + "step": 14666 + }, + { + "epoch": 0.38, + "learning_rate": 1.952740304558723e-06, + "loss": 1.0166, + "step": 14667 + }, + { + "epoch": 0.38, + "learning_rate": 1.9527318982984714e-06, + "loss": 1.1436, + "step": 14668 + }, + { + "epoch": 0.38, + "learning_rate": 1.9527234913087568e-06, + "loss": 1.1729, + "step": 14669 + }, + { + "epoch": 0.38, + "learning_rate": 1.9527150835895855e-06, + "loss": 0.9453, + "step": 14670 + }, + { + "epoch": 0.38, + "learning_rate": 1.9527066751409646e-06, + "loss": 1.0752, + "step": 14671 + }, + { + "epoch": 0.38, + "learning_rate": 1.9526982659628993e-06, + "loss": 0.9551, + "step": 14672 + }, + { + "epoch": 0.38, + "learning_rate": 1.9526898560553972e-06, + "loss": 0.9805, + "step": 14673 + }, + { + "epoch": 0.38, + "learning_rate": 1.9526814454184642e-06, + "loss": 0.8828, + "step": 14674 + }, + { + "epoch": 0.38, + "learning_rate": 1.9526730340521067e-06, + "loss": 0.9355, + "step": 14675 + }, + { + "epoch": 0.38, + "learning_rate": 1.9526646219563314e-06, + "loss": 1.1162, + "step": 14676 + }, + { + "epoch": 0.38, + "learning_rate": 1.9526562091311447e-06, + "loss": 0.9697, + "step": 14677 + }, + { + "epoch": 0.38, + "learning_rate": 1.9526477955765525e-06, + "loss": 0.9297, + "step": 14678 + }, + { + "epoch": 0.38, + "learning_rate": 1.952639381292562e-06, + "loss": 0.7864, + "step": 14679 + }, + { + "epoch": 0.38, + "learning_rate": 1.952630966279179e-06, + "loss": 0.9941, + "step": 14680 + }, + { + "epoch": 0.38, + "learning_rate": 1.9526225505364107e-06, + "loss": 0.7202, + "step": 14681 + }, + { + "epoch": 0.38, + "learning_rate": 1.952614134064263e-06, + "loss": 0.856, + "step": 14682 + }, + { + "epoch": 0.38, + "learning_rate": 1.9526057168627426e-06, + "loss": 0.9785, + "step": 14683 + }, + { + "epoch": 0.38, + "learning_rate": 1.952597298931856e-06, + "loss": 0.8311, + "step": 14684 + }, + { + "epoch": 0.38, + "learning_rate": 1.9525888802716092e-06, + "loss": 0.8984, + "step": 14685 + }, + { + "epoch": 0.38, + "learning_rate": 1.9525804608820086e-06, + "loss": 0.834, + "step": 14686 + }, + { + "epoch": 0.38, + "learning_rate": 1.9525720407630614e-06, + "loss": 0.821, + "step": 14687 + }, + { + "epoch": 0.38, + "learning_rate": 1.952563619914773e-06, + "loss": 1.0322, + "step": 14688 + }, + { + "epoch": 0.38, + "learning_rate": 1.952555198337151e-06, + "loss": 1.0137, + "step": 14689 + }, + { + "epoch": 0.38, + "learning_rate": 1.952546776030201e-06, + "loss": 0.7893, + "step": 14690 + }, + { + "epoch": 0.38, + "learning_rate": 1.9525383529939298e-06, + "loss": 0.7959, + "step": 14691 + }, + { + "epoch": 0.38, + "learning_rate": 1.9525299292283435e-06, + "loss": 1.0381, + "step": 14692 + }, + { + "epoch": 0.38, + "learning_rate": 1.9525215047334492e-06, + "loss": 0.6711, + "step": 14693 + }, + { + "epoch": 0.38, + "learning_rate": 1.952513079509253e-06, + "loss": 0.8242, + "step": 14694 + }, + { + "epoch": 0.38, + "learning_rate": 1.9525046535557614e-06, + "loss": 0.8848, + "step": 14695 + }, + { + "epoch": 0.38, + "learning_rate": 1.9524962268729805e-06, + "loss": 0.9424, + "step": 14696 + }, + { + "epoch": 0.38, + "learning_rate": 1.952487799460917e-06, + "loss": 0.8662, + "step": 14697 + }, + { + "epoch": 0.38, + "learning_rate": 1.9524793713195777e-06, + "loss": 0.7368, + "step": 14698 + }, + { + "epoch": 0.38, + "learning_rate": 1.9524709424489683e-06, + "loss": 1.0107, + "step": 14699 + }, + { + "epoch": 0.38, + "learning_rate": 1.9524625128490962e-06, + "loss": 0.9004, + "step": 14700 + }, + { + "epoch": 0.38, + "learning_rate": 1.9524540825199673e-06, + "loss": 0.7053, + "step": 14701 + }, + { + "epoch": 0.38, + "learning_rate": 1.952445651461588e-06, + "loss": 0.9121, + "step": 14702 + }, + { + "epoch": 0.38, + "learning_rate": 1.9524372196739644e-06, + "loss": 0.709, + "step": 14703 + }, + { + "epoch": 0.38, + "learning_rate": 1.952428787157104e-06, + "loss": 0.8125, + "step": 14704 + }, + { + "epoch": 0.38, + "learning_rate": 1.9524203539110125e-06, + "loss": 0.833, + "step": 14705 + }, + { + "epoch": 0.38, + "learning_rate": 1.9524119199356964e-06, + "loss": 0.7949, + "step": 14706 + }, + { + "epoch": 0.38, + "learning_rate": 1.9524034852311625e-06, + "loss": 0.9697, + "step": 14707 + }, + { + "epoch": 0.38, + "learning_rate": 1.952395049797417e-06, + "loss": 0.9209, + "step": 14708 + }, + { + "epoch": 0.38, + "learning_rate": 1.9523866136344664e-06, + "loss": 0.832, + "step": 14709 + }, + { + "epoch": 0.38, + "learning_rate": 1.952378176742317e-06, + "loss": 0.8457, + "step": 14710 + }, + { + "epoch": 0.38, + "learning_rate": 1.9523697391209755e-06, + "loss": 1.0225, + "step": 14711 + }, + { + "epoch": 0.38, + "learning_rate": 1.9523613007704484e-06, + "loss": 1.1191, + "step": 14712 + }, + { + "epoch": 0.38, + "learning_rate": 1.952352861690742e-06, + "loss": 0.9268, + "step": 14713 + }, + { + "epoch": 0.38, + "learning_rate": 1.9523444218818625e-06, + "loss": 0.7979, + "step": 14714 + }, + { + "epoch": 0.38, + "learning_rate": 1.952335981343817e-06, + "loss": 1.04, + "step": 14715 + }, + { + "epoch": 0.38, + "learning_rate": 1.952327540076612e-06, + "loss": 0.9814, + "step": 14716 + }, + { + "epoch": 0.38, + "learning_rate": 1.9523190980802525e-06, + "loss": 0.7432, + "step": 14717 + }, + { + "epoch": 0.38, + "learning_rate": 1.952310655354747e-06, + "loss": 0.665, + "step": 14718 + }, + { + "epoch": 0.38, + "learning_rate": 1.9523022119001004e-06, + "loss": 0.8975, + "step": 14719 + }, + { + "epoch": 0.38, + "learning_rate": 1.9522937677163204e-06, + "loss": 0.9707, + "step": 14720 + }, + { + "epoch": 0.38, + "learning_rate": 1.9522853228034123e-06, + "loss": 0.5, + "step": 14721 + }, + { + "epoch": 0.38, + "learning_rate": 1.9522768771613833e-06, + "loss": 0.8643, + "step": 14722 + }, + { + "epoch": 0.38, + "learning_rate": 1.9522684307902398e-06, + "loss": 0.7581, + "step": 14723 + }, + { + "epoch": 0.38, + "learning_rate": 1.952259983689988e-06, + "loss": 0.9209, + "step": 14724 + }, + { + "epoch": 0.38, + "learning_rate": 1.952251535860635e-06, + "loss": 1.0703, + "step": 14725 + }, + { + "epoch": 0.38, + "learning_rate": 1.952243087302186e-06, + "loss": 0.877, + "step": 14726 + }, + { + "epoch": 0.38, + "learning_rate": 1.952234638014649e-06, + "loss": 0.8662, + "step": 14727 + }, + { + "epoch": 0.38, + "learning_rate": 1.9522261879980292e-06, + "loss": 0.9434, + "step": 14728 + }, + { + "epoch": 0.38, + "learning_rate": 1.9522177372523336e-06, + "loss": 0.8174, + "step": 14729 + }, + { + "epoch": 0.38, + "learning_rate": 1.952209285777569e-06, + "loss": 1.0859, + "step": 14730 + }, + { + "epoch": 0.38, + "learning_rate": 1.9522008335737412e-06, + "loss": 0.9893, + "step": 14731 + }, + { + "epoch": 0.38, + "learning_rate": 1.9521923806408575e-06, + "loss": 0.8457, + "step": 14732 + }, + { + "epoch": 0.38, + "learning_rate": 1.9521839269789232e-06, + "loss": 0.8232, + "step": 14733 + }, + { + "epoch": 0.38, + "learning_rate": 1.952175472587946e-06, + "loss": 1.1807, + "step": 14734 + }, + { + "epoch": 0.38, + "learning_rate": 1.9521670174679317e-06, + "loss": 1.0039, + "step": 14735 + }, + { + "epoch": 0.38, + "learning_rate": 1.952158561618887e-06, + "loss": 0.8223, + "step": 14736 + }, + { + "epoch": 0.38, + "learning_rate": 1.952150105040818e-06, + "loss": 0.9385, + "step": 14737 + }, + { + "epoch": 0.38, + "learning_rate": 1.952141647733731e-06, + "loss": 0.8901, + "step": 14738 + }, + { + "epoch": 0.38, + "learning_rate": 1.952133189697634e-06, + "loss": 1.0342, + "step": 14739 + }, + { + "epoch": 0.38, + "learning_rate": 1.9521247309325317e-06, + "loss": 0.8789, + "step": 14740 + }, + { + "epoch": 0.38, + "learning_rate": 1.952116271438431e-06, + "loss": 0.9229, + "step": 14741 + }, + { + "epoch": 0.38, + "learning_rate": 1.9521078112153395e-06, + "loss": 0.8105, + "step": 14742 + }, + { + "epoch": 0.38, + "learning_rate": 1.9520993502632624e-06, + "loss": 0.8901, + "step": 14743 + }, + { + "epoch": 0.38, + "learning_rate": 1.9520908885822063e-06, + "loss": 0.5857, + "step": 14744 + }, + { + "epoch": 0.38, + "learning_rate": 1.9520824261721784e-06, + "loss": 0.792, + "step": 14745 + }, + { + "epoch": 0.38, + "learning_rate": 1.9520739630331846e-06, + "loss": 0.9209, + "step": 14746 + }, + { + "epoch": 0.38, + "learning_rate": 1.952065499165232e-06, + "loss": 0.8027, + "step": 14747 + }, + { + "epoch": 0.38, + "learning_rate": 1.9520570345683258e-06, + "loss": 0.7686, + "step": 14748 + }, + { + "epoch": 0.38, + "learning_rate": 1.9520485692424738e-06, + "loss": 0.7422, + "step": 14749 + }, + { + "epoch": 0.38, + "learning_rate": 1.952040103187682e-06, + "loss": 0.6636, + "step": 14750 + }, + { + "epoch": 0.38, + "learning_rate": 1.952031636403957e-06, + "loss": 0.7358, + "step": 14751 + }, + { + "epoch": 0.38, + "learning_rate": 1.9520231688913043e-06, + "loss": 0.9609, + "step": 14752 + }, + { + "epoch": 0.38, + "learning_rate": 1.952014700649732e-06, + "loss": 0.8301, + "step": 14753 + }, + { + "epoch": 0.38, + "learning_rate": 1.952006231679246e-06, + "loss": 0.8726, + "step": 14754 + }, + { + "epoch": 0.38, + "learning_rate": 1.951997761979852e-06, + "loss": 0.8906, + "step": 14755 + }, + { + "epoch": 0.38, + "learning_rate": 1.9519892915515577e-06, + "loss": 0.5164, + "step": 14756 + }, + { + "epoch": 0.38, + "learning_rate": 1.951980820394369e-06, + "loss": 0.8164, + "step": 14757 + }, + { + "epoch": 0.38, + "learning_rate": 1.9519723485082915e-06, + "loss": 0.8389, + "step": 14758 + }, + { + "epoch": 0.38, + "learning_rate": 1.951963875893333e-06, + "loss": 1.001, + "step": 14759 + }, + { + "epoch": 0.38, + "learning_rate": 1.9519554025495e-06, + "loss": 0.6865, + "step": 14760 + }, + { + "epoch": 0.38, + "learning_rate": 1.9519469284767977e-06, + "loss": 0.9414, + "step": 14761 + }, + { + "epoch": 0.38, + "learning_rate": 1.951938453675234e-06, + "loss": 0.7153, + "step": 14762 + }, + { + "epoch": 0.38, + "learning_rate": 1.9519299781448143e-06, + "loss": 0.8037, + "step": 14763 + }, + { + "epoch": 0.38, + "learning_rate": 1.951921501885546e-06, + "loss": 0.8809, + "step": 14764 + }, + { + "epoch": 0.38, + "learning_rate": 1.9519130248974353e-06, + "loss": 1.0215, + "step": 14765 + }, + { + "epoch": 0.38, + "learning_rate": 1.9519045471804883e-06, + "loss": 0.6323, + "step": 14766 + }, + { + "epoch": 0.38, + "learning_rate": 1.9518960687347118e-06, + "loss": 0.9326, + "step": 14767 + }, + { + "epoch": 0.38, + "learning_rate": 1.951887589560112e-06, + "loss": 0.792, + "step": 14768 + }, + { + "epoch": 0.38, + "learning_rate": 1.951879109656696e-06, + "loss": 1.0996, + "step": 14769 + }, + { + "epoch": 0.38, + "learning_rate": 1.95187062902447e-06, + "loss": 0.9785, + "step": 14770 + }, + { + "epoch": 0.38, + "learning_rate": 1.95186214766344e-06, + "loss": 0.9453, + "step": 14771 + }, + { + "epoch": 0.38, + "learning_rate": 1.951853665573613e-06, + "loss": 0.875, + "step": 14772 + }, + { + "epoch": 0.38, + "learning_rate": 1.951845182754996e-06, + "loss": 0.7202, + "step": 14773 + }, + { + "epoch": 0.38, + "learning_rate": 1.951836699207594e-06, + "loss": 0.8701, + "step": 14774 + }, + { + "epoch": 0.38, + "learning_rate": 1.951828214931415e-06, + "loss": 0.9082, + "step": 14775 + }, + { + "epoch": 0.38, + "learning_rate": 1.9518197299264647e-06, + "loss": 0.9141, + "step": 14776 + }, + { + "epoch": 0.38, + "learning_rate": 1.95181124419275e-06, + "loss": 0.9902, + "step": 14777 + }, + { + "epoch": 0.38, + "learning_rate": 1.9518027577302773e-06, + "loss": 0.7681, + "step": 14778 + }, + { + "epoch": 0.38, + "learning_rate": 1.951794270539053e-06, + "loss": 0.9019, + "step": 14779 + }, + { + "epoch": 0.38, + "learning_rate": 1.9517857826190832e-06, + "loss": 1.0205, + "step": 14780 + }, + { + "epoch": 0.38, + "learning_rate": 1.951777293970375e-06, + "loss": 0.7881, + "step": 14781 + }, + { + "epoch": 0.38, + "learning_rate": 1.951768804592935e-06, + "loss": 0.9238, + "step": 14782 + }, + { + "epoch": 0.38, + "learning_rate": 1.9517603144867686e-06, + "loss": 0.9775, + "step": 14783 + }, + { + "epoch": 0.38, + "learning_rate": 1.9517518236518837e-06, + "loss": 0.7222, + "step": 14784 + }, + { + "epoch": 0.38, + "learning_rate": 1.951743332088286e-06, + "loss": 0.9072, + "step": 14785 + }, + { + "epoch": 0.38, + "learning_rate": 1.9517348397959824e-06, + "loss": 0.8418, + "step": 14786 + }, + { + "epoch": 0.38, + "learning_rate": 1.9517263467749788e-06, + "loss": 0.8965, + "step": 14787 + }, + { + "epoch": 0.38, + "learning_rate": 1.9517178530252824e-06, + "loss": 0.9551, + "step": 14788 + }, + { + "epoch": 0.38, + "learning_rate": 1.9517093585468993e-06, + "loss": 0.9678, + "step": 14789 + }, + { + "epoch": 0.38, + "learning_rate": 1.951700863339836e-06, + "loss": 0.8428, + "step": 14790 + }, + { + "epoch": 0.38, + "learning_rate": 1.9516923674040993e-06, + "loss": 1.0508, + "step": 14791 + }, + { + "epoch": 0.38, + "learning_rate": 1.9516838707396953e-06, + "loss": 1.0459, + "step": 14792 + }, + { + "epoch": 0.38, + "learning_rate": 1.951675373346631e-06, + "loss": 0.9932, + "step": 14793 + }, + { + "epoch": 0.38, + "learning_rate": 1.9516668752249128e-06, + "loss": 0.8828, + "step": 14794 + }, + { + "epoch": 0.38, + "learning_rate": 1.9516583763745466e-06, + "loss": 1.0459, + "step": 14795 + }, + { + "epoch": 0.38, + "learning_rate": 1.9516498767955394e-06, + "loss": 0.7529, + "step": 14796 + }, + { + "epoch": 0.38, + "learning_rate": 1.9516413764878976e-06, + "loss": 0.8496, + "step": 14797 + }, + { + "epoch": 0.38, + "learning_rate": 1.951632875451628e-06, + "loss": 1.0498, + "step": 14798 + }, + { + "epoch": 0.38, + "learning_rate": 1.951624373686737e-06, + "loss": 0.7871, + "step": 14799 + }, + { + "epoch": 0.38, + "learning_rate": 1.9516158711932304e-06, + "loss": 0.7949, + "step": 14800 + }, + { + "epoch": 0.38, + "learning_rate": 1.951607367971116e-06, + "loss": 0.9619, + "step": 14801 + }, + { + "epoch": 0.38, + "learning_rate": 1.951598864020399e-06, + "loss": 1.1123, + "step": 14802 + }, + { + "epoch": 0.38, + "learning_rate": 1.9515903593410866e-06, + "loss": 0.9648, + "step": 14803 + }, + { + "epoch": 0.38, + "learning_rate": 1.9515818539331853e-06, + "loss": 0.9912, + "step": 14804 + }, + { + "epoch": 0.38, + "learning_rate": 1.9515733477967015e-06, + "loss": 1.0244, + "step": 14805 + }, + { + "epoch": 0.38, + "learning_rate": 1.951564840931642e-06, + "loss": 0.9312, + "step": 14806 + }, + { + "epoch": 0.38, + "learning_rate": 1.9515563333380127e-06, + "loss": 1.0938, + "step": 14807 + }, + { + "epoch": 0.38, + "learning_rate": 1.9515478250158205e-06, + "loss": 0.9277, + "step": 14808 + }, + { + "epoch": 0.38, + "learning_rate": 1.9515393159650724e-06, + "loss": 1.0, + "step": 14809 + }, + { + "epoch": 0.38, + "learning_rate": 1.9515308061857734e-06, + "loss": 0.7227, + "step": 14810 + }, + { + "epoch": 0.38, + "learning_rate": 1.9515222956779317e-06, + "loss": 0.6064, + "step": 14811 + }, + { + "epoch": 0.38, + "learning_rate": 1.951513784441553e-06, + "loss": 0.8223, + "step": 14812 + }, + { + "epoch": 0.38, + "learning_rate": 1.9515052724766444e-06, + "loss": 0.7153, + "step": 14813 + }, + { + "epoch": 0.38, + "learning_rate": 1.9514967597832116e-06, + "loss": 0.9102, + "step": 14814 + }, + { + "epoch": 0.38, + "learning_rate": 1.951488246361261e-06, + "loss": 0.647, + "step": 14815 + }, + { + "epoch": 0.38, + "learning_rate": 1.9514797322108003e-06, + "loss": 0.9629, + "step": 14816 + }, + { + "epoch": 0.38, + "learning_rate": 1.951471217331835e-06, + "loss": 0.9834, + "step": 14817 + }, + { + "epoch": 0.38, + "learning_rate": 1.951462701724372e-06, + "loss": 0.7793, + "step": 14818 + }, + { + "epoch": 0.38, + "learning_rate": 1.9514541853884176e-06, + "loss": 0.7998, + "step": 14819 + }, + { + "epoch": 0.38, + "learning_rate": 1.951445668323979e-06, + "loss": 0.7891, + "step": 14820 + }, + { + "epoch": 0.38, + "learning_rate": 1.9514371505310616e-06, + "loss": 0.9492, + "step": 14821 + }, + { + "epoch": 0.38, + "learning_rate": 1.951428632009673e-06, + "loss": 1.0, + "step": 14822 + }, + { + "epoch": 0.38, + "learning_rate": 1.951420112759819e-06, + "loss": 0.7642, + "step": 14823 + }, + { + "epoch": 0.38, + "learning_rate": 1.951411592781506e-06, + "loss": 0.9346, + "step": 14824 + }, + { + "epoch": 0.38, + "learning_rate": 1.951403072074741e-06, + "loss": 1.1318, + "step": 14825 + }, + { + "epoch": 0.38, + "learning_rate": 1.951394550639531e-06, + "loss": 1.0186, + "step": 14826 + }, + { + "epoch": 0.38, + "learning_rate": 1.9513860284758815e-06, + "loss": 0.8477, + "step": 14827 + }, + { + "epoch": 0.38, + "learning_rate": 1.9513775055837993e-06, + "loss": 1.04, + "step": 14828 + }, + { + "epoch": 0.38, + "learning_rate": 1.9513689819632917e-06, + "loss": 0.7764, + "step": 14829 + }, + { + "epoch": 0.38, + "learning_rate": 1.951360457614364e-06, + "loss": 0.8467, + "step": 14830 + }, + { + "epoch": 0.38, + "learning_rate": 1.9513519325370237e-06, + "loss": 0.7661, + "step": 14831 + }, + { + "epoch": 0.38, + "learning_rate": 1.951343406731277e-06, + "loss": 0.9346, + "step": 14832 + }, + { + "epoch": 0.38, + "learning_rate": 1.95133488019713e-06, + "loss": 0.9404, + "step": 14833 + }, + { + "epoch": 0.38, + "learning_rate": 1.95132635293459e-06, + "loss": 1.0391, + "step": 14834 + }, + { + "epoch": 0.38, + "learning_rate": 1.9513178249436634e-06, + "loss": 0.6942, + "step": 14835 + }, + { + "epoch": 0.38, + "learning_rate": 1.951309296224356e-06, + "loss": 0.8413, + "step": 14836 + }, + { + "epoch": 0.38, + "learning_rate": 1.951300766776675e-06, + "loss": 0.835, + "step": 14837 + }, + { + "epoch": 0.38, + "learning_rate": 1.9512922366006265e-06, + "loss": 0.7529, + "step": 14838 + }, + { + "epoch": 0.38, + "learning_rate": 1.951283705696218e-06, + "loss": 0.8643, + "step": 14839 + }, + { + "epoch": 0.38, + "learning_rate": 1.9512751740634544e-06, + "loss": 0.7148, + "step": 14840 + }, + { + "epoch": 0.38, + "learning_rate": 1.9512666417023435e-06, + "loss": 0.7979, + "step": 14841 + }, + { + "epoch": 0.38, + "learning_rate": 1.951258108612892e-06, + "loss": 0.9102, + "step": 14842 + }, + { + "epoch": 0.38, + "learning_rate": 1.951249574795105e-06, + "loss": 0.999, + "step": 14843 + }, + { + "epoch": 0.38, + "learning_rate": 1.9512410402489903e-06, + "loss": 0.9355, + "step": 14844 + }, + { + "epoch": 0.38, + "learning_rate": 1.951232504974554e-06, + "loss": 0.7096, + "step": 14845 + }, + { + "epoch": 0.38, + "learning_rate": 1.951223968971803e-06, + "loss": 0.8291, + "step": 14846 + }, + { + "epoch": 0.38, + "learning_rate": 1.9512154322407434e-06, + "loss": 1.043, + "step": 14847 + }, + { + "epoch": 0.38, + "learning_rate": 1.951206894781382e-06, + "loss": 1.0605, + "step": 14848 + }, + { + "epoch": 0.38, + "learning_rate": 1.951198356593725e-06, + "loss": 0.8154, + "step": 14849 + }, + { + "epoch": 0.38, + "learning_rate": 1.951189817677779e-06, + "loss": 0.7202, + "step": 14850 + }, + { + "epoch": 0.38, + "learning_rate": 1.951181278033551e-06, + "loss": 0.9512, + "step": 14851 + }, + { + "epoch": 0.38, + "learning_rate": 1.9511727376610475e-06, + "loss": 0.9102, + "step": 14852 + }, + { + "epoch": 0.38, + "learning_rate": 1.951164196560274e-06, + "loss": 0.9297, + "step": 14853 + }, + { + "epoch": 0.38, + "learning_rate": 1.9511556547312384e-06, + "loss": 0.9883, + "step": 14854 + }, + { + "epoch": 0.38, + "learning_rate": 1.9511471121739467e-06, + "loss": 1.0127, + "step": 14855 + }, + { + "epoch": 0.38, + "learning_rate": 1.951138568888405e-06, + "loss": 0.5039, + "step": 14856 + }, + { + "epoch": 0.38, + "learning_rate": 1.9511300248746207e-06, + "loss": 0.8369, + "step": 14857 + }, + { + "epoch": 0.38, + "learning_rate": 1.9511214801325994e-06, + "loss": 1.0898, + "step": 14858 + }, + { + "epoch": 0.38, + "learning_rate": 1.9511129346623484e-06, + "loss": 0.7891, + "step": 14859 + }, + { + "epoch": 0.38, + "learning_rate": 1.951104388463874e-06, + "loss": 1.1074, + "step": 14860 + }, + { + "epoch": 0.38, + "learning_rate": 1.9510958415371823e-06, + "loss": 0.8721, + "step": 14861 + }, + { + "epoch": 0.38, + "learning_rate": 1.9510872938822803e-06, + "loss": 0.7822, + "step": 14862 + }, + { + "epoch": 0.38, + "learning_rate": 1.951078745499175e-06, + "loss": 1.0723, + "step": 14863 + }, + { + "epoch": 0.38, + "learning_rate": 1.951070196387872e-06, + "loss": 0.8818, + "step": 14864 + }, + { + "epoch": 0.38, + "learning_rate": 1.9510616465483783e-06, + "loss": 0.7783, + "step": 14865 + }, + { + "epoch": 0.38, + "learning_rate": 1.9510530959807007e-06, + "loss": 1.0938, + "step": 14866 + }, + { + "epoch": 0.38, + "learning_rate": 1.9510445446848455e-06, + "loss": 1.002, + "step": 14867 + }, + { + "epoch": 0.38, + "learning_rate": 1.951035992660819e-06, + "loss": 0.9258, + "step": 14868 + }, + { + "epoch": 0.38, + "learning_rate": 1.951027439908628e-06, + "loss": 0.8535, + "step": 14869 + }, + { + "epoch": 0.38, + "learning_rate": 1.951018886428279e-06, + "loss": 0.9111, + "step": 14870 + }, + { + "epoch": 0.38, + "learning_rate": 1.951010332219778e-06, + "loss": 0.9326, + "step": 14871 + }, + { + "epoch": 0.38, + "learning_rate": 1.9510017772831335e-06, + "loss": 1.04, + "step": 14872 + }, + { + "epoch": 0.38, + "learning_rate": 1.9509932216183496e-06, + "loss": 0.9941, + "step": 14873 + }, + { + "epoch": 0.38, + "learning_rate": 1.9509846652254342e-06, + "loss": 0.8701, + "step": 14874 + }, + { + "epoch": 0.38, + "learning_rate": 1.9509761081043936e-06, + "loss": 0.9043, + "step": 14875 + }, + { + "epoch": 0.38, + "learning_rate": 1.950967550255234e-06, + "loss": 0.9844, + "step": 14876 + }, + { + "epoch": 0.38, + "learning_rate": 1.950958991677963e-06, + "loss": 0.833, + "step": 14877 + }, + { + "epoch": 0.38, + "learning_rate": 1.950950432372586e-06, + "loss": 0.9072, + "step": 14878 + }, + { + "epoch": 0.38, + "learning_rate": 1.95094187233911e-06, + "loss": 1.0713, + "step": 14879 + }, + { + "epoch": 0.38, + "learning_rate": 1.9509333115775414e-06, + "loss": 0.9326, + "step": 14880 + }, + { + "epoch": 0.38, + "learning_rate": 1.950924750087887e-06, + "loss": 1.1201, + "step": 14881 + }, + { + "epoch": 0.38, + "learning_rate": 1.9509161878701533e-06, + "loss": 0.8672, + "step": 14882 + }, + { + "epoch": 0.38, + "learning_rate": 1.9509076249243467e-06, + "loss": 0.7246, + "step": 14883 + }, + { + "epoch": 0.38, + "learning_rate": 1.9508990612504737e-06, + "loss": 1.0107, + "step": 14884 + }, + { + "epoch": 0.38, + "learning_rate": 1.950890496848541e-06, + "loss": 0.8438, + "step": 14885 + }, + { + "epoch": 0.38, + "learning_rate": 1.950881931718556e-06, + "loss": 1.0332, + "step": 14886 + }, + { + "epoch": 0.38, + "learning_rate": 1.9508733658605237e-06, + "loss": 0.9854, + "step": 14887 + }, + { + "epoch": 0.38, + "learning_rate": 1.9508647992744515e-06, + "loss": 0.7495, + "step": 14888 + }, + { + "epoch": 0.38, + "learning_rate": 1.9508562319603456e-06, + "loss": 0.9805, + "step": 14889 + }, + { + "epoch": 0.38, + "learning_rate": 1.950847663918213e-06, + "loss": 1.1348, + "step": 14890 + }, + { + "epoch": 0.38, + "learning_rate": 1.95083909514806e-06, + "loss": 1.0352, + "step": 14891 + }, + { + "epoch": 0.38, + "learning_rate": 1.9508305256498938e-06, + "loss": 1.1123, + "step": 14892 + }, + { + "epoch": 0.38, + "learning_rate": 1.95082195542372e-06, + "loss": 0.8086, + "step": 14893 + }, + { + "epoch": 0.38, + "learning_rate": 1.950813384469545e-06, + "loss": 0.957, + "step": 14894 + }, + { + "epoch": 0.38, + "learning_rate": 1.9508048127873765e-06, + "loss": 0.998, + "step": 14895 + }, + { + "epoch": 0.38, + "learning_rate": 1.9507962403772206e-06, + "loss": 0.8604, + "step": 14896 + }, + { + "epoch": 0.38, + "learning_rate": 1.9507876672390834e-06, + "loss": 0.668, + "step": 14897 + }, + { + "epoch": 0.38, + "learning_rate": 1.950779093372972e-06, + "loss": 0.9404, + "step": 14898 + }, + { + "epoch": 0.38, + "learning_rate": 1.9507705187788926e-06, + "loss": 0.7058, + "step": 14899 + }, + { + "epoch": 0.38, + "learning_rate": 1.950761943456852e-06, + "loss": 0.916, + "step": 14900 + }, + { + "epoch": 0.38, + "learning_rate": 1.9507533674068566e-06, + "loss": 0.916, + "step": 14901 + }, + { + "epoch": 0.38, + "learning_rate": 1.9507447906289134e-06, + "loss": 0.9707, + "step": 14902 + }, + { + "epoch": 0.38, + "learning_rate": 1.950736213123028e-06, + "loss": 0.9092, + "step": 14903 + }, + { + "epoch": 0.38, + "learning_rate": 1.9507276348892083e-06, + "loss": 1.0098, + "step": 14904 + }, + { + "epoch": 0.38, + "learning_rate": 1.9507190559274596e-06, + "loss": 0.6934, + "step": 14905 + }, + { + "epoch": 0.38, + "learning_rate": 1.9507104762377894e-06, + "loss": 0.9697, + "step": 14906 + }, + { + "epoch": 0.38, + "learning_rate": 1.9507018958202036e-06, + "loss": 0.9365, + "step": 14907 + }, + { + "epoch": 0.38, + "learning_rate": 1.9506933146747095e-06, + "loss": 0.9932, + "step": 14908 + }, + { + "epoch": 0.38, + "learning_rate": 1.9506847328013126e-06, + "loss": 0.792, + "step": 14909 + }, + { + "epoch": 0.38, + "learning_rate": 1.950676150200021e-06, + "loss": 1.0039, + "step": 14910 + }, + { + "epoch": 0.38, + "learning_rate": 1.9506675668708398e-06, + "loss": 0.7622, + "step": 14911 + }, + { + "epoch": 0.38, + "learning_rate": 1.950658982813776e-06, + "loss": 0.7446, + "step": 14912 + }, + { + "epoch": 0.38, + "learning_rate": 1.950650398028837e-06, + "loss": 0.854, + "step": 14913 + }, + { + "epoch": 0.38, + "learning_rate": 1.950641812516028e-06, + "loss": 1.0361, + "step": 14914 + }, + { + "epoch": 0.38, + "learning_rate": 1.9506332262753565e-06, + "loss": 0.9287, + "step": 14915 + }, + { + "epoch": 0.38, + "learning_rate": 1.950624639306829e-06, + "loss": 0.7578, + "step": 14916 + }, + { + "epoch": 0.38, + "learning_rate": 1.950616051610452e-06, + "loss": 0.6323, + "step": 14917 + }, + { + "epoch": 0.38, + "learning_rate": 1.9506074631862317e-06, + "loss": 0.9277, + "step": 14918 + }, + { + "epoch": 0.38, + "learning_rate": 1.950598874034175e-06, + "loss": 1.0391, + "step": 14919 + }, + { + "epoch": 0.38, + "learning_rate": 1.9505902841542887e-06, + "loss": 0.8462, + "step": 14920 + }, + { + "epoch": 0.38, + "learning_rate": 1.950581693546579e-06, + "loss": 0.7578, + "step": 14921 + }, + { + "epoch": 0.38, + "learning_rate": 1.9505731022110523e-06, + "loss": 0.8525, + "step": 14922 + }, + { + "epoch": 0.38, + "learning_rate": 1.950564510147716e-06, + "loss": 0.9971, + "step": 14923 + }, + { + "epoch": 0.38, + "learning_rate": 1.950555917356576e-06, + "loss": 0.7471, + "step": 14924 + }, + { + "epoch": 0.38, + "learning_rate": 1.950547323837639e-06, + "loss": 0.9346, + "step": 14925 + }, + { + "epoch": 0.38, + "learning_rate": 1.9505387295909113e-06, + "loss": 0.9111, + "step": 14926 + }, + { + "epoch": 0.38, + "learning_rate": 1.9505301346164003e-06, + "loss": 1.168, + "step": 14927 + }, + { + "epoch": 0.38, + "learning_rate": 1.950521538914112e-06, + "loss": 0.7529, + "step": 14928 + }, + { + "epoch": 0.38, + "learning_rate": 1.9505129424840526e-06, + "loss": 0.9746, + "step": 14929 + }, + { + "epoch": 0.38, + "learning_rate": 1.95050434532623e-06, + "loss": 0.75, + "step": 14930 + }, + { + "epoch": 0.38, + "learning_rate": 1.950495747440649e-06, + "loss": 0.9414, + "step": 14931 + }, + { + "epoch": 0.38, + "learning_rate": 1.9504871488273176e-06, + "loss": 1.0391, + "step": 14932 + }, + { + "epoch": 0.38, + "learning_rate": 1.950478549486242e-06, + "loss": 0.8262, + "step": 14933 + }, + { + "epoch": 0.38, + "learning_rate": 1.950469949417429e-06, + "loss": 0.8516, + "step": 14934 + }, + { + "epoch": 0.38, + "learning_rate": 1.950461348620884e-06, + "loss": 0.8613, + "step": 14935 + }, + { + "epoch": 0.38, + "learning_rate": 1.9504527470966147e-06, + "loss": 0.813, + "step": 14936 + }, + { + "epoch": 0.38, + "learning_rate": 1.9504441448446274e-06, + "loss": 0.9863, + "step": 14937 + }, + { + "epoch": 0.38, + "learning_rate": 1.950435541864929e-06, + "loss": 0.8389, + "step": 14938 + }, + { + "epoch": 0.38, + "learning_rate": 1.9504269381575258e-06, + "loss": 0.8081, + "step": 14939 + }, + { + "epoch": 0.38, + "learning_rate": 1.950418333722424e-06, + "loss": 0.7905, + "step": 14940 + }, + { + "epoch": 0.38, + "learning_rate": 1.950409728559631e-06, + "loss": 0.8086, + "step": 14941 + }, + { + "epoch": 0.38, + "learning_rate": 1.9504011226691527e-06, + "loss": 0.873, + "step": 14942 + }, + { + "epoch": 0.38, + "learning_rate": 1.9503925160509964e-06, + "loss": 1.0518, + "step": 14943 + }, + { + "epoch": 0.38, + "learning_rate": 1.9503839087051677e-06, + "loss": 0.9043, + "step": 14944 + }, + { + "epoch": 0.38, + "learning_rate": 1.950375300631674e-06, + "loss": 0.9844, + "step": 14945 + }, + { + "epoch": 0.38, + "learning_rate": 1.9503666918305217e-06, + "loss": 0.6616, + "step": 14946 + }, + { + "epoch": 0.38, + "learning_rate": 1.9503580823017176e-06, + "loss": 0.7207, + "step": 14947 + }, + { + "epoch": 0.38, + "learning_rate": 1.9503494720452672e-06, + "loss": 0.8428, + "step": 14948 + }, + { + "epoch": 0.38, + "learning_rate": 1.9503408610611783e-06, + "loss": 0.7021, + "step": 14949 + }, + { + "epoch": 0.38, + "learning_rate": 1.9503322493494576e-06, + "loss": 1.0117, + "step": 14950 + }, + { + "epoch": 0.38, + "learning_rate": 1.9503236369101106e-06, + "loss": 0.7461, + "step": 14951 + }, + { + "epoch": 0.38, + "learning_rate": 1.9503150237431445e-06, + "loss": 1.1777, + "step": 14952 + }, + { + "epoch": 0.38, + "learning_rate": 1.950306409848566e-06, + "loss": 0.8135, + "step": 14953 + }, + { + "epoch": 0.38, + "learning_rate": 1.9502977952263818e-06, + "loss": 0.8525, + "step": 14954 + }, + { + "epoch": 0.38, + "learning_rate": 1.9502891798765982e-06, + "loss": 1.0781, + "step": 14955 + }, + { + "epoch": 0.38, + "learning_rate": 1.950280563799222e-06, + "loss": 0.8242, + "step": 14956 + }, + { + "epoch": 0.38, + "learning_rate": 1.950271946994259e-06, + "loss": 0.8447, + "step": 14957 + }, + { + "epoch": 0.38, + "learning_rate": 1.950263329461717e-06, + "loss": 0.7969, + "step": 14958 + }, + { + "epoch": 0.38, + "learning_rate": 1.950254711201602e-06, + "loss": 1.1465, + "step": 14959 + }, + { + "epoch": 0.38, + "learning_rate": 1.9502460922139206e-06, + "loss": 1.001, + "step": 14960 + }, + { + "epoch": 0.38, + "learning_rate": 1.9502374724986796e-06, + "loss": 1.0371, + "step": 14961 + }, + { + "epoch": 0.38, + "learning_rate": 1.950228852055885e-06, + "loss": 0.8096, + "step": 14962 + }, + { + "epoch": 0.38, + "learning_rate": 1.950220230885544e-06, + "loss": 0.8936, + "step": 14963 + }, + { + "epoch": 0.38, + "learning_rate": 1.950211608987664e-06, + "loss": 0.6895, + "step": 14964 + }, + { + "epoch": 0.38, + "learning_rate": 1.9502029863622497e-06, + "loss": 0.6921, + "step": 14965 + }, + { + "epoch": 0.38, + "learning_rate": 1.950194363009309e-06, + "loss": 0.9307, + "step": 14966 + }, + { + "epoch": 0.38, + "learning_rate": 1.9501857389288476e-06, + "loss": 0.8906, + "step": 14967 + }, + { + "epoch": 0.38, + "learning_rate": 1.950177114120873e-06, + "loss": 0.8232, + "step": 14968 + }, + { + "epoch": 0.38, + "learning_rate": 1.9501684885853917e-06, + "loss": 0.7705, + "step": 14969 + }, + { + "epoch": 0.38, + "learning_rate": 1.9501598623224102e-06, + "loss": 0.8774, + "step": 14970 + }, + { + "epoch": 0.38, + "learning_rate": 1.9501512353319346e-06, + "loss": 0.665, + "step": 14971 + }, + { + "epoch": 0.38, + "learning_rate": 1.950142607613972e-06, + "loss": 1.0752, + "step": 14972 + }, + { + "epoch": 0.38, + "learning_rate": 1.950133979168529e-06, + "loss": 0.8125, + "step": 14973 + }, + { + "epoch": 0.38, + "learning_rate": 1.9501253499956124e-06, + "loss": 1.0879, + "step": 14974 + }, + { + "epoch": 0.38, + "learning_rate": 1.950116720095228e-06, + "loss": 0.8892, + "step": 14975 + }, + { + "epoch": 0.38, + "learning_rate": 1.950108089467383e-06, + "loss": 0.9531, + "step": 14976 + }, + { + "epoch": 0.38, + "learning_rate": 1.950099458112084e-06, + "loss": 0.7651, + "step": 14977 + }, + { + "epoch": 0.38, + "learning_rate": 1.9500908260293376e-06, + "loss": 1.1084, + "step": 14978 + }, + { + "epoch": 0.38, + "learning_rate": 1.95008219321915e-06, + "loss": 0.9209, + "step": 14979 + }, + { + "epoch": 0.38, + "learning_rate": 1.9500735596815287e-06, + "loss": 0.8896, + "step": 14980 + }, + { + "epoch": 0.38, + "learning_rate": 1.9500649254164792e-06, + "loss": 0.5532, + "step": 14981 + }, + { + "epoch": 0.38, + "learning_rate": 1.950056290424009e-06, + "loss": 0.7515, + "step": 14982 + }, + { + "epoch": 0.38, + "learning_rate": 1.9500476547041243e-06, + "loss": 0.792, + "step": 14983 + }, + { + "epoch": 0.38, + "learning_rate": 1.9500390182568317e-06, + "loss": 0.8574, + "step": 14984 + }, + { + "epoch": 0.38, + "learning_rate": 1.950030381082138e-06, + "loss": 0.9902, + "step": 14985 + }, + { + "epoch": 0.38, + "learning_rate": 1.9500217431800497e-06, + "loss": 0.7969, + "step": 14986 + }, + { + "epoch": 0.38, + "learning_rate": 1.9500131045505736e-06, + "loss": 1.1299, + "step": 14987 + }, + { + "epoch": 0.38, + "learning_rate": 1.9500044651937164e-06, + "loss": 0.8223, + "step": 14988 + }, + { + "epoch": 0.38, + "learning_rate": 1.949995825109484e-06, + "loss": 0.8398, + "step": 14989 + }, + { + "epoch": 0.38, + "learning_rate": 1.9499871842978833e-06, + "loss": 0.9766, + "step": 14990 + }, + { + "epoch": 0.38, + "learning_rate": 1.9499785427589215e-06, + "loss": 0.8975, + "step": 14991 + }, + { + "epoch": 0.38, + "learning_rate": 1.9499699004926048e-06, + "loss": 0.7871, + "step": 14992 + }, + { + "epoch": 0.38, + "learning_rate": 1.9499612574989396e-06, + "loss": 0.8857, + "step": 14993 + }, + { + "epoch": 0.38, + "learning_rate": 1.9499526137779328e-06, + "loss": 0.6968, + "step": 14994 + }, + { + "epoch": 0.38, + "learning_rate": 1.949943969329591e-06, + "loss": 0.9951, + "step": 14995 + }, + { + "epoch": 0.38, + "learning_rate": 1.949935324153921e-06, + "loss": 0.9111, + "step": 14996 + }, + { + "epoch": 0.38, + "learning_rate": 1.9499266782509286e-06, + "loss": 0.9482, + "step": 14997 + }, + { + "epoch": 0.38, + "learning_rate": 1.949918031620622e-06, + "loss": 0.7896, + "step": 14998 + }, + { + "epoch": 0.38, + "learning_rate": 1.949909384263006e-06, + "loss": 1.0625, + "step": 14999 + }, + { + "epoch": 0.38, + "learning_rate": 1.949900736178088e-06, + "loss": 0.6641, + "step": 15000 + }, + { + "epoch": 0.38, + "learning_rate": 1.9498920873658754e-06, + "loss": 0.7715, + "step": 15001 + }, + { + "epoch": 0.38, + "learning_rate": 1.9498834378263735e-06, + "loss": 0.9194, + "step": 15002 + }, + { + "epoch": 0.38, + "learning_rate": 1.9498747875595896e-06, + "loss": 0.959, + "step": 15003 + }, + { + "epoch": 0.38, + "learning_rate": 1.9498661365655306e-06, + "loss": 0.8848, + "step": 15004 + }, + { + "epoch": 0.38, + "learning_rate": 1.9498574848442027e-06, + "loss": 0.876, + "step": 15005 + }, + { + "epoch": 0.38, + "learning_rate": 1.9498488323956123e-06, + "loss": 0.8379, + "step": 15006 + }, + { + "epoch": 0.38, + "learning_rate": 1.9498401792197666e-06, + "loss": 0.9629, + "step": 15007 + }, + { + "epoch": 0.38, + "learning_rate": 1.949831525316672e-06, + "loss": 0.8789, + "step": 15008 + }, + { + "epoch": 0.38, + "learning_rate": 1.949822870686335e-06, + "loss": 0.96, + "step": 15009 + }, + { + "epoch": 0.38, + "learning_rate": 1.949814215328762e-06, + "loss": 1.0303, + "step": 15010 + }, + { + "epoch": 0.38, + "learning_rate": 1.9498055592439598e-06, + "loss": 1.0127, + "step": 15011 + }, + { + "epoch": 0.38, + "learning_rate": 1.949796902431936e-06, + "loss": 1.04, + "step": 15012 + }, + { + "epoch": 0.38, + "learning_rate": 1.9497882448926957e-06, + "loss": 0.7842, + "step": 15013 + }, + { + "epoch": 0.38, + "learning_rate": 1.9497795866262464e-06, + "loss": 1.0, + "step": 15014 + }, + { + "epoch": 0.38, + "learning_rate": 1.9497709276325947e-06, + "loss": 0.6388, + "step": 15015 + }, + { + "epoch": 0.38, + "learning_rate": 1.9497622679117467e-06, + "loss": 1.0127, + "step": 15016 + }, + { + "epoch": 0.38, + "learning_rate": 1.9497536074637098e-06, + "loss": 0.7578, + "step": 15017 + }, + { + "epoch": 0.38, + "learning_rate": 1.94974494628849e-06, + "loss": 0.834, + "step": 15018 + }, + { + "epoch": 0.38, + "learning_rate": 1.949736284386094e-06, + "loss": 1.0869, + "step": 15019 + }, + { + "epoch": 0.38, + "learning_rate": 1.949727621756529e-06, + "loss": 1.0049, + "step": 15020 + }, + { + "epoch": 0.38, + "learning_rate": 1.949718958399801e-06, + "loss": 0.9844, + "step": 15021 + }, + { + "epoch": 0.39, + "learning_rate": 1.949710294315917e-06, + "loss": 0.8174, + "step": 15022 + }, + { + "epoch": 0.39, + "learning_rate": 1.9497016295048833e-06, + "loss": 1.0859, + "step": 15023 + }, + { + "epoch": 0.39, + "learning_rate": 1.949692963966707e-06, + "loss": 0.9297, + "step": 15024 + }, + { + "epoch": 0.39, + "learning_rate": 1.949684297701394e-06, + "loss": 0.9717, + "step": 15025 + }, + { + "epoch": 0.39, + "learning_rate": 1.949675630708952e-06, + "loss": 0.9932, + "step": 15026 + }, + { + "epoch": 0.39, + "learning_rate": 1.9496669629893865e-06, + "loss": 0.7422, + "step": 15027 + }, + { + "epoch": 0.39, + "learning_rate": 1.9496582945427053e-06, + "loss": 0.8008, + "step": 15028 + }, + { + "epoch": 0.39, + "learning_rate": 1.949649625368914e-06, + "loss": 0.6816, + "step": 15029 + }, + { + "epoch": 0.39, + "learning_rate": 1.949640955468019e-06, + "loss": 1.1562, + "step": 15030 + }, + { + "epoch": 0.39, + "learning_rate": 1.9496322848400286e-06, + "loss": 0.665, + "step": 15031 + }, + { + "epoch": 0.39, + "learning_rate": 1.9496236134849483e-06, + "loss": 0.96, + "step": 15032 + }, + { + "epoch": 0.39, + "learning_rate": 1.9496149414027843e-06, + "loss": 0.752, + "step": 15033 + }, + { + "epoch": 0.39, + "learning_rate": 1.9496062685935446e-06, + "loss": 0.7603, + "step": 15034 + }, + { + "epoch": 0.39, + "learning_rate": 1.9495975950572342e-06, + "loss": 1.0352, + "step": 15035 + }, + { + "epoch": 0.39, + "learning_rate": 1.9495889207938613e-06, + "loss": 0.9043, + "step": 15036 + }, + { + "epoch": 0.39, + "learning_rate": 1.9495802458034312e-06, + "loss": 1.1465, + "step": 15037 + }, + { + "epoch": 0.39, + "learning_rate": 1.9495715700859518e-06, + "loss": 0.9727, + "step": 15038 + }, + { + "epoch": 0.39, + "learning_rate": 1.9495628936414287e-06, + "loss": 0.8008, + "step": 15039 + }, + { + "epoch": 0.39, + "learning_rate": 1.949554216469869e-06, + "loss": 0.8799, + "step": 15040 + }, + { + "epoch": 0.39, + "learning_rate": 1.949545538571279e-06, + "loss": 1.0703, + "step": 15041 + }, + { + "epoch": 0.39, + "learning_rate": 1.9495368599456662e-06, + "loss": 0.8887, + "step": 15042 + }, + { + "epoch": 0.39, + "learning_rate": 1.9495281805930364e-06, + "loss": 0.8223, + "step": 15043 + }, + { + "epoch": 0.39, + "learning_rate": 1.949519500513397e-06, + "loss": 0.8574, + "step": 15044 + }, + { + "epoch": 0.39, + "learning_rate": 1.9495108197067534e-06, + "loss": 1.1406, + "step": 15045 + }, + { + "epoch": 0.39, + "learning_rate": 1.9495021381731137e-06, + "loss": 0.9316, + "step": 15046 + }, + { + "epoch": 0.39, + "learning_rate": 1.9494934559124834e-06, + "loss": 0.9688, + "step": 15047 + }, + { + "epoch": 0.39, + "learning_rate": 1.9494847729248697e-06, + "loss": 0.9404, + "step": 15048 + }, + { + "epoch": 0.39, + "learning_rate": 1.9494760892102794e-06, + "loss": 0.957, + "step": 15049 + }, + { + "epoch": 0.39, + "learning_rate": 1.949467404768719e-06, + "loss": 0.7949, + "step": 15050 + }, + { + "epoch": 0.39, + "learning_rate": 1.9494587196001944e-06, + "loss": 0.8506, + "step": 15051 + }, + { + "epoch": 0.39, + "learning_rate": 1.9494500337047137e-06, + "loss": 0.7251, + "step": 15052 + }, + { + "epoch": 0.39, + "learning_rate": 1.9494413470822826e-06, + "loss": 0.9297, + "step": 15053 + }, + { + "epoch": 0.39, + "learning_rate": 1.9494326597329075e-06, + "loss": 0.9932, + "step": 15054 + }, + { + "epoch": 0.39, + "learning_rate": 1.9494239716565955e-06, + "loss": 0.8994, + "step": 15055 + }, + { + "epoch": 0.39, + "learning_rate": 1.9494152828533536e-06, + "loss": 0.8779, + "step": 15056 + }, + { + "epoch": 0.39, + "learning_rate": 1.949406593323188e-06, + "loss": 0.6516, + "step": 15057 + }, + { + "epoch": 0.39, + "learning_rate": 1.949397903066105e-06, + "loss": 0.9395, + "step": 15058 + }, + { + "epoch": 0.39, + "learning_rate": 1.9493892120821124e-06, + "loss": 0.7803, + "step": 15059 + }, + { + "epoch": 0.39, + "learning_rate": 1.9493805203712156e-06, + "loss": 0.9971, + "step": 15060 + }, + { + "epoch": 0.39, + "learning_rate": 1.9493718279334217e-06, + "loss": 0.9111, + "step": 15061 + }, + { + "epoch": 0.39, + "learning_rate": 1.9493631347687377e-06, + "loss": 0.8701, + "step": 15062 + }, + { + "epoch": 0.39, + "learning_rate": 1.94935444087717e-06, + "loss": 1.1641, + "step": 15063 + }, + { + "epoch": 0.39, + "learning_rate": 1.9493457462587256e-06, + "loss": 0.834, + "step": 15064 + }, + { + "epoch": 0.39, + "learning_rate": 1.9493370509134103e-06, + "loss": 0.9121, + "step": 15065 + }, + { + "epoch": 0.39, + "learning_rate": 1.9493283548412315e-06, + "loss": 0.9409, + "step": 15066 + }, + { + "epoch": 0.39, + "learning_rate": 1.9493196580421954e-06, + "loss": 0.833, + "step": 15067 + }, + { + "epoch": 0.39, + "learning_rate": 1.949310960516309e-06, + "loss": 0.8857, + "step": 15068 + }, + { + "epoch": 0.39, + "learning_rate": 1.949302262263579e-06, + "loss": 0.957, + "step": 15069 + }, + { + "epoch": 0.39, + "learning_rate": 1.9492935632840116e-06, + "loss": 0.9355, + "step": 15070 + }, + { + "epoch": 0.39, + "learning_rate": 1.949284863577614e-06, + "loss": 0.7227, + "step": 15071 + }, + { + "epoch": 0.39, + "learning_rate": 1.9492761631443926e-06, + "loss": 0.9551, + "step": 15072 + }, + { + "epoch": 0.39, + "learning_rate": 1.9492674619843545e-06, + "loss": 0.8242, + "step": 15073 + }, + { + "epoch": 0.39, + "learning_rate": 1.9492587600975054e-06, + "loss": 0.8606, + "step": 15074 + }, + { + "epoch": 0.39, + "learning_rate": 1.9492500574838524e-06, + "loss": 0.7559, + "step": 15075 + }, + { + "epoch": 0.39, + "learning_rate": 1.949241354143403e-06, + "loss": 0.6704, + "step": 15076 + }, + { + "epoch": 0.39, + "learning_rate": 1.9492326500761626e-06, + "loss": 1.0264, + "step": 15077 + }, + { + "epoch": 0.39, + "learning_rate": 1.949223945282138e-06, + "loss": 0.8643, + "step": 15078 + }, + { + "epoch": 0.39, + "learning_rate": 1.949215239761337e-06, + "loss": 0.8291, + "step": 15079 + }, + { + "epoch": 0.39, + "learning_rate": 1.9492065335137655e-06, + "loss": 0.8052, + "step": 15080 + }, + { + "epoch": 0.39, + "learning_rate": 1.94919782653943e-06, + "loss": 0.9727, + "step": 15081 + }, + { + "epoch": 0.39, + "learning_rate": 1.9491891188383373e-06, + "loss": 0.9473, + "step": 15082 + }, + { + "epoch": 0.39, + "learning_rate": 1.949180410410494e-06, + "loss": 1.0566, + "step": 15083 + }, + { + "epoch": 0.39, + "learning_rate": 1.9491717012559073e-06, + "loss": 0.731, + "step": 15084 + }, + { + "epoch": 0.39, + "learning_rate": 1.949162991374583e-06, + "loss": 0.7068, + "step": 15085 + }, + { + "epoch": 0.39, + "learning_rate": 1.9491542807665285e-06, + "loss": 0.8555, + "step": 15086 + }, + { + "epoch": 0.39, + "learning_rate": 1.9491455694317506e-06, + "loss": 1.0195, + "step": 15087 + }, + { + "epoch": 0.39, + "learning_rate": 1.949136857370255e-06, + "loss": 1.0439, + "step": 15088 + }, + { + "epoch": 0.39, + "learning_rate": 1.9491281445820494e-06, + "loss": 0.8008, + "step": 15089 + }, + { + "epoch": 0.39, + "learning_rate": 1.9491194310671396e-06, + "loss": 0.7739, + "step": 15090 + }, + { + "epoch": 0.39, + "learning_rate": 1.9491107168255327e-06, + "loss": 0.7041, + "step": 15091 + }, + { + "epoch": 0.39, + "learning_rate": 1.9491020018572355e-06, + "loss": 0.9131, + "step": 15092 + }, + { + "epoch": 0.39, + "learning_rate": 1.9490932861622548e-06, + "loss": 1.0664, + "step": 15093 + }, + { + "epoch": 0.39, + "learning_rate": 1.949084569740597e-06, + "loss": 0.8086, + "step": 15094 + }, + { + "epoch": 0.39, + "learning_rate": 1.9490758525922685e-06, + "loss": 0.833, + "step": 15095 + }, + { + "epoch": 0.39, + "learning_rate": 1.949067134717276e-06, + "loss": 1.1113, + "step": 15096 + }, + { + "epoch": 0.39, + "learning_rate": 1.949058416115627e-06, + "loss": 0.7432, + "step": 15097 + }, + { + "epoch": 0.39, + "learning_rate": 1.9490496967873275e-06, + "loss": 0.9277, + "step": 15098 + }, + { + "epoch": 0.39, + "learning_rate": 1.949040976732384e-06, + "loss": 0.9102, + "step": 15099 + }, + { + "epoch": 0.39, + "learning_rate": 1.9490322559508035e-06, + "loss": 0.9512, + "step": 15100 + }, + { + "epoch": 0.39, + "learning_rate": 1.949023534442593e-06, + "loss": 0.9932, + "step": 15101 + }, + { + "epoch": 0.39, + "learning_rate": 1.9490148122077584e-06, + "loss": 0.834, + "step": 15102 + }, + { + "epoch": 0.39, + "learning_rate": 1.949006089246307e-06, + "loss": 0.998, + "step": 15103 + }, + { + "epoch": 0.39, + "learning_rate": 1.948997365558245e-06, + "loss": 0.7744, + "step": 15104 + }, + { + "epoch": 0.39, + "learning_rate": 1.94898864114358e-06, + "loss": 0.8975, + "step": 15105 + }, + { + "epoch": 0.39, + "learning_rate": 1.9489799160023174e-06, + "loss": 0.731, + "step": 15106 + }, + { + "epoch": 0.39, + "learning_rate": 1.948971190134465e-06, + "loss": 0.9805, + "step": 15107 + }, + { + "epoch": 0.39, + "learning_rate": 1.9489624635400286e-06, + "loss": 1.043, + "step": 15108 + }, + { + "epoch": 0.39, + "learning_rate": 1.9489537362190154e-06, + "loss": 0.9941, + "step": 15109 + }, + { + "epoch": 0.39, + "learning_rate": 1.948945008171432e-06, + "loss": 0.8662, + "step": 15110 + }, + { + "epoch": 0.39, + "learning_rate": 1.948936279397285e-06, + "loss": 0.8994, + "step": 15111 + }, + { + "epoch": 0.39, + "learning_rate": 1.9489275498965814e-06, + "loss": 0.5786, + "step": 15112 + }, + { + "epoch": 0.39, + "learning_rate": 1.9489188196693274e-06, + "loss": 0.7783, + "step": 15113 + }, + { + "epoch": 0.39, + "learning_rate": 1.9489100887155297e-06, + "loss": 0.9814, + "step": 15114 + }, + { + "epoch": 0.39, + "learning_rate": 1.9489013570351953e-06, + "loss": 0.9238, + "step": 15115 + }, + { + "epoch": 0.39, + "learning_rate": 1.9488926246283308e-06, + "loss": 1.002, + "step": 15116 + }, + { + "epoch": 0.39, + "learning_rate": 1.9488838914949427e-06, + "loss": 1.0039, + "step": 15117 + }, + { + "epoch": 0.39, + "learning_rate": 1.948875157635038e-06, + "loss": 0.8066, + "step": 15118 + }, + { + "epoch": 0.39, + "learning_rate": 1.9488664230486235e-06, + "loss": 0.8621, + "step": 15119 + }, + { + "epoch": 0.39, + "learning_rate": 1.948857687735705e-06, + "loss": 1.1016, + "step": 15120 + }, + { + "epoch": 0.39, + "learning_rate": 1.94884895169629e-06, + "loss": 0.8721, + "step": 15121 + }, + { + "epoch": 0.39, + "learning_rate": 1.9488402149303855e-06, + "loss": 0.9863, + "step": 15122 + }, + { + "epoch": 0.39, + "learning_rate": 1.948831477437997e-06, + "loss": 0.793, + "step": 15123 + }, + { + "epoch": 0.39, + "learning_rate": 1.948822739219132e-06, + "loss": 0.9375, + "step": 15124 + }, + { + "epoch": 0.39, + "learning_rate": 1.9488140002737973e-06, + "loss": 0.6099, + "step": 15125 + }, + { + "epoch": 0.39, + "learning_rate": 1.948805260601999e-06, + "loss": 1.041, + "step": 15126 + }, + { + "epoch": 0.39, + "learning_rate": 1.948796520203745e-06, + "loss": 0.9062, + "step": 15127 + }, + { + "epoch": 0.39, + "learning_rate": 1.94878777907904e-06, + "loss": 1.0107, + "step": 15128 + }, + { + "epoch": 0.39, + "learning_rate": 1.9487790372278925e-06, + "loss": 0.6575, + "step": 15129 + }, + { + "epoch": 0.39, + "learning_rate": 1.948770294650308e-06, + "loss": 0.7402, + "step": 15130 + }, + { + "epoch": 0.39, + "learning_rate": 1.9487615513462944e-06, + "loss": 0.9307, + "step": 15131 + }, + { + "epoch": 0.39, + "learning_rate": 1.9487528073158576e-06, + "loss": 0.6731, + "step": 15132 + }, + { + "epoch": 0.39, + "learning_rate": 1.948744062559004e-06, + "loss": 0.7405, + "step": 15133 + }, + { + "epoch": 0.39, + "learning_rate": 1.9487353170757406e-06, + "loss": 1.0537, + "step": 15134 + }, + { + "epoch": 0.39, + "learning_rate": 1.9487265708660744e-06, + "loss": 1.0332, + "step": 15135 + }, + { + "epoch": 0.39, + "learning_rate": 1.948717823930012e-06, + "loss": 0.9238, + "step": 15136 + }, + { + "epoch": 0.39, + "learning_rate": 1.9487090762675603e-06, + "loss": 0.959, + "step": 15137 + }, + { + "epoch": 0.39, + "learning_rate": 1.948700327878725e-06, + "loss": 0.6528, + "step": 15138 + }, + { + "epoch": 0.39, + "learning_rate": 1.948691578763514e-06, + "loss": 0.7705, + "step": 15139 + }, + { + "epoch": 0.39, + "learning_rate": 1.948682828921933e-06, + "loss": 1.1992, + "step": 15140 + }, + { + "epoch": 0.39, + "learning_rate": 1.9486740783539893e-06, + "loss": 0.8164, + "step": 15141 + }, + { + "epoch": 0.39, + "learning_rate": 1.94866532705969e-06, + "loss": 0.7725, + "step": 15142 + }, + { + "epoch": 0.39, + "learning_rate": 1.948656575039041e-06, + "loss": 0.9355, + "step": 15143 + }, + { + "epoch": 0.39, + "learning_rate": 1.948647822292049e-06, + "loss": 0.8145, + "step": 15144 + }, + { + "epoch": 0.39, + "learning_rate": 1.9486390688187214e-06, + "loss": 0.8252, + "step": 15145 + }, + { + "epoch": 0.39, + "learning_rate": 1.948630314619064e-06, + "loss": 0.8652, + "step": 15146 + }, + { + "epoch": 0.39, + "learning_rate": 1.9486215596930845e-06, + "loss": 0.8032, + "step": 15147 + }, + { + "epoch": 0.39, + "learning_rate": 1.9486128040407886e-06, + "loss": 0.7983, + "step": 15148 + }, + { + "epoch": 0.39, + "learning_rate": 1.9486040476621835e-06, + "loss": 0.8324, + "step": 15149 + }, + { + "epoch": 0.39, + "learning_rate": 1.9485952905572765e-06, + "loss": 0.9443, + "step": 15150 + }, + { + "epoch": 0.39, + "learning_rate": 1.948586532726073e-06, + "loss": 0.8994, + "step": 15151 + }, + { + "epoch": 0.39, + "learning_rate": 1.948577774168581e-06, + "loss": 0.9434, + "step": 15152 + }, + { + "epoch": 0.39, + "learning_rate": 1.9485690148848063e-06, + "loss": 0.877, + "step": 15153 + }, + { + "epoch": 0.39, + "learning_rate": 1.948560254874756e-06, + "loss": 0.9336, + "step": 15154 + }, + { + "epoch": 0.39, + "learning_rate": 1.948551494138437e-06, + "loss": 0.7676, + "step": 15155 + }, + { + "epoch": 0.39, + "learning_rate": 1.9485427326758553e-06, + "loss": 0.8828, + "step": 15156 + }, + { + "epoch": 0.39, + "learning_rate": 1.948533970487018e-06, + "loss": 0.6597, + "step": 15157 + }, + { + "epoch": 0.39, + "learning_rate": 1.948525207571932e-06, + "loss": 0.8828, + "step": 15158 + }, + { + "epoch": 0.39, + "learning_rate": 1.948516443930604e-06, + "loss": 0.7397, + "step": 15159 + }, + { + "epoch": 0.39, + "learning_rate": 1.9485076795630402e-06, + "loss": 0.9746, + "step": 15160 + }, + { + "epoch": 0.39, + "learning_rate": 1.948498914469248e-06, + "loss": 1.1885, + "step": 15161 + }, + { + "epoch": 0.39, + "learning_rate": 1.9484901486492337e-06, + "loss": 0.8066, + "step": 15162 + }, + { + "epoch": 0.39, + "learning_rate": 1.9484813821030044e-06, + "loss": 1.0527, + "step": 15163 + }, + { + "epoch": 0.39, + "learning_rate": 1.9484726148305662e-06, + "loss": 1.1641, + "step": 15164 + }, + { + "epoch": 0.39, + "learning_rate": 1.948463846831926e-06, + "loss": 1.084, + "step": 15165 + }, + { + "epoch": 0.39, + "learning_rate": 1.948455078107091e-06, + "loss": 0.8359, + "step": 15166 + }, + { + "epoch": 0.39, + "learning_rate": 1.9484463086560674e-06, + "loss": 0.999, + "step": 15167 + }, + { + "epoch": 0.39, + "learning_rate": 1.948437538478862e-06, + "loss": 0.7568, + "step": 15168 + }, + { + "epoch": 0.39, + "learning_rate": 1.948428767575482e-06, + "loss": 0.8965, + "step": 15169 + }, + { + "epoch": 0.39, + "learning_rate": 1.948419995945933e-06, + "loss": 1.1582, + "step": 15170 + }, + { + "epoch": 0.39, + "learning_rate": 1.948411223590223e-06, + "loss": 0.7036, + "step": 15171 + }, + { + "epoch": 0.39, + "learning_rate": 1.948402450508358e-06, + "loss": 0.9863, + "step": 15172 + }, + { + "epoch": 0.39, + "learning_rate": 1.948393676700345e-06, + "loss": 0.8691, + "step": 15173 + }, + { + "epoch": 0.39, + "learning_rate": 1.94838490216619e-06, + "loss": 0.7544, + "step": 15174 + }, + { + "epoch": 0.39, + "learning_rate": 1.9483761269059007e-06, + "loss": 0.8584, + "step": 15175 + }, + { + "epoch": 0.39, + "learning_rate": 1.9483673509194833e-06, + "loss": 1.0557, + "step": 15176 + }, + { + "epoch": 0.39, + "learning_rate": 1.9483585742069447e-06, + "loss": 0.9834, + "step": 15177 + }, + { + "epoch": 0.39, + "learning_rate": 1.9483497967682918e-06, + "loss": 0.8203, + "step": 15178 + }, + { + "epoch": 0.39, + "learning_rate": 1.9483410186035304e-06, + "loss": 0.8086, + "step": 15179 + }, + { + "epoch": 0.39, + "learning_rate": 1.9483322397126683e-06, + "loss": 0.7236, + "step": 15180 + }, + { + "epoch": 0.39, + "learning_rate": 1.9483234600957118e-06, + "loss": 0.9043, + "step": 15181 + }, + { + "epoch": 0.39, + "learning_rate": 1.9483146797526676e-06, + "loss": 0.8389, + "step": 15182 + }, + { + "epoch": 0.39, + "learning_rate": 1.9483058986835425e-06, + "loss": 0.9141, + "step": 15183 + }, + { + "epoch": 0.39, + "learning_rate": 1.948297116888343e-06, + "loss": 0.8242, + "step": 15184 + }, + { + "epoch": 0.39, + "learning_rate": 1.9482883343670764e-06, + "loss": 0.9326, + "step": 15185 + }, + { + "epoch": 0.39, + "learning_rate": 1.9482795511197485e-06, + "loss": 0.918, + "step": 15186 + }, + { + "epoch": 0.39, + "learning_rate": 1.948270767146367e-06, + "loss": 0.8887, + "step": 15187 + }, + { + "epoch": 0.39, + "learning_rate": 1.9482619824469378e-06, + "loss": 0.7798, + "step": 15188 + }, + { + "epoch": 0.39, + "learning_rate": 1.9482531970214685e-06, + "loss": 0.6792, + "step": 15189 + }, + { + "epoch": 0.39, + "learning_rate": 1.948244410869965e-06, + "loss": 0.8525, + "step": 15190 + }, + { + "epoch": 0.39, + "learning_rate": 1.948235623992434e-06, + "loss": 1.083, + "step": 15191 + }, + { + "epoch": 0.39, + "learning_rate": 1.9482268363888836e-06, + "loss": 1.0234, + "step": 15192 + }, + { + "epoch": 0.39, + "learning_rate": 1.9482180480593186e-06, + "loss": 1.0264, + "step": 15193 + }, + { + "epoch": 0.39, + "learning_rate": 1.948209259003747e-06, + "loss": 0.9575, + "step": 15194 + }, + { + "epoch": 0.39, + "learning_rate": 1.9482004692221748e-06, + "loss": 0.915, + "step": 15195 + }, + { + "epoch": 0.39, + "learning_rate": 1.9481916787146094e-06, + "loss": 0.9082, + "step": 15196 + }, + { + "epoch": 0.39, + "learning_rate": 1.9481828874810577e-06, + "loss": 0.77, + "step": 15197 + }, + { + "epoch": 0.39, + "learning_rate": 1.948174095521525e-06, + "loss": 0.9883, + "step": 15198 + }, + { + "epoch": 0.39, + "learning_rate": 1.9481653028360198e-06, + "loss": 0.957, + "step": 15199 + }, + { + "epoch": 0.39, + "learning_rate": 1.9481565094245472e-06, + "loss": 0.9111, + "step": 15200 + }, + { + "epoch": 0.39, + "learning_rate": 1.9481477152871154e-06, + "loss": 0.8867, + "step": 15201 + }, + { + "epoch": 0.39, + "learning_rate": 1.9481389204237305e-06, + "loss": 0.9287, + "step": 15202 + }, + { + "epoch": 0.39, + "learning_rate": 1.948130124834399e-06, + "loss": 0.7271, + "step": 15203 + }, + { + "epoch": 0.39, + "learning_rate": 1.948121328519128e-06, + "loss": 0.792, + "step": 15204 + }, + { + "epoch": 0.39, + "learning_rate": 1.9481125314779242e-06, + "loss": 0.8555, + "step": 15205 + }, + { + "epoch": 0.39, + "learning_rate": 1.948103733710794e-06, + "loss": 1.0518, + "step": 15206 + }, + { + "epoch": 0.39, + "learning_rate": 1.948094935217744e-06, + "loss": 0.9053, + "step": 15207 + }, + { + "epoch": 0.39, + "learning_rate": 1.948086135998782e-06, + "loss": 0.7646, + "step": 15208 + }, + { + "epoch": 0.39, + "learning_rate": 1.948077336053914e-06, + "loss": 0.636, + "step": 15209 + }, + { + "epoch": 0.39, + "learning_rate": 1.9480685353831464e-06, + "loss": 1.0479, + "step": 15210 + }, + { + "epoch": 0.39, + "learning_rate": 1.9480597339864863e-06, + "loss": 0.5646, + "step": 15211 + }, + { + "epoch": 0.39, + "learning_rate": 1.948050931863941e-06, + "loss": 0.8662, + "step": 15212 + }, + { + "epoch": 0.39, + "learning_rate": 1.948042129015516e-06, + "loss": 0.7456, + "step": 15213 + }, + { + "epoch": 0.39, + "learning_rate": 1.948033325441219e-06, + "loss": 0.8047, + "step": 15214 + }, + { + "epoch": 0.39, + "learning_rate": 1.9480245211410565e-06, + "loss": 0.6025, + "step": 15215 + }, + { + "epoch": 0.39, + "learning_rate": 1.9480157161150356e-06, + "loss": 0.8203, + "step": 15216 + }, + { + "epoch": 0.39, + "learning_rate": 1.948006910363162e-06, + "loss": 0.833, + "step": 15217 + }, + { + "epoch": 0.39, + "learning_rate": 1.9479981038854436e-06, + "loss": 0.668, + "step": 15218 + }, + { + "epoch": 0.39, + "learning_rate": 1.9479892966818865e-06, + "loss": 0.7578, + "step": 15219 + }, + { + "epoch": 0.39, + "learning_rate": 1.9479804887524975e-06, + "loss": 0.5891, + "step": 15220 + }, + { + "epoch": 0.39, + "learning_rate": 1.947971680097283e-06, + "loss": 0.9697, + "step": 15221 + }, + { + "epoch": 0.39, + "learning_rate": 1.947962870716251e-06, + "loss": 0.6172, + "step": 15222 + }, + { + "epoch": 0.39, + "learning_rate": 1.9479540606094068e-06, + "loss": 0.7588, + "step": 15223 + }, + { + "epoch": 0.39, + "learning_rate": 1.947945249776758e-06, + "loss": 0.771, + "step": 15224 + }, + { + "epoch": 0.39, + "learning_rate": 1.947936438218311e-06, + "loss": 0.6958, + "step": 15225 + }, + { + "epoch": 0.39, + "learning_rate": 1.947927625934073e-06, + "loss": 0.6865, + "step": 15226 + }, + { + "epoch": 0.39, + "learning_rate": 1.9479188129240503e-06, + "loss": 0.9336, + "step": 15227 + }, + { + "epoch": 0.39, + "learning_rate": 1.9479099991882497e-06, + "loss": 0.7871, + "step": 15228 + }, + { + "epoch": 0.39, + "learning_rate": 1.9479011847266777e-06, + "loss": 0.8047, + "step": 15229 + }, + { + "epoch": 0.39, + "learning_rate": 1.9478923695393416e-06, + "loss": 1.0996, + "step": 15230 + }, + { + "epoch": 0.39, + "learning_rate": 1.947883553626248e-06, + "loss": 0.7734, + "step": 15231 + }, + { + "epoch": 0.39, + "learning_rate": 1.947874736987403e-06, + "loss": 0.9102, + "step": 15232 + }, + { + "epoch": 0.39, + "learning_rate": 1.9478659196228146e-06, + "loss": 0.9106, + "step": 15233 + }, + { + "epoch": 0.39, + "learning_rate": 1.9478571015324887e-06, + "loss": 0.9766, + "step": 15234 + }, + { + "epoch": 0.39, + "learning_rate": 1.947848282716432e-06, + "loss": 0.9209, + "step": 15235 + }, + { + "epoch": 0.39, + "learning_rate": 1.9478394631746513e-06, + "loss": 0.9453, + "step": 15236 + }, + { + "epoch": 0.39, + "learning_rate": 1.947830642907154e-06, + "loss": 1.0303, + "step": 15237 + }, + { + "epoch": 0.39, + "learning_rate": 1.947821821913946e-06, + "loss": 1.0635, + "step": 15238 + }, + { + "epoch": 0.39, + "learning_rate": 1.947813000195035e-06, + "loss": 0.7134, + "step": 15239 + }, + { + "epoch": 0.39, + "learning_rate": 1.9478041777504263e-06, + "loss": 0.9717, + "step": 15240 + }, + { + "epoch": 0.39, + "learning_rate": 1.947795354580128e-06, + "loss": 0.7051, + "step": 15241 + }, + { + "epoch": 0.39, + "learning_rate": 1.9477865306841462e-06, + "loss": 0.958, + "step": 15242 + }, + { + "epoch": 0.39, + "learning_rate": 1.9477777060624878e-06, + "loss": 1.0254, + "step": 15243 + }, + { + "epoch": 0.39, + "learning_rate": 1.9477688807151596e-06, + "loss": 0.9062, + "step": 15244 + }, + { + "epoch": 0.39, + "learning_rate": 1.9477600546421682e-06, + "loss": 0.6465, + "step": 15245 + }, + { + "epoch": 0.39, + "learning_rate": 1.947751227843521e-06, + "loss": 1.2373, + "step": 15246 + }, + { + "epoch": 0.39, + "learning_rate": 1.947742400319224e-06, + "loss": 0.9512, + "step": 15247 + }, + { + "epoch": 0.39, + "learning_rate": 1.947733572069284e-06, + "loss": 0.7734, + "step": 15248 + }, + { + "epoch": 0.39, + "learning_rate": 1.947724743093708e-06, + "loss": 0.8113, + "step": 15249 + }, + { + "epoch": 0.39, + "learning_rate": 1.9477159133925032e-06, + "loss": 0.8418, + "step": 15250 + }, + { + "epoch": 0.39, + "learning_rate": 1.947707082965676e-06, + "loss": 0.8418, + "step": 15251 + }, + { + "epoch": 0.39, + "learning_rate": 1.9476982518132326e-06, + "loss": 0.8215, + "step": 15252 + }, + { + "epoch": 0.39, + "learning_rate": 1.94768941993518e-06, + "loss": 0.6362, + "step": 15253 + }, + { + "epoch": 0.39, + "learning_rate": 1.9476805873315257e-06, + "loss": 0.9248, + "step": 15254 + }, + { + "epoch": 0.39, + "learning_rate": 1.947671754002276e-06, + "loss": 0.7959, + "step": 15255 + }, + { + "epoch": 0.39, + "learning_rate": 1.947662919947437e-06, + "loss": 0.7656, + "step": 15256 + }, + { + "epoch": 0.39, + "learning_rate": 1.9476540851670165e-06, + "loss": 0.8789, + "step": 15257 + }, + { + "epoch": 0.39, + "learning_rate": 1.947645249661021e-06, + "loss": 0.9971, + "step": 15258 + }, + { + "epoch": 0.39, + "learning_rate": 1.9476364134294568e-06, + "loss": 0.7402, + "step": 15259 + }, + { + "epoch": 0.39, + "learning_rate": 1.9476275764723313e-06, + "loss": 0.9089, + "step": 15260 + }, + { + "epoch": 0.39, + "learning_rate": 1.9476187387896505e-06, + "loss": 0.9346, + "step": 15261 + }, + { + "epoch": 0.39, + "learning_rate": 1.947609900381422e-06, + "loss": 1.1113, + "step": 15262 + }, + { + "epoch": 0.39, + "learning_rate": 1.947601061247652e-06, + "loss": 1.0674, + "step": 15263 + }, + { + "epoch": 0.39, + "learning_rate": 1.9475922213883475e-06, + "loss": 0.9199, + "step": 15264 + }, + { + "epoch": 0.39, + "learning_rate": 1.947583380803515e-06, + "loss": 0.9014, + "step": 15265 + }, + { + "epoch": 0.39, + "learning_rate": 1.947574539493162e-06, + "loss": 0.8799, + "step": 15266 + }, + { + "epoch": 0.39, + "learning_rate": 1.9475656974572942e-06, + "loss": 0.8262, + "step": 15267 + }, + { + "epoch": 0.39, + "learning_rate": 1.947556854695919e-06, + "loss": 0.4395, + "step": 15268 + }, + { + "epoch": 0.39, + "learning_rate": 1.9475480112090433e-06, + "loss": 0.8535, + "step": 15269 + }, + { + "epoch": 0.39, + "learning_rate": 1.9475391669966736e-06, + "loss": 0.6367, + "step": 15270 + }, + { + "epoch": 0.39, + "learning_rate": 1.9475303220588164e-06, + "loss": 0.7363, + "step": 15271 + }, + { + "epoch": 0.39, + "learning_rate": 1.9475214763954792e-06, + "loss": 0.8682, + "step": 15272 + }, + { + "epoch": 0.39, + "learning_rate": 1.947512630006668e-06, + "loss": 0.8252, + "step": 15273 + }, + { + "epoch": 0.39, + "learning_rate": 1.9475037828923902e-06, + "loss": 0.9766, + "step": 15274 + }, + { + "epoch": 0.39, + "learning_rate": 1.9474949350526523e-06, + "loss": 1.0195, + "step": 15275 + }, + { + "epoch": 0.39, + "learning_rate": 1.9474860864874612e-06, + "loss": 1.0889, + "step": 15276 + }, + { + "epoch": 0.39, + "learning_rate": 1.9474772371968237e-06, + "loss": 0.7812, + "step": 15277 + }, + { + "epoch": 0.39, + "learning_rate": 1.947468387180746e-06, + "loss": 0.7632, + "step": 15278 + }, + { + "epoch": 0.39, + "learning_rate": 1.9474595364392355e-06, + "loss": 0.9746, + "step": 15279 + }, + { + "epoch": 0.39, + "learning_rate": 1.9474506849722988e-06, + "loss": 0.9404, + "step": 15280 + }, + { + "epoch": 0.39, + "learning_rate": 1.9474418327799428e-06, + "loss": 0.9873, + "step": 15281 + }, + { + "epoch": 0.39, + "learning_rate": 1.947432979862174e-06, + "loss": 0.9785, + "step": 15282 + }, + { + "epoch": 0.39, + "learning_rate": 1.9474241262189994e-06, + "loss": 0.8325, + "step": 15283 + }, + { + "epoch": 0.39, + "learning_rate": 1.947415271850426e-06, + "loss": 1.2422, + "step": 15284 + }, + { + "epoch": 0.39, + "learning_rate": 1.9474064167564595e-06, + "loss": 0.8052, + "step": 15285 + }, + { + "epoch": 0.39, + "learning_rate": 1.9473975609371084e-06, + "loss": 0.9395, + "step": 15286 + }, + { + "epoch": 0.39, + "learning_rate": 1.9473887043923777e-06, + "loss": 0.7393, + "step": 15287 + }, + { + "epoch": 0.39, + "learning_rate": 1.9473798471222756e-06, + "loss": 0.9014, + "step": 15288 + }, + { + "epoch": 0.39, + "learning_rate": 1.9473709891268083e-06, + "loss": 0.8174, + "step": 15289 + }, + { + "epoch": 0.39, + "learning_rate": 1.9473621304059823e-06, + "loss": 0.7212, + "step": 15290 + }, + { + "epoch": 0.39, + "learning_rate": 1.9473532709598047e-06, + "loss": 0.792, + "step": 15291 + }, + { + "epoch": 0.39, + "learning_rate": 1.9473444107882827e-06, + "loss": 0.8262, + "step": 15292 + }, + { + "epoch": 0.39, + "learning_rate": 1.947335549891422e-06, + "loss": 0.9199, + "step": 15293 + }, + { + "epoch": 0.39, + "learning_rate": 1.9473266882692305e-06, + "loss": 0.9736, + "step": 15294 + }, + { + "epoch": 0.39, + "learning_rate": 1.9473178259217143e-06, + "loss": 0.7554, + "step": 15295 + }, + { + "epoch": 0.39, + "learning_rate": 1.9473089628488804e-06, + "loss": 0.7949, + "step": 15296 + }, + { + "epoch": 0.39, + "learning_rate": 1.9473000990507356e-06, + "loss": 0.7256, + "step": 15297 + }, + { + "epoch": 0.39, + "learning_rate": 1.947291234527287e-06, + "loss": 1.0098, + "step": 15298 + }, + { + "epoch": 0.39, + "learning_rate": 1.947282369278541e-06, + "loss": 0.9609, + "step": 15299 + }, + { + "epoch": 0.39, + "learning_rate": 1.947273503304504e-06, + "loss": 0.8018, + "step": 15300 + }, + { + "epoch": 0.39, + "learning_rate": 1.9472646366051835e-06, + "loss": 0.9434, + "step": 15301 + }, + { + "epoch": 0.39, + "learning_rate": 1.947255769180586e-06, + "loss": 0.9072, + "step": 15302 + }, + { + "epoch": 0.39, + "learning_rate": 1.947246901030718e-06, + "loss": 0.9561, + "step": 15303 + }, + { + "epoch": 0.39, + "learning_rate": 1.9472380321555873e-06, + "loss": 0.7139, + "step": 15304 + }, + { + "epoch": 0.39, + "learning_rate": 1.9472291625551995e-06, + "loss": 0.6367, + "step": 15305 + }, + { + "epoch": 0.39, + "learning_rate": 1.947220292229562e-06, + "loss": 0.8311, + "step": 15306 + }, + { + "epoch": 0.39, + "learning_rate": 1.9472114211786816e-06, + "loss": 0.7368, + "step": 15307 + }, + { + "epoch": 0.39, + "learning_rate": 1.9472025494025647e-06, + "loss": 0.8359, + "step": 15308 + }, + { + "epoch": 0.39, + "learning_rate": 1.9471936769012186e-06, + "loss": 0.8164, + "step": 15309 + }, + { + "epoch": 0.39, + "learning_rate": 1.9471848036746497e-06, + "loss": 0.7393, + "step": 15310 + }, + { + "epoch": 0.39, + "learning_rate": 1.947175929722865e-06, + "loss": 0.9766, + "step": 15311 + }, + { + "epoch": 0.39, + "learning_rate": 1.9471670550458713e-06, + "loss": 0.7329, + "step": 15312 + }, + { + "epoch": 0.39, + "learning_rate": 1.9471581796436754e-06, + "loss": 0.9717, + "step": 15313 + }, + { + "epoch": 0.39, + "learning_rate": 1.9471493035162837e-06, + "loss": 0.8042, + "step": 15314 + }, + { + "epoch": 0.39, + "learning_rate": 1.9471404266637035e-06, + "loss": 0.7202, + "step": 15315 + }, + { + "epoch": 0.39, + "learning_rate": 1.9471315490859416e-06, + "loss": 0.9863, + "step": 15316 + }, + { + "epoch": 0.39, + "learning_rate": 1.9471226707830043e-06, + "loss": 0.8477, + "step": 15317 + }, + { + "epoch": 0.39, + "learning_rate": 1.947113791754899e-06, + "loss": 0.7087, + "step": 15318 + }, + { + "epoch": 0.39, + "learning_rate": 1.9471049120016322e-06, + "loss": 0.9346, + "step": 15319 + }, + { + "epoch": 0.39, + "learning_rate": 1.9470960315232106e-06, + "loss": 0.876, + "step": 15320 + }, + { + "epoch": 0.39, + "learning_rate": 1.947087150319641e-06, + "loss": 0.9688, + "step": 15321 + }, + { + "epoch": 0.39, + "learning_rate": 1.947078268390931e-06, + "loss": 0.8535, + "step": 15322 + }, + { + "epoch": 0.39, + "learning_rate": 1.947069385737086e-06, + "loss": 0.7881, + "step": 15323 + }, + { + "epoch": 0.39, + "learning_rate": 1.9470605023581137e-06, + "loss": 0.6729, + "step": 15324 + }, + { + "epoch": 0.39, + "learning_rate": 1.947051618254021e-06, + "loss": 0.7822, + "step": 15325 + }, + { + "epoch": 0.39, + "learning_rate": 1.9470427334248138e-06, + "loss": 1.0996, + "step": 15326 + }, + { + "epoch": 0.39, + "learning_rate": 1.9470338478705002e-06, + "loss": 0.7212, + "step": 15327 + }, + { + "epoch": 0.39, + "learning_rate": 1.947024961591086e-06, + "loss": 1.0645, + "step": 15328 + }, + { + "epoch": 0.39, + "learning_rate": 1.947016074586578e-06, + "loss": 0.7808, + "step": 15329 + }, + { + "epoch": 0.39, + "learning_rate": 1.947007186856984e-06, + "loss": 0.873, + "step": 15330 + }, + { + "epoch": 0.39, + "learning_rate": 1.94699829840231e-06, + "loss": 0.9336, + "step": 15331 + }, + { + "epoch": 0.39, + "learning_rate": 1.9469894092225623e-06, + "loss": 0.8359, + "step": 15332 + }, + { + "epoch": 0.39, + "learning_rate": 1.946980519317749e-06, + "loss": 0.8799, + "step": 15333 + }, + { + "epoch": 0.39, + "learning_rate": 1.946971628687876e-06, + "loss": 0.8525, + "step": 15334 + }, + { + "epoch": 0.39, + "learning_rate": 1.946962737332951e-06, + "loss": 0.9736, + "step": 15335 + }, + { + "epoch": 0.39, + "learning_rate": 1.9469538452529794e-06, + "loss": 0.9736, + "step": 15336 + }, + { + "epoch": 0.39, + "learning_rate": 1.946944952447969e-06, + "loss": 0.6934, + "step": 15337 + }, + { + "epoch": 0.39, + "learning_rate": 1.9469360589179263e-06, + "loss": 1.0762, + "step": 15338 + }, + { + "epoch": 0.39, + "learning_rate": 1.9469271646628586e-06, + "loss": 0.8799, + "step": 15339 + }, + { + "epoch": 0.39, + "learning_rate": 1.9469182696827717e-06, + "loss": 0.9922, + "step": 15340 + }, + { + "epoch": 0.39, + "learning_rate": 1.9469093739776733e-06, + "loss": 0.8105, + "step": 15341 + }, + { + "epoch": 0.39, + "learning_rate": 1.9469004775475703e-06, + "loss": 0.8477, + "step": 15342 + }, + { + "epoch": 0.39, + "learning_rate": 1.946891580392469e-06, + "loss": 0.8018, + "step": 15343 + }, + { + "epoch": 0.39, + "learning_rate": 1.9468826825123758e-06, + "loss": 1.0713, + "step": 15344 + }, + { + "epoch": 0.39, + "learning_rate": 1.9468737839072983e-06, + "loss": 0.8926, + "step": 15345 + }, + { + "epoch": 0.39, + "learning_rate": 1.9468648845772433e-06, + "loss": 0.7812, + "step": 15346 + }, + { + "epoch": 0.39, + "learning_rate": 1.9468559845222174e-06, + "loss": 0.9795, + "step": 15347 + }, + { + "epoch": 0.39, + "learning_rate": 1.9468470837422274e-06, + "loss": 1.0918, + "step": 15348 + }, + { + "epoch": 0.39, + "learning_rate": 1.9468381822372797e-06, + "loss": 0.9131, + "step": 15349 + }, + { + "epoch": 0.39, + "learning_rate": 1.9468292800073824e-06, + "loss": 0.7461, + "step": 15350 + }, + { + "epoch": 0.39, + "learning_rate": 1.9468203770525405e-06, + "loss": 0.7373, + "step": 15351 + }, + { + "epoch": 0.39, + "learning_rate": 1.9468114733727624e-06, + "loss": 0.6304, + "step": 15352 + }, + { + "epoch": 0.39, + "learning_rate": 1.946802568968054e-06, + "loss": 1.0469, + "step": 15353 + }, + { + "epoch": 0.39, + "learning_rate": 1.946793663838423e-06, + "loss": 0.6978, + "step": 15354 + }, + { + "epoch": 0.39, + "learning_rate": 1.9467847579838747e-06, + "loss": 0.9883, + "step": 15355 + }, + { + "epoch": 0.39, + "learning_rate": 1.946775851404417e-06, + "loss": 0.8105, + "step": 15356 + }, + { + "epoch": 0.39, + "learning_rate": 1.9467669441000576e-06, + "loss": 0.8223, + "step": 15357 + }, + { + "epoch": 0.39, + "learning_rate": 1.9467580360708013e-06, + "loss": 0.8672, + "step": 15358 + }, + { + "epoch": 0.39, + "learning_rate": 1.946749127316656e-06, + "loss": 0.8149, + "step": 15359 + }, + { + "epoch": 0.39, + "learning_rate": 1.9467402178376288e-06, + "loss": 0.9365, + "step": 15360 + }, + { + "epoch": 0.39, + "learning_rate": 1.9467313076337256e-06, + "loss": 0.5806, + "step": 15361 + }, + { + "epoch": 0.39, + "learning_rate": 1.946722396704954e-06, + "loss": 0.6924, + "step": 15362 + }, + { + "epoch": 0.39, + "learning_rate": 1.946713485051321e-06, + "loss": 0.9727, + "step": 15363 + }, + { + "epoch": 0.39, + "learning_rate": 1.9467045726728326e-06, + "loss": 0.9136, + "step": 15364 + }, + { + "epoch": 0.39, + "learning_rate": 1.946695659569496e-06, + "loss": 1.1055, + "step": 15365 + }, + { + "epoch": 0.39, + "learning_rate": 1.9466867457413186e-06, + "loss": 0.9629, + "step": 15366 + }, + { + "epoch": 0.39, + "learning_rate": 1.946677831188306e-06, + "loss": 0.8374, + "step": 15367 + }, + { + "epoch": 0.39, + "learning_rate": 1.946668915910466e-06, + "loss": 0.8408, + "step": 15368 + }, + { + "epoch": 0.39, + "learning_rate": 1.9466599999078052e-06, + "loss": 0.8643, + "step": 15369 + }, + { + "epoch": 0.39, + "learning_rate": 1.9466510831803304e-06, + "loss": 0.9678, + "step": 15370 + }, + { + "epoch": 0.39, + "learning_rate": 1.946642165728048e-06, + "loss": 0.9746, + "step": 15371 + }, + { + "epoch": 0.39, + "learning_rate": 1.946633247550966e-06, + "loss": 0.9844, + "step": 15372 + }, + { + "epoch": 0.39, + "learning_rate": 1.9466243286490897e-06, + "loss": 0.8726, + "step": 15373 + }, + { + "epoch": 0.39, + "learning_rate": 1.946615409022427e-06, + "loss": 0.9263, + "step": 15374 + }, + { + "epoch": 0.39, + "learning_rate": 1.9466064886709847e-06, + "loss": 1.041, + "step": 15375 + }, + { + "epoch": 0.39, + "learning_rate": 1.9465975675947686e-06, + "loss": 0.6592, + "step": 15376 + }, + { + "epoch": 0.39, + "learning_rate": 1.9465886457937867e-06, + "loss": 0.8164, + "step": 15377 + }, + { + "epoch": 0.39, + "learning_rate": 1.9465797232680452e-06, + "loss": 0.7266, + "step": 15378 + }, + { + "epoch": 0.39, + "learning_rate": 1.9465708000175515e-06, + "loss": 0.8291, + "step": 15379 + }, + { + "epoch": 0.39, + "learning_rate": 1.9465618760423117e-06, + "loss": 0.8877, + "step": 15380 + }, + { + "epoch": 0.39, + "learning_rate": 1.9465529513423333e-06, + "loss": 0.7766, + "step": 15381 + }, + { + "epoch": 0.39, + "learning_rate": 1.946544025917623e-06, + "loss": 0.9414, + "step": 15382 + }, + { + "epoch": 0.39, + "learning_rate": 1.9465350997681867e-06, + "loss": 1.0518, + "step": 15383 + }, + { + "epoch": 0.39, + "learning_rate": 1.9465261728940327e-06, + "loss": 0.9775, + "step": 15384 + }, + { + "epoch": 0.39, + "learning_rate": 1.946517245295167e-06, + "loss": 0.8623, + "step": 15385 + }, + { + "epoch": 0.39, + "learning_rate": 1.946508316971596e-06, + "loss": 0.9062, + "step": 15386 + }, + { + "epoch": 0.39, + "learning_rate": 1.9464993879233277e-06, + "loss": 0.8086, + "step": 15387 + }, + { + "epoch": 0.39, + "learning_rate": 1.946490458150368e-06, + "loss": 0.876, + "step": 15388 + }, + { + "epoch": 0.39, + "learning_rate": 1.9464815276527244e-06, + "loss": 0.8984, + "step": 15389 + }, + { + "epoch": 0.39, + "learning_rate": 1.9464725964304037e-06, + "loss": 0.8125, + "step": 15390 + }, + { + "epoch": 0.39, + "learning_rate": 1.9464636644834117e-06, + "loss": 0.8945, + "step": 15391 + }, + { + "epoch": 0.39, + "learning_rate": 1.9464547318117567e-06, + "loss": 0.7053, + "step": 15392 + }, + { + "epoch": 0.39, + "learning_rate": 1.9464457984154443e-06, + "loss": 0.5552, + "step": 15393 + }, + { + "epoch": 0.39, + "learning_rate": 1.946436864294482e-06, + "loss": 0.8975, + "step": 15394 + }, + { + "epoch": 0.39, + "learning_rate": 1.9464279294488763e-06, + "loss": 0.9756, + "step": 15395 + }, + { + "epoch": 0.39, + "learning_rate": 1.9464189938786348e-06, + "loss": 0.9629, + "step": 15396 + }, + { + "epoch": 0.39, + "learning_rate": 1.9464100575837633e-06, + "loss": 1.0918, + "step": 15397 + }, + { + "epoch": 0.39, + "learning_rate": 1.9464011205642696e-06, + "loss": 0.7812, + "step": 15398 + }, + { + "epoch": 0.39, + "learning_rate": 1.94639218282016e-06, + "loss": 0.9404, + "step": 15399 + }, + { + "epoch": 0.39, + "learning_rate": 1.9463832443514406e-06, + "loss": 0.7891, + "step": 15400 + }, + { + "epoch": 0.39, + "learning_rate": 1.94637430515812e-06, + "loss": 0.8633, + "step": 15401 + }, + { + "epoch": 0.39, + "learning_rate": 1.946365365240204e-06, + "loss": 0.9795, + "step": 15402 + }, + { + "epoch": 0.39, + "learning_rate": 1.946356424597699e-06, + "loss": 1.0762, + "step": 15403 + }, + { + "epoch": 0.39, + "learning_rate": 1.9463474832306126e-06, + "loss": 1.168, + "step": 15404 + }, + { + "epoch": 0.39, + "learning_rate": 1.9463385411389518e-06, + "loss": 0.7524, + "step": 15405 + }, + { + "epoch": 0.39, + "learning_rate": 1.946329598322723e-06, + "loss": 0.8794, + "step": 15406 + }, + { + "epoch": 0.39, + "learning_rate": 1.946320654781933e-06, + "loss": 0.8125, + "step": 15407 + }, + { + "epoch": 0.39, + "learning_rate": 1.9463117105165887e-06, + "loss": 0.646, + "step": 15408 + }, + { + "epoch": 0.39, + "learning_rate": 1.9463027655266975e-06, + "loss": 0.9121, + "step": 15409 + }, + { + "epoch": 0.39, + "learning_rate": 1.9462938198122652e-06, + "loss": 0.7637, + "step": 15410 + }, + { + "epoch": 0.39, + "learning_rate": 1.9462848733732993e-06, + "loss": 0.5579, + "step": 15411 + }, + { + "epoch": 0.4, + "learning_rate": 1.946275926209807e-06, + "loss": 0.8721, + "step": 15412 + }, + { + "epoch": 0.4, + "learning_rate": 1.9462669783217943e-06, + "loss": 0.8706, + "step": 15413 + }, + { + "epoch": 0.4, + "learning_rate": 1.946258029709269e-06, + "loss": 0.8457, + "step": 15414 + }, + { + "epoch": 0.4, + "learning_rate": 1.946249080372237e-06, + "loss": 0.8857, + "step": 15415 + }, + { + "epoch": 0.4, + "learning_rate": 1.946240130310706e-06, + "loss": 0.9814, + "step": 15416 + }, + { + "epoch": 0.4, + "learning_rate": 1.9462311795246817e-06, + "loss": 0.6885, + "step": 15417 + }, + { + "epoch": 0.4, + "learning_rate": 1.946222228014172e-06, + "loss": 0.6357, + "step": 15418 + }, + { + "epoch": 0.4, + "learning_rate": 1.9462132757791836e-06, + "loss": 0.8076, + "step": 15419 + }, + { + "epoch": 0.4, + "learning_rate": 1.9462043228197232e-06, + "loss": 0.7837, + "step": 15420 + }, + { + "epoch": 0.4, + "learning_rate": 1.9461953691357977e-06, + "loss": 0.875, + "step": 15421 + }, + { + "epoch": 0.4, + "learning_rate": 1.9461864147274143e-06, + "loss": 0.8105, + "step": 15422 + }, + { + "epoch": 0.4, + "learning_rate": 1.9461774595945788e-06, + "loss": 1.1113, + "step": 15423 + }, + { + "epoch": 0.4, + "learning_rate": 1.946168503737299e-06, + "loss": 0.9346, + "step": 15424 + }, + { + "epoch": 0.4, + "learning_rate": 1.9461595471555813e-06, + "loss": 0.8252, + "step": 15425 + }, + { + "epoch": 0.4, + "learning_rate": 1.946150589849433e-06, + "loss": 0.9111, + "step": 15426 + }, + { + "epoch": 0.4, + "learning_rate": 1.9461416318188604e-06, + "loss": 0.834, + "step": 15427 + }, + { + "epoch": 0.4, + "learning_rate": 1.9461326730638707e-06, + "loss": 0.7588, + "step": 15428 + }, + { + "epoch": 0.4, + "learning_rate": 1.946123713584471e-06, + "loss": 0.5347, + "step": 15429 + }, + { + "epoch": 0.4, + "learning_rate": 1.9461147533806675e-06, + "loss": 0.5898, + "step": 15430 + }, + { + "epoch": 0.4, + "learning_rate": 1.9461057924524678e-06, + "loss": 0.7627, + "step": 15431 + }, + { + "epoch": 0.4, + "learning_rate": 1.9460968307998782e-06, + "loss": 1.0605, + "step": 15432 + }, + { + "epoch": 0.4, + "learning_rate": 1.9460878684229057e-06, + "loss": 0.9082, + "step": 15433 + }, + { + "epoch": 0.4, + "learning_rate": 1.9460789053215578e-06, + "loss": 0.8584, + "step": 15434 + }, + { + "epoch": 0.4, + "learning_rate": 1.94606994149584e-06, + "loss": 0.752, + "step": 15435 + }, + { + "epoch": 0.4, + "learning_rate": 1.9460609769457603e-06, + "loss": 0.7383, + "step": 15436 + }, + { + "epoch": 0.4, + "learning_rate": 1.9460520116713253e-06, + "loss": 1.0879, + "step": 15437 + }, + { + "epoch": 0.4, + "learning_rate": 1.9460430456725415e-06, + "loss": 0.8633, + "step": 15438 + }, + { + "epoch": 0.4, + "learning_rate": 1.946034078949416e-06, + "loss": 0.8965, + "step": 15439 + }, + { + "epoch": 0.4, + "learning_rate": 1.946025111501956e-06, + "loss": 0.7461, + "step": 15440 + }, + { + "epoch": 0.4, + "learning_rate": 1.9460161433301682e-06, + "loss": 0.8037, + "step": 15441 + }, + { + "epoch": 0.4, + "learning_rate": 1.946007174434059e-06, + "loss": 1.0107, + "step": 15442 + }, + { + "epoch": 0.4, + "learning_rate": 1.945998204813636e-06, + "loss": 1.002, + "step": 15443 + }, + { + "epoch": 0.4, + "learning_rate": 1.9459892344689054e-06, + "loss": 0.7998, + "step": 15444 + }, + { + "epoch": 0.4, + "learning_rate": 1.9459802633998743e-06, + "loss": 0.9707, + "step": 15445 + }, + { + "epoch": 0.4, + "learning_rate": 1.9459712916065495e-06, + "loss": 0.8232, + "step": 15446 + }, + { + "epoch": 0.4, + "learning_rate": 1.945962319088938e-06, + "loss": 0.9229, + "step": 15447 + }, + { + "epoch": 0.4, + "learning_rate": 1.945953345847047e-06, + "loss": 1.1006, + "step": 15448 + }, + { + "epoch": 0.4, + "learning_rate": 1.945944371880883e-06, + "loss": 0.7773, + "step": 15449 + }, + { + "epoch": 0.4, + "learning_rate": 1.9459353971904522e-06, + "loss": 0.6992, + "step": 15450 + }, + { + "epoch": 0.4, + "learning_rate": 1.9459264217757626e-06, + "loss": 0.8423, + "step": 15451 + }, + { + "epoch": 0.4, + "learning_rate": 1.945917445636821e-06, + "loss": 0.8066, + "step": 15452 + }, + { + "epoch": 0.4, + "learning_rate": 1.9459084687736334e-06, + "loss": 1.0498, + "step": 15453 + }, + { + "epoch": 0.4, + "learning_rate": 1.9458994911862073e-06, + "loss": 1.0215, + "step": 15454 + }, + { + "epoch": 0.4, + "learning_rate": 1.94589051287455e-06, + "loss": 0.8408, + "step": 15455 + }, + { + "epoch": 0.4, + "learning_rate": 1.945881533838667e-06, + "loss": 1.002, + "step": 15456 + }, + { + "epoch": 0.4, + "learning_rate": 1.9458725540785666e-06, + "loss": 0.9902, + "step": 15457 + }, + { + "epoch": 0.4, + "learning_rate": 1.9458635735942544e-06, + "loss": 1.0273, + "step": 15458 + }, + { + "epoch": 0.4, + "learning_rate": 1.9458545923857387e-06, + "loss": 0.7871, + "step": 15459 + }, + { + "epoch": 0.4, + "learning_rate": 1.945845610453025e-06, + "loss": 0.9209, + "step": 15460 + }, + { + "epoch": 0.4, + "learning_rate": 1.9458366277961212e-06, + "loss": 1.0029, + "step": 15461 + }, + { + "epoch": 0.4, + "learning_rate": 1.945827644415034e-06, + "loss": 0.8994, + "step": 15462 + }, + { + "epoch": 0.4, + "learning_rate": 1.9458186603097697e-06, + "loss": 0.9229, + "step": 15463 + }, + { + "epoch": 0.4, + "learning_rate": 1.9458096754803356e-06, + "loss": 0.8105, + "step": 15464 + }, + { + "epoch": 0.4, + "learning_rate": 1.9458006899267387e-06, + "loss": 1.0703, + "step": 15465 + }, + { + "epoch": 0.4, + "learning_rate": 1.9457917036489854e-06, + "loss": 0.7358, + "step": 15466 + }, + { + "epoch": 0.4, + "learning_rate": 1.945782716647083e-06, + "loss": 0.8857, + "step": 15467 + }, + { + "epoch": 0.4, + "learning_rate": 1.9457737289210383e-06, + "loss": 0.9932, + "step": 15468 + }, + { + "epoch": 0.4, + "learning_rate": 1.945764740470858e-06, + "loss": 0.7898, + "step": 15469 + }, + { + "epoch": 0.4, + "learning_rate": 1.945755751296549e-06, + "loss": 0.7793, + "step": 15470 + }, + { + "epoch": 0.4, + "learning_rate": 1.9457467613981186e-06, + "loss": 0.5791, + "step": 15471 + }, + { + "epoch": 0.4, + "learning_rate": 1.9457377707755733e-06, + "loss": 0.9307, + "step": 15472 + }, + { + "epoch": 0.4, + "learning_rate": 1.9457287794289203e-06, + "loss": 0.6963, + "step": 15473 + }, + { + "epoch": 0.4, + "learning_rate": 1.945719787358166e-06, + "loss": 0.896, + "step": 15474 + }, + { + "epoch": 0.4, + "learning_rate": 1.945710794563318e-06, + "loss": 0.8379, + "step": 15475 + }, + { + "epoch": 0.4, + "learning_rate": 1.945701801044382e-06, + "loss": 0.9395, + "step": 15476 + }, + { + "epoch": 0.4, + "learning_rate": 1.945692806801366e-06, + "loss": 0.9731, + "step": 15477 + }, + { + "epoch": 0.4, + "learning_rate": 1.9456838118342763e-06, + "loss": 0.8057, + "step": 15478 + }, + { + "epoch": 0.4, + "learning_rate": 1.94567481614312e-06, + "loss": 0.624, + "step": 15479 + }, + { + "epoch": 0.4, + "learning_rate": 1.9456658197279046e-06, + "loss": 0.6934, + "step": 15480 + }, + { + "epoch": 0.4, + "learning_rate": 1.945656822588636e-06, + "loss": 0.9082, + "step": 15481 + }, + { + "epoch": 0.4, + "learning_rate": 1.945647824725321e-06, + "loss": 0.769, + "step": 15482 + }, + { + "epoch": 0.4, + "learning_rate": 1.9456388261379673e-06, + "loss": 0.8999, + "step": 15483 + }, + { + "epoch": 0.4, + "learning_rate": 1.945629826826582e-06, + "loss": 0.8682, + "step": 15484 + }, + { + "epoch": 0.4, + "learning_rate": 1.9456208267911703e-06, + "loss": 0.582, + "step": 15485 + }, + { + "epoch": 0.4, + "learning_rate": 1.945611826031741e-06, + "loss": 0.834, + "step": 15486 + }, + { + "epoch": 0.4, + "learning_rate": 1.9456028245483e-06, + "loss": 0.8184, + "step": 15487 + }, + { + "epoch": 0.4, + "learning_rate": 1.945593822340854e-06, + "loss": 0.7554, + "step": 15488 + }, + { + "epoch": 0.4, + "learning_rate": 1.9455848194094106e-06, + "loss": 0.9346, + "step": 15489 + }, + { + "epoch": 0.4, + "learning_rate": 1.9455758157539767e-06, + "loss": 1.0176, + "step": 15490 + }, + { + "epoch": 0.4, + "learning_rate": 1.9455668113745584e-06, + "loss": 0.9004, + "step": 15491 + }, + { + "epoch": 0.4, + "learning_rate": 1.9455578062711633e-06, + "loss": 0.7734, + "step": 15492 + }, + { + "epoch": 0.4, + "learning_rate": 1.945548800443798e-06, + "loss": 0.8975, + "step": 15493 + }, + { + "epoch": 0.4, + "learning_rate": 1.9455397938924696e-06, + "loss": 0.9375, + "step": 15494 + }, + { + "epoch": 0.4, + "learning_rate": 1.945530786617185e-06, + "loss": 0.8721, + "step": 15495 + }, + { + "epoch": 0.4, + "learning_rate": 1.9455217786179506e-06, + "loss": 1.1074, + "step": 15496 + }, + { + "epoch": 0.4, + "learning_rate": 1.9455127698947737e-06, + "loss": 0.9111, + "step": 15497 + }, + { + "epoch": 0.4, + "learning_rate": 1.945503760447661e-06, + "loss": 0.9375, + "step": 15498 + }, + { + "epoch": 0.4, + "learning_rate": 1.94549475027662e-06, + "loss": 0.9043, + "step": 15499 + }, + { + "epoch": 0.4, + "learning_rate": 1.945485739381657e-06, + "loss": 0.7769, + "step": 15500 + }, + { + "epoch": 0.4, + "learning_rate": 1.945476727762779e-06, + "loss": 0.9233, + "step": 15501 + }, + { + "epoch": 0.4, + "learning_rate": 1.945467715419993e-06, + "loss": 1.0146, + "step": 15502 + }, + { + "epoch": 0.4, + "learning_rate": 1.9454587023533057e-06, + "loss": 0.8271, + "step": 15503 + }, + { + "epoch": 0.4, + "learning_rate": 1.945449688562724e-06, + "loss": 0.9395, + "step": 15504 + }, + { + "epoch": 0.4, + "learning_rate": 1.945440674048255e-06, + "loss": 0.7815, + "step": 15505 + }, + { + "epoch": 0.4, + "learning_rate": 1.9454316588099057e-06, + "loss": 0.8223, + "step": 15506 + }, + { + "epoch": 0.4, + "learning_rate": 1.945422642847683e-06, + "loss": 0.8467, + "step": 15507 + }, + { + "epoch": 0.4, + "learning_rate": 1.9454136261615933e-06, + "loss": 1.0479, + "step": 15508 + }, + { + "epoch": 0.4, + "learning_rate": 1.945404608751644e-06, + "loss": 0.9268, + "step": 15509 + }, + { + "epoch": 0.4, + "learning_rate": 1.9453955906178423e-06, + "loss": 0.8223, + "step": 15510 + }, + { + "epoch": 0.4, + "learning_rate": 1.945386571760194e-06, + "loss": 0.9551, + "step": 15511 + }, + { + "epoch": 0.4, + "learning_rate": 1.945377552178707e-06, + "loss": 1.0439, + "step": 15512 + }, + { + "epoch": 0.4, + "learning_rate": 1.945368531873388e-06, + "loss": 0.9092, + "step": 15513 + }, + { + "epoch": 0.4, + "learning_rate": 1.945359510844243e-06, + "loss": 0.8667, + "step": 15514 + }, + { + "epoch": 0.4, + "learning_rate": 1.945350489091281e-06, + "loss": 0.7786, + "step": 15515 + }, + { + "epoch": 0.4, + "learning_rate": 1.9453414666145064e-06, + "loss": 0.9893, + "step": 15516 + }, + { + "epoch": 0.4, + "learning_rate": 1.945332443413928e-06, + "loss": 0.9473, + "step": 15517 + }, + { + "epoch": 0.4, + "learning_rate": 1.9453234194895518e-06, + "loss": 0.8164, + "step": 15518 + }, + { + "epoch": 0.4, + "learning_rate": 1.9453143948413847e-06, + "loss": 0.7979, + "step": 15519 + }, + { + "epoch": 0.4, + "learning_rate": 1.9453053694694343e-06, + "loss": 1.1133, + "step": 15520 + }, + { + "epoch": 0.4, + "learning_rate": 1.9452963433737065e-06, + "loss": 0.7046, + "step": 15521 + }, + { + "epoch": 0.4, + "learning_rate": 1.9452873165542094e-06, + "loss": 0.7944, + "step": 15522 + }, + { + "epoch": 0.4, + "learning_rate": 1.945278289010949e-06, + "loss": 1.1455, + "step": 15523 + }, + { + "epoch": 0.4, + "learning_rate": 1.9452692607439322e-06, + "loss": 0.7554, + "step": 15524 + }, + { + "epoch": 0.4, + "learning_rate": 1.9452602317531665e-06, + "loss": 0.7207, + "step": 15525 + }, + { + "epoch": 0.4, + "learning_rate": 1.9452512020386586e-06, + "loss": 0.9912, + "step": 15526 + }, + { + "epoch": 0.4, + "learning_rate": 1.945242171600415e-06, + "loss": 0.635, + "step": 15527 + }, + { + "epoch": 0.4, + "learning_rate": 1.945233140438443e-06, + "loss": 0.8477, + "step": 15528 + }, + { + "epoch": 0.4, + "learning_rate": 1.9452241085527494e-06, + "loss": 0.7271, + "step": 15529 + }, + { + "epoch": 0.4, + "learning_rate": 1.9452150759433416e-06, + "loss": 0.835, + "step": 15530 + }, + { + "epoch": 0.4, + "learning_rate": 1.9452060426102255e-06, + "loss": 0.9453, + "step": 15531 + }, + { + "epoch": 0.4, + "learning_rate": 1.9451970085534087e-06, + "loss": 1.0703, + "step": 15532 + }, + { + "epoch": 0.4, + "learning_rate": 1.9451879737728984e-06, + "loss": 0.7192, + "step": 15533 + }, + { + "epoch": 0.4, + "learning_rate": 1.945178938268701e-06, + "loss": 0.7305, + "step": 15534 + }, + { + "epoch": 0.4, + "learning_rate": 1.945169902040823e-06, + "loss": 0.8867, + "step": 15535 + }, + { + "epoch": 0.4, + "learning_rate": 1.9451608650892725e-06, + "loss": 0.7563, + "step": 15536 + }, + { + "epoch": 0.4, + "learning_rate": 1.945151827414056e-06, + "loss": 0.8984, + "step": 15537 + }, + { + "epoch": 0.4, + "learning_rate": 1.9451427890151796e-06, + "loss": 0.8267, + "step": 15538 + }, + { + "epoch": 0.4, + "learning_rate": 1.945133749892651e-06, + "loss": 1.0854, + "step": 15539 + }, + { + "epoch": 0.4, + "learning_rate": 1.945124710046477e-06, + "loss": 0.8887, + "step": 15540 + }, + { + "epoch": 0.4, + "learning_rate": 1.945115669476664e-06, + "loss": 0.9277, + "step": 15541 + }, + { + "epoch": 0.4, + "learning_rate": 1.94510662818322e-06, + "loss": 0.9473, + "step": 15542 + }, + { + "epoch": 0.4, + "learning_rate": 1.945097586166151e-06, + "loss": 0.9121, + "step": 15543 + }, + { + "epoch": 0.4, + "learning_rate": 1.9450885434254645e-06, + "loss": 0.9443, + "step": 15544 + }, + { + "epoch": 0.4, + "learning_rate": 1.9450794999611673e-06, + "loss": 0.6836, + "step": 15545 + }, + { + "epoch": 0.4, + "learning_rate": 1.945070455773266e-06, + "loss": 0.8203, + "step": 15546 + }, + { + "epoch": 0.4, + "learning_rate": 1.9450614108617677e-06, + "loss": 0.7598, + "step": 15547 + }, + { + "epoch": 0.4, + "learning_rate": 1.945052365226679e-06, + "loss": 1.0254, + "step": 15548 + }, + { + "epoch": 0.4, + "learning_rate": 1.9450433188680074e-06, + "loss": 0.7637, + "step": 15549 + }, + { + "epoch": 0.4, + "learning_rate": 1.9450342717857598e-06, + "loss": 1.2168, + "step": 15550 + }, + { + "epoch": 0.4, + "learning_rate": 1.9450252239799427e-06, + "loss": 0.75, + "step": 15551 + }, + { + "epoch": 0.4, + "learning_rate": 1.945016175450563e-06, + "loss": 0.9336, + "step": 15552 + }, + { + "epoch": 0.4, + "learning_rate": 1.9450071261976283e-06, + "loss": 0.9414, + "step": 15553 + }, + { + "epoch": 0.4, + "learning_rate": 1.944998076221145e-06, + "loss": 0.9736, + "step": 15554 + }, + { + "epoch": 0.4, + "learning_rate": 1.94498902552112e-06, + "loss": 0.9414, + "step": 15555 + }, + { + "epoch": 0.4, + "learning_rate": 1.9449799740975604e-06, + "loss": 0.917, + "step": 15556 + }, + { + "epoch": 0.4, + "learning_rate": 1.944970921950473e-06, + "loss": 1.0303, + "step": 15557 + }, + { + "epoch": 0.4, + "learning_rate": 1.9449618690798647e-06, + "loss": 0.9302, + "step": 15558 + }, + { + "epoch": 0.4, + "learning_rate": 1.944952815485743e-06, + "loss": 0.8438, + "step": 15559 + }, + { + "epoch": 0.4, + "learning_rate": 1.944943761168114e-06, + "loss": 0.8975, + "step": 15560 + }, + { + "epoch": 0.4, + "learning_rate": 1.944934706126985e-06, + "loss": 0.9727, + "step": 15561 + }, + { + "epoch": 0.4, + "learning_rate": 1.944925650362363e-06, + "loss": 0.7446, + "step": 15562 + }, + { + "epoch": 0.4, + "learning_rate": 1.944916593874255e-06, + "loss": 0.9375, + "step": 15563 + }, + { + "epoch": 0.4, + "learning_rate": 1.9449075366626678e-06, + "loss": 1.1777, + "step": 15564 + }, + { + "epoch": 0.4, + "learning_rate": 1.9448984787276085e-06, + "loss": 0.7188, + "step": 15565 + }, + { + "epoch": 0.4, + "learning_rate": 1.9448894200690835e-06, + "loss": 0.9365, + "step": 15566 + }, + { + "epoch": 0.4, + "learning_rate": 1.9448803606871005e-06, + "loss": 0.6409, + "step": 15567 + }, + { + "epoch": 0.4, + "learning_rate": 1.944871300581666e-06, + "loss": 1.0112, + "step": 15568 + }, + { + "epoch": 0.4, + "learning_rate": 1.9448622397527867e-06, + "loss": 0.813, + "step": 15569 + }, + { + "epoch": 0.4, + "learning_rate": 1.94485317820047e-06, + "loss": 1.0107, + "step": 15570 + }, + { + "epoch": 0.4, + "learning_rate": 1.944844115924723e-06, + "loss": 0.8716, + "step": 15571 + }, + { + "epoch": 0.4, + "learning_rate": 1.9448350529255517e-06, + "loss": 0.7354, + "step": 15572 + }, + { + "epoch": 0.4, + "learning_rate": 1.9448259892029636e-06, + "loss": 1.0762, + "step": 15573 + }, + { + "epoch": 0.4, + "learning_rate": 1.9448169247569662e-06, + "loss": 0.7896, + "step": 15574 + }, + { + "epoch": 0.4, + "learning_rate": 1.944807859587566e-06, + "loss": 0.9863, + "step": 15575 + }, + { + "epoch": 0.4, + "learning_rate": 1.944798793694769e-06, + "loss": 1.1055, + "step": 15576 + }, + { + "epoch": 0.4, + "learning_rate": 1.944789727078584e-06, + "loss": 0.9141, + "step": 15577 + }, + { + "epoch": 0.4, + "learning_rate": 1.9447806597390166e-06, + "loss": 0.874, + "step": 15578 + }, + { + "epoch": 0.4, + "learning_rate": 1.944771591676074e-06, + "loss": 0.6313, + "step": 15579 + }, + { + "epoch": 0.4, + "learning_rate": 1.9447625228897634e-06, + "loss": 0.9316, + "step": 15580 + }, + { + "epoch": 0.4, + "learning_rate": 1.9447534533800912e-06, + "loss": 0.8691, + "step": 15581 + }, + { + "epoch": 0.4, + "learning_rate": 1.944744383147065e-06, + "loss": 1.082, + "step": 15582 + }, + { + "epoch": 0.4, + "learning_rate": 1.9447353121906917e-06, + "loss": 0.9199, + "step": 15583 + }, + { + "epoch": 0.4, + "learning_rate": 1.9447262405109774e-06, + "loss": 0.8037, + "step": 15584 + }, + { + "epoch": 0.4, + "learning_rate": 1.94471716810793e-06, + "loss": 0.8564, + "step": 15585 + }, + { + "epoch": 0.4, + "learning_rate": 1.9447080949815563e-06, + "loss": 0.8042, + "step": 15586 + }, + { + "epoch": 0.4, + "learning_rate": 1.9446990211318626e-06, + "loss": 0.6787, + "step": 15587 + }, + { + "epoch": 0.4, + "learning_rate": 1.9446899465588566e-06, + "loss": 0.7529, + "step": 15588 + }, + { + "epoch": 0.4, + "learning_rate": 1.944680871262545e-06, + "loss": 0.9746, + "step": 15589 + }, + { + "epoch": 0.4, + "learning_rate": 1.9446717952429346e-06, + "loss": 1.0723, + "step": 15590 + }, + { + "epoch": 0.4, + "learning_rate": 1.944662718500032e-06, + "loss": 0.8223, + "step": 15591 + }, + { + "epoch": 0.4, + "learning_rate": 1.9446536410338454e-06, + "loss": 0.9824, + "step": 15592 + }, + { + "epoch": 0.4, + "learning_rate": 1.9446445628443805e-06, + "loss": 0.8066, + "step": 15593 + }, + { + "epoch": 0.4, + "learning_rate": 1.944635483931645e-06, + "loss": 0.9619, + "step": 15594 + }, + { + "epoch": 0.4, + "learning_rate": 1.9446264042956455e-06, + "loss": 1.0195, + "step": 15595 + }, + { + "epoch": 0.4, + "learning_rate": 1.9446173239363884e-06, + "loss": 0.9248, + "step": 15596 + }, + { + "epoch": 0.4, + "learning_rate": 1.9446082428538817e-06, + "loss": 0.7744, + "step": 15597 + }, + { + "epoch": 0.4, + "learning_rate": 1.944599161048132e-06, + "loss": 1.0742, + "step": 15598 + }, + { + "epoch": 0.4, + "learning_rate": 1.944590078519146e-06, + "loss": 1.0654, + "step": 15599 + }, + { + "epoch": 0.4, + "learning_rate": 1.9445809952669308e-06, + "loss": 0.7529, + "step": 15600 + }, + { + "epoch": 0.4, + "learning_rate": 1.944571911291493e-06, + "loss": 0.8198, + "step": 15601 + }, + { + "epoch": 0.4, + "learning_rate": 1.9445628265928405e-06, + "loss": 1.1104, + "step": 15602 + }, + { + "epoch": 0.4, + "learning_rate": 1.9445537411709797e-06, + "loss": 0.8984, + "step": 15603 + }, + { + "epoch": 0.4, + "learning_rate": 1.944544655025917e-06, + "loss": 0.8389, + "step": 15604 + }, + { + "epoch": 0.4, + "learning_rate": 1.9445355681576604e-06, + "loss": 0.9893, + "step": 15605 + }, + { + "epoch": 0.4, + "learning_rate": 1.9445264805662162e-06, + "loss": 0.728, + "step": 15606 + }, + { + "epoch": 0.4, + "learning_rate": 1.9445173922515914e-06, + "loss": 0.9482, + "step": 15607 + }, + { + "epoch": 0.4, + "learning_rate": 1.944508303213793e-06, + "loss": 1.1494, + "step": 15608 + }, + { + "epoch": 0.4, + "learning_rate": 1.9444992134528282e-06, + "loss": 0.6475, + "step": 15609 + }, + { + "epoch": 0.4, + "learning_rate": 1.944490122968704e-06, + "loss": 0.6953, + "step": 15610 + }, + { + "epoch": 0.4, + "learning_rate": 1.944481031761427e-06, + "loss": 0.8213, + "step": 15611 + }, + { + "epoch": 0.4, + "learning_rate": 1.944471939831004e-06, + "loss": 1.085, + "step": 15612 + }, + { + "epoch": 0.4, + "learning_rate": 1.944462847177442e-06, + "loss": 0.9062, + "step": 15613 + }, + { + "epoch": 0.4, + "learning_rate": 1.944453753800749e-06, + "loss": 0.8252, + "step": 15614 + }, + { + "epoch": 0.4, + "learning_rate": 1.9444446597009306e-06, + "loss": 0.7773, + "step": 15615 + }, + { + "epoch": 0.4, + "learning_rate": 1.9444355648779948e-06, + "loss": 0.7178, + "step": 15616 + }, + { + "epoch": 0.4, + "learning_rate": 1.9444264693319477e-06, + "loss": 0.7988, + "step": 15617 + }, + { + "epoch": 0.4, + "learning_rate": 1.944417373062797e-06, + "loss": 0.6338, + "step": 15618 + }, + { + "epoch": 0.4, + "learning_rate": 1.9444082760705493e-06, + "loss": 0.9922, + "step": 15619 + }, + { + "epoch": 0.4, + "learning_rate": 1.9443991783552115e-06, + "loss": 0.9434, + "step": 15620 + }, + { + "epoch": 0.4, + "learning_rate": 1.944390079916791e-06, + "loss": 0.9395, + "step": 15621 + }, + { + "epoch": 0.4, + "learning_rate": 1.944380980755294e-06, + "loss": 1.0, + "step": 15622 + }, + { + "epoch": 0.4, + "learning_rate": 1.9443718808707283e-06, + "loss": 1.0352, + "step": 15623 + }, + { + "epoch": 0.4, + "learning_rate": 1.9443627802631e-06, + "loss": 0.9971, + "step": 15624 + }, + { + "epoch": 0.4, + "learning_rate": 1.9443536789324167e-06, + "loss": 1.1025, + "step": 15625 + }, + { + "epoch": 0.4, + "learning_rate": 1.9443445768786854e-06, + "loss": 0.832, + "step": 15626 + }, + { + "epoch": 0.4, + "learning_rate": 1.9443354741019128e-06, + "loss": 0.627, + "step": 15627 + }, + { + "epoch": 0.4, + "learning_rate": 1.9443263706021056e-06, + "loss": 0.6809, + "step": 15628 + }, + { + "epoch": 0.4, + "learning_rate": 1.9443172663792716e-06, + "loss": 0.8237, + "step": 15629 + }, + { + "epoch": 0.4, + "learning_rate": 1.944308161433417e-06, + "loss": 0.8828, + "step": 15630 + }, + { + "epoch": 0.4, + "learning_rate": 1.9442990557645495e-06, + "loss": 0.918, + "step": 15631 + }, + { + "epoch": 0.4, + "learning_rate": 1.944289949372675e-06, + "loss": 0.7671, + "step": 15632 + }, + { + "epoch": 0.4, + "learning_rate": 1.9442808422578016e-06, + "loss": 0.9424, + "step": 15633 + }, + { + "epoch": 0.4, + "learning_rate": 1.9442717344199356e-06, + "loss": 0.8066, + "step": 15634 + }, + { + "epoch": 0.4, + "learning_rate": 1.944262625859084e-06, + "loss": 1.0293, + "step": 15635 + }, + { + "epoch": 0.4, + "learning_rate": 1.944253516575254e-06, + "loss": 1.0293, + "step": 15636 + }, + { + "epoch": 0.4, + "learning_rate": 1.944244406568453e-06, + "loss": 0.8193, + "step": 15637 + }, + { + "epoch": 0.4, + "learning_rate": 1.944235295838687e-06, + "loss": 1.2891, + "step": 15638 + }, + { + "epoch": 0.4, + "learning_rate": 1.9442261843859633e-06, + "loss": 1.0586, + "step": 15639 + }, + { + "epoch": 0.4, + "learning_rate": 1.944217072210289e-06, + "loss": 0.8789, + "step": 15640 + }, + { + "epoch": 0.4, + "learning_rate": 1.9442079593116714e-06, + "loss": 0.8657, + "step": 15641 + }, + { + "epoch": 0.4, + "learning_rate": 1.9441988456901174e-06, + "loss": 1.0181, + "step": 15642 + }, + { + "epoch": 0.4, + "learning_rate": 1.9441897313456336e-06, + "loss": 0.8135, + "step": 15643 + }, + { + "epoch": 0.4, + "learning_rate": 1.944180616278227e-06, + "loss": 0.6782, + "step": 15644 + }, + { + "epoch": 0.4, + "learning_rate": 1.944171500487905e-06, + "loss": 0.5464, + "step": 15645 + }, + { + "epoch": 0.4, + "learning_rate": 1.9441623839746736e-06, + "loss": 0.8232, + "step": 15646 + }, + { + "epoch": 0.4, + "learning_rate": 1.9441532667385408e-06, + "loss": 0.8594, + "step": 15647 + }, + { + "epoch": 0.4, + "learning_rate": 1.9441441487795136e-06, + "loss": 1.0186, + "step": 15648 + }, + { + "epoch": 0.4, + "learning_rate": 1.944135030097598e-06, + "loss": 0.6798, + "step": 15649 + }, + { + "epoch": 0.4, + "learning_rate": 1.944125910692802e-06, + "loss": 0.9375, + "step": 15650 + }, + { + "epoch": 0.4, + "learning_rate": 1.9441167905651326e-06, + "loss": 0.8926, + "step": 15651 + }, + { + "epoch": 0.4, + "learning_rate": 1.944107669714596e-06, + "loss": 1.0273, + "step": 15652 + }, + { + "epoch": 0.4, + "learning_rate": 1.9440985481411995e-06, + "loss": 1.0762, + "step": 15653 + }, + { + "epoch": 0.4, + "learning_rate": 1.9440894258449503e-06, + "loss": 1.0537, + "step": 15654 + }, + { + "epoch": 0.4, + "learning_rate": 1.944080302825855e-06, + "loss": 0.9648, + "step": 15655 + }, + { + "epoch": 0.4, + "learning_rate": 1.944071179083921e-06, + "loss": 0.9766, + "step": 15656 + }, + { + "epoch": 0.4, + "learning_rate": 1.944062054619155e-06, + "loss": 0.7568, + "step": 15657 + }, + { + "epoch": 0.4, + "learning_rate": 1.9440529294315645e-06, + "loss": 0.7715, + "step": 15658 + }, + { + "epoch": 0.4, + "learning_rate": 1.9440438035211554e-06, + "loss": 0.9131, + "step": 15659 + }, + { + "epoch": 0.4, + "learning_rate": 1.944034676887936e-06, + "loss": 0.873, + "step": 15660 + }, + { + "epoch": 0.4, + "learning_rate": 1.9440255495319123e-06, + "loss": 0.7188, + "step": 15661 + }, + { + "epoch": 0.4, + "learning_rate": 1.944016421453092e-06, + "loss": 0.8792, + "step": 15662 + }, + { + "epoch": 0.4, + "learning_rate": 1.944007292651481e-06, + "loss": 1.0039, + "step": 15663 + }, + { + "epoch": 0.4, + "learning_rate": 1.9439981631270877e-06, + "loss": 0.8359, + "step": 15664 + }, + { + "epoch": 0.4, + "learning_rate": 1.943989032879918e-06, + "loss": 0.8662, + "step": 15665 + }, + { + "epoch": 0.4, + "learning_rate": 1.9439799019099795e-06, + "loss": 0.7275, + "step": 15666 + }, + { + "epoch": 0.4, + "learning_rate": 1.943970770217279e-06, + "loss": 0.9971, + "step": 15667 + }, + { + "epoch": 0.4, + "learning_rate": 1.943961637801824e-06, + "loss": 0.8916, + "step": 15668 + }, + { + "epoch": 0.4, + "learning_rate": 1.9439525046636203e-06, + "loss": 1.0527, + "step": 15669 + }, + { + "epoch": 0.4, + "learning_rate": 1.9439433708026757e-06, + "loss": 0.7026, + "step": 15670 + }, + { + "epoch": 0.4, + "learning_rate": 1.9439342362189972e-06, + "loss": 0.7725, + "step": 15671 + }, + { + "epoch": 0.4, + "learning_rate": 1.9439251009125913e-06, + "loss": 0.918, + "step": 15672 + }, + { + "epoch": 0.4, + "learning_rate": 1.9439159648834656e-06, + "loss": 0.9272, + "step": 15673 + }, + { + "epoch": 0.4, + "learning_rate": 1.943906828131627e-06, + "loss": 1.0605, + "step": 15674 + }, + { + "epoch": 0.4, + "learning_rate": 1.9438976906570824e-06, + "loss": 0.9004, + "step": 15675 + }, + { + "epoch": 0.4, + "learning_rate": 1.9438885524598386e-06, + "loss": 0.7461, + "step": 15676 + }, + { + "epoch": 0.4, + "learning_rate": 1.9438794135399025e-06, + "loss": 1.0127, + "step": 15677 + }, + { + "epoch": 0.4, + "learning_rate": 1.9438702738972817e-06, + "loss": 1.0586, + "step": 15678 + }, + { + "epoch": 0.4, + "learning_rate": 1.9438611335319825e-06, + "loss": 0.7065, + "step": 15679 + }, + { + "epoch": 0.4, + "learning_rate": 1.943851992444012e-06, + "loss": 1.1084, + "step": 15680 + }, + { + "epoch": 0.4, + "learning_rate": 1.9438428506333783e-06, + "loss": 0.8193, + "step": 15681 + }, + { + "epoch": 0.4, + "learning_rate": 1.943833708100087e-06, + "loss": 1.1104, + "step": 15682 + }, + { + "epoch": 0.4, + "learning_rate": 1.9438245648441455e-06, + "loss": 0.8789, + "step": 15683 + }, + { + "epoch": 0.4, + "learning_rate": 1.9438154208655613e-06, + "loss": 0.9619, + "step": 15684 + }, + { + "epoch": 0.4, + "learning_rate": 1.9438062761643407e-06, + "loss": 1.0459, + "step": 15685 + }, + { + "epoch": 0.4, + "learning_rate": 1.9437971307404913e-06, + "loss": 0.77, + "step": 15686 + }, + { + "epoch": 0.4, + "learning_rate": 1.9437879845940195e-06, + "loss": 0.9346, + "step": 15687 + }, + { + "epoch": 0.4, + "learning_rate": 1.943778837724933e-06, + "loss": 0.8457, + "step": 15688 + }, + { + "epoch": 0.4, + "learning_rate": 1.943769690133238e-06, + "loss": 0.8828, + "step": 15689 + }, + { + "epoch": 0.4, + "learning_rate": 1.943760541818942e-06, + "loss": 0.8467, + "step": 15690 + }, + { + "epoch": 0.4, + "learning_rate": 1.943751392782052e-06, + "loss": 0.7925, + "step": 15691 + }, + { + "epoch": 0.4, + "learning_rate": 1.9437422430225757e-06, + "loss": 0.9639, + "step": 15692 + }, + { + "epoch": 0.4, + "learning_rate": 1.9437330925405187e-06, + "loss": 0.9131, + "step": 15693 + }, + { + "epoch": 0.4, + "learning_rate": 1.9437239413358884e-06, + "loss": 0.7598, + "step": 15694 + }, + { + "epoch": 0.4, + "learning_rate": 1.943714789408693e-06, + "loss": 1.2236, + "step": 15695 + }, + { + "epoch": 0.4, + "learning_rate": 1.9437056367589375e-06, + "loss": 1.0303, + "step": 15696 + }, + { + "epoch": 0.4, + "learning_rate": 1.943696483386631e-06, + "loss": 0.8867, + "step": 15697 + }, + { + "epoch": 0.4, + "learning_rate": 1.943687329291779e-06, + "loss": 0.8223, + "step": 15698 + }, + { + "epoch": 0.4, + "learning_rate": 1.9436781744743888e-06, + "loss": 0.9922, + "step": 15699 + }, + { + "epoch": 0.4, + "learning_rate": 1.9436690189344677e-06, + "loss": 1.0244, + "step": 15700 + }, + { + "epoch": 0.4, + "learning_rate": 1.943659862672023e-06, + "loss": 1.0137, + "step": 15701 + }, + { + "epoch": 0.4, + "learning_rate": 1.9436507056870605e-06, + "loss": 0.9912, + "step": 15702 + }, + { + "epoch": 0.4, + "learning_rate": 1.9436415479795885e-06, + "loss": 1.0, + "step": 15703 + }, + { + "epoch": 0.4, + "learning_rate": 1.943632389549614e-06, + "loss": 0.8711, + "step": 15704 + }, + { + "epoch": 0.4, + "learning_rate": 1.9436232303971434e-06, + "loss": 0.6914, + "step": 15705 + }, + { + "epoch": 0.4, + "learning_rate": 1.9436140705221834e-06, + "loss": 1.0127, + "step": 15706 + }, + { + "epoch": 0.4, + "learning_rate": 1.9436049099247417e-06, + "loss": 0.9678, + "step": 15707 + }, + { + "epoch": 0.4, + "learning_rate": 1.9435957486048253e-06, + "loss": 0.9106, + "step": 15708 + }, + { + "epoch": 0.4, + "learning_rate": 1.943586586562441e-06, + "loss": 0.9131, + "step": 15709 + }, + { + "epoch": 0.4, + "learning_rate": 1.9435774237975957e-06, + "loss": 0.6873, + "step": 15710 + }, + { + "epoch": 0.4, + "learning_rate": 1.9435682603102965e-06, + "loss": 0.6729, + "step": 15711 + }, + { + "epoch": 0.4, + "learning_rate": 1.9435590961005506e-06, + "loss": 0.8574, + "step": 15712 + }, + { + "epoch": 0.4, + "learning_rate": 1.943549931168365e-06, + "loss": 0.8672, + "step": 15713 + }, + { + "epoch": 0.4, + "learning_rate": 1.9435407655137463e-06, + "loss": 0.8623, + "step": 15714 + }, + { + "epoch": 0.4, + "learning_rate": 1.943531599136702e-06, + "loss": 0.9434, + "step": 15715 + }, + { + "epoch": 0.4, + "learning_rate": 1.943522432037239e-06, + "loss": 0.8345, + "step": 15716 + }, + { + "epoch": 0.4, + "learning_rate": 1.943513264215364e-06, + "loss": 0.8223, + "step": 15717 + }, + { + "epoch": 0.4, + "learning_rate": 1.9435040956710845e-06, + "loss": 0.8447, + "step": 15718 + }, + { + "epoch": 0.4, + "learning_rate": 1.9434949264044075e-06, + "loss": 1.0137, + "step": 15719 + }, + { + "epoch": 0.4, + "learning_rate": 1.9434857564153393e-06, + "loss": 0.9131, + "step": 15720 + }, + { + "epoch": 0.4, + "learning_rate": 1.943476585703888e-06, + "loss": 0.8369, + "step": 15721 + }, + { + "epoch": 0.4, + "learning_rate": 1.94346741427006e-06, + "loss": 0.9258, + "step": 15722 + }, + { + "epoch": 0.4, + "learning_rate": 1.943458242113862e-06, + "loss": 0.9326, + "step": 15723 + }, + { + "epoch": 0.4, + "learning_rate": 1.9434490692353014e-06, + "loss": 0.8589, + "step": 15724 + }, + { + "epoch": 0.4, + "learning_rate": 1.943439895634385e-06, + "loss": 0.9102, + "step": 15725 + }, + { + "epoch": 0.4, + "learning_rate": 1.9434307213111205e-06, + "loss": 1.0879, + "step": 15726 + }, + { + "epoch": 0.4, + "learning_rate": 1.9434215462655147e-06, + "loss": 0.7686, + "step": 15727 + }, + { + "epoch": 0.4, + "learning_rate": 1.9434123704975743e-06, + "loss": 0.9678, + "step": 15728 + }, + { + "epoch": 0.4, + "learning_rate": 1.943403194007306e-06, + "loss": 0.9639, + "step": 15729 + }, + { + "epoch": 0.4, + "learning_rate": 1.9433940167947174e-06, + "loss": 0.8027, + "step": 15730 + }, + { + "epoch": 0.4, + "learning_rate": 1.9433848388598157e-06, + "loss": 0.7129, + "step": 15731 + }, + { + "epoch": 0.4, + "learning_rate": 1.943375660202608e-06, + "loss": 1.0898, + "step": 15732 + }, + { + "epoch": 0.4, + "learning_rate": 1.9433664808231e-06, + "loss": 0.8076, + "step": 15733 + }, + { + "epoch": 0.4, + "learning_rate": 1.9433573007213e-06, + "loss": 0.8828, + "step": 15734 + }, + { + "epoch": 0.4, + "learning_rate": 1.9433481198972144e-06, + "loss": 0.8203, + "step": 15735 + }, + { + "epoch": 0.4, + "learning_rate": 1.943338938350851e-06, + "loss": 1.001, + "step": 15736 + }, + { + "epoch": 0.4, + "learning_rate": 1.943329756082216e-06, + "loss": 1.0078, + "step": 15737 + }, + { + "epoch": 0.4, + "learning_rate": 1.943320573091317e-06, + "loss": 0.8301, + "step": 15738 + }, + { + "epoch": 0.4, + "learning_rate": 1.9433113893781606e-06, + "loss": 0.9854, + "step": 15739 + }, + { + "epoch": 0.4, + "learning_rate": 1.9433022049427545e-06, + "loss": 0.9014, + "step": 15740 + }, + { + "epoch": 0.4, + "learning_rate": 1.9432930197851045e-06, + "loss": 0.8516, + "step": 15741 + }, + { + "epoch": 0.4, + "learning_rate": 1.9432838339052192e-06, + "loss": 0.8315, + "step": 15742 + }, + { + "epoch": 0.4, + "learning_rate": 1.9432746473031045e-06, + "loss": 1.0273, + "step": 15743 + }, + { + "epoch": 0.4, + "learning_rate": 1.943265459978768e-06, + "loss": 0.9561, + "step": 15744 + }, + { + "epoch": 0.4, + "learning_rate": 1.943256271932216e-06, + "loss": 0.8179, + "step": 15745 + }, + { + "epoch": 0.4, + "learning_rate": 1.9432470831634563e-06, + "loss": 1.0996, + "step": 15746 + }, + { + "epoch": 0.4, + "learning_rate": 1.943237893672496e-06, + "loss": 0.8623, + "step": 15747 + }, + { + "epoch": 0.4, + "learning_rate": 1.9432287034593412e-06, + "loss": 1.0469, + "step": 15748 + }, + { + "epoch": 0.4, + "learning_rate": 1.943219512524e-06, + "loss": 1.041, + "step": 15749 + }, + { + "epoch": 0.4, + "learning_rate": 1.943210320866479e-06, + "loss": 0.8672, + "step": 15750 + }, + { + "epoch": 0.4, + "learning_rate": 1.9432011284867853e-06, + "loss": 0.8765, + "step": 15751 + }, + { + "epoch": 0.4, + "learning_rate": 1.9431919353849256e-06, + "loss": 0.7246, + "step": 15752 + }, + { + "epoch": 0.4, + "learning_rate": 1.943182741560907e-06, + "loss": 0.9375, + "step": 15753 + }, + { + "epoch": 0.4, + "learning_rate": 1.9431735470147373e-06, + "loss": 1.2764, + "step": 15754 + }, + { + "epoch": 0.4, + "learning_rate": 1.9431643517464226e-06, + "loss": 0.8994, + "step": 15755 + }, + { + "epoch": 0.4, + "learning_rate": 1.9431551557559705e-06, + "loss": 0.9863, + "step": 15756 + }, + { + "epoch": 0.4, + "learning_rate": 1.943145959043388e-06, + "loss": 0.9531, + "step": 15757 + }, + { + "epoch": 0.4, + "learning_rate": 1.9431367616086816e-06, + "loss": 1.0088, + "step": 15758 + }, + { + "epoch": 0.4, + "learning_rate": 1.943127563451859e-06, + "loss": 0.9092, + "step": 15759 + }, + { + "epoch": 0.4, + "learning_rate": 1.943118364572927e-06, + "loss": 0.7861, + "step": 15760 + }, + { + "epoch": 0.4, + "learning_rate": 1.9431091649718927e-06, + "loss": 1.0029, + "step": 15761 + }, + { + "epoch": 0.4, + "learning_rate": 1.943099964648763e-06, + "loss": 0.8008, + "step": 15762 + }, + { + "epoch": 0.4, + "learning_rate": 1.9430907636035446e-06, + "loss": 0.8579, + "step": 15763 + }, + { + "epoch": 0.4, + "learning_rate": 1.9430815618362456e-06, + "loss": 0.7593, + "step": 15764 + }, + { + "epoch": 0.4, + "learning_rate": 1.943072359346872e-06, + "loss": 0.959, + "step": 15765 + }, + { + "epoch": 0.4, + "learning_rate": 1.9430631561354315e-06, + "loss": 1.0254, + "step": 15766 + }, + { + "epoch": 0.4, + "learning_rate": 1.943053952201931e-06, + "loss": 0.9209, + "step": 15767 + }, + { + "epoch": 0.4, + "learning_rate": 1.943044747546377e-06, + "loss": 0.7715, + "step": 15768 + }, + { + "epoch": 0.4, + "learning_rate": 1.9430355421687775e-06, + "loss": 0.8262, + "step": 15769 + }, + { + "epoch": 0.4, + "learning_rate": 1.9430263360691387e-06, + "loss": 0.8887, + "step": 15770 + }, + { + "epoch": 0.4, + "learning_rate": 1.943017129247468e-06, + "loss": 0.8418, + "step": 15771 + }, + { + "epoch": 0.4, + "learning_rate": 1.9430079217037727e-06, + "loss": 0.9746, + "step": 15772 + }, + { + "epoch": 0.4, + "learning_rate": 1.9429987134380594e-06, + "loss": 0.6787, + "step": 15773 + }, + { + "epoch": 0.4, + "learning_rate": 1.9429895044503356e-06, + "loss": 0.915, + "step": 15774 + }, + { + "epoch": 0.4, + "learning_rate": 1.9429802947406077e-06, + "loss": 0.6875, + "step": 15775 + }, + { + "epoch": 0.4, + "learning_rate": 1.9429710843088833e-06, + "loss": 0.8372, + "step": 15776 + }, + { + "epoch": 0.4, + "learning_rate": 1.942961873155169e-06, + "loss": 0.79, + "step": 15777 + }, + { + "epoch": 0.4, + "learning_rate": 1.942952661279473e-06, + "loss": 0.9399, + "step": 15778 + }, + { + "epoch": 0.4, + "learning_rate": 1.9429434486818007e-06, + "loss": 1.1074, + "step": 15779 + }, + { + "epoch": 0.4, + "learning_rate": 1.9429342353621606e-06, + "loss": 1.0137, + "step": 15780 + }, + { + "epoch": 0.4, + "learning_rate": 1.9429250213205584e-06, + "loss": 0.7744, + "step": 15781 + }, + { + "epoch": 0.4, + "learning_rate": 1.9429158065570025e-06, + "loss": 0.7559, + "step": 15782 + }, + { + "epoch": 0.4, + "learning_rate": 1.942906591071499e-06, + "loss": 1.0449, + "step": 15783 + }, + { + "epoch": 0.4, + "learning_rate": 1.9428973748640554e-06, + "loss": 0.6694, + "step": 15784 + }, + { + "epoch": 0.4, + "learning_rate": 1.9428881579346786e-06, + "loss": 0.7764, + "step": 15785 + }, + { + "epoch": 0.4, + "learning_rate": 1.9428789402833756e-06, + "loss": 0.8311, + "step": 15786 + }, + { + "epoch": 0.4, + "learning_rate": 1.9428697219101537e-06, + "loss": 1.1172, + "step": 15787 + }, + { + "epoch": 0.4, + "learning_rate": 1.94286050281502e-06, + "loss": 1.0322, + "step": 15788 + }, + { + "epoch": 0.4, + "learning_rate": 1.9428512829979807e-06, + "loss": 1.0225, + "step": 15789 + }, + { + "epoch": 0.4, + "learning_rate": 1.9428420624590437e-06, + "loss": 1.0342, + "step": 15790 + }, + { + "epoch": 0.4, + "learning_rate": 1.9428328411982166e-06, + "loss": 1.0273, + "step": 15791 + }, + { + "epoch": 0.4, + "learning_rate": 1.942823619215505e-06, + "loss": 0.9434, + "step": 15792 + }, + { + "epoch": 0.4, + "learning_rate": 1.942814396510917e-06, + "loss": 0.96, + "step": 15793 + }, + { + "epoch": 0.4, + "learning_rate": 1.9428051730844596e-06, + "loss": 1.0254, + "step": 15794 + }, + { + "epoch": 0.4, + "learning_rate": 1.942795948936139e-06, + "loss": 0.7549, + "step": 15795 + }, + { + "epoch": 0.4, + "learning_rate": 1.9427867240659635e-06, + "loss": 0.5181, + "step": 15796 + }, + { + "epoch": 0.4, + "learning_rate": 1.9427774984739392e-06, + "loss": 1.0654, + "step": 15797 + }, + { + "epoch": 0.4, + "learning_rate": 1.9427682721600735e-06, + "loss": 0.9775, + "step": 15798 + }, + { + "epoch": 0.4, + "learning_rate": 1.9427590451243735e-06, + "loss": 0.9961, + "step": 15799 + }, + { + "epoch": 0.4, + "learning_rate": 1.942749817366847e-06, + "loss": 0.6433, + "step": 15800 + }, + { + "epoch": 0.4, + "learning_rate": 1.9427405888874994e-06, + "loss": 0.8296, + "step": 15801 + }, + { + "epoch": 0.41, + "learning_rate": 1.942731359686339e-06, + "loss": 0.8074, + "step": 15802 + }, + { + "epoch": 0.41, + "learning_rate": 1.942722129763372e-06, + "loss": 1.0371, + "step": 15803 + }, + { + "epoch": 0.41, + "learning_rate": 1.942712899118607e-06, + "loss": 0.7964, + "step": 15804 + }, + { + "epoch": 0.41, + "learning_rate": 1.9427036677520495e-06, + "loss": 0.9141, + "step": 15805 + }, + { + "epoch": 0.41, + "learning_rate": 1.9426944356637074e-06, + "loss": 1.1602, + "step": 15806 + }, + { + "epoch": 0.41, + "learning_rate": 1.9426852028535872e-06, + "loss": 0.479, + "step": 15807 + }, + { + "epoch": 0.41, + "learning_rate": 1.9426759693216964e-06, + "loss": 0.9961, + "step": 15808 + }, + { + "epoch": 0.41, + "learning_rate": 1.942666735068042e-06, + "loss": 0.8857, + "step": 15809 + }, + { + "epoch": 0.41, + "learning_rate": 1.9426575000926307e-06, + "loss": 1.2109, + "step": 15810 + }, + { + "epoch": 0.41, + "learning_rate": 1.9426482643954704e-06, + "loss": 0.9316, + "step": 15811 + }, + { + "epoch": 0.41, + "learning_rate": 1.9426390279765676e-06, + "loss": 0.835, + "step": 15812 + }, + { + "epoch": 0.41, + "learning_rate": 1.9426297908359293e-06, + "loss": 1.043, + "step": 15813 + }, + { + "epoch": 0.41, + "learning_rate": 1.9426205529735626e-06, + "loss": 0.9482, + "step": 15814 + }, + { + "epoch": 0.41, + "learning_rate": 1.942611314389475e-06, + "loss": 0.9131, + "step": 15815 + }, + { + "epoch": 0.41, + "learning_rate": 1.9426020750836727e-06, + "loss": 0.8711, + "step": 15816 + }, + { + "epoch": 0.41, + "learning_rate": 1.942592835056164e-06, + "loss": 0.6587, + "step": 15817 + }, + { + "epoch": 0.41, + "learning_rate": 1.9425835943069552e-06, + "loss": 0.9209, + "step": 15818 + }, + { + "epoch": 0.41, + "learning_rate": 1.9425743528360533e-06, + "loss": 0.7646, + "step": 15819 + }, + { + "epoch": 0.41, + "learning_rate": 1.9425651106434656e-06, + "loss": 1.0137, + "step": 15820 + }, + { + "epoch": 0.41, + "learning_rate": 1.942555867729199e-06, + "loss": 1.0566, + "step": 15821 + }, + { + "epoch": 0.41, + "learning_rate": 1.9425466240932606e-06, + "loss": 0.7783, + "step": 15822 + }, + { + "epoch": 0.41, + "learning_rate": 1.942537379735658e-06, + "loss": 0.8506, + "step": 15823 + }, + { + "epoch": 0.41, + "learning_rate": 1.942528134656398e-06, + "loss": 0.9824, + "step": 15824 + }, + { + "epoch": 0.41, + "learning_rate": 1.9425188888554867e-06, + "loss": 0.8408, + "step": 15825 + }, + { + "epoch": 0.41, + "learning_rate": 1.9425096423329327e-06, + "loss": 0.7744, + "step": 15826 + }, + { + "epoch": 0.41, + "learning_rate": 1.9425003950887423e-06, + "loss": 0.7642, + "step": 15827 + }, + { + "epoch": 0.41, + "learning_rate": 1.9424911471229225e-06, + "loss": 0.9038, + "step": 15828 + }, + { + "epoch": 0.41, + "learning_rate": 1.942481898435481e-06, + "loss": 1.0098, + "step": 15829 + }, + { + "epoch": 0.41, + "learning_rate": 1.942472649026424e-06, + "loss": 0.9805, + "step": 15830 + }, + { + "epoch": 0.41, + "learning_rate": 1.942463398895759e-06, + "loss": 1.0244, + "step": 15831 + }, + { + "epoch": 0.41, + "learning_rate": 1.9424541480434936e-06, + "loss": 0.8545, + "step": 15832 + }, + { + "epoch": 0.41, + "learning_rate": 1.942444896469634e-06, + "loss": 0.8164, + "step": 15833 + }, + { + "epoch": 0.41, + "learning_rate": 1.9424356441741876e-06, + "loss": 0.79, + "step": 15834 + }, + { + "epoch": 0.41, + "learning_rate": 1.942426391157162e-06, + "loss": 1.0205, + "step": 15835 + }, + { + "epoch": 0.41, + "learning_rate": 1.9424171374185635e-06, + "loss": 0.9072, + "step": 15836 + }, + { + "epoch": 0.41, + "learning_rate": 1.9424078829583994e-06, + "loss": 1.0029, + "step": 15837 + }, + { + "epoch": 0.41, + "learning_rate": 1.942398627776677e-06, + "loss": 0.8906, + "step": 15838 + }, + { + "epoch": 0.41, + "learning_rate": 1.9423893718734035e-06, + "loss": 1.0479, + "step": 15839 + }, + { + "epoch": 0.41, + "learning_rate": 1.9423801152485857e-06, + "loss": 0.9346, + "step": 15840 + }, + { + "epoch": 0.41, + "learning_rate": 1.942370857902231e-06, + "loss": 0.8062, + "step": 15841 + }, + { + "epoch": 0.41, + "learning_rate": 1.942361599834346e-06, + "loss": 0.9346, + "step": 15842 + }, + { + "epoch": 0.41, + "learning_rate": 1.942352341044938e-06, + "loss": 0.7378, + "step": 15843 + }, + { + "epoch": 0.41, + "learning_rate": 1.9423430815340144e-06, + "loss": 0.8633, + "step": 15844 + }, + { + "epoch": 0.41, + "learning_rate": 1.942333821301582e-06, + "loss": 0.8535, + "step": 15845 + }, + { + "epoch": 0.41, + "learning_rate": 1.9423245603476475e-06, + "loss": 0.9531, + "step": 15846 + }, + { + "epoch": 0.41, + "learning_rate": 1.9423152986722187e-06, + "loss": 0.9932, + "step": 15847 + }, + { + "epoch": 0.41, + "learning_rate": 1.9423060362753025e-06, + "loss": 0.9443, + "step": 15848 + }, + { + "epoch": 0.41, + "learning_rate": 1.9422967731569057e-06, + "loss": 0.9316, + "step": 15849 + }, + { + "epoch": 0.41, + "learning_rate": 1.942287509317036e-06, + "loss": 0.7705, + "step": 15850 + }, + { + "epoch": 0.41, + "learning_rate": 1.9422782447556994e-06, + "loss": 0.9185, + "step": 15851 + }, + { + "epoch": 0.41, + "learning_rate": 1.9422689794729043e-06, + "loss": 0.9395, + "step": 15852 + }, + { + "epoch": 0.41, + "learning_rate": 1.942259713468657e-06, + "loss": 0.874, + "step": 15853 + }, + { + "epoch": 0.41, + "learning_rate": 1.9422504467429644e-06, + "loss": 0.7092, + "step": 15854 + }, + { + "epoch": 0.41, + "learning_rate": 1.9422411792958345e-06, + "loss": 0.998, + "step": 15855 + }, + { + "epoch": 0.41, + "learning_rate": 1.9422319111272735e-06, + "loss": 0.957, + "step": 15856 + }, + { + "epoch": 0.41, + "learning_rate": 1.942222642237289e-06, + "loss": 0.7422, + "step": 15857 + }, + { + "epoch": 0.41, + "learning_rate": 1.942213372625888e-06, + "loss": 1.0225, + "step": 15858 + }, + { + "epoch": 0.41, + "learning_rate": 1.9422041022930773e-06, + "loss": 1.002, + "step": 15859 + }, + { + "epoch": 0.41, + "learning_rate": 1.9421948312388644e-06, + "loss": 1.1025, + "step": 15860 + }, + { + "epoch": 0.41, + "learning_rate": 1.9421855594632563e-06, + "loss": 0.8408, + "step": 15861 + }, + { + "epoch": 0.41, + "learning_rate": 1.94217628696626e-06, + "loss": 0.9355, + "step": 15862 + }, + { + "epoch": 0.41, + "learning_rate": 1.9421670137478825e-06, + "loss": 0.6538, + "step": 15863 + }, + { + "epoch": 0.41, + "learning_rate": 1.942157739808131e-06, + "loss": 1.0576, + "step": 15864 + }, + { + "epoch": 0.41, + "learning_rate": 1.942148465147013e-06, + "loss": 0.8398, + "step": 15865 + }, + { + "epoch": 0.41, + "learning_rate": 1.942139189764535e-06, + "loss": 0.8447, + "step": 15866 + }, + { + "epoch": 0.41, + "learning_rate": 1.9421299136607043e-06, + "loss": 0.8677, + "step": 15867 + }, + { + "epoch": 0.41, + "learning_rate": 1.9421206368355284e-06, + "loss": 0.6885, + "step": 15868 + }, + { + "epoch": 0.41, + "learning_rate": 1.942111359289014e-06, + "loss": 0.9844, + "step": 15869 + }, + { + "epoch": 0.41, + "learning_rate": 1.9421020810211676e-06, + "loss": 1.1738, + "step": 15870 + }, + { + "epoch": 0.41, + "learning_rate": 1.9420928020319975e-06, + "loss": 0.9268, + "step": 15871 + }, + { + "epoch": 0.41, + "learning_rate": 1.94208352232151e-06, + "loss": 0.8867, + "step": 15872 + }, + { + "epoch": 0.41, + "learning_rate": 1.942074241889713e-06, + "loss": 0.8999, + "step": 15873 + }, + { + "epoch": 0.41, + "learning_rate": 1.9420649607366124e-06, + "loss": 1.0186, + "step": 15874 + }, + { + "epoch": 0.41, + "learning_rate": 1.9420556788622164e-06, + "loss": 0.9688, + "step": 15875 + }, + { + "epoch": 0.41, + "learning_rate": 1.9420463962665316e-06, + "loss": 0.9893, + "step": 15876 + }, + { + "epoch": 0.41, + "learning_rate": 1.9420371129495647e-06, + "loss": 0.7832, + "step": 15877 + }, + { + "epoch": 0.41, + "learning_rate": 1.942027828911324e-06, + "loss": 1.0195, + "step": 15878 + }, + { + "epoch": 0.41, + "learning_rate": 1.9420185441518155e-06, + "loss": 0.8672, + "step": 15879 + }, + { + "epoch": 0.41, + "learning_rate": 1.9420092586710467e-06, + "loss": 0.9932, + "step": 15880 + }, + { + "epoch": 0.41, + "learning_rate": 1.941999972469025e-06, + "loss": 0.6602, + "step": 15881 + }, + { + "epoch": 0.41, + "learning_rate": 1.941990685545757e-06, + "loss": 0.7383, + "step": 15882 + }, + { + "epoch": 0.41, + "learning_rate": 1.9419813979012502e-06, + "loss": 0.6841, + "step": 15883 + }, + { + "epoch": 0.41, + "learning_rate": 1.9419721095355113e-06, + "loss": 0.8887, + "step": 15884 + }, + { + "epoch": 0.41, + "learning_rate": 1.9419628204485484e-06, + "loss": 1.0098, + "step": 15885 + }, + { + "epoch": 0.41, + "learning_rate": 1.941953530640367e-06, + "loss": 0.8418, + "step": 15886 + }, + { + "epoch": 0.41, + "learning_rate": 1.9419442401109757e-06, + "loss": 0.9365, + "step": 15887 + }, + { + "epoch": 0.41, + "learning_rate": 1.9419349488603806e-06, + "loss": 0.791, + "step": 15888 + }, + { + "epoch": 0.41, + "learning_rate": 1.9419256568885895e-06, + "loss": 0.6582, + "step": 15889 + }, + { + "epoch": 0.41, + "learning_rate": 1.941916364195609e-06, + "loss": 0.8691, + "step": 15890 + }, + { + "epoch": 0.41, + "learning_rate": 1.9419070707814468e-06, + "loss": 1.0146, + "step": 15891 + }, + { + "epoch": 0.41, + "learning_rate": 1.9418977766461095e-06, + "loss": 0.7944, + "step": 15892 + }, + { + "epoch": 0.41, + "learning_rate": 1.941888481789604e-06, + "loss": 1.0752, + "step": 15893 + }, + { + "epoch": 0.41, + "learning_rate": 1.9418791862119383e-06, + "loss": 0.7793, + "step": 15894 + }, + { + "epoch": 0.41, + "learning_rate": 1.941869889913119e-06, + "loss": 0.8574, + "step": 15895 + }, + { + "epoch": 0.41, + "learning_rate": 1.941860592893153e-06, + "loss": 1.0527, + "step": 15896 + }, + { + "epoch": 0.41, + "learning_rate": 1.9418512951520475e-06, + "loss": 0.5747, + "step": 15897 + }, + { + "epoch": 0.41, + "learning_rate": 1.9418419966898097e-06, + "loss": 0.8926, + "step": 15898 + }, + { + "epoch": 0.41, + "learning_rate": 1.9418326975064475e-06, + "loss": 0.9863, + "step": 15899 + }, + { + "epoch": 0.41, + "learning_rate": 1.9418233976019667e-06, + "loss": 0.8701, + "step": 15900 + }, + { + "epoch": 0.41, + "learning_rate": 1.9418140969763754e-06, + "loss": 0.9336, + "step": 15901 + }, + { + "epoch": 0.41, + "learning_rate": 1.94180479562968e-06, + "loss": 0.9365, + "step": 15902 + }, + { + "epoch": 0.41, + "learning_rate": 1.941795493561888e-06, + "loss": 0.9199, + "step": 15903 + }, + { + "epoch": 0.41, + "learning_rate": 1.941786190773007e-06, + "loss": 0.9619, + "step": 15904 + }, + { + "epoch": 0.41, + "learning_rate": 1.941776887263043e-06, + "loss": 0.8745, + "step": 15905 + }, + { + "epoch": 0.41, + "learning_rate": 1.941767583032004e-06, + "loss": 0.6875, + "step": 15906 + }, + { + "epoch": 0.41, + "learning_rate": 1.941758278079897e-06, + "loss": 0.8604, + "step": 15907 + }, + { + "epoch": 0.41, + "learning_rate": 1.941748972406729e-06, + "loss": 0.9141, + "step": 15908 + }, + { + "epoch": 0.41, + "learning_rate": 1.941739666012507e-06, + "loss": 0.8765, + "step": 15909 + }, + { + "epoch": 0.41, + "learning_rate": 1.941730358897238e-06, + "loss": 0.7559, + "step": 15910 + }, + { + "epoch": 0.41, + "learning_rate": 1.9417210510609294e-06, + "loss": 1.2432, + "step": 15911 + }, + { + "epoch": 0.41, + "learning_rate": 1.9417117425035886e-06, + "loss": 0.9268, + "step": 15912 + }, + { + "epoch": 0.41, + "learning_rate": 1.9417024332252225e-06, + "loss": 0.7402, + "step": 15913 + }, + { + "epoch": 0.41, + "learning_rate": 1.9416931232258377e-06, + "loss": 1.0859, + "step": 15914 + }, + { + "epoch": 0.41, + "learning_rate": 1.941683812505442e-06, + "loss": 0.8438, + "step": 15915 + }, + { + "epoch": 0.41, + "learning_rate": 1.9416745010640426e-06, + "loss": 0.9678, + "step": 15916 + }, + { + "epoch": 0.41, + "learning_rate": 1.9416651889016457e-06, + "loss": 0.8408, + "step": 15917 + }, + { + "epoch": 0.41, + "learning_rate": 1.9416558760182595e-06, + "loss": 1.0801, + "step": 15918 + }, + { + "epoch": 0.41, + "learning_rate": 1.9416465624138907e-06, + "loss": 0.9844, + "step": 15919 + }, + { + "epoch": 0.41, + "learning_rate": 1.941637248088546e-06, + "loss": 0.9072, + "step": 15920 + }, + { + "epoch": 0.41, + "learning_rate": 1.9416279330422337e-06, + "loss": 0.7446, + "step": 15921 + }, + { + "epoch": 0.41, + "learning_rate": 1.9416186172749594e-06, + "loss": 0.8447, + "step": 15922 + }, + { + "epoch": 0.41, + "learning_rate": 1.9416093007867314e-06, + "loss": 0.918, + "step": 15923 + }, + { + "epoch": 0.41, + "learning_rate": 1.941599983577557e-06, + "loss": 0.7695, + "step": 15924 + }, + { + "epoch": 0.41, + "learning_rate": 1.941590665647442e-06, + "loss": 0.8767, + "step": 15925 + }, + { + "epoch": 0.41, + "learning_rate": 1.9415813469963946e-06, + "loss": 0.9053, + "step": 15926 + }, + { + "epoch": 0.41, + "learning_rate": 1.9415720276244217e-06, + "loss": 0.9102, + "step": 15927 + }, + { + "epoch": 0.41, + "learning_rate": 1.9415627075315302e-06, + "loss": 0.8462, + "step": 15928 + }, + { + "epoch": 0.41, + "learning_rate": 1.9415533867177273e-06, + "loss": 0.8403, + "step": 15929 + }, + { + "epoch": 0.41, + "learning_rate": 1.9415440651830206e-06, + "loss": 0.7432, + "step": 15930 + }, + { + "epoch": 0.41, + "learning_rate": 1.941534742927417e-06, + "loss": 0.8311, + "step": 15931 + }, + { + "epoch": 0.41, + "learning_rate": 1.941525419950923e-06, + "loss": 0.7993, + "step": 15932 + }, + { + "epoch": 0.41, + "learning_rate": 1.941516096253547e-06, + "loss": 1.0088, + "step": 15933 + }, + { + "epoch": 0.41, + "learning_rate": 1.9415067718352953e-06, + "loss": 0.8364, + "step": 15934 + }, + { + "epoch": 0.41, + "learning_rate": 1.9414974466961745e-06, + "loss": 0.7275, + "step": 15935 + }, + { + "epoch": 0.41, + "learning_rate": 1.9414881208361927e-06, + "loss": 0.9268, + "step": 15936 + }, + { + "epoch": 0.41, + "learning_rate": 1.941478794255357e-06, + "loss": 0.9043, + "step": 15937 + }, + { + "epoch": 0.41, + "learning_rate": 1.941469466953674e-06, + "loss": 1.0176, + "step": 15938 + }, + { + "epoch": 0.41, + "learning_rate": 1.9414601389311514e-06, + "loss": 0.7666, + "step": 15939 + }, + { + "epoch": 0.41, + "learning_rate": 1.9414508101877957e-06, + "loss": 0.9326, + "step": 15940 + }, + { + "epoch": 0.41, + "learning_rate": 1.9414414807236146e-06, + "loss": 1.043, + "step": 15941 + }, + { + "epoch": 0.41, + "learning_rate": 1.9414321505386152e-06, + "loss": 0.7437, + "step": 15942 + }, + { + "epoch": 0.41, + "learning_rate": 1.9414228196328044e-06, + "loss": 0.8555, + "step": 15943 + }, + { + "epoch": 0.41, + "learning_rate": 1.9414134880061892e-06, + "loss": 0.7119, + "step": 15944 + }, + { + "epoch": 0.41, + "learning_rate": 1.9414041556587774e-06, + "loss": 0.8857, + "step": 15945 + }, + { + "epoch": 0.41, + "learning_rate": 1.9413948225905753e-06, + "loss": 0.7412, + "step": 15946 + }, + { + "epoch": 0.41, + "learning_rate": 1.9413854888015905e-06, + "loss": 0.814, + "step": 15947 + }, + { + "epoch": 0.41, + "learning_rate": 1.9413761542918302e-06, + "loss": 0.8691, + "step": 15948 + }, + { + "epoch": 0.41, + "learning_rate": 1.9413668190613017e-06, + "loss": 0.7754, + "step": 15949 + }, + { + "epoch": 0.41, + "learning_rate": 1.941357483110012e-06, + "loss": 0.7749, + "step": 15950 + }, + { + "epoch": 0.41, + "learning_rate": 1.9413481464379676e-06, + "loss": 0.8477, + "step": 15951 + }, + { + "epoch": 0.41, + "learning_rate": 1.9413388090451765e-06, + "loss": 0.8223, + "step": 15952 + }, + { + "epoch": 0.41, + "learning_rate": 1.9413294709316455e-06, + "loss": 0.8057, + "step": 15953 + }, + { + "epoch": 0.41, + "learning_rate": 1.941320132097382e-06, + "loss": 0.8477, + "step": 15954 + }, + { + "epoch": 0.41, + "learning_rate": 1.941310792542393e-06, + "loss": 0.8525, + "step": 15955 + }, + { + "epoch": 0.41, + "learning_rate": 1.9413014522666855e-06, + "loss": 0.6921, + "step": 15956 + }, + { + "epoch": 0.41, + "learning_rate": 1.9412921112702664e-06, + "loss": 0.6348, + "step": 15957 + }, + { + "epoch": 0.41, + "learning_rate": 1.9412827695531434e-06, + "loss": 1.1006, + "step": 15958 + }, + { + "epoch": 0.41, + "learning_rate": 1.9412734271153238e-06, + "loss": 1.0205, + "step": 15959 + }, + { + "epoch": 0.41, + "learning_rate": 1.941264083956814e-06, + "loss": 0.9092, + "step": 15960 + }, + { + "epoch": 0.41, + "learning_rate": 1.941254740077622e-06, + "loss": 0.7095, + "step": 15961 + }, + { + "epoch": 0.41, + "learning_rate": 1.9412453954777543e-06, + "loss": 0.8555, + "step": 15962 + }, + { + "epoch": 0.41, + "learning_rate": 1.941236050157218e-06, + "loss": 0.7358, + "step": 15963 + }, + { + "epoch": 0.41, + "learning_rate": 1.941226704116021e-06, + "loss": 1.082, + "step": 15964 + }, + { + "epoch": 0.41, + "learning_rate": 1.94121735735417e-06, + "loss": 0.6201, + "step": 15965 + }, + { + "epoch": 0.41, + "learning_rate": 1.9412080098716717e-06, + "loss": 0.873, + "step": 15966 + }, + { + "epoch": 0.41, + "learning_rate": 1.941198661668534e-06, + "loss": 0.9258, + "step": 15967 + }, + { + "epoch": 0.41, + "learning_rate": 1.941189312744764e-06, + "loss": 0.9834, + "step": 15968 + }, + { + "epoch": 0.41, + "learning_rate": 1.941179963100368e-06, + "loss": 0.8467, + "step": 15969 + }, + { + "epoch": 0.41, + "learning_rate": 1.941170612735354e-06, + "loss": 0.9736, + "step": 15970 + }, + { + "epoch": 0.41, + "learning_rate": 1.9411612616497295e-06, + "loss": 0.6465, + "step": 15971 + }, + { + "epoch": 0.41, + "learning_rate": 1.9411519098435005e-06, + "loss": 0.9385, + "step": 15972 + }, + { + "epoch": 0.41, + "learning_rate": 1.9411425573166747e-06, + "loss": 0.8203, + "step": 15973 + }, + { + "epoch": 0.41, + "learning_rate": 1.9411332040692594e-06, + "loss": 1.001, + "step": 15974 + }, + { + "epoch": 0.41, + "learning_rate": 1.9411238501012618e-06, + "loss": 0.6553, + "step": 15975 + }, + { + "epoch": 0.41, + "learning_rate": 1.9411144954126894e-06, + "loss": 0.8867, + "step": 15976 + }, + { + "epoch": 0.41, + "learning_rate": 1.941105140003548e-06, + "loss": 0.7239, + "step": 15977 + }, + { + "epoch": 0.41, + "learning_rate": 1.9410957838738466e-06, + "loss": 0.8101, + "step": 15978 + }, + { + "epoch": 0.41, + "learning_rate": 1.9410864270235906e-06, + "loss": 1.0049, + "step": 15979 + }, + { + "epoch": 0.41, + "learning_rate": 1.9410770694527883e-06, + "loss": 0.9004, + "step": 15980 + }, + { + "epoch": 0.41, + "learning_rate": 1.941067711161447e-06, + "loss": 0.7715, + "step": 15981 + }, + { + "epoch": 0.41, + "learning_rate": 1.941058352149573e-06, + "loss": 1.0332, + "step": 15982 + }, + { + "epoch": 0.41, + "learning_rate": 1.9410489924171734e-06, + "loss": 0.8516, + "step": 15983 + }, + { + "epoch": 0.41, + "learning_rate": 1.941039631964257e-06, + "loss": 0.9111, + "step": 15984 + }, + { + "epoch": 0.41, + "learning_rate": 1.941030270790829e-06, + "loss": 0.8394, + "step": 15985 + }, + { + "epoch": 0.41, + "learning_rate": 1.9410209088968975e-06, + "loss": 0.5701, + "step": 15986 + }, + { + "epoch": 0.41, + "learning_rate": 1.9410115462824697e-06, + "loss": 0.9204, + "step": 15987 + }, + { + "epoch": 0.41, + "learning_rate": 1.9410021829475527e-06, + "loss": 0.791, + "step": 15988 + }, + { + "epoch": 0.41, + "learning_rate": 1.9409928188921533e-06, + "loss": 1.0283, + "step": 15989 + }, + { + "epoch": 0.41, + "learning_rate": 1.9409834541162795e-06, + "loss": 0.8682, + "step": 15990 + }, + { + "epoch": 0.41, + "learning_rate": 1.9409740886199372e-06, + "loss": 0.7988, + "step": 15991 + }, + { + "epoch": 0.41, + "learning_rate": 1.9409647224031346e-06, + "loss": 0.8604, + "step": 15992 + }, + { + "epoch": 0.41, + "learning_rate": 1.9409553554658788e-06, + "loss": 0.7778, + "step": 15993 + }, + { + "epoch": 0.41, + "learning_rate": 1.9409459878081766e-06, + "loss": 0.8867, + "step": 15994 + }, + { + "epoch": 0.41, + "learning_rate": 1.9409366194300355e-06, + "loss": 0.8281, + "step": 15995 + }, + { + "epoch": 0.41, + "learning_rate": 1.940927250331462e-06, + "loss": 0.9492, + "step": 15996 + }, + { + "epoch": 0.41, + "learning_rate": 1.9409178805124642e-06, + "loss": 0.6938, + "step": 15997 + }, + { + "epoch": 0.41, + "learning_rate": 1.9409085099730488e-06, + "loss": 1.0127, + "step": 15998 + }, + { + "epoch": 0.41, + "learning_rate": 1.940899138713223e-06, + "loss": 0.667, + "step": 15999 + }, + { + "epoch": 0.41, + "learning_rate": 1.9408897667329938e-06, + "loss": 0.9248, + "step": 16000 + }, + { + "epoch": 0.41, + "learning_rate": 1.9408803940323687e-06, + "loss": 0.8945, + "step": 16001 + }, + { + "epoch": 0.41, + "learning_rate": 1.940871020611355e-06, + "loss": 0.7178, + "step": 16002 + }, + { + "epoch": 0.41, + "learning_rate": 1.940861646469959e-06, + "loss": 0.8789, + "step": 16003 + }, + { + "epoch": 0.41, + "learning_rate": 1.9408522716081892e-06, + "loss": 0.7471, + "step": 16004 + }, + { + "epoch": 0.41, + "learning_rate": 1.940842896026052e-06, + "loss": 0.8623, + "step": 16005 + }, + { + "epoch": 0.41, + "learning_rate": 1.9408335197235544e-06, + "loss": 0.9746, + "step": 16006 + }, + { + "epoch": 0.41, + "learning_rate": 1.9408241427007036e-06, + "loss": 0.7969, + "step": 16007 + }, + { + "epoch": 0.41, + "learning_rate": 1.9408147649575075e-06, + "loss": 0.9385, + "step": 16008 + }, + { + "epoch": 0.41, + "learning_rate": 1.9408053864939722e-06, + "loss": 1.1387, + "step": 16009 + }, + { + "epoch": 0.41, + "learning_rate": 1.940796007310106e-06, + "loss": 0.8618, + "step": 16010 + }, + { + "epoch": 0.41, + "learning_rate": 1.9407866274059155e-06, + "loss": 0.9961, + "step": 16011 + }, + { + "epoch": 0.41, + "learning_rate": 1.9407772467814078e-06, + "loss": 0.8838, + "step": 16012 + }, + { + "epoch": 0.41, + "learning_rate": 1.9407678654365903e-06, + "loss": 0.8896, + "step": 16013 + }, + { + "epoch": 0.41, + "learning_rate": 1.94075848337147e-06, + "loss": 0.7031, + "step": 16014 + }, + { + "epoch": 0.41, + "learning_rate": 1.940749100586054e-06, + "loss": 0.7949, + "step": 16015 + }, + { + "epoch": 0.41, + "learning_rate": 1.9407397170803503e-06, + "loss": 0.9316, + "step": 16016 + }, + { + "epoch": 0.41, + "learning_rate": 1.940730332854365e-06, + "loss": 0.8711, + "step": 16017 + }, + { + "epoch": 0.41, + "learning_rate": 1.940720947908106e-06, + "loss": 0.6396, + "step": 16018 + }, + { + "epoch": 0.41, + "learning_rate": 1.94071156224158e-06, + "loss": 0.9912, + "step": 16019 + }, + { + "epoch": 0.41, + "learning_rate": 1.940702175854794e-06, + "loss": 1.0635, + "step": 16020 + }, + { + "epoch": 0.41, + "learning_rate": 1.940692788747756e-06, + "loss": 0.8984, + "step": 16021 + }, + { + "epoch": 0.41, + "learning_rate": 1.940683400920473e-06, + "loss": 0.7559, + "step": 16022 + }, + { + "epoch": 0.41, + "learning_rate": 1.940674012372952e-06, + "loss": 0.9717, + "step": 16023 + }, + { + "epoch": 0.41, + "learning_rate": 1.9406646231052e-06, + "loss": 0.8066, + "step": 16024 + }, + { + "epoch": 0.41, + "learning_rate": 1.9406552331172243e-06, + "loss": 0.6724, + "step": 16025 + }, + { + "epoch": 0.41, + "learning_rate": 1.9406458424090324e-06, + "loss": 0.9727, + "step": 16026 + }, + { + "epoch": 0.41, + "learning_rate": 1.9406364509806308e-06, + "loss": 0.8408, + "step": 16027 + }, + { + "epoch": 0.41, + "learning_rate": 1.940627058832027e-06, + "loss": 0.8027, + "step": 16028 + }, + { + "epoch": 0.41, + "learning_rate": 1.940617665963229e-06, + "loss": 0.5767, + "step": 16029 + }, + { + "epoch": 0.41, + "learning_rate": 1.940608272374243e-06, + "loss": 0.959, + "step": 16030 + }, + { + "epoch": 0.41, + "learning_rate": 1.9405988780650763e-06, + "loss": 0.876, + "step": 16031 + }, + { + "epoch": 0.41, + "learning_rate": 1.9405894830357365e-06, + "loss": 0.7454, + "step": 16032 + }, + { + "epoch": 0.41, + "learning_rate": 1.94058008728623e-06, + "loss": 0.9565, + "step": 16033 + }, + { + "epoch": 0.41, + "learning_rate": 1.9405706908165655e-06, + "loss": 0.9141, + "step": 16034 + }, + { + "epoch": 0.41, + "learning_rate": 1.9405612936267487e-06, + "loss": 0.8418, + "step": 16035 + }, + { + "epoch": 0.41, + "learning_rate": 1.940551895716788e-06, + "loss": 0.9785, + "step": 16036 + }, + { + "epoch": 0.41, + "learning_rate": 1.9405424970866894e-06, + "loss": 0.6899, + "step": 16037 + }, + { + "epoch": 0.41, + "learning_rate": 1.9405330977364604e-06, + "loss": 0.7812, + "step": 16038 + }, + { + "epoch": 0.41, + "learning_rate": 1.9405236976661086e-06, + "loss": 0.6511, + "step": 16039 + }, + { + "epoch": 0.41, + "learning_rate": 1.9405142968756416e-06, + "loss": 0.8428, + "step": 16040 + }, + { + "epoch": 0.41, + "learning_rate": 1.9405048953650657e-06, + "loss": 0.959, + "step": 16041 + }, + { + "epoch": 0.41, + "learning_rate": 1.940495493134388e-06, + "loss": 0.8613, + "step": 16042 + }, + { + "epoch": 0.41, + "learning_rate": 1.940486090183617e-06, + "loss": 1.0166, + "step": 16043 + }, + { + "epoch": 0.41, + "learning_rate": 1.9404766865127584e-06, + "loss": 0.7598, + "step": 16044 + }, + { + "epoch": 0.41, + "learning_rate": 1.9404672821218203e-06, + "loss": 0.7666, + "step": 16045 + }, + { + "epoch": 0.41, + "learning_rate": 1.9404578770108097e-06, + "loss": 0.7749, + "step": 16046 + }, + { + "epoch": 0.41, + "learning_rate": 1.940448471179734e-06, + "loss": 0.8994, + "step": 16047 + }, + { + "epoch": 0.41, + "learning_rate": 1.940439064628599e-06, + "loss": 0.9346, + "step": 16048 + }, + { + "epoch": 0.41, + "learning_rate": 1.940429657357414e-06, + "loss": 0.7847, + "step": 16049 + }, + { + "epoch": 0.41, + "learning_rate": 1.9404202493661852e-06, + "loss": 0.7871, + "step": 16050 + }, + { + "epoch": 0.41, + "learning_rate": 1.94041084065492e-06, + "loss": 0.8281, + "step": 16051 + }, + { + "epoch": 0.41, + "learning_rate": 1.940401431223625e-06, + "loss": 1.1279, + "step": 16052 + }, + { + "epoch": 0.41, + "learning_rate": 1.9403920210723085e-06, + "loss": 0.9258, + "step": 16053 + }, + { + "epoch": 0.41, + "learning_rate": 1.9403826102009763e-06, + "loss": 1.0078, + "step": 16054 + }, + { + "epoch": 0.41, + "learning_rate": 1.9403731986096368e-06, + "loss": 0.8491, + "step": 16055 + }, + { + "epoch": 0.41, + "learning_rate": 1.940363786298297e-06, + "loss": 0.8867, + "step": 16056 + }, + { + "epoch": 0.41, + "learning_rate": 1.9403543732669637e-06, + "loss": 1.0566, + "step": 16057 + }, + { + "epoch": 0.41, + "learning_rate": 1.9403449595156436e-06, + "loss": 1.167, + "step": 16058 + }, + { + "epoch": 0.41, + "learning_rate": 1.9403355450443455e-06, + "loss": 0.7607, + "step": 16059 + }, + { + "epoch": 0.41, + "learning_rate": 1.9403261298530754e-06, + "loss": 0.6968, + "step": 16060 + }, + { + "epoch": 0.41, + "learning_rate": 1.9403167139418408e-06, + "loss": 0.8799, + "step": 16061 + }, + { + "epoch": 0.41, + "learning_rate": 1.9403072973106493e-06, + "loss": 0.939, + "step": 16062 + }, + { + "epoch": 0.41, + "learning_rate": 1.940297879959507e-06, + "loss": 0.8447, + "step": 16063 + }, + { + "epoch": 0.41, + "learning_rate": 1.940288461888422e-06, + "loss": 1.0381, + "step": 16064 + }, + { + "epoch": 0.41, + "learning_rate": 1.940279043097402e-06, + "loss": 0.7891, + "step": 16065 + }, + { + "epoch": 0.41, + "learning_rate": 1.9402696235864533e-06, + "loss": 0.8066, + "step": 16066 + }, + { + "epoch": 0.41, + "learning_rate": 1.940260203355583e-06, + "loss": 0.9258, + "step": 16067 + }, + { + "epoch": 0.41, + "learning_rate": 1.9402507824047994e-06, + "loss": 0.8301, + "step": 16068 + }, + { + "epoch": 0.41, + "learning_rate": 1.9402413607341084e-06, + "loss": 1.1016, + "step": 16069 + }, + { + "epoch": 0.41, + "learning_rate": 1.940231938343518e-06, + "loss": 0.8584, + "step": 16070 + }, + { + "epoch": 0.41, + "learning_rate": 1.940222515233035e-06, + "loss": 0.7275, + "step": 16071 + }, + { + "epoch": 0.41, + "learning_rate": 1.9402130914026674e-06, + "loss": 0.8516, + "step": 16072 + }, + { + "epoch": 0.41, + "learning_rate": 1.9402036668524214e-06, + "loss": 0.8096, + "step": 16073 + }, + { + "epoch": 0.41, + "learning_rate": 1.940194241582305e-06, + "loss": 0.9688, + "step": 16074 + }, + { + "epoch": 0.41, + "learning_rate": 1.9401848155923252e-06, + "loss": 0.9648, + "step": 16075 + }, + { + "epoch": 0.41, + "learning_rate": 1.9401753888824886e-06, + "loss": 1.0215, + "step": 16076 + }, + { + "epoch": 0.41, + "learning_rate": 1.9401659614528032e-06, + "loss": 0.6963, + "step": 16077 + }, + { + "epoch": 0.41, + "learning_rate": 1.9401565333032758e-06, + "loss": 0.7368, + "step": 16078 + }, + { + "epoch": 0.41, + "learning_rate": 1.940147104433914e-06, + "loss": 0.833, + "step": 16079 + }, + { + "epoch": 0.41, + "learning_rate": 1.9401376748447247e-06, + "loss": 0.9004, + "step": 16080 + }, + { + "epoch": 0.41, + "learning_rate": 1.940128244535715e-06, + "loss": 0.6582, + "step": 16081 + }, + { + "epoch": 0.41, + "learning_rate": 1.9401188135068927e-06, + "loss": 0.6382, + "step": 16082 + }, + { + "epoch": 0.41, + "learning_rate": 1.9401093817582646e-06, + "loss": 0.7256, + "step": 16083 + }, + { + "epoch": 0.41, + "learning_rate": 1.9400999492898377e-06, + "loss": 0.7998, + "step": 16084 + }, + { + "epoch": 0.41, + "learning_rate": 1.94009051610162e-06, + "loss": 0.8086, + "step": 16085 + }, + { + "epoch": 0.41, + "learning_rate": 1.940081082193618e-06, + "loss": 0.7749, + "step": 16086 + }, + { + "epoch": 0.41, + "learning_rate": 1.9400716475658388e-06, + "loss": 0.8809, + "step": 16087 + }, + { + "epoch": 0.41, + "learning_rate": 1.94006221221829e-06, + "loss": 0.8975, + "step": 16088 + }, + { + "epoch": 0.41, + "learning_rate": 1.9400527761509795e-06, + "loss": 0.9805, + "step": 16089 + }, + { + "epoch": 0.41, + "learning_rate": 1.940043339363913e-06, + "loss": 0.8669, + "step": 16090 + }, + { + "epoch": 0.41, + "learning_rate": 1.9400339018570988e-06, + "loss": 0.8271, + "step": 16091 + }, + { + "epoch": 0.41, + "learning_rate": 1.940024463630544e-06, + "loss": 0.9805, + "step": 16092 + }, + { + "epoch": 0.41, + "learning_rate": 1.9400150246842556e-06, + "loss": 0.6475, + "step": 16093 + }, + { + "epoch": 0.41, + "learning_rate": 1.940005585018241e-06, + "loss": 0.9355, + "step": 16094 + }, + { + "epoch": 0.41, + "learning_rate": 1.939996144632507e-06, + "loss": 0.8428, + "step": 16095 + }, + { + "epoch": 0.41, + "learning_rate": 1.939986703527062e-06, + "loss": 0.9668, + "step": 16096 + }, + { + "epoch": 0.41, + "learning_rate": 1.9399772617019113e-06, + "loss": 0.9424, + "step": 16097 + }, + { + "epoch": 0.41, + "learning_rate": 1.939967819157064e-06, + "loss": 0.8037, + "step": 16098 + }, + { + "epoch": 0.41, + "learning_rate": 1.939958375892526e-06, + "loss": 1.0498, + "step": 16099 + }, + { + "epoch": 0.41, + "learning_rate": 1.9399489319083056e-06, + "loss": 0.9912, + "step": 16100 + }, + { + "epoch": 0.41, + "learning_rate": 1.9399394872044094e-06, + "loss": 0.9907, + "step": 16101 + }, + { + "epoch": 0.41, + "learning_rate": 1.939930041780845e-06, + "loss": 0.9341, + "step": 16102 + }, + { + "epoch": 0.41, + "learning_rate": 1.939920595637619e-06, + "loss": 0.9883, + "step": 16103 + }, + { + "epoch": 0.41, + "learning_rate": 1.939911148774739e-06, + "loss": 0.8462, + "step": 16104 + }, + { + "epoch": 0.41, + "learning_rate": 1.9399017011922125e-06, + "loss": 0.8047, + "step": 16105 + }, + { + "epoch": 0.41, + "learning_rate": 1.9398922528900462e-06, + "loss": 0.9678, + "step": 16106 + }, + { + "epoch": 0.41, + "learning_rate": 1.9398828038682476e-06, + "loss": 0.9902, + "step": 16107 + }, + { + "epoch": 0.41, + "learning_rate": 1.939873354126824e-06, + "loss": 1.1211, + "step": 16108 + }, + { + "epoch": 0.41, + "learning_rate": 1.939863903665783e-06, + "loss": 0.834, + "step": 16109 + }, + { + "epoch": 0.41, + "learning_rate": 1.939854452485131e-06, + "loss": 0.9434, + "step": 16110 + }, + { + "epoch": 0.41, + "learning_rate": 1.939845000584876e-06, + "loss": 0.9814, + "step": 16111 + }, + { + "epoch": 0.41, + "learning_rate": 1.939835547965025e-06, + "loss": 0.9502, + "step": 16112 + }, + { + "epoch": 0.41, + "learning_rate": 1.9398260946255847e-06, + "loss": 0.7705, + "step": 16113 + }, + { + "epoch": 0.41, + "learning_rate": 1.939816640566563e-06, + "loss": 0.7773, + "step": 16114 + }, + { + "epoch": 0.41, + "learning_rate": 1.9398071857879665e-06, + "loss": 0.915, + "step": 16115 + }, + { + "epoch": 0.41, + "learning_rate": 1.939797730289803e-06, + "loss": 0.9521, + "step": 16116 + }, + { + "epoch": 0.41, + "learning_rate": 1.93978827407208e-06, + "loss": 0.7598, + "step": 16117 + }, + { + "epoch": 0.41, + "learning_rate": 1.939778817134804e-06, + "loss": 0.8193, + "step": 16118 + }, + { + "epoch": 0.41, + "learning_rate": 1.9397693594779828e-06, + "loss": 1.0156, + "step": 16119 + }, + { + "epoch": 0.41, + "learning_rate": 1.9397599011016234e-06, + "loss": 0.8711, + "step": 16120 + }, + { + "epoch": 0.41, + "learning_rate": 1.9397504420057328e-06, + "loss": 0.8164, + "step": 16121 + }, + { + "epoch": 0.41, + "learning_rate": 1.9397409821903186e-06, + "loss": 0.6506, + "step": 16122 + }, + { + "epoch": 0.41, + "learning_rate": 1.9397315216553876e-06, + "loss": 0.709, + "step": 16123 + }, + { + "epoch": 0.41, + "learning_rate": 1.939722060400948e-06, + "loss": 0.8623, + "step": 16124 + }, + { + "epoch": 0.41, + "learning_rate": 1.9397125984270062e-06, + "loss": 1.0518, + "step": 16125 + }, + { + "epoch": 0.41, + "learning_rate": 1.93970313573357e-06, + "loss": 0.9268, + "step": 16126 + }, + { + "epoch": 0.41, + "learning_rate": 1.9396936723206458e-06, + "loss": 0.8311, + "step": 16127 + }, + { + "epoch": 0.41, + "learning_rate": 1.9396842081882414e-06, + "loss": 0.6217, + "step": 16128 + }, + { + "epoch": 0.41, + "learning_rate": 1.939674743336364e-06, + "loss": 1.082, + "step": 16129 + }, + { + "epoch": 0.41, + "learning_rate": 1.9396652777650215e-06, + "loss": 1.0273, + "step": 16130 + }, + { + "epoch": 0.41, + "learning_rate": 1.9396558114742196e-06, + "loss": 1.002, + "step": 16131 + }, + { + "epoch": 0.41, + "learning_rate": 1.939646344463967e-06, + "loss": 1.1289, + "step": 16132 + }, + { + "epoch": 0.41, + "learning_rate": 1.93963687673427e-06, + "loss": 0.8643, + "step": 16133 + }, + { + "epoch": 0.41, + "learning_rate": 1.9396274082851366e-06, + "loss": 0.8779, + "step": 16134 + }, + { + "epoch": 0.41, + "learning_rate": 1.9396179391165737e-06, + "loss": 1.041, + "step": 16135 + }, + { + "epoch": 0.41, + "learning_rate": 1.9396084692285885e-06, + "loss": 0.8564, + "step": 16136 + }, + { + "epoch": 0.41, + "learning_rate": 1.939598998621188e-06, + "loss": 1.0273, + "step": 16137 + }, + { + "epoch": 0.41, + "learning_rate": 1.93958952729438e-06, + "loss": 0.9316, + "step": 16138 + }, + { + "epoch": 0.41, + "learning_rate": 1.9395800552481715e-06, + "loss": 1.0762, + "step": 16139 + }, + { + "epoch": 0.41, + "learning_rate": 1.9395705824825697e-06, + "loss": 0.8662, + "step": 16140 + }, + { + "epoch": 0.41, + "learning_rate": 1.9395611089975824e-06, + "loss": 0.7734, + "step": 16141 + }, + { + "epoch": 0.41, + "learning_rate": 1.939551634793216e-06, + "loss": 0.8135, + "step": 16142 + }, + { + "epoch": 0.41, + "learning_rate": 1.939542159869478e-06, + "loss": 0.9824, + "step": 16143 + }, + { + "epoch": 0.41, + "learning_rate": 1.9395326842263757e-06, + "loss": 0.9629, + "step": 16144 + }, + { + "epoch": 0.41, + "learning_rate": 1.9395232078639167e-06, + "loss": 0.5957, + "step": 16145 + }, + { + "epoch": 0.41, + "learning_rate": 1.9395137307821073e-06, + "loss": 0.958, + "step": 16146 + }, + { + "epoch": 0.41, + "learning_rate": 1.939504252980956e-06, + "loss": 0.7803, + "step": 16147 + }, + { + "epoch": 0.41, + "learning_rate": 1.9394947744604697e-06, + "loss": 0.8447, + "step": 16148 + }, + { + "epoch": 0.41, + "learning_rate": 1.9394852952206554e-06, + "loss": 0.7744, + "step": 16149 + }, + { + "epoch": 0.41, + "learning_rate": 1.93947581526152e-06, + "loss": 1.1143, + "step": 16150 + }, + { + "epoch": 0.41, + "learning_rate": 1.939466334583071e-06, + "loss": 0.9238, + "step": 16151 + }, + { + "epoch": 0.41, + "learning_rate": 1.9394568531853167e-06, + "loss": 0.6982, + "step": 16152 + }, + { + "epoch": 0.41, + "learning_rate": 1.939447371068263e-06, + "loss": 0.751, + "step": 16153 + }, + { + "epoch": 0.41, + "learning_rate": 1.9394378882319174e-06, + "loss": 0.7041, + "step": 16154 + }, + { + "epoch": 0.41, + "learning_rate": 1.9394284046762878e-06, + "loss": 0.8594, + "step": 16155 + }, + { + "epoch": 0.41, + "learning_rate": 1.9394189204013806e-06, + "loss": 0.7983, + "step": 16156 + }, + { + "epoch": 0.41, + "learning_rate": 1.939409435407204e-06, + "loss": 0.8896, + "step": 16157 + }, + { + "epoch": 0.41, + "learning_rate": 1.9393999496937646e-06, + "loss": 0.7983, + "step": 16158 + }, + { + "epoch": 0.41, + "learning_rate": 1.9393904632610698e-06, + "loss": 1.0566, + "step": 16159 + }, + { + "epoch": 0.41, + "learning_rate": 1.939380976109127e-06, + "loss": 0.9214, + "step": 16160 + }, + { + "epoch": 0.41, + "learning_rate": 1.9393714882379433e-06, + "loss": 1.0518, + "step": 16161 + }, + { + "epoch": 0.41, + "learning_rate": 1.9393619996475265e-06, + "loss": 0.9424, + "step": 16162 + }, + { + "epoch": 0.41, + "learning_rate": 1.939352510337883e-06, + "loss": 0.9629, + "step": 16163 + }, + { + "epoch": 0.41, + "learning_rate": 1.93934302030902e-06, + "loss": 0.9688, + "step": 16164 + }, + { + "epoch": 0.41, + "learning_rate": 1.939333529560946e-06, + "loss": 0.9922, + "step": 16165 + }, + { + "epoch": 0.41, + "learning_rate": 1.9393240380936674e-06, + "loss": 0.7039, + "step": 16166 + }, + { + "epoch": 0.41, + "learning_rate": 1.9393145459071913e-06, + "loss": 0.9502, + "step": 16167 + }, + { + "epoch": 0.41, + "learning_rate": 1.9393050530015253e-06, + "loss": 0.9775, + "step": 16168 + }, + { + "epoch": 0.41, + "learning_rate": 1.9392955593766767e-06, + "loss": 0.8335, + "step": 16169 + }, + { + "epoch": 0.41, + "learning_rate": 1.9392860650326527e-06, + "loss": 0.8428, + "step": 16170 + }, + { + "epoch": 0.41, + "learning_rate": 1.9392765699694604e-06, + "loss": 0.7979, + "step": 16171 + }, + { + "epoch": 0.41, + "learning_rate": 1.9392670741871075e-06, + "loss": 0.9248, + "step": 16172 + }, + { + "epoch": 0.41, + "learning_rate": 1.9392575776856007e-06, + "loss": 1.1045, + "step": 16173 + }, + { + "epoch": 0.41, + "learning_rate": 1.9392480804649477e-06, + "loss": 0.9209, + "step": 16174 + }, + { + "epoch": 0.41, + "learning_rate": 1.9392385825251558e-06, + "loss": 0.9424, + "step": 16175 + }, + { + "epoch": 0.41, + "learning_rate": 1.939229083866232e-06, + "loss": 0.8369, + "step": 16176 + }, + { + "epoch": 0.41, + "learning_rate": 1.9392195844881835e-06, + "loss": 0.9111, + "step": 16177 + }, + { + "epoch": 0.41, + "learning_rate": 1.9392100843910177e-06, + "loss": 0.9746, + "step": 16178 + }, + { + "epoch": 0.41, + "learning_rate": 1.9392005835747425e-06, + "loss": 0.9629, + "step": 16179 + }, + { + "epoch": 0.41, + "learning_rate": 1.9391910820393638e-06, + "loss": 0.7764, + "step": 16180 + }, + { + "epoch": 0.41, + "learning_rate": 1.93918157978489e-06, + "loss": 0.626, + "step": 16181 + }, + { + "epoch": 0.41, + "learning_rate": 1.939172076811328e-06, + "loss": 1.0127, + "step": 16182 + }, + { + "epoch": 0.41, + "learning_rate": 1.9391625731186855e-06, + "loss": 0.9727, + "step": 16183 + }, + { + "epoch": 0.41, + "learning_rate": 1.939153068706969e-06, + "loss": 0.9424, + "step": 16184 + }, + { + "epoch": 0.41, + "learning_rate": 1.939143563576186e-06, + "loss": 0.9326, + "step": 16185 + }, + { + "epoch": 0.41, + "learning_rate": 1.9391340577263447e-06, + "loss": 0.9736, + "step": 16186 + }, + { + "epoch": 0.41, + "learning_rate": 1.939124551157451e-06, + "loss": 1.0088, + "step": 16187 + }, + { + "epoch": 0.41, + "learning_rate": 1.939115043869513e-06, + "loss": 0.9629, + "step": 16188 + }, + { + "epoch": 0.41, + "learning_rate": 1.939105535862538e-06, + "loss": 0.8926, + "step": 16189 + }, + { + "epoch": 0.41, + "learning_rate": 1.9390960271365327e-06, + "loss": 0.7881, + "step": 16190 + }, + { + "epoch": 0.41, + "learning_rate": 1.939086517691505e-06, + "loss": 1.0293, + "step": 16191 + }, + { + "epoch": 0.42, + "learning_rate": 1.9390770075274617e-06, + "loss": 0.8477, + "step": 16192 + }, + { + "epoch": 0.42, + "learning_rate": 1.9390674966444104e-06, + "loss": 1.0215, + "step": 16193 + }, + { + "epoch": 0.42, + "learning_rate": 1.939057985042358e-06, + "loss": 0.8506, + "step": 16194 + }, + { + "epoch": 0.42, + "learning_rate": 1.939048472721313e-06, + "loss": 0.6309, + "step": 16195 + }, + { + "epoch": 0.42, + "learning_rate": 1.9390389596812813e-06, + "loss": 0.9678, + "step": 16196 + }, + { + "epoch": 0.42, + "learning_rate": 1.93902944592227e-06, + "loss": 0.9971, + "step": 16197 + }, + { + "epoch": 0.42, + "learning_rate": 1.939019931444288e-06, + "loss": 0.8672, + "step": 16198 + }, + { + "epoch": 0.42, + "learning_rate": 1.939010416247341e-06, + "loss": 0.7041, + "step": 16199 + }, + { + "epoch": 0.42, + "learning_rate": 1.9390009003314375e-06, + "loss": 0.96, + "step": 16200 + }, + { + "epoch": 0.42, + "learning_rate": 1.9389913836965836e-06, + "loss": 1.0322, + "step": 16201 + }, + { + "epoch": 0.42, + "learning_rate": 1.938981866342787e-06, + "loss": 1.2598, + "step": 16202 + }, + { + "epoch": 0.42, + "learning_rate": 1.9389723482700558e-06, + "loss": 1.1055, + "step": 16203 + }, + { + "epoch": 0.42, + "learning_rate": 1.9389628294783963e-06, + "loss": 0.6641, + "step": 16204 + }, + { + "epoch": 0.42, + "learning_rate": 1.9389533099678164e-06, + "loss": 0.7363, + "step": 16205 + }, + { + "epoch": 0.42, + "learning_rate": 1.9389437897383227e-06, + "loss": 0.8721, + "step": 16206 + }, + { + "epoch": 0.42, + "learning_rate": 1.9389342687899234e-06, + "loss": 0.7832, + "step": 16207 + }, + { + "epoch": 0.42, + "learning_rate": 1.938924747122625e-06, + "loss": 0.9209, + "step": 16208 + }, + { + "epoch": 0.42, + "learning_rate": 1.938915224736435e-06, + "loss": 0.7065, + "step": 16209 + }, + { + "epoch": 0.42, + "learning_rate": 1.938905701631361e-06, + "loss": 0.8691, + "step": 16210 + }, + { + "epoch": 0.42, + "learning_rate": 1.9388961778074098e-06, + "loss": 0.9092, + "step": 16211 + }, + { + "epoch": 0.42, + "learning_rate": 1.9388866532645893e-06, + "loss": 0.8491, + "step": 16212 + }, + { + "epoch": 0.42, + "learning_rate": 1.9388771280029064e-06, + "loss": 0.9111, + "step": 16213 + }, + { + "epoch": 0.42, + "learning_rate": 1.9388676020223686e-06, + "loss": 0.7959, + "step": 16214 + }, + { + "epoch": 0.42, + "learning_rate": 1.938858075322983e-06, + "loss": 0.8779, + "step": 16215 + }, + { + "epoch": 0.42, + "learning_rate": 1.938848547904756e-06, + "loss": 0.8994, + "step": 16216 + }, + { + "epoch": 0.42, + "learning_rate": 1.938839019767697e-06, + "loss": 0.9492, + "step": 16217 + }, + { + "epoch": 0.42, + "learning_rate": 1.9388294909118115e-06, + "loss": 0.9365, + "step": 16218 + }, + { + "epoch": 0.42, + "learning_rate": 1.938819961337108e-06, + "loss": 1.2539, + "step": 16219 + }, + { + "epoch": 0.42, + "learning_rate": 1.9388104310435928e-06, + "loss": 0.8896, + "step": 16220 + }, + { + "epoch": 0.42, + "learning_rate": 1.9388009000312736e-06, + "loss": 0.7383, + "step": 16221 + }, + { + "epoch": 0.42, + "learning_rate": 1.938791368300158e-06, + "loss": 0.7891, + "step": 16222 + }, + { + "epoch": 0.42, + "learning_rate": 1.9387818358502528e-06, + "loss": 0.8701, + "step": 16223 + }, + { + "epoch": 0.42, + "learning_rate": 1.9387723026815656e-06, + "loss": 0.7666, + "step": 16224 + }, + { + "epoch": 0.42, + "learning_rate": 1.9387627687941036e-06, + "loss": 0.5518, + "step": 16225 + }, + { + "epoch": 0.42, + "learning_rate": 1.938753234187874e-06, + "loss": 1.0078, + "step": 16226 + }, + { + "epoch": 0.42, + "learning_rate": 1.9387436988628844e-06, + "loss": 0.7971, + "step": 16227 + }, + { + "epoch": 0.42, + "learning_rate": 1.9387341628191416e-06, + "loss": 0.8535, + "step": 16228 + }, + { + "epoch": 0.42, + "learning_rate": 1.9387246260566537e-06, + "loss": 0.8564, + "step": 16229 + }, + { + "epoch": 0.42, + "learning_rate": 1.938715088575427e-06, + "loss": 1.0996, + "step": 16230 + }, + { + "epoch": 0.42, + "learning_rate": 1.9387055503754696e-06, + "loss": 0.9229, + "step": 16231 + }, + { + "epoch": 0.42, + "learning_rate": 1.9386960114567886e-06, + "loss": 0.8379, + "step": 16232 + }, + { + "epoch": 0.42, + "learning_rate": 1.938686471819391e-06, + "loss": 0.8281, + "step": 16233 + }, + { + "epoch": 0.42, + "learning_rate": 1.9386769314632847e-06, + "loss": 0.8789, + "step": 16234 + }, + { + "epoch": 0.42, + "learning_rate": 1.9386673903884762e-06, + "loss": 0.6362, + "step": 16235 + }, + { + "epoch": 0.42, + "learning_rate": 1.9386578485949735e-06, + "loss": 0.9609, + "step": 16236 + }, + { + "epoch": 0.42, + "learning_rate": 1.9386483060827836e-06, + "loss": 0.8965, + "step": 16237 + }, + { + "epoch": 0.42, + "learning_rate": 1.9386387628519137e-06, + "loss": 0.7354, + "step": 16238 + }, + { + "epoch": 0.42, + "learning_rate": 1.9386292189023716e-06, + "loss": 0.791, + "step": 16239 + }, + { + "epoch": 0.42, + "learning_rate": 1.938619674234164e-06, + "loss": 0.9248, + "step": 16240 + }, + { + "epoch": 0.42, + "learning_rate": 1.9386101288472983e-06, + "loss": 1.0518, + "step": 16241 + }, + { + "epoch": 0.42, + "learning_rate": 1.9386005827417825e-06, + "loss": 1.0527, + "step": 16242 + }, + { + "epoch": 0.42, + "learning_rate": 1.938591035917623e-06, + "loss": 0.9258, + "step": 16243 + }, + { + "epoch": 0.42, + "learning_rate": 1.9385814883748275e-06, + "loss": 1.0596, + "step": 16244 + }, + { + "epoch": 0.42, + "learning_rate": 1.9385719401134035e-06, + "loss": 0.7979, + "step": 16245 + }, + { + "epoch": 0.42, + "learning_rate": 1.938562391133358e-06, + "loss": 0.9038, + "step": 16246 + }, + { + "epoch": 0.42, + "learning_rate": 1.9385528414346985e-06, + "loss": 0.5918, + "step": 16247 + }, + { + "epoch": 0.42, + "learning_rate": 1.938543291017432e-06, + "loss": 0.8662, + "step": 16248 + }, + { + "epoch": 0.42, + "learning_rate": 1.9385337398815663e-06, + "loss": 0.7078, + "step": 16249 + }, + { + "epoch": 0.42, + "learning_rate": 1.9385241880271087e-06, + "loss": 0.9561, + "step": 16250 + }, + { + "epoch": 0.42, + "learning_rate": 1.938514635454066e-06, + "loss": 0.7456, + "step": 16251 + }, + { + "epoch": 0.42, + "learning_rate": 1.938505082162446e-06, + "loss": 0.7188, + "step": 16252 + }, + { + "epoch": 0.42, + "learning_rate": 1.938495528152255e-06, + "loss": 1.0332, + "step": 16253 + }, + { + "epoch": 0.42, + "learning_rate": 1.938485973423502e-06, + "loss": 0.8013, + "step": 16254 + }, + { + "epoch": 0.42, + "learning_rate": 1.9384764179761932e-06, + "loss": 0.9355, + "step": 16255 + }, + { + "epoch": 0.42, + "learning_rate": 1.9384668618103362e-06, + "loss": 0.4963, + "step": 16256 + }, + { + "epoch": 0.42, + "learning_rate": 1.938457304925938e-06, + "loss": 0.8853, + "step": 16257 + }, + { + "epoch": 0.42, + "learning_rate": 1.9384477473230067e-06, + "loss": 0.7139, + "step": 16258 + }, + { + "epoch": 0.42, + "learning_rate": 1.9384381890015487e-06, + "loss": 0.9805, + "step": 16259 + }, + { + "epoch": 0.42, + "learning_rate": 1.938428629961572e-06, + "loss": 0.8584, + "step": 16260 + }, + { + "epoch": 0.42, + "learning_rate": 1.9384190702030836e-06, + "loss": 0.7246, + "step": 16261 + }, + { + "epoch": 0.42, + "learning_rate": 1.9384095097260906e-06, + "loss": 0.8486, + "step": 16262 + }, + { + "epoch": 0.42, + "learning_rate": 1.938399948530601e-06, + "loss": 0.7969, + "step": 16263 + }, + { + "epoch": 0.42, + "learning_rate": 1.9383903866166214e-06, + "loss": 0.8105, + "step": 16264 + }, + { + "epoch": 0.42, + "learning_rate": 1.9383808239841595e-06, + "loss": 1.0781, + "step": 16265 + }, + { + "epoch": 0.42, + "learning_rate": 1.9383712606332226e-06, + "loss": 0.9727, + "step": 16266 + }, + { + "epoch": 0.42, + "learning_rate": 1.938361696563818e-06, + "loss": 0.9219, + "step": 16267 + }, + { + "epoch": 0.42, + "learning_rate": 1.938352131775953e-06, + "loss": 0.7642, + "step": 16268 + }, + { + "epoch": 0.42, + "learning_rate": 1.9383425662696345e-06, + "loss": 0.6172, + "step": 16269 + }, + { + "epoch": 0.42, + "learning_rate": 1.9383330000448707e-06, + "loss": 1.0244, + "step": 16270 + }, + { + "epoch": 0.42, + "learning_rate": 1.9383234331016684e-06, + "loss": 0.8877, + "step": 16271 + }, + { + "epoch": 0.42, + "learning_rate": 1.9383138654400352e-06, + "loss": 0.7549, + "step": 16272 + }, + { + "epoch": 0.42, + "learning_rate": 1.938304297059978e-06, + "loss": 1.0107, + "step": 16273 + }, + { + "epoch": 0.42, + "learning_rate": 1.938294727961504e-06, + "loss": 0.9307, + "step": 16274 + }, + { + "epoch": 0.42, + "learning_rate": 1.9382851581446214e-06, + "loss": 0.7065, + "step": 16275 + }, + { + "epoch": 0.42, + "learning_rate": 1.9382755876093367e-06, + "loss": 0.7327, + "step": 16276 + }, + { + "epoch": 0.42, + "learning_rate": 1.938266016355658e-06, + "loss": 1.0459, + "step": 16277 + }, + { + "epoch": 0.42, + "learning_rate": 1.9382564443835913e-06, + "loss": 0.9297, + "step": 16278 + }, + { + "epoch": 0.42, + "learning_rate": 1.9382468716931455e-06, + "loss": 1.0977, + "step": 16279 + }, + { + "epoch": 0.42, + "learning_rate": 1.938237298284327e-06, + "loss": 0.7852, + "step": 16280 + }, + { + "epoch": 0.42, + "learning_rate": 1.938227724157143e-06, + "loss": 0.9277, + "step": 16281 + }, + { + "epoch": 0.42, + "learning_rate": 1.938218149311602e-06, + "loss": 0.9072, + "step": 16282 + }, + { + "epoch": 0.42, + "learning_rate": 1.9382085737477094e-06, + "loss": 1.0801, + "step": 16283 + }, + { + "epoch": 0.42, + "learning_rate": 1.9381989974654742e-06, + "loss": 1.0674, + "step": 16284 + }, + { + "epoch": 0.42, + "learning_rate": 1.938189420464903e-06, + "loss": 0.7109, + "step": 16285 + }, + { + "epoch": 0.42, + "learning_rate": 1.938179842746004e-06, + "loss": 0.8359, + "step": 16286 + }, + { + "epoch": 0.42, + "learning_rate": 1.9381702643087834e-06, + "loss": 1.2227, + "step": 16287 + }, + { + "epoch": 0.42, + "learning_rate": 1.9381606851532485e-06, + "loss": 0.9307, + "step": 16288 + }, + { + "epoch": 0.42, + "learning_rate": 1.9381511052794077e-06, + "loss": 0.8936, + "step": 16289 + }, + { + "epoch": 0.42, + "learning_rate": 1.9381415246872673e-06, + "loss": 0.7271, + "step": 16290 + }, + { + "epoch": 0.42, + "learning_rate": 1.9381319433768357e-06, + "loss": 0.9961, + "step": 16291 + }, + { + "epoch": 0.42, + "learning_rate": 1.938122361348119e-06, + "loss": 0.7822, + "step": 16292 + }, + { + "epoch": 0.42, + "learning_rate": 1.938112778601125e-06, + "loss": 0.8945, + "step": 16293 + }, + { + "epoch": 0.42, + "learning_rate": 1.938103195135862e-06, + "loss": 0.833, + "step": 16294 + }, + { + "epoch": 0.42, + "learning_rate": 1.9380936109523357e-06, + "loss": 1.0117, + "step": 16295 + }, + { + "epoch": 0.42, + "learning_rate": 1.9380840260505547e-06, + "loss": 0.8408, + "step": 16296 + }, + { + "epoch": 0.42, + "learning_rate": 1.938074440430526e-06, + "loss": 1.001, + "step": 16297 + }, + { + "epoch": 0.42, + "learning_rate": 1.938064854092256e-06, + "loss": 0.9971, + "step": 16298 + }, + { + "epoch": 0.42, + "learning_rate": 1.938055267035754e-06, + "loss": 0.8872, + "step": 16299 + }, + { + "epoch": 0.42, + "learning_rate": 1.9380456792610256e-06, + "loss": 0.9482, + "step": 16300 + }, + { + "epoch": 0.42, + "learning_rate": 1.938036090768079e-06, + "loss": 0.7734, + "step": 16301 + }, + { + "epoch": 0.42, + "learning_rate": 1.938026501556921e-06, + "loss": 0.9033, + "step": 16302 + }, + { + "epoch": 0.42, + "learning_rate": 1.9380169116275595e-06, + "loss": 0.9062, + "step": 16303 + }, + { + "epoch": 0.42, + "learning_rate": 1.9380073209800012e-06, + "loss": 0.8809, + "step": 16304 + }, + { + "epoch": 0.42, + "learning_rate": 1.9379977296142544e-06, + "loss": 0.8047, + "step": 16305 + }, + { + "epoch": 0.42, + "learning_rate": 1.9379881375303256e-06, + "loss": 0.4932, + "step": 16306 + }, + { + "epoch": 0.42, + "learning_rate": 1.937978544728222e-06, + "loss": 0.8438, + "step": 16307 + }, + { + "epoch": 0.42, + "learning_rate": 1.937968951207952e-06, + "loss": 0.8813, + "step": 16308 + }, + { + "epoch": 0.42, + "learning_rate": 1.9379593569695222e-06, + "loss": 0.7427, + "step": 16309 + }, + { + "epoch": 0.42, + "learning_rate": 1.93794976201294e-06, + "loss": 0.873, + "step": 16310 + }, + { + "epoch": 0.42, + "learning_rate": 1.9379401663382125e-06, + "loss": 0.8857, + "step": 16311 + }, + { + "epoch": 0.42, + "learning_rate": 1.9379305699453476e-06, + "loss": 0.9922, + "step": 16312 + }, + { + "epoch": 0.42, + "learning_rate": 1.9379209728343524e-06, + "loss": 0.9473, + "step": 16313 + }, + { + "epoch": 0.42, + "learning_rate": 1.9379113750052342e-06, + "loss": 0.918, + "step": 16314 + }, + { + "epoch": 0.42, + "learning_rate": 1.9379017764580002e-06, + "loss": 1.0127, + "step": 16315 + }, + { + "epoch": 0.42, + "learning_rate": 1.937892177192658e-06, + "loss": 1.0918, + "step": 16316 + }, + { + "epoch": 0.42, + "learning_rate": 1.937882577209215e-06, + "loss": 0.6914, + "step": 16317 + }, + { + "epoch": 0.42, + "learning_rate": 1.937872976507679e-06, + "loss": 0.9219, + "step": 16318 + }, + { + "epoch": 0.42, + "learning_rate": 1.9378633750880558e-06, + "loss": 0.9385, + "step": 16319 + }, + { + "epoch": 0.42, + "learning_rate": 1.937853772950354e-06, + "loss": 0.7764, + "step": 16320 + }, + { + "epoch": 0.42, + "learning_rate": 1.937844170094581e-06, + "loss": 0.8286, + "step": 16321 + }, + { + "epoch": 0.42, + "learning_rate": 1.9378345665207437e-06, + "loss": 0.8086, + "step": 16322 + }, + { + "epoch": 0.42, + "learning_rate": 1.9378249622288493e-06, + "loss": 0.9023, + "step": 16323 + }, + { + "epoch": 0.42, + "learning_rate": 1.937815357218906e-06, + "loss": 0.9248, + "step": 16324 + }, + { + "epoch": 0.42, + "learning_rate": 1.93780575149092e-06, + "loss": 0.9316, + "step": 16325 + }, + { + "epoch": 0.42, + "learning_rate": 1.9377961450448997e-06, + "loss": 0.6943, + "step": 16326 + }, + { + "epoch": 0.42, + "learning_rate": 1.937786537880852e-06, + "loss": 0.8252, + "step": 16327 + }, + { + "epoch": 0.42, + "learning_rate": 1.937776929998784e-06, + "loss": 0.8975, + "step": 16328 + }, + { + "epoch": 0.42, + "learning_rate": 1.9377673213987037e-06, + "loss": 0.8877, + "step": 16329 + }, + { + "epoch": 0.42, + "learning_rate": 1.937757712080618e-06, + "loss": 0.9414, + "step": 16330 + }, + { + "epoch": 0.42, + "learning_rate": 1.937748102044534e-06, + "loss": 0.8066, + "step": 16331 + }, + { + "epoch": 0.42, + "learning_rate": 1.93773849129046e-06, + "loss": 0.917, + "step": 16332 + }, + { + "epoch": 0.42, + "learning_rate": 1.937728879818402e-06, + "loss": 0.9688, + "step": 16333 + }, + { + "epoch": 0.42, + "learning_rate": 1.9377192676283686e-06, + "loss": 0.7866, + "step": 16334 + }, + { + "epoch": 0.42, + "learning_rate": 1.9377096547203665e-06, + "loss": 0.9512, + "step": 16335 + }, + { + "epoch": 0.42, + "learning_rate": 1.9377000410944032e-06, + "loss": 1.0742, + "step": 16336 + }, + { + "epoch": 0.42, + "learning_rate": 1.937690426750486e-06, + "loss": 0.9736, + "step": 16337 + }, + { + "epoch": 0.42, + "learning_rate": 1.9376808116886226e-06, + "loss": 0.543, + "step": 16338 + }, + { + "epoch": 0.42, + "learning_rate": 1.93767119590882e-06, + "loss": 0.8428, + "step": 16339 + }, + { + "epoch": 0.42, + "learning_rate": 1.9376615794110856e-06, + "loss": 0.8369, + "step": 16340 + }, + { + "epoch": 0.42, + "learning_rate": 1.937651962195427e-06, + "loss": 0.8369, + "step": 16341 + }, + { + "epoch": 0.42, + "learning_rate": 1.9376423442618515e-06, + "loss": 0.855, + "step": 16342 + }, + { + "epoch": 0.42, + "learning_rate": 1.9376327256103663e-06, + "loss": 0.709, + "step": 16343 + }, + { + "epoch": 0.42, + "learning_rate": 1.937623106240979e-06, + "loss": 0.8467, + "step": 16344 + }, + { + "epoch": 0.42, + "learning_rate": 1.9376134861536966e-06, + "loss": 1.0439, + "step": 16345 + }, + { + "epoch": 0.42, + "learning_rate": 1.9376038653485263e-06, + "loss": 0.9551, + "step": 16346 + }, + { + "epoch": 0.42, + "learning_rate": 1.9375942438254762e-06, + "loss": 1.0254, + "step": 16347 + }, + { + "epoch": 0.42, + "learning_rate": 1.9375846215845534e-06, + "loss": 0.9004, + "step": 16348 + }, + { + "epoch": 0.42, + "learning_rate": 1.937574998625765e-06, + "loss": 0.874, + "step": 16349 + }, + { + "epoch": 0.42, + "learning_rate": 1.9375653749491185e-06, + "loss": 0.874, + "step": 16350 + }, + { + "epoch": 0.42, + "learning_rate": 1.9375557505546216e-06, + "loss": 0.5724, + "step": 16351 + }, + { + "epoch": 0.42, + "learning_rate": 1.9375461254422812e-06, + "loss": 0.8584, + "step": 16352 + }, + { + "epoch": 0.42, + "learning_rate": 1.9375364996121046e-06, + "loss": 0.9053, + "step": 16353 + }, + { + "epoch": 0.42, + "learning_rate": 1.9375268730640997e-06, + "loss": 0.7891, + "step": 16354 + }, + { + "epoch": 0.42, + "learning_rate": 1.9375172457982733e-06, + "loss": 0.8408, + "step": 16355 + }, + { + "epoch": 0.42, + "learning_rate": 1.9375076178146336e-06, + "loss": 1.3535, + "step": 16356 + }, + { + "epoch": 0.42, + "learning_rate": 1.9374979891131868e-06, + "loss": 0.8872, + "step": 16357 + }, + { + "epoch": 0.42, + "learning_rate": 1.9374883596939414e-06, + "loss": 0.9697, + "step": 16358 + }, + { + "epoch": 0.42, + "learning_rate": 1.937478729556904e-06, + "loss": 1.0674, + "step": 16359 + }, + { + "epoch": 0.42, + "learning_rate": 1.937469098702082e-06, + "loss": 0.8516, + "step": 16360 + }, + { + "epoch": 0.42, + "learning_rate": 1.9374594671294835e-06, + "loss": 0.9521, + "step": 16361 + }, + { + "epoch": 0.42, + "learning_rate": 1.937449834839115e-06, + "loss": 0.9092, + "step": 16362 + }, + { + "epoch": 0.42, + "learning_rate": 1.937440201830985e-06, + "loss": 1.0449, + "step": 16363 + }, + { + "epoch": 0.42, + "learning_rate": 1.9374305681050992e-06, + "loss": 0.7446, + "step": 16364 + }, + { + "epoch": 0.42, + "learning_rate": 1.937420933661466e-06, + "loss": 1.0947, + "step": 16365 + }, + { + "epoch": 0.42, + "learning_rate": 1.9374112985000933e-06, + "loss": 0.7822, + "step": 16366 + }, + { + "epoch": 0.42, + "learning_rate": 1.9374016626209876e-06, + "loss": 0.9541, + "step": 16367 + }, + { + "epoch": 0.42, + "learning_rate": 1.9373920260241565e-06, + "loss": 0.8633, + "step": 16368 + }, + { + "epoch": 0.42, + "learning_rate": 1.9373823887096073e-06, + "loss": 0.7285, + "step": 16369 + }, + { + "epoch": 0.42, + "learning_rate": 1.937372750677348e-06, + "loss": 0.8652, + "step": 16370 + }, + { + "epoch": 0.42, + "learning_rate": 1.937363111927385e-06, + "loss": 0.7041, + "step": 16371 + }, + { + "epoch": 0.42, + "learning_rate": 1.9373534724597264e-06, + "loss": 0.8584, + "step": 16372 + }, + { + "epoch": 0.42, + "learning_rate": 1.937343832274379e-06, + "loss": 0.9004, + "step": 16373 + }, + { + "epoch": 0.42, + "learning_rate": 1.9373341913713512e-06, + "loss": 0.792, + "step": 16374 + }, + { + "epoch": 0.42, + "learning_rate": 1.937324549750649e-06, + "loss": 1.0029, + "step": 16375 + }, + { + "epoch": 0.42, + "learning_rate": 1.937314907412281e-06, + "loss": 0.7939, + "step": 16376 + }, + { + "epoch": 0.42, + "learning_rate": 1.937305264356254e-06, + "loss": 0.8076, + "step": 16377 + }, + { + "epoch": 0.42, + "learning_rate": 1.937295620582575e-06, + "loss": 0.7949, + "step": 16378 + }, + { + "epoch": 0.42, + "learning_rate": 1.937285976091252e-06, + "loss": 0.9609, + "step": 16379 + }, + { + "epoch": 0.42, + "learning_rate": 1.9372763308822928e-06, + "loss": 0.9375, + "step": 16380 + }, + { + "epoch": 0.42, + "learning_rate": 1.937266684955704e-06, + "loss": 0.9609, + "step": 16381 + }, + { + "epoch": 0.42, + "learning_rate": 1.937257038311493e-06, + "loss": 0.9844, + "step": 16382 + }, + { + "epoch": 0.42, + "learning_rate": 1.937247390949667e-06, + "loss": 0.9443, + "step": 16383 + }, + { + "epoch": 0.42, + "learning_rate": 1.937237742870234e-06, + "loss": 0.6528, + "step": 16384 + }, + { + "epoch": 0.42, + "learning_rate": 1.9372280940732013e-06, + "loss": 0.8223, + "step": 16385 + }, + { + "epoch": 0.42, + "learning_rate": 1.9372184445585766e-06, + "loss": 0.6265, + "step": 16386 + }, + { + "epoch": 0.42, + "learning_rate": 1.9372087943263662e-06, + "loss": 0.8867, + "step": 16387 + }, + { + "epoch": 0.42, + "learning_rate": 1.9371991433765784e-06, + "loss": 1.0742, + "step": 16388 + }, + { + "epoch": 0.42, + "learning_rate": 1.93718949170922e-06, + "loss": 1.0146, + "step": 16389 + }, + { + "epoch": 0.42, + "learning_rate": 1.937179839324299e-06, + "loss": 0.7471, + "step": 16390 + }, + { + "epoch": 0.42, + "learning_rate": 1.937170186221822e-06, + "loss": 0.7603, + "step": 16391 + }, + { + "epoch": 0.42, + "learning_rate": 1.9371605324017975e-06, + "loss": 0.959, + "step": 16392 + }, + { + "epoch": 0.42, + "learning_rate": 1.9371508778642322e-06, + "loss": 0.8438, + "step": 16393 + }, + { + "epoch": 0.42, + "learning_rate": 1.9371412226091335e-06, + "loss": 0.8818, + "step": 16394 + }, + { + "epoch": 0.42, + "learning_rate": 1.937131566636509e-06, + "loss": 1.2051, + "step": 16395 + }, + { + "epoch": 0.42, + "learning_rate": 1.9371219099463656e-06, + "loss": 1.0674, + "step": 16396 + }, + { + "epoch": 0.42, + "learning_rate": 1.9371122525387113e-06, + "loss": 0.8477, + "step": 16397 + }, + { + "epoch": 0.42, + "learning_rate": 1.9371025944135528e-06, + "loss": 0.9883, + "step": 16398 + }, + { + "epoch": 0.42, + "learning_rate": 1.9370929355708985e-06, + "loss": 0.9668, + "step": 16399 + }, + { + "epoch": 0.42, + "learning_rate": 1.937083276010755e-06, + "loss": 0.6943, + "step": 16400 + }, + { + "epoch": 0.42, + "learning_rate": 1.9370736157331296e-06, + "loss": 1.0137, + "step": 16401 + }, + { + "epoch": 0.42, + "learning_rate": 1.9370639547380303e-06, + "loss": 0.8032, + "step": 16402 + }, + { + "epoch": 0.42, + "learning_rate": 1.937054293025464e-06, + "loss": 1.0381, + "step": 16403 + }, + { + "epoch": 0.42, + "learning_rate": 1.937044630595439e-06, + "loss": 0.9902, + "step": 16404 + }, + { + "epoch": 0.42, + "learning_rate": 1.937034967447961e-06, + "loss": 1.0859, + "step": 16405 + }, + { + "epoch": 0.42, + "learning_rate": 1.9370253035830393e-06, + "loss": 1.0586, + "step": 16406 + }, + { + "epoch": 0.42, + "learning_rate": 1.93701563900068e-06, + "loss": 0.9326, + "step": 16407 + }, + { + "epoch": 0.42, + "learning_rate": 1.937005973700891e-06, + "loss": 0.917, + "step": 16408 + }, + { + "epoch": 0.42, + "learning_rate": 1.9369963076836798e-06, + "loss": 0.9111, + "step": 16409 + }, + { + "epoch": 0.42, + "learning_rate": 1.9369866409490535e-06, + "loss": 0.9248, + "step": 16410 + }, + { + "epoch": 0.42, + "learning_rate": 1.9369769734970195e-06, + "loss": 0.8047, + "step": 16411 + }, + { + "epoch": 0.42, + "learning_rate": 1.936967305327585e-06, + "loss": 0.9014, + "step": 16412 + }, + { + "epoch": 0.42, + "learning_rate": 1.936957636440758e-06, + "loss": 0.9565, + "step": 16413 + }, + { + "epoch": 0.42, + "learning_rate": 1.936947966836546e-06, + "loss": 0.8826, + "step": 16414 + }, + { + "epoch": 0.42, + "learning_rate": 1.936938296514956e-06, + "loss": 0.8105, + "step": 16415 + }, + { + "epoch": 0.42, + "learning_rate": 1.936928625475995e-06, + "loss": 0.9473, + "step": 16416 + }, + { + "epoch": 0.42, + "learning_rate": 1.9369189537196706e-06, + "loss": 0.7529, + "step": 16417 + }, + { + "epoch": 0.42, + "learning_rate": 1.936909281245991e-06, + "loss": 0.9678, + "step": 16418 + }, + { + "epoch": 0.42, + "learning_rate": 1.9368996080549626e-06, + "loss": 1.0078, + "step": 16419 + }, + { + "epoch": 0.42, + "learning_rate": 1.9368899341465936e-06, + "loss": 0.6216, + "step": 16420 + }, + { + "epoch": 0.42, + "learning_rate": 1.936880259520891e-06, + "loss": 0.8506, + "step": 16421 + }, + { + "epoch": 0.42, + "learning_rate": 1.936870584177862e-06, + "loss": 0.9131, + "step": 16422 + }, + { + "epoch": 0.42, + "learning_rate": 1.9368609081175145e-06, + "loss": 0.8926, + "step": 16423 + }, + { + "epoch": 0.42, + "learning_rate": 1.936851231339856e-06, + "loss": 0.9062, + "step": 16424 + }, + { + "epoch": 0.42, + "learning_rate": 1.936841553844893e-06, + "loss": 0.833, + "step": 16425 + }, + { + "epoch": 0.42, + "learning_rate": 1.936831875632634e-06, + "loss": 0.877, + "step": 16426 + }, + { + "epoch": 0.42, + "learning_rate": 1.9368221967030855e-06, + "loss": 0.9307, + "step": 16427 + }, + { + "epoch": 0.42, + "learning_rate": 1.9368125170562555e-06, + "loss": 0.8438, + "step": 16428 + }, + { + "epoch": 0.42, + "learning_rate": 1.9368028366921512e-06, + "loss": 0.8623, + "step": 16429 + }, + { + "epoch": 0.42, + "learning_rate": 1.93679315561078e-06, + "loss": 1.0645, + "step": 16430 + }, + { + "epoch": 0.42, + "learning_rate": 1.9367834738121495e-06, + "loss": 0.7607, + "step": 16431 + }, + { + "epoch": 0.42, + "learning_rate": 1.936773791296267e-06, + "loss": 0.772, + "step": 16432 + }, + { + "epoch": 0.42, + "learning_rate": 1.93676410806314e-06, + "loss": 0.9062, + "step": 16433 + }, + { + "epoch": 0.42, + "learning_rate": 1.9367544241127753e-06, + "loss": 1.0889, + "step": 16434 + }, + { + "epoch": 0.42, + "learning_rate": 1.936744739445181e-06, + "loss": 0.6614, + "step": 16435 + }, + { + "epoch": 0.42, + "learning_rate": 1.9367350540603646e-06, + "loss": 1.0059, + "step": 16436 + }, + { + "epoch": 0.42, + "learning_rate": 1.936725367958333e-06, + "loss": 0.8516, + "step": 16437 + }, + { + "epoch": 0.42, + "learning_rate": 1.936715681139094e-06, + "loss": 0.689, + "step": 16438 + }, + { + "epoch": 0.42, + "learning_rate": 1.9367059936026547e-06, + "loss": 0.7466, + "step": 16439 + }, + { + "epoch": 0.42, + "learning_rate": 1.9366963053490225e-06, + "loss": 0.7026, + "step": 16440 + }, + { + "epoch": 0.42, + "learning_rate": 1.936686616378205e-06, + "loss": 0.9014, + "step": 16441 + }, + { + "epoch": 0.42, + "learning_rate": 1.9366769266902103e-06, + "loss": 0.7166, + "step": 16442 + }, + { + "epoch": 0.42, + "learning_rate": 1.9366672362850446e-06, + "loss": 0.8594, + "step": 16443 + }, + { + "epoch": 0.42, + "learning_rate": 1.936657545162716e-06, + "loss": 0.7812, + "step": 16444 + }, + { + "epoch": 0.42, + "learning_rate": 1.9366478533232317e-06, + "loss": 0.7522, + "step": 16445 + }, + { + "epoch": 0.42, + "learning_rate": 1.9366381607665993e-06, + "loss": 1.0508, + "step": 16446 + }, + { + "epoch": 0.42, + "learning_rate": 1.9366284674928265e-06, + "loss": 0.6899, + "step": 16447 + }, + { + "epoch": 0.42, + "learning_rate": 1.93661877350192e-06, + "loss": 0.7905, + "step": 16448 + }, + { + "epoch": 0.42, + "learning_rate": 1.9366090787938875e-06, + "loss": 1.0215, + "step": 16449 + }, + { + "epoch": 0.42, + "learning_rate": 1.9365993833687365e-06, + "loss": 0.9336, + "step": 16450 + }, + { + "epoch": 0.42, + "learning_rate": 1.9365896872264744e-06, + "loss": 0.8623, + "step": 16451 + }, + { + "epoch": 0.42, + "learning_rate": 1.9365799903671086e-06, + "loss": 0.5508, + "step": 16452 + }, + { + "epoch": 0.42, + "learning_rate": 1.936570292790647e-06, + "loss": 0.6494, + "step": 16453 + }, + { + "epoch": 0.42, + "learning_rate": 1.936560594497096e-06, + "loss": 1.0215, + "step": 16454 + }, + { + "epoch": 0.42, + "learning_rate": 1.936550895486464e-06, + "loss": 0.7808, + "step": 16455 + }, + { + "epoch": 0.42, + "learning_rate": 1.9365411957587578e-06, + "loss": 1.0625, + "step": 16456 + }, + { + "epoch": 0.42, + "learning_rate": 1.9365314953139854e-06, + "loss": 0.7656, + "step": 16457 + }, + { + "epoch": 0.42, + "learning_rate": 1.9365217941521535e-06, + "loss": 0.9258, + "step": 16458 + }, + { + "epoch": 0.42, + "learning_rate": 1.9365120922732704e-06, + "loss": 0.9062, + "step": 16459 + }, + { + "epoch": 0.42, + "learning_rate": 1.9365023896773423e-06, + "loss": 1.1445, + "step": 16460 + }, + { + "epoch": 0.42, + "learning_rate": 1.936492686364378e-06, + "loss": 0.9873, + "step": 16461 + }, + { + "epoch": 0.42, + "learning_rate": 1.9364829823343844e-06, + "loss": 0.8953, + "step": 16462 + }, + { + "epoch": 0.42, + "learning_rate": 1.9364732775873686e-06, + "loss": 0.8447, + "step": 16463 + }, + { + "epoch": 0.42, + "learning_rate": 1.936463572123338e-06, + "loss": 0.7354, + "step": 16464 + }, + { + "epoch": 0.42, + "learning_rate": 1.9364538659423007e-06, + "loss": 1.0283, + "step": 16465 + }, + { + "epoch": 0.42, + "learning_rate": 1.936444159044264e-06, + "loss": 0.9268, + "step": 16466 + }, + { + "epoch": 0.42, + "learning_rate": 1.9364344514292343e-06, + "loss": 1.001, + "step": 16467 + }, + { + "epoch": 0.42, + "learning_rate": 1.93642474309722e-06, + "loss": 0.855, + "step": 16468 + }, + { + "epoch": 0.42, + "learning_rate": 1.9364150340482287e-06, + "loss": 0.9287, + "step": 16469 + }, + { + "epoch": 0.42, + "learning_rate": 1.9364053242822674e-06, + "loss": 0.9707, + "step": 16470 + }, + { + "epoch": 0.42, + "learning_rate": 1.936395613799343e-06, + "loss": 0.8564, + "step": 16471 + }, + { + "epoch": 0.42, + "learning_rate": 1.9363859025994644e-06, + "loss": 0.7812, + "step": 16472 + }, + { + "epoch": 0.42, + "learning_rate": 1.936376190682638e-06, + "loss": 0.9541, + "step": 16473 + }, + { + "epoch": 0.42, + "learning_rate": 1.9363664780488708e-06, + "loss": 1.0176, + "step": 16474 + }, + { + "epoch": 0.42, + "learning_rate": 1.9363567646981712e-06, + "loss": 1.0654, + "step": 16475 + }, + { + "epoch": 0.42, + "learning_rate": 1.9363470506305464e-06, + "loss": 0.6038, + "step": 16476 + }, + { + "epoch": 0.42, + "learning_rate": 1.936337335846004e-06, + "loss": 0.9775, + "step": 16477 + }, + { + "epoch": 0.42, + "learning_rate": 1.9363276203445504e-06, + "loss": 0.7283, + "step": 16478 + }, + { + "epoch": 0.42, + "learning_rate": 1.936317904126194e-06, + "loss": 1.041, + "step": 16479 + }, + { + "epoch": 0.42, + "learning_rate": 1.9363081871909426e-06, + "loss": 0.8672, + "step": 16480 + }, + { + "epoch": 0.42, + "learning_rate": 1.9362984695388026e-06, + "loss": 0.4771, + "step": 16481 + }, + { + "epoch": 0.42, + "learning_rate": 1.936288751169782e-06, + "loss": 0.6973, + "step": 16482 + }, + { + "epoch": 0.42, + "learning_rate": 1.936279032083888e-06, + "loss": 0.7026, + "step": 16483 + }, + { + "epoch": 0.42, + "learning_rate": 1.9362693122811286e-06, + "loss": 0.9727, + "step": 16484 + }, + { + "epoch": 0.42, + "learning_rate": 1.9362595917615106e-06, + "loss": 0.833, + "step": 16485 + }, + { + "epoch": 0.42, + "learning_rate": 1.9362498705250415e-06, + "loss": 0.7842, + "step": 16486 + }, + { + "epoch": 0.42, + "learning_rate": 1.936240148571729e-06, + "loss": 1.0107, + "step": 16487 + }, + { + "epoch": 0.42, + "learning_rate": 1.9362304259015805e-06, + "loss": 0.8877, + "step": 16488 + }, + { + "epoch": 0.42, + "learning_rate": 1.936220702514604e-06, + "loss": 0.6582, + "step": 16489 + }, + { + "epoch": 0.42, + "learning_rate": 1.9362109784108055e-06, + "loss": 0.9805, + "step": 16490 + }, + { + "epoch": 0.42, + "learning_rate": 1.936201253590194e-06, + "loss": 1.0225, + "step": 16491 + }, + { + "epoch": 0.42, + "learning_rate": 1.9361915280527756e-06, + "loss": 0.8818, + "step": 16492 + }, + { + "epoch": 0.42, + "learning_rate": 1.9361818017985587e-06, + "loss": 0.9951, + "step": 16493 + }, + { + "epoch": 0.42, + "learning_rate": 1.9361720748275502e-06, + "loss": 0.9487, + "step": 16494 + }, + { + "epoch": 0.42, + "learning_rate": 1.936162347139758e-06, + "loss": 0.998, + "step": 16495 + }, + { + "epoch": 0.42, + "learning_rate": 1.9361526187351895e-06, + "loss": 0.7607, + "step": 16496 + }, + { + "epoch": 0.42, + "learning_rate": 1.9361428896138516e-06, + "loss": 0.8945, + "step": 16497 + }, + { + "epoch": 0.42, + "learning_rate": 1.9361331597757523e-06, + "loss": 0.8408, + "step": 16498 + }, + { + "epoch": 0.42, + "learning_rate": 1.936123429220899e-06, + "loss": 0.7988, + "step": 16499 + }, + { + "epoch": 0.42, + "learning_rate": 1.9361136979492995e-06, + "loss": 0.625, + "step": 16500 + }, + { + "epoch": 0.42, + "learning_rate": 1.93610396596096e-06, + "loss": 1.0742, + "step": 16501 + }, + { + "epoch": 0.42, + "learning_rate": 1.9360942332558888e-06, + "loss": 0.9414, + "step": 16502 + }, + { + "epoch": 0.42, + "learning_rate": 1.936084499834094e-06, + "loss": 0.9404, + "step": 16503 + }, + { + "epoch": 0.42, + "learning_rate": 1.9360747656955816e-06, + "loss": 0.8428, + "step": 16504 + }, + { + "epoch": 0.42, + "learning_rate": 1.93606503084036e-06, + "loss": 0.9048, + "step": 16505 + }, + { + "epoch": 0.42, + "learning_rate": 1.9360552952684363e-06, + "loss": 0.5779, + "step": 16506 + }, + { + "epoch": 0.42, + "learning_rate": 1.9360455589798186e-06, + "loss": 1.0225, + "step": 16507 + }, + { + "epoch": 0.42, + "learning_rate": 1.936035821974513e-06, + "loss": 1.0059, + "step": 16508 + }, + { + "epoch": 0.42, + "learning_rate": 1.936026084252529e-06, + "loss": 0.9785, + "step": 16509 + }, + { + "epoch": 0.42, + "learning_rate": 1.9360163458138717e-06, + "loss": 0.6973, + "step": 16510 + }, + { + "epoch": 0.42, + "learning_rate": 1.93600660665855e-06, + "loss": 1.043, + "step": 16511 + }, + { + "epoch": 0.42, + "learning_rate": 1.9359968667865718e-06, + "loss": 0.6514, + "step": 16512 + }, + { + "epoch": 0.42, + "learning_rate": 1.9359871261979434e-06, + "loss": 0.9688, + "step": 16513 + }, + { + "epoch": 0.42, + "learning_rate": 1.9359773848926727e-06, + "loss": 0.8076, + "step": 16514 + }, + { + "epoch": 0.42, + "learning_rate": 1.935967642870767e-06, + "loss": 0.9961, + "step": 16515 + }, + { + "epoch": 0.42, + "learning_rate": 1.935957900132234e-06, + "loss": 0.7422, + "step": 16516 + }, + { + "epoch": 0.42, + "learning_rate": 1.935948156677081e-06, + "loss": 0.9678, + "step": 16517 + }, + { + "epoch": 0.42, + "learning_rate": 1.9359384125053157e-06, + "loss": 1.1016, + "step": 16518 + }, + { + "epoch": 0.42, + "learning_rate": 1.9359286676169452e-06, + "loss": 0.7578, + "step": 16519 + }, + { + "epoch": 0.42, + "learning_rate": 1.9359189220119773e-06, + "loss": 0.9609, + "step": 16520 + }, + { + "epoch": 0.42, + "learning_rate": 1.935909175690419e-06, + "loss": 1.0068, + "step": 16521 + }, + { + "epoch": 0.42, + "learning_rate": 1.9358994286522785e-06, + "loss": 1.0703, + "step": 16522 + }, + { + "epoch": 0.42, + "learning_rate": 1.9358896808975625e-06, + "loss": 0.9951, + "step": 16523 + }, + { + "epoch": 0.42, + "learning_rate": 1.9358799324262795e-06, + "loss": 0.708, + "step": 16524 + }, + { + "epoch": 0.42, + "learning_rate": 1.9358701832384354e-06, + "loss": 0.7051, + "step": 16525 + }, + { + "epoch": 0.42, + "learning_rate": 1.935860433334039e-06, + "loss": 0.9463, + "step": 16526 + }, + { + "epoch": 0.42, + "learning_rate": 1.9358506827130976e-06, + "loss": 0.6235, + "step": 16527 + }, + { + "epoch": 0.42, + "learning_rate": 1.9358409313756177e-06, + "loss": 0.6914, + "step": 16528 + }, + { + "epoch": 0.42, + "learning_rate": 1.9358311793216077e-06, + "loss": 0.7695, + "step": 16529 + }, + { + "epoch": 0.42, + "learning_rate": 1.9358214265510747e-06, + "loss": 0.8701, + "step": 16530 + }, + { + "epoch": 0.42, + "learning_rate": 1.9358116730640264e-06, + "loss": 0.8193, + "step": 16531 + }, + { + "epoch": 0.42, + "learning_rate": 1.93580191886047e-06, + "loss": 0.8994, + "step": 16532 + }, + { + "epoch": 0.42, + "learning_rate": 1.9357921639404135e-06, + "loss": 1.0352, + "step": 16533 + }, + { + "epoch": 0.42, + "learning_rate": 1.935782408303863e-06, + "loss": 0.9639, + "step": 16534 + }, + { + "epoch": 0.42, + "learning_rate": 1.935772651950828e-06, + "loss": 1.0996, + "step": 16535 + }, + { + "epoch": 0.42, + "learning_rate": 1.9357628948813145e-06, + "loss": 0.8291, + "step": 16536 + }, + { + "epoch": 0.42, + "learning_rate": 1.9357531370953305e-06, + "loss": 0.7441, + "step": 16537 + }, + { + "epoch": 0.42, + "learning_rate": 1.9357433785928832e-06, + "loss": 0.9351, + "step": 16538 + }, + { + "epoch": 0.42, + "learning_rate": 1.9357336193739803e-06, + "loss": 0.8301, + "step": 16539 + }, + { + "epoch": 0.42, + "learning_rate": 1.935723859438629e-06, + "loss": 1.0156, + "step": 16540 + }, + { + "epoch": 0.42, + "learning_rate": 1.9357140987868373e-06, + "loss": 1.0518, + "step": 16541 + }, + { + "epoch": 0.42, + "learning_rate": 1.935704337418612e-06, + "loss": 0.9854, + "step": 16542 + }, + { + "epoch": 0.42, + "learning_rate": 1.9356945753339612e-06, + "loss": 0.7656, + "step": 16543 + }, + { + "epoch": 0.42, + "learning_rate": 1.9356848125328916e-06, + "loss": 0.8379, + "step": 16544 + }, + { + "epoch": 0.42, + "learning_rate": 1.9356750490154117e-06, + "loss": 0.8457, + "step": 16545 + }, + { + "epoch": 0.42, + "learning_rate": 1.9356652847815283e-06, + "loss": 0.9902, + "step": 16546 + }, + { + "epoch": 0.42, + "learning_rate": 1.935655519831249e-06, + "loss": 0.9023, + "step": 16547 + }, + { + "epoch": 0.42, + "learning_rate": 1.9356457541645814e-06, + "loss": 0.9072, + "step": 16548 + }, + { + "epoch": 0.42, + "learning_rate": 1.9356359877815327e-06, + "loss": 0.9463, + "step": 16549 + }, + { + "epoch": 0.42, + "learning_rate": 1.9356262206821105e-06, + "loss": 0.7178, + "step": 16550 + }, + { + "epoch": 0.42, + "learning_rate": 1.9356164528663225e-06, + "loss": 0.7656, + "step": 16551 + }, + { + "epoch": 0.42, + "learning_rate": 1.935606684334176e-06, + "loss": 0.8018, + "step": 16552 + }, + { + "epoch": 0.42, + "learning_rate": 1.9355969150856783e-06, + "loss": 0.8818, + "step": 16553 + }, + { + "epoch": 0.42, + "learning_rate": 1.935587145120837e-06, + "loss": 0.957, + "step": 16554 + }, + { + "epoch": 0.42, + "learning_rate": 1.93557737443966e-06, + "loss": 0.6724, + "step": 16555 + }, + { + "epoch": 0.42, + "learning_rate": 1.9355676030421543e-06, + "loss": 0.9883, + "step": 16556 + }, + { + "epoch": 0.42, + "learning_rate": 1.9355578309283272e-06, + "loss": 0.6719, + "step": 16557 + }, + { + "epoch": 0.42, + "learning_rate": 1.9355480580981868e-06, + "loss": 0.6857, + "step": 16558 + }, + { + "epoch": 0.42, + "learning_rate": 1.9355382845517402e-06, + "loss": 0.8174, + "step": 16559 + }, + { + "epoch": 0.42, + "learning_rate": 1.9355285102889947e-06, + "loss": 0.917, + "step": 16560 + }, + { + "epoch": 0.42, + "learning_rate": 1.9355187353099584e-06, + "loss": 1.0342, + "step": 16561 + }, + { + "epoch": 0.42, + "learning_rate": 1.9355089596146384e-06, + "loss": 0.9463, + "step": 16562 + }, + { + "epoch": 0.42, + "learning_rate": 1.935499183203042e-06, + "loss": 1.0166, + "step": 16563 + }, + { + "epoch": 0.42, + "learning_rate": 1.935489406075177e-06, + "loss": 0.8369, + "step": 16564 + }, + { + "epoch": 0.42, + "learning_rate": 1.9354796282310504e-06, + "loss": 1.0371, + "step": 16565 + }, + { + "epoch": 0.42, + "learning_rate": 1.9354698496706707e-06, + "loss": 0.8877, + "step": 16566 + }, + { + "epoch": 0.42, + "learning_rate": 1.9354600703940445e-06, + "loss": 0.7339, + "step": 16567 + }, + { + "epoch": 0.42, + "learning_rate": 1.935450290401179e-06, + "loss": 0.8701, + "step": 16568 + }, + { + "epoch": 0.42, + "learning_rate": 1.9354405096920835e-06, + "loss": 0.731, + "step": 16569 + }, + { + "epoch": 0.42, + "learning_rate": 1.935430728266763e-06, + "loss": 0.8501, + "step": 16570 + }, + { + "epoch": 0.42, + "learning_rate": 1.9354209461252267e-06, + "loss": 0.7695, + "step": 16571 + }, + { + "epoch": 0.42, + "learning_rate": 1.9354111632674817e-06, + "loss": 0.8242, + "step": 16572 + }, + { + "epoch": 0.42, + "learning_rate": 1.9354013796935355e-06, + "loss": 0.7939, + "step": 16573 + }, + { + "epoch": 0.42, + "learning_rate": 1.935391595403395e-06, + "loss": 0.7573, + "step": 16574 + }, + { + "epoch": 0.42, + "learning_rate": 1.9353818103970683e-06, + "loss": 0.874, + "step": 16575 + }, + { + "epoch": 0.42, + "learning_rate": 1.935372024674563e-06, + "loss": 0.8408, + "step": 16576 + }, + { + "epoch": 0.42, + "learning_rate": 1.935362238235886e-06, + "loss": 0.8218, + "step": 16577 + }, + { + "epoch": 0.42, + "learning_rate": 1.935352451081045e-06, + "loss": 1.1855, + "step": 16578 + }, + { + "epoch": 0.42, + "learning_rate": 1.9353426632100483e-06, + "loss": 0.8848, + "step": 16579 + }, + { + "epoch": 0.42, + "learning_rate": 1.9353328746229025e-06, + "loss": 0.9668, + "step": 16580 + }, + { + "epoch": 0.42, + "learning_rate": 1.9353230853196153e-06, + "loss": 0.9185, + "step": 16581 + }, + { + "epoch": 0.43, + "learning_rate": 1.935313295300194e-06, + "loss": 0.9375, + "step": 16582 + }, + { + "epoch": 0.43, + "learning_rate": 1.9353035045646465e-06, + "loss": 0.9092, + "step": 16583 + }, + { + "epoch": 0.43, + "learning_rate": 1.9352937131129797e-06, + "loss": 0.8418, + "step": 16584 + }, + { + "epoch": 0.43, + "learning_rate": 1.935283920945202e-06, + "loss": 0.8301, + "step": 16585 + }, + { + "epoch": 0.43, + "learning_rate": 1.93527412806132e-06, + "loss": 0.958, + "step": 16586 + }, + { + "epoch": 0.43, + "learning_rate": 1.9352643344613423e-06, + "loss": 0.7646, + "step": 16587 + }, + { + "epoch": 0.43, + "learning_rate": 1.9352545401452752e-06, + "loss": 1.083, + "step": 16588 + }, + { + "epoch": 0.43, + "learning_rate": 1.935244745113127e-06, + "loss": 0.8018, + "step": 16589 + }, + { + "epoch": 0.43, + "learning_rate": 1.935234949364905e-06, + "loss": 0.8271, + "step": 16590 + }, + { + "epoch": 0.43, + "learning_rate": 1.9352251529006157e-06, + "loss": 0.7031, + "step": 16591 + }, + { + "epoch": 0.43, + "learning_rate": 1.935215355720268e-06, + "loss": 0.5654, + "step": 16592 + }, + { + "epoch": 0.43, + "learning_rate": 1.9352055578238694e-06, + "loss": 0.6812, + "step": 16593 + }, + { + "epoch": 0.43, + "learning_rate": 1.9351957592114263e-06, + "loss": 0.8037, + "step": 16594 + }, + { + "epoch": 0.43, + "learning_rate": 1.935185959882947e-06, + "loss": 0.9395, + "step": 16595 + }, + { + "epoch": 0.43, + "learning_rate": 1.935176159838439e-06, + "loss": 0.9219, + "step": 16596 + }, + { + "epoch": 0.43, + "learning_rate": 1.9351663590779094e-06, + "loss": 0.6602, + "step": 16597 + }, + { + "epoch": 0.43, + "learning_rate": 1.935156557601366e-06, + "loss": 1.0957, + "step": 16598 + }, + { + "epoch": 0.43, + "learning_rate": 1.935146755408816e-06, + "loss": 0.7827, + "step": 16599 + }, + { + "epoch": 0.43, + "learning_rate": 1.9351369525002675e-06, + "loss": 1.0215, + "step": 16600 + }, + { + "epoch": 0.43, + "learning_rate": 1.9351271488757276e-06, + "loss": 1.0059, + "step": 16601 + }, + { + "epoch": 0.43, + "learning_rate": 1.9351173445352034e-06, + "loss": 1.0049, + "step": 16602 + }, + { + "epoch": 0.43, + "learning_rate": 1.9351075394787035e-06, + "loss": 0.8496, + "step": 16603 + }, + { + "epoch": 0.43, + "learning_rate": 1.935097733706234e-06, + "loss": 0.9912, + "step": 16604 + }, + { + "epoch": 0.43, + "learning_rate": 1.9350879272178038e-06, + "loss": 0.5889, + "step": 16605 + }, + { + "epoch": 0.43, + "learning_rate": 1.9350781200134193e-06, + "loss": 0.8486, + "step": 16606 + }, + { + "epoch": 0.43, + "learning_rate": 1.9350683120930886e-06, + "loss": 0.5991, + "step": 16607 + }, + { + "epoch": 0.43, + "learning_rate": 1.9350585034568195e-06, + "loss": 1.0703, + "step": 16608 + }, + { + "epoch": 0.43, + "learning_rate": 1.9350486941046187e-06, + "loss": 0.8604, + "step": 16609 + }, + { + "epoch": 0.43, + "learning_rate": 1.935038884036494e-06, + "loss": 1.0078, + "step": 16610 + }, + { + "epoch": 0.43, + "learning_rate": 1.9350290732524535e-06, + "loss": 0.8223, + "step": 16611 + }, + { + "epoch": 0.43, + "learning_rate": 1.935019261752504e-06, + "loss": 0.9023, + "step": 16612 + }, + { + "epoch": 0.43, + "learning_rate": 1.935009449536653e-06, + "loss": 1.0361, + "step": 16613 + }, + { + "epoch": 0.43, + "learning_rate": 1.9349996366049086e-06, + "loss": 0.8867, + "step": 16614 + }, + { + "epoch": 0.43, + "learning_rate": 1.934989822957278e-06, + "loss": 1.0771, + "step": 16615 + }, + { + "epoch": 0.43, + "learning_rate": 1.9349800085937684e-06, + "loss": 1.0488, + "step": 16616 + }, + { + "epoch": 0.43, + "learning_rate": 1.9349701935143877e-06, + "loss": 0.8096, + "step": 16617 + }, + { + "epoch": 0.43, + "learning_rate": 1.934960377719143e-06, + "loss": 1.0664, + "step": 16618 + }, + { + "epoch": 0.43, + "learning_rate": 1.934950561208043e-06, + "loss": 0.5962, + "step": 16619 + }, + { + "epoch": 0.43, + "learning_rate": 1.9349407439810937e-06, + "loss": 0.8955, + "step": 16620 + }, + { + "epoch": 0.43, + "learning_rate": 1.9349309260383033e-06, + "loss": 0.6782, + "step": 16621 + }, + { + "epoch": 0.43, + "learning_rate": 1.9349211073796795e-06, + "loss": 0.8926, + "step": 16622 + }, + { + "epoch": 0.43, + "learning_rate": 1.9349112880052293e-06, + "loss": 1.0303, + "step": 16623 + }, + { + "epoch": 0.43, + "learning_rate": 1.9349014679149606e-06, + "loss": 1.0918, + "step": 16624 + }, + { + "epoch": 0.43, + "learning_rate": 1.9348916471088808e-06, + "loss": 0.8369, + "step": 16625 + }, + { + "epoch": 0.43, + "learning_rate": 1.9348818255869976e-06, + "loss": 1.0371, + "step": 16626 + }, + { + "epoch": 0.43, + "learning_rate": 1.9348720033493186e-06, + "loss": 0.7842, + "step": 16627 + }, + { + "epoch": 0.43, + "learning_rate": 1.9348621803958506e-06, + "loss": 0.9688, + "step": 16628 + }, + { + "epoch": 0.43, + "learning_rate": 1.9348523567266017e-06, + "loss": 0.8584, + "step": 16629 + }, + { + "epoch": 0.43, + "learning_rate": 1.9348425323415794e-06, + "loss": 0.9766, + "step": 16630 + }, + { + "epoch": 0.43, + "learning_rate": 1.9348327072407914e-06, + "loss": 0.7969, + "step": 16631 + }, + { + "epoch": 0.43, + "learning_rate": 1.9348228814242445e-06, + "loss": 0.6121, + "step": 16632 + }, + { + "epoch": 0.43, + "learning_rate": 1.934813054891947e-06, + "loss": 0.8599, + "step": 16633 + }, + { + "epoch": 0.43, + "learning_rate": 1.9348032276439064e-06, + "loss": 0.7969, + "step": 16634 + }, + { + "epoch": 0.43, + "learning_rate": 1.9347933996801297e-06, + "loss": 0.9023, + "step": 16635 + }, + { + "epoch": 0.43, + "learning_rate": 1.9347835710006246e-06, + "loss": 0.979, + "step": 16636 + }, + { + "epoch": 0.43, + "learning_rate": 1.934773741605399e-06, + "loss": 1.083, + "step": 16637 + }, + { + "epoch": 0.43, + "learning_rate": 1.9347639114944594e-06, + "loss": 1.0244, + "step": 16638 + }, + { + "epoch": 0.43, + "learning_rate": 1.9347540806678147e-06, + "loss": 0.9004, + "step": 16639 + }, + { + "epoch": 0.43, + "learning_rate": 1.9347442491254716e-06, + "loss": 0.7734, + "step": 16640 + }, + { + "epoch": 0.43, + "learning_rate": 1.934734416867438e-06, + "loss": 0.9473, + "step": 16641 + }, + { + "epoch": 0.43, + "learning_rate": 1.9347245838937208e-06, + "loss": 0.8604, + "step": 16642 + }, + { + "epoch": 0.43, + "learning_rate": 1.9347147502043283e-06, + "loss": 1.1182, + "step": 16643 + }, + { + "epoch": 0.43, + "learning_rate": 1.934704915799268e-06, + "loss": 0.8418, + "step": 16644 + }, + { + "epoch": 0.43, + "learning_rate": 1.9346950806785465e-06, + "loss": 1.0498, + "step": 16645 + }, + { + "epoch": 0.43, + "learning_rate": 1.9346852448421724e-06, + "loss": 0.8188, + "step": 16646 + }, + { + "epoch": 0.43, + "learning_rate": 1.9346754082901524e-06, + "loss": 1.0283, + "step": 16647 + }, + { + "epoch": 0.43, + "learning_rate": 1.9346655710224947e-06, + "loss": 0.9434, + "step": 16648 + }, + { + "epoch": 0.43, + "learning_rate": 1.9346557330392067e-06, + "loss": 0.8115, + "step": 16649 + }, + { + "epoch": 0.43, + "learning_rate": 1.9346458943402954e-06, + "loss": 0.9263, + "step": 16650 + }, + { + "epoch": 0.43, + "learning_rate": 1.934636054925769e-06, + "loss": 1.1309, + "step": 16651 + }, + { + "epoch": 0.43, + "learning_rate": 1.9346262147956347e-06, + "loss": 1.0342, + "step": 16652 + }, + { + "epoch": 0.43, + "learning_rate": 1.9346163739498997e-06, + "loss": 0.7534, + "step": 16653 + }, + { + "epoch": 0.43, + "learning_rate": 1.934606532388572e-06, + "loss": 0.9512, + "step": 16654 + }, + { + "epoch": 0.43, + "learning_rate": 1.9345966901116594e-06, + "loss": 1.0039, + "step": 16655 + }, + { + "epoch": 0.43, + "learning_rate": 1.934586847119169e-06, + "loss": 0.9863, + "step": 16656 + }, + { + "epoch": 0.43, + "learning_rate": 1.9345770034111085e-06, + "loss": 0.9229, + "step": 16657 + }, + { + "epoch": 0.43, + "learning_rate": 1.934567158987485e-06, + "loss": 0.7798, + "step": 16658 + }, + { + "epoch": 0.43, + "learning_rate": 1.934557313848307e-06, + "loss": 0.7656, + "step": 16659 + }, + { + "epoch": 0.43, + "learning_rate": 1.934547467993581e-06, + "loss": 0.8623, + "step": 16660 + }, + { + "epoch": 0.43, + "learning_rate": 1.934537621423315e-06, + "loss": 0.8867, + "step": 16661 + }, + { + "epoch": 0.43, + "learning_rate": 1.9345277741375167e-06, + "loss": 0.9678, + "step": 16662 + }, + { + "epoch": 0.43, + "learning_rate": 1.934517926136193e-06, + "loss": 0.7412, + "step": 16663 + }, + { + "epoch": 0.43, + "learning_rate": 1.9345080774193523e-06, + "loss": 0.7896, + "step": 16664 + }, + { + "epoch": 0.43, + "learning_rate": 1.9344982279870016e-06, + "loss": 1.0264, + "step": 16665 + }, + { + "epoch": 0.43, + "learning_rate": 1.9344883778391487e-06, + "loss": 1.0938, + "step": 16666 + }, + { + "epoch": 0.43, + "learning_rate": 1.934478526975801e-06, + "loss": 0.959, + "step": 16667 + }, + { + "epoch": 0.43, + "learning_rate": 1.934468675396966e-06, + "loss": 0.9209, + "step": 16668 + }, + { + "epoch": 0.43, + "learning_rate": 1.934458823102651e-06, + "loss": 0.7969, + "step": 16669 + }, + { + "epoch": 0.43, + "learning_rate": 1.9344489700928645e-06, + "loss": 0.9062, + "step": 16670 + }, + { + "epoch": 0.43, + "learning_rate": 1.9344391163676132e-06, + "loss": 1.0, + "step": 16671 + }, + { + "epoch": 0.43, + "learning_rate": 1.9344292619269046e-06, + "loss": 0.7837, + "step": 16672 + }, + { + "epoch": 0.43, + "learning_rate": 1.9344194067707466e-06, + "loss": 1.0381, + "step": 16673 + }, + { + "epoch": 0.43, + "learning_rate": 1.9344095508991464e-06, + "loss": 0.9375, + "step": 16674 + }, + { + "epoch": 0.43, + "learning_rate": 1.9343996943121117e-06, + "loss": 0.7979, + "step": 16675 + }, + { + "epoch": 0.43, + "learning_rate": 1.9343898370096506e-06, + "loss": 0.874, + "step": 16676 + }, + { + "epoch": 0.43, + "learning_rate": 1.93437997899177e-06, + "loss": 0.6763, + "step": 16677 + }, + { + "epoch": 0.43, + "learning_rate": 1.9343701202584777e-06, + "loss": 0.8081, + "step": 16678 + }, + { + "epoch": 0.43, + "learning_rate": 1.9343602608097808e-06, + "loss": 0.7754, + "step": 16679 + }, + { + "epoch": 0.43, + "learning_rate": 1.9343504006456874e-06, + "loss": 0.8096, + "step": 16680 + }, + { + "epoch": 0.43, + "learning_rate": 1.9343405397662053e-06, + "loss": 0.8032, + "step": 16681 + }, + { + "epoch": 0.43, + "learning_rate": 1.9343306781713407e-06, + "loss": 0.8398, + "step": 16682 + }, + { + "epoch": 0.43, + "learning_rate": 1.9343208158611027e-06, + "loss": 0.9648, + "step": 16683 + }, + { + "epoch": 0.43, + "learning_rate": 1.9343109528354982e-06, + "loss": 0.7969, + "step": 16684 + }, + { + "epoch": 0.43, + "learning_rate": 1.9343010890945347e-06, + "loss": 0.8672, + "step": 16685 + }, + { + "epoch": 0.43, + "learning_rate": 1.9342912246382196e-06, + "loss": 0.7881, + "step": 16686 + }, + { + "epoch": 0.43, + "learning_rate": 1.9342813594665607e-06, + "loss": 0.9844, + "step": 16687 + }, + { + "epoch": 0.43, + "learning_rate": 1.934271493579566e-06, + "loss": 0.9248, + "step": 16688 + }, + { + "epoch": 0.43, + "learning_rate": 1.934261626977242e-06, + "loss": 0.9941, + "step": 16689 + }, + { + "epoch": 0.43, + "learning_rate": 1.934251759659597e-06, + "loss": 0.8369, + "step": 16690 + }, + { + "epoch": 0.43, + "learning_rate": 1.9342418916266384e-06, + "loss": 0.8975, + "step": 16691 + }, + { + "epoch": 0.43, + "learning_rate": 1.934232022878374e-06, + "loss": 0.7949, + "step": 16692 + }, + { + "epoch": 0.43, + "learning_rate": 1.9342221534148105e-06, + "loss": 0.7939, + "step": 16693 + }, + { + "epoch": 0.43, + "learning_rate": 1.934212283235957e-06, + "loss": 0.9512, + "step": 16694 + }, + { + "epoch": 0.43, + "learning_rate": 1.934202412341819e-06, + "loss": 0.9561, + "step": 16695 + }, + { + "epoch": 0.43, + "learning_rate": 1.934192540732406e-06, + "loss": 0.8496, + "step": 16696 + }, + { + "epoch": 0.43, + "learning_rate": 1.9341826684077247e-06, + "loss": 1.0391, + "step": 16697 + }, + { + "epoch": 0.43, + "learning_rate": 1.934172795367782e-06, + "loss": 0.958, + "step": 16698 + }, + { + "epoch": 0.43, + "learning_rate": 1.9341629216125866e-06, + "loss": 0.9561, + "step": 16699 + }, + { + "epoch": 0.43, + "learning_rate": 1.9341530471421458e-06, + "loss": 0.9893, + "step": 16700 + }, + { + "epoch": 0.43, + "learning_rate": 1.9341431719564665e-06, + "loss": 0.918, + "step": 16701 + }, + { + "epoch": 0.43, + "learning_rate": 1.934133296055557e-06, + "loss": 0.9434, + "step": 16702 + }, + { + "epoch": 0.43, + "learning_rate": 1.9341234194394244e-06, + "loss": 0.606, + "step": 16703 + }, + { + "epoch": 0.43, + "learning_rate": 1.9341135421080768e-06, + "loss": 0.8691, + "step": 16704 + }, + { + "epoch": 0.43, + "learning_rate": 1.9341036640615213e-06, + "loss": 0.8965, + "step": 16705 + }, + { + "epoch": 0.43, + "learning_rate": 1.9340937852997654e-06, + "loss": 0.8887, + "step": 16706 + }, + { + "epoch": 0.43, + "learning_rate": 1.934083905822817e-06, + "loss": 0.9648, + "step": 16707 + }, + { + "epoch": 0.43, + "learning_rate": 1.9340740256306837e-06, + "loss": 0.811, + "step": 16708 + }, + { + "epoch": 0.43, + "learning_rate": 1.9340641447233723e-06, + "loss": 0.8916, + "step": 16709 + }, + { + "epoch": 0.43, + "learning_rate": 1.9340542631008914e-06, + "loss": 0.7686, + "step": 16710 + }, + { + "epoch": 0.43, + "learning_rate": 1.934044380763248e-06, + "loss": 0.7722, + "step": 16711 + }, + { + "epoch": 0.43, + "learning_rate": 1.9340344977104494e-06, + "loss": 1.0273, + "step": 16712 + }, + { + "epoch": 0.43, + "learning_rate": 1.934024613942504e-06, + "loss": 1.001, + "step": 16713 + }, + { + "epoch": 0.43, + "learning_rate": 1.934014729459419e-06, + "loss": 1.0967, + "step": 16714 + }, + { + "epoch": 0.43, + "learning_rate": 1.934004844261201e-06, + "loss": 0.8164, + "step": 16715 + }, + { + "epoch": 0.43, + "learning_rate": 1.9339949583478592e-06, + "loss": 0.7412, + "step": 16716 + }, + { + "epoch": 0.43, + "learning_rate": 1.9339850717194005e-06, + "loss": 1.0371, + "step": 16717 + }, + { + "epoch": 0.43, + "learning_rate": 1.933975184375832e-06, + "loss": 0.8591, + "step": 16718 + }, + { + "epoch": 0.43, + "learning_rate": 1.9339652963171617e-06, + "loss": 0.7979, + "step": 16719 + }, + { + "epoch": 0.43, + "learning_rate": 1.933955407543397e-06, + "loss": 0.9912, + "step": 16720 + }, + { + "epoch": 0.43, + "learning_rate": 1.933945518054546e-06, + "loss": 1.0176, + "step": 16721 + }, + { + "epoch": 0.43, + "learning_rate": 1.933935627850616e-06, + "loss": 0.8896, + "step": 16722 + }, + { + "epoch": 0.43, + "learning_rate": 1.933925736931614e-06, + "loss": 0.8916, + "step": 16723 + }, + { + "epoch": 0.43, + "learning_rate": 1.933915845297548e-06, + "loss": 0.668, + "step": 16724 + }, + { + "epoch": 0.43, + "learning_rate": 1.9339059529484256e-06, + "loss": 0.5071, + "step": 16725 + }, + { + "epoch": 0.43, + "learning_rate": 1.933896059884254e-06, + "loss": 0.8672, + "step": 16726 + }, + { + "epoch": 0.43, + "learning_rate": 1.9338861661050416e-06, + "loss": 1.0977, + "step": 16727 + }, + { + "epoch": 0.43, + "learning_rate": 1.9338762716107957e-06, + "loss": 0.7861, + "step": 16728 + }, + { + "epoch": 0.43, + "learning_rate": 1.933866376401523e-06, + "loss": 1.1006, + "step": 16729 + }, + { + "epoch": 0.43, + "learning_rate": 1.9338564804772327e-06, + "loss": 0.8174, + "step": 16730 + }, + { + "epoch": 0.43, + "learning_rate": 1.933846583837931e-06, + "loss": 0.8848, + "step": 16731 + }, + { + "epoch": 0.43, + "learning_rate": 1.9338366864836256e-06, + "loss": 1.0127, + "step": 16732 + }, + { + "epoch": 0.43, + "learning_rate": 1.9338267884143247e-06, + "loss": 1.0371, + "step": 16733 + }, + { + "epoch": 0.43, + "learning_rate": 1.9338168896300356e-06, + "loss": 1.0566, + "step": 16734 + }, + { + "epoch": 0.43, + "learning_rate": 1.9338069901307655e-06, + "loss": 0.6345, + "step": 16735 + }, + { + "epoch": 0.43, + "learning_rate": 1.9337970899165226e-06, + "loss": 0.9883, + "step": 16736 + }, + { + "epoch": 0.43, + "learning_rate": 1.9337871889873144e-06, + "loss": 0.873, + "step": 16737 + }, + { + "epoch": 0.43, + "learning_rate": 1.9337772873431478e-06, + "loss": 1.0, + "step": 16738 + }, + { + "epoch": 0.43, + "learning_rate": 1.933767384984031e-06, + "loss": 0.9287, + "step": 16739 + }, + { + "epoch": 0.43, + "learning_rate": 1.933757481909972e-06, + "loss": 0.7241, + "step": 16740 + }, + { + "epoch": 0.43, + "learning_rate": 1.9337475781209773e-06, + "loss": 0.8818, + "step": 16741 + }, + { + "epoch": 0.43, + "learning_rate": 1.9337376736170546e-06, + "loss": 0.8125, + "step": 16742 + }, + { + "epoch": 0.43, + "learning_rate": 1.933727768398213e-06, + "loss": 1.04, + "step": 16743 + }, + { + "epoch": 0.43, + "learning_rate": 1.9337178624644582e-06, + "loss": 0.9023, + "step": 16744 + }, + { + "epoch": 0.43, + "learning_rate": 1.9337079558157986e-06, + "loss": 0.8027, + "step": 16745 + }, + { + "epoch": 0.43, + "learning_rate": 1.933698048452242e-06, + "loss": 0.9795, + "step": 16746 + }, + { + "epoch": 0.43, + "learning_rate": 1.9336881403737956e-06, + "loss": 0.7725, + "step": 16747 + }, + { + "epoch": 0.43, + "learning_rate": 1.933678231580467e-06, + "loss": 0.8169, + "step": 16748 + }, + { + "epoch": 0.43, + "learning_rate": 1.933668322072264e-06, + "loss": 0.8926, + "step": 16749 + }, + { + "epoch": 0.43, + "learning_rate": 1.9336584118491944e-06, + "loss": 0.9131, + "step": 16750 + }, + { + "epoch": 0.43, + "learning_rate": 1.933648500911265e-06, + "loss": 0.8516, + "step": 16751 + }, + { + "epoch": 0.43, + "learning_rate": 1.9336385892584845e-06, + "loss": 0.79, + "step": 16752 + }, + { + "epoch": 0.43, + "learning_rate": 1.9336286768908595e-06, + "loss": 0.8052, + "step": 16753 + }, + { + "epoch": 0.43, + "learning_rate": 1.9336187638083976e-06, + "loss": 1.0439, + "step": 16754 + }, + { + "epoch": 0.43, + "learning_rate": 1.9336088500111073e-06, + "loss": 0.7739, + "step": 16755 + }, + { + "epoch": 0.43, + "learning_rate": 1.9335989354989956e-06, + "loss": 0.9414, + "step": 16756 + }, + { + "epoch": 0.43, + "learning_rate": 1.9335890202720695e-06, + "loss": 0.8926, + "step": 16757 + }, + { + "epoch": 0.43, + "learning_rate": 1.9335791043303378e-06, + "loss": 0.8457, + "step": 16758 + }, + { + "epoch": 0.43, + "learning_rate": 1.9335691876738072e-06, + "loss": 0.8701, + "step": 16759 + }, + { + "epoch": 0.43, + "learning_rate": 1.933559270302486e-06, + "loss": 0.8159, + "step": 16760 + }, + { + "epoch": 0.43, + "learning_rate": 1.933549352216381e-06, + "loss": 0.7393, + "step": 16761 + }, + { + "epoch": 0.43, + "learning_rate": 1.9335394334155006e-06, + "loss": 0.7266, + "step": 16762 + }, + { + "epoch": 0.43, + "learning_rate": 1.9335295138998514e-06, + "loss": 0.7705, + "step": 16763 + }, + { + "epoch": 0.43, + "learning_rate": 1.933519593669442e-06, + "loss": 1.0137, + "step": 16764 + }, + { + "epoch": 0.43, + "learning_rate": 1.9335096727242794e-06, + "loss": 1.0049, + "step": 16765 + }, + { + "epoch": 0.43, + "learning_rate": 1.9334997510643714e-06, + "loss": 0.7734, + "step": 16766 + }, + { + "epoch": 0.43, + "learning_rate": 1.9334898286897255e-06, + "loss": 0.9668, + "step": 16767 + }, + { + "epoch": 0.43, + "learning_rate": 1.9334799056003495e-06, + "loss": 0.6597, + "step": 16768 + }, + { + "epoch": 0.43, + "learning_rate": 1.933469981796251e-06, + "loss": 0.793, + "step": 16769 + }, + { + "epoch": 0.43, + "learning_rate": 1.9334600572774372e-06, + "loss": 0.8174, + "step": 16770 + }, + { + "epoch": 0.43, + "learning_rate": 1.933450132043916e-06, + "loss": 0.8818, + "step": 16771 + }, + { + "epoch": 0.43, + "learning_rate": 1.933440206095695e-06, + "loss": 1.0225, + "step": 16772 + }, + { + "epoch": 0.43, + "learning_rate": 1.9334302794327816e-06, + "loss": 0.7686, + "step": 16773 + }, + { + "epoch": 0.43, + "learning_rate": 1.933420352055184e-06, + "loss": 0.9805, + "step": 16774 + }, + { + "epoch": 0.43, + "learning_rate": 1.933410423962909e-06, + "loss": 0.9629, + "step": 16775 + }, + { + "epoch": 0.43, + "learning_rate": 1.9334004951559644e-06, + "loss": 1.0713, + "step": 16776 + }, + { + "epoch": 0.43, + "learning_rate": 1.933390565634358e-06, + "loss": 0.9307, + "step": 16777 + }, + { + "epoch": 0.43, + "learning_rate": 1.9333806353980976e-06, + "loss": 1.125, + "step": 16778 + }, + { + "epoch": 0.43, + "learning_rate": 1.9333707044471906e-06, + "loss": 0.7988, + "step": 16779 + }, + { + "epoch": 0.43, + "learning_rate": 1.9333607727816445e-06, + "loss": 0.7773, + "step": 16780 + }, + { + "epoch": 0.43, + "learning_rate": 1.933350840401467e-06, + "loss": 0.8496, + "step": 16781 + }, + { + "epoch": 0.43, + "learning_rate": 1.9333409073066653e-06, + "loss": 0.9688, + "step": 16782 + }, + { + "epoch": 0.43, + "learning_rate": 1.933330973497248e-06, + "loss": 0.9092, + "step": 16783 + }, + { + "epoch": 0.43, + "learning_rate": 1.933321038973222e-06, + "loss": 0.8652, + "step": 16784 + }, + { + "epoch": 0.43, + "learning_rate": 1.9333111037345947e-06, + "loss": 1.0088, + "step": 16785 + }, + { + "epoch": 0.43, + "learning_rate": 1.933301167781374e-06, + "loss": 0.8975, + "step": 16786 + }, + { + "epoch": 0.43, + "learning_rate": 1.9332912311135675e-06, + "loss": 0.8721, + "step": 16787 + }, + { + "epoch": 0.43, + "learning_rate": 1.933281293731183e-06, + "loss": 1.0254, + "step": 16788 + }, + { + "epoch": 0.43, + "learning_rate": 1.933271355634228e-06, + "loss": 0.7539, + "step": 16789 + }, + { + "epoch": 0.43, + "learning_rate": 1.9332614168227095e-06, + "loss": 1.0195, + "step": 16790 + }, + { + "epoch": 0.43, + "learning_rate": 1.9332514772966363e-06, + "loss": 0.9287, + "step": 16791 + }, + { + "epoch": 0.43, + "learning_rate": 1.933241537056015e-06, + "loss": 0.9766, + "step": 16792 + }, + { + "epoch": 0.43, + "learning_rate": 1.9332315961008535e-06, + "loss": 0.6392, + "step": 16793 + }, + { + "epoch": 0.43, + "learning_rate": 1.93322165443116e-06, + "loss": 0.9365, + "step": 16794 + }, + { + "epoch": 0.43, + "learning_rate": 1.933211712046941e-06, + "loss": 0.8096, + "step": 16795 + }, + { + "epoch": 0.43, + "learning_rate": 1.933201768948205e-06, + "loss": 0.9541, + "step": 16796 + }, + { + "epoch": 0.43, + "learning_rate": 1.9331918251349593e-06, + "loss": 0.7488, + "step": 16797 + }, + { + "epoch": 0.43, + "learning_rate": 1.933181880607211e-06, + "loss": 1.0156, + "step": 16798 + }, + { + "epoch": 0.43, + "learning_rate": 1.933171935364969e-06, + "loss": 0.8818, + "step": 16799 + }, + { + "epoch": 0.43, + "learning_rate": 1.93316198940824e-06, + "loss": 0.8252, + "step": 16800 + }, + { + "epoch": 0.43, + "learning_rate": 1.933152042737031e-06, + "loss": 1.0869, + "step": 16801 + }, + { + "epoch": 0.43, + "learning_rate": 1.9331420953513515e-06, + "loss": 0.9814, + "step": 16802 + }, + { + "epoch": 0.43, + "learning_rate": 1.9331321472512075e-06, + "loss": 0.915, + "step": 16803 + }, + { + "epoch": 0.43, + "learning_rate": 1.933122198436607e-06, + "loss": 0.8447, + "step": 16804 + }, + { + "epoch": 0.43, + "learning_rate": 1.933112248907558e-06, + "loss": 0.8984, + "step": 16805 + }, + { + "epoch": 0.43, + "learning_rate": 1.9331022986640677e-06, + "loss": 1.0244, + "step": 16806 + }, + { + "epoch": 0.43, + "learning_rate": 1.933092347706144e-06, + "loss": 0.7778, + "step": 16807 + }, + { + "epoch": 0.43, + "learning_rate": 1.9330823960337943e-06, + "loss": 0.4589, + "step": 16808 + }, + { + "epoch": 0.43, + "learning_rate": 1.9330724436470263e-06, + "loss": 0.8887, + "step": 16809 + }, + { + "epoch": 0.43, + "learning_rate": 1.9330624905458478e-06, + "loss": 0.7627, + "step": 16810 + }, + { + "epoch": 0.43, + "learning_rate": 1.933052536730266e-06, + "loss": 0.9941, + "step": 16811 + }, + { + "epoch": 0.43, + "learning_rate": 1.933042582200289e-06, + "loss": 1.0283, + "step": 16812 + }, + { + "epoch": 0.43, + "learning_rate": 1.933032626955924e-06, + "loss": 0.8931, + "step": 16813 + }, + { + "epoch": 0.43, + "learning_rate": 1.9330226709971787e-06, + "loss": 1.1104, + "step": 16814 + }, + { + "epoch": 0.43, + "learning_rate": 1.9330127143240614e-06, + "loss": 0.6362, + "step": 16815 + }, + { + "epoch": 0.43, + "learning_rate": 1.933002756936579e-06, + "loss": 0.7676, + "step": 16816 + }, + { + "epoch": 0.43, + "learning_rate": 1.9329927988347386e-06, + "loss": 0.916, + "step": 16817 + }, + { + "epoch": 0.43, + "learning_rate": 1.932982840018549e-06, + "loss": 1.0859, + "step": 16818 + }, + { + "epoch": 0.43, + "learning_rate": 1.9329728804880174e-06, + "loss": 0.7324, + "step": 16819 + }, + { + "epoch": 0.43, + "learning_rate": 1.9329629202431515e-06, + "loss": 0.8135, + "step": 16820 + }, + { + "epoch": 0.43, + "learning_rate": 1.9329529592839586e-06, + "loss": 0.8701, + "step": 16821 + }, + { + "epoch": 0.43, + "learning_rate": 1.9329429976104467e-06, + "loss": 0.853, + "step": 16822 + }, + { + "epoch": 0.43, + "learning_rate": 1.932933035222623e-06, + "loss": 0.9092, + "step": 16823 + }, + { + "epoch": 0.43, + "learning_rate": 1.9329230721204955e-06, + "loss": 0.8535, + "step": 16824 + }, + { + "epoch": 0.43, + "learning_rate": 1.9329131083040716e-06, + "loss": 1.0098, + "step": 16825 + }, + { + "epoch": 0.43, + "learning_rate": 1.932903143773359e-06, + "loss": 0.7993, + "step": 16826 + }, + { + "epoch": 0.43, + "learning_rate": 1.9328931785283654e-06, + "loss": 0.8555, + "step": 16827 + }, + { + "epoch": 0.43, + "learning_rate": 1.9328832125690984e-06, + "loss": 0.9512, + "step": 16828 + }, + { + "epoch": 0.43, + "learning_rate": 1.932873245895566e-06, + "loss": 0.9541, + "step": 16829 + }, + { + "epoch": 0.43, + "learning_rate": 1.932863278507775e-06, + "loss": 0.9424, + "step": 16830 + }, + { + "epoch": 0.43, + "learning_rate": 1.932853310405733e-06, + "loss": 0.9404, + "step": 16831 + }, + { + "epoch": 0.43, + "learning_rate": 1.9328433415894493e-06, + "loss": 1.0859, + "step": 16832 + }, + { + "epoch": 0.43, + "learning_rate": 1.9328333720589292e-06, + "loss": 0.8867, + "step": 16833 + }, + { + "epoch": 0.43, + "learning_rate": 1.932823401814182e-06, + "loss": 0.9893, + "step": 16834 + }, + { + "epoch": 0.43, + "learning_rate": 1.932813430855215e-06, + "loss": 1.0176, + "step": 16835 + }, + { + "epoch": 0.43, + "learning_rate": 1.9328034591820357e-06, + "loss": 0.7114, + "step": 16836 + }, + { + "epoch": 0.43, + "learning_rate": 1.9327934867946514e-06, + "loss": 0.9639, + "step": 16837 + }, + { + "epoch": 0.43, + "learning_rate": 1.93278351369307e-06, + "loss": 0.7275, + "step": 16838 + }, + { + "epoch": 0.43, + "learning_rate": 1.9327735398772993e-06, + "loss": 0.9092, + "step": 16839 + }, + { + "epoch": 0.43, + "learning_rate": 1.932763565347347e-06, + "loss": 0.8936, + "step": 16840 + }, + { + "epoch": 0.43, + "learning_rate": 1.93275359010322e-06, + "loss": 0.9248, + "step": 16841 + }, + { + "epoch": 0.43, + "learning_rate": 1.9327436141449267e-06, + "loss": 0.8433, + "step": 16842 + }, + { + "epoch": 0.43, + "learning_rate": 1.9327336374724746e-06, + "loss": 0.8711, + "step": 16843 + }, + { + "epoch": 0.43, + "learning_rate": 1.932723660085871e-06, + "loss": 0.7786, + "step": 16844 + }, + { + "epoch": 0.43, + "learning_rate": 1.932713681985124e-06, + "loss": 0.751, + "step": 16845 + }, + { + "epoch": 0.43, + "learning_rate": 1.932703703170241e-06, + "loss": 0.7148, + "step": 16846 + }, + { + "epoch": 0.43, + "learning_rate": 1.9326937236412297e-06, + "loss": 1.0098, + "step": 16847 + }, + { + "epoch": 0.43, + "learning_rate": 1.9326837433980976e-06, + "loss": 0.9658, + "step": 16848 + }, + { + "epoch": 0.43, + "learning_rate": 1.9326737624408523e-06, + "loss": 0.7959, + "step": 16849 + }, + { + "epoch": 0.43, + "learning_rate": 1.932663780769502e-06, + "loss": 0.7754, + "step": 16850 + }, + { + "epoch": 0.43, + "learning_rate": 1.9326537983840537e-06, + "loss": 0.8994, + "step": 16851 + }, + { + "epoch": 0.43, + "learning_rate": 1.932643815284515e-06, + "loss": 0.9473, + "step": 16852 + }, + { + "epoch": 0.43, + "learning_rate": 1.932633831470894e-06, + "loss": 0.8213, + "step": 16853 + }, + { + "epoch": 0.43, + "learning_rate": 1.9326238469431985e-06, + "loss": 0.8115, + "step": 16854 + }, + { + "epoch": 0.43, + "learning_rate": 1.9326138617014353e-06, + "loss": 1.0918, + "step": 16855 + }, + { + "epoch": 0.43, + "learning_rate": 1.9326038757456127e-06, + "loss": 0.7129, + "step": 16856 + }, + { + "epoch": 0.43, + "learning_rate": 1.9325938890757384e-06, + "loss": 0.6763, + "step": 16857 + }, + { + "epoch": 0.43, + "learning_rate": 1.9325839016918195e-06, + "loss": 1.0137, + "step": 16858 + }, + { + "epoch": 0.43, + "learning_rate": 1.9325739135938646e-06, + "loss": 0.6396, + "step": 16859 + }, + { + "epoch": 0.43, + "learning_rate": 1.9325639247818804e-06, + "loss": 0.7236, + "step": 16860 + }, + { + "epoch": 0.43, + "learning_rate": 1.9325539352558745e-06, + "loss": 1.0732, + "step": 16861 + }, + { + "epoch": 0.43, + "learning_rate": 1.9325439450158554e-06, + "loss": 0.8535, + "step": 16862 + }, + { + "epoch": 0.43, + "learning_rate": 1.9325339540618303e-06, + "loss": 0.9248, + "step": 16863 + }, + { + "epoch": 0.43, + "learning_rate": 1.9325239623938064e-06, + "loss": 0.9092, + "step": 16864 + }, + { + "epoch": 0.43, + "learning_rate": 1.932513970011792e-06, + "loss": 1.0752, + "step": 16865 + }, + { + "epoch": 0.43, + "learning_rate": 1.932503976915795e-06, + "loss": 0.8047, + "step": 16866 + }, + { + "epoch": 0.43, + "learning_rate": 1.932493983105822e-06, + "loss": 0.6582, + "step": 16867 + }, + { + "epoch": 0.43, + "learning_rate": 1.9324839885818812e-06, + "loss": 0.5222, + "step": 16868 + }, + { + "epoch": 0.43, + "learning_rate": 1.9324739933439806e-06, + "loss": 0.9238, + "step": 16869 + }, + { + "epoch": 0.43, + "learning_rate": 1.9324639973921274e-06, + "loss": 0.7861, + "step": 16870 + }, + { + "epoch": 0.43, + "learning_rate": 1.9324540007263296e-06, + "loss": 0.9854, + "step": 16871 + }, + { + "epoch": 0.43, + "learning_rate": 1.9324440033465944e-06, + "loss": 0.7539, + "step": 16872 + }, + { + "epoch": 0.43, + "learning_rate": 1.9324340052529295e-06, + "loss": 1.0029, + "step": 16873 + }, + { + "epoch": 0.43, + "learning_rate": 1.9324240064453428e-06, + "loss": 0.728, + "step": 16874 + }, + { + "epoch": 0.43, + "learning_rate": 1.9324140069238424e-06, + "loss": 0.9258, + "step": 16875 + }, + { + "epoch": 0.43, + "learning_rate": 1.932404006688435e-06, + "loss": 0.8721, + "step": 16876 + }, + { + "epoch": 0.43, + "learning_rate": 1.932394005739129e-06, + "loss": 0.6309, + "step": 16877 + }, + { + "epoch": 0.43, + "learning_rate": 1.9323840040759318e-06, + "loss": 0.9248, + "step": 16878 + }, + { + "epoch": 0.43, + "learning_rate": 1.932374001698851e-06, + "loss": 0.8623, + "step": 16879 + }, + { + "epoch": 0.43, + "learning_rate": 1.9323639986078943e-06, + "loss": 0.8799, + "step": 16880 + }, + { + "epoch": 0.43, + "learning_rate": 1.932353994803069e-06, + "loss": 0.8115, + "step": 16881 + }, + { + "epoch": 0.43, + "learning_rate": 1.9323439902843835e-06, + "loss": 1.0352, + "step": 16882 + }, + { + "epoch": 0.43, + "learning_rate": 1.9323339850518452e-06, + "loss": 0.8887, + "step": 16883 + }, + { + "epoch": 0.43, + "learning_rate": 1.9323239791054615e-06, + "loss": 1.0586, + "step": 16884 + }, + { + "epoch": 0.43, + "learning_rate": 1.93231397244524e-06, + "loss": 0.896, + "step": 16885 + }, + { + "epoch": 0.43, + "learning_rate": 1.932303965071189e-06, + "loss": 0.957, + "step": 16886 + }, + { + "epoch": 0.43, + "learning_rate": 1.9322939569833153e-06, + "loss": 0.8799, + "step": 16887 + }, + { + "epoch": 0.43, + "learning_rate": 1.932283948181627e-06, + "loss": 0.8682, + "step": 16888 + }, + { + "epoch": 0.43, + "learning_rate": 1.932273938666132e-06, + "loss": 0.8345, + "step": 16889 + }, + { + "epoch": 0.43, + "learning_rate": 1.9322639284368375e-06, + "loss": 0.9844, + "step": 16890 + }, + { + "epoch": 0.43, + "learning_rate": 1.9322539174937513e-06, + "loss": 1.042, + "step": 16891 + }, + { + "epoch": 0.43, + "learning_rate": 1.9322439058368815e-06, + "loss": 0.8071, + "step": 16892 + }, + { + "epoch": 0.43, + "learning_rate": 1.932233893466235e-06, + "loss": 0.8296, + "step": 16893 + }, + { + "epoch": 0.43, + "learning_rate": 1.93222388038182e-06, + "loss": 1.0576, + "step": 16894 + }, + { + "epoch": 0.43, + "learning_rate": 1.9322138665836443e-06, + "loss": 0.5908, + "step": 16895 + }, + { + "epoch": 0.43, + "learning_rate": 1.9322038520717148e-06, + "loss": 0.8628, + "step": 16896 + }, + { + "epoch": 0.43, + "learning_rate": 1.93219383684604e-06, + "loss": 0.8584, + "step": 16897 + }, + { + "epoch": 0.43, + "learning_rate": 1.9321838209066273e-06, + "loss": 0.7998, + "step": 16898 + }, + { + "epoch": 0.43, + "learning_rate": 1.9321738042534845e-06, + "loss": 0.9697, + "step": 16899 + }, + { + "epoch": 0.43, + "learning_rate": 1.9321637868866186e-06, + "loss": 0.9639, + "step": 16900 + }, + { + "epoch": 0.43, + "learning_rate": 1.9321537688060377e-06, + "loss": 0.8457, + "step": 16901 + }, + { + "epoch": 0.43, + "learning_rate": 1.93214375001175e-06, + "loss": 0.8848, + "step": 16902 + }, + { + "epoch": 0.43, + "learning_rate": 1.9321337305037625e-06, + "loss": 1.0186, + "step": 16903 + }, + { + "epoch": 0.43, + "learning_rate": 1.932123710282083e-06, + "loss": 0.9023, + "step": 16904 + }, + { + "epoch": 0.43, + "learning_rate": 1.9321136893467195e-06, + "loss": 0.9092, + "step": 16905 + }, + { + "epoch": 0.43, + "learning_rate": 1.932103667697679e-06, + "loss": 0.9941, + "step": 16906 + }, + { + "epoch": 0.43, + "learning_rate": 1.93209364533497e-06, + "loss": 1.0273, + "step": 16907 + }, + { + "epoch": 0.43, + "learning_rate": 1.9320836222585994e-06, + "loss": 0.8672, + "step": 16908 + }, + { + "epoch": 0.43, + "learning_rate": 1.9320735984685755e-06, + "loss": 0.7969, + "step": 16909 + }, + { + "epoch": 0.43, + "learning_rate": 1.932063573964905e-06, + "loss": 0.9912, + "step": 16910 + }, + { + "epoch": 0.43, + "learning_rate": 1.9320535487475974e-06, + "loss": 0.9229, + "step": 16911 + }, + { + "epoch": 0.43, + "learning_rate": 1.9320435228166583e-06, + "loss": 0.6309, + "step": 16912 + }, + { + "epoch": 0.43, + "learning_rate": 1.9320334961720966e-06, + "loss": 0.9238, + "step": 16913 + }, + { + "epoch": 0.43, + "learning_rate": 1.93202346881392e-06, + "loss": 0.6692, + "step": 16914 + }, + { + "epoch": 0.43, + "learning_rate": 1.932013440742136e-06, + "loss": 0.9355, + "step": 16915 + }, + { + "epoch": 0.43, + "learning_rate": 1.9320034119567517e-06, + "loss": 0.9834, + "step": 16916 + }, + { + "epoch": 0.43, + "learning_rate": 1.9319933824577754e-06, + "loss": 1.1289, + "step": 16917 + }, + { + "epoch": 0.43, + "learning_rate": 1.9319833522452144e-06, + "loss": 1.0781, + "step": 16918 + }, + { + "epoch": 0.43, + "learning_rate": 1.9319733213190773e-06, + "loss": 0.8486, + "step": 16919 + }, + { + "epoch": 0.43, + "learning_rate": 1.9319632896793704e-06, + "loss": 0.9854, + "step": 16920 + }, + { + "epoch": 0.43, + "learning_rate": 1.9319532573261022e-06, + "loss": 0.7588, + "step": 16921 + }, + { + "epoch": 0.43, + "learning_rate": 1.9319432242592804e-06, + "loss": 0.8623, + "step": 16922 + }, + { + "epoch": 0.43, + "learning_rate": 1.9319331904789124e-06, + "loss": 0.8896, + "step": 16923 + }, + { + "epoch": 0.43, + "learning_rate": 1.931923155985006e-06, + "loss": 0.6887, + "step": 16924 + }, + { + "epoch": 0.43, + "learning_rate": 1.931913120777569e-06, + "loss": 0.9121, + "step": 16925 + }, + { + "epoch": 0.43, + "learning_rate": 1.931903084856609e-06, + "loss": 0.8027, + "step": 16926 + }, + { + "epoch": 0.43, + "learning_rate": 1.9318930482221334e-06, + "loss": 0.6973, + "step": 16927 + }, + { + "epoch": 0.43, + "learning_rate": 1.9318830108741504e-06, + "loss": 1.1602, + "step": 16928 + }, + { + "epoch": 0.43, + "learning_rate": 1.9318729728126674e-06, + "loss": 0.5845, + "step": 16929 + }, + { + "epoch": 0.43, + "learning_rate": 1.9318629340376922e-06, + "loss": 1.1162, + "step": 16930 + }, + { + "epoch": 0.43, + "learning_rate": 1.931852894549232e-06, + "loss": 1.0459, + "step": 16931 + }, + { + "epoch": 0.43, + "learning_rate": 1.931842854347295e-06, + "loss": 0.9551, + "step": 16932 + }, + { + "epoch": 0.43, + "learning_rate": 1.931832813431889e-06, + "loss": 0.9404, + "step": 16933 + }, + { + "epoch": 0.43, + "learning_rate": 1.9318227718030215e-06, + "loss": 0.8906, + "step": 16934 + }, + { + "epoch": 0.43, + "learning_rate": 1.9318127294607e-06, + "loss": 0.748, + "step": 16935 + }, + { + "epoch": 0.43, + "learning_rate": 1.9318026864049327e-06, + "loss": 0.7979, + "step": 16936 + }, + { + "epoch": 0.43, + "learning_rate": 1.9317926426357267e-06, + "loss": 1.0098, + "step": 16937 + }, + { + "epoch": 0.43, + "learning_rate": 1.9317825981530894e-06, + "loss": 0.9492, + "step": 16938 + }, + { + "epoch": 0.43, + "learning_rate": 1.9317725529570293e-06, + "loss": 0.9604, + "step": 16939 + }, + { + "epoch": 0.43, + "learning_rate": 1.931762507047554e-06, + "loss": 0.8081, + "step": 16940 + }, + { + "epoch": 0.43, + "learning_rate": 1.931752460424671e-06, + "loss": 0.8726, + "step": 16941 + }, + { + "epoch": 0.43, + "learning_rate": 1.931742413088388e-06, + "loss": 0.8975, + "step": 16942 + }, + { + "epoch": 0.43, + "learning_rate": 1.9317323650387124e-06, + "loss": 0.8643, + "step": 16943 + }, + { + "epoch": 0.43, + "learning_rate": 1.9317223162756526e-06, + "loss": 0.7998, + "step": 16944 + }, + { + "epoch": 0.43, + "learning_rate": 1.9317122667992157e-06, + "loss": 0.9941, + "step": 16945 + }, + { + "epoch": 0.43, + "learning_rate": 1.9317022166094094e-06, + "loss": 0.875, + "step": 16946 + }, + { + "epoch": 0.43, + "learning_rate": 1.9316921657062416e-06, + "loss": 0.7656, + "step": 16947 + }, + { + "epoch": 0.43, + "learning_rate": 1.93168211408972e-06, + "loss": 1.0215, + "step": 16948 + }, + { + "epoch": 0.43, + "learning_rate": 1.931672061759852e-06, + "loss": 0.8779, + "step": 16949 + }, + { + "epoch": 0.43, + "learning_rate": 1.9316620087166457e-06, + "loss": 0.9385, + "step": 16950 + }, + { + "epoch": 0.43, + "learning_rate": 1.931651954960109e-06, + "loss": 0.9727, + "step": 16951 + }, + { + "epoch": 0.43, + "learning_rate": 1.931641900490249e-06, + "loss": 0.8135, + "step": 16952 + }, + { + "epoch": 0.43, + "learning_rate": 1.9316318453070737e-06, + "loss": 0.8115, + "step": 16953 + }, + { + "epoch": 0.43, + "learning_rate": 1.9316217894105903e-06, + "loss": 0.8057, + "step": 16954 + }, + { + "epoch": 0.43, + "learning_rate": 1.9316117328008075e-06, + "loss": 1.0371, + "step": 16955 + }, + { + "epoch": 0.43, + "learning_rate": 1.931601675477732e-06, + "loss": 0.9385, + "step": 16956 + }, + { + "epoch": 0.43, + "learning_rate": 1.931591617441372e-06, + "loss": 0.6235, + "step": 16957 + }, + { + "epoch": 0.43, + "learning_rate": 1.9315815586917355e-06, + "loss": 0.894, + "step": 16958 + }, + { + "epoch": 0.43, + "learning_rate": 1.9315714992288292e-06, + "loss": 0.9043, + "step": 16959 + }, + { + "epoch": 0.43, + "learning_rate": 1.931561439052662e-06, + "loss": 0.96, + "step": 16960 + }, + { + "epoch": 0.43, + "learning_rate": 1.931551378163241e-06, + "loss": 1.0381, + "step": 16961 + }, + { + "epoch": 0.43, + "learning_rate": 1.9315413165605736e-06, + "loss": 0.877, + "step": 16962 + }, + { + "epoch": 0.43, + "learning_rate": 1.931531254244668e-06, + "loss": 0.8301, + "step": 16963 + }, + { + "epoch": 0.43, + "learning_rate": 1.9315211912155317e-06, + "loss": 1.1504, + "step": 16964 + }, + { + "epoch": 0.43, + "learning_rate": 1.931511127473173e-06, + "loss": 0.9609, + "step": 16965 + }, + { + "epoch": 0.43, + "learning_rate": 1.9315010630175986e-06, + "loss": 0.6978, + "step": 16966 + }, + { + "epoch": 0.43, + "learning_rate": 1.9314909978488167e-06, + "loss": 1.0273, + "step": 16967 + }, + { + "epoch": 0.43, + "learning_rate": 1.9314809319668348e-06, + "loss": 1.1406, + "step": 16968 + }, + { + "epoch": 0.43, + "learning_rate": 1.931470865371661e-06, + "loss": 0.9277, + "step": 16969 + }, + { + "epoch": 0.43, + "learning_rate": 1.9314607980633025e-06, + "loss": 0.6992, + "step": 16970 + }, + { + "epoch": 0.43, + "learning_rate": 1.931450730041768e-06, + "loss": 0.9658, + "step": 16971 + }, + { + "epoch": 0.44, + "learning_rate": 1.9314406613070637e-06, + "loss": 0.8506, + "step": 16972 + }, + { + "epoch": 0.44, + "learning_rate": 1.9314305918591984e-06, + "loss": 0.8955, + "step": 16973 + }, + { + "epoch": 0.44, + "learning_rate": 1.9314205216981792e-06, + "loss": 0.9336, + "step": 16974 + }, + { + "epoch": 0.44, + "learning_rate": 1.9314104508240147e-06, + "loss": 1.082, + "step": 16975 + }, + { + "epoch": 0.44, + "learning_rate": 1.931400379236712e-06, + "loss": 0.9414, + "step": 16976 + }, + { + "epoch": 0.44, + "learning_rate": 1.9313903069362785e-06, + "loss": 0.7764, + "step": 16977 + }, + { + "epoch": 0.44, + "learning_rate": 1.9313802339227226e-06, + "loss": 0.7744, + "step": 16978 + }, + { + "epoch": 0.44, + "learning_rate": 1.9313701601960517e-06, + "loss": 0.6758, + "step": 16979 + }, + { + "epoch": 0.44, + "learning_rate": 1.931360085756273e-06, + "loss": 1.0762, + "step": 16980 + }, + { + "epoch": 0.44, + "learning_rate": 1.9313500106033953e-06, + "loss": 0.9375, + "step": 16981 + }, + { + "epoch": 0.44, + "learning_rate": 1.9313399347374255e-06, + "loss": 0.8135, + "step": 16982 + }, + { + "epoch": 0.44, + "learning_rate": 1.9313298581583716e-06, + "loss": 0.9072, + "step": 16983 + }, + { + "epoch": 0.44, + "learning_rate": 1.9313197808662413e-06, + "loss": 0.7412, + "step": 16984 + }, + { + "epoch": 0.44, + "learning_rate": 1.931309702861042e-06, + "loss": 1.0791, + "step": 16985 + }, + { + "epoch": 0.44, + "learning_rate": 1.9312996241427818e-06, + "loss": 0.8433, + "step": 16986 + }, + { + "epoch": 0.44, + "learning_rate": 1.9312895447114685e-06, + "loss": 0.9375, + "step": 16987 + }, + { + "epoch": 0.44, + "learning_rate": 1.931279464567109e-06, + "loss": 0.7368, + "step": 16988 + }, + { + "epoch": 0.44, + "learning_rate": 1.9312693837097124e-06, + "loss": 0.9102, + "step": 16989 + }, + { + "epoch": 0.44, + "learning_rate": 1.9312593021392853e-06, + "loss": 1.1357, + "step": 16990 + }, + { + "epoch": 0.44, + "learning_rate": 1.9312492198558355e-06, + "loss": 0.6958, + "step": 16991 + }, + { + "epoch": 0.44, + "learning_rate": 1.9312391368593716e-06, + "loss": 0.8027, + "step": 16992 + }, + { + "epoch": 0.44, + "learning_rate": 1.9312290531499e-06, + "loss": 1.0059, + "step": 16993 + }, + { + "epoch": 0.44, + "learning_rate": 1.93121896872743e-06, + "loss": 0.6221, + "step": 16994 + }, + { + "epoch": 0.44, + "learning_rate": 1.9312088835919676e-06, + "loss": 1.1162, + "step": 16995 + }, + { + "epoch": 0.44, + "learning_rate": 1.931198797743522e-06, + "loss": 0.8721, + "step": 16996 + }, + { + "epoch": 0.44, + "learning_rate": 1.9311887111821e-06, + "loss": 1.0762, + "step": 16997 + }, + { + "epoch": 0.44, + "learning_rate": 1.9311786239077096e-06, + "loss": 0.749, + "step": 16998 + }, + { + "epoch": 0.44, + "learning_rate": 1.9311685359203586e-06, + "loss": 1.1719, + "step": 16999 + }, + { + "epoch": 0.44, + "learning_rate": 1.9311584472200545e-06, + "loss": 1.0654, + "step": 17000 + }, + { + "epoch": 0.44, + "learning_rate": 1.9311483578068057e-06, + "loss": 0.8389, + "step": 17001 + }, + { + "epoch": 0.44, + "learning_rate": 1.931138267680619e-06, + "loss": 0.8965, + "step": 17002 + }, + { + "epoch": 0.44, + "learning_rate": 1.931128176841503e-06, + "loss": 0.9355, + "step": 17003 + }, + { + "epoch": 0.44, + "learning_rate": 1.9311180852894645e-06, + "loss": 0.8994, + "step": 17004 + }, + { + "epoch": 0.44, + "learning_rate": 1.9311079930245116e-06, + "loss": 0.8047, + "step": 17005 + }, + { + "epoch": 0.44, + "learning_rate": 1.9310979000466525e-06, + "loss": 0.9326, + "step": 17006 + }, + { + "epoch": 0.44, + "learning_rate": 1.931087806355894e-06, + "loss": 0.8643, + "step": 17007 + }, + { + "epoch": 0.44, + "learning_rate": 1.931077711952245e-06, + "loss": 1.001, + "step": 17008 + }, + { + "epoch": 0.44, + "learning_rate": 1.9310676168357122e-06, + "loss": 0.877, + "step": 17009 + }, + { + "epoch": 0.44, + "learning_rate": 1.931057521006304e-06, + "loss": 0.9004, + "step": 17010 + }, + { + "epoch": 0.44, + "learning_rate": 1.931047424464028e-06, + "loss": 1.1299, + "step": 17011 + }, + { + "epoch": 0.44, + "learning_rate": 1.9310373272088912e-06, + "loss": 0.7422, + "step": 17012 + }, + { + "epoch": 0.44, + "learning_rate": 1.9310272292409023e-06, + "loss": 0.7871, + "step": 17013 + }, + { + "epoch": 0.44, + "learning_rate": 1.9310171305600687e-06, + "loss": 1.1357, + "step": 17014 + }, + { + "epoch": 0.44, + "learning_rate": 1.9310070311663984e-06, + "loss": 0.7959, + "step": 17015 + }, + { + "epoch": 0.44, + "learning_rate": 1.930996931059898e-06, + "loss": 0.9443, + "step": 17016 + }, + { + "epoch": 0.44, + "learning_rate": 1.930986830240577e-06, + "loss": 0.7207, + "step": 17017 + }, + { + "epoch": 0.44, + "learning_rate": 1.930976728708442e-06, + "loss": 0.9062, + "step": 17018 + }, + { + "epoch": 0.44, + "learning_rate": 1.9309666264635003e-06, + "loss": 0.772, + "step": 17019 + }, + { + "epoch": 0.44, + "learning_rate": 1.9309565235057606e-06, + "loss": 0.8477, + "step": 17020 + }, + { + "epoch": 0.44, + "learning_rate": 1.9309464198352303e-06, + "loss": 0.8521, + "step": 17021 + }, + { + "epoch": 0.44, + "learning_rate": 1.930936315451917e-06, + "loss": 1.0352, + "step": 17022 + }, + { + "epoch": 0.44, + "learning_rate": 1.930926210355829e-06, + "loss": 0.877, + "step": 17023 + }, + { + "epoch": 0.44, + "learning_rate": 1.930916104546973e-06, + "loss": 0.8164, + "step": 17024 + }, + { + "epoch": 0.44, + "learning_rate": 1.930905998025358e-06, + "loss": 0.8076, + "step": 17025 + }, + { + "epoch": 0.44, + "learning_rate": 1.930895890790991e-06, + "loss": 1.123, + "step": 17026 + }, + { + "epoch": 0.44, + "learning_rate": 1.9308857828438793e-06, + "loss": 0.8262, + "step": 17027 + }, + { + "epoch": 0.44, + "learning_rate": 1.930875674184031e-06, + "loss": 0.7061, + "step": 17028 + }, + { + "epoch": 0.44, + "learning_rate": 1.9308655648114546e-06, + "loss": 0.8877, + "step": 17029 + }, + { + "epoch": 0.44, + "learning_rate": 1.930855454726157e-06, + "loss": 0.4663, + "step": 17030 + }, + { + "epoch": 0.44, + "learning_rate": 1.9308453439281466e-06, + "loss": 0.8965, + "step": 17031 + }, + { + "epoch": 0.44, + "learning_rate": 1.9308352324174302e-06, + "loss": 0.9106, + "step": 17032 + }, + { + "epoch": 0.44, + "learning_rate": 1.930825120194016e-06, + "loss": 0.9727, + "step": 17033 + }, + { + "epoch": 0.44, + "learning_rate": 1.9308150072579123e-06, + "loss": 0.8203, + "step": 17034 + }, + { + "epoch": 0.44, + "learning_rate": 1.930804893609126e-06, + "loss": 0.9014, + "step": 17035 + }, + { + "epoch": 0.44, + "learning_rate": 1.9307947792476653e-06, + "loss": 0.8857, + "step": 17036 + }, + { + "epoch": 0.44, + "learning_rate": 1.930784664173538e-06, + "loss": 0.8228, + "step": 17037 + }, + { + "epoch": 0.44, + "learning_rate": 1.9307745483867516e-06, + "loss": 0.9717, + "step": 17038 + }, + { + "epoch": 0.44, + "learning_rate": 1.9307644318873136e-06, + "loss": 0.6655, + "step": 17039 + }, + { + "epoch": 0.44, + "learning_rate": 1.9307543146752325e-06, + "loss": 1.0527, + "step": 17040 + }, + { + "epoch": 0.44, + "learning_rate": 1.930744196750515e-06, + "loss": 0.8931, + "step": 17041 + }, + { + "epoch": 0.44, + "learning_rate": 1.93073407811317e-06, + "loss": 1.0156, + "step": 17042 + }, + { + "epoch": 0.44, + "learning_rate": 1.9307239587632045e-06, + "loss": 0.8711, + "step": 17043 + }, + { + "epoch": 0.44, + "learning_rate": 1.9307138387006267e-06, + "loss": 0.8545, + "step": 17044 + }, + { + "epoch": 0.44, + "learning_rate": 1.930703717925444e-06, + "loss": 0.689, + "step": 17045 + }, + { + "epoch": 0.44, + "learning_rate": 1.930693596437664e-06, + "loss": 1.0098, + "step": 17046 + }, + { + "epoch": 0.44, + "learning_rate": 1.9306834742372954e-06, + "loss": 0.7808, + "step": 17047 + }, + { + "epoch": 0.44, + "learning_rate": 1.9306733513243446e-06, + "loss": 1.0234, + "step": 17048 + }, + { + "epoch": 0.44, + "learning_rate": 1.93066322769882e-06, + "loss": 0.8066, + "step": 17049 + }, + { + "epoch": 0.44, + "learning_rate": 1.9306531033607295e-06, + "loss": 0.8467, + "step": 17050 + }, + { + "epoch": 0.44, + "learning_rate": 1.930642978310081e-06, + "loss": 0.7642, + "step": 17051 + }, + { + "epoch": 0.44, + "learning_rate": 1.9306328525468817e-06, + "loss": 0.8857, + "step": 17052 + }, + { + "epoch": 0.44, + "learning_rate": 1.9306227260711396e-06, + "loss": 1.0547, + "step": 17053 + }, + { + "epoch": 0.44, + "learning_rate": 1.9306125988828624e-06, + "loss": 0.8965, + "step": 17054 + }, + { + "epoch": 0.44, + "learning_rate": 1.930602470982058e-06, + "loss": 0.8091, + "step": 17055 + }, + { + "epoch": 0.44, + "learning_rate": 1.9305923423687344e-06, + "loss": 0.8809, + "step": 17056 + }, + { + "epoch": 0.44, + "learning_rate": 1.9305822130428988e-06, + "loss": 0.8848, + "step": 17057 + }, + { + "epoch": 0.44, + "learning_rate": 1.930572083004559e-06, + "loss": 0.7427, + "step": 17058 + }, + { + "epoch": 0.44, + "learning_rate": 1.930561952253723e-06, + "loss": 0.9814, + "step": 17059 + }, + { + "epoch": 0.44, + "learning_rate": 1.9305518207903985e-06, + "loss": 0.7959, + "step": 17060 + }, + { + "epoch": 0.44, + "learning_rate": 1.9305416886145936e-06, + "loss": 0.8623, + "step": 17061 + }, + { + "epoch": 0.44, + "learning_rate": 1.9305315557263153e-06, + "loss": 1.0127, + "step": 17062 + }, + { + "epoch": 0.44, + "learning_rate": 1.9305214221255718e-06, + "loss": 0.7251, + "step": 17063 + }, + { + "epoch": 0.44, + "learning_rate": 1.930511287812371e-06, + "loss": 1.0225, + "step": 17064 + }, + { + "epoch": 0.44, + "learning_rate": 1.9305011527867207e-06, + "loss": 0.71, + "step": 17065 + }, + { + "epoch": 0.44, + "learning_rate": 1.930491017048628e-06, + "loss": 0.9473, + "step": 17066 + }, + { + "epoch": 0.44, + "learning_rate": 1.9304808805981015e-06, + "loss": 1.0205, + "step": 17067 + }, + { + "epoch": 0.44, + "learning_rate": 1.930470743435148e-06, + "loss": 0.9619, + "step": 17068 + }, + { + "epoch": 0.44, + "learning_rate": 1.9304606055597767e-06, + "loss": 1.1094, + "step": 17069 + }, + { + "epoch": 0.44, + "learning_rate": 1.9304504669719937e-06, + "loss": 0.8643, + "step": 17070 + }, + { + "epoch": 0.44, + "learning_rate": 1.930440327671808e-06, + "loss": 0.7844, + "step": 17071 + }, + { + "epoch": 0.44, + "learning_rate": 1.9304301876592272e-06, + "loss": 1.0283, + "step": 17072 + }, + { + "epoch": 0.44, + "learning_rate": 1.930420046934258e-06, + "loss": 0.635, + "step": 17073 + }, + { + "epoch": 0.44, + "learning_rate": 1.9304099054969093e-06, + "loss": 0.9326, + "step": 17074 + }, + { + "epoch": 0.44, + "learning_rate": 1.9303997633471885e-06, + "loss": 0.8672, + "step": 17075 + }, + { + "epoch": 0.44, + "learning_rate": 1.9303896204851036e-06, + "loss": 0.9453, + "step": 17076 + }, + { + "epoch": 0.44, + "learning_rate": 1.930379476910662e-06, + "loss": 0.8867, + "step": 17077 + }, + { + "epoch": 0.44, + "learning_rate": 1.930369332623872e-06, + "loss": 0.9395, + "step": 17078 + }, + { + "epoch": 0.44, + "learning_rate": 1.9303591876247402e-06, + "loss": 0.9268, + "step": 17079 + }, + { + "epoch": 0.44, + "learning_rate": 1.9303490419132755e-06, + "loss": 0.8291, + "step": 17080 + }, + { + "epoch": 0.44, + "learning_rate": 1.9303388954894857e-06, + "loss": 0.9326, + "step": 17081 + }, + { + "epoch": 0.44, + "learning_rate": 1.9303287483533776e-06, + "loss": 1.0186, + "step": 17082 + }, + { + "epoch": 0.44, + "learning_rate": 1.93031860050496e-06, + "loss": 0.9551, + "step": 17083 + }, + { + "epoch": 0.44, + "learning_rate": 1.93030845194424e-06, + "loss": 1.0146, + "step": 17084 + }, + { + "epoch": 0.44, + "learning_rate": 1.9302983026712257e-06, + "loss": 1.0889, + "step": 17085 + }, + { + "epoch": 0.44, + "learning_rate": 1.9302881526859245e-06, + "loss": 0.8174, + "step": 17086 + }, + { + "epoch": 0.44, + "learning_rate": 1.930278001988345e-06, + "loss": 0.8535, + "step": 17087 + }, + { + "epoch": 0.44, + "learning_rate": 1.930267850578494e-06, + "loss": 0.9668, + "step": 17088 + }, + { + "epoch": 0.44, + "learning_rate": 1.9302576984563793e-06, + "loss": 0.9189, + "step": 17089 + }, + { + "epoch": 0.44, + "learning_rate": 1.93024754562201e-06, + "loss": 1.04, + "step": 17090 + }, + { + "epoch": 0.44, + "learning_rate": 1.930237392075392e-06, + "loss": 0.9443, + "step": 17091 + }, + { + "epoch": 0.44, + "learning_rate": 1.9302272378165344e-06, + "loss": 0.708, + "step": 17092 + }, + { + "epoch": 0.44, + "learning_rate": 1.930217082845445e-06, + "loss": 0.96, + "step": 17093 + }, + { + "epoch": 0.44, + "learning_rate": 1.9302069271621306e-06, + "loss": 0.75, + "step": 17094 + }, + { + "epoch": 0.44, + "learning_rate": 1.9301967707665992e-06, + "loss": 0.834, + "step": 17095 + }, + { + "epoch": 0.44, + "learning_rate": 1.9301866136588597e-06, + "loss": 1.0449, + "step": 17096 + }, + { + "epoch": 0.44, + "learning_rate": 1.930176455838919e-06, + "loss": 0.6401, + "step": 17097 + }, + { + "epoch": 0.44, + "learning_rate": 1.930166297306784e-06, + "loss": 0.7295, + "step": 17098 + }, + { + "epoch": 0.44, + "learning_rate": 1.9301561380624645e-06, + "loss": 0.9121, + "step": 17099 + }, + { + "epoch": 0.44, + "learning_rate": 1.930145978105967e-06, + "loss": 0.833, + "step": 17100 + }, + { + "epoch": 0.44, + "learning_rate": 1.930135817437299e-06, + "loss": 0.8174, + "step": 17101 + }, + { + "epoch": 0.44, + "learning_rate": 1.9301256560564694e-06, + "loss": 0.9717, + "step": 17102 + }, + { + "epoch": 0.44, + "learning_rate": 1.930115493963485e-06, + "loss": 0.9941, + "step": 17103 + }, + { + "epoch": 0.44, + "learning_rate": 1.930105331158354e-06, + "loss": 0.917, + "step": 17104 + }, + { + "epoch": 0.44, + "learning_rate": 1.930095167641084e-06, + "loss": 0.8496, + "step": 17105 + }, + { + "epoch": 0.44, + "learning_rate": 1.9300850034116833e-06, + "loss": 1.0684, + "step": 17106 + }, + { + "epoch": 0.44, + "learning_rate": 1.9300748384701587e-06, + "loss": 0.9023, + "step": 17107 + }, + { + "epoch": 0.44, + "learning_rate": 1.930064672816519e-06, + "loss": 0.8896, + "step": 17108 + }, + { + "epoch": 0.44, + "learning_rate": 1.9300545064507718e-06, + "loss": 0.7646, + "step": 17109 + }, + { + "epoch": 0.44, + "learning_rate": 1.9300443393729238e-06, + "loss": 0.7236, + "step": 17110 + }, + { + "epoch": 0.44, + "learning_rate": 1.930034171582984e-06, + "loss": 0.8037, + "step": 17111 + }, + { + "epoch": 0.44, + "learning_rate": 1.93002400308096e-06, + "loss": 0.5022, + "step": 17112 + }, + { + "epoch": 0.44, + "learning_rate": 1.9300138338668593e-06, + "loss": 0.7695, + "step": 17113 + }, + { + "epoch": 0.44, + "learning_rate": 1.9300036639406894e-06, + "loss": 1.0049, + "step": 17114 + }, + { + "epoch": 0.44, + "learning_rate": 1.929993493302459e-06, + "loss": 1.0439, + "step": 17115 + }, + { + "epoch": 0.44, + "learning_rate": 1.9299833219521753e-06, + "loss": 0.749, + "step": 17116 + }, + { + "epoch": 0.44, + "learning_rate": 1.929973149889846e-06, + "loss": 0.8867, + "step": 17117 + }, + { + "epoch": 0.44, + "learning_rate": 1.929962977115479e-06, + "loss": 0.9502, + "step": 17118 + }, + { + "epoch": 0.44, + "learning_rate": 1.9299528036290818e-06, + "loss": 0.9375, + "step": 17119 + }, + { + "epoch": 0.44, + "learning_rate": 1.9299426294306628e-06, + "loss": 0.5723, + "step": 17120 + }, + { + "epoch": 0.44, + "learning_rate": 1.9299324545202296e-06, + "loss": 0.9512, + "step": 17121 + }, + { + "epoch": 0.44, + "learning_rate": 1.9299222788977898e-06, + "loss": 0.9502, + "step": 17122 + }, + { + "epoch": 0.44, + "learning_rate": 1.929912102563351e-06, + "loss": 0.9033, + "step": 17123 + }, + { + "epoch": 0.44, + "learning_rate": 1.9299019255169214e-06, + "loss": 0.7441, + "step": 17124 + }, + { + "epoch": 0.44, + "learning_rate": 1.929891747758509e-06, + "loss": 0.9072, + "step": 17125 + }, + { + "epoch": 0.44, + "learning_rate": 1.929881569288121e-06, + "loss": 1.0771, + "step": 17126 + }, + { + "epoch": 0.44, + "learning_rate": 1.9298713901057653e-06, + "loss": 1.0225, + "step": 17127 + }, + { + "epoch": 0.44, + "learning_rate": 1.92986121021145e-06, + "loss": 0.8271, + "step": 17128 + }, + { + "epoch": 0.44, + "learning_rate": 1.9298510296051822e-06, + "loss": 0.8594, + "step": 17129 + }, + { + "epoch": 0.44, + "learning_rate": 1.929840848286971e-06, + "loss": 0.8945, + "step": 17130 + }, + { + "epoch": 0.44, + "learning_rate": 1.929830666256823e-06, + "loss": 0.8301, + "step": 17131 + }, + { + "epoch": 0.44, + "learning_rate": 1.9298204835147466e-06, + "loss": 0.9092, + "step": 17132 + }, + { + "epoch": 0.44, + "learning_rate": 1.9298103000607494e-06, + "loss": 0.8579, + "step": 17133 + }, + { + "epoch": 0.44, + "learning_rate": 1.9298001158948393e-06, + "loss": 0.8213, + "step": 17134 + }, + { + "epoch": 0.44, + "learning_rate": 1.929789931017024e-06, + "loss": 0.8721, + "step": 17135 + }, + { + "epoch": 0.44, + "learning_rate": 1.929779745427311e-06, + "loss": 0.8213, + "step": 17136 + }, + { + "epoch": 0.44, + "learning_rate": 1.9297695591257085e-06, + "loss": 0.9082, + "step": 17137 + }, + { + "epoch": 0.44, + "learning_rate": 1.9297593721122244e-06, + "loss": 0.603, + "step": 17138 + }, + { + "epoch": 0.44, + "learning_rate": 1.929749184386866e-06, + "loss": 0.8682, + "step": 17139 + }, + { + "epoch": 0.44, + "learning_rate": 1.9297389959496417e-06, + "loss": 0.8174, + "step": 17140 + }, + { + "epoch": 0.44, + "learning_rate": 1.929728806800559e-06, + "loss": 0.7939, + "step": 17141 + }, + { + "epoch": 0.44, + "learning_rate": 1.929718616939625e-06, + "loss": 0.8721, + "step": 17142 + }, + { + "epoch": 0.44, + "learning_rate": 1.929708426366849e-06, + "loss": 0.9326, + "step": 17143 + }, + { + "epoch": 0.44, + "learning_rate": 1.9296982350822376e-06, + "loss": 0.9746, + "step": 17144 + }, + { + "epoch": 0.44, + "learning_rate": 1.929688043085799e-06, + "loss": 0.7764, + "step": 17145 + }, + { + "epoch": 0.44, + "learning_rate": 1.9296778503775415e-06, + "loss": 1.1104, + "step": 17146 + }, + { + "epoch": 0.44, + "learning_rate": 1.929667656957472e-06, + "loss": 1.0303, + "step": 17147 + }, + { + "epoch": 0.44, + "learning_rate": 1.9296574628255988e-06, + "loss": 0.8213, + "step": 17148 + }, + { + "epoch": 0.44, + "learning_rate": 1.92964726798193e-06, + "loss": 0.6948, + "step": 17149 + }, + { + "epoch": 0.44, + "learning_rate": 1.9296370724264725e-06, + "loss": 0.9072, + "step": 17150 + }, + { + "epoch": 0.44, + "learning_rate": 1.9296268761592348e-06, + "loss": 1.1182, + "step": 17151 + }, + { + "epoch": 0.44, + "learning_rate": 1.9296166791802246e-06, + "loss": 0.9277, + "step": 17152 + }, + { + "epoch": 0.44, + "learning_rate": 1.9296064814894498e-06, + "loss": 0.9355, + "step": 17153 + }, + { + "epoch": 0.44, + "learning_rate": 1.9295962830869177e-06, + "loss": 0.9233, + "step": 17154 + }, + { + "epoch": 0.44, + "learning_rate": 1.9295860839726366e-06, + "loss": 1.0039, + "step": 17155 + }, + { + "epoch": 0.44, + "learning_rate": 1.9295758841466145e-06, + "loss": 0.7549, + "step": 17156 + }, + { + "epoch": 0.44, + "learning_rate": 1.9295656836088586e-06, + "loss": 0.9795, + "step": 17157 + }, + { + "epoch": 0.44, + "learning_rate": 1.929555482359377e-06, + "loss": 0.835, + "step": 17158 + }, + { + "epoch": 0.44, + "learning_rate": 1.9295452803981777e-06, + "loss": 0.8779, + "step": 17159 + }, + { + "epoch": 0.44, + "learning_rate": 1.9295350777252677e-06, + "loss": 0.9316, + "step": 17160 + }, + { + "epoch": 0.44, + "learning_rate": 1.929524874340656e-06, + "loss": 0.6655, + "step": 17161 + }, + { + "epoch": 0.44, + "learning_rate": 1.92951467024435e-06, + "loss": 0.7358, + "step": 17162 + }, + { + "epoch": 0.44, + "learning_rate": 1.929504465436357e-06, + "loss": 0.9629, + "step": 17163 + }, + { + "epoch": 0.44, + "learning_rate": 1.9294942599166853e-06, + "loss": 0.7866, + "step": 17164 + }, + { + "epoch": 0.44, + "learning_rate": 1.9294840536853424e-06, + "loss": 0.9766, + "step": 17165 + }, + { + "epoch": 0.44, + "learning_rate": 1.9294738467423364e-06, + "loss": 0.9229, + "step": 17166 + }, + { + "epoch": 0.44, + "learning_rate": 1.9294636390876754e-06, + "loss": 0.7656, + "step": 17167 + }, + { + "epoch": 0.44, + "learning_rate": 1.929453430721366e-06, + "loss": 0.7822, + "step": 17168 + }, + { + "epoch": 0.44, + "learning_rate": 1.9294432216434177e-06, + "loss": 0.749, + "step": 17169 + }, + { + "epoch": 0.44, + "learning_rate": 1.929433011853837e-06, + "loss": 0.7366, + "step": 17170 + }, + { + "epoch": 0.44, + "learning_rate": 1.9294228013526322e-06, + "loss": 0.999, + "step": 17171 + }, + { + "epoch": 0.44, + "learning_rate": 1.929412590139811e-06, + "loss": 0.8984, + "step": 17172 + }, + { + "epoch": 0.44, + "learning_rate": 1.9294023782153815e-06, + "loss": 0.834, + "step": 17173 + }, + { + "epoch": 0.44, + "learning_rate": 1.9293921655793514e-06, + "loss": 0.7378, + "step": 17174 + }, + { + "epoch": 0.44, + "learning_rate": 1.9293819522317286e-06, + "loss": 0.7656, + "step": 17175 + }, + { + "epoch": 0.44, + "learning_rate": 1.9293717381725206e-06, + "loss": 0.9062, + "step": 17176 + }, + { + "epoch": 0.44, + "learning_rate": 1.9293615234017354e-06, + "loss": 0.7676, + "step": 17177 + }, + { + "epoch": 0.44, + "learning_rate": 1.9293513079193808e-06, + "loss": 0.7148, + "step": 17178 + }, + { + "epoch": 0.44, + "learning_rate": 1.9293410917254646e-06, + "loss": 0.9824, + "step": 17179 + }, + { + "epoch": 0.44, + "learning_rate": 1.9293308748199943e-06, + "loss": 0.8574, + "step": 17180 + }, + { + "epoch": 0.44, + "learning_rate": 1.9293206572029785e-06, + "loss": 0.8335, + "step": 17181 + }, + { + "epoch": 0.44, + "learning_rate": 1.9293104388744246e-06, + "loss": 1.0127, + "step": 17182 + }, + { + "epoch": 0.44, + "learning_rate": 1.9293002198343405e-06, + "loss": 1.0039, + "step": 17183 + }, + { + "epoch": 0.44, + "learning_rate": 1.9292900000827336e-06, + "loss": 0.71, + "step": 17184 + }, + { + "epoch": 0.44, + "learning_rate": 1.9292797796196126e-06, + "loss": 1.0195, + "step": 17185 + }, + { + "epoch": 0.44, + "learning_rate": 1.9292695584449843e-06, + "loss": 0.8154, + "step": 17186 + }, + { + "epoch": 0.44, + "learning_rate": 1.9292593365588573e-06, + "loss": 0.6489, + "step": 17187 + }, + { + "epoch": 0.44, + "learning_rate": 1.929249113961239e-06, + "loss": 0.8633, + "step": 17188 + }, + { + "epoch": 0.44, + "learning_rate": 1.9292388906521374e-06, + "loss": 0.8853, + "step": 17189 + }, + { + "epoch": 0.44, + "learning_rate": 1.9292286666315606e-06, + "loss": 0.8398, + "step": 17190 + }, + { + "epoch": 0.44, + "learning_rate": 1.9292184418995155e-06, + "loss": 0.8281, + "step": 17191 + }, + { + "epoch": 0.44, + "learning_rate": 1.9292082164560115e-06, + "loss": 0.8506, + "step": 17192 + }, + { + "epoch": 0.44, + "learning_rate": 1.9291979903010548e-06, + "loss": 0.9307, + "step": 17193 + }, + { + "epoch": 0.44, + "learning_rate": 1.929187763434654e-06, + "loss": 0.9844, + "step": 17194 + }, + { + "epoch": 0.44, + "learning_rate": 1.929177535856817e-06, + "loss": 0.7324, + "step": 17195 + }, + { + "epoch": 0.44, + "learning_rate": 1.9291673075675512e-06, + "loss": 0.626, + "step": 17196 + }, + { + "epoch": 0.44, + "learning_rate": 1.929157078566865e-06, + "loss": 0.6699, + "step": 17197 + }, + { + "epoch": 0.44, + "learning_rate": 1.929146848854766e-06, + "loss": 0.686, + "step": 17198 + }, + { + "epoch": 0.44, + "learning_rate": 1.9291366184312617e-06, + "loss": 0.9609, + "step": 17199 + }, + { + "epoch": 0.44, + "learning_rate": 1.9291263872963607e-06, + "loss": 0.8242, + "step": 17200 + }, + { + "epoch": 0.44, + "learning_rate": 1.92911615545007e-06, + "loss": 0.9619, + "step": 17201 + }, + { + "epoch": 0.44, + "learning_rate": 1.929105922892398e-06, + "loss": 0.9639, + "step": 17202 + }, + { + "epoch": 0.44, + "learning_rate": 1.929095689623352e-06, + "loss": 0.7842, + "step": 17203 + }, + { + "epoch": 0.44, + "learning_rate": 1.9290854556429405e-06, + "loss": 0.8389, + "step": 17204 + }, + { + "epoch": 0.44, + "learning_rate": 1.9290752209511703e-06, + "loss": 0.8564, + "step": 17205 + }, + { + "epoch": 0.44, + "learning_rate": 1.9290649855480505e-06, + "loss": 0.9541, + "step": 17206 + }, + { + "epoch": 0.44, + "learning_rate": 1.929054749433588e-06, + "loss": 0.9141, + "step": 17207 + }, + { + "epoch": 0.44, + "learning_rate": 1.9290445126077916e-06, + "loss": 0.749, + "step": 17208 + }, + { + "epoch": 0.44, + "learning_rate": 1.929034275070668e-06, + "loss": 1.1035, + "step": 17209 + }, + { + "epoch": 0.44, + "learning_rate": 1.929024036822226e-06, + "loss": 0.8633, + "step": 17210 + }, + { + "epoch": 0.44, + "learning_rate": 1.9290137978624727e-06, + "loss": 0.8604, + "step": 17211 + }, + { + "epoch": 0.44, + "learning_rate": 1.9290035581914164e-06, + "loss": 0.8799, + "step": 17212 + }, + { + "epoch": 0.44, + "learning_rate": 1.9289933178090646e-06, + "loss": 0.7109, + "step": 17213 + }, + { + "epoch": 0.44, + "learning_rate": 1.9289830767154257e-06, + "loss": 1.0645, + "step": 17214 + }, + { + "epoch": 0.44, + "learning_rate": 1.9289728349105066e-06, + "loss": 0.7734, + "step": 17215 + }, + { + "epoch": 0.44, + "learning_rate": 1.928962592394316e-06, + "loss": 1.0469, + "step": 17216 + }, + { + "epoch": 0.44, + "learning_rate": 1.9289523491668616e-06, + "loss": 0.875, + "step": 17217 + }, + { + "epoch": 0.44, + "learning_rate": 1.9289421052281513e-06, + "loss": 0.8477, + "step": 17218 + }, + { + "epoch": 0.44, + "learning_rate": 1.928931860578192e-06, + "loss": 0.8408, + "step": 17219 + }, + { + "epoch": 0.44, + "learning_rate": 1.9289216152169933e-06, + "loss": 0.7876, + "step": 17220 + }, + { + "epoch": 0.44, + "learning_rate": 1.9289113691445613e-06, + "loss": 0.959, + "step": 17221 + }, + { + "epoch": 0.44, + "learning_rate": 1.9289011223609046e-06, + "loss": 1.1064, + "step": 17222 + }, + { + "epoch": 0.44, + "learning_rate": 1.928890874866031e-06, + "loss": 0.7715, + "step": 17223 + }, + { + "epoch": 0.44, + "learning_rate": 1.9288806266599485e-06, + "loss": 0.4993, + "step": 17224 + }, + { + "epoch": 0.44, + "learning_rate": 1.928870377742665e-06, + "loss": 0.9873, + "step": 17225 + }, + { + "epoch": 0.44, + "learning_rate": 1.928860128114188e-06, + "loss": 0.7759, + "step": 17226 + }, + { + "epoch": 0.44, + "learning_rate": 1.9288498777745253e-06, + "loss": 0.5688, + "step": 17227 + }, + { + "epoch": 0.44, + "learning_rate": 1.9288396267236855e-06, + "loss": 0.9287, + "step": 17228 + }, + { + "epoch": 0.44, + "learning_rate": 1.9288293749616756e-06, + "loss": 1.0371, + "step": 17229 + }, + { + "epoch": 0.44, + "learning_rate": 1.9288191224885036e-06, + "loss": 1.0254, + "step": 17230 + }, + { + "epoch": 0.44, + "learning_rate": 1.928808869304178e-06, + "loss": 1.0977, + "step": 17231 + }, + { + "epoch": 0.44, + "learning_rate": 1.928798615408706e-06, + "loss": 0.6235, + "step": 17232 + }, + { + "epoch": 0.44, + "learning_rate": 1.928788360802095e-06, + "loss": 0.8691, + "step": 17233 + }, + { + "epoch": 0.44, + "learning_rate": 1.928778105484354e-06, + "loss": 0.9912, + "step": 17234 + }, + { + "epoch": 0.44, + "learning_rate": 1.92876784945549e-06, + "loss": 0.957, + "step": 17235 + }, + { + "epoch": 0.44, + "learning_rate": 1.928757592715511e-06, + "loss": 0.9805, + "step": 17236 + }, + { + "epoch": 0.44, + "learning_rate": 1.928747335264426e-06, + "loss": 0.873, + "step": 17237 + }, + { + "epoch": 0.44, + "learning_rate": 1.9287370771022407e-06, + "loss": 0.668, + "step": 17238 + }, + { + "epoch": 0.44, + "learning_rate": 1.9287268182289652e-06, + "loss": 0.8213, + "step": 17239 + }, + { + "epoch": 0.44, + "learning_rate": 1.9287165586446056e-06, + "loss": 0.8516, + "step": 17240 + }, + { + "epoch": 0.44, + "learning_rate": 1.9287062983491707e-06, + "loss": 0.7429, + "step": 17241 + }, + { + "epoch": 0.44, + "learning_rate": 1.928696037342668e-06, + "loss": 0.8101, + "step": 17242 + }, + { + "epoch": 0.44, + "learning_rate": 1.9286857756251053e-06, + "loss": 0.7139, + "step": 17243 + }, + { + "epoch": 0.44, + "learning_rate": 1.9286755131964907e-06, + "loss": 0.9688, + "step": 17244 + }, + { + "epoch": 0.44, + "learning_rate": 1.928665250056832e-06, + "loss": 0.8379, + "step": 17245 + }, + { + "epoch": 0.44, + "learning_rate": 1.928654986206137e-06, + "loss": 0.9629, + "step": 17246 + }, + { + "epoch": 0.44, + "learning_rate": 1.9286447216444133e-06, + "loss": 0.8506, + "step": 17247 + }, + { + "epoch": 0.44, + "learning_rate": 1.9286344563716693e-06, + "loss": 0.8008, + "step": 17248 + }, + { + "epoch": 0.44, + "learning_rate": 1.9286241903879126e-06, + "loss": 0.7725, + "step": 17249 + }, + { + "epoch": 0.44, + "learning_rate": 1.928613923693151e-06, + "loss": 0.875, + "step": 17250 + }, + { + "epoch": 0.44, + "learning_rate": 1.9286036562873925e-06, + "loss": 0.9473, + "step": 17251 + }, + { + "epoch": 0.44, + "learning_rate": 1.928593388170645e-06, + "loss": 0.9209, + "step": 17252 + }, + { + "epoch": 0.44, + "learning_rate": 1.928583119342916e-06, + "loss": 0.6387, + "step": 17253 + }, + { + "epoch": 0.44, + "learning_rate": 1.928572849804214e-06, + "loss": 0.8594, + "step": 17254 + }, + { + "epoch": 0.44, + "learning_rate": 1.928562579554546e-06, + "loss": 0.8281, + "step": 17255 + }, + { + "epoch": 0.44, + "learning_rate": 1.9285523085939203e-06, + "loss": 0.813, + "step": 17256 + }, + { + "epoch": 0.44, + "learning_rate": 1.9285420369223455e-06, + "loss": 1.0049, + "step": 17257 + }, + { + "epoch": 0.44, + "learning_rate": 1.928531764539828e-06, + "loss": 0.8262, + "step": 17258 + }, + { + "epoch": 0.44, + "learning_rate": 1.9285214914463766e-06, + "loss": 0.7114, + "step": 17259 + }, + { + "epoch": 0.44, + "learning_rate": 1.928511217641999e-06, + "loss": 0.9565, + "step": 17260 + }, + { + "epoch": 0.44, + "learning_rate": 1.9285009431267034e-06, + "loss": 1.0908, + "step": 17261 + }, + { + "epoch": 0.44, + "learning_rate": 1.9284906679004968e-06, + "loss": 0.9268, + "step": 17262 + }, + { + "epoch": 0.44, + "learning_rate": 1.9284803919633877e-06, + "loss": 1.0703, + "step": 17263 + }, + { + "epoch": 0.44, + "learning_rate": 1.928470115315384e-06, + "loss": 0.9619, + "step": 17264 + }, + { + "epoch": 0.44, + "learning_rate": 1.9284598379564935e-06, + "loss": 0.9043, + "step": 17265 + }, + { + "epoch": 0.44, + "learning_rate": 1.928449559886724e-06, + "loss": 1.0225, + "step": 17266 + }, + { + "epoch": 0.44, + "learning_rate": 1.9284392811060834e-06, + "loss": 0.8315, + "step": 17267 + }, + { + "epoch": 0.44, + "learning_rate": 1.9284290016145793e-06, + "loss": 0.877, + "step": 17268 + }, + { + "epoch": 0.44, + "learning_rate": 1.9284187214122197e-06, + "loss": 0.9658, + "step": 17269 + }, + { + "epoch": 0.44, + "learning_rate": 1.9284084404990127e-06, + "loss": 0.8584, + "step": 17270 + }, + { + "epoch": 0.44, + "learning_rate": 1.9283981588749663e-06, + "loss": 1.0537, + "step": 17271 + }, + { + "epoch": 0.44, + "learning_rate": 1.9283878765400882e-06, + "loss": 0.9453, + "step": 17272 + }, + { + "epoch": 0.44, + "learning_rate": 1.928377593494386e-06, + "loss": 0.7153, + "step": 17273 + }, + { + "epoch": 0.44, + "learning_rate": 1.9283673097378673e-06, + "loss": 0.8711, + "step": 17274 + }, + { + "epoch": 0.44, + "learning_rate": 1.928357025270541e-06, + "loss": 0.9971, + "step": 17275 + }, + { + "epoch": 0.44, + "learning_rate": 1.9283467400924142e-06, + "loss": 0.8271, + "step": 17276 + }, + { + "epoch": 0.44, + "learning_rate": 1.928336454203495e-06, + "loss": 0.9458, + "step": 17277 + }, + { + "epoch": 0.44, + "learning_rate": 1.9283261676037913e-06, + "loss": 0.8232, + "step": 17278 + }, + { + "epoch": 0.44, + "learning_rate": 1.9283158802933112e-06, + "loss": 0.667, + "step": 17279 + }, + { + "epoch": 0.44, + "learning_rate": 1.928305592272062e-06, + "loss": 0.8418, + "step": 17280 + }, + { + "epoch": 0.44, + "learning_rate": 1.928295303540052e-06, + "loss": 0.9385, + "step": 17281 + }, + { + "epoch": 0.44, + "learning_rate": 1.928285014097289e-06, + "loss": 0.6704, + "step": 17282 + }, + { + "epoch": 0.44, + "learning_rate": 1.9282747239437803e-06, + "loss": 1.2158, + "step": 17283 + }, + { + "epoch": 0.44, + "learning_rate": 1.928264433079535e-06, + "loss": 0.8799, + "step": 17284 + }, + { + "epoch": 0.44, + "learning_rate": 1.92825414150456e-06, + "loss": 0.7402, + "step": 17285 + }, + { + "epoch": 0.44, + "learning_rate": 1.9282438492188637e-06, + "loss": 0.875, + "step": 17286 + }, + { + "epoch": 0.44, + "learning_rate": 1.9282335562224535e-06, + "loss": 0.6475, + "step": 17287 + }, + { + "epoch": 0.44, + "learning_rate": 1.9282232625153377e-06, + "loss": 0.9619, + "step": 17288 + }, + { + "epoch": 0.44, + "learning_rate": 1.928212968097524e-06, + "loss": 0.9277, + "step": 17289 + }, + { + "epoch": 0.44, + "learning_rate": 1.9282026729690205e-06, + "loss": 0.8125, + "step": 17290 + }, + { + "epoch": 0.44, + "learning_rate": 1.9281923771298347e-06, + "loss": 1.0215, + "step": 17291 + }, + { + "epoch": 0.44, + "learning_rate": 1.9281820805799747e-06, + "loss": 0.7891, + "step": 17292 + }, + { + "epoch": 0.44, + "learning_rate": 1.9281717833194486e-06, + "loss": 0.8042, + "step": 17293 + }, + { + "epoch": 0.44, + "learning_rate": 1.9281614853482635e-06, + "loss": 0.9302, + "step": 17294 + }, + { + "epoch": 0.44, + "learning_rate": 1.9281511866664283e-06, + "loss": 0.9473, + "step": 17295 + }, + { + "epoch": 0.44, + "learning_rate": 1.9281408872739504e-06, + "loss": 0.9297, + "step": 17296 + }, + { + "epoch": 0.44, + "learning_rate": 1.928130587170837e-06, + "loss": 0.9365, + "step": 17297 + }, + { + "epoch": 0.44, + "learning_rate": 1.9281202863570976e-06, + "loss": 0.7278, + "step": 17298 + }, + { + "epoch": 0.44, + "learning_rate": 1.928109984832739e-06, + "loss": 0.9082, + "step": 17299 + }, + { + "epoch": 0.44, + "learning_rate": 1.928099682597769e-06, + "loss": 0.8408, + "step": 17300 + }, + { + "epoch": 0.44, + "learning_rate": 1.928089379652196e-06, + "loss": 0.5466, + "step": 17301 + }, + { + "epoch": 0.44, + "learning_rate": 1.928079075996027e-06, + "loss": 0.8242, + "step": 17302 + }, + { + "epoch": 0.44, + "learning_rate": 1.928068771629271e-06, + "loss": 0.9053, + "step": 17303 + }, + { + "epoch": 0.44, + "learning_rate": 1.9280584665519357e-06, + "loss": 0.7129, + "step": 17304 + }, + { + "epoch": 0.44, + "learning_rate": 1.928048160764028e-06, + "loss": 0.9414, + "step": 17305 + }, + { + "epoch": 0.44, + "learning_rate": 1.928037854265557e-06, + "loss": 0.9756, + "step": 17306 + }, + { + "epoch": 0.44, + "learning_rate": 1.9280275470565302e-06, + "loss": 1.0684, + "step": 17307 + }, + { + "epoch": 0.44, + "learning_rate": 1.928017239136955e-06, + "loss": 0.8652, + "step": 17308 + }, + { + "epoch": 0.44, + "learning_rate": 1.92800693050684e-06, + "loss": 1.1523, + "step": 17309 + }, + { + "epoch": 0.44, + "learning_rate": 1.9279966211661924e-06, + "loss": 0.916, + "step": 17310 + }, + { + "epoch": 0.44, + "learning_rate": 1.9279863111150207e-06, + "loss": 0.7305, + "step": 17311 + }, + { + "epoch": 0.44, + "learning_rate": 1.9279760003533324e-06, + "loss": 0.7236, + "step": 17312 + }, + { + "epoch": 0.44, + "learning_rate": 1.927965688881136e-06, + "loss": 0.8203, + "step": 17313 + }, + { + "epoch": 0.44, + "learning_rate": 1.9279553766984383e-06, + "loss": 0.8975, + "step": 17314 + }, + { + "epoch": 0.44, + "learning_rate": 1.9279450638052483e-06, + "loss": 1.0801, + "step": 17315 + }, + { + "epoch": 0.44, + "learning_rate": 1.9279347502015734e-06, + "loss": 0.9922, + "step": 17316 + }, + { + "epoch": 0.44, + "learning_rate": 1.927924435887421e-06, + "loss": 1.2061, + "step": 17317 + }, + { + "epoch": 0.44, + "learning_rate": 1.9279141208628002e-06, + "loss": 0.8652, + "step": 17318 + }, + { + "epoch": 0.44, + "learning_rate": 1.9279038051277177e-06, + "loss": 0.9648, + "step": 17319 + }, + { + "epoch": 0.44, + "learning_rate": 1.9278934886821824e-06, + "loss": 0.793, + "step": 17320 + }, + { + "epoch": 0.44, + "learning_rate": 1.9278831715262017e-06, + "loss": 0.9414, + "step": 17321 + }, + { + "epoch": 0.44, + "learning_rate": 1.927872853659783e-06, + "loss": 1.1816, + "step": 17322 + }, + { + "epoch": 0.44, + "learning_rate": 1.927862535082935e-06, + "loss": 0.8984, + "step": 17323 + }, + { + "epoch": 0.44, + "learning_rate": 1.9278522157956653e-06, + "loss": 0.9189, + "step": 17324 + }, + { + "epoch": 0.44, + "learning_rate": 1.927841895797982e-06, + "loss": 1.0068, + "step": 17325 + }, + { + "epoch": 0.44, + "learning_rate": 1.927831575089893e-06, + "loss": 0.8257, + "step": 17326 + }, + { + "epoch": 0.44, + "learning_rate": 1.9278212536714052e-06, + "loss": 0.6934, + "step": 17327 + }, + { + "epoch": 0.44, + "learning_rate": 1.9278109315425284e-06, + "loss": 1.0469, + "step": 17328 + }, + { + "epoch": 0.44, + "learning_rate": 1.9278006087032687e-06, + "loss": 0.9561, + "step": 17329 + }, + { + "epoch": 0.44, + "learning_rate": 1.9277902851536346e-06, + "loss": 0.7773, + "step": 17330 + }, + { + "epoch": 0.44, + "learning_rate": 1.9277799608936347e-06, + "loss": 0.916, + "step": 17331 + }, + { + "epoch": 0.44, + "learning_rate": 1.927769635923276e-06, + "loss": 0.9082, + "step": 17332 + }, + { + "epoch": 0.44, + "learning_rate": 1.927759310242567e-06, + "loss": 0.7424, + "step": 17333 + }, + { + "epoch": 0.44, + "learning_rate": 1.927748983851515e-06, + "loss": 0.9863, + "step": 17334 + }, + { + "epoch": 0.44, + "learning_rate": 1.9277386567501284e-06, + "loss": 0.9971, + "step": 17335 + }, + { + "epoch": 0.44, + "learning_rate": 1.927728328938415e-06, + "loss": 0.7686, + "step": 17336 + }, + { + "epoch": 0.44, + "learning_rate": 1.927718000416383e-06, + "loss": 1.1221, + "step": 17337 + }, + { + "epoch": 0.44, + "learning_rate": 1.9277076711840397e-06, + "loss": 0.7632, + "step": 17338 + }, + { + "epoch": 0.44, + "learning_rate": 1.927697341241393e-06, + "loss": 0.9922, + "step": 17339 + }, + { + "epoch": 0.44, + "learning_rate": 1.927687010588452e-06, + "loss": 0.8569, + "step": 17340 + }, + { + "epoch": 0.44, + "learning_rate": 1.9276766792252227e-06, + "loss": 0.6296, + "step": 17341 + }, + { + "epoch": 0.44, + "learning_rate": 1.9276663471517144e-06, + "loss": 0.8081, + "step": 17342 + }, + { + "epoch": 0.44, + "learning_rate": 1.9276560143679347e-06, + "loss": 0.9023, + "step": 17343 + }, + { + "epoch": 0.44, + "learning_rate": 1.9276456808738916e-06, + "loss": 0.8652, + "step": 17344 + }, + { + "epoch": 0.44, + "learning_rate": 1.9276353466695923e-06, + "loss": 0.8857, + "step": 17345 + }, + { + "epoch": 0.44, + "learning_rate": 1.9276250117550458e-06, + "loss": 0.916, + "step": 17346 + }, + { + "epoch": 0.44, + "learning_rate": 1.9276146761302595e-06, + "loss": 0.7988, + "step": 17347 + }, + { + "epoch": 0.44, + "learning_rate": 1.9276043397952413e-06, + "loss": 1.126, + "step": 17348 + }, + { + "epoch": 0.44, + "learning_rate": 1.9275940027499986e-06, + "loss": 1.0518, + "step": 17349 + }, + { + "epoch": 0.44, + "learning_rate": 1.92758366499454e-06, + "loss": 0.9141, + "step": 17350 + }, + { + "epoch": 0.44, + "learning_rate": 1.927573326528874e-06, + "loss": 0.8398, + "step": 17351 + }, + { + "epoch": 0.44, + "learning_rate": 1.927562987353007e-06, + "loss": 0.687, + "step": 17352 + }, + { + "epoch": 0.44, + "learning_rate": 1.9275526474669475e-06, + "loss": 0.7695, + "step": 17353 + }, + { + "epoch": 0.44, + "learning_rate": 1.927542306870704e-06, + "loss": 0.873, + "step": 17354 + }, + { + "epoch": 0.44, + "learning_rate": 1.927531965564284e-06, + "loss": 0.9541, + "step": 17355 + }, + { + "epoch": 0.44, + "learning_rate": 1.9275216235476953e-06, + "loss": 0.8857, + "step": 17356 + }, + { + "epoch": 0.44, + "learning_rate": 1.927511280820946e-06, + "loss": 0.9307, + "step": 17357 + }, + { + "epoch": 0.44, + "learning_rate": 1.927500937384044e-06, + "loss": 0.7703, + "step": 17358 + }, + { + "epoch": 0.44, + "learning_rate": 1.927490593236997e-06, + "loss": 0.8633, + "step": 17359 + }, + { + "epoch": 0.44, + "learning_rate": 1.927480248379813e-06, + "loss": 0.7305, + "step": 17360 + }, + { + "epoch": 0.44, + "learning_rate": 1.9274699028125003e-06, + "loss": 0.7646, + "step": 17361 + }, + { + "epoch": 0.44, + "learning_rate": 1.9274595565350665e-06, + "loss": 0.8037, + "step": 17362 + }, + { + "epoch": 0.45, + "learning_rate": 1.9274492095475196e-06, + "loss": 0.8936, + "step": 17363 + }, + { + "epoch": 0.45, + "learning_rate": 1.9274388618498673e-06, + "loss": 0.8359, + "step": 17364 + }, + { + "epoch": 0.45, + "learning_rate": 1.927428513442118e-06, + "loss": 0.6323, + "step": 17365 + }, + { + "epoch": 0.45, + "learning_rate": 1.927418164324279e-06, + "loss": 1.1875, + "step": 17366 + }, + { + "epoch": 0.45, + "learning_rate": 1.927407814496359e-06, + "loss": 0.8994, + "step": 17367 + }, + { + "epoch": 0.45, + "learning_rate": 1.927397463958365e-06, + "loss": 0.6221, + "step": 17368 + }, + { + "epoch": 0.45, + "learning_rate": 1.9273871127103055e-06, + "loss": 1.0635, + "step": 17369 + }, + { + "epoch": 0.45, + "learning_rate": 1.9273767607521885e-06, + "loss": 1.123, + "step": 17370 + }, + { + "epoch": 0.45, + "learning_rate": 1.927366408084022e-06, + "loss": 0.8252, + "step": 17371 + }, + { + "epoch": 0.45, + "learning_rate": 1.927356054705813e-06, + "loss": 0.8535, + "step": 17372 + }, + { + "epoch": 0.45, + "learning_rate": 1.9273457006175704e-06, + "loss": 0.6111, + "step": 17373 + }, + { + "epoch": 0.45, + "learning_rate": 1.927335345819302e-06, + "loss": 0.9268, + "step": 17374 + }, + { + "epoch": 0.45, + "learning_rate": 1.9273249903110152e-06, + "loss": 0.7969, + "step": 17375 + }, + { + "epoch": 0.45, + "learning_rate": 1.927314634092719e-06, + "loss": 0.5889, + "step": 17376 + }, + { + "epoch": 0.45, + "learning_rate": 1.92730427716442e-06, + "loss": 0.5977, + "step": 17377 + }, + { + "epoch": 0.45, + "learning_rate": 1.9272939195261267e-06, + "loss": 0.9336, + "step": 17378 + }, + { + "epoch": 0.45, + "learning_rate": 1.927283561177848e-06, + "loss": 1.0439, + "step": 17379 + }, + { + "epoch": 0.45, + "learning_rate": 1.9272732021195898e-06, + "loss": 0.8174, + "step": 17380 + }, + { + "epoch": 0.45, + "learning_rate": 1.927262842351362e-06, + "loss": 0.9229, + "step": 17381 + }, + { + "epoch": 0.45, + "learning_rate": 1.927252481873171e-06, + "loss": 0.959, + "step": 17382 + }, + { + "epoch": 0.45, + "learning_rate": 1.9272421206850255e-06, + "loss": 0.9014, + "step": 17383 + }, + { + "epoch": 0.45, + "learning_rate": 1.9272317587869336e-06, + "loss": 0.9648, + "step": 17384 + }, + { + "epoch": 0.45, + "learning_rate": 1.927221396178903e-06, + "loss": 0.999, + "step": 17385 + }, + { + "epoch": 0.45, + "learning_rate": 1.927211032860942e-06, + "loss": 0.9795, + "step": 17386 + }, + { + "epoch": 0.45, + "learning_rate": 1.927200668833057e-06, + "loss": 0.9473, + "step": 17387 + }, + { + "epoch": 0.45, + "learning_rate": 1.927190304095258e-06, + "loss": 0.9922, + "step": 17388 + }, + { + "epoch": 0.45, + "learning_rate": 1.927179938647552e-06, + "loss": 0.8652, + "step": 17389 + }, + { + "epoch": 0.45, + "learning_rate": 1.9271695724899464e-06, + "loss": 0.9326, + "step": 17390 + }, + { + "epoch": 0.45, + "learning_rate": 1.9271592056224503e-06, + "loss": 0.7485, + "step": 17391 + }, + { + "epoch": 0.45, + "learning_rate": 1.9271488380450703e-06, + "loss": 0.7236, + "step": 17392 + }, + { + "epoch": 0.45, + "learning_rate": 1.9271384697578156e-06, + "loss": 0.9629, + "step": 17393 + }, + { + "epoch": 0.45, + "learning_rate": 1.9271281007606936e-06, + "loss": 1.0312, + "step": 17394 + }, + { + "epoch": 0.45, + "learning_rate": 1.9271177310537123e-06, + "loss": 0.7749, + "step": 17395 + }, + { + "epoch": 0.45, + "learning_rate": 1.927107360636879e-06, + "loss": 0.9717, + "step": 17396 + }, + { + "epoch": 0.45, + "learning_rate": 1.927096989510203e-06, + "loss": 0.6982, + "step": 17397 + }, + { + "epoch": 0.45, + "learning_rate": 1.9270866176736912e-06, + "loss": 0.8721, + "step": 17398 + }, + { + "epoch": 0.45, + "learning_rate": 1.9270762451273517e-06, + "loss": 0.8047, + "step": 17399 + }, + { + "epoch": 0.45, + "learning_rate": 1.9270658718711926e-06, + "loss": 1.2021, + "step": 17400 + }, + { + "epoch": 0.45, + "learning_rate": 1.9270554979052215e-06, + "loss": 0.958, + "step": 17401 + }, + { + "epoch": 0.45, + "learning_rate": 1.927045123229447e-06, + "loss": 0.9541, + "step": 17402 + }, + { + "epoch": 0.45, + "learning_rate": 1.9270347478438768e-06, + "loss": 0.821, + "step": 17403 + }, + { + "epoch": 0.45, + "learning_rate": 1.9270243717485183e-06, + "loss": 0.8496, + "step": 17404 + }, + { + "epoch": 0.45, + "learning_rate": 1.92701399494338e-06, + "loss": 0.8965, + "step": 17405 + }, + { + "epoch": 0.45, + "learning_rate": 1.9270036174284697e-06, + "loss": 0.8955, + "step": 17406 + }, + { + "epoch": 0.45, + "learning_rate": 1.9269932392037954e-06, + "loss": 0.9883, + "step": 17407 + }, + { + "epoch": 0.45, + "learning_rate": 1.9269828602693654e-06, + "loss": 0.9453, + "step": 17408 + }, + { + "epoch": 0.45, + "learning_rate": 1.9269724806251866e-06, + "loss": 0.8237, + "step": 17409 + }, + { + "epoch": 0.45, + "learning_rate": 1.926962100271268e-06, + "loss": 0.9033, + "step": 17410 + }, + { + "epoch": 0.45, + "learning_rate": 1.926951719207617e-06, + "loss": 0.8467, + "step": 17411 + }, + { + "epoch": 0.45, + "learning_rate": 1.9269413374342417e-06, + "loss": 0.8281, + "step": 17412 + }, + { + "epoch": 0.45, + "learning_rate": 1.9269309549511502e-06, + "loss": 0.7471, + "step": 17413 + }, + { + "epoch": 0.45, + "learning_rate": 1.9269205717583498e-06, + "loss": 0.8379, + "step": 17414 + }, + { + "epoch": 0.45, + "learning_rate": 1.9269101878558492e-06, + "loss": 0.9302, + "step": 17415 + }, + { + "epoch": 0.45, + "learning_rate": 1.926899803243656e-06, + "loss": 0.6943, + "step": 17416 + }, + { + "epoch": 0.45, + "learning_rate": 1.9268894179217787e-06, + "loss": 0.9595, + "step": 17417 + }, + { + "epoch": 0.45, + "learning_rate": 1.9268790318902244e-06, + "loss": 0.9307, + "step": 17418 + }, + { + "epoch": 0.45, + "learning_rate": 1.9268686451490014e-06, + "loss": 0.8115, + "step": 17419 + }, + { + "epoch": 0.45, + "learning_rate": 1.926858257698118e-06, + "loss": 1.0283, + "step": 17420 + }, + { + "epoch": 0.45, + "learning_rate": 1.926847869537582e-06, + "loss": 1.1543, + "step": 17421 + }, + { + "epoch": 0.45, + "learning_rate": 1.926837480667401e-06, + "loss": 0.7842, + "step": 17422 + }, + { + "epoch": 0.45, + "learning_rate": 1.9268270910875824e-06, + "loss": 0.8701, + "step": 17423 + }, + { + "epoch": 0.45, + "learning_rate": 1.9268167007981358e-06, + "loss": 0.8706, + "step": 17424 + }, + { + "epoch": 0.45, + "learning_rate": 1.9268063097990683e-06, + "loss": 0.9346, + "step": 17425 + }, + { + "epoch": 0.45, + "learning_rate": 1.9267959180903875e-06, + "loss": 1.0957, + "step": 17426 + }, + { + "epoch": 0.45, + "learning_rate": 1.9267855256721014e-06, + "loss": 0.9219, + "step": 17427 + }, + { + "epoch": 0.45, + "learning_rate": 1.9267751325442186e-06, + "loss": 0.8237, + "step": 17428 + }, + { + "epoch": 0.45, + "learning_rate": 1.9267647387067466e-06, + "loss": 0.7334, + "step": 17429 + }, + { + "epoch": 0.45, + "learning_rate": 1.926754344159694e-06, + "loss": 0.9199, + "step": 17430 + }, + { + "epoch": 0.45, + "learning_rate": 1.9267439489030674e-06, + "loss": 0.8457, + "step": 17431 + }, + { + "epoch": 0.45, + "learning_rate": 1.926733552936876e-06, + "loss": 0.8838, + "step": 17432 + }, + { + "epoch": 0.45, + "learning_rate": 1.926723156261127e-06, + "loss": 1.1074, + "step": 17433 + }, + { + "epoch": 0.45, + "learning_rate": 1.926712758875829e-06, + "loss": 0.8574, + "step": 17434 + }, + { + "epoch": 0.45, + "learning_rate": 1.9267023607809896e-06, + "loss": 1.0186, + "step": 17435 + }, + { + "epoch": 0.45, + "learning_rate": 1.9266919619766168e-06, + "loss": 0.9121, + "step": 17436 + }, + { + "epoch": 0.45, + "learning_rate": 1.926681562462719e-06, + "loss": 1.1318, + "step": 17437 + }, + { + "epoch": 0.45, + "learning_rate": 1.9266711622393032e-06, + "loss": 0.8286, + "step": 17438 + }, + { + "epoch": 0.45, + "learning_rate": 1.9266607613063777e-06, + "loss": 0.8789, + "step": 17439 + }, + { + "epoch": 0.45, + "learning_rate": 1.926650359663951e-06, + "loss": 0.7979, + "step": 17440 + }, + { + "epoch": 0.45, + "learning_rate": 1.9266399573120307e-06, + "loss": 0.8506, + "step": 17441 + }, + { + "epoch": 0.45, + "learning_rate": 1.926629554250625e-06, + "loss": 0.9795, + "step": 17442 + }, + { + "epoch": 0.45, + "learning_rate": 1.926619150479741e-06, + "loss": 0.7939, + "step": 17443 + }, + { + "epoch": 0.45, + "learning_rate": 1.9266087459993877e-06, + "loss": 0.8613, + "step": 17444 + }, + { + "epoch": 0.45, + "learning_rate": 1.926598340809573e-06, + "loss": 0.6875, + "step": 17445 + }, + { + "epoch": 0.45, + "learning_rate": 1.926587934910304e-06, + "loss": 0.8408, + "step": 17446 + }, + { + "epoch": 0.45, + "learning_rate": 1.92657752830159e-06, + "loss": 0.9355, + "step": 17447 + }, + { + "epoch": 0.45, + "learning_rate": 1.926567120983438e-06, + "loss": 0.9541, + "step": 17448 + }, + { + "epoch": 0.45, + "learning_rate": 1.9265567129558555e-06, + "loss": 0.958, + "step": 17449 + }, + { + "epoch": 0.45, + "learning_rate": 1.9265463042188517e-06, + "loss": 0.7168, + "step": 17450 + }, + { + "epoch": 0.45, + "learning_rate": 1.9265358947724336e-06, + "loss": 1.1436, + "step": 17451 + }, + { + "epoch": 0.45, + "learning_rate": 1.9265254846166097e-06, + "loss": 0.8154, + "step": 17452 + }, + { + "epoch": 0.45, + "learning_rate": 1.926515073751388e-06, + "loss": 1.0859, + "step": 17453 + }, + { + "epoch": 0.45, + "learning_rate": 1.926504662176776e-06, + "loss": 0.9062, + "step": 17454 + }, + { + "epoch": 0.45, + "learning_rate": 1.9264942498927824e-06, + "loss": 0.9639, + "step": 17455 + }, + { + "epoch": 0.45, + "learning_rate": 1.9264838368994147e-06, + "loss": 0.9678, + "step": 17456 + }, + { + "epoch": 0.45, + "learning_rate": 1.926473423196681e-06, + "loss": 1.0098, + "step": 17457 + }, + { + "epoch": 0.45, + "learning_rate": 1.9264630087845886e-06, + "loss": 0.9014, + "step": 17458 + }, + { + "epoch": 0.45, + "learning_rate": 1.9264525936631467e-06, + "loss": 0.9141, + "step": 17459 + }, + { + "epoch": 0.45, + "learning_rate": 1.9264421778323622e-06, + "loss": 0.8662, + "step": 17460 + }, + { + "epoch": 0.45, + "learning_rate": 1.926431761292244e-06, + "loss": 0.8525, + "step": 17461 + }, + { + "epoch": 0.45, + "learning_rate": 1.926421344042799e-06, + "loss": 0.6724, + "step": 17462 + }, + { + "epoch": 0.45, + "learning_rate": 1.926410926084036e-06, + "loss": 0.9658, + "step": 17463 + }, + { + "epoch": 0.45, + "learning_rate": 1.926400507415963e-06, + "loss": 0.9922, + "step": 17464 + }, + { + "epoch": 0.45, + "learning_rate": 1.9263900880385878e-06, + "loss": 0.8359, + "step": 17465 + }, + { + "epoch": 0.45, + "learning_rate": 1.926379667951918e-06, + "loss": 0.8369, + "step": 17466 + }, + { + "epoch": 0.45, + "learning_rate": 1.926369247155962e-06, + "loss": 0.8452, + "step": 17467 + }, + { + "epoch": 0.45, + "learning_rate": 1.926358825650728e-06, + "loss": 1.0254, + "step": 17468 + }, + { + "epoch": 0.45, + "learning_rate": 1.926348403436223e-06, + "loss": 1.125, + "step": 17469 + }, + { + "epoch": 0.45, + "learning_rate": 1.926337980512456e-06, + "loss": 0.8882, + "step": 17470 + }, + { + "epoch": 0.45, + "learning_rate": 1.9263275568794346e-06, + "loss": 0.8379, + "step": 17471 + }, + { + "epoch": 0.45, + "learning_rate": 1.9263171325371667e-06, + "loss": 0.7891, + "step": 17472 + }, + { + "epoch": 0.45, + "learning_rate": 1.9263067074856603e-06, + "loss": 0.8623, + "step": 17473 + }, + { + "epoch": 0.45, + "learning_rate": 1.9262962817249235e-06, + "loss": 1.0898, + "step": 17474 + }, + { + "epoch": 0.45, + "learning_rate": 1.9262858552549642e-06, + "loss": 0.998, + "step": 17475 + }, + { + "epoch": 0.45, + "learning_rate": 1.9262754280757903e-06, + "loss": 0.7954, + "step": 17476 + }, + { + "epoch": 0.45, + "learning_rate": 1.9262650001874105e-06, + "loss": 0.9561, + "step": 17477 + }, + { + "epoch": 0.45, + "learning_rate": 1.9262545715898315e-06, + "loss": 0.9961, + "step": 17478 + }, + { + "epoch": 0.45, + "learning_rate": 1.926244142283062e-06, + "loss": 1.0625, + "step": 17479 + }, + { + "epoch": 0.45, + "learning_rate": 1.9262337122671103e-06, + "loss": 1.0391, + "step": 17480 + }, + { + "epoch": 0.45, + "learning_rate": 1.9262232815419837e-06, + "loss": 0.8159, + "step": 17481 + }, + { + "epoch": 0.45, + "learning_rate": 1.926212850107691e-06, + "loss": 0.5723, + "step": 17482 + }, + { + "epoch": 0.45, + "learning_rate": 1.9262024179642395e-06, + "loss": 0.9482, + "step": 17483 + }, + { + "epoch": 0.45, + "learning_rate": 1.926191985111637e-06, + "loss": 0.5923, + "step": 17484 + }, + { + "epoch": 0.45, + "learning_rate": 1.926181551549892e-06, + "loss": 0.8848, + "step": 17485 + }, + { + "epoch": 0.45, + "learning_rate": 1.9261711172790127e-06, + "loss": 0.8682, + "step": 17486 + }, + { + "epoch": 0.45, + "learning_rate": 1.926160682299007e-06, + "loss": 0.5776, + "step": 17487 + }, + { + "epoch": 0.45, + "learning_rate": 1.926150246609882e-06, + "loss": 0.8242, + "step": 17488 + }, + { + "epoch": 0.45, + "learning_rate": 1.9261398102116467e-06, + "loss": 0.9058, + "step": 17489 + }, + { + "epoch": 0.45, + "learning_rate": 1.9261293731043085e-06, + "loss": 0.96, + "step": 17490 + }, + { + "epoch": 0.45, + "learning_rate": 1.926118935287876e-06, + "loss": 0.8096, + "step": 17491 + }, + { + "epoch": 0.45, + "learning_rate": 1.9261084967623567e-06, + "loss": 0.9531, + "step": 17492 + }, + { + "epoch": 0.45, + "learning_rate": 1.9260980575277584e-06, + "loss": 0.9014, + "step": 17493 + }, + { + "epoch": 0.45, + "learning_rate": 1.9260876175840893e-06, + "loss": 0.9355, + "step": 17494 + }, + { + "epoch": 0.45, + "learning_rate": 1.9260771769313583e-06, + "loss": 0.7842, + "step": 17495 + }, + { + "epoch": 0.45, + "learning_rate": 1.926066735569572e-06, + "loss": 0.9199, + "step": 17496 + }, + { + "epoch": 0.45, + "learning_rate": 1.926056293498739e-06, + "loss": 0.8418, + "step": 17497 + }, + { + "epoch": 0.45, + "learning_rate": 1.926045850718867e-06, + "loss": 1.0186, + "step": 17498 + }, + { + "epoch": 0.45, + "learning_rate": 1.926035407229965e-06, + "loss": 0.8291, + "step": 17499 + }, + { + "epoch": 0.45, + "learning_rate": 1.9260249630320398e-06, + "loss": 0.8213, + "step": 17500 + }, + { + "epoch": 0.45, + "learning_rate": 1.9260145181250998e-06, + "loss": 0.9141, + "step": 17501 + }, + { + "epoch": 0.45, + "learning_rate": 1.9260040725091534e-06, + "loss": 0.9502, + "step": 17502 + }, + { + "epoch": 0.45, + "learning_rate": 1.925993626184208e-06, + "loss": 0.7783, + "step": 17503 + }, + { + "epoch": 0.45, + "learning_rate": 1.925983179150272e-06, + "loss": 1.0176, + "step": 17504 + }, + { + "epoch": 0.45, + "learning_rate": 1.925972731407353e-06, + "loss": 0.75, + "step": 17505 + }, + { + "epoch": 0.45, + "learning_rate": 1.9259622829554596e-06, + "loss": 0.9893, + "step": 17506 + }, + { + "epoch": 0.45, + "learning_rate": 1.9259518337945994e-06, + "loss": 0.6455, + "step": 17507 + }, + { + "epoch": 0.45, + "learning_rate": 1.9259413839247803e-06, + "loss": 0.8584, + "step": 17508 + }, + { + "epoch": 0.45, + "learning_rate": 1.9259309333460103e-06, + "loss": 0.8906, + "step": 17509 + }, + { + "epoch": 0.45, + "learning_rate": 1.925920482058298e-06, + "loss": 1.127, + "step": 17510 + }, + { + "epoch": 0.45, + "learning_rate": 1.9259100300616507e-06, + "loss": 0.6641, + "step": 17511 + }, + { + "epoch": 0.45, + "learning_rate": 1.9258995773560767e-06, + "loss": 0.833, + "step": 17512 + }, + { + "epoch": 0.45, + "learning_rate": 1.925889123941584e-06, + "loss": 0.9971, + "step": 17513 + }, + { + "epoch": 0.45, + "learning_rate": 1.9258786698181805e-06, + "loss": 1.0859, + "step": 17514 + }, + { + "epoch": 0.45, + "learning_rate": 1.925868214985874e-06, + "loss": 0.8149, + "step": 17515 + }, + { + "epoch": 0.45, + "learning_rate": 1.9258577594446735e-06, + "loss": 0.7324, + "step": 17516 + }, + { + "epoch": 0.45, + "learning_rate": 1.925847303194586e-06, + "loss": 1.1777, + "step": 17517 + }, + { + "epoch": 0.45, + "learning_rate": 1.9258368462356195e-06, + "loss": 0.9121, + "step": 17518 + }, + { + "epoch": 0.45, + "learning_rate": 1.9258263885677825e-06, + "loss": 1.0811, + "step": 17519 + }, + { + "epoch": 0.45, + "learning_rate": 1.925815930191083e-06, + "loss": 0.915, + "step": 17520 + }, + { + "epoch": 0.45, + "learning_rate": 1.9258054711055283e-06, + "loss": 0.6503, + "step": 17521 + }, + { + "epoch": 0.45, + "learning_rate": 1.925795011311127e-06, + "loss": 0.8594, + "step": 17522 + }, + { + "epoch": 0.45, + "learning_rate": 1.9257845508078872e-06, + "loss": 0.9404, + "step": 17523 + }, + { + "epoch": 0.45, + "learning_rate": 1.925774089595817e-06, + "loss": 0.689, + "step": 17524 + }, + { + "epoch": 0.45, + "learning_rate": 1.925763627674924e-06, + "loss": 0.8906, + "step": 17525 + }, + { + "epoch": 0.45, + "learning_rate": 1.9257531650452164e-06, + "loss": 0.8545, + "step": 17526 + }, + { + "epoch": 0.45, + "learning_rate": 1.925742701706702e-06, + "loss": 1.0137, + "step": 17527 + }, + { + "epoch": 0.45, + "learning_rate": 1.925732237659389e-06, + "loss": 0.9004, + "step": 17528 + }, + { + "epoch": 0.45, + "learning_rate": 1.9257217729032855e-06, + "loss": 0.832, + "step": 17529 + }, + { + "epoch": 0.45, + "learning_rate": 1.9257113074383994e-06, + "loss": 1.1055, + "step": 17530 + }, + { + "epoch": 0.45, + "learning_rate": 1.9257008412647385e-06, + "loss": 0.7822, + "step": 17531 + }, + { + "epoch": 0.45, + "learning_rate": 1.9256903743823114e-06, + "loss": 0.8145, + "step": 17532 + }, + { + "epoch": 0.45, + "learning_rate": 1.925679906791125e-06, + "loss": 0.8418, + "step": 17533 + }, + { + "epoch": 0.45, + "learning_rate": 1.925669438491189e-06, + "loss": 0.9668, + "step": 17534 + }, + { + "epoch": 0.45, + "learning_rate": 1.92565896948251e-06, + "loss": 0.9453, + "step": 17535 + }, + { + "epoch": 0.45, + "learning_rate": 1.925648499765096e-06, + "loss": 0.9756, + "step": 17536 + }, + { + "epoch": 0.45, + "learning_rate": 1.9256380293389564e-06, + "loss": 1.0352, + "step": 17537 + }, + { + "epoch": 0.45, + "learning_rate": 1.925627558204098e-06, + "loss": 0.9316, + "step": 17538 + }, + { + "epoch": 0.45, + "learning_rate": 1.925617086360529e-06, + "loss": 0.8838, + "step": 17539 + }, + { + "epoch": 0.45, + "learning_rate": 1.925606613808258e-06, + "loss": 0.8604, + "step": 17540 + }, + { + "epoch": 0.45, + "learning_rate": 1.925596140547292e-06, + "loss": 1.0664, + "step": 17541 + }, + { + "epoch": 0.45, + "learning_rate": 1.92558566657764e-06, + "loss": 1.0879, + "step": 17542 + }, + { + "epoch": 0.45, + "learning_rate": 1.9255751918993094e-06, + "loss": 0.6094, + "step": 17543 + }, + { + "epoch": 0.45, + "learning_rate": 1.9255647165123086e-06, + "loss": 0.9062, + "step": 17544 + }, + { + "epoch": 0.45, + "learning_rate": 1.925554240416645e-06, + "loss": 0.8428, + "step": 17545 + }, + { + "epoch": 0.45, + "learning_rate": 1.925543763612328e-06, + "loss": 1.04, + "step": 17546 + }, + { + "epoch": 0.45, + "learning_rate": 1.925533286099364e-06, + "loss": 1.0117, + "step": 17547 + }, + { + "epoch": 0.45, + "learning_rate": 1.9255228078777615e-06, + "loss": 0.8535, + "step": 17548 + }, + { + "epoch": 0.45, + "learning_rate": 1.9255123289475295e-06, + "loss": 0.793, + "step": 17549 + }, + { + "epoch": 0.45, + "learning_rate": 1.9255018493086743e-06, + "loss": 0.7549, + "step": 17550 + }, + { + "epoch": 0.45, + "learning_rate": 1.9254913689612054e-06, + "loss": 0.998, + "step": 17551 + }, + { + "epoch": 0.45, + "learning_rate": 1.9254808879051304e-06, + "loss": 0.8088, + "step": 17552 + }, + { + "epoch": 0.45, + "learning_rate": 1.9254704061404576e-06, + "loss": 1.0361, + "step": 17553 + }, + { + "epoch": 0.45, + "learning_rate": 1.9254599236671943e-06, + "loss": 0.916, + "step": 17554 + }, + { + "epoch": 0.45, + "learning_rate": 1.9254494404853486e-06, + "loss": 0.7676, + "step": 17555 + }, + { + "epoch": 0.45, + "learning_rate": 1.9254389565949294e-06, + "loss": 0.8301, + "step": 17556 + }, + { + "epoch": 0.45, + "learning_rate": 1.9254284719959433e-06, + "loss": 0.9375, + "step": 17557 + }, + { + "epoch": 0.45, + "learning_rate": 1.9254179866884e-06, + "loss": 0.9902, + "step": 17558 + }, + { + "epoch": 0.45, + "learning_rate": 1.9254075006723065e-06, + "loss": 0.8271, + "step": 17559 + }, + { + "epoch": 0.45, + "learning_rate": 1.925397013947671e-06, + "loss": 0.7075, + "step": 17560 + }, + { + "epoch": 0.45, + "learning_rate": 1.9253865265145012e-06, + "loss": 0.8135, + "step": 17561 + }, + { + "epoch": 0.45, + "learning_rate": 1.925376038372806e-06, + "loss": 0.8604, + "step": 17562 + }, + { + "epoch": 0.45, + "learning_rate": 1.9253655495225923e-06, + "loss": 0.6406, + "step": 17563 + }, + { + "epoch": 0.45, + "learning_rate": 1.9253550599638692e-06, + "loss": 0.9697, + "step": 17564 + }, + { + "epoch": 0.45, + "learning_rate": 1.925344569696644e-06, + "loss": 0.9717, + "step": 17565 + }, + { + "epoch": 0.45, + "learning_rate": 1.925334078720925e-06, + "loss": 0.9541, + "step": 17566 + }, + { + "epoch": 0.45, + "learning_rate": 1.9253235870367207e-06, + "loss": 0.8447, + "step": 17567 + }, + { + "epoch": 0.45, + "learning_rate": 1.9253130946440384e-06, + "loss": 0.8467, + "step": 17568 + }, + { + "epoch": 0.45, + "learning_rate": 1.9253026015428867e-06, + "loss": 0.877, + "step": 17569 + }, + { + "epoch": 0.45, + "learning_rate": 1.925292107733273e-06, + "loss": 0.6162, + "step": 17570 + }, + { + "epoch": 0.45, + "learning_rate": 1.9252816132152058e-06, + "loss": 1.0244, + "step": 17571 + }, + { + "epoch": 0.45, + "learning_rate": 1.925271117988693e-06, + "loss": 0.834, + "step": 17572 + }, + { + "epoch": 0.45, + "learning_rate": 1.9252606220537427e-06, + "loss": 0.7178, + "step": 17573 + }, + { + "epoch": 0.45, + "learning_rate": 1.9252501254103627e-06, + "loss": 1.0195, + "step": 17574 + }, + { + "epoch": 0.45, + "learning_rate": 1.9252396280585613e-06, + "loss": 0.7617, + "step": 17575 + }, + { + "epoch": 0.45, + "learning_rate": 1.9252291299983464e-06, + "loss": 0.9375, + "step": 17576 + }, + { + "epoch": 0.45, + "learning_rate": 1.925218631229726e-06, + "loss": 0.8198, + "step": 17577 + }, + { + "epoch": 0.45, + "learning_rate": 1.925208131752709e-06, + "loss": 1.0215, + "step": 17578 + }, + { + "epoch": 0.45, + "learning_rate": 1.925197631567302e-06, + "loss": 0.6733, + "step": 17579 + }, + { + "epoch": 0.45, + "learning_rate": 1.9251871306735135e-06, + "loss": 0.499, + "step": 17580 + }, + { + "epoch": 0.45, + "learning_rate": 1.9251766290713524e-06, + "loss": 0.7075, + "step": 17581 + }, + { + "epoch": 0.45, + "learning_rate": 1.9251661267608257e-06, + "loss": 0.8179, + "step": 17582 + }, + { + "epoch": 0.45, + "learning_rate": 1.925155623741942e-06, + "loss": 0.7056, + "step": 17583 + }, + { + "epoch": 0.45, + "learning_rate": 1.925145120014709e-06, + "loss": 0.9316, + "step": 17584 + }, + { + "epoch": 0.45, + "learning_rate": 1.925134615579135e-06, + "loss": 0.7954, + "step": 17585 + }, + { + "epoch": 0.45, + "learning_rate": 1.925124110435228e-06, + "loss": 0.9873, + "step": 17586 + }, + { + "epoch": 0.45, + "learning_rate": 1.925113604582996e-06, + "loss": 0.9639, + "step": 17587 + }, + { + "epoch": 0.45, + "learning_rate": 1.925103098022447e-06, + "loss": 0.8525, + "step": 17588 + }, + { + "epoch": 0.45, + "learning_rate": 1.925092590753589e-06, + "loss": 0.8516, + "step": 17589 + }, + { + "epoch": 0.45, + "learning_rate": 1.9250820827764302e-06, + "loss": 0.8384, + "step": 17590 + }, + { + "epoch": 0.45, + "learning_rate": 1.9250715740909785e-06, + "loss": 1.0146, + "step": 17591 + }, + { + "epoch": 0.45, + "learning_rate": 1.9250610646972426e-06, + "loss": 0.7783, + "step": 17592 + }, + { + "epoch": 0.45, + "learning_rate": 1.9250505545952295e-06, + "loss": 0.9795, + "step": 17593 + }, + { + "epoch": 0.45, + "learning_rate": 1.925040043784948e-06, + "loss": 0.7332, + "step": 17594 + }, + { + "epoch": 0.45, + "learning_rate": 1.9250295322664056e-06, + "loss": 0.9863, + "step": 17595 + }, + { + "epoch": 0.45, + "learning_rate": 1.9250190200396104e-06, + "loss": 1.001, + "step": 17596 + }, + { + "epoch": 0.45, + "learning_rate": 1.925008507104571e-06, + "loss": 0.8281, + "step": 17597 + }, + { + "epoch": 0.45, + "learning_rate": 1.924997993461295e-06, + "loss": 0.751, + "step": 17598 + }, + { + "epoch": 0.45, + "learning_rate": 1.9249874791097905e-06, + "loss": 0.6821, + "step": 17599 + }, + { + "epoch": 0.45, + "learning_rate": 1.924976964050066e-06, + "loss": 0.8701, + "step": 17600 + }, + { + "epoch": 0.45, + "learning_rate": 1.924966448282129e-06, + "loss": 0.7134, + "step": 17601 + }, + { + "epoch": 0.45, + "learning_rate": 1.9249559318059875e-06, + "loss": 0.9863, + "step": 17602 + }, + { + "epoch": 0.45, + "learning_rate": 1.92494541462165e-06, + "loss": 0.9492, + "step": 17603 + }, + { + "epoch": 0.45, + "learning_rate": 1.924934896729124e-06, + "loss": 0.8774, + "step": 17604 + }, + { + "epoch": 0.45, + "learning_rate": 1.9249243781284188e-06, + "loss": 0.9629, + "step": 17605 + }, + { + "epoch": 0.45, + "learning_rate": 1.9249138588195404e-06, + "loss": 0.9414, + "step": 17606 + }, + { + "epoch": 0.45, + "learning_rate": 1.9249033388024985e-06, + "loss": 0.6062, + "step": 17607 + }, + { + "epoch": 0.45, + "learning_rate": 1.9248928180773006e-06, + "loss": 0.6953, + "step": 17608 + }, + { + "epoch": 0.45, + "learning_rate": 1.924882296643955e-06, + "loss": 0.9248, + "step": 17609 + }, + { + "epoch": 0.45, + "learning_rate": 1.924871774502469e-06, + "loss": 1.1074, + "step": 17610 + }, + { + "epoch": 0.45, + "learning_rate": 1.9248612516528516e-06, + "loss": 0.9219, + "step": 17611 + }, + { + "epoch": 0.45, + "learning_rate": 1.9248507280951103e-06, + "loss": 0.8281, + "step": 17612 + }, + { + "epoch": 0.45, + "learning_rate": 1.9248402038292533e-06, + "loss": 0.6689, + "step": 17613 + }, + { + "epoch": 0.45, + "learning_rate": 1.924829678855289e-06, + "loss": 0.7861, + "step": 17614 + }, + { + "epoch": 0.45, + "learning_rate": 1.924819153173225e-06, + "loss": 0.9199, + "step": 17615 + }, + { + "epoch": 0.45, + "learning_rate": 1.9248086267830696e-06, + "loss": 0.8252, + "step": 17616 + }, + { + "epoch": 0.45, + "learning_rate": 1.9247980996848305e-06, + "loss": 0.8994, + "step": 17617 + }, + { + "epoch": 0.45, + "learning_rate": 1.9247875718785164e-06, + "loss": 0.9062, + "step": 17618 + }, + { + "epoch": 0.45, + "learning_rate": 1.9247770433641344e-06, + "loss": 0.8833, + "step": 17619 + }, + { + "epoch": 0.45, + "learning_rate": 1.9247665141416934e-06, + "loss": 0.9004, + "step": 17620 + }, + { + "epoch": 0.45, + "learning_rate": 1.9247559842112015e-06, + "loss": 0.8936, + "step": 17621 + }, + { + "epoch": 0.45, + "learning_rate": 1.9247454535726663e-06, + "loss": 1.0049, + "step": 17622 + }, + { + "epoch": 0.45, + "learning_rate": 1.9247349222260958e-06, + "loss": 1.0469, + "step": 17623 + }, + { + "epoch": 0.45, + "learning_rate": 1.9247243901714985e-06, + "loss": 1.0312, + "step": 17624 + }, + { + "epoch": 0.45, + "learning_rate": 1.924713857408882e-06, + "loss": 0.9541, + "step": 17625 + }, + { + "epoch": 0.45, + "learning_rate": 1.924703323938255e-06, + "loss": 0.9971, + "step": 17626 + }, + { + "epoch": 0.45, + "learning_rate": 1.924692789759625e-06, + "loss": 0.9062, + "step": 17627 + }, + { + "epoch": 0.45, + "learning_rate": 1.924682254873e-06, + "loss": 0.8037, + "step": 17628 + }, + { + "epoch": 0.45, + "learning_rate": 1.924671719278389e-06, + "loss": 0.9619, + "step": 17629 + }, + { + "epoch": 0.45, + "learning_rate": 1.924661182975799e-06, + "loss": 0.7881, + "step": 17630 + }, + { + "epoch": 0.45, + "learning_rate": 1.924650645965238e-06, + "loss": 0.8623, + "step": 17631 + }, + { + "epoch": 0.45, + "learning_rate": 1.9246401082467153e-06, + "loss": 0.9004, + "step": 17632 + }, + { + "epoch": 0.45, + "learning_rate": 1.9246295698202377e-06, + "loss": 0.7297, + "step": 17633 + }, + { + "epoch": 0.45, + "learning_rate": 1.9246190306858137e-06, + "loss": 0.5986, + "step": 17634 + }, + { + "epoch": 0.45, + "learning_rate": 1.9246084908434515e-06, + "loss": 1.0986, + "step": 17635 + }, + { + "epoch": 0.45, + "learning_rate": 1.924597950293159e-06, + "loss": 0.8428, + "step": 17636 + }, + { + "epoch": 0.45, + "learning_rate": 1.924587409034945e-06, + "loss": 0.6895, + "step": 17637 + }, + { + "epoch": 0.45, + "learning_rate": 1.924576867068816e-06, + "loss": 0.9189, + "step": 17638 + }, + { + "epoch": 0.45, + "learning_rate": 1.9245663243947817e-06, + "loss": 0.7451, + "step": 17639 + }, + { + "epoch": 0.45, + "learning_rate": 1.9245557810128492e-06, + "loss": 0.79, + "step": 17640 + }, + { + "epoch": 0.45, + "learning_rate": 1.924545236923027e-06, + "loss": 0.7119, + "step": 17641 + }, + { + "epoch": 0.45, + "learning_rate": 1.9245346921253228e-06, + "loss": 0.8931, + "step": 17642 + }, + { + "epoch": 0.45, + "learning_rate": 1.924524146619745e-06, + "loss": 1.0254, + "step": 17643 + }, + { + "epoch": 0.45, + "learning_rate": 1.9245136004063015e-06, + "loss": 0.7949, + "step": 17644 + }, + { + "epoch": 0.45, + "learning_rate": 1.924503053485001e-06, + "loss": 1.0488, + "step": 17645 + }, + { + "epoch": 0.45, + "learning_rate": 1.9244925058558503e-06, + "loss": 1.1836, + "step": 17646 + }, + { + "epoch": 0.45, + "learning_rate": 1.9244819575188585e-06, + "loss": 0.8438, + "step": 17647 + }, + { + "epoch": 0.45, + "learning_rate": 1.924471408474033e-06, + "loss": 1.0137, + "step": 17648 + }, + { + "epoch": 0.45, + "learning_rate": 1.924460858721383e-06, + "loss": 0.915, + "step": 17649 + }, + { + "epoch": 0.45, + "learning_rate": 1.924450308260915e-06, + "loss": 1.127, + "step": 17650 + }, + { + "epoch": 0.45, + "learning_rate": 1.9244397570926386e-06, + "loss": 0.8071, + "step": 17651 + }, + { + "epoch": 0.45, + "learning_rate": 1.924429205216561e-06, + "loss": 0.917, + "step": 17652 + }, + { + "epoch": 0.45, + "learning_rate": 1.92441865263269e-06, + "loss": 0.7197, + "step": 17653 + }, + { + "epoch": 0.45, + "learning_rate": 1.924408099341035e-06, + "loss": 0.9482, + "step": 17654 + }, + { + "epoch": 0.45, + "learning_rate": 1.9243975453416025e-06, + "loss": 0.9941, + "step": 17655 + }, + { + "epoch": 0.45, + "learning_rate": 1.9243869906344016e-06, + "loss": 0.9873, + "step": 17656 + }, + { + "epoch": 0.45, + "learning_rate": 1.92437643521944e-06, + "loss": 0.8354, + "step": 17657 + }, + { + "epoch": 0.45, + "learning_rate": 1.924365879096726e-06, + "loss": 0.8984, + "step": 17658 + }, + { + "epoch": 0.45, + "learning_rate": 1.924355322266267e-06, + "loss": 0.7446, + "step": 17659 + }, + { + "epoch": 0.45, + "learning_rate": 1.9243447647280724e-06, + "loss": 0.7876, + "step": 17660 + }, + { + "epoch": 0.45, + "learning_rate": 1.924334206482149e-06, + "loss": 0.8027, + "step": 17661 + }, + { + "epoch": 0.45, + "learning_rate": 1.9243236475285056e-06, + "loss": 0.9668, + "step": 17662 + }, + { + "epoch": 0.45, + "learning_rate": 1.92431308786715e-06, + "loss": 0.7949, + "step": 17663 + }, + { + "epoch": 0.45, + "learning_rate": 1.924302527498091e-06, + "loss": 0.8164, + "step": 17664 + }, + { + "epoch": 0.45, + "learning_rate": 1.924291966421335e-06, + "loss": 1.0557, + "step": 17665 + }, + { + "epoch": 0.45, + "learning_rate": 1.924281404636892e-06, + "loss": 0.5422, + "step": 17666 + }, + { + "epoch": 0.45, + "learning_rate": 1.9242708421447688e-06, + "loss": 0.9434, + "step": 17667 + }, + { + "epoch": 0.45, + "learning_rate": 1.9242602789449737e-06, + "loss": 0.7939, + "step": 17668 + }, + { + "epoch": 0.45, + "learning_rate": 1.9242497150375153e-06, + "loss": 0.7773, + "step": 17669 + }, + { + "epoch": 0.45, + "learning_rate": 1.9242391504224014e-06, + "loss": 0.9629, + "step": 17670 + }, + { + "epoch": 0.45, + "learning_rate": 1.92422858509964e-06, + "loss": 1.0723, + "step": 17671 + }, + { + "epoch": 0.45, + "learning_rate": 1.9242180190692394e-06, + "loss": 0.7261, + "step": 17672 + }, + { + "epoch": 0.45, + "learning_rate": 1.9242074523312073e-06, + "loss": 0.9746, + "step": 17673 + }, + { + "epoch": 0.45, + "learning_rate": 1.9241968848855525e-06, + "loss": 0.8828, + "step": 17674 + }, + { + "epoch": 0.45, + "learning_rate": 1.924186316732282e-06, + "loss": 0.7178, + "step": 17675 + }, + { + "epoch": 0.45, + "learning_rate": 1.924175747871405e-06, + "loss": 0.7227, + "step": 17676 + }, + { + "epoch": 0.45, + "learning_rate": 1.9241651783029293e-06, + "loss": 1.0332, + "step": 17677 + }, + { + "epoch": 0.45, + "learning_rate": 1.9241546080268626e-06, + "loss": 1.0088, + "step": 17678 + }, + { + "epoch": 0.45, + "learning_rate": 1.924144037043213e-06, + "loss": 0.7251, + "step": 17679 + }, + { + "epoch": 0.45, + "learning_rate": 1.9241334653519893e-06, + "loss": 0.957, + "step": 17680 + }, + { + "epoch": 0.45, + "learning_rate": 1.9241228929531983e-06, + "loss": 0.6973, + "step": 17681 + }, + { + "epoch": 0.45, + "learning_rate": 1.92411231984685e-06, + "loss": 0.6899, + "step": 17682 + }, + { + "epoch": 0.45, + "learning_rate": 1.92410174603295e-06, + "loss": 0.8477, + "step": 17683 + }, + { + "epoch": 0.45, + "learning_rate": 1.924091171511509e-06, + "loss": 0.9082, + "step": 17684 + }, + { + "epoch": 0.45, + "learning_rate": 1.924080596282533e-06, + "loss": 0.8936, + "step": 17685 + }, + { + "epoch": 0.45, + "learning_rate": 1.924070020346032e-06, + "loss": 0.7759, + "step": 17686 + }, + { + "epoch": 0.45, + "learning_rate": 1.9240594437020123e-06, + "loss": 0.8364, + "step": 17687 + }, + { + "epoch": 0.45, + "learning_rate": 1.924048866350483e-06, + "loss": 1.0234, + "step": 17688 + }, + { + "epoch": 0.45, + "learning_rate": 1.924038288291452e-06, + "loss": 0.834, + "step": 17689 + }, + { + "epoch": 0.45, + "learning_rate": 1.924027709524927e-06, + "loss": 0.7129, + "step": 17690 + }, + { + "epoch": 0.45, + "learning_rate": 1.9240171300509166e-06, + "loss": 0.8584, + "step": 17691 + }, + { + "epoch": 0.45, + "learning_rate": 1.924006549869429e-06, + "loss": 1.082, + "step": 17692 + }, + { + "epoch": 0.45, + "learning_rate": 1.923995968980472e-06, + "loss": 0.9102, + "step": 17693 + }, + { + "epoch": 0.45, + "learning_rate": 1.923985387384054e-06, + "loss": 0.9199, + "step": 17694 + }, + { + "epoch": 0.45, + "learning_rate": 1.9239748050801824e-06, + "loss": 0.7842, + "step": 17695 + }, + { + "epoch": 0.45, + "learning_rate": 1.923964222068866e-06, + "loss": 1.1025, + "step": 17696 + }, + { + "epoch": 0.45, + "learning_rate": 1.923953638350113e-06, + "loss": 0.8809, + "step": 17697 + }, + { + "epoch": 0.45, + "learning_rate": 1.9239430539239305e-06, + "loss": 0.79, + "step": 17698 + }, + { + "epoch": 0.45, + "learning_rate": 1.923932468790328e-06, + "loss": 0.8799, + "step": 17699 + }, + { + "epoch": 0.45, + "learning_rate": 1.923921882949312e-06, + "loss": 0.9551, + "step": 17700 + }, + { + "epoch": 0.45, + "learning_rate": 1.9239112964008925e-06, + "loss": 0.9336, + "step": 17701 + }, + { + "epoch": 0.45, + "learning_rate": 1.9239007091450762e-06, + "loss": 0.8389, + "step": 17702 + }, + { + "epoch": 0.45, + "learning_rate": 1.9238901211818715e-06, + "loss": 0.8887, + "step": 17703 + }, + { + "epoch": 0.45, + "learning_rate": 1.9238795325112867e-06, + "loss": 0.6611, + "step": 17704 + }, + { + "epoch": 0.45, + "learning_rate": 1.9238689431333298e-06, + "loss": 0.9443, + "step": 17705 + }, + { + "epoch": 0.45, + "learning_rate": 1.923858353048009e-06, + "loss": 0.8298, + "step": 17706 + }, + { + "epoch": 0.45, + "learning_rate": 1.923847762255332e-06, + "loss": 0.9326, + "step": 17707 + }, + { + "epoch": 0.45, + "learning_rate": 1.923837170755308e-06, + "loss": 0.9395, + "step": 17708 + }, + { + "epoch": 0.45, + "learning_rate": 1.9238265785479437e-06, + "loss": 0.8516, + "step": 17709 + }, + { + "epoch": 0.45, + "learning_rate": 1.923815985633248e-06, + "loss": 0.8984, + "step": 17710 + }, + { + "epoch": 0.45, + "learning_rate": 1.923805392011229e-06, + "loss": 0.9336, + "step": 17711 + }, + { + "epoch": 0.45, + "learning_rate": 1.9237947976818947e-06, + "loss": 0.7393, + "step": 17712 + }, + { + "epoch": 0.45, + "learning_rate": 1.923784202645253e-06, + "loss": 0.9932, + "step": 17713 + }, + { + "epoch": 0.45, + "learning_rate": 1.9237736069013124e-06, + "loss": 0.9336, + "step": 17714 + }, + { + "epoch": 0.45, + "learning_rate": 1.9237630104500807e-06, + "loss": 1.0449, + "step": 17715 + }, + { + "epoch": 0.45, + "learning_rate": 1.9237524132915663e-06, + "loss": 0.8394, + "step": 17716 + }, + { + "epoch": 0.45, + "learning_rate": 1.923741815425777e-06, + "loss": 0.8613, + "step": 17717 + }, + { + "epoch": 0.45, + "learning_rate": 1.9237312168527212e-06, + "loss": 0.686, + "step": 17718 + }, + { + "epoch": 0.45, + "learning_rate": 1.9237206175724067e-06, + "loss": 0.8964, + "step": 17719 + }, + { + "epoch": 0.45, + "learning_rate": 1.9237100175848416e-06, + "loss": 0.958, + "step": 17720 + }, + { + "epoch": 0.45, + "learning_rate": 1.9236994168900346e-06, + "loss": 0.9727, + "step": 17721 + }, + { + "epoch": 0.45, + "learning_rate": 1.923688815487993e-06, + "loss": 0.8696, + "step": 17722 + }, + { + "epoch": 0.45, + "learning_rate": 1.923678213378726e-06, + "loss": 0.5708, + "step": 17723 + }, + { + "epoch": 0.45, + "learning_rate": 1.923667610562241e-06, + "loss": 0.9463, + "step": 17724 + }, + { + "epoch": 0.45, + "learning_rate": 1.923657007038546e-06, + "loss": 0.7698, + "step": 17725 + }, + { + "epoch": 0.45, + "learning_rate": 1.923646402807649e-06, + "loss": 0.9131, + "step": 17726 + }, + { + "epoch": 0.45, + "learning_rate": 1.9236357978695588e-06, + "loss": 0.9199, + "step": 17727 + }, + { + "epoch": 0.45, + "learning_rate": 1.923625192224283e-06, + "loss": 0.79, + "step": 17728 + }, + { + "epoch": 0.45, + "learning_rate": 1.92361458587183e-06, + "loss": 0.9302, + "step": 17729 + }, + { + "epoch": 0.45, + "learning_rate": 1.9236039788122075e-06, + "loss": 1.0088, + "step": 17730 + }, + { + "epoch": 0.45, + "learning_rate": 1.923593371045424e-06, + "loss": 0.8535, + "step": 17731 + }, + { + "epoch": 0.45, + "learning_rate": 1.9235827625714872e-06, + "loss": 0.7158, + "step": 17732 + }, + { + "epoch": 0.45, + "learning_rate": 1.923572153390406e-06, + "loss": 0.7861, + "step": 17733 + }, + { + "epoch": 0.45, + "learning_rate": 1.923561543502188e-06, + "loss": 0.8545, + "step": 17734 + }, + { + "epoch": 0.45, + "learning_rate": 1.9235509329068415e-06, + "loss": 0.9131, + "step": 17735 + }, + { + "epoch": 0.45, + "learning_rate": 1.9235403216043744e-06, + "loss": 0.7969, + "step": 17736 + }, + { + "epoch": 0.45, + "learning_rate": 1.923529709594795e-06, + "loss": 0.8691, + "step": 17737 + }, + { + "epoch": 0.45, + "learning_rate": 1.923519096878111e-06, + "loss": 0.8916, + "step": 17738 + }, + { + "epoch": 0.45, + "learning_rate": 1.9235084834543314e-06, + "loss": 0.6855, + "step": 17739 + }, + { + "epoch": 0.45, + "learning_rate": 1.9234978693234638e-06, + "loss": 0.9248, + "step": 17740 + }, + { + "epoch": 0.45, + "learning_rate": 1.923487254485516e-06, + "loss": 0.7871, + "step": 17741 + }, + { + "epoch": 0.45, + "learning_rate": 1.9234766389404963e-06, + "loss": 0.9727, + "step": 17742 + }, + { + "epoch": 0.45, + "learning_rate": 1.923466022688414e-06, + "loss": 0.8643, + "step": 17743 + }, + { + "epoch": 0.45, + "learning_rate": 1.9234554057292753e-06, + "loss": 0.8252, + "step": 17744 + }, + { + "epoch": 0.45, + "learning_rate": 1.9234447880630895e-06, + "loss": 0.875, + "step": 17745 + }, + { + "epoch": 0.45, + "learning_rate": 1.923434169689864e-06, + "loss": 0.9639, + "step": 17746 + }, + { + "epoch": 0.45, + "learning_rate": 1.923423550609608e-06, + "loss": 0.7656, + "step": 17747 + }, + { + "epoch": 0.45, + "learning_rate": 1.9234129308223294e-06, + "loss": 0.8018, + "step": 17748 + }, + { + "epoch": 0.45, + "learning_rate": 1.9234023103280353e-06, + "loss": 0.9385, + "step": 17749 + }, + { + "epoch": 0.45, + "learning_rate": 1.9233916891267347e-06, + "loss": 0.8174, + "step": 17750 + }, + { + "epoch": 0.45, + "learning_rate": 1.9233810672184355e-06, + "loss": 0.7285, + "step": 17751 + }, + { + "epoch": 0.45, + "learning_rate": 1.923370444603146e-06, + "loss": 1.0752, + "step": 17752 + }, + { + "epoch": 0.46, + "learning_rate": 1.9233598212808743e-06, + "loss": 0.5693, + "step": 17753 + }, + { + "epoch": 0.46, + "learning_rate": 1.9233491972516284e-06, + "loss": 0.8916, + "step": 17754 + }, + { + "epoch": 0.46, + "learning_rate": 1.923338572515416e-06, + "loss": 0.918, + "step": 17755 + }, + { + "epoch": 0.46, + "learning_rate": 1.9233279470722465e-06, + "loss": 0.8652, + "step": 17756 + }, + { + "epoch": 0.46, + "learning_rate": 1.9233173209221267e-06, + "loss": 0.8584, + "step": 17757 + }, + { + "epoch": 0.46, + "learning_rate": 1.9233066940650655e-06, + "loss": 0.8496, + "step": 17758 + }, + { + "epoch": 0.46, + "learning_rate": 1.9232960665010706e-06, + "loss": 0.9912, + "step": 17759 + }, + { + "epoch": 0.46, + "learning_rate": 1.9232854382301505e-06, + "loss": 0.9668, + "step": 17760 + }, + { + "epoch": 0.46, + "learning_rate": 1.923274809252313e-06, + "loss": 0.9854, + "step": 17761 + }, + { + "epoch": 0.46, + "learning_rate": 1.9232641795675668e-06, + "loss": 0.7837, + "step": 17762 + }, + { + "epoch": 0.46, + "learning_rate": 1.9232535491759197e-06, + "loss": 0.9136, + "step": 17763 + }, + { + "epoch": 0.46, + "learning_rate": 1.9232429180773795e-06, + "loss": 0.8203, + "step": 17764 + }, + { + "epoch": 0.46, + "learning_rate": 1.9232322862719544e-06, + "loss": 0.9092, + "step": 17765 + }, + { + "epoch": 0.46, + "learning_rate": 1.9232216537596536e-06, + "loss": 0.9248, + "step": 17766 + }, + { + "epoch": 0.46, + "learning_rate": 1.9232110205404835e-06, + "loss": 0.8037, + "step": 17767 + }, + { + "epoch": 0.46, + "learning_rate": 1.923200386614454e-06, + "loss": 0.7695, + "step": 17768 + }, + { + "epoch": 0.46, + "learning_rate": 1.923189751981572e-06, + "loss": 1.0049, + "step": 17769 + }, + { + "epoch": 0.46, + "learning_rate": 1.923179116641846e-06, + "loss": 0.7212, + "step": 17770 + }, + { + "epoch": 0.46, + "learning_rate": 1.9231684805952842e-06, + "loss": 0.9292, + "step": 17771 + }, + { + "epoch": 0.46, + "learning_rate": 1.923157843841895e-06, + "loss": 0.9312, + "step": 17772 + }, + { + "epoch": 0.46, + "learning_rate": 1.9231472063816864e-06, + "loss": 1.0293, + "step": 17773 + }, + { + "epoch": 0.46, + "learning_rate": 1.923136568214666e-06, + "loss": 0.7754, + "step": 17774 + }, + { + "epoch": 0.46, + "learning_rate": 1.9231259293408425e-06, + "loss": 1.0098, + "step": 17775 + }, + { + "epoch": 0.46, + "learning_rate": 1.923115289760224e-06, + "loss": 0.9482, + "step": 17776 + }, + { + "epoch": 0.46, + "learning_rate": 1.9231046494728185e-06, + "loss": 1.0264, + "step": 17777 + }, + { + "epoch": 0.46, + "learning_rate": 1.9230940084786343e-06, + "loss": 1.0088, + "step": 17778 + }, + { + "epoch": 0.46, + "learning_rate": 1.9230833667776794e-06, + "loss": 0.8027, + "step": 17779 + }, + { + "epoch": 0.46, + "learning_rate": 1.923072724369962e-06, + "loss": 0.7998, + "step": 17780 + }, + { + "epoch": 0.46, + "learning_rate": 1.9230620812554904e-06, + "loss": 0.668, + "step": 17781 + }, + { + "epoch": 0.46, + "learning_rate": 1.9230514374342727e-06, + "loss": 0.9355, + "step": 17782 + }, + { + "epoch": 0.46, + "learning_rate": 1.923040792906317e-06, + "loss": 0.9297, + "step": 17783 + }, + { + "epoch": 0.46, + "learning_rate": 1.923030147671631e-06, + "loss": 0.9062, + "step": 17784 + }, + { + "epoch": 0.46, + "learning_rate": 1.9230195017302233e-06, + "loss": 0.8389, + "step": 17785 + }, + { + "epoch": 0.46, + "learning_rate": 1.923008855082102e-06, + "loss": 0.9326, + "step": 17786 + }, + { + "epoch": 0.46, + "learning_rate": 1.9229982077272756e-06, + "loss": 0.9727, + "step": 17787 + }, + { + "epoch": 0.46, + "learning_rate": 1.9229875596657513e-06, + "loss": 0.8242, + "step": 17788 + }, + { + "epoch": 0.46, + "learning_rate": 1.9229769108975385e-06, + "loss": 0.917, + "step": 17789 + }, + { + "epoch": 0.46, + "learning_rate": 1.9229662614226444e-06, + "loss": 0.8613, + "step": 17790 + }, + { + "epoch": 0.46, + "learning_rate": 1.9229556112410775e-06, + "loss": 0.999, + "step": 17791 + }, + { + "epoch": 0.46, + "learning_rate": 1.9229449603528463e-06, + "loss": 0.8711, + "step": 17792 + }, + { + "epoch": 0.46, + "learning_rate": 1.9229343087579583e-06, + "loss": 0.8276, + "step": 17793 + }, + { + "epoch": 0.46, + "learning_rate": 1.9229236564564217e-06, + "loss": 0.6455, + "step": 17794 + }, + { + "epoch": 0.46, + "learning_rate": 1.9229130034482453e-06, + "loss": 0.5942, + "step": 17795 + }, + { + "epoch": 0.46, + "learning_rate": 1.9229023497334363e-06, + "loss": 0.9453, + "step": 17796 + }, + { + "epoch": 0.46, + "learning_rate": 1.922891695312004e-06, + "loss": 0.9189, + "step": 17797 + }, + { + "epoch": 0.46, + "learning_rate": 1.9228810401839557e-06, + "loss": 0.9258, + "step": 17798 + }, + { + "epoch": 0.46, + "learning_rate": 1.9228703843493e-06, + "loss": 0.7012, + "step": 17799 + }, + { + "epoch": 0.46, + "learning_rate": 1.922859727808045e-06, + "loss": 1.1055, + "step": 17800 + }, + { + "epoch": 0.46, + "learning_rate": 1.922849070560198e-06, + "loss": 0.8975, + "step": 17801 + }, + { + "epoch": 0.46, + "learning_rate": 1.9228384126057684e-06, + "loss": 0.813, + "step": 17802 + }, + { + "epoch": 0.46, + "learning_rate": 1.922827753944764e-06, + "loss": 0.7598, + "step": 17803 + }, + { + "epoch": 0.46, + "learning_rate": 1.9228170945771924e-06, + "loss": 1.0078, + "step": 17804 + }, + { + "epoch": 0.46, + "learning_rate": 1.9228064345030625e-06, + "loss": 1.0459, + "step": 17805 + }, + { + "epoch": 0.46, + "learning_rate": 1.922795773722382e-06, + "loss": 0.6577, + "step": 17806 + }, + { + "epoch": 0.46, + "learning_rate": 1.9227851122351595e-06, + "loss": 1.0068, + "step": 17807 + }, + { + "epoch": 0.46, + "learning_rate": 1.922774450041403e-06, + "loss": 0.7637, + "step": 17808 + }, + { + "epoch": 0.46, + "learning_rate": 1.92276378714112e-06, + "loss": 0.9229, + "step": 17809 + }, + { + "epoch": 0.46, + "learning_rate": 1.9227531235343193e-06, + "loss": 0.7461, + "step": 17810 + }, + { + "epoch": 0.46, + "learning_rate": 1.922742459221009e-06, + "loss": 0.9609, + "step": 17811 + }, + { + "epoch": 0.46, + "learning_rate": 1.922731794201197e-06, + "loss": 1.0889, + "step": 17812 + }, + { + "epoch": 0.46, + "learning_rate": 1.9227211284748922e-06, + "loss": 0.6934, + "step": 17813 + }, + { + "epoch": 0.46, + "learning_rate": 1.922710462042102e-06, + "loss": 0.9971, + "step": 17814 + }, + { + "epoch": 0.46, + "learning_rate": 1.9226997949028348e-06, + "loss": 0.7412, + "step": 17815 + }, + { + "epoch": 0.46, + "learning_rate": 1.922689127057099e-06, + "loss": 0.5884, + "step": 17816 + }, + { + "epoch": 0.46, + "learning_rate": 1.922678458504902e-06, + "loss": 1.1123, + "step": 17817 + }, + { + "epoch": 0.46, + "learning_rate": 1.9226677892462534e-06, + "loss": 0.7178, + "step": 17818 + }, + { + "epoch": 0.46, + "learning_rate": 1.92265711928116e-06, + "loss": 0.8604, + "step": 17819 + }, + { + "epoch": 0.46, + "learning_rate": 1.9226464486096307e-06, + "loss": 0.6394, + "step": 17820 + }, + { + "epoch": 0.46, + "learning_rate": 1.922635777231673e-06, + "loss": 0.9512, + "step": 17821 + }, + { + "epoch": 0.46, + "learning_rate": 1.9226251051472956e-06, + "loss": 1.1592, + "step": 17822 + }, + { + "epoch": 0.46, + "learning_rate": 1.922614432356507e-06, + "loss": 0.9663, + "step": 17823 + }, + { + "epoch": 0.46, + "learning_rate": 1.922603758859315e-06, + "loss": 1.0156, + "step": 17824 + }, + { + "epoch": 0.46, + "learning_rate": 1.922593084655727e-06, + "loss": 0.6768, + "step": 17825 + }, + { + "epoch": 0.46, + "learning_rate": 1.9225824097457524e-06, + "loss": 0.8057, + "step": 17826 + }, + { + "epoch": 0.46, + "learning_rate": 1.922571734129399e-06, + "loss": 0.8633, + "step": 17827 + }, + { + "epoch": 0.46, + "learning_rate": 1.9225610578066745e-06, + "loss": 1.041, + "step": 17828 + }, + { + "epoch": 0.46, + "learning_rate": 1.9225503807775873e-06, + "loss": 0.7227, + "step": 17829 + }, + { + "epoch": 0.46, + "learning_rate": 1.922539703042146e-06, + "loss": 1.0713, + "step": 17830 + }, + { + "epoch": 0.46, + "learning_rate": 1.9225290246003584e-06, + "loss": 0.9883, + "step": 17831 + }, + { + "epoch": 0.46, + "learning_rate": 1.9225183454522328e-06, + "loss": 0.9287, + "step": 17832 + }, + { + "epoch": 0.46, + "learning_rate": 1.9225076655977774e-06, + "loss": 0.917, + "step": 17833 + }, + { + "epoch": 0.46, + "learning_rate": 1.9224969850370003e-06, + "loss": 0.8418, + "step": 17834 + }, + { + "epoch": 0.46, + "learning_rate": 1.922486303769909e-06, + "loss": 0.8623, + "step": 17835 + }, + { + "epoch": 0.46, + "learning_rate": 1.922475621796513e-06, + "loss": 0.9395, + "step": 17836 + }, + { + "epoch": 0.46, + "learning_rate": 1.92246493911682e-06, + "loss": 0.7476, + "step": 17837 + }, + { + "epoch": 0.46, + "learning_rate": 1.922454255730838e-06, + "loss": 0.7148, + "step": 17838 + }, + { + "epoch": 0.46, + "learning_rate": 1.9224435716385745e-06, + "loss": 0.9131, + "step": 17839 + }, + { + "epoch": 0.46, + "learning_rate": 1.922432886840039e-06, + "loss": 0.8428, + "step": 17840 + }, + { + "epoch": 0.46, + "learning_rate": 1.922422201335239e-06, + "loss": 0.8682, + "step": 17841 + }, + { + "epoch": 0.46, + "learning_rate": 1.9224115151241826e-06, + "loss": 0.9141, + "step": 17842 + }, + { + "epoch": 0.46, + "learning_rate": 1.922400828206878e-06, + "loss": 0.7334, + "step": 17843 + }, + { + "epoch": 0.46, + "learning_rate": 1.9223901405833336e-06, + "loss": 0.5674, + "step": 17844 + }, + { + "epoch": 0.46, + "learning_rate": 1.9223794522535576e-06, + "loss": 0.8926, + "step": 17845 + }, + { + "epoch": 0.46, + "learning_rate": 1.922368763217558e-06, + "loss": 0.8359, + "step": 17846 + }, + { + "epoch": 0.46, + "learning_rate": 1.922358073475343e-06, + "loss": 0.804, + "step": 17847 + }, + { + "epoch": 0.46, + "learning_rate": 1.9223473830269207e-06, + "loss": 0.8457, + "step": 17848 + }, + { + "epoch": 0.46, + "learning_rate": 1.9223366918722995e-06, + "loss": 0.894, + "step": 17849 + }, + { + "epoch": 0.46, + "learning_rate": 1.922326000011488e-06, + "loss": 0.4868, + "step": 17850 + }, + { + "epoch": 0.46, + "learning_rate": 1.922315307444493e-06, + "loss": 0.9277, + "step": 17851 + }, + { + "epoch": 0.46, + "learning_rate": 1.9223046141713245e-06, + "loss": 0.8381, + "step": 17852 + }, + { + "epoch": 0.46, + "learning_rate": 1.922293920191989e-06, + "loss": 0.8291, + "step": 17853 + }, + { + "epoch": 0.46, + "learning_rate": 1.922283225506496e-06, + "loss": 0.7998, + "step": 17854 + }, + { + "epoch": 0.46, + "learning_rate": 1.922272530114853e-06, + "loss": 0.4839, + "step": 17855 + }, + { + "epoch": 0.46, + "learning_rate": 1.922261834017068e-06, + "loss": 0.6177, + "step": 17856 + }, + { + "epoch": 0.46, + "learning_rate": 1.92225113721315e-06, + "loss": 0.8164, + "step": 17857 + }, + { + "epoch": 0.46, + "learning_rate": 1.922240439703106e-06, + "loss": 0.9302, + "step": 17858 + }, + { + "epoch": 0.46, + "learning_rate": 1.922229741486946e-06, + "loss": 0.9531, + "step": 17859 + }, + { + "epoch": 0.46, + "learning_rate": 1.922219042564676e-06, + "loss": 0.8076, + "step": 17860 + }, + { + "epoch": 0.46, + "learning_rate": 1.922208342936306e-06, + "loss": 0.7603, + "step": 17861 + }, + { + "epoch": 0.46, + "learning_rate": 1.922197642601843e-06, + "loss": 0.7583, + "step": 17862 + }, + { + "epoch": 0.46, + "learning_rate": 1.922186941561296e-06, + "loss": 0.9961, + "step": 17863 + }, + { + "epoch": 0.46, + "learning_rate": 1.9221762398146728e-06, + "loss": 0.6353, + "step": 17864 + }, + { + "epoch": 0.46, + "learning_rate": 1.9221655373619815e-06, + "loss": 0.7529, + "step": 17865 + }, + { + "epoch": 0.46, + "learning_rate": 1.9221548342032306e-06, + "loss": 0.874, + "step": 17866 + }, + { + "epoch": 0.46, + "learning_rate": 1.922144130338428e-06, + "loss": 1.0264, + "step": 17867 + }, + { + "epoch": 0.46, + "learning_rate": 1.922133425767582e-06, + "loss": 0.873, + "step": 17868 + }, + { + "epoch": 0.46, + "learning_rate": 1.922122720490701e-06, + "loss": 0.9092, + "step": 17869 + }, + { + "epoch": 0.46, + "learning_rate": 1.9221120145077932e-06, + "loss": 0.7852, + "step": 17870 + }, + { + "epoch": 0.46, + "learning_rate": 1.9221013078188665e-06, + "loss": 0.9854, + "step": 17871 + }, + { + "epoch": 0.46, + "learning_rate": 1.922090600423929e-06, + "loss": 0.9375, + "step": 17872 + }, + { + "epoch": 0.46, + "learning_rate": 1.9220798923229894e-06, + "loss": 0.6914, + "step": 17873 + }, + { + "epoch": 0.46, + "learning_rate": 1.9220691835160556e-06, + "loss": 0.7988, + "step": 17874 + }, + { + "epoch": 0.46, + "learning_rate": 1.9220584740031354e-06, + "loss": 0.8716, + "step": 17875 + }, + { + "epoch": 0.46, + "learning_rate": 1.922047763784238e-06, + "loss": 0.6807, + "step": 17876 + }, + { + "epoch": 0.46, + "learning_rate": 1.922037052859371e-06, + "loss": 0.8428, + "step": 17877 + }, + { + "epoch": 0.46, + "learning_rate": 1.9220263412285423e-06, + "loss": 0.8789, + "step": 17878 + }, + { + "epoch": 0.46, + "learning_rate": 1.9220156288917604e-06, + "loss": 0.5867, + "step": 17879 + }, + { + "epoch": 0.46, + "learning_rate": 1.9220049158490338e-06, + "loss": 1.2812, + "step": 17880 + }, + { + "epoch": 0.46, + "learning_rate": 1.9219942021003704e-06, + "loss": 0.7129, + "step": 17881 + }, + { + "epoch": 0.46, + "learning_rate": 1.9219834876457782e-06, + "loss": 0.835, + "step": 17882 + }, + { + "epoch": 0.46, + "learning_rate": 1.9219727724852655e-06, + "loss": 0.8784, + "step": 17883 + }, + { + "epoch": 0.46, + "learning_rate": 1.9219620566188414e-06, + "loss": 0.9946, + "step": 17884 + }, + { + "epoch": 0.46, + "learning_rate": 1.9219513400465128e-06, + "loss": 0.832, + "step": 17885 + }, + { + "epoch": 0.46, + "learning_rate": 1.9219406227682885e-06, + "loss": 0.8672, + "step": 17886 + }, + { + "epoch": 0.46, + "learning_rate": 1.9219299047841766e-06, + "loss": 1.0283, + "step": 17887 + }, + { + "epoch": 0.46, + "learning_rate": 1.9219191860941855e-06, + "loss": 1.0391, + "step": 17888 + }, + { + "epoch": 0.46, + "learning_rate": 1.9219084666983234e-06, + "loss": 0.7241, + "step": 17889 + }, + { + "epoch": 0.46, + "learning_rate": 1.9218977465965978e-06, + "loss": 0.6748, + "step": 17890 + }, + { + "epoch": 0.46, + "learning_rate": 1.921887025789018e-06, + "loss": 0.8057, + "step": 17891 + }, + { + "epoch": 0.46, + "learning_rate": 1.9218763042755913e-06, + "loss": 0.8784, + "step": 17892 + }, + { + "epoch": 0.46, + "learning_rate": 1.921865582056327e-06, + "loss": 0.9736, + "step": 17893 + }, + { + "epoch": 0.46, + "learning_rate": 1.921854859131232e-06, + "loss": 0.7461, + "step": 17894 + }, + { + "epoch": 0.46, + "learning_rate": 1.9218441355003153e-06, + "loss": 0.9473, + "step": 17895 + }, + { + "epoch": 0.46, + "learning_rate": 1.9218334111635847e-06, + "loss": 0.8496, + "step": 17896 + }, + { + "epoch": 0.46, + "learning_rate": 1.921822686121049e-06, + "loss": 0.7612, + "step": 17897 + }, + { + "epoch": 0.46, + "learning_rate": 1.9218119603727162e-06, + "loss": 1.0234, + "step": 17898 + }, + { + "epoch": 0.46, + "learning_rate": 1.921801233918594e-06, + "loss": 0.7891, + "step": 17899 + }, + { + "epoch": 0.46, + "learning_rate": 1.921790506758691e-06, + "loss": 0.7344, + "step": 17900 + }, + { + "epoch": 0.46, + "learning_rate": 1.9217797788930155e-06, + "loss": 0.8232, + "step": 17901 + }, + { + "epoch": 0.46, + "learning_rate": 1.9217690503215753e-06, + "loss": 0.8193, + "step": 17902 + }, + { + "epoch": 0.46, + "learning_rate": 1.9217583210443793e-06, + "loss": 0.9199, + "step": 17903 + }, + { + "epoch": 0.46, + "learning_rate": 1.9217475910614354e-06, + "loss": 0.9092, + "step": 17904 + }, + { + "epoch": 0.46, + "learning_rate": 1.9217368603727517e-06, + "loss": 0.7812, + "step": 17905 + }, + { + "epoch": 0.46, + "learning_rate": 1.9217261289783363e-06, + "loss": 0.9688, + "step": 17906 + }, + { + "epoch": 0.46, + "learning_rate": 1.9217153968781975e-06, + "loss": 1.0146, + "step": 17907 + }, + { + "epoch": 0.46, + "learning_rate": 1.921704664072344e-06, + "loss": 0.9336, + "step": 17908 + }, + { + "epoch": 0.46, + "learning_rate": 1.921693930560783e-06, + "loss": 0.9316, + "step": 17909 + }, + { + "epoch": 0.46, + "learning_rate": 1.921683196343524e-06, + "loss": 0.6094, + "step": 17910 + }, + { + "epoch": 0.46, + "learning_rate": 1.921672461420574e-06, + "loss": 0.6768, + "step": 17911 + }, + { + "epoch": 0.46, + "learning_rate": 1.9216617257919425e-06, + "loss": 1.0186, + "step": 17912 + }, + { + "epoch": 0.46, + "learning_rate": 1.9216509894576364e-06, + "loss": 0.7778, + "step": 17913 + }, + { + "epoch": 0.46, + "learning_rate": 1.9216402524176646e-06, + "loss": 0.9268, + "step": 17914 + }, + { + "epoch": 0.46, + "learning_rate": 1.9216295146720356e-06, + "loss": 0.7803, + "step": 17915 + }, + { + "epoch": 0.46, + "learning_rate": 1.9216187762207566e-06, + "loss": 0.7578, + "step": 17916 + }, + { + "epoch": 0.46, + "learning_rate": 1.921608037063837e-06, + "loss": 0.8315, + "step": 17917 + }, + { + "epoch": 0.46, + "learning_rate": 1.921597297201284e-06, + "loss": 0.9023, + "step": 17918 + }, + { + "epoch": 0.46, + "learning_rate": 1.921586556633107e-06, + "loss": 0.8799, + "step": 17919 + }, + { + "epoch": 0.46, + "learning_rate": 1.921575815359313e-06, + "loss": 0.9307, + "step": 17920 + }, + { + "epoch": 0.46, + "learning_rate": 1.921565073379911e-06, + "loss": 0.7178, + "step": 17921 + }, + { + "epoch": 0.46, + "learning_rate": 1.9215543306949093e-06, + "loss": 0.7329, + "step": 17922 + }, + { + "epoch": 0.46, + "learning_rate": 1.921543587304315e-06, + "loss": 0.9219, + "step": 17923 + }, + { + "epoch": 0.46, + "learning_rate": 1.921532843208138e-06, + "loss": 0.7529, + "step": 17924 + }, + { + "epoch": 0.46, + "learning_rate": 1.9215220984063853e-06, + "loss": 1.1182, + "step": 17925 + }, + { + "epoch": 0.46, + "learning_rate": 1.9215113528990656e-06, + "loss": 1.0303, + "step": 17926 + }, + { + "epoch": 0.46, + "learning_rate": 1.921500606686187e-06, + "loss": 0.9229, + "step": 17927 + }, + { + "epoch": 0.46, + "learning_rate": 1.9214898597677578e-06, + "loss": 1.0068, + "step": 17928 + }, + { + "epoch": 0.46, + "learning_rate": 1.9214791121437857e-06, + "loss": 1.1543, + "step": 17929 + }, + { + "epoch": 0.46, + "learning_rate": 1.9214683638142797e-06, + "loss": 0.7188, + "step": 17930 + }, + { + "epoch": 0.46, + "learning_rate": 1.921457614779248e-06, + "loss": 0.9385, + "step": 17931 + }, + { + "epoch": 0.46, + "learning_rate": 1.9214468650386984e-06, + "loss": 0.7773, + "step": 17932 + }, + { + "epoch": 0.46, + "learning_rate": 1.9214361145926396e-06, + "loss": 0.8721, + "step": 17933 + }, + { + "epoch": 0.46, + "learning_rate": 1.921425363441079e-06, + "loss": 1.0264, + "step": 17934 + }, + { + "epoch": 0.46, + "learning_rate": 1.921414611584026e-06, + "loss": 0.9775, + "step": 17935 + }, + { + "epoch": 0.46, + "learning_rate": 1.9214038590214876e-06, + "loss": 0.8486, + "step": 17936 + }, + { + "epoch": 0.46, + "learning_rate": 1.921393105753473e-06, + "loss": 0.96, + "step": 17937 + }, + { + "epoch": 0.46, + "learning_rate": 1.92138235177999e-06, + "loss": 1.0889, + "step": 17938 + }, + { + "epoch": 0.46, + "learning_rate": 1.9213715971010465e-06, + "loss": 0.896, + "step": 17939 + }, + { + "epoch": 0.46, + "learning_rate": 1.9213608417166518e-06, + "loss": 0.9111, + "step": 17940 + }, + { + "epoch": 0.46, + "learning_rate": 1.921350085626813e-06, + "loss": 0.8076, + "step": 17941 + }, + { + "epoch": 0.46, + "learning_rate": 1.921339328831539e-06, + "loss": 0.6953, + "step": 17942 + }, + { + "epoch": 0.46, + "learning_rate": 1.9213285713308376e-06, + "loss": 0.9531, + "step": 17943 + }, + { + "epoch": 0.46, + "learning_rate": 1.921317813124718e-06, + "loss": 0.7686, + "step": 17944 + }, + { + "epoch": 0.46, + "learning_rate": 1.921307054213187e-06, + "loss": 0.8135, + "step": 17945 + }, + { + "epoch": 0.46, + "learning_rate": 1.921296294596253e-06, + "loss": 1.0635, + "step": 17946 + }, + { + "epoch": 0.46, + "learning_rate": 1.921285534273926e-06, + "loss": 0.707, + "step": 17947 + }, + { + "epoch": 0.46, + "learning_rate": 1.9212747732462126e-06, + "loss": 0.7666, + "step": 17948 + }, + { + "epoch": 0.46, + "learning_rate": 1.9212640115131213e-06, + "loss": 0.8721, + "step": 17949 + }, + { + "epoch": 0.46, + "learning_rate": 1.9212532490746607e-06, + "loss": 0.8267, + "step": 17950 + }, + { + "epoch": 0.46, + "learning_rate": 1.9212424859308386e-06, + "loss": 0.9121, + "step": 17951 + }, + { + "epoch": 0.46, + "learning_rate": 1.9212317220816637e-06, + "loss": 0.7871, + "step": 17952 + }, + { + "epoch": 0.46, + "learning_rate": 1.921220957527144e-06, + "loss": 0.7812, + "step": 17953 + }, + { + "epoch": 0.46, + "learning_rate": 1.921210192267288e-06, + "loss": 1.0391, + "step": 17954 + }, + { + "epoch": 0.46, + "learning_rate": 1.9211994263021034e-06, + "loss": 1.0596, + "step": 17955 + }, + { + "epoch": 0.46, + "learning_rate": 1.9211886596315986e-06, + "loss": 0.9922, + "step": 17956 + }, + { + "epoch": 0.46, + "learning_rate": 1.9211778922557825e-06, + "loss": 1.1035, + "step": 17957 + }, + { + "epoch": 0.46, + "learning_rate": 1.9211671241746625e-06, + "loss": 0.9482, + "step": 17958 + }, + { + "epoch": 0.46, + "learning_rate": 1.921156355388247e-06, + "loss": 0.7764, + "step": 17959 + }, + { + "epoch": 0.46, + "learning_rate": 1.921145585896545e-06, + "loss": 0.9512, + "step": 17960 + }, + { + "epoch": 0.46, + "learning_rate": 1.9211348156995636e-06, + "loss": 0.8555, + "step": 17961 + }, + { + "epoch": 0.46, + "learning_rate": 1.921124044797312e-06, + "loss": 0.917, + "step": 17962 + }, + { + "epoch": 0.46, + "learning_rate": 1.921113273189798e-06, + "loss": 1.0039, + "step": 17963 + }, + { + "epoch": 0.46, + "learning_rate": 1.9211025008770296e-06, + "loss": 0.9365, + "step": 17964 + }, + { + "epoch": 0.46, + "learning_rate": 1.921091727859016e-06, + "loss": 1.04, + "step": 17965 + }, + { + "epoch": 0.46, + "learning_rate": 1.9210809541357644e-06, + "loss": 0.6895, + "step": 17966 + }, + { + "epoch": 0.46, + "learning_rate": 1.9210701797072836e-06, + "loss": 0.9336, + "step": 17967 + }, + { + "epoch": 0.46, + "learning_rate": 1.9210594045735817e-06, + "loss": 0.9414, + "step": 17968 + }, + { + "epoch": 0.46, + "learning_rate": 1.921048628734667e-06, + "loss": 0.6982, + "step": 17969 + }, + { + "epoch": 0.46, + "learning_rate": 1.9210378521905477e-06, + "loss": 0.8975, + "step": 17970 + }, + { + "epoch": 0.46, + "learning_rate": 1.921027074941232e-06, + "loss": 0.9062, + "step": 17971 + }, + { + "epoch": 0.46, + "learning_rate": 1.9210162969867283e-06, + "loss": 0.9941, + "step": 17972 + }, + { + "epoch": 0.46, + "learning_rate": 1.9210055183270447e-06, + "loss": 0.8828, + "step": 17973 + }, + { + "epoch": 0.46, + "learning_rate": 1.9209947389621893e-06, + "loss": 0.9824, + "step": 17974 + }, + { + "epoch": 0.46, + "learning_rate": 1.920983958892171e-06, + "loss": 1.0752, + "step": 17975 + }, + { + "epoch": 0.46, + "learning_rate": 1.9209731781169975e-06, + "loss": 0.9727, + "step": 17976 + }, + { + "epoch": 0.46, + "learning_rate": 1.920962396636677e-06, + "loss": 0.9805, + "step": 17977 + }, + { + "epoch": 0.46, + "learning_rate": 1.9209516144512178e-06, + "loss": 0.918, + "step": 17978 + }, + { + "epoch": 0.46, + "learning_rate": 1.9209408315606288e-06, + "loss": 1.0508, + "step": 17979 + }, + { + "epoch": 0.46, + "learning_rate": 1.9209300479649174e-06, + "loss": 0.9424, + "step": 17980 + }, + { + "epoch": 0.46, + "learning_rate": 1.9209192636640923e-06, + "loss": 0.8354, + "step": 17981 + }, + { + "epoch": 0.46, + "learning_rate": 1.9209084786581617e-06, + "loss": 1.168, + "step": 17982 + }, + { + "epoch": 0.46, + "learning_rate": 1.920897692947134e-06, + "loss": 0.9453, + "step": 17983 + }, + { + "epoch": 0.46, + "learning_rate": 1.920886906531017e-06, + "loss": 0.9307, + "step": 17984 + }, + { + "epoch": 0.46, + "learning_rate": 1.9208761194098195e-06, + "loss": 0.9746, + "step": 17985 + }, + { + "epoch": 0.46, + "learning_rate": 1.920865331583549e-06, + "loss": 0.9443, + "step": 17986 + }, + { + "epoch": 0.46, + "learning_rate": 1.9208545430522146e-06, + "loss": 0.8438, + "step": 17987 + }, + { + "epoch": 0.46, + "learning_rate": 1.9208437538158245e-06, + "loss": 0.6436, + "step": 17988 + }, + { + "epoch": 0.46, + "learning_rate": 1.9208329638743863e-06, + "loss": 0.8501, + "step": 17989 + }, + { + "epoch": 0.46, + "learning_rate": 1.9208221732279088e-06, + "loss": 0.7871, + "step": 17990 + }, + { + "epoch": 0.46, + "learning_rate": 1.9208113818764e-06, + "loss": 0.7715, + "step": 17991 + }, + { + "epoch": 0.46, + "learning_rate": 1.920800589819868e-06, + "loss": 0.877, + "step": 17992 + }, + { + "epoch": 0.46, + "learning_rate": 1.9207897970583216e-06, + "loss": 0.6084, + "step": 17993 + }, + { + "epoch": 0.46, + "learning_rate": 1.9207790035917686e-06, + "loss": 0.9912, + "step": 17994 + }, + { + "epoch": 0.46, + "learning_rate": 1.920768209420218e-06, + "loss": 0.8799, + "step": 17995 + }, + { + "epoch": 0.46, + "learning_rate": 1.920757414543677e-06, + "loss": 1.0625, + "step": 17996 + }, + { + "epoch": 0.46, + "learning_rate": 1.9207466189621545e-06, + "loss": 0.918, + "step": 17997 + }, + { + "epoch": 0.46, + "learning_rate": 1.920735822675659e-06, + "loss": 0.8604, + "step": 17998 + }, + { + "epoch": 0.46, + "learning_rate": 1.920725025684198e-06, + "loss": 1.0801, + "step": 17999 + }, + { + "epoch": 0.46, + "learning_rate": 1.9207142279877803e-06, + "loss": 0.8091, + "step": 18000 + }, + { + "epoch": 0.46, + "learning_rate": 1.9207034295864138e-06, + "loss": 0.9189, + "step": 18001 + }, + { + "epoch": 0.46, + "learning_rate": 1.9206926304801074e-06, + "loss": 1.0498, + "step": 18002 + }, + { + "epoch": 0.46, + "learning_rate": 1.920681830668869e-06, + "loss": 0.957, + "step": 18003 + }, + { + "epoch": 0.46, + "learning_rate": 1.9206710301527067e-06, + "loss": 0.9541, + "step": 18004 + }, + { + "epoch": 0.46, + "learning_rate": 1.920660228931629e-06, + "loss": 0.957, + "step": 18005 + }, + { + "epoch": 0.46, + "learning_rate": 1.9206494270056443e-06, + "loss": 0.8755, + "step": 18006 + }, + { + "epoch": 0.46, + "learning_rate": 1.92063862437476e-06, + "loss": 0.8989, + "step": 18007 + }, + { + "epoch": 0.46, + "learning_rate": 1.920627821038986e-06, + "loss": 0.791, + "step": 18008 + }, + { + "epoch": 0.46, + "learning_rate": 1.9206170169983285e-06, + "loss": 0.8965, + "step": 18009 + }, + { + "epoch": 0.46, + "learning_rate": 1.920606212252798e-06, + "loss": 0.8052, + "step": 18010 + }, + { + "epoch": 0.46, + "learning_rate": 1.9205954068024006e-06, + "loss": 0.9561, + "step": 18011 + }, + { + "epoch": 0.46, + "learning_rate": 1.9205846006471466e-06, + "loss": 0.8145, + "step": 18012 + }, + { + "epoch": 0.46, + "learning_rate": 1.9205737937870427e-06, + "loss": 0.8086, + "step": 18013 + }, + { + "epoch": 0.46, + "learning_rate": 1.9205629862220976e-06, + "loss": 1.0625, + "step": 18014 + }, + { + "epoch": 0.46, + "learning_rate": 1.9205521779523203e-06, + "loss": 0.8167, + "step": 18015 + }, + { + "epoch": 0.46, + "learning_rate": 1.920541368977718e-06, + "loss": 0.9424, + "step": 18016 + }, + { + "epoch": 0.46, + "learning_rate": 1.9205305592982997e-06, + "loss": 0.8125, + "step": 18017 + }, + { + "epoch": 0.46, + "learning_rate": 1.920519748914074e-06, + "loss": 1.1064, + "step": 18018 + }, + { + "epoch": 0.46, + "learning_rate": 1.920508937825048e-06, + "loss": 1.0264, + "step": 18019 + }, + { + "epoch": 0.46, + "learning_rate": 1.920498126031231e-06, + "loss": 0.9482, + "step": 18020 + }, + { + "epoch": 0.46, + "learning_rate": 1.9204873135326305e-06, + "loss": 0.8828, + "step": 18021 + }, + { + "epoch": 0.46, + "learning_rate": 1.9204765003292556e-06, + "loss": 0.6924, + "step": 18022 + }, + { + "epoch": 0.46, + "learning_rate": 1.9204656864211138e-06, + "loss": 0.8149, + "step": 18023 + }, + { + "epoch": 0.46, + "learning_rate": 1.9204548718082142e-06, + "loss": 0.8389, + "step": 18024 + }, + { + "epoch": 0.46, + "learning_rate": 1.9204440564905642e-06, + "loss": 0.9204, + "step": 18025 + }, + { + "epoch": 0.46, + "learning_rate": 1.920433240468173e-06, + "loss": 0.8403, + "step": 18026 + }, + { + "epoch": 0.46, + "learning_rate": 1.920422423741048e-06, + "loss": 0.6968, + "step": 18027 + }, + { + "epoch": 0.46, + "learning_rate": 1.9204116063091978e-06, + "loss": 0.8701, + "step": 18028 + }, + { + "epoch": 0.46, + "learning_rate": 1.920400788172631e-06, + "loss": 0.7432, + "step": 18029 + }, + { + "epoch": 0.46, + "learning_rate": 1.9203899693313557e-06, + "loss": 0.7373, + "step": 18030 + }, + { + "epoch": 0.46, + "learning_rate": 1.9203791497853795e-06, + "loss": 0.8232, + "step": 18031 + }, + { + "epoch": 0.46, + "learning_rate": 1.920368329534712e-06, + "loss": 1.0059, + "step": 18032 + }, + { + "epoch": 0.46, + "learning_rate": 1.9203575085793607e-06, + "loss": 0.8667, + "step": 18033 + }, + { + "epoch": 0.46, + "learning_rate": 1.9203466869193338e-06, + "loss": 0.9941, + "step": 18034 + }, + { + "epoch": 0.46, + "learning_rate": 1.92033586455464e-06, + "loss": 0.8628, + "step": 18035 + }, + { + "epoch": 0.46, + "learning_rate": 1.920325041485287e-06, + "loss": 0.8604, + "step": 18036 + }, + { + "epoch": 0.46, + "learning_rate": 1.9203142177112835e-06, + "loss": 0.8555, + "step": 18037 + }, + { + "epoch": 0.46, + "learning_rate": 1.9203033932326376e-06, + "loss": 0.8936, + "step": 18038 + }, + { + "epoch": 0.46, + "learning_rate": 1.920292568049358e-06, + "loss": 1.0781, + "step": 18039 + }, + { + "epoch": 0.46, + "learning_rate": 1.9202817421614526e-06, + "loss": 0.6851, + "step": 18040 + }, + { + "epoch": 0.46, + "learning_rate": 1.9202709155689297e-06, + "loss": 0.9004, + "step": 18041 + }, + { + "epoch": 0.46, + "learning_rate": 1.920260088271798e-06, + "loss": 0.7998, + "step": 18042 + }, + { + "epoch": 0.46, + "learning_rate": 1.9202492602700653e-06, + "loss": 0.6418, + "step": 18043 + }, + { + "epoch": 0.46, + "learning_rate": 1.92023843156374e-06, + "loss": 1.0059, + "step": 18044 + }, + { + "epoch": 0.46, + "learning_rate": 1.9202276021528304e-06, + "loss": 0.9004, + "step": 18045 + }, + { + "epoch": 0.46, + "learning_rate": 1.920216772037345e-06, + "loss": 0.8545, + "step": 18046 + }, + { + "epoch": 0.46, + "learning_rate": 1.9202059412172916e-06, + "loss": 0.8008, + "step": 18047 + }, + { + "epoch": 0.46, + "learning_rate": 1.9201951096926788e-06, + "loss": 0.9258, + "step": 18048 + }, + { + "epoch": 0.46, + "learning_rate": 1.9201842774635154e-06, + "loss": 0.9922, + "step": 18049 + }, + { + "epoch": 0.46, + "learning_rate": 1.920173444529809e-06, + "loss": 0.9492, + "step": 18050 + }, + { + "epoch": 0.46, + "learning_rate": 1.9201626108915678e-06, + "loss": 0.8604, + "step": 18051 + }, + { + "epoch": 0.46, + "learning_rate": 1.920151776548801e-06, + "loss": 0.7856, + "step": 18052 + }, + { + "epoch": 0.46, + "learning_rate": 1.9201409415015157e-06, + "loss": 0.7314, + "step": 18053 + }, + { + "epoch": 0.46, + "learning_rate": 1.920130105749721e-06, + "loss": 1.1504, + "step": 18054 + }, + { + "epoch": 0.46, + "learning_rate": 1.9201192692934253e-06, + "loss": 0.9648, + "step": 18055 + }, + { + "epoch": 0.46, + "learning_rate": 1.920108432132636e-06, + "loss": 1.0, + "step": 18056 + }, + { + "epoch": 0.46, + "learning_rate": 1.9200975942673626e-06, + "loss": 1.0254, + "step": 18057 + }, + { + "epoch": 0.46, + "learning_rate": 1.9200867556976125e-06, + "loss": 0.7715, + "step": 18058 + }, + { + "epoch": 0.46, + "learning_rate": 1.920075916423394e-06, + "loss": 0.9912, + "step": 18059 + }, + { + "epoch": 0.46, + "learning_rate": 1.920065076444716e-06, + "loss": 0.8345, + "step": 18060 + }, + { + "epoch": 0.46, + "learning_rate": 1.9200542357615865e-06, + "loss": 0.998, + "step": 18061 + }, + { + "epoch": 0.46, + "learning_rate": 1.9200433943740137e-06, + "loss": 0.7622, + "step": 18062 + }, + { + "epoch": 0.46, + "learning_rate": 1.920032552282006e-06, + "loss": 1.0889, + "step": 18063 + }, + { + "epoch": 0.46, + "learning_rate": 1.9200217094855715e-06, + "loss": 0.9834, + "step": 18064 + }, + { + "epoch": 0.46, + "learning_rate": 1.9200108659847187e-06, + "loss": 0.7939, + "step": 18065 + }, + { + "epoch": 0.46, + "learning_rate": 1.9200000217794565e-06, + "loss": 0.8271, + "step": 18066 + }, + { + "epoch": 0.46, + "learning_rate": 1.919989176869792e-06, + "loss": 0.8965, + "step": 18067 + }, + { + "epoch": 0.46, + "learning_rate": 1.9199783312557338e-06, + "loss": 0.7998, + "step": 18068 + }, + { + "epoch": 0.46, + "learning_rate": 1.9199674849372907e-06, + "loss": 0.77, + "step": 18069 + }, + { + "epoch": 0.46, + "learning_rate": 1.9199566379144716e-06, + "loss": 0.8633, + "step": 18070 + }, + { + "epoch": 0.46, + "learning_rate": 1.9199457901872827e-06, + "loss": 0.751, + "step": 18071 + }, + { + "epoch": 0.46, + "learning_rate": 1.9199349417557347e-06, + "loss": 0.9814, + "step": 18072 + }, + { + "epoch": 0.46, + "learning_rate": 1.9199240926198343e-06, + "loss": 1.0352, + "step": 18073 + }, + { + "epoch": 0.46, + "learning_rate": 1.9199132427795905e-06, + "loss": 0.8232, + "step": 18074 + }, + { + "epoch": 0.46, + "learning_rate": 1.9199023922350112e-06, + "loss": 0.7676, + "step": 18075 + }, + { + "epoch": 0.46, + "learning_rate": 1.919891540986105e-06, + "loss": 0.9458, + "step": 18076 + }, + { + "epoch": 0.46, + "learning_rate": 1.9198806890328803e-06, + "loss": 0.8086, + "step": 18077 + }, + { + "epoch": 0.46, + "learning_rate": 1.919869836375345e-06, + "loss": 0.7266, + "step": 18078 + }, + { + "epoch": 0.46, + "learning_rate": 1.919858983013508e-06, + "loss": 0.7803, + "step": 18079 + }, + { + "epoch": 0.46, + "learning_rate": 1.919848128947377e-06, + "loss": 0.9336, + "step": 18080 + }, + { + "epoch": 0.46, + "learning_rate": 1.919837274176961e-06, + "loss": 0.8052, + "step": 18081 + }, + { + "epoch": 0.46, + "learning_rate": 1.9198264187022675e-06, + "loss": 0.8896, + "step": 18082 + }, + { + "epoch": 0.46, + "learning_rate": 1.9198155625233056e-06, + "loss": 0.9385, + "step": 18083 + }, + { + "epoch": 0.46, + "learning_rate": 1.9198047056400827e-06, + "loss": 0.4043, + "step": 18084 + }, + { + "epoch": 0.46, + "learning_rate": 1.919793848052608e-06, + "loss": 0.9785, + "step": 18085 + }, + { + "epoch": 0.46, + "learning_rate": 1.919782989760889e-06, + "loss": 0.8672, + "step": 18086 + }, + { + "epoch": 0.46, + "learning_rate": 1.919772130764935e-06, + "loss": 0.9609, + "step": 18087 + }, + { + "epoch": 0.46, + "learning_rate": 1.9197612710647536e-06, + "loss": 0.8154, + "step": 18088 + }, + { + "epoch": 0.46, + "learning_rate": 1.919750410660353e-06, + "loss": 0.7236, + "step": 18089 + }, + { + "epoch": 0.46, + "learning_rate": 1.9197395495517422e-06, + "loss": 0.9736, + "step": 18090 + }, + { + "epoch": 0.46, + "learning_rate": 1.9197286877389287e-06, + "loss": 1.0605, + "step": 18091 + }, + { + "epoch": 0.46, + "learning_rate": 1.9197178252219216e-06, + "loss": 0.9023, + "step": 18092 + }, + { + "epoch": 0.46, + "learning_rate": 1.9197069620007285e-06, + "loss": 0.8926, + "step": 18093 + }, + { + "epoch": 0.46, + "learning_rate": 1.9196960980753585e-06, + "loss": 1.0498, + "step": 18094 + }, + { + "epoch": 0.46, + "learning_rate": 1.919685233445819e-06, + "loss": 0.9795, + "step": 18095 + }, + { + "epoch": 0.46, + "learning_rate": 1.9196743681121194e-06, + "loss": 0.835, + "step": 18096 + }, + { + "epoch": 0.46, + "learning_rate": 1.919663502074267e-06, + "loss": 0.7163, + "step": 18097 + }, + { + "epoch": 0.46, + "learning_rate": 1.9196526353322705e-06, + "loss": 0.8447, + "step": 18098 + }, + { + "epoch": 0.46, + "learning_rate": 1.9196417678861386e-06, + "loss": 0.7607, + "step": 18099 + }, + { + "epoch": 0.46, + "learning_rate": 1.9196308997358787e-06, + "loss": 0.9038, + "step": 18100 + }, + { + "epoch": 0.46, + "learning_rate": 1.9196200308815007e-06, + "loss": 0.748, + "step": 18101 + }, + { + "epoch": 0.46, + "learning_rate": 1.919609161323011e-06, + "loss": 0.8188, + "step": 18102 + }, + { + "epoch": 0.46, + "learning_rate": 1.9195982910604193e-06, + "loss": 0.7031, + "step": 18103 + }, + { + "epoch": 0.46, + "learning_rate": 1.919587420093733e-06, + "loss": 1.1514, + "step": 18104 + }, + { + "epoch": 0.46, + "learning_rate": 1.9195765484229615e-06, + "loss": 0.9282, + "step": 18105 + }, + { + "epoch": 0.46, + "learning_rate": 1.919565676048112e-06, + "loss": 1.0361, + "step": 18106 + }, + { + "epoch": 0.46, + "learning_rate": 1.919554802969194e-06, + "loss": 0.8818, + "step": 18107 + }, + { + "epoch": 0.46, + "learning_rate": 1.9195439291862147e-06, + "loss": 0.6851, + "step": 18108 + }, + { + "epoch": 0.46, + "learning_rate": 1.9195330546991828e-06, + "loss": 0.8242, + "step": 18109 + }, + { + "epoch": 0.46, + "learning_rate": 1.9195221795081068e-06, + "loss": 0.9336, + "step": 18110 + }, + { + "epoch": 0.46, + "learning_rate": 1.9195113036129952e-06, + "loss": 1.0312, + "step": 18111 + }, + { + "epoch": 0.46, + "learning_rate": 1.919500427013856e-06, + "loss": 0.8721, + "step": 18112 + }, + { + "epoch": 0.46, + "learning_rate": 1.919489549710697e-06, + "loss": 0.8877, + "step": 18113 + }, + { + "epoch": 0.46, + "learning_rate": 1.919478671703528e-06, + "loss": 0.8887, + "step": 18114 + }, + { + "epoch": 0.46, + "learning_rate": 1.9194677929923563e-06, + "loss": 0.9502, + "step": 18115 + }, + { + "epoch": 0.46, + "learning_rate": 1.91945691357719e-06, + "loss": 1.0898, + "step": 18116 + }, + { + "epoch": 0.46, + "learning_rate": 1.9194460334580384e-06, + "loss": 1.125, + "step": 18117 + }, + { + "epoch": 0.46, + "learning_rate": 1.9194351526349086e-06, + "loss": 0.6616, + "step": 18118 + }, + { + "epoch": 0.46, + "learning_rate": 1.9194242711078098e-06, + "loss": 0.6797, + "step": 18119 + }, + { + "epoch": 0.46, + "learning_rate": 1.9194133888767503e-06, + "loss": 0.7881, + "step": 18120 + }, + { + "epoch": 0.46, + "learning_rate": 1.919402505941738e-06, + "loss": 0.7861, + "step": 18121 + }, + { + "epoch": 0.46, + "learning_rate": 1.9193916223027813e-06, + "loss": 0.7588, + "step": 18122 + }, + { + "epoch": 0.46, + "learning_rate": 1.919380737959889e-06, + "loss": 0.6318, + "step": 18123 + }, + { + "epoch": 0.46, + "learning_rate": 1.9193698529130694e-06, + "loss": 0.7764, + "step": 18124 + }, + { + "epoch": 0.46, + "learning_rate": 1.91935896716233e-06, + "loss": 0.8623, + "step": 18125 + }, + { + "epoch": 0.46, + "learning_rate": 1.9193480807076803e-06, + "loss": 0.7891, + "step": 18126 + }, + { + "epoch": 0.46, + "learning_rate": 1.9193371935491278e-06, + "loss": 0.8447, + "step": 18127 + }, + { + "epoch": 0.46, + "learning_rate": 1.919326305686681e-06, + "loss": 0.8281, + "step": 18128 + }, + { + "epoch": 0.46, + "learning_rate": 1.9193154171203485e-06, + "loss": 0.9473, + "step": 18129 + }, + { + "epoch": 0.46, + "learning_rate": 1.919304527850138e-06, + "loss": 0.8945, + "step": 18130 + }, + { + "epoch": 0.46, + "learning_rate": 1.9192936378760587e-06, + "loss": 0.8037, + "step": 18131 + }, + { + "epoch": 0.46, + "learning_rate": 1.9192827471981187e-06, + "loss": 0.7783, + "step": 18132 + }, + { + "epoch": 0.46, + "learning_rate": 1.919271855816326e-06, + "loss": 0.832, + "step": 18133 + }, + { + "epoch": 0.46, + "learning_rate": 1.919260963730689e-06, + "loss": 0.7368, + "step": 18134 + }, + { + "epoch": 0.46, + "learning_rate": 1.919250070941216e-06, + "loss": 1.042, + "step": 18135 + }, + { + "epoch": 0.46, + "learning_rate": 1.9192391774479156e-06, + "loss": 0.791, + "step": 18136 + }, + { + "epoch": 0.46, + "learning_rate": 1.9192282832507963e-06, + "loss": 0.6897, + "step": 18137 + }, + { + "epoch": 0.46, + "learning_rate": 1.919217388349866e-06, + "loss": 1.0176, + "step": 18138 + }, + { + "epoch": 0.46, + "learning_rate": 1.9192064927451332e-06, + "loss": 0.8208, + "step": 18139 + }, + { + "epoch": 0.46, + "learning_rate": 1.919195596436606e-06, + "loss": 0.918, + "step": 18140 + }, + { + "epoch": 0.46, + "learning_rate": 1.9191846994242935e-06, + "loss": 0.9482, + "step": 18141 + }, + { + "epoch": 0.46, + "learning_rate": 1.919173801708203e-06, + "loss": 0.8218, + "step": 18142 + }, + { + "epoch": 0.47, + "learning_rate": 1.9191629032883436e-06, + "loss": 0.9453, + "step": 18143 + }, + { + "epoch": 0.47, + "learning_rate": 1.9191520041647235e-06, + "loss": 0.8311, + "step": 18144 + }, + { + "epoch": 0.47, + "learning_rate": 1.919141104337351e-06, + "loss": 0.834, + "step": 18145 + }, + { + "epoch": 0.47, + "learning_rate": 1.9191302038062343e-06, + "loss": 0.8672, + "step": 18146 + }, + { + "epoch": 0.47, + "learning_rate": 1.919119302571382e-06, + "loss": 0.9219, + "step": 18147 + }, + { + "epoch": 0.47, + "learning_rate": 1.9191084006328026e-06, + "loss": 0.7891, + "step": 18148 + }, + { + "epoch": 0.47, + "learning_rate": 1.9190974979905035e-06, + "loss": 0.7021, + "step": 18149 + }, + { + "epoch": 0.47, + "learning_rate": 1.919086594644494e-06, + "loss": 0.7549, + "step": 18150 + }, + { + "epoch": 0.47, + "learning_rate": 1.9190756905947824e-06, + "loss": 0.9395, + "step": 18151 + }, + { + "epoch": 0.47, + "learning_rate": 1.9190647858413765e-06, + "loss": 0.8975, + "step": 18152 + }, + { + "epoch": 0.47, + "learning_rate": 1.9190538803842853e-06, + "loss": 1.0527, + "step": 18153 + }, + { + "epoch": 0.47, + "learning_rate": 1.9190429742235163e-06, + "loss": 0.4824, + "step": 18154 + }, + { + "epoch": 0.47, + "learning_rate": 1.9190320673590786e-06, + "loss": 0.9023, + "step": 18155 + }, + { + "epoch": 0.47, + "learning_rate": 1.91902115979098e-06, + "loss": 0.9893, + "step": 18156 + }, + { + "epoch": 0.47, + "learning_rate": 1.9190102515192297e-06, + "loss": 1.0586, + "step": 18157 + }, + { + "epoch": 0.47, + "learning_rate": 1.9189993425438355e-06, + "loss": 0.5879, + "step": 18158 + }, + { + "epoch": 0.47, + "learning_rate": 1.9189884328648055e-06, + "loss": 0.9062, + "step": 18159 + }, + { + "epoch": 0.47, + "learning_rate": 1.9189775224821483e-06, + "loss": 0.7522, + "step": 18160 + }, + { + "epoch": 0.47, + "learning_rate": 1.918966611395872e-06, + "loss": 1.0088, + "step": 18161 + }, + { + "epoch": 0.47, + "learning_rate": 1.9189556996059857e-06, + "loss": 0.7607, + "step": 18162 + }, + { + "epoch": 0.47, + "learning_rate": 1.918944787112497e-06, + "loss": 0.7812, + "step": 18163 + }, + { + "epoch": 0.47, + "learning_rate": 1.9189338739154147e-06, + "loss": 1.0391, + "step": 18164 + }, + { + "epoch": 0.47, + "learning_rate": 1.918922960014747e-06, + "loss": 1.0859, + "step": 18165 + }, + { + "epoch": 0.47, + "learning_rate": 1.918912045410502e-06, + "loss": 0.9688, + "step": 18166 + }, + { + "epoch": 0.47, + "learning_rate": 1.9189011301026884e-06, + "loss": 0.9014, + "step": 18167 + }, + { + "epoch": 0.47, + "learning_rate": 1.9188902140913146e-06, + "loss": 0.832, + "step": 18168 + }, + { + "epoch": 0.47, + "learning_rate": 1.918879297376389e-06, + "loss": 0.6787, + "step": 18169 + }, + { + "epoch": 0.47, + "learning_rate": 1.9188683799579194e-06, + "loss": 0.9648, + "step": 18170 + }, + { + "epoch": 0.47, + "learning_rate": 1.9188574618359145e-06, + "loss": 0.9229, + "step": 18171 + }, + { + "epoch": 0.47, + "learning_rate": 1.918846543010383e-06, + "loss": 0.8262, + "step": 18172 + }, + { + "epoch": 0.47, + "learning_rate": 1.9188356234813327e-06, + "loss": 0.8457, + "step": 18173 + }, + { + "epoch": 0.47, + "learning_rate": 1.9188247032487724e-06, + "loss": 0.9258, + "step": 18174 + }, + { + "epoch": 0.47, + "learning_rate": 1.91881378231271e-06, + "loss": 1.0322, + "step": 18175 + }, + { + "epoch": 0.47, + "learning_rate": 1.9188028606731544e-06, + "loss": 0.9023, + "step": 18176 + }, + { + "epoch": 0.47, + "learning_rate": 1.9187919383301137e-06, + "loss": 0.7905, + "step": 18177 + }, + { + "epoch": 0.47, + "learning_rate": 1.918781015283596e-06, + "loss": 1.0752, + "step": 18178 + }, + { + "epoch": 0.47, + "learning_rate": 1.91877009153361e-06, + "loss": 0.7725, + "step": 18179 + }, + { + "epoch": 0.47, + "learning_rate": 1.918759167080164e-06, + "loss": 0.8281, + "step": 18180 + }, + { + "epoch": 0.47, + "learning_rate": 1.9187482419232667e-06, + "loss": 0.9053, + "step": 18181 + }, + { + "epoch": 0.47, + "learning_rate": 1.918737316062926e-06, + "loss": 0.8877, + "step": 18182 + }, + { + "epoch": 0.47, + "learning_rate": 1.91872638949915e-06, + "loss": 0.9473, + "step": 18183 + }, + { + "epoch": 0.47, + "learning_rate": 1.9187154622319476e-06, + "loss": 0.748, + "step": 18184 + }, + { + "epoch": 0.47, + "learning_rate": 1.918704534261327e-06, + "loss": 0.8975, + "step": 18185 + }, + { + "epoch": 0.47, + "learning_rate": 1.918693605587297e-06, + "loss": 0.8555, + "step": 18186 + }, + { + "epoch": 0.47, + "learning_rate": 1.918682676209865e-06, + "loss": 0.8643, + "step": 18187 + }, + { + "epoch": 0.47, + "learning_rate": 1.91867174612904e-06, + "loss": 0.7354, + "step": 18188 + }, + { + "epoch": 0.47, + "learning_rate": 1.9186608153448303e-06, + "loss": 0.9561, + "step": 18189 + }, + { + "epoch": 0.47, + "learning_rate": 1.9186498838572443e-06, + "loss": 0.9951, + "step": 18190 + }, + { + "epoch": 0.47, + "learning_rate": 1.9186389516662906e-06, + "loss": 0.791, + "step": 18191 + }, + { + "epoch": 0.47, + "learning_rate": 1.9186280187719773e-06, + "loss": 0.8477, + "step": 18192 + }, + { + "epoch": 0.47, + "learning_rate": 1.9186170851743124e-06, + "loss": 1.0078, + "step": 18193 + }, + { + "epoch": 0.47, + "learning_rate": 1.9186061508733047e-06, + "loss": 0.8887, + "step": 18194 + }, + { + "epoch": 0.47, + "learning_rate": 1.9185952158689625e-06, + "loss": 1.0752, + "step": 18195 + }, + { + "epoch": 0.47, + "learning_rate": 1.9185842801612944e-06, + "loss": 0.8555, + "step": 18196 + }, + { + "epoch": 0.47, + "learning_rate": 1.9185733437503083e-06, + "loss": 0.6528, + "step": 18197 + }, + { + "epoch": 0.47, + "learning_rate": 1.9185624066360133e-06, + "loss": 1.0703, + "step": 18198 + }, + { + "epoch": 0.47, + "learning_rate": 1.9185514688184166e-06, + "loss": 0.6582, + "step": 18199 + }, + { + "epoch": 0.47, + "learning_rate": 1.9185405302975277e-06, + "loss": 1.127, + "step": 18200 + }, + { + "epoch": 0.47, + "learning_rate": 1.9185295910733545e-06, + "loss": 0.707, + "step": 18201 + }, + { + "epoch": 0.47, + "learning_rate": 1.9185186511459056e-06, + "loss": 0.8916, + "step": 18202 + }, + { + "epoch": 0.47, + "learning_rate": 1.918507710515189e-06, + "loss": 0.9395, + "step": 18203 + }, + { + "epoch": 0.47, + "learning_rate": 1.9184967691812133e-06, + "loss": 0.957, + "step": 18204 + }, + { + "epoch": 0.47, + "learning_rate": 1.918485827143987e-06, + "loss": 0.895, + "step": 18205 + }, + { + "epoch": 0.47, + "learning_rate": 1.9184748844035183e-06, + "loss": 0.8906, + "step": 18206 + }, + { + "epoch": 0.47, + "learning_rate": 1.9184639409598154e-06, + "loss": 0.7041, + "step": 18207 + }, + { + "epoch": 0.47, + "learning_rate": 1.918452996812887e-06, + "loss": 0.9873, + "step": 18208 + }, + { + "epoch": 0.47, + "learning_rate": 1.9184420519627413e-06, + "loss": 0.8545, + "step": 18209 + }, + { + "epoch": 0.47, + "learning_rate": 1.918431106409387e-06, + "loss": 0.8887, + "step": 18210 + }, + { + "epoch": 0.47, + "learning_rate": 1.918420160152832e-06, + "loss": 0.7197, + "step": 18211 + }, + { + "epoch": 0.47, + "learning_rate": 1.918409213193085e-06, + "loss": 0.7139, + "step": 18212 + }, + { + "epoch": 0.47, + "learning_rate": 1.918398265530154e-06, + "loss": 0.9209, + "step": 18213 + }, + { + "epoch": 0.47, + "learning_rate": 1.918387317164048e-06, + "loss": 0.9512, + "step": 18214 + }, + { + "epoch": 0.47, + "learning_rate": 1.918376368094775e-06, + "loss": 0.813, + "step": 18215 + }, + { + "epoch": 0.47, + "learning_rate": 1.9183654183223433e-06, + "loss": 0.9395, + "step": 18216 + }, + { + "epoch": 0.47, + "learning_rate": 1.9183544678467617e-06, + "loss": 0.915, + "step": 18217 + }, + { + "epoch": 0.47, + "learning_rate": 1.918343516668038e-06, + "loss": 0.8438, + "step": 18218 + }, + { + "epoch": 0.47, + "learning_rate": 1.918332564786181e-06, + "loss": 0.8008, + "step": 18219 + }, + { + "epoch": 0.47, + "learning_rate": 1.9183216122011995e-06, + "loss": 0.8877, + "step": 18220 + }, + { + "epoch": 0.47, + "learning_rate": 1.918310658913101e-06, + "loss": 0.8018, + "step": 18221 + }, + { + "epoch": 0.47, + "learning_rate": 1.918299704921894e-06, + "loss": 0.8457, + "step": 18222 + }, + { + "epoch": 0.47, + "learning_rate": 1.918288750227587e-06, + "loss": 0.7559, + "step": 18223 + }, + { + "epoch": 0.47, + "learning_rate": 1.9182777948301893e-06, + "loss": 0.9258, + "step": 18224 + }, + { + "epoch": 0.47, + "learning_rate": 1.918266838729708e-06, + "loss": 0.8047, + "step": 18225 + }, + { + "epoch": 0.47, + "learning_rate": 1.918255881926152e-06, + "loss": 0.9141, + "step": 18226 + }, + { + "epoch": 0.47, + "learning_rate": 1.91824492441953e-06, + "loss": 0.8594, + "step": 18227 + }, + { + "epoch": 0.47, + "learning_rate": 1.9182339662098497e-06, + "loss": 0.9932, + "step": 18228 + }, + { + "epoch": 0.47, + "learning_rate": 1.91822300729712e-06, + "loss": 1.0078, + "step": 18229 + }, + { + "epoch": 0.47, + "learning_rate": 1.918212047681349e-06, + "loss": 0.8721, + "step": 18230 + }, + { + "epoch": 0.47, + "learning_rate": 1.9182010873625453e-06, + "loss": 0.7783, + "step": 18231 + }, + { + "epoch": 0.47, + "learning_rate": 1.918190126340718e-06, + "loss": 0.9238, + "step": 18232 + }, + { + "epoch": 0.47, + "learning_rate": 1.9181791646158738e-06, + "loss": 1.0703, + "step": 18233 + }, + { + "epoch": 0.47, + "learning_rate": 1.9181682021880224e-06, + "loss": 0.9102, + "step": 18234 + }, + { + "epoch": 0.47, + "learning_rate": 1.9181572390571715e-06, + "loss": 0.9448, + "step": 18235 + }, + { + "epoch": 0.47, + "learning_rate": 1.9181462752233306e-06, + "loss": 0.8643, + "step": 18236 + }, + { + "epoch": 0.47, + "learning_rate": 1.9181353106865065e-06, + "loss": 0.7012, + "step": 18237 + }, + { + "epoch": 0.47, + "learning_rate": 1.9181243454467087e-06, + "loss": 0.8809, + "step": 18238 + }, + { + "epoch": 0.47, + "learning_rate": 1.9181133795039455e-06, + "loss": 0.7749, + "step": 18239 + }, + { + "epoch": 0.47, + "learning_rate": 1.918102412858225e-06, + "loss": 0.8975, + "step": 18240 + }, + { + "epoch": 0.47, + "learning_rate": 1.9180914455095552e-06, + "loss": 0.8857, + "step": 18241 + }, + { + "epoch": 0.47, + "learning_rate": 1.918080477457946e-06, + "loss": 0.9453, + "step": 18242 + }, + { + "epoch": 0.47, + "learning_rate": 1.918069508703404e-06, + "loss": 0.9902, + "step": 18243 + }, + { + "epoch": 0.47, + "learning_rate": 1.9180585392459385e-06, + "loss": 1.0195, + "step": 18244 + }, + { + "epoch": 0.47, + "learning_rate": 1.9180475690855577e-06, + "loss": 0.7627, + "step": 18245 + }, + { + "epoch": 0.47, + "learning_rate": 1.9180365982222704e-06, + "loss": 0.5989, + "step": 18246 + }, + { + "epoch": 0.47, + "learning_rate": 1.9180256266560847e-06, + "loss": 1.0635, + "step": 18247 + }, + { + "epoch": 0.47, + "learning_rate": 1.9180146543870086e-06, + "loss": 0.8486, + "step": 18248 + }, + { + "epoch": 0.47, + "learning_rate": 1.9180036814150514e-06, + "loss": 0.7759, + "step": 18249 + }, + { + "epoch": 0.47, + "learning_rate": 1.917992707740221e-06, + "loss": 0.6924, + "step": 18250 + }, + { + "epoch": 0.47, + "learning_rate": 1.9179817333625252e-06, + "loss": 0.8198, + "step": 18251 + }, + { + "epoch": 0.47, + "learning_rate": 1.9179707582819736e-06, + "loss": 0.832, + "step": 18252 + }, + { + "epoch": 0.47, + "learning_rate": 1.9179597824985734e-06, + "loss": 0.7046, + "step": 18253 + }, + { + "epoch": 0.47, + "learning_rate": 1.917948806012334e-06, + "loss": 0.8818, + "step": 18254 + }, + { + "epoch": 0.47, + "learning_rate": 1.9179378288232634e-06, + "loss": 0.8875, + "step": 18255 + }, + { + "epoch": 0.47, + "learning_rate": 1.91792685093137e-06, + "loss": 0.7412, + "step": 18256 + }, + { + "epoch": 0.47, + "learning_rate": 1.917915872336662e-06, + "loss": 0.9194, + "step": 18257 + }, + { + "epoch": 0.47, + "learning_rate": 1.9179048930391483e-06, + "loss": 0.9668, + "step": 18258 + }, + { + "epoch": 0.47, + "learning_rate": 1.917893913038837e-06, + "loss": 0.7241, + "step": 18259 + }, + { + "epoch": 0.47, + "learning_rate": 1.9178829323357366e-06, + "loss": 0.8408, + "step": 18260 + }, + { + "epoch": 0.47, + "learning_rate": 1.9178719509298554e-06, + "loss": 0.9531, + "step": 18261 + }, + { + "epoch": 0.47, + "learning_rate": 1.9178609688212016e-06, + "loss": 0.9082, + "step": 18262 + }, + { + "epoch": 0.47, + "learning_rate": 1.917849986009784e-06, + "loss": 0.6118, + "step": 18263 + }, + { + "epoch": 0.47, + "learning_rate": 1.917839002495611e-06, + "loss": 0.7261, + "step": 18264 + }, + { + "epoch": 0.47, + "learning_rate": 1.9178280182786906e-06, + "loss": 0.8516, + "step": 18265 + }, + { + "epoch": 0.47, + "learning_rate": 1.917817033359032e-06, + "loss": 1.0205, + "step": 18266 + }, + { + "epoch": 0.47, + "learning_rate": 1.9178060477366426e-06, + "loss": 1.0137, + "step": 18267 + }, + { + "epoch": 0.47, + "learning_rate": 1.9177950614115317e-06, + "loss": 0.8281, + "step": 18268 + }, + { + "epoch": 0.47, + "learning_rate": 1.917784074383707e-06, + "loss": 1.0088, + "step": 18269 + }, + { + "epoch": 0.47, + "learning_rate": 1.9177730866531773e-06, + "loss": 0.7236, + "step": 18270 + }, + { + "epoch": 0.47, + "learning_rate": 1.9177620982199508e-06, + "loss": 0.9336, + "step": 18271 + }, + { + "epoch": 0.47, + "learning_rate": 1.9177511090840363e-06, + "loss": 0.9209, + "step": 18272 + }, + { + "epoch": 0.47, + "learning_rate": 1.917740119245442e-06, + "loss": 0.7881, + "step": 18273 + }, + { + "epoch": 0.47, + "learning_rate": 1.9177291287041763e-06, + "loss": 0.5996, + "step": 18274 + }, + { + "epoch": 0.47, + "learning_rate": 1.9177181374602475e-06, + "loss": 0.9824, + "step": 18275 + }, + { + "epoch": 0.47, + "learning_rate": 1.9177071455136643e-06, + "loss": 0.8223, + "step": 18276 + }, + { + "epoch": 0.47, + "learning_rate": 1.9176961528644347e-06, + "loss": 0.7891, + "step": 18277 + }, + { + "epoch": 0.47, + "learning_rate": 1.9176851595125675e-06, + "loss": 0.8389, + "step": 18278 + }, + { + "epoch": 0.47, + "learning_rate": 1.9176741654580704e-06, + "loss": 0.8105, + "step": 18279 + }, + { + "epoch": 0.47, + "learning_rate": 1.917663170700953e-06, + "loss": 1.0615, + "step": 18280 + }, + { + "epoch": 0.47, + "learning_rate": 1.9176521752412233e-06, + "loss": 0.8994, + "step": 18281 + }, + { + "epoch": 0.47, + "learning_rate": 1.9176411790788893e-06, + "loss": 0.6304, + "step": 18282 + }, + { + "epoch": 0.47, + "learning_rate": 1.9176301822139593e-06, + "loss": 0.918, + "step": 18283 + }, + { + "epoch": 0.47, + "learning_rate": 1.9176191846464426e-06, + "loss": 1.0049, + "step": 18284 + }, + { + "epoch": 0.47, + "learning_rate": 1.917608186376347e-06, + "loss": 0.832, + "step": 18285 + }, + { + "epoch": 0.47, + "learning_rate": 1.9175971874036804e-06, + "loss": 1.0684, + "step": 18286 + }, + { + "epoch": 0.47, + "learning_rate": 1.917586187728452e-06, + "loss": 0.8428, + "step": 18287 + }, + { + "epoch": 0.47, + "learning_rate": 1.9175751873506703e-06, + "loss": 1.1221, + "step": 18288 + }, + { + "epoch": 0.47, + "learning_rate": 1.9175641862703437e-06, + "loss": 0.9453, + "step": 18289 + }, + { + "epoch": 0.47, + "learning_rate": 1.9175531844874802e-06, + "loss": 0.9834, + "step": 18290 + }, + { + "epoch": 0.47, + "learning_rate": 1.917542182002088e-06, + "loss": 0.8271, + "step": 18291 + }, + { + "epoch": 0.47, + "learning_rate": 1.9175311788141766e-06, + "loss": 0.7607, + "step": 18292 + }, + { + "epoch": 0.47, + "learning_rate": 1.9175201749237534e-06, + "loss": 1.1338, + "step": 18293 + }, + { + "epoch": 0.47, + "learning_rate": 1.9175091703308272e-06, + "loss": 0.8271, + "step": 18294 + }, + { + "epoch": 0.47, + "learning_rate": 1.9174981650354067e-06, + "loss": 0.6045, + "step": 18295 + }, + { + "epoch": 0.47, + "learning_rate": 1.9174871590375e-06, + "loss": 0.96, + "step": 18296 + }, + { + "epoch": 0.47, + "learning_rate": 1.917476152337115e-06, + "loss": 0.7715, + "step": 18297 + }, + { + "epoch": 0.47, + "learning_rate": 1.9174651449342613e-06, + "loss": 1.0791, + "step": 18298 + }, + { + "epoch": 0.47, + "learning_rate": 1.9174541368289466e-06, + "loss": 0.9277, + "step": 18299 + }, + { + "epoch": 0.47, + "learning_rate": 1.917443128021179e-06, + "loss": 0.915, + "step": 18300 + }, + { + "epoch": 0.47, + "learning_rate": 1.917432118510968e-06, + "loss": 0.9189, + "step": 18301 + }, + { + "epoch": 0.47, + "learning_rate": 1.9174211082983207e-06, + "loss": 0.9443, + "step": 18302 + }, + { + "epoch": 0.47, + "learning_rate": 1.917410097383247e-06, + "loss": 0.8896, + "step": 18303 + }, + { + "epoch": 0.47, + "learning_rate": 1.9173990857657546e-06, + "loss": 0.9722, + "step": 18304 + }, + { + "epoch": 0.47, + "learning_rate": 1.9173880734458513e-06, + "loss": 0.8701, + "step": 18305 + }, + { + "epoch": 0.47, + "learning_rate": 1.9173770604235464e-06, + "loss": 0.7178, + "step": 18306 + }, + { + "epoch": 0.47, + "learning_rate": 1.9173660466988483e-06, + "loss": 0.8496, + "step": 18307 + }, + { + "epoch": 0.47, + "learning_rate": 1.917355032271765e-06, + "loss": 0.6343, + "step": 18308 + }, + { + "epoch": 0.47, + "learning_rate": 1.9173440171423047e-06, + "loss": 0.7979, + "step": 18309 + }, + { + "epoch": 0.47, + "learning_rate": 1.9173330013104765e-06, + "loss": 0.8418, + "step": 18310 + }, + { + "epoch": 0.47, + "learning_rate": 1.917321984776289e-06, + "loss": 0.8027, + "step": 18311 + }, + { + "epoch": 0.47, + "learning_rate": 1.91731096753975e-06, + "loss": 0.999, + "step": 18312 + }, + { + "epoch": 0.47, + "learning_rate": 1.917299949600868e-06, + "loss": 1.0898, + "step": 18313 + }, + { + "epoch": 0.47, + "learning_rate": 1.917288930959652e-06, + "loss": 0.8311, + "step": 18314 + }, + { + "epoch": 0.47, + "learning_rate": 1.91727791161611e-06, + "loss": 0.7666, + "step": 18315 + }, + { + "epoch": 0.47, + "learning_rate": 1.9172668915702502e-06, + "loss": 0.8877, + "step": 18316 + }, + { + "epoch": 0.47, + "learning_rate": 1.9172558708220815e-06, + "loss": 1.0215, + "step": 18317 + }, + { + "epoch": 0.47, + "learning_rate": 1.917244849371612e-06, + "loss": 0.9414, + "step": 18318 + }, + { + "epoch": 0.47, + "learning_rate": 1.9172338272188505e-06, + "loss": 0.8413, + "step": 18319 + }, + { + "epoch": 0.47, + "learning_rate": 1.917222804363805e-06, + "loss": 0.8623, + "step": 18320 + }, + { + "epoch": 0.47, + "learning_rate": 1.917211780806484e-06, + "loss": 1.0068, + "step": 18321 + }, + { + "epoch": 0.47, + "learning_rate": 1.917200756546897e-06, + "loss": 0.748, + "step": 18322 + }, + { + "epoch": 0.47, + "learning_rate": 1.917189731585051e-06, + "loss": 0.8574, + "step": 18323 + }, + { + "epoch": 0.47, + "learning_rate": 1.917178705920955e-06, + "loss": 0.833, + "step": 18324 + }, + { + "epoch": 0.47, + "learning_rate": 1.917167679554617e-06, + "loss": 1.0381, + "step": 18325 + }, + { + "epoch": 0.47, + "learning_rate": 1.9171566524860465e-06, + "loss": 0.6084, + "step": 18326 + }, + { + "epoch": 0.47, + "learning_rate": 1.917145624715251e-06, + "loss": 0.8613, + "step": 18327 + }, + { + "epoch": 0.47, + "learning_rate": 1.9171345962422395e-06, + "loss": 0.7539, + "step": 18328 + }, + { + "epoch": 0.47, + "learning_rate": 1.9171235670670197e-06, + "loss": 0.8018, + "step": 18329 + }, + { + "epoch": 0.47, + "learning_rate": 1.917112537189601e-06, + "loss": 0.7998, + "step": 18330 + }, + { + "epoch": 0.47, + "learning_rate": 1.917101506609991e-06, + "loss": 0.7056, + "step": 18331 + }, + { + "epoch": 0.47, + "learning_rate": 1.9170904753281995e-06, + "loss": 1.1045, + "step": 18332 + }, + { + "epoch": 0.47, + "learning_rate": 1.917079443344233e-06, + "loss": 0.9004, + "step": 18333 + }, + { + "epoch": 0.47, + "learning_rate": 1.9170684106581016e-06, + "loss": 0.873, + "step": 18334 + }, + { + "epoch": 0.47, + "learning_rate": 1.9170573772698127e-06, + "loss": 0.8779, + "step": 18335 + }, + { + "epoch": 0.47, + "learning_rate": 1.917046343179375e-06, + "loss": 0.7969, + "step": 18336 + }, + { + "epoch": 0.47, + "learning_rate": 1.917035308386798e-06, + "loss": 0.6304, + "step": 18337 + }, + { + "epoch": 0.47, + "learning_rate": 1.917024272892088e-06, + "loss": 1.0537, + "step": 18338 + }, + { + "epoch": 0.47, + "learning_rate": 1.917013236695255e-06, + "loss": 0.8828, + "step": 18339 + }, + { + "epoch": 0.47, + "learning_rate": 1.9170021997963076e-06, + "loss": 0.7715, + "step": 18340 + }, + { + "epoch": 0.47, + "learning_rate": 1.9169911621952533e-06, + "loss": 0.8291, + "step": 18341 + }, + { + "epoch": 0.47, + "learning_rate": 1.9169801238921015e-06, + "loss": 0.9688, + "step": 18342 + }, + { + "epoch": 0.47, + "learning_rate": 1.91696908488686e-06, + "loss": 0.9834, + "step": 18343 + }, + { + "epoch": 0.47, + "learning_rate": 1.9169580451795373e-06, + "loss": 0.6355, + "step": 18344 + }, + { + "epoch": 0.47, + "learning_rate": 1.916947004770142e-06, + "loss": 0.9521, + "step": 18345 + }, + { + "epoch": 0.47, + "learning_rate": 1.9169359636586824e-06, + "loss": 0.7444, + "step": 18346 + }, + { + "epoch": 0.47, + "learning_rate": 1.9169249218451677e-06, + "loss": 0.7544, + "step": 18347 + }, + { + "epoch": 0.47, + "learning_rate": 1.916913879329605e-06, + "loss": 0.9014, + "step": 18348 + }, + { + "epoch": 0.47, + "learning_rate": 1.916902836112004e-06, + "loss": 0.793, + "step": 18349 + }, + { + "epoch": 0.47, + "learning_rate": 1.9168917921923727e-06, + "loss": 0.8613, + "step": 18350 + }, + { + "epoch": 0.47, + "learning_rate": 1.9168807475707193e-06, + "loss": 0.8936, + "step": 18351 + }, + { + "epoch": 0.47, + "learning_rate": 1.916869702247052e-06, + "loss": 0.7529, + "step": 18352 + }, + { + "epoch": 0.47, + "learning_rate": 1.9168586562213807e-06, + "loss": 1.0586, + "step": 18353 + }, + { + "epoch": 0.47, + "learning_rate": 1.9168476094937124e-06, + "loss": 0.6865, + "step": 18354 + }, + { + "epoch": 0.47, + "learning_rate": 1.916836562064056e-06, + "loss": 0.8066, + "step": 18355 + }, + { + "epoch": 0.47, + "learning_rate": 1.91682551393242e-06, + "loss": 0.8818, + "step": 18356 + }, + { + "epoch": 0.47, + "learning_rate": 1.916814465098813e-06, + "loss": 0.8955, + "step": 18357 + }, + { + "epoch": 0.47, + "learning_rate": 1.9168034155632433e-06, + "loss": 0.9648, + "step": 18358 + }, + { + "epoch": 0.47, + "learning_rate": 1.916792365325719e-06, + "loss": 1.0938, + "step": 18359 + }, + { + "epoch": 0.47, + "learning_rate": 1.9167813143862493e-06, + "loss": 0.8975, + "step": 18360 + }, + { + "epoch": 0.47, + "learning_rate": 1.916770262744842e-06, + "loss": 0.7256, + "step": 18361 + }, + { + "epoch": 0.47, + "learning_rate": 1.916759210401507e-06, + "loss": 0.8848, + "step": 18362 + }, + { + "epoch": 0.47, + "learning_rate": 1.91674815735625e-06, + "loss": 0.8252, + "step": 18363 + }, + { + "epoch": 0.47, + "learning_rate": 1.916737103609082e-06, + "loss": 0.7397, + "step": 18364 + }, + { + "epoch": 0.47, + "learning_rate": 1.9167260491600106e-06, + "loss": 0.4846, + "step": 18365 + }, + { + "epoch": 0.47, + "learning_rate": 1.916714994009044e-06, + "loss": 0.8184, + "step": 18366 + }, + { + "epoch": 0.47, + "learning_rate": 1.916703938156191e-06, + "loss": 0.7773, + "step": 18367 + }, + { + "epoch": 0.47, + "learning_rate": 1.9166928816014596e-06, + "loss": 0.8887, + "step": 18368 + }, + { + "epoch": 0.47, + "learning_rate": 1.9166818243448592e-06, + "loss": 0.7031, + "step": 18369 + }, + { + "epoch": 0.47, + "learning_rate": 1.916670766386397e-06, + "loss": 0.8242, + "step": 18370 + }, + { + "epoch": 0.47, + "learning_rate": 1.916659707726083e-06, + "loss": 0.7512, + "step": 18371 + }, + { + "epoch": 0.47, + "learning_rate": 1.9166486483639238e-06, + "loss": 1.1182, + "step": 18372 + }, + { + "epoch": 0.47, + "learning_rate": 1.9166375882999293e-06, + "loss": 0.6543, + "step": 18373 + }, + { + "epoch": 0.47, + "learning_rate": 1.9166265275341074e-06, + "loss": 1.0303, + "step": 18374 + }, + { + "epoch": 0.47, + "learning_rate": 1.916615466066467e-06, + "loss": 0.9922, + "step": 18375 + }, + { + "epoch": 0.47, + "learning_rate": 1.9166044038970163e-06, + "loss": 0.8862, + "step": 18376 + }, + { + "epoch": 0.47, + "learning_rate": 1.9165933410257637e-06, + "loss": 0.5947, + "step": 18377 + }, + { + "epoch": 0.47, + "learning_rate": 1.9165822774527175e-06, + "loss": 0.8623, + "step": 18378 + }, + { + "epoch": 0.47, + "learning_rate": 1.9165712131778867e-06, + "loss": 0.7822, + "step": 18379 + }, + { + "epoch": 0.47, + "learning_rate": 1.9165601482012794e-06, + "loss": 0.7744, + "step": 18380 + }, + { + "epoch": 0.47, + "learning_rate": 1.916549082522904e-06, + "loss": 0.9883, + "step": 18381 + }, + { + "epoch": 0.47, + "learning_rate": 1.916538016142769e-06, + "loss": 0.7925, + "step": 18382 + }, + { + "epoch": 0.47, + "learning_rate": 1.9165269490608835e-06, + "loss": 0.7545, + "step": 18383 + }, + { + "epoch": 0.47, + "learning_rate": 1.916515881277255e-06, + "loss": 0.877, + "step": 18384 + }, + { + "epoch": 0.47, + "learning_rate": 1.9165048127918927e-06, + "loss": 1.0137, + "step": 18385 + }, + { + "epoch": 0.47, + "learning_rate": 1.916493743604805e-06, + "loss": 0.877, + "step": 18386 + }, + { + "epoch": 0.47, + "learning_rate": 1.9164826737159994e-06, + "loss": 0.7773, + "step": 18387 + }, + { + "epoch": 0.47, + "learning_rate": 1.9164716031254856e-06, + "loss": 1.0703, + "step": 18388 + }, + { + "epoch": 0.47, + "learning_rate": 1.916460531833272e-06, + "loss": 0.7209, + "step": 18389 + }, + { + "epoch": 0.47, + "learning_rate": 1.916449459839366e-06, + "loss": 0.6943, + "step": 18390 + }, + { + "epoch": 0.47, + "learning_rate": 1.916438387143777e-06, + "loss": 0.9951, + "step": 18391 + }, + { + "epoch": 0.47, + "learning_rate": 1.9164273137465137e-06, + "loss": 1.043, + "step": 18392 + }, + { + "epoch": 0.47, + "learning_rate": 1.916416239647584e-06, + "loss": 0.8071, + "step": 18393 + }, + { + "epoch": 0.47, + "learning_rate": 1.916405164846996e-06, + "loss": 0.6309, + "step": 18394 + }, + { + "epoch": 0.47, + "learning_rate": 1.9163940893447594e-06, + "loss": 0.9268, + "step": 18395 + }, + { + "epoch": 0.47, + "learning_rate": 1.9163830131408816e-06, + "loss": 0.9033, + "step": 18396 + }, + { + "epoch": 0.47, + "learning_rate": 1.9163719362353716e-06, + "loss": 0.8584, + "step": 18397 + }, + { + "epoch": 0.47, + "learning_rate": 1.9163608586282376e-06, + "loss": 0.9082, + "step": 18398 + }, + { + "epoch": 0.47, + "learning_rate": 1.9163497803194885e-06, + "loss": 0.9648, + "step": 18399 + }, + { + "epoch": 0.47, + "learning_rate": 1.916338701309132e-06, + "loss": 0.9775, + "step": 18400 + }, + { + "epoch": 0.47, + "learning_rate": 1.9163276215971776e-06, + "loss": 0.7578, + "step": 18401 + }, + { + "epoch": 0.47, + "learning_rate": 1.916316541183633e-06, + "loss": 0.8623, + "step": 18402 + }, + { + "epoch": 0.47, + "learning_rate": 1.9163054600685073e-06, + "loss": 0.7085, + "step": 18403 + }, + { + "epoch": 0.47, + "learning_rate": 1.916294378251808e-06, + "loss": 0.7866, + "step": 18404 + }, + { + "epoch": 0.47, + "learning_rate": 1.9162832957335448e-06, + "loss": 1.0146, + "step": 18405 + }, + { + "epoch": 0.47, + "learning_rate": 1.9162722125137252e-06, + "loss": 1.0166, + "step": 18406 + }, + { + "epoch": 0.47, + "learning_rate": 1.9162611285923583e-06, + "loss": 0.6899, + "step": 18407 + }, + { + "epoch": 0.47, + "learning_rate": 1.916250043969453e-06, + "loss": 0.8418, + "step": 18408 + }, + { + "epoch": 0.47, + "learning_rate": 1.916238958645016e-06, + "loss": 1.0195, + "step": 18409 + }, + { + "epoch": 0.47, + "learning_rate": 1.9162278726190577e-06, + "loss": 0.8291, + "step": 18410 + }, + { + "epoch": 0.47, + "learning_rate": 1.916216785891586e-06, + "loss": 0.8564, + "step": 18411 + }, + { + "epoch": 0.47, + "learning_rate": 1.9162056984626084e-06, + "loss": 0.8252, + "step": 18412 + }, + { + "epoch": 0.47, + "learning_rate": 1.916194610332135e-06, + "loss": 0.8262, + "step": 18413 + }, + { + "epoch": 0.47, + "learning_rate": 1.916183521500173e-06, + "loss": 0.8545, + "step": 18414 + }, + { + "epoch": 0.47, + "learning_rate": 1.9161724319667314e-06, + "loss": 0.8105, + "step": 18415 + }, + { + "epoch": 0.47, + "learning_rate": 1.9161613417318193e-06, + "loss": 0.9561, + "step": 18416 + }, + { + "epoch": 0.47, + "learning_rate": 1.9161502507954445e-06, + "loss": 0.8223, + "step": 18417 + }, + { + "epoch": 0.47, + "learning_rate": 1.916139159157615e-06, + "loss": 0.856, + "step": 18418 + }, + { + "epoch": 0.47, + "learning_rate": 1.9161280668183403e-06, + "loss": 0.7061, + "step": 18419 + }, + { + "epoch": 0.47, + "learning_rate": 1.9161169737776286e-06, + "loss": 1.084, + "step": 18420 + }, + { + "epoch": 0.47, + "learning_rate": 1.9161058800354876e-06, + "loss": 0.7622, + "step": 18421 + }, + { + "epoch": 0.47, + "learning_rate": 1.9160947855919267e-06, + "loss": 0.9111, + "step": 18422 + }, + { + "epoch": 0.47, + "learning_rate": 1.916083690446955e-06, + "loss": 0.8145, + "step": 18423 + }, + { + "epoch": 0.47, + "learning_rate": 1.916072594600579e-06, + "loss": 0.8896, + "step": 18424 + }, + { + "epoch": 0.47, + "learning_rate": 1.9160614980528087e-06, + "loss": 0.7217, + "step": 18425 + }, + { + "epoch": 0.47, + "learning_rate": 1.9160504008036524e-06, + "loss": 1.0117, + "step": 18426 + }, + { + "epoch": 0.47, + "learning_rate": 1.9160393028531185e-06, + "loss": 1.0254, + "step": 18427 + }, + { + "epoch": 0.47, + "learning_rate": 1.9160282042012154e-06, + "loss": 0.7686, + "step": 18428 + }, + { + "epoch": 0.47, + "learning_rate": 1.9160171048479513e-06, + "loss": 0.9766, + "step": 18429 + }, + { + "epoch": 0.47, + "learning_rate": 1.9160060047933354e-06, + "loss": 1.0918, + "step": 18430 + }, + { + "epoch": 0.47, + "learning_rate": 1.9159949040373754e-06, + "loss": 0.7432, + "step": 18431 + }, + { + "epoch": 0.47, + "learning_rate": 1.91598380258008e-06, + "loss": 0.8545, + "step": 18432 + }, + { + "epoch": 0.47, + "learning_rate": 1.915972700421459e-06, + "loss": 0.772, + "step": 18433 + }, + { + "epoch": 0.47, + "learning_rate": 1.915961597561519e-06, + "loss": 1.0703, + "step": 18434 + }, + { + "epoch": 0.47, + "learning_rate": 1.9159504940002695e-06, + "loss": 0.9146, + "step": 18435 + }, + { + "epoch": 0.47, + "learning_rate": 1.915939389737719e-06, + "loss": 1.041, + "step": 18436 + }, + { + "epoch": 0.47, + "learning_rate": 1.9159282847738754e-06, + "loss": 0.71, + "step": 18437 + }, + { + "epoch": 0.47, + "learning_rate": 1.915917179108748e-06, + "loss": 0.7832, + "step": 18438 + }, + { + "epoch": 0.47, + "learning_rate": 1.915906072742345e-06, + "loss": 0.8535, + "step": 18439 + }, + { + "epoch": 0.47, + "learning_rate": 1.9158949656746744e-06, + "loss": 0.8882, + "step": 18440 + }, + { + "epoch": 0.47, + "learning_rate": 1.9158838579057454e-06, + "loss": 0.6997, + "step": 18441 + }, + { + "epoch": 0.47, + "learning_rate": 1.9158727494355662e-06, + "loss": 0.9854, + "step": 18442 + }, + { + "epoch": 0.47, + "learning_rate": 1.9158616402641454e-06, + "loss": 1.0645, + "step": 18443 + }, + { + "epoch": 0.47, + "learning_rate": 1.915850530391492e-06, + "loss": 0.9189, + "step": 18444 + }, + { + "epoch": 0.47, + "learning_rate": 1.9158394198176133e-06, + "loss": 0.9033, + "step": 18445 + }, + { + "epoch": 0.47, + "learning_rate": 1.9158283085425184e-06, + "loss": 1.1152, + "step": 18446 + }, + { + "epoch": 0.47, + "learning_rate": 1.915817196566216e-06, + "loss": 0.918, + "step": 18447 + }, + { + "epoch": 0.47, + "learning_rate": 1.9158060838887143e-06, + "loss": 0.8799, + "step": 18448 + }, + { + "epoch": 0.47, + "learning_rate": 1.9157949705100224e-06, + "loss": 0.9922, + "step": 18449 + }, + { + "epoch": 0.47, + "learning_rate": 1.915783856430148e-06, + "loss": 0.5969, + "step": 18450 + }, + { + "epoch": 0.47, + "learning_rate": 1.9157727416491005e-06, + "loss": 0.9512, + "step": 18451 + }, + { + "epoch": 0.47, + "learning_rate": 1.915761626166888e-06, + "loss": 1.0742, + "step": 18452 + }, + { + "epoch": 0.47, + "learning_rate": 1.915750509983518e-06, + "loss": 0.8584, + "step": 18453 + }, + { + "epoch": 0.47, + "learning_rate": 1.9157393930990006e-06, + "loss": 0.9141, + "step": 18454 + }, + { + "epoch": 0.47, + "learning_rate": 1.915728275513344e-06, + "loss": 0.9697, + "step": 18455 + }, + { + "epoch": 0.47, + "learning_rate": 1.9157171572265555e-06, + "loss": 0.7827, + "step": 18456 + }, + { + "epoch": 0.47, + "learning_rate": 1.915706038238645e-06, + "loss": 0.7109, + "step": 18457 + }, + { + "epoch": 0.47, + "learning_rate": 1.9156949185496203e-06, + "loss": 0.875, + "step": 18458 + }, + { + "epoch": 0.47, + "learning_rate": 1.9156837981594904e-06, + "loss": 0.9885, + "step": 18459 + }, + { + "epoch": 0.47, + "learning_rate": 1.9156726770682633e-06, + "loss": 0.8301, + "step": 18460 + }, + { + "epoch": 0.47, + "learning_rate": 1.915661555275948e-06, + "loss": 0.7314, + "step": 18461 + }, + { + "epoch": 0.47, + "learning_rate": 1.9156504327825525e-06, + "loss": 0.9521, + "step": 18462 + }, + { + "epoch": 0.47, + "learning_rate": 1.9156393095880858e-06, + "loss": 0.8457, + "step": 18463 + }, + { + "epoch": 0.47, + "learning_rate": 1.9156281856925557e-06, + "loss": 0.6265, + "step": 18464 + }, + { + "epoch": 0.47, + "learning_rate": 1.9156170610959712e-06, + "loss": 0.791, + "step": 18465 + }, + { + "epoch": 0.47, + "learning_rate": 1.9156059357983412e-06, + "loss": 0.8087, + "step": 18466 + }, + { + "epoch": 0.47, + "learning_rate": 1.915594809799674e-06, + "loss": 1.0029, + "step": 18467 + }, + { + "epoch": 0.47, + "learning_rate": 1.9155836830999775e-06, + "loss": 0.8433, + "step": 18468 + }, + { + "epoch": 0.47, + "learning_rate": 1.915572555699261e-06, + "loss": 0.9463, + "step": 18469 + }, + { + "epoch": 0.47, + "learning_rate": 1.915561427597533e-06, + "loss": 1.002, + "step": 18470 + }, + { + "epoch": 0.47, + "learning_rate": 1.915550298794801e-06, + "loss": 0.8965, + "step": 18471 + }, + { + "epoch": 0.47, + "learning_rate": 1.915539169291074e-06, + "loss": 0.9961, + "step": 18472 + }, + { + "epoch": 0.47, + "learning_rate": 1.9155280390863617e-06, + "loss": 0.9678, + "step": 18473 + }, + { + "epoch": 0.47, + "learning_rate": 1.9155169081806713e-06, + "loss": 0.7725, + "step": 18474 + }, + { + "epoch": 0.47, + "learning_rate": 1.9155057765740113e-06, + "loss": 0.873, + "step": 18475 + }, + { + "epoch": 0.47, + "learning_rate": 1.915494644266391e-06, + "loss": 0.7384, + "step": 18476 + }, + { + "epoch": 0.47, + "learning_rate": 1.9154835112578188e-06, + "loss": 0.7969, + "step": 18477 + }, + { + "epoch": 0.47, + "learning_rate": 1.9154723775483024e-06, + "loss": 0.8486, + "step": 18478 + }, + { + "epoch": 0.47, + "learning_rate": 1.915461243137851e-06, + "loss": 0.8047, + "step": 18479 + }, + { + "epoch": 0.47, + "learning_rate": 1.915450108026473e-06, + "loss": 0.9404, + "step": 18480 + }, + { + "epoch": 0.47, + "learning_rate": 1.9154389722141776e-06, + "loss": 0.8789, + "step": 18481 + }, + { + "epoch": 0.47, + "learning_rate": 1.915427835700972e-06, + "loss": 0.9082, + "step": 18482 + }, + { + "epoch": 0.47, + "learning_rate": 1.9154166984868658e-06, + "loss": 0.9814, + "step": 18483 + }, + { + "epoch": 0.47, + "learning_rate": 1.915405560571867e-06, + "loss": 1.041, + "step": 18484 + }, + { + "epoch": 0.47, + "learning_rate": 1.915394421955984e-06, + "loss": 0.623, + "step": 18485 + }, + { + "epoch": 0.47, + "learning_rate": 1.915383282639226e-06, + "loss": 0.9775, + "step": 18486 + }, + { + "epoch": 0.47, + "learning_rate": 1.915372142621601e-06, + "loss": 1.0361, + "step": 18487 + }, + { + "epoch": 0.47, + "learning_rate": 1.9153610019031173e-06, + "loss": 0.8555, + "step": 18488 + }, + { + "epoch": 0.47, + "learning_rate": 1.9153498604837843e-06, + "loss": 0.8535, + "step": 18489 + }, + { + "epoch": 0.47, + "learning_rate": 1.9153387183636094e-06, + "loss": 0.9277, + "step": 18490 + }, + { + "epoch": 0.47, + "learning_rate": 1.915327575542602e-06, + "loss": 0.7509, + "step": 18491 + }, + { + "epoch": 0.47, + "learning_rate": 1.9153164320207705e-06, + "loss": 1.1562, + "step": 18492 + }, + { + "epoch": 0.47, + "learning_rate": 1.915305287798123e-06, + "loss": 0.8711, + "step": 18493 + }, + { + "epoch": 0.47, + "learning_rate": 1.9152941428746685e-06, + "loss": 1.1064, + "step": 18494 + }, + { + "epoch": 0.47, + "learning_rate": 1.9152829972504153e-06, + "loss": 0.8057, + "step": 18495 + }, + { + "epoch": 0.47, + "learning_rate": 1.9152718509253723e-06, + "loss": 1.0684, + "step": 18496 + }, + { + "epoch": 0.47, + "learning_rate": 1.9152607038995473e-06, + "loss": 1.0449, + "step": 18497 + }, + { + "epoch": 0.47, + "learning_rate": 1.9152495561729494e-06, + "loss": 0.6912, + "step": 18498 + }, + { + "epoch": 0.47, + "learning_rate": 1.915238407745587e-06, + "loss": 0.8643, + "step": 18499 + }, + { + "epoch": 0.47, + "learning_rate": 1.915227258617469e-06, + "loss": 0.8027, + "step": 18500 + }, + { + "epoch": 0.47, + "learning_rate": 1.9152161087886032e-06, + "loss": 0.6064, + "step": 18501 + }, + { + "epoch": 0.47, + "learning_rate": 1.9152049582589984e-06, + "loss": 0.7278, + "step": 18502 + }, + { + "epoch": 0.47, + "learning_rate": 1.9151938070286636e-06, + "loss": 0.9258, + "step": 18503 + }, + { + "epoch": 0.47, + "learning_rate": 1.9151826550976068e-06, + "loss": 0.7715, + "step": 18504 + }, + { + "epoch": 0.47, + "learning_rate": 1.9151715024658364e-06, + "loss": 0.9922, + "step": 18505 + }, + { + "epoch": 0.47, + "learning_rate": 1.915160349133362e-06, + "loss": 0.7764, + "step": 18506 + }, + { + "epoch": 0.47, + "learning_rate": 1.915149195100191e-06, + "loss": 0.9902, + "step": 18507 + }, + { + "epoch": 0.47, + "learning_rate": 1.915138040366332e-06, + "loss": 0.9414, + "step": 18508 + }, + { + "epoch": 0.47, + "learning_rate": 1.9151268849317945e-06, + "loss": 0.8896, + "step": 18509 + }, + { + "epoch": 0.47, + "learning_rate": 1.915115728796586e-06, + "loss": 0.7656, + "step": 18510 + }, + { + "epoch": 0.47, + "learning_rate": 1.9151045719607156e-06, + "loss": 0.9033, + "step": 18511 + }, + { + "epoch": 0.47, + "learning_rate": 1.9150934144241917e-06, + "loss": 0.9229, + "step": 18512 + }, + { + "epoch": 0.47, + "learning_rate": 1.915082256187023e-06, + "loss": 0.7285, + "step": 18513 + }, + { + "epoch": 0.47, + "learning_rate": 1.9150710972492176e-06, + "loss": 0.8389, + "step": 18514 + }, + { + "epoch": 0.47, + "learning_rate": 1.9150599376107844e-06, + "loss": 1.0049, + "step": 18515 + }, + { + "epoch": 0.47, + "learning_rate": 1.915048777271732e-06, + "loss": 0.6914, + "step": 18516 + }, + { + "epoch": 0.47, + "learning_rate": 1.9150376162320688e-06, + "loss": 1.0254, + "step": 18517 + }, + { + "epoch": 0.47, + "learning_rate": 1.9150264544918033e-06, + "loss": 0.8604, + "step": 18518 + }, + { + "epoch": 0.47, + "learning_rate": 1.9150152920509442e-06, + "loss": 0.6895, + "step": 18519 + }, + { + "epoch": 0.47, + "learning_rate": 1.9150041289095e-06, + "loss": 0.9092, + "step": 18520 + }, + { + "epoch": 0.47, + "learning_rate": 1.9149929650674794e-06, + "loss": 1.082, + "step": 18521 + }, + { + "epoch": 0.47, + "learning_rate": 1.91498180052489e-06, + "loss": 0.8447, + "step": 18522 + }, + { + "epoch": 0.47, + "learning_rate": 1.914970635281742e-06, + "loss": 0.8994, + "step": 18523 + }, + { + "epoch": 0.47, + "learning_rate": 1.9149594693380425e-06, + "loss": 0.9082, + "step": 18524 + }, + { + "epoch": 0.47, + "learning_rate": 1.914948302693801e-06, + "loss": 0.8447, + "step": 18525 + }, + { + "epoch": 0.47, + "learning_rate": 1.9149371353490252e-06, + "loss": 1.207, + "step": 18526 + }, + { + "epoch": 0.47, + "learning_rate": 1.9149259673037244e-06, + "loss": 0.8975, + "step": 18527 + }, + { + "epoch": 0.47, + "learning_rate": 1.914914798557907e-06, + "loss": 0.9033, + "step": 18528 + }, + { + "epoch": 0.47, + "learning_rate": 1.914903629111581e-06, + "loss": 0.875, + "step": 18529 + }, + { + "epoch": 0.47, + "learning_rate": 1.9148924589647553e-06, + "loss": 1.0234, + "step": 18530 + }, + { + "epoch": 0.47, + "learning_rate": 1.914881288117439e-06, + "loss": 0.7871, + "step": 18531 + }, + { + "epoch": 0.47, + "learning_rate": 1.9148701165696403e-06, + "loss": 0.9736, + "step": 18532 + }, + { + "epoch": 0.48, + "learning_rate": 1.914858944321367e-06, + "loss": 0.8066, + "step": 18533 + }, + { + "epoch": 0.48, + "learning_rate": 1.9148477713726285e-06, + "loss": 0.916, + "step": 18534 + }, + { + "epoch": 0.48, + "learning_rate": 1.914836597723433e-06, + "loss": 0.8789, + "step": 18535 + }, + { + "epoch": 0.48, + "learning_rate": 1.9148254233737896e-06, + "loss": 0.9932, + "step": 18536 + }, + { + "epoch": 0.48, + "learning_rate": 1.9148142483237062e-06, + "loss": 0.8706, + "step": 18537 + }, + { + "epoch": 0.48, + "learning_rate": 1.9148030725731914e-06, + "loss": 0.6719, + "step": 18538 + }, + { + "epoch": 0.48, + "learning_rate": 1.914791896122254e-06, + "loss": 0.9873, + "step": 18539 + }, + { + "epoch": 0.48, + "learning_rate": 1.914780718970903e-06, + "loss": 0.9219, + "step": 18540 + }, + { + "epoch": 0.48, + "learning_rate": 1.914769541119146e-06, + "loss": 1.0244, + "step": 18541 + }, + { + "epoch": 0.48, + "learning_rate": 1.9147583625669922e-06, + "loss": 0.8994, + "step": 18542 + }, + { + "epoch": 0.48, + "learning_rate": 1.9147471833144498e-06, + "loss": 0.7495, + "step": 18543 + }, + { + "epoch": 0.48, + "learning_rate": 1.9147360033615275e-06, + "loss": 1.0391, + "step": 18544 + }, + { + "epoch": 0.48, + "learning_rate": 1.914724822708234e-06, + "loss": 0.7695, + "step": 18545 + }, + { + "epoch": 0.48, + "learning_rate": 1.914713641354578e-06, + "loss": 0.8564, + "step": 18546 + }, + { + "epoch": 0.48, + "learning_rate": 1.9147024593005677e-06, + "loss": 1.1162, + "step": 18547 + }, + { + "epoch": 0.48, + "learning_rate": 1.9146912765462115e-06, + "loss": 0.6855, + "step": 18548 + }, + { + "epoch": 0.48, + "learning_rate": 1.9146800930915187e-06, + "loss": 1.0352, + "step": 18549 + }, + { + "epoch": 0.48, + "learning_rate": 1.9146689089364973e-06, + "loss": 1.0146, + "step": 18550 + }, + { + "epoch": 0.48, + "learning_rate": 1.914657724081156e-06, + "loss": 0.9531, + "step": 18551 + }, + { + "epoch": 0.48, + "learning_rate": 1.914646538525503e-06, + "loss": 0.9512, + "step": 18552 + }, + { + "epoch": 0.48, + "learning_rate": 1.9146353522695472e-06, + "loss": 0.8047, + "step": 18553 + }, + { + "epoch": 0.48, + "learning_rate": 1.9146241653132973e-06, + "loss": 0.8857, + "step": 18554 + }, + { + "epoch": 0.48, + "learning_rate": 1.914612977656762e-06, + "loss": 0.9863, + "step": 18555 + }, + { + "epoch": 0.48, + "learning_rate": 1.9146017892999495e-06, + "loss": 0.7979, + "step": 18556 + }, + { + "epoch": 0.48, + "learning_rate": 1.914590600242868e-06, + "loss": 0.5752, + "step": 18557 + }, + { + "epoch": 0.48, + "learning_rate": 1.9145794104855272e-06, + "loss": 1.0088, + "step": 18558 + }, + { + "epoch": 0.48, + "learning_rate": 1.9145682200279345e-06, + "loss": 0.8232, + "step": 18559 + }, + { + "epoch": 0.48, + "learning_rate": 1.9145570288700996e-06, + "loss": 0.8198, + "step": 18560 + }, + { + "epoch": 0.48, + "learning_rate": 1.9145458370120298e-06, + "loss": 0.7754, + "step": 18561 + }, + { + "epoch": 0.48, + "learning_rate": 1.9145346444537343e-06, + "loss": 0.8975, + "step": 18562 + }, + { + "epoch": 0.48, + "learning_rate": 1.914523451195222e-06, + "loss": 0.9717, + "step": 18563 + }, + { + "epoch": 0.48, + "learning_rate": 1.9145122572365013e-06, + "loss": 0.7749, + "step": 18564 + }, + { + "epoch": 0.48, + "learning_rate": 1.9145010625775798e-06, + "loss": 1.1016, + "step": 18565 + }, + { + "epoch": 0.48, + "learning_rate": 1.914489867218468e-06, + "loss": 0.9209, + "step": 18566 + }, + { + "epoch": 0.48, + "learning_rate": 1.9144786711591726e-06, + "loss": 0.8975, + "step": 18567 + }, + { + "epoch": 0.48, + "learning_rate": 1.914467474399703e-06, + "loss": 0.832, + "step": 18568 + }, + { + "epoch": 0.48, + "learning_rate": 1.9144562769400675e-06, + "loss": 0.8486, + "step": 18569 + }, + { + "epoch": 0.48, + "learning_rate": 1.9144450787802754e-06, + "loss": 0.9272, + "step": 18570 + }, + { + "epoch": 0.48, + "learning_rate": 1.9144338799203348e-06, + "loss": 0.7231, + "step": 18571 + }, + { + "epoch": 0.48, + "learning_rate": 1.914422680360254e-06, + "loss": 0.7842, + "step": 18572 + }, + { + "epoch": 0.48, + "learning_rate": 1.9144114801000413e-06, + "loss": 0.7939, + "step": 18573 + }, + { + "epoch": 0.48, + "learning_rate": 1.9144002791397063e-06, + "loss": 0.9834, + "step": 18574 + }, + { + "epoch": 0.48, + "learning_rate": 1.914389077479257e-06, + "loss": 0.7974, + "step": 18575 + }, + { + "epoch": 0.48, + "learning_rate": 1.9143778751187025e-06, + "loss": 0.8904, + "step": 18576 + }, + { + "epoch": 0.48, + "learning_rate": 1.91436667205805e-06, + "loss": 0.7754, + "step": 18577 + }, + { + "epoch": 0.48, + "learning_rate": 1.9143554682973095e-06, + "loss": 1.0195, + "step": 18578 + }, + { + "epoch": 0.48, + "learning_rate": 1.914344263836489e-06, + "loss": 0.7041, + "step": 18579 + }, + { + "epoch": 0.48, + "learning_rate": 1.914333058675597e-06, + "loss": 0.9932, + "step": 18580 + }, + { + "epoch": 0.48, + "learning_rate": 1.9143218528146425e-06, + "loss": 0.7227, + "step": 18581 + }, + { + "epoch": 0.48, + "learning_rate": 1.9143106462536338e-06, + "loss": 0.7415, + "step": 18582 + }, + { + "epoch": 0.48, + "learning_rate": 1.914299438992579e-06, + "loss": 0.8887, + "step": 18583 + }, + { + "epoch": 0.48, + "learning_rate": 1.914288231031488e-06, + "loss": 0.8979, + "step": 18584 + }, + { + "epoch": 0.48, + "learning_rate": 1.9142770223703676e-06, + "loss": 0.9492, + "step": 18585 + }, + { + "epoch": 0.48, + "learning_rate": 1.9142658130092276e-06, + "loss": 0.7427, + "step": 18586 + }, + { + "epoch": 0.48, + "learning_rate": 1.9142546029480762e-06, + "loss": 0.6846, + "step": 18587 + }, + { + "epoch": 0.48, + "learning_rate": 1.914243392186923e-06, + "loss": 0.959, + "step": 18588 + }, + { + "epoch": 0.48, + "learning_rate": 1.9142321807257748e-06, + "loss": 0.9902, + "step": 18589 + }, + { + "epoch": 0.48, + "learning_rate": 1.914220968564641e-06, + "loss": 0.7, + "step": 18590 + }, + { + "epoch": 0.48, + "learning_rate": 1.9142097557035305e-06, + "loss": 0.6807, + "step": 18591 + }, + { + "epoch": 0.48, + "learning_rate": 1.9141985421424517e-06, + "loss": 0.7812, + "step": 18592 + }, + { + "epoch": 0.48, + "learning_rate": 1.9141873278814133e-06, + "loss": 0.7598, + "step": 18593 + }, + { + "epoch": 0.48, + "learning_rate": 1.914176112920423e-06, + "loss": 0.8145, + "step": 18594 + }, + { + "epoch": 0.48, + "learning_rate": 1.9141648972594905e-06, + "loss": 0.7495, + "step": 18595 + }, + { + "epoch": 0.48, + "learning_rate": 1.9141536808986244e-06, + "loss": 1.001, + "step": 18596 + }, + { + "epoch": 0.48, + "learning_rate": 1.914142463837832e-06, + "loss": 0.9111, + "step": 18597 + }, + { + "epoch": 0.48, + "learning_rate": 1.9141312460771233e-06, + "loss": 0.9189, + "step": 18598 + }, + { + "epoch": 0.48, + "learning_rate": 1.9141200276165065e-06, + "loss": 0.7695, + "step": 18599 + }, + { + "epoch": 0.48, + "learning_rate": 1.91410880845599e-06, + "loss": 0.8743, + "step": 18600 + }, + { + "epoch": 0.48, + "learning_rate": 1.914097588595582e-06, + "loss": 0.8838, + "step": 18601 + }, + { + "epoch": 0.48, + "learning_rate": 1.9140863680352917e-06, + "loss": 0.7871, + "step": 18602 + }, + { + "epoch": 0.48, + "learning_rate": 1.9140751467751273e-06, + "loss": 0.9043, + "step": 18603 + }, + { + "epoch": 0.48, + "learning_rate": 1.9140639248150977e-06, + "loss": 0.875, + "step": 18604 + }, + { + "epoch": 0.48, + "learning_rate": 1.9140527021552113e-06, + "loss": 0.8574, + "step": 18605 + }, + { + "epoch": 0.48, + "learning_rate": 1.914041478795477e-06, + "loss": 0.7837, + "step": 18606 + }, + { + "epoch": 0.48, + "learning_rate": 1.914030254735903e-06, + "loss": 0.8257, + "step": 18607 + }, + { + "epoch": 0.48, + "learning_rate": 1.9140190299764982e-06, + "loss": 0.8848, + "step": 18608 + }, + { + "epoch": 0.48, + "learning_rate": 1.9140078045172713e-06, + "loss": 0.8652, + "step": 18609 + }, + { + "epoch": 0.48, + "learning_rate": 1.9139965783582304e-06, + "loss": 0.9902, + "step": 18610 + }, + { + "epoch": 0.48, + "learning_rate": 1.9139853514993845e-06, + "loss": 0.9131, + "step": 18611 + }, + { + "epoch": 0.48, + "learning_rate": 1.9139741239407415e-06, + "loss": 0.6648, + "step": 18612 + }, + { + "epoch": 0.48, + "learning_rate": 1.913962895682311e-06, + "loss": 0.8496, + "step": 18613 + }, + { + "epoch": 0.48, + "learning_rate": 1.913951666724101e-06, + "loss": 0.7676, + "step": 18614 + }, + { + "epoch": 0.48, + "learning_rate": 1.9139404370661203e-06, + "loss": 0.7749, + "step": 18615 + }, + { + "epoch": 0.48, + "learning_rate": 1.9139292067083773e-06, + "loss": 0.7656, + "step": 18616 + }, + { + "epoch": 0.48, + "learning_rate": 1.913917975650881e-06, + "loss": 0.9136, + "step": 18617 + }, + { + "epoch": 0.48, + "learning_rate": 1.9139067438936397e-06, + "loss": 0.8237, + "step": 18618 + }, + { + "epoch": 0.48, + "learning_rate": 1.913895511436662e-06, + "loss": 0.793, + "step": 18619 + }, + { + "epoch": 0.48, + "learning_rate": 1.913884278279956e-06, + "loss": 0.8984, + "step": 18620 + }, + { + "epoch": 0.48, + "learning_rate": 1.9138730444235318e-06, + "loss": 0.7861, + "step": 18621 + }, + { + "epoch": 0.48, + "learning_rate": 1.913861809867396e-06, + "loss": 0.8564, + "step": 18622 + }, + { + "epoch": 0.48, + "learning_rate": 1.9138505746115587e-06, + "loss": 0.7432, + "step": 18623 + }, + { + "epoch": 0.48, + "learning_rate": 1.9138393386560283e-06, + "loss": 0.8535, + "step": 18624 + }, + { + "epoch": 0.48, + "learning_rate": 1.9138281020008126e-06, + "loss": 0.6357, + "step": 18625 + }, + { + "epoch": 0.48, + "learning_rate": 1.913816864645921e-06, + "loss": 0.8447, + "step": 18626 + }, + { + "epoch": 0.48, + "learning_rate": 1.913805626591362e-06, + "loss": 1.0283, + "step": 18627 + }, + { + "epoch": 0.48, + "learning_rate": 1.9137943878371437e-06, + "loss": 0.5125, + "step": 18628 + }, + { + "epoch": 0.48, + "learning_rate": 1.9137831483832757e-06, + "loss": 0.8936, + "step": 18629 + }, + { + "epoch": 0.48, + "learning_rate": 1.9137719082297653e-06, + "loss": 1.0381, + "step": 18630 + }, + { + "epoch": 0.48, + "learning_rate": 1.913760667376622e-06, + "loss": 0.8711, + "step": 18631 + }, + { + "epoch": 0.48, + "learning_rate": 1.9137494258238543e-06, + "loss": 0.9609, + "step": 18632 + }, + { + "epoch": 0.48, + "learning_rate": 1.9137381835714704e-06, + "loss": 0.9023, + "step": 18633 + }, + { + "epoch": 0.48, + "learning_rate": 1.9137269406194795e-06, + "loss": 0.6729, + "step": 18634 + }, + { + "epoch": 0.48, + "learning_rate": 1.91371569696789e-06, + "loss": 0.7881, + "step": 18635 + }, + { + "epoch": 0.48, + "learning_rate": 1.91370445261671e-06, + "loss": 0.7783, + "step": 18636 + }, + { + "epoch": 0.48, + "learning_rate": 1.9136932075659485e-06, + "loss": 0.8281, + "step": 18637 + }, + { + "epoch": 0.48, + "learning_rate": 1.9136819618156145e-06, + "loss": 0.9277, + "step": 18638 + }, + { + "epoch": 0.48, + "learning_rate": 1.913670715365716e-06, + "loss": 0.9814, + "step": 18639 + }, + { + "epoch": 0.48, + "learning_rate": 1.913659468216262e-06, + "loss": 0.6953, + "step": 18640 + }, + { + "epoch": 0.48, + "learning_rate": 1.9136482203672606e-06, + "loss": 0.7012, + "step": 18641 + }, + { + "epoch": 0.48, + "learning_rate": 1.913636971818721e-06, + "loss": 0.9189, + "step": 18642 + }, + { + "epoch": 0.48, + "learning_rate": 1.9136257225706513e-06, + "loss": 0.8896, + "step": 18643 + }, + { + "epoch": 0.48, + "learning_rate": 1.913614472623061e-06, + "loss": 0.8086, + "step": 18644 + }, + { + "epoch": 0.48, + "learning_rate": 1.9136032219759576e-06, + "loss": 1.0244, + "step": 18645 + }, + { + "epoch": 0.48, + "learning_rate": 1.9135919706293502e-06, + "loss": 0.8672, + "step": 18646 + }, + { + "epoch": 0.48, + "learning_rate": 1.913580718583248e-06, + "loss": 0.8477, + "step": 18647 + }, + { + "epoch": 0.48, + "learning_rate": 1.9135694658376583e-06, + "loss": 0.8135, + "step": 18648 + }, + { + "epoch": 0.48, + "learning_rate": 1.913558212392591e-06, + "loss": 1.0752, + "step": 18649 + }, + { + "epoch": 0.48, + "learning_rate": 1.9135469582480543e-06, + "loss": 0.834, + "step": 18650 + }, + { + "epoch": 0.48, + "learning_rate": 1.9135357034040563e-06, + "loss": 0.8809, + "step": 18651 + }, + { + "epoch": 0.48, + "learning_rate": 1.913524447860606e-06, + "loss": 0.8496, + "step": 18652 + }, + { + "epoch": 0.48, + "learning_rate": 1.9135131916177124e-06, + "loss": 0.7046, + "step": 18653 + }, + { + "epoch": 0.48, + "learning_rate": 1.9135019346753834e-06, + "loss": 0.7627, + "step": 18654 + }, + { + "epoch": 0.48, + "learning_rate": 1.913490677033628e-06, + "loss": 0.7395, + "step": 18655 + }, + { + "epoch": 0.48, + "learning_rate": 1.913479418692455e-06, + "loss": 0.8076, + "step": 18656 + }, + { + "epoch": 0.48, + "learning_rate": 1.9134681596518725e-06, + "loss": 0.791, + "step": 18657 + }, + { + "epoch": 0.48, + "learning_rate": 1.91345689991189e-06, + "loss": 0.7627, + "step": 18658 + }, + { + "epoch": 0.48, + "learning_rate": 1.913445639472515e-06, + "loss": 0.7864, + "step": 18659 + }, + { + "epoch": 0.48, + "learning_rate": 1.9134343783337566e-06, + "loss": 0.7646, + "step": 18660 + }, + { + "epoch": 0.48, + "learning_rate": 1.913423116495624e-06, + "loss": 1.126, + "step": 18661 + }, + { + "epoch": 0.48, + "learning_rate": 1.913411853958125e-06, + "loss": 0.9014, + "step": 18662 + }, + { + "epoch": 0.48, + "learning_rate": 1.913400590721269e-06, + "loss": 0.9336, + "step": 18663 + }, + { + "epoch": 0.48, + "learning_rate": 1.913389326785064e-06, + "loss": 0.7666, + "step": 18664 + }, + { + "epoch": 0.48, + "learning_rate": 1.9133780621495183e-06, + "loss": 0.9248, + "step": 18665 + }, + { + "epoch": 0.48, + "learning_rate": 1.913366796814641e-06, + "loss": 0.7397, + "step": 18666 + }, + { + "epoch": 0.48, + "learning_rate": 1.9133555307804413e-06, + "loss": 0.8691, + "step": 18667 + }, + { + "epoch": 0.48, + "learning_rate": 1.913344264046927e-06, + "loss": 0.9404, + "step": 18668 + }, + { + "epoch": 0.48, + "learning_rate": 1.913332996614107e-06, + "loss": 1.0146, + "step": 18669 + }, + { + "epoch": 0.48, + "learning_rate": 1.91332172848199e-06, + "loss": 0.8506, + "step": 18670 + }, + { + "epoch": 0.48, + "learning_rate": 1.9133104596505843e-06, + "loss": 0.7466, + "step": 18671 + }, + { + "epoch": 0.48, + "learning_rate": 1.913299190119899e-06, + "loss": 1.0088, + "step": 18672 + }, + { + "epoch": 0.48, + "learning_rate": 1.9132879198899427e-06, + "loss": 0.8994, + "step": 18673 + }, + { + "epoch": 0.48, + "learning_rate": 1.9132766489607234e-06, + "loss": 0.8438, + "step": 18674 + }, + { + "epoch": 0.48, + "learning_rate": 1.9132653773322504e-06, + "loss": 1.0957, + "step": 18675 + }, + { + "epoch": 0.48, + "learning_rate": 1.913254105004532e-06, + "loss": 1.0566, + "step": 18676 + }, + { + "epoch": 0.48, + "learning_rate": 1.913242831977577e-06, + "loss": 0.8738, + "step": 18677 + }, + { + "epoch": 0.48, + "learning_rate": 1.913231558251394e-06, + "loss": 0.665, + "step": 18678 + }, + { + "epoch": 0.48, + "learning_rate": 1.9132202838259915e-06, + "loss": 0.7197, + "step": 18679 + }, + { + "epoch": 0.48, + "learning_rate": 1.9132090087013782e-06, + "loss": 0.7546, + "step": 18680 + }, + { + "epoch": 0.48, + "learning_rate": 1.913197732877563e-06, + "loss": 0.7471, + "step": 18681 + }, + { + "epoch": 0.48, + "learning_rate": 1.9131864563545538e-06, + "loss": 1.1338, + "step": 18682 + }, + { + "epoch": 0.48, + "learning_rate": 1.91317517913236e-06, + "loss": 0.79, + "step": 18683 + }, + { + "epoch": 0.48, + "learning_rate": 1.91316390121099e-06, + "loss": 0.999, + "step": 18684 + }, + { + "epoch": 0.48, + "learning_rate": 1.9131526225904523e-06, + "loss": 0.7129, + "step": 18685 + }, + { + "epoch": 0.48, + "learning_rate": 1.913141343270756e-06, + "loss": 0.9863, + "step": 18686 + }, + { + "epoch": 0.48, + "learning_rate": 1.9131300632519087e-06, + "loss": 0.8389, + "step": 18687 + }, + { + "epoch": 0.48, + "learning_rate": 1.91311878253392e-06, + "loss": 0.668, + "step": 18688 + }, + { + "epoch": 0.48, + "learning_rate": 1.913107501116798e-06, + "loss": 0.7104, + "step": 18689 + }, + { + "epoch": 0.48, + "learning_rate": 1.913096219000552e-06, + "loss": 0.8135, + "step": 18690 + }, + { + "epoch": 0.48, + "learning_rate": 1.91308493618519e-06, + "loss": 0.9902, + "step": 18691 + }, + { + "epoch": 0.48, + "learning_rate": 1.913073652670721e-06, + "loss": 0.8857, + "step": 18692 + }, + { + "epoch": 0.48, + "learning_rate": 1.9130623684571532e-06, + "loss": 1.0986, + "step": 18693 + }, + { + "epoch": 0.48, + "learning_rate": 1.913051083544496e-06, + "loss": 0.998, + "step": 18694 + }, + { + "epoch": 0.48, + "learning_rate": 1.913039797932757e-06, + "loss": 0.7339, + "step": 18695 + }, + { + "epoch": 0.48, + "learning_rate": 1.9130285116219457e-06, + "loss": 0.9756, + "step": 18696 + }, + { + "epoch": 0.48, + "learning_rate": 1.9130172246120706e-06, + "loss": 1.0439, + "step": 18697 + }, + { + "epoch": 0.48, + "learning_rate": 1.91300593690314e-06, + "loss": 0.6514, + "step": 18698 + }, + { + "epoch": 0.48, + "learning_rate": 1.9129946484951625e-06, + "loss": 0.8496, + "step": 18699 + }, + { + "epoch": 0.48, + "learning_rate": 1.912983359388148e-06, + "loss": 0.8237, + "step": 18700 + }, + { + "epoch": 0.48, + "learning_rate": 1.912972069582103e-06, + "loss": 0.8955, + "step": 18701 + }, + { + "epoch": 0.48, + "learning_rate": 1.9129607790770375e-06, + "loss": 1.0093, + "step": 18702 + }, + { + "epoch": 0.48, + "learning_rate": 1.9129494878729598e-06, + "loss": 0.9248, + "step": 18703 + }, + { + "epoch": 0.48, + "learning_rate": 1.912938195969879e-06, + "loss": 1.0205, + "step": 18704 + }, + { + "epoch": 0.48, + "learning_rate": 1.9129269033678035e-06, + "loss": 0.9131, + "step": 18705 + }, + { + "epoch": 0.48, + "learning_rate": 1.9129156100667416e-06, + "loss": 1.0381, + "step": 18706 + }, + { + "epoch": 0.48, + "learning_rate": 1.912904316066702e-06, + "loss": 0.8838, + "step": 18707 + }, + { + "epoch": 0.48, + "learning_rate": 1.912893021367694e-06, + "loss": 0.8516, + "step": 18708 + }, + { + "epoch": 0.48, + "learning_rate": 1.9128817259697257e-06, + "loss": 0.8701, + "step": 18709 + }, + { + "epoch": 0.48, + "learning_rate": 1.9128704298728057e-06, + "loss": 0.875, + "step": 18710 + }, + { + "epoch": 0.48, + "learning_rate": 1.9128591330769426e-06, + "loss": 0.9062, + "step": 18711 + }, + { + "epoch": 0.48, + "learning_rate": 1.9128478355821455e-06, + "loss": 0.8271, + "step": 18712 + }, + { + "epoch": 0.48, + "learning_rate": 1.9128365373884226e-06, + "loss": 1.0703, + "step": 18713 + }, + { + "epoch": 0.48, + "learning_rate": 1.9128252384957828e-06, + "loss": 0.5413, + "step": 18714 + }, + { + "epoch": 0.48, + "learning_rate": 1.912813938904235e-06, + "loss": 1.0029, + "step": 18715 + }, + { + "epoch": 0.48, + "learning_rate": 1.9128026386137874e-06, + "loss": 0.8467, + "step": 18716 + }, + { + "epoch": 0.48, + "learning_rate": 1.9127913376244483e-06, + "loss": 0.7163, + "step": 18717 + }, + { + "epoch": 0.48, + "learning_rate": 1.9127800359362274e-06, + "loss": 0.915, + "step": 18718 + }, + { + "epoch": 0.48, + "learning_rate": 1.912768733549133e-06, + "loss": 0.7114, + "step": 18719 + }, + { + "epoch": 0.48, + "learning_rate": 1.9127574304631725e-06, + "loss": 0.8516, + "step": 18720 + }, + { + "epoch": 0.48, + "learning_rate": 1.9127461266783562e-06, + "loss": 0.7788, + "step": 18721 + }, + { + "epoch": 0.48, + "learning_rate": 1.9127348221946925e-06, + "loss": 0.8379, + "step": 18722 + }, + { + "epoch": 0.48, + "learning_rate": 1.9127235170121896e-06, + "loss": 1.0762, + "step": 18723 + }, + { + "epoch": 0.48, + "learning_rate": 1.912712211130856e-06, + "loss": 0.7607, + "step": 18724 + }, + { + "epoch": 0.48, + "learning_rate": 1.912700904550701e-06, + "loss": 0.8584, + "step": 18725 + }, + { + "epoch": 0.48, + "learning_rate": 1.912689597271732e-06, + "loss": 0.9453, + "step": 18726 + }, + { + "epoch": 0.48, + "learning_rate": 1.9126782892939596e-06, + "loss": 1.0312, + "step": 18727 + }, + { + "epoch": 0.48, + "learning_rate": 1.912666980617391e-06, + "loss": 0.8018, + "step": 18728 + }, + { + "epoch": 0.48, + "learning_rate": 1.912655671242035e-06, + "loss": 0.9707, + "step": 18729 + }, + { + "epoch": 0.48, + "learning_rate": 1.912644361167901e-06, + "loss": 0.7178, + "step": 18730 + }, + { + "epoch": 0.48, + "learning_rate": 1.912633050394997e-06, + "loss": 1.0156, + "step": 18731 + }, + { + "epoch": 0.48, + "learning_rate": 1.9126217389233315e-06, + "loss": 1.0029, + "step": 18732 + }, + { + "epoch": 0.48, + "learning_rate": 1.9126104267529136e-06, + "loss": 0.8115, + "step": 18733 + }, + { + "epoch": 0.48, + "learning_rate": 1.9125991138837524e-06, + "loss": 0.8867, + "step": 18734 + }, + { + "epoch": 0.48, + "learning_rate": 1.9125878003158555e-06, + "loss": 1.0439, + "step": 18735 + }, + { + "epoch": 0.48, + "learning_rate": 1.9125764860492323e-06, + "loss": 1.0547, + "step": 18736 + }, + { + "epoch": 0.48, + "learning_rate": 1.912565171083891e-06, + "loss": 0.957, + "step": 18737 + }, + { + "epoch": 0.48, + "learning_rate": 1.9125538554198405e-06, + "loss": 0.9844, + "step": 18738 + }, + { + "epoch": 0.48, + "learning_rate": 1.9125425390570898e-06, + "loss": 1.3428, + "step": 18739 + }, + { + "epoch": 0.48, + "learning_rate": 1.912531221995647e-06, + "loss": 0.9883, + "step": 18740 + }, + { + "epoch": 0.48, + "learning_rate": 1.912519904235521e-06, + "loss": 0.8223, + "step": 18741 + }, + { + "epoch": 0.48, + "learning_rate": 1.9125085857767208e-06, + "loss": 0.7373, + "step": 18742 + }, + { + "epoch": 0.48, + "learning_rate": 1.9124972666192543e-06, + "loss": 0.9092, + "step": 18743 + }, + { + "epoch": 0.48, + "learning_rate": 1.912485946763131e-06, + "loss": 0.7686, + "step": 18744 + }, + { + "epoch": 0.48, + "learning_rate": 1.912474626208359e-06, + "loss": 0.9746, + "step": 18745 + }, + { + "epoch": 0.48, + "learning_rate": 1.912463304954947e-06, + "loss": 0.8916, + "step": 18746 + }, + { + "epoch": 0.48, + "learning_rate": 1.912451983002904e-06, + "loss": 0.7417, + "step": 18747 + }, + { + "epoch": 0.48, + "learning_rate": 1.9124406603522384e-06, + "loss": 0.7856, + "step": 18748 + }, + { + "epoch": 0.48, + "learning_rate": 1.912429337002959e-06, + "loss": 0.7988, + "step": 18749 + }, + { + "epoch": 0.48, + "learning_rate": 1.912418012955074e-06, + "loss": 0.8496, + "step": 18750 + }, + { + "epoch": 0.48, + "learning_rate": 1.912406688208593e-06, + "loss": 0.7546, + "step": 18751 + }, + { + "epoch": 0.48, + "learning_rate": 1.912395362763524e-06, + "loss": 0.8789, + "step": 18752 + }, + { + "epoch": 0.48, + "learning_rate": 1.912384036619876e-06, + "loss": 0.9736, + "step": 18753 + }, + { + "epoch": 0.48, + "learning_rate": 1.912372709777657e-06, + "loss": 0.9551, + "step": 18754 + }, + { + "epoch": 0.48, + "learning_rate": 1.9123613822368766e-06, + "loss": 0.7705, + "step": 18755 + }, + { + "epoch": 0.48, + "learning_rate": 1.9123500539975427e-06, + "loss": 1.1191, + "step": 18756 + }, + { + "epoch": 0.48, + "learning_rate": 1.9123387250596642e-06, + "loss": 0.5759, + "step": 18757 + }, + { + "epoch": 0.48, + "learning_rate": 1.9123273954232503e-06, + "loss": 0.9072, + "step": 18758 + }, + { + "epoch": 0.48, + "learning_rate": 1.912316065088309e-06, + "loss": 0.8232, + "step": 18759 + }, + { + "epoch": 0.48, + "learning_rate": 1.9123047340548495e-06, + "loss": 1.1133, + "step": 18760 + }, + { + "epoch": 0.48, + "learning_rate": 1.9122934023228804e-06, + "loss": 1.0049, + "step": 18761 + }, + { + "epoch": 0.48, + "learning_rate": 1.9122820698924097e-06, + "loss": 0.9058, + "step": 18762 + }, + { + "epoch": 0.48, + "learning_rate": 1.912270736763447e-06, + "loss": 0.8516, + "step": 18763 + }, + { + "epoch": 0.48, + "learning_rate": 1.912259402936e-06, + "loss": 0.7358, + "step": 18764 + }, + { + "epoch": 0.48, + "learning_rate": 1.9122480684100783e-06, + "loss": 0.918, + "step": 18765 + }, + { + "epoch": 0.48, + "learning_rate": 1.91223673318569e-06, + "loss": 0.8389, + "step": 18766 + }, + { + "epoch": 0.48, + "learning_rate": 1.9122253972628443e-06, + "loss": 0.8081, + "step": 18767 + }, + { + "epoch": 0.48, + "learning_rate": 1.9122140606415494e-06, + "loss": 0.7456, + "step": 18768 + }, + { + "epoch": 0.48, + "learning_rate": 1.912202723321814e-06, + "loss": 0.9414, + "step": 18769 + }, + { + "epoch": 0.48, + "learning_rate": 1.912191385303647e-06, + "loss": 0.5496, + "step": 18770 + }, + { + "epoch": 0.48, + "learning_rate": 1.912180046587057e-06, + "loss": 1.1289, + "step": 18771 + }, + { + "epoch": 0.48, + "learning_rate": 1.912168707172053e-06, + "loss": 0.8789, + "step": 18772 + }, + { + "epoch": 0.48, + "learning_rate": 1.9121573670586428e-06, + "loss": 0.9727, + "step": 18773 + }, + { + "epoch": 0.48, + "learning_rate": 1.912146026246836e-06, + "loss": 0.8604, + "step": 18774 + }, + { + "epoch": 0.48, + "learning_rate": 1.9121346847366407e-06, + "loss": 0.9111, + "step": 18775 + }, + { + "epoch": 0.48, + "learning_rate": 1.9121233425280662e-06, + "loss": 0.9648, + "step": 18776 + }, + { + "epoch": 0.48, + "learning_rate": 1.9121119996211202e-06, + "loss": 0.6445, + "step": 18777 + }, + { + "epoch": 0.48, + "learning_rate": 1.9121006560158125e-06, + "loss": 0.8794, + "step": 18778 + }, + { + "epoch": 0.48, + "learning_rate": 1.912089311712151e-06, + "loss": 0.9561, + "step": 18779 + }, + { + "epoch": 0.48, + "learning_rate": 1.912077966710145e-06, + "loss": 0.9268, + "step": 18780 + }, + { + "epoch": 0.48, + "learning_rate": 1.9120666210098025e-06, + "loss": 0.8262, + "step": 18781 + }, + { + "epoch": 0.48, + "learning_rate": 1.9120552746111326e-06, + "loss": 0.877, + "step": 18782 + }, + { + "epoch": 0.48, + "learning_rate": 1.912043927514144e-06, + "loss": 0.7747, + "step": 18783 + }, + { + "epoch": 0.48, + "learning_rate": 1.9120325797188453e-06, + "loss": 0.8906, + "step": 18784 + }, + { + "epoch": 0.48, + "learning_rate": 1.9120212312252452e-06, + "loss": 0.9443, + "step": 18785 + }, + { + "epoch": 0.48, + "learning_rate": 1.912009882033352e-06, + "loss": 0.9272, + "step": 18786 + }, + { + "epoch": 0.48, + "learning_rate": 1.9119985321431755e-06, + "loss": 0.793, + "step": 18787 + }, + { + "epoch": 0.48, + "learning_rate": 1.911987181554723e-06, + "loss": 1.1172, + "step": 18788 + }, + { + "epoch": 0.48, + "learning_rate": 1.911975830268004e-06, + "loss": 0.7695, + "step": 18789 + }, + { + "epoch": 0.48, + "learning_rate": 1.911964478283027e-06, + "loss": 0.8145, + "step": 18790 + }, + { + "epoch": 0.48, + "learning_rate": 1.911953125599801e-06, + "loss": 1.0713, + "step": 18791 + }, + { + "epoch": 0.48, + "learning_rate": 1.9119417722183344e-06, + "loss": 0.5718, + "step": 18792 + }, + { + "epoch": 0.48, + "learning_rate": 1.9119304181386354e-06, + "loss": 0.8096, + "step": 18793 + }, + { + "epoch": 0.48, + "learning_rate": 1.911919063360714e-06, + "loss": 0.8774, + "step": 18794 + }, + { + "epoch": 0.48, + "learning_rate": 1.9119077078845776e-06, + "loss": 0.7681, + "step": 18795 + }, + { + "epoch": 0.48, + "learning_rate": 1.9118963517102357e-06, + "loss": 1.0273, + "step": 18796 + }, + { + "epoch": 0.48, + "learning_rate": 1.9118849948376964e-06, + "loss": 0.8535, + "step": 18797 + }, + { + "epoch": 0.48, + "learning_rate": 1.911873637266969e-06, + "loss": 1.0234, + "step": 18798 + }, + { + "epoch": 0.48, + "learning_rate": 1.9118622789980615e-06, + "loss": 1.0557, + "step": 18799 + }, + { + "epoch": 0.48, + "learning_rate": 1.9118509200309833e-06, + "loss": 0.9375, + "step": 18800 + }, + { + "epoch": 0.48, + "learning_rate": 1.911839560365742e-06, + "loss": 0.9307, + "step": 18801 + }, + { + "epoch": 0.48, + "learning_rate": 1.9118282000023483e-06, + "loss": 0.8008, + "step": 18802 + }, + { + "epoch": 0.48, + "learning_rate": 1.9118168389408088e-06, + "loss": 0.8057, + "step": 18803 + }, + { + "epoch": 0.48, + "learning_rate": 1.9118054771811333e-06, + "loss": 0.5098, + "step": 18804 + }, + { + "epoch": 0.48, + "learning_rate": 1.9117941147233307e-06, + "loss": 0.7627, + "step": 18805 + }, + { + "epoch": 0.48, + "learning_rate": 1.9117827515674086e-06, + "loss": 1.0361, + "step": 18806 + }, + { + "epoch": 0.48, + "learning_rate": 1.9117713877133768e-06, + "loss": 0.917, + "step": 18807 + }, + { + "epoch": 0.48, + "learning_rate": 1.9117600231612433e-06, + "loss": 0.9111, + "step": 18808 + }, + { + "epoch": 0.48, + "learning_rate": 1.9117486579110174e-06, + "loss": 0.7056, + "step": 18809 + }, + { + "epoch": 0.48, + "learning_rate": 1.9117372919627073e-06, + "loss": 0.9551, + "step": 18810 + }, + { + "epoch": 0.48, + "learning_rate": 1.9117259253163217e-06, + "loss": 0.9336, + "step": 18811 + }, + { + "epoch": 0.48, + "learning_rate": 1.91171455797187e-06, + "loss": 0.7031, + "step": 18812 + }, + { + "epoch": 0.48, + "learning_rate": 1.9117031899293598e-06, + "loss": 0.8386, + "step": 18813 + }, + { + "epoch": 0.48, + "learning_rate": 1.911691821188801e-06, + "loss": 0.8325, + "step": 18814 + }, + { + "epoch": 0.48, + "learning_rate": 1.911680451750201e-06, + "loss": 1.0732, + "step": 18815 + }, + { + "epoch": 0.48, + "learning_rate": 1.9116690816135693e-06, + "loss": 1.041, + "step": 18816 + }, + { + "epoch": 0.48, + "learning_rate": 1.911657710778915e-06, + "loss": 0.749, + "step": 18817 + }, + { + "epoch": 0.48, + "learning_rate": 1.9116463392462457e-06, + "loss": 0.8298, + "step": 18818 + }, + { + "epoch": 0.48, + "learning_rate": 1.9116349670155714e-06, + "loss": 0.7749, + "step": 18819 + }, + { + "epoch": 0.48, + "learning_rate": 1.9116235940868995e-06, + "loss": 0.7607, + "step": 18820 + }, + { + "epoch": 0.48, + "learning_rate": 1.91161222046024e-06, + "loss": 0.7573, + "step": 18821 + }, + { + "epoch": 0.48, + "learning_rate": 1.9116008461356e-06, + "loss": 0.9014, + "step": 18822 + }, + { + "epoch": 0.48, + "learning_rate": 1.91158947111299e-06, + "loss": 1.001, + "step": 18823 + }, + { + "epoch": 0.48, + "learning_rate": 1.9115780953924175e-06, + "loss": 0.9072, + "step": 18824 + }, + { + "epoch": 0.48, + "learning_rate": 1.9115667189738916e-06, + "loss": 0.9102, + "step": 18825 + }, + { + "epoch": 0.48, + "learning_rate": 1.911555341857421e-06, + "loss": 0.7891, + "step": 18826 + }, + { + "epoch": 0.48, + "learning_rate": 1.9115439640430145e-06, + "loss": 0.9365, + "step": 18827 + }, + { + "epoch": 0.48, + "learning_rate": 1.9115325855306807e-06, + "loss": 1.1006, + "step": 18828 + }, + { + "epoch": 0.48, + "learning_rate": 1.911521206320428e-06, + "loss": 0.916, + "step": 18829 + }, + { + "epoch": 0.48, + "learning_rate": 1.911509826412266e-06, + "loss": 0.9575, + "step": 18830 + }, + { + "epoch": 0.48, + "learning_rate": 1.911498445806202e-06, + "loss": 0.9932, + "step": 18831 + }, + { + "epoch": 0.48, + "learning_rate": 1.9114870645022464e-06, + "loss": 0.8877, + "step": 18832 + }, + { + "epoch": 0.48, + "learning_rate": 1.9114756825004067e-06, + "loss": 0.918, + "step": 18833 + }, + { + "epoch": 0.48, + "learning_rate": 1.911464299800692e-06, + "loss": 0.8291, + "step": 18834 + }, + { + "epoch": 0.48, + "learning_rate": 1.9114529164031107e-06, + "loss": 0.8564, + "step": 18835 + }, + { + "epoch": 0.48, + "learning_rate": 1.911441532307672e-06, + "loss": 0.7432, + "step": 18836 + }, + { + "epoch": 0.48, + "learning_rate": 1.9114301475143847e-06, + "loss": 0.9639, + "step": 18837 + }, + { + "epoch": 0.48, + "learning_rate": 1.911418762023257e-06, + "loss": 0.8867, + "step": 18838 + }, + { + "epoch": 0.48, + "learning_rate": 1.911407375834298e-06, + "loss": 0.834, + "step": 18839 + }, + { + "epoch": 0.48, + "learning_rate": 1.911395988947516e-06, + "loss": 0.8555, + "step": 18840 + }, + { + "epoch": 0.48, + "learning_rate": 1.91138460136292e-06, + "loss": 0.8242, + "step": 18841 + }, + { + "epoch": 0.48, + "learning_rate": 1.911373213080519e-06, + "loss": 1.0586, + "step": 18842 + }, + { + "epoch": 0.48, + "learning_rate": 1.9113618241003213e-06, + "loss": 0.8223, + "step": 18843 + }, + { + "epoch": 0.48, + "learning_rate": 1.9113504344223357e-06, + "loss": 0.9395, + "step": 18844 + }, + { + "epoch": 0.48, + "learning_rate": 1.9113390440465716e-06, + "loss": 0.8342, + "step": 18845 + }, + { + "epoch": 0.48, + "learning_rate": 1.9113276529730365e-06, + "loss": 0.8857, + "step": 18846 + }, + { + "epoch": 0.48, + "learning_rate": 1.9113162612017394e-06, + "loss": 0.9277, + "step": 18847 + }, + { + "epoch": 0.48, + "learning_rate": 1.91130486873269e-06, + "loss": 0.6919, + "step": 18848 + }, + { + "epoch": 0.48, + "learning_rate": 1.911293475565896e-06, + "loss": 0.7686, + "step": 18849 + }, + { + "epoch": 0.48, + "learning_rate": 1.911282081701367e-06, + "loss": 0.9395, + "step": 18850 + }, + { + "epoch": 0.48, + "learning_rate": 1.9112706871391106e-06, + "loss": 0.8633, + "step": 18851 + }, + { + "epoch": 0.48, + "learning_rate": 1.911259291879136e-06, + "loss": 0.9033, + "step": 18852 + }, + { + "epoch": 0.48, + "learning_rate": 1.9112478959214526e-06, + "loss": 0.9531, + "step": 18853 + }, + { + "epoch": 0.48, + "learning_rate": 1.9112364992660687e-06, + "loss": 0.6416, + "step": 18854 + }, + { + "epoch": 0.48, + "learning_rate": 1.911225101912992e-06, + "loss": 0.9668, + "step": 18855 + }, + { + "epoch": 0.48, + "learning_rate": 1.911213703862233e-06, + "loss": 0.9297, + "step": 18856 + }, + { + "epoch": 0.48, + "learning_rate": 1.9112023051137995e-06, + "loss": 0.7705, + "step": 18857 + }, + { + "epoch": 0.48, + "learning_rate": 1.9111909056677e-06, + "loss": 0.8413, + "step": 18858 + }, + { + "epoch": 0.48, + "learning_rate": 1.9111795055239438e-06, + "loss": 0.8711, + "step": 18859 + }, + { + "epoch": 0.48, + "learning_rate": 1.911168104682539e-06, + "loss": 0.9141, + "step": 18860 + }, + { + "epoch": 0.48, + "learning_rate": 1.9111567031434948e-06, + "loss": 0.8164, + "step": 18861 + }, + { + "epoch": 0.48, + "learning_rate": 1.9111453009068197e-06, + "loss": 1.0781, + "step": 18862 + }, + { + "epoch": 0.48, + "learning_rate": 1.911133897972523e-06, + "loss": 0.918, + "step": 18863 + }, + { + "epoch": 0.48, + "learning_rate": 1.9111224943406126e-06, + "loss": 0.7939, + "step": 18864 + }, + { + "epoch": 0.48, + "learning_rate": 1.9111110900110974e-06, + "loss": 1.0547, + "step": 18865 + }, + { + "epoch": 0.48, + "learning_rate": 1.9110996849839867e-06, + "loss": 1.0264, + "step": 18866 + }, + { + "epoch": 0.48, + "learning_rate": 1.911088279259289e-06, + "loss": 0.8594, + "step": 18867 + }, + { + "epoch": 0.48, + "learning_rate": 1.9110768728370123e-06, + "loss": 0.7861, + "step": 18868 + }, + { + "epoch": 0.48, + "learning_rate": 1.9110654657171665e-06, + "loss": 0.9336, + "step": 18869 + }, + { + "epoch": 0.48, + "learning_rate": 1.91105405789976e-06, + "loss": 0.9473, + "step": 18870 + }, + { + "epoch": 0.48, + "learning_rate": 1.9110426493848003e-06, + "loss": 0.9189, + "step": 18871 + }, + { + "epoch": 0.48, + "learning_rate": 1.9110312401722978e-06, + "loss": 1.0234, + "step": 18872 + }, + { + "epoch": 0.48, + "learning_rate": 1.91101983026226e-06, + "loss": 1.0791, + "step": 18873 + }, + { + "epoch": 0.48, + "learning_rate": 1.911008419654697e-06, + "loss": 0.9053, + "step": 18874 + }, + { + "epoch": 0.48, + "learning_rate": 1.9109970083496164e-06, + "loss": 0.9229, + "step": 18875 + }, + { + "epoch": 0.48, + "learning_rate": 1.9109855963470275e-06, + "loss": 0.8223, + "step": 18876 + }, + { + "epoch": 0.48, + "learning_rate": 1.9109741836469384e-06, + "loss": 0.7705, + "step": 18877 + }, + { + "epoch": 0.48, + "learning_rate": 1.9109627702493583e-06, + "loss": 0.6611, + "step": 18878 + }, + { + "epoch": 0.48, + "learning_rate": 1.910951356154296e-06, + "loss": 0.6152, + "step": 18879 + }, + { + "epoch": 0.48, + "learning_rate": 1.9109399413617603e-06, + "loss": 0.8491, + "step": 18880 + }, + { + "epoch": 0.48, + "learning_rate": 1.9109285258717598e-06, + "loss": 0.999, + "step": 18881 + }, + { + "epoch": 0.48, + "learning_rate": 1.910917109684303e-06, + "loss": 0.8662, + "step": 18882 + }, + { + "epoch": 0.48, + "learning_rate": 1.910905692799399e-06, + "loss": 0.9033, + "step": 18883 + }, + { + "epoch": 0.48, + "learning_rate": 1.9108942752170563e-06, + "loss": 0.834, + "step": 18884 + }, + { + "epoch": 0.48, + "learning_rate": 1.9108828569372837e-06, + "loss": 0.9609, + "step": 18885 + }, + { + "epoch": 0.48, + "learning_rate": 1.91087143796009e-06, + "loss": 0.9131, + "step": 18886 + }, + { + "epoch": 0.48, + "learning_rate": 1.910860018285484e-06, + "loss": 0.9111, + "step": 18887 + }, + { + "epoch": 0.48, + "learning_rate": 1.910848597913474e-06, + "loss": 0.7954, + "step": 18888 + }, + { + "epoch": 0.48, + "learning_rate": 1.9108371768440698e-06, + "loss": 0.8018, + "step": 18889 + }, + { + "epoch": 0.48, + "learning_rate": 1.910825755077279e-06, + "loss": 0.9082, + "step": 18890 + }, + { + "epoch": 0.48, + "learning_rate": 1.910814332613111e-06, + "loss": 0.8584, + "step": 18891 + }, + { + "epoch": 0.48, + "learning_rate": 1.9108029094515743e-06, + "loss": 0.8643, + "step": 18892 + }, + { + "epoch": 0.48, + "learning_rate": 1.9107914855926778e-06, + "loss": 0.863, + "step": 18893 + }, + { + "epoch": 0.48, + "learning_rate": 1.9107800610364296e-06, + "loss": 0.8296, + "step": 18894 + }, + { + "epoch": 0.48, + "learning_rate": 1.9107686357828395e-06, + "loss": 0.7471, + "step": 18895 + }, + { + "epoch": 0.48, + "learning_rate": 1.9107572098319156e-06, + "loss": 0.7612, + "step": 18896 + }, + { + "epoch": 0.48, + "learning_rate": 1.9107457831836667e-06, + "loss": 0.7012, + "step": 18897 + }, + { + "epoch": 0.48, + "learning_rate": 1.910734355838102e-06, + "loss": 0.8174, + "step": 18898 + }, + { + "epoch": 0.48, + "learning_rate": 1.9107229277952293e-06, + "loss": 0.8525, + "step": 18899 + }, + { + "epoch": 0.48, + "learning_rate": 1.910711499055058e-06, + "loss": 0.7773, + "step": 18900 + }, + { + "epoch": 0.48, + "learning_rate": 1.910700069617597e-06, + "loss": 0.8755, + "step": 18901 + }, + { + "epoch": 0.48, + "learning_rate": 1.910688639482855e-06, + "loss": 0.9238, + "step": 18902 + }, + { + "epoch": 0.48, + "learning_rate": 1.9106772086508403e-06, + "loss": 0.9307, + "step": 18903 + }, + { + "epoch": 0.48, + "learning_rate": 1.9106657771215624e-06, + "loss": 0.7627, + "step": 18904 + }, + { + "epoch": 0.48, + "learning_rate": 1.910654344895029e-06, + "loss": 0.8831, + "step": 18905 + }, + { + "epoch": 0.48, + "learning_rate": 1.9106429119712498e-06, + "loss": 0.9766, + "step": 18906 + }, + { + "epoch": 0.48, + "learning_rate": 1.910631478350233e-06, + "loss": 0.9238, + "step": 18907 + }, + { + "epoch": 0.48, + "learning_rate": 1.9106200440319876e-06, + "loss": 0.8252, + "step": 18908 + }, + { + "epoch": 0.48, + "learning_rate": 1.9106086090165224e-06, + "loss": 0.916, + "step": 18909 + }, + { + "epoch": 0.48, + "learning_rate": 1.910597173303846e-06, + "loss": 0.7441, + "step": 18910 + }, + { + "epoch": 0.48, + "learning_rate": 1.910585736893967e-06, + "loss": 0.7578, + "step": 18911 + }, + { + "epoch": 0.48, + "learning_rate": 1.9105742997868945e-06, + "loss": 0.582, + "step": 18912 + }, + { + "epoch": 0.48, + "learning_rate": 1.9105628619826372e-06, + "loss": 1.0342, + "step": 18913 + }, + { + "epoch": 0.48, + "learning_rate": 1.9105514234812037e-06, + "loss": 1.0234, + "step": 18914 + }, + { + "epoch": 0.48, + "learning_rate": 1.910539984282603e-06, + "loss": 1.1836, + "step": 18915 + }, + { + "epoch": 0.48, + "learning_rate": 1.9105285443868437e-06, + "loss": 1.0732, + "step": 18916 + }, + { + "epoch": 0.48, + "learning_rate": 1.9105171037939346e-06, + "loss": 1.0557, + "step": 18917 + }, + { + "epoch": 0.48, + "learning_rate": 1.9105056625038844e-06, + "loss": 0.7793, + "step": 18918 + }, + { + "epoch": 0.48, + "learning_rate": 1.9104942205167015e-06, + "loss": 0.8369, + "step": 18919 + }, + { + "epoch": 0.48, + "learning_rate": 1.9104827778323952e-06, + "loss": 0.9844, + "step": 18920 + }, + { + "epoch": 0.48, + "learning_rate": 1.9104713344509745e-06, + "loss": 1.0293, + "step": 18921 + }, + { + "epoch": 0.48, + "learning_rate": 1.9104598903724473e-06, + "loss": 0.8066, + "step": 18922 + }, + { + "epoch": 0.49, + "learning_rate": 1.910448445596823e-06, + "loss": 1.0068, + "step": 18923 + }, + { + "epoch": 0.49, + "learning_rate": 1.91043700012411e-06, + "loss": 0.9214, + "step": 18924 + }, + { + "epoch": 0.49, + "learning_rate": 1.910425553954318e-06, + "loss": 0.5898, + "step": 18925 + }, + { + "epoch": 0.49, + "learning_rate": 1.910414107087454e-06, + "loss": 0.9375, + "step": 18926 + }, + { + "epoch": 0.49, + "learning_rate": 1.9104026595235286e-06, + "loss": 0.9639, + "step": 18927 + }, + { + "epoch": 0.49, + "learning_rate": 1.9103912112625492e-06, + "loss": 0.6084, + "step": 18928 + }, + { + "epoch": 0.49, + "learning_rate": 1.9103797623045253e-06, + "loss": 0.9365, + "step": 18929 + }, + { + "epoch": 0.49, + "learning_rate": 1.9103683126494657e-06, + "loss": 0.8877, + "step": 18930 + }, + { + "epoch": 0.49, + "learning_rate": 1.9103568622973784e-06, + "loss": 0.7109, + "step": 18931 + }, + { + "epoch": 0.49, + "learning_rate": 1.9103454112482732e-06, + "loss": 0.666, + "step": 18932 + }, + { + "epoch": 0.49, + "learning_rate": 1.910333959502158e-06, + "loss": 0.8096, + "step": 18933 + }, + { + "epoch": 0.49, + "learning_rate": 1.9103225070590426e-06, + "loss": 0.8379, + "step": 18934 + }, + { + "epoch": 0.49, + "learning_rate": 1.9103110539189345e-06, + "loss": 0.7578, + "step": 18935 + }, + { + "epoch": 0.49, + "learning_rate": 1.9102996000818433e-06, + "loss": 0.8301, + "step": 18936 + }, + { + "epoch": 0.49, + "learning_rate": 1.9102881455477773e-06, + "loss": 0.7485, + "step": 18937 + }, + { + "epoch": 0.49, + "learning_rate": 1.910276690316746e-06, + "loss": 0.8789, + "step": 18938 + }, + { + "epoch": 0.49, + "learning_rate": 1.9102652343887572e-06, + "loss": 0.9326, + "step": 18939 + }, + { + "epoch": 0.49, + "learning_rate": 1.9102537777638205e-06, + "loss": 1.0068, + "step": 18940 + }, + { + "epoch": 0.49, + "learning_rate": 1.9102423204419442e-06, + "loss": 1.0615, + "step": 18941 + }, + { + "epoch": 0.49, + "learning_rate": 1.9102308624231373e-06, + "loss": 0.7554, + "step": 18942 + }, + { + "epoch": 0.49, + "learning_rate": 1.9102194037074086e-06, + "loss": 0.7153, + "step": 18943 + }, + { + "epoch": 0.49, + "learning_rate": 1.9102079442947666e-06, + "loss": 0.8188, + "step": 18944 + }, + { + "epoch": 0.49, + "learning_rate": 1.9101964841852197e-06, + "loss": 0.8516, + "step": 18945 + }, + { + "epoch": 0.49, + "learning_rate": 1.910185023378778e-06, + "loss": 0.6978, + "step": 18946 + }, + { + "epoch": 0.49, + "learning_rate": 1.9101735618754493e-06, + "loss": 0.8682, + "step": 18947 + }, + { + "epoch": 0.49, + "learning_rate": 1.910162099675242e-06, + "loss": 0.9834, + "step": 18948 + }, + { + "epoch": 0.49, + "learning_rate": 1.9101506367781662e-06, + "loss": 0.7412, + "step": 18949 + }, + { + "epoch": 0.49, + "learning_rate": 1.9101391731842295e-06, + "loss": 0.7363, + "step": 18950 + }, + { + "epoch": 0.49, + "learning_rate": 1.9101277088934413e-06, + "loss": 0.9023, + "step": 18951 + }, + { + "epoch": 0.49, + "learning_rate": 1.91011624390581e-06, + "loss": 0.873, + "step": 18952 + }, + { + "epoch": 0.49, + "learning_rate": 1.9101047782213444e-06, + "loss": 0.9541, + "step": 18953 + }, + { + "epoch": 0.49, + "learning_rate": 1.910093311840054e-06, + "loss": 0.7651, + "step": 18954 + }, + { + "epoch": 0.49, + "learning_rate": 1.9100818447619463e-06, + "loss": 0.7061, + "step": 18955 + }, + { + "epoch": 0.49, + "learning_rate": 1.910070376987031e-06, + "loss": 0.9092, + "step": 18956 + }, + { + "epoch": 0.49, + "learning_rate": 1.910058908515317e-06, + "loss": 0.6379, + "step": 18957 + }, + { + "epoch": 0.49, + "learning_rate": 1.9100474393468123e-06, + "loss": 0.7197, + "step": 18958 + }, + { + "epoch": 0.49, + "learning_rate": 1.9100359694815262e-06, + "loss": 0.8945, + "step": 18959 + }, + { + "epoch": 0.49, + "learning_rate": 1.9100244989194675e-06, + "loss": 0.8018, + "step": 18960 + }, + { + "epoch": 0.49, + "learning_rate": 1.910013027660645e-06, + "loss": 0.958, + "step": 18961 + }, + { + "epoch": 0.49, + "learning_rate": 1.910001555705067e-06, + "loss": 0.8154, + "step": 18962 + }, + { + "epoch": 0.49, + "learning_rate": 1.909990083052743e-06, + "loss": 0.8701, + "step": 18963 + }, + { + "epoch": 0.49, + "learning_rate": 1.9099786097036812e-06, + "loss": 0.7734, + "step": 18964 + }, + { + "epoch": 0.49, + "learning_rate": 1.909967135657891e-06, + "loss": 1.0186, + "step": 18965 + }, + { + "epoch": 0.49, + "learning_rate": 1.9099556609153805e-06, + "loss": 0.9482, + "step": 18966 + }, + { + "epoch": 0.49, + "learning_rate": 1.909944185476159e-06, + "loss": 0.79, + "step": 18967 + }, + { + "epoch": 0.49, + "learning_rate": 1.909932709340235e-06, + "loss": 1.1006, + "step": 18968 + }, + { + "epoch": 0.49, + "learning_rate": 1.909921232507617e-06, + "loss": 0.8184, + "step": 18969 + }, + { + "epoch": 0.49, + "learning_rate": 1.9099097549783143e-06, + "loss": 0.8184, + "step": 18970 + }, + { + "epoch": 0.49, + "learning_rate": 1.9098982767523357e-06, + "loss": 0.9551, + "step": 18971 + }, + { + "epoch": 0.49, + "learning_rate": 1.90988679782969e-06, + "loss": 0.5981, + "step": 18972 + }, + { + "epoch": 0.49, + "learning_rate": 1.9098753182103854e-06, + "loss": 0.7539, + "step": 18973 + }, + { + "epoch": 0.49, + "learning_rate": 1.9098638378944318e-06, + "loss": 0.6606, + "step": 18974 + }, + { + "epoch": 0.49, + "learning_rate": 1.9098523568818364e-06, + "loss": 0.7139, + "step": 18975 + }, + { + "epoch": 0.49, + "learning_rate": 1.9098408751726093e-06, + "loss": 1.0352, + "step": 18976 + }, + { + "epoch": 0.49, + "learning_rate": 1.909829392766759e-06, + "loss": 0.9658, + "step": 18977 + }, + { + "epoch": 0.49, + "learning_rate": 1.909817909664294e-06, + "loss": 0.8691, + "step": 18978 + }, + { + "epoch": 0.49, + "learning_rate": 1.9098064258652236e-06, + "loss": 0.7505, + "step": 18979 + }, + { + "epoch": 0.49, + "learning_rate": 1.909794941369556e-06, + "loss": 1.0, + "step": 18980 + }, + { + "epoch": 0.49, + "learning_rate": 1.9097834561772997e-06, + "loss": 0.9727, + "step": 18981 + }, + { + "epoch": 0.49, + "learning_rate": 1.9097719702884648e-06, + "loss": 1.0352, + "step": 18982 + }, + { + "epoch": 0.49, + "learning_rate": 1.909760483703059e-06, + "loss": 0.5967, + "step": 18983 + }, + { + "epoch": 0.49, + "learning_rate": 1.909748996421092e-06, + "loss": 0.6865, + "step": 18984 + }, + { + "epoch": 0.49, + "learning_rate": 1.909737508442571e-06, + "loss": 0.8809, + "step": 18985 + }, + { + "epoch": 0.49, + "learning_rate": 1.909726019767507e-06, + "loss": 0.6765, + "step": 18986 + }, + { + "epoch": 0.49, + "learning_rate": 1.9097145303959067e-06, + "loss": 0.8291, + "step": 18987 + }, + { + "epoch": 0.49, + "learning_rate": 1.90970304032778e-06, + "loss": 0.9756, + "step": 18988 + }, + { + "epoch": 0.49, + "learning_rate": 1.9096915495631357e-06, + "loss": 0.7417, + "step": 18989 + }, + { + "epoch": 0.49, + "learning_rate": 1.909680058101982e-06, + "loss": 0.8438, + "step": 18990 + }, + { + "epoch": 0.49, + "learning_rate": 1.9096685659443286e-06, + "loss": 0.8877, + "step": 18991 + }, + { + "epoch": 0.49, + "learning_rate": 1.9096570730901837e-06, + "loss": 0.7832, + "step": 18992 + }, + { + "epoch": 0.49, + "learning_rate": 1.909645579539556e-06, + "loss": 1.0156, + "step": 18993 + }, + { + "epoch": 0.49, + "learning_rate": 1.909634085292455e-06, + "loss": 0.7305, + "step": 18994 + }, + { + "epoch": 0.49, + "learning_rate": 1.9096225903488885e-06, + "loss": 0.8945, + "step": 18995 + }, + { + "epoch": 0.49, + "learning_rate": 1.909611094708866e-06, + "loss": 0.6953, + "step": 18996 + }, + { + "epoch": 0.49, + "learning_rate": 1.909599598372396e-06, + "loss": 0.624, + "step": 18997 + }, + { + "epoch": 0.49, + "learning_rate": 1.9095881013394872e-06, + "loss": 0.9453, + "step": 18998 + }, + { + "epoch": 0.49, + "learning_rate": 1.909576603610149e-06, + "loss": 1.0283, + "step": 18999 + }, + { + "epoch": 0.49, + "learning_rate": 1.9095651051843896e-06, + "loss": 0.8208, + "step": 19000 + }, + { + "epoch": 0.49, + "learning_rate": 1.9095536060622183e-06, + "loss": 0.96, + "step": 19001 + }, + { + "epoch": 0.49, + "learning_rate": 1.9095421062436437e-06, + "loss": 0.9697, + "step": 19002 + }, + { + "epoch": 0.49, + "learning_rate": 1.909530605728674e-06, + "loss": 0.917, + "step": 19003 + }, + { + "epoch": 0.49, + "learning_rate": 1.909519104517319e-06, + "loss": 0.7065, + "step": 19004 + }, + { + "epoch": 0.49, + "learning_rate": 1.9095076026095867e-06, + "loss": 0.9336, + "step": 19005 + }, + { + "epoch": 0.49, + "learning_rate": 1.9094961000054866e-06, + "loss": 1.0146, + "step": 19006 + }, + { + "epoch": 0.49, + "learning_rate": 1.909484596705027e-06, + "loss": 0.8516, + "step": 19007 + }, + { + "epoch": 0.49, + "learning_rate": 1.909473092708217e-06, + "loss": 0.9307, + "step": 19008 + }, + { + "epoch": 0.49, + "learning_rate": 1.909461588015065e-06, + "loss": 1.0415, + "step": 19009 + }, + { + "epoch": 0.49, + "learning_rate": 1.90945008262558e-06, + "loss": 0.9707, + "step": 19010 + }, + { + "epoch": 0.49, + "learning_rate": 1.909438576539771e-06, + "loss": 0.6504, + "step": 19011 + }, + { + "epoch": 0.49, + "learning_rate": 1.909427069757647e-06, + "loss": 0.5615, + "step": 19012 + }, + { + "epoch": 0.49, + "learning_rate": 1.909415562279216e-06, + "loss": 0.6519, + "step": 19013 + }, + { + "epoch": 0.49, + "learning_rate": 1.909404054104488e-06, + "loss": 1.1152, + "step": 19014 + }, + { + "epoch": 0.49, + "learning_rate": 1.909392545233471e-06, + "loss": 0.7817, + "step": 19015 + }, + { + "epoch": 0.49, + "learning_rate": 1.9093810356661734e-06, + "loss": 0.9785, + "step": 19016 + }, + { + "epoch": 0.49, + "learning_rate": 1.9093695254026047e-06, + "loss": 0.9463, + "step": 19017 + }, + { + "epoch": 0.49, + "learning_rate": 1.9093580144427736e-06, + "loss": 0.5476, + "step": 19018 + }, + { + "epoch": 0.49, + "learning_rate": 1.909346502786689e-06, + "loss": 0.8438, + "step": 19019 + }, + { + "epoch": 0.49, + "learning_rate": 1.9093349904343595e-06, + "loss": 0.8506, + "step": 19020 + }, + { + "epoch": 0.49, + "learning_rate": 1.9093234773857943e-06, + "loss": 0.8564, + "step": 19021 + }, + { + "epoch": 0.49, + "learning_rate": 1.909311963641002e-06, + "loss": 0.9023, + "step": 19022 + }, + { + "epoch": 0.49, + "learning_rate": 1.9093004491999907e-06, + "loss": 0.6699, + "step": 19023 + }, + { + "epoch": 0.49, + "learning_rate": 1.90928893406277e-06, + "loss": 0.9971, + "step": 19024 + }, + { + "epoch": 0.49, + "learning_rate": 1.909277418229349e-06, + "loss": 0.7578, + "step": 19025 + }, + { + "epoch": 0.49, + "learning_rate": 1.909265901699736e-06, + "loss": 0.9434, + "step": 19026 + }, + { + "epoch": 0.49, + "learning_rate": 1.9092543844739397e-06, + "loss": 0.8232, + "step": 19027 + }, + { + "epoch": 0.49, + "learning_rate": 1.909242866551969e-06, + "loss": 0.876, + "step": 19028 + }, + { + "epoch": 0.49, + "learning_rate": 1.9092313479338333e-06, + "loss": 0.8438, + "step": 19029 + }, + { + "epoch": 0.49, + "learning_rate": 1.909219828619541e-06, + "loss": 0.875, + "step": 19030 + }, + { + "epoch": 0.49, + "learning_rate": 1.9092083086091005e-06, + "loss": 0.9102, + "step": 19031 + }, + { + "epoch": 0.49, + "learning_rate": 1.909196787902521e-06, + "loss": 0.8169, + "step": 19032 + }, + { + "epoch": 0.49, + "learning_rate": 1.9091852664998113e-06, + "loss": 0.7197, + "step": 19033 + }, + { + "epoch": 0.49, + "learning_rate": 1.9091737444009807e-06, + "loss": 0.7241, + "step": 19034 + }, + { + "epoch": 0.49, + "learning_rate": 1.909162221606037e-06, + "loss": 0.8467, + "step": 19035 + }, + { + "epoch": 0.49, + "learning_rate": 1.90915069811499e-06, + "loss": 0.8247, + "step": 19036 + }, + { + "epoch": 0.49, + "learning_rate": 1.9091391739278477e-06, + "loss": 1.0205, + "step": 19037 + }, + { + "epoch": 0.49, + "learning_rate": 1.90912764904462e-06, + "loss": 0.9297, + "step": 19038 + }, + { + "epoch": 0.49, + "learning_rate": 1.9091161234653144e-06, + "loss": 0.999, + "step": 19039 + }, + { + "epoch": 0.49, + "learning_rate": 1.9091045971899405e-06, + "loss": 0.6704, + "step": 19040 + }, + { + "epoch": 0.49, + "learning_rate": 1.909093070218507e-06, + "loss": 0.6658, + "step": 19041 + }, + { + "epoch": 0.49, + "learning_rate": 1.909081542551023e-06, + "loss": 0.8213, + "step": 19042 + }, + { + "epoch": 0.49, + "learning_rate": 1.909070014187497e-06, + "loss": 0.8008, + "step": 19043 + }, + { + "epoch": 0.49, + "learning_rate": 1.909058485127938e-06, + "loss": 1.1797, + "step": 19044 + }, + { + "epoch": 0.49, + "learning_rate": 1.9090469553723544e-06, + "loss": 0.8467, + "step": 19045 + }, + { + "epoch": 0.49, + "learning_rate": 1.9090354249207558e-06, + "loss": 0.793, + "step": 19046 + }, + { + "epoch": 0.49, + "learning_rate": 1.90902389377315e-06, + "loss": 0.7646, + "step": 19047 + }, + { + "epoch": 0.49, + "learning_rate": 1.9090123619295468e-06, + "loss": 0.9424, + "step": 19048 + }, + { + "epoch": 0.49, + "learning_rate": 1.9090008293899547e-06, + "loss": 0.9863, + "step": 19049 + }, + { + "epoch": 0.49, + "learning_rate": 1.9089892961543823e-06, + "loss": 0.916, + "step": 19050 + }, + { + "epoch": 0.49, + "learning_rate": 1.9089777622228386e-06, + "loss": 0.7183, + "step": 19051 + }, + { + "epoch": 0.49, + "learning_rate": 1.9089662275953323e-06, + "loss": 0.9316, + "step": 19052 + }, + { + "epoch": 0.49, + "learning_rate": 1.9089546922718724e-06, + "loss": 1.0205, + "step": 19053 + }, + { + "epoch": 0.49, + "learning_rate": 1.908943156252468e-06, + "loss": 0.9893, + "step": 19054 + }, + { + "epoch": 0.49, + "learning_rate": 1.9089316195371274e-06, + "loss": 0.7266, + "step": 19055 + }, + { + "epoch": 0.49, + "learning_rate": 1.9089200821258596e-06, + "loss": 0.7456, + "step": 19056 + }, + { + "epoch": 0.49, + "learning_rate": 1.9089085440186734e-06, + "loss": 0.8389, + "step": 19057 + }, + { + "epoch": 0.49, + "learning_rate": 1.9088970052155776e-06, + "loss": 0.8828, + "step": 19058 + }, + { + "epoch": 0.49, + "learning_rate": 1.9088854657165816e-06, + "loss": 0.9014, + "step": 19059 + }, + { + "epoch": 0.49, + "learning_rate": 1.9088739255216933e-06, + "loss": 0.6753, + "step": 19060 + }, + { + "epoch": 0.49, + "learning_rate": 1.9088623846309226e-06, + "loss": 0.9131, + "step": 19061 + }, + { + "epoch": 0.49, + "learning_rate": 1.9088508430442775e-06, + "loss": 0.5737, + "step": 19062 + }, + { + "epoch": 0.49, + "learning_rate": 1.908839300761767e-06, + "loss": 0.8887, + "step": 19063 + }, + { + "epoch": 0.49, + "learning_rate": 1.9088277577834e-06, + "loss": 1.0283, + "step": 19064 + }, + { + "epoch": 0.49, + "learning_rate": 1.9088162141091855e-06, + "loss": 0.9473, + "step": 19065 + }, + { + "epoch": 0.49, + "learning_rate": 1.908804669739132e-06, + "loss": 0.8604, + "step": 19066 + }, + { + "epoch": 0.49, + "learning_rate": 1.9087931246732488e-06, + "loss": 0.7219, + "step": 19067 + }, + { + "epoch": 0.49, + "learning_rate": 1.9087815789115444e-06, + "loss": 0.9248, + "step": 19068 + }, + { + "epoch": 0.49, + "learning_rate": 1.908770032454028e-06, + "loss": 1.0869, + "step": 19069 + }, + { + "epoch": 0.49, + "learning_rate": 1.9087584853007076e-06, + "loss": 0.7002, + "step": 19070 + }, + { + "epoch": 0.49, + "learning_rate": 1.908746937451593e-06, + "loss": 0.8389, + "step": 19071 + }, + { + "epoch": 0.49, + "learning_rate": 1.9087353889066925e-06, + "loss": 0.8369, + "step": 19072 + }, + { + "epoch": 0.49, + "learning_rate": 1.9087238396660155e-06, + "loss": 0.8691, + "step": 19073 + }, + { + "epoch": 0.49, + "learning_rate": 1.90871228972957e-06, + "loss": 0.7314, + "step": 19074 + }, + { + "epoch": 0.49, + "learning_rate": 1.9087007390973655e-06, + "loss": 0.9814, + "step": 19075 + }, + { + "epoch": 0.49, + "learning_rate": 1.9086891877694103e-06, + "loss": 0.6797, + "step": 19076 + }, + { + "epoch": 0.49, + "learning_rate": 1.908677635745714e-06, + "loss": 0.9326, + "step": 19077 + }, + { + "epoch": 0.49, + "learning_rate": 1.908666083026285e-06, + "loss": 0.9531, + "step": 19078 + }, + { + "epoch": 0.49, + "learning_rate": 1.908654529611132e-06, + "loss": 0.9927, + "step": 19079 + }, + { + "epoch": 0.49, + "learning_rate": 1.908642975500264e-06, + "loss": 0.8672, + "step": 19080 + }, + { + "epoch": 0.49, + "learning_rate": 1.9086314206936898e-06, + "loss": 1.041, + "step": 19081 + }, + { + "epoch": 0.49, + "learning_rate": 1.908619865191418e-06, + "loss": 0.6426, + "step": 19082 + }, + { + "epoch": 0.49, + "learning_rate": 1.9086083089934586e-06, + "loss": 0.7861, + "step": 19083 + }, + { + "epoch": 0.49, + "learning_rate": 1.908596752099819e-06, + "loss": 0.9629, + "step": 19084 + }, + { + "epoch": 0.49, + "learning_rate": 1.9085851945105086e-06, + "loss": 0.918, + "step": 19085 + }, + { + "epoch": 0.49, + "learning_rate": 1.908573636225537e-06, + "loss": 1.0469, + "step": 19086 + }, + { + "epoch": 0.49, + "learning_rate": 1.9085620772449113e-06, + "loss": 0.8818, + "step": 19087 + }, + { + "epoch": 0.49, + "learning_rate": 1.908550517568642e-06, + "loss": 1.1279, + "step": 19088 + }, + { + "epoch": 0.49, + "learning_rate": 1.908538957196737e-06, + "loss": 0.8711, + "step": 19089 + }, + { + "epoch": 0.49, + "learning_rate": 1.908527396129206e-06, + "loss": 0.8838, + "step": 19090 + }, + { + "epoch": 0.49, + "learning_rate": 1.908515834366057e-06, + "loss": 0.8965, + "step": 19091 + }, + { + "epoch": 0.49, + "learning_rate": 1.9085042719072993e-06, + "loss": 0.7944, + "step": 19092 + }, + { + "epoch": 0.49, + "learning_rate": 1.9084927087529414e-06, + "loss": 0.5669, + "step": 19093 + }, + { + "epoch": 0.49, + "learning_rate": 1.908481144902993e-06, + "loss": 0.832, + "step": 19094 + }, + { + "epoch": 0.49, + "learning_rate": 1.9084695803574617e-06, + "loss": 0.999, + "step": 19095 + }, + { + "epoch": 0.49, + "learning_rate": 1.908458015116357e-06, + "loss": 0.9639, + "step": 19096 + }, + { + "epoch": 0.49, + "learning_rate": 1.9084464491796884e-06, + "loss": 0.8394, + "step": 19097 + }, + { + "epoch": 0.49, + "learning_rate": 1.9084348825474636e-06, + "loss": 0.8545, + "step": 19098 + }, + { + "epoch": 0.49, + "learning_rate": 1.9084233152196926e-06, + "loss": 0.8584, + "step": 19099 + }, + { + "epoch": 0.49, + "learning_rate": 1.908411747196383e-06, + "loss": 0.8406, + "step": 19100 + }, + { + "epoch": 0.49, + "learning_rate": 1.9084001784775447e-06, + "loss": 0.9854, + "step": 19101 + }, + { + "epoch": 0.49, + "learning_rate": 1.9083886090631856e-06, + "loss": 0.959, + "step": 19102 + }, + { + "epoch": 0.49, + "learning_rate": 1.908377038953316e-06, + "loss": 0.9072, + "step": 19103 + }, + { + "epoch": 0.49, + "learning_rate": 1.908365468147943e-06, + "loss": 0.9971, + "step": 19104 + }, + { + "epoch": 0.49, + "learning_rate": 1.9083538966470767e-06, + "loss": 0.9219, + "step": 19105 + }, + { + "epoch": 0.49, + "learning_rate": 1.9083423244507255e-06, + "loss": 0.8867, + "step": 19106 + }, + { + "epoch": 0.49, + "learning_rate": 1.9083307515588985e-06, + "loss": 0.8652, + "step": 19107 + }, + { + "epoch": 0.49, + "learning_rate": 1.9083191779716044e-06, + "loss": 0.8516, + "step": 19108 + }, + { + "epoch": 0.49, + "learning_rate": 1.908307603688852e-06, + "loss": 0.7354, + "step": 19109 + }, + { + "epoch": 0.49, + "learning_rate": 1.90829602871065e-06, + "loss": 0.8779, + "step": 19110 + }, + { + "epoch": 0.49, + "learning_rate": 1.908284453037008e-06, + "loss": 0.8564, + "step": 19111 + }, + { + "epoch": 0.49, + "learning_rate": 1.908272876667934e-06, + "loss": 0.8652, + "step": 19112 + }, + { + "epoch": 0.49, + "learning_rate": 1.908261299603437e-06, + "loss": 0.9072, + "step": 19113 + }, + { + "epoch": 0.49, + "learning_rate": 1.9082497218435267e-06, + "loss": 0.9385, + "step": 19114 + }, + { + "epoch": 0.49, + "learning_rate": 1.908238143388211e-06, + "loss": 0.8789, + "step": 19115 + }, + { + "epoch": 0.49, + "learning_rate": 1.908226564237499e-06, + "loss": 0.8848, + "step": 19116 + }, + { + "epoch": 0.49, + "learning_rate": 1.9082149843914e-06, + "loss": 0.7754, + "step": 19117 + }, + { + "epoch": 0.49, + "learning_rate": 1.9082034038499226e-06, + "loss": 1.1348, + "step": 19118 + }, + { + "epoch": 0.49, + "learning_rate": 1.9081918226130752e-06, + "loss": 1.0439, + "step": 19119 + }, + { + "epoch": 0.49, + "learning_rate": 1.9081802406808672e-06, + "loss": 0.9092, + "step": 19120 + }, + { + "epoch": 0.49, + "learning_rate": 1.908168658053308e-06, + "loss": 0.9141, + "step": 19121 + }, + { + "epoch": 0.49, + "learning_rate": 1.9081570747304047e-06, + "loss": 1.0645, + "step": 19122 + }, + { + "epoch": 0.49, + "learning_rate": 1.908145490712168e-06, + "loss": 0.8564, + "step": 19123 + }, + { + "epoch": 0.49, + "learning_rate": 1.9081339059986057e-06, + "loss": 0.9326, + "step": 19124 + }, + { + "epoch": 0.49, + "learning_rate": 1.9081223205897273e-06, + "loss": 0.8467, + "step": 19125 + }, + { + "epoch": 0.49, + "learning_rate": 1.9081107344855415e-06, + "loss": 0.8721, + "step": 19126 + }, + { + "epoch": 0.49, + "learning_rate": 1.9080991476860564e-06, + "loss": 0.5618, + "step": 19127 + }, + { + "epoch": 0.49, + "learning_rate": 1.9080875601912822e-06, + "loss": 0.5938, + "step": 19128 + }, + { + "epoch": 0.49, + "learning_rate": 1.908075972001227e-06, + "loss": 0.9248, + "step": 19129 + }, + { + "epoch": 0.49, + "learning_rate": 1.9080643831158996e-06, + "loss": 0.8608, + "step": 19130 + }, + { + "epoch": 0.49, + "learning_rate": 1.9080527935353093e-06, + "loss": 0.958, + "step": 19131 + }, + { + "epoch": 0.49, + "learning_rate": 1.9080412032594647e-06, + "loss": 0.8428, + "step": 19132 + }, + { + "epoch": 0.49, + "learning_rate": 1.9080296122883745e-06, + "loss": 0.6025, + "step": 19133 + }, + { + "epoch": 0.49, + "learning_rate": 1.9080180206220478e-06, + "loss": 0.7876, + "step": 19134 + }, + { + "epoch": 0.49, + "learning_rate": 1.9080064282604933e-06, + "loss": 0.7627, + "step": 19135 + }, + { + "epoch": 0.49, + "learning_rate": 1.907994835203721e-06, + "loss": 0.7939, + "step": 19136 + }, + { + "epoch": 0.49, + "learning_rate": 1.9079832414517378e-06, + "loss": 0.8359, + "step": 19137 + }, + { + "epoch": 0.49, + "learning_rate": 1.9079716470045536e-06, + "loss": 0.9658, + "step": 19138 + }, + { + "epoch": 0.49, + "learning_rate": 1.9079600518621777e-06, + "loss": 0.6279, + "step": 19139 + }, + { + "epoch": 0.49, + "learning_rate": 1.907948456024618e-06, + "loss": 0.7427, + "step": 19140 + }, + { + "epoch": 0.49, + "learning_rate": 1.9079368594918847e-06, + "loss": 1.0049, + "step": 19141 + }, + { + "epoch": 0.49, + "learning_rate": 1.9079252622639854e-06, + "loss": 0.9424, + "step": 19142 + }, + { + "epoch": 0.49, + "learning_rate": 1.9079136643409295e-06, + "loss": 0.9072, + "step": 19143 + }, + { + "epoch": 0.49, + "learning_rate": 1.907902065722726e-06, + "loss": 0.8564, + "step": 19144 + }, + { + "epoch": 0.49, + "learning_rate": 1.9078904664093832e-06, + "loss": 0.8701, + "step": 19145 + }, + { + "epoch": 0.49, + "learning_rate": 1.9078788664009106e-06, + "loss": 0.9639, + "step": 19146 + }, + { + "epoch": 0.49, + "learning_rate": 1.907867265697317e-06, + "loss": 0.917, + "step": 19147 + }, + { + "epoch": 0.49, + "learning_rate": 1.9078556642986114e-06, + "loss": 0.8213, + "step": 19148 + }, + { + "epoch": 0.49, + "learning_rate": 1.9078440622048025e-06, + "loss": 0.7246, + "step": 19149 + }, + { + "epoch": 0.49, + "learning_rate": 1.9078324594158986e-06, + "loss": 0.8232, + "step": 19150 + }, + { + "epoch": 0.49, + "learning_rate": 1.9078208559319096e-06, + "loss": 1.1035, + "step": 19151 + }, + { + "epoch": 0.49, + "learning_rate": 1.9078092517528437e-06, + "loss": 0.7334, + "step": 19152 + }, + { + "epoch": 0.49, + "learning_rate": 1.90779764687871e-06, + "loss": 0.8572, + "step": 19153 + }, + { + "epoch": 0.49, + "learning_rate": 1.9077860413095175e-06, + "loss": 0.8828, + "step": 19154 + }, + { + "epoch": 0.49, + "learning_rate": 1.907774435045275e-06, + "loss": 0.666, + "step": 19155 + }, + { + "epoch": 0.49, + "learning_rate": 1.9077628280859912e-06, + "loss": 0.8174, + "step": 19156 + }, + { + "epoch": 0.49, + "learning_rate": 1.9077512204316754e-06, + "loss": 0.8096, + "step": 19157 + }, + { + "epoch": 0.49, + "learning_rate": 1.9077396120823355e-06, + "loss": 1.0215, + "step": 19158 + }, + { + "epoch": 0.49, + "learning_rate": 1.907728003037982e-06, + "loss": 0.9653, + "step": 19159 + }, + { + "epoch": 0.49, + "learning_rate": 1.9077163932986228e-06, + "loss": 0.5488, + "step": 19160 + }, + { + "epoch": 0.49, + "learning_rate": 1.9077047828642664e-06, + "loss": 0.8721, + "step": 19161 + }, + { + "epoch": 0.49, + "learning_rate": 1.907693171734922e-06, + "loss": 0.9434, + "step": 19162 + }, + { + "epoch": 0.49, + "learning_rate": 1.9076815599105995e-06, + "loss": 0.9258, + "step": 19163 + }, + { + "epoch": 0.49, + "learning_rate": 1.9076699473913067e-06, + "loss": 0.9814, + "step": 19164 + }, + { + "epoch": 0.49, + "learning_rate": 1.9076583341770526e-06, + "loss": 0.7434, + "step": 19165 + }, + { + "epoch": 0.49, + "learning_rate": 1.9076467202678465e-06, + "loss": 0.9102, + "step": 19166 + }, + { + "epoch": 0.49, + "learning_rate": 1.9076351056636964e-06, + "loss": 0.7935, + "step": 19167 + }, + { + "epoch": 0.49, + "learning_rate": 1.9076234903646126e-06, + "loss": 0.9131, + "step": 19168 + }, + { + "epoch": 0.49, + "learning_rate": 1.9076118743706026e-06, + "loss": 0.6802, + "step": 19169 + }, + { + "epoch": 0.49, + "learning_rate": 1.907600257681676e-06, + "loss": 0.832, + "step": 19170 + }, + { + "epoch": 0.49, + "learning_rate": 1.9075886402978422e-06, + "loss": 0.9346, + "step": 19171 + }, + { + "epoch": 0.49, + "learning_rate": 1.907577022219109e-06, + "loss": 0.7646, + "step": 19172 + }, + { + "epoch": 0.49, + "learning_rate": 1.907565403445486e-06, + "loss": 0.6392, + "step": 19173 + }, + { + "epoch": 0.49, + "learning_rate": 1.907553783976982e-06, + "loss": 0.7061, + "step": 19174 + }, + { + "epoch": 0.49, + "learning_rate": 1.9075421638136057e-06, + "loss": 0.73, + "step": 19175 + }, + { + "epoch": 0.49, + "learning_rate": 1.907530542955366e-06, + "loss": 0.8462, + "step": 19176 + }, + { + "epoch": 0.49, + "learning_rate": 1.907518921402272e-06, + "loss": 0.8574, + "step": 19177 + }, + { + "epoch": 0.49, + "learning_rate": 1.9075072991543322e-06, + "loss": 0.7319, + "step": 19178 + }, + { + "epoch": 0.49, + "learning_rate": 1.9074956762115557e-06, + "loss": 0.9854, + "step": 19179 + }, + { + "epoch": 0.49, + "learning_rate": 1.907484052573952e-06, + "loss": 0.7065, + "step": 19180 + }, + { + "epoch": 0.49, + "learning_rate": 1.9074724282415296e-06, + "loss": 0.6934, + "step": 19181 + }, + { + "epoch": 0.49, + "learning_rate": 1.9074608032142965e-06, + "loss": 0.8535, + "step": 19182 + }, + { + "epoch": 0.49, + "learning_rate": 1.907449177492263e-06, + "loss": 0.7734, + "step": 19183 + }, + { + "epoch": 0.49, + "learning_rate": 1.9074375510754373e-06, + "loss": 0.6445, + "step": 19184 + }, + { + "epoch": 0.49, + "learning_rate": 1.9074259239638285e-06, + "loss": 0.9683, + "step": 19185 + }, + { + "epoch": 0.49, + "learning_rate": 1.907414296157445e-06, + "loss": 0.6155, + "step": 19186 + }, + { + "epoch": 0.49, + "learning_rate": 1.9074026676562966e-06, + "loss": 0.7612, + "step": 19187 + }, + { + "epoch": 0.49, + "learning_rate": 1.9073910384603912e-06, + "loss": 0.9639, + "step": 19188 + }, + { + "epoch": 0.49, + "learning_rate": 1.9073794085697385e-06, + "loss": 1.0752, + "step": 19189 + }, + { + "epoch": 0.49, + "learning_rate": 1.907367777984347e-06, + "loss": 0.9375, + "step": 19190 + }, + { + "epoch": 0.49, + "learning_rate": 1.9073561467042263e-06, + "loss": 0.9922, + "step": 19191 + }, + { + "epoch": 0.49, + "learning_rate": 1.907344514729384e-06, + "loss": 0.9199, + "step": 19192 + }, + { + "epoch": 0.49, + "learning_rate": 1.9073328820598297e-06, + "loss": 0.9961, + "step": 19193 + }, + { + "epoch": 0.49, + "learning_rate": 1.9073212486955726e-06, + "loss": 0.8936, + "step": 19194 + }, + { + "epoch": 0.49, + "learning_rate": 1.9073096146366211e-06, + "loss": 0.7656, + "step": 19195 + }, + { + "epoch": 0.49, + "learning_rate": 1.9072979798829847e-06, + "loss": 1.0508, + "step": 19196 + }, + { + "epoch": 0.49, + "learning_rate": 1.9072863444346718e-06, + "loss": 0.9302, + "step": 19197 + }, + { + "epoch": 0.49, + "learning_rate": 1.9072747082916916e-06, + "loss": 0.7549, + "step": 19198 + }, + { + "epoch": 0.49, + "learning_rate": 1.9072630714540526e-06, + "loss": 0.9863, + "step": 19199 + }, + { + "epoch": 0.49, + "learning_rate": 1.907251433921764e-06, + "loss": 0.918, + "step": 19200 + }, + { + "epoch": 0.49, + "learning_rate": 1.9072397956948349e-06, + "loss": 0.8506, + "step": 19201 + }, + { + "epoch": 0.49, + "learning_rate": 1.9072281567732737e-06, + "loss": 0.8164, + "step": 19202 + }, + { + "epoch": 0.49, + "learning_rate": 1.90721651715709e-06, + "loss": 0.5186, + "step": 19203 + }, + { + "epoch": 0.49, + "learning_rate": 1.907204876846292e-06, + "loss": 1.0117, + "step": 19204 + }, + { + "epoch": 0.49, + "learning_rate": 1.9071932358408893e-06, + "loss": 0.9062, + "step": 19205 + }, + { + "epoch": 0.49, + "learning_rate": 1.9071815941408902e-06, + "loss": 0.8809, + "step": 19206 + }, + { + "epoch": 0.49, + "learning_rate": 1.907169951746304e-06, + "loss": 0.6943, + "step": 19207 + }, + { + "epoch": 0.49, + "learning_rate": 1.9071583086571393e-06, + "loss": 1.002, + "step": 19208 + }, + { + "epoch": 0.49, + "learning_rate": 1.907146664873405e-06, + "loss": 0.8335, + "step": 19209 + }, + { + "epoch": 0.49, + "learning_rate": 1.9071350203951107e-06, + "loss": 0.8926, + "step": 19210 + }, + { + "epoch": 0.49, + "learning_rate": 1.9071233752222647e-06, + "loss": 0.6572, + "step": 19211 + }, + { + "epoch": 0.49, + "learning_rate": 1.907111729354876e-06, + "loss": 0.6885, + "step": 19212 + }, + { + "epoch": 0.49, + "learning_rate": 1.9071000827929535e-06, + "loss": 0.8721, + "step": 19213 + }, + { + "epoch": 0.49, + "learning_rate": 1.9070884355365062e-06, + "loss": 0.6587, + "step": 19214 + }, + { + "epoch": 0.49, + "learning_rate": 1.907076787585543e-06, + "loss": 0.9023, + "step": 19215 + }, + { + "epoch": 0.49, + "learning_rate": 1.9070651389400728e-06, + "loss": 0.8301, + "step": 19216 + }, + { + "epoch": 0.49, + "learning_rate": 1.9070534896001045e-06, + "loss": 0.6978, + "step": 19217 + }, + { + "epoch": 0.49, + "learning_rate": 1.907041839565647e-06, + "loss": 0.999, + "step": 19218 + }, + { + "epoch": 0.49, + "learning_rate": 1.9070301888367095e-06, + "loss": 0.7236, + "step": 19219 + }, + { + "epoch": 0.49, + "learning_rate": 1.9070185374133005e-06, + "loss": 0.8652, + "step": 19220 + }, + { + "epoch": 0.49, + "learning_rate": 1.9070068852954292e-06, + "loss": 0.7319, + "step": 19221 + }, + { + "epoch": 0.49, + "learning_rate": 1.9069952324831044e-06, + "loss": 0.8857, + "step": 19222 + }, + { + "epoch": 0.49, + "learning_rate": 1.9069835789763351e-06, + "loss": 0.9219, + "step": 19223 + }, + { + "epoch": 0.49, + "learning_rate": 1.9069719247751301e-06, + "loss": 0.9014, + "step": 19224 + }, + { + "epoch": 0.49, + "learning_rate": 1.9069602698794983e-06, + "loss": 0.916, + "step": 19225 + }, + { + "epoch": 0.49, + "learning_rate": 1.9069486142894488e-06, + "loss": 0.9492, + "step": 19226 + }, + { + "epoch": 0.49, + "learning_rate": 1.9069369580049909e-06, + "loss": 0.9062, + "step": 19227 + }, + { + "epoch": 0.49, + "learning_rate": 1.9069253010261325e-06, + "loss": 0.8193, + "step": 19228 + }, + { + "epoch": 0.49, + "learning_rate": 1.9069136433528832e-06, + "loss": 0.791, + "step": 19229 + }, + { + "epoch": 0.49, + "learning_rate": 1.906901984985252e-06, + "loss": 0.79, + "step": 19230 + }, + { + "epoch": 0.49, + "learning_rate": 1.9068903259232473e-06, + "loss": 0.981, + "step": 19231 + }, + { + "epoch": 0.49, + "learning_rate": 1.9068786661668788e-06, + "loss": 0.8682, + "step": 19232 + }, + { + "epoch": 0.49, + "learning_rate": 1.9068670057161547e-06, + "loss": 0.7008, + "step": 19233 + }, + { + "epoch": 0.49, + "learning_rate": 1.9068553445710843e-06, + "loss": 0.8848, + "step": 19234 + }, + { + "epoch": 0.49, + "learning_rate": 1.9068436827316768e-06, + "loss": 0.7646, + "step": 19235 + }, + { + "epoch": 0.49, + "learning_rate": 1.9068320201979404e-06, + "loss": 1.0469, + "step": 19236 + }, + { + "epoch": 0.49, + "learning_rate": 1.9068203569698843e-06, + "loss": 0.7715, + "step": 19237 + }, + { + "epoch": 0.49, + "learning_rate": 1.9068086930475181e-06, + "loss": 0.6606, + "step": 19238 + }, + { + "epoch": 0.49, + "learning_rate": 1.9067970284308496e-06, + "loss": 0.9805, + "step": 19239 + }, + { + "epoch": 0.49, + "learning_rate": 1.9067853631198887e-06, + "loss": 0.9814, + "step": 19240 + }, + { + "epoch": 0.49, + "learning_rate": 1.9067736971146439e-06, + "loss": 0.9248, + "step": 19241 + }, + { + "epoch": 0.49, + "learning_rate": 1.906762030415124e-06, + "loss": 0.9678, + "step": 19242 + }, + { + "epoch": 0.49, + "learning_rate": 1.9067503630213384e-06, + "loss": 0.9629, + "step": 19243 + }, + { + "epoch": 0.49, + "learning_rate": 1.9067386949332955e-06, + "loss": 0.7695, + "step": 19244 + }, + { + "epoch": 0.49, + "learning_rate": 1.9067270261510045e-06, + "loss": 0.8857, + "step": 19245 + }, + { + "epoch": 0.49, + "learning_rate": 1.9067153566744742e-06, + "loss": 0.8896, + "step": 19246 + }, + { + "epoch": 0.49, + "learning_rate": 1.9067036865037137e-06, + "loss": 1.0635, + "step": 19247 + }, + { + "epoch": 0.49, + "learning_rate": 1.9066920156387321e-06, + "loss": 0.7319, + "step": 19248 + }, + { + "epoch": 0.49, + "learning_rate": 1.9066803440795378e-06, + "loss": 0.9697, + "step": 19249 + }, + { + "epoch": 0.49, + "learning_rate": 1.9066686718261403e-06, + "loss": 1.1133, + "step": 19250 + }, + { + "epoch": 0.49, + "learning_rate": 1.906656998878548e-06, + "loss": 0.8594, + "step": 19251 + }, + { + "epoch": 0.49, + "learning_rate": 1.9066453252367706e-06, + "loss": 0.875, + "step": 19252 + }, + { + "epoch": 0.49, + "learning_rate": 1.9066336509008161e-06, + "loss": 1.0635, + "step": 19253 + }, + { + "epoch": 0.49, + "learning_rate": 1.9066219758706943e-06, + "loss": 0.7249, + "step": 19254 + }, + { + "epoch": 0.49, + "learning_rate": 1.9066103001464134e-06, + "loss": 1.0459, + "step": 19255 + }, + { + "epoch": 0.49, + "learning_rate": 1.9065986237279828e-06, + "loss": 0.7944, + "step": 19256 + }, + { + "epoch": 0.49, + "learning_rate": 1.9065869466154111e-06, + "loss": 0.8408, + "step": 19257 + }, + { + "epoch": 0.49, + "learning_rate": 1.9065752688087078e-06, + "loss": 0.6777, + "step": 19258 + }, + { + "epoch": 0.49, + "learning_rate": 1.9065635903078814e-06, + "loss": 0.9268, + "step": 19259 + }, + { + "epoch": 0.49, + "learning_rate": 1.9065519111129409e-06, + "loss": 0.5706, + "step": 19260 + }, + { + "epoch": 0.49, + "learning_rate": 1.9065402312238954e-06, + "loss": 0.6423, + "step": 19261 + }, + { + "epoch": 0.49, + "learning_rate": 1.9065285506407536e-06, + "loss": 1.1104, + "step": 19262 + }, + { + "epoch": 0.49, + "learning_rate": 1.9065168693635247e-06, + "loss": 0.8682, + "step": 19263 + }, + { + "epoch": 0.49, + "learning_rate": 1.9065051873922173e-06, + "loss": 0.6914, + "step": 19264 + }, + { + "epoch": 0.49, + "learning_rate": 1.906493504726841e-06, + "loss": 0.9785, + "step": 19265 + }, + { + "epoch": 0.49, + "learning_rate": 1.9064818213674038e-06, + "loss": 1.0049, + "step": 19266 + }, + { + "epoch": 0.49, + "learning_rate": 1.9064701373139154e-06, + "loss": 0.8398, + "step": 19267 + }, + { + "epoch": 0.49, + "learning_rate": 1.9064584525663844e-06, + "loss": 0.96, + "step": 19268 + }, + { + "epoch": 0.49, + "learning_rate": 1.9064467671248198e-06, + "loss": 0.6514, + "step": 19269 + }, + { + "epoch": 0.49, + "learning_rate": 1.906435080989231e-06, + "loss": 1.1357, + "step": 19270 + }, + { + "epoch": 0.49, + "learning_rate": 1.906423394159626e-06, + "loss": 1.0156, + "step": 19271 + }, + { + "epoch": 0.49, + "learning_rate": 1.9064117066360146e-06, + "loss": 0.8613, + "step": 19272 + }, + { + "epoch": 0.49, + "learning_rate": 1.9064000184184052e-06, + "loss": 1.0205, + "step": 19273 + }, + { + "epoch": 0.49, + "learning_rate": 1.9063883295068073e-06, + "loss": 0.7671, + "step": 19274 + }, + { + "epoch": 0.49, + "learning_rate": 1.9063766399012292e-06, + "loss": 0.9736, + "step": 19275 + }, + { + "epoch": 0.49, + "learning_rate": 1.9063649496016802e-06, + "loss": 0.7466, + "step": 19276 + }, + { + "epoch": 0.49, + "learning_rate": 1.9063532586081696e-06, + "loss": 1.0117, + "step": 19277 + }, + { + "epoch": 0.49, + "learning_rate": 1.9063415669207056e-06, + "loss": 0.5664, + "step": 19278 + }, + { + "epoch": 0.49, + "learning_rate": 1.9063298745392976e-06, + "loss": 0.6865, + "step": 19279 + }, + { + "epoch": 0.49, + "learning_rate": 1.906318181463955e-06, + "loss": 0.9502, + "step": 19280 + }, + { + "epoch": 0.49, + "learning_rate": 1.9063064876946858e-06, + "loss": 0.7378, + "step": 19281 + }, + { + "epoch": 0.49, + "learning_rate": 1.9062947932314993e-06, + "loss": 1.2812, + "step": 19282 + }, + { + "epoch": 0.49, + "learning_rate": 1.9062830980744046e-06, + "loss": 0.9287, + "step": 19283 + }, + { + "epoch": 0.49, + "learning_rate": 1.9062714022234107e-06, + "loss": 0.877, + "step": 19284 + }, + { + "epoch": 0.49, + "learning_rate": 1.9062597056785267e-06, + "loss": 0.959, + "step": 19285 + }, + { + "epoch": 0.49, + "learning_rate": 1.9062480084397608e-06, + "loss": 0.9668, + "step": 19286 + }, + { + "epoch": 0.49, + "learning_rate": 1.9062363105071227e-06, + "loss": 0.8379, + "step": 19287 + }, + { + "epoch": 0.49, + "learning_rate": 1.906224611880621e-06, + "loss": 0.8677, + "step": 19288 + }, + { + "epoch": 0.49, + "learning_rate": 1.906212912560265e-06, + "loss": 0.9365, + "step": 19289 + }, + { + "epoch": 0.49, + "learning_rate": 1.9062012125460635e-06, + "loss": 0.9736, + "step": 19290 + }, + { + "epoch": 0.49, + "learning_rate": 1.9061895118380252e-06, + "loss": 1.0771, + "step": 19291 + }, + { + "epoch": 0.49, + "learning_rate": 1.9061778104361595e-06, + "loss": 1.2012, + "step": 19292 + }, + { + "epoch": 0.49, + "learning_rate": 1.9061661083404748e-06, + "loss": 0.7017, + "step": 19293 + }, + { + "epoch": 0.49, + "learning_rate": 1.9061544055509807e-06, + "loss": 0.8857, + "step": 19294 + }, + { + "epoch": 0.49, + "learning_rate": 1.9061427020676855e-06, + "loss": 0.8135, + "step": 19295 + }, + { + "epoch": 0.49, + "learning_rate": 1.9061309978905986e-06, + "loss": 0.7913, + "step": 19296 + }, + { + "epoch": 0.49, + "learning_rate": 1.906119293019729e-06, + "loss": 0.8677, + "step": 19297 + }, + { + "epoch": 0.49, + "learning_rate": 1.9061075874550853e-06, + "loss": 0.9668, + "step": 19298 + }, + { + "epoch": 0.49, + "learning_rate": 1.906095881196677e-06, + "loss": 1.0557, + "step": 19299 + }, + { + "epoch": 0.49, + "learning_rate": 1.9060841742445124e-06, + "loss": 1.0127, + "step": 19300 + }, + { + "epoch": 0.49, + "learning_rate": 1.906072466598601e-06, + "loss": 0.7363, + "step": 19301 + }, + { + "epoch": 0.49, + "learning_rate": 1.9060607582589515e-06, + "loss": 0.9014, + "step": 19302 + }, + { + "epoch": 0.49, + "learning_rate": 1.9060490492255731e-06, + "loss": 0.8525, + "step": 19303 + }, + { + "epoch": 0.49, + "learning_rate": 1.9060373394984745e-06, + "loss": 0.5879, + "step": 19304 + }, + { + "epoch": 0.49, + "learning_rate": 1.9060256290776646e-06, + "loss": 0.8896, + "step": 19305 + }, + { + "epoch": 0.49, + "learning_rate": 1.906013917963153e-06, + "loss": 0.7754, + "step": 19306 + }, + { + "epoch": 0.49, + "learning_rate": 1.9060022061549477e-06, + "loss": 0.7373, + "step": 19307 + }, + { + "epoch": 0.49, + "learning_rate": 1.9059904936530584e-06, + "loss": 0.6445, + "step": 19308 + }, + { + "epoch": 0.49, + "learning_rate": 1.9059787804574939e-06, + "loss": 1.0361, + "step": 19309 + }, + { + "epoch": 0.49, + "learning_rate": 1.905967066568263e-06, + "loss": 0.9189, + "step": 19310 + }, + { + "epoch": 0.49, + "learning_rate": 1.9059553519853748e-06, + "loss": 0.8057, + "step": 19311 + }, + { + "epoch": 0.49, + "learning_rate": 1.9059436367088382e-06, + "loss": 1.0391, + "step": 19312 + }, + { + "epoch": 0.5, + "learning_rate": 1.9059319207386623e-06, + "loss": 0.8184, + "step": 19313 + }, + { + "epoch": 0.5, + "learning_rate": 1.9059202040748562e-06, + "loss": 1.1543, + "step": 19314 + }, + { + "epoch": 0.5, + "learning_rate": 1.9059084867174281e-06, + "loss": 0.7529, + "step": 19315 + }, + { + "epoch": 0.5, + "learning_rate": 1.9058967686663879e-06, + "loss": 0.9717, + "step": 19316 + }, + { + "epoch": 0.5, + "learning_rate": 1.9058850499217441e-06, + "loss": 0.8274, + "step": 19317 + }, + { + "epoch": 0.5, + "learning_rate": 1.9058733304835057e-06, + "loss": 0.9443, + "step": 19318 + }, + { + "epoch": 0.5, + "learning_rate": 1.9058616103516818e-06, + "loss": 0.8193, + "step": 19319 + }, + { + "epoch": 0.5, + "learning_rate": 1.9058498895262813e-06, + "loss": 0.916, + "step": 19320 + }, + { + "epoch": 0.5, + "learning_rate": 1.9058381680073135e-06, + "loss": 1.0117, + "step": 19321 + }, + { + "epoch": 0.5, + "learning_rate": 1.9058264457947866e-06, + "loss": 0.8135, + "step": 19322 + }, + { + "epoch": 0.5, + "learning_rate": 1.9058147228887104e-06, + "loss": 0.585, + "step": 19323 + }, + { + "epoch": 0.5, + "learning_rate": 1.9058029992890932e-06, + "loss": 1.124, + "step": 19324 + }, + { + "epoch": 0.5, + "learning_rate": 1.9057912749959447e-06, + "loss": 0.7998, + "step": 19325 + }, + { + "epoch": 0.5, + "learning_rate": 1.905779550009273e-06, + "loss": 1.0547, + "step": 19326 + }, + { + "epoch": 0.5, + "learning_rate": 1.905767824329088e-06, + "loss": 0.7217, + "step": 19327 + }, + { + "epoch": 0.5, + "learning_rate": 1.905756097955398e-06, + "loss": 1.0059, + "step": 19328 + }, + { + "epoch": 0.5, + "learning_rate": 1.905744370888212e-06, + "loss": 0.8325, + "step": 19329 + }, + { + "epoch": 0.5, + "learning_rate": 1.9057326431275396e-06, + "loss": 1.0469, + "step": 19330 + }, + { + "epoch": 0.5, + "learning_rate": 1.905720914673389e-06, + "loss": 0.8809, + "step": 19331 + }, + { + "epoch": 0.5, + "learning_rate": 1.9057091855257696e-06, + "loss": 0.8921, + "step": 19332 + }, + { + "epoch": 0.5, + "learning_rate": 1.9056974556846906e-06, + "loss": 0.8638, + "step": 19333 + }, + { + "epoch": 0.5, + "learning_rate": 1.9056857251501603e-06, + "loss": 1.0078, + "step": 19334 + }, + { + "epoch": 0.5, + "learning_rate": 1.9056739939221887e-06, + "loss": 1.0283, + "step": 19335 + }, + { + "epoch": 0.5, + "learning_rate": 1.9056622620007836e-06, + "loss": 0.7715, + "step": 19336 + }, + { + "epoch": 0.5, + "learning_rate": 1.9056505293859546e-06, + "loss": 0.7822, + "step": 19337 + }, + { + "epoch": 0.5, + "learning_rate": 1.905638796077711e-06, + "loss": 0.7939, + "step": 19338 + }, + { + "epoch": 0.5, + "learning_rate": 1.9056270620760612e-06, + "loss": 0.7617, + "step": 19339 + }, + { + "epoch": 0.5, + "learning_rate": 1.9056153273810143e-06, + "loss": 0.6411, + "step": 19340 + }, + { + "epoch": 0.5, + "learning_rate": 1.9056035919925793e-06, + "loss": 0.958, + "step": 19341 + }, + { + "epoch": 0.5, + "learning_rate": 1.9055918559107656e-06, + "loss": 1.0537, + "step": 19342 + }, + { + "epoch": 0.5, + "learning_rate": 1.9055801191355814e-06, + "loss": 1.0605, + "step": 19343 + }, + { + "epoch": 0.5, + "learning_rate": 1.9055683816670365e-06, + "loss": 0.8262, + "step": 19344 + }, + { + "epoch": 0.5, + "learning_rate": 1.9055566435051395e-06, + "loss": 0.75, + "step": 19345 + }, + { + "epoch": 0.5, + "learning_rate": 1.9055449046498992e-06, + "loss": 1.0039, + "step": 19346 + }, + { + "epoch": 0.5, + "learning_rate": 1.9055331651013252e-06, + "loss": 0.9014, + "step": 19347 + }, + { + "epoch": 0.5, + "learning_rate": 1.905521424859426e-06, + "loss": 0.7402, + "step": 19348 + }, + { + "epoch": 0.5, + "learning_rate": 1.9055096839242104e-06, + "loss": 0.7939, + "step": 19349 + }, + { + "epoch": 0.5, + "learning_rate": 1.9054979422956875e-06, + "loss": 1.1572, + "step": 19350 + }, + { + "epoch": 0.5, + "learning_rate": 1.905486199973867e-06, + "loss": 0.9863, + "step": 19351 + }, + { + "epoch": 0.5, + "learning_rate": 1.9054744569587573e-06, + "loss": 0.6938, + "step": 19352 + }, + { + "epoch": 0.5, + "learning_rate": 1.905462713250367e-06, + "loss": 0.8682, + "step": 19353 + }, + { + "epoch": 0.5, + "learning_rate": 1.9054509688487059e-06, + "loss": 0.6558, + "step": 19354 + }, + { + "epoch": 0.5, + "learning_rate": 1.9054392237537825e-06, + "loss": 0.7793, + "step": 19355 + }, + { + "epoch": 0.5, + "learning_rate": 1.9054274779656062e-06, + "loss": 1.0449, + "step": 19356 + }, + { + "epoch": 0.5, + "learning_rate": 1.9054157314841852e-06, + "loss": 0.8867, + "step": 19357 + }, + { + "epoch": 0.5, + "learning_rate": 1.9054039843095296e-06, + "loss": 1.0303, + "step": 19358 + }, + { + "epoch": 0.5, + "learning_rate": 1.9053922364416472e-06, + "loss": 0.8984, + "step": 19359 + }, + { + "epoch": 0.5, + "learning_rate": 1.905380487880548e-06, + "loss": 0.9932, + "step": 19360 + }, + { + "epoch": 0.5, + "learning_rate": 1.9053687386262406e-06, + "loss": 0.9424, + "step": 19361 + }, + { + "epoch": 0.5, + "learning_rate": 1.9053569886787337e-06, + "loss": 0.9688, + "step": 19362 + }, + { + "epoch": 0.5, + "learning_rate": 1.9053452380380368e-06, + "loss": 1.084, + "step": 19363 + }, + { + "epoch": 0.5, + "learning_rate": 1.9053334867041583e-06, + "loss": 1.1182, + "step": 19364 + }, + { + "epoch": 0.5, + "learning_rate": 1.9053217346771082e-06, + "loss": 0.8838, + "step": 19365 + }, + { + "epoch": 0.5, + "learning_rate": 1.9053099819568945e-06, + "loss": 0.959, + "step": 19366 + }, + { + "epoch": 0.5, + "learning_rate": 1.9052982285435266e-06, + "loss": 0.9126, + "step": 19367 + }, + { + "epoch": 0.5, + "learning_rate": 1.9052864744370134e-06, + "loss": 1.04, + "step": 19368 + }, + { + "epoch": 0.5, + "learning_rate": 1.9052747196373642e-06, + "loss": 0.7891, + "step": 19369 + }, + { + "epoch": 0.5, + "learning_rate": 1.9052629641445876e-06, + "loss": 0.8867, + "step": 19370 + }, + { + "epoch": 0.5, + "learning_rate": 1.9052512079586932e-06, + "loss": 0.812, + "step": 19371 + }, + { + "epoch": 0.5, + "learning_rate": 1.905239451079689e-06, + "loss": 0.749, + "step": 19372 + }, + { + "epoch": 0.5, + "learning_rate": 1.9052276935075847e-06, + "loss": 1.0654, + "step": 19373 + }, + { + "epoch": 0.5, + "learning_rate": 1.9052159352423894e-06, + "loss": 0.9805, + "step": 19374 + }, + { + "epoch": 0.5, + "learning_rate": 1.9052041762841115e-06, + "loss": 0.9146, + "step": 19375 + }, + { + "epoch": 0.5, + "learning_rate": 1.9051924166327607e-06, + "loss": 0.8516, + "step": 19376 + }, + { + "epoch": 0.5, + "learning_rate": 1.9051806562883456e-06, + "loss": 0.9414, + "step": 19377 + }, + { + "epoch": 0.5, + "learning_rate": 1.9051688952508754e-06, + "loss": 1.0078, + "step": 19378 + }, + { + "epoch": 0.5, + "learning_rate": 1.9051571335203588e-06, + "loss": 0.8145, + "step": 19379 + }, + { + "epoch": 0.5, + "learning_rate": 1.9051453710968052e-06, + "loss": 0.6458, + "step": 19380 + }, + { + "epoch": 0.5, + "learning_rate": 1.9051336079802234e-06, + "loss": 0.9043, + "step": 19381 + }, + { + "epoch": 0.5, + "learning_rate": 1.9051218441706223e-06, + "loss": 0.8237, + "step": 19382 + }, + { + "epoch": 0.5, + "learning_rate": 1.905110079668011e-06, + "loss": 0.7871, + "step": 19383 + }, + { + "epoch": 0.5, + "learning_rate": 1.9050983144723987e-06, + "loss": 0.918, + "step": 19384 + }, + { + "epoch": 0.5, + "learning_rate": 1.905086548583794e-06, + "loss": 0.8662, + "step": 19385 + }, + { + "epoch": 0.5, + "learning_rate": 1.9050747820022063e-06, + "loss": 0.8555, + "step": 19386 + }, + { + "epoch": 0.5, + "learning_rate": 1.9050630147276446e-06, + "loss": 0.8818, + "step": 19387 + }, + { + "epoch": 0.5, + "learning_rate": 1.9050512467601174e-06, + "loss": 1.0117, + "step": 19388 + }, + { + "epoch": 0.5, + "learning_rate": 1.9050394780996344e-06, + "loss": 0.7549, + "step": 19389 + }, + { + "epoch": 0.5, + "learning_rate": 1.9050277087462042e-06, + "loss": 1.1318, + "step": 19390 + }, + { + "epoch": 0.5, + "learning_rate": 1.9050159386998358e-06, + "loss": 0.7656, + "step": 19391 + }, + { + "epoch": 0.5, + "learning_rate": 1.9050041679605383e-06, + "loss": 0.8193, + "step": 19392 + }, + { + "epoch": 0.5, + "learning_rate": 1.9049923965283208e-06, + "loss": 0.7969, + "step": 19393 + }, + { + "epoch": 0.5, + "learning_rate": 1.9049806244031923e-06, + "loss": 0.8252, + "step": 19394 + }, + { + "epoch": 0.5, + "learning_rate": 1.9049688515851617e-06, + "loss": 0.7939, + "step": 19395 + }, + { + "epoch": 0.5, + "learning_rate": 1.904957078074238e-06, + "loss": 0.8643, + "step": 19396 + }, + { + "epoch": 0.5, + "learning_rate": 1.9049453038704302e-06, + "loss": 0.9043, + "step": 19397 + }, + { + "epoch": 0.5, + "learning_rate": 1.9049335289737476e-06, + "loss": 0.8057, + "step": 19398 + }, + { + "epoch": 0.5, + "learning_rate": 1.9049217533841989e-06, + "loss": 0.959, + "step": 19399 + }, + { + "epoch": 0.5, + "learning_rate": 1.904909977101793e-06, + "loss": 0.8877, + "step": 19400 + }, + { + "epoch": 0.5, + "learning_rate": 1.9048982001265395e-06, + "loss": 0.8896, + "step": 19401 + }, + { + "epoch": 0.5, + "learning_rate": 1.9048864224584469e-06, + "loss": 0.8037, + "step": 19402 + }, + { + "epoch": 0.5, + "learning_rate": 1.9048746440975245e-06, + "loss": 0.7642, + "step": 19403 + }, + { + "epoch": 0.5, + "learning_rate": 1.904862865043781e-06, + "loss": 0.7241, + "step": 19404 + }, + { + "epoch": 0.5, + "learning_rate": 1.9048510852972256e-06, + "loss": 0.8359, + "step": 19405 + }, + { + "epoch": 0.5, + "learning_rate": 1.9048393048578676e-06, + "loss": 1.0957, + "step": 19406 + }, + { + "epoch": 0.5, + "learning_rate": 1.9048275237257155e-06, + "loss": 0.9502, + "step": 19407 + }, + { + "epoch": 0.5, + "learning_rate": 1.9048157419007787e-06, + "loss": 0.7432, + "step": 19408 + }, + { + "epoch": 0.5, + "learning_rate": 1.904803959383066e-06, + "loss": 0.8506, + "step": 19409 + }, + { + "epoch": 0.5, + "learning_rate": 1.9047921761725867e-06, + "loss": 0.7783, + "step": 19410 + }, + { + "epoch": 0.5, + "learning_rate": 1.9047803922693495e-06, + "loss": 0.9854, + "step": 19411 + }, + { + "epoch": 0.5, + "learning_rate": 1.9047686076733634e-06, + "loss": 0.9023, + "step": 19412 + }, + { + "epoch": 0.5, + "learning_rate": 1.9047568223846377e-06, + "loss": 1.0684, + "step": 19413 + }, + { + "epoch": 0.5, + "learning_rate": 1.9047450364031814e-06, + "loss": 0.8672, + "step": 19414 + }, + { + "epoch": 0.5, + "learning_rate": 1.9047332497290033e-06, + "loss": 0.9668, + "step": 19415 + }, + { + "epoch": 0.5, + "learning_rate": 1.9047214623621126e-06, + "loss": 0.7114, + "step": 19416 + }, + { + "epoch": 0.5, + "learning_rate": 1.9047096743025181e-06, + "loss": 0.729, + "step": 19417 + }, + { + "epoch": 0.5, + "learning_rate": 1.9046978855502294e-06, + "loss": 0.8135, + "step": 19418 + }, + { + "epoch": 0.5, + "learning_rate": 1.904686096105255e-06, + "loss": 0.8643, + "step": 19419 + }, + { + "epoch": 0.5, + "learning_rate": 1.9046743059676039e-06, + "loss": 0.748, + "step": 19420 + }, + { + "epoch": 0.5, + "learning_rate": 1.9046625151372852e-06, + "loss": 0.8643, + "step": 19421 + }, + { + "epoch": 0.5, + "learning_rate": 1.9046507236143081e-06, + "loss": 1.0186, + "step": 19422 + }, + { + "epoch": 0.5, + "learning_rate": 1.9046389313986817e-06, + "loss": 0.8721, + "step": 19423 + }, + { + "epoch": 0.5, + "learning_rate": 1.9046271384904146e-06, + "loss": 0.7588, + "step": 19424 + }, + { + "epoch": 0.5, + "learning_rate": 1.9046153448895166e-06, + "loss": 0.6716, + "step": 19425 + }, + { + "epoch": 0.5, + "learning_rate": 1.9046035505959956e-06, + "loss": 0.8164, + "step": 19426 + }, + { + "epoch": 0.5, + "learning_rate": 1.9045917556098616e-06, + "loss": 0.915, + "step": 19427 + }, + { + "epoch": 0.5, + "learning_rate": 1.9045799599311234e-06, + "loss": 0.8115, + "step": 19428 + }, + { + "epoch": 0.5, + "learning_rate": 1.9045681635597896e-06, + "loss": 1.04, + "step": 19429 + }, + { + "epoch": 0.5, + "learning_rate": 1.9045563664958699e-06, + "loss": 0.7725, + "step": 19430 + }, + { + "epoch": 0.5, + "learning_rate": 1.9045445687393726e-06, + "loss": 0.9307, + "step": 19431 + }, + { + "epoch": 0.5, + "learning_rate": 1.9045327702903074e-06, + "loss": 1.0098, + "step": 19432 + }, + { + "epoch": 0.5, + "learning_rate": 1.904520971148683e-06, + "loss": 0.9668, + "step": 19433 + }, + { + "epoch": 0.5, + "learning_rate": 1.9045091713145083e-06, + "loss": 0.8506, + "step": 19434 + }, + { + "epoch": 0.5, + "learning_rate": 1.9044973707877927e-06, + "loss": 0.7939, + "step": 19435 + }, + { + "epoch": 0.5, + "learning_rate": 1.9044855695685448e-06, + "loss": 0.8896, + "step": 19436 + }, + { + "epoch": 0.5, + "learning_rate": 1.9044737676567743e-06, + "loss": 0.9365, + "step": 19437 + }, + { + "epoch": 0.5, + "learning_rate": 1.9044619650524895e-06, + "loss": 0.9385, + "step": 19438 + }, + { + "epoch": 0.5, + "learning_rate": 1.9044501617557e-06, + "loss": 0.8462, + "step": 19439 + }, + { + "epoch": 0.5, + "learning_rate": 1.9044383577664145e-06, + "loss": 1.0605, + "step": 19440 + }, + { + "epoch": 0.5, + "learning_rate": 1.9044265530846419e-06, + "loss": 1.1279, + "step": 19441 + }, + { + "epoch": 0.5, + "learning_rate": 1.9044147477103919e-06, + "loss": 0.7949, + "step": 19442 + }, + { + "epoch": 0.5, + "learning_rate": 1.904402941643673e-06, + "loss": 0.8379, + "step": 19443 + }, + { + "epoch": 0.5, + "learning_rate": 1.9043911348844942e-06, + "loss": 0.6538, + "step": 19444 + }, + { + "epoch": 0.5, + "learning_rate": 1.9043793274328645e-06, + "loss": 0.959, + "step": 19445 + }, + { + "epoch": 0.5, + "learning_rate": 1.9043675192887933e-06, + "loss": 0.8232, + "step": 19446 + }, + { + "epoch": 0.5, + "learning_rate": 1.9043557104522895e-06, + "loss": 0.8496, + "step": 19447 + }, + { + "epoch": 0.5, + "learning_rate": 1.9043439009233624e-06, + "loss": 0.8047, + "step": 19448 + }, + { + "epoch": 0.5, + "learning_rate": 1.9043320907020206e-06, + "loss": 0.7998, + "step": 19449 + }, + { + "epoch": 0.5, + "learning_rate": 1.9043202797882731e-06, + "loss": 0.8164, + "step": 19450 + }, + { + "epoch": 0.5, + "learning_rate": 1.9043084681821294e-06, + "loss": 0.877, + "step": 19451 + }, + { + "epoch": 0.5, + "learning_rate": 1.904296655883598e-06, + "loss": 0.8701, + "step": 19452 + }, + { + "epoch": 0.5, + "learning_rate": 1.9042848428926884e-06, + "loss": 0.9248, + "step": 19453 + }, + { + "epoch": 0.5, + "learning_rate": 1.9042730292094094e-06, + "loss": 0.8486, + "step": 19454 + }, + { + "epoch": 0.5, + "learning_rate": 1.9042612148337701e-06, + "loss": 0.9248, + "step": 19455 + }, + { + "epoch": 0.5, + "learning_rate": 1.90424939976578e-06, + "loss": 0.8286, + "step": 19456 + }, + { + "epoch": 0.5, + "learning_rate": 1.9042375840054471e-06, + "loss": 1.0615, + "step": 19457 + }, + { + "epoch": 0.5, + "learning_rate": 1.9042257675527814e-06, + "loss": 1.04, + "step": 19458 + }, + { + "epoch": 0.5, + "learning_rate": 1.9042139504077914e-06, + "loss": 0.8604, + "step": 19459 + }, + { + "epoch": 0.5, + "learning_rate": 1.9042021325704867e-06, + "loss": 0.8828, + "step": 19460 + }, + { + "epoch": 0.5, + "learning_rate": 1.9041903140408756e-06, + "loss": 0.9961, + "step": 19461 + }, + { + "epoch": 0.5, + "learning_rate": 1.9041784948189678e-06, + "loss": 1.0947, + "step": 19462 + }, + { + "epoch": 0.5, + "learning_rate": 1.904166674904772e-06, + "loss": 0.6515, + "step": 19463 + }, + { + "epoch": 0.5, + "learning_rate": 1.9041548542982975e-06, + "loss": 1.0566, + "step": 19464 + }, + { + "epoch": 0.5, + "learning_rate": 1.9041430329995532e-06, + "loss": 0.8281, + "step": 19465 + }, + { + "epoch": 0.5, + "learning_rate": 1.904131211008548e-06, + "loss": 0.7354, + "step": 19466 + }, + { + "epoch": 0.5, + "learning_rate": 1.904119388325291e-06, + "loss": 0.8135, + "step": 19467 + }, + { + "epoch": 0.5, + "learning_rate": 1.9041075649497916e-06, + "loss": 0.833, + "step": 19468 + }, + { + "epoch": 0.5, + "learning_rate": 1.9040957408820585e-06, + "loss": 0.6465, + "step": 19469 + }, + { + "epoch": 0.5, + "learning_rate": 1.9040839161221009e-06, + "loss": 0.7185, + "step": 19470 + }, + { + "epoch": 0.5, + "learning_rate": 1.904072090669928e-06, + "loss": 1.04, + "step": 19471 + }, + { + "epoch": 0.5, + "learning_rate": 1.9040602645255483e-06, + "loss": 0.9326, + "step": 19472 + }, + { + "epoch": 0.5, + "learning_rate": 1.9040484376889715e-06, + "loss": 1.0615, + "step": 19473 + }, + { + "epoch": 0.5, + "learning_rate": 1.9040366101602063e-06, + "loss": 0.8242, + "step": 19474 + }, + { + "epoch": 0.5, + "learning_rate": 1.9040247819392618e-06, + "loss": 0.9443, + "step": 19475 + }, + { + "epoch": 0.5, + "learning_rate": 1.904012953026147e-06, + "loss": 0.9619, + "step": 19476 + }, + { + "epoch": 0.5, + "learning_rate": 1.9040011234208712e-06, + "loss": 0.7832, + "step": 19477 + }, + { + "epoch": 0.5, + "learning_rate": 1.9039892931234433e-06, + "loss": 0.9395, + "step": 19478 + }, + { + "epoch": 0.5, + "learning_rate": 1.9039774621338722e-06, + "loss": 0.623, + "step": 19479 + }, + { + "epoch": 0.5, + "learning_rate": 1.903965630452167e-06, + "loss": 0.9028, + "step": 19480 + }, + { + "epoch": 0.5, + "learning_rate": 1.9039537980783376e-06, + "loss": 0.8921, + "step": 19481 + }, + { + "epoch": 0.5, + "learning_rate": 1.9039419650123918e-06, + "loss": 0.8105, + "step": 19482 + }, + { + "epoch": 0.5, + "learning_rate": 1.9039301312543392e-06, + "loss": 0.8887, + "step": 19483 + }, + { + "epoch": 0.5, + "learning_rate": 1.903918296804189e-06, + "loss": 0.9189, + "step": 19484 + }, + { + "epoch": 0.5, + "learning_rate": 1.90390646166195e-06, + "loss": 0.8496, + "step": 19485 + }, + { + "epoch": 0.5, + "learning_rate": 1.9038946258276316e-06, + "loss": 0.6211, + "step": 19486 + }, + { + "epoch": 0.5, + "learning_rate": 1.9038827893012424e-06, + "loss": 0.5706, + "step": 19487 + }, + { + "epoch": 0.5, + "learning_rate": 1.9038709520827917e-06, + "loss": 1.0625, + "step": 19488 + }, + { + "epoch": 0.5, + "learning_rate": 1.9038591141722886e-06, + "loss": 0.9512, + "step": 19489 + }, + { + "epoch": 0.5, + "learning_rate": 1.9038472755697423e-06, + "loss": 0.7988, + "step": 19490 + }, + { + "epoch": 0.5, + "learning_rate": 1.9038354362751617e-06, + "loss": 0.7939, + "step": 19491 + }, + { + "epoch": 0.5, + "learning_rate": 1.9038235962885559e-06, + "loss": 1.0513, + "step": 19492 + }, + { + "epoch": 0.5, + "learning_rate": 1.9038117556099339e-06, + "loss": 0.8574, + "step": 19493 + }, + { + "epoch": 0.5, + "learning_rate": 1.9037999142393044e-06, + "loss": 0.9629, + "step": 19494 + }, + { + "epoch": 0.5, + "learning_rate": 1.9037880721766773e-06, + "loss": 0.7666, + "step": 19495 + }, + { + "epoch": 0.5, + "learning_rate": 1.903776229422061e-06, + "loss": 0.6855, + "step": 19496 + }, + { + "epoch": 0.5, + "learning_rate": 1.9037643859754651e-06, + "loss": 0.792, + "step": 19497 + }, + { + "epoch": 0.5, + "learning_rate": 1.903752541836898e-06, + "loss": 0.6787, + "step": 19498 + }, + { + "epoch": 0.5, + "learning_rate": 1.9037406970063695e-06, + "loss": 0.8848, + "step": 19499 + }, + { + "epoch": 0.5, + "learning_rate": 1.903728851483888e-06, + "loss": 0.8643, + "step": 19500 + }, + { + "epoch": 0.5, + "learning_rate": 1.9037170052694628e-06, + "loss": 0.8652, + "step": 19501 + }, + { + "epoch": 0.5, + "learning_rate": 1.9037051583631035e-06, + "loss": 0.8257, + "step": 19502 + }, + { + "epoch": 0.5, + "learning_rate": 1.9036933107648184e-06, + "loss": 0.9756, + "step": 19503 + }, + { + "epoch": 0.5, + "learning_rate": 1.9036814624746169e-06, + "loss": 1.1123, + "step": 19504 + }, + { + "epoch": 0.5, + "learning_rate": 1.903669613492508e-06, + "loss": 0.7036, + "step": 19505 + }, + { + "epoch": 0.5, + "learning_rate": 1.9036577638185007e-06, + "loss": 0.958, + "step": 19506 + }, + { + "epoch": 0.5, + "learning_rate": 1.9036459134526045e-06, + "loss": 0.916, + "step": 19507 + }, + { + "epoch": 0.5, + "learning_rate": 1.903634062394828e-06, + "loss": 0.9043, + "step": 19508 + }, + { + "epoch": 0.5, + "learning_rate": 1.9036222106451807e-06, + "loss": 0.9082, + "step": 19509 + }, + { + "epoch": 0.5, + "learning_rate": 1.9036103582036711e-06, + "loss": 1.0879, + "step": 19510 + }, + { + "epoch": 0.5, + "learning_rate": 1.9035985050703087e-06, + "loss": 0.9893, + "step": 19511 + }, + { + "epoch": 0.5, + "learning_rate": 1.9035866512451028e-06, + "loss": 0.8662, + "step": 19512 + }, + { + "epoch": 0.5, + "learning_rate": 1.9035747967280618e-06, + "loss": 1.1162, + "step": 19513 + }, + { + "epoch": 0.5, + "learning_rate": 1.9035629415191952e-06, + "loss": 0.8638, + "step": 19514 + }, + { + "epoch": 0.5, + "learning_rate": 1.903551085618512e-06, + "loss": 0.9766, + "step": 19515 + }, + { + "epoch": 0.5, + "learning_rate": 1.9035392290260212e-06, + "loss": 0.7402, + "step": 19516 + }, + { + "epoch": 0.5, + "learning_rate": 1.9035273717417319e-06, + "loss": 0.7788, + "step": 19517 + }, + { + "epoch": 0.5, + "learning_rate": 1.9035155137656535e-06, + "loss": 0.7261, + "step": 19518 + }, + { + "epoch": 0.5, + "learning_rate": 1.9035036550977947e-06, + "loss": 0.8691, + "step": 19519 + }, + { + "epoch": 0.5, + "learning_rate": 1.903491795738165e-06, + "loss": 0.9746, + "step": 19520 + }, + { + "epoch": 0.5, + "learning_rate": 1.9034799356867726e-06, + "loss": 0.8887, + "step": 19521 + }, + { + "epoch": 0.5, + "learning_rate": 1.9034680749436274e-06, + "loss": 0.9912, + "step": 19522 + }, + { + "epoch": 0.5, + "learning_rate": 1.9034562135087385e-06, + "loss": 1.0684, + "step": 19523 + }, + { + "epoch": 0.5, + "learning_rate": 1.9034443513821143e-06, + "loss": 0.751, + "step": 19524 + }, + { + "epoch": 0.5, + "learning_rate": 1.9034324885637646e-06, + "loss": 0.9199, + "step": 19525 + }, + { + "epoch": 0.5, + "learning_rate": 1.9034206250536979e-06, + "loss": 0.8906, + "step": 19526 + }, + { + "epoch": 0.5, + "learning_rate": 1.9034087608519238e-06, + "loss": 0.9678, + "step": 19527 + }, + { + "epoch": 0.5, + "learning_rate": 1.903396895958451e-06, + "loss": 0.7217, + "step": 19528 + }, + { + "epoch": 0.5, + "learning_rate": 1.9033850303732889e-06, + "loss": 0.5991, + "step": 19529 + }, + { + "epoch": 0.5, + "learning_rate": 1.9033731640964463e-06, + "loss": 0.8584, + "step": 19530 + }, + { + "epoch": 0.5, + "learning_rate": 1.9033612971279322e-06, + "loss": 1.248, + "step": 19531 + }, + { + "epoch": 0.5, + "learning_rate": 1.9033494294677563e-06, + "loss": 0.7061, + "step": 19532 + }, + { + "epoch": 0.5, + "learning_rate": 1.903337561115927e-06, + "loss": 0.792, + "step": 19533 + }, + { + "epoch": 0.5, + "learning_rate": 1.903325692072454e-06, + "loss": 0.9355, + "step": 19534 + }, + { + "epoch": 0.5, + "learning_rate": 1.903313822337346e-06, + "loss": 1.0244, + "step": 19535 + }, + { + "epoch": 0.5, + "learning_rate": 1.903301951910612e-06, + "loss": 0.7202, + "step": 19536 + }, + { + "epoch": 0.5, + "learning_rate": 1.903290080792261e-06, + "loss": 1.0625, + "step": 19537 + }, + { + "epoch": 0.5, + "learning_rate": 1.9032782089823026e-06, + "loss": 0.8555, + "step": 19538 + }, + { + "epoch": 0.5, + "learning_rate": 1.9032663364807453e-06, + "loss": 0.8398, + "step": 19539 + }, + { + "epoch": 0.5, + "learning_rate": 1.903254463287599e-06, + "loss": 0.7246, + "step": 19540 + }, + { + "epoch": 0.5, + "learning_rate": 1.9032425894028718e-06, + "loss": 0.7969, + "step": 19541 + }, + { + "epoch": 0.5, + "learning_rate": 1.9032307148265736e-06, + "loss": 0.9092, + "step": 19542 + }, + { + "epoch": 0.5, + "learning_rate": 1.903218839558713e-06, + "loss": 0.7166, + "step": 19543 + }, + { + "epoch": 0.5, + "learning_rate": 1.9032069635992993e-06, + "loss": 1.0049, + "step": 19544 + }, + { + "epoch": 0.5, + "learning_rate": 1.9031950869483417e-06, + "loss": 0.9209, + "step": 19545 + }, + { + "epoch": 0.5, + "learning_rate": 1.903183209605849e-06, + "loss": 0.917, + "step": 19546 + }, + { + "epoch": 0.5, + "learning_rate": 1.9031713315718308e-06, + "loss": 0.8325, + "step": 19547 + }, + { + "epoch": 0.5, + "learning_rate": 1.9031594528462955e-06, + "loss": 0.8354, + "step": 19548 + }, + { + "epoch": 0.5, + "learning_rate": 1.9031475734292525e-06, + "loss": 0.8457, + "step": 19549 + }, + { + "epoch": 0.5, + "learning_rate": 1.903135693320711e-06, + "loss": 0.9062, + "step": 19550 + }, + { + "epoch": 0.5, + "learning_rate": 1.9031238125206799e-06, + "loss": 1.127, + "step": 19551 + }, + { + "epoch": 0.5, + "learning_rate": 1.9031119310291689e-06, + "loss": 0.9111, + "step": 19552 + }, + { + "epoch": 0.5, + "learning_rate": 1.903100048846186e-06, + "loss": 0.7202, + "step": 19553 + }, + { + "epoch": 0.5, + "learning_rate": 1.9030881659717412e-06, + "loss": 0.645, + "step": 19554 + }, + { + "epoch": 0.5, + "learning_rate": 1.9030762824058435e-06, + "loss": 0.8369, + "step": 19555 + }, + { + "epoch": 0.5, + "learning_rate": 1.9030643981485015e-06, + "loss": 0.8159, + "step": 19556 + }, + { + "epoch": 0.5, + "learning_rate": 1.9030525131997247e-06, + "loss": 0.8711, + "step": 19557 + }, + { + "epoch": 0.5, + "learning_rate": 1.9030406275595224e-06, + "loss": 0.8621, + "step": 19558 + }, + { + "epoch": 0.5, + "learning_rate": 1.903028741227903e-06, + "loss": 0.7725, + "step": 19559 + }, + { + "epoch": 0.5, + "learning_rate": 1.903016854204876e-06, + "loss": 1.0, + "step": 19560 + }, + { + "epoch": 0.5, + "learning_rate": 1.9030049664904508e-06, + "loss": 0.8618, + "step": 19561 + }, + { + "epoch": 0.5, + "learning_rate": 1.902993078084636e-06, + "loss": 0.6665, + "step": 19562 + }, + { + "epoch": 0.5, + "learning_rate": 1.9029811889874411e-06, + "loss": 1.1064, + "step": 19563 + }, + { + "epoch": 0.5, + "learning_rate": 1.902969299198875e-06, + "loss": 1.0195, + "step": 19564 + }, + { + "epoch": 0.5, + "learning_rate": 1.9029574087189469e-06, + "loss": 0.7344, + "step": 19565 + }, + { + "epoch": 0.5, + "learning_rate": 1.902945517547666e-06, + "loss": 0.7571, + "step": 19566 + }, + { + "epoch": 0.5, + "learning_rate": 1.9029336256850406e-06, + "loss": 0.7686, + "step": 19567 + }, + { + "epoch": 0.5, + "learning_rate": 1.9029217331310807e-06, + "loss": 0.6494, + "step": 19568 + }, + { + "epoch": 0.5, + "learning_rate": 1.9029098398857955e-06, + "loss": 0.9268, + "step": 19569 + }, + { + "epoch": 0.5, + "learning_rate": 1.9028979459491935e-06, + "loss": 0.9736, + "step": 19570 + }, + { + "epoch": 0.5, + "learning_rate": 1.9028860513212842e-06, + "loss": 1.0273, + "step": 19571 + }, + { + "epoch": 0.5, + "learning_rate": 1.9028741560020762e-06, + "loss": 0.9824, + "step": 19572 + }, + { + "epoch": 0.5, + "learning_rate": 1.9028622599915791e-06, + "loss": 0.8354, + "step": 19573 + }, + { + "epoch": 0.5, + "learning_rate": 1.902850363289802e-06, + "loss": 0.876, + "step": 19574 + }, + { + "epoch": 0.5, + "learning_rate": 1.902838465896754e-06, + "loss": 1.0811, + "step": 19575 + }, + { + "epoch": 0.5, + "learning_rate": 1.9028265678124439e-06, + "loss": 0.8506, + "step": 19576 + }, + { + "epoch": 0.5, + "learning_rate": 1.902814669036881e-06, + "loss": 0.7559, + "step": 19577 + }, + { + "epoch": 0.5, + "learning_rate": 1.9028027695700746e-06, + "loss": 1.0723, + "step": 19578 + }, + { + "epoch": 0.5, + "learning_rate": 1.9027908694120335e-06, + "loss": 0.8115, + "step": 19579 + }, + { + "epoch": 0.5, + "learning_rate": 1.9027789685627672e-06, + "loss": 0.8086, + "step": 19580 + }, + { + "epoch": 0.5, + "learning_rate": 1.9027670670222843e-06, + "loss": 0.9785, + "step": 19581 + }, + { + "epoch": 0.5, + "learning_rate": 1.902755164790594e-06, + "loss": 0.918, + "step": 19582 + }, + { + "epoch": 0.5, + "learning_rate": 1.9027432618677058e-06, + "loss": 0.6802, + "step": 19583 + }, + { + "epoch": 0.5, + "learning_rate": 1.9027313582536286e-06, + "loss": 0.8506, + "step": 19584 + }, + { + "epoch": 0.5, + "learning_rate": 1.9027194539483715e-06, + "loss": 0.8633, + "step": 19585 + }, + { + "epoch": 0.5, + "learning_rate": 1.9027075489519438e-06, + "loss": 0.9463, + "step": 19586 + }, + { + "epoch": 0.5, + "learning_rate": 1.902695643264354e-06, + "loss": 0.6621, + "step": 19587 + }, + { + "epoch": 0.5, + "learning_rate": 1.9026837368856122e-06, + "loss": 0.8066, + "step": 19588 + }, + { + "epoch": 0.5, + "learning_rate": 1.9026718298157264e-06, + "loss": 0.8506, + "step": 19589 + }, + { + "epoch": 0.5, + "learning_rate": 1.9026599220547066e-06, + "loss": 0.834, + "step": 19590 + }, + { + "epoch": 0.5, + "learning_rate": 1.9026480136025615e-06, + "loss": 0.7461, + "step": 19591 + }, + { + "epoch": 0.5, + "learning_rate": 1.9026361044593005e-06, + "loss": 0.7705, + "step": 19592 + }, + { + "epoch": 0.5, + "learning_rate": 1.9026241946249323e-06, + "loss": 0.8975, + "step": 19593 + }, + { + "epoch": 0.5, + "learning_rate": 1.9026122840994665e-06, + "loss": 0.7617, + "step": 19594 + }, + { + "epoch": 0.5, + "learning_rate": 1.9026003728829117e-06, + "loss": 0.9902, + "step": 19595 + }, + { + "epoch": 0.5, + "learning_rate": 1.9025884609752776e-06, + "loss": 0.9482, + "step": 19596 + }, + { + "epoch": 0.5, + "learning_rate": 1.9025765483765727e-06, + "loss": 0.958, + "step": 19597 + }, + { + "epoch": 0.5, + "learning_rate": 1.9025646350868066e-06, + "loss": 1.0967, + "step": 19598 + }, + { + "epoch": 0.5, + "learning_rate": 1.902552721105988e-06, + "loss": 0.8721, + "step": 19599 + }, + { + "epoch": 0.5, + "learning_rate": 1.9025408064341268e-06, + "loss": 0.7822, + "step": 19600 + }, + { + "epoch": 0.5, + "learning_rate": 1.9025288910712313e-06, + "loss": 1.043, + "step": 19601 + }, + { + "epoch": 0.5, + "learning_rate": 1.902516975017311e-06, + "loss": 0.8379, + "step": 19602 + }, + { + "epoch": 0.5, + "learning_rate": 1.902505058272375e-06, + "loss": 0.8281, + "step": 19603 + }, + { + "epoch": 0.5, + "learning_rate": 1.9024931408364324e-06, + "loss": 1.0, + "step": 19604 + }, + { + "epoch": 0.5, + "learning_rate": 1.9024812227094922e-06, + "loss": 0.7642, + "step": 19605 + }, + { + "epoch": 0.5, + "learning_rate": 1.9024693038915635e-06, + "loss": 0.8457, + "step": 19606 + }, + { + "epoch": 0.5, + "learning_rate": 1.9024573843826556e-06, + "loss": 0.9854, + "step": 19607 + }, + { + "epoch": 0.5, + "learning_rate": 1.9024454641827776e-06, + "loss": 0.958, + "step": 19608 + }, + { + "epoch": 0.5, + "learning_rate": 1.9024335432919388e-06, + "loss": 1.0898, + "step": 19609 + }, + { + "epoch": 0.5, + "learning_rate": 1.9024216217101481e-06, + "loss": 0.75, + "step": 19610 + }, + { + "epoch": 0.5, + "learning_rate": 1.9024096994374145e-06, + "loss": 1.0713, + "step": 19611 + }, + { + "epoch": 0.5, + "learning_rate": 1.9023977764737474e-06, + "loss": 0.9023, + "step": 19612 + }, + { + "epoch": 0.5, + "learning_rate": 1.9023858528191557e-06, + "loss": 0.8564, + "step": 19613 + }, + { + "epoch": 0.5, + "learning_rate": 1.9023739284736486e-06, + "loss": 0.9053, + "step": 19614 + }, + { + "epoch": 0.5, + "learning_rate": 1.9023620034372353e-06, + "loss": 0.7607, + "step": 19615 + }, + { + "epoch": 0.5, + "learning_rate": 1.902350077709925e-06, + "loss": 1.002, + "step": 19616 + }, + { + "epoch": 0.5, + "learning_rate": 1.9023381512917268e-06, + "loss": 0.7197, + "step": 19617 + }, + { + "epoch": 0.5, + "learning_rate": 1.9023262241826496e-06, + "loss": 0.7227, + "step": 19618 + }, + { + "epoch": 0.5, + "learning_rate": 1.9023142963827028e-06, + "loss": 1.0479, + "step": 19619 + }, + { + "epoch": 0.5, + "learning_rate": 1.9023023678918954e-06, + "loss": 0.7656, + "step": 19620 + }, + { + "epoch": 0.5, + "learning_rate": 1.9022904387102367e-06, + "loss": 0.6504, + "step": 19621 + }, + { + "epoch": 0.5, + "learning_rate": 1.9022785088377356e-06, + "loss": 0.9546, + "step": 19622 + }, + { + "epoch": 0.5, + "learning_rate": 1.9022665782744013e-06, + "loss": 1.0117, + "step": 19623 + }, + { + "epoch": 0.5, + "learning_rate": 1.902254647020243e-06, + "loss": 0.9814, + "step": 19624 + }, + { + "epoch": 0.5, + "learning_rate": 1.9022427150752697e-06, + "loss": 0.7441, + "step": 19625 + }, + { + "epoch": 0.5, + "learning_rate": 1.9022307824394907e-06, + "loss": 0.752, + "step": 19626 + }, + { + "epoch": 0.5, + "learning_rate": 1.9022188491129153e-06, + "loss": 1.1211, + "step": 19627 + }, + { + "epoch": 0.5, + "learning_rate": 1.9022069150955523e-06, + "loss": 0.9951, + "step": 19628 + }, + { + "epoch": 0.5, + "learning_rate": 1.9021949803874106e-06, + "loss": 0.8848, + "step": 19629 + }, + { + "epoch": 0.5, + "learning_rate": 1.9021830449884998e-06, + "loss": 0.8623, + "step": 19630 + }, + { + "epoch": 0.5, + "learning_rate": 1.9021711088988292e-06, + "loss": 0.96, + "step": 19631 + }, + { + "epoch": 0.5, + "learning_rate": 1.9021591721184077e-06, + "loss": 1.0469, + "step": 19632 + }, + { + "epoch": 0.5, + "learning_rate": 1.9021472346472441e-06, + "loss": 0.9229, + "step": 19633 + }, + { + "epoch": 0.5, + "learning_rate": 1.902135296485348e-06, + "loss": 0.9395, + "step": 19634 + }, + { + "epoch": 0.5, + "learning_rate": 1.9021233576327282e-06, + "loss": 0.6885, + "step": 19635 + }, + { + "epoch": 0.5, + "learning_rate": 1.9021114180893943e-06, + "loss": 0.7764, + "step": 19636 + }, + { + "epoch": 0.5, + "learning_rate": 1.9020994778553551e-06, + "loss": 0.9834, + "step": 19637 + }, + { + "epoch": 0.5, + "learning_rate": 1.9020875369306197e-06, + "loss": 0.918, + "step": 19638 + }, + { + "epoch": 0.5, + "learning_rate": 1.9020755953151975e-06, + "loss": 1.167, + "step": 19639 + }, + { + "epoch": 0.5, + "learning_rate": 1.9020636530090975e-06, + "loss": 1.042, + "step": 19640 + }, + { + "epoch": 0.5, + "learning_rate": 1.9020517100123287e-06, + "loss": 0.9312, + "step": 19641 + }, + { + "epoch": 0.5, + "learning_rate": 1.9020397663249007e-06, + "loss": 1.0674, + "step": 19642 + }, + { + "epoch": 0.5, + "learning_rate": 1.902027821946822e-06, + "loss": 0.6543, + "step": 19643 + }, + { + "epoch": 0.5, + "learning_rate": 1.902015876878102e-06, + "loss": 0.7314, + "step": 19644 + }, + { + "epoch": 0.5, + "learning_rate": 1.9020039311187501e-06, + "loss": 0.7412, + "step": 19645 + }, + { + "epoch": 0.5, + "learning_rate": 1.9019919846687752e-06, + "loss": 0.9243, + "step": 19646 + }, + { + "epoch": 0.5, + "learning_rate": 1.9019800375281867e-06, + "loss": 1.0693, + "step": 19647 + }, + { + "epoch": 0.5, + "learning_rate": 1.9019680896969935e-06, + "loss": 0.6919, + "step": 19648 + }, + { + "epoch": 0.5, + "learning_rate": 1.9019561411752045e-06, + "loss": 0.666, + "step": 19649 + }, + { + "epoch": 0.5, + "learning_rate": 1.9019441919628294e-06, + "loss": 0.8652, + "step": 19650 + }, + { + "epoch": 0.5, + "learning_rate": 1.901932242059877e-06, + "loss": 0.8335, + "step": 19651 + }, + { + "epoch": 0.5, + "learning_rate": 1.9019202914663566e-06, + "loss": 1.0127, + "step": 19652 + }, + { + "epoch": 0.5, + "learning_rate": 1.9019083401822774e-06, + "loss": 0.665, + "step": 19653 + }, + { + "epoch": 0.5, + "learning_rate": 1.9018963882076484e-06, + "loss": 0.8994, + "step": 19654 + }, + { + "epoch": 0.5, + "learning_rate": 1.9018844355424788e-06, + "loss": 0.9521, + "step": 19655 + }, + { + "epoch": 0.5, + "learning_rate": 1.9018724821867776e-06, + "loss": 0.9785, + "step": 19656 + }, + { + "epoch": 0.5, + "learning_rate": 1.9018605281405544e-06, + "loss": 0.9297, + "step": 19657 + }, + { + "epoch": 0.5, + "learning_rate": 1.901848573403818e-06, + "loss": 0.957, + "step": 19658 + }, + { + "epoch": 0.5, + "learning_rate": 1.9018366179765772e-06, + "loss": 0.7139, + "step": 19659 + }, + { + "epoch": 0.5, + "learning_rate": 1.901824661858842e-06, + "loss": 0.9824, + "step": 19660 + }, + { + "epoch": 0.5, + "learning_rate": 1.901812705050621e-06, + "loss": 0.9541, + "step": 19661 + }, + { + "epoch": 0.5, + "learning_rate": 1.9018007475519235e-06, + "loss": 1.0059, + "step": 19662 + }, + { + "epoch": 0.5, + "learning_rate": 1.9017887893627588e-06, + "loss": 1.0264, + "step": 19663 + }, + { + "epoch": 0.5, + "learning_rate": 1.9017768304831357e-06, + "loss": 0.7031, + "step": 19664 + }, + { + "epoch": 0.5, + "learning_rate": 1.9017648709130634e-06, + "loss": 0.9658, + "step": 19665 + }, + { + "epoch": 0.5, + "learning_rate": 1.9017529106525517e-06, + "loss": 0.7822, + "step": 19666 + }, + { + "epoch": 0.5, + "learning_rate": 1.9017409497016085e-06, + "loss": 1.0674, + "step": 19667 + }, + { + "epoch": 0.5, + "learning_rate": 1.9017289880602444e-06, + "loss": 0.8945, + "step": 19668 + }, + { + "epoch": 0.5, + "learning_rate": 1.9017170257284676e-06, + "loss": 0.9141, + "step": 19669 + }, + { + "epoch": 0.5, + "learning_rate": 1.9017050627062877e-06, + "loss": 0.7949, + "step": 19670 + }, + { + "epoch": 0.5, + "learning_rate": 1.9016930989937135e-06, + "loss": 0.9033, + "step": 19671 + }, + { + "epoch": 0.5, + "learning_rate": 1.9016811345907543e-06, + "loss": 0.8247, + "step": 19672 + }, + { + "epoch": 0.5, + "learning_rate": 1.9016691694974197e-06, + "loss": 0.9619, + "step": 19673 + }, + { + "epoch": 0.5, + "learning_rate": 1.901657203713718e-06, + "loss": 0.9062, + "step": 19674 + }, + { + "epoch": 0.5, + "learning_rate": 1.901645237239659e-06, + "loss": 1.0586, + "step": 19675 + }, + { + "epoch": 0.5, + "learning_rate": 1.9016332700752518e-06, + "loss": 0.6936, + "step": 19676 + }, + { + "epoch": 0.5, + "learning_rate": 1.9016213022205055e-06, + "loss": 0.958, + "step": 19677 + }, + { + "epoch": 0.5, + "learning_rate": 1.9016093336754292e-06, + "loss": 0.8828, + "step": 19678 + }, + { + "epoch": 0.5, + "learning_rate": 1.9015973644400318e-06, + "loss": 0.8457, + "step": 19679 + }, + { + "epoch": 0.5, + "learning_rate": 1.9015853945143232e-06, + "loss": 0.7563, + "step": 19680 + }, + { + "epoch": 0.5, + "learning_rate": 1.9015734238983119e-06, + "loss": 0.7524, + "step": 19681 + }, + { + "epoch": 0.5, + "learning_rate": 1.9015614525920073e-06, + "loss": 0.8545, + "step": 19682 + }, + { + "epoch": 0.5, + "learning_rate": 1.9015494805954183e-06, + "loss": 0.6509, + "step": 19683 + }, + { + "epoch": 0.5, + "learning_rate": 1.9015375079085546e-06, + "loss": 0.876, + "step": 19684 + }, + { + "epoch": 0.5, + "learning_rate": 1.901525534531425e-06, + "loss": 0.9766, + "step": 19685 + }, + { + "epoch": 0.5, + "learning_rate": 1.901513560464039e-06, + "loss": 0.8326, + "step": 19686 + }, + { + "epoch": 0.5, + "learning_rate": 1.9015015857064052e-06, + "loss": 0.6709, + "step": 19687 + }, + { + "epoch": 0.5, + "learning_rate": 1.9014896102585332e-06, + "loss": 0.6846, + "step": 19688 + }, + { + "epoch": 0.5, + "learning_rate": 1.9014776341204319e-06, + "loss": 0.729, + "step": 19689 + }, + { + "epoch": 0.5, + "learning_rate": 1.901465657292111e-06, + "loss": 0.7009, + "step": 19690 + }, + { + "epoch": 0.5, + "learning_rate": 1.901453679773579e-06, + "loss": 0.9678, + "step": 19691 + }, + { + "epoch": 0.5, + "learning_rate": 1.9014417015648455e-06, + "loss": 0.8403, + "step": 19692 + }, + { + "epoch": 0.5, + "learning_rate": 1.9014297226659192e-06, + "loss": 0.9141, + "step": 19693 + }, + { + "epoch": 0.5, + "learning_rate": 1.9014177430768102e-06, + "loss": 0.9111, + "step": 19694 + }, + { + "epoch": 0.5, + "learning_rate": 1.9014057627975267e-06, + "loss": 0.8281, + "step": 19695 + }, + { + "epoch": 0.5, + "learning_rate": 1.9013937818280784e-06, + "loss": 0.6279, + "step": 19696 + }, + { + "epoch": 0.5, + "learning_rate": 1.9013818001684742e-06, + "loss": 0.8281, + "step": 19697 + }, + { + "epoch": 0.5, + "learning_rate": 1.9013698178187234e-06, + "loss": 0.9272, + "step": 19698 + }, + { + "epoch": 0.5, + "learning_rate": 1.9013578347788352e-06, + "loss": 0.8887, + "step": 19699 + }, + { + "epoch": 0.5, + "learning_rate": 1.9013458510488188e-06, + "loss": 1.0498, + "step": 19700 + }, + { + "epoch": 0.5, + "learning_rate": 1.9013338666286832e-06, + "loss": 1.0898, + "step": 19701 + }, + { + "epoch": 0.5, + "learning_rate": 1.901321881518438e-06, + "loss": 0.7559, + "step": 19702 + }, + { + "epoch": 0.5, + "learning_rate": 1.901309895718092e-06, + "loss": 0.9893, + "step": 19703 + }, + { + "epoch": 0.51, + "learning_rate": 1.9012979092276541e-06, + "loss": 0.9033, + "step": 19704 + }, + { + "epoch": 0.51, + "learning_rate": 1.9012859220471343e-06, + "loss": 0.6655, + "step": 19705 + }, + { + "epoch": 0.51, + "learning_rate": 1.9012739341765412e-06, + "loss": 0.689, + "step": 19706 + }, + { + "epoch": 0.51, + "learning_rate": 1.9012619456158836e-06, + "loss": 0.8135, + "step": 19707 + }, + { + "epoch": 0.51, + "learning_rate": 1.9012499563651718e-06, + "loss": 0.8105, + "step": 19708 + }, + { + "epoch": 0.51, + "learning_rate": 1.901237966424414e-06, + "loss": 0.8438, + "step": 19709 + }, + { + "epoch": 0.51, + "learning_rate": 1.9012259757936197e-06, + "loss": 0.7505, + "step": 19710 + }, + { + "epoch": 0.51, + "learning_rate": 1.9012139844727986e-06, + "loss": 0.7891, + "step": 19711 + }, + { + "epoch": 0.51, + "learning_rate": 1.901201992461959e-06, + "loss": 0.8994, + "step": 19712 + }, + { + "epoch": 0.51, + "learning_rate": 1.9011899997611103e-06, + "loss": 0.9922, + "step": 19713 + }, + { + "epoch": 0.51, + "learning_rate": 1.9011780063702622e-06, + "loss": 0.9229, + "step": 19714 + }, + { + "epoch": 0.51, + "learning_rate": 1.9011660122894234e-06, + "loss": 0.9766, + "step": 19715 + }, + { + "epoch": 0.51, + "learning_rate": 1.9011540175186032e-06, + "loss": 0.9834, + "step": 19716 + }, + { + "epoch": 0.51, + "learning_rate": 1.9011420220578107e-06, + "loss": 0.9814, + "step": 19717 + }, + { + "epoch": 0.51, + "learning_rate": 1.9011300259070553e-06, + "loss": 0.8154, + "step": 19718 + }, + { + "epoch": 0.51, + "learning_rate": 1.9011180290663461e-06, + "loss": 1.0098, + "step": 19719 + }, + { + "epoch": 0.51, + "learning_rate": 1.9011060315356923e-06, + "loss": 0.8984, + "step": 19720 + }, + { + "epoch": 0.51, + "learning_rate": 1.9010940333151032e-06, + "loss": 1.0605, + "step": 19721 + }, + { + "epoch": 0.51, + "learning_rate": 1.9010820344045876e-06, + "loss": 1.0127, + "step": 19722 + }, + { + "epoch": 0.51, + "learning_rate": 1.901070034804155e-06, + "loss": 0.8564, + "step": 19723 + }, + { + "epoch": 0.51, + "learning_rate": 1.9010580345138143e-06, + "loss": 0.917, + "step": 19724 + }, + { + "epoch": 0.51, + "learning_rate": 1.901046033533575e-06, + "loss": 0.751, + "step": 19725 + }, + { + "epoch": 0.51, + "learning_rate": 1.901034031863446e-06, + "loss": 0.9395, + "step": 19726 + }, + { + "epoch": 0.51, + "learning_rate": 1.901022029503437e-06, + "loss": 1.1064, + "step": 19727 + }, + { + "epoch": 0.51, + "learning_rate": 1.901010026453557e-06, + "loss": 0.7085, + "step": 19728 + }, + { + "epoch": 0.51, + "learning_rate": 1.9009980227138147e-06, + "loss": 0.813, + "step": 19729 + }, + { + "epoch": 0.51, + "learning_rate": 1.90098601828422e-06, + "loss": 0.9448, + "step": 19730 + }, + { + "epoch": 0.51, + "learning_rate": 1.9009740131647813e-06, + "loss": 0.9233, + "step": 19731 + }, + { + "epoch": 0.51, + "learning_rate": 1.9009620073555084e-06, + "loss": 0.8555, + "step": 19732 + }, + { + "epoch": 0.51, + "learning_rate": 1.9009500008564104e-06, + "loss": 0.9062, + "step": 19733 + }, + { + "epoch": 0.51, + "learning_rate": 1.9009379936674962e-06, + "loss": 0.8784, + "step": 19734 + }, + { + "epoch": 0.51, + "learning_rate": 1.9009259857887753e-06, + "loss": 0.7026, + "step": 19735 + }, + { + "epoch": 0.51, + "learning_rate": 1.9009139772202572e-06, + "loss": 1.0039, + "step": 19736 + }, + { + "epoch": 0.51, + "learning_rate": 1.9009019679619502e-06, + "loss": 0.8604, + "step": 19737 + }, + { + "epoch": 0.51, + "learning_rate": 1.900889958013864e-06, + "loss": 0.9521, + "step": 19738 + }, + { + "epoch": 0.51, + "learning_rate": 1.9008779473760081e-06, + "loss": 0.8525, + "step": 19739 + }, + { + "epoch": 0.51, + "learning_rate": 1.9008659360483912e-06, + "loss": 0.8096, + "step": 19740 + }, + { + "epoch": 0.51, + "learning_rate": 1.9008539240310226e-06, + "loss": 0.9443, + "step": 19741 + }, + { + "epoch": 0.51, + "learning_rate": 1.9008419113239115e-06, + "loss": 0.8301, + "step": 19742 + }, + { + "epoch": 0.51, + "learning_rate": 1.9008298979270676e-06, + "loss": 0.8848, + "step": 19743 + }, + { + "epoch": 0.51, + "learning_rate": 1.9008178838404994e-06, + "loss": 1.0625, + "step": 19744 + }, + { + "epoch": 0.51, + "learning_rate": 1.9008058690642162e-06, + "loss": 0.8408, + "step": 19745 + }, + { + "epoch": 0.51, + "learning_rate": 1.9007938535982275e-06, + "loss": 0.6865, + "step": 19746 + }, + { + "epoch": 0.51, + "learning_rate": 1.9007818374425425e-06, + "loss": 0.8296, + "step": 19747 + }, + { + "epoch": 0.51, + "learning_rate": 1.90076982059717e-06, + "loss": 0.958, + "step": 19748 + }, + { + "epoch": 0.51, + "learning_rate": 1.90075780306212e-06, + "loss": 0.9297, + "step": 19749 + }, + { + "epoch": 0.51, + "learning_rate": 1.9007457848374004e-06, + "loss": 0.8359, + "step": 19750 + }, + { + "epoch": 0.51, + "learning_rate": 1.9007337659230216e-06, + "loss": 0.874, + "step": 19751 + }, + { + "epoch": 0.51, + "learning_rate": 1.9007217463189922e-06, + "loss": 0.8486, + "step": 19752 + }, + { + "epoch": 0.51, + "learning_rate": 1.900709726025322e-06, + "loss": 1.1445, + "step": 19753 + }, + { + "epoch": 0.51, + "learning_rate": 1.9006977050420195e-06, + "loss": 0.833, + "step": 19754 + }, + { + "epoch": 0.51, + "learning_rate": 1.9006856833690939e-06, + "loss": 0.7256, + "step": 19755 + }, + { + "epoch": 0.51, + "learning_rate": 1.9006736610065551e-06, + "loss": 1.1074, + "step": 19756 + }, + { + "epoch": 0.51, + "learning_rate": 1.9006616379544119e-06, + "loss": 0.7324, + "step": 19757 + }, + { + "epoch": 0.51, + "learning_rate": 1.900649614212673e-06, + "loss": 0.7705, + "step": 19758 + }, + { + "epoch": 0.51, + "learning_rate": 1.9006375897813487e-06, + "loss": 0.8955, + "step": 19759 + }, + { + "epoch": 0.51, + "learning_rate": 1.9006255646604473e-06, + "loss": 1.084, + "step": 19760 + }, + { + "epoch": 0.51, + "learning_rate": 1.9006135388499781e-06, + "loss": 0.9902, + "step": 19761 + }, + { + "epoch": 0.51, + "learning_rate": 1.900601512349951e-06, + "loss": 0.8838, + "step": 19762 + }, + { + "epoch": 0.51, + "learning_rate": 1.9005894851603746e-06, + "loss": 0.8091, + "step": 19763 + }, + { + "epoch": 0.51, + "learning_rate": 1.900577457281258e-06, + "loss": 0.9395, + "step": 19764 + }, + { + "epoch": 0.51, + "learning_rate": 1.900565428712611e-06, + "loss": 0.8936, + "step": 19765 + }, + { + "epoch": 0.51, + "learning_rate": 1.9005533994544422e-06, + "loss": 1.0068, + "step": 19766 + }, + { + "epoch": 0.51, + "learning_rate": 1.900541369506761e-06, + "loss": 0.9668, + "step": 19767 + }, + { + "epoch": 0.51, + "learning_rate": 1.900529338869577e-06, + "loss": 1.1406, + "step": 19768 + }, + { + "epoch": 0.51, + "learning_rate": 1.9005173075428988e-06, + "loss": 0.7744, + "step": 19769 + }, + { + "epoch": 0.51, + "learning_rate": 1.9005052755267361e-06, + "loss": 0.9355, + "step": 19770 + }, + { + "epoch": 0.51, + "learning_rate": 1.9004932428210978e-06, + "loss": 0.8467, + "step": 19771 + }, + { + "epoch": 0.51, + "learning_rate": 1.9004812094259934e-06, + "loss": 0.9102, + "step": 19772 + }, + { + "epoch": 0.51, + "learning_rate": 1.9004691753414317e-06, + "loss": 1.0947, + "step": 19773 + }, + { + "epoch": 0.51, + "learning_rate": 1.9004571405674223e-06, + "loss": 0.7256, + "step": 19774 + }, + { + "epoch": 0.51, + "learning_rate": 1.9004451051039742e-06, + "loss": 0.6963, + "step": 19775 + }, + { + "epoch": 0.51, + "learning_rate": 1.9004330689510968e-06, + "loss": 0.8223, + "step": 19776 + }, + { + "epoch": 0.51, + "learning_rate": 1.9004210321087992e-06, + "loss": 0.7456, + "step": 19777 + }, + { + "epoch": 0.51, + "learning_rate": 1.9004089945770904e-06, + "loss": 0.8857, + "step": 19778 + }, + { + "epoch": 0.51, + "learning_rate": 1.90039695635598e-06, + "loss": 0.96, + "step": 19779 + }, + { + "epoch": 0.51, + "learning_rate": 1.9003849174454771e-06, + "loss": 0.8555, + "step": 19780 + }, + { + "epoch": 0.51, + "learning_rate": 1.9003728778455907e-06, + "loss": 0.8906, + "step": 19781 + }, + { + "epoch": 0.51, + "learning_rate": 1.9003608375563306e-06, + "loss": 0.8779, + "step": 19782 + }, + { + "epoch": 0.51, + "learning_rate": 1.9003487965777053e-06, + "loss": 0.7559, + "step": 19783 + }, + { + "epoch": 0.51, + "learning_rate": 1.9003367549097241e-06, + "loss": 0.8071, + "step": 19784 + }, + { + "epoch": 0.51, + "learning_rate": 1.9003247125523969e-06, + "loss": 0.7319, + "step": 19785 + }, + { + "epoch": 0.51, + "learning_rate": 1.9003126695057322e-06, + "loss": 1.0225, + "step": 19786 + }, + { + "epoch": 0.51, + "learning_rate": 1.9003006257697394e-06, + "loss": 0.9434, + "step": 19787 + }, + { + "epoch": 0.51, + "learning_rate": 1.9002885813444278e-06, + "loss": 0.5122, + "step": 19788 + }, + { + "epoch": 0.51, + "learning_rate": 1.900276536229807e-06, + "loss": 0.6187, + "step": 19789 + }, + { + "epoch": 0.51, + "learning_rate": 1.9002644904258856e-06, + "loss": 0.959, + "step": 19790 + }, + { + "epoch": 0.51, + "learning_rate": 1.900252443932673e-06, + "loss": 1.083, + "step": 19791 + }, + { + "epoch": 0.51, + "learning_rate": 1.9002403967501786e-06, + "loss": 0.7556, + "step": 19792 + }, + { + "epoch": 0.51, + "learning_rate": 1.9002283488784117e-06, + "loss": 0.8887, + "step": 19793 + }, + { + "epoch": 0.51, + "learning_rate": 1.900216300317381e-06, + "loss": 0.7729, + "step": 19794 + }, + { + "epoch": 0.51, + "learning_rate": 1.9002042510670963e-06, + "loss": 0.9541, + "step": 19795 + }, + { + "epoch": 0.51, + "learning_rate": 1.9001922011275664e-06, + "loss": 0.9443, + "step": 19796 + }, + { + "epoch": 0.51, + "learning_rate": 1.9001801504988008e-06, + "loss": 0.9834, + "step": 19797 + }, + { + "epoch": 0.51, + "learning_rate": 1.9001680991808088e-06, + "loss": 0.7705, + "step": 19798 + }, + { + "epoch": 0.51, + "learning_rate": 1.9001560471735993e-06, + "loss": 0.7988, + "step": 19799 + }, + { + "epoch": 0.51, + "learning_rate": 1.9001439944771817e-06, + "loss": 1.083, + "step": 19800 + }, + { + "epoch": 0.51, + "learning_rate": 1.9001319410915655e-06, + "loss": 0.9717, + "step": 19801 + }, + { + "epoch": 0.51, + "learning_rate": 1.9001198870167595e-06, + "loss": 0.7744, + "step": 19802 + }, + { + "epoch": 0.51, + "learning_rate": 1.9001078322527731e-06, + "loss": 0.8994, + "step": 19803 + }, + { + "epoch": 0.51, + "learning_rate": 1.9000957767996156e-06, + "loss": 0.9971, + "step": 19804 + }, + { + "epoch": 0.51, + "learning_rate": 1.900083720657296e-06, + "loss": 0.6011, + "step": 19805 + }, + { + "epoch": 0.51, + "learning_rate": 1.9000716638258237e-06, + "loss": 0.8203, + "step": 19806 + }, + { + "epoch": 0.51, + "learning_rate": 1.9000596063052078e-06, + "loss": 0.7744, + "step": 19807 + }, + { + "epoch": 0.51, + "learning_rate": 1.9000475480954576e-06, + "loss": 0.9756, + "step": 19808 + }, + { + "epoch": 0.51, + "learning_rate": 1.9000354891965827e-06, + "loss": 0.8027, + "step": 19809 + }, + { + "epoch": 0.51, + "learning_rate": 1.9000234296085917e-06, + "loss": 0.8281, + "step": 19810 + }, + { + "epoch": 0.51, + "learning_rate": 1.9000113693314945e-06, + "loss": 1.0088, + "step": 19811 + }, + { + "epoch": 0.51, + "learning_rate": 1.8999993083653e-06, + "loss": 0.8799, + "step": 19812 + }, + { + "epoch": 0.51, + "learning_rate": 1.899987246710017e-06, + "loss": 0.9746, + "step": 19813 + }, + { + "epoch": 0.51, + "learning_rate": 1.8999751843656554e-06, + "loss": 0.6807, + "step": 19814 + }, + { + "epoch": 0.51, + "learning_rate": 1.8999631213322243e-06, + "loss": 1.0205, + "step": 19815 + }, + { + "epoch": 0.51, + "learning_rate": 1.8999510576097327e-06, + "loss": 1.0713, + "step": 19816 + }, + { + "epoch": 0.51, + "learning_rate": 1.8999389931981897e-06, + "loss": 0.9014, + "step": 19817 + }, + { + "epoch": 0.51, + "learning_rate": 1.8999269280976052e-06, + "loss": 0.8926, + "step": 19818 + }, + { + "epoch": 0.51, + "learning_rate": 1.8999148623079875e-06, + "loss": 0.8506, + "step": 19819 + }, + { + "epoch": 0.51, + "learning_rate": 1.8999027958293468e-06, + "loss": 0.9492, + "step": 19820 + }, + { + "epoch": 0.51, + "learning_rate": 1.8998907286616918e-06, + "loss": 0.7583, + "step": 19821 + }, + { + "epoch": 0.51, + "learning_rate": 1.8998786608050319e-06, + "loss": 0.8643, + "step": 19822 + }, + { + "epoch": 0.51, + "learning_rate": 1.8998665922593765e-06, + "loss": 0.7891, + "step": 19823 + }, + { + "epoch": 0.51, + "learning_rate": 1.8998545230247341e-06, + "loss": 0.7734, + "step": 19824 + }, + { + "epoch": 0.51, + "learning_rate": 1.8998424531011147e-06, + "loss": 0.7329, + "step": 19825 + }, + { + "epoch": 0.51, + "learning_rate": 1.8998303824885276e-06, + "loss": 0.9482, + "step": 19826 + }, + { + "epoch": 0.51, + "learning_rate": 1.8998183111869813e-06, + "loss": 0.7275, + "step": 19827 + }, + { + "epoch": 0.51, + "learning_rate": 1.8998062391964857e-06, + "loss": 0.8271, + "step": 19828 + }, + { + "epoch": 0.51, + "learning_rate": 1.8997941665170499e-06, + "loss": 0.8252, + "step": 19829 + }, + { + "epoch": 0.51, + "learning_rate": 1.899782093148683e-06, + "loss": 0.7383, + "step": 19830 + }, + { + "epoch": 0.51, + "learning_rate": 1.8997700190913944e-06, + "loss": 0.8877, + "step": 19831 + }, + { + "epoch": 0.51, + "learning_rate": 1.8997579443451932e-06, + "loss": 0.8105, + "step": 19832 + }, + { + "epoch": 0.51, + "learning_rate": 1.8997458689100886e-06, + "loss": 0.8379, + "step": 19833 + }, + { + "epoch": 0.51, + "learning_rate": 1.8997337927860902e-06, + "loss": 0.6055, + "step": 19834 + }, + { + "epoch": 0.51, + "learning_rate": 1.8997217159732069e-06, + "loss": 0.9736, + "step": 19835 + }, + { + "epoch": 0.51, + "learning_rate": 1.899709638471448e-06, + "loss": 0.5518, + "step": 19836 + }, + { + "epoch": 0.51, + "learning_rate": 1.8996975602808228e-06, + "loss": 0.8408, + "step": 19837 + }, + { + "epoch": 0.51, + "learning_rate": 1.8996854814013405e-06, + "loss": 0.8301, + "step": 19838 + }, + { + "epoch": 0.51, + "learning_rate": 1.8996734018330107e-06, + "loss": 1.1445, + "step": 19839 + }, + { + "epoch": 0.51, + "learning_rate": 1.899661321575842e-06, + "loss": 0.8232, + "step": 19840 + }, + { + "epoch": 0.51, + "learning_rate": 1.899649240629844e-06, + "loss": 0.9453, + "step": 19841 + }, + { + "epoch": 0.51, + "learning_rate": 1.8996371589950262e-06, + "loss": 1.0146, + "step": 19842 + }, + { + "epoch": 0.51, + "learning_rate": 1.8996250766713974e-06, + "loss": 0.8564, + "step": 19843 + }, + { + "epoch": 0.51, + "learning_rate": 1.899612993658967e-06, + "loss": 0.7793, + "step": 19844 + }, + { + "epoch": 0.51, + "learning_rate": 1.8996009099577446e-06, + "loss": 0.7861, + "step": 19845 + }, + { + "epoch": 0.51, + "learning_rate": 1.899588825567739e-06, + "loss": 1.0117, + "step": 19846 + }, + { + "epoch": 0.51, + "learning_rate": 1.8995767404889596e-06, + "loss": 0.9766, + "step": 19847 + }, + { + "epoch": 0.51, + "learning_rate": 1.8995646547214155e-06, + "loss": 0.7881, + "step": 19848 + }, + { + "epoch": 0.51, + "learning_rate": 1.8995525682651161e-06, + "loss": 0.7812, + "step": 19849 + }, + { + "epoch": 0.51, + "learning_rate": 1.899540481120071e-06, + "loss": 0.9697, + "step": 19850 + }, + { + "epoch": 0.51, + "learning_rate": 1.8995283932862886e-06, + "loss": 0.8652, + "step": 19851 + }, + { + "epoch": 0.51, + "learning_rate": 1.8995163047637792e-06, + "loss": 0.8184, + "step": 19852 + }, + { + "epoch": 0.51, + "learning_rate": 1.899504215552551e-06, + "loss": 0.9277, + "step": 19853 + }, + { + "epoch": 0.51, + "learning_rate": 1.8994921256526142e-06, + "loss": 0.8428, + "step": 19854 + }, + { + "epoch": 0.51, + "learning_rate": 1.8994800350639775e-06, + "loss": 0.8379, + "step": 19855 + }, + { + "epoch": 0.51, + "learning_rate": 1.8994679437866504e-06, + "loss": 0.8008, + "step": 19856 + }, + { + "epoch": 0.51, + "learning_rate": 1.8994558518206418e-06, + "loss": 0.7822, + "step": 19857 + }, + { + "epoch": 0.51, + "learning_rate": 1.8994437591659613e-06, + "loss": 0.7646, + "step": 19858 + }, + { + "epoch": 0.51, + "learning_rate": 1.8994316658226182e-06, + "loss": 0.8525, + "step": 19859 + }, + { + "epoch": 0.51, + "learning_rate": 1.8994195717906215e-06, + "loss": 0.8828, + "step": 19860 + }, + { + "epoch": 0.51, + "learning_rate": 1.899407477069981e-06, + "loss": 0.8516, + "step": 19861 + }, + { + "epoch": 0.51, + "learning_rate": 1.8993953816607048e-06, + "loss": 0.9873, + "step": 19862 + }, + { + "epoch": 0.51, + "learning_rate": 1.8993832855628034e-06, + "loss": 0.9355, + "step": 19863 + }, + { + "epoch": 0.51, + "learning_rate": 1.8993711887762856e-06, + "loss": 0.9814, + "step": 19864 + }, + { + "epoch": 0.51, + "learning_rate": 1.8993590913011604e-06, + "loss": 1.1123, + "step": 19865 + }, + { + "epoch": 0.51, + "learning_rate": 1.8993469931374375e-06, + "loss": 0.6426, + "step": 19866 + }, + { + "epoch": 0.51, + "learning_rate": 1.899334894285126e-06, + "loss": 0.7759, + "step": 19867 + }, + { + "epoch": 0.51, + "learning_rate": 1.899322794744235e-06, + "loss": 0.8457, + "step": 19868 + }, + { + "epoch": 0.51, + "learning_rate": 1.899310694514774e-06, + "loss": 0.9736, + "step": 19869 + }, + { + "epoch": 0.51, + "learning_rate": 1.899298593596752e-06, + "loss": 1.0049, + "step": 19870 + }, + { + "epoch": 0.51, + "learning_rate": 1.8992864919901783e-06, + "loss": 0.7983, + "step": 19871 + }, + { + "epoch": 0.51, + "learning_rate": 1.8992743896950625e-06, + "loss": 0.9268, + "step": 19872 + }, + { + "epoch": 0.51, + "learning_rate": 1.8992622867114136e-06, + "loss": 0.8965, + "step": 19873 + }, + { + "epoch": 0.51, + "learning_rate": 1.899250183039241e-06, + "loss": 0.8936, + "step": 19874 + }, + { + "epoch": 0.51, + "learning_rate": 1.8992380786785539e-06, + "loss": 0.7397, + "step": 19875 + }, + { + "epoch": 0.51, + "learning_rate": 1.8992259736293614e-06, + "loss": 0.9248, + "step": 19876 + }, + { + "epoch": 0.51, + "learning_rate": 1.8992138678916726e-06, + "loss": 0.873, + "step": 19877 + }, + { + "epoch": 0.51, + "learning_rate": 1.8992017614654979e-06, + "loss": 0.8521, + "step": 19878 + }, + { + "epoch": 0.51, + "learning_rate": 1.8991896543508452e-06, + "loss": 0.8467, + "step": 19879 + }, + { + "epoch": 0.51, + "learning_rate": 1.8991775465477241e-06, + "loss": 0.6895, + "step": 19880 + }, + { + "epoch": 0.51, + "learning_rate": 1.8991654380561447e-06, + "loss": 0.8467, + "step": 19881 + }, + { + "epoch": 0.51, + "learning_rate": 1.8991533288761155e-06, + "loss": 0.8125, + "step": 19882 + }, + { + "epoch": 0.51, + "learning_rate": 1.8991412190076458e-06, + "loss": 0.5681, + "step": 19883 + }, + { + "epoch": 0.51, + "learning_rate": 1.899129108450745e-06, + "loss": 0.8711, + "step": 19884 + }, + { + "epoch": 0.51, + "learning_rate": 1.8991169972054223e-06, + "loss": 0.8994, + "step": 19885 + }, + { + "epoch": 0.51, + "learning_rate": 1.8991048852716873e-06, + "loss": 0.918, + "step": 19886 + }, + { + "epoch": 0.51, + "learning_rate": 1.8990927726495491e-06, + "loss": 0.7832, + "step": 19887 + }, + { + "epoch": 0.51, + "learning_rate": 1.8990806593390167e-06, + "loss": 0.6689, + "step": 19888 + }, + { + "epoch": 0.51, + "learning_rate": 1.8990685453400995e-06, + "loss": 0.6709, + "step": 19889 + }, + { + "epoch": 0.51, + "learning_rate": 1.899056430652807e-06, + "loss": 0.9912, + "step": 19890 + }, + { + "epoch": 0.51, + "learning_rate": 1.8990443152771482e-06, + "loss": 0.8047, + "step": 19891 + }, + { + "epoch": 0.51, + "learning_rate": 1.8990321992131327e-06, + "loss": 0.751, + "step": 19892 + }, + { + "epoch": 0.51, + "learning_rate": 1.8990200824607696e-06, + "loss": 0.665, + "step": 19893 + }, + { + "epoch": 0.51, + "learning_rate": 1.8990079650200678e-06, + "loss": 0.7578, + "step": 19894 + }, + { + "epoch": 0.51, + "learning_rate": 1.8989958468910375e-06, + "loss": 1.0244, + "step": 19895 + }, + { + "epoch": 0.51, + "learning_rate": 1.898983728073687e-06, + "loss": 0.7427, + "step": 19896 + }, + { + "epoch": 0.51, + "learning_rate": 1.898971608568026e-06, + "loss": 0.9229, + "step": 19897 + }, + { + "epoch": 0.51, + "learning_rate": 1.898959488374064e-06, + "loss": 0.8535, + "step": 19898 + }, + { + "epoch": 0.51, + "learning_rate": 1.89894736749181e-06, + "loss": 0.9893, + "step": 19899 + }, + { + "epoch": 0.51, + "learning_rate": 1.8989352459212733e-06, + "loss": 0.8037, + "step": 19900 + }, + { + "epoch": 0.51, + "learning_rate": 1.8989231236624633e-06, + "loss": 1.0527, + "step": 19901 + }, + { + "epoch": 0.51, + "learning_rate": 1.898911000715389e-06, + "loss": 0.9531, + "step": 19902 + }, + { + "epoch": 0.51, + "learning_rate": 1.89889887708006e-06, + "loss": 1.0176, + "step": 19903 + }, + { + "epoch": 0.51, + "learning_rate": 1.8988867527564853e-06, + "loss": 0.9141, + "step": 19904 + }, + { + "epoch": 0.51, + "learning_rate": 1.8988746277446746e-06, + "loss": 0.7354, + "step": 19905 + }, + { + "epoch": 0.51, + "learning_rate": 1.8988625020446368e-06, + "loss": 0.6763, + "step": 19906 + }, + { + "epoch": 0.51, + "learning_rate": 1.8988503756563813e-06, + "loss": 0.834, + "step": 19907 + }, + { + "epoch": 0.51, + "learning_rate": 1.8988382485799175e-06, + "loss": 0.8018, + "step": 19908 + }, + { + "epoch": 0.51, + "learning_rate": 1.8988261208152542e-06, + "loss": 1.0625, + "step": 19909 + }, + { + "epoch": 0.51, + "learning_rate": 1.8988139923624016e-06, + "loss": 0.832, + "step": 19910 + }, + { + "epoch": 0.51, + "learning_rate": 1.8988018632213683e-06, + "loss": 0.8652, + "step": 19911 + }, + { + "epoch": 0.51, + "learning_rate": 1.8987897333921636e-06, + "loss": 0.8865, + "step": 19912 + }, + { + "epoch": 0.51, + "learning_rate": 1.898777602874797e-06, + "loss": 0.8477, + "step": 19913 + }, + { + "epoch": 0.51, + "learning_rate": 1.8987654716692775e-06, + "loss": 0.9775, + "step": 19914 + }, + { + "epoch": 0.51, + "learning_rate": 1.898753339775615e-06, + "loss": 0.7153, + "step": 19915 + }, + { + "epoch": 0.51, + "learning_rate": 1.8987412071938183e-06, + "loss": 0.6531, + "step": 19916 + }, + { + "epoch": 0.51, + "learning_rate": 1.8987290739238966e-06, + "loss": 0.823, + "step": 19917 + }, + { + "epoch": 0.51, + "learning_rate": 1.8987169399658595e-06, + "loss": 0.8555, + "step": 19918 + }, + { + "epoch": 0.51, + "learning_rate": 1.898704805319716e-06, + "loss": 1.0811, + "step": 19919 + }, + { + "epoch": 0.51, + "learning_rate": 1.8986926699854757e-06, + "loss": 0.8613, + "step": 19920 + }, + { + "epoch": 0.51, + "learning_rate": 1.8986805339631478e-06, + "loss": 0.6919, + "step": 19921 + }, + { + "epoch": 0.51, + "learning_rate": 1.8986683972527415e-06, + "loss": 0.9199, + "step": 19922 + }, + { + "epoch": 0.51, + "learning_rate": 1.898656259854266e-06, + "loss": 0.791, + "step": 19923 + }, + { + "epoch": 0.51, + "learning_rate": 1.898644121767731e-06, + "loss": 0.8955, + "step": 19924 + }, + { + "epoch": 0.51, + "learning_rate": 1.898631982993145e-06, + "loss": 0.9189, + "step": 19925 + }, + { + "epoch": 0.51, + "learning_rate": 1.8986198435305183e-06, + "loss": 1.0938, + "step": 19926 + }, + { + "epoch": 0.51, + "learning_rate": 1.8986077033798596e-06, + "loss": 0.8799, + "step": 19927 + }, + { + "epoch": 0.51, + "learning_rate": 1.8985955625411782e-06, + "loss": 0.7744, + "step": 19928 + }, + { + "epoch": 0.51, + "learning_rate": 1.8985834210144836e-06, + "loss": 0.8262, + "step": 19929 + }, + { + "epoch": 0.51, + "learning_rate": 1.898571278799785e-06, + "loss": 0.8613, + "step": 19930 + }, + { + "epoch": 0.51, + "learning_rate": 1.8985591358970913e-06, + "loss": 0.8447, + "step": 19931 + }, + { + "epoch": 0.51, + "learning_rate": 1.8985469923064126e-06, + "loss": 0.8184, + "step": 19932 + }, + { + "epoch": 0.51, + "learning_rate": 1.8985348480277578e-06, + "loss": 0.8887, + "step": 19933 + }, + { + "epoch": 0.51, + "learning_rate": 1.898522703061136e-06, + "loss": 0.8408, + "step": 19934 + }, + { + "epoch": 0.51, + "learning_rate": 1.8985105574065567e-06, + "loss": 1.0234, + "step": 19935 + }, + { + "epoch": 0.51, + "learning_rate": 1.8984984110640295e-06, + "loss": 0.7588, + "step": 19936 + }, + { + "epoch": 0.51, + "learning_rate": 1.898486264033563e-06, + "loss": 0.9688, + "step": 19937 + }, + { + "epoch": 0.51, + "learning_rate": 1.898474116315167e-06, + "loss": 0.7534, + "step": 19938 + }, + { + "epoch": 0.51, + "learning_rate": 1.8984619679088508e-06, + "loss": 0.7725, + "step": 19939 + }, + { + "epoch": 0.51, + "learning_rate": 1.8984498188146233e-06, + "loss": 0.916, + "step": 19940 + }, + { + "epoch": 0.51, + "learning_rate": 1.8984376690324944e-06, + "loss": 0.7188, + "step": 19941 + }, + { + "epoch": 0.51, + "learning_rate": 1.898425518562473e-06, + "loss": 0.8447, + "step": 19942 + }, + { + "epoch": 0.51, + "learning_rate": 1.8984133674045683e-06, + "loss": 0.7773, + "step": 19943 + }, + { + "epoch": 0.51, + "learning_rate": 1.8984012155587901e-06, + "loss": 0.7656, + "step": 19944 + }, + { + "epoch": 0.51, + "learning_rate": 1.898389063025147e-06, + "loss": 0.6611, + "step": 19945 + }, + { + "epoch": 0.51, + "learning_rate": 1.898376909803649e-06, + "loss": 0.7339, + "step": 19946 + }, + { + "epoch": 0.51, + "learning_rate": 1.898364755894305e-06, + "loss": 0.7026, + "step": 19947 + }, + { + "epoch": 0.51, + "learning_rate": 1.8983526012971246e-06, + "loss": 0.8447, + "step": 19948 + }, + { + "epoch": 0.51, + "learning_rate": 1.8983404460121167e-06, + "loss": 0.8984, + "step": 19949 + }, + { + "epoch": 0.51, + "learning_rate": 1.898328290039291e-06, + "loss": 0.6226, + "step": 19950 + }, + { + "epoch": 0.51, + "learning_rate": 1.8983161333786564e-06, + "loss": 0.6196, + "step": 19951 + }, + { + "epoch": 0.51, + "learning_rate": 1.8983039760302227e-06, + "loss": 0.8809, + "step": 19952 + }, + { + "epoch": 0.51, + "learning_rate": 1.8982918179939986e-06, + "loss": 0.832, + "step": 19953 + }, + { + "epoch": 0.51, + "learning_rate": 1.8982796592699942e-06, + "loss": 0.7349, + "step": 19954 + }, + { + "epoch": 0.51, + "learning_rate": 1.898267499858218e-06, + "loss": 0.8486, + "step": 19955 + }, + { + "epoch": 0.51, + "learning_rate": 1.89825533975868e-06, + "loss": 0.9951, + "step": 19956 + }, + { + "epoch": 0.51, + "learning_rate": 1.898243178971389e-06, + "loss": 0.8662, + "step": 19957 + }, + { + "epoch": 0.51, + "learning_rate": 1.8982310174963546e-06, + "loss": 1.0605, + "step": 19958 + }, + { + "epoch": 0.51, + "learning_rate": 1.898218855333586e-06, + "loss": 0.8125, + "step": 19959 + }, + { + "epoch": 0.51, + "learning_rate": 1.8982066924830921e-06, + "loss": 0.8545, + "step": 19960 + }, + { + "epoch": 0.51, + "learning_rate": 1.898194528944883e-06, + "loss": 0.709, + "step": 19961 + }, + { + "epoch": 0.51, + "learning_rate": 1.8981823647189676e-06, + "loss": 0.7036, + "step": 19962 + }, + { + "epoch": 0.51, + "learning_rate": 1.8981701998053556e-06, + "loss": 0.9121, + "step": 19963 + }, + { + "epoch": 0.51, + "learning_rate": 1.8981580342040554e-06, + "loss": 0.8271, + "step": 19964 + }, + { + "epoch": 0.51, + "learning_rate": 1.8981458679150776e-06, + "loss": 0.9902, + "step": 19965 + }, + { + "epoch": 0.51, + "learning_rate": 1.89813370093843e-06, + "loss": 0.9873, + "step": 19966 + }, + { + "epoch": 0.51, + "learning_rate": 1.8981215332741231e-06, + "loss": 0.8496, + "step": 19967 + }, + { + "epoch": 0.51, + "learning_rate": 1.898109364922166e-06, + "loss": 1.0869, + "step": 19968 + }, + { + "epoch": 0.51, + "learning_rate": 1.8980971958825679e-06, + "loss": 0.7637, + "step": 19969 + }, + { + "epoch": 0.51, + "learning_rate": 1.8980850261553378e-06, + "loss": 0.9346, + "step": 19970 + }, + { + "epoch": 0.51, + "learning_rate": 1.8980728557404853e-06, + "loss": 0.7275, + "step": 19971 + }, + { + "epoch": 0.51, + "learning_rate": 1.8980606846380195e-06, + "loss": 1.1094, + "step": 19972 + }, + { + "epoch": 0.51, + "learning_rate": 1.8980485128479504e-06, + "loss": 0.6514, + "step": 19973 + }, + { + "epoch": 0.51, + "learning_rate": 1.8980363403702868e-06, + "loss": 0.7949, + "step": 19974 + }, + { + "epoch": 0.51, + "learning_rate": 1.8980241672050376e-06, + "loss": 0.9551, + "step": 19975 + }, + { + "epoch": 0.51, + "learning_rate": 1.898011993352213e-06, + "loss": 0.7461, + "step": 19976 + }, + { + "epoch": 0.51, + "learning_rate": 1.8979998188118218e-06, + "loss": 1.2812, + "step": 19977 + }, + { + "epoch": 0.51, + "learning_rate": 1.8979876435838738e-06, + "loss": 1.0479, + "step": 19978 + }, + { + "epoch": 0.51, + "learning_rate": 1.8979754676683775e-06, + "loss": 0.9922, + "step": 19979 + }, + { + "epoch": 0.51, + "learning_rate": 1.8979632910653427e-06, + "loss": 0.9268, + "step": 19980 + }, + { + "epoch": 0.51, + "learning_rate": 1.8979511137747788e-06, + "loss": 0.7837, + "step": 19981 + }, + { + "epoch": 0.51, + "learning_rate": 1.8979389357966948e-06, + "loss": 1.0332, + "step": 19982 + }, + { + "epoch": 0.51, + "learning_rate": 1.8979267571311004e-06, + "loss": 0.7559, + "step": 19983 + }, + { + "epoch": 0.51, + "learning_rate": 1.897914577778005e-06, + "loss": 0.916, + "step": 19984 + }, + { + "epoch": 0.51, + "learning_rate": 1.8979023977374173e-06, + "loss": 0.999, + "step": 19985 + }, + { + "epoch": 0.51, + "learning_rate": 1.8978902170093473e-06, + "loss": 0.8105, + "step": 19986 + }, + { + "epoch": 0.51, + "learning_rate": 1.8978780355938039e-06, + "loss": 0.8105, + "step": 19987 + }, + { + "epoch": 0.51, + "learning_rate": 1.8978658534907967e-06, + "loss": 0.835, + "step": 19988 + }, + { + "epoch": 0.51, + "learning_rate": 1.8978536707003348e-06, + "loss": 0.8926, + "step": 19989 + }, + { + "epoch": 0.51, + "learning_rate": 1.8978414872224278e-06, + "loss": 0.8921, + "step": 19990 + }, + { + "epoch": 0.51, + "learning_rate": 1.8978293030570847e-06, + "loss": 1.1992, + "step": 19991 + }, + { + "epoch": 0.51, + "learning_rate": 1.897817118204315e-06, + "loss": 0.7827, + "step": 19992 + }, + { + "epoch": 0.51, + "learning_rate": 1.8978049326641278e-06, + "loss": 0.9873, + "step": 19993 + }, + { + "epoch": 0.51, + "learning_rate": 1.897792746436533e-06, + "loss": 0.8467, + "step": 19994 + }, + { + "epoch": 0.51, + "learning_rate": 1.8977805595215395e-06, + "loss": 0.8555, + "step": 19995 + }, + { + "epoch": 0.51, + "learning_rate": 1.8977683719191567e-06, + "loss": 0.5861, + "step": 19996 + }, + { + "epoch": 0.51, + "learning_rate": 1.897756183629394e-06, + "loss": 0.6868, + "step": 19997 + }, + { + "epoch": 0.51, + "learning_rate": 1.8977439946522605e-06, + "loss": 0.9434, + "step": 19998 + }, + { + "epoch": 0.51, + "learning_rate": 1.8977318049877658e-06, + "loss": 0.9844, + "step": 19999 + }, + { + "epoch": 0.51, + "learning_rate": 1.897719614635919e-06, + "loss": 0.8027, + "step": 20000 + }, + { + "epoch": 0.51, + "learning_rate": 1.8977074235967296e-06, + "loss": 0.8154, + "step": 20001 + }, + { + "epoch": 0.51, + "learning_rate": 1.8976952318702072e-06, + "loss": 0.6533, + "step": 20002 + }, + { + "epoch": 0.51, + "learning_rate": 1.8976830394563606e-06, + "loss": 0.605, + "step": 20003 + }, + { + "epoch": 0.51, + "learning_rate": 1.8976708463551994e-06, + "loss": 0.7998, + "step": 20004 + }, + { + "epoch": 0.51, + "learning_rate": 1.8976586525667328e-06, + "loss": 0.9082, + "step": 20005 + }, + { + "epoch": 0.51, + "learning_rate": 1.8976464580909703e-06, + "loss": 0.9551, + "step": 20006 + }, + { + "epoch": 0.51, + "learning_rate": 1.8976342629279212e-06, + "loss": 0.9365, + "step": 20007 + }, + { + "epoch": 0.51, + "learning_rate": 1.897622067077595e-06, + "loss": 0.8857, + "step": 20008 + }, + { + "epoch": 0.51, + "learning_rate": 1.8976098705400005e-06, + "loss": 0.9668, + "step": 20009 + }, + { + "epoch": 0.51, + "learning_rate": 1.8975976733151477e-06, + "loss": 0.6353, + "step": 20010 + }, + { + "epoch": 0.51, + "learning_rate": 1.8975854754030456e-06, + "loss": 0.999, + "step": 20011 + }, + { + "epoch": 0.51, + "learning_rate": 1.8975732768037033e-06, + "loss": 0.9863, + "step": 20012 + }, + { + "epoch": 0.51, + "learning_rate": 1.8975610775171308e-06, + "loss": 0.8193, + "step": 20013 + }, + { + "epoch": 0.51, + "learning_rate": 1.8975488775433367e-06, + "loss": 0.8691, + "step": 20014 + }, + { + "epoch": 0.51, + "learning_rate": 1.8975366768823308e-06, + "loss": 0.7695, + "step": 20015 + }, + { + "epoch": 0.51, + "learning_rate": 1.8975244755341225e-06, + "loss": 0.917, + "step": 20016 + }, + { + "epoch": 0.51, + "learning_rate": 1.8975122734987207e-06, + "loss": 0.6836, + "step": 20017 + }, + { + "epoch": 0.51, + "learning_rate": 1.8975000707761355e-06, + "loss": 0.8076, + "step": 20018 + }, + { + "epoch": 0.51, + "learning_rate": 1.8974878673663754e-06, + "loss": 0.7068, + "step": 20019 + }, + { + "epoch": 0.51, + "learning_rate": 1.89747566326945e-06, + "loss": 0.9436, + "step": 20020 + }, + { + "epoch": 0.51, + "learning_rate": 1.897463458485369e-06, + "loss": 0.9131, + "step": 20021 + }, + { + "epoch": 0.51, + "learning_rate": 1.8974512530141414e-06, + "loss": 0.8389, + "step": 20022 + }, + { + "epoch": 0.51, + "learning_rate": 1.8974390468557769e-06, + "loss": 0.6782, + "step": 20023 + }, + { + "epoch": 0.51, + "learning_rate": 1.8974268400102842e-06, + "loss": 0.7725, + "step": 20024 + }, + { + "epoch": 0.51, + "learning_rate": 1.8974146324776732e-06, + "loss": 0.8896, + "step": 20025 + }, + { + "epoch": 0.51, + "learning_rate": 1.897402424257953e-06, + "loss": 0.6895, + "step": 20026 + }, + { + "epoch": 0.51, + "learning_rate": 1.897390215351133e-06, + "loss": 0.8789, + "step": 20027 + }, + { + "epoch": 0.51, + "learning_rate": 1.8973780057572229e-06, + "loss": 0.874, + "step": 20028 + }, + { + "epoch": 0.51, + "learning_rate": 1.8973657954762313e-06, + "loss": 0.8896, + "step": 20029 + }, + { + "epoch": 0.51, + "learning_rate": 1.8973535845081683e-06, + "loss": 0.6989, + "step": 20030 + }, + { + "epoch": 0.51, + "learning_rate": 1.8973413728530426e-06, + "loss": 0.8555, + "step": 20031 + }, + { + "epoch": 0.51, + "learning_rate": 1.8973291605108641e-06, + "loss": 0.751, + "step": 20032 + }, + { + "epoch": 0.51, + "learning_rate": 1.897316947481642e-06, + "loss": 1.0449, + "step": 20033 + }, + { + "epoch": 0.51, + "learning_rate": 1.8973047337653853e-06, + "loss": 0.876, + "step": 20034 + }, + { + "epoch": 0.51, + "learning_rate": 1.8972925193621037e-06, + "loss": 0.8301, + "step": 20035 + }, + { + "epoch": 0.51, + "learning_rate": 1.8972803042718067e-06, + "loss": 0.9463, + "step": 20036 + }, + { + "epoch": 0.51, + "learning_rate": 1.8972680884945032e-06, + "loss": 0.9883, + "step": 20037 + }, + { + "epoch": 0.51, + "learning_rate": 1.897255872030203e-06, + "loss": 0.9863, + "step": 20038 + }, + { + "epoch": 0.51, + "learning_rate": 1.897243654878915e-06, + "loss": 0.7764, + "step": 20039 + }, + { + "epoch": 0.51, + "learning_rate": 1.897231437040649e-06, + "loss": 1.0479, + "step": 20040 + }, + { + "epoch": 0.51, + "learning_rate": 1.897219218515414e-06, + "loss": 1.0176, + "step": 20041 + }, + { + "epoch": 0.51, + "learning_rate": 1.8972069993032193e-06, + "loss": 0.7524, + "step": 20042 + }, + { + "epoch": 0.51, + "learning_rate": 1.8971947794040748e-06, + "loss": 0.6997, + "step": 20043 + }, + { + "epoch": 0.51, + "learning_rate": 1.8971825588179895e-06, + "loss": 0.9697, + "step": 20044 + }, + { + "epoch": 0.51, + "learning_rate": 1.8971703375449726e-06, + "loss": 0.8896, + "step": 20045 + }, + { + "epoch": 0.51, + "learning_rate": 1.8971581155850336e-06, + "loss": 0.8574, + "step": 20046 + }, + { + "epoch": 0.51, + "learning_rate": 1.897145892938182e-06, + "loss": 0.7617, + "step": 20047 + }, + { + "epoch": 0.51, + "learning_rate": 1.8971336696044271e-06, + "loss": 0.843, + "step": 20048 + }, + { + "epoch": 0.51, + "learning_rate": 1.897121445583778e-06, + "loss": 0.959, + "step": 20049 + }, + { + "epoch": 0.51, + "learning_rate": 1.8971092208762446e-06, + "loss": 0.9287, + "step": 20050 + }, + { + "epoch": 0.51, + "learning_rate": 1.8970969954818353e-06, + "loss": 0.8271, + "step": 20051 + }, + { + "epoch": 0.51, + "learning_rate": 1.8970847694005607e-06, + "loss": 0.8325, + "step": 20052 + }, + { + "epoch": 0.51, + "learning_rate": 1.8970725426324293e-06, + "loss": 0.7544, + "step": 20053 + }, + { + "epoch": 0.51, + "learning_rate": 1.8970603151774506e-06, + "loss": 0.7891, + "step": 20054 + }, + { + "epoch": 0.51, + "learning_rate": 1.8970480870356345e-06, + "loss": 0.8682, + "step": 20055 + }, + { + "epoch": 0.51, + "learning_rate": 1.8970358582069895e-06, + "loss": 0.8584, + "step": 20056 + }, + { + "epoch": 0.51, + "learning_rate": 1.8970236286915253e-06, + "loss": 0.7705, + "step": 20057 + }, + { + "epoch": 0.51, + "learning_rate": 1.8970113984892518e-06, + "loss": 0.7861, + "step": 20058 + }, + { + "epoch": 0.51, + "learning_rate": 1.8969991676001775e-06, + "loss": 0.8408, + "step": 20059 + }, + { + "epoch": 0.51, + "learning_rate": 1.8969869360243122e-06, + "loss": 0.6069, + "step": 20060 + }, + { + "epoch": 0.51, + "learning_rate": 1.8969747037616654e-06, + "loss": 1.165, + "step": 20061 + }, + { + "epoch": 0.51, + "learning_rate": 1.8969624708122464e-06, + "loss": 0.8291, + "step": 20062 + }, + { + "epoch": 0.51, + "learning_rate": 1.8969502371760645e-06, + "loss": 0.8389, + "step": 20063 + }, + { + "epoch": 0.51, + "learning_rate": 1.896938002853129e-06, + "loss": 0.8975, + "step": 20064 + }, + { + "epoch": 0.51, + "learning_rate": 1.8969257678434491e-06, + "loss": 1.0566, + "step": 20065 + }, + { + "epoch": 0.51, + "learning_rate": 1.8969135321470347e-06, + "loss": 1.0889, + "step": 20066 + }, + { + "epoch": 0.51, + "learning_rate": 1.8969012957638945e-06, + "loss": 0.7451, + "step": 20067 + }, + { + "epoch": 0.51, + "learning_rate": 1.8968890586940386e-06, + "loss": 0.707, + "step": 20068 + }, + { + "epoch": 0.51, + "learning_rate": 1.8968768209374757e-06, + "loss": 1.0703, + "step": 20069 + }, + { + "epoch": 0.51, + "learning_rate": 1.8968645824942156e-06, + "loss": 0.9087, + "step": 20070 + }, + { + "epoch": 0.51, + "learning_rate": 1.8968523433642676e-06, + "loss": 0.874, + "step": 20071 + }, + { + "epoch": 0.51, + "learning_rate": 1.8968401035476408e-06, + "loss": 1.1104, + "step": 20072 + }, + { + "epoch": 0.51, + "learning_rate": 1.8968278630443449e-06, + "loss": 0.6699, + "step": 20073 + }, + { + "epoch": 0.51, + "learning_rate": 1.896815621854389e-06, + "loss": 0.9561, + "step": 20074 + }, + { + "epoch": 0.51, + "learning_rate": 1.8968033799777827e-06, + "loss": 1.1758, + "step": 20075 + }, + { + "epoch": 0.51, + "learning_rate": 1.896791137414535e-06, + "loss": 0.8525, + "step": 20076 + }, + { + "epoch": 0.51, + "learning_rate": 1.896778894164656e-06, + "loss": 0.9805, + "step": 20077 + }, + { + "epoch": 0.51, + "learning_rate": 1.8967666502281548e-06, + "loss": 0.7178, + "step": 20078 + }, + { + "epoch": 0.51, + "learning_rate": 1.8967544056050402e-06, + "loss": 0.8462, + "step": 20079 + }, + { + "epoch": 0.51, + "learning_rate": 1.8967421602953219e-06, + "loss": 0.7153, + "step": 20080 + }, + { + "epoch": 0.51, + "learning_rate": 1.8967299142990097e-06, + "loss": 0.8623, + "step": 20081 + }, + { + "epoch": 0.51, + "learning_rate": 1.8967176676161123e-06, + "loss": 1.1016, + "step": 20082 + }, + { + "epoch": 0.51, + "learning_rate": 1.8967054202466396e-06, + "loss": 1.0195, + "step": 20083 + }, + { + "epoch": 0.51, + "learning_rate": 1.8966931721906008e-06, + "loss": 0.873, + "step": 20084 + }, + { + "epoch": 0.51, + "learning_rate": 1.8966809234480054e-06, + "loss": 0.9014, + "step": 20085 + }, + { + "epoch": 0.51, + "learning_rate": 1.8966686740188624e-06, + "loss": 0.6331, + "step": 20086 + }, + { + "epoch": 0.51, + "learning_rate": 1.8966564239031815e-06, + "loss": 0.9512, + "step": 20087 + }, + { + "epoch": 0.51, + "learning_rate": 1.896644173100972e-06, + "loss": 0.8877, + "step": 20088 + }, + { + "epoch": 0.51, + "learning_rate": 1.8966319216122435e-06, + "loss": 0.9971, + "step": 20089 + }, + { + "epoch": 0.51, + "learning_rate": 1.896619669437005e-06, + "loss": 0.8301, + "step": 20090 + }, + { + "epoch": 0.51, + "learning_rate": 1.896607416575266e-06, + "loss": 0.9844, + "step": 20091 + }, + { + "epoch": 0.51, + "learning_rate": 1.896595163027036e-06, + "loss": 0.9736, + "step": 20092 + }, + { + "epoch": 0.51, + "learning_rate": 1.8965829087923242e-06, + "loss": 1.0, + "step": 20093 + }, + { + "epoch": 0.52, + "learning_rate": 1.89657065387114e-06, + "loss": 0.772, + "step": 20094 + }, + { + "epoch": 0.52, + "learning_rate": 1.8965583982634932e-06, + "loss": 0.8994, + "step": 20095 + }, + { + "epoch": 0.52, + "learning_rate": 1.8965461419693927e-06, + "loss": 0.8545, + "step": 20096 + }, + { + "epoch": 0.52, + "learning_rate": 1.8965338849888481e-06, + "loss": 0.8906, + "step": 20097 + }, + { + "epoch": 0.52, + "learning_rate": 1.8965216273218685e-06, + "loss": 1.0498, + "step": 20098 + }, + { + "epoch": 0.52, + "learning_rate": 1.8965093689684637e-06, + "loss": 0.9326, + "step": 20099 + }, + { + "epoch": 0.52, + "learning_rate": 1.896497109928643e-06, + "loss": 0.7324, + "step": 20100 + }, + { + "epoch": 0.52, + "learning_rate": 1.8964848502024155e-06, + "loss": 0.8516, + "step": 20101 + }, + { + "epoch": 0.52, + "learning_rate": 1.8964725897897908e-06, + "loss": 0.7061, + "step": 20102 + }, + { + "epoch": 0.52, + "learning_rate": 1.8964603286907783e-06, + "loss": 0.9346, + "step": 20103 + }, + { + "epoch": 0.52, + "learning_rate": 1.8964480669053872e-06, + "loss": 0.8652, + "step": 20104 + }, + { + "epoch": 0.52, + "learning_rate": 1.8964358044336275e-06, + "loss": 0.7993, + "step": 20105 + }, + { + "epoch": 0.52, + "learning_rate": 1.8964235412755078e-06, + "loss": 0.9912, + "step": 20106 + }, + { + "epoch": 0.52, + "learning_rate": 1.8964112774310376e-06, + "loss": 0.9717, + "step": 20107 + }, + { + "epoch": 0.52, + "learning_rate": 1.8963990129002268e-06, + "loss": 0.833, + "step": 20108 + }, + { + "epoch": 0.52, + "learning_rate": 1.8963867476830843e-06, + "loss": 0.5178, + "step": 20109 + }, + { + "epoch": 0.52, + "learning_rate": 1.89637448177962e-06, + "loss": 0.8643, + "step": 20110 + }, + { + "epoch": 0.52, + "learning_rate": 1.8963622151898425e-06, + "loss": 0.9854, + "step": 20111 + }, + { + "epoch": 0.52, + "learning_rate": 1.8963499479137622e-06, + "loss": 0.8416, + "step": 20112 + }, + { + "epoch": 0.52, + "learning_rate": 1.8963376799513878e-06, + "loss": 0.8389, + "step": 20113 + }, + { + "epoch": 0.52, + "learning_rate": 1.8963254113027286e-06, + "loss": 0.6963, + "step": 20114 + }, + { + "epoch": 0.52, + "learning_rate": 1.8963131419677945e-06, + "loss": 0.9736, + "step": 20115 + }, + { + "epoch": 0.52, + "learning_rate": 1.8963008719465945e-06, + "loss": 1.001, + "step": 20116 + }, + { + "epoch": 0.52, + "learning_rate": 1.8962886012391382e-06, + "loss": 0.96, + "step": 20117 + }, + { + "epoch": 0.52, + "learning_rate": 1.896276329845435e-06, + "loss": 0.793, + "step": 20118 + }, + { + "epoch": 0.52, + "learning_rate": 1.896264057765494e-06, + "loss": 1.0107, + "step": 20119 + }, + { + "epoch": 0.52, + "learning_rate": 1.896251784999325e-06, + "loss": 0.856, + "step": 20120 + }, + { + "epoch": 0.52, + "learning_rate": 1.8962395115469372e-06, + "loss": 0.9131, + "step": 20121 + }, + { + "epoch": 0.52, + "learning_rate": 1.89622723740834e-06, + "loss": 0.6365, + "step": 20122 + }, + { + "epoch": 0.52, + "learning_rate": 1.8962149625835426e-06, + "loss": 0.6987, + "step": 20123 + }, + { + "epoch": 0.52, + "learning_rate": 1.896202687072555e-06, + "loss": 0.8223, + "step": 20124 + }, + { + "epoch": 0.52, + "learning_rate": 1.896190410875386e-06, + "loss": 0.6948, + "step": 20125 + }, + { + "epoch": 0.52, + "learning_rate": 1.8961781339920453e-06, + "loss": 0.7305, + "step": 20126 + }, + { + "epoch": 0.52, + "learning_rate": 1.896165856422542e-06, + "loss": 0.8857, + "step": 20127 + }, + { + "epoch": 0.52, + "learning_rate": 1.8961535781668857e-06, + "loss": 0.8545, + "step": 20128 + }, + { + "epoch": 0.52, + "learning_rate": 1.8961412992250862e-06, + "loss": 0.7744, + "step": 20129 + }, + { + "epoch": 0.52, + "learning_rate": 1.8961290195971524e-06, + "loss": 0.7686, + "step": 20130 + }, + { + "epoch": 0.52, + "learning_rate": 1.8961167392830934e-06, + "loss": 0.9736, + "step": 20131 + }, + { + "epoch": 0.52, + "learning_rate": 1.8961044582829196e-06, + "loss": 0.8145, + "step": 20132 + }, + { + "epoch": 0.52, + "learning_rate": 1.8960921765966394e-06, + "loss": 0.9912, + "step": 20133 + }, + { + "epoch": 0.52, + "learning_rate": 1.8960798942242628e-06, + "loss": 0.6943, + "step": 20134 + }, + { + "epoch": 0.52, + "learning_rate": 1.8960676111657992e-06, + "loss": 1.1729, + "step": 20135 + }, + { + "epoch": 0.52, + "learning_rate": 1.8960553274212574e-06, + "loss": 0.9834, + "step": 20136 + }, + { + "epoch": 0.52, + "learning_rate": 1.8960430429906476e-06, + "loss": 0.9336, + "step": 20137 + }, + { + "epoch": 0.52, + "learning_rate": 1.8960307578739788e-06, + "loss": 0.7827, + "step": 20138 + }, + { + "epoch": 0.52, + "learning_rate": 1.89601847207126e-06, + "loss": 0.9648, + "step": 20139 + }, + { + "epoch": 0.52, + "learning_rate": 1.8960061855825016e-06, + "loss": 0.8066, + "step": 20140 + }, + { + "epoch": 0.52, + "learning_rate": 1.8959938984077121e-06, + "loss": 0.8271, + "step": 20141 + }, + { + "epoch": 0.52, + "learning_rate": 1.8959816105469016e-06, + "loss": 0.8457, + "step": 20142 + }, + { + "epoch": 0.52, + "learning_rate": 1.895969322000079e-06, + "loss": 0.9541, + "step": 20143 + }, + { + "epoch": 0.52, + "learning_rate": 1.8959570327672538e-06, + "loss": 0.9854, + "step": 20144 + }, + { + "epoch": 0.52, + "learning_rate": 1.8959447428484357e-06, + "loss": 0.9209, + "step": 20145 + }, + { + "epoch": 0.52, + "learning_rate": 1.8959324522436337e-06, + "loss": 0.9365, + "step": 20146 + }, + { + "epoch": 0.52, + "learning_rate": 1.8959201609528576e-06, + "loss": 0.7178, + "step": 20147 + }, + { + "epoch": 0.52, + "learning_rate": 1.8959078689761166e-06, + "loss": 0.9053, + "step": 20148 + }, + { + "epoch": 0.52, + "learning_rate": 1.8958955763134202e-06, + "loss": 0.6382, + "step": 20149 + }, + { + "epoch": 0.52, + "learning_rate": 1.8958832829647776e-06, + "loss": 0.9707, + "step": 20150 + }, + { + "epoch": 0.52, + "learning_rate": 1.8958709889301984e-06, + "loss": 1.0264, + "step": 20151 + }, + { + "epoch": 0.52, + "learning_rate": 1.895858694209692e-06, + "loss": 0.9902, + "step": 20152 + }, + { + "epoch": 0.52, + "learning_rate": 1.895846398803268e-06, + "loss": 0.9102, + "step": 20153 + }, + { + "epoch": 0.52, + "learning_rate": 1.895834102710935e-06, + "loss": 0.9053, + "step": 20154 + }, + { + "epoch": 0.52, + "learning_rate": 1.8958218059327035e-06, + "loss": 0.7617, + "step": 20155 + }, + { + "epoch": 0.52, + "learning_rate": 1.8958095084685823e-06, + "loss": 0.9102, + "step": 20156 + }, + { + "epoch": 0.52, + "learning_rate": 1.8957972103185811e-06, + "loss": 1.0195, + "step": 20157 + }, + { + "epoch": 0.52, + "learning_rate": 1.8957849114827092e-06, + "loss": 0.8262, + "step": 20158 + }, + { + "epoch": 0.52, + "learning_rate": 1.8957726119609756e-06, + "loss": 0.9639, + "step": 20159 + }, + { + "epoch": 0.52, + "learning_rate": 1.8957603117533903e-06, + "loss": 0.6511, + "step": 20160 + }, + { + "epoch": 0.52, + "learning_rate": 1.8957480108599627e-06, + "loss": 0.7217, + "step": 20161 + }, + { + "epoch": 0.52, + "learning_rate": 1.8957357092807018e-06, + "loss": 1.1113, + "step": 20162 + }, + { + "epoch": 0.52, + "learning_rate": 1.8957234070156174e-06, + "loss": 0.8096, + "step": 20163 + }, + { + "epoch": 0.52, + "learning_rate": 1.8957111040647188e-06, + "loss": 0.8477, + "step": 20164 + }, + { + "epoch": 0.52, + "learning_rate": 1.8956988004280153e-06, + "loss": 0.8896, + "step": 20165 + }, + { + "epoch": 0.52, + "learning_rate": 1.8956864961055164e-06, + "loss": 0.8809, + "step": 20166 + }, + { + "epoch": 0.52, + "learning_rate": 1.8956741910972313e-06, + "loss": 0.8271, + "step": 20167 + }, + { + "epoch": 0.52, + "learning_rate": 1.8956618854031701e-06, + "loss": 0.915, + "step": 20168 + }, + { + "epoch": 0.52, + "learning_rate": 1.8956495790233415e-06, + "loss": 0.8672, + "step": 20169 + }, + { + "epoch": 0.52, + "learning_rate": 1.8956372719577553e-06, + "loss": 0.8984, + "step": 20170 + }, + { + "epoch": 0.52, + "learning_rate": 1.8956249642064211e-06, + "loss": 0.9678, + "step": 20171 + }, + { + "epoch": 0.52, + "learning_rate": 1.8956126557693475e-06, + "loss": 0.7847, + "step": 20172 + }, + { + "epoch": 0.52, + "learning_rate": 1.8956003466465446e-06, + "loss": 0.875, + "step": 20173 + }, + { + "epoch": 0.52, + "learning_rate": 1.895588036838022e-06, + "loss": 0.6167, + "step": 20174 + }, + { + "epoch": 0.52, + "learning_rate": 1.8955757263437886e-06, + "loss": 0.8857, + "step": 20175 + }, + { + "epoch": 0.52, + "learning_rate": 1.8955634151638541e-06, + "loss": 0.9658, + "step": 20176 + }, + { + "epoch": 0.52, + "learning_rate": 1.8955511032982279e-06, + "loss": 0.6895, + "step": 20177 + }, + { + "epoch": 0.52, + "learning_rate": 1.8955387907469194e-06, + "loss": 1.0791, + "step": 20178 + }, + { + "epoch": 0.52, + "learning_rate": 1.895526477509938e-06, + "loss": 0.6855, + "step": 20179 + }, + { + "epoch": 0.52, + "learning_rate": 1.8955141635872932e-06, + "loss": 0.8691, + "step": 20180 + }, + { + "epoch": 0.52, + "learning_rate": 1.8955018489789941e-06, + "loss": 0.6688, + "step": 20181 + }, + { + "epoch": 0.52, + "learning_rate": 1.8954895336850507e-06, + "loss": 1.0527, + "step": 20182 + }, + { + "epoch": 0.52, + "learning_rate": 1.8954772177054723e-06, + "loss": 0.7251, + "step": 20183 + }, + { + "epoch": 0.52, + "learning_rate": 1.8954649010402677e-06, + "loss": 0.7473, + "step": 20184 + }, + { + "epoch": 0.52, + "learning_rate": 1.895452583689447e-06, + "loss": 0.7646, + "step": 20185 + }, + { + "epoch": 0.52, + "learning_rate": 1.8954402656530198e-06, + "loss": 0.8584, + "step": 20186 + }, + { + "epoch": 0.52, + "learning_rate": 1.8954279469309947e-06, + "loss": 0.7471, + "step": 20187 + }, + { + "epoch": 0.52, + "learning_rate": 1.8954156275233816e-06, + "loss": 0.9531, + "step": 20188 + }, + { + "epoch": 0.52, + "learning_rate": 1.89540330743019e-06, + "loss": 0.606, + "step": 20189 + }, + { + "epoch": 0.52, + "learning_rate": 1.8953909866514295e-06, + "loss": 0.8691, + "step": 20190 + }, + { + "epoch": 0.52, + "learning_rate": 1.895378665187109e-06, + "loss": 0.6387, + "step": 20191 + }, + { + "epoch": 0.52, + "learning_rate": 1.8953663430372386e-06, + "loss": 0.8398, + "step": 20192 + }, + { + "epoch": 0.52, + "learning_rate": 1.895354020201827e-06, + "loss": 0.8867, + "step": 20193 + }, + { + "epoch": 0.52, + "learning_rate": 1.8953416966808842e-06, + "loss": 0.7227, + "step": 20194 + }, + { + "epoch": 0.52, + "learning_rate": 1.8953293724744193e-06, + "loss": 0.7305, + "step": 20195 + }, + { + "epoch": 0.52, + "learning_rate": 1.8953170475824419e-06, + "loss": 1.0215, + "step": 20196 + }, + { + "epoch": 0.52, + "learning_rate": 1.8953047220049614e-06, + "loss": 0.7432, + "step": 20197 + }, + { + "epoch": 0.52, + "learning_rate": 1.895292395741987e-06, + "loss": 0.6797, + "step": 20198 + }, + { + "epoch": 0.52, + "learning_rate": 1.8952800687935286e-06, + "loss": 0.7812, + "step": 20199 + }, + { + "epoch": 0.52, + "learning_rate": 1.8952677411595957e-06, + "loss": 1.0938, + "step": 20200 + }, + { + "epoch": 0.52, + "learning_rate": 1.895255412840197e-06, + "loss": 1.0254, + "step": 20201 + }, + { + "epoch": 0.52, + "learning_rate": 1.8952430838353428e-06, + "loss": 0.6963, + "step": 20202 + }, + { + "epoch": 0.52, + "learning_rate": 1.895230754145042e-06, + "loss": 0.792, + "step": 20203 + }, + { + "epoch": 0.52, + "learning_rate": 1.8952184237693038e-06, + "loss": 0.7959, + "step": 20204 + }, + { + "epoch": 0.52, + "learning_rate": 1.8952060927081383e-06, + "loss": 1.0117, + "step": 20205 + }, + { + "epoch": 0.52, + "learning_rate": 1.8951937609615549e-06, + "loss": 0.748, + "step": 20206 + }, + { + "epoch": 0.52, + "learning_rate": 1.8951814285295625e-06, + "loss": 0.8389, + "step": 20207 + }, + { + "epoch": 0.52, + "learning_rate": 1.895169095412171e-06, + "loss": 0.8579, + "step": 20208 + }, + { + "epoch": 0.52, + "learning_rate": 1.8951567616093896e-06, + "loss": 0.5725, + "step": 20209 + }, + { + "epoch": 0.52, + "learning_rate": 1.8951444271212278e-06, + "loss": 1.1738, + "step": 20210 + }, + { + "epoch": 0.52, + "learning_rate": 1.8951320919476949e-06, + "loss": 0.8945, + "step": 20211 + }, + { + "epoch": 0.52, + "learning_rate": 1.8951197560888008e-06, + "loss": 0.8076, + "step": 20212 + }, + { + "epoch": 0.52, + "learning_rate": 1.8951074195445547e-06, + "loss": 0.8164, + "step": 20213 + }, + { + "epoch": 0.52, + "learning_rate": 1.8950950823149658e-06, + "loss": 0.7229, + "step": 20214 + }, + { + "epoch": 0.52, + "learning_rate": 1.8950827444000439e-06, + "loss": 0.8853, + "step": 20215 + }, + { + "epoch": 0.52, + "learning_rate": 1.8950704057997981e-06, + "loss": 0.7622, + "step": 20216 + }, + { + "epoch": 0.52, + "learning_rate": 1.8950580665142382e-06, + "loss": 0.686, + "step": 20217 + }, + { + "epoch": 0.52, + "learning_rate": 1.8950457265433735e-06, + "loss": 0.8325, + "step": 20218 + }, + { + "epoch": 0.52, + "learning_rate": 1.8950333858872134e-06, + "loss": 0.9893, + "step": 20219 + }, + { + "epoch": 0.52, + "learning_rate": 1.8950210445457674e-06, + "loss": 0.6885, + "step": 20220 + }, + { + "epoch": 0.52, + "learning_rate": 1.895008702519045e-06, + "loss": 0.9824, + "step": 20221 + }, + { + "epoch": 0.52, + "learning_rate": 1.8949963598070556e-06, + "loss": 0.7559, + "step": 20222 + }, + { + "epoch": 0.52, + "learning_rate": 1.8949840164098086e-06, + "loss": 0.9131, + "step": 20223 + }, + { + "epoch": 0.52, + "learning_rate": 1.8949716723273134e-06, + "loss": 1.0078, + "step": 20224 + }, + { + "epoch": 0.52, + "learning_rate": 1.8949593275595796e-06, + "loss": 0.8799, + "step": 20225 + }, + { + "epoch": 0.52, + "learning_rate": 1.8949469821066167e-06, + "loss": 0.8022, + "step": 20226 + }, + { + "epoch": 0.52, + "learning_rate": 1.894934635968434e-06, + "loss": 0.8096, + "step": 20227 + }, + { + "epoch": 0.52, + "learning_rate": 1.894922289145041e-06, + "loss": 0.8467, + "step": 20228 + }, + { + "epoch": 0.52, + "learning_rate": 1.8949099416364472e-06, + "loss": 1.0117, + "step": 20229 + }, + { + "epoch": 0.52, + "learning_rate": 1.8948975934426619e-06, + "loss": 0.9727, + "step": 20230 + }, + { + "epoch": 0.52, + "learning_rate": 1.8948852445636944e-06, + "loss": 0.9082, + "step": 20231 + }, + { + "epoch": 0.52, + "learning_rate": 1.8948728949995548e-06, + "loss": 0.4658, + "step": 20232 + }, + { + "epoch": 0.52, + "learning_rate": 1.8948605447502519e-06, + "loss": 0.7393, + "step": 20233 + }, + { + "epoch": 0.52, + "learning_rate": 1.894848193815796e-06, + "loss": 0.957, + "step": 20234 + }, + { + "epoch": 0.52, + "learning_rate": 1.8948358421961953e-06, + "loss": 0.6929, + "step": 20235 + }, + { + "epoch": 0.52, + "learning_rate": 1.8948234898914603e-06, + "loss": 1.0703, + "step": 20236 + }, + { + "epoch": 0.52, + "learning_rate": 1.8948111369016e-06, + "loss": 0.9058, + "step": 20237 + }, + { + "epoch": 0.52, + "learning_rate": 1.8947987832266239e-06, + "loss": 0.8267, + "step": 20238 + }, + { + "epoch": 0.52, + "learning_rate": 1.8947864288665415e-06, + "loss": 0.8071, + "step": 20239 + }, + { + "epoch": 0.52, + "learning_rate": 1.8947740738213625e-06, + "loss": 0.7646, + "step": 20240 + }, + { + "epoch": 0.52, + "learning_rate": 1.894761718091096e-06, + "loss": 0.8877, + "step": 20241 + }, + { + "epoch": 0.52, + "learning_rate": 1.8947493616757515e-06, + "loss": 0.7402, + "step": 20242 + }, + { + "epoch": 0.52, + "learning_rate": 1.8947370045753389e-06, + "loss": 0.7993, + "step": 20243 + }, + { + "epoch": 0.52, + "learning_rate": 1.894724646789867e-06, + "loss": 0.9658, + "step": 20244 + }, + { + "epoch": 0.52, + "learning_rate": 1.8947122883193455e-06, + "loss": 0.7046, + "step": 20245 + }, + { + "epoch": 0.52, + "learning_rate": 1.894699929163784e-06, + "loss": 0.915, + "step": 20246 + }, + { + "epoch": 0.52, + "learning_rate": 1.8946875693231924e-06, + "loss": 0.959, + "step": 20247 + }, + { + "epoch": 0.52, + "learning_rate": 1.894675208797579e-06, + "loss": 0.7695, + "step": 20248 + }, + { + "epoch": 0.52, + "learning_rate": 1.894662847586954e-06, + "loss": 0.9688, + "step": 20249 + }, + { + "epoch": 0.52, + "learning_rate": 1.894650485691327e-06, + "loss": 0.918, + "step": 20250 + }, + { + "epoch": 0.52, + "learning_rate": 1.8946381231107074e-06, + "loss": 0.9023, + "step": 20251 + }, + { + "epoch": 0.52, + "learning_rate": 1.8946257598451042e-06, + "loss": 0.7153, + "step": 20252 + }, + { + "epoch": 0.52, + "learning_rate": 1.8946133958945274e-06, + "loss": 0.7939, + "step": 20253 + }, + { + "epoch": 0.52, + "learning_rate": 1.8946010312589861e-06, + "loss": 1.1436, + "step": 20254 + }, + { + "epoch": 0.52, + "learning_rate": 1.8945886659384902e-06, + "loss": 0.9434, + "step": 20255 + }, + { + "epoch": 0.52, + "learning_rate": 1.8945762999330489e-06, + "loss": 0.8369, + "step": 20256 + }, + { + "epoch": 0.52, + "learning_rate": 1.8945639332426713e-06, + "loss": 1.0312, + "step": 20257 + }, + { + "epoch": 0.52, + "learning_rate": 1.8945515658673674e-06, + "loss": 0.7734, + "step": 20258 + }, + { + "epoch": 0.52, + "learning_rate": 1.8945391978071466e-06, + "loss": 0.8682, + "step": 20259 + }, + { + "epoch": 0.52, + "learning_rate": 1.8945268290620183e-06, + "loss": 0.7275, + "step": 20260 + }, + { + "epoch": 0.52, + "learning_rate": 1.8945144596319917e-06, + "loss": 0.842, + "step": 20261 + }, + { + "epoch": 0.52, + "learning_rate": 1.8945020895170769e-06, + "loss": 0.8301, + "step": 20262 + }, + { + "epoch": 0.52, + "learning_rate": 1.8944897187172825e-06, + "loss": 0.9463, + "step": 20263 + }, + { + "epoch": 0.52, + "learning_rate": 1.8944773472326187e-06, + "loss": 1.0732, + "step": 20264 + }, + { + "epoch": 0.52, + "learning_rate": 1.8944649750630948e-06, + "loss": 0.792, + "step": 20265 + }, + { + "epoch": 0.52, + "learning_rate": 1.89445260220872e-06, + "loss": 0.8965, + "step": 20266 + }, + { + "epoch": 0.52, + "learning_rate": 1.894440228669504e-06, + "loss": 0.6323, + "step": 20267 + }, + { + "epoch": 0.52, + "learning_rate": 1.8944278544454564e-06, + "loss": 0.7603, + "step": 20268 + }, + { + "epoch": 0.52, + "learning_rate": 1.8944154795365862e-06, + "loss": 0.6909, + "step": 20269 + }, + { + "epoch": 0.52, + "learning_rate": 1.8944031039429037e-06, + "loss": 0.8516, + "step": 20270 + }, + { + "epoch": 0.52, + "learning_rate": 1.8943907276644175e-06, + "loss": 0.9346, + "step": 20271 + }, + { + "epoch": 0.52, + "learning_rate": 1.8943783507011375e-06, + "loss": 1.0449, + "step": 20272 + }, + { + "epoch": 0.52, + "learning_rate": 1.8943659730530731e-06, + "loss": 0.6333, + "step": 20273 + }, + { + "epoch": 0.52, + "learning_rate": 1.894353594720234e-06, + "loss": 0.9961, + "step": 20274 + }, + { + "epoch": 0.52, + "learning_rate": 1.8943412157026292e-06, + "loss": 0.8555, + "step": 20275 + }, + { + "epoch": 0.52, + "learning_rate": 1.8943288360002687e-06, + "loss": 0.8105, + "step": 20276 + }, + { + "epoch": 0.52, + "learning_rate": 1.8943164556131617e-06, + "loss": 0.8389, + "step": 20277 + }, + { + "epoch": 0.52, + "learning_rate": 1.8943040745413176e-06, + "loss": 0.832, + "step": 20278 + }, + { + "epoch": 0.52, + "learning_rate": 1.894291692784746e-06, + "loss": 0.832, + "step": 20279 + }, + { + "epoch": 0.52, + "learning_rate": 1.8942793103434563e-06, + "loss": 1.0244, + "step": 20280 + }, + { + "epoch": 0.52, + "learning_rate": 1.8942669272174583e-06, + "loss": 0.7744, + "step": 20281 + }, + { + "epoch": 0.52, + "learning_rate": 1.8942545434067609e-06, + "loss": 1.1143, + "step": 20282 + }, + { + "epoch": 0.52, + "learning_rate": 1.8942421589113743e-06, + "loss": 0.9736, + "step": 20283 + }, + { + "epoch": 0.52, + "learning_rate": 1.8942297737313072e-06, + "loss": 0.9258, + "step": 20284 + }, + { + "epoch": 0.52, + "learning_rate": 1.8942173878665696e-06, + "loss": 0.8989, + "step": 20285 + }, + { + "epoch": 0.52, + "learning_rate": 1.8942050013171711e-06, + "loss": 0.749, + "step": 20286 + }, + { + "epoch": 0.52, + "learning_rate": 1.8941926140831205e-06, + "loss": 0.729, + "step": 20287 + }, + { + "epoch": 0.52, + "learning_rate": 1.8941802261644284e-06, + "loss": 0.9199, + "step": 20288 + }, + { + "epoch": 0.52, + "learning_rate": 1.894167837561103e-06, + "loss": 0.8477, + "step": 20289 + }, + { + "epoch": 0.52, + "learning_rate": 1.8941554482731548e-06, + "loss": 0.6738, + "step": 20290 + }, + { + "epoch": 0.52, + "learning_rate": 1.8941430583005926e-06, + "loss": 0.7339, + "step": 20291 + }, + { + "epoch": 0.52, + "learning_rate": 1.8941306676434263e-06, + "loss": 0.8157, + "step": 20292 + }, + { + "epoch": 0.52, + "learning_rate": 1.8941182763016653e-06, + "loss": 0.9219, + "step": 20293 + }, + { + "epoch": 0.52, + "learning_rate": 1.8941058842753191e-06, + "loss": 0.8916, + "step": 20294 + }, + { + "epoch": 0.52, + "learning_rate": 1.894093491564397e-06, + "loss": 0.7676, + "step": 20295 + }, + { + "epoch": 0.52, + "learning_rate": 1.8940810981689086e-06, + "loss": 0.9736, + "step": 20296 + }, + { + "epoch": 0.52, + "learning_rate": 1.8940687040888635e-06, + "loss": 1.0898, + "step": 20297 + }, + { + "epoch": 0.52, + "learning_rate": 1.894056309324271e-06, + "loss": 0.8491, + "step": 20298 + }, + { + "epoch": 0.52, + "learning_rate": 1.8940439138751408e-06, + "loss": 0.7695, + "step": 20299 + }, + { + "epoch": 0.52, + "learning_rate": 1.8940315177414823e-06, + "loss": 0.6924, + "step": 20300 + }, + { + "epoch": 0.52, + "learning_rate": 1.8940191209233048e-06, + "loss": 0.8457, + "step": 20301 + }, + { + "epoch": 0.52, + "learning_rate": 1.894006723420618e-06, + "loss": 1.0225, + "step": 20302 + }, + { + "epoch": 0.52, + "learning_rate": 1.8939943252334317e-06, + "loss": 0.8506, + "step": 20303 + }, + { + "epoch": 0.52, + "learning_rate": 1.893981926361755e-06, + "loss": 0.793, + "step": 20304 + }, + { + "epoch": 0.52, + "learning_rate": 1.8939695268055971e-06, + "loss": 0.8701, + "step": 20305 + }, + { + "epoch": 0.52, + "learning_rate": 1.8939571265649681e-06, + "loss": 0.6436, + "step": 20306 + }, + { + "epoch": 0.52, + "learning_rate": 1.8939447256398768e-06, + "loss": 0.877, + "step": 20307 + }, + { + "epoch": 0.52, + "learning_rate": 1.8939323240303334e-06, + "loss": 0.8799, + "step": 20308 + }, + { + "epoch": 0.52, + "learning_rate": 1.8939199217363475e-06, + "loss": 0.8799, + "step": 20309 + }, + { + "epoch": 0.52, + "learning_rate": 1.8939075187579276e-06, + "loss": 0.9795, + "step": 20310 + }, + { + "epoch": 0.52, + "learning_rate": 1.893895115095084e-06, + "loss": 1.0752, + "step": 20311 + }, + { + "epoch": 0.52, + "learning_rate": 1.8938827107478263e-06, + "loss": 0.8867, + "step": 20312 + }, + { + "epoch": 0.52, + "learning_rate": 1.8938703057161635e-06, + "loss": 0.9873, + "step": 20313 + }, + { + "epoch": 0.52, + "learning_rate": 1.8938579000001056e-06, + "loss": 0.9629, + "step": 20314 + }, + { + "epoch": 0.52, + "learning_rate": 1.8938454935996616e-06, + "loss": 1.0137, + "step": 20315 + }, + { + "epoch": 0.52, + "learning_rate": 1.8938330865148412e-06, + "loss": 0.9414, + "step": 20316 + }, + { + "epoch": 0.52, + "learning_rate": 1.8938206787456537e-06, + "loss": 0.917, + "step": 20317 + }, + { + "epoch": 0.52, + "learning_rate": 1.893808270292109e-06, + "loss": 0.9883, + "step": 20318 + }, + { + "epoch": 0.52, + "learning_rate": 1.8937958611542164e-06, + "loss": 0.9971, + "step": 20319 + }, + { + "epoch": 0.52, + "learning_rate": 1.8937834513319854e-06, + "loss": 1.0029, + "step": 20320 + }, + { + "epoch": 0.52, + "learning_rate": 1.8937710408254255e-06, + "loss": 0.5774, + "step": 20321 + }, + { + "epoch": 0.52, + "learning_rate": 1.8937586296345462e-06, + "loss": 0.8486, + "step": 20322 + }, + { + "epoch": 0.52, + "learning_rate": 1.8937462177593568e-06, + "loss": 1.248, + "step": 20323 + }, + { + "epoch": 0.52, + "learning_rate": 1.8937338051998675e-06, + "loss": 0.8701, + "step": 20324 + }, + { + "epoch": 0.52, + "learning_rate": 1.893721391956087e-06, + "loss": 1.1572, + "step": 20325 + }, + { + "epoch": 0.52, + "learning_rate": 1.893708978028025e-06, + "loss": 0.8125, + "step": 20326 + }, + { + "epoch": 0.52, + "learning_rate": 1.8936965634156917e-06, + "loss": 0.7163, + "step": 20327 + }, + { + "epoch": 0.52, + "learning_rate": 1.8936841481190954e-06, + "loss": 0.9121, + "step": 20328 + }, + { + "epoch": 0.52, + "learning_rate": 1.8936717321382465e-06, + "loss": 1.084, + "step": 20329 + }, + { + "epoch": 0.52, + "learning_rate": 1.8936593154731542e-06, + "loss": 0.686, + "step": 20330 + }, + { + "epoch": 0.52, + "learning_rate": 1.893646898123828e-06, + "loss": 0.834, + "step": 20331 + }, + { + "epoch": 0.52, + "learning_rate": 1.8936344800902777e-06, + "loss": 0.8535, + "step": 20332 + }, + { + "epoch": 0.52, + "learning_rate": 1.8936220613725124e-06, + "loss": 0.7881, + "step": 20333 + }, + { + "epoch": 0.52, + "learning_rate": 1.8936096419705417e-06, + "loss": 0.6045, + "step": 20334 + }, + { + "epoch": 0.52, + "learning_rate": 1.8935972218843754e-06, + "loss": 0.9795, + "step": 20335 + }, + { + "epoch": 0.52, + "learning_rate": 1.8935848011140227e-06, + "loss": 0.8965, + "step": 20336 + }, + { + "epoch": 0.52, + "learning_rate": 1.8935723796594931e-06, + "loss": 0.812, + "step": 20337 + }, + { + "epoch": 0.52, + "learning_rate": 1.8935599575207962e-06, + "loss": 0.7939, + "step": 20338 + }, + { + "epoch": 0.52, + "learning_rate": 1.8935475346979416e-06, + "loss": 0.959, + "step": 20339 + }, + { + "epoch": 0.52, + "learning_rate": 1.893535111190939e-06, + "loss": 0.7456, + "step": 20340 + }, + { + "epoch": 0.52, + "learning_rate": 1.8935226869997973e-06, + "loss": 0.9707, + "step": 20341 + }, + { + "epoch": 0.52, + "learning_rate": 1.8935102621245265e-06, + "loss": 1.1318, + "step": 20342 + }, + { + "epoch": 0.52, + "learning_rate": 1.8934978365651359e-06, + "loss": 0.8506, + "step": 20343 + }, + { + "epoch": 0.52, + "learning_rate": 1.8934854103216353e-06, + "loss": 0.8193, + "step": 20344 + }, + { + "epoch": 0.52, + "learning_rate": 1.8934729833940337e-06, + "loss": 0.7188, + "step": 20345 + }, + { + "epoch": 0.52, + "learning_rate": 1.8934605557823411e-06, + "loss": 1.0215, + "step": 20346 + }, + { + "epoch": 0.52, + "learning_rate": 1.8934481274865668e-06, + "loss": 0.9062, + "step": 20347 + }, + { + "epoch": 0.52, + "learning_rate": 1.8934356985067204e-06, + "loss": 0.9346, + "step": 20348 + }, + { + "epoch": 0.52, + "learning_rate": 1.8934232688428114e-06, + "loss": 1.0039, + "step": 20349 + }, + { + "epoch": 0.52, + "learning_rate": 1.893410838494849e-06, + "loss": 0.6313, + "step": 20350 + }, + { + "epoch": 0.52, + "learning_rate": 1.8933984074628434e-06, + "loss": 0.917, + "step": 20351 + }, + { + "epoch": 0.52, + "learning_rate": 1.8933859757468033e-06, + "loss": 0.9229, + "step": 20352 + }, + { + "epoch": 0.52, + "learning_rate": 1.893373543346739e-06, + "loss": 0.9492, + "step": 20353 + }, + { + "epoch": 0.52, + "learning_rate": 1.8933611102626595e-06, + "loss": 0.6069, + "step": 20354 + }, + { + "epoch": 0.52, + "learning_rate": 1.8933486764945746e-06, + "loss": 0.7773, + "step": 20355 + }, + { + "epoch": 0.52, + "learning_rate": 1.8933362420424934e-06, + "loss": 0.6558, + "step": 20356 + }, + { + "epoch": 0.52, + "learning_rate": 1.8933238069064262e-06, + "loss": 1.0557, + "step": 20357 + }, + { + "epoch": 0.52, + "learning_rate": 1.8933113710863815e-06, + "loss": 0.9111, + "step": 20358 + }, + { + "epoch": 0.52, + "learning_rate": 1.8932989345823698e-06, + "loss": 0.8516, + "step": 20359 + }, + { + "epoch": 0.52, + "learning_rate": 1.8932864973944e-06, + "loss": 0.832, + "step": 20360 + }, + { + "epoch": 0.52, + "learning_rate": 1.8932740595224814e-06, + "loss": 1.0264, + "step": 20361 + }, + { + "epoch": 0.52, + "learning_rate": 1.8932616209666245e-06, + "loss": 0.7485, + "step": 20362 + }, + { + "epoch": 0.52, + "learning_rate": 1.893249181726838e-06, + "loss": 1.0146, + "step": 20363 + }, + { + "epoch": 0.52, + "learning_rate": 1.8932367418031318e-06, + "loss": 0.8132, + "step": 20364 + }, + { + "epoch": 0.52, + "learning_rate": 1.8932243011955152e-06, + "loss": 1.0127, + "step": 20365 + }, + { + "epoch": 0.52, + "learning_rate": 1.8932118599039979e-06, + "loss": 0.7288, + "step": 20366 + }, + { + "epoch": 0.52, + "learning_rate": 1.8931994179285893e-06, + "loss": 0.8076, + "step": 20367 + }, + { + "epoch": 0.52, + "learning_rate": 1.893186975269299e-06, + "loss": 0.7334, + "step": 20368 + }, + { + "epoch": 0.52, + "learning_rate": 1.8931745319261365e-06, + "loss": 0.8076, + "step": 20369 + }, + { + "epoch": 0.52, + "learning_rate": 1.8931620878991112e-06, + "loss": 1.1562, + "step": 20370 + }, + { + "epoch": 0.52, + "learning_rate": 1.893149643188233e-06, + "loss": 0.8633, + "step": 20371 + }, + { + "epoch": 0.52, + "learning_rate": 1.8931371977935111e-06, + "loss": 0.7827, + "step": 20372 + }, + { + "epoch": 0.52, + "learning_rate": 1.893124751714955e-06, + "loss": 0.646, + "step": 20373 + }, + { + "epoch": 0.52, + "learning_rate": 1.8931123049525746e-06, + "loss": 0.9229, + "step": 20374 + }, + { + "epoch": 0.52, + "learning_rate": 1.893099857506379e-06, + "loss": 0.9775, + "step": 20375 + }, + { + "epoch": 0.52, + "learning_rate": 1.8930874093763777e-06, + "loss": 0.9844, + "step": 20376 + }, + { + "epoch": 0.52, + "learning_rate": 1.8930749605625806e-06, + "loss": 1.0488, + "step": 20377 + }, + { + "epoch": 0.52, + "learning_rate": 1.893062511064997e-06, + "loss": 0.7754, + "step": 20378 + }, + { + "epoch": 0.52, + "learning_rate": 1.8930500608836369e-06, + "loss": 0.7002, + "step": 20379 + }, + { + "epoch": 0.52, + "learning_rate": 1.8930376100185091e-06, + "loss": 1.0684, + "step": 20380 + }, + { + "epoch": 0.52, + "learning_rate": 1.8930251584696234e-06, + "loss": 0.7959, + "step": 20381 + }, + { + "epoch": 0.52, + "learning_rate": 1.8930127062369897e-06, + "loss": 0.8887, + "step": 20382 + }, + { + "epoch": 0.52, + "learning_rate": 1.8930002533206169e-06, + "loss": 0.7881, + "step": 20383 + }, + { + "epoch": 0.52, + "learning_rate": 1.892987799720515e-06, + "loss": 0.8838, + "step": 20384 + }, + { + "epoch": 0.52, + "learning_rate": 1.8929753454366933e-06, + "loss": 0.8994, + "step": 20385 + }, + { + "epoch": 0.52, + "learning_rate": 1.8929628904691618e-06, + "loss": 0.6499, + "step": 20386 + }, + { + "epoch": 0.52, + "learning_rate": 1.8929504348179292e-06, + "loss": 0.8132, + "step": 20387 + }, + { + "epoch": 0.52, + "learning_rate": 1.8929379784830057e-06, + "loss": 0.8242, + "step": 20388 + }, + { + "epoch": 0.52, + "learning_rate": 1.892925521464401e-06, + "loss": 0.8135, + "step": 20389 + }, + { + "epoch": 0.52, + "learning_rate": 1.8929130637621236e-06, + "loss": 0.752, + "step": 20390 + }, + { + "epoch": 0.52, + "learning_rate": 1.8929006053761842e-06, + "loss": 1.1318, + "step": 20391 + }, + { + "epoch": 0.52, + "learning_rate": 1.8928881463065917e-06, + "loss": 0.6074, + "step": 20392 + }, + { + "epoch": 0.52, + "learning_rate": 1.8928756865533558e-06, + "loss": 0.9512, + "step": 20393 + }, + { + "epoch": 0.52, + "learning_rate": 1.892863226116486e-06, + "loss": 0.8916, + "step": 20394 + }, + { + "epoch": 0.52, + "learning_rate": 1.8928507649959922e-06, + "loss": 0.8965, + "step": 20395 + }, + { + "epoch": 0.52, + "learning_rate": 1.8928383031918833e-06, + "loss": 0.748, + "step": 20396 + }, + { + "epoch": 0.52, + "learning_rate": 1.8928258407041692e-06, + "loss": 0.9146, + "step": 20397 + }, + { + "epoch": 0.52, + "learning_rate": 1.8928133775328596e-06, + "loss": 1.0605, + "step": 20398 + }, + { + "epoch": 0.52, + "learning_rate": 1.8928009136779636e-06, + "loss": 0.6804, + "step": 20399 + }, + { + "epoch": 0.52, + "learning_rate": 1.8927884491394911e-06, + "loss": 0.835, + "step": 20400 + }, + { + "epoch": 0.52, + "learning_rate": 1.8927759839174518e-06, + "loss": 0.9824, + "step": 20401 + }, + { + "epoch": 0.52, + "learning_rate": 1.8927635180118546e-06, + "loss": 0.8506, + "step": 20402 + }, + { + "epoch": 0.52, + "learning_rate": 1.8927510514227096e-06, + "loss": 0.8604, + "step": 20403 + }, + { + "epoch": 0.52, + "learning_rate": 1.8927385841500261e-06, + "loss": 1.1318, + "step": 20404 + }, + { + "epoch": 0.52, + "learning_rate": 1.8927261161938138e-06, + "loss": 0.8164, + "step": 20405 + }, + { + "epoch": 0.52, + "learning_rate": 1.892713647554082e-06, + "loss": 0.7637, + "step": 20406 + }, + { + "epoch": 0.52, + "learning_rate": 1.8927011782308403e-06, + "loss": 0.9746, + "step": 20407 + }, + { + "epoch": 0.52, + "learning_rate": 1.8926887082240987e-06, + "loss": 0.689, + "step": 20408 + }, + { + "epoch": 0.52, + "learning_rate": 1.8926762375338664e-06, + "loss": 0.8809, + "step": 20409 + }, + { + "epoch": 0.52, + "learning_rate": 1.8926637661601527e-06, + "loss": 0.9678, + "step": 20410 + }, + { + "epoch": 0.52, + "learning_rate": 1.8926512941029675e-06, + "loss": 0.6665, + "step": 20411 + }, + { + "epoch": 0.52, + "learning_rate": 1.8926388213623202e-06, + "loss": 0.8916, + "step": 20412 + }, + { + "epoch": 0.52, + "learning_rate": 1.8926263479382208e-06, + "loss": 1.083, + "step": 20413 + }, + { + "epoch": 0.52, + "learning_rate": 1.892613873830678e-06, + "loss": 0.8945, + "step": 20414 + }, + { + "epoch": 0.52, + "learning_rate": 1.892601399039702e-06, + "loss": 0.7275, + "step": 20415 + }, + { + "epoch": 0.52, + "learning_rate": 1.8925889235653018e-06, + "loss": 0.7505, + "step": 20416 + }, + { + "epoch": 0.52, + "learning_rate": 1.8925764474074878e-06, + "loss": 0.8975, + "step": 20417 + }, + { + "epoch": 0.52, + "learning_rate": 1.8925639705662687e-06, + "loss": 0.7075, + "step": 20418 + }, + { + "epoch": 0.52, + "learning_rate": 1.8925514930416545e-06, + "loss": 0.9102, + "step": 20419 + }, + { + "epoch": 0.52, + "learning_rate": 1.8925390148336549e-06, + "loss": 0.9062, + "step": 20420 + }, + { + "epoch": 0.52, + "learning_rate": 1.892526535942279e-06, + "loss": 0.9824, + "step": 20421 + }, + { + "epoch": 0.52, + "learning_rate": 1.8925140563675365e-06, + "loss": 0.8984, + "step": 20422 + }, + { + "epoch": 0.52, + "learning_rate": 1.8925015761094372e-06, + "loss": 0.9287, + "step": 20423 + }, + { + "epoch": 0.52, + "learning_rate": 1.8924890951679902e-06, + "loss": 1.0029, + "step": 20424 + }, + { + "epoch": 0.52, + "learning_rate": 1.8924766135432057e-06, + "loss": 0.8213, + "step": 20425 + }, + { + "epoch": 0.52, + "learning_rate": 1.8924641312350926e-06, + "loss": 0.7041, + "step": 20426 + }, + { + "epoch": 0.52, + "learning_rate": 1.8924516482436607e-06, + "loss": 0.9229, + "step": 20427 + }, + { + "epoch": 0.52, + "learning_rate": 1.89243916456892e-06, + "loss": 0.7549, + "step": 20428 + }, + { + "epoch": 0.52, + "learning_rate": 1.8924266802108795e-06, + "loss": 0.916, + "step": 20429 + }, + { + "epoch": 0.52, + "learning_rate": 1.892414195169549e-06, + "loss": 0.8252, + "step": 20430 + }, + { + "epoch": 0.52, + "learning_rate": 1.8924017094449378e-06, + "loss": 0.8125, + "step": 20431 + }, + { + "epoch": 0.52, + "learning_rate": 1.8923892230370554e-06, + "loss": 0.9883, + "step": 20432 + }, + { + "epoch": 0.52, + "learning_rate": 1.8923767359459123e-06, + "loss": 0.8057, + "step": 20433 + }, + { + "epoch": 0.52, + "learning_rate": 1.8923642481715168e-06, + "loss": 0.8809, + "step": 20434 + }, + { + "epoch": 0.52, + "learning_rate": 1.8923517597138793e-06, + "loss": 1.0029, + "step": 20435 + }, + { + "epoch": 0.52, + "learning_rate": 1.8923392705730091e-06, + "loss": 0.8682, + "step": 20436 + }, + { + "epoch": 0.52, + "learning_rate": 1.8923267807489154e-06, + "loss": 0.9922, + "step": 20437 + }, + { + "epoch": 0.52, + "learning_rate": 1.8923142902416083e-06, + "loss": 0.9072, + "step": 20438 + }, + { + "epoch": 0.52, + "learning_rate": 1.8923017990510974e-06, + "loss": 0.8413, + "step": 20439 + }, + { + "epoch": 0.52, + "learning_rate": 1.8922893071773917e-06, + "loss": 0.7559, + "step": 20440 + }, + { + "epoch": 0.52, + "learning_rate": 1.8922768146205014e-06, + "loss": 0.6235, + "step": 20441 + }, + { + "epoch": 0.52, + "learning_rate": 1.8922643213804357e-06, + "loss": 0.7842, + "step": 20442 + }, + { + "epoch": 0.52, + "learning_rate": 1.8922518274572042e-06, + "loss": 0.9424, + "step": 20443 + }, + { + "epoch": 0.52, + "learning_rate": 1.8922393328508167e-06, + "loss": 0.9717, + "step": 20444 + }, + { + "epoch": 0.52, + "learning_rate": 1.892226837561282e-06, + "loss": 0.9404, + "step": 20445 + }, + { + "epoch": 0.52, + "learning_rate": 1.8922143415886107e-06, + "loss": 0.9648, + "step": 20446 + }, + { + "epoch": 0.52, + "learning_rate": 1.8922018449328117e-06, + "loss": 0.9209, + "step": 20447 + }, + { + "epoch": 0.52, + "learning_rate": 1.892189347593895e-06, + "loss": 0.8516, + "step": 20448 + }, + { + "epoch": 0.52, + "learning_rate": 1.8921768495718697e-06, + "loss": 0.8018, + "step": 20449 + }, + { + "epoch": 0.52, + "learning_rate": 1.892164350866746e-06, + "loss": 0.9385, + "step": 20450 + }, + { + "epoch": 0.52, + "learning_rate": 1.8921518514785325e-06, + "loss": 0.8916, + "step": 20451 + }, + { + "epoch": 0.52, + "learning_rate": 1.8921393514072399e-06, + "loss": 0.73, + "step": 20452 + }, + { + "epoch": 0.52, + "learning_rate": 1.892126850652877e-06, + "loss": 0.8589, + "step": 20453 + }, + { + "epoch": 0.52, + "learning_rate": 1.8921143492154533e-06, + "loss": 1.0352, + "step": 20454 + }, + { + "epoch": 0.52, + "learning_rate": 1.8921018470949792e-06, + "loss": 0.9551, + "step": 20455 + }, + { + "epoch": 0.52, + "learning_rate": 1.8920893442914633e-06, + "loss": 1.002, + "step": 20456 + }, + { + "epoch": 0.52, + "learning_rate": 1.8920768408049156e-06, + "loss": 0.7627, + "step": 20457 + }, + { + "epoch": 0.52, + "learning_rate": 1.8920643366353461e-06, + "loss": 1.0283, + "step": 20458 + }, + { + "epoch": 0.52, + "learning_rate": 1.8920518317827638e-06, + "loss": 0.7734, + "step": 20459 + }, + { + "epoch": 0.52, + "learning_rate": 1.8920393262471782e-06, + "loss": 1.0254, + "step": 20460 + }, + { + "epoch": 0.52, + "learning_rate": 1.8920268200285992e-06, + "loss": 0.9375, + "step": 20461 + }, + { + "epoch": 0.52, + "learning_rate": 1.8920143131270363e-06, + "loss": 0.8613, + "step": 20462 + }, + { + "epoch": 0.52, + "learning_rate": 1.8920018055424993e-06, + "loss": 0.8008, + "step": 20463 + }, + { + "epoch": 0.52, + "learning_rate": 1.8919892972749972e-06, + "loss": 0.9307, + "step": 20464 + }, + { + "epoch": 0.52, + "learning_rate": 1.89197678832454e-06, + "loss": 0.9951, + "step": 20465 + }, + { + "epoch": 0.52, + "learning_rate": 1.8919642786911374e-06, + "loss": 1.0703, + "step": 20466 + }, + { + "epoch": 0.52, + "learning_rate": 1.8919517683747985e-06, + "loss": 0.793, + "step": 20467 + }, + { + "epoch": 0.52, + "learning_rate": 1.8919392573755332e-06, + "loss": 0.9165, + "step": 20468 + }, + { + "epoch": 0.52, + "learning_rate": 1.891926745693351e-06, + "loss": 0.8965, + "step": 20469 + }, + { + "epoch": 0.52, + "learning_rate": 1.8919142333282614e-06, + "loss": 0.7783, + "step": 20470 + }, + { + "epoch": 0.52, + "learning_rate": 1.8919017202802742e-06, + "loss": 0.8848, + "step": 20471 + }, + { + "epoch": 0.52, + "learning_rate": 1.8918892065493992e-06, + "loss": 0.877, + "step": 20472 + }, + { + "epoch": 0.52, + "learning_rate": 1.8918766921356451e-06, + "loss": 0.8496, + "step": 20473 + }, + { + "epoch": 0.52, + "learning_rate": 1.8918641770390224e-06, + "loss": 0.7954, + "step": 20474 + }, + { + "epoch": 0.52, + "learning_rate": 1.8918516612595404e-06, + "loss": 0.7974, + "step": 20475 + }, + { + "epoch": 0.52, + "learning_rate": 1.891839144797208e-06, + "loss": 0.6758, + "step": 20476 + }, + { + "epoch": 0.52, + "learning_rate": 1.8918266276520358e-06, + "loss": 0.8418, + "step": 20477 + }, + { + "epoch": 0.52, + "learning_rate": 1.891814109824033e-06, + "loss": 0.9756, + "step": 20478 + }, + { + "epoch": 0.52, + "learning_rate": 1.891801591313209e-06, + "loss": 0.9385, + "step": 20479 + }, + { + "epoch": 0.52, + "learning_rate": 1.8917890721195735e-06, + "loss": 0.6494, + "step": 20480 + }, + { + "epoch": 0.52, + "learning_rate": 1.891776552243136e-06, + "loss": 0.6934, + "step": 20481 + }, + { + "epoch": 0.52, + "learning_rate": 1.8917640316839068e-06, + "loss": 0.8379, + "step": 20482 + }, + { + "epoch": 0.52, + "learning_rate": 1.8917515104418942e-06, + "loss": 0.7603, + "step": 20483 + }, + { + "epoch": 0.53, + "learning_rate": 1.891738988517109e-06, + "loss": 0.7085, + "step": 20484 + }, + { + "epoch": 0.53, + "learning_rate": 1.89172646590956e-06, + "loss": 0.9141, + "step": 20485 + }, + { + "epoch": 0.53, + "learning_rate": 1.8917139426192569e-06, + "loss": 0.9521, + "step": 20486 + }, + { + "epoch": 0.53, + "learning_rate": 1.8917014186462094e-06, + "loss": 1.0254, + "step": 20487 + }, + { + "epoch": 0.53, + "learning_rate": 1.8916888939904277e-06, + "loss": 1.0146, + "step": 20488 + }, + { + "epoch": 0.53, + "learning_rate": 1.8916763686519205e-06, + "loss": 0.4692, + "step": 20489 + }, + { + "epoch": 0.53, + "learning_rate": 1.8916638426306975e-06, + "loss": 0.9272, + "step": 20490 + }, + { + "epoch": 0.53, + "learning_rate": 1.8916513159267685e-06, + "loss": 0.7969, + "step": 20491 + }, + { + "epoch": 0.53, + "learning_rate": 1.8916387885401433e-06, + "loss": 0.8799, + "step": 20492 + }, + { + "epoch": 0.53, + "learning_rate": 1.891626260470831e-06, + "loss": 0.8711, + "step": 20493 + }, + { + "epoch": 0.53, + "learning_rate": 1.8916137317188419e-06, + "loss": 0.8066, + "step": 20494 + }, + { + "epoch": 0.53, + "learning_rate": 1.8916012022841848e-06, + "loss": 0.7036, + "step": 20495 + }, + { + "epoch": 0.53, + "learning_rate": 1.8915886721668697e-06, + "loss": 0.9873, + "step": 20496 + }, + { + "epoch": 0.53, + "learning_rate": 1.8915761413669063e-06, + "loss": 0.8096, + "step": 20497 + }, + { + "epoch": 0.53, + "learning_rate": 1.891563609884304e-06, + "loss": 0.6763, + "step": 20498 + }, + { + "epoch": 0.53, + "learning_rate": 1.8915510777190722e-06, + "loss": 0.9131, + "step": 20499 + }, + { + "epoch": 0.53, + "learning_rate": 1.8915385448712211e-06, + "loss": 0.9277, + "step": 20500 + }, + { + "epoch": 0.53, + "learning_rate": 1.8915260113407597e-06, + "loss": 0.8037, + "step": 20501 + }, + { + "epoch": 0.53, + "learning_rate": 1.891513477127698e-06, + "loss": 0.8682, + "step": 20502 + }, + { + "epoch": 0.53, + "learning_rate": 1.8915009422320454e-06, + "loss": 0.7529, + "step": 20503 + }, + { + "epoch": 0.53, + "learning_rate": 1.8914884066538113e-06, + "loss": 0.8701, + "step": 20504 + }, + { + "epoch": 0.53, + "learning_rate": 1.8914758703930059e-06, + "loss": 0.7627, + "step": 20505 + }, + { + "epoch": 0.53, + "learning_rate": 1.891463333449638e-06, + "loss": 0.8086, + "step": 20506 + }, + { + "epoch": 0.53, + "learning_rate": 1.8914507958237179e-06, + "loss": 0.8779, + "step": 20507 + }, + { + "epoch": 0.53, + "learning_rate": 1.8914382575152548e-06, + "loss": 0.8281, + "step": 20508 + }, + { + "epoch": 0.53, + "learning_rate": 1.8914257185242585e-06, + "loss": 0.7334, + "step": 20509 + }, + { + "epoch": 0.53, + "learning_rate": 1.8914131788507382e-06, + "loss": 0.9922, + "step": 20510 + }, + { + "epoch": 0.53, + "learning_rate": 1.891400638494704e-06, + "loss": 0.7666, + "step": 20511 + }, + { + "epoch": 0.53, + "learning_rate": 1.8913880974561655e-06, + "loss": 0.7266, + "step": 20512 + }, + { + "epoch": 0.53, + "learning_rate": 1.891375555735132e-06, + "loss": 0.7935, + "step": 20513 + }, + { + "epoch": 0.53, + "learning_rate": 1.8913630133316132e-06, + "loss": 0.6172, + "step": 20514 + }, + { + "epoch": 0.53, + "learning_rate": 1.891350470245619e-06, + "loss": 0.7764, + "step": 20515 + }, + { + "epoch": 0.53, + "learning_rate": 1.8913379264771584e-06, + "loss": 0.8604, + "step": 20516 + }, + { + "epoch": 0.53, + "learning_rate": 1.8913253820262415e-06, + "loss": 1.0059, + "step": 20517 + }, + { + "epoch": 0.53, + "learning_rate": 1.8913128368928775e-06, + "loss": 0.959, + "step": 20518 + }, + { + "epoch": 0.53, + "learning_rate": 1.8913002910770763e-06, + "loss": 1.0811, + "step": 20519 + }, + { + "epoch": 0.53, + "learning_rate": 1.8912877445788475e-06, + "loss": 0.8818, + "step": 20520 + }, + { + "epoch": 0.53, + "learning_rate": 1.891275197398201e-06, + "loss": 0.7725, + "step": 20521 + }, + { + "epoch": 0.53, + "learning_rate": 1.8912626495351456e-06, + "loss": 0.9297, + "step": 20522 + }, + { + "epoch": 0.53, + "learning_rate": 1.8912501009896915e-06, + "loss": 0.8857, + "step": 20523 + }, + { + "epoch": 0.53, + "learning_rate": 1.8912375517618485e-06, + "loss": 0.8047, + "step": 20524 + }, + { + "epoch": 0.53, + "learning_rate": 1.8912250018516253e-06, + "loss": 1.0527, + "step": 20525 + }, + { + "epoch": 0.53, + "learning_rate": 1.8912124512590326e-06, + "loss": 0.9229, + "step": 20526 + }, + { + "epoch": 0.53, + "learning_rate": 1.8911998999840792e-06, + "loss": 0.873, + "step": 20527 + }, + { + "epoch": 0.53, + "learning_rate": 1.8911873480267752e-06, + "loss": 0.668, + "step": 20528 + }, + { + "epoch": 0.53, + "learning_rate": 1.8911747953871298e-06, + "loss": 0.9551, + "step": 20529 + }, + { + "epoch": 0.53, + "learning_rate": 1.8911622420651532e-06, + "loss": 0.8594, + "step": 20530 + }, + { + "epoch": 0.53, + "learning_rate": 1.8911496880608545e-06, + "loss": 0.9697, + "step": 20531 + }, + { + "epoch": 0.53, + "learning_rate": 1.8911371333742432e-06, + "loss": 0.958, + "step": 20532 + }, + { + "epoch": 0.53, + "learning_rate": 1.8911245780053293e-06, + "loss": 1.0117, + "step": 20533 + }, + { + "epoch": 0.53, + "learning_rate": 1.8911120219541226e-06, + "loss": 0.7812, + "step": 20534 + }, + { + "epoch": 0.53, + "learning_rate": 1.8910994652206318e-06, + "loss": 0.8574, + "step": 20535 + }, + { + "epoch": 0.53, + "learning_rate": 1.8910869078048677e-06, + "loss": 0.5759, + "step": 20536 + }, + { + "epoch": 0.53, + "learning_rate": 1.891074349706839e-06, + "loss": 0.8818, + "step": 20537 + }, + { + "epoch": 0.53, + "learning_rate": 1.8910617909265559e-06, + "loss": 0.9424, + "step": 20538 + }, + { + "epoch": 0.53, + "learning_rate": 1.8910492314640277e-06, + "loss": 1.0264, + "step": 20539 + }, + { + "epoch": 0.53, + "learning_rate": 1.8910366713192638e-06, + "loss": 0.8477, + "step": 20540 + }, + { + "epoch": 0.53, + "learning_rate": 1.8910241104922741e-06, + "loss": 0.7612, + "step": 20541 + }, + { + "epoch": 0.53, + "learning_rate": 1.8910115489830685e-06, + "loss": 0.9766, + "step": 20542 + }, + { + "epoch": 0.53, + "learning_rate": 1.890998986791656e-06, + "loss": 0.7939, + "step": 20543 + }, + { + "epoch": 0.53, + "learning_rate": 1.8909864239180469e-06, + "loss": 0.8271, + "step": 20544 + }, + { + "epoch": 0.53, + "learning_rate": 1.8909738603622502e-06, + "loss": 1.1289, + "step": 20545 + }, + { + "epoch": 0.53, + "learning_rate": 1.890961296124276e-06, + "loss": 1.0078, + "step": 20546 + }, + { + "epoch": 0.53, + "learning_rate": 1.8909487312041335e-06, + "loss": 0.8184, + "step": 20547 + }, + { + "epoch": 0.53, + "learning_rate": 1.8909361656018326e-06, + "loss": 0.9526, + "step": 20548 + }, + { + "epoch": 0.53, + "learning_rate": 1.8909235993173832e-06, + "loss": 0.9385, + "step": 20549 + }, + { + "epoch": 0.53, + "learning_rate": 1.890911032350794e-06, + "loss": 0.8262, + "step": 20550 + }, + { + "epoch": 0.53, + "learning_rate": 1.8908984647020754e-06, + "loss": 0.7524, + "step": 20551 + }, + { + "epoch": 0.53, + "learning_rate": 1.8908858963712368e-06, + "loss": 0.7075, + "step": 20552 + }, + { + "epoch": 0.53, + "learning_rate": 1.890873327358288e-06, + "loss": 0.7249, + "step": 20553 + }, + { + "epoch": 0.53, + "learning_rate": 1.8908607576632383e-06, + "loss": 0.8008, + "step": 20554 + }, + { + "epoch": 0.53, + "learning_rate": 1.8908481872860972e-06, + "loss": 0.8555, + "step": 20555 + }, + { + "epoch": 0.53, + "learning_rate": 1.890835616226875e-06, + "loss": 0.8701, + "step": 20556 + }, + { + "epoch": 0.53, + "learning_rate": 1.890823044485581e-06, + "loss": 0.7224, + "step": 20557 + }, + { + "epoch": 0.53, + "learning_rate": 1.8908104720622244e-06, + "loss": 0.9229, + "step": 20558 + }, + { + "epoch": 0.53, + "learning_rate": 1.8907978989568156e-06, + "loss": 0.8252, + "step": 20559 + }, + { + "epoch": 0.53, + "learning_rate": 1.8907853251693636e-06, + "loss": 0.7661, + "step": 20560 + }, + { + "epoch": 0.53, + "learning_rate": 1.8907727506998781e-06, + "loss": 0.9502, + "step": 20561 + }, + { + "epoch": 0.53, + "learning_rate": 1.890760175548369e-06, + "loss": 1.0684, + "step": 20562 + }, + { + "epoch": 0.53, + "learning_rate": 1.8907475997148456e-06, + "loss": 0.9189, + "step": 20563 + }, + { + "epoch": 0.53, + "learning_rate": 1.890735023199318e-06, + "loss": 0.7754, + "step": 20564 + }, + { + "epoch": 0.53, + "learning_rate": 1.8907224460017954e-06, + "loss": 0.9014, + "step": 20565 + }, + { + "epoch": 0.53, + "learning_rate": 1.8907098681222876e-06, + "loss": 0.8291, + "step": 20566 + }, + { + "epoch": 0.53, + "learning_rate": 1.8906972895608042e-06, + "loss": 0.8125, + "step": 20567 + }, + { + "epoch": 0.53, + "learning_rate": 1.8906847103173548e-06, + "loss": 0.6978, + "step": 20568 + }, + { + "epoch": 0.53, + "learning_rate": 1.8906721303919493e-06, + "loss": 1.0898, + "step": 20569 + }, + { + "epoch": 0.53, + "learning_rate": 1.8906595497845967e-06, + "loss": 0.7046, + "step": 20570 + }, + { + "epoch": 0.53, + "learning_rate": 1.8906469684953075e-06, + "loss": 0.9814, + "step": 20571 + }, + { + "epoch": 0.53, + "learning_rate": 1.8906343865240908e-06, + "loss": 1.0107, + "step": 20572 + }, + { + "epoch": 0.53, + "learning_rate": 1.8906218038709559e-06, + "loss": 1.1104, + "step": 20573 + }, + { + "epoch": 0.53, + "learning_rate": 1.8906092205359132e-06, + "loss": 0.9395, + "step": 20574 + }, + { + "epoch": 0.53, + "learning_rate": 1.8905966365189718e-06, + "loss": 0.8096, + "step": 20575 + }, + { + "epoch": 0.53, + "learning_rate": 1.8905840518201416e-06, + "loss": 0.9102, + "step": 20576 + }, + { + "epoch": 0.53, + "learning_rate": 1.890571466439432e-06, + "loss": 0.8428, + "step": 20577 + }, + { + "epoch": 0.53, + "learning_rate": 1.890558880376853e-06, + "loss": 1.0098, + "step": 20578 + }, + { + "epoch": 0.53, + "learning_rate": 1.890546293632414e-06, + "loss": 0.7959, + "step": 20579 + }, + { + "epoch": 0.53, + "learning_rate": 1.8905337062061244e-06, + "loss": 0.9053, + "step": 20580 + }, + { + "epoch": 0.53, + "learning_rate": 1.8905211180979944e-06, + "loss": 0.9785, + "step": 20581 + }, + { + "epoch": 0.53, + "learning_rate": 1.890508529308033e-06, + "loss": 0.957, + "step": 20582 + }, + { + "epoch": 0.53, + "learning_rate": 1.8904959398362506e-06, + "loss": 0.6851, + "step": 20583 + }, + { + "epoch": 0.53, + "learning_rate": 1.890483349682656e-06, + "loss": 0.9258, + "step": 20584 + }, + { + "epoch": 0.53, + "learning_rate": 1.8904707588472593e-06, + "loss": 0.9365, + "step": 20585 + }, + { + "epoch": 0.53, + "learning_rate": 1.8904581673300704e-06, + "loss": 0.9639, + "step": 20586 + }, + { + "epoch": 0.53, + "learning_rate": 1.8904455751310982e-06, + "loss": 0.8306, + "step": 20587 + }, + { + "epoch": 0.53, + "learning_rate": 1.890432982250353e-06, + "loss": 0.9058, + "step": 20588 + }, + { + "epoch": 0.53, + "learning_rate": 1.8904203886878443e-06, + "loss": 1.0225, + "step": 20589 + }, + { + "epoch": 0.53, + "learning_rate": 1.8904077944435812e-06, + "loss": 0.9531, + "step": 20590 + }, + { + "epoch": 0.53, + "learning_rate": 1.8903951995175742e-06, + "loss": 0.6475, + "step": 20591 + }, + { + "epoch": 0.53, + "learning_rate": 1.8903826039098324e-06, + "loss": 0.6904, + "step": 20592 + }, + { + "epoch": 0.53, + "learning_rate": 1.890370007620366e-06, + "loss": 0.8867, + "step": 20593 + }, + { + "epoch": 0.53, + "learning_rate": 1.8903574106491836e-06, + "loss": 0.9766, + "step": 20594 + }, + { + "epoch": 0.53, + "learning_rate": 1.8903448129962957e-06, + "loss": 0.9336, + "step": 20595 + }, + { + "epoch": 0.53, + "learning_rate": 1.8903322146617118e-06, + "loss": 0.8467, + "step": 20596 + }, + { + "epoch": 0.53, + "learning_rate": 1.8903196156454415e-06, + "loss": 1.0703, + "step": 20597 + }, + { + "epoch": 0.53, + "learning_rate": 1.8903070159474943e-06, + "loss": 0.9443, + "step": 20598 + }, + { + "epoch": 0.53, + "learning_rate": 1.89029441556788e-06, + "loss": 0.9893, + "step": 20599 + }, + { + "epoch": 0.53, + "learning_rate": 1.890281814506608e-06, + "loss": 0.8232, + "step": 20600 + }, + { + "epoch": 0.53, + "learning_rate": 1.8902692127636883e-06, + "loss": 0.7246, + "step": 20601 + }, + { + "epoch": 0.53, + "learning_rate": 1.8902566103391305e-06, + "loss": 0.9951, + "step": 20602 + }, + { + "epoch": 0.53, + "learning_rate": 1.890244007232944e-06, + "loss": 0.8594, + "step": 20603 + }, + { + "epoch": 0.53, + "learning_rate": 1.8902314034451387e-06, + "loss": 0.521, + "step": 20604 + }, + { + "epoch": 0.53, + "learning_rate": 1.890218798975724e-06, + "loss": 0.9775, + "step": 20605 + }, + { + "epoch": 0.53, + "learning_rate": 1.89020619382471e-06, + "loss": 0.7139, + "step": 20606 + }, + { + "epoch": 0.53, + "learning_rate": 1.8901935879921058e-06, + "loss": 0.8745, + "step": 20607 + }, + { + "epoch": 0.53, + "learning_rate": 1.8901809814779215e-06, + "loss": 0.7573, + "step": 20608 + }, + { + "epoch": 0.53, + "learning_rate": 1.8901683742821663e-06, + "loss": 0.9072, + "step": 20609 + }, + { + "epoch": 0.53, + "learning_rate": 1.8901557664048502e-06, + "loss": 0.688, + "step": 20610 + }, + { + "epoch": 0.53, + "learning_rate": 1.8901431578459827e-06, + "loss": 0.814, + "step": 20611 + }, + { + "epoch": 0.53, + "learning_rate": 1.890130548605574e-06, + "loss": 0.5884, + "step": 20612 + }, + { + "epoch": 0.53, + "learning_rate": 1.8901179386836326e-06, + "loss": 0.9512, + "step": 20613 + }, + { + "epoch": 0.53, + "learning_rate": 1.890105328080169e-06, + "loss": 0.8486, + "step": 20614 + }, + { + "epoch": 0.53, + "learning_rate": 1.890092716795193e-06, + "loss": 0.792, + "step": 20615 + }, + { + "epoch": 0.53, + "learning_rate": 1.8900801048287137e-06, + "loss": 0.7002, + "step": 20616 + }, + { + "epoch": 0.53, + "learning_rate": 1.8900674921807409e-06, + "loss": 0.9375, + "step": 20617 + }, + { + "epoch": 0.53, + "learning_rate": 1.8900548788512845e-06, + "loss": 0.7466, + "step": 20618 + }, + { + "epoch": 0.53, + "learning_rate": 1.8900422648403538e-06, + "loss": 0.8271, + "step": 20619 + }, + { + "epoch": 0.53, + "learning_rate": 1.890029650147959e-06, + "loss": 0.7744, + "step": 20620 + }, + { + "epoch": 0.53, + "learning_rate": 1.8900170347741092e-06, + "loss": 0.8799, + "step": 20621 + }, + { + "epoch": 0.53, + "learning_rate": 1.8900044187188142e-06, + "loss": 0.6836, + "step": 20622 + }, + { + "epoch": 0.53, + "learning_rate": 1.889991801982084e-06, + "loss": 0.8613, + "step": 20623 + }, + { + "epoch": 0.53, + "learning_rate": 1.8899791845639276e-06, + "loss": 0.9736, + "step": 20624 + }, + { + "epoch": 0.53, + "learning_rate": 1.8899665664643555e-06, + "loss": 0.7808, + "step": 20625 + }, + { + "epoch": 0.53, + "learning_rate": 1.889953947683377e-06, + "loss": 1.0254, + "step": 20626 + }, + { + "epoch": 0.53, + "learning_rate": 1.8899413282210014e-06, + "loss": 0.9258, + "step": 20627 + }, + { + "epoch": 0.53, + "learning_rate": 1.8899287080772385e-06, + "loss": 0.7354, + "step": 20628 + }, + { + "epoch": 0.53, + "learning_rate": 1.8899160872520983e-06, + "loss": 0.7227, + "step": 20629 + }, + { + "epoch": 0.53, + "learning_rate": 1.88990346574559e-06, + "loss": 0.7959, + "step": 20630 + }, + { + "epoch": 0.53, + "learning_rate": 1.8898908435577238e-06, + "loss": 1.0405, + "step": 20631 + }, + { + "epoch": 0.53, + "learning_rate": 1.8898782206885091e-06, + "loss": 0.627, + "step": 20632 + }, + { + "epoch": 0.53, + "learning_rate": 1.8898655971379558e-06, + "loss": 0.9932, + "step": 20633 + }, + { + "epoch": 0.53, + "learning_rate": 1.8898529729060728e-06, + "loss": 0.6885, + "step": 20634 + }, + { + "epoch": 0.53, + "learning_rate": 1.8898403479928707e-06, + "loss": 0.8799, + "step": 20635 + }, + { + "epoch": 0.53, + "learning_rate": 1.8898277223983588e-06, + "loss": 0.9434, + "step": 20636 + }, + { + "epoch": 0.53, + "learning_rate": 1.8898150961225462e-06, + "loss": 0.8799, + "step": 20637 + }, + { + "epoch": 0.53, + "learning_rate": 1.8898024691654438e-06, + "loss": 0.7305, + "step": 20638 + }, + { + "epoch": 0.53, + "learning_rate": 1.8897898415270599e-06, + "loss": 0.8691, + "step": 20639 + }, + { + "epoch": 0.53, + "learning_rate": 1.8897772132074053e-06, + "loss": 0.605, + "step": 20640 + }, + { + "epoch": 0.53, + "learning_rate": 1.889764584206489e-06, + "loss": 0.7773, + "step": 20641 + }, + { + "epoch": 0.53, + "learning_rate": 1.8897519545243207e-06, + "loss": 1.0371, + "step": 20642 + }, + { + "epoch": 0.53, + "learning_rate": 1.8897393241609107e-06, + "loss": 0.8672, + "step": 20643 + }, + { + "epoch": 0.53, + "learning_rate": 1.8897266931162678e-06, + "loss": 0.9062, + "step": 20644 + }, + { + "epoch": 0.53, + "learning_rate": 1.8897140613904025e-06, + "loss": 0.8896, + "step": 20645 + }, + { + "epoch": 0.53, + "learning_rate": 1.8897014289833237e-06, + "loss": 0.594, + "step": 20646 + }, + { + "epoch": 0.53, + "learning_rate": 1.8896887958950415e-06, + "loss": 0.9375, + "step": 20647 + }, + { + "epoch": 0.53, + "learning_rate": 1.8896761621255657e-06, + "loss": 0.8813, + "step": 20648 + }, + { + "epoch": 0.53, + "learning_rate": 1.8896635276749055e-06, + "loss": 0.9297, + "step": 20649 + }, + { + "epoch": 0.53, + "learning_rate": 1.889650892543071e-06, + "loss": 0.75, + "step": 20650 + }, + { + "epoch": 0.53, + "learning_rate": 1.8896382567300714e-06, + "loss": 0.8799, + "step": 20651 + }, + { + "epoch": 0.53, + "learning_rate": 1.8896256202359174e-06, + "loss": 0.7959, + "step": 20652 + }, + { + "epoch": 0.53, + "learning_rate": 1.8896129830606173e-06, + "loss": 0.6172, + "step": 20653 + }, + { + "epoch": 0.53, + "learning_rate": 1.8896003452041817e-06, + "loss": 0.7036, + "step": 20654 + }, + { + "epoch": 0.53, + "learning_rate": 1.88958770666662e-06, + "loss": 0.6692, + "step": 20655 + }, + { + "epoch": 0.53, + "learning_rate": 1.8895750674479421e-06, + "loss": 0.8506, + "step": 20656 + }, + { + "epoch": 0.53, + "learning_rate": 1.889562427548157e-06, + "loss": 0.8667, + "step": 20657 + }, + { + "epoch": 0.53, + "learning_rate": 1.8895497869672753e-06, + "loss": 0.6235, + "step": 20658 + }, + { + "epoch": 0.53, + "learning_rate": 1.8895371457053057e-06, + "loss": 1.1338, + "step": 20659 + }, + { + "epoch": 0.53, + "learning_rate": 1.8895245037622588e-06, + "loss": 0.8809, + "step": 20660 + }, + { + "epoch": 0.53, + "learning_rate": 1.8895118611381439e-06, + "loss": 0.4785, + "step": 20661 + }, + { + "epoch": 0.53, + "learning_rate": 1.8894992178329708e-06, + "loss": 1.0625, + "step": 20662 + }, + { + "epoch": 0.53, + "learning_rate": 1.889486573846749e-06, + "loss": 0.4858, + "step": 20663 + }, + { + "epoch": 0.53, + "learning_rate": 1.8894739291794878e-06, + "loss": 0.8281, + "step": 20664 + }, + { + "epoch": 0.53, + "learning_rate": 1.8894612838311978e-06, + "loss": 0.7134, + "step": 20665 + }, + { + "epoch": 0.53, + "learning_rate": 1.889448637801888e-06, + "loss": 0.6733, + "step": 20666 + }, + { + "epoch": 0.53, + "learning_rate": 1.889435991091568e-06, + "loss": 0.8213, + "step": 20667 + }, + { + "epoch": 0.53, + "learning_rate": 1.8894233437002482e-06, + "loss": 0.6479, + "step": 20668 + }, + { + "epoch": 0.53, + "learning_rate": 1.8894106956279377e-06, + "loss": 0.8701, + "step": 20669 + }, + { + "epoch": 0.53, + "learning_rate": 1.8893980468746462e-06, + "loss": 0.875, + "step": 20670 + }, + { + "epoch": 0.53, + "learning_rate": 1.8893853974403838e-06, + "loss": 0.7949, + "step": 20671 + }, + { + "epoch": 0.53, + "learning_rate": 1.8893727473251596e-06, + "loss": 1.0381, + "step": 20672 + }, + { + "epoch": 0.53, + "learning_rate": 1.8893600965289837e-06, + "loss": 1.0645, + "step": 20673 + }, + { + "epoch": 0.53, + "learning_rate": 1.8893474450518658e-06, + "loss": 0.9033, + "step": 20674 + }, + { + "epoch": 0.53, + "learning_rate": 1.8893347928938153e-06, + "loss": 0.8525, + "step": 20675 + }, + { + "epoch": 0.53, + "learning_rate": 1.889322140054842e-06, + "loss": 0.9609, + "step": 20676 + }, + { + "epoch": 0.53, + "learning_rate": 1.8893094865349557e-06, + "loss": 0.9961, + "step": 20677 + }, + { + "epoch": 0.53, + "learning_rate": 1.8892968323341657e-06, + "loss": 0.874, + "step": 20678 + }, + { + "epoch": 0.53, + "learning_rate": 1.8892841774524824e-06, + "loss": 0.9131, + "step": 20679 + }, + { + "epoch": 0.53, + "learning_rate": 1.889271521889915e-06, + "loss": 1.1064, + "step": 20680 + }, + { + "epoch": 0.53, + "learning_rate": 1.8892588656464734e-06, + "loss": 0.6509, + "step": 20681 + }, + { + "epoch": 0.53, + "learning_rate": 1.889246208722167e-06, + "loss": 0.9893, + "step": 20682 + }, + { + "epoch": 0.53, + "learning_rate": 1.8892335511170058e-06, + "loss": 0.7959, + "step": 20683 + }, + { + "epoch": 0.53, + "learning_rate": 1.889220892830999e-06, + "loss": 0.835, + "step": 20684 + }, + { + "epoch": 0.53, + "learning_rate": 1.8892082338641574e-06, + "loss": 1.0527, + "step": 20685 + }, + { + "epoch": 0.53, + "learning_rate": 1.8891955742164894e-06, + "loss": 0.7959, + "step": 20686 + }, + { + "epoch": 0.53, + "learning_rate": 1.8891829138880054e-06, + "loss": 0.79, + "step": 20687 + }, + { + "epoch": 0.53, + "learning_rate": 1.8891702528787149e-06, + "loss": 0.9648, + "step": 20688 + }, + { + "epoch": 0.53, + "learning_rate": 1.8891575911886273e-06, + "loss": 1.04, + "step": 20689 + }, + { + "epoch": 0.53, + "learning_rate": 1.8891449288177531e-06, + "loss": 0.9453, + "step": 20690 + }, + { + "epoch": 0.53, + "learning_rate": 1.8891322657661012e-06, + "loss": 0.9404, + "step": 20691 + }, + { + "epoch": 0.53, + "learning_rate": 1.8891196020336816e-06, + "loss": 0.8516, + "step": 20692 + }, + { + "epoch": 0.53, + "learning_rate": 1.8891069376205043e-06, + "loss": 0.8716, + "step": 20693 + }, + { + "epoch": 0.53, + "learning_rate": 1.8890942725265784e-06, + "loss": 0.8252, + "step": 20694 + }, + { + "epoch": 0.53, + "learning_rate": 1.889081606751914e-06, + "loss": 0.8228, + "step": 20695 + }, + { + "epoch": 0.53, + "learning_rate": 1.8890689402965209e-06, + "loss": 0.9727, + "step": 20696 + }, + { + "epoch": 0.53, + "learning_rate": 1.889056273160408e-06, + "loss": 0.9756, + "step": 20697 + }, + { + "epoch": 0.53, + "learning_rate": 1.8890436053435863e-06, + "loss": 0.8428, + "step": 20698 + }, + { + "epoch": 0.53, + "learning_rate": 1.8890309368460644e-06, + "loss": 0.8857, + "step": 20699 + }, + { + "epoch": 0.53, + "learning_rate": 1.8890182676678524e-06, + "loss": 0.9385, + "step": 20700 + }, + { + "epoch": 0.53, + "learning_rate": 1.88900559780896e-06, + "loss": 1.084, + "step": 20701 + }, + { + "epoch": 0.53, + "learning_rate": 1.8889929272693972e-06, + "loss": 0.6943, + "step": 20702 + }, + { + "epoch": 0.53, + "learning_rate": 1.888980256049173e-06, + "loss": 0.8115, + "step": 20703 + }, + { + "epoch": 0.53, + "learning_rate": 1.8889675841482977e-06, + "loss": 0.7305, + "step": 20704 + }, + { + "epoch": 0.53, + "learning_rate": 1.8889549115667807e-06, + "loss": 0.8496, + "step": 20705 + }, + { + "epoch": 0.53, + "learning_rate": 1.8889422383046317e-06, + "loss": 1.0195, + "step": 20706 + }, + { + "epoch": 0.53, + "learning_rate": 1.8889295643618609e-06, + "loss": 0.9189, + "step": 20707 + }, + { + "epoch": 0.53, + "learning_rate": 1.888916889738477e-06, + "loss": 0.8574, + "step": 20708 + }, + { + "epoch": 0.53, + "learning_rate": 1.888904214434491e-06, + "loss": 0.7896, + "step": 20709 + }, + { + "epoch": 0.53, + "learning_rate": 1.8888915384499113e-06, + "loss": 0.8423, + "step": 20710 + }, + { + "epoch": 0.53, + "learning_rate": 1.8888788617847484e-06, + "loss": 0.9521, + "step": 20711 + }, + { + "epoch": 0.53, + "learning_rate": 1.888866184439012e-06, + "loss": 0.8877, + "step": 20712 + }, + { + "epoch": 0.53, + "learning_rate": 1.8888535064127119e-06, + "loss": 0.832, + "step": 20713 + }, + { + "epoch": 0.53, + "learning_rate": 1.888840827705857e-06, + "loss": 0.8926, + "step": 20714 + }, + { + "epoch": 0.53, + "learning_rate": 1.8888281483184576e-06, + "loss": 0.9443, + "step": 20715 + }, + { + "epoch": 0.53, + "learning_rate": 1.8888154682505238e-06, + "loss": 0.8633, + "step": 20716 + }, + { + "epoch": 0.53, + "learning_rate": 1.8888027875020645e-06, + "loss": 0.822, + "step": 20717 + }, + { + "epoch": 0.53, + "learning_rate": 1.8887901060730898e-06, + "loss": 1.0078, + "step": 20718 + }, + { + "epoch": 0.53, + "learning_rate": 1.8887774239636092e-06, + "loss": 0.8711, + "step": 20719 + }, + { + "epoch": 0.53, + "learning_rate": 1.888764741173633e-06, + "loss": 0.9727, + "step": 20720 + }, + { + "epoch": 0.53, + "learning_rate": 1.8887520577031704e-06, + "loss": 0.9121, + "step": 20721 + }, + { + "epoch": 0.53, + "learning_rate": 1.888739373552231e-06, + "loss": 0.8403, + "step": 20722 + }, + { + "epoch": 0.53, + "learning_rate": 1.8887266887208249e-06, + "loss": 0.9785, + "step": 20723 + }, + { + "epoch": 0.53, + "learning_rate": 1.8887140032089614e-06, + "loss": 0.959, + "step": 20724 + }, + { + "epoch": 0.53, + "learning_rate": 1.8887013170166508e-06, + "loss": 1.1475, + "step": 20725 + }, + { + "epoch": 0.53, + "learning_rate": 1.8886886301439023e-06, + "loss": 0.7412, + "step": 20726 + }, + { + "epoch": 0.53, + "learning_rate": 1.8886759425907256e-06, + "loss": 1.0068, + "step": 20727 + }, + { + "epoch": 0.53, + "learning_rate": 1.888663254357131e-06, + "loss": 0.8955, + "step": 20728 + }, + { + "epoch": 0.53, + "learning_rate": 1.8886505654431276e-06, + "loss": 0.7101, + "step": 20729 + }, + { + "epoch": 0.53, + "learning_rate": 1.8886378758487252e-06, + "loss": 0.8877, + "step": 20730 + }, + { + "epoch": 0.53, + "learning_rate": 1.8886251855739336e-06, + "loss": 0.6079, + "step": 20731 + }, + { + "epoch": 0.53, + "learning_rate": 1.8886124946187629e-06, + "loss": 0.9092, + "step": 20732 + }, + { + "epoch": 0.53, + "learning_rate": 1.8885998029832222e-06, + "loss": 0.9424, + "step": 20733 + }, + { + "epoch": 0.53, + "learning_rate": 1.8885871106673216e-06, + "loss": 0.9785, + "step": 20734 + }, + { + "epoch": 0.53, + "learning_rate": 1.8885744176710708e-06, + "loss": 0.9854, + "step": 20735 + }, + { + "epoch": 0.53, + "learning_rate": 1.8885617239944793e-06, + "loss": 0.9678, + "step": 20736 + }, + { + "epoch": 0.53, + "learning_rate": 1.8885490296375571e-06, + "loss": 0.8984, + "step": 20737 + }, + { + "epoch": 0.53, + "learning_rate": 1.8885363346003133e-06, + "loss": 0.6499, + "step": 20738 + }, + { + "epoch": 0.53, + "learning_rate": 1.8885236388827587e-06, + "loss": 0.7158, + "step": 20739 + }, + { + "epoch": 0.53, + "learning_rate": 1.888510942484902e-06, + "loss": 0.8452, + "step": 20740 + }, + { + "epoch": 0.53, + "learning_rate": 1.8884982454067534e-06, + "loss": 0.8237, + "step": 20741 + }, + { + "epoch": 0.53, + "learning_rate": 1.8884855476483226e-06, + "loss": 1.1162, + "step": 20742 + }, + { + "epoch": 0.53, + "learning_rate": 1.8884728492096191e-06, + "loss": 0.998, + "step": 20743 + }, + { + "epoch": 0.53, + "learning_rate": 1.888460150090653e-06, + "loss": 0.9697, + "step": 20744 + }, + { + "epoch": 0.53, + "learning_rate": 1.8884474502914337e-06, + "loss": 0.9043, + "step": 20745 + }, + { + "epoch": 0.53, + "learning_rate": 1.8884347498119712e-06, + "loss": 1.0244, + "step": 20746 + }, + { + "epoch": 0.53, + "learning_rate": 1.8884220486522748e-06, + "loss": 0.8594, + "step": 20747 + }, + { + "epoch": 0.53, + "learning_rate": 1.888409346812355e-06, + "loss": 0.8867, + "step": 20748 + }, + { + "epoch": 0.53, + "learning_rate": 1.8883966442922205e-06, + "loss": 0.7334, + "step": 20749 + }, + { + "epoch": 0.53, + "learning_rate": 1.8883839410918818e-06, + "loss": 0.8232, + "step": 20750 + }, + { + "epoch": 0.53, + "learning_rate": 1.888371237211348e-06, + "loss": 0.6279, + "step": 20751 + }, + { + "epoch": 0.53, + "learning_rate": 1.8883585326506294e-06, + "loss": 0.7246, + "step": 20752 + }, + { + "epoch": 0.53, + "learning_rate": 1.888345827409736e-06, + "loss": 0.8428, + "step": 20753 + }, + { + "epoch": 0.53, + "learning_rate": 1.8883331214886764e-06, + "loss": 1.0576, + "step": 20754 + }, + { + "epoch": 0.53, + "learning_rate": 1.8883204148874613e-06, + "loss": 0.9102, + "step": 20755 + }, + { + "epoch": 0.53, + "learning_rate": 1.8883077076061e-06, + "loss": 0.7744, + "step": 20756 + }, + { + "epoch": 0.53, + "learning_rate": 1.8882949996446022e-06, + "loss": 0.6914, + "step": 20757 + }, + { + "epoch": 0.53, + "learning_rate": 1.8882822910029778e-06, + "loss": 0.7539, + "step": 20758 + }, + { + "epoch": 0.53, + "learning_rate": 1.8882695816812367e-06, + "loss": 0.9307, + "step": 20759 + }, + { + "epoch": 0.53, + "learning_rate": 1.8882568716793883e-06, + "loss": 0.8682, + "step": 20760 + }, + { + "epoch": 0.53, + "learning_rate": 1.8882441609974426e-06, + "loss": 0.8105, + "step": 20761 + }, + { + "epoch": 0.53, + "learning_rate": 1.888231449635409e-06, + "loss": 0.7563, + "step": 20762 + }, + { + "epoch": 0.53, + "learning_rate": 1.8882187375932977e-06, + "loss": 0.5674, + "step": 20763 + }, + { + "epoch": 0.53, + "learning_rate": 1.8882060248711177e-06, + "loss": 0.7832, + "step": 20764 + }, + { + "epoch": 0.53, + "learning_rate": 1.8881933114688795e-06, + "loss": 0.8486, + "step": 20765 + }, + { + "epoch": 0.53, + "learning_rate": 1.8881805973865926e-06, + "loss": 0.7026, + "step": 20766 + }, + { + "epoch": 0.53, + "learning_rate": 1.8881678826242664e-06, + "loss": 0.7117, + "step": 20767 + }, + { + "epoch": 0.53, + "learning_rate": 1.8881551671819112e-06, + "loss": 0.7461, + "step": 20768 + }, + { + "epoch": 0.53, + "learning_rate": 1.8881424510595362e-06, + "loss": 0.8701, + "step": 20769 + }, + { + "epoch": 0.53, + "learning_rate": 1.8881297342571512e-06, + "loss": 0.9795, + "step": 20770 + }, + { + "epoch": 0.53, + "learning_rate": 1.8881170167747663e-06, + "loss": 0.7715, + "step": 20771 + }, + { + "epoch": 0.53, + "learning_rate": 1.888104298612391e-06, + "loss": 0.8379, + "step": 20772 + }, + { + "epoch": 0.53, + "learning_rate": 1.8880915797700351e-06, + "loss": 0.9248, + "step": 20773 + }, + { + "epoch": 0.53, + "learning_rate": 1.8880788602477082e-06, + "loss": 1.0547, + "step": 20774 + }, + { + "epoch": 0.53, + "learning_rate": 1.8880661400454204e-06, + "loss": 1.0127, + "step": 20775 + }, + { + "epoch": 0.53, + "learning_rate": 1.8880534191631812e-06, + "loss": 0.8228, + "step": 20776 + }, + { + "epoch": 0.53, + "learning_rate": 1.888040697601e-06, + "loss": 0.749, + "step": 20777 + }, + { + "epoch": 0.53, + "learning_rate": 1.8880279753588871e-06, + "loss": 0.8857, + "step": 20778 + }, + { + "epoch": 0.53, + "learning_rate": 1.888015252436852e-06, + "loss": 0.9258, + "step": 20779 + }, + { + "epoch": 0.53, + "learning_rate": 1.8880025288349043e-06, + "loss": 0.8555, + "step": 20780 + }, + { + "epoch": 0.53, + "learning_rate": 1.8879898045530541e-06, + "loss": 0.9346, + "step": 20781 + }, + { + "epoch": 0.53, + "learning_rate": 1.8879770795913109e-06, + "loss": 1.0801, + "step": 20782 + }, + { + "epoch": 0.53, + "learning_rate": 1.8879643539496844e-06, + "loss": 0.876, + "step": 20783 + }, + { + "epoch": 0.53, + "learning_rate": 1.8879516276281846e-06, + "loss": 0.8535, + "step": 20784 + }, + { + "epoch": 0.53, + "learning_rate": 1.8879389006268207e-06, + "loss": 0.7334, + "step": 20785 + }, + { + "epoch": 0.53, + "learning_rate": 1.887926172945603e-06, + "loss": 0.7646, + "step": 20786 + }, + { + "epoch": 0.53, + "learning_rate": 1.8879134445845413e-06, + "loss": 0.708, + "step": 20787 + }, + { + "epoch": 0.53, + "learning_rate": 1.887900715543645e-06, + "loss": 0.6958, + "step": 20788 + }, + { + "epoch": 0.53, + "learning_rate": 1.8878879858229237e-06, + "loss": 0.8125, + "step": 20789 + }, + { + "epoch": 0.53, + "learning_rate": 1.8878752554223875e-06, + "loss": 1.1426, + "step": 20790 + }, + { + "epoch": 0.53, + "learning_rate": 1.887862524342046e-06, + "loss": 0.9355, + "step": 20791 + }, + { + "epoch": 0.53, + "learning_rate": 1.887849792581909e-06, + "loss": 0.8887, + "step": 20792 + }, + { + "epoch": 0.53, + "learning_rate": 1.8878370601419866e-06, + "loss": 0.6104, + "step": 20793 + }, + { + "epoch": 0.53, + "learning_rate": 1.8878243270222878e-06, + "loss": 0.8994, + "step": 20794 + }, + { + "epoch": 0.53, + "learning_rate": 1.887811593222823e-06, + "loss": 0.8315, + "step": 20795 + }, + { + "epoch": 0.53, + "learning_rate": 1.8877988587436014e-06, + "loss": 0.5879, + "step": 20796 + }, + { + "epoch": 0.53, + "learning_rate": 1.887786123584633e-06, + "loss": 0.9678, + "step": 20797 + }, + { + "epoch": 0.53, + "learning_rate": 1.8877733877459278e-06, + "loss": 0.9604, + "step": 20798 + }, + { + "epoch": 0.53, + "learning_rate": 1.8877606512274955e-06, + "loss": 0.7473, + "step": 20799 + }, + { + "epoch": 0.53, + "learning_rate": 1.8877479140293454e-06, + "loss": 1.0176, + "step": 20800 + }, + { + "epoch": 0.53, + "learning_rate": 1.8877351761514875e-06, + "loss": 0.8623, + "step": 20801 + }, + { + "epoch": 0.53, + "learning_rate": 1.8877224375939318e-06, + "loss": 1.1006, + "step": 20802 + }, + { + "epoch": 0.53, + "learning_rate": 1.8877096983566877e-06, + "loss": 0.8208, + "step": 20803 + }, + { + "epoch": 0.53, + "learning_rate": 1.8876969584397652e-06, + "loss": 0.7671, + "step": 20804 + }, + { + "epoch": 0.53, + "learning_rate": 1.8876842178431738e-06, + "loss": 1.0713, + "step": 20805 + }, + { + "epoch": 0.53, + "learning_rate": 1.8876714765669236e-06, + "loss": 0.9717, + "step": 20806 + }, + { + "epoch": 0.53, + "learning_rate": 1.887658734611024e-06, + "loss": 0.5967, + "step": 20807 + }, + { + "epoch": 0.53, + "learning_rate": 1.8876459919754853e-06, + "loss": 1.0049, + "step": 20808 + }, + { + "epoch": 0.53, + "learning_rate": 1.8876332486603164e-06, + "loss": 0.7153, + "step": 20809 + }, + { + "epoch": 0.53, + "learning_rate": 1.8876205046655277e-06, + "loss": 0.8628, + "step": 20810 + }, + { + "epoch": 0.53, + "learning_rate": 1.887607759991129e-06, + "loss": 0.9062, + "step": 20811 + }, + { + "epoch": 0.53, + "learning_rate": 1.8875950146371296e-06, + "loss": 0.8125, + "step": 20812 + }, + { + "epoch": 0.53, + "learning_rate": 1.8875822686035393e-06, + "loss": 1.1094, + "step": 20813 + }, + { + "epoch": 0.53, + "learning_rate": 1.8875695218903687e-06, + "loss": 0.9893, + "step": 20814 + }, + { + "epoch": 0.53, + "learning_rate": 1.8875567744976264e-06, + "loss": 0.7197, + "step": 20815 + }, + { + "epoch": 0.53, + "learning_rate": 1.887544026425323e-06, + "loss": 1.1982, + "step": 20816 + }, + { + "epoch": 0.53, + "learning_rate": 1.8875312776734678e-06, + "loss": 0.9961, + "step": 20817 + }, + { + "epoch": 0.53, + "learning_rate": 1.8875185282420706e-06, + "loss": 0.9736, + "step": 20818 + }, + { + "epoch": 0.53, + "learning_rate": 1.8875057781311416e-06, + "loss": 1.001, + "step": 20819 + }, + { + "epoch": 0.53, + "learning_rate": 1.88749302734069e-06, + "loss": 0.6958, + "step": 20820 + }, + { + "epoch": 0.53, + "learning_rate": 1.8874802758707258e-06, + "loss": 0.833, + "step": 20821 + }, + { + "epoch": 0.53, + "learning_rate": 1.8874675237212587e-06, + "loss": 1.0625, + "step": 20822 + }, + { + "epoch": 0.53, + "learning_rate": 1.8874547708922988e-06, + "loss": 0.9385, + "step": 20823 + }, + { + "epoch": 0.53, + "learning_rate": 1.8874420173838552e-06, + "loss": 0.8516, + "step": 20824 + }, + { + "epoch": 0.53, + "learning_rate": 1.8874292631959383e-06, + "loss": 0.5698, + "step": 20825 + }, + { + "epoch": 0.53, + "learning_rate": 1.8874165083285578e-06, + "loss": 0.7705, + "step": 20826 + }, + { + "epoch": 0.53, + "learning_rate": 1.887403752781723e-06, + "loss": 0.9512, + "step": 20827 + }, + { + "epoch": 0.53, + "learning_rate": 1.887390996555444e-06, + "loss": 0.9902, + "step": 20828 + }, + { + "epoch": 0.53, + "learning_rate": 1.8873782396497305e-06, + "loss": 0.8828, + "step": 20829 + }, + { + "epoch": 0.53, + "learning_rate": 1.8873654820645923e-06, + "loss": 0.8975, + "step": 20830 + }, + { + "epoch": 0.53, + "learning_rate": 1.8873527238000392e-06, + "loss": 0.9863, + "step": 20831 + }, + { + "epoch": 0.53, + "learning_rate": 1.8873399648560808e-06, + "loss": 0.8896, + "step": 20832 + }, + { + "epoch": 0.53, + "learning_rate": 1.8873272052327272e-06, + "loss": 0.8652, + "step": 20833 + }, + { + "epoch": 0.53, + "learning_rate": 1.8873144449299878e-06, + "loss": 0.9629, + "step": 20834 + }, + { + "epoch": 0.53, + "learning_rate": 1.8873016839478724e-06, + "loss": 0.8809, + "step": 20835 + }, + { + "epoch": 0.53, + "learning_rate": 1.8872889222863911e-06, + "loss": 0.8379, + "step": 20836 + }, + { + "epoch": 0.53, + "learning_rate": 1.8872761599455536e-06, + "loss": 0.6436, + "step": 20837 + }, + { + "epoch": 0.53, + "learning_rate": 1.8872633969253692e-06, + "loss": 0.7651, + "step": 20838 + }, + { + "epoch": 0.53, + "learning_rate": 1.8872506332258485e-06, + "loss": 0.7939, + "step": 20839 + }, + { + "epoch": 0.53, + "learning_rate": 1.8872378688470004e-06, + "loss": 0.8477, + "step": 20840 + }, + { + "epoch": 0.53, + "learning_rate": 1.8872251037888352e-06, + "loss": 0.6851, + "step": 20841 + }, + { + "epoch": 0.53, + "learning_rate": 1.8872123380513624e-06, + "loss": 1.0781, + "step": 20842 + }, + { + "epoch": 0.53, + "learning_rate": 1.887199571634592e-06, + "loss": 0.9277, + "step": 20843 + }, + { + "epoch": 0.53, + "learning_rate": 1.8871868045385335e-06, + "loss": 1.0449, + "step": 20844 + }, + { + "epoch": 0.53, + "learning_rate": 1.8871740367631972e-06, + "loss": 0.8457, + "step": 20845 + }, + { + "epoch": 0.53, + "learning_rate": 1.8871612683085923e-06, + "loss": 0.7395, + "step": 20846 + }, + { + "epoch": 0.53, + "learning_rate": 1.8871484991747289e-06, + "loss": 0.7156, + "step": 20847 + }, + { + "epoch": 0.53, + "learning_rate": 1.8871357293616166e-06, + "loss": 0.8271, + "step": 20848 + }, + { + "epoch": 0.53, + "learning_rate": 1.8871229588692654e-06, + "loss": 0.9766, + "step": 20849 + }, + { + "epoch": 0.53, + "learning_rate": 1.8871101876976846e-06, + "loss": 1.0391, + "step": 20850 + }, + { + "epoch": 0.53, + "learning_rate": 1.8870974158468847e-06, + "loss": 0.873, + "step": 20851 + }, + { + "epoch": 0.53, + "learning_rate": 1.887084643316875e-06, + "loss": 1.0391, + "step": 20852 + }, + { + "epoch": 0.53, + "learning_rate": 1.8870718701076654e-06, + "loss": 0.8672, + "step": 20853 + }, + { + "epoch": 0.53, + "learning_rate": 1.8870590962192657e-06, + "loss": 0.7539, + "step": 20854 + }, + { + "epoch": 0.53, + "learning_rate": 1.8870463216516854e-06, + "loss": 0.8535, + "step": 20855 + }, + { + "epoch": 0.53, + "learning_rate": 1.8870335464049347e-06, + "loss": 0.9141, + "step": 20856 + }, + { + "epoch": 0.53, + "learning_rate": 1.8870207704790232e-06, + "loss": 0.9092, + "step": 20857 + }, + { + "epoch": 0.53, + "learning_rate": 1.8870079938739605e-06, + "loss": 1.0459, + "step": 20858 + }, + { + "epoch": 0.53, + "learning_rate": 1.886995216589757e-06, + "loss": 0.6069, + "step": 20859 + }, + { + "epoch": 0.53, + "learning_rate": 1.8869824386264214e-06, + "loss": 0.9707, + "step": 20860 + }, + { + "epoch": 0.53, + "learning_rate": 1.8869696599839648e-06, + "loss": 0.7627, + "step": 20861 + }, + { + "epoch": 0.53, + "learning_rate": 1.8869568806623958e-06, + "loss": 0.999, + "step": 20862 + }, + { + "epoch": 0.53, + "learning_rate": 1.886944100661725e-06, + "loss": 0.7314, + "step": 20863 + }, + { + "epoch": 0.53, + "learning_rate": 1.8869313199819618e-06, + "loss": 0.9502, + "step": 20864 + }, + { + "epoch": 0.53, + "learning_rate": 1.8869185386231162e-06, + "loss": 1.0547, + "step": 20865 + }, + { + "epoch": 0.53, + "learning_rate": 1.8869057565851975e-06, + "loss": 0.8374, + "step": 20866 + }, + { + "epoch": 0.53, + "learning_rate": 1.8868929738682163e-06, + "loss": 0.8779, + "step": 20867 + }, + { + "epoch": 0.53, + "learning_rate": 1.8868801904721817e-06, + "loss": 0.8525, + "step": 20868 + }, + { + "epoch": 0.53, + "learning_rate": 1.8868674063971035e-06, + "loss": 0.9761, + "step": 20869 + }, + { + "epoch": 0.53, + "learning_rate": 1.8868546216429922e-06, + "loss": 0.8994, + "step": 20870 + }, + { + "epoch": 0.53, + "learning_rate": 1.8868418362098567e-06, + "loss": 0.9102, + "step": 20871 + }, + { + "epoch": 0.53, + "learning_rate": 1.8868290500977074e-06, + "loss": 0.8252, + "step": 20872 + }, + { + "epoch": 0.53, + "learning_rate": 1.8868162633065536e-06, + "loss": 0.8101, + "step": 20873 + }, + { + "epoch": 0.54, + "learning_rate": 1.8868034758364055e-06, + "loss": 0.834, + "step": 20874 + }, + { + "epoch": 0.54, + "learning_rate": 1.8867906876872729e-06, + "loss": 1.0625, + "step": 20875 + }, + { + "epoch": 0.54, + "learning_rate": 1.8867778988591652e-06, + "loss": 0.7192, + "step": 20876 + }, + { + "epoch": 0.54, + "learning_rate": 1.8867651093520926e-06, + "loss": 0.8521, + "step": 20877 + }, + { + "epoch": 0.54, + "learning_rate": 1.8867523191660646e-06, + "loss": 0.752, + "step": 20878 + }, + { + "epoch": 0.54, + "learning_rate": 1.8867395283010913e-06, + "loss": 0.8291, + "step": 20879 + }, + { + "epoch": 0.54, + "learning_rate": 1.886726736757182e-06, + "loss": 0.876, + "step": 20880 + }, + { + "epoch": 0.54, + "learning_rate": 1.8867139445343474e-06, + "loss": 0.749, + "step": 20881 + }, + { + "epoch": 0.54, + "learning_rate": 1.8867011516325963e-06, + "loss": 0.9424, + "step": 20882 + }, + { + "epoch": 0.54, + "learning_rate": 1.886688358051939e-06, + "loss": 1.0254, + "step": 20883 + }, + { + "epoch": 0.54, + "learning_rate": 1.886675563792385e-06, + "loss": 0.8799, + "step": 20884 + }, + { + "epoch": 0.54, + "learning_rate": 1.8866627688539446e-06, + "loss": 0.5381, + "step": 20885 + }, + { + "epoch": 0.54, + "learning_rate": 1.886649973236627e-06, + "loss": 0.9297, + "step": 20886 + }, + { + "epoch": 0.54, + "learning_rate": 1.8866371769404425e-06, + "loss": 0.9019, + "step": 20887 + }, + { + "epoch": 0.54, + "learning_rate": 1.8866243799654006e-06, + "loss": 0.7104, + "step": 20888 + }, + { + "epoch": 0.54, + "learning_rate": 1.8866115823115111e-06, + "loss": 0.5493, + "step": 20889 + }, + { + "epoch": 0.54, + "learning_rate": 1.8865987839787843e-06, + "loss": 0.6924, + "step": 20890 + }, + { + "epoch": 0.54, + "learning_rate": 1.8865859849672289e-06, + "loss": 1.1152, + "step": 20891 + }, + { + "epoch": 0.54, + "learning_rate": 1.8865731852768558e-06, + "loss": 0.8994, + "step": 20892 + }, + { + "epoch": 0.54, + "learning_rate": 1.8865603849076743e-06, + "loss": 0.9072, + "step": 20893 + }, + { + "epoch": 0.54, + "learning_rate": 1.8865475838596942e-06, + "loss": 0.8682, + "step": 20894 + }, + { + "epoch": 0.54, + "learning_rate": 1.8865347821329255e-06, + "loss": 0.9854, + "step": 20895 + }, + { + "epoch": 0.54, + "learning_rate": 1.886521979727378e-06, + "loss": 0.9375, + "step": 20896 + }, + { + "epoch": 0.54, + "learning_rate": 1.8865091766430612e-06, + "loss": 0.7891, + "step": 20897 + }, + { + "epoch": 0.54, + "learning_rate": 1.886496372879985e-06, + "loss": 0.9434, + "step": 20898 + }, + { + "epoch": 0.54, + "learning_rate": 1.8864835684381595e-06, + "loss": 1.0557, + "step": 20899 + }, + { + "epoch": 0.54, + "learning_rate": 1.886470763317594e-06, + "loss": 0.8408, + "step": 20900 + }, + { + "epoch": 0.54, + "learning_rate": 1.8864579575182987e-06, + "loss": 1.0117, + "step": 20901 + }, + { + "epoch": 0.54, + "learning_rate": 1.8864451510402835e-06, + "loss": 0.8965, + "step": 20902 + }, + { + "epoch": 0.54, + "learning_rate": 1.886432343883558e-06, + "loss": 0.8857, + "step": 20903 + }, + { + "epoch": 0.54, + "learning_rate": 1.8864195360481318e-06, + "loss": 0.8066, + "step": 20904 + }, + { + "epoch": 0.54, + "learning_rate": 1.886406727534015e-06, + "loss": 0.793, + "step": 20905 + }, + { + "epoch": 0.54, + "learning_rate": 1.8863939183412175e-06, + "loss": 0.731, + "step": 20906 + }, + { + "epoch": 0.54, + "learning_rate": 1.8863811084697487e-06, + "loss": 0.9326, + "step": 20907 + }, + { + "epoch": 0.54, + "learning_rate": 1.8863682979196187e-06, + "loss": 0.7109, + "step": 20908 + }, + { + "epoch": 0.54, + "learning_rate": 1.8863554866908373e-06, + "loss": 0.8135, + "step": 20909 + }, + { + "epoch": 0.54, + "learning_rate": 1.8863426747834143e-06, + "loss": 0.9072, + "step": 20910 + }, + { + "epoch": 0.54, + "learning_rate": 1.8863298621973595e-06, + "loss": 0.7339, + "step": 20911 + }, + { + "epoch": 0.54, + "learning_rate": 1.8863170489326824e-06, + "loss": 0.9316, + "step": 20912 + }, + { + "epoch": 0.54, + "learning_rate": 1.8863042349893933e-06, + "loss": 0.9111, + "step": 20913 + }, + { + "epoch": 0.54, + "learning_rate": 1.886291420367502e-06, + "loss": 0.6521, + "step": 20914 + }, + { + "epoch": 0.54, + "learning_rate": 1.8862786050670177e-06, + "loss": 0.874, + "step": 20915 + }, + { + "epoch": 0.54, + "learning_rate": 1.8862657890879508e-06, + "loss": 1.0205, + "step": 20916 + }, + { + "epoch": 0.54, + "learning_rate": 1.886252972430311e-06, + "loss": 0.8506, + "step": 20917 + }, + { + "epoch": 0.54, + "learning_rate": 1.886240155094108e-06, + "loss": 0.7695, + "step": 20918 + }, + { + "epoch": 0.54, + "learning_rate": 1.8862273370793517e-06, + "loss": 0.7549, + "step": 20919 + }, + { + "epoch": 0.54, + "learning_rate": 1.8862145183860518e-06, + "loss": 0.8057, + "step": 20920 + }, + { + "epoch": 0.54, + "learning_rate": 1.8862016990142183e-06, + "loss": 0.7361, + "step": 20921 + }, + { + "epoch": 0.54, + "learning_rate": 1.886188878963861e-06, + "loss": 0.8662, + "step": 20922 + }, + { + "epoch": 0.54, + "learning_rate": 1.8861760582349892e-06, + "loss": 1.0508, + "step": 20923 + }, + { + "epoch": 0.54, + "learning_rate": 1.8861632368276135e-06, + "loss": 0.8721, + "step": 20924 + }, + { + "epoch": 0.54, + "learning_rate": 1.8861504147417433e-06, + "loss": 0.7222, + "step": 20925 + }, + { + "epoch": 0.54, + "learning_rate": 1.8861375919773885e-06, + "loss": 0.7041, + "step": 20926 + }, + { + "epoch": 0.54, + "learning_rate": 1.8861247685345588e-06, + "loss": 0.7861, + "step": 20927 + }, + { + "epoch": 0.54, + "learning_rate": 1.8861119444132641e-06, + "loss": 0.9609, + "step": 20928 + }, + { + "epoch": 0.54, + "learning_rate": 1.8860991196135143e-06, + "loss": 0.9248, + "step": 20929 + }, + { + "epoch": 0.54, + "learning_rate": 1.886086294135319e-06, + "loss": 1.0195, + "step": 20930 + }, + { + "epoch": 0.54, + "learning_rate": 1.8860734679786884e-06, + "loss": 0.821, + "step": 20931 + }, + { + "epoch": 0.54, + "learning_rate": 1.8860606411436319e-06, + "loss": 0.9814, + "step": 20932 + }, + { + "epoch": 0.54, + "learning_rate": 1.8860478136301596e-06, + "loss": 0.8984, + "step": 20933 + }, + { + "epoch": 0.54, + "learning_rate": 1.886034985438281e-06, + "loss": 0.9092, + "step": 20934 + }, + { + "epoch": 0.54, + "learning_rate": 1.8860221565680065e-06, + "loss": 1.0605, + "step": 20935 + }, + { + "epoch": 0.54, + "learning_rate": 1.8860093270193453e-06, + "loss": 0.9316, + "step": 20936 + }, + { + "epoch": 0.54, + "learning_rate": 1.8859964967923079e-06, + "loss": 0.8975, + "step": 20937 + }, + { + "epoch": 0.54, + "learning_rate": 1.8859836658869032e-06, + "loss": 0.8779, + "step": 20938 + }, + { + "epoch": 0.54, + "learning_rate": 1.885970834303142e-06, + "loss": 0.8711, + "step": 20939 + }, + { + "epoch": 0.54, + "learning_rate": 1.8859580020410336e-06, + "loss": 0.9902, + "step": 20940 + }, + { + "epoch": 0.54, + "learning_rate": 1.8859451691005876e-06, + "loss": 0.7231, + "step": 20941 + }, + { + "epoch": 0.54, + "learning_rate": 1.8859323354818145e-06, + "loss": 0.7969, + "step": 20942 + }, + { + "epoch": 0.54, + "learning_rate": 1.8859195011847234e-06, + "loss": 1.0596, + "step": 20943 + }, + { + "epoch": 0.54, + "learning_rate": 1.8859066662093246e-06, + "loss": 0.6553, + "step": 20944 + }, + { + "epoch": 0.54, + "learning_rate": 1.8858938305556279e-06, + "loss": 0.6865, + "step": 20945 + }, + { + "epoch": 0.54, + "learning_rate": 1.8858809942236429e-06, + "loss": 0.7466, + "step": 20946 + }, + { + "epoch": 0.54, + "learning_rate": 1.8858681572133795e-06, + "loss": 0.8486, + "step": 20947 + }, + { + "epoch": 0.54, + "learning_rate": 1.8858553195248477e-06, + "loss": 0.9502, + "step": 20948 + }, + { + "epoch": 0.54, + "learning_rate": 1.885842481158057e-06, + "loss": 0.7354, + "step": 20949 + }, + { + "epoch": 0.54, + "learning_rate": 1.8858296421130179e-06, + "loss": 0.8994, + "step": 20950 + }, + { + "epoch": 0.54, + "learning_rate": 1.8858168023897395e-06, + "loss": 0.8911, + "step": 20951 + }, + { + "epoch": 0.54, + "learning_rate": 1.8858039619882317e-06, + "loss": 1.0059, + "step": 20952 + }, + { + "epoch": 0.54, + "learning_rate": 1.885791120908505e-06, + "loss": 0.9932, + "step": 20953 + }, + { + "epoch": 0.54, + "learning_rate": 1.8857782791505685e-06, + "loss": 0.6992, + "step": 20954 + }, + { + "epoch": 0.54, + "learning_rate": 1.8857654367144323e-06, + "loss": 0.834, + "step": 20955 + }, + { + "epoch": 0.54, + "learning_rate": 1.8857525936001064e-06, + "loss": 0.8926, + "step": 20956 + }, + { + "epoch": 0.54, + "learning_rate": 1.8857397498076003e-06, + "loss": 0.9795, + "step": 20957 + }, + { + "epoch": 0.54, + "learning_rate": 1.885726905336924e-06, + "loss": 0.9648, + "step": 20958 + }, + { + "epoch": 0.54, + "learning_rate": 1.8857140601880875e-06, + "loss": 0.8716, + "step": 20959 + }, + { + "epoch": 0.54, + "learning_rate": 1.8857012143611003e-06, + "loss": 0.9121, + "step": 20960 + }, + { + "epoch": 0.54, + "learning_rate": 1.8856883678559724e-06, + "loss": 0.835, + "step": 20961 + }, + { + "epoch": 0.54, + "learning_rate": 1.8856755206727137e-06, + "loss": 0.7031, + "step": 20962 + }, + { + "epoch": 0.54, + "learning_rate": 1.8856626728113338e-06, + "loss": 0.7812, + "step": 20963 + }, + { + "epoch": 0.54, + "learning_rate": 1.885649824271843e-06, + "loss": 0.8354, + "step": 20964 + }, + { + "epoch": 0.54, + "learning_rate": 1.8856369750542507e-06, + "loss": 0.8647, + "step": 20965 + }, + { + "epoch": 0.54, + "learning_rate": 1.8856241251585668e-06, + "loss": 0.7339, + "step": 20966 + }, + { + "epoch": 0.54, + "learning_rate": 1.8856112745848013e-06, + "loss": 1.0273, + "step": 20967 + }, + { + "epoch": 0.54, + "learning_rate": 1.885598423332964e-06, + "loss": 0.7178, + "step": 20968 + }, + { + "epoch": 0.54, + "learning_rate": 1.885585571403065e-06, + "loss": 0.9648, + "step": 20969 + }, + { + "epoch": 0.54, + "learning_rate": 1.8855727187951134e-06, + "loss": 0.9473, + "step": 20970 + }, + { + "epoch": 0.54, + "learning_rate": 1.8855598655091195e-06, + "loss": 0.9619, + "step": 20971 + }, + { + "epoch": 0.54, + "learning_rate": 1.8855470115450936e-06, + "loss": 1.0039, + "step": 20972 + }, + { + "epoch": 0.54, + "learning_rate": 1.8855341569030445e-06, + "loss": 0.6333, + "step": 20973 + }, + { + "epoch": 0.54, + "learning_rate": 1.885521301582983e-06, + "loss": 0.6953, + "step": 20974 + }, + { + "epoch": 0.54, + "learning_rate": 1.8855084455849184e-06, + "loss": 0.9697, + "step": 20975 + }, + { + "epoch": 0.54, + "learning_rate": 1.885495588908861e-06, + "loss": 0.9834, + "step": 20976 + }, + { + "epoch": 0.54, + "learning_rate": 1.8854827315548198e-06, + "loss": 0.9941, + "step": 20977 + }, + { + "epoch": 0.54, + "learning_rate": 1.8854698735228055e-06, + "loss": 0.9658, + "step": 20978 + }, + { + "epoch": 0.54, + "learning_rate": 1.8854570148128276e-06, + "loss": 0.8379, + "step": 20979 + }, + { + "epoch": 0.54, + "learning_rate": 1.885444155424896e-06, + "loss": 0.7451, + "step": 20980 + }, + { + "epoch": 0.54, + "learning_rate": 1.8854312953590203e-06, + "loss": 0.7695, + "step": 20981 + }, + { + "epoch": 0.54, + "learning_rate": 1.885418434615211e-06, + "loss": 0.7461, + "step": 20982 + }, + { + "epoch": 0.54, + "learning_rate": 1.8854055731934773e-06, + "loss": 0.646, + "step": 20983 + }, + { + "epoch": 0.54, + "learning_rate": 1.8853927110938293e-06, + "loss": 0.9634, + "step": 20984 + }, + { + "epoch": 0.54, + "learning_rate": 1.8853798483162765e-06, + "loss": 0.9121, + "step": 20985 + }, + { + "epoch": 0.54, + "learning_rate": 1.8853669848608295e-06, + "loss": 0.8389, + "step": 20986 + }, + { + "epoch": 0.54, + "learning_rate": 1.8853541207274977e-06, + "loss": 0.8047, + "step": 20987 + }, + { + "epoch": 0.54, + "learning_rate": 1.8853412559162906e-06, + "loss": 0.8818, + "step": 20988 + }, + { + "epoch": 0.54, + "learning_rate": 1.885328390427219e-06, + "loss": 1.0039, + "step": 20989 + }, + { + "epoch": 0.54, + "learning_rate": 1.8853155242602915e-06, + "loss": 0.9629, + "step": 20990 + }, + { + "epoch": 0.54, + "learning_rate": 1.8853026574155186e-06, + "loss": 0.5752, + "step": 20991 + }, + { + "epoch": 0.54, + "learning_rate": 1.8852897898929107e-06, + "loss": 0.9053, + "step": 20992 + }, + { + "epoch": 0.54, + "learning_rate": 1.8852769216924768e-06, + "loss": 1.2109, + "step": 20993 + }, + { + "epoch": 0.54, + "learning_rate": 1.885264052814227e-06, + "loss": 0.9307, + "step": 20994 + }, + { + "epoch": 0.54, + "learning_rate": 1.8852511832581714e-06, + "loss": 1.0078, + "step": 20995 + }, + { + "epoch": 0.54, + "learning_rate": 1.8852383130243197e-06, + "loss": 0.8494, + "step": 20996 + }, + { + "epoch": 0.54, + "learning_rate": 1.8852254421126816e-06, + "loss": 0.6162, + "step": 20997 + }, + { + "epoch": 0.54, + "learning_rate": 1.8852125705232671e-06, + "loss": 0.9805, + "step": 20998 + }, + { + "epoch": 0.54, + "learning_rate": 1.885199698256086e-06, + "loss": 0.7529, + "step": 20999 + }, + { + "epoch": 0.54, + "learning_rate": 1.8851868253111482e-06, + "loss": 0.707, + "step": 21000 + }, + { + "epoch": 0.54, + "learning_rate": 1.885173951688464e-06, + "loss": 0.811, + "step": 21001 + }, + { + "epoch": 0.54, + "learning_rate": 1.8851610773880422e-06, + "loss": 0.8701, + "step": 21002 + }, + { + "epoch": 0.54, + "learning_rate": 1.8851482024098935e-06, + "loss": 0.8428, + "step": 21003 + }, + { + "epoch": 0.54, + "learning_rate": 1.8851353267540272e-06, + "loss": 0.7598, + "step": 21004 + }, + { + "epoch": 0.54, + "learning_rate": 1.8851224504204541e-06, + "loss": 0.8232, + "step": 21005 + }, + { + "epoch": 0.54, + "learning_rate": 1.885109573409183e-06, + "loss": 0.9072, + "step": 21006 + }, + { + "epoch": 0.54, + "learning_rate": 1.8850966957202244e-06, + "loss": 0.5154, + "step": 21007 + }, + { + "epoch": 0.54, + "learning_rate": 1.885083817353588e-06, + "loss": 0.8423, + "step": 21008 + }, + { + "epoch": 0.54, + "learning_rate": 1.8850709383092833e-06, + "loss": 0.9116, + "step": 21009 + }, + { + "epoch": 0.54, + "learning_rate": 1.8850580585873206e-06, + "loss": 0.8267, + "step": 21010 + }, + { + "epoch": 0.54, + "learning_rate": 1.8850451781877096e-06, + "loss": 0.8984, + "step": 21011 + }, + { + "epoch": 0.54, + "learning_rate": 1.8850322971104604e-06, + "loss": 1.0732, + "step": 21012 + }, + { + "epoch": 0.54, + "learning_rate": 1.8850194153555827e-06, + "loss": 0.8545, + "step": 21013 + }, + { + "epoch": 0.54, + "learning_rate": 1.8850065329230863e-06, + "loss": 0.79, + "step": 21014 + }, + { + "epoch": 0.54, + "learning_rate": 1.8849936498129808e-06, + "loss": 0.639, + "step": 21015 + }, + { + "epoch": 0.54, + "learning_rate": 1.8849807660252766e-06, + "loss": 0.8677, + "step": 21016 + }, + { + "epoch": 0.54, + "learning_rate": 1.8849678815599834e-06, + "loss": 0.6743, + "step": 21017 + }, + { + "epoch": 0.54, + "learning_rate": 1.884954996417111e-06, + "loss": 0.8779, + "step": 21018 + }, + { + "epoch": 0.54, + "learning_rate": 1.8849421105966689e-06, + "loss": 0.832, + "step": 21019 + }, + { + "epoch": 0.54, + "learning_rate": 1.8849292240986676e-06, + "loss": 0.9395, + "step": 21020 + }, + { + "epoch": 0.54, + "learning_rate": 1.8849163369231165e-06, + "loss": 0.9902, + "step": 21021 + }, + { + "epoch": 0.54, + "learning_rate": 1.884903449070026e-06, + "loss": 1.0234, + "step": 21022 + }, + { + "epoch": 0.54, + "learning_rate": 1.8848905605394052e-06, + "loss": 1.0732, + "step": 21023 + }, + { + "epoch": 0.54, + "learning_rate": 1.8848776713312646e-06, + "loss": 0.7969, + "step": 21024 + }, + { + "epoch": 0.54, + "learning_rate": 1.8848647814456139e-06, + "loss": 0.9258, + "step": 21025 + }, + { + "epoch": 0.54, + "learning_rate": 1.8848518908824626e-06, + "loss": 0.8838, + "step": 21026 + }, + { + "epoch": 0.54, + "learning_rate": 1.8848389996418213e-06, + "loss": 0.8394, + "step": 21027 + }, + { + "epoch": 0.54, + "learning_rate": 1.8848261077236993e-06, + "loss": 0.8623, + "step": 21028 + }, + { + "epoch": 0.54, + "learning_rate": 1.8848132151281067e-06, + "loss": 0.8896, + "step": 21029 + }, + { + "epoch": 0.54, + "learning_rate": 1.8848003218550532e-06, + "loss": 0.8027, + "step": 21030 + }, + { + "epoch": 0.54, + "learning_rate": 1.8847874279045488e-06, + "loss": 0.7314, + "step": 21031 + }, + { + "epoch": 0.54, + "learning_rate": 1.8847745332766035e-06, + "loss": 0.8301, + "step": 21032 + }, + { + "epoch": 0.54, + "learning_rate": 1.8847616379712268e-06, + "loss": 1.0654, + "step": 21033 + }, + { + "epoch": 0.54, + "learning_rate": 1.884748741988429e-06, + "loss": 1.0508, + "step": 21034 + }, + { + "epoch": 0.54, + "learning_rate": 1.8847358453282194e-06, + "loss": 0.7295, + "step": 21035 + }, + { + "epoch": 0.54, + "learning_rate": 1.8847229479906087e-06, + "loss": 0.9854, + "step": 21036 + }, + { + "epoch": 0.54, + "learning_rate": 1.8847100499756058e-06, + "loss": 0.7236, + "step": 21037 + }, + { + "epoch": 0.54, + "learning_rate": 1.8846971512832214e-06, + "loss": 0.752, + "step": 21038 + }, + { + "epoch": 0.54, + "learning_rate": 1.8846842519134654e-06, + "loss": 0.7656, + "step": 21039 + }, + { + "epoch": 0.54, + "learning_rate": 1.884671351866347e-06, + "loss": 0.8447, + "step": 21040 + }, + { + "epoch": 0.54, + "learning_rate": 1.8846584511418764e-06, + "loss": 1.0801, + "step": 21041 + }, + { + "epoch": 0.54, + "learning_rate": 1.8846455497400636e-06, + "loss": 1.2051, + "step": 21042 + }, + { + "epoch": 0.54, + "learning_rate": 1.8846326476609185e-06, + "loss": 0.9849, + "step": 21043 + }, + { + "epoch": 0.54, + "learning_rate": 1.8846197449044505e-06, + "loss": 0.9785, + "step": 21044 + }, + { + "epoch": 0.54, + "learning_rate": 1.8846068414706702e-06, + "loss": 0.9131, + "step": 21045 + }, + { + "epoch": 0.54, + "learning_rate": 1.884593937359587e-06, + "loss": 0.7949, + "step": 21046 + }, + { + "epoch": 0.54, + "learning_rate": 1.8845810325712108e-06, + "loss": 0.8076, + "step": 21047 + }, + { + "epoch": 0.54, + "learning_rate": 1.8845681271055516e-06, + "loss": 0.7598, + "step": 21048 + }, + { + "epoch": 0.54, + "learning_rate": 1.8845552209626192e-06, + "loss": 0.7979, + "step": 21049 + }, + { + "epoch": 0.54, + "learning_rate": 1.8845423141424236e-06, + "loss": 0.7935, + "step": 21050 + }, + { + "epoch": 0.54, + "learning_rate": 1.8845294066449746e-06, + "loss": 1.0078, + "step": 21051 + }, + { + "epoch": 0.54, + "learning_rate": 1.884516498470282e-06, + "loss": 0.8643, + "step": 21052 + }, + { + "epoch": 0.54, + "learning_rate": 1.8845035896183562e-06, + "loss": 0.7637, + "step": 21053 + }, + { + "epoch": 0.54, + "learning_rate": 1.8844906800892063e-06, + "loss": 0.9092, + "step": 21054 + }, + { + "epoch": 0.54, + "learning_rate": 1.8844777698828426e-06, + "loss": 0.8779, + "step": 21055 + }, + { + "epoch": 0.54, + "learning_rate": 1.8844648589992752e-06, + "loss": 0.9912, + "step": 21056 + }, + { + "epoch": 0.54, + "learning_rate": 1.8844519474385134e-06, + "loss": 0.6749, + "step": 21057 + }, + { + "epoch": 0.54, + "learning_rate": 1.8844390352005676e-06, + "loss": 0.8037, + "step": 21058 + }, + { + "epoch": 0.54, + "learning_rate": 1.8844261222854474e-06, + "loss": 0.8818, + "step": 21059 + }, + { + "epoch": 0.54, + "learning_rate": 1.884413208693163e-06, + "loss": 0.7979, + "step": 21060 + }, + { + "epoch": 0.54, + "learning_rate": 1.884400294423724e-06, + "loss": 0.8359, + "step": 21061 + }, + { + "epoch": 0.54, + "learning_rate": 1.8843873794771402e-06, + "loss": 1.0127, + "step": 21062 + }, + { + "epoch": 0.54, + "learning_rate": 1.8843744638534216e-06, + "loss": 0.7314, + "step": 21063 + }, + { + "epoch": 0.54, + "learning_rate": 1.8843615475525783e-06, + "loss": 0.7178, + "step": 21064 + }, + { + "epoch": 0.54, + "learning_rate": 1.8843486305746199e-06, + "loss": 0.9307, + "step": 21065 + }, + { + "epoch": 0.54, + "learning_rate": 1.8843357129195566e-06, + "loss": 0.9927, + "step": 21066 + }, + { + "epoch": 0.54, + "learning_rate": 1.884322794587398e-06, + "loss": 0.9941, + "step": 21067 + }, + { + "epoch": 0.54, + "learning_rate": 1.8843098755781538e-06, + "loss": 0.9766, + "step": 21068 + }, + { + "epoch": 0.54, + "learning_rate": 1.8842969558918346e-06, + "loss": 0.752, + "step": 21069 + }, + { + "epoch": 0.54, + "learning_rate": 1.88428403552845e-06, + "loss": 0.9131, + "step": 21070 + }, + { + "epoch": 0.54, + "learning_rate": 1.8842711144880093e-06, + "loss": 0.9287, + "step": 21071 + }, + { + "epoch": 0.54, + "learning_rate": 1.8842581927705233e-06, + "loss": 0.9102, + "step": 21072 + }, + { + "epoch": 0.54, + "learning_rate": 1.8842452703760013e-06, + "loss": 0.8438, + "step": 21073 + }, + { + "epoch": 0.54, + "learning_rate": 1.8842323473044533e-06, + "loss": 0.8467, + "step": 21074 + }, + { + "epoch": 0.54, + "learning_rate": 1.8842194235558892e-06, + "loss": 0.918, + "step": 21075 + }, + { + "epoch": 0.54, + "learning_rate": 1.884206499130319e-06, + "loss": 1.0273, + "step": 21076 + }, + { + "epoch": 0.54, + "learning_rate": 1.8841935740277525e-06, + "loss": 0.9189, + "step": 21077 + }, + { + "epoch": 0.54, + "learning_rate": 1.8841806482481997e-06, + "loss": 0.7627, + "step": 21078 + }, + { + "epoch": 0.54, + "learning_rate": 1.8841677217916705e-06, + "loss": 0.7686, + "step": 21079 + }, + { + "epoch": 0.54, + "learning_rate": 1.884154794658175e-06, + "loss": 1.0596, + "step": 21080 + }, + { + "epoch": 0.54, + "learning_rate": 1.884141866847722e-06, + "loss": 0.915, + "step": 21081 + }, + { + "epoch": 0.54, + "learning_rate": 1.884128938360323e-06, + "loss": 1.0566, + "step": 21082 + }, + { + "epoch": 0.54, + "learning_rate": 1.8841160091959867e-06, + "loss": 0.8633, + "step": 21083 + }, + { + "epoch": 0.54, + "learning_rate": 1.8841030793547238e-06, + "loss": 0.8538, + "step": 21084 + }, + { + "epoch": 0.54, + "learning_rate": 1.8840901488365434e-06, + "loss": 0.7842, + "step": 21085 + }, + { + "epoch": 0.54, + "learning_rate": 1.884077217641456e-06, + "loss": 0.9971, + "step": 21086 + }, + { + "epoch": 0.54, + "learning_rate": 1.8840642857694714e-06, + "loss": 0.7026, + "step": 21087 + }, + { + "epoch": 0.54, + "learning_rate": 1.8840513532205993e-06, + "loss": 0.8174, + "step": 21088 + }, + { + "epoch": 0.54, + "learning_rate": 1.8840384199948497e-06, + "loss": 0.876, + "step": 21089 + }, + { + "epoch": 0.54, + "learning_rate": 1.8840254860922328e-06, + "loss": 0.8394, + "step": 21090 + }, + { + "epoch": 0.54, + "learning_rate": 1.8840125515127582e-06, + "loss": 0.9209, + "step": 21091 + }, + { + "epoch": 0.54, + "learning_rate": 1.8839996162564356e-06, + "loss": 0.8555, + "step": 21092 + }, + { + "epoch": 0.54, + "learning_rate": 1.883986680323275e-06, + "loss": 0.7397, + "step": 21093 + }, + { + "epoch": 0.54, + "learning_rate": 1.883973743713287e-06, + "loss": 0.9023, + "step": 21094 + }, + { + "epoch": 0.54, + "learning_rate": 1.8839608064264807e-06, + "loss": 1.1543, + "step": 21095 + }, + { + "epoch": 0.54, + "learning_rate": 1.883947868462866e-06, + "loss": 0.915, + "step": 21096 + }, + { + "epoch": 0.54, + "learning_rate": 1.8839349298224534e-06, + "loss": 0.8193, + "step": 21097 + }, + { + "epoch": 0.54, + "learning_rate": 1.8839219905052524e-06, + "loss": 0.7959, + "step": 21098 + }, + { + "epoch": 0.54, + "learning_rate": 1.883909050511273e-06, + "loss": 0.7815, + "step": 21099 + }, + { + "epoch": 0.54, + "learning_rate": 1.8838961098405246e-06, + "loss": 0.7979, + "step": 21100 + }, + { + "epoch": 0.54, + "learning_rate": 1.883883168493018e-06, + "loss": 0.8965, + "step": 21101 + }, + { + "epoch": 0.54, + "learning_rate": 1.8838702264687627e-06, + "loss": 1.1367, + "step": 21102 + }, + { + "epoch": 0.54, + "learning_rate": 1.8838572837677687e-06, + "loss": 0.9658, + "step": 21103 + }, + { + "epoch": 0.54, + "learning_rate": 1.8838443403900457e-06, + "loss": 0.9531, + "step": 21104 + }, + { + "epoch": 0.54, + "learning_rate": 1.8838313963356036e-06, + "loss": 0.9434, + "step": 21105 + }, + { + "epoch": 0.54, + "learning_rate": 1.8838184516044526e-06, + "loss": 0.8818, + "step": 21106 + }, + { + "epoch": 0.54, + "learning_rate": 1.8838055061966024e-06, + "loss": 1.0, + "step": 21107 + }, + { + "epoch": 0.54, + "learning_rate": 1.883792560112063e-06, + "loss": 0.7998, + "step": 21108 + }, + { + "epoch": 0.54, + "learning_rate": 1.8837796133508444e-06, + "loss": 0.9238, + "step": 21109 + }, + { + "epoch": 0.54, + "learning_rate": 1.8837666659129562e-06, + "loss": 0.7949, + "step": 21110 + }, + { + "epoch": 0.54, + "learning_rate": 1.8837537177984086e-06, + "loss": 0.5693, + "step": 21111 + }, + { + "epoch": 0.54, + "learning_rate": 1.8837407690072113e-06, + "loss": 1.1689, + "step": 21112 + }, + { + "epoch": 0.54, + "learning_rate": 1.8837278195393744e-06, + "loss": 0.8662, + "step": 21113 + }, + { + "epoch": 0.54, + "learning_rate": 1.8837148693949078e-06, + "loss": 0.8623, + "step": 21114 + }, + { + "epoch": 0.54, + "learning_rate": 1.8837019185738212e-06, + "loss": 0.9971, + "step": 21115 + }, + { + "epoch": 0.54, + "learning_rate": 1.8836889670761247e-06, + "loss": 0.7468, + "step": 21116 + }, + { + "epoch": 0.54, + "learning_rate": 1.8836760149018284e-06, + "loss": 0.8843, + "step": 21117 + }, + { + "epoch": 0.54, + "learning_rate": 1.883663062050942e-06, + "loss": 0.8877, + "step": 21118 + }, + { + "epoch": 0.54, + "learning_rate": 1.8836501085234752e-06, + "loss": 0.9521, + "step": 21119 + }, + { + "epoch": 0.54, + "learning_rate": 1.8836371543194383e-06, + "loss": 1.0156, + "step": 21120 + }, + { + "epoch": 0.54, + "learning_rate": 1.8836241994388408e-06, + "loss": 0.636, + "step": 21121 + }, + { + "epoch": 0.54, + "learning_rate": 1.8836112438816932e-06, + "loss": 0.915, + "step": 21122 + }, + { + "epoch": 0.54, + "learning_rate": 1.883598287648005e-06, + "loss": 1.0479, + "step": 21123 + }, + { + "epoch": 0.54, + "learning_rate": 1.883585330737786e-06, + "loss": 0.959, + "step": 21124 + }, + { + "epoch": 0.54, + "learning_rate": 1.8835723731510466e-06, + "loss": 0.7803, + "step": 21125 + }, + { + "epoch": 0.54, + "learning_rate": 1.8835594148877964e-06, + "loss": 0.7927, + "step": 21126 + }, + { + "epoch": 0.54, + "learning_rate": 1.8835464559480453e-06, + "loss": 0.8447, + "step": 21127 + }, + { + "epoch": 0.54, + "learning_rate": 1.8835334963318036e-06, + "loss": 0.9121, + "step": 21128 + }, + { + "epoch": 0.54, + "learning_rate": 1.8835205360390806e-06, + "loss": 0.9932, + "step": 21129 + }, + { + "epoch": 0.54, + "learning_rate": 1.8835075750698867e-06, + "loss": 0.8633, + "step": 21130 + }, + { + "epoch": 0.54, + "learning_rate": 1.8834946134242315e-06, + "loss": 0.76, + "step": 21131 + }, + { + "epoch": 0.54, + "learning_rate": 1.8834816511021254e-06, + "loss": 0.876, + "step": 21132 + }, + { + "epoch": 0.54, + "learning_rate": 1.8834686881035777e-06, + "loss": 1.04, + "step": 21133 + }, + { + "epoch": 0.54, + "learning_rate": 1.8834557244285988e-06, + "loss": 0.7852, + "step": 21134 + }, + { + "epoch": 0.54, + "learning_rate": 1.8834427600771987e-06, + "loss": 1.0117, + "step": 21135 + }, + { + "epoch": 0.54, + "learning_rate": 1.8834297950493867e-06, + "loss": 0.9258, + "step": 21136 + }, + { + "epoch": 0.54, + "learning_rate": 1.8834168293451733e-06, + "loss": 0.8862, + "step": 21137 + }, + { + "epoch": 0.54, + "learning_rate": 1.8834038629645686e-06, + "loss": 0.7856, + "step": 21138 + }, + { + "epoch": 0.54, + "learning_rate": 1.8833908959075818e-06, + "loss": 0.8267, + "step": 21139 + }, + { + "epoch": 0.54, + "learning_rate": 1.883377928174223e-06, + "loss": 0.7354, + "step": 21140 + }, + { + "epoch": 0.54, + "learning_rate": 1.8833649597645028e-06, + "loss": 1.1777, + "step": 21141 + }, + { + "epoch": 0.54, + "learning_rate": 1.8833519906784306e-06, + "loss": 0.6221, + "step": 21142 + }, + { + "epoch": 0.54, + "learning_rate": 1.883339020916016e-06, + "loss": 0.9082, + "step": 21143 + }, + { + "epoch": 0.54, + "learning_rate": 1.8833260504772697e-06, + "loss": 0.7354, + "step": 21144 + }, + { + "epoch": 0.54, + "learning_rate": 1.8833130793622012e-06, + "loss": 0.8174, + "step": 21145 + }, + { + "epoch": 0.54, + "learning_rate": 1.8833001075708203e-06, + "loss": 0.7417, + "step": 21146 + }, + { + "epoch": 0.54, + "learning_rate": 1.8832871351031373e-06, + "loss": 0.9922, + "step": 21147 + }, + { + "epoch": 0.54, + "learning_rate": 1.8832741619591621e-06, + "loss": 0.9707, + "step": 21148 + }, + { + "epoch": 0.54, + "learning_rate": 1.8832611881389042e-06, + "loss": 0.8604, + "step": 21149 + }, + { + "epoch": 0.54, + "learning_rate": 1.883248213642374e-06, + "loss": 0.7148, + "step": 21150 + }, + { + "epoch": 0.54, + "learning_rate": 1.883235238469581e-06, + "loss": 0.9443, + "step": 21151 + }, + { + "epoch": 0.54, + "learning_rate": 1.8832222626205358e-06, + "loss": 0.7656, + "step": 21152 + }, + { + "epoch": 0.54, + "learning_rate": 1.8832092860952478e-06, + "loss": 0.9131, + "step": 21153 + }, + { + "epoch": 0.54, + "learning_rate": 1.8831963088937269e-06, + "loss": 0.8398, + "step": 21154 + }, + { + "epoch": 0.54, + "learning_rate": 1.8831833310159833e-06, + "loss": 0.8652, + "step": 21155 + }, + { + "epoch": 0.54, + "learning_rate": 1.8831703524620267e-06, + "loss": 0.7002, + "step": 21156 + }, + { + "epoch": 0.54, + "learning_rate": 1.8831573732318673e-06, + "loss": 0.9932, + "step": 21157 + }, + { + "epoch": 0.54, + "learning_rate": 1.883144393325515e-06, + "loss": 1.0244, + "step": 21158 + }, + { + "epoch": 0.54, + "learning_rate": 1.8831314127429794e-06, + "loss": 0.6333, + "step": 21159 + }, + { + "epoch": 0.54, + "learning_rate": 1.8831184314842708e-06, + "loss": 0.9214, + "step": 21160 + }, + { + "epoch": 0.54, + "learning_rate": 1.883105449549399e-06, + "loss": 0.8398, + "step": 21161 + }, + { + "epoch": 0.54, + "learning_rate": 1.883092466938374e-06, + "loss": 1.001, + "step": 21162 + }, + { + "epoch": 0.54, + "learning_rate": 1.8830794836512055e-06, + "loss": 0.9951, + "step": 21163 + }, + { + "epoch": 0.54, + "learning_rate": 1.883066499687904e-06, + "loss": 0.8315, + "step": 21164 + }, + { + "epoch": 0.54, + "learning_rate": 1.8830535150484787e-06, + "loss": 0.9131, + "step": 21165 + }, + { + "epoch": 0.54, + "learning_rate": 1.8830405297329403e-06, + "loss": 0.9883, + "step": 21166 + }, + { + "epoch": 0.54, + "learning_rate": 1.8830275437412983e-06, + "loss": 0.8174, + "step": 21167 + }, + { + "epoch": 0.54, + "learning_rate": 1.8830145570735625e-06, + "loss": 0.9629, + "step": 21168 + }, + { + "epoch": 0.54, + "learning_rate": 1.8830015697297435e-06, + "loss": 0.8877, + "step": 21169 + }, + { + "epoch": 0.54, + "learning_rate": 1.8829885817098502e-06, + "loss": 0.7832, + "step": 21170 + }, + { + "epoch": 0.54, + "learning_rate": 1.8829755930138936e-06, + "loss": 0.8887, + "step": 21171 + }, + { + "epoch": 0.54, + "learning_rate": 1.882962603641883e-06, + "loss": 0.6777, + "step": 21172 + }, + { + "epoch": 0.54, + "learning_rate": 1.8829496135938286e-06, + "loss": 0.9717, + "step": 21173 + }, + { + "epoch": 0.54, + "learning_rate": 1.88293662286974e-06, + "loss": 0.874, + "step": 21174 + }, + { + "epoch": 0.54, + "learning_rate": 1.882923631469628e-06, + "loss": 0.915, + "step": 21175 + }, + { + "epoch": 0.54, + "learning_rate": 1.8829106393935014e-06, + "loss": 0.8799, + "step": 21176 + }, + { + "epoch": 0.54, + "learning_rate": 1.8828976466413712e-06, + "loss": 0.8906, + "step": 21177 + }, + { + "epoch": 0.54, + "learning_rate": 1.8828846532132464e-06, + "loss": 0.9678, + "step": 21178 + }, + { + "epoch": 0.54, + "learning_rate": 1.8828716591091377e-06, + "loss": 1.0889, + "step": 21179 + }, + { + "epoch": 0.54, + "learning_rate": 1.8828586643290547e-06, + "loss": 0.9092, + "step": 21180 + }, + { + "epoch": 0.54, + "learning_rate": 1.8828456688730075e-06, + "loss": 0.8906, + "step": 21181 + }, + { + "epoch": 0.54, + "learning_rate": 1.8828326727410057e-06, + "loss": 0.8418, + "step": 21182 + }, + { + "epoch": 0.54, + "learning_rate": 1.8828196759330596e-06, + "loss": 0.8037, + "step": 21183 + }, + { + "epoch": 0.54, + "learning_rate": 1.8828066784491793e-06, + "loss": 0.54, + "step": 21184 + }, + { + "epoch": 0.54, + "learning_rate": 1.8827936802893746e-06, + "loss": 0.8574, + "step": 21185 + }, + { + "epoch": 0.54, + "learning_rate": 1.882780681453655e-06, + "loss": 0.9678, + "step": 21186 + }, + { + "epoch": 0.54, + "learning_rate": 1.882767681942031e-06, + "loss": 1.0215, + "step": 21187 + }, + { + "epoch": 0.54, + "learning_rate": 1.8827546817545124e-06, + "loss": 1.0332, + "step": 21188 + }, + { + "epoch": 0.54, + "learning_rate": 1.882741680891109e-06, + "loss": 1.1895, + "step": 21189 + }, + { + "epoch": 0.54, + "learning_rate": 1.8827286793518312e-06, + "loss": 0.9512, + "step": 21190 + }, + { + "epoch": 0.54, + "learning_rate": 1.8827156771366882e-06, + "loss": 0.8838, + "step": 21191 + }, + { + "epoch": 0.54, + "learning_rate": 1.8827026742456907e-06, + "loss": 0.8721, + "step": 21192 + }, + { + "epoch": 0.54, + "learning_rate": 1.8826896706788482e-06, + "loss": 0.8081, + "step": 21193 + }, + { + "epoch": 0.54, + "learning_rate": 1.882676666436171e-06, + "loss": 1.1143, + "step": 21194 + }, + { + "epoch": 0.54, + "learning_rate": 1.8826636615176686e-06, + "loss": 1.0342, + "step": 21195 + }, + { + "epoch": 0.54, + "learning_rate": 1.8826506559233515e-06, + "loss": 0.7495, + "step": 21196 + }, + { + "epoch": 0.54, + "learning_rate": 1.8826376496532293e-06, + "loss": 0.6631, + "step": 21197 + }, + { + "epoch": 0.54, + "learning_rate": 1.882624642707312e-06, + "loss": 0.9023, + "step": 21198 + }, + { + "epoch": 0.54, + "learning_rate": 1.8826116350856094e-06, + "loss": 0.7153, + "step": 21199 + }, + { + "epoch": 0.54, + "learning_rate": 1.8825986267881318e-06, + "loss": 0.8184, + "step": 21200 + }, + { + "epoch": 0.54, + "learning_rate": 1.8825856178148891e-06, + "loss": 0.7197, + "step": 21201 + }, + { + "epoch": 0.54, + "learning_rate": 1.8825726081658911e-06, + "loss": 0.7654, + "step": 21202 + }, + { + "epoch": 0.54, + "learning_rate": 1.8825595978411476e-06, + "loss": 0.9053, + "step": 21203 + }, + { + "epoch": 0.54, + "learning_rate": 1.8825465868406694e-06, + "loss": 0.9375, + "step": 21204 + }, + { + "epoch": 0.54, + "learning_rate": 1.8825335751644653e-06, + "loss": 0.7271, + "step": 21205 + }, + { + "epoch": 0.54, + "learning_rate": 1.8825205628125462e-06, + "loss": 0.8633, + "step": 21206 + }, + { + "epoch": 0.54, + "learning_rate": 1.8825075497849214e-06, + "loss": 0.6221, + "step": 21207 + }, + { + "epoch": 0.54, + "learning_rate": 1.882494536081601e-06, + "loss": 0.9824, + "step": 21208 + }, + { + "epoch": 0.54, + "learning_rate": 1.8824815217025956e-06, + "loss": 1.0039, + "step": 21209 + }, + { + "epoch": 0.54, + "learning_rate": 1.8824685066479144e-06, + "loss": 1.0137, + "step": 21210 + }, + { + "epoch": 0.54, + "learning_rate": 1.8824554909175676e-06, + "loss": 0.8857, + "step": 21211 + }, + { + "epoch": 0.54, + "learning_rate": 1.8824424745115652e-06, + "loss": 0.7197, + "step": 21212 + }, + { + "epoch": 0.54, + "learning_rate": 1.8824294574299175e-06, + "loss": 0.916, + "step": 21213 + }, + { + "epoch": 0.54, + "learning_rate": 1.882416439672634e-06, + "loss": 0.9736, + "step": 21214 + }, + { + "epoch": 0.54, + "learning_rate": 1.8824034212397245e-06, + "loss": 0.7915, + "step": 21215 + }, + { + "epoch": 0.54, + "learning_rate": 1.8823904021311996e-06, + "loss": 0.8779, + "step": 21216 + }, + { + "epoch": 0.54, + "learning_rate": 1.8823773823470689e-06, + "loss": 0.7332, + "step": 21217 + }, + { + "epoch": 0.54, + "learning_rate": 1.8823643618873422e-06, + "loss": 0.8516, + "step": 21218 + }, + { + "epoch": 0.54, + "learning_rate": 1.88235134075203e-06, + "loss": 0.918, + "step": 21219 + }, + { + "epoch": 0.54, + "learning_rate": 1.8823383189411417e-06, + "loss": 0.7891, + "step": 21220 + }, + { + "epoch": 0.54, + "learning_rate": 1.8823252964546875e-06, + "loss": 1.0625, + "step": 21221 + }, + { + "epoch": 0.54, + "learning_rate": 1.8823122732926775e-06, + "loss": 0.7461, + "step": 21222 + }, + { + "epoch": 0.54, + "learning_rate": 1.8822992494551215e-06, + "loss": 0.7715, + "step": 21223 + }, + { + "epoch": 0.54, + "learning_rate": 1.8822862249420296e-06, + "loss": 0.7295, + "step": 21224 + }, + { + "epoch": 0.54, + "learning_rate": 1.8822731997534115e-06, + "loss": 1.0518, + "step": 21225 + }, + { + "epoch": 0.54, + "learning_rate": 1.8822601738892777e-06, + "loss": 0.8721, + "step": 21226 + }, + { + "epoch": 0.54, + "learning_rate": 1.8822471473496378e-06, + "loss": 0.8906, + "step": 21227 + }, + { + "epoch": 0.54, + "learning_rate": 1.8822341201345015e-06, + "loss": 0.957, + "step": 21228 + }, + { + "epoch": 0.54, + "learning_rate": 1.8822210922438794e-06, + "loss": 1.0156, + "step": 21229 + }, + { + "epoch": 0.54, + "learning_rate": 1.882208063677781e-06, + "loss": 0.7754, + "step": 21230 + }, + { + "epoch": 0.54, + "learning_rate": 1.8821950344362168e-06, + "loss": 0.79, + "step": 21231 + }, + { + "epoch": 0.54, + "learning_rate": 1.8821820045191964e-06, + "loss": 0.9668, + "step": 21232 + }, + { + "epoch": 0.54, + "learning_rate": 1.8821689739267294e-06, + "loss": 0.8369, + "step": 21233 + }, + { + "epoch": 0.54, + "learning_rate": 1.8821559426588265e-06, + "loss": 1.0752, + "step": 21234 + }, + { + "epoch": 0.54, + "learning_rate": 1.8821429107154972e-06, + "loss": 0.9844, + "step": 21235 + }, + { + "epoch": 0.54, + "learning_rate": 1.8821298780967516e-06, + "loss": 0.9678, + "step": 21236 + }, + { + "epoch": 0.54, + "learning_rate": 1.8821168448025998e-06, + "loss": 0.9893, + "step": 21237 + }, + { + "epoch": 0.54, + "learning_rate": 1.8821038108330516e-06, + "loss": 0.6631, + "step": 21238 + }, + { + "epoch": 0.54, + "learning_rate": 1.882090776188117e-06, + "loss": 0.7195, + "step": 21239 + }, + { + "epoch": 0.54, + "learning_rate": 1.8820777408678063e-06, + "loss": 0.8799, + "step": 21240 + }, + { + "epoch": 0.54, + "learning_rate": 1.8820647048721293e-06, + "loss": 0.708, + "step": 21241 + }, + { + "epoch": 0.54, + "learning_rate": 1.8820516682010953e-06, + "loss": 0.7676, + "step": 21242 + }, + { + "epoch": 0.54, + "learning_rate": 1.8820386308547156e-06, + "loss": 1.0459, + "step": 21243 + }, + { + "epoch": 0.54, + "learning_rate": 1.8820255928329991e-06, + "loss": 0.8633, + "step": 21244 + }, + { + "epoch": 0.54, + "learning_rate": 1.8820125541359564e-06, + "loss": 0.71, + "step": 21245 + }, + { + "epoch": 0.54, + "learning_rate": 1.881999514763597e-06, + "loss": 1.041, + "step": 21246 + }, + { + "epoch": 0.54, + "learning_rate": 1.8819864747159313e-06, + "loss": 0.7725, + "step": 21247 + }, + { + "epoch": 0.54, + "learning_rate": 1.8819734339929691e-06, + "loss": 0.8613, + "step": 21248 + }, + { + "epoch": 0.54, + "learning_rate": 1.8819603925947205e-06, + "loss": 0.8301, + "step": 21249 + }, + { + "epoch": 0.54, + "learning_rate": 1.8819473505211952e-06, + "loss": 0.7129, + "step": 21250 + }, + { + "epoch": 0.54, + "learning_rate": 1.8819343077724032e-06, + "loss": 0.9287, + "step": 21251 + }, + { + "epoch": 0.54, + "learning_rate": 1.8819212643483548e-06, + "loss": 0.8062, + "step": 21252 + }, + { + "epoch": 0.54, + "learning_rate": 1.88190822024906e-06, + "loss": 0.8728, + "step": 21253 + }, + { + "epoch": 0.54, + "learning_rate": 1.8818951754745287e-06, + "loss": 0.9238, + "step": 21254 + }, + { + "epoch": 0.54, + "learning_rate": 1.8818821300247705e-06, + "loss": 0.7461, + "step": 21255 + }, + { + "epoch": 0.54, + "learning_rate": 1.881869083899796e-06, + "loss": 0.8564, + "step": 21256 + }, + { + "epoch": 0.54, + "learning_rate": 1.8818560370996147e-06, + "loss": 0.9033, + "step": 21257 + }, + { + "epoch": 0.54, + "learning_rate": 1.8818429896242367e-06, + "loss": 0.8066, + "step": 21258 + }, + { + "epoch": 0.54, + "learning_rate": 1.881829941473672e-06, + "loss": 0.7114, + "step": 21259 + }, + { + "epoch": 0.54, + "learning_rate": 1.881816892647931e-06, + "loss": 0.5854, + "step": 21260 + }, + { + "epoch": 0.54, + "learning_rate": 1.8818038431470233e-06, + "loss": 1.0107, + "step": 21261 + }, + { + "epoch": 0.54, + "learning_rate": 1.8817907929709587e-06, + "loss": 0.7344, + "step": 21262 + }, + { + "epoch": 0.54, + "learning_rate": 1.8817777421197477e-06, + "loss": 0.7275, + "step": 21263 + }, + { + "epoch": 0.55, + "learning_rate": 1.8817646905933997e-06, + "loss": 0.8994, + "step": 21264 + }, + { + "epoch": 0.55, + "learning_rate": 1.8817516383919254e-06, + "loss": 0.8545, + "step": 21265 + }, + { + "epoch": 0.55, + "learning_rate": 1.8817385855153342e-06, + "loss": 0.9424, + "step": 21266 + }, + { + "epoch": 0.55, + "learning_rate": 1.8817255319636364e-06, + "loss": 0.7998, + "step": 21267 + }, + { + "epoch": 0.55, + "learning_rate": 1.8817124777368418e-06, + "loss": 0.9648, + "step": 21268 + }, + { + "epoch": 0.55, + "learning_rate": 1.8816994228349605e-06, + "loss": 0.9688, + "step": 21269 + }, + { + "epoch": 0.55, + "learning_rate": 1.8816863672580025e-06, + "loss": 1.291, + "step": 21270 + }, + { + "epoch": 0.55, + "learning_rate": 1.881673311005978e-06, + "loss": 0.7075, + "step": 21271 + }, + { + "epoch": 0.55, + "learning_rate": 1.8816602540788966e-06, + "loss": 0.9258, + "step": 21272 + }, + { + "epoch": 0.55, + "learning_rate": 1.8816471964767684e-06, + "loss": 0.8896, + "step": 21273 + }, + { + "epoch": 0.55, + "learning_rate": 1.8816341381996036e-06, + "loss": 0.9502, + "step": 21274 + }, + { + "epoch": 0.55, + "learning_rate": 1.881621079247412e-06, + "loss": 0.9492, + "step": 21275 + }, + { + "epoch": 0.55, + "learning_rate": 1.881608019620204e-06, + "loss": 1.0664, + "step": 21276 + }, + { + "epoch": 0.55, + "learning_rate": 1.8815949593179888e-06, + "loss": 0.9248, + "step": 21277 + }, + { + "epoch": 0.55, + "learning_rate": 1.881581898340777e-06, + "loss": 0.8059, + "step": 21278 + }, + { + "epoch": 0.55, + "learning_rate": 1.8815688366885786e-06, + "loss": 0.8496, + "step": 21279 + }, + { + "epoch": 0.55, + "learning_rate": 1.8815557743614035e-06, + "loss": 0.8105, + "step": 21280 + }, + { + "epoch": 0.55, + "learning_rate": 1.8815427113592618e-06, + "loss": 0.7021, + "step": 21281 + }, + { + "epoch": 0.55, + "learning_rate": 1.8815296476821628e-06, + "loss": 0.7588, + "step": 21282 + }, + { + "epoch": 0.55, + "learning_rate": 1.8815165833301178e-06, + "loss": 0.6934, + "step": 21283 + }, + { + "epoch": 0.55, + "learning_rate": 1.881503518303136e-06, + "loss": 0.749, + "step": 21284 + }, + { + "epoch": 0.55, + "learning_rate": 1.881490452601227e-06, + "loss": 0.8242, + "step": 21285 + }, + { + "epoch": 0.55, + "learning_rate": 1.8814773862244015e-06, + "loss": 0.7192, + "step": 21286 + }, + { + "epoch": 0.55, + "learning_rate": 1.8814643191726693e-06, + "loss": 0.8735, + "step": 21287 + }, + { + "epoch": 0.55, + "learning_rate": 1.8814512514460405e-06, + "loss": 1.0781, + "step": 21288 + }, + { + "epoch": 0.55, + "learning_rate": 1.881438183044525e-06, + "loss": 0.7952, + "step": 21289 + }, + { + "epoch": 0.55, + "learning_rate": 1.8814251139681327e-06, + "loss": 0.9058, + "step": 21290 + }, + { + "epoch": 0.55, + "learning_rate": 1.8814120442168736e-06, + "loss": 0.8643, + "step": 21291 + }, + { + "epoch": 0.55, + "learning_rate": 1.8813989737907583e-06, + "loss": 1.0264, + "step": 21292 + }, + { + "epoch": 0.55, + "learning_rate": 1.881385902689796e-06, + "loss": 0.855, + "step": 21293 + }, + { + "epoch": 0.55, + "learning_rate": 1.881372830913997e-06, + "loss": 0.8154, + "step": 21294 + }, + { + "epoch": 0.55, + "learning_rate": 1.8813597584633715e-06, + "loss": 0.6113, + "step": 21295 + }, + { + "epoch": 0.55, + "learning_rate": 1.8813466853379294e-06, + "loss": 0.9414, + "step": 21296 + }, + { + "epoch": 0.55, + "learning_rate": 1.8813336115376806e-06, + "loss": 0.8511, + "step": 21297 + }, + { + "epoch": 0.55, + "learning_rate": 1.881320537062635e-06, + "loss": 0.9844, + "step": 21298 + }, + { + "epoch": 0.55, + "learning_rate": 1.881307461912803e-06, + "loss": 0.8271, + "step": 21299 + }, + { + "epoch": 0.55, + "learning_rate": 1.8812943860881942e-06, + "loss": 0.7499, + "step": 21300 + }, + { + "epoch": 0.55, + "learning_rate": 1.8812813095888191e-06, + "loss": 0.8428, + "step": 21301 + }, + { + "epoch": 0.55, + "learning_rate": 1.8812682324146873e-06, + "loss": 1.0186, + "step": 21302 + }, + { + "epoch": 0.55, + "learning_rate": 1.881255154565809e-06, + "loss": 0.6311, + "step": 21303 + }, + { + "epoch": 0.55, + "learning_rate": 1.8812420760421941e-06, + "loss": 0.7451, + "step": 21304 + }, + { + "epoch": 0.55, + "learning_rate": 1.8812289968438524e-06, + "loss": 0.752, + "step": 21305 + }, + { + "epoch": 0.55, + "learning_rate": 1.8812159169707944e-06, + "loss": 0.7549, + "step": 21306 + }, + { + "epoch": 0.55, + "learning_rate": 1.8812028364230299e-06, + "loss": 0.9658, + "step": 21307 + }, + { + "epoch": 0.55, + "learning_rate": 1.8811897552005688e-06, + "loss": 0.8291, + "step": 21308 + }, + { + "epoch": 0.55, + "learning_rate": 1.8811766733034212e-06, + "loss": 0.6006, + "step": 21309 + }, + { + "epoch": 0.55, + "learning_rate": 1.8811635907315975e-06, + "loss": 0.8105, + "step": 21310 + }, + { + "epoch": 0.55, + "learning_rate": 1.881150507485107e-06, + "loss": 0.9375, + "step": 21311 + }, + { + "epoch": 0.55, + "learning_rate": 1.8811374235639602e-06, + "loss": 0.8169, + "step": 21312 + }, + { + "epoch": 0.55, + "learning_rate": 1.881124338968167e-06, + "loss": 1.0898, + "step": 21313 + }, + { + "epoch": 0.55, + "learning_rate": 1.8811112536977376e-06, + "loss": 0.7861, + "step": 21314 + }, + { + "epoch": 0.55, + "learning_rate": 1.8810981677526816e-06, + "loss": 0.959, + "step": 21315 + }, + { + "epoch": 0.55, + "learning_rate": 1.8810850811330092e-06, + "loss": 0.9736, + "step": 21316 + }, + { + "epoch": 0.55, + "learning_rate": 1.8810719938387306e-06, + "loss": 0.8281, + "step": 21317 + }, + { + "epoch": 0.55, + "learning_rate": 1.8810589058698554e-06, + "loss": 0.8926, + "step": 21318 + }, + { + "epoch": 0.55, + "learning_rate": 1.8810458172263943e-06, + "loss": 0.8545, + "step": 21319 + }, + { + "epoch": 0.55, + "learning_rate": 1.8810327279083568e-06, + "loss": 0.6904, + "step": 21320 + }, + { + "epoch": 0.55, + "learning_rate": 1.8810196379157528e-06, + "loss": 0.7324, + "step": 21321 + }, + { + "epoch": 0.55, + "learning_rate": 1.8810065472485927e-06, + "loss": 0.8677, + "step": 21322 + }, + { + "epoch": 0.55, + "learning_rate": 1.8809934559068866e-06, + "loss": 0.8608, + "step": 21323 + }, + { + "epoch": 0.55, + "learning_rate": 1.8809803638906442e-06, + "loss": 0.9404, + "step": 21324 + }, + { + "epoch": 0.55, + "learning_rate": 1.8809672711998757e-06, + "loss": 0.8896, + "step": 21325 + }, + { + "epoch": 0.55, + "learning_rate": 1.880954177834591e-06, + "loss": 1.0156, + "step": 21326 + }, + { + "epoch": 0.55, + "learning_rate": 1.8809410837948001e-06, + "loss": 1.001, + "step": 21327 + }, + { + "epoch": 0.55, + "learning_rate": 1.8809279890805133e-06, + "loss": 0.9424, + "step": 21328 + }, + { + "epoch": 0.55, + "learning_rate": 1.8809148936917402e-06, + "loss": 0.9746, + "step": 21329 + }, + { + "epoch": 0.55, + "learning_rate": 1.8809017976284914e-06, + "loss": 1.1758, + "step": 21330 + }, + { + "epoch": 0.55, + "learning_rate": 1.8808887008907766e-06, + "loss": 0.9336, + "step": 21331 + }, + { + "epoch": 0.55, + "learning_rate": 1.8808756034786054e-06, + "loss": 0.8496, + "step": 21332 + }, + { + "epoch": 0.55, + "learning_rate": 1.8808625053919887e-06, + "loss": 1.1094, + "step": 21333 + }, + { + "epoch": 0.55, + "learning_rate": 1.8808494066309357e-06, + "loss": 0.6802, + "step": 21334 + }, + { + "epoch": 0.55, + "learning_rate": 1.880836307195457e-06, + "loss": 0.8701, + "step": 21335 + }, + { + "epoch": 0.55, + "learning_rate": 1.8808232070855625e-06, + "loss": 0.998, + "step": 21336 + }, + { + "epoch": 0.55, + "learning_rate": 1.8808101063012622e-06, + "loss": 1.0059, + "step": 21337 + }, + { + "epoch": 0.55, + "learning_rate": 1.8807970048425661e-06, + "loss": 0.8135, + "step": 21338 + }, + { + "epoch": 0.55, + "learning_rate": 1.880783902709484e-06, + "loss": 0.7734, + "step": 21339 + }, + { + "epoch": 0.55, + "learning_rate": 1.8807707999020263e-06, + "loss": 1.001, + "step": 21340 + }, + { + "epoch": 0.55, + "learning_rate": 1.880757696420203e-06, + "loss": 0.793, + "step": 21341 + }, + { + "epoch": 0.55, + "learning_rate": 1.880744592264024e-06, + "loss": 0.7891, + "step": 21342 + }, + { + "epoch": 0.55, + "learning_rate": 1.8807314874334992e-06, + "loss": 0.5264, + "step": 21343 + }, + { + "epoch": 0.55, + "learning_rate": 1.880718381928639e-06, + "loss": 0.998, + "step": 21344 + }, + { + "epoch": 0.55, + "learning_rate": 1.880705275749453e-06, + "loss": 1.1162, + "step": 21345 + }, + { + "epoch": 0.55, + "learning_rate": 1.8806921688959517e-06, + "loss": 0.9297, + "step": 21346 + }, + { + "epoch": 0.55, + "learning_rate": 1.8806790613681449e-06, + "loss": 1.0127, + "step": 21347 + }, + { + "epoch": 0.55, + "learning_rate": 1.8806659531660425e-06, + "loss": 0.8242, + "step": 21348 + }, + { + "epoch": 0.55, + "learning_rate": 1.8806528442896544e-06, + "loss": 0.9546, + "step": 21349 + }, + { + "epoch": 0.55, + "learning_rate": 1.8806397347389913e-06, + "loss": 0.8506, + "step": 21350 + }, + { + "epoch": 0.55, + "learning_rate": 1.8806266245140629e-06, + "loss": 0.8506, + "step": 21351 + }, + { + "epoch": 0.55, + "learning_rate": 1.880613513614879e-06, + "loss": 0.8809, + "step": 21352 + }, + { + "epoch": 0.55, + "learning_rate": 1.88060040204145e-06, + "loss": 1.0859, + "step": 21353 + }, + { + "epoch": 0.55, + "learning_rate": 1.8805872897937855e-06, + "loss": 0.8359, + "step": 21354 + }, + { + "epoch": 0.55, + "learning_rate": 1.880574176871896e-06, + "loss": 0.7192, + "step": 21355 + }, + { + "epoch": 0.55, + "learning_rate": 1.8805610632757913e-06, + "loss": 0.6909, + "step": 21356 + }, + { + "epoch": 0.55, + "learning_rate": 1.8805479490054816e-06, + "loss": 0.7988, + "step": 21357 + }, + { + "epoch": 0.55, + "learning_rate": 1.8805348340609766e-06, + "loss": 1.0713, + "step": 21358 + }, + { + "epoch": 0.55, + "learning_rate": 1.8805217184422868e-06, + "loss": 0.8564, + "step": 21359 + }, + { + "epoch": 0.55, + "learning_rate": 1.8805086021494216e-06, + "loss": 0.9004, + "step": 21360 + }, + { + "epoch": 0.55, + "learning_rate": 1.8804954851823919e-06, + "loss": 0.8369, + "step": 21361 + }, + { + "epoch": 0.55, + "learning_rate": 1.8804823675412072e-06, + "loss": 0.7988, + "step": 21362 + }, + { + "epoch": 0.55, + "learning_rate": 1.8804692492258776e-06, + "loss": 0.5842, + "step": 21363 + }, + { + "epoch": 0.55, + "learning_rate": 1.880456130236413e-06, + "loss": 0.8389, + "step": 21364 + }, + { + "epoch": 0.55, + "learning_rate": 1.880443010572824e-06, + "loss": 0.7324, + "step": 21365 + }, + { + "epoch": 0.55, + "learning_rate": 1.8804298902351199e-06, + "loss": 0.7881, + "step": 21366 + }, + { + "epoch": 0.55, + "learning_rate": 1.8804167692233113e-06, + "loss": 0.8672, + "step": 21367 + }, + { + "epoch": 0.55, + "learning_rate": 1.880403647537408e-06, + "loss": 0.8711, + "step": 21368 + }, + { + "epoch": 0.55, + "learning_rate": 1.88039052517742e-06, + "loss": 0.9824, + "step": 21369 + }, + { + "epoch": 0.55, + "learning_rate": 1.8803774021433576e-06, + "loss": 1.0771, + "step": 21370 + }, + { + "epoch": 0.55, + "learning_rate": 1.8803642784352308e-06, + "loss": 0.8682, + "step": 21371 + }, + { + "epoch": 0.55, + "learning_rate": 1.8803511540530495e-06, + "loss": 0.6193, + "step": 21372 + }, + { + "epoch": 0.55, + "learning_rate": 1.8803380289968236e-06, + "loss": 0.8193, + "step": 21373 + }, + { + "epoch": 0.55, + "learning_rate": 1.8803249032665636e-06, + "loss": 0.8848, + "step": 21374 + }, + { + "epoch": 0.55, + "learning_rate": 1.880311776862279e-06, + "loss": 0.4575, + "step": 21375 + }, + { + "epoch": 0.55, + "learning_rate": 1.8802986497839805e-06, + "loss": 0.7949, + "step": 21376 + }, + { + "epoch": 0.55, + "learning_rate": 1.8802855220316776e-06, + "loss": 0.791, + "step": 21377 + }, + { + "epoch": 0.55, + "learning_rate": 1.8802723936053805e-06, + "loss": 0.686, + "step": 21378 + }, + { + "epoch": 0.55, + "learning_rate": 1.8802592645050994e-06, + "loss": 0.9033, + "step": 21379 + }, + { + "epoch": 0.55, + "learning_rate": 1.8802461347308442e-06, + "loss": 0.5811, + "step": 21380 + }, + { + "epoch": 0.55, + "learning_rate": 1.8802330042826251e-06, + "loss": 1.0059, + "step": 21381 + }, + { + "epoch": 0.55, + "learning_rate": 1.8802198731604522e-06, + "loss": 0.7803, + "step": 21382 + }, + { + "epoch": 0.55, + "learning_rate": 1.880206741364335e-06, + "loss": 1.0781, + "step": 21383 + }, + { + "epoch": 0.55, + "learning_rate": 1.8801936088942842e-06, + "loss": 0.918, + "step": 21384 + }, + { + "epoch": 0.55, + "learning_rate": 1.8801804757503096e-06, + "loss": 0.8477, + "step": 21385 + }, + { + "epoch": 0.55, + "learning_rate": 1.8801673419324215e-06, + "loss": 0.791, + "step": 21386 + }, + { + "epoch": 0.55, + "learning_rate": 1.8801542074406295e-06, + "loss": 0.8496, + "step": 21387 + }, + { + "epoch": 0.55, + "learning_rate": 1.880141072274944e-06, + "loss": 0.8975, + "step": 21388 + }, + { + "epoch": 0.55, + "learning_rate": 1.8801279364353748e-06, + "loss": 0.8037, + "step": 21389 + }, + { + "epoch": 0.55, + "learning_rate": 1.8801147999219323e-06, + "loss": 0.8867, + "step": 21390 + }, + { + "epoch": 0.55, + "learning_rate": 1.8801016627346263e-06, + "loss": 0.7461, + "step": 21391 + }, + { + "epoch": 0.55, + "learning_rate": 1.8800885248734668e-06, + "loss": 0.7891, + "step": 21392 + }, + { + "epoch": 0.55, + "learning_rate": 1.8800753863384643e-06, + "loss": 0.8872, + "step": 21393 + }, + { + "epoch": 0.55, + "learning_rate": 1.8800622471296282e-06, + "loss": 0.875, + "step": 21394 + }, + { + "epoch": 0.55, + "learning_rate": 1.8800491072469691e-06, + "loss": 0.9258, + "step": 21395 + }, + { + "epoch": 0.55, + "learning_rate": 1.8800359666904968e-06, + "loss": 0.9355, + "step": 21396 + }, + { + "epoch": 0.55, + "learning_rate": 1.8800228254602213e-06, + "loss": 0.834, + "step": 21397 + }, + { + "epoch": 0.55, + "learning_rate": 1.880009683556153e-06, + "loss": 0.5356, + "step": 21398 + }, + { + "epoch": 0.55, + "learning_rate": 1.8799965409783016e-06, + "loss": 1.1377, + "step": 21399 + }, + { + "epoch": 0.55, + "learning_rate": 1.8799833977266774e-06, + "loss": 0.8245, + "step": 21400 + }, + { + "epoch": 0.55, + "learning_rate": 1.8799702538012902e-06, + "loss": 1.0557, + "step": 21401 + }, + { + "epoch": 0.55, + "learning_rate": 1.8799571092021505e-06, + "loss": 0.6626, + "step": 21402 + }, + { + "epoch": 0.55, + "learning_rate": 1.8799439639292681e-06, + "loss": 0.9844, + "step": 21403 + }, + { + "epoch": 0.55, + "learning_rate": 1.879930817982653e-06, + "loss": 0.5867, + "step": 21404 + }, + { + "epoch": 0.55, + "learning_rate": 1.879917671362315e-06, + "loss": 0.6943, + "step": 21405 + }, + { + "epoch": 0.55, + "learning_rate": 1.879904524068265e-06, + "loss": 0.813, + "step": 21406 + }, + { + "epoch": 0.55, + "learning_rate": 1.8798913761005122e-06, + "loss": 0.7407, + "step": 21407 + }, + { + "epoch": 0.55, + "learning_rate": 1.8798782274590672e-06, + "loss": 0.7725, + "step": 21408 + }, + { + "epoch": 0.55, + "learning_rate": 1.8798650781439399e-06, + "loss": 0.6289, + "step": 21409 + }, + { + "epoch": 0.55, + "learning_rate": 1.8798519281551403e-06, + "loss": 0.7217, + "step": 21410 + }, + { + "epoch": 0.55, + "learning_rate": 1.8798387774926786e-06, + "loss": 0.9385, + "step": 21411 + }, + { + "epoch": 0.55, + "learning_rate": 1.879825626156565e-06, + "loss": 1.0762, + "step": 21412 + }, + { + "epoch": 0.55, + "learning_rate": 1.8798124741468092e-06, + "loss": 0.8569, + "step": 21413 + }, + { + "epoch": 0.55, + "learning_rate": 1.8797993214634212e-06, + "loss": 0.7627, + "step": 21414 + }, + { + "epoch": 0.55, + "learning_rate": 1.8797861681064115e-06, + "loss": 0.8789, + "step": 21415 + }, + { + "epoch": 0.55, + "learning_rate": 1.8797730140757899e-06, + "loss": 0.9854, + "step": 21416 + }, + { + "epoch": 0.55, + "learning_rate": 1.8797598593715666e-06, + "loss": 0.6821, + "step": 21417 + }, + { + "epoch": 0.55, + "learning_rate": 1.879746703993752e-06, + "loss": 0.8674, + "step": 21418 + }, + { + "epoch": 0.55, + "learning_rate": 1.8797335479423553e-06, + "loss": 0.9248, + "step": 21419 + }, + { + "epoch": 0.55, + "learning_rate": 1.8797203912173871e-06, + "loss": 0.5591, + "step": 21420 + }, + { + "epoch": 0.55, + "learning_rate": 1.8797072338188577e-06, + "loss": 0.7734, + "step": 21421 + }, + { + "epoch": 0.55, + "learning_rate": 1.879694075746777e-06, + "loss": 0.9648, + "step": 21422 + }, + { + "epoch": 0.55, + "learning_rate": 1.879680917001155e-06, + "loss": 0.9634, + "step": 21423 + }, + { + "epoch": 0.55, + "learning_rate": 1.8796677575820014e-06, + "loss": 0.7656, + "step": 21424 + }, + { + "epoch": 0.55, + "learning_rate": 1.8796545974893268e-06, + "loss": 0.8936, + "step": 21425 + }, + { + "epoch": 0.55, + "learning_rate": 1.879641436723141e-06, + "loss": 0.835, + "step": 21426 + }, + { + "epoch": 0.55, + "learning_rate": 1.8796282752834544e-06, + "loss": 0.6777, + "step": 21427 + }, + { + "epoch": 0.55, + "learning_rate": 1.879615113170277e-06, + "loss": 1.0039, + "step": 21428 + }, + { + "epoch": 0.55, + "learning_rate": 1.8796019503836185e-06, + "loss": 0.7095, + "step": 21429 + }, + { + "epoch": 0.55, + "learning_rate": 1.8795887869234895e-06, + "loss": 0.689, + "step": 21430 + }, + { + "epoch": 0.55, + "learning_rate": 1.8795756227898996e-06, + "loss": 0.7251, + "step": 21431 + }, + { + "epoch": 0.55, + "learning_rate": 1.879562457982859e-06, + "loss": 0.9092, + "step": 21432 + }, + { + "epoch": 0.55, + "learning_rate": 1.8795492925023783e-06, + "loss": 0.75, + "step": 21433 + }, + { + "epoch": 0.55, + "learning_rate": 1.8795361263484665e-06, + "loss": 0.7646, + "step": 21434 + }, + { + "epoch": 0.55, + "learning_rate": 1.8795229595211346e-06, + "loss": 0.8682, + "step": 21435 + }, + { + "epoch": 0.55, + "learning_rate": 1.8795097920203926e-06, + "loss": 0.8774, + "step": 21436 + }, + { + "epoch": 0.55, + "learning_rate": 1.8794966238462502e-06, + "loss": 0.9775, + "step": 21437 + }, + { + "epoch": 0.55, + "learning_rate": 1.8794834549987178e-06, + "loss": 0.8594, + "step": 21438 + }, + { + "epoch": 0.55, + "learning_rate": 1.8794702854778052e-06, + "loss": 1.0537, + "step": 21439 + }, + { + "epoch": 0.55, + "learning_rate": 1.879457115283523e-06, + "loss": 0.8235, + "step": 21440 + }, + { + "epoch": 0.55, + "learning_rate": 1.8794439444158808e-06, + "loss": 1.0303, + "step": 21441 + }, + { + "epoch": 0.55, + "learning_rate": 1.8794307728748887e-06, + "loss": 0.8398, + "step": 21442 + }, + { + "epoch": 0.55, + "learning_rate": 1.8794176006605566e-06, + "loss": 1.1494, + "step": 21443 + }, + { + "epoch": 0.55, + "learning_rate": 1.8794044277728954e-06, + "loss": 0.874, + "step": 21444 + }, + { + "epoch": 0.55, + "learning_rate": 1.879391254211914e-06, + "loss": 0.7822, + "step": 21445 + }, + { + "epoch": 0.55, + "learning_rate": 1.879378079977624e-06, + "loss": 0.438, + "step": 21446 + }, + { + "epoch": 0.55, + "learning_rate": 1.8793649050700342e-06, + "loss": 1.1133, + "step": 21447 + }, + { + "epoch": 0.55, + "learning_rate": 1.879351729489155e-06, + "loss": 0.8042, + "step": 21448 + }, + { + "epoch": 0.55, + "learning_rate": 1.8793385532349967e-06, + "loss": 0.8579, + "step": 21449 + }, + { + "epoch": 0.55, + "learning_rate": 1.8793253763075694e-06, + "loss": 0.9844, + "step": 21450 + }, + { + "epoch": 0.55, + "learning_rate": 1.879312198706883e-06, + "loss": 0.9521, + "step": 21451 + }, + { + "epoch": 0.55, + "learning_rate": 1.8792990204329478e-06, + "loss": 0.73, + "step": 21452 + }, + { + "epoch": 0.55, + "learning_rate": 1.8792858414857738e-06, + "loss": 0.8652, + "step": 21453 + }, + { + "epoch": 0.55, + "learning_rate": 1.879272661865371e-06, + "loss": 1.0205, + "step": 21454 + }, + { + "epoch": 0.55, + "learning_rate": 1.8792594815717494e-06, + "loss": 0.8525, + "step": 21455 + }, + { + "epoch": 0.55, + "learning_rate": 1.8792463006049193e-06, + "loss": 0.8645, + "step": 21456 + }, + { + "epoch": 0.55, + "learning_rate": 1.8792331189648908e-06, + "loss": 0.8359, + "step": 21457 + }, + { + "epoch": 0.55, + "learning_rate": 1.879219936651674e-06, + "loss": 0.6123, + "step": 21458 + }, + { + "epoch": 0.55, + "learning_rate": 1.879206753665279e-06, + "loss": 0.9639, + "step": 21459 + }, + { + "epoch": 0.55, + "learning_rate": 1.8791935700057155e-06, + "loss": 0.9932, + "step": 21460 + }, + { + "epoch": 0.55, + "learning_rate": 1.8791803856729942e-06, + "loss": 0.5791, + "step": 21461 + }, + { + "epoch": 0.55, + "learning_rate": 1.8791672006671248e-06, + "loss": 0.7979, + "step": 21462 + }, + { + "epoch": 0.55, + "learning_rate": 1.8791540149881175e-06, + "loss": 0.8643, + "step": 21463 + }, + { + "epoch": 0.55, + "learning_rate": 1.8791408286359824e-06, + "loss": 0.9678, + "step": 21464 + }, + { + "epoch": 0.55, + "learning_rate": 1.8791276416107293e-06, + "loss": 0.7998, + "step": 21465 + }, + { + "epoch": 0.55, + "learning_rate": 1.879114453912369e-06, + "loss": 0.8164, + "step": 21466 + }, + { + "epoch": 0.55, + "learning_rate": 1.8791012655409112e-06, + "loss": 0.7817, + "step": 21467 + }, + { + "epoch": 0.55, + "learning_rate": 1.8790880764963656e-06, + "loss": 0.9619, + "step": 21468 + }, + { + "epoch": 0.55, + "learning_rate": 1.879074886778743e-06, + "loss": 0.8965, + "step": 21469 + }, + { + "epoch": 0.55, + "learning_rate": 1.879061696388053e-06, + "loss": 0.8955, + "step": 21470 + }, + { + "epoch": 0.55, + "learning_rate": 1.8790485053243058e-06, + "loss": 0.6982, + "step": 21471 + }, + { + "epoch": 0.55, + "learning_rate": 1.8790353135875118e-06, + "loss": 1.1104, + "step": 21472 + }, + { + "epoch": 0.55, + "learning_rate": 1.879022121177681e-06, + "loss": 0.6553, + "step": 21473 + }, + { + "epoch": 0.55, + "learning_rate": 1.8790089280948233e-06, + "loss": 0.9512, + "step": 21474 + }, + { + "epoch": 0.55, + "learning_rate": 1.8789957343389488e-06, + "loss": 0.9336, + "step": 21475 + }, + { + "epoch": 0.55, + "learning_rate": 1.8789825399100677e-06, + "loss": 0.9307, + "step": 21476 + }, + { + "epoch": 0.55, + "learning_rate": 1.87896934480819e-06, + "loss": 0.6567, + "step": 21477 + }, + { + "epoch": 0.55, + "learning_rate": 1.8789561490333259e-06, + "loss": 0.8276, + "step": 21478 + }, + { + "epoch": 0.55, + "learning_rate": 1.8789429525854853e-06, + "loss": 0.8105, + "step": 21479 + }, + { + "epoch": 0.55, + "learning_rate": 1.878929755464679e-06, + "loss": 0.9375, + "step": 21480 + }, + { + "epoch": 0.55, + "learning_rate": 1.8789165576709163e-06, + "loss": 1.0205, + "step": 21481 + }, + { + "epoch": 0.55, + "learning_rate": 1.8789033592042077e-06, + "loss": 0.6372, + "step": 21482 + }, + { + "epoch": 0.55, + "learning_rate": 1.878890160064563e-06, + "loss": 0.9277, + "step": 21483 + }, + { + "epoch": 0.55, + "learning_rate": 1.8788769602519927e-06, + "loss": 0.8145, + "step": 21484 + }, + { + "epoch": 0.55, + "learning_rate": 1.8788637597665069e-06, + "loss": 0.8643, + "step": 21485 + }, + { + "epoch": 0.55, + "learning_rate": 1.8788505586081152e-06, + "loss": 0.9663, + "step": 21486 + }, + { + "epoch": 0.55, + "learning_rate": 1.878837356776828e-06, + "loss": 0.9019, + "step": 21487 + }, + { + "epoch": 0.55, + "learning_rate": 1.8788241542726557e-06, + "loss": 0.6646, + "step": 21488 + }, + { + "epoch": 0.55, + "learning_rate": 1.8788109510956081e-06, + "loss": 1.0518, + "step": 21489 + }, + { + "epoch": 0.55, + "learning_rate": 1.8787977472456956e-06, + "loss": 0.8062, + "step": 21490 + }, + { + "epoch": 0.55, + "learning_rate": 1.8787845427229273e-06, + "loss": 0.7441, + "step": 21491 + }, + { + "epoch": 0.55, + "learning_rate": 1.8787713375273149e-06, + "loss": 0.832, + "step": 21492 + }, + { + "epoch": 0.55, + "learning_rate": 1.8787581316588673e-06, + "loss": 0.7427, + "step": 21493 + }, + { + "epoch": 0.55, + "learning_rate": 1.878744925117595e-06, + "loss": 0.9131, + "step": 21494 + }, + { + "epoch": 0.55, + "learning_rate": 1.8787317179035083e-06, + "loss": 0.9258, + "step": 21495 + }, + { + "epoch": 0.55, + "learning_rate": 1.878718510016617e-06, + "loss": 1.1328, + "step": 21496 + }, + { + "epoch": 0.55, + "learning_rate": 1.8787053014569315e-06, + "loss": 1.002, + "step": 21497 + }, + { + "epoch": 0.55, + "learning_rate": 1.8786920922244614e-06, + "loss": 0.8994, + "step": 21498 + }, + { + "epoch": 0.55, + "learning_rate": 1.8786788823192174e-06, + "loss": 0.7729, + "step": 21499 + }, + { + "epoch": 0.55, + "learning_rate": 1.8786656717412095e-06, + "loss": 1.1328, + "step": 21500 + }, + { + "epoch": 0.55, + "learning_rate": 1.8786524604904478e-06, + "loss": 0.9932, + "step": 21501 + }, + { + "epoch": 0.55, + "learning_rate": 1.8786392485669418e-06, + "loss": 0.8225, + "step": 21502 + }, + { + "epoch": 0.55, + "learning_rate": 1.8786260359707025e-06, + "loss": 0.8486, + "step": 21503 + }, + { + "epoch": 0.55, + "learning_rate": 1.8786128227017395e-06, + "loss": 0.6436, + "step": 21504 + }, + { + "epoch": 0.55, + "learning_rate": 1.8785996087600632e-06, + "loss": 0.8457, + "step": 21505 + }, + { + "epoch": 0.55, + "learning_rate": 1.8785863941456834e-06, + "loss": 0.9971, + "step": 21506 + }, + { + "epoch": 0.55, + "learning_rate": 1.8785731788586104e-06, + "loss": 0.8096, + "step": 21507 + }, + { + "epoch": 0.55, + "learning_rate": 1.8785599628988543e-06, + "loss": 0.9922, + "step": 21508 + }, + { + "epoch": 0.55, + "learning_rate": 1.8785467462664256e-06, + "loss": 0.7295, + "step": 21509 + }, + { + "epoch": 0.55, + "learning_rate": 1.8785335289613339e-06, + "loss": 0.6871, + "step": 21510 + }, + { + "epoch": 0.55, + "learning_rate": 1.8785203109835891e-06, + "loss": 0.7505, + "step": 21511 + }, + { + "epoch": 0.55, + "learning_rate": 1.878507092333202e-06, + "loss": 0.5776, + "step": 21512 + }, + { + "epoch": 0.55, + "learning_rate": 1.8784938730101824e-06, + "loss": 0.8281, + "step": 21513 + }, + { + "epoch": 0.55, + "learning_rate": 1.8784806530145403e-06, + "loss": 0.8926, + "step": 21514 + }, + { + "epoch": 0.55, + "learning_rate": 1.8784674323462862e-06, + "loss": 0.7246, + "step": 21515 + }, + { + "epoch": 0.55, + "learning_rate": 1.8784542110054298e-06, + "loss": 0.9766, + "step": 21516 + }, + { + "epoch": 0.55, + "learning_rate": 1.8784409889919814e-06, + "loss": 0.8589, + "step": 21517 + }, + { + "epoch": 0.55, + "learning_rate": 1.8784277663059513e-06, + "loss": 0.9043, + "step": 21518 + }, + { + "epoch": 0.55, + "learning_rate": 1.8784145429473493e-06, + "loss": 0.7734, + "step": 21519 + }, + { + "epoch": 0.55, + "learning_rate": 1.8784013189161856e-06, + "loss": 0.7822, + "step": 21520 + }, + { + "epoch": 0.55, + "learning_rate": 1.8783880942124705e-06, + "loss": 0.8232, + "step": 21521 + }, + { + "epoch": 0.55, + "learning_rate": 1.878374868836214e-06, + "loss": 0.9131, + "step": 21522 + }, + { + "epoch": 0.55, + "learning_rate": 1.8783616427874263e-06, + "loss": 0.9268, + "step": 21523 + }, + { + "epoch": 0.55, + "learning_rate": 1.8783484160661174e-06, + "loss": 0.6699, + "step": 21524 + }, + { + "epoch": 0.55, + "learning_rate": 1.8783351886722975e-06, + "loss": 0.7969, + "step": 21525 + }, + { + "epoch": 0.55, + "learning_rate": 1.878321960605977e-06, + "loss": 1.0283, + "step": 21526 + }, + { + "epoch": 0.55, + "learning_rate": 1.8783087318671655e-06, + "loss": 0.998, + "step": 21527 + }, + { + "epoch": 0.55, + "learning_rate": 1.8782955024558736e-06, + "loss": 0.792, + "step": 21528 + }, + { + "epoch": 0.55, + "learning_rate": 1.878282272372111e-06, + "loss": 0.8535, + "step": 21529 + }, + { + "epoch": 0.55, + "learning_rate": 1.878269041615888e-06, + "loss": 0.5858, + "step": 21530 + }, + { + "epoch": 0.55, + "learning_rate": 1.8782558101872151e-06, + "loss": 0.5835, + "step": 21531 + }, + { + "epoch": 0.55, + "learning_rate": 1.8782425780861017e-06, + "loss": 0.7378, + "step": 21532 + }, + { + "epoch": 0.55, + "learning_rate": 1.8782293453125587e-06, + "loss": 0.8418, + "step": 21533 + }, + { + "epoch": 0.55, + "learning_rate": 1.8782161118665956e-06, + "loss": 0.8027, + "step": 21534 + }, + { + "epoch": 0.55, + "learning_rate": 1.8782028777482228e-06, + "loss": 0.791, + "step": 21535 + }, + { + "epoch": 0.55, + "learning_rate": 1.8781896429574507e-06, + "loss": 0.8271, + "step": 21536 + }, + { + "epoch": 0.55, + "learning_rate": 1.8781764074942892e-06, + "loss": 0.8799, + "step": 21537 + }, + { + "epoch": 0.55, + "learning_rate": 1.878163171358748e-06, + "loss": 0.9814, + "step": 21538 + }, + { + "epoch": 0.55, + "learning_rate": 1.878149934550838e-06, + "loss": 0.7822, + "step": 21539 + }, + { + "epoch": 0.55, + "learning_rate": 1.8781366970705687e-06, + "loss": 0.9004, + "step": 21540 + }, + { + "epoch": 0.55, + "learning_rate": 1.8781234589179506e-06, + "loss": 0.8477, + "step": 21541 + }, + { + "epoch": 0.55, + "learning_rate": 1.878110220092994e-06, + "loss": 0.9434, + "step": 21542 + }, + { + "epoch": 0.55, + "learning_rate": 1.8780969805957084e-06, + "loss": 0.731, + "step": 21543 + }, + { + "epoch": 0.55, + "learning_rate": 1.8780837404261045e-06, + "loss": 0.8506, + "step": 21544 + }, + { + "epoch": 0.55, + "learning_rate": 1.8780704995841924e-06, + "loss": 0.9766, + "step": 21545 + }, + { + "epoch": 0.55, + "learning_rate": 1.8780572580699819e-06, + "loss": 0.8867, + "step": 21546 + }, + { + "epoch": 0.55, + "learning_rate": 1.8780440158834835e-06, + "loss": 0.8501, + "step": 21547 + }, + { + "epoch": 0.55, + "learning_rate": 1.8780307730247069e-06, + "loss": 0.8926, + "step": 21548 + }, + { + "epoch": 0.55, + "learning_rate": 1.8780175294936627e-06, + "loss": 0.8301, + "step": 21549 + }, + { + "epoch": 0.55, + "learning_rate": 1.8780042852903608e-06, + "loss": 0.9902, + "step": 21550 + }, + { + "epoch": 0.55, + "learning_rate": 1.8779910404148115e-06, + "loss": 0.8145, + "step": 21551 + }, + { + "epoch": 0.55, + "learning_rate": 1.8779777948670246e-06, + "loss": 0.8438, + "step": 21552 + }, + { + "epoch": 0.55, + "learning_rate": 1.8779645486470106e-06, + "loss": 0.8169, + "step": 21553 + }, + { + "epoch": 0.55, + "learning_rate": 1.8779513017547797e-06, + "loss": 0.877, + "step": 21554 + }, + { + "epoch": 0.55, + "learning_rate": 1.8779380541903417e-06, + "loss": 0.6377, + "step": 21555 + }, + { + "epoch": 0.55, + "learning_rate": 1.8779248059537067e-06, + "loss": 1.0098, + "step": 21556 + }, + { + "epoch": 0.55, + "learning_rate": 1.877911557044885e-06, + "loss": 0.8086, + "step": 21557 + }, + { + "epoch": 0.55, + "learning_rate": 1.8778983074638873e-06, + "loss": 0.8379, + "step": 21558 + }, + { + "epoch": 0.55, + "learning_rate": 1.8778850572107227e-06, + "loss": 1.0615, + "step": 21559 + }, + { + "epoch": 0.55, + "learning_rate": 1.8778718062854023e-06, + "loss": 1.0752, + "step": 21560 + }, + { + "epoch": 0.55, + "learning_rate": 1.8778585546879357e-06, + "loss": 0.6113, + "step": 21561 + }, + { + "epoch": 0.55, + "learning_rate": 1.877845302418333e-06, + "loss": 1.0605, + "step": 21562 + }, + { + "epoch": 0.55, + "learning_rate": 1.8778320494766046e-06, + "loss": 1.0146, + "step": 21563 + }, + { + "epoch": 0.55, + "learning_rate": 1.8778187958627606e-06, + "loss": 0.7148, + "step": 21564 + }, + { + "epoch": 0.55, + "learning_rate": 1.8778055415768114e-06, + "loss": 0.8525, + "step": 21565 + }, + { + "epoch": 0.55, + "learning_rate": 1.8777922866187663e-06, + "loss": 1.0117, + "step": 21566 + }, + { + "epoch": 0.55, + "learning_rate": 1.8777790309886363e-06, + "loss": 0.814, + "step": 21567 + }, + { + "epoch": 0.55, + "learning_rate": 1.877765774686431e-06, + "loss": 0.6577, + "step": 21568 + }, + { + "epoch": 0.55, + "learning_rate": 1.8777525177121612e-06, + "loss": 0.8462, + "step": 21569 + }, + { + "epoch": 0.55, + "learning_rate": 1.8777392600658364e-06, + "loss": 0.7549, + "step": 21570 + }, + { + "epoch": 0.55, + "learning_rate": 1.8777260017474672e-06, + "loss": 0.7959, + "step": 21571 + }, + { + "epoch": 0.55, + "learning_rate": 1.8777127427570635e-06, + "loss": 1.1377, + "step": 21572 + }, + { + "epoch": 0.55, + "learning_rate": 1.8776994830946356e-06, + "loss": 0.6826, + "step": 21573 + }, + { + "epoch": 0.55, + "learning_rate": 1.8776862227601933e-06, + "loss": 0.9092, + "step": 21574 + }, + { + "epoch": 0.55, + "learning_rate": 1.8776729617537472e-06, + "loss": 1.0176, + "step": 21575 + }, + { + "epoch": 0.55, + "learning_rate": 1.8776597000753071e-06, + "loss": 0.8115, + "step": 21576 + }, + { + "epoch": 0.55, + "learning_rate": 1.8776464377248832e-06, + "loss": 0.7939, + "step": 21577 + }, + { + "epoch": 0.55, + "learning_rate": 1.8776331747024862e-06, + "loss": 0.8579, + "step": 21578 + }, + { + "epoch": 0.55, + "learning_rate": 1.877619911008126e-06, + "loss": 0.8047, + "step": 21579 + }, + { + "epoch": 0.55, + "learning_rate": 1.8776066466418121e-06, + "loss": 0.5913, + "step": 21580 + }, + { + "epoch": 0.55, + "learning_rate": 1.8775933816035553e-06, + "loss": 0.75, + "step": 21581 + }, + { + "epoch": 0.55, + "learning_rate": 1.8775801158933654e-06, + "loss": 0.8306, + "step": 21582 + }, + { + "epoch": 0.55, + "learning_rate": 1.8775668495112532e-06, + "loss": 0.8955, + "step": 21583 + }, + { + "epoch": 0.55, + "learning_rate": 1.877553582457228e-06, + "loss": 0.8799, + "step": 21584 + }, + { + "epoch": 0.55, + "learning_rate": 1.8775403147313004e-06, + "loss": 0.9658, + "step": 21585 + }, + { + "epoch": 0.55, + "learning_rate": 1.8775270463334808e-06, + "loss": 1.0303, + "step": 21586 + }, + { + "epoch": 0.55, + "learning_rate": 1.8775137772637791e-06, + "loss": 0.9385, + "step": 21587 + }, + { + "epoch": 0.55, + "learning_rate": 1.877500507522205e-06, + "loss": 0.8457, + "step": 21588 + }, + { + "epoch": 0.55, + "learning_rate": 1.8774872371087696e-06, + "loss": 0.7109, + "step": 21589 + }, + { + "epoch": 0.55, + "learning_rate": 1.8774739660234821e-06, + "loss": 1.0469, + "step": 21590 + }, + { + "epoch": 0.55, + "learning_rate": 1.8774606942663537e-06, + "loss": 0.9463, + "step": 21591 + }, + { + "epoch": 0.55, + "learning_rate": 1.8774474218373935e-06, + "loss": 0.8223, + "step": 21592 + }, + { + "epoch": 0.55, + "learning_rate": 1.8774341487366125e-06, + "loss": 0.9082, + "step": 21593 + }, + { + "epoch": 0.55, + "learning_rate": 1.8774208749640204e-06, + "loss": 0.7109, + "step": 21594 + }, + { + "epoch": 0.55, + "learning_rate": 1.8774076005196275e-06, + "loss": 0.8818, + "step": 21595 + }, + { + "epoch": 0.55, + "learning_rate": 1.877394325403444e-06, + "loss": 0.9688, + "step": 21596 + }, + { + "epoch": 0.55, + "learning_rate": 1.8773810496154797e-06, + "loss": 0.9814, + "step": 21597 + }, + { + "epoch": 0.55, + "learning_rate": 1.8773677731557453e-06, + "loss": 0.959, + "step": 21598 + }, + { + "epoch": 0.55, + "learning_rate": 1.8773544960242509e-06, + "loss": 1.0332, + "step": 21599 + }, + { + "epoch": 0.55, + "learning_rate": 1.8773412182210062e-06, + "loss": 0.645, + "step": 21600 + }, + { + "epoch": 0.55, + "learning_rate": 1.8773279397460218e-06, + "loss": 0.6868, + "step": 21601 + }, + { + "epoch": 0.55, + "learning_rate": 1.8773146605993078e-06, + "loss": 0.7573, + "step": 21602 + }, + { + "epoch": 0.55, + "learning_rate": 1.877301380780874e-06, + "loss": 0.6492, + "step": 21603 + }, + { + "epoch": 0.55, + "learning_rate": 1.8772881002907312e-06, + "loss": 0.9775, + "step": 21604 + }, + { + "epoch": 0.55, + "learning_rate": 1.8772748191288894e-06, + "loss": 1.1836, + "step": 21605 + }, + { + "epoch": 0.55, + "learning_rate": 1.8772615372953582e-06, + "loss": 0.9463, + "step": 21606 + }, + { + "epoch": 0.55, + "learning_rate": 1.8772482547901483e-06, + "loss": 0.9204, + "step": 21607 + }, + { + "epoch": 0.55, + "learning_rate": 1.8772349716132698e-06, + "loss": 1.0615, + "step": 21608 + }, + { + "epoch": 0.55, + "learning_rate": 1.877221687764733e-06, + "loss": 0.7446, + "step": 21609 + }, + { + "epoch": 0.55, + "learning_rate": 1.8772084032445474e-06, + "loss": 1.0576, + "step": 21610 + }, + { + "epoch": 0.55, + "learning_rate": 1.877195118052724e-06, + "loss": 0.7539, + "step": 21611 + }, + { + "epoch": 0.55, + "learning_rate": 1.8771818321892726e-06, + "loss": 0.9385, + "step": 21612 + }, + { + "epoch": 0.55, + "learning_rate": 1.8771685456542037e-06, + "loss": 0.9648, + "step": 21613 + }, + { + "epoch": 0.55, + "learning_rate": 1.8771552584475266e-06, + "loss": 0.8745, + "step": 21614 + }, + { + "epoch": 0.55, + "learning_rate": 1.8771419705692523e-06, + "loss": 1.209, + "step": 21615 + }, + { + "epoch": 0.55, + "learning_rate": 1.877128682019391e-06, + "loss": 0.918, + "step": 21616 + }, + { + "epoch": 0.55, + "learning_rate": 1.8771153927979522e-06, + "loss": 1.0605, + "step": 21617 + }, + { + "epoch": 0.55, + "learning_rate": 1.8771021029049465e-06, + "loss": 1.0557, + "step": 21618 + }, + { + "epoch": 0.55, + "learning_rate": 1.8770888123403843e-06, + "loss": 0.8125, + "step": 21619 + }, + { + "epoch": 0.55, + "learning_rate": 1.8770755211042755e-06, + "loss": 0.9102, + "step": 21620 + }, + { + "epoch": 0.55, + "learning_rate": 1.8770622291966301e-06, + "loss": 0.7568, + "step": 21621 + }, + { + "epoch": 0.55, + "learning_rate": 1.8770489366174587e-06, + "loss": 0.9248, + "step": 21622 + }, + { + "epoch": 0.55, + "learning_rate": 1.8770356433667712e-06, + "loss": 0.6138, + "step": 21623 + }, + { + "epoch": 0.55, + "learning_rate": 1.8770223494445776e-06, + "loss": 0.9648, + "step": 21624 + }, + { + "epoch": 0.55, + "learning_rate": 1.8770090548508886e-06, + "loss": 0.9512, + "step": 21625 + }, + { + "epoch": 0.55, + "learning_rate": 1.8769957595857137e-06, + "loss": 1.0186, + "step": 21626 + }, + { + "epoch": 0.55, + "learning_rate": 1.8769824636490638e-06, + "loss": 0.8672, + "step": 21627 + }, + { + "epoch": 0.55, + "learning_rate": 1.8769691670409488e-06, + "loss": 1.041, + "step": 21628 + }, + { + "epoch": 0.55, + "learning_rate": 1.8769558697613787e-06, + "loss": 0.8379, + "step": 21629 + }, + { + "epoch": 0.55, + "learning_rate": 1.876942571810364e-06, + "loss": 0.9668, + "step": 21630 + }, + { + "epoch": 0.55, + "learning_rate": 1.8769292731879144e-06, + "loss": 0.8398, + "step": 21631 + }, + { + "epoch": 0.55, + "learning_rate": 1.8769159738940407e-06, + "loss": 0.8877, + "step": 21632 + }, + { + "epoch": 0.55, + "learning_rate": 1.8769026739287526e-06, + "loss": 0.7036, + "step": 21633 + }, + { + "epoch": 0.55, + "learning_rate": 1.8768893732920604e-06, + "loss": 0.751, + "step": 21634 + }, + { + "epoch": 0.55, + "learning_rate": 1.8768760719839746e-06, + "loss": 0.9248, + "step": 21635 + }, + { + "epoch": 0.55, + "learning_rate": 1.8768627700045045e-06, + "loss": 0.7134, + "step": 21636 + }, + { + "epoch": 0.55, + "learning_rate": 1.8768494673536614e-06, + "loss": 1.0068, + "step": 21637 + }, + { + "epoch": 0.55, + "learning_rate": 1.8768361640314549e-06, + "loss": 1.042, + "step": 21638 + }, + { + "epoch": 0.55, + "learning_rate": 1.8768228600378953e-06, + "loss": 0.835, + "step": 21639 + }, + { + "epoch": 0.55, + "learning_rate": 1.8768095553729927e-06, + "loss": 0.7949, + "step": 21640 + }, + { + "epoch": 0.55, + "learning_rate": 1.8767962500367571e-06, + "loss": 0.8472, + "step": 21641 + }, + { + "epoch": 0.55, + "learning_rate": 1.876782944029199e-06, + "loss": 0.9199, + "step": 21642 + }, + { + "epoch": 0.55, + "learning_rate": 1.8767696373503289e-06, + "loss": 0.6956, + "step": 21643 + }, + { + "epoch": 0.55, + "learning_rate": 1.8767563300001562e-06, + "loss": 0.8369, + "step": 21644 + }, + { + "epoch": 0.55, + "learning_rate": 1.8767430219786918e-06, + "loss": 0.8809, + "step": 21645 + }, + { + "epoch": 0.55, + "learning_rate": 1.8767297132859455e-06, + "loss": 0.8184, + "step": 21646 + }, + { + "epoch": 0.55, + "learning_rate": 1.8767164039219275e-06, + "loss": 0.7427, + "step": 21647 + }, + { + "epoch": 0.55, + "learning_rate": 1.8767030938866477e-06, + "loss": 0.9551, + "step": 21648 + }, + { + "epoch": 0.55, + "learning_rate": 1.8766897831801172e-06, + "loss": 1.0088, + "step": 21649 + }, + { + "epoch": 0.55, + "learning_rate": 1.8766764718023452e-06, + "loss": 0.8333, + "step": 21650 + }, + { + "epoch": 0.55, + "learning_rate": 1.8766631597533429e-06, + "loss": 0.9014, + "step": 21651 + }, + { + "epoch": 0.55, + "learning_rate": 1.8766498470331197e-06, + "loss": 0.9395, + "step": 21652 + }, + { + "epoch": 0.55, + "learning_rate": 1.876636533641686e-06, + "loss": 0.624, + "step": 21653 + }, + { + "epoch": 0.56, + "learning_rate": 1.8766232195790516e-06, + "loss": 0.9619, + "step": 21654 + }, + { + "epoch": 0.56, + "learning_rate": 1.8766099048452278e-06, + "loss": 0.9453, + "step": 21655 + }, + { + "epoch": 0.56, + "learning_rate": 1.8765965894402235e-06, + "loss": 0.9043, + "step": 21656 + }, + { + "epoch": 0.56, + "learning_rate": 1.87658327336405e-06, + "loss": 0.8086, + "step": 21657 + }, + { + "epoch": 0.56, + "learning_rate": 1.8765699566167169e-06, + "loss": 0.5215, + "step": 21658 + }, + { + "epoch": 0.56, + "learning_rate": 1.8765566391982342e-06, + "loss": 0.8574, + "step": 21659 + }, + { + "epoch": 0.56, + "learning_rate": 1.8765433211086124e-06, + "loss": 1.1191, + "step": 21660 + }, + { + "epoch": 0.56, + "learning_rate": 1.8765300023478618e-06, + "loss": 0.8232, + "step": 21661 + }, + { + "epoch": 0.56, + "learning_rate": 1.8765166829159926e-06, + "loss": 1.0342, + "step": 21662 + }, + { + "epoch": 0.56, + "learning_rate": 1.8765033628130147e-06, + "loss": 0.9912, + "step": 21663 + }, + { + "epoch": 0.56, + "learning_rate": 1.8764900420389388e-06, + "loss": 0.7598, + "step": 21664 + }, + { + "epoch": 0.56, + "learning_rate": 1.8764767205937743e-06, + "loss": 0.9121, + "step": 21665 + }, + { + "epoch": 0.56, + "learning_rate": 1.8764633984775321e-06, + "loss": 0.7979, + "step": 21666 + }, + { + "epoch": 0.56, + "learning_rate": 1.8764500756902222e-06, + "loss": 0.7559, + "step": 21667 + }, + { + "epoch": 0.56, + "learning_rate": 1.876436752231855e-06, + "loss": 0.6274, + "step": 21668 + }, + { + "epoch": 0.56, + "learning_rate": 1.87642342810244e-06, + "loss": 0.8135, + "step": 21669 + }, + { + "epoch": 0.56, + "learning_rate": 1.876410103301988e-06, + "loss": 0.7661, + "step": 21670 + }, + { + "epoch": 0.56, + "learning_rate": 1.8763967778305095e-06, + "loss": 0.8428, + "step": 21671 + }, + { + "epoch": 0.56, + "learning_rate": 1.8763834516880139e-06, + "loss": 0.9521, + "step": 21672 + }, + { + "epoch": 0.56, + "learning_rate": 1.8763701248745122e-06, + "loss": 0.9199, + "step": 21673 + }, + { + "epoch": 0.56, + "learning_rate": 1.8763567973900136e-06, + "loss": 1.0752, + "step": 21674 + }, + { + "epoch": 0.56, + "learning_rate": 1.8763434692345292e-06, + "loss": 0.8896, + "step": 21675 + }, + { + "epoch": 0.56, + "learning_rate": 1.876330140408069e-06, + "loss": 0.7637, + "step": 21676 + }, + { + "epoch": 0.56, + "learning_rate": 1.876316810910643e-06, + "loss": 0.9678, + "step": 21677 + }, + { + "epoch": 0.56, + "learning_rate": 1.8763034807422616e-06, + "loss": 0.9736, + "step": 21678 + }, + { + "epoch": 0.56, + "learning_rate": 1.8762901499029345e-06, + "loss": 0.9961, + "step": 21679 + }, + { + "epoch": 0.56, + "learning_rate": 1.8762768183926727e-06, + "loss": 0.8877, + "step": 21680 + }, + { + "epoch": 0.56, + "learning_rate": 1.876263486211486e-06, + "loss": 0.6826, + "step": 21681 + }, + { + "epoch": 0.56, + "learning_rate": 1.8762501533593847e-06, + "loss": 0.8418, + "step": 21682 + }, + { + "epoch": 0.56, + "learning_rate": 1.8762368198363787e-06, + "loss": 1.0303, + "step": 21683 + }, + { + "epoch": 0.56, + "learning_rate": 1.8762234856424786e-06, + "loss": 0.8652, + "step": 21684 + }, + { + "epoch": 0.56, + "learning_rate": 1.8762101507776945e-06, + "loss": 0.8564, + "step": 21685 + }, + { + "epoch": 0.56, + "learning_rate": 1.8761968152420366e-06, + "loss": 0.7959, + "step": 21686 + }, + { + "epoch": 0.56, + "learning_rate": 1.8761834790355149e-06, + "loss": 0.7959, + "step": 21687 + }, + { + "epoch": 0.56, + "learning_rate": 1.87617014215814e-06, + "loss": 0.8223, + "step": 21688 + }, + { + "epoch": 0.56, + "learning_rate": 1.876156804609922e-06, + "loss": 1.0059, + "step": 21689 + }, + { + "epoch": 0.56, + "learning_rate": 1.8761434663908708e-06, + "loss": 0.8184, + "step": 21690 + }, + { + "epoch": 0.56, + "learning_rate": 1.876130127500997e-06, + "loss": 0.7988, + "step": 21691 + }, + { + "epoch": 0.56, + "learning_rate": 1.8761167879403103e-06, + "loss": 0.8252, + "step": 21692 + }, + { + "epoch": 0.56, + "learning_rate": 1.8761034477088216e-06, + "loss": 0.8682, + "step": 21693 + }, + { + "epoch": 0.56, + "learning_rate": 1.876090106806541e-06, + "loss": 0.7639, + "step": 21694 + }, + { + "epoch": 0.56, + "learning_rate": 1.876076765233478e-06, + "loss": 0.8359, + "step": 21695 + }, + { + "epoch": 0.56, + "learning_rate": 1.8760634229896434e-06, + "loss": 0.6909, + "step": 21696 + }, + { + "epoch": 0.56, + "learning_rate": 1.8760500800750476e-06, + "loss": 0.9463, + "step": 21697 + }, + { + "epoch": 0.56, + "learning_rate": 1.8760367364897002e-06, + "loss": 0.9424, + "step": 21698 + }, + { + "epoch": 0.56, + "learning_rate": 1.8760233922336117e-06, + "loss": 0.9795, + "step": 21699 + }, + { + "epoch": 0.56, + "learning_rate": 1.8760100473067928e-06, + "loss": 0.7959, + "step": 21700 + }, + { + "epoch": 0.56, + "learning_rate": 1.875996701709253e-06, + "loss": 1.1387, + "step": 21701 + }, + { + "epoch": 0.56, + "learning_rate": 1.875983355441003e-06, + "loss": 0.8311, + "step": 21702 + }, + { + "epoch": 0.56, + "learning_rate": 1.8759700085020525e-06, + "loss": 0.8491, + "step": 21703 + }, + { + "epoch": 0.56, + "learning_rate": 1.8759566608924121e-06, + "loss": 0.833, + "step": 21704 + }, + { + "epoch": 0.56, + "learning_rate": 1.8759433126120924e-06, + "loss": 0.6279, + "step": 21705 + }, + { + "epoch": 0.56, + "learning_rate": 1.8759299636611025e-06, + "loss": 0.7222, + "step": 21706 + }, + { + "epoch": 0.56, + "learning_rate": 1.875916614039454e-06, + "loss": 0.8877, + "step": 21707 + }, + { + "epoch": 0.56, + "learning_rate": 1.8759032637471559e-06, + "loss": 0.9854, + "step": 21708 + }, + { + "epoch": 0.56, + "learning_rate": 1.8758899127842193e-06, + "loss": 0.8867, + "step": 21709 + }, + { + "epoch": 0.56, + "learning_rate": 1.8758765611506538e-06, + "loss": 0.8496, + "step": 21710 + }, + { + "epoch": 0.56, + "learning_rate": 1.8758632088464702e-06, + "loss": 0.7158, + "step": 21711 + }, + { + "epoch": 0.56, + "learning_rate": 1.875849855871678e-06, + "loss": 0.6504, + "step": 21712 + }, + { + "epoch": 0.56, + "learning_rate": 1.875836502226288e-06, + "loss": 1.0166, + "step": 21713 + }, + { + "epoch": 0.56, + "learning_rate": 1.8758231479103102e-06, + "loss": 0.7002, + "step": 21714 + }, + { + "epoch": 0.56, + "learning_rate": 1.8758097929237551e-06, + "loss": 0.7446, + "step": 21715 + }, + { + "epoch": 0.56, + "learning_rate": 1.8757964372666326e-06, + "loss": 0.7471, + "step": 21716 + }, + { + "epoch": 0.56, + "learning_rate": 1.8757830809389529e-06, + "loss": 0.7871, + "step": 21717 + }, + { + "epoch": 0.56, + "learning_rate": 1.875769723940727e-06, + "loss": 0.7334, + "step": 21718 + }, + { + "epoch": 0.56, + "learning_rate": 1.8757563662719639e-06, + "loss": 0.9102, + "step": 21719 + }, + { + "epoch": 0.56, + "learning_rate": 1.8757430079326743e-06, + "loss": 0.9209, + "step": 21720 + }, + { + "epoch": 0.56, + "learning_rate": 1.875729648922869e-06, + "loss": 0.8564, + "step": 21721 + }, + { + "epoch": 0.56, + "learning_rate": 1.8757162892425574e-06, + "loss": 0.7959, + "step": 21722 + }, + { + "epoch": 0.56, + "learning_rate": 1.87570292889175e-06, + "loss": 0.7959, + "step": 21723 + }, + { + "epoch": 0.56, + "learning_rate": 1.8756895678704577e-06, + "loss": 0.79, + "step": 21724 + }, + { + "epoch": 0.56, + "learning_rate": 1.8756762061786896e-06, + "loss": 0.7646, + "step": 21725 + }, + { + "epoch": 0.56, + "learning_rate": 1.8756628438164568e-06, + "loss": 0.9121, + "step": 21726 + }, + { + "epoch": 0.56, + "learning_rate": 1.8756494807837693e-06, + "loss": 0.9272, + "step": 21727 + }, + { + "epoch": 0.56, + "learning_rate": 1.8756361170806372e-06, + "loss": 0.8252, + "step": 21728 + }, + { + "epoch": 0.56, + "learning_rate": 1.8756227527070705e-06, + "loss": 0.9863, + "step": 21729 + }, + { + "epoch": 0.56, + "learning_rate": 1.87560938766308e-06, + "loss": 0.9756, + "step": 21730 + }, + { + "epoch": 0.56, + "learning_rate": 1.8755960219486756e-06, + "loss": 0.7808, + "step": 21731 + }, + { + "epoch": 0.56, + "learning_rate": 1.8755826555638677e-06, + "loss": 0.7935, + "step": 21732 + }, + { + "epoch": 0.56, + "learning_rate": 1.875569288508666e-06, + "loss": 0.9531, + "step": 21733 + }, + { + "epoch": 0.56, + "learning_rate": 1.8755559207830816e-06, + "loss": 0.8379, + "step": 21734 + }, + { + "epoch": 0.56, + "learning_rate": 1.875542552387124e-06, + "loss": 0.9028, + "step": 21735 + }, + { + "epoch": 0.56, + "learning_rate": 1.875529183320804e-06, + "loss": 0.7847, + "step": 21736 + }, + { + "epoch": 0.56, + "learning_rate": 1.8755158135841315e-06, + "loss": 0.9043, + "step": 21737 + }, + { + "epoch": 0.56, + "learning_rate": 1.8755024431771167e-06, + "loss": 0.9248, + "step": 21738 + }, + { + "epoch": 0.56, + "learning_rate": 1.8754890720997697e-06, + "loss": 0.9082, + "step": 21739 + }, + { + "epoch": 0.56, + "learning_rate": 1.8754757003521012e-06, + "loss": 1.042, + "step": 21740 + }, + { + "epoch": 0.56, + "learning_rate": 1.8754623279341214e-06, + "loss": 0.8164, + "step": 21741 + }, + { + "epoch": 0.56, + "learning_rate": 1.87544895484584e-06, + "loss": 0.6768, + "step": 21742 + }, + { + "epoch": 0.56, + "learning_rate": 1.875435581087268e-06, + "loss": 0.9033, + "step": 21743 + }, + { + "epoch": 0.56, + "learning_rate": 1.8754222066584152e-06, + "loss": 0.9668, + "step": 21744 + }, + { + "epoch": 0.56, + "learning_rate": 1.8754088315592912e-06, + "loss": 0.9521, + "step": 21745 + }, + { + "epoch": 0.56, + "learning_rate": 1.8753954557899076e-06, + "loss": 0.897, + "step": 21746 + }, + { + "epoch": 0.56, + "learning_rate": 1.875382079350274e-06, + "loss": 0.6782, + "step": 21747 + }, + { + "epoch": 0.56, + "learning_rate": 1.8753687022404e-06, + "loss": 1.0049, + "step": 21748 + }, + { + "epoch": 0.56, + "learning_rate": 1.8753553244602968e-06, + "loss": 0.6343, + "step": 21749 + }, + { + "epoch": 0.56, + "learning_rate": 1.8753419460099744e-06, + "loss": 0.9561, + "step": 21750 + }, + { + "epoch": 0.56, + "learning_rate": 1.8753285668894428e-06, + "loss": 1.0439, + "step": 21751 + }, + { + "epoch": 0.56, + "learning_rate": 1.8753151870987124e-06, + "loss": 0.9238, + "step": 21752 + }, + { + "epoch": 0.56, + "learning_rate": 1.8753018066377932e-06, + "loss": 0.7559, + "step": 21753 + }, + { + "epoch": 0.56, + "learning_rate": 1.8752884255066959e-06, + "loss": 0.8516, + "step": 21754 + }, + { + "epoch": 0.56, + "learning_rate": 1.87527504370543e-06, + "loss": 0.707, + "step": 21755 + }, + { + "epoch": 0.56, + "learning_rate": 1.8752616612340068e-06, + "loss": 0.7368, + "step": 21756 + }, + { + "epoch": 0.56, + "learning_rate": 1.875248278092436e-06, + "loss": 0.6753, + "step": 21757 + }, + { + "epoch": 0.56, + "learning_rate": 1.8752348942807275e-06, + "loss": 0.5911, + "step": 21758 + }, + { + "epoch": 0.56, + "learning_rate": 1.875221509798892e-06, + "loss": 0.9795, + "step": 21759 + }, + { + "epoch": 0.56, + "learning_rate": 1.87520812464694e-06, + "loss": 0.9658, + "step": 21760 + }, + { + "epoch": 0.56, + "learning_rate": 1.8751947388248807e-06, + "loss": 0.7905, + "step": 21761 + }, + { + "epoch": 0.56, + "learning_rate": 1.8751813523327255e-06, + "loss": 0.8203, + "step": 21762 + }, + { + "epoch": 0.56, + "learning_rate": 1.8751679651704842e-06, + "loss": 0.5347, + "step": 21763 + }, + { + "epoch": 0.56, + "learning_rate": 1.875154577338167e-06, + "loss": 0.688, + "step": 21764 + }, + { + "epoch": 0.56, + "learning_rate": 1.8751411888357839e-06, + "loss": 0.8584, + "step": 21765 + }, + { + "epoch": 0.56, + "learning_rate": 1.8751277996633456e-06, + "loss": 0.7324, + "step": 21766 + }, + { + "epoch": 0.56, + "learning_rate": 1.8751144098208625e-06, + "loss": 0.9941, + "step": 21767 + }, + { + "epoch": 0.56, + "learning_rate": 1.8751010193083442e-06, + "loss": 0.874, + "step": 21768 + }, + { + "epoch": 0.56, + "learning_rate": 1.8750876281258012e-06, + "loss": 1.0684, + "step": 21769 + }, + { + "epoch": 0.56, + "learning_rate": 1.8750742362732441e-06, + "loss": 0.8022, + "step": 21770 + }, + { + "epoch": 0.56, + "learning_rate": 1.8750608437506827e-06, + "loss": 0.9463, + "step": 21771 + }, + { + "epoch": 0.56, + "learning_rate": 1.8750474505581276e-06, + "loss": 0.8555, + "step": 21772 + }, + { + "epoch": 0.56, + "learning_rate": 1.8750340566955889e-06, + "loss": 0.9023, + "step": 21773 + }, + { + "epoch": 0.56, + "learning_rate": 1.8750206621630765e-06, + "loss": 0.8955, + "step": 21774 + }, + { + "epoch": 0.56, + "learning_rate": 1.8750072669606014e-06, + "loss": 0.7666, + "step": 21775 + }, + { + "epoch": 0.56, + "learning_rate": 1.8749938710881733e-06, + "loss": 0.7463, + "step": 21776 + }, + { + "epoch": 0.56, + "learning_rate": 1.8749804745458028e-06, + "loss": 0.9541, + "step": 21777 + }, + { + "epoch": 0.56, + "learning_rate": 1.8749670773334997e-06, + "loss": 0.9268, + "step": 21778 + }, + { + "epoch": 0.56, + "learning_rate": 1.8749536794512749e-06, + "loss": 0.7129, + "step": 21779 + }, + { + "epoch": 0.56, + "learning_rate": 1.8749402808991382e-06, + "loss": 1.0439, + "step": 21780 + }, + { + "epoch": 0.56, + "learning_rate": 1.8749268816770995e-06, + "loss": 0.8643, + "step": 21781 + }, + { + "epoch": 0.56, + "learning_rate": 1.8749134817851702e-06, + "loss": 0.7402, + "step": 21782 + }, + { + "epoch": 0.56, + "learning_rate": 1.8749000812233592e-06, + "loss": 0.8203, + "step": 21783 + }, + { + "epoch": 0.56, + "learning_rate": 1.8748866799916781e-06, + "loss": 0.9102, + "step": 21784 + }, + { + "epoch": 0.56, + "learning_rate": 1.8748732780901363e-06, + "loss": 0.7747, + "step": 21785 + }, + { + "epoch": 0.56, + "learning_rate": 1.874859875518744e-06, + "loss": 0.8713, + "step": 21786 + }, + { + "epoch": 0.56, + "learning_rate": 1.874846472277512e-06, + "loss": 0.8906, + "step": 21787 + }, + { + "epoch": 0.56, + "learning_rate": 1.8748330683664499e-06, + "loss": 0.9756, + "step": 21788 + }, + { + "epoch": 0.56, + "learning_rate": 1.8748196637855687e-06, + "loss": 0.9414, + "step": 21789 + }, + { + "epoch": 0.56, + "learning_rate": 1.8748062585348783e-06, + "loss": 0.8955, + "step": 21790 + }, + { + "epoch": 0.56, + "learning_rate": 1.8747928526143887e-06, + "loss": 0.7876, + "step": 21791 + }, + { + "epoch": 0.56, + "learning_rate": 1.8747794460241106e-06, + "loss": 0.8652, + "step": 21792 + }, + { + "epoch": 0.56, + "learning_rate": 1.8747660387640543e-06, + "loss": 0.8193, + "step": 21793 + }, + { + "epoch": 0.56, + "learning_rate": 1.8747526308342296e-06, + "loss": 0.6855, + "step": 21794 + }, + { + "epoch": 0.56, + "learning_rate": 1.8747392222346472e-06, + "loss": 0.9785, + "step": 21795 + }, + { + "epoch": 0.56, + "learning_rate": 1.8747258129653171e-06, + "loss": 1.0693, + "step": 21796 + }, + { + "epoch": 0.56, + "learning_rate": 1.8747124030262498e-06, + "loss": 0.8535, + "step": 21797 + }, + { + "epoch": 0.56, + "learning_rate": 1.8746989924174553e-06, + "loss": 0.6416, + "step": 21798 + }, + { + "epoch": 0.56, + "learning_rate": 1.874685581138944e-06, + "loss": 0.9736, + "step": 21799 + }, + { + "epoch": 0.56, + "learning_rate": 1.8746721691907262e-06, + "loss": 0.7104, + "step": 21800 + }, + { + "epoch": 0.56, + "learning_rate": 1.874658756572812e-06, + "loss": 0.7036, + "step": 21801 + }, + { + "epoch": 0.56, + "learning_rate": 1.8746453432852122e-06, + "loss": 1.0107, + "step": 21802 + }, + { + "epoch": 0.56, + "learning_rate": 1.8746319293279363e-06, + "loss": 0.8096, + "step": 21803 + }, + { + "epoch": 0.56, + "learning_rate": 1.874618514700995e-06, + "loss": 0.9297, + "step": 21804 + }, + { + "epoch": 0.56, + "learning_rate": 1.8746050994043987e-06, + "loss": 0.8535, + "step": 21805 + }, + { + "epoch": 0.56, + "learning_rate": 1.8745916834381572e-06, + "loss": 0.6509, + "step": 21806 + }, + { + "epoch": 0.56, + "learning_rate": 1.8745782668022812e-06, + "loss": 0.8589, + "step": 21807 + }, + { + "epoch": 0.56, + "learning_rate": 1.8745648494967809e-06, + "loss": 0.9404, + "step": 21808 + }, + { + "epoch": 0.56, + "learning_rate": 1.8745514315216665e-06, + "loss": 0.7031, + "step": 21809 + }, + { + "epoch": 0.56, + "learning_rate": 1.8745380128769483e-06, + "loss": 0.8643, + "step": 21810 + }, + { + "epoch": 0.56, + "learning_rate": 1.8745245935626363e-06, + "loss": 0.7468, + "step": 21811 + }, + { + "epoch": 0.56, + "learning_rate": 1.8745111735787416e-06, + "loss": 0.9185, + "step": 21812 + }, + { + "epoch": 0.56, + "learning_rate": 1.8744977529252735e-06, + "loss": 1.001, + "step": 21813 + }, + { + "epoch": 0.56, + "learning_rate": 1.8744843316022428e-06, + "loss": 0.9277, + "step": 21814 + }, + { + "epoch": 0.56, + "learning_rate": 1.8744709096096596e-06, + "loss": 0.9521, + "step": 21815 + }, + { + "epoch": 0.56, + "learning_rate": 1.8744574869475342e-06, + "loss": 0.7705, + "step": 21816 + }, + { + "epoch": 0.56, + "learning_rate": 1.8744440636158769e-06, + "loss": 0.8892, + "step": 21817 + }, + { + "epoch": 0.56, + "learning_rate": 1.8744306396146978e-06, + "loss": 0.8281, + "step": 21818 + }, + { + "epoch": 0.56, + "learning_rate": 1.8744172149440076e-06, + "loss": 0.9395, + "step": 21819 + }, + { + "epoch": 0.56, + "learning_rate": 1.8744037896038164e-06, + "loss": 0.7339, + "step": 21820 + }, + { + "epoch": 0.56, + "learning_rate": 1.8743903635941344e-06, + "loss": 0.9414, + "step": 21821 + }, + { + "epoch": 0.56, + "learning_rate": 1.874376936914972e-06, + "loss": 0.8257, + "step": 21822 + }, + { + "epoch": 0.56, + "learning_rate": 1.874363509566339e-06, + "loss": 0.8672, + "step": 21823 + }, + { + "epoch": 0.56, + "learning_rate": 1.8743500815482464e-06, + "loss": 0.8174, + "step": 21824 + }, + { + "epoch": 0.56, + "learning_rate": 1.874336652860704e-06, + "loss": 1.0908, + "step": 21825 + }, + { + "epoch": 0.56, + "learning_rate": 1.8743232235037225e-06, + "loss": 0.7246, + "step": 21826 + }, + { + "epoch": 0.56, + "learning_rate": 1.8743097934773116e-06, + "loss": 0.8906, + "step": 21827 + }, + { + "epoch": 0.56, + "learning_rate": 1.874296362781482e-06, + "loss": 0.7573, + "step": 21828 + }, + { + "epoch": 0.56, + "learning_rate": 1.874282931416244e-06, + "loss": 0.9746, + "step": 21829 + }, + { + "epoch": 0.56, + "learning_rate": 1.8742694993816074e-06, + "loss": 0.8701, + "step": 21830 + }, + { + "epoch": 0.56, + "learning_rate": 1.8742560666775832e-06, + "loss": 1.0352, + "step": 21831 + }, + { + "epoch": 0.56, + "learning_rate": 1.8742426333041811e-06, + "loss": 1.0654, + "step": 21832 + }, + { + "epoch": 0.56, + "learning_rate": 1.8742291992614119e-06, + "loss": 0.8428, + "step": 21833 + }, + { + "epoch": 0.56, + "learning_rate": 1.8742157645492854e-06, + "loss": 0.7871, + "step": 21834 + }, + { + "epoch": 0.56, + "learning_rate": 1.874202329167812e-06, + "loss": 0.6426, + "step": 21835 + }, + { + "epoch": 0.56, + "learning_rate": 1.8741888931170022e-06, + "loss": 0.9688, + "step": 21836 + }, + { + "epoch": 0.56, + "learning_rate": 1.8741754563968662e-06, + "loss": 0.7607, + "step": 21837 + }, + { + "epoch": 0.56, + "learning_rate": 1.874162019007414e-06, + "loss": 0.7798, + "step": 21838 + }, + { + "epoch": 0.56, + "learning_rate": 1.8741485809486566e-06, + "loss": 0.9727, + "step": 21839 + }, + { + "epoch": 0.56, + "learning_rate": 1.8741351422206036e-06, + "loss": 0.7705, + "step": 21840 + }, + { + "epoch": 0.56, + "learning_rate": 1.8741217028232653e-06, + "loss": 1.1035, + "step": 21841 + }, + { + "epoch": 0.56, + "learning_rate": 1.8741082627566525e-06, + "loss": 0.7744, + "step": 21842 + }, + { + "epoch": 0.56, + "learning_rate": 1.8740948220207748e-06, + "loss": 1.1445, + "step": 21843 + }, + { + "epoch": 0.56, + "learning_rate": 1.8740813806156432e-06, + "loss": 0.853, + "step": 21844 + }, + { + "epoch": 0.56, + "learning_rate": 1.8740679385412677e-06, + "loss": 0.8228, + "step": 21845 + }, + { + "epoch": 0.56, + "learning_rate": 1.8740544957976585e-06, + "loss": 0.8154, + "step": 21846 + }, + { + "epoch": 0.56, + "learning_rate": 1.874041052384826e-06, + "loss": 1.0098, + "step": 21847 + }, + { + "epoch": 0.56, + "learning_rate": 1.8740276083027804e-06, + "loss": 0.8877, + "step": 21848 + }, + { + "epoch": 0.56, + "learning_rate": 1.8740141635515322e-06, + "loss": 0.9023, + "step": 21849 + }, + { + "epoch": 0.56, + "learning_rate": 1.8740007181310913e-06, + "loss": 0.8203, + "step": 21850 + }, + { + "epoch": 0.56, + "learning_rate": 1.8739872720414684e-06, + "loss": 1.001, + "step": 21851 + }, + { + "epoch": 0.56, + "learning_rate": 1.8739738252826735e-06, + "loss": 0.9277, + "step": 21852 + }, + { + "epoch": 0.56, + "learning_rate": 1.8739603778547171e-06, + "loss": 0.7656, + "step": 21853 + }, + { + "epoch": 0.56, + "learning_rate": 1.8739469297576096e-06, + "loss": 0.7334, + "step": 21854 + }, + { + "epoch": 0.56, + "learning_rate": 1.8739334809913609e-06, + "loss": 0.7251, + "step": 21855 + }, + { + "epoch": 0.56, + "learning_rate": 1.8739200315559813e-06, + "loss": 1.0234, + "step": 21856 + }, + { + "epoch": 0.56, + "learning_rate": 1.873906581451482e-06, + "loss": 1.0459, + "step": 21857 + }, + { + "epoch": 0.56, + "learning_rate": 1.873893130677872e-06, + "loss": 0.8848, + "step": 21858 + }, + { + "epoch": 0.56, + "learning_rate": 1.8738796792351622e-06, + "loss": 0.8008, + "step": 21859 + }, + { + "epoch": 0.56, + "learning_rate": 1.873866227123363e-06, + "loss": 0.8652, + "step": 21860 + }, + { + "epoch": 0.56, + "learning_rate": 1.873852774342485e-06, + "loss": 0.8477, + "step": 21861 + }, + { + "epoch": 0.56, + "learning_rate": 1.873839320892538e-06, + "loss": 0.8481, + "step": 21862 + }, + { + "epoch": 0.56, + "learning_rate": 1.873825866773532e-06, + "loss": 1.0488, + "step": 21863 + }, + { + "epoch": 0.56, + "learning_rate": 1.8738124119854781e-06, + "loss": 0.8184, + "step": 21864 + }, + { + "epoch": 0.56, + "learning_rate": 1.8737989565283861e-06, + "loss": 1.0703, + "step": 21865 + }, + { + "epoch": 0.56, + "learning_rate": 1.8737855004022664e-06, + "loss": 1.0859, + "step": 21866 + }, + { + "epoch": 0.56, + "learning_rate": 1.8737720436071294e-06, + "loss": 0.9346, + "step": 21867 + }, + { + "epoch": 0.56, + "learning_rate": 1.8737585861429852e-06, + "loss": 1.0479, + "step": 21868 + }, + { + "epoch": 0.56, + "learning_rate": 1.8737451280098444e-06, + "loss": 0.6582, + "step": 21869 + }, + { + "epoch": 0.56, + "learning_rate": 1.873731669207717e-06, + "loss": 0.8135, + "step": 21870 + }, + { + "epoch": 0.56, + "learning_rate": 1.8737182097366133e-06, + "loss": 0.9102, + "step": 21871 + }, + { + "epoch": 0.56, + "learning_rate": 1.8737047495965438e-06, + "loss": 0.9336, + "step": 21872 + }, + { + "epoch": 0.56, + "learning_rate": 1.8736912887875188e-06, + "loss": 0.9053, + "step": 21873 + }, + { + "epoch": 0.56, + "learning_rate": 1.873677827309549e-06, + "loss": 0.9395, + "step": 21874 + }, + { + "epoch": 0.56, + "learning_rate": 1.8736643651626436e-06, + "loss": 0.8398, + "step": 21875 + }, + { + "epoch": 0.56, + "learning_rate": 1.8736509023468138e-06, + "loss": 1.0361, + "step": 21876 + }, + { + "epoch": 0.56, + "learning_rate": 1.8736374388620697e-06, + "loss": 0.8145, + "step": 21877 + }, + { + "epoch": 0.56, + "learning_rate": 1.8736239747084218e-06, + "loss": 0.7725, + "step": 21878 + }, + { + "epoch": 0.56, + "learning_rate": 1.8736105098858798e-06, + "loss": 0.9502, + "step": 21879 + }, + { + "epoch": 0.56, + "learning_rate": 1.8735970443944544e-06, + "loss": 0.865, + "step": 21880 + }, + { + "epoch": 0.56, + "learning_rate": 1.8735835782341562e-06, + "loss": 0.7324, + "step": 21881 + }, + { + "epoch": 0.56, + "learning_rate": 1.8735701114049953e-06, + "loss": 0.7397, + "step": 21882 + }, + { + "epoch": 0.56, + "learning_rate": 1.8735566439069816e-06, + "loss": 0.7925, + "step": 21883 + }, + { + "epoch": 0.56, + "learning_rate": 1.873543175740126e-06, + "loss": 0.8584, + "step": 21884 + }, + { + "epoch": 0.56, + "learning_rate": 1.8735297069044384e-06, + "loss": 0.853, + "step": 21885 + }, + { + "epoch": 0.56, + "learning_rate": 1.8735162373999294e-06, + "loss": 0.876, + "step": 21886 + }, + { + "epoch": 0.56, + "learning_rate": 1.873502767226609e-06, + "loss": 0.665, + "step": 21887 + }, + { + "epoch": 0.56, + "learning_rate": 1.8734892963844878e-06, + "loss": 1.0098, + "step": 21888 + }, + { + "epoch": 0.56, + "learning_rate": 1.8734758248735761e-06, + "loss": 0.7856, + "step": 21889 + }, + { + "epoch": 0.56, + "learning_rate": 1.8734623526938838e-06, + "loss": 0.9043, + "step": 21890 + }, + { + "epoch": 0.56, + "learning_rate": 1.8734488798454218e-06, + "loss": 0.6648, + "step": 21891 + }, + { + "epoch": 0.56, + "learning_rate": 1.8734354063282e-06, + "loss": 0.9844, + "step": 21892 + }, + { + "epoch": 0.56, + "learning_rate": 1.8734219321422292e-06, + "loss": 0.7812, + "step": 21893 + }, + { + "epoch": 0.56, + "learning_rate": 1.873408457287519e-06, + "loss": 0.8154, + "step": 21894 + }, + { + "epoch": 0.56, + "learning_rate": 1.8733949817640803e-06, + "loss": 0.9248, + "step": 21895 + }, + { + "epoch": 0.56, + "learning_rate": 1.873381505571923e-06, + "loss": 0.9863, + "step": 21896 + }, + { + "epoch": 0.56, + "learning_rate": 1.873368028711058e-06, + "loss": 0.8252, + "step": 21897 + }, + { + "epoch": 0.56, + "learning_rate": 1.8733545511814951e-06, + "loss": 0.9941, + "step": 21898 + }, + { + "epoch": 0.56, + "learning_rate": 1.873341072983245e-06, + "loss": 0.7036, + "step": 21899 + }, + { + "epoch": 0.56, + "learning_rate": 1.8733275941163176e-06, + "loss": 0.6963, + "step": 21900 + }, + { + "epoch": 0.56, + "learning_rate": 1.8733141145807231e-06, + "loss": 0.7026, + "step": 21901 + }, + { + "epoch": 0.56, + "learning_rate": 1.8733006343764726e-06, + "loss": 0.6218, + "step": 21902 + }, + { + "epoch": 0.56, + "learning_rate": 1.873287153503576e-06, + "loss": 0.6689, + "step": 21903 + }, + { + "epoch": 0.56, + "learning_rate": 1.8732736719620433e-06, + "loss": 0.8091, + "step": 21904 + }, + { + "epoch": 0.56, + "learning_rate": 1.873260189751885e-06, + "loss": 0.5986, + "step": 21905 + }, + { + "epoch": 0.56, + "learning_rate": 1.873246706873112e-06, + "loss": 0.9902, + "step": 21906 + }, + { + "epoch": 0.56, + "learning_rate": 1.8732332233257338e-06, + "loss": 0.7305, + "step": 21907 + }, + { + "epoch": 0.56, + "learning_rate": 1.8732197391097611e-06, + "loss": 0.8721, + "step": 21908 + }, + { + "epoch": 0.56, + "learning_rate": 1.873206254225204e-06, + "loss": 0.8857, + "step": 21909 + }, + { + "epoch": 0.56, + "learning_rate": 1.8731927686720734e-06, + "loss": 0.7979, + "step": 21910 + }, + { + "epoch": 0.56, + "learning_rate": 1.873179282450379e-06, + "loss": 0.8916, + "step": 21911 + }, + { + "epoch": 0.56, + "learning_rate": 1.8731657955601315e-06, + "loss": 0.9048, + "step": 21912 + }, + { + "epoch": 0.56, + "learning_rate": 1.873152308001341e-06, + "loss": 0.7129, + "step": 21913 + }, + { + "epoch": 0.56, + "learning_rate": 1.873138819774018e-06, + "loss": 0.6841, + "step": 21914 + }, + { + "epoch": 0.56, + "learning_rate": 1.8731253308781727e-06, + "loss": 0.7896, + "step": 21915 + }, + { + "epoch": 0.56, + "learning_rate": 1.8731118413138155e-06, + "loss": 0.9531, + "step": 21916 + }, + { + "epoch": 0.56, + "learning_rate": 1.8730983510809568e-06, + "loss": 1.1533, + "step": 21917 + }, + { + "epoch": 0.56, + "learning_rate": 1.873084860179607e-06, + "loss": 0.9199, + "step": 21918 + }, + { + "epoch": 0.56, + "learning_rate": 1.8730713686097759e-06, + "loss": 0.8164, + "step": 21919 + }, + { + "epoch": 0.56, + "learning_rate": 1.8730578763714743e-06, + "loss": 0.8213, + "step": 21920 + }, + { + "epoch": 0.56, + "learning_rate": 1.8730443834647124e-06, + "loss": 0.9521, + "step": 21921 + }, + { + "epoch": 0.56, + "learning_rate": 1.8730308898895007e-06, + "loss": 0.8301, + "step": 21922 + }, + { + "epoch": 0.56, + "learning_rate": 1.8730173956458493e-06, + "loss": 0.9717, + "step": 21923 + }, + { + "epoch": 0.56, + "learning_rate": 1.8730039007337688e-06, + "loss": 0.8389, + "step": 21924 + }, + { + "epoch": 0.56, + "learning_rate": 1.8729904051532693e-06, + "loss": 0.8447, + "step": 21925 + }, + { + "epoch": 0.56, + "learning_rate": 1.872976908904361e-06, + "loss": 0.918, + "step": 21926 + }, + { + "epoch": 0.56, + "learning_rate": 1.8729634119870545e-06, + "loss": 0.8062, + "step": 21927 + }, + { + "epoch": 0.56, + "learning_rate": 1.8729499144013601e-06, + "loss": 0.9365, + "step": 21928 + }, + { + "epoch": 0.56, + "learning_rate": 1.8729364161472879e-06, + "loss": 0.8613, + "step": 21929 + }, + { + "epoch": 0.56, + "learning_rate": 1.8729229172248486e-06, + "loss": 0.9189, + "step": 21930 + }, + { + "epoch": 0.56, + "learning_rate": 1.8729094176340523e-06, + "loss": 0.8682, + "step": 21931 + }, + { + "epoch": 0.56, + "learning_rate": 1.8728959173749095e-06, + "loss": 0.8867, + "step": 21932 + }, + { + "epoch": 0.56, + "learning_rate": 1.8728824164474304e-06, + "loss": 0.7217, + "step": 21933 + }, + { + "epoch": 0.56, + "learning_rate": 1.8728689148516256e-06, + "loss": 0.7026, + "step": 21934 + }, + { + "epoch": 0.56, + "learning_rate": 1.8728554125875047e-06, + "loss": 0.7588, + "step": 21935 + }, + { + "epoch": 0.56, + "learning_rate": 1.8728419096550787e-06, + "loss": 0.8149, + "step": 21936 + }, + { + "epoch": 0.56, + "learning_rate": 1.8728284060543577e-06, + "loss": 1.0078, + "step": 21937 + }, + { + "epoch": 0.56, + "learning_rate": 1.8728149017853525e-06, + "loss": 0.7783, + "step": 21938 + }, + { + "epoch": 0.56, + "learning_rate": 1.872801396848073e-06, + "loss": 0.7637, + "step": 21939 + }, + { + "epoch": 0.56, + "learning_rate": 1.8727878912425291e-06, + "loss": 1.0117, + "step": 21940 + }, + { + "epoch": 0.56, + "learning_rate": 1.8727743849687322e-06, + "loss": 1.0352, + "step": 21941 + }, + { + "epoch": 0.56, + "learning_rate": 1.872760878026692e-06, + "loss": 0.5376, + "step": 21942 + }, + { + "epoch": 0.56, + "learning_rate": 1.8727473704164187e-06, + "loss": 0.9297, + "step": 21943 + }, + { + "epoch": 0.56, + "learning_rate": 1.872733862137923e-06, + "loss": 0.959, + "step": 21944 + }, + { + "epoch": 0.56, + "learning_rate": 1.872720353191215e-06, + "loss": 0.8818, + "step": 21945 + }, + { + "epoch": 0.56, + "learning_rate": 1.8727068435763056e-06, + "loss": 1.0898, + "step": 21946 + }, + { + "epoch": 0.56, + "learning_rate": 1.8726933332932042e-06, + "loss": 0.9082, + "step": 21947 + }, + { + "epoch": 0.56, + "learning_rate": 1.8726798223419217e-06, + "loss": 0.9922, + "step": 21948 + }, + { + "epoch": 0.56, + "learning_rate": 1.8726663107224688e-06, + "loss": 0.7046, + "step": 21949 + }, + { + "epoch": 0.56, + "learning_rate": 1.872652798434855e-06, + "loss": 0.8535, + "step": 21950 + }, + { + "epoch": 0.56, + "learning_rate": 1.8726392854790911e-06, + "loss": 0.9531, + "step": 21951 + }, + { + "epoch": 0.56, + "learning_rate": 1.8726257718551874e-06, + "loss": 0.686, + "step": 21952 + }, + { + "epoch": 0.56, + "learning_rate": 1.8726122575631545e-06, + "loss": 0.8086, + "step": 21953 + }, + { + "epoch": 0.56, + "learning_rate": 1.8725987426030023e-06, + "loss": 0.9136, + "step": 21954 + }, + { + "epoch": 0.56, + "learning_rate": 1.8725852269747414e-06, + "loss": 0.7715, + "step": 21955 + }, + { + "epoch": 0.56, + "learning_rate": 1.8725717106783823e-06, + "loss": 0.8711, + "step": 21956 + }, + { + "epoch": 0.56, + "learning_rate": 1.872558193713935e-06, + "loss": 0.8623, + "step": 21957 + }, + { + "epoch": 0.56, + "learning_rate": 1.8725446760814102e-06, + "loss": 1.0107, + "step": 21958 + }, + { + "epoch": 0.56, + "learning_rate": 1.8725311577808177e-06, + "loss": 0.7178, + "step": 21959 + }, + { + "epoch": 0.56, + "learning_rate": 1.8725176388121685e-06, + "loss": 0.9463, + "step": 21960 + }, + { + "epoch": 0.56, + "learning_rate": 1.8725041191754727e-06, + "loss": 0.7515, + "step": 21961 + }, + { + "epoch": 0.56, + "learning_rate": 1.8724905988707404e-06, + "loss": 0.9155, + "step": 21962 + }, + { + "epoch": 0.56, + "learning_rate": 1.8724770778979824e-06, + "loss": 0.9316, + "step": 21963 + }, + { + "epoch": 0.56, + "learning_rate": 1.8724635562572086e-06, + "loss": 1.0107, + "step": 21964 + }, + { + "epoch": 0.56, + "learning_rate": 1.8724500339484298e-06, + "loss": 0.8066, + "step": 21965 + }, + { + "epoch": 0.56, + "learning_rate": 1.872436510971656e-06, + "loss": 0.7227, + "step": 21966 + }, + { + "epoch": 0.56, + "learning_rate": 1.8724229873268977e-06, + "loss": 0.8105, + "step": 21967 + }, + { + "epoch": 0.56, + "learning_rate": 1.8724094630141651e-06, + "loss": 0.8438, + "step": 21968 + }, + { + "epoch": 0.56, + "learning_rate": 1.8723959380334688e-06, + "loss": 0.9834, + "step": 21969 + }, + { + "epoch": 0.56, + "learning_rate": 1.8723824123848191e-06, + "loss": 0.8174, + "step": 21970 + }, + { + "epoch": 0.56, + "learning_rate": 1.872368886068226e-06, + "loss": 0.6421, + "step": 21971 + }, + { + "epoch": 0.56, + "learning_rate": 1.8723553590837006e-06, + "loss": 0.8633, + "step": 21972 + }, + { + "epoch": 0.56, + "learning_rate": 1.8723418314312527e-06, + "loss": 0.9385, + "step": 21973 + }, + { + "epoch": 0.56, + "learning_rate": 1.8723283031108928e-06, + "loss": 1.0205, + "step": 21974 + }, + { + "epoch": 0.56, + "learning_rate": 1.8723147741226308e-06, + "loss": 0.7114, + "step": 21975 + }, + { + "epoch": 0.56, + "learning_rate": 1.872301244466478e-06, + "loss": 0.9854, + "step": 21976 + }, + { + "epoch": 0.56, + "learning_rate": 1.8722877141424438e-06, + "loss": 0.9746, + "step": 21977 + }, + { + "epoch": 0.56, + "learning_rate": 1.8722741831505395e-06, + "loss": 0.8306, + "step": 21978 + }, + { + "epoch": 0.56, + "learning_rate": 1.8722606514907746e-06, + "loss": 0.7222, + "step": 21979 + }, + { + "epoch": 0.56, + "learning_rate": 1.87224711916316e-06, + "loss": 0.8906, + "step": 21980 + }, + { + "epoch": 0.56, + "learning_rate": 1.8722335861677059e-06, + "loss": 0.7104, + "step": 21981 + }, + { + "epoch": 0.56, + "learning_rate": 1.8722200525044225e-06, + "loss": 0.7979, + "step": 21982 + }, + { + "epoch": 0.56, + "learning_rate": 1.8722065181733205e-06, + "loss": 0.8916, + "step": 21983 + }, + { + "epoch": 0.56, + "learning_rate": 1.87219298317441e-06, + "loss": 0.8643, + "step": 21984 + }, + { + "epoch": 0.56, + "learning_rate": 1.872179447507701e-06, + "loss": 0.8916, + "step": 21985 + }, + { + "epoch": 0.56, + "learning_rate": 1.8721659111732048e-06, + "loss": 0.8066, + "step": 21986 + }, + { + "epoch": 0.56, + "learning_rate": 1.8721523741709313e-06, + "loss": 0.8643, + "step": 21987 + }, + { + "epoch": 0.56, + "learning_rate": 1.8721388365008907e-06, + "loss": 0.8623, + "step": 21988 + }, + { + "epoch": 0.56, + "learning_rate": 1.8721252981630936e-06, + "loss": 0.8916, + "step": 21989 + }, + { + "epoch": 0.56, + "learning_rate": 1.8721117591575499e-06, + "loss": 0.9102, + "step": 21990 + }, + { + "epoch": 0.56, + "learning_rate": 1.8720982194842708e-06, + "loss": 1.0254, + "step": 21991 + }, + { + "epoch": 0.56, + "learning_rate": 1.8720846791432661e-06, + "loss": 0.6924, + "step": 21992 + }, + { + "epoch": 0.56, + "learning_rate": 1.872071138134546e-06, + "loss": 0.9307, + "step": 21993 + }, + { + "epoch": 0.56, + "learning_rate": 1.8720575964581213e-06, + "loss": 0.7432, + "step": 21994 + }, + { + "epoch": 0.56, + "learning_rate": 1.872044054114002e-06, + "loss": 0.8452, + "step": 21995 + }, + { + "epoch": 0.56, + "learning_rate": 1.8720305111021988e-06, + "loss": 0.9365, + "step": 21996 + }, + { + "epoch": 0.56, + "learning_rate": 1.8720169674227222e-06, + "loss": 0.6768, + "step": 21997 + }, + { + "epoch": 0.56, + "learning_rate": 1.8720034230755819e-06, + "loss": 0.9512, + "step": 21998 + }, + { + "epoch": 0.56, + "learning_rate": 1.8719898780607888e-06, + "loss": 0.7295, + "step": 21999 + }, + { + "epoch": 0.56, + "learning_rate": 1.8719763323783533e-06, + "loss": 0.918, + "step": 22000 + }, + { + "epoch": 0.56, + "learning_rate": 1.8719627860282853e-06, + "loss": 0.7349, + "step": 22001 + }, + { + "epoch": 0.56, + "learning_rate": 1.8719492390105958e-06, + "loss": 0.7168, + "step": 22002 + }, + { + "epoch": 0.56, + "learning_rate": 1.8719356913252947e-06, + "loss": 0.8135, + "step": 22003 + }, + { + "epoch": 0.56, + "learning_rate": 1.8719221429723926e-06, + "loss": 1.0957, + "step": 22004 + }, + { + "epoch": 0.56, + "learning_rate": 1.8719085939518998e-06, + "loss": 0.8223, + "step": 22005 + }, + { + "epoch": 0.56, + "learning_rate": 1.8718950442638267e-06, + "loss": 0.8721, + "step": 22006 + }, + { + "epoch": 0.56, + "learning_rate": 1.8718814939081838e-06, + "loss": 0.7334, + "step": 22007 + }, + { + "epoch": 0.56, + "learning_rate": 1.871867942884981e-06, + "loss": 1.1416, + "step": 22008 + }, + { + "epoch": 0.56, + "learning_rate": 1.8718543911942292e-06, + "loss": 0.9043, + "step": 22009 + }, + { + "epoch": 0.56, + "learning_rate": 1.8718408388359386e-06, + "loss": 0.8086, + "step": 22010 + }, + { + "epoch": 0.56, + "learning_rate": 1.8718272858101197e-06, + "loss": 0.916, + "step": 22011 + }, + { + "epoch": 0.56, + "learning_rate": 1.8718137321167822e-06, + "loss": 0.7222, + "step": 22012 + }, + { + "epoch": 0.56, + "learning_rate": 1.8718001777559374e-06, + "loss": 0.9092, + "step": 22013 + }, + { + "epoch": 0.56, + "learning_rate": 1.8717866227275954e-06, + "loss": 1.001, + "step": 22014 + }, + { + "epoch": 0.56, + "learning_rate": 1.8717730670317661e-06, + "loss": 0.8887, + "step": 22015 + }, + { + "epoch": 0.56, + "learning_rate": 1.8717595106684607e-06, + "loss": 0.9512, + "step": 22016 + }, + { + "epoch": 0.56, + "learning_rate": 1.8717459536376887e-06, + "loss": 0.8945, + "step": 22017 + }, + { + "epoch": 0.56, + "learning_rate": 1.871732395939461e-06, + "loss": 0.9131, + "step": 22018 + }, + { + "epoch": 0.56, + "learning_rate": 1.871718837573788e-06, + "loss": 0.9004, + "step": 22019 + }, + { + "epoch": 0.56, + "learning_rate": 1.87170527854068e-06, + "loss": 0.9697, + "step": 22020 + }, + { + "epoch": 0.56, + "learning_rate": 1.8716917188401472e-06, + "loss": 0.7529, + "step": 22021 + }, + { + "epoch": 0.56, + "learning_rate": 1.8716781584722003e-06, + "loss": 0.8564, + "step": 22022 + }, + { + "epoch": 0.56, + "learning_rate": 1.8716645974368496e-06, + "loss": 1.0176, + "step": 22023 + }, + { + "epoch": 0.56, + "learning_rate": 1.8716510357341054e-06, + "loss": 0.9297, + "step": 22024 + }, + { + "epoch": 0.56, + "learning_rate": 1.8716374733639778e-06, + "loss": 0.9336, + "step": 22025 + }, + { + "epoch": 0.56, + "learning_rate": 1.8716239103264775e-06, + "loss": 0.8994, + "step": 22026 + }, + { + "epoch": 0.56, + "learning_rate": 1.8716103466216149e-06, + "loss": 0.8623, + "step": 22027 + }, + { + "epoch": 0.56, + "learning_rate": 1.8715967822494006e-06, + "loss": 0.9473, + "step": 22028 + }, + { + "epoch": 0.56, + "learning_rate": 1.8715832172098444e-06, + "loss": 0.812, + "step": 22029 + }, + { + "epoch": 0.56, + "learning_rate": 1.8715696515029569e-06, + "loss": 1.1758, + "step": 22030 + }, + { + "epoch": 0.56, + "learning_rate": 1.8715560851287488e-06, + "loss": 0.8369, + "step": 22031 + }, + { + "epoch": 0.56, + "learning_rate": 1.8715425180872305e-06, + "loss": 0.8486, + "step": 22032 + }, + { + "epoch": 0.56, + "learning_rate": 1.871528950378412e-06, + "loss": 0.9531, + "step": 22033 + }, + { + "epoch": 0.56, + "learning_rate": 1.8715153820023038e-06, + "loss": 0.7598, + "step": 22034 + }, + { + "epoch": 0.56, + "learning_rate": 1.8715018129589163e-06, + "loss": 0.9414, + "step": 22035 + }, + { + "epoch": 0.56, + "learning_rate": 1.8714882432482599e-06, + "loss": 1.0293, + "step": 22036 + }, + { + "epoch": 0.56, + "learning_rate": 1.8714746728703452e-06, + "loss": 0.5029, + "step": 22037 + }, + { + "epoch": 0.56, + "learning_rate": 1.8714611018251823e-06, + "loss": 0.8906, + "step": 22038 + }, + { + "epoch": 0.56, + "learning_rate": 1.8714475301127816e-06, + "loss": 1.002, + "step": 22039 + }, + { + "epoch": 0.56, + "learning_rate": 1.8714339577331536e-06, + "loss": 1.0703, + "step": 22040 + }, + { + "epoch": 0.56, + "learning_rate": 1.8714203846863091e-06, + "loss": 0.4277, + "step": 22041 + }, + { + "epoch": 0.56, + "learning_rate": 1.8714068109722576e-06, + "loss": 0.7593, + "step": 22042 + }, + { + "epoch": 0.56, + "learning_rate": 1.8713932365910103e-06, + "loss": 1.1074, + "step": 22043 + }, + { + "epoch": 0.56, + "learning_rate": 1.8713796615425771e-06, + "loss": 1.0469, + "step": 22044 + }, + { + "epoch": 0.57, + "learning_rate": 1.8713660858269687e-06, + "loss": 0.9258, + "step": 22045 + }, + { + "epoch": 0.57, + "learning_rate": 1.871352509444195e-06, + "loss": 1.0449, + "step": 22046 + }, + { + "epoch": 0.57, + "learning_rate": 1.8713389323942671e-06, + "loss": 0.832, + "step": 22047 + }, + { + "epoch": 0.57, + "learning_rate": 1.871325354677195e-06, + "loss": 0.7603, + "step": 22048 + }, + { + "epoch": 0.57, + "learning_rate": 1.871311776292989e-06, + "loss": 0.8867, + "step": 22049 + }, + { + "epoch": 0.57, + "learning_rate": 1.8712981972416597e-06, + "loss": 0.801, + "step": 22050 + }, + { + "epoch": 0.57, + "learning_rate": 1.8712846175232175e-06, + "loss": 0.6467, + "step": 22051 + }, + { + "epoch": 0.57, + "learning_rate": 1.8712710371376728e-06, + "loss": 0.9678, + "step": 22052 + }, + { + "epoch": 0.57, + "learning_rate": 1.8712574560850358e-06, + "loss": 0.8604, + "step": 22053 + }, + { + "epoch": 0.57, + "learning_rate": 1.8712438743653171e-06, + "loss": 0.8887, + "step": 22054 + }, + { + "epoch": 0.57, + "learning_rate": 1.8712302919785268e-06, + "loss": 1.0322, + "step": 22055 + }, + { + "epoch": 0.57, + "learning_rate": 1.8712167089246758e-06, + "loss": 0.7305, + "step": 22056 + }, + { + "epoch": 0.57, + "learning_rate": 1.871203125203774e-06, + "loss": 0.9746, + "step": 22057 + }, + { + "epoch": 0.57, + "learning_rate": 1.8711895408158322e-06, + "loss": 0.9097, + "step": 22058 + }, + { + "epoch": 0.57, + "learning_rate": 1.8711759557608606e-06, + "loss": 0.8862, + "step": 22059 + }, + { + "epoch": 0.57, + "learning_rate": 1.8711623700388698e-06, + "loss": 0.9014, + "step": 22060 + }, + { + "epoch": 0.57, + "learning_rate": 1.8711487836498695e-06, + "loss": 0.8369, + "step": 22061 + }, + { + "epoch": 0.57, + "learning_rate": 1.871135196593871e-06, + "loss": 0.9951, + "step": 22062 + }, + { + "epoch": 0.57, + "learning_rate": 1.8711216088708843e-06, + "loss": 0.687, + "step": 22063 + }, + { + "epoch": 0.57, + "learning_rate": 1.87110802048092e-06, + "loss": 1.1035, + "step": 22064 + }, + { + "epoch": 0.57, + "learning_rate": 1.8710944314239883e-06, + "loss": 0.9561, + "step": 22065 + }, + { + "epoch": 0.57, + "learning_rate": 1.8710808417000994e-06, + "loss": 0.6362, + "step": 22066 + }, + { + "epoch": 0.57, + "learning_rate": 1.871067251309264e-06, + "loss": 1.0127, + "step": 22067 + }, + { + "epoch": 0.57, + "learning_rate": 1.8710536602514926e-06, + "loss": 0.7266, + "step": 22068 + }, + { + "epoch": 0.57, + "learning_rate": 1.8710400685267955e-06, + "loss": 0.9541, + "step": 22069 + }, + { + "epoch": 0.57, + "learning_rate": 1.871026476135183e-06, + "loss": 0.7617, + "step": 22070 + }, + { + "epoch": 0.57, + "learning_rate": 1.8710128830766654e-06, + "loss": 0.876, + "step": 22071 + }, + { + "epoch": 0.57, + "learning_rate": 1.8709992893512534e-06, + "loss": 0.8779, + "step": 22072 + }, + { + "epoch": 0.57, + "learning_rate": 1.8709856949589575e-06, + "loss": 1.0625, + "step": 22073 + }, + { + "epoch": 0.57, + "learning_rate": 1.8709720998997875e-06, + "loss": 0.9219, + "step": 22074 + }, + { + "epoch": 0.57, + "learning_rate": 1.8709585041737546e-06, + "loss": 0.8672, + "step": 22075 + }, + { + "epoch": 0.57, + "learning_rate": 1.8709449077808688e-06, + "loss": 0.7842, + "step": 22076 + }, + { + "epoch": 0.57, + "learning_rate": 1.8709313107211404e-06, + "loss": 0.9648, + "step": 22077 + }, + { + "epoch": 0.57, + "learning_rate": 1.8709177129945798e-06, + "loss": 0.8457, + "step": 22078 + }, + { + "epoch": 0.57, + "learning_rate": 1.8709041146011978e-06, + "loss": 0.8174, + "step": 22079 + }, + { + "epoch": 0.57, + "learning_rate": 1.8708905155410041e-06, + "loss": 0.7178, + "step": 22080 + }, + { + "epoch": 0.57, + "learning_rate": 1.8708769158140103e-06, + "loss": 0.7578, + "step": 22081 + }, + { + "epoch": 0.57, + "learning_rate": 1.8708633154202255e-06, + "loss": 0.8271, + "step": 22082 + }, + { + "epoch": 0.57, + "learning_rate": 1.870849714359661e-06, + "loss": 0.958, + "step": 22083 + }, + { + "epoch": 0.57, + "learning_rate": 1.870836112632327e-06, + "loss": 0.7837, + "step": 22084 + }, + { + "epoch": 0.57, + "learning_rate": 1.8708225102382336e-06, + "loss": 0.8662, + "step": 22085 + }, + { + "epoch": 0.57, + "learning_rate": 1.8708089071773915e-06, + "loss": 0.7705, + "step": 22086 + }, + { + "epoch": 0.57, + "learning_rate": 1.870795303449811e-06, + "loss": 0.9795, + "step": 22087 + }, + { + "epoch": 0.57, + "learning_rate": 1.8707816990555028e-06, + "loss": 0.7676, + "step": 22088 + }, + { + "epoch": 0.57, + "learning_rate": 1.870768093994477e-06, + "loss": 0.8203, + "step": 22089 + }, + { + "epoch": 0.57, + "learning_rate": 1.870754488266744e-06, + "loss": 0.7705, + "step": 22090 + }, + { + "epoch": 0.57, + "learning_rate": 1.8707408818723142e-06, + "loss": 0.5649, + "step": 22091 + }, + { + "epoch": 0.57, + "learning_rate": 1.8707272748111984e-06, + "loss": 0.8105, + "step": 22092 + }, + { + "epoch": 0.57, + "learning_rate": 1.8707136670834068e-06, + "loss": 0.6445, + "step": 22093 + }, + { + "epoch": 0.57, + "learning_rate": 1.8707000586889496e-06, + "loss": 0.9785, + "step": 22094 + }, + { + "epoch": 0.57, + "learning_rate": 1.8706864496278376e-06, + "loss": 0.9648, + "step": 22095 + }, + { + "epoch": 0.57, + "learning_rate": 1.870672839900081e-06, + "loss": 0.4937, + "step": 22096 + }, + { + "epoch": 0.57, + "learning_rate": 1.8706592295056898e-06, + "loss": 0.9648, + "step": 22097 + }, + { + "epoch": 0.57, + "learning_rate": 1.8706456184446756e-06, + "loss": 0.8506, + "step": 22098 + }, + { + "epoch": 0.57, + "learning_rate": 1.8706320067170473e-06, + "loss": 0.792, + "step": 22099 + }, + { + "epoch": 0.57, + "learning_rate": 1.8706183943228167e-06, + "loss": 1.0508, + "step": 22100 + }, + { + "epoch": 0.57, + "learning_rate": 1.8706047812619934e-06, + "loss": 0.7983, + "step": 22101 + }, + { + "epoch": 0.57, + "learning_rate": 1.870591167534588e-06, + "loss": 0.8364, + "step": 22102 + }, + { + "epoch": 0.57, + "learning_rate": 1.870577553140611e-06, + "loss": 0.9121, + "step": 22103 + }, + { + "epoch": 0.57, + "learning_rate": 1.8705639380800728e-06, + "loss": 0.8633, + "step": 22104 + }, + { + "epoch": 0.57, + "learning_rate": 1.870550322352984e-06, + "loss": 0.9531, + "step": 22105 + }, + { + "epoch": 0.57, + "learning_rate": 1.8705367059593546e-06, + "loss": 1.1504, + "step": 22106 + }, + { + "epoch": 0.57, + "learning_rate": 1.8705230888991954e-06, + "loss": 0.8506, + "step": 22107 + }, + { + "epoch": 0.57, + "learning_rate": 1.8705094711725168e-06, + "loss": 0.9951, + "step": 22108 + }, + { + "epoch": 0.57, + "learning_rate": 1.8704958527793289e-06, + "loss": 0.8975, + "step": 22109 + }, + { + "epoch": 0.57, + "learning_rate": 1.8704822337196427e-06, + "loss": 0.6763, + "step": 22110 + }, + { + "epoch": 0.57, + "learning_rate": 1.8704686139934677e-06, + "loss": 0.6992, + "step": 22111 + }, + { + "epoch": 0.57, + "learning_rate": 1.8704549936008153e-06, + "loss": 0.8613, + "step": 22112 + }, + { + "epoch": 0.57, + "learning_rate": 1.8704413725416956e-06, + "loss": 0.834, + "step": 22113 + }, + { + "epoch": 0.57, + "learning_rate": 1.8704277508161188e-06, + "loss": 1.0703, + "step": 22114 + }, + { + "epoch": 0.57, + "learning_rate": 1.8704141284240955e-06, + "loss": 1.3975, + "step": 22115 + }, + { + "epoch": 0.57, + "learning_rate": 1.8704005053656361e-06, + "loss": 0.9287, + "step": 22116 + }, + { + "epoch": 0.57, + "learning_rate": 1.8703868816407513e-06, + "loss": 0.9141, + "step": 22117 + }, + { + "epoch": 0.57, + "learning_rate": 1.870373257249451e-06, + "loss": 0.8389, + "step": 22118 + }, + { + "epoch": 0.57, + "learning_rate": 1.870359632191746e-06, + "loss": 0.6875, + "step": 22119 + }, + { + "epoch": 0.57, + "learning_rate": 1.8703460064676468e-06, + "loss": 0.7388, + "step": 22120 + }, + { + "epoch": 0.57, + "learning_rate": 1.8703323800771633e-06, + "loss": 0.8848, + "step": 22121 + }, + { + "epoch": 0.57, + "learning_rate": 1.8703187530203066e-06, + "loss": 0.8086, + "step": 22122 + }, + { + "epoch": 0.57, + "learning_rate": 1.870305125297087e-06, + "loss": 0.916, + "step": 22123 + }, + { + "epoch": 0.57, + "learning_rate": 1.8702914969075145e-06, + "loss": 0.748, + "step": 22124 + }, + { + "epoch": 0.57, + "learning_rate": 1.8702778678516e-06, + "loss": 1.0303, + "step": 22125 + }, + { + "epoch": 0.57, + "learning_rate": 1.8702642381293536e-06, + "loss": 1.0557, + "step": 22126 + }, + { + "epoch": 0.57, + "learning_rate": 1.870250607740786e-06, + "loss": 0.7402, + "step": 22127 + }, + { + "epoch": 0.57, + "learning_rate": 1.8702369766859074e-06, + "loss": 0.8062, + "step": 22128 + }, + { + "epoch": 0.57, + "learning_rate": 1.8702233449647285e-06, + "loss": 0.8394, + "step": 22129 + }, + { + "epoch": 0.57, + "learning_rate": 1.8702097125772595e-06, + "loss": 0.6333, + "step": 22130 + }, + { + "epoch": 0.57, + "learning_rate": 1.8701960795235112e-06, + "loss": 0.8267, + "step": 22131 + }, + { + "epoch": 0.57, + "learning_rate": 1.8701824458034934e-06, + "loss": 0.8218, + "step": 22132 + }, + { + "epoch": 0.57, + "learning_rate": 1.870168811417217e-06, + "loss": 0.7402, + "step": 22133 + }, + { + "epoch": 0.57, + "learning_rate": 1.8701551763646925e-06, + "loss": 0.8721, + "step": 22134 + }, + { + "epoch": 0.57, + "learning_rate": 1.87014154064593e-06, + "loss": 0.8164, + "step": 22135 + }, + { + "epoch": 0.57, + "learning_rate": 1.8701279042609405e-06, + "loss": 0.8301, + "step": 22136 + }, + { + "epoch": 0.57, + "learning_rate": 1.8701142672097337e-06, + "loss": 0.9375, + "step": 22137 + }, + { + "epoch": 0.57, + "learning_rate": 1.8701006294923205e-06, + "loss": 0.7888, + "step": 22138 + }, + { + "epoch": 0.57, + "learning_rate": 1.8700869911087114e-06, + "loss": 0.4663, + "step": 22139 + }, + { + "epoch": 0.57, + "learning_rate": 1.8700733520589164e-06, + "loss": 0.8584, + "step": 22140 + }, + { + "epoch": 0.57, + "learning_rate": 1.8700597123429468e-06, + "loss": 0.957, + "step": 22141 + }, + { + "epoch": 0.57, + "learning_rate": 1.8700460719608117e-06, + "loss": 0.9258, + "step": 22142 + }, + { + "epoch": 0.57, + "learning_rate": 1.870032430912523e-06, + "loss": 0.8955, + "step": 22143 + }, + { + "epoch": 0.57, + "learning_rate": 1.8700187891980903e-06, + "loss": 0.9062, + "step": 22144 + }, + { + "epoch": 0.57, + "learning_rate": 1.870005146817524e-06, + "loss": 0.7949, + "step": 22145 + }, + { + "epoch": 0.57, + "learning_rate": 1.869991503770835e-06, + "loss": 0.9121, + "step": 22146 + }, + { + "epoch": 0.57, + "learning_rate": 1.8699778600580332e-06, + "loss": 0.8223, + "step": 22147 + }, + { + "epoch": 0.57, + "learning_rate": 1.8699642156791296e-06, + "loss": 0.9756, + "step": 22148 + }, + { + "epoch": 0.57, + "learning_rate": 1.8699505706341343e-06, + "loss": 1.1455, + "step": 22149 + }, + { + "epoch": 0.57, + "learning_rate": 1.8699369249230582e-06, + "loss": 0.8823, + "step": 22150 + }, + { + "epoch": 0.57, + "learning_rate": 1.8699232785459109e-06, + "loss": 0.8525, + "step": 22151 + }, + { + "epoch": 0.57, + "learning_rate": 1.8699096315027037e-06, + "loss": 0.916, + "step": 22152 + }, + { + "epoch": 0.57, + "learning_rate": 1.8698959837934465e-06, + "loss": 1.084, + "step": 22153 + }, + { + "epoch": 0.57, + "learning_rate": 1.8698823354181502e-06, + "loss": 0.877, + "step": 22154 + }, + { + "epoch": 0.57, + "learning_rate": 1.8698686863768244e-06, + "loss": 0.8721, + "step": 22155 + }, + { + "epoch": 0.57, + "learning_rate": 1.8698550366694805e-06, + "loss": 0.7842, + "step": 22156 + }, + { + "epoch": 0.57, + "learning_rate": 1.869841386296129e-06, + "loss": 0.709, + "step": 22157 + }, + { + "epoch": 0.57, + "learning_rate": 1.8698277352567793e-06, + "loss": 1.0615, + "step": 22158 + }, + { + "epoch": 0.57, + "learning_rate": 1.8698140835514428e-06, + "loss": 0.7578, + "step": 22159 + }, + { + "epoch": 0.57, + "learning_rate": 1.8698004311801297e-06, + "loss": 0.9551, + "step": 22160 + }, + { + "epoch": 0.57, + "learning_rate": 1.8697867781428504e-06, + "loss": 0.6816, + "step": 22161 + }, + { + "epoch": 0.57, + "learning_rate": 1.8697731244396154e-06, + "loss": 0.9521, + "step": 22162 + }, + { + "epoch": 0.57, + "learning_rate": 1.8697594700704346e-06, + "loss": 0.9863, + "step": 22163 + }, + { + "epoch": 0.57, + "learning_rate": 1.8697458150353195e-06, + "loss": 0.8574, + "step": 22164 + }, + { + "epoch": 0.57, + "learning_rate": 1.8697321593342798e-06, + "loss": 0.9854, + "step": 22165 + }, + { + "epoch": 0.57, + "learning_rate": 1.8697185029673265e-06, + "loss": 0.8252, + "step": 22166 + }, + { + "epoch": 0.57, + "learning_rate": 1.8697048459344696e-06, + "loss": 1.0146, + "step": 22167 + }, + { + "epoch": 0.57, + "learning_rate": 1.8696911882357194e-06, + "loss": 0.8525, + "step": 22168 + }, + { + "epoch": 0.57, + "learning_rate": 1.8696775298710868e-06, + "loss": 0.8652, + "step": 22169 + }, + { + "epoch": 0.57, + "learning_rate": 1.8696638708405822e-06, + "loss": 0.834, + "step": 22170 + }, + { + "epoch": 0.57, + "learning_rate": 1.8696502111442158e-06, + "loss": 1.0049, + "step": 22171 + }, + { + "epoch": 0.57, + "learning_rate": 1.8696365507819985e-06, + "loss": 0.9863, + "step": 22172 + }, + { + "epoch": 0.57, + "learning_rate": 1.8696228897539404e-06, + "loss": 0.7861, + "step": 22173 + }, + { + "epoch": 0.57, + "learning_rate": 1.8696092280600518e-06, + "loss": 1.082, + "step": 22174 + }, + { + "epoch": 0.57, + "learning_rate": 1.8695955657003435e-06, + "loss": 0.8867, + "step": 22175 + }, + { + "epoch": 0.57, + "learning_rate": 1.8695819026748261e-06, + "loss": 0.9004, + "step": 22176 + }, + { + "epoch": 0.57, + "learning_rate": 1.8695682389835095e-06, + "loss": 1.0156, + "step": 22177 + }, + { + "epoch": 0.57, + "learning_rate": 1.8695545746264046e-06, + "loss": 0.8447, + "step": 22178 + }, + { + "epoch": 0.57, + "learning_rate": 1.8695409096035215e-06, + "loss": 0.8188, + "step": 22179 + }, + { + "epoch": 0.57, + "learning_rate": 1.8695272439148715e-06, + "loss": 1.0205, + "step": 22180 + }, + { + "epoch": 0.57, + "learning_rate": 1.869513577560464e-06, + "loss": 0.8887, + "step": 22181 + }, + { + "epoch": 0.57, + "learning_rate": 1.86949991054031e-06, + "loss": 0.853, + "step": 22182 + }, + { + "epoch": 0.57, + "learning_rate": 1.86948624285442e-06, + "loss": 0.7422, + "step": 22183 + }, + { + "epoch": 0.57, + "learning_rate": 1.8694725745028044e-06, + "loss": 0.79, + "step": 22184 + }, + { + "epoch": 0.57, + "learning_rate": 1.8694589054854735e-06, + "loss": 0.605, + "step": 22185 + }, + { + "epoch": 0.57, + "learning_rate": 1.8694452358024379e-06, + "loss": 0.7756, + "step": 22186 + }, + { + "epoch": 0.57, + "learning_rate": 1.8694315654537082e-06, + "loss": 1.0908, + "step": 22187 + }, + { + "epoch": 0.57, + "learning_rate": 1.8694178944392947e-06, + "loss": 0.6997, + "step": 22188 + }, + { + "epoch": 0.57, + "learning_rate": 1.8694042227592078e-06, + "loss": 0.918, + "step": 22189 + }, + { + "epoch": 0.57, + "learning_rate": 1.869390550413458e-06, + "loss": 1.0176, + "step": 22190 + }, + { + "epoch": 0.57, + "learning_rate": 1.869376877402056e-06, + "loss": 1.0771, + "step": 22191 + }, + { + "epoch": 0.57, + "learning_rate": 1.869363203725012e-06, + "loss": 0.8291, + "step": 22192 + }, + { + "epoch": 0.57, + "learning_rate": 1.8693495293823367e-06, + "loss": 0.8535, + "step": 22193 + }, + { + "epoch": 0.57, + "learning_rate": 1.8693358543740403e-06, + "loss": 0.7896, + "step": 22194 + }, + { + "epoch": 0.57, + "learning_rate": 1.8693221787001333e-06, + "loss": 0.7046, + "step": 22195 + }, + { + "epoch": 0.57, + "learning_rate": 1.8693085023606266e-06, + "loss": 1.209, + "step": 22196 + }, + { + "epoch": 0.57, + "learning_rate": 1.86929482535553e-06, + "loss": 0.7656, + "step": 22197 + }, + { + "epoch": 0.57, + "learning_rate": 1.8692811476848547e-06, + "loss": 0.8467, + "step": 22198 + }, + { + "epoch": 0.57, + "learning_rate": 1.8692674693486105e-06, + "loss": 0.8594, + "step": 22199 + }, + { + "epoch": 0.57, + "learning_rate": 1.8692537903468085e-06, + "loss": 0.7354, + "step": 22200 + }, + { + "epoch": 0.57, + "learning_rate": 1.8692401106794583e-06, + "loss": 1.0645, + "step": 22201 + }, + { + "epoch": 0.57, + "learning_rate": 1.8692264303465716e-06, + "loss": 0.792, + "step": 22202 + }, + { + "epoch": 0.57, + "learning_rate": 1.8692127493481574e-06, + "loss": 0.957, + "step": 22203 + }, + { + "epoch": 0.57, + "learning_rate": 1.8691990676842274e-06, + "loss": 0.8291, + "step": 22204 + }, + { + "epoch": 0.57, + "learning_rate": 1.8691853853547919e-06, + "loss": 0.959, + "step": 22205 + }, + { + "epoch": 0.57, + "learning_rate": 1.8691717023598606e-06, + "loss": 0.8677, + "step": 22206 + }, + { + "epoch": 0.57, + "learning_rate": 1.8691580186994447e-06, + "loss": 0.707, + "step": 22207 + }, + { + "epoch": 0.57, + "learning_rate": 1.8691443343735546e-06, + "loss": 0.7495, + "step": 22208 + }, + { + "epoch": 0.57, + "learning_rate": 1.8691306493822005e-06, + "loss": 0.8384, + "step": 22209 + }, + { + "epoch": 0.57, + "learning_rate": 1.8691169637253931e-06, + "loss": 0.8369, + "step": 22210 + }, + { + "epoch": 0.57, + "learning_rate": 1.869103277403143e-06, + "loss": 0.7026, + "step": 22211 + }, + { + "epoch": 0.57, + "learning_rate": 1.8690895904154603e-06, + "loss": 1.0254, + "step": 22212 + }, + { + "epoch": 0.57, + "learning_rate": 1.8690759027623556e-06, + "loss": 1.0137, + "step": 22213 + }, + { + "epoch": 0.57, + "learning_rate": 1.8690622144438393e-06, + "loss": 0.9258, + "step": 22214 + }, + { + "epoch": 0.57, + "learning_rate": 1.8690485254599221e-06, + "loss": 0.8086, + "step": 22215 + }, + { + "epoch": 0.57, + "learning_rate": 1.8690348358106144e-06, + "loss": 1.002, + "step": 22216 + }, + { + "epoch": 0.57, + "learning_rate": 1.8690211454959267e-06, + "loss": 0.9805, + "step": 22217 + }, + { + "epoch": 0.57, + "learning_rate": 1.86900745451587e-06, + "loss": 0.9814, + "step": 22218 + }, + { + "epoch": 0.57, + "learning_rate": 1.8689937628704535e-06, + "loss": 0.707, + "step": 22219 + }, + { + "epoch": 0.57, + "learning_rate": 1.8689800705596888e-06, + "loss": 0.6347, + "step": 22220 + }, + { + "epoch": 0.57, + "learning_rate": 1.868966377583586e-06, + "loss": 0.8252, + "step": 22221 + }, + { + "epoch": 0.57, + "learning_rate": 1.8689526839421554e-06, + "loss": 0.7168, + "step": 22222 + }, + { + "epoch": 0.57, + "learning_rate": 1.868938989635408e-06, + "loss": 0.9141, + "step": 22223 + }, + { + "epoch": 0.57, + "learning_rate": 1.8689252946633537e-06, + "loss": 0.7876, + "step": 22224 + }, + { + "epoch": 0.57, + "learning_rate": 1.8689115990260035e-06, + "loss": 0.9502, + "step": 22225 + }, + { + "epoch": 0.57, + "learning_rate": 1.8688979027233676e-06, + "loss": 1.0801, + "step": 22226 + }, + { + "epoch": 0.57, + "learning_rate": 1.8688842057554562e-06, + "loss": 0.9053, + "step": 22227 + }, + { + "epoch": 0.57, + "learning_rate": 1.8688705081222804e-06, + "loss": 0.7822, + "step": 22228 + }, + { + "epoch": 0.57, + "learning_rate": 1.8688568098238504e-06, + "loss": 1.0898, + "step": 22229 + }, + { + "epoch": 0.57, + "learning_rate": 1.8688431108601765e-06, + "loss": 0.8838, + "step": 22230 + }, + { + "epoch": 0.57, + "learning_rate": 1.8688294112312697e-06, + "loss": 0.9697, + "step": 22231 + }, + { + "epoch": 0.57, + "learning_rate": 1.86881571093714e-06, + "loss": 0.9365, + "step": 22232 + }, + { + "epoch": 0.57, + "learning_rate": 1.868802009977798e-06, + "loss": 0.8447, + "step": 22233 + }, + { + "epoch": 0.57, + "learning_rate": 1.8687883083532544e-06, + "loss": 0.9004, + "step": 22234 + }, + { + "epoch": 0.57, + "learning_rate": 1.8687746060635194e-06, + "loss": 0.8379, + "step": 22235 + }, + { + "epoch": 0.57, + "learning_rate": 1.8687609031086038e-06, + "loss": 1.0518, + "step": 22236 + }, + { + "epoch": 0.57, + "learning_rate": 1.8687471994885176e-06, + "loss": 0.8467, + "step": 22237 + }, + { + "epoch": 0.57, + "learning_rate": 1.8687334952032719e-06, + "loss": 0.9463, + "step": 22238 + }, + { + "epoch": 0.57, + "learning_rate": 1.8687197902528768e-06, + "loss": 0.8007, + "step": 22239 + }, + { + "epoch": 0.57, + "learning_rate": 1.8687060846373428e-06, + "loss": 0.7715, + "step": 22240 + }, + { + "epoch": 0.57, + "learning_rate": 1.8686923783566808e-06, + "loss": 0.9619, + "step": 22241 + }, + { + "epoch": 0.57, + "learning_rate": 1.8686786714109006e-06, + "loss": 0.8252, + "step": 22242 + }, + { + "epoch": 0.57, + "learning_rate": 1.8686649638000134e-06, + "loss": 0.7122, + "step": 22243 + }, + { + "epoch": 0.57, + "learning_rate": 1.8686512555240293e-06, + "loss": 0.9326, + "step": 22244 + }, + { + "epoch": 0.57, + "learning_rate": 1.8686375465829588e-06, + "loss": 0.769, + "step": 22245 + }, + { + "epoch": 0.57, + "learning_rate": 1.8686238369768126e-06, + "loss": 0.8853, + "step": 22246 + }, + { + "epoch": 0.57, + "learning_rate": 1.868610126705601e-06, + "loss": 0.4326, + "step": 22247 + }, + { + "epoch": 0.57, + "learning_rate": 1.8685964157693346e-06, + "loss": 0.8311, + "step": 22248 + }, + { + "epoch": 0.57, + "learning_rate": 1.8685827041680237e-06, + "loss": 1.0361, + "step": 22249 + }, + { + "epoch": 0.57, + "learning_rate": 1.8685689919016791e-06, + "loss": 0.9814, + "step": 22250 + }, + { + "epoch": 0.57, + "learning_rate": 1.868555278970311e-06, + "loss": 1.0371, + "step": 22251 + }, + { + "epoch": 0.57, + "learning_rate": 1.8685415653739302e-06, + "loss": 0.9307, + "step": 22252 + }, + { + "epoch": 0.57, + "learning_rate": 1.8685278511125473e-06, + "loss": 0.8936, + "step": 22253 + }, + { + "epoch": 0.57, + "learning_rate": 1.8685141361861724e-06, + "loss": 0.9062, + "step": 22254 + }, + { + "epoch": 0.57, + "learning_rate": 1.8685004205948158e-06, + "loss": 0.7637, + "step": 22255 + }, + { + "epoch": 0.57, + "learning_rate": 1.8684867043384886e-06, + "loss": 0.8096, + "step": 22256 + }, + { + "epoch": 0.57, + "learning_rate": 1.8684729874172011e-06, + "loss": 0.8081, + "step": 22257 + }, + { + "epoch": 0.57, + "learning_rate": 1.8684592698309638e-06, + "loss": 0.876, + "step": 22258 + }, + { + "epoch": 0.57, + "learning_rate": 1.8684455515797872e-06, + "loss": 0.9004, + "step": 22259 + }, + { + "epoch": 0.57, + "learning_rate": 1.8684318326636817e-06, + "loss": 0.8818, + "step": 22260 + }, + { + "epoch": 0.57, + "learning_rate": 1.8684181130826579e-06, + "loss": 0.6812, + "step": 22261 + }, + { + "epoch": 0.57, + "learning_rate": 1.8684043928367263e-06, + "loss": 0.8438, + "step": 22262 + }, + { + "epoch": 0.57, + "learning_rate": 1.8683906719258973e-06, + "loss": 1.0732, + "step": 22263 + }, + { + "epoch": 0.57, + "learning_rate": 1.8683769503501816e-06, + "loss": 0.749, + "step": 22264 + }, + { + "epoch": 0.57, + "learning_rate": 1.8683632281095895e-06, + "loss": 0.6318, + "step": 22265 + }, + { + "epoch": 0.57, + "learning_rate": 1.8683495052041318e-06, + "loss": 0.7822, + "step": 22266 + }, + { + "epoch": 0.57, + "learning_rate": 1.8683357816338185e-06, + "loss": 1.0137, + "step": 22267 + }, + { + "epoch": 0.57, + "learning_rate": 1.8683220573986608e-06, + "loss": 0.8359, + "step": 22268 + }, + { + "epoch": 0.57, + "learning_rate": 1.8683083324986683e-06, + "loss": 0.9863, + "step": 22269 + }, + { + "epoch": 0.57, + "learning_rate": 1.8682946069338526e-06, + "loss": 1.043, + "step": 22270 + }, + { + "epoch": 0.57, + "learning_rate": 1.8682808807042233e-06, + "loss": 1.0605, + "step": 22271 + }, + { + "epoch": 0.57, + "learning_rate": 1.8682671538097914e-06, + "loss": 0.7422, + "step": 22272 + }, + { + "epoch": 0.57, + "learning_rate": 1.8682534262505674e-06, + "loss": 0.8115, + "step": 22273 + }, + { + "epoch": 0.57, + "learning_rate": 1.8682396980265614e-06, + "loss": 0.6792, + "step": 22274 + }, + { + "epoch": 0.57, + "learning_rate": 1.8682259691377841e-06, + "loss": 0.8564, + "step": 22275 + }, + { + "epoch": 0.57, + "learning_rate": 1.8682122395842463e-06, + "loss": 0.7734, + "step": 22276 + }, + { + "epoch": 0.57, + "learning_rate": 1.8681985093659582e-06, + "loss": 0.8252, + "step": 22277 + }, + { + "epoch": 0.57, + "learning_rate": 1.8681847784829308e-06, + "loss": 0.9263, + "step": 22278 + }, + { + "epoch": 0.57, + "learning_rate": 1.8681710469351737e-06, + "loss": 0.8145, + "step": 22279 + }, + { + "epoch": 0.57, + "learning_rate": 1.8681573147226984e-06, + "loss": 0.8013, + "step": 22280 + }, + { + "epoch": 0.57, + "learning_rate": 1.8681435818455146e-06, + "loss": 0.8486, + "step": 22281 + }, + { + "epoch": 0.57, + "learning_rate": 1.8681298483036332e-06, + "loss": 0.8945, + "step": 22282 + }, + { + "epoch": 0.57, + "learning_rate": 1.868116114097065e-06, + "loss": 0.8057, + "step": 22283 + }, + { + "epoch": 0.57, + "learning_rate": 1.8681023792258198e-06, + "loss": 0.6941, + "step": 22284 + }, + { + "epoch": 0.57, + "learning_rate": 1.8680886436899091e-06, + "loss": 0.9072, + "step": 22285 + }, + { + "epoch": 0.57, + "learning_rate": 1.8680749074893422e-06, + "loss": 0.6508, + "step": 22286 + }, + { + "epoch": 0.57, + "learning_rate": 1.8680611706241306e-06, + "loss": 1.1074, + "step": 22287 + }, + { + "epoch": 0.57, + "learning_rate": 1.8680474330942847e-06, + "loss": 0.7295, + "step": 22288 + }, + { + "epoch": 0.57, + "learning_rate": 1.8680336948998145e-06, + "loss": 0.8101, + "step": 22289 + }, + { + "epoch": 0.57, + "learning_rate": 1.8680199560407308e-06, + "loss": 0.9521, + "step": 22290 + }, + { + "epoch": 0.57, + "learning_rate": 1.868006216517044e-06, + "loss": 0.9062, + "step": 22291 + }, + { + "epoch": 0.57, + "learning_rate": 1.8679924763287648e-06, + "loss": 0.6934, + "step": 22292 + }, + { + "epoch": 0.57, + "learning_rate": 1.867978735475904e-06, + "loss": 0.9346, + "step": 22293 + }, + { + "epoch": 0.57, + "learning_rate": 1.8679649939584717e-06, + "loss": 0.7607, + "step": 22294 + }, + { + "epoch": 0.57, + "learning_rate": 1.8679512517764783e-06, + "loss": 0.9062, + "step": 22295 + }, + { + "epoch": 0.57, + "learning_rate": 1.8679375089299344e-06, + "loss": 0.9287, + "step": 22296 + }, + { + "epoch": 0.57, + "learning_rate": 1.867923765418851e-06, + "loss": 0.8838, + "step": 22297 + }, + { + "epoch": 0.57, + "learning_rate": 1.8679100212432384e-06, + "loss": 1.0, + "step": 22298 + }, + { + "epoch": 0.57, + "learning_rate": 1.8678962764031066e-06, + "loss": 1.0088, + "step": 22299 + }, + { + "epoch": 0.57, + "learning_rate": 1.8678825308984668e-06, + "loss": 0.9375, + "step": 22300 + }, + { + "epoch": 0.57, + "learning_rate": 1.867868784729329e-06, + "loss": 0.7549, + "step": 22301 + }, + { + "epoch": 0.57, + "learning_rate": 1.8678550378957043e-06, + "loss": 1.002, + "step": 22302 + }, + { + "epoch": 0.57, + "learning_rate": 1.8678412903976026e-06, + "loss": 0.6218, + "step": 22303 + }, + { + "epoch": 0.57, + "learning_rate": 1.8678275422350352e-06, + "loss": 0.8169, + "step": 22304 + }, + { + "epoch": 0.57, + "learning_rate": 1.8678137934080116e-06, + "loss": 1.0117, + "step": 22305 + }, + { + "epoch": 0.57, + "learning_rate": 1.8678000439165432e-06, + "loss": 0.7666, + "step": 22306 + }, + { + "epoch": 0.57, + "learning_rate": 1.86778629376064e-06, + "loss": 0.9238, + "step": 22307 + }, + { + "epoch": 0.57, + "learning_rate": 1.8677725429403132e-06, + "loss": 0.6807, + "step": 22308 + }, + { + "epoch": 0.57, + "learning_rate": 1.8677587914555723e-06, + "loss": 0.8086, + "step": 22309 + }, + { + "epoch": 0.57, + "learning_rate": 1.8677450393064285e-06, + "loss": 0.8228, + "step": 22310 + }, + { + "epoch": 0.57, + "learning_rate": 1.8677312864928924e-06, + "loss": 0.7852, + "step": 22311 + }, + { + "epoch": 0.57, + "learning_rate": 1.8677175330149742e-06, + "loss": 0.8721, + "step": 22312 + }, + { + "epoch": 0.57, + "learning_rate": 1.8677037788726846e-06, + "loss": 0.6538, + "step": 22313 + }, + { + "epoch": 0.57, + "learning_rate": 1.8676900240660342e-06, + "loss": 0.8838, + "step": 22314 + }, + { + "epoch": 0.57, + "learning_rate": 1.8676762685950337e-06, + "loss": 0.9834, + "step": 22315 + }, + { + "epoch": 0.57, + "learning_rate": 1.867662512459693e-06, + "loss": 0.7749, + "step": 22316 + }, + { + "epoch": 0.57, + "learning_rate": 1.867648755660023e-06, + "loss": 0.8613, + "step": 22317 + }, + { + "epoch": 0.57, + "learning_rate": 1.8676349981960344e-06, + "loss": 0.8418, + "step": 22318 + }, + { + "epoch": 0.57, + "learning_rate": 1.8676212400677375e-06, + "loss": 0.7998, + "step": 22319 + }, + { + "epoch": 0.57, + "learning_rate": 1.867607481275143e-06, + "loss": 0.6826, + "step": 22320 + }, + { + "epoch": 0.57, + "learning_rate": 1.8675937218182613e-06, + "loss": 1.0381, + "step": 22321 + }, + { + "epoch": 0.57, + "learning_rate": 1.8675799616971028e-06, + "loss": 1.0518, + "step": 22322 + }, + { + "epoch": 0.57, + "learning_rate": 1.8675662009116786e-06, + "loss": 0.999, + "step": 22323 + }, + { + "epoch": 0.57, + "learning_rate": 1.8675524394619985e-06, + "loss": 0.7363, + "step": 22324 + }, + { + "epoch": 0.57, + "learning_rate": 1.8675386773480737e-06, + "loss": 1.0156, + "step": 22325 + }, + { + "epoch": 0.57, + "learning_rate": 1.8675249145699143e-06, + "loss": 0.8804, + "step": 22326 + }, + { + "epoch": 0.57, + "learning_rate": 1.8675111511275308e-06, + "loss": 0.9766, + "step": 22327 + }, + { + "epoch": 0.57, + "learning_rate": 1.867497387020934e-06, + "loss": 0.7251, + "step": 22328 + }, + { + "epoch": 0.57, + "learning_rate": 1.8674836222501345e-06, + "loss": 1.1387, + "step": 22329 + }, + { + "epoch": 0.57, + "learning_rate": 1.8674698568151426e-06, + "loss": 0.9365, + "step": 22330 + }, + { + "epoch": 0.57, + "learning_rate": 1.8674560907159687e-06, + "loss": 1.0049, + "step": 22331 + }, + { + "epoch": 0.57, + "learning_rate": 1.8674423239526239e-06, + "loss": 0.96, + "step": 22332 + }, + { + "epoch": 0.57, + "learning_rate": 1.8674285565251182e-06, + "loss": 0.6721, + "step": 22333 + }, + { + "epoch": 0.57, + "learning_rate": 1.867414788433462e-06, + "loss": 0.9688, + "step": 22334 + }, + { + "epoch": 0.57, + "learning_rate": 1.8674010196776667e-06, + "loss": 1.0078, + "step": 22335 + }, + { + "epoch": 0.57, + "learning_rate": 1.8673872502577424e-06, + "loss": 0.8604, + "step": 22336 + }, + { + "epoch": 0.57, + "learning_rate": 1.8673734801736992e-06, + "loss": 0.6338, + "step": 22337 + }, + { + "epoch": 0.57, + "learning_rate": 1.867359709425548e-06, + "loss": 0.6416, + "step": 22338 + }, + { + "epoch": 0.57, + "learning_rate": 1.8673459380132996e-06, + "loss": 0.9053, + "step": 22339 + }, + { + "epoch": 0.57, + "learning_rate": 1.8673321659369643e-06, + "loss": 0.877, + "step": 22340 + }, + { + "epoch": 0.57, + "learning_rate": 1.8673183931965523e-06, + "loss": 0.8262, + "step": 22341 + }, + { + "epoch": 0.57, + "learning_rate": 1.8673046197920747e-06, + "loss": 0.9727, + "step": 22342 + }, + { + "epoch": 0.57, + "learning_rate": 1.867290845723542e-06, + "loss": 0.7891, + "step": 22343 + }, + { + "epoch": 0.57, + "learning_rate": 1.8672770709909641e-06, + "loss": 1.0625, + "step": 22344 + }, + { + "epoch": 0.57, + "learning_rate": 1.8672632955943525e-06, + "loss": 0.7334, + "step": 22345 + }, + { + "epoch": 0.57, + "learning_rate": 1.8672495195337172e-06, + "loss": 0.9023, + "step": 22346 + }, + { + "epoch": 0.57, + "learning_rate": 1.8672357428090689e-06, + "loss": 0.8672, + "step": 22347 + }, + { + "epoch": 0.57, + "learning_rate": 1.8672219654204179e-06, + "loss": 0.9355, + "step": 22348 + }, + { + "epoch": 0.57, + "learning_rate": 1.8672081873677748e-06, + "loss": 0.8379, + "step": 22349 + }, + { + "epoch": 0.57, + "learning_rate": 1.8671944086511504e-06, + "loss": 1.0908, + "step": 22350 + }, + { + "epoch": 0.57, + "learning_rate": 1.867180629270555e-06, + "loss": 0.8701, + "step": 22351 + }, + { + "epoch": 0.57, + "learning_rate": 1.8671668492259994e-06, + "loss": 0.7773, + "step": 22352 + }, + { + "epoch": 0.57, + "learning_rate": 1.867153068517494e-06, + "loss": 1.0391, + "step": 22353 + }, + { + "epoch": 0.57, + "learning_rate": 1.8671392871450493e-06, + "loss": 0.8066, + "step": 22354 + }, + { + "epoch": 0.57, + "learning_rate": 1.8671255051086762e-06, + "loss": 0.644, + "step": 22355 + }, + { + "epoch": 0.57, + "learning_rate": 1.8671117224083845e-06, + "loss": 0.8594, + "step": 22356 + }, + { + "epoch": 0.57, + "learning_rate": 1.8670979390441856e-06, + "loss": 0.7949, + "step": 22357 + }, + { + "epoch": 0.57, + "learning_rate": 1.8670841550160895e-06, + "loss": 0.7969, + "step": 22358 + }, + { + "epoch": 0.57, + "learning_rate": 1.867070370324107e-06, + "loss": 0.6465, + "step": 22359 + }, + { + "epoch": 0.57, + "learning_rate": 1.8670565849682486e-06, + "loss": 0.9736, + "step": 22360 + }, + { + "epoch": 0.57, + "learning_rate": 1.8670427989485248e-06, + "loss": 0.8877, + "step": 22361 + }, + { + "epoch": 0.57, + "learning_rate": 1.8670290122649463e-06, + "loss": 0.8496, + "step": 22362 + }, + { + "epoch": 0.57, + "learning_rate": 1.8670152249175235e-06, + "loss": 0.7363, + "step": 22363 + }, + { + "epoch": 0.57, + "learning_rate": 1.8670014369062668e-06, + "loss": 0.7646, + "step": 22364 + }, + { + "epoch": 0.57, + "learning_rate": 1.8669876482311872e-06, + "loss": 0.79, + "step": 22365 + }, + { + "epoch": 0.57, + "learning_rate": 1.866973858892295e-06, + "loss": 0.6689, + "step": 22366 + }, + { + "epoch": 0.57, + "learning_rate": 1.8669600688896009e-06, + "loss": 0.8057, + "step": 22367 + }, + { + "epoch": 0.57, + "learning_rate": 1.866946278223115e-06, + "loss": 0.8594, + "step": 22368 + }, + { + "epoch": 0.57, + "learning_rate": 1.8669324868928485e-06, + "loss": 1.0283, + "step": 22369 + }, + { + "epoch": 0.57, + "learning_rate": 1.8669186948988113e-06, + "loss": 1.0205, + "step": 22370 + }, + { + "epoch": 0.57, + "learning_rate": 1.8669049022410146e-06, + "loss": 0.8081, + "step": 22371 + }, + { + "epoch": 0.57, + "learning_rate": 1.8668911089194687e-06, + "loss": 0.9482, + "step": 22372 + }, + { + "epoch": 0.57, + "learning_rate": 1.8668773149341841e-06, + "loss": 0.8091, + "step": 22373 + }, + { + "epoch": 0.57, + "learning_rate": 1.8668635202851713e-06, + "loss": 0.9922, + "step": 22374 + }, + { + "epoch": 0.57, + "learning_rate": 1.866849724972441e-06, + "loss": 0.9473, + "step": 22375 + }, + { + "epoch": 0.57, + "learning_rate": 1.8668359289960038e-06, + "loss": 0.9736, + "step": 22376 + }, + { + "epoch": 0.57, + "learning_rate": 1.8668221323558702e-06, + "loss": 0.8105, + "step": 22377 + }, + { + "epoch": 0.57, + "learning_rate": 1.8668083350520507e-06, + "loss": 0.9111, + "step": 22378 + }, + { + "epoch": 0.57, + "learning_rate": 1.866794537084556e-06, + "loss": 0.8418, + "step": 22379 + }, + { + "epoch": 0.57, + "learning_rate": 1.8667807384533965e-06, + "loss": 0.9551, + "step": 22380 + }, + { + "epoch": 0.57, + "learning_rate": 1.8667669391585825e-06, + "loss": 0.8799, + "step": 22381 + }, + { + "epoch": 0.57, + "learning_rate": 1.8667531392001255e-06, + "loss": 0.8716, + "step": 22382 + }, + { + "epoch": 0.57, + "learning_rate": 1.8667393385780352e-06, + "loss": 0.9648, + "step": 22383 + }, + { + "epoch": 0.57, + "learning_rate": 1.8667255372923223e-06, + "loss": 0.9502, + "step": 22384 + }, + { + "epoch": 0.57, + "learning_rate": 1.8667117353429977e-06, + "loss": 1.1357, + "step": 22385 + }, + { + "epoch": 0.57, + "learning_rate": 1.8666979327300719e-06, + "loss": 0.8262, + "step": 22386 + }, + { + "epoch": 0.57, + "learning_rate": 1.8666841294535552e-06, + "loss": 0.9219, + "step": 22387 + }, + { + "epoch": 0.57, + "learning_rate": 1.8666703255134581e-06, + "loss": 0.9834, + "step": 22388 + }, + { + "epoch": 0.57, + "learning_rate": 1.8666565209097916e-06, + "loss": 0.8984, + "step": 22389 + }, + { + "epoch": 0.57, + "learning_rate": 1.866642715642566e-06, + "loss": 0.874, + "step": 22390 + }, + { + "epoch": 0.57, + "learning_rate": 1.866628909711792e-06, + "loss": 1.042, + "step": 22391 + }, + { + "epoch": 0.57, + "learning_rate": 1.8666151031174802e-06, + "loss": 0.9033, + "step": 22392 + }, + { + "epoch": 0.57, + "learning_rate": 1.8666012958596408e-06, + "loss": 0.8438, + "step": 22393 + }, + { + "epoch": 0.57, + "learning_rate": 1.8665874879382847e-06, + "loss": 0.9248, + "step": 22394 + }, + { + "epoch": 0.57, + "learning_rate": 1.8665736793534226e-06, + "loss": 0.9834, + "step": 22395 + }, + { + "epoch": 0.57, + "learning_rate": 1.8665598701050647e-06, + "loss": 0.8574, + "step": 22396 + }, + { + "epoch": 0.57, + "learning_rate": 1.8665460601932218e-06, + "loss": 0.9707, + "step": 22397 + }, + { + "epoch": 0.57, + "learning_rate": 1.8665322496179044e-06, + "loss": 0.7207, + "step": 22398 + }, + { + "epoch": 0.57, + "learning_rate": 1.866518438379123e-06, + "loss": 0.918, + "step": 22399 + }, + { + "epoch": 0.57, + "learning_rate": 1.8665046264768885e-06, + "loss": 0.9814, + "step": 22400 + }, + { + "epoch": 0.57, + "learning_rate": 1.866490813911211e-06, + "loss": 0.4138, + "step": 22401 + }, + { + "epoch": 0.57, + "learning_rate": 1.8664770006821015e-06, + "loss": 1.0068, + "step": 22402 + }, + { + "epoch": 0.57, + "learning_rate": 1.8664631867895704e-06, + "loss": 0.7598, + "step": 22403 + }, + { + "epoch": 0.57, + "learning_rate": 1.8664493722336284e-06, + "loss": 0.9893, + "step": 22404 + }, + { + "epoch": 0.57, + "learning_rate": 1.8664355570142858e-06, + "loss": 0.998, + "step": 22405 + }, + { + "epoch": 0.57, + "learning_rate": 1.8664217411315533e-06, + "loss": 0.7764, + "step": 22406 + }, + { + "epoch": 0.57, + "learning_rate": 1.8664079245854416e-06, + "loss": 0.6892, + "step": 22407 + }, + { + "epoch": 0.57, + "learning_rate": 1.866394107375961e-06, + "loss": 0.8623, + "step": 22408 + }, + { + "epoch": 0.57, + "learning_rate": 1.8663802895031223e-06, + "loss": 0.9746, + "step": 22409 + }, + { + "epoch": 0.57, + "learning_rate": 1.8663664709669361e-06, + "loss": 0.8105, + "step": 22410 + }, + { + "epoch": 0.57, + "learning_rate": 1.8663526517674132e-06, + "loss": 0.772, + "step": 22411 + }, + { + "epoch": 0.57, + "learning_rate": 1.8663388319045636e-06, + "loss": 0.7852, + "step": 22412 + }, + { + "epoch": 0.57, + "learning_rate": 1.8663250113783984e-06, + "loss": 0.6189, + "step": 22413 + }, + { + "epoch": 0.57, + "learning_rate": 1.866311190188928e-06, + "loss": 0.7456, + "step": 22414 + }, + { + "epoch": 0.57, + "learning_rate": 1.8662973683361626e-06, + "loss": 0.8374, + "step": 22415 + }, + { + "epoch": 0.57, + "learning_rate": 1.8662835458201136e-06, + "loss": 0.6641, + "step": 22416 + }, + { + "epoch": 0.57, + "learning_rate": 1.8662697226407907e-06, + "loss": 0.7842, + "step": 22417 + }, + { + "epoch": 0.57, + "learning_rate": 1.866255898798205e-06, + "loss": 0.9336, + "step": 22418 + }, + { + "epoch": 0.57, + "learning_rate": 1.8662420742923672e-06, + "loss": 0.8936, + "step": 22419 + }, + { + "epoch": 0.57, + "learning_rate": 1.8662282491232877e-06, + "loss": 0.7969, + "step": 22420 + }, + { + "epoch": 0.57, + "learning_rate": 1.8662144232909767e-06, + "loss": 1.103, + "step": 22421 + }, + { + "epoch": 0.57, + "learning_rate": 1.8662005967954455e-06, + "loss": 0.8018, + "step": 22422 + }, + { + "epoch": 0.57, + "learning_rate": 1.8661867696367043e-06, + "loss": 0.8926, + "step": 22423 + }, + { + "epoch": 0.57, + "learning_rate": 1.8661729418147635e-06, + "loss": 0.7803, + "step": 22424 + }, + { + "epoch": 0.57, + "learning_rate": 1.866159113329634e-06, + "loss": 0.875, + "step": 22425 + }, + { + "epoch": 0.57, + "learning_rate": 1.8661452841813264e-06, + "loss": 0.7554, + "step": 22426 + }, + { + "epoch": 0.57, + "learning_rate": 1.866131454369851e-06, + "loss": 0.6938, + "step": 22427 + }, + { + "epoch": 0.57, + "learning_rate": 1.8661176238952186e-06, + "loss": 0.7451, + "step": 22428 + }, + { + "epoch": 0.57, + "learning_rate": 1.86610379275744e-06, + "loss": 0.9541, + "step": 22429 + }, + { + "epoch": 0.57, + "learning_rate": 1.866089960956525e-06, + "loss": 0.8623, + "step": 22430 + }, + { + "epoch": 0.57, + "learning_rate": 1.8660761284924853e-06, + "loss": 0.749, + "step": 22431 + }, + { + "epoch": 0.57, + "learning_rate": 1.8660622953653307e-06, + "loss": 0.9756, + "step": 22432 + }, + { + "epoch": 0.57, + "learning_rate": 1.866048461575072e-06, + "loss": 0.8604, + "step": 22433 + }, + { + "epoch": 0.57, + "learning_rate": 1.86603462712172e-06, + "loss": 0.9805, + "step": 22434 + }, + { + "epoch": 0.58, + "learning_rate": 1.866020792005285e-06, + "loss": 0.9131, + "step": 22435 + }, + { + "epoch": 0.58, + "learning_rate": 1.8660069562257777e-06, + "loss": 0.4907, + "step": 22436 + }, + { + "epoch": 0.58, + "learning_rate": 1.8659931197832085e-06, + "loss": 0.7881, + "step": 22437 + }, + { + "epoch": 0.58, + "learning_rate": 1.8659792826775887e-06, + "loss": 1.0127, + "step": 22438 + }, + { + "epoch": 0.58, + "learning_rate": 1.865965444908928e-06, + "loss": 0.7852, + "step": 22439 + }, + { + "epoch": 0.58, + "learning_rate": 1.8659516064772374e-06, + "loss": 0.5471, + "step": 22440 + }, + { + "epoch": 0.58, + "learning_rate": 1.8659377673825274e-06, + "loss": 0.7437, + "step": 22441 + }, + { + "epoch": 0.58, + "learning_rate": 1.8659239276248089e-06, + "loss": 0.6433, + "step": 22442 + }, + { + "epoch": 0.58, + "learning_rate": 1.865910087204092e-06, + "loss": 1.0371, + "step": 22443 + }, + { + "epoch": 0.58, + "learning_rate": 1.8658962461203877e-06, + "loss": 0.9043, + "step": 22444 + }, + { + "epoch": 0.58, + "learning_rate": 1.8658824043737064e-06, + "loss": 0.8662, + "step": 22445 + }, + { + "epoch": 0.58, + "learning_rate": 1.865868561964059e-06, + "loss": 0.8247, + "step": 22446 + }, + { + "epoch": 0.58, + "learning_rate": 1.8658547188914557e-06, + "loss": 0.9854, + "step": 22447 + }, + { + "epoch": 0.58, + "learning_rate": 1.8658408751559071e-06, + "loss": 0.7336, + "step": 22448 + }, + { + "epoch": 0.58, + "learning_rate": 1.865827030757424e-06, + "loss": 0.9629, + "step": 22449 + }, + { + "epoch": 0.58, + "learning_rate": 1.865813185696017e-06, + "loss": 0.8564, + "step": 22450 + }, + { + "epoch": 0.58, + "learning_rate": 1.865799339971697e-06, + "loss": 0.8906, + "step": 22451 + }, + { + "epoch": 0.58, + "learning_rate": 1.865785493584474e-06, + "loss": 0.7065, + "step": 22452 + }, + { + "epoch": 0.58, + "learning_rate": 1.8657716465343584e-06, + "loss": 1.0625, + "step": 22453 + }, + { + "epoch": 0.58, + "learning_rate": 1.8657577988213617e-06, + "loss": 0.7666, + "step": 22454 + }, + { + "epoch": 0.58, + "learning_rate": 1.8657439504454942e-06, + "loss": 0.7949, + "step": 22455 + }, + { + "epoch": 0.58, + "learning_rate": 1.8657301014067662e-06, + "loss": 1.0684, + "step": 22456 + }, + { + "epoch": 0.58, + "learning_rate": 1.8657162517051886e-06, + "loss": 0.6709, + "step": 22457 + }, + { + "epoch": 0.58, + "learning_rate": 1.8657024013407714e-06, + "loss": 0.9395, + "step": 22458 + }, + { + "epoch": 0.58, + "learning_rate": 1.8656885503135262e-06, + "loss": 0.8755, + "step": 22459 + }, + { + "epoch": 0.58, + "learning_rate": 1.8656746986234627e-06, + "loss": 0.7344, + "step": 22460 + }, + { + "epoch": 0.58, + "learning_rate": 1.8656608462705923e-06, + "loss": 0.9087, + "step": 22461 + }, + { + "epoch": 0.58, + "learning_rate": 1.8656469932549248e-06, + "loss": 1.0586, + "step": 22462 + }, + { + "epoch": 0.58, + "learning_rate": 1.8656331395764716e-06, + "loss": 0.9287, + "step": 22463 + }, + { + "epoch": 0.58, + "learning_rate": 1.8656192852352426e-06, + "loss": 1.0195, + "step": 22464 + }, + { + "epoch": 0.58, + "learning_rate": 1.8656054302312487e-06, + "loss": 0.9746, + "step": 22465 + }, + { + "epoch": 0.58, + "learning_rate": 1.8655915745645006e-06, + "loss": 0.9385, + "step": 22466 + }, + { + "epoch": 0.58, + "learning_rate": 1.865577718235009e-06, + "loss": 0.7803, + "step": 22467 + }, + { + "epoch": 0.58, + "learning_rate": 1.8655638612427843e-06, + "loss": 0.7979, + "step": 22468 + }, + { + "epoch": 0.58, + "learning_rate": 1.8655500035878368e-06, + "loss": 0.9893, + "step": 22469 + }, + { + "epoch": 0.58, + "learning_rate": 1.8655361452701776e-06, + "loss": 0.9531, + "step": 22470 + }, + { + "epoch": 0.58, + "learning_rate": 1.8655222862898175e-06, + "loss": 0.9014, + "step": 22471 + }, + { + "epoch": 0.58, + "learning_rate": 1.8655084266467664e-06, + "loss": 0.8438, + "step": 22472 + }, + { + "epoch": 0.58, + "learning_rate": 1.8654945663410355e-06, + "loss": 0.5171, + "step": 22473 + }, + { + "epoch": 0.58, + "learning_rate": 1.8654807053726352e-06, + "loss": 1.0586, + "step": 22474 + }, + { + "epoch": 0.58, + "learning_rate": 1.8654668437415762e-06, + "loss": 1.1445, + "step": 22475 + }, + { + "epoch": 0.58, + "learning_rate": 1.8654529814478689e-06, + "loss": 1.0381, + "step": 22476 + }, + { + "epoch": 0.58, + "learning_rate": 1.8654391184915239e-06, + "loss": 1.2275, + "step": 22477 + }, + { + "epoch": 0.58, + "learning_rate": 1.8654252548725522e-06, + "loss": 0.9316, + "step": 22478 + }, + { + "epoch": 0.58, + "learning_rate": 1.865411390590964e-06, + "loss": 0.6797, + "step": 22479 + }, + { + "epoch": 0.58, + "learning_rate": 1.8653975256467702e-06, + "loss": 0.8584, + "step": 22480 + }, + { + "epoch": 0.58, + "learning_rate": 1.8653836600399812e-06, + "loss": 0.6362, + "step": 22481 + }, + { + "epoch": 0.58, + "learning_rate": 1.865369793770608e-06, + "loss": 0.7998, + "step": 22482 + }, + { + "epoch": 0.58, + "learning_rate": 1.865355926838661e-06, + "loss": 0.8115, + "step": 22483 + }, + { + "epoch": 0.58, + "learning_rate": 1.8653420592441504e-06, + "loss": 0.9854, + "step": 22484 + }, + { + "epoch": 0.58, + "learning_rate": 1.8653281909870872e-06, + "loss": 0.7041, + "step": 22485 + }, + { + "epoch": 0.58, + "learning_rate": 1.865314322067482e-06, + "loss": 0.7676, + "step": 22486 + }, + { + "epoch": 0.58, + "learning_rate": 1.8653004524853455e-06, + "loss": 0.6011, + "step": 22487 + }, + { + "epoch": 0.58, + "learning_rate": 1.8652865822406882e-06, + "loss": 0.8574, + "step": 22488 + }, + { + "epoch": 0.58, + "learning_rate": 1.8652727113335209e-06, + "loss": 0.8271, + "step": 22489 + }, + { + "epoch": 0.58, + "learning_rate": 1.8652588397638537e-06, + "loss": 0.7734, + "step": 22490 + }, + { + "epoch": 0.58, + "learning_rate": 1.8652449675316982e-06, + "loss": 0.6787, + "step": 22491 + }, + { + "epoch": 0.58, + "learning_rate": 1.865231094637064e-06, + "loss": 0.6409, + "step": 22492 + }, + { + "epoch": 0.58, + "learning_rate": 1.865217221079962e-06, + "loss": 0.8828, + "step": 22493 + }, + { + "epoch": 0.58, + "learning_rate": 1.8652033468604032e-06, + "loss": 0.9346, + "step": 22494 + }, + { + "epoch": 0.58, + "learning_rate": 1.865189471978398e-06, + "loss": 0.9287, + "step": 22495 + }, + { + "epoch": 0.58, + "learning_rate": 1.8651755964339571e-06, + "loss": 0.6641, + "step": 22496 + }, + { + "epoch": 0.58, + "learning_rate": 1.8651617202270908e-06, + "loss": 0.6897, + "step": 22497 + }, + { + "epoch": 0.58, + "learning_rate": 1.86514784335781e-06, + "loss": 0.9404, + "step": 22498 + }, + { + "epoch": 0.58, + "learning_rate": 1.8651339658261252e-06, + "loss": 0.9141, + "step": 22499 + }, + { + "epoch": 0.58, + "learning_rate": 1.8651200876320472e-06, + "loss": 0.7891, + "step": 22500 + }, + { + "epoch": 0.58, + "learning_rate": 1.8651062087755864e-06, + "loss": 0.9561, + "step": 22501 + }, + { + "epoch": 0.58, + "learning_rate": 1.865092329256754e-06, + "loss": 0.8223, + "step": 22502 + }, + { + "epoch": 0.58, + "learning_rate": 1.8650784490755598e-06, + "loss": 0.9131, + "step": 22503 + }, + { + "epoch": 0.58, + "learning_rate": 1.8650645682320146e-06, + "loss": 0.9639, + "step": 22504 + }, + { + "epoch": 0.58, + "learning_rate": 1.8650506867261298e-06, + "loss": 1.0117, + "step": 22505 + }, + { + "epoch": 0.58, + "learning_rate": 1.865036804557915e-06, + "loss": 0.9346, + "step": 22506 + }, + { + "epoch": 0.58, + "learning_rate": 1.8650229217273817e-06, + "loss": 0.8311, + "step": 22507 + }, + { + "epoch": 0.58, + "learning_rate": 1.8650090382345395e-06, + "loss": 0.9717, + "step": 22508 + }, + { + "epoch": 0.58, + "learning_rate": 1.8649951540794002e-06, + "loss": 0.9355, + "step": 22509 + }, + { + "epoch": 0.58, + "learning_rate": 1.8649812692619738e-06, + "loss": 0.9492, + "step": 22510 + }, + { + "epoch": 0.58, + "learning_rate": 1.8649673837822708e-06, + "loss": 0.875, + "step": 22511 + }, + { + "epoch": 0.58, + "learning_rate": 1.864953497640302e-06, + "loss": 0.9502, + "step": 22512 + }, + { + "epoch": 0.58, + "learning_rate": 1.8649396108360787e-06, + "loss": 1.0479, + "step": 22513 + }, + { + "epoch": 0.58, + "learning_rate": 1.8649257233696102e-06, + "loss": 0.8193, + "step": 22514 + }, + { + "epoch": 0.58, + "learning_rate": 1.8649118352409082e-06, + "loss": 0.8623, + "step": 22515 + }, + { + "epoch": 0.58, + "learning_rate": 1.8648979464499827e-06, + "loss": 0.8076, + "step": 22516 + }, + { + "epoch": 0.58, + "learning_rate": 1.864884056996845e-06, + "loss": 0.9453, + "step": 22517 + }, + { + "epoch": 0.58, + "learning_rate": 1.8648701668815052e-06, + "loss": 0.8584, + "step": 22518 + }, + { + "epoch": 0.58, + "learning_rate": 1.8648562761039739e-06, + "loss": 0.7803, + "step": 22519 + }, + { + "epoch": 0.58, + "learning_rate": 1.864842384664262e-06, + "loss": 1.0146, + "step": 22520 + }, + { + "epoch": 0.58, + "learning_rate": 1.8648284925623803e-06, + "loss": 0.7256, + "step": 22521 + }, + { + "epoch": 0.58, + "learning_rate": 1.864814599798339e-06, + "loss": 0.5488, + "step": 22522 + }, + { + "epoch": 0.58, + "learning_rate": 1.864800706372149e-06, + "loss": 0.7671, + "step": 22523 + }, + { + "epoch": 0.58, + "learning_rate": 1.8647868122838206e-06, + "loss": 0.9238, + "step": 22524 + }, + { + "epoch": 0.58, + "learning_rate": 1.8647729175333648e-06, + "loss": 0.8696, + "step": 22525 + }, + { + "epoch": 0.58, + "learning_rate": 1.8647590221207923e-06, + "loss": 0.9307, + "step": 22526 + }, + { + "epoch": 0.58, + "learning_rate": 1.8647451260461137e-06, + "loss": 0.8105, + "step": 22527 + }, + { + "epoch": 0.58, + "learning_rate": 1.8647312293093392e-06, + "loss": 0.6636, + "step": 22528 + }, + { + "epoch": 0.58, + "learning_rate": 1.86471733191048e-06, + "loss": 0.7358, + "step": 22529 + }, + { + "epoch": 0.58, + "learning_rate": 1.8647034338495463e-06, + "loss": 0.8311, + "step": 22530 + }, + { + "epoch": 0.58, + "learning_rate": 1.864689535126549e-06, + "loss": 0.9834, + "step": 22531 + }, + { + "epoch": 0.58, + "learning_rate": 1.8646756357414985e-06, + "loss": 0.6426, + "step": 22532 + }, + { + "epoch": 0.58, + "learning_rate": 1.8646617356944058e-06, + "loss": 0.9199, + "step": 22533 + }, + { + "epoch": 0.58, + "learning_rate": 1.8646478349852814e-06, + "loss": 0.8467, + "step": 22534 + }, + { + "epoch": 0.58, + "learning_rate": 1.8646339336141362e-06, + "loss": 0.8623, + "step": 22535 + }, + { + "epoch": 0.58, + "learning_rate": 1.8646200315809801e-06, + "loss": 0.958, + "step": 22536 + }, + { + "epoch": 0.58, + "learning_rate": 1.8646061288858244e-06, + "loss": 0.873, + "step": 22537 + }, + { + "epoch": 0.58, + "learning_rate": 1.8645922255286794e-06, + "loss": 0.9014, + "step": 22538 + }, + { + "epoch": 0.58, + "learning_rate": 1.864578321509556e-06, + "loss": 1.0195, + "step": 22539 + }, + { + "epoch": 0.58, + "learning_rate": 1.8645644168284647e-06, + "loss": 0.9971, + "step": 22540 + }, + { + "epoch": 0.58, + "learning_rate": 1.864550511485416e-06, + "loss": 0.8525, + "step": 22541 + }, + { + "epoch": 0.58, + "learning_rate": 1.864536605480421e-06, + "loss": 0.9648, + "step": 22542 + }, + { + "epoch": 0.58, + "learning_rate": 1.86452269881349e-06, + "loss": 1.0527, + "step": 22543 + }, + { + "epoch": 0.58, + "learning_rate": 1.864508791484634e-06, + "loss": 0.958, + "step": 22544 + }, + { + "epoch": 0.58, + "learning_rate": 1.864494883493863e-06, + "loss": 0.9375, + "step": 22545 + }, + { + "epoch": 0.58, + "learning_rate": 1.8644809748411881e-06, + "loss": 0.793, + "step": 22546 + }, + { + "epoch": 0.58, + "learning_rate": 1.8644670655266198e-06, + "loss": 0.9248, + "step": 22547 + }, + { + "epoch": 0.58, + "learning_rate": 1.8644531555501688e-06, + "loss": 0.7646, + "step": 22548 + }, + { + "epoch": 0.58, + "learning_rate": 1.864439244911846e-06, + "loss": 1.0898, + "step": 22549 + }, + { + "epoch": 0.58, + "learning_rate": 1.8644253336116617e-06, + "loss": 0.8828, + "step": 22550 + }, + { + "epoch": 0.58, + "learning_rate": 1.8644114216496268e-06, + "loss": 0.6279, + "step": 22551 + }, + { + "epoch": 0.58, + "learning_rate": 1.8643975090257516e-06, + "loss": 0.7881, + "step": 22552 + }, + { + "epoch": 0.58, + "learning_rate": 1.8643835957400472e-06, + "loss": 0.8555, + "step": 22553 + }, + { + "epoch": 0.58, + "learning_rate": 1.8643696817925235e-06, + "loss": 0.8447, + "step": 22554 + }, + { + "epoch": 0.58, + "learning_rate": 1.8643557671831923e-06, + "loss": 0.6514, + "step": 22555 + }, + { + "epoch": 0.58, + "learning_rate": 1.8643418519120632e-06, + "loss": 0.7563, + "step": 22556 + }, + { + "epoch": 0.58, + "learning_rate": 1.8643279359791475e-06, + "loss": 0.8809, + "step": 22557 + }, + { + "epoch": 0.58, + "learning_rate": 1.8643140193844556e-06, + "loss": 0.8013, + "step": 22558 + }, + { + "epoch": 0.58, + "learning_rate": 1.8643001021279984e-06, + "loss": 0.8848, + "step": 22559 + }, + { + "epoch": 0.58, + "learning_rate": 1.8642861842097859e-06, + "loss": 0.7324, + "step": 22560 + }, + { + "epoch": 0.58, + "learning_rate": 1.8642722656298295e-06, + "loss": 0.7656, + "step": 22561 + }, + { + "epoch": 0.58, + "learning_rate": 1.8642583463881397e-06, + "loss": 0.9258, + "step": 22562 + }, + { + "epoch": 0.58, + "learning_rate": 1.8642444264847268e-06, + "loss": 1.002, + "step": 22563 + }, + { + "epoch": 0.58, + "learning_rate": 1.8642305059196017e-06, + "loss": 0.9229, + "step": 22564 + }, + { + "epoch": 0.58, + "learning_rate": 1.864216584692775e-06, + "loss": 0.9023, + "step": 22565 + }, + { + "epoch": 0.58, + "learning_rate": 1.8642026628042578e-06, + "loss": 0.9609, + "step": 22566 + }, + { + "epoch": 0.58, + "learning_rate": 1.86418874025406e-06, + "loss": 0.9639, + "step": 22567 + }, + { + "epoch": 0.58, + "learning_rate": 1.8641748170421925e-06, + "loss": 1.1895, + "step": 22568 + }, + { + "epoch": 0.58, + "learning_rate": 1.8641608931686663e-06, + "loss": 1.0381, + "step": 22569 + }, + { + "epoch": 0.58, + "learning_rate": 1.864146968633492e-06, + "loss": 0.7427, + "step": 22570 + }, + { + "epoch": 0.58, + "learning_rate": 1.8641330434366798e-06, + "loss": 0.5322, + "step": 22571 + }, + { + "epoch": 0.58, + "learning_rate": 1.8641191175782405e-06, + "loss": 0.8579, + "step": 22572 + }, + { + "epoch": 0.58, + "learning_rate": 1.8641051910581852e-06, + "loss": 0.8965, + "step": 22573 + }, + { + "epoch": 0.58, + "learning_rate": 1.8640912638765243e-06, + "loss": 0.999, + "step": 22574 + }, + { + "epoch": 0.58, + "learning_rate": 1.8640773360332685e-06, + "loss": 1.0684, + "step": 22575 + }, + { + "epoch": 0.58, + "learning_rate": 1.864063407528428e-06, + "loss": 0.8408, + "step": 22576 + }, + { + "epoch": 0.58, + "learning_rate": 1.8640494783620144e-06, + "loss": 0.9258, + "step": 22577 + }, + { + "epoch": 0.58, + "learning_rate": 1.8640355485340376e-06, + "loss": 1.0166, + "step": 22578 + }, + { + "epoch": 0.58, + "learning_rate": 1.8640216180445085e-06, + "loss": 0.9521, + "step": 22579 + }, + { + "epoch": 0.58, + "learning_rate": 1.864007686893438e-06, + "loss": 0.9165, + "step": 22580 + }, + { + "epoch": 0.58, + "learning_rate": 1.8639937550808361e-06, + "loss": 0.8237, + "step": 22581 + }, + { + "epoch": 0.58, + "learning_rate": 1.8639798226067142e-06, + "loss": 0.7471, + "step": 22582 + }, + { + "epoch": 0.58, + "learning_rate": 1.8639658894710828e-06, + "loss": 0.8867, + "step": 22583 + }, + { + "epoch": 0.58, + "learning_rate": 1.8639519556739525e-06, + "loss": 0.7373, + "step": 22584 + }, + { + "epoch": 0.58, + "learning_rate": 1.8639380212153336e-06, + "loss": 0.7705, + "step": 22585 + }, + { + "epoch": 0.58, + "learning_rate": 1.863924086095237e-06, + "loss": 1.1221, + "step": 22586 + }, + { + "epoch": 0.58, + "learning_rate": 1.863910150313674e-06, + "loss": 1.0547, + "step": 22587 + }, + { + "epoch": 0.58, + "learning_rate": 1.8638962138706541e-06, + "loss": 0.6602, + "step": 22588 + }, + { + "epoch": 0.58, + "learning_rate": 1.8638822767661889e-06, + "loss": 0.6733, + "step": 22589 + }, + { + "epoch": 0.58, + "learning_rate": 1.8638683390002887e-06, + "loss": 0.9824, + "step": 22590 + }, + { + "epoch": 0.58, + "learning_rate": 1.8638544005729645e-06, + "loss": 0.9141, + "step": 22591 + }, + { + "epoch": 0.58, + "learning_rate": 1.8638404614842265e-06, + "loss": 1.0566, + "step": 22592 + }, + { + "epoch": 0.58, + "learning_rate": 1.8638265217340854e-06, + "loss": 1.0225, + "step": 22593 + }, + { + "epoch": 0.58, + "learning_rate": 1.8638125813225521e-06, + "loss": 0.9961, + "step": 22594 + }, + { + "epoch": 0.58, + "learning_rate": 1.8637986402496373e-06, + "loss": 0.6484, + "step": 22595 + }, + { + "epoch": 0.58, + "learning_rate": 1.8637846985153516e-06, + "loss": 0.9307, + "step": 22596 + }, + { + "epoch": 0.58, + "learning_rate": 1.8637707561197057e-06, + "loss": 0.6343, + "step": 22597 + }, + { + "epoch": 0.58, + "learning_rate": 1.8637568130627103e-06, + "loss": 0.917, + "step": 22598 + }, + { + "epoch": 0.58, + "learning_rate": 1.863742869344376e-06, + "loss": 0.6523, + "step": 22599 + }, + { + "epoch": 0.58, + "learning_rate": 1.8637289249647137e-06, + "loss": 0.9346, + "step": 22600 + }, + { + "epoch": 0.58, + "learning_rate": 1.8637149799237335e-06, + "loss": 0.9746, + "step": 22601 + }, + { + "epoch": 0.58, + "learning_rate": 1.8637010342214466e-06, + "loss": 0.7397, + "step": 22602 + }, + { + "epoch": 0.58, + "learning_rate": 1.8636870878578636e-06, + "loss": 0.6698, + "step": 22603 + }, + { + "epoch": 0.58, + "learning_rate": 1.8636731408329949e-06, + "loss": 0.8306, + "step": 22604 + }, + { + "epoch": 0.58, + "learning_rate": 1.8636591931468515e-06, + "loss": 0.8594, + "step": 22605 + }, + { + "epoch": 0.58, + "learning_rate": 1.8636452447994441e-06, + "loss": 1.0771, + "step": 22606 + }, + { + "epoch": 0.58, + "learning_rate": 1.8636312957907831e-06, + "loss": 0.7781, + "step": 22607 + }, + { + "epoch": 0.58, + "learning_rate": 1.8636173461208795e-06, + "loss": 0.8828, + "step": 22608 + }, + { + "epoch": 0.58, + "learning_rate": 1.8636033957897434e-06, + "loss": 0.7021, + "step": 22609 + }, + { + "epoch": 0.58, + "learning_rate": 1.8635894447973863e-06, + "loss": 0.7715, + "step": 22610 + }, + { + "epoch": 0.58, + "learning_rate": 1.8635754931438183e-06, + "loss": 0.8057, + "step": 22611 + }, + { + "epoch": 0.58, + "learning_rate": 1.8635615408290503e-06, + "loss": 0.8875, + "step": 22612 + }, + { + "epoch": 0.58, + "learning_rate": 1.863547587853093e-06, + "loss": 0.7139, + "step": 22613 + }, + { + "epoch": 0.58, + "learning_rate": 1.8635336342159568e-06, + "loss": 1.0371, + "step": 22614 + }, + { + "epoch": 0.58, + "learning_rate": 1.863519679917653e-06, + "loss": 0.792, + "step": 22615 + }, + { + "epoch": 0.58, + "learning_rate": 1.8635057249581917e-06, + "loss": 0.7739, + "step": 22616 + }, + { + "epoch": 0.58, + "learning_rate": 1.8634917693375836e-06, + "loss": 0.9062, + "step": 22617 + }, + { + "epoch": 0.58, + "learning_rate": 1.8634778130558397e-06, + "loss": 0.7666, + "step": 22618 + }, + { + "epoch": 0.58, + "learning_rate": 1.8634638561129705e-06, + "loss": 1.0566, + "step": 22619 + }, + { + "epoch": 0.58, + "learning_rate": 1.8634498985089867e-06, + "loss": 0.957, + "step": 22620 + }, + { + "epoch": 0.58, + "learning_rate": 1.863435940243899e-06, + "loss": 0.6963, + "step": 22621 + }, + { + "epoch": 0.58, + "learning_rate": 1.8634219813177183e-06, + "loss": 0.873, + "step": 22622 + }, + { + "epoch": 0.58, + "learning_rate": 1.863408021730455e-06, + "loss": 0.9316, + "step": 22623 + }, + { + "epoch": 0.58, + "learning_rate": 1.8633940614821197e-06, + "loss": 0.9072, + "step": 22624 + }, + { + "epoch": 0.58, + "learning_rate": 1.8633801005727235e-06, + "loss": 0.8291, + "step": 22625 + }, + { + "epoch": 0.58, + "learning_rate": 1.8633661390022767e-06, + "loss": 1.0459, + "step": 22626 + }, + { + "epoch": 0.58, + "learning_rate": 1.8633521767707902e-06, + "loss": 0.7603, + "step": 22627 + }, + { + "epoch": 0.58, + "learning_rate": 1.8633382138782747e-06, + "loss": 0.7007, + "step": 22628 + }, + { + "epoch": 0.58, + "learning_rate": 1.8633242503247409e-06, + "loss": 0.96, + "step": 22629 + }, + { + "epoch": 0.58, + "learning_rate": 1.863310286110199e-06, + "loss": 1.0293, + "step": 22630 + }, + { + "epoch": 0.58, + "learning_rate": 1.8632963212346604e-06, + "loss": 0.9053, + "step": 22631 + }, + { + "epoch": 0.58, + "learning_rate": 1.8632823556981356e-06, + "loss": 0.9434, + "step": 22632 + }, + { + "epoch": 0.58, + "learning_rate": 1.8632683895006348e-06, + "loss": 0.7729, + "step": 22633 + }, + { + "epoch": 0.58, + "learning_rate": 1.8632544226421696e-06, + "loss": 0.8965, + "step": 22634 + }, + { + "epoch": 0.58, + "learning_rate": 1.8632404551227498e-06, + "loss": 1.0459, + "step": 22635 + }, + { + "epoch": 0.58, + "learning_rate": 1.8632264869423868e-06, + "loss": 0.9219, + "step": 22636 + }, + { + "epoch": 0.58, + "learning_rate": 1.8632125181010907e-06, + "loss": 0.8184, + "step": 22637 + }, + { + "epoch": 0.58, + "learning_rate": 1.8631985485988727e-06, + "loss": 1.0283, + "step": 22638 + }, + { + "epoch": 0.58, + "learning_rate": 1.8631845784357432e-06, + "loss": 1.0674, + "step": 22639 + }, + { + "epoch": 0.58, + "learning_rate": 1.8631706076117128e-06, + "loss": 0.915, + "step": 22640 + }, + { + "epoch": 0.58, + "learning_rate": 1.8631566361267926e-06, + "loss": 0.9062, + "step": 22641 + }, + { + "epoch": 0.58, + "learning_rate": 1.8631426639809928e-06, + "loss": 0.7949, + "step": 22642 + }, + { + "epoch": 0.58, + "learning_rate": 1.8631286911743245e-06, + "loss": 0.7578, + "step": 22643 + }, + { + "epoch": 0.58, + "learning_rate": 1.8631147177067983e-06, + "loss": 0.7715, + "step": 22644 + }, + { + "epoch": 0.58, + "learning_rate": 1.8631007435784247e-06, + "loss": 0.9189, + "step": 22645 + }, + { + "epoch": 0.58, + "learning_rate": 1.8630867687892145e-06, + "loss": 0.8203, + "step": 22646 + }, + { + "epoch": 0.58, + "learning_rate": 1.8630727933391786e-06, + "loss": 0.7202, + "step": 22647 + }, + { + "epoch": 0.58, + "learning_rate": 1.8630588172283275e-06, + "loss": 0.8467, + "step": 22648 + }, + { + "epoch": 0.58, + "learning_rate": 1.863044840456672e-06, + "loss": 0.769, + "step": 22649 + }, + { + "epoch": 0.58, + "learning_rate": 1.8630308630242224e-06, + "loss": 0.8706, + "step": 22650 + }, + { + "epoch": 0.58, + "learning_rate": 1.8630168849309903e-06, + "loss": 0.8643, + "step": 22651 + }, + { + "epoch": 0.58, + "learning_rate": 1.8630029061769854e-06, + "loss": 0.9482, + "step": 22652 + }, + { + "epoch": 0.58, + "learning_rate": 1.862988926762219e-06, + "loss": 1.0322, + "step": 22653 + }, + { + "epoch": 0.58, + "learning_rate": 1.8629749466867018e-06, + "loss": 0.7402, + "step": 22654 + }, + { + "epoch": 0.58, + "learning_rate": 1.8629609659504442e-06, + "loss": 0.9111, + "step": 22655 + }, + { + "epoch": 0.58, + "learning_rate": 1.8629469845534574e-06, + "loss": 0.9697, + "step": 22656 + }, + { + "epoch": 0.58, + "learning_rate": 1.8629330024957515e-06, + "loss": 0.8799, + "step": 22657 + }, + { + "epoch": 0.58, + "learning_rate": 1.8629190197773372e-06, + "loss": 0.7725, + "step": 22658 + }, + { + "epoch": 0.58, + "learning_rate": 1.862905036398226e-06, + "loss": 0.6572, + "step": 22659 + }, + { + "epoch": 0.58, + "learning_rate": 1.8628910523584278e-06, + "loss": 0.9482, + "step": 22660 + }, + { + "epoch": 0.58, + "learning_rate": 1.8628770676579537e-06, + "loss": 0.5835, + "step": 22661 + }, + { + "epoch": 0.58, + "learning_rate": 1.862863082296814e-06, + "loss": 0.8857, + "step": 22662 + }, + { + "epoch": 0.58, + "learning_rate": 1.8628490962750201e-06, + "loss": 0.9531, + "step": 22663 + }, + { + "epoch": 0.58, + "learning_rate": 1.8628351095925825e-06, + "loss": 1.0977, + "step": 22664 + }, + { + "epoch": 0.58, + "learning_rate": 1.862821122249511e-06, + "loss": 0.7144, + "step": 22665 + }, + { + "epoch": 0.58, + "learning_rate": 1.8628071342458179e-06, + "loss": 0.7793, + "step": 22666 + }, + { + "epoch": 0.58, + "learning_rate": 1.8627931455815125e-06, + "loss": 0.8125, + "step": 22667 + }, + { + "epoch": 0.58, + "learning_rate": 1.8627791562566063e-06, + "loss": 0.8394, + "step": 22668 + }, + { + "epoch": 0.58, + "learning_rate": 1.8627651662711094e-06, + "loss": 1.0801, + "step": 22669 + }, + { + "epoch": 0.58, + "learning_rate": 1.8627511756250334e-06, + "loss": 0.9785, + "step": 22670 + }, + { + "epoch": 0.58, + "learning_rate": 1.8627371843183882e-06, + "loss": 0.8086, + "step": 22671 + }, + { + "epoch": 0.58, + "learning_rate": 1.8627231923511845e-06, + "loss": 0.9121, + "step": 22672 + }, + { + "epoch": 0.58, + "learning_rate": 1.8627091997234339e-06, + "loss": 0.8613, + "step": 22673 + }, + { + "epoch": 0.58, + "learning_rate": 1.8626952064351462e-06, + "loss": 0.7048, + "step": 22674 + }, + { + "epoch": 0.58, + "learning_rate": 1.8626812124863327e-06, + "loss": 0.9697, + "step": 22675 + }, + { + "epoch": 0.58, + "learning_rate": 1.8626672178770035e-06, + "loss": 1.0293, + "step": 22676 + }, + { + "epoch": 0.58, + "learning_rate": 1.86265322260717e-06, + "loss": 0.8379, + "step": 22677 + }, + { + "epoch": 0.58, + "learning_rate": 1.8626392266768424e-06, + "loss": 0.9004, + "step": 22678 + }, + { + "epoch": 0.58, + "learning_rate": 1.8626252300860319e-06, + "loss": 0.7383, + "step": 22679 + }, + { + "epoch": 0.58, + "learning_rate": 1.8626112328347485e-06, + "loss": 0.8281, + "step": 22680 + }, + { + "epoch": 0.58, + "learning_rate": 1.8625972349230036e-06, + "loss": 0.7178, + "step": 22681 + }, + { + "epoch": 0.58, + "learning_rate": 1.8625832363508075e-06, + "loss": 0.8232, + "step": 22682 + }, + { + "epoch": 0.58, + "learning_rate": 1.8625692371181713e-06, + "loss": 0.791, + "step": 22683 + }, + { + "epoch": 0.58, + "learning_rate": 1.8625552372251057e-06, + "loss": 0.9248, + "step": 22684 + }, + { + "epoch": 0.58, + "learning_rate": 1.8625412366716207e-06, + "loss": 0.7627, + "step": 22685 + }, + { + "epoch": 0.58, + "learning_rate": 1.8625272354577279e-06, + "loss": 1.0791, + "step": 22686 + }, + { + "epoch": 0.58, + "learning_rate": 1.8625132335834376e-06, + "loss": 0.918, + "step": 22687 + }, + { + "epoch": 0.58, + "learning_rate": 1.8624992310487601e-06, + "loss": 0.7725, + "step": 22688 + }, + { + "epoch": 0.58, + "learning_rate": 1.8624852278537074e-06, + "loss": 0.8359, + "step": 22689 + }, + { + "epoch": 0.58, + "learning_rate": 1.862471223998289e-06, + "loss": 0.8027, + "step": 22690 + }, + { + "epoch": 0.58, + "learning_rate": 1.8624572194825156e-06, + "loss": 0.9541, + "step": 22691 + }, + { + "epoch": 0.58, + "learning_rate": 1.8624432143063991e-06, + "loss": 0.7383, + "step": 22692 + }, + { + "epoch": 0.58, + "learning_rate": 1.8624292084699491e-06, + "loss": 1.0918, + "step": 22693 + }, + { + "epoch": 0.58, + "learning_rate": 1.8624152019731766e-06, + "loss": 0.8789, + "step": 22694 + }, + { + "epoch": 0.58, + "learning_rate": 1.8624011948160928e-06, + "loss": 0.8018, + "step": 22695 + }, + { + "epoch": 0.58, + "learning_rate": 1.862387186998708e-06, + "loss": 0.9102, + "step": 22696 + }, + { + "epoch": 0.58, + "learning_rate": 1.862373178521033e-06, + "loss": 1.1152, + "step": 22697 + }, + { + "epoch": 0.58, + "learning_rate": 1.8623591693830782e-06, + "loss": 0.6367, + "step": 22698 + }, + { + "epoch": 0.58, + "learning_rate": 1.862345159584855e-06, + "loss": 0.812, + "step": 22699 + }, + { + "epoch": 0.58, + "learning_rate": 1.8623311491263735e-06, + "loss": 0.8398, + "step": 22700 + }, + { + "epoch": 0.58, + "learning_rate": 1.8623171380076447e-06, + "loss": 0.8, + "step": 22701 + }, + { + "epoch": 0.58, + "learning_rate": 1.8623031262286795e-06, + "loss": 0.9082, + "step": 22702 + }, + { + "epoch": 0.58, + "learning_rate": 1.8622891137894882e-06, + "loss": 0.8838, + "step": 22703 + }, + { + "epoch": 0.58, + "learning_rate": 1.8622751006900818e-06, + "loss": 0.7891, + "step": 22704 + }, + { + "epoch": 0.58, + "learning_rate": 1.8622610869304714e-06, + "loss": 0.7954, + "step": 22705 + }, + { + "epoch": 0.58, + "learning_rate": 1.862247072510667e-06, + "loss": 0.7715, + "step": 22706 + }, + { + "epoch": 0.58, + "learning_rate": 1.8622330574306797e-06, + "loss": 0.7944, + "step": 22707 + }, + { + "epoch": 0.58, + "learning_rate": 1.8622190416905204e-06, + "loss": 0.8213, + "step": 22708 + }, + { + "epoch": 0.58, + "learning_rate": 1.8622050252901993e-06, + "loss": 0.75, + "step": 22709 + }, + { + "epoch": 0.58, + "learning_rate": 1.8621910082297275e-06, + "loss": 1.0059, + "step": 22710 + }, + { + "epoch": 0.58, + "learning_rate": 1.8621769905091158e-06, + "loss": 1.1211, + "step": 22711 + }, + { + "epoch": 0.58, + "learning_rate": 1.8621629721283747e-06, + "loss": 1.0488, + "step": 22712 + }, + { + "epoch": 0.58, + "learning_rate": 1.8621489530875154e-06, + "loss": 0.8477, + "step": 22713 + }, + { + "epoch": 0.58, + "learning_rate": 1.8621349333865478e-06, + "loss": 0.7832, + "step": 22714 + }, + { + "epoch": 0.58, + "learning_rate": 1.8621209130254835e-06, + "loss": 1.0068, + "step": 22715 + }, + { + "epoch": 0.58, + "learning_rate": 1.8621068920043327e-06, + "loss": 0.916, + "step": 22716 + }, + { + "epoch": 0.58, + "learning_rate": 1.8620928703231065e-06, + "loss": 0.7227, + "step": 22717 + }, + { + "epoch": 0.58, + "learning_rate": 1.8620788479818153e-06, + "loss": 0.8271, + "step": 22718 + }, + { + "epoch": 0.58, + "learning_rate": 1.8620648249804699e-06, + "loss": 0.7578, + "step": 22719 + }, + { + "epoch": 0.58, + "learning_rate": 1.862050801319081e-06, + "loss": 1.0068, + "step": 22720 + }, + { + "epoch": 0.58, + "learning_rate": 1.8620367769976597e-06, + "loss": 0.8564, + "step": 22721 + }, + { + "epoch": 0.58, + "learning_rate": 1.862022752016216e-06, + "loss": 0.7485, + "step": 22722 + }, + { + "epoch": 0.58, + "learning_rate": 1.8620087263747617e-06, + "loss": 0.9893, + "step": 22723 + }, + { + "epoch": 0.58, + "learning_rate": 1.8619947000733066e-06, + "loss": 0.8838, + "step": 22724 + }, + { + "epoch": 0.58, + "learning_rate": 1.8619806731118621e-06, + "loss": 0.9688, + "step": 22725 + }, + { + "epoch": 0.58, + "learning_rate": 1.8619666454904384e-06, + "loss": 0.8418, + "step": 22726 + }, + { + "epoch": 0.58, + "learning_rate": 1.8619526172090466e-06, + "loss": 0.9023, + "step": 22727 + }, + { + "epoch": 0.58, + "learning_rate": 1.861938588267697e-06, + "loss": 0.5967, + "step": 22728 + }, + { + "epoch": 0.58, + "learning_rate": 1.861924558666401e-06, + "loss": 0.8425, + "step": 22729 + }, + { + "epoch": 0.58, + "learning_rate": 1.8619105284051689e-06, + "loss": 0.6704, + "step": 22730 + }, + { + "epoch": 0.58, + "learning_rate": 1.8618964974840114e-06, + "loss": 0.9092, + "step": 22731 + }, + { + "epoch": 0.58, + "learning_rate": 1.8618824659029398e-06, + "loss": 0.7568, + "step": 22732 + }, + { + "epoch": 0.58, + "learning_rate": 1.861868433661964e-06, + "loss": 0.8022, + "step": 22733 + }, + { + "epoch": 0.58, + "learning_rate": 1.8618544007610952e-06, + "loss": 0.9062, + "step": 22734 + }, + { + "epoch": 0.58, + "learning_rate": 1.8618403672003442e-06, + "loss": 1.0234, + "step": 22735 + }, + { + "epoch": 0.58, + "learning_rate": 1.8618263329797216e-06, + "loss": 1.0117, + "step": 22736 + }, + { + "epoch": 0.58, + "learning_rate": 1.8618122980992384e-06, + "loss": 0.8037, + "step": 22737 + }, + { + "epoch": 0.58, + "learning_rate": 1.8617982625589051e-06, + "loss": 0.75, + "step": 22738 + }, + { + "epoch": 0.58, + "learning_rate": 1.8617842263587323e-06, + "loss": 0.875, + "step": 22739 + }, + { + "epoch": 0.58, + "learning_rate": 1.8617701894987312e-06, + "loss": 1.0498, + "step": 22740 + }, + { + "epoch": 0.58, + "learning_rate": 1.8617561519789121e-06, + "loss": 0.832, + "step": 22741 + }, + { + "epoch": 0.58, + "learning_rate": 1.861742113799286e-06, + "loss": 0.9082, + "step": 22742 + }, + { + "epoch": 0.58, + "learning_rate": 1.8617280749598633e-06, + "loss": 0.8848, + "step": 22743 + }, + { + "epoch": 0.58, + "learning_rate": 1.8617140354606558e-06, + "loss": 0.9619, + "step": 22744 + }, + { + "epoch": 0.58, + "learning_rate": 1.8616999953016727e-06, + "loss": 0.9033, + "step": 22745 + }, + { + "epoch": 0.58, + "learning_rate": 1.861685954482926e-06, + "loss": 0.8389, + "step": 22746 + }, + { + "epoch": 0.58, + "learning_rate": 1.861671913004426e-06, + "loss": 0.9033, + "step": 22747 + }, + { + "epoch": 0.58, + "learning_rate": 1.861657870866183e-06, + "loss": 0.9902, + "step": 22748 + }, + { + "epoch": 0.58, + "learning_rate": 1.8616438280682084e-06, + "loss": 0.8809, + "step": 22749 + }, + { + "epoch": 0.58, + "learning_rate": 1.861629784610513e-06, + "loss": 0.7412, + "step": 22750 + }, + { + "epoch": 0.58, + "learning_rate": 1.861615740493107e-06, + "loss": 0.877, + "step": 22751 + }, + { + "epoch": 0.58, + "learning_rate": 1.8616016957160014e-06, + "loss": 0.8506, + "step": 22752 + }, + { + "epoch": 0.58, + "learning_rate": 1.8615876502792075e-06, + "loss": 0.9512, + "step": 22753 + }, + { + "epoch": 0.58, + "learning_rate": 1.861573604182735e-06, + "loss": 0.9805, + "step": 22754 + }, + { + "epoch": 0.58, + "learning_rate": 1.8615595574265953e-06, + "loss": 0.8955, + "step": 22755 + }, + { + "epoch": 0.58, + "learning_rate": 1.8615455100107993e-06, + "loss": 0.7588, + "step": 22756 + }, + { + "epoch": 0.58, + "learning_rate": 1.8615314619353573e-06, + "loss": 0.6196, + "step": 22757 + }, + { + "epoch": 0.58, + "learning_rate": 1.8615174132002801e-06, + "loss": 0.6995, + "step": 22758 + }, + { + "epoch": 0.58, + "learning_rate": 1.8615033638055793e-06, + "loss": 0.8193, + "step": 22759 + }, + { + "epoch": 0.58, + "learning_rate": 1.8614893137512644e-06, + "loss": 0.8892, + "step": 22760 + }, + { + "epoch": 0.58, + "learning_rate": 1.861475263037347e-06, + "loss": 0.6191, + "step": 22761 + }, + { + "epoch": 0.58, + "learning_rate": 1.8614612116638374e-06, + "loss": 0.6011, + "step": 22762 + }, + { + "epoch": 0.58, + "learning_rate": 1.8614471596307466e-06, + "loss": 0.8496, + "step": 22763 + }, + { + "epoch": 0.58, + "learning_rate": 1.8614331069380855e-06, + "loss": 0.8418, + "step": 22764 + }, + { + "epoch": 0.58, + "learning_rate": 1.8614190535858648e-06, + "loss": 0.7656, + "step": 22765 + }, + { + "epoch": 0.58, + "learning_rate": 1.861404999574095e-06, + "loss": 0.9761, + "step": 22766 + }, + { + "epoch": 0.58, + "learning_rate": 1.8613909449027866e-06, + "loss": 0.7822, + "step": 22767 + }, + { + "epoch": 0.58, + "learning_rate": 1.861376889571951e-06, + "loss": 0.7383, + "step": 22768 + }, + { + "epoch": 0.58, + "learning_rate": 1.861362833581599e-06, + "loss": 0.8945, + "step": 22769 + }, + { + "epoch": 0.58, + "learning_rate": 1.8613487769317407e-06, + "loss": 0.6841, + "step": 22770 + }, + { + "epoch": 0.58, + "learning_rate": 1.8613347196223877e-06, + "loss": 0.9678, + "step": 22771 + }, + { + "epoch": 0.58, + "learning_rate": 1.8613206616535498e-06, + "loss": 0.8662, + "step": 22772 + }, + { + "epoch": 0.58, + "learning_rate": 1.8613066030252384e-06, + "loss": 0.8652, + "step": 22773 + }, + { + "epoch": 0.58, + "learning_rate": 1.8612925437374644e-06, + "loss": 0.8198, + "step": 22774 + }, + { + "epoch": 0.58, + "learning_rate": 1.8612784837902382e-06, + "loss": 0.6934, + "step": 22775 + }, + { + "epoch": 0.58, + "learning_rate": 1.8612644231835706e-06, + "loss": 1.0205, + "step": 22776 + }, + { + "epoch": 0.58, + "learning_rate": 1.8612503619174723e-06, + "loss": 0.877, + "step": 22777 + }, + { + "epoch": 0.58, + "learning_rate": 1.8612362999919547e-06, + "loss": 0.8652, + "step": 22778 + }, + { + "epoch": 0.58, + "learning_rate": 1.8612222374070274e-06, + "loss": 0.9971, + "step": 22779 + }, + { + "epoch": 0.58, + "learning_rate": 1.8612081741627024e-06, + "loss": 0.8467, + "step": 22780 + }, + { + "epoch": 0.58, + "learning_rate": 1.8611941102589897e-06, + "loss": 1.082, + "step": 22781 + }, + { + "epoch": 0.58, + "learning_rate": 1.8611800456958998e-06, + "loss": 0.8362, + "step": 22782 + }, + { + "epoch": 0.58, + "learning_rate": 1.8611659804734447e-06, + "loss": 0.8066, + "step": 22783 + }, + { + "epoch": 0.58, + "learning_rate": 1.8611519145916338e-06, + "loss": 0.8994, + "step": 22784 + }, + { + "epoch": 0.58, + "learning_rate": 1.8611378480504789e-06, + "loss": 0.6802, + "step": 22785 + }, + { + "epoch": 0.58, + "learning_rate": 1.8611237808499903e-06, + "loss": 1.0205, + "step": 22786 + }, + { + "epoch": 0.58, + "learning_rate": 1.8611097129901787e-06, + "loss": 0.9648, + "step": 22787 + }, + { + "epoch": 0.58, + "learning_rate": 1.8610956444710549e-06, + "loss": 0.8955, + "step": 22788 + }, + { + "epoch": 0.58, + "learning_rate": 1.8610815752926298e-06, + "loss": 1.0342, + "step": 22789 + }, + { + "epoch": 0.58, + "learning_rate": 1.8610675054549143e-06, + "loss": 0.7158, + "step": 22790 + }, + { + "epoch": 0.58, + "learning_rate": 1.861053434957919e-06, + "loss": 1.042, + "step": 22791 + }, + { + "epoch": 0.58, + "learning_rate": 1.8610393638016544e-06, + "loss": 0.8418, + "step": 22792 + }, + { + "epoch": 0.58, + "learning_rate": 1.8610252919861319e-06, + "loss": 1.0967, + "step": 22793 + }, + { + "epoch": 0.58, + "learning_rate": 1.8610112195113616e-06, + "loss": 0.8965, + "step": 22794 + }, + { + "epoch": 0.58, + "learning_rate": 1.8609971463773547e-06, + "loss": 0.8359, + "step": 22795 + }, + { + "epoch": 0.58, + "learning_rate": 1.860983072584122e-06, + "loss": 0.9229, + "step": 22796 + }, + { + "epoch": 0.58, + "learning_rate": 1.860968998131674e-06, + "loss": 0.7832, + "step": 22797 + }, + { + "epoch": 0.58, + "learning_rate": 1.8609549230200217e-06, + "loss": 1.0293, + "step": 22798 + }, + { + "epoch": 0.58, + "learning_rate": 1.8609408472491758e-06, + "loss": 0.9746, + "step": 22799 + }, + { + "epoch": 0.58, + "learning_rate": 1.860926770819147e-06, + "loss": 0.8184, + "step": 22800 + }, + { + "epoch": 0.58, + "learning_rate": 1.8609126937299463e-06, + "loss": 0.7227, + "step": 22801 + }, + { + "epoch": 0.58, + "learning_rate": 1.8608986159815846e-06, + "loss": 1.0479, + "step": 22802 + }, + { + "epoch": 0.58, + "learning_rate": 1.8608845375740719e-06, + "loss": 0.8203, + "step": 22803 + }, + { + "epoch": 0.58, + "learning_rate": 1.8608704585074196e-06, + "loss": 0.7214, + "step": 22804 + }, + { + "epoch": 0.58, + "learning_rate": 1.8608563787816384e-06, + "loss": 0.71, + "step": 22805 + }, + { + "epoch": 0.58, + "learning_rate": 1.8608422983967392e-06, + "loss": 0.8379, + "step": 22806 + }, + { + "epoch": 0.58, + "learning_rate": 1.8608282173527323e-06, + "loss": 0.9326, + "step": 22807 + }, + { + "epoch": 0.58, + "learning_rate": 1.8608141356496291e-06, + "loss": 1.0254, + "step": 22808 + }, + { + "epoch": 0.58, + "learning_rate": 1.8608000532874401e-06, + "loss": 0.9814, + "step": 22809 + }, + { + "epoch": 0.58, + "learning_rate": 1.860785970266176e-06, + "loss": 0.8359, + "step": 22810 + }, + { + "epoch": 0.58, + "learning_rate": 1.860771886585848e-06, + "loss": 0.7842, + "step": 22811 + }, + { + "epoch": 0.58, + "learning_rate": 1.8607578022464661e-06, + "loss": 0.8594, + "step": 22812 + }, + { + "epoch": 0.58, + "learning_rate": 1.8607437172480416e-06, + "loss": 0.6685, + "step": 22813 + }, + { + "epoch": 0.58, + "learning_rate": 1.8607296315905853e-06, + "loss": 0.8682, + "step": 22814 + }, + { + "epoch": 0.58, + "learning_rate": 1.860715545274108e-06, + "loss": 0.9326, + "step": 22815 + }, + { + "epoch": 0.58, + "learning_rate": 1.8607014582986202e-06, + "loss": 0.7705, + "step": 22816 + }, + { + "epoch": 0.58, + "learning_rate": 1.860687370664133e-06, + "loss": 0.8154, + "step": 22817 + }, + { + "epoch": 0.58, + "learning_rate": 1.860673282370657e-06, + "loss": 0.8975, + "step": 22818 + }, + { + "epoch": 0.58, + "learning_rate": 1.860659193418203e-06, + "loss": 0.6465, + "step": 22819 + }, + { + "epoch": 0.58, + "learning_rate": 1.8606451038067818e-06, + "loss": 0.9141, + "step": 22820 + }, + { + "epoch": 0.58, + "learning_rate": 1.8606310135364046e-06, + "loss": 0.9209, + "step": 22821 + }, + { + "epoch": 0.58, + "learning_rate": 1.8606169226070812e-06, + "loss": 0.8154, + "step": 22822 + }, + { + "epoch": 0.58, + "learning_rate": 1.8606028310188232e-06, + "loss": 1.1621, + "step": 22823 + }, + { + "epoch": 0.58, + "learning_rate": 1.8605887387716416e-06, + "loss": 0.981, + "step": 22824 + }, + { + "epoch": 0.59, + "learning_rate": 1.8605746458655462e-06, + "loss": 0.8926, + "step": 22825 + }, + { + "epoch": 0.59, + "learning_rate": 1.8605605523005488e-06, + "loss": 0.9824, + "step": 22826 + }, + { + "epoch": 0.59, + "learning_rate": 1.8605464580766594e-06, + "loss": 0.8945, + "step": 22827 + }, + { + "epoch": 0.59, + "learning_rate": 1.8605323631938892e-06, + "loss": 0.9121, + "step": 22828 + }, + { + "epoch": 0.59, + "learning_rate": 1.8605182676522491e-06, + "loss": 0.877, + "step": 22829 + }, + { + "epoch": 0.59, + "learning_rate": 1.8605041714517498e-06, + "loss": 0.8057, + "step": 22830 + }, + { + "epoch": 0.59, + "learning_rate": 1.860490074592402e-06, + "loss": 0.9326, + "step": 22831 + }, + { + "epoch": 0.59, + "learning_rate": 1.8604759770742162e-06, + "loss": 1.1182, + "step": 22832 + }, + { + "epoch": 0.59, + "learning_rate": 1.8604618788972038e-06, + "loss": 0.8821, + "step": 22833 + }, + { + "epoch": 0.59, + "learning_rate": 1.860447780061375e-06, + "loss": 0.7881, + "step": 22834 + }, + { + "epoch": 0.59, + "learning_rate": 1.8604336805667413e-06, + "loss": 0.8032, + "step": 22835 + }, + { + "epoch": 0.59, + "learning_rate": 1.860419580413313e-06, + "loss": 0.8516, + "step": 22836 + }, + { + "epoch": 0.59, + "learning_rate": 1.8604054796011008e-06, + "loss": 0.9844, + "step": 22837 + }, + { + "epoch": 0.59, + "learning_rate": 1.860391378130116e-06, + "loss": 1.0479, + "step": 22838 + }, + { + "epoch": 0.59, + "learning_rate": 1.8603772760003688e-06, + "loss": 0.9873, + "step": 22839 + }, + { + "epoch": 0.59, + "learning_rate": 1.8603631732118704e-06, + "loss": 0.6646, + "step": 22840 + }, + { + "epoch": 0.59, + "learning_rate": 1.8603490697646313e-06, + "loss": 0.8135, + "step": 22841 + }, + { + "epoch": 0.59, + "learning_rate": 1.8603349656586627e-06, + "loss": 1.0781, + "step": 22842 + }, + { + "epoch": 0.59, + "learning_rate": 1.8603208608939752e-06, + "loss": 1.0156, + "step": 22843 + }, + { + "epoch": 0.59, + "learning_rate": 1.8603067554705794e-06, + "loss": 0.7871, + "step": 22844 + }, + { + "epoch": 0.59, + "learning_rate": 1.8602926493884863e-06, + "loss": 0.8535, + "step": 22845 + }, + { + "epoch": 0.59, + "learning_rate": 1.8602785426477067e-06, + "loss": 0.8428, + "step": 22846 + }, + { + "epoch": 0.59, + "learning_rate": 1.8602644352482514e-06, + "loss": 0.8701, + "step": 22847 + }, + { + "epoch": 0.59, + "learning_rate": 1.860250327190131e-06, + "loss": 0.6709, + "step": 22848 + }, + { + "epoch": 0.59, + "learning_rate": 1.8602362184733566e-06, + "loss": 0.7236, + "step": 22849 + }, + { + "epoch": 0.59, + "learning_rate": 1.860222109097939e-06, + "loss": 0.8457, + "step": 22850 + }, + { + "epoch": 0.59, + "learning_rate": 1.860207999063889e-06, + "loss": 1.1279, + "step": 22851 + }, + { + "epoch": 0.59, + "learning_rate": 1.8601938883712171e-06, + "loss": 0.8315, + "step": 22852 + }, + { + "epoch": 0.59, + "learning_rate": 1.8601797770199343e-06, + "loss": 0.7271, + "step": 22853 + }, + { + "epoch": 0.59, + "learning_rate": 1.8601656650100512e-06, + "loss": 0.7314, + "step": 22854 + }, + { + "epoch": 0.59, + "learning_rate": 1.8601515523415792e-06, + "loss": 0.8462, + "step": 22855 + }, + { + "epoch": 0.59, + "learning_rate": 1.8601374390145285e-06, + "loss": 0.6802, + "step": 22856 + }, + { + "epoch": 0.59, + "learning_rate": 1.86012332502891e-06, + "loss": 1.1279, + "step": 22857 + }, + { + "epoch": 0.59, + "learning_rate": 1.8601092103847348e-06, + "loss": 0.9619, + "step": 22858 + }, + { + "epoch": 0.59, + "learning_rate": 1.8600950950820136e-06, + "loss": 0.8369, + "step": 22859 + }, + { + "epoch": 0.59, + "learning_rate": 1.8600809791207567e-06, + "loss": 0.9346, + "step": 22860 + }, + { + "epoch": 0.59, + "learning_rate": 1.8600668625009758e-06, + "loss": 1.0029, + "step": 22861 + }, + { + "epoch": 0.59, + "learning_rate": 1.8600527452226813e-06, + "loss": 1.1152, + "step": 22862 + }, + { + "epoch": 0.59, + "learning_rate": 1.8600386272858836e-06, + "loss": 0.9658, + "step": 22863 + }, + { + "epoch": 0.59, + "learning_rate": 1.8600245086905942e-06, + "loss": 0.7476, + "step": 22864 + }, + { + "epoch": 0.59, + "learning_rate": 1.8600103894368232e-06, + "loss": 0.9092, + "step": 22865 + }, + { + "epoch": 0.59, + "learning_rate": 1.859996269524582e-06, + "loss": 0.9707, + "step": 22866 + }, + { + "epoch": 0.59, + "learning_rate": 1.859982148953881e-06, + "loss": 0.9248, + "step": 22867 + }, + { + "epoch": 0.59, + "learning_rate": 1.8599680277247317e-06, + "loss": 0.8369, + "step": 22868 + }, + { + "epoch": 0.59, + "learning_rate": 1.8599539058371442e-06, + "loss": 0.7217, + "step": 22869 + }, + { + "epoch": 0.59, + "learning_rate": 1.8599397832911294e-06, + "loss": 1.0244, + "step": 22870 + }, + { + "epoch": 0.59, + "learning_rate": 1.8599256600866981e-06, + "loss": 0.8076, + "step": 22871 + }, + { + "epoch": 0.59, + "learning_rate": 1.8599115362238616e-06, + "loss": 0.8286, + "step": 22872 + }, + { + "epoch": 0.59, + "learning_rate": 1.8598974117026304e-06, + "loss": 1.0137, + "step": 22873 + }, + { + "epoch": 0.59, + "learning_rate": 1.859883286523015e-06, + "loss": 1.0098, + "step": 22874 + }, + { + "epoch": 0.59, + "learning_rate": 1.8598691606850268e-06, + "loss": 0.8613, + "step": 22875 + }, + { + "epoch": 0.59, + "learning_rate": 1.859855034188676e-06, + "loss": 1.124, + "step": 22876 + }, + { + "epoch": 0.59, + "learning_rate": 1.859840907033974e-06, + "loss": 0.8066, + "step": 22877 + }, + { + "epoch": 0.59, + "learning_rate": 1.8598267792209312e-06, + "loss": 0.9668, + "step": 22878 + }, + { + "epoch": 0.59, + "learning_rate": 1.8598126507495586e-06, + "loss": 0.9629, + "step": 22879 + }, + { + "epoch": 0.59, + "learning_rate": 1.859798521619867e-06, + "loss": 1.042, + "step": 22880 + }, + { + "epoch": 0.59, + "learning_rate": 1.8597843918318672e-06, + "loss": 0.7881, + "step": 22881 + }, + { + "epoch": 0.59, + "learning_rate": 1.8597702613855702e-06, + "loss": 0.9131, + "step": 22882 + }, + { + "epoch": 0.59, + "learning_rate": 1.8597561302809865e-06, + "loss": 0.9023, + "step": 22883 + }, + { + "epoch": 0.59, + "learning_rate": 1.8597419985181271e-06, + "loss": 0.9092, + "step": 22884 + }, + { + "epoch": 0.59, + "learning_rate": 1.8597278660970029e-06, + "loss": 0.791, + "step": 22885 + }, + { + "epoch": 0.59, + "learning_rate": 1.8597137330176243e-06, + "loss": 0.6963, + "step": 22886 + }, + { + "epoch": 0.59, + "learning_rate": 1.8596995992800025e-06, + "loss": 0.7522, + "step": 22887 + }, + { + "epoch": 0.59, + "learning_rate": 1.8596854648841482e-06, + "loss": 1.1123, + "step": 22888 + }, + { + "epoch": 0.59, + "learning_rate": 1.8596713298300726e-06, + "loss": 0.8379, + "step": 22889 + }, + { + "epoch": 0.59, + "learning_rate": 1.859657194117786e-06, + "loss": 0.6836, + "step": 22890 + }, + { + "epoch": 0.59, + "learning_rate": 1.8596430577472994e-06, + "loss": 1.2021, + "step": 22891 + }, + { + "epoch": 0.59, + "learning_rate": 1.8596289207186236e-06, + "loss": 0.9121, + "step": 22892 + }, + { + "epoch": 0.59, + "learning_rate": 1.8596147830317693e-06, + "loss": 0.9795, + "step": 22893 + }, + { + "epoch": 0.59, + "learning_rate": 1.8596006446867478e-06, + "loss": 0.9678, + "step": 22894 + }, + { + "epoch": 0.59, + "learning_rate": 1.8595865056835694e-06, + "loss": 0.9893, + "step": 22895 + }, + { + "epoch": 0.59, + "learning_rate": 1.8595723660222453e-06, + "loss": 0.9092, + "step": 22896 + }, + { + "epoch": 0.59, + "learning_rate": 1.859558225702786e-06, + "loss": 0.9014, + "step": 22897 + }, + { + "epoch": 0.59, + "learning_rate": 1.859544084725203e-06, + "loss": 0.791, + "step": 22898 + }, + { + "epoch": 0.59, + "learning_rate": 1.859529943089506e-06, + "loss": 0.9111, + "step": 22899 + }, + { + "epoch": 0.59, + "learning_rate": 1.8595158007957066e-06, + "loss": 0.9121, + "step": 22900 + }, + { + "epoch": 0.59, + "learning_rate": 1.8595016578438156e-06, + "loss": 1.0156, + "step": 22901 + }, + { + "epoch": 0.59, + "learning_rate": 1.8594875142338435e-06, + "loss": 0.7881, + "step": 22902 + }, + { + "epoch": 0.59, + "learning_rate": 1.8594733699658014e-06, + "loss": 0.6758, + "step": 22903 + }, + { + "epoch": 0.59, + "learning_rate": 1.8594592250397004e-06, + "loss": 0.7949, + "step": 22904 + }, + { + "epoch": 0.59, + "learning_rate": 1.8594450794555505e-06, + "loss": 0.8027, + "step": 22905 + }, + { + "epoch": 0.59, + "learning_rate": 1.8594309332133632e-06, + "loss": 0.8853, + "step": 22906 + }, + { + "epoch": 0.59, + "learning_rate": 1.8594167863131492e-06, + "loss": 0.917, + "step": 22907 + }, + { + "epoch": 0.59, + "learning_rate": 1.8594026387549194e-06, + "loss": 1.0391, + "step": 22908 + }, + { + "epoch": 0.59, + "learning_rate": 1.8593884905386843e-06, + "loss": 0.9541, + "step": 22909 + }, + { + "epoch": 0.59, + "learning_rate": 1.859374341664455e-06, + "loss": 0.6118, + "step": 22910 + }, + { + "epoch": 0.59, + "learning_rate": 1.8593601921322421e-06, + "loss": 0.7056, + "step": 22911 + }, + { + "epoch": 0.59, + "learning_rate": 1.859346041942057e-06, + "loss": 0.8813, + "step": 22912 + }, + { + "epoch": 0.59, + "learning_rate": 1.8593318910939098e-06, + "loss": 0.7695, + "step": 22913 + }, + { + "epoch": 0.59, + "learning_rate": 1.859317739587812e-06, + "loss": 0.8691, + "step": 22914 + }, + { + "epoch": 0.59, + "learning_rate": 1.8593035874237739e-06, + "loss": 0.7773, + "step": 22915 + }, + { + "epoch": 0.59, + "learning_rate": 1.8592894346018067e-06, + "loss": 0.8325, + "step": 22916 + }, + { + "epoch": 0.59, + "learning_rate": 1.859275281121921e-06, + "loss": 0.9062, + "step": 22917 + }, + { + "epoch": 0.59, + "learning_rate": 1.8592611269841277e-06, + "loss": 1.0859, + "step": 22918 + }, + { + "epoch": 0.59, + "learning_rate": 1.8592469721884378e-06, + "loss": 0.7725, + "step": 22919 + }, + { + "epoch": 0.59, + "learning_rate": 1.8592328167348618e-06, + "loss": 0.7632, + "step": 22920 + }, + { + "epoch": 0.59, + "learning_rate": 1.8592186606234108e-06, + "loss": 0.9883, + "step": 22921 + }, + { + "epoch": 0.59, + "learning_rate": 1.8592045038540958e-06, + "loss": 1.0332, + "step": 22922 + }, + { + "epoch": 0.59, + "learning_rate": 1.8591903464269273e-06, + "loss": 0.8066, + "step": 22923 + }, + { + "epoch": 0.59, + "learning_rate": 1.8591761883419162e-06, + "loss": 0.8652, + "step": 22924 + }, + { + "epoch": 0.59, + "learning_rate": 1.8591620295990733e-06, + "loss": 0.9883, + "step": 22925 + }, + { + "epoch": 0.59, + "learning_rate": 1.8591478701984098e-06, + "loss": 0.8613, + "step": 22926 + }, + { + "epoch": 0.59, + "learning_rate": 1.859133710139936e-06, + "loss": 0.7407, + "step": 22927 + }, + { + "epoch": 0.59, + "learning_rate": 1.8591195494236632e-06, + "loss": 0.7124, + "step": 22928 + }, + { + "epoch": 0.59, + "learning_rate": 1.8591053880496022e-06, + "loss": 0.6921, + "step": 22929 + }, + { + "epoch": 0.59, + "learning_rate": 1.8590912260177634e-06, + "loss": 0.6821, + "step": 22930 + }, + { + "epoch": 0.59, + "learning_rate": 1.859077063328158e-06, + "loss": 0.7617, + "step": 22931 + }, + { + "epoch": 0.59, + "learning_rate": 1.859062899980797e-06, + "loss": 0.876, + "step": 22932 + }, + { + "epoch": 0.59, + "learning_rate": 1.8590487359756909e-06, + "loss": 0.8682, + "step": 22933 + }, + { + "epoch": 0.59, + "learning_rate": 1.8590345713128506e-06, + "loss": 0.8813, + "step": 22934 + }, + { + "epoch": 0.59, + "learning_rate": 1.859020405992287e-06, + "loss": 0.875, + "step": 22935 + }, + { + "epoch": 0.59, + "learning_rate": 1.8590062400140113e-06, + "loss": 0.8564, + "step": 22936 + }, + { + "epoch": 0.59, + "learning_rate": 1.8589920733780338e-06, + "loss": 0.8213, + "step": 22937 + }, + { + "epoch": 0.59, + "learning_rate": 1.8589779060843656e-06, + "loss": 0.877, + "step": 22938 + }, + { + "epoch": 0.59, + "learning_rate": 1.8589637381330175e-06, + "loss": 0.8301, + "step": 22939 + }, + { + "epoch": 0.59, + "learning_rate": 1.8589495695240002e-06, + "loss": 0.5767, + "step": 22940 + }, + { + "epoch": 0.59, + "learning_rate": 1.8589354002573248e-06, + "loss": 0.8096, + "step": 22941 + }, + { + "epoch": 0.59, + "learning_rate": 1.8589212303330021e-06, + "loss": 0.8408, + "step": 22942 + }, + { + "epoch": 0.59, + "learning_rate": 1.858907059751043e-06, + "loss": 0.8135, + "step": 22943 + }, + { + "epoch": 0.59, + "learning_rate": 1.8588928885114581e-06, + "loss": 0.9854, + "step": 22944 + }, + { + "epoch": 0.59, + "learning_rate": 1.8588787166142587e-06, + "loss": 0.7891, + "step": 22945 + }, + { + "epoch": 0.59, + "learning_rate": 1.8588645440594552e-06, + "loss": 1.0781, + "step": 22946 + }, + { + "epoch": 0.59, + "learning_rate": 1.8588503708470584e-06, + "loss": 0.7791, + "step": 22947 + }, + { + "epoch": 0.59, + "learning_rate": 1.8588361969770795e-06, + "loss": 0.8721, + "step": 22948 + }, + { + "epoch": 0.59, + "learning_rate": 1.8588220224495292e-06, + "loss": 0.9717, + "step": 22949 + }, + { + "epoch": 0.59, + "learning_rate": 1.8588078472644186e-06, + "loss": 0.8132, + "step": 22950 + }, + { + "epoch": 0.59, + "learning_rate": 1.858793671421758e-06, + "loss": 0.793, + "step": 22951 + }, + { + "epoch": 0.59, + "learning_rate": 1.858779494921559e-06, + "loss": 0.8491, + "step": 22952 + }, + { + "epoch": 0.59, + "learning_rate": 1.8587653177638316e-06, + "loss": 1.0293, + "step": 22953 + }, + { + "epoch": 0.59, + "learning_rate": 1.8587511399485871e-06, + "loss": 0.8877, + "step": 22954 + }, + { + "epoch": 0.59, + "learning_rate": 1.8587369614758367e-06, + "loss": 0.8096, + "step": 22955 + }, + { + "epoch": 0.59, + "learning_rate": 1.8587227823455904e-06, + "loss": 1.0264, + "step": 22956 + }, + { + "epoch": 0.59, + "learning_rate": 1.85870860255786e-06, + "loss": 0.9307, + "step": 22957 + }, + { + "epoch": 0.59, + "learning_rate": 1.8586944221126558e-06, + "loss": 0.8555, + "step": 22958 + }, + { + "epoch": 0.59, + "learning_rate": 1.8586802410099885e-06, + "loss": 0.7012, + "step": 22959 + }, + { + "epoch": 0.59, + "learning_rate": 1.8586660592498693e-06, + "loss": 0.8613, + "step": 22960 + }, + { + "epoch": 0.59, + "learning_rate": 1.858651876832309e-06, + "loss": 0.894, + "step": 22961 + }, + { + "epoch": 0.59, + "learning_rate": 1.8586376937573185e-06, + "loss": 0.8916, + "step": 22962 + }, + { + "epoch": 0.59, + "learning_rate": 1.8586235100249085e-06, + "loss": 0.7871, + "step": 22963 + }, + { + "epoch": 0.59, + "learning_rate": 1.8586093256350904e-06, + "loss": 0.9893, + "step": 22964 + }, + { + "epoch": 0.59, + "learning_rate": 1.8585951405878744e-06, + "loss": 0.8779, + "step": 22965 + }, + { + "epoch": 0.59, + "learning_rate": 1.8585809548832714e-06, + "loss": 0.7402, + "step": 22966 + }, + { + "epoch": 0.59, + "learning_rate": 1.8585667685212925e-06, + "loss": 0.9766, + "step": 22967 + }, + { + "epoch": 0.59, + "learning_rate": 1.8585525815019483e-06, + "loss": 0.8018, + "step": 22968 + }, + { + "epoch": 0.59, + "learning_rate": 1.8585383938252503e-06, + "loss": 0.7178, + "step": 22969 + }, + { + "epoch": 0.59, + "learning_rate": 1.8585242054912087e-06, + "loss": 0.8291, + "step": 22970 + }, + { + "epoch": 0.59, + "learning_rate": 1.8585100164998346e-06, + "loss": 0.8535, + "step": 22971 + }, + { + "epoch": 0.59, + "learning_rate": 1.858495826851139e-06, + "loss": 0.8496, + "step": 22972 + }, + { + "epoch": 0.59, + "learning_rate": 1.8584816365451324e-06, + "loss": 0.9258, + "step": 22973 + }, + { + "epoch": 0.59, + "learning_rate": 1.858467445581826e-06, + "loss": 0.7476, + "step": 22974 + }, + { + "epoch": 0.59, + "learning_rate": 1.8584532539612306e-06, + "loss": 0.9229, + "step": 22975 + }, + { + "epoch": 0.59, + "learning_rate": 1.8584390616833567e-06, + "loss": 0.9014, + "step": 22976 + }, + { + "epoch": 0.59, + "learning_rate": 1.8584248687482158e-06, + "loss": 0.7639, + "step": 22977 + }, + { + "epoch": 0.59, + "learning_rate": 1.8584106751558184e-06, + "loss": 0.6694, + "step": 22978 + }, + { + "epoch": 0.59, + "learning_rate": 1.8583964809061751e-06, + "loss": 0.8643, + "step": 22979 + }, + { + "epoch": 0.59, + "learning_rate": 1.8583822859992976e-06, + "loss": 0.8535, + "step": 22980 + }, + { + "epoch": 0.59, + "learning_rate": 1.858368090435196e-06, + "loss": 0.9668, + "step": 22981 + }, + { + "epoch": 0.59, + "learning_rate": 1.8583538942138812e-06, + "loss": 0.8242, + "step": 22982 + }, + { + "epoch": 0.59, + "learning_rate": 1.8583396973353647e-06, + "loss": 0.7949, + "step": 22983 + }, + { + "epoch": 0.59, + "learning_rate": 1.8583254997996568e-06, + "loss": 0.8008, + "step": 22984 + }, + { + "epoch": 0.59, + "learning_rate": 1.8583113016067683e-06, + "loss": 0.7793, + "step": 22985 + }, + { + "epoch": 0.59, + "learning_rate": 1.8582971027567108e-06, + "loss": 0.6836, + "step": 22986 + }, + { + "epoch": 0.59, + "learning_rate": 1.8582829032494942e-06, + "loss": 0.9541, + "step": 22987 + }, + { + "epoch": 0.59, + "learning_rate": 1.8582687030851303e-06, + "loss": 0.792, + "step": 22988 + }, + { + "epoch": 0.59, + "learning_rate": 1.858254502263629e-06, + "loss": 0.8994, + "step": 22989 + }, + { + "epoch": 0.59, + "learning_rate": 1.858240300785002e-06, + "loss": 0.7129, + "step": 22990 + }, + { + "epoch": 0.59, + "learning_rate": 1.85822609864926e-06, + "loss": 0.7295, + "step": 22991 + }, + { + "epoch": 0.59, + "learning_rate": 1.8582118958564135e-06, + "loss": 0.7666, + "step": 22992 + }, + { + "epoch": 0.59, + "learning_rate": 1.8581976924064737e-06, + "loss": 0.8916, + "step": 22993 + }, + { + "epoch": 0.59, + "learning_rate": 1.8581834882994514e-06, + "loss": 0.8652, + "step": 22994 + }, + { + "epoch": 0.59, + "learning_rate": 1.8581692835353576e-06, + "loss": 0.6829, + "step": 22995 + }, + { + "epoch": 0.59, + "learning_rate": 1.8581550781142026e-06, + "loss": 0.9355, + "step": 22996 + }, + { + "epoch": 0.59, + "learning_rate": 1.8581408720359981e-06, + "loss": 0.7217, + "step": 22997 + }, + { + "epoch": 0.59, + "learning_rate": 1.8581266653007544e-06, + "loss": 0.9395, + "step": 22998 + }, + { + "epoch": 0.59, + "learning_rate": 1.8581124579084827e-06, + "loss": 0.8633, + "step": 22999 + }, + { + "epoch": 0.59, + "learning_rate": 1.8580982498591937e-06, + "loss": 0.813, + "step": 23000 + }, + { + "epoch": 0.59, + "learning_rate": 1.8580840411528982e-06, + "loss": 0.96, + "step": 23001 + }, + { + "epoch": 0.59, + "learning_rate": 1.8580698317896073e-06, + "loss": 1.0879, + "step": 23002 + }, + { + "epoch": 0.59, + "learning_rate": 1.8580556217693318e-06, + "loss": 1.0977, + "step": 23003 + }, + { + "epoch": 0.59, + "learning_rate": 1.8580414110920827e-06, + "loss": 0.8652, + "step": 23004 + }, + { + "epoch": 0.59, + "learning_rate": 1.8580271997578706e-06, + "loss": 1.0967, + "step": 23005 + }, + { + "epoch": 0.59, + "learning_rate": 1.8580129877667065e-06, + "loss": 0.8242, + "step": 23006 + }, + { + "epoch": 0.59, + "learning_rate": 1.8579987751186013e-06, + "loss": 0.8691, + "step": 23007 + }, + { + "epoch": 0.59, + "learning_rate": 1.8579845618135659e-06, + "loss": 0.8906, + "step": 23008 + }, + { + "epoch": 0.59, + "learning_rate": 1.8579703478516113e-06, + "loss": 0.9023, + "step": 23009 + }, + { + "epoch": 0.59, + "learning_rate": 1.857956133232748e-06, + "loss": 1.1748, + "step": 23010 + }, + { + "epoch": 0.59, + "learning_rate": 1.8579419179569875e-06, + "loss": 0.9043, + "step": 23011 + }, + { + "epoch": 0.59, + "learning_rate": 1.85792770202434e-06, + "loss": 0.6423, + "step": 23012 + }, + { + "epoch": 0.59, + "learning_rate": 1.857913485434817e-06, + "loss": 0.8486, + "step": 23013 + }, + { + "epoch": 0.59, + "learning_rate": 1.857899268188429e-06, + "loss": 0.678, + "step": 23014 + }, + { + "epoch": 0.59, + "learning_rate": 1.857885050285187e-06, + "loss": 0.7349, + "step": 23015 + }, + { + "epoch": 0.59, + "learning_rate": 1.8578708317251015e-06, + "loss": 0.8887, + "step": 23016 + }, + { + "epoch": 0.59, + "learning_rate": 1.857856612508184e-06, + "loss": 0.8789, + "step": 23017 + }, + { + "epoch": 0.59, + "learning_rate": 1.8578423926344451e-06, + "loss": 0.7686, + "step": 23018 + }, + { + "epoch": 0.59, + "learning_rate": 1.857828172103896e-06, + "loss": 0.793, + "step": 23019 + }, + { + "epoch": 0.59, + "learning_rate": 1.8578139509165468e-06, + "loss": 0.5762, + "step": 23020 + }, + { + "epoch": 0.59, + "learning_rate": 1.8577997290724095e-06, + "loss": 0.8809, + "step": 23021 + }, + { + "epoch": 0.59, + "learning_rate": 1.8577855065714937e-06, + "loss": 1.0342, + "step": 23022 + }, + { + "epoch": 0.59, + "learning_rate": 1.8577712834138115e-06, + "loss": 0.8511, + "step": 23023 + }, + { + "epoch": 0.59, + "learning_rate": 1.8577570595993732e-06, + "loss": 0.9678, + "step": 23024 + }, + { + "epoch": 0.59, + "learning_rate": 1.8577428351281896e-06, + "loss": 0.8887, + "step": 23025 + }, + { + "epoch": 0.59, + "learning_rate": 1.857728610000272e-06, + "loss": 0.6992, + "step": 23026 + }, + { + "epoch": 0.59, + "learning_rate": 1.857714384215631e-06, + "loss": 0.8086, + "step": 23027 + }, + { + "epoch": 0.59, + "learning_rate": 1.8577001577742773e-06, + "loss": 0.9541, + "step": 23028 + }, + { + "epoch": 0.59, + "learning_rate": 1.8576859306762222e-06, + "loss": 0.665, + "step": 23029 + }, + { + "epoch": 0.59, + "learning_rate": 1.8576717029214764e-06, + "loss": 0.7759, + "step": 23030 + }, + { + "epoch": 0.59, + "learning_rate": 1.8576574745100508e-06, + "loss": 0.9531, + "step": 23031 + }, + { + "epoch": 0.59, + "learning_rate": 1.8576432454419562e-06, + "loss": 0.6509, + "step": 23032 + }, + { + "epoch": 0.59, + "learning_rate": 1.8576290157172037e-06, + "loss": 0.9521, + "step": 23033 + }, + { + "epoch": 0.59, + "learning_rate": 1.8576147853358043e-06, + "loss": 0.7515, + "step": 23034 + }, + { + "epoch": 0.59, + "learning_rate": 1.8576005542977682e-06, + "loss": 0.9961, + "step": 23035 + }, + { + "epoch": 0.59, + "learning_rate": 1.8575863226031073e-06, + "loss": 0.7007, + "step": 23036 + }, + { + "epoch": 0.59, + "learning_rate": 1.8575720902518316e-06, + "loss": 1.0703, + "step": 23037 + }, + { + "epoch": 0.59, + "learning_rate": 1.8575578572439526e-06, + "loss": 1.2432, + "step": 23038 + }, + { + "epoch": 0.59, + "learning_rate": 1.857543623579481e-06, + "loss": 1.0059, + "step": 23039 + }, + { + "epoch": 0.59, + "learning_rate": 1.8575293892584276e-06, + "loss": 0.8926, + "step": 23040 + }, + { + "epoch": 0.59, + "learning_rate": 1.8575151542808034e-06, + "loss": 0.9443, + "step": 23041 + }, + { + "epoch": 0.59, + "learning_rate": 1.857500918646619e-06, + "loss": 0.6099, + "step": 23042 + }, + { + "epoch": 0.59, + "learning_rate": 1.8574866823558862e-06, + "loss": 0.9404, + "step": 23043 + }, + { + "epoch": 0.59, + "learning_rate": 1.8574724454086147e-06, + "loss": 0.7817, + "step": 23044 + }, + { + "epoch": 0.59, + "learning_rate": 1.8574582078048163e-06, + "loss": 0.7617, + "step": 23045 + }, + { + "epoch": 0.59, + "learning_rate": 1.8574439695445015e-06, + "loss": 0.8174, + "step": 23046 + }, + { + "epoch": 0.59, + "learning_rate": 1.8574297306276811e-06, + "loss": 0.7275, + "step": 23047 + }, + { + "epoch": 0.59, + "learning_rate": 1.8574154910543661e-06, + "loss": 1.0068, + "step": 23048 + }, + { + "epoch": 0.59, + "learning_rate": 1.857401250824568e-06, + "loss": 0.8057, + "step": 23049 + }, + { + "epoch": 0.59, + "learning_rate": 1.857387009938297e-06, + "loss": 0.9258, + "step": 23050 + }, + { + "epoch": 0.59, + "learning_rate": 1.8573727683955639e-06, + "loss": 0.9658, + "step": 23051 + }, + { + "epoch": 0.59, + "learning_rate": 1.85735852619638e-06, + "loss": 0.7979, + "step": 23052 + }, + { + "epoch": 0.59, + "learning_rate": 1.8573442833407563e-06, + "loss": 0.918, + "step": 23053 + }, + { + "epoch": 0.59, + "learning_rate": 1.8573300398287032e-06, + "loss": 0.7559, + "step": 23054 + }, + { + "epoch": 0.59, + "learning_rate": 1.8573157956602321e-06, + "loss": 0.8623, + "step": 23055 + }, + { + "epoch": 0.59, + "learning_rate": 1.8573015508353537e-06, + "loss": 0.7109, + "step": 23056 + }, + { + "epoch": 0.59, + "learning_rate": 1.857287305354079e-06, + "loss": 0.793, + "step": 23057 + }, + { + "epoch": 0.59, + "learning_rate": 1.8572730592164188e-06, + "loss": 0.8984, + "step": 23058 + }, + { + "epoch": 0.59, + "learning_rate": 1.8572588124223839e-06, + "loss": 0.8975, + "step": 23059 + }, + { + "epoch": 0.59, + "learning_rate": 1.8572445649719854e-06, + "loss": 0.9424, + "step": 23060 + }, + { + "epoch": 0.59, + "learning_rate": 1.8572303168652343e-06, + "loss": 0.8267, + "step": 23061 + }, + { + "epoch": 0.59, + "learning_rate": 1.8572160681021412e-06, + "loss": 0.8652, + "step": 23062 + }, + { + "epoch": 0.59, + "learning_rate": 1.8572018186827172e-06, + "loss": 0.8652, + "step": 23063 + }, + { + "epoch": 0.59, + "learning_rate": 1.8571875686069732e-06, + "loss": 0.9932, + "step": 23064 + }, + { + "epoch": 0.59, + "learning_rate": 1.85717331787492e-06, + "loss": 0.8467, + "step": 23065 + }, + { + "epoch": 0.59, + "learning_rate": 1.857159066486569e-06, + "loss": 0.8999, + "step": 23066 + }, + { + "epoch": 0.59, + "learning_rate": 1.8571448144419302e-06, + "loss": 0.8711, + "step": 23067 + }, + { + "epoch": 0.59, + "learning_rate": 1.8571305617410153e-06, + "loss": 0.9326, + "step": 23068 + }, + { + "epoch": 0.59, + "learning_rate": 1.8571163083838347e-06, + "loss": 0.715, + "step": 23069 + }, + { + "epoch": 0.59, + "learning_rate": 1.8571020543704e-06, + "loss": 0.9277, + "step": 23070 + }, + { + "epoch": 0.59, + "learning_rate": 1.8570877997007212e-06, + "loss": 0.7886, + "step": 23071 + }, + { + "epoch": 0.59, + "learning_rate": 1.85707354437481e-06, + "loss": 0.6389, + "step": 23072 + }, + { + "epoch": 0.59, + "learning_rate": 1.8570592883926767e-06, + "loss": 0.9883, + "step": 23073 + }, + { + "epoch": 0.59, + "learning_rate": 1.857045031754333e-06, + "loss": 0.9473, + "step": 23074 + }, + { + "epoch": 0.59, + "learning_rate": 1.857030774459789e-06, + "loss": 0.8418, + "step": 23075 + }, + { + "epoch": 0.59, + "learning_rate": 1.857016516509056e-06, + "loss": 1.1289, + "step": 23076 + }, + { + "epoch": 0.59, + "learning_rate": 1.8570022579021447e-06, + "loss": 0.894, + "step": 23077 + }, + { + "epoch": 0.59, + "learning_rate": 1.8569879986390663e-06, + "loss": 1.0049, + "step": 23078 + }, + { + "epoch": 0.59, + "learning_rate": 1.8569737387198317e-06, + "loss": 0.9434, + "step": 23079 + }, + { + "epoch": 0.59, + "learning_rate": 1.8569594781444514e-06, + "loss": 0.8506, + "step": 23080 + }, + { + "epoch": 0.59, + "learning_rate": 1.8569452169129368e-06, + "loss": 0.9941, + "step": 23081 + }, + { + "epoch": 0.59, + "learning_rate": 1.8569309550252989e-06, + "loss": 0.7163, + "step": 23082 + }, + { + "epoch": 0.59, + "learning_rate": 1.8569166924815481e-06, + "loss": 0.8701, + "step": 23083 + }, + { + "epoch": 0.59, + "learning_rate": 1.8569024292816956e-06, + "loss": 0.8413, + "step": 23084 + }, + { + "epoch": 0.59, + "learning_rate": 1.8568881654257528e-06, + "loss": 0.7661, + "step": 23085 + }, + { + "epoch": 0.59, + "learning_rate": 1.8568739009137295e-06, + "loss": 0.8481, + "step": 23086 + }, + { + "epoch": 0.59, + "learning_rate": 1.8568596357456374e-06, + "loss": 0.8213, + "step": 23087 + }, + { + "epoch": 0.59, + "learning_rate": 1.8568453699214875e-06, + "loss": 0.6665, + "step": 23088 + }, + { + "epoch": 0.59, + "learning_rate": 1.8568311034412902e-06, + "loss": 0.6992, + "step": 23089 + }, + { + "epoch": 0.59, + "learning_rate": 1.8568168363050568e-06, + "loss": 0.7656, + "step": 23090 + }, + { + "epoch": 0.59, + "learning_rate": 1.8568025685127981e-06, + "loss": 0.9453, + "step": 23091 + }, + { + "epoch": 0.59, + "learning_rate": 1.8567883000645253e-06, + "loss": 0.9219, + "step": 23092 + }, + { + "epoch": 0.59, + "learning_rate": 1.8567740309602488e-06, + "loss": 0.7979, + "step": 23093 + }, + { + "epoch": 0.59, + "learning_rate": 1.85675976119998e-06, + "loss": 0.7798, + "step": 23094 + }, + { + "epoch": 0.59, + "learning_rate": 1.8567454907837297e-06, + "loss": 0.8994, + "step": 23095 + }, + { + "epoch": 0.59, + "learning_rate": 1.8567312197115087e-06, + "loss": 0.8389, + "step": 23096 + }, + { + "epoch": 0.59, + "learning_rate": 1.856716947983328e-06, + "loss": 0.5874, + "step": 23097 + }, + { + "epoch": 0.59, + "learning_rate": 1.8567026755991985e-06, + "loss": 0.8838, + "step": 23098 + }, + { + "epoch": 0.59, + "learning_rate": 1.8566884025591313e-06, + "loss": 0.9561, + "step": 23099 + }, + { + "epoch": 0.59, + "learning_rate": 1.8566741288631369e-06, + "loss": 0.6821, + "step": 23100 + }, + { + "epoch": 0.59, + "learning_rate": 1.8566598545112267e-06, + "loss": 0.9609, + "step": 23101 + }, + { + "epoch": 0.59, + "learning_rate": 1.8566455795034116e-06, + "loss": 1.0264, + "step": 23102 + }, + { + "epoch": 0.59, + "learning_rate": 1.8566313038397022e-06, + "loss": 0.7949, + "step": 23103 + }, + { + "epoch": 0.59, + "learning_rate": 1.8566170275201093e-06, + "loss": 0.7998, + "step": 23104 + }, + { + "epoch": 0.59, + "learning_rate": 1.8566027505446447e-06, + "loss": 0.7583, + "step": 23105 + }, + { + "epoch": 0.59, + "learning_rate": 1.8565884729133184e-06, + "loss": 0.9658, + "step": 23106 + }, + { + "epoch": 0.59, + "learning_rate": 1.8565741946261417e-06, + "loss": 0.7227, + "step": 23107 + }, + { + "epoch": 0.59, + "learning_rate": 1.8565599156831256e-06, + "loss": 0.7998, + "step": 23108 + }, + { + "epoch": 0.59, + "learning_rate": 1.856545636084281e-06, + "loss": 0.8828, + "step": 23109 + }, + { + "epoch": 0.59, + "learning_rate": 1.8565313558296186e-06, + "loss": 0.8848, + "step": 23110 + }, + { + "epoch": 0.59, + "learning_rate": 1.8565170749191496e-06, + "loss": 0.6885, + "step": 23111 + }, + { + "epoch": 0.59, + "learning_rate": 1.8565027933528852e-06, + "loss": 0.5383, + "step": 23112 + }, + { + "epoch": 0.59, + "learning_rate": 1.8564885111308357e-06, + "loss": 0.9863, + "step": 23113 + }, + { + "epoch": 0.59, + "learning_rate": 1.8564742282530124e-06, + "loss": 1.1865, + "step": 23114 + }, + { + "epoch": 0.59, + "learning_rate": 1.856459944719426e-06, + "loss": 1.0459, + "step": 23115 + }, + { + "epoch": 0.59, + "learning_rate": 1.8564456605300878e-06, + "loss": 0.9473, + "step": 23116 + }, + { + "epoch": 0.59, + "learning_rate": 1.8564313756850086e-06, + "loss": 0.7998, + "step": 23117 + }, + { + "epoch": 0.59, + "learning_rate": 1.8564170901841988e-06, + "loss": 0.8154, + "step": 23118 + }, + { + "epoch": 0.59, + "learning_rate": 1.8564028040276702e-06, + "loss": 1.2607, + "step": 23119 + }, + { + "epoch": 0.59, + "learning_rate": 1.8563885172154334e-06, + "loss": 0.9258, + "step": 23120 + }, + { + "epoch": 0.59, + "learning_rate": 1.856374229747499e-06, + "loss": 0.918, + "step": 23121 + }, + { + "epoch": 0.59, + "learning_rate": 1.8563599416238787e-06, + "loss": 0.7744, + "step": 23122 + }, + { + "epoch": 0.59, + "learning_rate": 1.8563456528445824e-06, + "loss": 0.8906, + "step": 23123 + }, + { + "epoch": 0.59, + "learning_rate": 1.856331363409622e-06, + "loss": 0.8066, + "step": 23124 + }, + { + "epoch": 0.59, + "learning_rate": 1.856317073319008e-06, + "loss": 0.9473, + "step": 23125 + }, + { + "epoch": 0.59, + "learning_rate": 1.8563027825727512e-06, + "loss": 0.8398, + "step": 23126 + }, + { + "epoch": 0.59, + "learning_rate": 1.856288491170863e-06, + "loss": 0.8281, + "step": 23127 + }, + { + "epoch": 0.59, + "learning_rate": 1.856274199113354e-06, + "loss": 1.0381, + "step": 23128 + }, + { + "epoch": 0.59, + "learning_rate": 1.856259906400235e-06, + "loss": 0.7236, + "step": 23129 + }, + { + "epoch": 0.59, + "learning_rate": 1.8562456130315173e-06, + "loss": 0.8105, + "step": 23130 + }, + { + "epoch": 0.59, + "learning_rate": 1.8562313190072118e-06, + "loss": 1.0234, + "step": 23131 + }, + { + "epoch": 0.59, + "learning_rate": 1.8562170243273294e-06, + "loss": 0.8135, + "step": 23132 + }, + { + "epoch": 0.59, + "learning_rate": 1.8562027289918807e-06, + "loss": 0.7744, + "step": 23133 + }, + { + "epoch": 0.59, + "learning_rate": 1.8561884330008773e-06, + "loss": 0.9785, + "step": 23134 + }, + { + "epoch": 0.59, + "learning_rate": 1.8561741363543294e-06, + "loss": 0.9375, + "step": 23135 + }, + { + "epoch": 0.59, + "learning_rate": 1.8561598390522486e-06, + "loss": 0.6208, + "step": 23136 + }, + { + "epoch": 0.59, + "learning_rate": 1.8561455410946456e-06, + "loss": 0.7256, + "step": 23137 + }, + { + "epoch": 0.59, + "learning_rate": 1.8561312424815312e-06, + "loss": 0.959, + "step": 23138 + }, + { + "epoch": 0.59, + "learning_rate": 1.8561169432129164e-06, + "loss": 1.0479, + "step": 23139 + }, + { + "epoch": 0.59, + "learning_rate": 1.8561026432888123e-06, + "loss": 0.9805, + "step": 23140 + }, + { + "epoch": 0.59, + "learning_rate": 1.85608834270923e-06, + "loss": 0.8955, + "step": 23141 + }, + { + "epoch": 0.59, + "learning_rate": 1.85607404147418e-06, + "loss": 0.8145, + "step": 23142 + }, + { + "epoch": 0.59, + "learning_rate": 1.8560597395836735e-06, + "loss": 0.7808, + "step": 23143 + }, + { + "epoch": 0.59, + "learning_rate": 1.8560454370377214e-06, + "loss": 0.874, + "step": 23144 + }, + { + "epoch": 0.59, + "learning_rate": 1.8560311338363346e-06, + "loss": 0.8457, + "step": 23145 + }, + { + "epoch": 0.59, + "learning_rate": 1.856016829979524e-06, + "loss": 0.8643, + "step": 23146 + }, + { + "epoch": 0.59, + "learning_rate": 1.8560025254673011e-06, + "loss": 0.9355, + "step": 23147 + }, + { + "epoch": 0.59, + "learning_rate": 1.8559882202996762e-06, + "loss": 1.1523, + "step": 23148 + }, + { + "epoch": 0.59, + "learning_rate": 1.8559739144766605e-06, + "loss": 0.7578, + "step": 23149 + }, + { + "epoch": 0.59, + "learning_rate": 1.855959607998265e-06, + "loss": 0.7773, + "step": 23150 + }, + { + "epoch": 0.59, + "learning_rate": 1.8559453008645006e-06, + "loss": 0.9155, + "step": 23151 + }, + { + "epoch": 0.59, + "learning_rate": 1.8559309930753779e-06, + "loss": 0.7031, + "step": 23152 + }, + { + "epoch": 0.59, + "learning_rate": 1.8559166846309085e-06, + "loss": 0.9912, + "step": 23153 + }, + { + "epoch": 0.59, + "learning_rate": 1.855902375531103e-06, + "loss": 0.66, + "step": 23154 + }, + { + "epoch": 0.59, + "learning_rate": 1.8558880657759723e-06, + "loss": 0.9893, + "step": 23155 + }, + { + "epoch": 0.59, + "learning_rate": 1.8558737553655276e-06, + "loss": 0.9629, + "step": 23156 + }, + { + "epoch": 0.59, + "learning_rate": 1.8558594442997797e-06, + "loss": 0.9033, + "step": 23157 + }, + { + "epoch": 0.59, + "learning_rate": 1.8558451325787394e-06, + "loss": 0.7891, + "step": 23158 + }, + { + "epoch": 0.59, + "learning_rate": 1.855830820202418e-06, + "loss": 0.8359, + "step": 23159 + }, + { + "epoch": 0.59, + "learning_rate": 1.8558165071708266e-06, + "loss": 1.0215, + "step": 23160 + }, + { + "epoch": 0.59, + "learning_rate": 1.8558021934839752e-06, + "loss": 0.9663, + "step": 23161 + }, + { + "epoch": 0.59, + "learning_rate": 1.855787879141876e-06, + "loss": 0.7061, + "step": 23162 + }, + { + "epoch": 0.59, + "learning_rate": 1.855773564144539e-06, + "loss": 0.8564, + "step": 23163 + }, + { + "epoch": 0.59, + "learning_rate": 1.8557592484919756e-06, + "loss": 0.8018, + "step": 23164 + }, + { + "epoch": 0.59, + "learning_rate": 1.8557449321841969e-06, + "loss": 0.8418, + "step": 23165 + }, + { + "epoch": 0.59, + "learning_rate": 1.8557306152212133e-06, + "loss": 0.8184, + "step": 23166 + }, + { + "epoch": 0.59, + "learning_rate": 1.8557162976030364e-06, + "loss": 0.8398, + "step": 23167 + }, + { + "epoch": 0.59, + "learning_rate": 1.8557019793296766e-06, + "loss": 0.9814, + "step": 23168 + }, + { + "epoch": 0.59, + "learning_rate": 1.8556876604011453e-06, + "loss": 0.7549, + "step": 23169 + }, + { + "epoch": 0.59, + "learning_rate": 1.8556733408174536e-06, + "loss": 0.9375, + "step": 23170 + }, + { + "epoch": 0.59, + "learning_rate": 1.8556590205786119e-06, + "loss": 0.4932, + "step": 23171 + }, + { + "epoch": 0.59, + "learning_rate": 1.8556446996846314e-06, + "loss": 0.9346, + "step": 23172 + }, + { + "epoch": 0.59, + "learning_rate": 1.8556303781355229e-06, + "loss": 0.833, + "step": 23173 + }, + { + "epoch": 0.59, + "learning_rate": 1.855616055931298e-06, + "loss": 0.8438, + "step": 23174 + }, + { + "epoch": 0.59, + "learning_rate": 1.855601733071967e-06, + "loss": 0.8896, + "step": 23175 + }, + { + "epoch": 0.59, + "learning_rate": 1.855587409557541e-06, + "loss": 1.0762, + "step": 23176 + }, + { + "epoch": 0.59, + "learning_rate": 1.8555730853880315e-06, + "loss": 0.6772, + "step": 23177 + }, + { + "epoch": 0.59, + "learning_rate": 1.8555587605634484e-06, + "loss": 0.7373, + "step": 23178 + }, + { + "epoch": 0.59, + "learning_rate": 1.8555444350838037e-06, + "loss": 1.1572, + "step": 23179 + }, + { + "epoch": 0.59, + "learning_rate": 1.8555301089491078e-06, + "loss": 0.9346, + "step": 23180 + }, + { + "epoch": 0.59, + "learning_rate": 1.855515782159372e-06, + "loss": 0.7852, + "step": 23181 + }, + { + "epoch": 0.59, + "learning_rate": 1.855501454714607e-06, + "loss": 0.8579, + "step": 23182 + }, + { + "epoch": 0.59, + "learning_rate": 1.8554871266148237e-06, + "loss": 0.8818, + "step": 23183 + }, + { + "epoch": 0.59, + "learning_rate": 1.8554727978600336e-06, + "loss": 0.9658, + "step": 23184 + }, + { + "epoch": 0.59, + "learning_rate": 1.8554584684502471e-06, + "loss": 0.7983, + "step": 23185 + }, + { + "epoch": 0.59, + "learning_rate": 1.8554441383854752e-06, + "loss": 1.1074, + "step": 23186 + }, + { + "epoch": 0.59, + "learning_rate": 1.8554298076657292e-06, + "loss": 0.853, + "step": 23187 + }, + { + "epoch": 0.59, + "learning_rate": 1.85541547629102e-06, + "loss": 0.8259, + "step": 23188 + }, + { + "epoch": 0.59, + "learning_rate": 1.8554011442613588e-06, + "loss": 0.9893, + "step": 23189 + }, + { + "epoch": 0.59, + "learning_rate": 1.855386811576756e-06, + "loss": 0.8174, + "step": 23190 + }, + { + "epoch": 0.59, + "learning_rate": 1.8553724782372225e-06, + "loss": 0.8818, + "step": 23191 + }, + { + "epoch": 0.59, + "learning_rate": 1.8553581442427703e-06, + "loss": 0.8916, + "step": 23192 + }, + { + "epoch": 0.59, + "learning_rate": 1.8553438095934093e-06, + "loss": 0.7759, + "step": 23193 + }, + { + "epoch": 0.59, + "learning_rate": 1.8553294742891508e-06, + "loss": 0.8652, + "step": 23194 + }, + { + "epoch": 0.59, + "learning_rate": 1.855315138330006e-06, + "loss": 0.9863, + "step": 23195 + }, + { + "epoch": 0.59, + "learning_rate": 1.8553008017159856e-06, + "loss": 0.7568, + "step": 23196 + }, + { + "epoch": 0.59, + "learning_rate": 1.8552864644471011e-06, + "loss": 0.9209, + "step": 23197 + }, + { + "epoch": 0.59, + "learning_rate": 1.8552721265233625e-06, + "loss": 0.8711, + "step": 23198 + }, + { + "epoch": 0.59, + "learning_rate": 1.855257787944782e-06, + "loss": 0.8574, + "step": 23199 + }, + { + "epoch": 0.59, + "learning_rate": 1.8552434487113695e-06, + "loss": 0.8877, + "step": 23200 + }, + { + "epoch": 0.59, + "learning_rate": 1.8552291088231366e-06, + "loss": 0.8135, + "step": 23201 + }, + { + "epoch": 0.59, + "learning_rate": 1.8552147682800937e-06, + "loss": 0.8062, + "step": 23202 + }, + { + "epoch": 0.59, + "learning_rate": 1.8552004270822528e-06, + "loss": 0.8691, + "step": 23203 + }, + { + "epoch": 0.59, + "learning_rate": 1.855186085229624e-06, + "loss": 0.8389, + "step": 23204 + }, + { + "epoch": 0.59, + "learning_rate": 1.8551717427222182e-06, + "loss": 0.9521, + "step": 23205 + }, + { + "epoch": 0.59, + "learning_rate": 1.855157399560047e-06, + "loss": 1.0137, + "step": 23206 + }, + { + "epoch": 0.59, + "learning_rate": 1.8551430557431211e-06, + "loss": 0.7124, + "step": 23207 + }, + { + "epoch": 0.59, + "learning_rate": 1.8551287112714515e-06, + "loss": 0.9492, + "step": 23208 + }, + { + "epoch": 0.59, + "learning_rate": 1.8551143661450492e-06, + "loss": 0.7354, + "step": 23209 + }, + { + "epoch": 0.59, + "learning_rate": 1.855100020363925e-06, + "loss": 1.0186, + "step": 23210 + }, + { + "epoch": 0.59, + "learning_rate": 1.8550856739280902e-06, + "loss": 0.7451, + "step": 23211 + }, + { + "epoch": 0.59, + "learning_rate": 1.8550713268375557e-06, + "loss": 1.0879, + "step": 23212 + }, + { + "epoch": 0.59, + "learning_rate": 1.8550569790923322e-06, + "loss": 0.8027, + "step": 23213 + }, + { + "epoch": 0.59, + "learning_rate": 1.8550426306924307e-06, + "loss": 0.7617, + "step": 23214 + }, + { + "epoch": 0.6, + "learning_rate": 1.8550282816378626e-06, + "loss": 0.8369, + "step": 23215 + }, + { + "epoch": 0.6, + "learning_rate": 1.855013931928639e-06, + "loss": 1.041, + "step": 23216 + }, + { + "epoch": 0.6, + "learning_rate": 1.8549995815647701e-06, + "loss": 0.8066, + "step": 23217 + }, + { + "epoch": 0.6, + "learning_rate": 1.8549852305462675e-06, + "loss": 0.9189, + "step": 23218 + }, + { + "epoch": 0.6, + "learning_rate": 1.854970878873142e-06, + "loss": 0.6304, + "step": 23219 + }, + { + "epoch": 0.6, + "learning_rate": 1.8549565265454046e-06, + "loss": 0.8975, + "step": 23220 + }, + { + "epoch": 0.6, + "learning_rate": 1.8549421735630662e-06, + "loss": 0.9736, + "step": 23221 + }, + { + "epoch": 0.6, + "learning_rate": 1.854927819926138e-06, + "loss": 0.9043, + "step": 23222 + }, + { + "epoch": 0.6, + "learning_rate": 1.8549134656346306e-06, + "loss": 0.9951, + "step": 23223 + }, + { + "epoch": 0.6, + "learning_rate": 1.8548991106885556e-06, + "loss": 0.8994, + "step": 23224 + }, + { + "epoch": 0.6, + "learning_rate": 1.8548847550879236e-06, + "loss": 0.9551, + "step": 23225 + }, + { + "epoch": 0.6, + "learning_rate": 1.8548703988327456e-06, + "loss": 0.8584, + "step": 23226 + }, + { + "epoch": 0.6, + "learning_rate": 1.8548560419230329e-06, + "loss": 0.8906, + "step": 23227 + }, + { + "epoch": 0.6, + "learning_rate": 1.8548416843587958e-06, + "loss": 0.9551, + "step": 23228 + }, + { + "epoch": 0.6, + "learning_rate": 1.854827326140046e-06, + "loss": 0.812, + "step": 23229 + }, + { + "epoch": 0.6, + "learning_rate": 1.8548129672667941e-06, + "loss": 0.8975, + "step": 23230 + }, + { + "epoch": 0.6, + "learning_rate": 1.8547986077390512e-06, + "loss": 1.0205, + "step": 23231 + }, + { + "epoch": 0.6, + "learning_rate": 1.8547842475568286e-06, + "loss": 0.9648, + "step": 23232 + }, + { + "epoch": 0.6, + "learning_rate": 1.8547698867201367e-06, + "loss": 0.8311, + "step": 23233 + }, + { + "epoch": 0.6, + "learning_rate": 1.8547555252289868e-06, + "loss": 0.9424, + "step": 23234 + }, + { + "epoch": 0.6, + "learning_rate": 1.8547411630833901e-06, + "loss": 1.0771, + "step": 23235 + }, + { + "epoch": 0.6, + "learning_rate": 1.8547268002833571e-06, + "loss": 0.9619, + "step": 23236 + }, + { + "epoch": 0.6, + "learning_rate": 1.8547124368288993e-06, + "loss": 0.8779, + "step": 23237 + }, + { + "epoch": 0.6, + "learning_rate": 1.8546980727200276e-06, + "loss": 0.9297, + "step": 23238 + }, + { + "epoch": 0.6, + "learning_rate": 1.8546837079567528e-06, + "loss": 0.5815, + "step": 23239 + }, + { + "epoch": 0.6, + "learning_rate": 1.8546693425390858e-06, + "loss": 0.9131, + "step": 23240 + }, + { + "epoch": 0.6, + "learning_rate": 1.8546549764670378e-06, + "loss": 0.8838, + "step": 23241 + }, + { + "epoch": 0.6, + "learning_rate": 1.85464060974062e-06, + "loss": 0.791, + "step": 23242 + }, + { + "epoch": 0.6, + "learning_rate": 1.8546262423598432e-06, + "loss": 0.8711, + "step": 23243 + }, + { + "epoch": 0.6, + "learning_rate": 1.8546118743247182e-06, + "loss": 1.0332, + "step": 23244 + }, + { + "epoch": 0.6, + "learning_rate": 1.8545975056352562e-06, + "loss": 0.7803, + "step": 23245 + }, + { + "epoch": 0.6, + "learning_rate": 1.854583136291468e-06, + "loss": 0.8018, + "step": 23246 + }, + { + "epoch": 0.6, + "learning_rate": 1.8545687662933654e-06, + "loss": 0.7939, + "step": 23247 + }, + { + "epoch": 0.6, + "learning_rate": 1.8545543956409584e-06, + "loss": 0.9131, + "step": 23248 + }, + { + "epoch": 0.6, + "learning_rate": 1.8545400243342582e-06, + "loss": 0.9512, + "step": 23249 + }, + { + "epoch": 0.6, + "learning_rate": 1.8545256523732765e-06, + "loss": 0.9932, + "step": 23250 + }, + { + "epoch": 0.6, + "learning_rate": 1.8545112797580233e-06, + "loss": 0.8008, + "step": 23251 + }, + { + "epoch": 0.6, + "learning_rate": 1.8544969064885104e-06, + "loss": 0.8203, + "step": 23252 + }, + { + "epoch": 0.6, + "learning_rate": 1.8544825325647481e-06, + "loss": 0.9092, + "step": 23253 + }, + { + "epoch": 0.6, + "learning_rate": 1.8544681579867483e-06, + "loss": 0.7158, + "step": 23254 + }, + { + "epoch": 0.6, + "learning_rate": 1.8544537827545215e-06, + "loss": 0.8984, + "step": 23255 + }, + { + "epoch": 0.6, + "learning_rate": 1.8544394068680785e-06, + "loss": 0.7705, + "step": 23256 + }, + { + "epoch": 0.6, + "learning_rate": 1.8544250303274307e-06, + "loss": 0.9531, + "step": 23257 + }, + { + "epoch": 0.6, + "learning_rate": 1.8544106531325888e-06, + "loss": 0.7969, + "step": 23258 + }, + { + "epoch": 0.6, + "learning_rate": 1.8543962752835639e-06, + "loss": 0.9648, + "step": 23259 + }, + { + "epoch": 0.6, + "learning_rate": 1.8543818967803672e-06, + "loss": 0.9795, + "step": 23260 + }, + { + "epoch": 0.6, + "learning_rate": 1.8543675176230097e-06, + "loss": 0.7715, + "step": 23261 + }, + { + "epoch": 0.6, + "learning_rate": 1.8543531378115017e-06, + "loss": 0.8076, + "step": 23262 + }, + { + "epoch": 0.6, + "learning_rate": 1.8543387573458555e-06, + "loss": 0.7085, + "step": 23263 + }, + { + "epoch": 0.6, + "learning_rate": 1.854324376226081e-06, + "loss": 1.041, + "step": 23264 + }, + { + "epoch": 0.6, + "learning_rate": 1.8543099944521896e-06, + "loss": 0.9854, + "step": 23265 + }, + { + "epoch": 0.6, + "learning_rate": 1.8542956120241927e-06, + "loss": 0.7939, + "step": 23266 + }, + { + "epoch": 0.6, + "learning_rate": 1.8542812289421006e-06, + "loss": 0.7793, + "step": 23267 + }, + { + "epoch": 0.6, + "learning_rate": 1.8542668452059246e-06, + "loss": 1.0225, + "step": 23268 + }, + { + "epoch": 0.6, + "learning_rate": 1.8542524608156757e-06, + "loss": 0.728, + "step": 23269 + }, + { + "epoch": 0.6, + "learning_rate": 1.854238075771365e-06, + "loss": 1.0117, + "step": 23270 + }, + { + "epoch": 0.6, + "learning_rate": 1.8542236900730038e-06, + "loss": 1.0371, + "step": 23271 + }, + { + "epoch": 0.6, + "learning_rate": 1.8542093037206026e-06, + "loss": 0.752, + "step": 23272 + }, + { + "epoch": 0.6, + "learning_rate": 1.8541949167141726e-06, + "loss": 0.7397, + "step": 23273 + }, + { + "epoch": 0.6, + "learning_rate": 1.8541805290537247e-06, + "loss": 0.8872, + "step": 23274 + }, + { + "epoch": 0.6, + "learning_rate": 1.8541661407392704e-06, + "loss": 0.8369, + "step": 23275 + }, + { + "epoch": 0.6, + "learning_rate": 1.85415175177082e-06, + "loss": 1.0049, + "step": 23276 + }, + { + "epoch": 0.6, + "learning_rate": 1.854137362148385e-06, + "loss": 0.7432, + "step": 23277 + }, + { + "epoch": 0.6, + "learning_rate": 1.8541229718719763e-06, + "loss": 0.7822, + "step": 23278 + }, + { + "epoch": 0.6, + "learning_rate": 1.854108580941605e-06, + "loss": 0.9727, + "step": 23279 + }, + { + "epoch": 0.6, + "learning_rate": 1.854094189357282e-06, + "loss": 0.8779, + "step": 23280 + }, + { + "epoch": 0.6, + "learning_rate": 1.8540797971190183e-06, + "loss": 0.9014, + "step": 23281 + }, + { + "epoch": 0.6, + "learning_rate": 1.854065404226825e-06, + "loss": 0.9307, + "step": 23282 + }, + { + "epoch": 0.6, + "learning_rate": 1.8540510106807133e-06, + "loss": 0.9121, + "step": 23283 + }, + { + "epoch": 0.6, + "learning_rate": 1.8540366164806937e-06, + "loss": 0.8701, + "step": 23284 + }, + { + "epoch": 0.6, + "learning_rate": 1.8540222216267775e-06, + "loss": 0.8096, + "step": 23285 + }, + { + "epoch": 0.6, + "learning_rate": 1.854007826118976e-06, + "loss": 0.9971, + "step": 23286 + }, + { + "epoch": 0.6, + "learning_rate": 1.8539934299572998e-06, + "loss": 0.5437, + "step": 23287 + }, + { + "epoch": 0.6, + "learning_rate": 1.85397903314176e-06, + "loss": 0.8906, + "step": 23288 + }, + { + "epoch": 0.6, + "learning_rate": 1.8539646356723679e-06, + "loss": 0.7759, + "step": 23289 + }, + { + "epoch": 0.6, + "learning_rate": 1.8539502375491344e-06, + "loss": 0.8135, + "step": 23290 + }, + { + "epoch": 0.6, + "learning_rate": 1.8539358387720705e-06, + "loss": 0.8467, + "step": 23291 + }, + { + "epoch": 0.6, + "learning_rate": 1.853921439341187e-06, + "loss": 0.8457, + "step": 23292 + }, + { + "epoch": 0.6, + "learning_rate": 1.8539070392564953e-06, + "loss": 0.876, + "step": 23293 + }, + { + "epoch": 0.6, + "learning_rate": 1.853892638518006e-06, + "loss": 0.6216, + "step": 23294 + }, + { + "epoch": 0.6, + "learning_rate": 1.8538782371257305e-06, + "loss": 1.0479, + "step": 23295 + }, + { + "epoch": 0.6, + "learning_rate": 1.85386383507968e-06, + "loss": 0.7129, + "step": 23296 + }, + { + "epoch": 0.6, + "learning_rate": 1.8538494323798645e-06, + "loss": 0.9541, + "step": 23297 + }, + { + "epoch": 0.6, + "learning_rate": 1.8538350290262966e-06, + "loss": 0.8818, + "step": 23298 + }, + { + "epoch": 0.6, + "learning_rate": 1.853820625018986e-06, + "loss": 1.0244, + "step": 23299 + }, + { + "epoch": 0.6, + "learning_rate": 1.8538062203579441e-06, + "loss": 0.7832, + "step": 23300 + }, + { + "epoch": 0.6, + "learning_rate": 1.8537918150431824e-06, + "loss": 0.6724, + "step": 23301 + }, + { + "epoch": 0.6, + "learning_rate": 1.8537774090747113e-06, + "loss": 0.7803, + "step": 23302 + }, + { + "epoch": 0.6, + "learning_rate": 1.8537630024525422e-06, + "loss": 0.8877, + "step": 23303 + }, + { + "epoch": 0.6, + "learning_rate": 1.8537485951766861e-06, + "loss": 0.7773, + "step": 23304 + }, + { + "epoch": 0.6, + "learning_rate": 1.8537341872471538e-06, + "loss": 0.8872, + "step": 23305 + }, + { + "epoch": 0.6, + "learning_rate": 1.8537197786639562e-06, + "loss": 0.7227, + "step": 23306 + }, + { + "epoch": 0.6, + "learning_rate": 1.8537053694271052e-06, + "loss": 0.876, + "step": 23307 + }, + { + "epoch": 0.6, + "learning_rate": 1.8536909595366109e-06, + "loss": 1.0, + "step": 23308 + }, + { + "epoch": 0.6, + "learning_rate": 1.8536765489924848e-06, + "loss": 1.0669, + "step": 23309 + }, + { + "epoch": 0.6, + "learning_rate": 1.8536621377947379e-06, + "loss": 0.7432, + "step": 23310 + }, + { + "epoch": 0.6, + "learning_rate": 1.853647725943381e-06, + "loss": 1.0391, + "step": 23311 + }, + { + "epoch": 0.6, + "learning_rate": 1.8536333134384255e-06, + "loss": 0.9717, + "step": 23312 + }, + { + "epoch": 0.6, + "learning_rate": 1.853618900279882e-06, + "loss": 1.0039, + "step": 23313 + }, + { + "epoch": 0.6, + "learning_rate": 1.8536044864677618e-06, + "loss": 0.686, + "step": 23314 + }, + { + "epoch": 0.6, + "learning_rate": 1.8535900720020758e-06, + "loss": 1.0176, + "step": 23315 + }, + { + "epoch": 0.6, + "learning_rate": 1.8535756568828353e-06, + "loss": 0.834, + "step": 23316 + }, + { + "epoch": 0.6, + "learning_rate": 1.8535612411100514e-06, + "loss": 1.085, + "step": 23317 + }, + { + "epoch": 0.6, + "learning_rate": 1.8535468246837345e-06, + "loss": 0.8408, + "step": 23318 + }, + { + "epoch": 0.6, + "learning_rate": 1.8535324076038962e-06, + "loss": 0.708, + "step": 23319 + }, + { + "epoch": 0.6, + "learning_rate": 1.8535179898705473e-06, + "loss": 0.6953, + "step": 23320 + }, + { + "epoch": 0.6, + "learning_rate": 1.853503571483699e-06, + "loss": 0.875, + "step": 23321 + }, + { + "epoch": 0.6, + "learning_rate": 1.8534891524433624e-06, + "loss": 0.7148, + "step": 23322 + }, + { + "epoch": 0.6, + "learning_rate": 1.853474732749548e-06, + "loss": 0.8135, + "step": 23323 + }, + { + "epoch": 0.6, + "learning_rate": 1.8534603124022675e-06, + "loss": 0.8057, + "step": 23324 + }, + { + "epoch": 0.6, + "learning_rate": 1.8534458914015318e-06, + "loss": 0.9268, + "step": 23325 + }, + { + "epoch": 0.6, + "learning_rate": 1.8534314697473516e-06, + "loss": 1.0596, + "step": 23326 + }, + { + "epoch": 0.6, + "learning_rate": 1.8534170474397384e-06, + "loss": 0.7988, + "step": 23327 + }, + { + "epoch": 0.6, + "learning_rate": 1.853402624478703e-06, + "loss": 0.7837, + "step": 23328 + }, + { + "epoch": 0.6, + "learning_rate": 1.853388200864256e-06, + "loss": 0.9854, + "step": 23329 + }, + { + "epoch": 0.6, + "learning_rate": 1.8533737765964093e-06, + "loss": 0.7456, + "step": 23330 + }, + { + "epoch": 0.6, + "learning_rate": 1.8533593516751735e-06, + "loss": 0.9258, + "step": 23331 + }, + { + "epoch": 0.6, + "learning_rate": 1.8533449261005596e-06, + "loss": 0.6421, + "step": 23332 + }, + { + "epoch": 0.6, + "learning_rate": 1.853330499872579e-06, + "loss": 0.7612, + "step": 23333 + }, + { + "epoch": 0.6, + "learning_rate": 1.853316072991242e-06, + "loss": 0.71, + "step": 23334 + }, + { + "epoch": 0.6, + "learning_rate": 1.8533016454565603e-06, + "loss": 0.9375, + "step": 23335 + }, + { + "epoch": 0.6, + "learning_rate": 1.853287217268545e-06, + "loss": 0.9106, + "step": 23336 + }, + { + "epoch": 0.6, + "learning_rate": 1.8532727884272067e-06, + "loss": 1.0967, + "step": 23337 + }, + { + "epoch": 0.6, + "learning_rate": 1.8532583589325568e-06, + "loss": 0.8394, + "step": 23338 + }, + { + "epoch": 0.6, + "learning_rate": 1.853243928784606e-06, + "loss": 0.8633, + "step": 23339 + }, + { + "epoch": 0.6, + "learning_rate": 1.8532294979833655e-06, + "loss": 1.1152, + "step": 23340 + }, + { + "epoch": 0.6, + "learning_rate": 1.8532150665288466e-06, + "loss": 0.8467, + "step": 23341 + }, + { + "epoch": 0.6, + "learning_rate": 1.8532006344210602e-06, + "loss": 0.9043, + "step": 23342 + }, + { + "epoch": 0.6, + "learning_rate": 1.853186201660017e-06, + "loss": 0.8379, + "step": 23343 + }, + { + "epoch": 0.6, + "learning_rate": 1.8531717682457289e-06, + "loss": 1.0, + "step": 23344 + }, + { + "epoch": 0.6, + "learning_rate": 1.853157334178206e-06, + "loss": 1.0312, + "step": 23345 + }, + { + "epoch": 0.6, + "learning_rate": 1.8531428994574598e-06, + "loss": 0.8926, + "step": 23346 + }, + { + "epoch": 0.6, + "learning_rate": 1.8531284640835014e-06, + "loss": 1.0088, + "step": 23347 + }, + { + "epoch": 0.6, + "learning_rate": 1.8531140280563418e-06, + "loss": 0.998, + "step": 23348 + }, + { + "epoch": 0.6, + "learning_rate": 1.853099591375992e-06, + "loss": 0.7383, + "step": 23349 + }, + { + "epoch": 0.6, + "learning_rate": 1.8530851540424628e-06, + "loss": 0.7139, + "step": 23350 + }, + { + "epoch": 0.6, + "learning_rate": 1.8530707160557659e-06, + "loss": 0.6792, + "step": 23351 + }, + { + "epoch": 0.6, + "learning_rate": 1.8530562774159118e-06, + "loss": 0.7686, + "step": 23352 + }, + { + "epoch": 0.6, + "learning_rate": 1.8530418381229115e-06, + "loss": 0.8291, + "step": 23353 + }, + { + "epoch": 0.6, + "learning_rate": 1.8530273981767768e-06, + "loss": 1.0049, + "step": 23354 + }, + { + "epoch": 0.6, + "learning_rate": 1.8530129575775178e-06, + "loss": 0.6597, + "step": 23355 + }, + { + "epoch": 0.6, + "learning_rate": 1.8529985163251463e-06, + "loss": 0.916, + "step": 23356 + }, + { + "epoch": 0.6, + "learning_rate": 1.8529840744196728e-06, + "loss": 0.8311, + "step": 23357 + }, + { + "epoch": 0.6, + "learning_rate": 1.8529696318611089e-06, + "loss": 0.8887, + "step": 23358 + }, + { + "epoch": 0.6, + "learning_rate": 1.8529551886494652e-06, + "loss": 0.5752, + "step": 23359 + }, + { + "epoch": 0.6, + "learning_rate": 1.852940744784753e-06, + "loss": 0.7783, + "step": 23360 + }, + { + "epoch": 0.6, + "learning_rate": 1.8529263002669833e-06, + "loss": 0.5933, + "step": 23361 + }, + { + "epoch": 0.6, + "learning_rate": 1.8529118550961668e-06, + "loss": 0.8242, + "step": 23362 + }, + { + "epoch": 0.6, + "learning_rate": 1.8528974092723153e-06, + "loss": 0.8438, + "step": 23363 + }, + { + "epoch": 0.6, + "learning_rate": 1.8528829627954394e-06, + "loss": 0.9414, + "step": 23364 + }, + { + "epoch": 0.6, + "learning_rate": 1.8528685156655501e-06, + "loss": 0.7637, + "step": 23365 + }, + { + "epoch": 0.6, + "learning_rate": 1.8528540678826587e-06, + "loss": 0.7324, + "step": 23366 + }, + { + "epoch": 0.6, + "learning_rate": 1.8528396194467763e-06, + "loss": 0.9805, + "step": 23367 + }, + { + "epoch": 0.6, + "learning_rate": 1.8528251703579137e-06, + "loss": 0.9521, + "step": 23368 + }, + { + "epoch": 0.6, + "learning_rate": 1.8528107206160822e-06, + "loss": 0.6919, + "step": 23369 + }, + { + "epoch": 0.6, + "learning_rate": 1.8527962702212925e-06, + "loss": 0.8867, + "step": 23370 + }, + { + "epoch": 0.6, + "learning_rate": 1.8527818191735559e-06, + "loss": 0.8447, + "step": 23371 + }, + { + "epoch": 0.6, + "learning_rate": 1.8527673674728836e-06, + "loss": 0.96, + "step": 23372 + }, + { + "epoch": 0.6, + "learning_rate": 1.8527529151192866e-06, + "loss": 0.8916, + "step": 23373 + }, + { + "epoch": 0.6, + "learning_rate": 1.8527384621127757e-06, + "loss": 0.9619, + "step": 23374 + }, + { + "epoch": 0.6, + "learning_rate": 1.8527240084533622e-06, + "loss": 0.7432, + "step": 23375 + }, + { + "epoch": 0.6, + "learning_rate": 1.8527095541410572e-06, + "loss": 0.9375, + "step": 23376 + }, + { + "epoch": 0.6, + "learning_rate": 1.8526950991758722e-06, + "loss": 0.9141, + "step": 23377 + }, + { + "epoch": 0.6, + "learning_rate": 1.852680643557817e-06, + "loss": 0.8047, + "step": 23378 + }, + { + "epoch": 0.6, + "learning_rate": 1.8526661872869037e-06, + "loss": 0.8926, + "step": 23379 + }, + { + "epoch": 0.6, + "learning_rate": 1.8526517303631432e-06, + "loss": 0.7012, + "step": 23380 + }, + { + "epoch": 0.6, + "learning_rate": 1.8526372727865465e-06, + "loss": 0.8164, + "step": 23381 + }, + { + "epoch": 0.6, + "learning_rate": 1.8526228145571245e-06, + "loss": 0.8848, + "step": 23382 + }, + { + "epoch": 0.6, + "learning_rate": 1.8526083556748885e-06, + "loss": 0.8516, + "step": 23383 + }, + { + "epoch": 0.6, + "learning_rate": 1.8525938961398495e-06, + "loss": 0.8916, + "step": 23384 + }, + { + "epoch": 0.6, + "learning_rate": 1.8525794359520183e-06, + "loss": 0.5647, + "step": 23385 + }, + { + "epoch": 0.6, + "learning_rate": 1.8525649751114068e-06, + "loss": 0.876, + "step": 23386 + }, + { + "epoch": 0.6, + "learning_rate": 1.852550513618025e-06, + "loss": 0.5786, + "step": 23387 + }, + { + "epoch": 0.6, + "learning_rate": 1.8525360514718847e-06, + "loss": 0.5396, + "step": 23388 + }, + { + "epoch": 0.6, + "learning_rate": 1.8525215886729965e-06, + "loss": 0.8018, + "step": 23389 + }, + { + "epoch": 0.6, + "learning_rate": 1.852507125221372e-06, + "loss": 0.9375, + "step": 23390 + }, + { + "epoch": 0.6, + "learning_rate": 1.8524926611170218e-06, + "loss": 0.7988, + "step": 23391 + }, + { + "epoch": 0.6, + "learning_rate": 1.8524781963599574e-06, + "loss": 0.7705, + "step": 23392 + }, + { + "epoch": 0.6, + "learning_rate": 1.8524637309501895e-06, + "loss": 0.7627, + "step": 23393 + }, + { + "epoch": 0.6, + "learning_rate": 1.8524492648877293e-06, + "loss": 0.7754, + "step": 23394 + }, + { + "epoch": 0.6, + "learning_rate": 1.852434798172588e-06, + "loss": 0.9434, + "step": 23395 + }, + { + "epoch": 0.6, + "learning_rate": 1.8524203308047763e-06, + "loss": 1.0547, + "step": 23396 + }, + { + "epoch": 0.6, + "learning_rate": 1.8524058627843058e-06, + "loss": 0.603, + "step": 23397 + }, + { + "epoch": 0.6, + "learning_rate": 1.8523913941111872e-06, + "loss": 0.875, + "step": 23398 + }, + { + "epoch": 0.6, + "learning_rate": 1.8523769247854318e-06, + "loss": 0.7681, + "step": 23399 + }, + { + "epoch": 0.6, + "learning_rate": 1.8523624548070505e-06, + "loss": 0.9727, + "step": 23400 + }, + { + "epoch": 0.6, + "learning_rate": 1.8523479841760548e-06, + "loss": 0.9424, + "step": 23401 + }, + { + "epoch": 0.6, + "learning_rate": 1.852333512892455e-06, + "loss": 0.6812, + "step": 23402 + }, + { + "epoch": 0.6, + "learning_rate": 1.8523190409562628e-06, + "loss": 0.6714, + "step": 23403 + }, + { + "epoch": 0.6, + "learning_rate": 1.852304568367489e-06, + "loss": 0.6383, + "step": 23404 + }, + { + "epoch": 0.6, + "learning_rate": 1.8522900951261448e-06, + "loss": 0.7168, + "step": 23405 + }, + { + "epoch": 0.6, + "learning_rate": 1.8522756212322412e-06, + "loss": 0.8867, + "step": 23406 + }, + { + "epoch": 0.6, + "learning_rate": 1.8522611466857896e-06, + "loss": 0.7593, + "step": 23407 + }, + { + "epoch": 0.6, + "learning_rate": 1.8522466714868007e-06, + "loss": 1.0234, + "step": 23408 + }, + { + "epoch": 0.6, + "learning_rate": 1.8522321956352855e-06, + "loss": 0.8584, + "step": 23409 + }, + { + "epoch": 0.6, + "learning_rate": 1.8522177191312556e-06, + "loss": 0.7842, + "step": 23410 + }, + { + "epoch": 0.6, + "learning_rate": 1.8522032419747217e-06, + "loss": 0.9473, + "step": 23411 + }, + { + "epoch": 0.6, + "learning_rate": 1.852188764165695e-06, + "loss": 0.7811, + "step": 23412 + }, + { + "epoch": 0.6, + "learning_rate": 1.8521742857041864e-06, + "loss": 0.8916, + "step": 23413 + }, + { + "epoch": 0.6, + "learning_rate": 1.8521598065902074e-06, + "loss": 0.7466, + "step": 23414 + }, + { + "epoch": 0.6, + "learning_rate": 1.8521453268237685e-06, + "loss": 0.9199, + "step": 23415 + }, + { + "epoch": 0.6, + "learning_rate": 1.8521308464048812e-06, + "loss": 0.8955, + "step": 23416 + }, + { + "epoch": 0.6, + "learning_rate": 1.8521163653335565e-06, + "loss": 0.9111, + "step": 23417 + }, + { + "epoch": 0.6, + "learning_rate": 1.8521018836098055e-06, + "loss": 0.835, + "step": 23418 + }, + { + "epoch": 0.6, + "learning_rate": 1.8520874012336394e-06, + "loss": 0.9912, + "step": 23419 + }, + { + "epoch": 0.6, + "learning_rate": 1.852072918205069e-06, + "loss": 0.9336, + "step": 23420 + }, + { + "epoch": 0.6, + "learning_rate": 1.8520584345241055e-06, + "loss": 0.7236, + "step": 23421 + }, + { + "epoch": 0.6, + "learning_rate": 1.8520439501907603e-06, + "loss": 0.8877, + "step": 23422 + }, + { + "epoch": 0.6, + "learning_rate": 1.8520294652050439e-06, + "loss": 0.7002, + "step": 23423 + }, + { + "epoch": 0.6, + "learning_rate": 1.8520149795669679e-06, + "loss": 1.0801, + "step": 23424 + }, + { + "epoch": 0.6, + "learning_rate": 1.8520004932765431e-06, + "loss": 0.7583, + "step": 23425 + }, + { + "epoch": 0.6, + "learning_rate": 1.8519860063337806e-06, + "loss": 0.9248, + "step": 23426 + }, + { + "epoch": 0.6, + "learning_rate": 1.8519715187386922e-06, + "loss": 0.8154, + "step": 23427 + }, + { + "epoch": 0.6, + "learning_rate": 1.8519570304912878e-06, + "loss": 0.8726, + "step": 23428 + }, + { + "epoch": 0.6, + "learning_rate": 1.8519425415915793e-06, + "loss": 0.7148, + "step": 23429 + }, + { + "epoch": 0.6, + "learning_rate": 1.8519280520395773e-06, + "loss": 0.8281, + "step": 23430 + }, + { + "epoch": 0.6, + "learning_rate": 1.8519135618352935e-06, + "loss": 0.8018, + "step": 23431 + }, + { + "epoch": 0.6, + "learning_rate": 1.8518990709787383e-06, + "loss": 0.8271, + "step": 23432 + }, + { + "epoch": 0.6, + "learning_rate": 1.8518845794699234e-06, + "loss": 0.9844, + "step": 23433 + }, + { + "epoch": 0.6, + "learning_rate": 1.8518700873088596e-06, + "loss": 0.9131, + "step": 23434 + }, + { + "epoch": 0.6, + "learning_rate": 1.851855594495558e-06, + "loss": 0.9609, + "step": 23435 + }, + { + "epoch": 0.6, + "learning_rate": 1.85184110103003e-06, + "loss": 0.8848, + "step": 23436 + }, + { + "epoch": 0.6, + "learning_rate": 1.8518266069122862e-06, + "loss": 0.8447, + "step": 23437 + }, + { + "epoch": 0.6, + "learning_rate": 1.8518121121423378e-06, + "loss": 0.8379, + "step": 23438 + }, + { + "epoch": 0.6, + "learning_rate": 1.8517976167201964e-06, + "loss": 1.2822, + "step": 23439 + }, + { + "epoch": 0.6, + "learning_rate": 1.8517831206458725e-06, + "loss": 0.4434, + "step": 23440 + }, + { + "epoch": 0.6, + "learning_rate": 1.8517686239193772e-06, + "loss": 0.7192, + "step": 23441 + }, + { + "epoch": 0.6, + "learning_rate": 1.8517541265407224e-06, + "loss": 0.9014, + "step": 23442 + }, + { + "epoch": 0.6, + "learning_rate": 1.851739628509918e-06, + "loss": 1.1426, + "step": 23443 + }, + { + "epoch": 0.6, + "learning_rate": 1.8517251298269763e-06, + "loss": 0.7417, + "step": 23444 + }, + { + "epoch": 0.6, + "learning_rate": 1.8517106304919074e-06, + "loss": 0.9824, + "step": 23445 + }, + { + "epoch": 0.6, + "learning_rate": 1.8516961305047231e-06, + "loss": 0.8242, + "step": 23446 + }, + { + "epoch": 0.6, + "learning_rate": 1.851681629865434e-06, + "loss": 0.8525, + "step": 23447 + }, + { + "epoch": 0.6, + "learning_rate": 1.8516671285740518e-06, + "loss": 0.8936, + "step": 23448 + }, + { + "epoch": 0.6, + "learning_rate": 1.851652626630587e-06, + "loss": 0.8232, + "step": 23449 + }, + { + "epoch": 0.6, + "learning_rate": 1.8516381240350509e-06, + "loss": 0.96, + "step": 23450 + }, + { + "epoch": 0.6, + "learning_rate": 1.8516236207874547e-06, + "loss": 0.8936, + "step": 23451 + }, + { + "epoch": 0.6, + "learning_rate": 1.8516091168878093e-06, + "loss": 0.9639, + "step": 23452 + }, + { + "epoch": 0.6, + "learning_rate": 1.8515946123361263e-06, + "loss": 0.9844, + "step": 23453 + }, + { + "epoch": 0.6, + "learning_rate": 1.8515801071324164e-06, + "loss": 1.0225, + "step": 23454 + }, + { + "epoch": 0.6, + "learning_rate": 1.8515656012766905e-06, + "loss": 0.7959, + "step": 23455 + }, + { + "epoch": 0.6, + "learning_rate": 1.8515510947689603e-06, + "loss": 0.9854, + "step": 23456 + }, + { + "epoch": 0.6, + "learning_rate": 1.8515365876092363e-06, + "loss": 0.79, + "step": 23457 + }, + { + "epoch": 0.6, + "learning_rate": 1.85152207979753e-06, + "loss": 1.1094, + "step": 23458 + }, + { + "epoch": 0.6, + "learning_rate": 1.8515075713338523e-06, + "loss": 0.7466, + "step": 23459 + }, + { + "epoch": 0.6, + "learning_rate": 1.8514930622182145e-06, + "loss": 0.8848, + "step": 23460 + }, + { + "epoch": 0.6, + "learning_rate": 1.8514785524506278e-06, + "loss": 0.7676, + "step": 23461 + }, + { + "epoch": 0.6, + "learning_rate": 1.851464042031103e-06, + "loss": 1.0771, + "step": 23462 + }, + { + "epoch": 0.6, + "learning_rate": 1.8514495309596511e-06, + "loss": 0.9424, + "step": 23463 + }, + { + "epoch": 0.6, + "learning_rate": 1.8514350192362837e-06, + "loss": 0.7578, + "step": 23464 + }, + { + "epoch": 0.6, + "learning_rate": 1.8514205068610116e-06, + "loss": 0.8516, + "step": 23465 + }, + { + "epoch": 0.6, + "learning_rate": 1.851405993833846e-06, + "loss": 0.7563, + "step": 23466 + }, + { + "epoch": 0.6, + "learning_rate": 1.851391480154798e-06, + "loss": 0.8691, + "step": 23467 + }, + { + "epoch": 0.6, + "learning_rate": 1.8513769658238784e-06, + "loss": 1.0146, + "step": 23468 + }, + { + "epoch": 0.6, + "learning_rate": 1.851362450841099e-06, + "loss": 0.8789, + "step": 23469 + }, + { + "epoch": 0.6, + "learning_rate": 1.8513479352064703e-06, + "loss": 0.5679, + "step": 23470 + }, + { + "epoch": 0.6, + "learning_rate": 1.8513334189200038e-06, + "loss": 0.8306, + "step": 23471 + }, + { + "epoch": 0.6, + "learning_rate": 1.8513189019817101e-06, + "loss": 1.0195, + "step": 23472 + }, + { + "epoch": 0.6, + "learning_rate": 1.8513043843916009e-06, + "loss": 0.7324, + "step": 23473 + }, + { + "epoch": 0.6, + "learning_rate": 1.8512898661496873e-06, + "loss": 0.915, + "step": 23474 + }, + { + "epoch": 0.6, + "learning_rate": 1.8512753472559797e-06, + "loss": 1.041, + "step": 23475 + }, + { + "epoch": 0.6, + "learning_rate": 1.8512608277104902e-06, + "loss": 0.8457, + "step": 23476 + }, + { + "epoch": 0.6, + "learning_rate": 1.8512463075132292e-06, + "loss": 0.7471, + "step": 23477 + }, + { + "epoch": 0.6, + "learning_rate": 1.8512317866642077e-06, + "loss": 0.8408, + "step": 23478 + }, + { + "epoch": 0.6, + "learning_rate": 1.8512172651634378e-06, + "loss": 0.8203, + "step": 23479 + }, + { + "epoch": 0.6, + "learning_rate": 1.8512027430109293e-06, + "loss": 0.7388, + "step": 23480 + }, + { + "epoch": 0.6, + "learning_rate": 1.8511882202066947e-06, + "loss": 0.9551, + "step": 23481 + }, + { + "epoch": 0.6, + "learning_rate": 1.8511736967507438e-06, + "loss": 1.1182, + "step": 23482 + }, + { + "epoch": 0.6, + "learning_rate": 1.8511591726430889e-06, + "loss": 0.9141, + "step": 23483 + }, + { + "epoch": 0.6, + "learning_rate": 1.8511446478837402e-06, + "loss": 0.8296, + "step": 23484 + }, + { + "epoch": 0.6, + "learning_rate": 1.8511301224727091e-06, + "loss": 0.7861, + "step": 23485 + }, + { + "epoch": 0.6, + "learning_rate": 1.8511155964100071e-06, + "loss": 0.8809, + "step": 23486 + }, + { + "epoch": 0.6, + "learning_rate": 1.851101069695645e-06, + "loss": 0.7725, + "step": 23487 + }, + { + "epoch": 0.6, + "learning_rate": 1.8510865423296337e-06, + "loss": 0.7738, + "step": 23488 + }, + { + "epoch": 0.6, + "learning_rate": 1.8510720143119848e-06, + "loss": 0.7245, + "step": 23489 + }, + { + "epoch": 0.6, + "learning_rate": 1.8510574856427091e-06, + "loss": 0.8979, + "step": 23490 + }, + { + "epoch": 0.6, + "learning_rate": 1.8510429563218178e-06, + "loss": 0.8516, + "step": 23491 + }, + { + "epoch": 0.6, + "learning_rate": 1.851028426349322e-06, + "loss": 0.7095, + "step": 23492 + }, + { + "epoch": 0.6, + "learning_rate": 1.851013895725233e-06, + "loss": 0.9131, + "step": 23493 + }, + { + "epoch": 0.6, + "learning_rate": 1.8509993644495619e-06, + "loss": 1.0332, + "step": 23494 + }, + { + "epoch": 0.6, + "learning_rate": 1.8509848325223195e-06, + "loss": 0.5791, + "step": 23495 + }, + { + "epoch": 0.6, + "learning_rate": 1.850970299943517e-06, + "loss": 0.6465, + "step": 23496 + }, + { + "epoch": 0.6, + "learning_rate": 1.8509557667131657e-06, + "loss": 1.001, + "step": 23497 + }, + { + "epoch": 0.6, + "learning_rate": 1.850941232831277e-06, + "loss": 0.7158, + "step": 23498 + }, + { + "epoch": 0.6, + "learning_rate": 1.8509266982978615e-06, + "loss": 0.8281, + "step": 23499 + }, + { + "epoch": 0.6, + "learning_rate": 1.8509121631129308e-06, + "loss": 0.856, + "step": 23500 + }, + { + "epoch": 0.6, + "learning_rate": 1.8508976272764954e-06, + "loss": 1.0039, + "step": 23501 + }, + { + "epoch": 0.6, + "learning_rate": 1.8508830907885671e-06, + "loss": 0.874, + "step": 23502 + }, + { + "epoch": 0.6, + "learning_rate": 1.8508685536491566e-06, + "loss": 0.8955, + "step": 23503 + }, + { + "epoch": 0.6, + "learning_rate": 1.8508540158582753e-06, + "loss": 1.0166, + "step": 23504 + }, + { + "epoch": 0.6, + "learning_rate": 1.850839477415934e-06, + "loss": 0.8076, + "step": 23505 + }, + { + "epoch": 0.6, + "learning_rate": 1.8508249383221442e-06, + "loss": 0.7266, + "step": 23506 + }, + { + "epoch": 0.6, + "learning_rate": 1.8508103985769168e-06, + "loss": 1.0215, + "step": 23507 + }, + { + "epoch": 0.6, + "learning_rate": 1.850795858180263e-06, + "loss": 0.958, + "step": 23508 + }, + { + "epoch": 0.6, + "learning_rate": 1.8507813171321941e-06, + "loss": 0.6426, + "step": 23509 + }, + { + "epoch": 0.6, + "learning_rate": 1.8507667754327208e-06, + "loss": 0.7305, + "step": 23510 + }, + { + "epoch": 0.6, + "learning_rate": 1.8507522330818547e-06, + "loss": 0.8906, + "step": 23511 + }, + { + "epoch": 0.6, + "learning_rate": 1.8507376900796067e-06, + "loss": 0.9453, + "step": 23512 + }, + { + "epoch": 0.6, + "learning_rate": 1.8507231464259881e-06, + "loss": 0.9424, + "step": 23513 + }, + { + "epoch": 0.6, + "learning_rate": 1.8507086021210097e-06, + "loss": 1.0186, + "step": 23514 + }, + { + "epoch": 0.6, + "learning_rate": 1.8506940571646827e-06, + "loss": 0.9648, + "step": 23515 + }, + { + "epoch": 0.6, + "learning_rate": 1.8506795115570186e-06, + "loss": 1.002, + "step": 23516 + }, + { + "epoch": 0.6, + "learning_rate": 1.8506649652980281e-06, + "loss": 1.0918, + "step": 23517 + }, + { + "epoch": 0.6, + "learning_rate": 1.850650418387723e-06, + "loss": 0.7051, + "step": 23518 + }, + { + "epoch": 0.6, + "learning_rate": 1.8506358708261136e-06, + "loss": 0.8564, + "step": 23519 + }, + { + "epoch": 0.6, + "learning_rate": 1.8506213226132114e-06, + "loss": 1.1924, + "step": 23520 + }, + { + "epoch": 0.6, + "learning_rate": 1.8506067737490279e-06, + "loss": 0.7539, + "step": 23521 + }, + { + "epoch": 0.6, + "learning_rate": 1.8505922242335736e-06, + "loss": 0.9736, + "step": 23522 + }, + { + "epoch": 0.6, + "learning_rate": 1.85057767406686e-06, + "loss": 0.8789, + "step": 23523 + }, + { + "epoch": 0.6, + "learning_rate": 1.8505631232488984e-06, + "loss": 0.9746, + "step": 23524 + }, + { + "epoch": 0.6, + "learning_rate": 1.8505485717796993e-06, + "loss": 1.0332, + "step": 23525 + }, + { + "epoch": 0.6, + "learning_rate": 1.8505340196592747e-06, + "loss": 0.8701, + "step": 23526 + }, + { + "epoch": 0.6, + "learning_rate": 1.8505194668876348e-06, + "loss": 0.7588, + "step": 23527 + }, + { + "epoch": 0.6, + "learning_rate": 1.8505049134647918e-06, + "loss": 0.9409, + "step": 23528 + }, + { + "epoch": 0.6, + "learning_rate": 1.8504903593907562e-06, + "loss": 0.6562, + "step": 23529 + }, + { + "epoch": 0.6, + "learning_rate": 1.850475804665539e-06, + "loss": 0.9395, + "step": 23530 + }, + { + "epoch": 0.6, + "learning_rate": 1.850461249289152e-06, + "loss": 0.7959, + "step": 23531 + }, + { + "epoch": 0.6, + "learning_rate": 1.8504466932616055e-06, + "loss": 0.8159, + "step": 23532 + }, + { + "epoch": 0.6, + "learning_rate": 1.8504321365829111e-06, + "loss": 0.7656, + "step": 23533 + }, + { + "epoch": 0.6, + "learning_rate": 1.8504175792530801e-06, + "loss": 0.9531, + "step": 23534 + }, + { + "epoch": 0.6, + "learning_rate": 1.8504030212721233e-06, + "loss": 0.7725, + "step": 23535 + }, + { + "epoch": 0.6, + "learning_rate": 1.8503884626400522e-06, + "loss": 0.9375, + "step": 23536 + }, + { + "epoch": 0.6, + "learning_rate": 1.8503739033568774e-06, + "loss": 0.8438, + "step": 23537 + }, + { + "epoch": 0.6, + "learning_rate": 1.850359343422611e-06, + "loss": 0.6885, + "step": 23538 + }, + { + "epoch": 0.6, + "learning_rate": 1.8503447828372632e-06, + "loss": 0.7786, + "step": 23539 + }, + { + "epoch": 0.6, + "learning_rate": 1.850330221600845e-06, + "loss": 0.7246, + "step": 23540 + }, + { + "epoch": 0.6, + "learning_rate": 1.8503156597133689e-06, + "loss": 0.8389, + "step": 23541 + }, + { + "epoch": 0.6, + "learning_rate": 1.850301097174845e-06, + "loss": 0.7529, + "step": 23542 + }, + { + "epoch": 0.6, + "learning_rate": 1.8502865339852842e-06, + "loss": 0.957, + "step": 23543 + }, + { + "epoch": 0.6, + "learning_rate": 1.8502719701446985e-06, + "loss": 0.6409, + "step": 23544 + }, + { + "epoch": 0.6, + "learning_rate": 1.8502574056530987e-06, + "loss": 0.7622, + "step": 23545 + }, + { + "epoch": 0.6, + "learning_rate": 1.8502428405104956e-06, + "loss": 0.8652, + "step": 23546 + }, + { + "epoch": 0.6, + "learning_rate": 1.8502282747169007e-06, + "loss": 0.7939, + "step": 23547 + }, + { + "epoch": 0.6, + "learning_rate": 1.8502137082723252e-06, + "loss": 0.8604, + "step": 23548 + }, + { + "epoch": 0.6, + "learning_rate": 1.8501991411767803e-06, + "loss": 0.5881, + "step": 23549 + }, + { + "epoch": 0.6, + "learning_rate": 1.8501845734302768e-06, + "loss": 0.7351, + "step": 23550 + }, + { + "epoch": 0.6, + "learning_rate": 1.8501700050328261e-06, + "loss": 0.7441, + "step": 23551 + }, + { + "epoch": 0.6, + "learning_rate": 1.8501554359844394e-06, + "loss": 0.873, + "step": 23552 + }, + { + "epoch": 0.6, + "learning_rate": 1.8501408662851277e-06, + "loss": 0.6919, + "step": 23553 + }, + { + "epoch": 0.6, + "learning_rate": 1.8501262959349023e-06, + "loss": 0.915, + "step": 23554 + }, + { + "epoch": 0.6, + "learning_rate": 1.8501117249337743e-06, + "loss": 0.8262, + "step": 23555 + }, + { + "epoch": 0.6, + "learning_rate": 1.8500971532817547e-06, + "loss": 0.873, + "step": 23556 + }, + { + "epoch": 0.6, + "learning_rate": 1.8500825809788548e-06, + "loss": 0.8447, + "step": 23557 + }, + { + "epoch": 0.6, + "learning_rate": 1.850068008025086e-06, + "loss": 0.9307, + "step": 23558 + }, + { + "epoch": 0.6, + "learning_rate": 1.850053434420459e-06, + "loss": 0.7559, + "step": 23559 + }, + { + "epoch": 0.6, + "learning_rate": 1.8500388601649853e-06, + "loss": 0.791, + "step": 23560 + }, + { + "epoch": 0.6, + "learning_rate": 1.8500242852586756e-06, + "loss": 0.8828, + "step": 23561 + }, + { + "epoch": 0.6, + "learning_rate": 1.850009709701542e-06, + "loss": 0.8604, + "step": 23562 + }, + { + "epoch": 0.6, + "learning_rate": 1.8499951334935946e-06, + "loss": 0.999, + "step": 23563 + }, + { + "epoch": 0.6, + "learning_rate": 1.849980556634845e-06, + "loss": 0.8271, + "step": 23564 + }, + { + "epoch": 0.6, + "learning_rate": 1.8499659791253044e-06, + "loss": 0.6973, + "step": 23565 + }, + { + "epoch": 0.6, + "learning_rate": 1.8499514009649842e-06, + "loss": 0.8584, + "step": 23566 + }, + { + "epoch": 0.6, + "learning_rate": 1.849936822153895e-06, + "loss": 0.9609, + "step": 23567 + }, + { + "epoch": 0.6, + "learning_rate": 1.8499222426920484e-06, + "loss": 0.96, + "step": 23568 + }, + { + "epoch": 0.6, + "learning_rate": 1.8499076625794551e-06, + "loss": 0.999, + "step": 23569 + }, + { + "epoch": 0.6, + "learning_rate": 1.849893081816127e-06, + "loss": 0.9404, + "step": 23570 + }, + { + "epoch": 0.6, + "learning_rate": 1.8498785004020747e-06, + "loss": 0.9229, + "step": 23571 + }, + { + "epoch": 0.6, + "learning_rate": 1.8498639183373095e-06, + "loss": 0.667, + "step": 23572 + }, + { + "epoch": 0.6, + "learning_rate": 1.8498493356218424e-06, + "loss": 0.8787, + "step": 23573 + }, + { + "epoch": 0.6, + "learning_rate": 1.8498347522556853e-06, + "loss": 0.4851, + "step": 23574 + }, + { + "epoch": 0.6, + "learning_rate": 1.8498201682388484e-06, + "loss": 0.8867, + "step": 23575 + }, + { + "epoch": 0.6, + "learning_rate": 1.849805583571343e-06, + "loss": 0.7739, + "step": 23576 + }, + { + "epoch": 0.6, + "learning_rate": 1.849790998253181e-06, + "loss": 0.9004, + "step": 23577 + }, + { + "epoch": 0.6, + "learning_rate": 1.8497764122843731e-06, + "loss": 0.9131, + "step": 23578 + }, + { + "epoch": 0.6, + "learning_rate": 1.8497618256649301e-06, + "loss": 0.6724, + "step": 23579 + }, + { + "epoch": 0.6, + "learning_rate": 1.849747238394864e-06, + "loss": 0.8125, + "step": 23580 + }, + { + "epoch": 0.6, + "learning_rate": 1.8497326504741853e-06, + "loss": 0.6045, + "step": 23581 + }, + { + "epoch": 0.6, + "learning_rate": 1.8497180619029052e-06, + "loss": 0.5042, + "step": 23582 + }, + { + "epoch": 0.6, + "learning_rate": 1.8497034726810352e-06, + "loss": 1.0215, + "step": 23583 + }, + { + "epoch": 0.6, + "learning_rate": 1.8496888828085863e-06, + "loss": 0.8457, + "step": 23584 + }, + { + "epoch": 0.6, + "learning_rate": 1.8496742922855697e-06, + "loss": 0.7725, + "step": 23585 + }, + { + "epoch": 0.6, + "learning_rate": 1.8496597011119967e-06, + "loss": 0.7949, + "step": 23586 + }, + { + "epoch": 0.6, + "learning_rate": 1.8496451092878782e-06, + "loss": 0.7876, + "step": 23587 + }, + { + "epoch": 0.6, + "learning_rate": 1.8496305168132255e-06, + "loss": 0.7812, + "step": 23588 + }, + { + "epoch": 0.6, + "learning_rate": 1.84961592368805e-06, + "loss": 0.7793, + "step": 23589 + }, + { + "epoch": 0.6, + "learning_rate": 1.8496013299123626e-06, + "loss": 0.8623, + "step": 23590 + }, + { + "epoch": 0.6, + "learning_rate": 1.8495867354861741e-06, + "loss": 1.0391, + "step": 23591 + }, + { + "epoch": 0.6, + "learning_rate": 1.8495721404094966e-06, + "loss": 0.9111, + "step": 23592 + }, + { + "epoch": 0.6, + "learning_rate": 1.8495575446823403e-06, + "loss": 1.0996, + "step": 23593 + }, + { + "epoch": 0.6, + "learning_rate": 1.8495429483047173e-06, + "loss": 1.0312, + "step": 23594 + }, + { + "epoch": 0.6, + "learning_rate": 1.8495283512766383e-06, + "loss": 1.0635, + "step": 23595 + }, + { + "epoch": 0.6, + "learning_rate": 1.8495137535981142e-06, + "loss": 0.7109, + "step": 23596 + }, + { + "epoch": 0.6, + "learning_rate": 1.8494991552691568e-06, + "loss": 0.8955, + "step": 23597 + }, + { + "epoch": 0.6, + "learning_rate": 1.8494845562897767e-06, + "loss": 0.7871, + "step": 23598 + }, + { + "epoch": 0.6, + "learning_rate": 1.8494699566599853e-06, + "loss": 0.8301, + "step": 23599 + }, + { + "epoch": 0.6, + "learning_rate": 1.849455356379794e-06, + "loss": 0.6226, + "step": 23600 + }, + { + "epoch": 0.6, + "learning_rate": 1.8494407554492137e-06, + "loss": 1.0127, + "step": 23601 + }, + { + "epoch": 0.6, + "learning_rate": 1.8494261538682557e-06, + "loss": 0.8994, + "step": 23602 + }, + { + "epoch": 0.6, + "learning_rate": 1.8494115516369314e-06, + "loss": 1.0068, + "step": 23603 + }, + { + "epoch": 0.6, + "learning_rate": 1.8493969487552512e-06, + "loss": 0.8574, + "step": 23604 + }, + { + "epoch": 0.61, + "learning_rate": 1.8493823452232271e-06, + "loss": 0.9287, + "step": 23605 + }, + { + "epoch": 0.61, + "learning_rate": 1.8493677410408702e-06, + "loss": 0.7642, + "step": 23606 + }, + { + "epoch": 0.61, + "learning_rate": 1.849353136208191e-06, + "loss": 0.8975, + "step": 23607 + }, + { + "epoch": 0.61, + "learning_rate": 1.8493385307252017e-06, + "loss": 0.8799, + "step": 23608 + }, + { + "epoch": 0.61, + "learning_rate": 1.8493239245919128e-06, + "loss": 0.9082, + "step": 23609 + }, + { + "epoch": 0.61, + "learning_rate": 1.8493093178083354e-06, + "loss": 0.7568, + "step": 23610 + }, + { + "epoch": 0.61, + "learning_rate": 1.849294710374481e-06, + "loss": 0.9043, + "step": 23611 + }, + { + "epoch": 0.61, + "learning_rate": 1.8492801022903606e-06, + "loss": 0.9775, + "step": 23612 + }, + { + "epoch": 0.61, + "learning_rate": 1.8492654935559858e-06, + "loss": 0.9414, + "step": 23613 + }, + { + "epoch": 0.61, + "learning_rate": 1.8492508841713672e-06, + "loss": 1.0332, + "step": 23614 + }, + { + "epoch": 0.61, + "learning_rate": 1.8492362741365162e-06, + "loss": 0.917, + "step": 23615 + }, + { + "epoch": 0.61, + "learning_rate": 1.849221663451444e-06, + "loss": 0.9033, + "step": 23616 + }, + { + "epoch": 0.61, + "learning_rate": 1.849207052116162e-06, + "loss": 0.8145, + "step": 23617 + }, + { + "epoch": 0.61, + "learning_rate": 1.849192440130681e-06, + "loss": 0.6821, + "step": 23618 + }, + { + "epoch": 0.61, + "learning_rate": 1.8491778274950128e-06, + "loss": 0.9727, + "step": 23619 + }, + { + "epoch": 0.61, + "learning_rate": 1.8491632142091678e-06, + "loss": 0.5784, + "step": 23620 + }, + { + "epoch": 0.61, + "learning_rate": 1.8491486002731579e-06, + "loss": 0.7568, + "step": 23621 + }, + { + "epoch": 0.61, + "learning_rate": 1.8491339856869936e-06, + "loss": 1.0098, + "step": 23622 + }, + { + "epoch": 0.61, + "learning_rate": 1.8491193704506867e-06, + "loss": 0.8799, + "step": 23623 + }, + { + "epoch": 0.61, + "learning_rate": 1.849104754564248e-06, + "loss": 0.9629, + "step": 23624 + }, + { + "epoch": 0.61, + "learning_rate": 1.8490901380276889e-06, + "loss": 0.8066, + "step": 23625 + }, + { + "epoch": 0.61, + "learning_rate": 1.8490755208410204e-06, + "loss": 0.9268, + "step": 23626 + }, + { + "epoch": 0.61, + "learning_rate": 1.8490609030042542e-06, + "loss": 0.9434, + "step": 23627 + }, + { + "epoch": 0.61, + "learning_rate": 1.8490462845174007e-06, + "loss": 1.0059, + "step": 23628 + }, + { + "epoch": 0.61, + "learning_rate": 1.8490316653804715e-06, + "loss": 0.9619, + "step": 23629 + }, + { + "epoch": 0.61, + "learning_rate": 1.849017045593478e-06, + "loss": 0.8555, + "step": 23630 + }, + { + "epoch": 0.61, + "learning_rate": 1.8490024251564311e-06, + "loss": 0.707, + "step": 23631 + }, + { + "epoch": 0.61, + "learning_rate": 1.8489878040693422e-06, + "loss": 0.9473, + "step": 23632 + }, + { + "epoch": 0.61, + "learning_rate": 1.8489731823322221e-06, + "loss": 1.0117, + "step": 23633 + }, + { + "epoch": 0.61, + "learning_rate": 1.8489585599450822e-06, + "loss": 0.8022, + "step": 23634 + }, + { + "epoch": 0.61, + "learning_rate": 1.8489439369079343e-06, + "loss": 0.7886, + "step": 23635 + }, + { + "epoch": 0.61, + "learning_rate": 1.8489293132207888e-06, + "loss": 0.8291, + "step": 23636 + }, + { + "epoch": 0.61, + "learning_rate": 1.848914688883657e-06, + "loss": 1.042, + "step": 23637 + }, + { + "epoch": 0.61, + "learning_rate": 1.8489000638965506e-06, + "loss": 0.8745, + "step": 23638 + }, + { + "epoch": 0.61, + "learning_rate": 1.84888543825948e-06, + "loss": 0.8945, + "step": 23639 + }, + { + "epoch": 0.61, + "learning_rate": 1.8488708119724572e-06, + "loss": 0.7852, + "step": 23640 + }, + { + "epoch": 0.61, + "learning_rate": 1.8488561850354932e-06, + "loss": 0.7354, + "step": 23641 + }, + { + "epoch": 0.61, + "learning_rate": 1.8488415574485985e-06, + "loss": 0.8164, + "step": 23642 + }, + { + "epoch": 0.61, + "learning_rate": 1.8488269292117853e-06, + "loss": 0.9941, + "step": 23643 + }, + { + "epoch": 0.61, + "learning_rate": 1.848812300325064e-06, + "loss": 0.8203, + "step": 23644 + }, + { + "epoch": 0.61, + "learning_rate": 1.8487976707884462e-06, + "loss": 0.7876, + "step": 23645 + }, + { + "epoch": 0.61, + "learning_rate": 1.8487830406019436e-06, + "loss": 1.0107, + "step": 23646 + }, + { + "epoch": 0.61, + "learning_rate": 1.8487684097655664e-06, + "loss": 0.8555, + "step": 23647 + }, + { + "epoch": 0.61, + "learning_rate": 1.848753778279326e-06, + "loss": 0.8809, + "step": 23648 + }, + { + "epoch": 0.61, + "learning_rate": 1.8487391461432344e-06, + "loss": 0.9229, + "step": 23649 + }, + { + "epoch": 0.61, + "learning_rate": 1.848724513357302e-06, + "loss": 0.7158, + "step": 23650 + }, + { + "epoch": 0.61, + "learning_rate": 1.8487098799215404e-06, + "loss": 0.9082, + "step": 23651 + }, + { + "epoch": 0.61, + "learning_rate": 1.8486952458359605e-06, + "loss": 0.6719, + "step": 23652 + }, + { + "epoch": 0.61, + "learning_rate": 1.8486806111005738e-06, + "loss": 0.877, + "step": 23653 + }, + { + "epoch": 0.61, + "learning_rate": 1.848665975715391e-06, + "loss": 0.5486, + "step": 23654 + }, + { + "epoch": 0.61, + "learning_rate": 1.8486513396804243e-06, + "loss": 0.9902, + "step": 23655 + }, + { + "epoch": 0.61, + "learning_rate": 1.848636702995684e-06, + "loss": 0.8398, + "step": 23656 + }, + { + "epoch": 0.61, + "learning_rate": 1.8486220656611815e-06, + "loss": 0.9023, + "step": 23657 + }, + { + "epoch": 0.61, + "learning_rate": 1.8486074276769283e-06, + "loss": 0.7949, + "step": 23658 + }, + { + "epoch": 0.61, + "learning_rate": 1.8485927890429354e-06, + "loss": 0.9775, + "step": 23659 + }, + { + "epoch": 0.61, + "learning_rate": 1.8485781497592136e-06, + "loss": 0.9473, + "step": 23660 + }, + { + "epoch": 0.61, + "learning_rate": 1.848563509825775e-06, + "loss": 0.8096, + "step": 23661 + }, + { + "epoch": 0.61, + "learning_rate": 1.8485488692426304e-06, + "loss": 0.8643, + "step": 23662 + }, + { + "epoch": 0.61, + "learning_rate": 1.8485342280097907e-06, + "loss": 0.8428, + "step": 23663 + }, + { + "epoch": 0.61, + "learning_rate": 1.8485195861272674e-06, + "loss": 1.0459, + "step": 23664 + }, + { + "epoch": 0.61, + "learning_rate": 1.8485049435950716e-06, + "loss": 0.8018, + "step": 23665 + }, + { + "epoch": 0.61, + "learning_rate": 1.8484903004132146e-06, + "loss": 0.8965, + "step": 23666 + }, + { + "epoch": 0.61, + "learning_rate": 1.8484756565817077e-06, + "loss": 1.0732, + "step": 23667 + }, + { + "epoch": 0.61, + "learning_rate": 1.8484610121005619e-06, + "loss": 0.8193, + "step": 23668 + }, + { + "epoch": 0.61, + "learning_rate": 1.8484463669697888e-06, + "loss": 0.8115, + "step": 23669 + }, + { + "epoch": 0.61, + "learning_rate": 1.848431721189399e-06, + "loss": 0.8672, + "step": 23670 + }, + { + "epoch": 0.61, + "learning_rate": 1.848417074759404e-06, + "loss": 0.9902, + "step": 23671 + }, + { + "epoch": 0.61, + "learning_rate": 1.848402427679815e-06, + "loss": 0.8711, + "step": 23672 + }, + { + "epoch": 0.61, + "learning_rate": 1.8483877799506437e-06, + "loss": 0.8735, + "step": 23673 + }, + { + "epoch": 0.61, + "learning_rate": 1.8483731315719008e-06, + "loss": 0.8682, + "step": 23674 + }, + { + "epoch": 0.61, + "learning_rate": 1.848358482543597e-06, + "loss": 0.9414, + "step": 23675 + }, + { + "epoch": 0.61, + "learning_rate": 1.848343832865745e-06, + "loss": 0.8304, + "step": 23676 + }, + { + "epoch": 0.61, + "learning_rate": 1.8483291825383546e-06, + "loss": 0.9106, + "step": 23677 + }, + { + "epoch": 0.61, + "learning_rate": 1.8483145315614376e-06, + "loss": 0.8164, + "step": 23678 + }, + { + "epoch": 0.61, + "learning_rate": 1.8482998799350052e-06, + "loss": 0.71, + "step": 23679 + }, + { + "epoch": 0.61, + "learning_rate": 1.8482852276590685e-06, + "loss": 0.5186, + "step": 23680 + }, + { + "epoch": 0.61, + "learning_rate": 1.848270574733639e-06, + "loss": 0.6631, + "step": 23681 + }, + { + "epoch": 0.61, + "learning_rate": 1.8482559211587279e-06, + "loss": 0.6753, + "step": 23682 + }, + { + "epoch": 0.61, + "learning_rate": 1.8482412669343459e-06, + "loss": 0.9746, + "step": 23683 + }, + { + "epoch": 0.61, + "learning_rate": 1.8482266120605047e-06, + "loss": 0.918, + "step": 23684 + }, + { + "epoch": 0.61, + "learning_rate": 1.848211956537215e-06, + "loss": 0.7949, + "step": 23685 + }, + { + "epoch": 0.61, + "learning_rate": 1.848197300364489e-06, + "loss": 0.7778, + "step": 23686 + }, + { + "epoch": 0.61, + "learning_rate": 1.8481826435423372e-06, + "loss": 0.668, + "step": 23687 + }, + { + "epoch": 0.61, + "learning_rate": 1.848167986070771e-06, + "loss": 0.8867, + "step": 23688 + }, + { + "epoch": 0.61, + "learning_rate": 1.8481533279498013e-06, + "loss": 0.9199, + "step": 23689 + }, + { + "epoch": 0.61, + "learning_rate": 1.8481386691794396e-06, + "loss": 0.9287, + "step": 23690 + }, + { + "epoch": 0.61, + "learning_rate": 1.8481240097596974e-06, + "loss": 0.7852, + "step": 23691 + }, + { + "epoch": 0.61, + "learning_rate": 1.8481093496905854e-06, + "loss": 0.7427, + "step": 23692 + }, + { + "epoch": 0.61, + "learning_rate": 1.8480946889721149e-06, + "loss": 0.79, + "step": 23693 + }, + { + "epoch": 0.61, + "learning_rate": 1.8480800276042977e-06, + "loss": 0.8975, + "step": 23694 + }, + { + "epoch": 0.61, + "learning_rate": 1.8480653655871444e-06, + "loss": 0.9287, + "step": 23695 + }, + { + "epoch": 0.61, + "learning_rate": 1.8480507029206664e-06, + "loss": 0.8306, + "step": 23696 + }, + { + "epoch": 0.61, + "learning_rate": 1.848036039604875e-06, + "loss": 0.9512, + "step": 23697 + }, + { + "epoch": 0.61, + "learning_rate": 1.8480213756397816e-06, + "loss": 0.8096, + "step": 23698 + }, + { + "epoch": 0.61, + "learning_rate": 1.848006711025397e-06, + "loss": 0.9707, + "step": 23699 + }, + { + "epoch": 0.61, + "learning_rate": 1.8479920457617329e-06, + "loss": 1.0312, + "step": 23700 + }, + { + "epoch": 0.61, + "learning_rate": 1.8479773798488e-06, + "loss": 0.864, + "step": 23701 + }, + { + "epoch": 0.61, + "learning_rate": 1.84796271328661e-06, + "loss": 0.6738, + "step": 23702 + }, + { + "epoch": 0.61, + "learning_rate": 1.8479480460751739e-06, + "loss": 1.0762, + "step": 23703 + }, + { + "epoch": 0.61, + "learning_rate": 1.847933378214503e-06, + "loss": 0.9609, + "step": 23704 + }, + { + "epoch": 0.61, + "learning_rate": 1.8479187097046083e-06, + "loss": 0.7285, + "step": 23705 + }, + { + "epoch": 0.61, + "learning_rate": 1.8479040405455012e-06, + "loss": 0.7227, + "step": 23706 + }, + { + "epoch": 0.61, + "learning_rate": 1.8478893707371932e-06, + "loss": 0.6631, + "step": 23707 + }, + { + "epoch": 0.61, + "learning_rate": 1.8478747002796954e-06, + "loss": 0.9395, + "step": 23708 + }, + { + "epoch": 0.61, + "learning_rate": 1.8478600291730188e-06, + "loss": 1.0039, + "step": 23709 + }, + { + "epoch": 0.61, + "learning_rate": 1.8478453574171747e-06, + "loss": 0.9717, + "step": 23710 + }, + { + "epoch": 0.61, + "learning_rate": 1.8478306850121746e-06, + "loss": 0.8203, + "step": 23711 + }, + { + "epoch": 0.61, + "learning_rate": 1.847816011958029e-06, + "loss": 1.0059, + "step": 23712 + }, + { + "epoch": 0.61, + "learning_rate": 1.8478013382547501e-06, + "loss": 0.9131, + "step": 23713 + }, + { + "epoch": 0.61, + "learning_rate": 1.8477866639023488e-06, + "loss": 0.9443, + "step": 23714 + }, + { + "epoch": 0.61, + "learning_rate": 1.847771988900836e-06, + "loss": 0.6748, + "step": 23715 + }, + { + "epoch": 0.61, + "learning_rate": 1.847757313250223e-06, + "loss": 0.7051, + "step": 23716 + }, + { + "epoch": 0.61, + "learning_rate": 1.8477426369505215e-06, + "loss": 0.7939, + "step": 23717 + }, + { + "epoch": 0.61, + "learning_rate": 1.8477279600017425e-06, + "loss": 0.876, + "step": 23718 + }, + { + "epoch": 0.61, + "learning_rate": 1.8477132824038969e-06, + "loss": 0.7461, + "step": 23719 + }, + { + "epoch": 0.61, + "learning_rate": 1.8476986041569964e-06, + "loss": 0.877, + "step": 23720 + }, + { + "epoch": 0.61, + "learning_rate": 1.847683925261052e-06, + "loss": 0.9668, + "step": 23721 + }, + { + "epoch": 0.61, + "learning_rate": 1.847669245716075e-06, + "loss": 0.9736, + "step": 23722 + }, + { + "epoch": 0.61, + "learning_rate": 1.8476545655220765e-06, + "loss": 0.752, + "step": 23723 + }, + { + "epoch": 0.61, + "learning_rate": 1.8476398846790682e-06, + "loss": 1.085, + "step": 23724 + }, + { + "epoch": 0.61, + "learning_rate": 1.847625203187061e-06, + "loss": 1.0195, + "step": 23725 + }, + { + "epoch": 0.61, + "learning_rate": 1.8476105210460657e-06, + "loss": 0.8535, + "step": 23726 + }, + { + "epoch": 0.61, + "learning_rate": 1.8475958382560943e-06, + "loss": 0.8086, + "step": 23727 + }, + { + "epoch": 0.61, + "learning_rate": 1.847581154817158e-06, + "loss": 0.7734, + "step": 23728 + }, + { + "epoch": 0.61, + "learning_rate": 1.8475664707292674e-06, + "loss": 0.8965, + "step": 23729 + }, + { + "epoch": 0.61, + "learning_rate": 1.8475517859924344e-06, + "loss": 1.0928, + "step": 23730 + }, + { + "epoch": 0.61, + "learning_rate": 1.8475371006066696e-06, + "loss": 0.9307, + "step": 23731 + }, + { + "epoch": 0.61, + "learning_rate": 1.8475224145719847e-06, + "loss": 0.6807, + "step": 23732 + }, + { + "epoch": 0.61, + "learning_rate": 1.8475077278883913e-06, + "loss": 0.8638, + "step": 23733 + }, + { + "epoch": 0.61, + "learning_rate": 1.8474930405559e-06, + "loss": 1.0117, + "step": 23734 + }, + { + "epoch": 0.61, + "learning_rate": 1.847478352574522e-06, + "loss": 0.9844, + "step": 23735 + }, + { + "epoch": 0.61, + "learning_rate": 1.8474636639442688e-06, + "loss": 0.8467, + "step": 23736 + }, + { + "epoch": 0.61, + "learning_rate": 1.8474489746651518e-06, + "loss": 0.9219, + "step": 23737 + }, + { + "epoch": 0.61, + "learning_rate": 1.847434284737182e-06, + "loss": 0.8584, + "step": 23738 + }, + { + "epoch": 0.61, + "learning_rate": 1.8474195941603709e-06, + "loss": 0.8237, + "step": 23739 + }, + { + "epoch": 0.61, + "learning_rate": 1.8474049029347293e-06, + "loss": 0.8203, + "step": 23740 + }, + { + "epoch": 0.61, + "learning_rate": 1.847390211060269e-06, + "loss": 0.834, + "step": 23741 + }, + { + "epoch": 0.61, + "learning_rate": 1.847375518537001e-06, + "loss": 0.6045, + "step": 23742 + }, + { + "epoch": 0.61, + "learning_rate": 1.8473608253649365e-06, + "loss": 0.6957, + "step": 23743 + }, + { + "epoch": 0.61, + "learning_rate": 1.8473461315440866e-06, + "loss": 0.9043, + "step": 23744 + }, + { + "epoch": 0.61, + "learning_rate": 1.8473314370744628e-06, + "loss": 0.8809, + "step": 23745 + }, + { + "epoch": 0.61, + "learning_rate": 1.8473167419560763e-06, + "loss": 0.7383, + "step": 23746 + }, + { + "epoch": 0.61, + "learning_rate": 1.8473020461889384e-06, + "loss": 0.9297, + "step": 23747 + }, + { + "epoch": 0.61, + "learning_rate": 1.8472873497730601e-06, + "loss": 0.9365, + "step": 23748 + }, + { + "epoch": 0.61, + "learning_rate": 1.8472726527084528e-06, + "loss": 0.7725, + "step": 23749 + }, + { + "epoch": 0.61, + "learning_rate": 1.8472579549951282e-06, + "loss": 0.7324, + "step": 23750 + }, + { + "epoch": 0.61, + "learning_rate": 1.8472432566330966e-06, + "loss": 0.9893, + "step": 23751 + }, + { + "epoch": 0.61, + "learning_rate": 1.8472285576223704e-06, + "loss": 0.8691, + "step": 23752 + }, + { + "epoch": 0.61, + "learning_rate": 1.8472138579629596e-06, + "loss": 0.7944, + "step": 23753 + }, + { + "epoch": 0.61, + "learning_rate": 1.8471991576548764e-06, + "loss": 0.8311, + "step": 23754 + }, + { + "epoch": 0.61, + "learning_rate": 1.847184456698132e-06, + "loss": 0.833, + "step": 23755 + }, + { + "epoch": 0.61, + "learning_rate": 1.8471697550927371e-06, + "loss": 0.8438, + "step": 23756 + }, + { + "epoch": 0.61, + "learning_rate": 1.8471550528387035e-06, + "loss": 0.8271, + "step": 23757 + }, + { + "epoch": 0.61, + "learning_rate": 1.8471403499360421e-06, + "loss": 0.7148, + "step": 23758 + }, + { + "epoch": 0.61, + "learning_rate": 1.8471256463847642e-06, + "loss": 0.5522, + "step": 23759 + }, + { + "epoch": 0.61, + "learning_rate": 1.8471109421848814e-06, + "loss": 0.9092, + "step": 23760 + }, + { + "epoch": 0.61, + "learning_rate": 1.8470962373364043e-06, + "loss": 0.8398, + "step": 23761 + }, + { + "epoch": 0.61, + "learning_rate": 1.847081531839345e-06, + "loss": 0.8652, + "step": 23762 + }, + { + "epoch": 0.61, + "learning_rate": 1.8470668256937142e-06, + "loss": 0.7222, + "step": 23763 + }, + { + "epoch": 0.61, + "learning_rate": 1.8470521188995232e-06, + "loss": 0.9053, + "step": 23764 + }, + { + "epoch": 0.61, + "learning_rate": 1.847037411456783e-06, + "loss": 0.5882, + "step": 23765 + }, + { + "epoch": 0.61, + "learning_rate": 1.8470227033655057e-06, + "loss": 0.9233, + "step": 23766 + }, + { + "epoch": 0.61, + "learning_rate": 1.8470079946257018e-06, + "loss": 0.959, + "step": 23767 + }, + { + "epoch": 0.61, + "learning_rate": 1.846993285237383e-06, + "loss": 1.0752, + "step": 23768 + }, + { + "epoch": 0.61, + "learning_rate": 1.8469785752005604e-06, + "loss": 0.8516, + "step": 23769 + }, + { + "epoch": 0.61, + "learning_rate": 1.8469638645152451e-06, + "loss": 0.7144, + "step": 23770 + }, + { + "epoch": 0.61, + "learning_rate": 1.8469491531814488e-06, + "loss": 0.915, + "step": 23771 + }, + { + "epoch": 0.61, + "learning_rate": 1.846934441199182e-06, + "loss": 0.9043, + "step": 23772 + }, + { + "epoch": 0.61, + "learning_rate": 1.8469197285684568e-06, + "loss": 1.1318, + "step": 23773 + }, + { + "epoch": 0.61, + "learning_rate": 1.846905015289284e-06, + "loss": 0.5453, + "step": 23774 + }, + { + "epoch": 0.61, + "learning_rate": 1.846890301361675e-06, + "loss": 0.5605, + "step": 23775 + }, + { + "epoch": 0.61, + "learning_rate": 1.846875586785641e-06, + "loss": 1.0322, + "step": 23776 + }, + { + "epoch": 0.61, + "learning_rate": 1.8468608715611933e-06, + "loss": 0.9209, + "step": 23777 + }, + { + "epoch": 0.61, + "learning_rate": 1.8468461556883433e-06, + "loss": 1.1152, + "step": 23778 + }, + { + "epoch": 0.61, + "learning_rate": 1.846831439167102e-06, + "loss": 0.8975, + "step": 23779 + }, + { + "epoch": 0.61, + "learning_rate": 1.8468167219974809e-06, + "loss": 0.9326, + "step": 23780 + }, + { + "epoch": 0.61, + "learning_rate": 1.8468020041794913e-06, + "loss": 0.8652, + "step": 23781 + }, + { + "epoch": 0.61, + "learning_rate": 1.846787285713144e-06, + "loss": 1.0117, + "step": 23782 + }, + { + "epoch": 0.61, + "learning_rate": 1.8467725665984509e-06, + "loss": 0.918, + "step": 23783 + }, + { + "epoch": 0.61, + "learning_rate": 1.8467578468354225e-06, + "loss": 0.9316, + "step": 23784 + }, + { + "epoch": 0.61, + "learning_rate": 1.8467431264240708e-06, + "loss": 1.1514, + "step": 23785 + }, + { + "epoch": 0.61, + "learning_rate": 1.846728405364407e-06, + "loss": 0.9863, + "step": 23786 + }, + { + "epoch": 0.61, + "learning_rate": 1.8467136836564423e-06, + "loss": 0.8779, + "step": 23787 + }, + { + "epoch": 0.61, + "learning_rate": 1.8466989613001876e-06, + "loss": 0.7451, + "step": 23788 + }, + { + "epoch": 0.61, + "learning_rate": 1.8466842382956543e-06, + "loss": 0.8535, + "step": 23789 + }, + { + "epoch": 0.61, + "learning_rate": 1.8466695146428544e-06, + "loss": 0.8467, + "step": 23790 + }, + { + "epoch": 0.61, + "learning_rate": 1.846654790341798e-06, + "loss": 0.5918, + "step": 23791 + }, + { + "epoch": 0.61, + "learning_rate": 1.8466400653924973e-06, + "loss": 0.8291, + "step": 23792 + }, + { + "epoch": 0.61, + "learning_rate": 1.8466253397949632e-06, + "loss": 0.7871, + "step": 23793 + }, + { + "epoch": 0.61, + "learning_rate": 1.8466106135492065e-06, + "loss": 1.0269, + "step": 23794 + }, + { + "epoch": 0.61, + "learning_rate": 1.8465958866552396e-06, + "loss": 0.75, + "step": 23795 + }, + { + "epoch": 0.61, + "learning_rate": 1.846581159113073e-06, + "loss": 0.9102, + "step": 23796 + }, + { + "epoch": 0.61, + "learning_rate": 1.8465664309227181e-06, + "loss": 0.8691, + "step": 23797 + }, + { + "epoch": 0.61, + "learning_rate": 1.8465517020841861e-06, + "loss": 0.7842, + "step": 23798 + }, + { + "epoch": 0.61, + "learning_rate": 1.8465369725974887e-06, + "loss": 0.5786, + "step": 23799 + }, + { + "epoch": 0.61, + "learning_rate": 1.8465222424626363e-06, + "loss": 1.002, + "step": 23800 + }, + { + "epoch": 0.61, + "learning_rate": 1.846507511679641e-06, + "loss": 0.7227, + "step": 23801 + }, + { + "epoch": 0.61, + "learning_rate": 1.8464927802485143e-06, + "loss": 0.717, + "step": 23802 + }, + { + "epoch": 0.61, + "learning_rate": 1.8464780481692666e-06, + "loss": 0.8877, + "step": 23803 + }, + { + "epoch": 0.61, + "learning_rate": 1.8464633154419094e-06, + "loss": 0.8418, + "step": 23804 + }, + { + "epoch": 0.61, + "learning_rate": 1.8464485820664545e-06, + "loss": 0.9502, + "step": 23805 + }, + { + "epoch": 0.61, + "learning_rate": 1.8464338480429124e-06, + "loss": 1.3145, + "step": 23806 + }, + { + "epoch": 0.61, + "learning_rate": 1.8464191133712952e-06, + "loss": 0.8652, + "step": 23807 + }, + { + "epoch": 0.61, + "learning_rate": 1.8464043780516135e-06, + "loss": 0.7224, + "step": 23808 + }, + { + "epoch": 0.61, + "learning_rate": 1.846389642083879e-06, + "loss": 0.957, + "step": 23809 + }, + { + "epoch": 0.61, + "learning_rate": 1.8463749054681032e-06, + "loss": 0.7505, + "step": 23810 + }, + { + "epoch": 0.61, + "learning_rate": 1.8463601682042969e-06, + "loss": 0.8711, + "step": 23811 + }, + { + "epoch": 0.61, + "learning_rate": 1.8463454302924714e-06, + "loss": 0.8408, + "step": 23812 + }, + { + "epoch": 0.61, + "learning_rate": 1.8463306917326382e-06, + "loss": 0.833, + "step": 23813 + }, + { + "epoch": 0.61, + "learning_rate": 1.8463159525248083e-06, + "loss": 0.7725, + "step": 23814 + }, + { + "epoch": 0.61, + "learning_rate": 1.8463012126689936e-06, + "loss": 0.9238, + "step": 23815 + }, + { + "epoch": 0.61, + "learning_rate": 1.8462864721652047e-06, + "loss": 1.1191, + "step": 23816 + }, + { + "epoch": 0.61, + "learning_rate": 1.8462717310134533e-06, + "loss": 0.79, + "step": 23817 + }, + { + "epoch": 0.61, + "learning_rate": 1.8462569892137502e-06, + "loss": 0.8936, + "step": 23818 + }, + { + "epoch": 0.61, + "learning_rate": 1.8462422467661076e-06, + "loss": 0.6787, + "step": 23819 + }, + { + "epoch": 0.61, + "learning_rate": 1.846227503670536e-06, + "loss": 1.0586, + "step": 23820 + }, + { + "epoch": 0.61, + "learning_rate": 1.8462127599270467e-06, + "loss": 0.9961, + "step": 23821 + }, + { + "epoch": 0.61, + "learning_rate": 1.846198015535651e-06, + "loss": 1.0156, + "step": 23822 + }, + { + "epoch": 0.61, + "learning_rate": 1.8461832704963612e-06, + "loss": 1.0215, + "step": 23823 + }, + { + "epoch": 0.61, + "learning_rate": 1.8461685248091873e-06, + "loss": 0.6826, + "step": 23824 + }, + { + "epoch": 0.61, + "learning_rate": 1.8461537784741407e-06, + "loss": 0.6343, + "step": 23825 + }, + { + "epoch": 0.61, + "learning_rate": 1.8461390314912336e-06, + "loss": 0.8877, + "step": 23826 + }, + { + "epoch": 0.61, + "learning_rate": 1.8461242838604765e-06, + "loss": 0.9219, + "step": 23827 + }, + { + "epoch": 0.61, + "learning_rate": 1.846109535581881e-06, + "loss": 0.8516, + "step": 23828 + }, + { + "epoch": 0.61, + "learning_rate": 1.8460947866554584e-06, + "loss": 0.8311, + "step": 23829 + }, + { + "epoch": 0.61, + "learning_rate": 1.84608003708122e-06, + "loss": 0.7764, + "step": 23830 + }, + { + "epoch": 0.61, + "learning_rate": 1.8460652868591767e-06, + "loss": 1.0098, + "step": 23831 + }, + { + "epoch": 0.61, + "learning_rate": 1.8460505359893404e-06, + "loss": 0.792, + "step": 23832 + }, + { + "epoch": 0.61, + "learning_rate": 1.8460357844717217e-06, + "loss": 0.8711, + "step": 23833 + }, + { + "epoch": 0.61, + "learning_rate": 1.846021032306333e-06, + "loss": 0.7627, + "step": 23834 + }, + { + "epoch": 0.61, + "learning_rate": 1.8460062794931845e-06, + "loss": 0.7886, + "step": 23835 + }, + { + "epoch": 0.61, + "learning_rate": 1.8459915260322878e-06, + "loss": 0.8828, + "step": 23836 + }, + { + "epoch": 0.61, + "learning_rate": 1.8459767719236546e-06, + "loss": 0.9746, + "step": 23837 + }, + { + "epoch": 0.61, + "learning_rate": 1.8459620171672955e-06, + "loss": 0.9297, + "step": 23838 + }, + { + "epoch": 0.61, + "learning_rate": 1.8459472617632224e-06, + "loss": 0.7842, + "step": 23839 + }, + { + "epoch": 0.61, + "learning_rate": 1.8459325057114463e-06, + "loss": 0.9883, + "step": 23840 + }, + { + "epoch": 0.61, + "learning_rate": 1.8459177490119786e-06, + "loss": 0.8701, + "step": 23841 + }, + { + "epoch": 0.61, + "learning_rate": 1.8459029916648308e-06, + "loss": 0.7266, + "step": 23842 + }, + { + "epoch": 0.61, + "learning_rate": 1.8458882336700134e-06, + "loss": 0.5732, + "step": 23843 + }, + { + "epoch": 0.61, + "learning_rate": 1.8458734750275387e-06, + "loss": 1.1016, + "step": 23844 + }, + { + "epoch": 0.61, + "learning_rate": 1.8458587157374174e-06, + "loss": 0.8789, + "step": 23845 + }, + { + "epoch": 0.61, + "learning_rate": 1.8458439557996612e-06, + "loss": 0.9346, + "step": 23846 + }, + { + "epoch": 0.61, + "learning_rate": 1.8458291952142812e-06, + "loss": 0.8647, + "step": 23847 + }, + { + "epoch": 0.61, + "learning_rate": 1.8458144339812884e-06, + "loss": 0.9258, + "step": 23848 + }, + { + "epoch": 0.61, + "learning_rate": 1.8457996721006945e-06, + "loss": 0.8057, + "step": 23849 + }, + { + "epoch": 0.61, + "learning_rate": 1.8457849095725108e-06, + "loss": 0.7014, + "step": 23850 + }, + { + "epoch": 0.61, + "learning_rate": 1.8457701463967484e-06, + "loss": 0.6836, + "step": 23851 + }, + { + "epoch": 0.61, + "learning_rate": 1.8457553825734188e-06, + "loss": 0.8359, + "step": 23852 + }, + { + "epoch": 0.61, + "learning_rate": 1.8457406181025328e-06, + "loss": 0.8125, + "step": 23853 + }, + { + "epoch": 0.61, + "learning_rate": 1.8457258529841025e-06, + "loss": 0.8887, + "step": 23854 + }, + { + "epoch": 0.61, + "learning_rate": 1.8457110872181386e-06, + "loss": 0.9561, + "step": 23855 + }, + { + "epoch": 0.61, + "learning_rate": 1.8456963208046527e-06, + "loss": 0.8447, + "step": 23856 + }, + { + "epoch": 0.61, + "learning_rate": 1.845681553743656e-06, + "loss": 0.8281, + "step": 23857 + }, + { + "epoch": 0.61, + "learning_rate": 1.8456667860351599e-06, + "loss": 0.9023, + "step": 23858 + }, + { + "epoch": 0.61, + "learning_rate": 1.8456520176791754e-06, + "loss": 0.5925, + "step": 23859 + }, + { + "epoch": 0.61, + "learning_rate": 1.8456372486757142e-06, + "loss": 0.7529, + "step": 23860 + }, + { + "epoch": 0.61, + "learning_rate": 1.8456224790247874e-06, + "loss": 0.9639, + "step": 23861 + }, + { + "epoch": 0.61, + "learning_rate": 1.8456077087264065e-06, + "loss": 0.6323, + "step": 23862 + }, + { + "epoch": 0.61, + "learning_rate": 1.8455929377805824e-06, + "loss": 0.9336, + "step": 23863 + }, + { + "epoch": 0.61, + "learning_rate": 1.8455781661873266e-06, + "loss": 1.0088, + "step": 23864 + }, + { + "epoch": 0.61, + "learning_rate": 1.845563393946651e-06, + "loss": 0.9824, + "step": 23865 + }, + { + "epoch": 0.61, + "learning_rate": 1.8455486210585658e-06, + "loss": 1.0205, + "step": 23866 + }, + { + "epoch": 0.61, + "learning_rate": 1.8455338475230833e-06, + "loss": 0.8877, + "step": 23867 + }, + { + "epoch": 0.61, + "learning_rate": 1.8455190733402142e-06, + "loss": 0.9355, + "step": 23868 + }, + { + "epoch": 0.61, + "learning_rate": 1.84550429850997e-06, + "loss": 0.76, + "step": 23869 + }, + { + "epoch": 0.61, + "learning_rate": 1.8454895230323623e-06, + "loss": 0.9033, + "step": 23870 + }, + { + "epoch": 0.61, + "learning_rate": 1.8454747469074019e-06, + "loss": 1.0049, + "step": 23871 + }, + { + "epoch": 0.61, + "learning_rate": 1.8454599701351005e-06, + "loss": 0.8418, + "step": 23872 + }, + { + "epoch": 0.61, + "learning_rate": 1.8454451927154692e-06, + "loss": 0.9229, + "step": 23873 + }, + { + "epoch": 0.61, + "learning_rate": 1.8454304146485193e-06, + "loss": 0.8892, + "step": 23874 + }, + { + "epoch": 0.61, + "learning_rate": 1.8454156359342625e-06, + "loss": 0.7451, + "step": 23875 + }, + { + "epoch": 0.61, + "learning_rate": 1.8454008565727098e-06, + "loss": 0.708, + "step": 23876 + }, + { + "epoch": 0.61, + "learning_rate": 1.845386076563872e-06, + "loss": 0.835, + "step": 23877 + }, + { + "epoch": 0.61, + "learning_rate": 1.8453712959077615e-06, + "loss": 0.9883, + "step": 23878 + }, + { + "epoch": 0.61, + "learning_rate": 1.8453565146043889e-06, + "loss": 1.0488, + "step": 23879 + }, + { + "epoch": 0.61, + "learning_rate": 1.8453417326537658e-06, + "loss": 0.9297, + "step": 23880 + }, + { + "epoch": 0.61, + "learning_rate": 1.8453269500559032e-06, + "loss": 0.7842, + "step": 23881 + }, + { + "epoch": 0.61, + "learning_rate": 1.8453121668108128e-06, + "loss": 1.1113, + "step": 23882 + }, + { + "epoch": 0.61, + "learning_rate": 1.8452973829185056e-06, + "loss": 0.8604, + "step": 23883 + }, + { + "epoch": 0.61, + "learning_rate": 1.845282598378993e-06, + "loss": 0.8506, + "step": 23884 + }, + { + "epoch": 0.61, + "learning_rate": 1.8452678131922866e-06, + "loss": 0.8965, + "step": 23885 + }, + { + "epoch": 0.61, + "learning_rate": 1.8452530273583973e-06, + "loss": 0.7324, + "step": 23886 + }, + { + "epoch": 0.61, + "learning_rate": 1.8452382408773368e-06, + "loss": 0.6506, + "step": 23887 + }, + { + "epoch": 0.61, + "learning_rate": 1.8452234537491163e-06, + "loss": 0.7578, + "step": 23888 + }, + { + "epoch": 0.61, + "learning_rate": 1.8452086659737467e-06, + "loss": 0.9561, + "step": 23889 + }, + { + "epoch": 0.61, + "learning_rate": 1.8451938775512402e-06, + "loss": 0.8848, + "step": 23890 + }, + { + "epoch": 0.61, + "learning_rate": 1.8451790884816071e-06, + "loss": 1.0361, + "step": 23891 + }, + { + "epoch": 0.61, + "learning_rate": 1.8451642987648595e-06, + "loss": 0.9297, + "step": 23892 + }, + { + "epoch": 0.61, + "learning_rate": 1.8451495084010084e-06, + "loss": 1.0078, + "step": 23893 + }, + { + "epoch": 0.61, + "learning_rate": 1.8451347173900652e-06, + "loss": 0.7969, + "step": 23894 + }, + { + "epoch": 0.61, + "learning_rate": 1.8451199257320411e-06, + "loss": 0.8193, + "step": 23895 + }, + { + "epoch": 0.61, + "learning_rate": 1.8451051334269478e-06, + "loss": 0.7451, + "step": 23896 + }, + { + "epoch": 0.61, + "learning_rate": 1.845090340474796e-06, + "loss": 1.0186, + "step": 23897 + }, + { + "epoch": 0.61, + "learning_rate": 1.8450755468755976e-06, + "loss": 0.8828, + "step": 23898 + }, + { + "epoch": 0.61, + "learning_rate": 1.8450607526293638e-06, + "loss": 0.7544, + "step": 23899 + }, + { + "epoch": 0.61, + "learning_rate": 1.8450459577361058e-06, + "loss": 1.0752, + "step": 23900 + }, + { + "epoch": 0.61, + "learning_rate": 1.8450311621958347e-06, + "loss": 0.7056, + "step": 23901 + }, + { + "epoch": 0.61, + "learning_rate": 1.8450163660085624e-06, + "loss": 0.9609, + "step": 23902 + }, + { + "epoch": 0.61, + "learning_rate": 1.8450015691742999e-06, + "loss": 0.8994, + "step": 23903 + }, + { + "epoch": 0.61, + "learning_rate": 1.8449867716930583e-06, + "loss": 0.9131, + "step": 23904 + }, + { + "epoch": 0.61, + "learning_rate": 1.8449719735648494e-06, + "loss": 0.9033, + "step": 23905 + }, + { + "epoch": 0.61, + "learning_rate": 1.8449571747896844e-06, + "loss": 0.8965, + "step": 23906 + }, + { + "epoch": 0.61, + "learning_rate": 1.8449423753675744e-06, + "loss": 1.0889, + "step": 23907 + }, + { + "epoch": 0.61, + "learning_rate": 1.8449275752985307e-06, + "loss": 0.6511, + "step": 23908 + }, + { + "epoch": 0.61, + "learning_rate": 1.844912774582565e-06, + "loss": 0.8271, + "step": 23909 + }, + { + "epoch": 0.61, + "learning_rate": 1.8448979732196884e-06, + "loss": 0.7524, + "step": 23910 + }, + { + "epoch": 0.61, + "learning_rate": 1.8448831712099125e-06, + "loss": 0.9307, + "step": 23911 + }, + { + "epoch": 0.61, + "learning_rate": 1.8448683685532482e-06, + "loss": 0.8525, + "step": 23912 + }, + { + "epoch": 0.61, + "learning_rate": 1.8448535652497071e-06, + "loss": 0.8652, + "step": 23913 + }, + { + "epoch": 0.61, + "learning_rate": 1.8448387612993002e-06, + "loss": 1.0264, + "step": 23914 + }, + { + "epoch": 0.61, + "learning_rate": 1.8448239567020395e-06, + "loss": 1.0273, + "step": 23915 + }, + { + "epoch": 0.61, + "learning_rate": 1.8448091514579356e-06, + "loss": 0.8594, + "step": 23916 + }, + { + "epoch": 0.61, + "learning_rate": 1.8447943455670005e-06, + "loss": 0.9785, + "step": 23917 + }, + { + "epoch": 0.61, + "learning_rate": 1.8447795390292452e-06, + "loss": 0.9814, + "step": 23918 + }, + { + "epoch": 0.61, + "learning_rate": 1.844764731844681e-06, + "loss": 0.7729, + "step": 23919 + }, + { + "epoch": 0.61, + "learning_rate": 1.8447499240133189e-06, + "loss": 0.7402, + "step": 23920 + }, + { + "epoch": 0.61, + "learning_rate": 1.844735115535171e-06, + "loss": 0.7166, + "step": 23921 + }, + { + "epoch": 0.61, + "learning_rate": 1.8447203064102482e-06, + "loss": 0.9902, + "step": 23922 + }, + { + "epoch": 0.61, + "learning_rate": 1.8447054966385618e-06, + "loss": 0.9766, + "step": 23923 + }, + { + "epoch": 0.61, + "learning_rate": 1.8446906862201233e-06, + "loss": 0.7832, + "step": 23924 + }, + { + "epoch": 0.61, + "learning_rate": 1.844675875154944e-06, + "loss": 0.832, + "step": 23925 + }, + { + "epoch": 0.61, + "learning_rate": 1.8446610634430353e-06, + "loss": 0.8438, + "step": 23926 + }, + { + "epoch": 0.61, + "learning_rate": 1.8446462510844084e-06, + "loss": 0.8118, + "step": 23927 + }, + { + "epoch": 0.61, + "learning_rate": 1.8446314380790748e-06, + "loss": 0.7998, + "step": 23928 + }, + { + "epoch": 0.61, + "learning_rate": 1.8446166244270455e-06, + "loss": 0.9883, + "step": 23929 + }, + { + "epoch": 0.61, + "learning_rate": 1.8446018101283324e-06, + "loss": 0.8584, + "step": 23930 + }, + { + "epoch": 0.61, + "learning_rate": 1.8445869951829462e-06, + "loss": 0.7891, + "step": 23931 + }, + { + "epoch": 0.61, + "learning_rate": 1.844572179590899e-06, + "loss": 1.083, + "step": 23932 + }, + { + "epoch": 0.61, + "learning_rate": 1.844557363352201e-06, + "loss": 0.8398, + "step": 23933 + }, + { + "epoch": 0.61, + "learning_rate": 1.844542546466865e-06, + "loss": 0.8965, + "step": 23934 + }, + { + "epoch": 0.61, + "learning_rate": 1.8445277289349013e-06, + "loss": 0.916, + "step": 23935 + }, + { + "epoch": 0.61, + "learning_rate": 1.8445129107563216e-06, + "loss": 0.8418, + "step": 23936 + }, + { + "epoch": 0.61, + "learning_rate": 1.844498091931137e-06, + "loss": 0.7827, + "step": 23937 + }, + { + "epoch": 0.61, + "learning_rate": 1.8444832724593593e-06, + "loss": 0.9971, + "step": 23938 + }, + { + "epoch": 0.61, + "learning_rate": 1.8444684523409994e-06, + "loss": 0.918, + "step": 23939 + }, + { + "epoch": 0.61, + "learning_rate": 1.8444536315760691e-06, + "loss": 0.8398, + "step": 23940 + }, + { + "epoch": 0.61, + "learning_rate": 1.8444388101645792e-06, + "loss": 0.874, + "step": 23941 + }, + { + "epoch": 0.61, + "learning_rate": 1.8444239881065416e-06, + "loss": 0.9502, + "step": 23942 + }, + { + "epoch": 0.61, + "learning_rate": 1.844409165401967e-06, + "loss": 0.8887, + "step": 23943 + }, + { + "epoch": 0.61, + "learning_rate": 1.8443943420508674e-06, + "loss": 1.0547, + "step": 23944 + }, + { + "epoch": 0.61, + "learning_rate": 1.844379518053254e-06, + "loss": 0.9551, + "step": 23945 + }, + { + "epoch": 0.61, + "learning_rate": 1.8443646934091377e-06, + "loss": 0.7285, + "step": 23946 + }, + { + "epoch": 0.61, + "learning_rate": 1.8443498681185305e-06, + "loss": 0.7427, + "step": 23947 + }, + { + "epoch": 0.61, + "learning_rate": 1.8443350421814433e-06, + "loss": 0.9395, + "step": 23948 + }, + { + "epoch": 0.61, + "learning_rate": 1.8443202155978873e-06, + "loss": 0.6846, + "step": 23949 + }, + { + "epoch": 0.61, + "learning_rate": 1.8443053883678746e-06, + "loss": 0.7588, + "step": 23950 + }, + { + "epoch": 0.61, + "learning_rate": 1.8442905604914158e-06, + "loss": 0.8252, + "step": 23951 + }, + { + "epoch": 0.61, + "learning_rate": 1.8442757319685227e-06, + "loss": 1.001, + "step": 23952 + }, + { + "epoch": 0.61, + "learning_rate": 1.8442609027992062e-06, + "loss": 0.7793, + "step": 23953 + }, + { + "epoch": 0.61, + "learning_rate": 1.8442460729834784e-06, + "loss": 0.79, + "step": 23954 + }, + { + "epoch": 0.61, + "learning_rate": 1.8442312425213497e-06, + "loss": 0.8535, + "step": 23955 + }, + { + "epoch": 0.61, + "learning_rate": 1.8442164114128324e-06, + "loss": 0.7402, + "step": 23956 + }, + { + "epoch": 0.61, + "learning_rate": 1.844201579657937e-06, + "loss": 0.915, + "step": 23957 + }, + { + "epoch": 0.61, + "learning_rate": 1.8441867472566757e-06, + "loss": 1.0098, + "step": 23958 + }, + { + "epoch": 0.61, + "learning_rate": 1.8441719142090592e-06, + "loss": 0.877, + "step": 23959 + }, + { + "epoch": 0.61, + "learning_rate": 1.844157080515099e-06, + "loss": 0.7163, + "step": 23960 + }, + { + "epoch": 0.61, + "learning_rate": 1.8441422461748068e-06, + "loss": 0.8779, + "step": 23961 + }, + { + "epoch": 0.61, + "learning_rate": 1.8441274111881934e-06, + "loss": 0.8848, + "step": 23962 + }, + { + "epoch": 0.61, + "learning_rate": 1.8441125755552706e-06, + "loss": 0.8359, + "step": 23963 + }, + { + "epoch": 0.61, + "learning_rate": 1.8440977392760497e-06, + "loss": 0.8223, + "step": 23964 + }, + { + "epoch": 0.61, + "learning_rate": 1.8440829023505417e-06, + "loss": 0.8389, + "step": 23965 + }, + { + "epoch": 0.61, + "learning_rate": 1.8440680647787583e-06, + "loss": 0.6802, + "step": 23966 + }, + { + "epoch": 0.61, + "learning_rate": 1.8440532265607112e-06, + "loss": 0.9756, + "step": 23967 + }, + { + "epoch": 0.61, + "learning_rate": 1.8440383876964109e-06, + "loss": 0.8452, + "step": 23968 + }, + { + "epoch": 0.61, + "learning_rate": 1.8440235481858694e-06, + "loss": 0.9629, + "step": 23969 + }, + { + "epoch": 0.61, + "learning_rate": 1.844008708029098e-06, + "loss": 0.8052, + "step": 23970 + }, + { + "epoch": 0.61, + "learning_rate": 1.8439938672261075e-06, + "loss": 0.8325, + "step": 23971 + }, + { + "epoch": 0.61, + "learning_rate": 1.8439790257769104e-06, + "loss": 0.8071, + "step": 23972 + }, + { + "epoch": 0.61, + "learning_rate": 1.8439641836815168e-06, + "loss": 0.7057, + "step": 23973 + }, + { + "epoch": 0.61, + "learning_rate": 1.8439493409399388e-06, + "loss": 0.9253, + "step": 23974 + }, + { + "epoch": 0.61, + "learning_rate": 1.8439344975521875e-06, + "loss": 0.6787, + "step": 23975 + }, + { + "epoch": 0.61, + "learning_rate": 1.8439196535182745e-06, + "loss": 0.9453, + "step": 23976 + }, + { + "epoch": 0.61, + "learning_rate": 1.843904808838211e-06, + "loss": 0.7402, + "step": 23977 + }, + { + "epoch": 0.61, + "learning_rate": 1.8438899635120083e-06, + "loss": 0.874, + "step": 23978 + }, + { + "epoch": 0.61, + "learning_rate": 1.843875117539678e-06, + "loss": 1.0215, + "step": 23979 + }, + { + "epoch": 0.61, + "learning_rate": 1.8438602709212313e-06, + "loss": 0.7959, + "step": 23980 + }, + { + "epoch": 0.61, + "learning_rate": 1.8438454236566794e-06, + "loss": 0.7446, + "step": 23981 + }, + { + "epoch": 0.61, + "learning_rate": 1.8438305757460339e-06, + "loss": 0.7256, + "step": 23982 + }, + { + "epoch": 0.61, + "learning_rate": 1.8438157271893064e-06, + "loss": 1.0508, + "step": 23983 + }, + { + "epoch": 0.61, + "learning_rate": 1.8438008779865077e-06, + "loss": 0.8672, + "step": 23984 + }, + { + "epoch": 0.61, + "learning_rate": 1.8437860281376496e-06, + "loss": 0.8223, + "step": 23985 + }, + { + "epoch": 0.61, + "learning_rate": 1.8437711776427434e-06, + "loss": 0.8721, + "step": 23986 + }, + { + "epoch": 0.61, + "learning_rate": 1.8437563265018003e-06, + "loss": 0.8438, + "step": 23987 + }, + { + "epoch": 0.61, + "learning_rate": 1.843741474714832e-06, + "loss": 0.8398, + "step": 23988 + }, + { + "epoch": 0.61, + "learning_rate": 1.8437266222818492e-06, + "loss": 0.833, + "step": 23989 + }, + { + "epoch": 0.61, + "learning_rate": 1.843711769202864e-06, + "loss": 0.8262, + "step": 23990 + }, + { + "epoch": 0.61, + "learning_rate": 1.8436969154778877e-06, + "loss": 0.8555, + "step": 23991 + }, + { + "epoch": 0.61, + "learning_rate": 1.8436820611069312e-06, + "loss": 0.8955, + "step": 23992 + }, + { + "epoch": 0.61, + "learning_rate": 1.8436672060900062e-06, + "loss": 0.876, + "step": 23993 + }, + { + "epoch": 0.61, + "learning_rate": 1.843652350427124e-06, + "loss": 0.876, + "step": 23994 + }, + { + "epoch": 0.62, + "learning_rate": 1.8436374941182959e-06, + "loss": 0.8857, + "step": 23995 + }, + { + "epoch": 0.62, + "learning_rate": 1.8436226371635336e-06, + "loss": 0.9883, + "step": 23996 + }, + { + "epoch": 0.62, + "learning_rate": 1.843607779562848e-06, + "loss": 0.9756, + "step": 23997 + }, + { + "epoch": 0.62, + "learning_rate": 1.8435929213162508e-06, + "loss": 0.7578, + "step": 23998 + }, + { + "epoch": 0.62, + "learning_rate": 1.843578062423753e-06, + "loss": 0.9893, + "step": 23999 + }, + { + "epoch": 0.62, + "learning_rate": 1.8435632028853666e-06, + "loss": 0.9102, + "step": 24000 + }, + { + "epoch": 0.62, + "learning_rate": 1.8435483427011028e-06, + "loss": 0.8403, + "step": 24001 + }, + { + "epoch": 0.62, + "learning_rate": 1.8435334818709727e-06, + "loss": 0.7024, + "step": 24002 + }, + { + "epoch": 0.62, + "learning_rate": 1.8435186203949878e-06, + "loss": 0.8369, + "step": 24003 + }, + { + "epoch": 0.62, + "learning_rate": 1.8435037582731593e-06, + "loss": 0.6826, + "step": 24004 + }, + { + "epoch": 0.62, + "learning_rate": 1.8434888955054987e-06, + "loss": 0.8657, + "step": 24005 + }, + { + "epoch": 0.62, + "learning_rate": 1.8434740320920177e-06, + "loss": 0.8218, + "step": 24006 + }, + { + "epoch": 0.62, + "learning_rate": 1.8434591680327274e-06, + "loss": 1.0127, + "step": 24007 + }, + { + "epoch": 0.62, + "learning_rate": 1.843444303327639e-06, + "loss": 0.8174, + "step": 24008 + }, + { + "epoch": 0.62, + "learning_rate": 1.843429437976764e-06, + "loss": 0.7793, + "step": 24009 + }, + { + "epoch": 0.62, + "learning_rate": 1.8434145719801141e-06, + "loss": 0.9443, + "step": 24010 + }, + { + "epoch": 0.62, + "learning_rate": 1.8433997053377005e-06, + "loss": 1.1689, + "step": 24011 + }, + { + "epoch": 0.62, + "learning_rate": 1.8433848380495345e-06, + "loss": 0.8906, + "step": 24012 + }, + { + "epoch": 0.62, + "learning_rate": 1.8433699701156273e-06, + "loss": 1.1309, + "step": 24013 + }, + { + "epoch": 0.62, + "learning_rate": 1.8433551015359907e-06, + "loss": 0.6279, + "step": 24014 + }, + { + "epoch": 0.62, + "learning_rate": 1.843340232310636e-06, + "loss": 0.6929, + "step": 24015 + }, + { + "epoch": 0.62, + "learning_rate": 1.843325362439574e-06, + "loss": 0.8418, + "step": 24016 + }, + { + "epoch": 0.62, + "learning_rate": 1.8433104919228168e-06, + "loss": 0.6382, + "step": 24017 + }, + { + "epoch": 0.62, + "learning_rate": 1.8432956207603755e-06, + "loss": 0.812, + "step": 24018 + }, + { + "epoch": 0.62, + "learning_rate": 1.8432807489522618e-06, + "loss": 0.7861, + "step": 24019 + }, + { + "epoch": 0.62, + "learning_rate": 1.8432658764984864e-06, + "loss": 0.7197, + "step": 24020 + }, + { + "epoch": 0.62, + "learning_rate": 1.8432510033990614e-06, + "loss": 0.8711, + "step": 24021 + }, + { + "epoch": 0.62, + "learning_rate": 1.8432361296539978e-06, + "loss": 0.8125, + "step": 24022 + }, + { + "epoch": 0.62, + "learning_rate": 1.8432212552633069e-06, + "loss": 0.8105, + "step": 24023 + }, + { + "epoch": 0.62, + "learning_rate": 1.8432063802270004e-06, + "loss": 0.9688, + "step": 24024 + }, + { + "epoch": 0.62, + "learning_rate": 1.8431915045450895e-06, + "loss": 0.8833, + "step": 24025 + }, + { + "epoch": 0.62, + "learning_rate": 1.8431766282175855e-06, + "loss": 0.7744, + "step": 24026 + }, + { + "epoch": 0.62, + "learning_rate": 1.8431617512445001e-06, + "loss": 0.7402, + "step": 24027 + }, + { + "epoch": 0.62, + "learning_rate": 1.8431468736258443e-06, + "loss": 0.5737, + "step": 24028 + }, + { + "epoch": 0.62, + "learning_rate": 1.84313199536163e-06, + "loss": 0.729, + "step": 24029 + }, + { + "epoch": 0.62, + "learning_rate": 1.8431171164518684e-06, + "loss": 1.0859, + "step": 24030 + }, + { + "epoch": 0.62, + "learning_rate": 1.8431022368965704e-06, + "loss": 1.0439, + "step": 24031 + }, + { + "epoch": 0.62, + "learning_rate": 1.843087356695748e-06, + "loss": 0.9062, + "step": 24032 + }, + { + "epoch": 0.62, + "learning_rate": 1.8430724758494125e-06, + "loss": 0.8467, + "step": 24033 + }, + { + "epoch": 0.62, + "learning_rate": 1.843057594357575e-06, + "loss": 0.7334, + "step": 24034 + }, + { + "epoch": 0.62, + "learning_rate": 1.8430427122202469e-06, + "loss": 0.9463, + "step": 24035 + }, + { + "epoch": 0.62, + "learning_rate": 1.8430278294374402e-06, + "loss": 0.6714, + "step": 24036 + }, + { + "epoch": 0.62, + "learning_rate": 1.8430129460091655e-06, + "loss": 0.8379, + "step": 24037 + }, + { + "epoch": 0.62, + "learning_rate": 1.8429980619354346e-06, + "loss": 0.9473, + "step": 24038 + }, + { + "epoch": 0.62, + "learning_rate": 1.842983177216259e-06, + "loss": 1.0244, + "step": 24039 + }, + { + "epoch": 0.62, + "learning_rate": 1.8429682918516497e-06, + "loss": 0.686, + "step": 24040 + }, + { + "epoch": 0.62, + "learning_rate": 1.8429534058416185e-06, + "loss": 0.8447, + "step": 24041 + }, + { + "epoch": 0.62, + "learning_rate": 1.8429385191861768e-06, + "loss": 0.6729, + "step": 24042 + }, + { + "epoch": 0.62, + "learning_rate": 1.8429236318853354e-06, + "loss": 0.6252, + "step": 24043 + }, + { + "epoch": 0.62, + "learning_rate": 1.8429087439391067e-06, + "loss": 0.8125, + "step": 24044 + }, + { + "epoch": 0.62, + "learning_rate": 1.842893855347501e-06, + "loss": 1.0156, + "step": 24045 + }, + { + "epoch": 0.62, + "learning_rate": 1.8428789661105305e-06, + "loss": 0.9463, + "step": 24046 + }, + { + "epoch": 0.62, + "learning_rate": 1.8428640762282064e-06, + "loss": 0.916, + "step": 24047 + }, + { + "epoch": 0.62, + "learning_rate": 1.8428491857005396e-06, + "loss": 0.751, + "step": 24048 + }, + { + "epoch": 0.62, + "learning_rate": 1.8428342945275426e-06, + "loss": 0.9941, + "step": 24049 + }, + { + "epoch": 0.62, + "learning_rate": 1.8428194027092256e-06, + "loss": 0.8389, + "step": 24050 + }, + { + "epoch": 0.62, + "learning_rate": 1.8428045102456006e-06, + "loss": 0.7915, + "step": 24051 + }, + { + "epoch": 0.62, + "learning_rate": 1.8427896171366792e-06, + "loss": 0.7461, + "step": 24052 + }, + { + "epoch": 0.62, + "learning_rate": 1.8427747233824725e-06, + "loss": 0.874, + "step": 24053 + }, + { + "epoch": 0.62, + "learning_rate": 1.8427598289829918e-06, + "loss": 0.8877, + "step": 24054 + }, + { + "epoch": 0.62, + "learning_rate": 1.8427449339382487e-06, + "loss": 0.8633, + "step": 24055 + }, + { + "epoch": 0.62, + "learning_rate": 1.8427300382482544e-06, + "loss": 0.8657, + "step": 24056 + }, + { + "epoch": 0.62, + "learning_rate": 1.8427151419130208e-06, + "loss": 1.1113, + "step": 24057 + }, + { + "epoch": 0.62, + "learning_rate": 1.8427002449325587e-06, + "loss": 0.9248, + "step": 24058 + }, + { + "epoch": 0.62, + "learning_rate": 1.8426853473068799e-06, + "loss": 0.76, + "step": 24059 + }, + { + "epoch": 0.62, + "learning_rate": 1.8426704490359955e-06, + "loss": 1.041, + "step": 24060 + }, + { + "epoch": 0.62, + "learning_rate": 1.8426555501199173e-06, + "loss": 0.6992, + "step": 24061 + }, + { + "epoch": 0.62, + "learning_rate": 1.8426406505586566e-06, + "loss": 0.9805, + "step": 24062 + }, + { + "epoch": 0.62, + "learning_rate": 1.8426257503522242e-06, + "loss": 0.8379, + "step": 24063 + }, + { + "epoch": 0.62, + "learning_rate": 1.8426108495006325e-06, + "loss": 0.6748, + "step": 24064 + }, + { + "epoch": 0.62, + "learning_rate": 1.842595948003892e-06, + "loss": 1.0693, + "step": 24065 + }, + { + "epoch": 0.62, + "learning_rate": 1.8425810458620147e-06, + "loss": 0.9453, + "step": 24066 + }, + { + "epoch": 0.62, + "learning_rate": 1.8425661430750118e-06, + "loss": 0.8809, + "step": 24067 + }, + { + "epoch": 0.62, + "learning_rate": 1.842551239642895e-06, + "loss": 0.8545, + "step": 24068 + }, + { + "epoch": 0.62, + "learning_rate": 1.8425363355656754e-06, + "loss": 0.8789, + "step": 24069 + }, + { + "epoch": 0.62, + "learning_rate": 1.8425214308433644e-06, + "loss": 0.7837, + "step": 24070 + }, + { + "epoch": 0.62, + "learning_rate": 1.8425065254759732e-06, + "loss": 0.6953, + "step": 24071 + }, + { + "epoch": 0.62, + "learning_rate": 1.842491619463514e-06, + "loss": 0.751, + "step": 24072 + }, + { + "epoch": 0.62, + "learning_rate": 1.8424767128059973e-06, + "loss": 0.5405, + "step": 24073 + }, + { + "epoch": 0.62, + "learning_rate": 1.842461805503435e-06, + "loss": 0.9873, + "step": 24074 + }, + { + "epoch": 0.62, + "learning_rate": 1.8424468975558386e-06, + "loss": 0.9502, + "step": 24075 + }, + { + "epoch": 0.62, + "learning_rate": 1.8424319889632191e-06, + "loss": 0.7937, + "step": 24076 + }, + { + "epoch": 0.62, + "learning_rate": 1.8424170797255885e-06, + "loss": 0.7959, + "step": 24077 + }, + { + "epoch": 0.62, + "learning_rate": 1.8424021698429575e-06, + "loss": 0.8672, + "step": 24078 + }, + { + "epoch": 0.62, + "learning_rate": 1.842387259315338e-06, + "loss": 0.7554, + "step": 24079 + }, + { + "epoch": 0.62, + "learning_rate": 1.8423723481427414e-06, + "loss": 0.9746, + "step": 24080 + }, + { + "epoch": 0.62, + "learning_rate": 1.842357436325179e-06, + "loss": 0.9092, + "step": 24081 + }, + { + "epoch": 0.62, + "learning_rate": 1.8423425238626625e-06, + "loss": 0.9785, + "step": 24082 + }, + { + "epoch": 0.62, + "learning_rate": 1.8423276107552026e-06, + "loss": 0.7988, + "step": 24083 + }, + { + "epoch": 0.62, + "learning_rate": 1.8423126970028116e-06, + "loss": 0.6211, + "step": 24084 + }, + { + "epoch": 0.62, + "learning_rate": 1.8422977826055002e-06, + "loss": 0.8711, + "step": 24085 + }, + { + "epoch": 0.62, + "learning_rate": 1.8422828675632802e-06, + "loss": 0.8955, + "step": 24086 + }, + { + "epoch": 0.62, + "learning_rate": 1.8422679518761629e-06, + "loss": 0.7393, + "step": 24087 + }, + { + "epoch": 0.62, + "learning_rate": 1.84225303554416e-06, + "loss": 1.1055, + "step": 24088 + }, + { + "epoch": 0.62, + "learning_rate": 1.8422381185672822e-06, + "loss": 0.9209, + "step": 24089 + }, + { + "epoch": 0.62, + "learning_rate": 1.8422232009455416e-06, + "loss": 0.8672, + "step": 24090 + }, + { + "epoch": 0.62, + "learning_rate": 1.8422082826789497e-06, + "loss": 0.8281, + "step": 24091 + }, + { + "epoch": 0.62, + "learning_rate": 1.8421933637675174e-06, + "loss": 0.4834, + "step": 24092 + }, + { + "epoch": 0.62, + "learning_rate": 1.8421784442112564e-06, + "loss": 0.9102, + "step": 24093 + }, + { + "epoch": 0.62, + "learning_rate": 1.842163524010178e-06, + "loss": 0.9043, + "step": 24094 + }, + { + "epoch": 0.62, + "learning_rate": 1.8421486031642938e-06, + "loss": 0.5576, + "step": 24095 + }, + { + "epoch": 0.62, + "learning_rate": 1.8421336816736152e-06, + "loss": 0.9326, + "step": 24096 + }, + { + "epoch": 0.62, + "learning_rate": 1.8421187595381536e-06, + "loss": 0.9316, + "step": 24097 + }, + { + "epoch": 0.62, + "learning_rate": 1.8421038367579205e-06, + "loss": 0.5676, + "step": 24098 + }, + { + "epoch": 0.62, + "learning_rate": 1.842088913332927e-06, + "loss": 0.8882, + "step": 24099 + }, + { + "epoch": 0.62, + "learning_rate": 1.8420739892631847e-06, + "loss": 0.7666, + "step": 24100 + }, + { + "epoch": 0.62, + "learning_rate": 1.8420590645487048e-06, + "loss": 0.7222, + "step": 24101 + }, + { + "epoch": 0.62, + "learning_rate": 1.8420441391894995e-06, + "loss": 0.7539, + "step": 24102 + }, + { + "epoch": 0.62, + "learning_rate": 1.8420292131855795e-06, + "loss": 1.1328, + "step": 24103 + }, + { + "epoch": 0.62, + "learning_rate": 1.8420142865369565e-06, + "loss": 0.8994, + "step": 24104 + }, + { + "epoch": 0.62, + "learning_rate": 1.8419993592436418e-06, + "loss": 0.957, + "step": 24105 + }, + { + "epoch": 0.62, + "learning_rate": 1.8419844313056472e-06, + "loss": 1.0518, + "step": 24106 + }, + { + "epoch": 0.62, + "learning_rate": 1.8419695027229833e-06, + "loss": 0.9678, + "step": 24107 + }, + { + "epoch": 0.62, + "learning_rate": 1.8419545734956625e-06, + "loss": 0.7451, + "step": 24108 + }, + { + "epoch": 0.62, + "learning_rate": 1.8419396436236956e-06, + "loss": 1.124, + "step": 24109 + }, + { + "epoch": 0.62, + "learning_rate": 1.8419247131070943e-06, + "loss": 0.7412, + "step": 24110 + }, + { + "epoch": 0.62, + "learning_rate": 1.84190978194587e-06, + "loss": 0.9541, + "step": 24111 + }, + { + "epoch": 0.62, + "learning_rate": 1.8418948501400343e-06, + "loss": 0.8447, + "step": 24112 + }, + { + "epoch": 0.62, + "learning_rate": 1.841879917689598e-06, + "loss": 0.8052, + "step": 24113 + }, + { + "epoch": 0.62, + "learning_rate": 1.841864984594573e-06, + "loss": 0.8506, + "step": 24114 + }, + { + "epoch": 0.62, + "learning_rate": 1.8418500508549709e-06, + "loss": 0.5151, + "step": 24115 + }, + { + "epoch": 0.62, + "learning_rate": 1.8418351164708027e-06, + "loss": 0.8428, + "step": 24116 + }, + { + "epoch": 0.62, + "learning_rate": 1.8418201814420804e-06, + "loss": 0.8428, + "step": 24117 + }, + { + "epoch": 0.62, + "learning_rate": 1.841805245768815e-06, + "loss": 0.9463, + "step": 24118 + }, + { + "epoch": 0.62, + "learning_rate": 1.841790309451018e-06, + "loss": 0.8809, + "step": 24119 + }, + { + "epoch": 0.62, + "learning_rate": 1.8417753724887006e-06, + "loss": 0.8252, + "step": 24120 + }, + { + "epoch": 0.62, + "learning_rate": 1.8417604348818747e-06, + "loss": 0.772, + "step": 24121 + }, + { + "epoch": 0.62, + "learning_rate": 1.8417454966305516e-06, + "loss": 0.8584, + "step": 24122 + }, + { + "epoch": 0.62, + "learning_rate": 1.8417305577347427e-06, + "loss": 0.7852, + "step": 24123 + }, + { + "epoch": 0.62, + "learning_rate": 1.8417156181944593e-06, + "loss": 0.8242, + "step": 24124 + }, + { + "epoch": 0.62, + "learning_rate": 1.8417006780097131e-06, + "loss": 0.958, + "step": 24125 + }, + { + "epoch": 0.62, + "learning_rate": 1.8416857371805151e-06, + "loss": 0.9766, + "step": 24126 + }, + { + "epoch": 0.62, + "learning_rate": 1.8416707957068773e-06, + "loss": 0.9219, + "step": 24127 + }, + { + "epoch": 0.62, + "learning_rate": 1.8416558535888106e-06, + "loss": 0.8311, + "step": 24128 + }, + { + "epoch": 0.62, + "learning_rate": 1.841640910826327e-06, + "loss": 0.9189, + "step": 24129 + }, + { + "epoch": 0.62, + "learning_rate": 1.8416259674194375e-06, + "loss": 1.0684, + "step": 24130 + }, + { + "epoch": 0.62, + "learning_rate": 1.841611023368154e-06, + "loss": 0.958, + "step": 24131 + }, + { + "epoch": 0.62, + "learning_rate": 1.841596078672487e-06, + "loss": 0.75, + "step": 24132 + }, + { + "epoch": 0.62, + "learning_rate": 1.8415811333324491e-06, + "loss": 0.9893, + "step": 24133 + }, + { + "epoch": 0.62, + "learning_rate": 1.8415661873480513e-06, + "loss": 0.9229, + "step": 24134 + }, + { + "epoch": 0.62, + "learning_rate": 1.8415512407193048e-06, + "loss": 0.7363, + "step": 24135 + }, + { + "epoch": 0.62, + "learning_rate": 1.841536293446221e-06, + "loss": 1.0088, + "step": 24136 + }, + { + "epoch": 0.62, + "learning_rate": 1.8415213455288119e-06, + "loss": 0.9648, + "step": 24137 + }, + { + "epoch": 0.62, + "learning_rate": 1.8415063969670884e-06, + "loss": 0.6465, + "step": 24138 + }, + { + "epoch": 0.62, + "learning_rate": 1.8414914477610621e-06, + "loss": 0.9082, + "step": 24139 + }, + { + "epoch": 0.62, + "learning_rate": 1.8414764979107447e-06, + "loss": 0.7881, + "step": 24140 + }, + { + "epoch": 0.62, + "learning_rate": 1.8414615474161473e-06, + "loss": 0.9111, + "step": 24141 + }, + { + "epoch": 0.62, + "learning_rate": 1.8414465962772812e-06, + "loss": 0.9854, + "step": 24142 + }, + { + "epoch": 0.62, + "learning_rate": 1.8414316444941585e-06, + "loss": 0.9932, + "step": 24143 + }, + { + "epoch": 0.62, + "learning_rate": 1.84141669206679e-06, + "loss": 1.0566, + "step": 24144 + }, + { + "epoch": 0.62, + "learning_rate": 1.841401738995188e-06, + "loss": 0.79, + "step": 24145 + }, + { + "epoch": 0.62, + "learning_rate": 1.8413867852793628e-06, + "loss": 0.9297, + "step": 24146 + }, + { + "epoch": 0.62, + "learning_rate": 1.8413718309193267e-06, + "loss": 0.9023, + "step": 24147 + }, + { + "epoch": 0.62, + "learning_rate": 1.8413568759150908e-06, + "loss": 0.9805, + "step": 24148 + }, + { + "epoch": 0.62, + "learning_rate": 1.8413419202666666e-06, + "loss": 1.0098, + "step": 24149 + }, + { + "epoch": 0.62, + "learning_rate": 1.8413269639740656e-06, + "loss": 0.9717, + "step": 24150 + }, + { + "epoch": 0.62, + "learning_rate": 1.8413120070372994e-06, + "loss": 0.8447, + "step": 24151 + }, + { + "epoch": 0.62, + "learning_rate": 1.8412970494563789e-06, + "loss": 1.0781, + "step": 24152 + }, + { + "epoch": 0.62, + "learning_rate": 1.8412820912313162e-06, + "loss": 1.0361, + "step": 24153 + }, + { + "epoch": 0.62, + "learning_rate": 1.8412671323621225e-06, + "loss": 0.9238, + "step": 24154 + }, + { + "epoch": 0.62, + "learning_rate": 1.8412521728488094e-06, + "loss": 0.8452, + "step": 24155 + }, + { + "epoch": 0.62, + "learning_rate": 1.8412372126913878e-06, + "loss": 0.8115, + "step": 24156 + }, + { + "epoch": 0.62, + "learning_rate": 1.8412222518898697e-06, + "loss": 0.9678, + "step": 24157 + }, + { + "epoch": 0.62, + "learning_rate": 1.8412072904442665e-06, + "loss": 0.7192, + "step": 24158 + }, + { + "epoch": 0.62, + "learning_rate": 1.8411923283545893e-06, + "loss": 0.8623, + "step": 24159 + }, + { + "epoch": 0.62, + "learning_rate": 1.84117736562085e-06, + "loss": 1.0059, + "step": 24160 + }, + { + "epoch": 0.62, + "learning_rate": 1.84116240224306e-06, + "loss": 0.9131, + "step": 24161 + }, + { + "epoch": 0.62, + "learning_rate": 1.8411474382212304e-06, + "loss": 0.9189, + "step": 24162 + }, + { + "epoch": 0.62, + "learning_rate": 1.841132473555373e-06, + "loss": 0.8096, + "step": 24163 + }, + { + "epoch": 0.62, + "learning_rate": 1.841117508245499e-06, + "loss": 1.0078, + "step": 24164 + }, + { + "epoch": 0.62, + "learning_rate": 1.8411025422916203e-06, + "loss": 0.7783, + "step": 24165 + }, + { + "epoch": 0.62, + "learning_rate": 1.8410875756937477e-06, + "loss": 0.9551, + "step": 24166 + }, + { + "epoch": 0.62, + "learning_rate": 1.8410726084518933e-06, + "loss": 0.6167, + "step": 24167 + }, + { + "epoch": 0.62, + "learning_rate": 1.841057640566068e-06, + "loss": 0.9062, + "step": 24168 + }, + { + "epoch": 0.62, + "learning_rate": 1.8410426720362837e-06, + "loss": 0.7661, + "step": 24169 + }, + { + "epoch": 0.62, + "learning_rate": 1.8410277028625516e-06, + "loss": 0.8916, + "step": 24170 + }, + { + "epoch": 0.62, + "learning_rate": 1.8410127330448834e-06, + "loss": 0.8809, + "step": 24171 + }, + { + "epoch": 0.62, + "learning_rate": 1.8409977625832904e-06, + "loss": 0.9604, + "step": 24172 + }, + { + "epoch": 0.62, + "learning_rate": 1.840982791477784e-06, + "loss": 0.8037, + "step": 24173 + }, + { + "epoch": 0.62, + "learning_rate": 1.840967819728376e-06, + "loss": 0.9131, + "step": 24174 + }, + { + "epoch": 0.62, + "learning_rate": 1.8409528473350773e-06, + "loss": 0.791, + "step": 24175 + }, + { + "epoch": 0.62, + "learning_rate": 1.8409378742979e-06, + "loss": 0.9844, + "step": 24176 + }, + { + "epoch": 0.62, + "learning_rate": 1.840922900616855e-06, + "loss": 0.6982, + "step": 24177 + }, + { + "epoch": 0.62, + "learning_rate": 1.8409079262919538e-06, + "loss": 1.0742, + "step": 24178 + }, + { + "epoch": 0.62, + "learning_rate": 1.8408929513232083e-06, + "loss": 0.6924, + "step": 24179 + }, + { + "epoch": 0.62, + "learning_rate": 1.8408779757106298e-06, + "loss": 0.6636, + "step": 24180 + }, + { + "epoch": 0.62, + "learning_rate": 1.8408629994542296e-06, + "loss": 0.4438, + "step": 24181 + }, + { + "epoch": 0.62, + "learning_rate": 1.8408480225540192e-06, + "loss": 0.8398, + "step": 24182 + }, + { + "epoch": 0.62, + "learning_rate": 1.8408330450100102e-06, + "loss": 1.0596, + "step": 24183 + }, + { + "epoch": 0.62, + "learning_rate": 1.8408180668222144e-06, + "loss": 0.8104, + "step": 24184 + }, + { + "epoch": 0.62, + "learning_rate": 1.8408030879906424e-06, + "loss": 0.6152, + "step": 24185 + }, + { + "epoch": 0.62, + "learning_rate": 1.8407881085153063e-06, + "loss": 1.1191, + "step": 24186 + }, + { + "epoch": 0.62, + "learning_rate": 1.8407731283962172e-06, + "loss": 0.7095, + "step": 24187 + }, + { + "epoch": 0.62, + "learning_rate": 1.8407581476333868e-06, + "loss": 0.9409, + "step": 24188 + }, + { + "epoch": 0.62, + "learning_rate": 1.8407431662268266e-06, + "loss": 0.8555, + "step": 24189 + }, + { + "epoch": 0.62, + "learning_rate": 1.840728184176548e-06, + "loss": 0.8867, + "step": 24190 + }, + { + "epoch": 0.62, + "learning_rate": 1.8407132014825629e-06, + "loss": 0.6929, + "step": 24191 + }, + { + "epoch": 0.62, + "learning_rate": 1.8406982181448817e-06, + "loss": 0.8223, + "step": 24192 + }, + { + "epoch": 0.62, + "learning_rate": 1.840683234163517e-06, + "loss": 0.7661, + "step": 24193 + }, + { + "epoch": 0.62, + "learning_rate": 1.8406682495384795e-06, + "loss": 0.915, + "step": 24194 + }, + { + "epoch": 0.62, + "learning_rate": 1.8406532642697811e-06, + "loss": 0.7559, + "step": 24195 + }, + { + "epoch": 0.62, + "learning_rate": 1.8406382783574334e-06, + "loss": 0.9512, + "step": 24196 + }, + { + "epoch": 0.62, + "learning_rate": 1.8406232918014472e-06, + "loss": 0.918, + "step": 24197 + }, + { + "epoch": 0.62, + "learning_rate": 1.8406083046018348e-06, + "loss": 0.79, + "step": 24198 + }, + { + "epoch": 0.62, + "learning_rate": 1.840593316758607e-06, + "loss": 0.8691, + "step": 24199 + }, + { + "epoch": 0.62, + "learning_rate": 1.8405783282717758e-06, + "loss": 0.9385, + "step": 24200 + }, + { + "epoch": 0.62, + "learning_rate": 1.8405633391413521e-06, + "loss": 0.7655, + "step": 24201 + }, + { + "epoch": 0.62, + "learning_rate": 1.840548349367348e-06, + "loss": 1.0654, + "step": 24202 + }, + { + "epoch": 0.62, + "learning_rate": 1.8405333589497745e-06, + "loss": 0.8125, + "step": 24203 + }, + { + "epoch": 0.62, + "learning_rate": 1.8405183678886433e-06, + "loss": 0.5774, + "step": 24204 + }, + { + "epoch": 0.62, + "learning_rate": 1.8405033761839658e-06, + "loss": 1.0391, + "step": 24205 + }, + { + "epoch": 0.62, + "learning_rate": 1.8404883838357535e-06, + "loss": 0.6519, + "step": 24206 + }, + { + "epoch": 0.62, + "learning_rate": 1.8404733908440178e-06, + "loss": 0.771, + "step": 24207 + }, + { + "epoch": 0.62, + "learning_rate": 1.8404583972087707e-06, + "loss": 0.9229, + "step": 24208 + }, + { + "epoch": 0.62, + "learning_rate": 1.8404434029300226e-06, + "loss": 0.7568, + "step": 24209 + }, + { + "epoch": 0.62, + "learning_rate": 1.8404284080077858e-06, + "loss": 0.5801, + "step": 24210 + }, + { + "epoch": 0.62, + "learning_rate": 1.8404134124420721e-06, + "loss": 0.7109, + "step": 24211 + }, + { + "epoch": 0.62, + "learning_rate": 1.840398416232892e-06, + "loss": 0.7705, + "step": 24212 + }, + { + "epoch": 0.62, + "learning_rate": 1.8403834193802577e-06, + "loss": 0.7959, + "step": 24213 + }, + { + "epoch": 0.62, + "learning_rate": 1.8403684218841805e-06, + "loss": 0.9922, + "step": 24214 + }, + { + "epoch": 0.62, + "learning_rate": 1.8403534237446717e-06, + "loss": 0.6833, + "step": 24215 + }, + { + "epoch": 0.62, + "learning_rate": 1.840338424961743e-06, + "loss": 0.9385, + "step": 24216 + }, + { + "epoch": 0.62, + "learning_rate": 1.8403234255354056e-06, + "loss": 0.7178, + "step": 24217 + }, + { + "epoch": 0.62, + "learning_rate": 1.8403084254656716e-06, + "loss": 0.8198, + "step": 24218 + }, + { + "epoch": 0.62, + "learning_rate": 1.8402934247525518e-06, + "loss": 0.9404, + "step": 24219 + }, + { + "epoch": 0.62, + "learning_rate": 1.840278423396058e-06, + "loss": 0.7266, + "step": 24220 + }, + { + "epoch": 0.62, + "learning_rate": 1.8402634213962015e-06, + "loss": 0.7329, + "step": 24221 + }, + { + "epoch": 0.62, + "learning_rate": 1.8402484187529944e-06, + "loss": 0.9844, + "step": 24222 + }, + { + "epoch": 0.62, + "learning_rate": 1.8402334154664474e-06, + "loss": 1.0137, + "step": 24223 + }, + { + "epoch": 0.62, + "learning_rate": 1.8402184115365725e-06, + "loss": 0.9287, + "step": 24224 + }, + { + "epoch": 0.62, + "learning_rate": 1.8402034069633806e-06, + "loss": 0.6816, + "step": 24225 + }, + { + "epoch": 0.62, + "learning_rate": 1.840188401746884e-06, + "loss": 0.8232, + "step": 24226 + }, + { + "epoch": 0.62, + "learning_rate": 1.8401733958870933e-06, + "loss": 0.7842, + "step": 24227 + }, + { + "epoch": 0.62, + "learning_rate": 1.8401583893840207e-06, + "loss": 0.7373, + "step": 24228 + }, + { + "epoch": 0.62, + "learning_rate": 1.8401433822376777e-06, + "loss": 0.7002, + "step": 24229 + }, + { + "epoch": 0.62, + "learning_rate": 1.8401283744480751e-06, + "loss": 1.043, + "step": 24230 + }, + { + "epoch": 0.62, + "learning_rate": 1.8401133660152252e-06, + "loss": 0.6255, + "step": 24231 + }, + { + "epoch": 0.62, + "learning_rate": 1.8400983569391388e-06, + "loss": 0.9053, + "step": 24232 + }, + { + "epoch": 0.62, + "learning_rate": 1.8400833472198284e-06, + "loss": 0.7271, + "step": 24233 + }, + { + "epoch": 0.62, + "learning_rate": 1.840068336857304e-06, + "loss": 0.8643, + "step": 24234 + }, + { + "epoch": 0.62, + "learning_rate": 1.8400533258515783e-06, + "loss": 0.7578, + "step": 24235 + }, + { + "epoch": 0.62, + "learning_rate": 1.8400383142026624e-06, + "loss": 0.9414, + "step": 24236 + }, + { + "epoch": 0.62, + "learning_rate": 1.8400233019105675e-06, + "loss": 0.9189, + "step": 24237 + }, + { + "epoch": 0.62, + "learning_rate": 1.8400082889753057e-06, + "loss": 0.7969, + "step": 24238 + }, + { + "epoch": 0.62, + "learning_rate": 1.8399932753968881e-06, + "loss": 0.875, + "step": 24239 + }, + { + "epoch": 0.62, + "learning_rate": 1.839978261175326e-06, + "loss": 1.1123, + "step": 24240 + }, + { + "epoch": 0.62, + "learning_rate": 1.8399632463106316e-06, + "loss": 0.8975, + "step": 24241 + }, + { + "epoch": 0.62, + "learning_rate": 1.8399482308028157e-06, + "loss": 1.0078, + "step": 24242 + }, + { + "epoch": 0.62, + "learning_rate": 1.8399332146518903e-06, + "loss": 0.6758, + "step": 24243 + }, + { + "epoch": 0.62, + "learning_rate": 1.8399181978578665e-06, + "loss": 0.6562, + "step": 24244 + }, + { + "epoch": 0.62, + "learning_rate": 1.8399031804207558e-06, + "loss": 0.7939, + "step": 24245 + }, + { + "epoch": 0.62, + "learning_rate": 1.83988816234057e-06, + "loss": 0.7441, + "step": 24246 + }, + { + "epoch": 0.62, + "learning_rate": 1.8398731436173204e-06, + "loss": 0.6924, + "step": 24247 + }, + { + "epoch": 0.62, + "learning_rate": 1.8398581242510187e-06, + "loss": 0.8579, + "step": 24248 + }, + { + "epoch": 0.62, + "learning_rate": 1.8398431042416763e-06, + "loss": 0.7178, + "step": 24249 + }, + { + "epoch": 0.62, + "learning_rate": 1.8398280835893046e-06, + "loss": 0.8896, + "step": 24250 + }, + { + "epoch": 0.62, + "learning_rate": 1.839813062293915e-06, + "loss": 0.7188, + "step": 24251 + }, + { + "epoch": 0.62, + "learning_rate": 1.8397980403555192e-06, + "loss": 1.1348, + "step": 24252 + }, + { + "epoch": 0.62, + "learning_rate": 1.8397830177741287e-06, + "loss": 0.9785, + "step": 24253 + }, + { + "epoch": 0.62, + "learning_rate": 1.8397679945497548e-06, + "loss": 1.0059, + "step": 24254 + }, + { + "epoch": 0.62, + "learning_rate": 1.8397529706824094e-06, + "loss": 0.8877, + "step": 24255 + }, + { + "epoch": 0.62, + "learning_rate": 1.8397379461721037e-06, + "loss": 0.811, + "step": 24256 + }, + { + "epoch": 0.62, + "learning_rate": 1.8397229210188492e-06, + "loss": 0.8047, + "step": 24257 + }, + { + "epoch": 0.62, + "learning_rate": 1.8397078952226575e-06, + "loss": 0.9102, + "step": 24258 + }, + { + "epoch": 0.62, + "learning_rate": 1.83969286878354e-06, + "loss": 0.9092, + "step": 24259 + }, + { + "epoch": 0.62, + "learning_rate": 1.8396778417015084e-06, + "loss": 0.9482, + "step": 24260 + }, + { + "epoch": 0.62, + "learning_rate": 1.8396628139765742e-06, + "loss": 1.0947, + "step": 24261 + }, + { + "epoch": 0.62, + "learning_rate": 1.8396477856087485e-06, + "loss": 0.6851, + "step": 24262 + }, + { + "epoch": 0.62, + "learning_rate": 1.8396327565980431e-06, + "loss": 0.8267, + "step": 24263 + }, + { + "epoch": 0.62, + "learning_rate": 1.8396177269444698e-06, + "loss": 0.8428, + "step": 24264 + }, + { + "epoch": 0.62, + "learning_rate": 1.8396026966480397e-06, + "loss": 0.9229, + "step": 24265 + }, + { + "epoch": 0.62, + "learning_rate": 1.8395876657087643e-06, + "loss": 0.7703, + "step": 24266 + }, + { + "epoch": 0.62, + "learning_rate": 1.8395726341266553e-06, + "loss": 0.8975, + "step": 24267 + }, + { + "epoch": 0.62, + "learning_rate": 1.8395576019017241e-06, + "loss": 1.1133, + "step": 24268 + }, + { + "epoch": 0.62, + "learning_rate": 1.8395425690339824e-06, + "loss": 0.8857, + "step": 24269 + }, + { + "epoch": 0.62, + "learning_rate": 1.8395275355234413e-06, + "loss": 0.8286, + "step": 24270 + }, + { + "epoch": 0.62, + "learning_rate": 1.839512501370113e-06, + "loss": 0.8232, + "step": 24271 + }, + { + "epoch": 0.62, + "learning_rate": 1.839497466574008e-06, + "loss": 0.7427, + "step": 24272 + }, + { + "epoch": 0.62, + "learning_rate": 1.8394824311351386e-06, + "loss": 1.0352, + "step": 24273 + }, + { + "epoch": 0.62, + "learning_rate": 1.8394673950535165e-06, + "loss": 0.8877, + "step": 24274 + }, + { + "epoch": 0.62, + "learning_rate": 1.8394523583291525e-06, + "loss": 0.8096, + "step": 24275 + }, + { + "epoch": 0.62, + "learning_rate": 1.8394373209620583e-06, + "loss": 0.8057, + "step": 24276 + }, + { + "epoch": 0.62, + "learning_rate": 1.8394222829522455e-06, + "loss": 0.665, + "step": 24277 + }, + { + "epoch": 0.62, + "learning_rate": 1.839407244299726e-06, + "loss": 0.7705, + "step": 24278 + }, + { + "epoch": 0.62, + "learning_rate": 1.8393922050045108e-06, + "loss": 0.7725, + "step": 24279 + }, + { + "epoch": 0.62, + "learning_rate": 1.8393771650666117e-06, + "loss": 0.7041, + "step": 24280 + }, + { + "epoch": 0.62, + "learning_rate": 1.8393621244860397e-06, + "loss": 0.9443, + "step": 24281 + }, + { + "epoch": 0.62, + "learning_rate": 1.8393470832628071e-06, + "loss": 0.8545, + "step": 24282 + }, + { + "epoch": 0.62, + "learning_rate": 1.8393320413969251e-06, + "loss": 0.9482, + "step": 24283 + }, + { + "epoch": 0.62, + "learning_rate": 1.839316998888405e-06, + "loss": 0.8281, + "step": 24284 + }, + { + "epoch": 0.62, + "learning_rate": 1.8393019557372582e-06, + "loss": 0.9824, + "step": 24285 + }, + { + "epoch": 0.62, + "learning_rate": 1.8392869119434968e-06, + "loss": 0.7573, + "step": 24286 + }, + { + "epoch": 0.62, + "learning_rate": 1.839271867507132e-06, + "loss": 0.7029, + "step": 24287 + }, + { + "epoch": 0.62, + "learning_rate": 1.8392568224281753e-06, + "loss": 0.8657, + "step": 24288 + }, + { + "epoch": 0.62, + "learning_rate": 1.8392417767066381e-06, + "loss": 1.0645, + "step": 24289 + }, + { + "epoch": 0.62, + "learning_rate": 1.8392267303425322e-06, + "loss": 0.6738, + "step": 24290 + }, + { + "epoch": 0.62, + "learning_rate": 1.839211683335869e-06, + "loss": 0.8975, + "step": 24291 + }, + { + "epoch": 0.62, + "learning_rate": 1.83919663568666e-06, + "loss": 0.9062, + "step": 24292 + }, + { + "epoch": 0.62, + "learning_rate": 1.8391815873949165e-06, + "loss": 1.1279, + "step": 24293 + }, + { + "epoch": 0.62, + "learning_rate": 1.8391665384606505e-06, + "loss": 0.8545, + "step": 24294 + }, + { + "epoch": 0.62, + "learning_rate": 1.839151488883873e-06, + "loss": 1.0117, + "step": 24295 + }, + { + "epoch": 0.62, + "learning_rate": 1.839136438664596e-06, + "loss": 0.9736, + "step": 24296 + }, + { + "epoch": 0.62, + "learning_rate": 1.8391213878028308e-06, + "loss": 0.8887, + "step": 24297 + }, + { + "epoch": 0.62, + "learning_rate": 1.839106336298589e-06, + "loss": 0.7725, + "step": 24298 + }, + { + "epoch": 0.62, + "learning_rate": 1.839091284151882e-06, + "loss": 1.0625, + "step": 24299 + }, + { + "epoch": 0.62, + "learning_rate": 1.8390762313627213e-06, + "loss": 0.7715, + "step": 24300 + }, + { + "epoch": 0.62, + "learning_rate": 1.8390611779311187e-06, + "loss": 0.9023, + "step": 24301 + }, + { + "epoch": 0.62, + "learning_rate": 1.8390461238570853e-06, + "loss": 0.9131, + "step": 24302 + }, + { + "epoch": 0.62, + "learning_rate": 1.839031069140633e-06, + "loss": 0.8418, + "step": 24303 + }, + { + "epoch": 0.62, + "learning_rate": 1.8390160137817731e-06, + "loss": 0.6846, + "step": 24304 + }, + { + "epoch": 0.62, + "learning_rate": 1.8390009577805174e-06, + "loss": 0.7598, + "step": 24305 + }, + { + "epoch": 0.62, + "learning_rate": 1.8389859011368772e-06, + "loss": 0.8154, + "step": 24306 + }, + { + "epoch": 0.62, + "learning_rate": 1.838970843850864e-06, + "loss": 0.8691, + "step": 24307 + }, + { + "epoch": 0.62, + "learning_rate": 1.8389557859224893e-06, + "loss": 0.9365, + "step": 24308 + }, + { + "epoch": 0.62, + "learning_rate": 1.838940727351765e-06, + "loss": 0.8896, + "step": 24309 + }, + { + "epoch": 0.62, + "learning_rate": 1.8389256681387019e-06, + "loss": 0.958, + "step": 24310 + }, + { + "epoch": 0.62, + "learning_rate": 1.8389106082833124e-06, + "loss": 1.0361, + "step": 24311 + }, + { + "epoch": 0.62, + "learning_rate": 1.8388955477856073e-06, + "loss": 0.6885, + "step": 24312 + }, + { + "epoch": 0.62, + "learning_rate": 1.838880486645599e-06, + "loss": 0.8887, + "step": 24313 + }, + { + "epoch": 0.62, + "learning_rate": 1.838865424863298e-06, + "loss": 0.9893, + "step": 24314 + }, + { + "epoch": 0.62, + "learning_rate": 1.8388503624387167e-06, + "loss": 0.8335, + "step": 24315 + }, + { + "epoch": 0.62, + "learning_rate": 1.8388352993718658e-06, + "loss": 0.7241, + "step": 24316 + }, + { + "epoch": 0.62, + "learning_rate": 1.8388202356627577e-06, + "loss": 0.8281, + "step": 24317 + }, + { + "epoch": 0.62, + "learning_rate": 1.8388051713114033e-06, + "loss": 0.7695, + "step": 24318 + }, + { + "epoch": 0.62, + "learning_rate": 1.8387901063178142e-06, + "loss": 0.7476, + "step": 24319 + }, + { + "epoch": 0.62, + "learning_rate": 1.838775040682002e-06, + "loss": 0.7271, + "step": 24320 + }, + { + "epoch": 0.62, + "learning_rate": 1.8387599744039788e-06, + "loss": 0.915, + "step": 24321 + }, + { + "epoch": 0.62, + "learning_rate": 1.8387449074837554e-06, + "loss": 0.9385, + "step": 24322 + }, + { + "epoch": 0.62, + "learning_rate": 1.8387298399213438e-06, + "loss": 0.9453, + "step": 24323 + }, + { + "epoch": 0.62, + "learning_rate": 1.8387147717167548e-06, + "loss": 0.8862, + "step": 24324 + }, + { + "epoch": 0.62, + "learning_rate": 1.838699702870001e-06, + "loss": 0.8428, + "step": 24325 + }, + { + "epoch": 0.62, + "learning_rate": 1.838684633381093e-06, + "loss": 0.8975, + "step": 24326 + }, + { + "epoch": 0.62, + "learning_rate": 1.8386695632500432e-06, + "loss": 0.8643, + "step": 24327 + }, + { + "epoch": 0.62, + "learning_rate": 1.8386544924768623e-06, + "loss": 0.7153, + "step": 24328 + }, + { + "epoch": 0.62, + "learning_rate": 1.8386394210615624e-06, + "loss": 0.5708, + "step": 24329 + }, + { + "epoch": 0.62, + "learning_rate": 1.8386243490041547e-06, + "loss": 0.8281, + "step": 24330 + }, + { + "epoch": 0.62, + "learning_rate": 1.8386092763046511e-06, + "loss": 0.9629, + "step": 24331 + }, + { + "epoch": 0.62, + "learning_rate": 1.8385942029630627e-06, + "loss": 0.9727, + "step": 24332 + }, + { + "epoch": 0.62, + "learning_rate": 1.8385791289794015e-06, + "loss": 0.9014, + "step": 24333 + }, + { + "epoch": 0.62, + "learning_rate": 1.8385640543536787e-06, + "loss": 0.9561, + "step": 24334 + }, + { + "epoch": 0.62, + "learning_rate": 1.8385489790859058e-06, + "loss": 0.9922, + "step": 24335 + }, + { + "epoch": 0.62, + "learning_rate": 1.8385339031760949e-06, + "loss": 0.8496, + "step": 24336 + }, + { + "epoch": 0.62, + "learning_rate": 1.838518826624257e-06, + "loss": 0.918, + "step": 24337 + }, + { + "epoch": 0.62, + "learning_rate": 1.8385037494304037e-06, + "loss": 1.0918, + "step": 24338 + }, + { + "epoch": 0.62, + "learning_rate": 1.8384886715945468e-06, + "loss": 0.9258, + "step": 24339 + }, + { + "epoch": 0.62, + "learning_rate": 1.8384735931166975e-06, + "loss": 0.6108, + "step": 24340 + }, + { + "epoch": 0.62, + "learning_rate": 1.8384585139968674e-06, + "loss": 0.8398, + "step": 24341 + }, + { + "epoch": 0.62, + "learning_rate": 1.8384434342350684e-06, + "loss": 0.8779, + "step": 24342 + }, + { + "epoch": 0.62, + "learning_rate": 1.8384283538313117e-06, + "loss": 0.8027, + "step": 24343 + }, + { + "epoch": 0.62, + "learning_rate": 1.838413272785609e-06, + "loss": 0.7549, + "step": 24344 + }, + { + "epoch": 0.62, + "learning_rate": 1.8383981910979718e-06, + "loss": 0.7129, + "step": 24345 + }, + { + "epoch": 0.62, + "learning_rate": 1.8383831087684117e-06, + "loss": 0.9736, + "step": 24346 + }, + { + "epoch": 0.62, + "learning_rate": 1.83836802579694e-06, + "loss": 0.751, + "step": 24347 + }, + { + "epoch": 0.62, + "learning_rate": 1.8383529421835688e-06, + "loss": 0.7532, + "step": 24348 + }, + { + "epoch": 0.62, + "learning_rate": 1.8383378579283094e-06, + "loss": 0.8701, + "step": 24349 + }, + { + "epoch": 0.62, + "learning_rate": 1.8383227730311725e-06, + "loss": 0.8564, + "step": 24350 + }, + { + "epoch": 0.62, + "learning_rate": 1.8383076874921711e-06, + "loss": 0.959, + "step": 24351 + }, + { + "epoch": 0.62, + "learning_rate": 1.8382926013113157e-06, + "loss": 0.7412, + "step": 24352 + }, + { + "epoch": 0.62, + "learning_rate": 1.8382775144886184e-06, + "loss": 0.876, + "step": 24353 + }, + { + "epoch": 0.62, + "learning_rate": 1.8382624270240905e-06, + "loss": 0.8555, + "step": 24354 + }, + { + "epoch": 0.62, + "learning_rate": 1.8382473389177435e-06, + "loss": 0.8682, + "step": 24355 + }, + { + "epoch": 0.62, + "learning_rate": 1.8382322501695895e-06, + "loss": 0.8965, + "step": 24356 + }, + { + "epoch": 0.62, + "learning_rate": 1.838217160779639e-06, + "loss": 0.9854, + "step": 24357 + }, + { + "epoch": 0.62, + "learning_rate": 1.8382020707479046e-06, + "loss": 0.7163, + "step": 24358 + }, + { + "epoch": 0.62, + "learning_rate": 1.838186980074397e-06, + "loss": 0.8311, + "step": 24359 + }, + { + "epoch": 0.62, + "learning_rate": 1.8381718887591284e-06, + "loss": 0.8203, + "step": 24360 + }, + { + "epoch": 0.62, + "learning_rate": 1.8381567968021104e-06, + "loss": 0.792, + "step": 24361 + }, + { + "epoch": 0.62, + "learning_rate": 1.838141704203354e-06, + "loss": 0.874, + "step": 24362 + }, + { + "epoch": 0.62, + "learning_rate": 1.8381266109628708e-06, + "loss": 0.8105, + "step": 24363 + }, + { + "epoch": 0.62, + "learning_rate": 1.8381115170806729e-06, + "loss": 0.7471, + "step": 24364 + }, + { + "epoch": 0.62, + "learning_rate": 1.8380964225567715e-06, + "loss": 0.9229, + "step": 24365 + }, + { + "epoch": 0.62, + "learning_rate": 1.8380813273911784e-06, + "loss": 1.0918, + "step": 24366 + }, + { + "epoch": 0.62, + "learning_rate": 1.8380662315839043e-06, + "loss": 0.9189, + "step": 24367 + }, + { + "epoch": 0.62, + "learning_rate": 1.8380511351349621e-06, + "loss": 0.876, + "step": 24368 + }, + { + "epoch": 0.62, + "learning_rate": 1.8380360380443624e-06, + "loss": 0.7051, + "step": 24369 + }, + { + "epoch": 0.62, + "learning_rate": 1.8380209403121172e-06, + "loss": 0.79, + "step": 24370 + }, + { + "epoch": 0.62, + "learning_rate": 1.8380058419382378e-06, + "loss": 0.8818, + "step": 24371 + }, + { + "epoch": 0.62, + "learning_rate": 1.8379907429227358e-06, + "loss": 0.9971, + "step": 24372 + }, + { + "epoch": 0.62, + "learning_rate": 1.837975643265623e-06, + "loss": 1.1055, + "step": 24373 + }, + { + "epoch": 0.62, + "learning_rate": 1.8379605429669108e-06, + "loss": 0.9844, + "step": 24374 + }, + { + "epoch": 0.62, + "learning_rate": 1.8379454420266103e-06, + "loss": 0.7383, + "step": 24375 + }, + { + "epoch": 0.62, + "learning_rate": 1.837930340444734e-06, + "loss": 0.7275, + "step": 24376 + }, + { + "epoch": 0.62, + "learning_rate": 1.8379152382212927e-06, + "loss": 0.8887, + "step": 24377 + }, + { + "epoch": 0.62, + "learning_rate": 1.8379001353562985e-06, + "loss": 0.8955, + "step": 24378 + }, + { + "epoch": 0.62, + "learning_rate": 1.8378850318497623e-06, + "loss": 0.6724, + "step": 24379 + }, + { + "epoch": 0.62, + "learning_rate": 1.8378699277016962e-06, + "loss": 0.6929, + "step": 24380 + }, + { + "epoch": 0.62, + "learning_rate": 1.8378548229121118e-06, + "loss": 0.8662, + "step": 24381 + }, + { + "epoch": 0.62, + "learning_rate": 1.8378397174810202e-06, + "loss": 0.8184, + "step": 24382 + }, + { + "epoch": 0.62, + "learning_rate": 1.8378246114084334e-06, + "loss": 0.8789, + "step": 24383 + }, + { + "epoch": 0.62, + "learning_rate": 1.8378095046943628e-06, + "loss": 0.8447, + "step": 24384 + }, + { + "epoch": 0.62, + "learning_rate": 1.83779439733882e-06, + "loss": 0.9795, + "step": 24385 + }, + { + "epoch": 0.63, + "learning_rate": 1.837779289341817e-06, + "loss": 0.8818, + "step": 24386 + }, + { + "epoch": 0.63, + "learning_rate": 1.8377641807033642e-06, + "loss": 0.7124, + "step": 24387 + }, + { + "epoch": 0.63, + "learning_rate": 1.8377490714234741e-06, + "loss": 0.9004, + "step": 24388 + }, + { + "epoch": 0.63, + "learning_rate": 1.8377339615021582e-06, + "loss": 0.7607, + "step": 24389 + }, + { + "epoch": 0.63, + "learning_rate": 1.837718850939428e-06, + "loss": 0.916, + "step": 24390 + }, + { + "epoch": 0.63, + "learning_rate": 1.8377037397352948e-06, + "loss": 0.9009, + "step": 24391 + }, + { + "epoch": 0.63, + "learning_rate": 1.8376886278897703e-06, + "loss": 0.7139, + "step": 24392 + }, + { + "epoch": 0.63, + "learning_rate": 1.8376735154028664e-06, + "loss": 0.7852, + "step": 24393 + }, + { + "epoch": 0.63, + "learning_rate": 1.8376584022745942e-06, + "loss": 0.7524, + "step": 24394 + }, + { + "epoch": 0.63, + "learning_rate": 1.8376432885049656e-06, + "loss": 1.0283, + "step": 24395 + }, + { + "epoch": 0.63, + "learning_rate": 1.837628174093992e-06, + "loss": 0.9658, + "step": 24396 + }, + { + "epoch": 0.63, + "learning_rate": 1.8376130590416849e-06, + "loss": 0.833, + "step": 24397 + }, + { + "epoch": 0.63, + "learning_rate": 1.8375979433480563e-06, + "loss": 0.792, + "step": 24398 + }, + { + "epoch": 0.63, + "learning_rate": 1.8375828270131172e-06, + "loss": 0.9746, + "step": 24399 + }, + { + "epoch": 0.63, + "learning_rate": 1.8375677100368794e-06, + "loss": 0.8584, + "step": 24400 + }, + { + "epoch": 0.63, + "learning_rate": 1.837552592419355e-06, + "loss": 0.9541, + "step": 24401 + }, + { + "epoch": 0.63, + "learning_rate": 1.8375374741605544e-06, + "loss": 0.8506, + "step": 24402 + }, + { + "epoch": 0.63, + "learning_rate": 1.8375223552604902e-06, + "loss": 0.8096, + "step": 24403 + }, + { + "epoch": 0.63, + "learning_rate": 1.8375072357191738e-06, + "loss": 0.7585, + "step": 24404 + }, + { + "epoch": 0.63, + "learning_rate": 1.8374921155366164e-06, + "loss": 0.9512, + "step": 24405 + }, + { + "epoch": 0.63, + "learning_rate": 1.8374769947128299e-06, + "loss": 0.9023, + "step": 24406 + }, + { + "epoch": 0.63, + "learning_rate": 1.8374618732478258e-06, + "loss": 1.0615, + "step": 24407 + }, + { + "epoch": 0.63, + "learning_rate": 1.8374467511416155e-06, + "loss": 1.0098, + "step": 24408 + }, + { + "epoch": 0.63, + "learning_rate": 1.8374316283942108e-06, + "loss": 0.7559, + "step": 24409 + }, + { + "epoch": 0.63, + "learning_rate": 1.8374165050056233e-06, + "loss": 1.0186, + "step": 24410 + }, + { + "epoch": 0.63, + "learning_rate": 1.8374013809758644e-06, + "loss": 0.8711, + "step": 24411 + }, + { + "epoch": 0.63, + "learning_rate": 1.8373862563049455e-06, + "loss": 0.751, + "step": 24412 + }, + { + "epoch": 0.63, + "learning_rate": 1.8373711309928788e-06, + "loss": 0.7466, + "step": 24413 + }, + { + "epoch": 0.63, + "learning_rate": 1.8373560050396754e-06, + "loss": 0.6603, + "step": 24414 + }, + { + "epoch": 0.63, + "learning_rate": 1.8373408784453473e-06, + "loss": 0.8198, + "step": 24415 + }, + { + "epoch": 0.63, + "learning_rate": 1.8373257512099055e-06, + "loss": 0.8486, + "step": 24416 + }, + { + "epoch": 0.63, + "learning_rate": 1.8373106233333617e-06, + "loss": 0.8193, + "step": 24417 + }, + { + "epoch": 0.63, + "learning_rate": 1.837295494815728e-06, + "loss": 0.7461, + "step": 24418 + }, + { + "epoch": 0.63, + "learning_rate": 1.8372803656570155e-06, + "loss": 1.1348, + "step": 24419 + }, + { + "epoch": 0.63, + "learning_rate": 1.837265235857236e-06, + "loss": 0.873, + "step": 24420 + }, + { + "epoch": 0.63, + "learning_rate": 1.837250105416401e-06, + "loss": 0.8398, + "step": 24421 + }, + { + "epoch": 0.63, + "learning_rate": 1.8372349743345219e-06, + "loss": 0.8086, + "step": 24422 + }, + { + "epoch": 0.63, + "learning_rate": 1.8372198426116109e-06, + "loss": 0.9346, + "step": 24423 + }, + { + "epoch": 0.63, + "learning_rate": 1.8372047102476787e-06, + "loss": 0.8496, + "step": 24424 + }, + { + "epoch": 0.63, + "learning_rate": 1.8371895772427376e-06, + "loss": 0.8994, + "step": 24425 + }, + { + "epoch": 0.63, + "learning_rate": 1.8371744435967988e-06, + "loss": 0.8623, + "step": 24426 + }, + { + "epoch": 0.63, + "learning_rate": 1.8371593093098744e-06, + "loss": 0.7686, + "step": 24427 + }, + { + "epoch": 0.63, + "learning_rate": 1.8371441743819751e-06, + "loss": 0.8379, + "step": 24428 + }, + { + "epoch": 0.63, + "learning_rate": 1.8371290388131131e-06, + "loss": 0.8076, + "step": 24429 + }, + { + "epoch": 0.63, + "learning_rate": 1.8371139026033e-06, + "loss": 0.8379, + "step": 24430 + }, + { + "epoch": 0.63, + "learning_rate": 1.837098765752547e-06, + "loss": 1.1357, + "step": 24431 + }, + { + "epoch": 0.63, + "learning_rate": 1.8370836282608665e-06, + "loss": 0.8306, + "step": 24432 + }, + { + "epoch": 0.63, + "learning_rate": 1.8370684901282694e-06, + "loss": 0.9199, + "step": 24433 + }, + { + "epoch": 0.63, + "learning_rate": 1.8370533513547673e-06, + "loss": 0.7065, + "step": 24434 + }, + { + "epoch": 0.63, + "learning_rate": 1.837038211940372e-06, + "loss": 1.0703, + "step": 24435 + }, + { + "epoch": 0.63, + "learning_rate": 1.8370230718850949e-06, + "loss": 0.5249, + "step": 24436 + }, + { + "epoch": 0.63, + "learning_rate": 1.8370079311889479e-06, + "loss": 0.9258, + "step": 24437 + }, + { + "epoch": 0.63, + "learning_rate": 1.8369927898519423e-06, + "loss": 0.7969, + "step": 24438 + }, + { + "epoch": 0.63, + "learning_rate": 1.83697764787409e-06, + "loss": 0.7007, + "step": 24439 + }, + { + "epoch": 0.63, + "learning_rate": 1.836962505255402e-06, + "loss": 0.9844, + "step": 24440 + }, + { + "epoch": 0.63, + "learning_rate": 1.8369473619958906e-06, + "loss": 0.8594, + "step": 24441 + }, + { + "epoch": 0.63, + "learning_rate": 1.8369322180955668e-06, + "loss": 0.9053, + "step": 24442 + }, + { + "epoch": 0.63, + "learning_rate": 1.8369170735544431e-06, + "loss": 0.9902, + "step": 24443 + }, + { + "epoch": 0.63, + "learning_rate": 1.83690192837253e-06, + "loss": 0.5806, + "step": 24444 + }, + { + "epoch": 0.63, + "learning_rate": 1.8368867825498398e-06, + "loss": 0.9307, + "step": 24445 + }, + { + "epoch": 0.63, + "learning_rate": 1.8368716360863833e-06, + "loss": 1.1504, + "step": 24446 + }, + { + "epoch": 0.63, + "learning_rate": 1.8368564889821733e-06, + "loss": 1.0879, + "step": 24447 + }, + { + "epoch": 0.63, + "learning_rate": 1.8368413412372205e-06, + "loss": 0.9316, + "step": 24448 + }, + { + "epoch": 0.63, + "learning_rate": 1.836826192851537e-06, + "loss": 1.1582, + "step": 24449 + }, + { + "epoch": 0.63, + "learning_rate": 1.836811043825134e-06, + "loss": 0.9033, + "step": 24450 + }, + { + "epoch": 0.63, + "learning_rate": 1.836795894158023e-06, + "loss": 0.6831, + "step": 24451 + }, + { + "epoch": 0.63, + "learning_rate": 1.8367807438502164e-06, + "loss": 0.8213, + "step": 24452 + }, + { + "epoch": 0.63, + "learning_rate": 1.8367655929017246e-06, + "loss": 0.8701, + "step": 24453 + }, + { + "epoch": 0.63, + "learning_rate": 1.8367504413125605e-06, + "loss": 0.8271, + "step": 24454 + }, + { + "epoch": 0.63, + "learning_rate": 1.8367352890827347e-06, + "loss": 0.9365, + "step": 24455 + }, + { + "epoch": 0.63, + "learning_rate": 1.8367201362122594e-06, + "loss": 0.9404, + "step": 24456 + }, + { + "epoch": 0.63, + "learning_rate": 1.836704982701146e-06, + "loss": 1.1289, + "step": 24457 + }, + { + "epoch": 0.63, + "learning_rate": 1.8366898285494058e-06, + "loss": 0.7646, + "step": 24458 + }, + { + "epoch": 0.63, + "learning_rate": 1.8366746737570506e-06, + "loss": 0.999, + "step": 24459 + }, + { + "epoch": 0.63, + "learning_rate": 1.8366595183240922e-06, + "loss": 0.8965, + "step": 24460 + }, + { + "epoch": 0.63, + "learning_rate": 1.836644362250542e-06, + "loss": 1.1172, + "step": 24461 + }, + { + "epoch": 0.63, + "learning_rate": 1.836629205536412e-06, + "loss": 0.8525, + "step": 24462 + }, + { + "epoch": 0.63, + "learning_rate": 1.8366140481817132e-06, + "loss": 0.9678, + "step": 24463 + }, + { + "epoch": 0.63, + "learning_rate": 1.8365988901864577e-06, + "loss": 0.6216, + "step": 24464 + }, + { + "epoch": 0.63, + "learning_rate": 1.8365837315506568e-06, + "loss": 1.0068, + "step": 24465 + }, + { + "epoch": 0.63, + "learning_rate": 1.8365685722743223e-06, + "loss": 0.7695, + "step": 24466 + }, + { + "epoch": 0.63, + "learning_rate": 1.8365534123574654e-06, + "loss": 0.9658, + "step": 24467 + }, + { + "epoch": 0.63, + "learning_rate": 1.8365382518000983e-06, + "loss": 1.1211, + "step": 24468 + }, + { + "epoch": 0.63, + "learning_rate": 1.8365230906022322e-06, + "loss": 0.9346, + "step": 24469 + }, + { + "epoch": 0.63, + "learning_rate": 1.8365079287638787e-06, + "loss": 0.998, + "step": 24470 + }, + { + "epoch": 0.63, + "learning_rate": 1.8364927662850498e-06, + "loss": 0.876, + "step": 24471 + }, + { + "epoch": 0.63, + "learning_rate": 1.8364776031657568e-06, + "loss": 0.8135, + "step": 24472 + }, + { + "epoch": 0.63, + "learning_rate": 1.8364624394060114e-06, + "loss": 0.8022, + "step": 24473 + }, + { + "epoch": 0.63, + "learning_rate": 1.836447275005825e-06, + "loss": 0.9229, + "step": 24474 + }, + { + "epoch": 0.63, + "learning_rate": 1.8364321099652095e-06, + "loss": 0.8896, + "step": 24475 + }, + { + "epoch": 0.63, + "learning_rate": 1.8364169442841763e-06, + "loss": 0.9004, + "step": 24476 + }, + { + "epoch": 0.63, + "learning_rate": 1.8364017779627371e-06, + "loss": 0.7637, + "step": 24477 + }, + { + "epoch": 0.63, + "learning_rate": 1.8363866110009037e-06, + "loss": 0.6924, + "step": 24478 + }, + { + "epoch": 0.63, + "learning_rate": 1.8363714433986874e-06, + "loss": 0.8418, + "step": 24479 + }, + { + "epoch": 0.63, + "learning_rate": 1.8363562751561e-06, + "loss": 0.8203, + "step": 24480 + }, + { + "epoch": 0.63, + "learning_rate": 1.836341106273153e-06, + "loss": 1.0342, + "step": 24481 + }, + { + "epoch": 0.63, + "learning_rate": 1.8363259367498581e-06, + "loss": 1.0283, + "step": 24482 + }, + { + "epoch": 0.63, + "learning_rate": 1.836310766586227e-06, + "loss": 0.9463, + "step": 24483 + }, + { + "epoch": 0.63, + "learning_rate": 1.836295595782271e-06, + "loss": 0.9541, + "step": 24484 + }, + { + "epoch": 0.63, + "learning_rate": 1.836280424338002e-06, + "loss": 0.6885, + "step": 24485 + }, + { + "epoch": 0.63, + "learning_rate": 1.8362652522534315e-06, + "loss": 1.1562, + "step": 24486 + }, + { + "epoch": 0.63, + "learning_rate": 1.8362500795285712e-06, + "loss": 0.8809, + "step": 24487 + }, + { + "epoch": 0.63, + "learning_rate": 1.8362349061634328e-06, + "loss": 0.7568, + "step": 24488 + }, + { + "epoch": 0.63, + "learning_rate": 1.8362197321580274e-06, + "loss": 0.5571, + "step": 24489 + }, + { + "epoch": 0.63, + "learning_rate": 1.8362045575123673e-06, + "loss": 0.8877, + "step": 24490 + }, + { + "epoch": 0.63, + "learning_rate": 1.8361893822264637e-06, + "loss": 0.7725, + "step": 24491 + }, + { + "epoch": 0.63, + "learning_rate": 1.8361742063003286e-06, + "loss": 0.8599, + "step": 24492 + }, + { + "epoch": 0.63, + "learning_rate": 1.8361590297339731e-06, + "loss": 1.0146, + "step": 24493 + }, + { + "epoch": 0.63, + "learning_rate": 1.8361438525274088e-06, + "loss": 0.9863, + "step": 24494 + }, + { + "epoch": 0.63, + "learning_rate": 1.836128674680648e-06, + "loss": 0.7666, + "step": 24495 + }, + { + "epoch": 0.63, + "learning_rate": 1.8361134961937022e-06, + "loss": 0.6621, + "step": 24496 + }, + { + "epoch": 0.63, + "learning_rate": 1.836098317066582e-06, + "loss": 0.959, + "step": 24497 + }, + { + "epoch": 0.63, + "learning_rate": 1.8360831372993002e-06, + "loss": 0.5742, + "step": 24498 + }, + { + "epoch": 0.63, + "learning_rate": 1.8360679568918682e-06, + "loss": 0.9238, + "step": 24499 + }, + { + "epoch": 0.63, + "learning_rate": 1.836052775844297e-06, + "loss": 0.9326, + "step": 24500 + }, + { + "epoch": 0.63, + "learning_rate": 1.8360375941565987e-06, + "loss": 0.7773, + "step": 24501 + }, + { + "epoch": 0.63, + "learning_rate": 1.836022411828785e-06, + "loss": 0.6582, + "step": 24502 + }, + { + "epoch": 0.63, + "learning_rate": 1.8360072288608674e-06, + "loss": 0.6377, + "step": 24503 + }, + { + "epoch": 0.63, + "learning_rate": 1.8359920452528575e-06, + "loss": 0.9482, + "step": 24504 + }, + { + "epoch": 0.63, + "learning_rate": 1.8359768610047666e-06, + "loss": 0.8037, + "step": 24505 + }, + { + "epoch": 0.63, + "learning_rate": 1.835961676116607e-06, + "loss": 0.8594, + "step": 24506 + }, + { + "epoch": 0.63, + "learning_rate": 1.83594649058839e-06, + "loss": 0.8408, + "step": 24507 + }, + { + "epoch": 0.63, + "learning_rate": 1.835931304420127e-06, + "loss": 1.0127, + "step": 24508 + }, + { + "epoch": 0.63, + "learning_rate": 1.8359161176118299e-06, + "loss": 0.9248, + "step": 24509 + }, + { + "epoch": 0.63, + "learning_rate": 1.8359009301635102e-06, + "loss": 0.8564, + "step": 24510 + }, + { + "epoch": 0.63, + "learning_rate": 1.8358857420751797e-06, + "loss": 0.7959, + "step": 24511 + }, + { + "epoch": 0.63, + "learning_rate": 1.83587055334685e-06, + "loss": 0.6982, + "step": 24512 + }, + { + "epoch": 0.63, + "learning_rate": 1.8358553639785325e-06, + "loss": 0.7842, + "step": 24513 + }, + { + "epoch": 0.63, + "learning_rate": 1.8358401739702392e-06, + "loss": 0.8789, + "step": 24514 + }, + { + "epoch": 0.63, + "learning_rate": 1.8358249833219813e-06, + "loss": 0.9678, + "step": 24515 + }, + { + "epoch": 0.63, + "learning_rate": 1.8358097920337708e-06, + "loss": 0.7842, + "step": 24516 + }, + { + "epoch": 0.63, + "learning_rate": 1.835794600105619e-06, + "loss": 0.7437, + "step": 24517 + }, + { + "epoch": 0.63, + "learning_rate": 1.835779407537538e-06, + "loss": 0.709, + "step": 24518 + }, + { + "epoch": 0.63, + "learning_rate": 1.8357642143295387e-06, + "loss": 0.6934, + "step": 24519 + }, + { + "epoch": 0.63, + "learning_rate": 1.8357490204816335e-06, + "loss": 0.7793, + "step": 24520 + }, + { + "epoch": 0.63, + "learning_rate": 1.8357338259938335e-06, + "loss": 0.7588, + "step": 24521 + }, + { + "epoch": 0.63, + "learning_rate": 1.8357186308661508e-06, + "loss": 0.877, + "step": 24522 + }, + { + "epoch": 0.63, + "learning_rate": 1.8357034350985962e-06, + "loss": 1.0264, + "step": 24523 + }, + { + "epoch": 0.63, + "learning_rate": 1.8356882386911824e-06, + "loss": 0.8457, + "step": 24524 + }, + { + "epoch": 0.63, + "learning_rate": 1.8356730416439206e-06, + "loss": 0.8784, + "step": 24525 + }, + { + "epoch": 0.63, + "learning_rate": 1.8356578439568223e-06, + "loss": 0.8711, + "step": 24526 + }, + { + "epoch": 0.63, + "learning_rate": 1.835642645629899e-06, + "loss": 0.8213, + "step": 24527 + }, + { + "epoch": 0.63, + "learning_rate": 1.8356274466631627e-06, + "loss": 1.0596, + "step": 24528 + }, + { + "epoch": 0.63, + "learning_rate": 1.835612247056625e-06, + "loss": 0.728, + "step": 24529 + }, + { + "epoch": 0.63, + "learning_rate": 1.8355970468102973e-06, + "loss": 0.7881, + "step": 24530 + }, + { + "epoch": 0.63, + "learning_rate": 1.8355818459241915e-06, + "loss": 0.6787, + "step": 24531 + }, + { + "epoch": 0.63, + "learning_rate": 1.8355666443983187e-06, + "loss": 0.7422, + "step": 24532 + }, + { + "epoch": 0.63, + "learning_rate": 1.8355514422326915e-06, + "loss": 0.8428, + "step": 24533 + }, + { + "epoch": 0.63, + "learning_rate": 1.8355362394273204e-06, + "loss": 0.7317, + "step": 24534 + }, + { + "epoch": 0.63, + "learning_rate": 1.835521035982218e-06, + "loss": 0.7075, + "step": 24535 + }, + { + "epoch": 0.63, + "learning_rate": 1.8355058318973955e-06, + "loss": 1.0566, + "step": 24536 + }, + { + "epoch": 0.63, + "learning_rate": 1.8354906271728644e-06, + "loss": 0.8281, + "step": 24537 + }, + { + "epoch": 0.63, + "learning_rate": 1.835475421808637e-06, + "loss": 0.7749, + "step": 24538 + }, + { + "epoch": 0.63, + "learning_rate": 1.8354602158047241e-06, + "loss": 0.9053, + "step": 24539 + }, + { + "epoch": 0.63, + "learning_rate": 1.835445009161138e-06, + "loss": 0.9121, + "step": 24540 + }, + { + "epoch": 0.63, + "learning_rate": 1.8354298018778898e-06, + "loss": 0.7871, + "step": 24541 + }, + { + "epoch": 0.63, + "learning_rate": 1.8354145939549915e-06, + "loss": 0.957, + "step": 24542 + }, + { + "epoch": 0.63, + "learning_rate": 1.8353993853924545e-06, + "loss": 0.9639, + "step": 24543 + }, + { + "epoch": 0.63, + "learning_rate": 1.835384176190291e-06, + "loss": 1.1055, + "step": 24544 + }, + { + "epoch": 0.63, + "learning_rate": 1.8353689663485118e-06, + "loss": 0.9082, + "step": 24545 + }, + { + "epoch": 0.63, + "learning_rate": 1.8353537558671293e-06, + "loss": 0.8564, + "step": 24546 + }, + { + "epoch": 0.63, + "learning_rate": 1.8353385447461548e-06, + "loss": 0.9785, + "step": 24547 + }, + { + "epoch": 0.63, + "learning_rate": 1.8353233329855999e-06, + "loss": 0.9648, + "step": 24548 + }, + { + "epoch": 0.63, + "learning_rate": 1.8353081205854766e-06, + "loss": 0.9229, + "step": 24549 + }, + { + "epoch": 0.63, + "learning_rate": 1.8352929075457959e-06, + "loss": 0.9873, + "step": 24550 + }, + { + "epoch": 0.63, + "learning_rate": 1.8352776938665699e-06, + "loss": 0.6741, + "step": 24551 + }, + { + "epoch": 0.63, + "learning_rate": 1.8352624795478105e-06, + "loss": 1.0361, + "step": 24552 + }, + { + "epoch": 0.63, + "learning_rate": 1.8352472645895287e-06, + "loss": 0.9434, + "step": 24553 + }, + { + "epoch": 0.63, + "learning_rate": 1.8352320489917365e-06, + "loss": 0.752, + "step": 24554 + }, + { + "epoch": 0.63, + "learning_rate": 1.8352168327544458e-06, + "loss": 0.9609, + "step": 24555 + }, + { + "epoch": 0.63, + "learning_rate": 1.8352016158776674e-06, + "loss": 0.6709, + "step": 24556 + }, + { + "epoch": 0.63, + "learning_rate": 1.8351863983614142e-06, + "loss": 0.9062, + "step": 24557 + }, + { + "epoch": 0.63, + "learning_rate": 1.8351711802056967e-06, + "loss": 0.6914, + "step": 24558 + }, + { + "epoch": 0.63, + "learning_rate": 1.8351559614105275e-06, + "loss": 0.8672, + "step": 24559 + }, + { + "epoch": 0.63, + "learning_rate": 1.8351407419759174e-06, + "loss": 0.9951, + "step": 24560 + }, + { + "epoch": 0.63, + "learning_rate": 1.8351255219018785e-06, + "loss": 0.9619, + "step": 24561 + }, + { + "epoch": 0.63, + "learning_rate": 1.8351103011884223e-06, + "loss": 0.9395, + "step": 24562 + }, + { + "epoch": 0.63, + "learning_rate": 1.8350950798355606e-06, + "loss": 1.0049, + "step": 24563 + }, + { + "epoch": 0.63, + "learning_rate": 1.835079857843305e-06, + "loss": 0.9111, + "step": 24564 + }, + { + "epoch": 0.63, + "learning_rate": 1.8350646352116671e-06, + "loss": 0.9297, + "step": 24565 + }, + { + "epoch": 0.63, + "learning_rate": 1.835049411940659e-06, + "loss": 0.9922, + "step": 24566 + }, + { + "epoch": 0.63, + "learning_rate": 1.8350341880302915e-06, + "loss": 0.6758, + "step": 24567 + }, + { + "epoch": 0.63, + "learning_rate": 1.835018963480577e-06, + "loss": 0.709, + "step": 24568 + }, + { + "epoch": 0.63, + "learning_rate": 1.8350037382915267e-06, + "loss": 1.2734, + "step": 24569 + }, + { + "epoch": 0.63, + "learning_rate": 1.8349885124631524e-06, + "loss": 0.7627, + "step": 24570 + }, + { + "epoch": 0.63, + "learning_rate": 1.8349732859954661e-06, + "loss": 0.6855, + "step": 24571 + }, + { + "epoch": 0.63, + "learning_rate": 1.8349580588884788e-06, + "loss": 0.8809, + "step": 24572 + }, + { + "epoch": 0.63, + "learning_rate": 1.8349428311422027e-06, + "loss": 0.8096, + "step": 24573 + }, + { + "epoch": 0.63, + "learning_rate": 1.834927602756649e-06, + "loss": 0.8228, + "step": 24574 + }, + { + "epoch": 0.63, + "learning_rate": 1.83491237373183e-06, + "loss": 0.7568, + "step": 24575 + }, + { + "epoch": 0.63, + "learning_rate": 1.8348971440677567e-06, + "loss": 0.915, + "step": 24576 + }, + { + "epoch": 0.63, + "learning_rate": 1.834881913764441e-06, + "loss": 0.9062, + "step": 24577 + }, + { + "epoch": 0.63, + "learning_rate": 1.8348666828218948e-06, + "loss": 0.9756, + "step": 24578 + }, + { + "epoch": 0.63, + "learning_rate": 1.8348514512401296e-06, + "loss": 0.8398, + "step": 24579 + }, + { + "epoch": 0.63, + "learning_rate": 1.8348362190191571e-06, + "loss": 0.958, + "step": 24580 + }, + { + "epoch": 0.63, + "learning_rate": 1.8348209861589888e-06, + "loss": 0.8364, + "step": 24581 + }, + { + "epoch": 0.63, + "learning_rate": 1.8348057526596365e-06, + "loss": 0.9131, + "step": 24582 + }, + { + "epoch": 0.63, + "learning_rate": 1.8347905185211117e-06, + "loss": 0.7383, + "step": 24583 + }, + { + "epoch": 0.63, + "learning_rate": 1.834775283743426e-06, + "loss": 0.5994, + "step": 24584 + }, + { + "epoch": 0.63, + "learning_rate": 1.8347600483265917e-06, + "loss": 0.999, + "step": 24585 + }, + { + "epoch": 0.63, + "learning_rate": 1.8347448122706197e-06, + "loss": 0.709, + "step": 24586 + }, + { + "epoch": 0.63, + "learning_rate": 1.834729575575522e-06, + "loss": 0.9131, + "step": 24587 + }, + { + "epoch": 0.63, + "learning_rate": 1.8347143382413105e-06, + "loss": 0.9521, + "step": 24588 + }, + { + "epoch": 0.63, + "learning_rate": 1.834699100267996e-06, + "loss": 1.0127, + "step": 24589 + }, + { + "epoch": 0.63, + "learning_rate": 1.8346838616555912e-06, + "loss": 0.5786, + "step": 24590 + }, + { + "epoch": 0.63, + "learning_rate": 1.8346686224041074e-06, + "loss": 1.0625, + "step": 24591 + }, + { + "epoch": 0.63, + "learning_rate": 1.8346533825135564e-06, + "loss": 0.7295, + "step": 24592 + }, + { + "epoch": 0.63, + "learning_rate": 1.8346381419839494e-06, + "loss": 0.9766, + "step": 24593 + }, + { + "epoch": 0.63, + "learning_rate": 1.8346229008152983e-06, + "loss": 0.5874, + "step": 24594 + }, + { + "epoch": 0.63, + "learning_rate": 1.8346076590076152e-06, + "loss": 0.917, + "step": 24595 + }, + { + "epoch": 0.63, + "learning_rate": 1.8345924165609107e-06, + "loss": 0.7759, + "step": 24596 + }, + { + "epoch": 0.63, + "learning_rate": 1.8345771734751978e-06, + "loss": 0.8711, + "step": 24597 + }, + { + "epoch": 0.63, + "learning_rate": 1.8345619297504873e-06, + "loss": 0.9023, + "step": 24598 + }, + { + "epoch": 0.63, + "learning_rate": 1.8345466853867913e-06, + "loss": 0.8853, + "step": 24599 + }, + { + "epoch": 0.63, + "learning_rate": 1.834531440384121e-06, + "loss": 0.7725, + "step": 24600 + }, + { + "epoch": 0.63, + "learning_rate": 1.8345161947424886e-06, + "loss": 0.5884, + "step": 24601 + }, + { + "epoch": 0.63, + "learning_rate": 1.834500948461905e-06, + "loss": 0.9824, + "step": 24602 + }, + { + "epoch": 0.63, + "learning_rate": 1.8344857015423828e-06, + "loss": 0.835, + "step": 24603 + }, + { + "epoch": 0.63, + "learning_rate": 1.8344704539839332e-06, + "loss": 0.7456, + "step": 24604 + }, + { + "epoch": 0.63, + "learning_rate": 1.8344552057865681e-06, + "loss": 0.8701, + "step": 24605 + }, + { + "epoch": 0.63, + "learning_rate": 1.8344399569502988e-06, + "loss": 0.7661, + "step": 24606 + }, + { + "epoch": 0.63, + "learning_rate": 1.8344247074751373e-06, + "loss": 0.7549, + "step": 24607 + }, + { + "epoch": 0.63, + "learning_rate": 1.834409457361095e-06, + "loss": 1.0137, + "step": 24608 + }, + { + "epoch": 0.63, + "learning_rate": 1.8343942066081842e-06, + "loss": 0.9658, + "step": 24609 + }, + { + "epoch": 0.63, + "learning_rate": 1.8343789552164158e-06, + "loss": 0.7319, + "step": 24610 + }, + { + "epoch": 0.63, + "learning_rate": 1.8343637031858017e-06, + "loss": 0.8623, + "step": 24611 + }, + { + "epoch": 0.63, + "learning_rate": 1.8343484505163538e-06, + "loss": 0.6284, + "step": 24612 + }, + { + "epoch": 0.63, + "learning_rate": 1.8343331972080836e-06, + "loss": 0.7847, + "step": 24613 + }, + { + "epoch": 0.63, + "learning_rate": 1.834317943261003e-06, + "loss": 0.9961, + "step": 24614 + }, + { + "epoch": 0.63, + "learning_rate": 1.8343026886751233e-06, + "loss": 0.7734, + "step": 24615 + }, + { + "epoch": 0.63, + "learning_rate": 1.8342874334504566e-06, + "loss": 0.8799, + "step": 24616 + }, + { + "epoch": 0.63, + "learning_rate": 1.8342721775870143e-06, + "loss": 0.8516, + "step": 24617 + }, + { + "epoch": 0.63, + "learning_rate": 1.834256921084808e-06, + "loss": 0.9688, + "step": 24618 + }, + { + "epoch": 0.63, + "learning_rate": 1.8342416639438496e-06, + "loss": 0.9395, + "step": 24619 + }, + { + "epoch": 0.63, + "learning_rate": 1.8342264061641508e-06, + "loss": 0.915, + "step": 24620 + }, + { + "epoch": 0.63, + "learning_rate": 1.8342111477457234e-06, + "loss": 0.5981, + "step": 24621 + }, + { + "epoch": 0.63, + "learning_rate": 1.8341958886885783e-06, + "loss": 0.8174, + "step": 24622 + }, + { + "epoch": 0.63, + "learning_rate": 1.8341806289927283e-06, + "loss": 0.9189, + "step": 24623 + }, + { + "epoch": 0.63, + "learning_rate": 1.8341653686581843e-06, + "loss": 0.8921, + "step": 24624 + }, + { + "epoch": 0.63, + "learning_rate": 1.8341501076849584e-06, + "loss": 0.8462, + "step": 24625 + }, + { + "epoch": 0.63, + "learning_rate": 1.8341348460730618e-06, + "loss": 0.8613, + "step": 24626 + }, + { + "epoch": 0.63, + "learning_rate": 1.834119583822507e-06, + "loss": 0.6748, + "step": 24627 + }, + { + "epoch": 0.63, + "learning_rate": 1.8341043209333049e-06, + "loss": 0.8926, + "step": 24628 + }, + { + "epoch": 0.63, + "learning_rate": 1.8340890574054674e-06, + "loss": 0.958, + "step": 24629 + }, + { + "epoch": 0.63, + "learning_rate": 1.8340737932390065e-06, + "loss": 0.8521, + "step": 24630 + }, + { + "epoch": 0.63, + "learning_rate": 1.8340585284339333e-06, + "loss": 1.0137, + "step": 24631 + }, + { + "epoch": 0.63, + "learning_rate": 1.83404326299026e-06, + "loss": 0.8057, + "step": 24632 + }, + { + "epoch": 0.63, + "learning_rate": 1.8340279969079982e-06, + "loss": 1.0244, + "step": 24633 + }, + { + "epoch": 0.63, + "learning_rate": 1.8340127301871595e-06, + "loss": 0.8232, + "step": 24634 + }, + { + "epoch": 0.63, + "learning_rate": 1.8339974628277558e-06, + "loss": 1.0371, + "step": 24635 + }, + { + "epoch": 0.63, + "learning_rate": 1.8339821948297983e-06, + "loss": 0.7197, + "step": 24636 + }, + { + "epoch": 0.63, + "learning_rate": 1.833966926193299e-06, + "loss": 0.873, + "step": 24637 + }, + { + "epoch": 0.63, + "learning_rate": 1.8339516569182694e-06, + "loss": 1.0132, + "step": 24638 + }, + { + "epoch": 0.63, + "learning_rate": 1.8339363870047215e-06, + "loss": 0.7944, + "step": 24639 + }, + { + "epoch": 0.63, + "learning_rate": 1.8339211164526672e-06, + "loss": 0.9512, + "step": 24640 + }, + { + "epoch": 0.63, + "learning_rate": 1.8339058452621174e-06, + "loss": 0.8301, + "step": 24641 + }, + { + "epoch": 0.63, + "learning_rate": 1.8338905734330845e-06, + "loss": 0.73, + "step": 24642 + }, + { + "epoch": 0.63, + "learning_rate": 1.8338753009655798e-06, + "loss": 0.7197, + "step": 24643 + }, + { + "epoch": 0.63, + "learning_rate": 1.8338600278596153e-06, + "loss": 0.7412, + "step": 24644 + }, + { + "epoch": 0.63, + "learning_rate": 1.8338447541152023e-06, + "loss": 0.8525, + "step": 24645 + }, + { + "epoch": 0.63, + "learning_rate": 1.8338294797323528e-06, + "loss": 0.7686, + "step": 24646 + }, + { + "epoch": 0.63, + "learning_rate": 1.8338142047110784e-06, + "loss": 0.8311, + "step": 24647 + }, + { + "epoch": 0.63, + "learning_rate": 1.833798929051391e-06, + "loss": 0.8379, + "step": 24648 + }, + { + "epoch": 0.63, + "learning_rate": 1.8337836527533017e-06, + "loss": 0.9756, + "step": 24649 + }, + { + "epoch": 0.63, + "learning_rate": 1.833768375816823e-06, + "loss": 0.9668, + "step": 24650 + }, + { + "epoch": 0.63, + "learning_rate": 1.8337530982419658e-06, + "loss": 0.8291, + "step": 24651 + }, + { + "epoch": 0.63, + "learning_rate": 1.8337378200287423e-06, + "loss": 0.9824, + "step": 24652 + }, + { + "epoch": 0.63, + "learning_rate": 1.8337225411771642e-06, + "loss": 0.7754, + "step": 24653 + }, + { + "epoch": 0.63, + "learning_rate": 1.8337072616872432e-06, + "loss": 0.8076, + "step": 24654 + }, + { + "epoch": 0.63, + "learning_rate": 1.8336919815589909e-06, + "loss": 0.9453, + "step": 24655 + }, + { + "epoch": 0.63, + "learning_rate": 1.8336767007924187e-06, + "loss": 0.8481, + "step": 24656 + }, + { + "epoch": 0.63, + "learning_rate": 1.8336614193875386e-06, + "loss": 0.7891, + "step": 24657 + }, + { + "epoch": 0.63, + "learning_rate": 1.8336461373443624e-06, + "loss": 0.8154, + "step": 24658 + }, + { + "epoch": 0.63, + "learning_rate": 1.8336308546629016e-06, + "loss": 0.7427, + "step": 24659 + }, + { + "epoch": 0.63, + "learning_rate": 1.8336155713431682e-06, + "loss": 0.8416, + "step": 24660 + }, + { + "epoch": 0.63, + "learning_rate": 1.8336002873851734e-06, + "loss": 0.9814, + "step": 24661 + }, + { + "epoch": 0.63, + "learning_rate": 1.8335850027889294e-06, + "loss": 0.7168, + "step": 24662 + }, + { + "epoch": 0.63, + "learning_rate": 1.8335697175544477e-06, + "loss": 0.9854, + "step": 24663 + }, + { + "epoch": 0.63, + "learning_rate": 1.8335544316817399e-06, + "loss": 0.7979, + "step": 24664 + }, + { + "epoch": 0.63, + "learning_rate": 1.833539145170818e-06, + "loss": 0.9688, + "step": 24665 + }, + { + "epoch": 0.63, + "learning_rate": 1.8335238580216932e-06, + "loss": 0.8193, + "step": 24666 + }, + { + "epoch": 0.63, + "learning_rate": 1.8335085702343775e-06, + "loss": 1.0049, + "step": 24667 + }, + { + "epoch": 0.63, + "learning_rate": 1.833493281808883e-06, + "loss": 0.9219, + "step": 24668 + }, + { + "epoch": 0.63, + "learning_rate": 1.833477992745221e-06, + "loss": 0.8174, + "step": 24669 + }, + { + "epoch": 0.63, + "learning_rate": 1.8334627030434028e-06, + "loss": 0.6846, + "step": 24670 + }, + { + "epoch": 0.63, + "learning_rate": 1.8334474127034407e-06, + "loss": 1.0156, + "step": 24671 + }, + { + "epoch": 0.63, + "learning_rate": 1.8334321217253463e-06, + "loss": 0.8965, + "step": 24672 + }, + { + "epoch": 0.63, + "learning_rate": 1.8334168301091313e-06, + "loss": 0.8975, + "step": 24673 + }, + { + "epoch": 0.63, + "learning_rate": 1.833401537854807e-06, + "loss": 0.9258, + "step": 24674 + }, + { + "epoch": 0.63, + "learning_rate": 1.8333862449623859e-06, + "loss": 0.7939, + "step": 24675 + }, + { + "epoch": 0.63, + "learning_rate": 1.833370951431879e-06, + "loss": 0.7954, + "step": 24676 + }, + { + "epoch": 0.63, + "learning_rate": 1.8333556572632984e-06, + "loss": 0.9482, + "step": 24677 + }, + { + "epoch": 0.63, + "learning_rate": 1.8333403624566558e-06, + "loss": 0.8652, + "step": 24678 + }, + { + "epoch": 0.63, + "learning_rate": 1.8333250670119627e-06, + "loss": 0.8193, + "step": 24679 + }, + { + "epoch": 0.63, + "learning_rate": 1.8333097709292309e-06, + "loss": 0.9863, + "step": 24680 + }, + { + "epoch": 0.63, + "learning_rate": 1.833294474208472e-06, + "loss": 0.5255, + "step": 24681 + }, + { + "epoch": 0.63, + "learning_rate": 1.833279176849698e-06, + "loss": 0.8965, + "step": 24682 + }, + { + "epoch": 0.63, + "learning_rate": 1.8332638788529204e-06, + "loss": 0.9746, + "step": 24683 + }, + { + "epoch": 0.63, + "learning_rate": 1.833248580218151e-06, + "loss": 0.7339, + "step": 24684 + }, + { + "epoch": 0.63, + "learning_rate": 1.8332332809454013e-06, + "loss": 0.9824, + "step": 24685 + }, + { + "epoch": 0.63, + "learning_rate": 1.8332179810346834e-06, + "loss": 1.0459, + "step": 24686 + }, + { + "epoch": 0.63, + "learning_rate": 1.8332026804860087e-06, + "loss": 0.7632, + "step": 24687 + }, + { + "epoch": 0.63, + "learning_rate": 1.8331873792993892e-06, + "loss": 0.5436, + "step": 24688 + }, + { + "epoch": 0.63, + "learning_rate": 1.8331720774748362e-06, + "loss": 0.8477, + "step": 24689 + }, + { + "epoch": 0.63, + "learning_rate": 1.833156775012362e-06, + "loss": 0.7949, + "step": 24690 + }, + { + "epoch": 0.63, + "learning_rate": 1.8331414719119776e-06, + "loss": 0.6436, + "step": 24691 + }, + { + "epoch": 0.63, + "learning_rate": 1.8331261681736955e-06, + "loss": 0.7739, + "step": 24692 + }, + { + "epoch": 0.63, + "learning_rate": 1.8331108637975264e-06, + "loss": 0.7827, + "step": 24693 + }, + { + "epoch": 0.63, + "learning_rate": 1.8330955587834829e-06, + "loss": 0.8135, + "step": 24694 + }, + { + "epoch": 0.63, + "learning_rate": 1.8330802531315765e-06, + "loss": 0.6802, + "step": 24695 + }, + { + "epoch": 0.63, + "learning_rate": 1.8330649468418188e-06, + "loss": 0.834, + "step": 24696 + }, + { + "epoch": 0.63, + "learning_rate": 1.8330496399142215e-06, + "loss": 0.7778, + "step": 24697 + }, + { + "epoch": 0.63, + "learning_rate": 1.8330343323487964e-06, + "loss": 0.9277, + "step": 24698 + }, + { + "epoch": 0.63, + "learning_rate": 1.8330190241455555e-06, + "loss": 0.8105, + "step": 24699 + }, + { + "epoch": 0.63, + "learning_rate": 1.83300371530451e-06, + "loss": 1.0176, + "step": 24700 + }, + { + "epoch": 0.63, + "learning_rate": 1.8329884058256719e-06, + "loss": 0.8604, + "step": 24701 + }, + { + "epoch": 0.63, + "learning_rate": 1.832973095709053e-06, + "loss": 0.9253, + "step": 24702 + }, + { + "epoch": 0.63, + "learning_rate": 1.8329577849546646e-06, + "loss": 0.5271, + "step": 24703 + }, + { + "epoch": 0.63, + "learning_rate": 1.8329424735625189e-06, + "loss": 1.2119, + "step": 24704 + }, + { + "epoch": 0.63, + "learning_rate": 1.8329271615326275e-06, + "loss": 0.7109, + "step": 24705 + }, + { + "epoch": 0.63, + "learning_rate": 1.832911848865002e-06, + "loss": 0.9609, + "step": 24706 + }, + { + "epoch": 0.63, + "learning_rate": 1.8328965355596542e-06, + "loss": 1.1348, + "step": 24707 + }, + { + "epoch": 0.63, + "learning_rate": 1.832881221616596e-06, + "loss": 0.7244, + "step": 24708 + }, + { + "epoch": 0.63, + "learning_rate": 1.8328659070358388e-06, + "loss": 0.7793, + "step": 24709 + }, + { + "epoch": 0.63, + "learning_rate": 1.8328505918173943e-06, + "loss": 0.9014, + "step": 24710 + }, + { + "epoch": 0.63, + "learning_rate": 1.8328352759612744e-06, + "loss": 1.2148, + "step": 24711 + }, + { + "epoch": 0.63, + "learning_rate": 1.8328199594674912e-06, + "loss": 0.9434, + "step": 24712 + }, + { + "epoch": 0.63, + "learning_rate": 1.8328046423360556e-06, + "loss": 1.0039, + "step": 24713 + }, + { + "epoch": 0.63, + "learning_rate": 1.83278932456698e-06, + "loss": 1.1074, + "step": 24714 + }, + { + "epoch": 0.63, + "learning_rate": 1.8327740061602762e-06, + "loss": 0.5813, + "step": 24715 + }, + { + "epoch": 0.63, + "learning_rate": 1.8327586871159552e-06, + "loss": 0.8018, + "step": 24716 + }, + { + "epoch": 0.63, + "learning_rate": 1.8327433674340293e-06, + "loss": 0.6177, + "step": 24717 + }, + { + "epoch": 0.63, + "learning_rate": 1.8327280471145102e-06, + "loss": 0.999, + "step": 24718 + }, + { + "epoch": 0.63, + "learning_rate": 1.8327127261574093e-06, + "loss": 0.7197, + "step": 24719 + }, + { + "epoch": 0.63, + "learning_rate": 1.8326974045627388e-06, + "loss": 0.5278, + "step": 24720 + }, + { + "epoch": 0.63, + "learning_rate": 1.83268208233051e-06, + "loss": 0.999, + "step": 24721 + }, + { + "epoch": 0.63, + "learning_rate": 1.8326667594607347e-06, + "loss": 0.8818, + "step": 24722 + }, + { + "epoch": 0.63, + "learning_rate": 1.8326514359534251e-06, + "loss": 0.873, + "step": 24723 + }, + { + "epoch": 0.63, + "learning_rate": 1.8326361118085925e-06, + "loss": 0.9746, + "step": 24724 + }, + { + "epoch": 0.63, + "learning_rate": 1.8326207870262484e-06, + "loss": 0.8789, + "step": 24725 + }, + { + "epoch": 0.63, + "learning_rate": 1.8326054616064051e-06, + "loss": 0.6001, + "step": 24726 + }, + { + "epoch": 0.63, + "learning_rate": 1.8325901355490742e-06, + "loss": 0.8022, + "step": 24727 + }, + { + "epoch": 0.63, + "learning_rate": 1.8325748088542672e-06, + "loss": 0.8408, + "step": 24728 + }, + { + "epoch": 0.63, + "learning_rate": 1.8325594815219958e-06, + "loss": 0.9736, + "step": 24729 + }, + { + "epoch": 0.63, + "learning_rate": 1.832544153552272e-06, + "loss": 1.0352, + "step": 24730 + }, + { + "epoch": 0.63, + "learning_rate": 1.8325288249451077e-06, + "loss": 1.0215, + "step": 24731 + }, + { + "epoch": 0.63, + "learning_rate": 1.832513495700514e-06, + "loss": 0.9502, + "step": 24732 + }, + { + "epoch": 0.63, + "learning_rate": 1.832498165818503e-06, + "loss": 0.4979, + "step": 24733 + }, + { + "epoch": 0.63, + "learning_rate": 1.8324828352990866e-06, + "loss": 1.1084, + "step": 24734 + }, + { + "epoch": 0.63, + "learning_rate": 1.8324675041422764e-06, + "loss": 0.8687, + "step": 24735 + }, + { + "epoch": 0.63, + "learning_rate": 1.832452172348084e-06, + "loss": 0.9473, + "step": 24736 + }, + { + "epoch": 0.63, + "learning_rate": 1.8324368399165211e-06, + "loss": 0.8711, + "step": 24737 + }, + { + "epoch": 0.63, + "learning_rate": 1.8324215068476e-06, + "loss": 0.8164, + "step": 24738 + }, + { + "epoch": 0.63, + "learning_rate": 1.8324061731413315e-06, + "loss": 1.0146, + "step": 24739 + }, + { + "epoch": 0.63, + "learning_rate": 1.8323908387977283e-06, + "loss": 0.9014, + "step": 24740 + }, + { + "epoch": 0.63, + "learning_rate": 1.8323755038168015e-06, + "loss": 0.8301, + "step": 24741 + }, + { + "epoch": 0.63, + "learning_rate": 1.832360168198563e-06, + "loss": 1.1113, + "step": 24742 + }, + { + "epoch": 0.63, + "learning_rate": 1.8323448319430248e-06, + "loss": 0.9492, + "step": 24743 + }, + { + "epoch": 0.63, + "learning_rate": 1.832329495050198e-06, + "loss": 0.8062, + "step": 24744 + }, + { + "epoch": 0.63, + "learning_rate": 1.8323141575200954e-06, + "loss": 1.0332, + "step": 24745 + }, + { + "epoch": 0.63, + "learning_rate": 1.8322988193527279e-06, + "loss": 0.8374, + "step": 24746 + }, + { + "epoch": 0.63, + "learning_rate": 1.8322834805481074e-06, + "loss": 1.0146, + "step": 24747 + }, + { + "epoch": 0.63, + "learning_rate": 1.8322681411062456e-06, + "loss": 0.678, + "step": 24748 + }, + { + "epoch": 0.63, + "learning_rate": 1.8322528010271546e-06, + "loss": 0.9219, + "step": 24749 + }, + { + "epoch": 0.63, + "learning_rate": 1.8322374603108458e-06, + "loss": 0.8496, + "step": 24750 + }, + { + "epoch": 0.63, + "learning_rate": 1.8322221189573308e-06, + "loss": 0.6663, + "step": 24751 + }, + { + "epoch": 0.63, + "learning_rate": 1.832206776966622e-06, + "loss": 0.8525, + "step": 24752 + }, + { + "epoch": 0.63, + "learning_rate": 1.8321914343387304e-06, + "loss": 0.7393, + "step": 24753 + }, + { + "epoch": 0.63, + "learning_rate": 1.8321760910736681e-06, + "loss": 0.9785, + "step": 24754 + }, + { + "epoch": 0.63, + "learning_rate": 1.832160747171447e-06, + "loss": 0.9072, + "step": 24755 + }, + { + "epoch": 0.63, + "learning_rate": 1.8321454026320786e-06, + "loss": 0.9502, + "step": 24756 + }, + { + "epoch": 0.63, + "learning_rate": 1.8321300574555746e-06, + "loss": 0.718, + "step": 24757 + }, + { + "epoch": 0.63, + "learning_rate": 1.8321147116419473e-06, + "loss": 0.8574, + "step": 24758 + }, + { + "epoch": 0.63, + "learning_rate": 1.8320993651912079e-06, + "loss": 0.8906, + "step": 24759 + }, + { + "epoch": 0.63, + "learning_rate": 1.832084018103368e-06, + "loss": 0.6675, + "step": 24760 + }, + { + "epoch": 0.63, + "learning_rate": 1.8320686703784396e-06, + "loss": 0.9639, + "step": 24761 + }, + { + "epoch": 0.63, + "learning_rate": 1.8320533220164346e-06, + "loss": 0.7661, + "step": 24762 + }, + { + "epoch": 0.63, + "learning_rate": 1.8320379730173648e-06, + "loss": 0.9873, + "step": 24763 + }, + { + "epoch": 0.63, + "learning_rate": 1.8320226233812417e-06, + "loss": 0.8877, + "step": 24764 + }, + { + "epoch": 0.63, + "learning_rate": 1.832007273108077e-06, + "loss": 0.6638, + "step": 24765 + }, + { + "epoch": 0.63, + "learning_rate": 1.8319919221978827e-06, + "loss": 0.8574, + "step": 24766 + }, + { + "epoch": 0.63, + "learning_rate": 1.8319765706506703e-06, + "loss": 0.9189, + "step": 24767 + }, + { + "epoch": 0.63, + "learning_rate": 1.8319612184664516e-06, + "loss": 0.9277, + "step": 24768 + }, + { + "epoch": 0.63, + "learning_rate": 1.8319458656452388e-06, + "loss": 0.8887, + "step": 24769 + }, + { + "epoch": 0.63, + "learning_rate": 1.8319305121870432e-06, + "loss": 0.7153, + "step": 24770 + }, + { + "epoch": 0.63, + "learning_rate": 1.8319151580918767e-06, + "loss": 0.6699, + "step": 24771 + }, + { + "epoch": 0.63, + "learning_rate": 1.831899803359751e-06, + "loss": 0.7148, + "step": 24772 + }, + { + "epoch": 0.63, + "learning_rate": 1.8318844479906779e-06, + "loss": 0.9023, + "step": 24773 + }, + { + "epoch": 0.63, + "learning_rate": 1.8318690919846688e-06, + "loss": 0.6768, + "step": 24774 + }, + { + "epoch": 0.63, + "learning_rate": 1.831853735341736e-06, + "loss": 0.7954, + "step": 24775 + }, + { + "epoch": 0.64, + "learning_rate": 1.831838378061891e-06, + "loss": 1.0459, + "step": 24776 + }, + { + "epoch": 0.64, + "learning_rate": 1.831823020145146e-06, + "loss": 0.9395, + "step": 24777 + }, + { + "epoch": 0.64, + "learning_rate": 1.8318076615915118e-06, + "loss": 0.644, + "step": 24778 + }, + { + "epoch": 0.64, + "learning_rate": 1.831792302401001e-06, + "loss": 0.7637, + "step": 24779 + }, + { + "epoch": 0.64, + "learning_rate": 1.8317769425736249e-06, + "loss": 0.9541, + "step": 24780 + }, + { + "epoch": 0.64, + "learning_rate": 1.8317615821093957e-06, + "loss": 0.6021, + "step": 24781 + }, + { + "epoch": 0.64, + "learning_rate": 1.8317462210083247e-06, + "loss": 0.9092, + "step": 24782 + }, + { + "epoch": 0.64, + "learning_rate": 1.831730859270424e-06, + "loss": 1.0137, + "step": 24783 + }, + { + "epoch": 0.64, + "learning_rate": 1.8317154968957054e-06, + "loss": 0.8789, + "step": 24784 + }, + { + "epoch": 0.64, + "learning_rate": 1.8317001338841801e-06, + "loss": 0.9111, + "step": 24785 + }, + { + "epoch": 0.64, + "learning_rate": 1.8316847702358603e-06, + "loss": 0.7637, + "step": 24786 + }, + { + "epoch": 0.64, + "learning_rate": 1.8316694059507581e-06, + "loss": 0.936, + "step": 24787 + }, + { + "epoch": 0.64, + "learning_rate": 1.8316540410288845e-06, + "loss": 0.709, + "step": 24788 + }, + { + "epoch": 0.64, + "learning_rate": 1.8316386754702515e-06, + "loss": 0.8137, + "step": 24789 + }, + { + "epoch": 0.64, + "learning_rate": 1.8316233092748714e-06, + "loss": 0.958, + "step": 24790 + }, + { + "epoch": 0.64, + "learning_rate": 1.8316079424427553e-06, + "loss": 0.8555, + "step": 24791 + }, + { + "epoch": 0.64, + "learning_rate": 1.8315925749739154e-06, + "loss": 0.998, + "step": 24792 + }, + { + "epoch": 0.64, + "learning_rate": 1.8315772068683632e-06, + "loss": 0.9023, + "step": 24793 + }, + { + "epoch": 0.64, + "learning_rate": 1.8315618381261107e-06, + "loss": 0.9585, + "step": 24794 + }, + { + "epoch": 0.64, + "learning_rate": 1.8315464687471694e-06, + "loss": 1.0166, + "step": 24795 + }, + { + "epoch": 0.64, + "learning_rate": 1.8315310987315513e-06, + "loss": 0.491, + "step": 24796 + }, + { + "epoch": 0.64, + "learning_rate": 1.831515728079268e-06, + "loss": 0.916, + "step": 24797 + }, + { + "epoch": 0.64, + "learning_rate": 1.8315003567903315e-06, + "loss": 0.8164, + "step": 24798 + }, + { + "epoch": 0.64, + "learning_rate": 1.8314849848647534e-06, + "loss": 1.0322, + "step": 24799 + }, + { + "epoch": 0.64, + "learning_rate": 1.8314696123025452e-06, + "loss": 0.6526, + "step": 24800 + }, + { + "epoch": 0.64, + "learning_rate": 1.831454239103719e-06, + "loss": 0.6172, + "step": 24801 + }, + { + "epoch": 0.64, + "learning_rate": 1.8314388652682867e-06, + "loss": 0.6885, + "step": 24802 + }, + { + "epoch": 0.64, + "learning_rate": 1.8314234907962597e-06, + "loss": 0.73, + "step": 24803 + }, + { + "epoch": 0.64, + "learning_rate": 1.8314081156876502e-06, + "loss": 0.9131, + "step": 24804 + }, + { + "epoch": 0.64, + "learning_rate": 1.8313927399424696e-06, + "loss": 0.7183, + "step": 24805 + }, + { + "epoch": 0.64, + "learning_rate": 1.83137736356073e-06, + "loss": 1.0713, + "step": 24806 + }, + { + "epoch": 0.64, + "learning_rate": 1.8313619865424428e-06, + "loss": 0.918, + "step": 24807 + }, + { + "epoch": 0.64, + "learning_rate": 1.83134660888762e-06, + "loss": 0.916, + "step": 24808 + }, + { + "epoch": 0.64, + "learning_rate": 1.8313312305962732e-06, + "loss": 0.9043, + "step": 24809 + }, + { + "epoch": 0.64, + "learning_rate": 1.8313158516684144e-06, + "loss": 0.8867, + "step": 24810 + }, + { + "epoch": 0.64, + "learning_rate": 1.8313004721040552e-06, + "loss": 0.9961, + "step": 24811 + }, + { + "epoch": 0.64, + "learning_rate": 1.8312850919032075e-06, + "loss": 0.9346, + "step": 24812 + }, + { + "epoch": 0.64, + "learning_rate": 1.8312697110658831e-06, + "loss": 0.7012, + "step": 24813 + }, + { + "epoch": 0.64, + "learning_rate": 1.8312543295920938e-06, + "loss": 1.0352, + "step": 24814 + }, + { + "epoch": 0.64, + "learning_rate": 1.831238947481851e-06, + "loss": 1.2207, + "step": 24815 + }, + { + "epoch": 0.64, + "learning_rate": 1.831223564735167e-06, + "loss": 0.9297, + "step": 24816 + }, + { + "epoch": 0.64, + "learning_rate": 1.831208181352053e-06, + "loss": 0.7246, + "step": 24817 + }, + { + "epoch": 0.64, + "learning_rate": 1.8311927973325214e-06, + "loss": 0.9175, + "step": 24818 + }, + { + "epoch": 0.64, + "learning_rate": 1.8311774126765838e-06, + "loss": 0.8457, + "step": 24819 + }, + { + "epoch": 0.64, + "learning_rate": 1.8311620273842516e-06, + "loss": 0.562, + "step": 24820 + }, + { + "epoch": 0.64, + "learning_rate": 1.8311466414555369e-06, + "loss": 0.8887, + "step": 24821 + }, + { + "epoch": 0.64, + "learning_rate": 1.8311312548904519e-06, + "loss": 0.9336, + "step": 24822 + }, + { + "epoch": 0.64, + "learning_rate": 1.8311158676890073e-06, + "loss": 0.9043, + "step": 24823 + }, + { + "epoch": 0.64, + "learning_rate": 1.8311004798512157e-06, + "loss": 0.9004, + "step": 24824 + }, + { + "epoch": 0.64, + "learning_rate": 1.8310850913770889e-06, + "loss": 0.9834, + "step": 24825 + }, + { + "epoch": 0.64, + "learning_rate": 1.8310697022666378e-06, + "loss": 0.9941, + "step": 24826 + }, + { + "epoch": 0.64, + "learning_rate": 1.8310543125198756e-06, + "loss": 0.7744, + "step": 24827 + }, + { + "epoch": 0.64, + "learning_rate": 1.831038922136813e-06, + "loss": 0.8398, + "step": 24828 + }, + { + "epoch": 0.64, + "learning_rate": 1.8310235311174621e-06, + "loss": 0.9873, + "step": 24829 + }, + { + "epoch": 0.64, + "learning_rate": 1.8310081394618349e-06, + "loss": 0.8867, + "step": 24830 + }, + { + "epoch": 0.64, + "learning_rate": 1.8309927471699427e-06, + "loss": 0.6353, + "step": 24831 + }, + { + "epoch": 0.64, + "learning_rate": 1.8309773542417978e-06, + "loss": 0.8916, + "step": 24832 + }, + { + "epoch": 0.64, + "learning_rate": 1.8309619606774116e-06, + "loss": 0.8228, + "step": 24833 + }, + { + "epoch": 0.64, + "learning_rate": 1.830946566476796e-06, + "loss": 0.8457, + "step": 24834 + }, + { + "epoch": 0.64, + "learning_rate": 1.8309311716399626e-06, + "loss": 1.1934, + "step": 24835 + }, + { + "epoch": 0.64, + "learning_rate": 1.830915776166924e-06, + "loss": 0.8789, + "step": 24836 + }, + { + "epoch": 0.64, + "learning_rate": 1.830900380057691e-06, + "loss": 0.8955, + "step": 24837 + }, + { + "epoch": 0.64, + "learning_rate": 1.8308849833122756e-06, + "loss": 0.9492, + "step": 24838 + }, + { + "epoch": 0.64, + "learning_rate": 1.8308695859306904e-06, + "loss": 0.6826, + "step": 24839 + }, + { + "epoch": 0.64, + "learning_rate": 1.830854187912946e-06, + "loss": 1.0273, + "step": 24840 + }, + { + "epoch": 0.64, + "learning_rate": 1.830838789259055e-06, + "loss": 0.9961, + "step": 24841 + }, + { + "epoch": 0.64, + "learning_rate": 1.8308233899690291e-06, + "loss": 1.041, + "step": 24842 + }, + { + "epoch": 0.64, + "learning_rate": 1.8308079900428796e-06, + "loss": 0.8018, + "step": 24843 + }, + { + "epoch": 0.64, + "learning_rate": 1.8307925894806186e-06, + "loss": 0.834, + "step": 24844 + }, + { + "epoch": 0.64, + "learning_rate": 1.8307771882822582e-06, + "loss": 0.7666, + "step": 24845 + }, + { + "epoch": 0.64, + "learning_rate": 1.8307617864478098e-06, + "loss": 0.8169, + "step": 24846 + }, + { + "epoch": 0.64, + "learning_rate": 1.8307463839772853e-06, + "loss": 0.833, + "step": 24847 + }, + { + "epoch": 0.64, + "learning_rate": 1.8307309808706966e-06, + "loss": 1.0068, + "step": 24848 + }, + { + "epoch": 0.64, + "learning_rate": 1.830715577128055e-06, + "loss": 0.5728, + "step": 24849 + }, + { + "epoch": 0.64, + "learning_rate": 1.8307001727493731e-06, + "loss": 0.8418, + "step": 24850 + }, + { + "epoch": 0.64, + "learning_rate": 1.8306847677346622e-06, + "loss": 0.957, + "step": 24851 + }, + { + "epoch": 0.64, + "learning_rate": 1.830669362083934e-06, + "loss": 0.9873, + "step": 24852 + }, + { + "epoch": 0.64, + "learning_rate": 1.8306539557972006e-06, + "loss": 0.9365, + "step": 24853 + }, + { + "epoch": 0.64, + "learning_rate": 1.8306385488744736e-06, + "loss": 0.7925, + "step": 24854 + }, + { + "epoch": 0.64, + "learning_rate": 1.8306231413157649e-06, + "loss": 0.6875, + "step": 24855 + }, + { + "epoch": 0.64, + "learning_rate": 1.830607733121086e-06, + "loss": 0.9688, + "step": 24856 + }, + { + "epoch": 0.64, + "learning_rate": 1.8305923242904493e-06, + "loss": 0.8311, + "step": 24857 + }, + { + "epoch": 0.64, + "learning_rate": 1.8305769148238662e-06, + "loss": 0.8438, + "step": 24858 + }, + { + "epoch": 0.64, + "learning_rate": 1.8305615047213483e-06, + "loss": 0.8301, + "step": 24859 + }, + { + "epoch": 0.64, + "learning_rate": 1.8305460939829075e-06, + "loss": 0.9473, + "step": 24860 + }, + { + "epoch": 0.64, + "learning_rate": 1.8305306826085563e-06, + "loss": 0.8682, + "step": 24861 + }, + { + "epoch": 0.64, + "learning_rate": 1.8305152705983055e-06, + "loss": 0.6018, + "step": 24862 + }, + { + "epoch": 0.64, + "learning_rate": 1.8304998579521678e-06, + "loss": 0.9277, + "step": 24863 + }, + { + "epoch": 0.64, + "learning_rate": 1.8304844446701542e-06, + "loss": 0.9541, + "step": 24864 + }, + { + "epoch": 0.64, + "learning_rate": 1.830469030752277e-06, + "loss": 0.791, + "step": 24865 + }, + { + "epoch": 0.64, + "learning_rate": 1.8304536161985477e-06, + "loss": 0.729, + "step": 24866 + }, + { + "epoch": 0.64, + "learning_rate": 1.8304382010089782e-06, + "loss": 0.9873, + "step": 24867 + }, + { + "epoch": 0.64, + "learning_rate": 1.8304227851835807e-06, + "loss": 0.5605, + "step": 24868 + }, + { + "epoch": 0.64, + "learning_rate": 1.8304073687223666e-06, + "loss": 0.9248, + "step": 24869 + }, + { + "epoch": 0.64, + "learning_rate": 1.8303919516253475e-06, + "loss": 0.5918, + "step": 24870 + }, + { + "epoch": 0.64, + "learning_rate": 1.8303765338925357e-06, + "loss": 0.7197, + "step": 24871 + }, + { + "epoch": 0.64, + "learning_rate": 1.8303611155239428e-06, + "loss": 0.7744, + "step": 24872 + }, + { + "epoch": 0.64, + "learning_rate": 1.83034569651958e-06, + "loss": 0.6045, + "step": 24873 + }, + { + "epoch": 0.64, + "learning_rate": 1.8303302768794601e-06, + "loss": 0.8906, + "step": 24874 + }, + { + "epoch": 0.64, + "learning_rate": 1.8303148566035946e-06, + "loss": 0.9688, + "step": 24875 + }, + { + "epoch": 0.64, + "learning_rate": 1.830299435691995e-06, + "loss": 0.835, + "step": 24876 + }, + { + "epoch": 0.64, + "learning_rate": 1.8302840141446735e-06, + "loss": 0.9766, + "step": 24877 + }, + { + "epoch": 0.64, + "learning_rate": 1.8302685919616415e-06, + "loss": 0.9805, + "step": 24878 + }, + { + "epoch": 0.64, + "learning_rate": 1.8302531691429111e-06, + "loss": 0.873, + "step": 24879 + }, + { + "epoch": 0.64, + "learning_rate": 1.830237745688494e-06, + "loss": 0.8506, + "step": 24880 + }, + { + "epoch": 0.64, + "learning_rate": 1.8302223215984021e-06, + "loss": 0.9082, + "step": 24881 + }, + { + "epoch": 0.64, + "learning_rate": 1.8302068968726471e-06, + "loss": 0.7949, + "step": 24882 + }, + { + "epoch": 0.64, + "learning_rate": 1.8301914715112407e-06, + "loss": 0.8306, + "step": 24883 + }, + { + "epoch": 0.64, + "learning_rate": 1.8301760455141953e-06, + "loss": 0.5898, + "step": 24884 + }, + { + "epoch": 0.64, + "learning_rate": 1.830160618881522e-06, + "loss": 0.6821, + "step": 24885 + }, + { + "epoch": 0.64, + "learning_rate": 1.8301451916132326e-06, + "loss": 0.6733, + "step": 24886 + }, + { + "epoch": 0.64, + "learning_rate": 1.8301297637093396e-06, + "loss": 0.6862, + "step": 24887 + }, + { + "epoch": 0.64, + "learning_rate": 1.8301143351698545e-06, + "loss": 0.6182, + "step": 24888 + }, + { + "epoch": 0.64, + "learning_rate": 1.8300989059947887e-06, + "loss": 0.7832, + "step": 24889 + }, + { + "epoch": 0.64, + "learning_rate": 1.8300834761841543e-06, + "loss": 0.8384, + "step": 24890 + }, + { + "epoch": 0.64, + "learning_rate": 1.8300680457379634e-06, + "loss": 0.7959, + "step": 24891 + }, + { + "epoch": 0.64, + "learning_rate": 1.8300526146562275e-06, + "loss": 0.9492, + "step": 24892 + }, + { + "epoch": 0.64, + "learning_rate": 1.8300371829389585e-06, + "loss": 0.8442, + "step": 24893 + }, + { + "epoch": 0.64, + "learning_rate": 1.8300217505861682e-06, + "loss": 0.8022, + "step": 24894 + }, + { + "epoch": 0.64, + "learning_rate": 1.8300063175978685e-06, + "loss": 0.9268, + "step": 24895 + }, + { + "epoch": 0.64, + "learning_rate": 1.8299908839740706e-06, + "loss": 0.6934, + "step": 24896 + }, + { + "epoch": 0.64, + "learning_rate": 1.8299754497147872e-06, + "loss": 0.8564, + "step": 24897 + }, + { + "epoch": 0.64, + "learning_rate": 1.8299600148200298e-06, + "loss": 0.7896, + "step": 24898 + }, + { + "epoch": 0.64, + "learning_rate": 1.8299445792898103e-06, + "loss": 0.8486, + "step": 24899 + }, + { + "epoch": 0.64, + "learning_rate": 1.8299291431241403e-06, + "loss": 0.8564, + "step": 24900 + }, + { + "epoch": 0.64, + "learning_rate": 1.8299137063230317e-06, + "loss": 0.8447, + "step": 24901 + }, + { + "epoch": 0.64, + "learning_rate": 1.8298982688864961e-06, + "loss": 0.749, + "step": 24902 + }, + { + "epoch": 0.64, + "learning_rate": 1.829882830814546e-06, + "loss": 1.0449, + "step": 24903 + }, + { + "epoch": 0.64, + "learning_rate": 1.8298673921071926e-06, + "loss": 0.8369, + "step": 24904 + }, + { + "epoch": 0.64, + "learning_rate": 1.829851952764448e-06, + "loss": 0.8604, + "step": 24905 + }, + { + "epoch": 0.64, + "learning_rate": 1.8298365127863233e-06, + "loss": 0.8379, + "step": 24906 + }, + { + "epoch": 0.64, + "learning_rate": 1.8298210721728316e-06, + "loss": 0.8672, + "step": 24907 + }, + { + "epoch": 0.64, + "learning_rate": 1.8298056309239837e-06, + "loss": 0.7041, + "step": 24908 + }, + { + "epoch": 0.64, + "learning_rate": 1.829790189039792e-06, + "loss": 0.7441, + "step": 24909 + }, + { + "epoch": 0.64, + "learning_rate": 1.8297747465202683e-06, + "loss": 0.9053, + "step": 24910 + }, + { + "epoch": 0.64, + "learning_rate": 1.8297593033654239e-06, + "loss": 1.085, + "step": 24911 + }, + { + "epoch": 0.64, + "learning_rate": 1.829743859575271e-06, + "loss": 0.9355, + "step": 24912 + }, + { + "epoch": 0.64, + "learning_rate": 1.8297284151498214e-06, + "loss": 0.9268, + "step": 24913 + }, + { + "epoch": 0.64, + "learning_rate": 1.829712970089087e-06, + "loss": 0.835, + "step": 24914 + }, + { + "epoch": 0.64, + "learning_rate": 1.8296975243930791e-06, + "loss": 0.998, + "step": 24915 + }, + { + "epoch": 0.64, + "learning_rate": 1.8296820780618106e-06, + "loss": 0.8066, + "step": 24916 + }, + { + "epoch": 0.64, + "learning_rate": 1.8296666310952925e-06, + "loss": 0.7886, + "step": 24917 + }, + { + "epoch": 0.64, + "learning_rate": 1.8296511834935363e-06, + "loss": 0.7603, + "step": 24918 + }, + { + "epoch": 0.64, + "learning_rate": 1.8296357352565548e-06, + "loss": 0.9492, + "step": 24919 + }, + { + "epoch": 0.64, + "learning_rate": 1.8296202863843595e-06, + "loss": 0.9844, + "step": 24920 + }, + { + "epoch": 0.64, + "learning_rate": 1.8296048368769616e-06, + "loss": 0.8379, + "step": 24921 + }, + { + "epoch": 0.64, + "learning_rate": 1.8295893867343738e-06, + "loss": 0.8154, + "step": 24922 + }, + { + "epoch": 0.64, + "learning_rate": 1.8295739359566075e-06, + "loss": 0.8262, + "step": 24923 + }, + { + "epoch": 0.64, + "learning_rate": 1.8295584845436744e-06, + "loss": 0.7637, + "step": 24924 + }, + { + "epoch": 0.64, + "learning_rate": 1.8295430324955867e-06, + "loss": 0.7314, + "step": 24925 + }, + { + "epoch": 0.64, + "learning_rate": 1.8295275798123563e-06, + "loss": 0.7529, + "step": 24926 + }, + { + "epoch": 0.64, + "learning_rate": 1.8295121264939942e-06, + "loss": 0.9082, + "step": 24927 + }, + { + "epoch": 0.64, + "learning_rate": 1.8294966725405131e-06, + "loss": 1.0029, + "step": 24928 + }, + { + "epoch": 0.64, + "learning_rate": 1.8294812179519248e-06, + "loss": 1.1426, + "step": 24929 + }, + { + "epoch": 0.64, + "learning_rate": 1.8294657627282403e-06, + "loss": 1.0635, + "step": 24930 + }, + { + "epoch": 0.64, + "learning_rate": 1.8294503068694725e-06, + "loss": 0.9688, + "step": 24931 + }, + { + "epoch": 0.64, + "learning_rate": 1.8294348503756324e-06, + "loss": 0.9502, + "step": 24932 + }, + { + "epoch": 0.64, + "learning_rate": 1.8294193932467324e-06, + "loss": 0.874, + "step": 24933 + }, + { + "epoch": 0.64, + "learning_rate": 1.8294039354827842e-06, + "loss": 0.9004, + "step": 24934 + }, + { + "epoch": 0.64, + "learning_rate": 1.8293884770837993e-06, + "loss": 0.8408, + "step": 24935 + }, + { + "epoch": 0.64, + "learning_rate": 1.8293730180497896e-06, + "loss": 1.0117, + "step": 24936 + }, + { + "epoch": 0.64, + "learning_rate": 1.8293575583807676e-06, + "loss": 0.7588, + "step": 24937 + }, + { + "epoch": 0.64, + "learning_rate": 1.8293420980767444e-06, + "loss": 0.7937, + "step": 24938 + }, + { + "epoch": 0.64, + "learning_rate": 1.829326637137732e-06, + "loss": 0.8184, + "step": 24939 + }, + { + "epoch": 0.64, + "learning_rate": 1.8293111755637426e-06, + "loss": 0.874, + "step": 24940 + }, + { + "epoch": 0.64, + "learning_rate": 1.8292957133547876e-06, + "loss": 0.9834, + "step": 24941 + }, + { + "epoch": 0.64, + "learning_rate": 1.829280250510879e-06, + "loss": 0.8398, + "step": 24942 + }, + { + "epoch": 0.64, + "learning_rate": 1.8292647870320285e-06, + "loss": 1.0488, + "step": 24943 + }, + { + "epoch": 0.64, + "learning_rate": 1.8292493229182485e-06, + "loss": 0.7363, + "step": 24944 + }, + { + "epoch": 0.64, + "learning_rate": 1.82923385816955e-06, + "loss": 0.9717, + "step": 24945 + }, + { + "epoch": 0.64, + "learning_rate": 1.8292183927859452e-06, + "loss": 0.8921, + "step": 24946 + }, + { + "epoch": 0.64, + "learning_rate": 1.8292029267674462e-06, + "loss": 0.8008, + "step": 24947 + }, + { + "epoch": 0.64, + "learning_rate": 1.8291874601140647e-06, + "loss": 0.7617, + "step": 24948 + }, + { + "epoch": 0.64, + "learning_rate": 1.8291719928258125e-06, + "loss": 0.9482, + "step": 24949 + }, + { + "epoch": 0.64, + "learning_rate": 1.8291565249027015e-06, + "loss": 0.7871, + "step": 24950 + }, + { + "epoch": 0.64, + "learning_rate": 1.8291410563447433e-06, + "loss": 0.8232, + "step": 24951 + }, + { + "epoch": 0.64, + "learning_rate": 1.82912558715195e-06, + "loss": 0.8164, + "step": 24952 + }, + { + "epoch": 0.64, + "learning_rate": 1.8291101173243333e-06, + "loss": 0.9971, + "step": 24953 + }, + { + "epoch": 0.64, + "learning_rate": 1.8290946468619052e-06, + "loss": 0.9531, + "step": 24954 + }, + { + "epoch": 0.64, + "learning_rate": 1.8290791757646774e-06, + "loss": 1.0869, + "step": 24955 + }, + { + "epoch": 0.64, + "learning_rate": 1.8290637040326618e-06, + "loss": 0.8438, + "step": 24956 + }, + { + "epoch": 0.64, + "learning_rate": 1.82904823166587e-06, + "loss": 0.7822, + "step": 24957 + }, + { + "epoch": 0.64, + "learning_rate": 1.8290327586643146e-06, + "loss": 0.605, + "step": 24958 + }, + { + "epoch": 0.64, + "learning_rate": 1.8290172850280066e-06, + "loss": 0.9443, + "step": 24959 + }, + { + "epoch": 0.64, + "learning_rate": 1.8290018107569582e-06, + "loss": 0.8022, + "step": 24960 + }, + { + "epoch": 0.64, + "learning_rate": 1.8289863358511814e-06, + "loss": 0.9023, + "step": 24961 + }, + { + "epoch": 0.64, + "learning_rate": 1.8289708603106876e-06, + "loss": 0.8047, + "step": 24962 + }, + { + "epoch": 0.64, + "learning_rate": 1.8289553841354892e-06, + "loss": 0.8574, + "step": 24963 + }, + { + "epoch": 0.64, + "learning_rate": 1.8289399073255978e-06, + "loss": 1.1006, + "step": 24964 + }, + { + "epoch": 0.64, + "learning_rate": 1.828924429881025e-06, + "loss": 0.7832, + "step": 24965 + }, + { + "epoch": 0.64, + "learning_rate": 1.828908951801783e-06, + "loss": 0.666, + "step": 24966 + }, + { + "epoch": 0.64, + "learning_rate": 1.8288934730878834e-06, + "loss": 0.71, + "step": 24967 + }, + { + "epoch": 0.64, + "learning_rate": 1.828877993739338e-06, + "loss": 0.8604, + "step": 24968 + }, + { + "epoch": 0.64, + "learning_rate": 1.8288625137561593e-06, + "loss": 0.8379, + "step": 24969 + }, + { + "epoch": 0.64, + "learning_rate": 1.8288470331383586e-06, + "loss": 0.7603, + "step": 24970 + }, + { + "epoch": 0.64, + "learning_rate": 1.8288315518859477e-06, + "loss": 0.8525, + "step": 24971 + }, + { + "epoch": 0.64, + "learning_rate": 1.8288160699989387e-06, + "loss": 0.9707, + "step": 24972 + }, + { + "epoch": 0.64, + "learning_rate": 1.8288005874773434e-06, + "loss": 1.0586, + "step": 24973 + }, + { + "epoch": 0.64, + "learning_rate": 1.8287851043211732e-06, + "loss": 0.8237, + "step": 24974 + }, + { + "epoch": 0.64, + "learning_rate": 1.828769620530441e-06, + "loss": 0.9951, + "step": 24975 + }, + { + "epoch": 0.64, + "learning_rate": 1.8287541361051575e-06, + "loss": 0.9824, + "step": 24976 + }, + { + "epoch": 0.64, + "learning_rate": 1.8287386510453354e-06, + "loss": 0.8613, + "step": 24977 + }, + { + "epoch": 0.64, + "learning_rate": 1.8287231653509857e-06, + "loss": 0.8789, + "step": 24978 + }, + { + "epoch": 0.64, + "learning_rate": 1.8287076790221213e-06, + "loss": 0.7793, + "step": 24979 + }, + { + "epoch": 0.64, + "learning_rate": 1.8286921920587532e-06, + "loss": 0.9277, + "step": 24980 + }, + { + "epoch": 0.64, + "learning_rate": 1.8286767044608937e-06, + "loss": 1.0166, + "step": 24981 + }, + { + "epoch": 0.64, + "learning_rate": 1.8286612162285548e-06, + "loss": 1.0381, + "step": 24982 + }, + { + "epoch": 0.64, + "learning_rate": 1.8286457273617478e-06, + "loss": 0.8379, + "step": 24983 + }, + { + "epoch": 0.64, + "learning_rate": 1.828630237860485e-06, + "loss": 0.9775, + "step": 24984 + }, + { + "epoch": 0.64, + "learning_rate": 1.828614747724778e-06, + "loss": 0.7275, + "step": 24985 + }, + { + "epoch": 0.64, + "learning_rate": 1.828599256954639e-06, + "loss": 0.748, + "step": 24986 + }, + { + "epoch": 0.64, + "learning_rate": 1.8285837655500793e-06, + "loss": 0.8281, + "step": 24987 + }, + { + "epoch": 0.64, + "learning_rate": 1.8285682735111117e-06, + "loss": 0.8975, + "step": 24988 + }, + { + "epoch": 0.64, + "learning_rate": 1.828552780837747e-06, + "loss": 0.8608, + "step": 24989 + }, + { + "epoch": 0.64, + "learning_rate": 1.8285372875299976e-06, + "loss": 0.9238, + "step": 24990 + }, + { + "epoch": 0.64, + "learning_rate": 1.828521793587875e-06, + "loss": 0.6577, + "step": 24991 + }, + { + "epoch": 0.64, + "learning_rate": 1.828506299011392e-06, + "loss": 0.8174, + "step": 24992 + }, + { + "epoch": 0.64, + "learning_rate": 1.8284908038005596e-06, + "loss": 0.7734, + "step": 24993 + }, + { + "epoch": 0.64, + "learning_rate": 1.8284753079553897e-06, + "loss": 0.9209, + "step": 24994 + }, + { + "epoch": 0.64, + "learning_rate": 1.8284598114758944e-06, + "loss": 1.0742, + "step": 24995 + }, + { + "epoch": 0.64, + "learning_rate": 1.8284443143620858e-06, + "loss": 0.9111, + "step": 24996 + }, + { + "epoch": 0.64, + "learning_rate": 1.8284288166139753e-06, + "loss": 0.731, + "step": 24997 + }, + { + "epoch": 0.64, + "learning_rate": 1.8284133182315745e-06, + "loss": 0.8394, + "step": 24998 + }, + { + "epoch": 0.64, + "learning_rate": 1.8283978192148962e-06, + "loss": 0.9048, + "step": 24999 + }, + { + "epoch": 0.64, + "learning_rate": 1.8283823195639518e-06, + "loss": 0.7412, + "step": 25000 + }, + { + "epoch": 0.64, + "learning_rate": 1.8283668192787532e-06, + "loss": 0.8442, + "step": 25001 + }, + { + "epoch": 0.64, + "learning_rate": 1.828351318359312e-06, + "loss": 0.8604, + "step": 25002 + }, + { + "epoch": 0.64, + "learning_rate": 1.8283358168056404e-06, + "loss": 0.792, + "step": 25003 + }, + { + "epoch": 0.64, + "learning_rate": 1.8283203146177502e-06, + "loss": 1.0547, + "step": 25004 + }, + { + "epoch": 0.64, + "learning_rate": 1.828304811795653e-06, + "loss": 0.8408, + "step": 25005 + }, + { + "epoch": 0.64, + "learning_rate": 1.8282893083393609e-06, + "loss": 0.9756, + "step": 25006 + }, + { + "epoch": 0.64, + "learning_rate": 1.8282738042488858e-06, + "loss": 0.96, + "step": 25007 + }, + { + "epoch": 0.64, + "learning_rate": 1.8282582995242397e-06, + "loss": 0.7148, + "step": 25008 + }, + { + "epoch": 0.64, + "learning_rate": 1.8282427941654344e-06, + "loss": 0.9424, + "step": 25009 + }, + { + "epoch": 0.64, + "learning_rate": 1.8282272881724813e-06, + "loss": 1.1211, + "step": 25010 + }, + { + "epoch": 0.64, + "learning_rate": 1.8282117815453929e-06, + "loss": 0.6592, + "step": 25011 + }, + { + "epoch": 0.64, + "learning_rate": 1.8281962742841808e-06, + "loss": 0.604, + "step": 25012 + }, + { + "epoch": 0.64, + "learning_rate": 1.828180766388857e-06, + "loss": 0.7178, + "step": 25013 + }, + { + "epoch": 0.64, + "learning_rate": 1.828165257859433e-06, + "loss": 0.7065, + "step": 25014 + }, + { + "epoch": 0.64, + "learning_rate": 1.828149748695921e-06, + "loss": 1.0059, + "step": 25015 + }, + { + "epoch": 0.64, + "learning_rate": 1.8281342388983329e-06, + "loss": 0.894, + "step": 25016 + }, + { + "epoch": 0.64, + "learning_rate": 1.8281187284666805e-06, + "loss": 0.8428, + "step": 25017 + }, + { + "epoch": 0.64, + "learning_rate": 1.8281032174009757e-06, + "loss": 0.9844, + "step": 25018 + }, + { + "epoch": 0.64, + "learning_rate": 1.8280877057012303e-06, + "loss": 0.7969, + "step": 25019 + }, + { + "epoch": 0.64, + "learning_rate": 1.8280721933674562e-06, + "loss": 0.8242, + "step": 25020 + }, + { + "epoch": 0.64, + "learning_rate": 1.8280566803996652e-06, + "loss": 0.8564, + "step": 25021 + }, + { + "epoch": 0.64, + "learning_rate": 1.8280411667978694e-06, + "loss": 0.7524, + "step": 25022 + }, + { + "epoch": 0.64, + "learning_rate": 1.8280256525620805e-06, + "loss": 0.9854, + "step": 25023 + }, + { + "epoch": 0.64, + "learning_rate": 1.8280101376923105e-06, + "loss": 0.7378, + "step": 25024 + }, + { + "epoch": 0.64, + "learning_rate": 1.8279946221885712e-06, + "loss": 0.7466, + "step": 25025 + }, + { + "epoch": 0.64, + "learning_rate": 1.8279791060508744e-06, + "loss": 0.8809, + "step": 25026 + }, + { + "epoch": 0.64, + "learning_rate": 1.8279635892792323e-06, + "loss": 0.6763, + "step": 25027 + }, + { + "epoch": 0.64, + "learning_rate": 1.8279480718736564e-06, + "loss": 1.0645, + "step": 25028 + }, + { + "epoch": 0.64, + "learning_rate": 1.8279325538341586e-06, + "loss": 0.7749, + "step": 25029 + }, + { + "epoch": 0.64, + "learning_rate": 1.827917035160751e-06, + "loss": 0.9775, + "step": 25030 + }, + { + "epoch": 0.64, + "learning_rate": 1.8279015158534454e-06, + "loss": 0.8203, + "step": 25031 + }, + { + "epoch": 0.64, + "learning_rate": 1.8278859959122537e-06, + "loss": 1.0107, + "step": 25032 + }, + { + "epoch": 0.64, + "learning_rate": 1.8278704753371876e-06, + "loss": 0.8857, + "step": 25033 + }, + { + "epoch": 0.64, + "learning_rate": 1.8278549541282596e-06, + "loss": 0.9443, + "step": 25034 + }, + { + "epoch": 0.64, + "learning_rate": 1.8278394322854806e-06, + "loss": 0.8945, + "step": 25035 + }, + { + "epoch": 0.64, + "learning_rate": 1.8278239098088632e-06, + "loss": 0.8086, + "step": 25036 + }, + { + "epoch": 0.64, + "learning_rate": 1.8278083866984194e-06, + "loss": 0.9131, + "step": 25037 + }, + { + "epoch": 0.64, + "learning_rate": 1.8277928629541606e-06, + "loss": 0.7827, + "step": 25038 + }, + { + "epoch": 0.64, + "learning_rate": 1.8277773385760987e-06, + "loss": 1.0449, + "step": 25039 + }, + { + "epoch": 0.64, + "learning_rate": 1.8277618135642459e-06, + "loss": 0.855, + "step": 25040 + }, + { + "epoch": 0.64, + "learning_rate": 1.8277462879186136e-06, + "loss": 0.9814, + "step": 25041 + }, + { + "epoch": 0.64, + "learning_rate": 1.8277307616392147e-06, + "loss": 0.8037, + "step": 25042 + }, + { + "epoch": 0.64, + "learning_rate": 1.8277152347260598e-06, + "loss": 0.9336, + "step": 25043 + }, + { + "epoch": 0.64, + "learning_rate": 1.8276997071791619e-06, + "loss": 1.1338, + "step": 25044 + }, + { + "epoch": 0.64, + "learning_rate": 1.8276841789985319e-06, + "loss": 0.8838, + "step": 25045 + }, + { + "epoch": 0.64, + "learning_rate": 1.8276686501841825e-06, + "loss": 0.7451, + "step": 25046 + }, + { + "epoch": 0.64, + "learning_rate": 1.827653120736125e-06, + "loss": 0.9297, + "step": 25047 + }, + { + "epoch": 0.64, + "learning_rate": 1.8276375906543718e-06, + "loss": 0.9375, + "step": 25048 + }, + { + "epoch": 0.64, + "learning_rate": 1.8276220599389345e-06, + "loss": 0.9414, + "step": 25049 + }, + { + "epoch": 0.64, + "learning_rate": 1.827606528589825e-06, + "loss": 0.7441, + "step": 25050 + }, + { + "epoch": 0.64, + "learning_rate": 1.8275909966070552e-06, + "loss": 0.6797, + "step": 25051 + }, + { + "epoch": 0.64, + "learning_rate": 1.8275754639906373e-06, + "loss": 0.8447, + "step": 25052 + }, + { + "epoch": 0.64, + "learning_rate": 1.8275599307405827e-06, + "loss": 0.9404, + "step": 25053 + }, + { + "epoch": 0.64, + "learning_rate": 1.8275443968569034e-06, + "loss": 0.7319, + "step": 25054 + }, + { + "epoch": 0.64, + "learning_rate": 1.8275288623396117e-06, + "loss": 1.002, + "step": 25055 + }, + { + "epoch": 0.64, + "learning_rate": 1.8275133271887188e-06, + "loss": 0.8403, + "step": 25056 + }, + { + "epoch": 0.64, + "learning_rate": 1.8274977914042374e-06, + "loss": 0.6787, + "step": 25057 + }, + { + "epoch": 0.64, + "learning_rate": 1.8274822549861787e-06, + "loss": 0.8027, + "step": 25058 + }, + { + "epoch": 0.64, + "learning_rate": 1.8274667179345551e-06, + "loss": 0.8613, + "step": 25059 + }, + { + "epoch": 0.64, + "learning_rate": 1.8274511802493782e-06, + "loss": 0.7886, + "step": 25060 + }, + { + "epoch": 0.64, + "learning_rate": 1.82743564193066e-06, + "loss": 1.0459, + "step": 25061 + }, + { + "epoch": 0.64, + "learning_rate": 1.8274201029784124e-06, + "loss": 0.8931, + "step": 25062 + }, + { + "epoch": 0.64, + "learning_rate": 1.8274045633926472e-06, + "loss": 0.7886, + "step": 25063 + }, + { + "epoch": 0.64, + "learning_rate": 1.8273890231733762e-06, + "loss": 0.729, + "step": 25064 + }, + { + "epoch": 0.64, + "learning_rate": 1.8273734823206117e-06, + "loss": 0.8906, + "step": 25065 + }, + { + "epoch": 0.64, + "learning_rate": 1.8273579408343655e-06, + "loss": 0.9277, + "step": 25066 + }, + { + "epoch": 0.64, + "learning_rate": 1.827342398714649e-06, + "loss": 0.8057, + "step": 25067 + }, + { + "epoch": 0.64, + "learning_rate": 1.8273268559614747e-06, + "loss": 1.0186, + "step": 25068 + }, + { + "epoch": 0.64, + "learning_rate": 1.8273113125748542e-06, + "loss": 0.8276, + "step": 25069 + }, + { + "epoch": 0.64, + "learning_rate": 1.8272957685547996e-06, + "loss": 0.7734, + "step": 25070 + }, + { + "epoch": 0.64, + "learning_rate": 1.8272802239013227e-06, + "loss": 0.792, + "step": 25071 + }, + { + "epoch": 0.64, + "learning_rate": 1.8272646786144352e-06, + "loss": 0.7505, + "step": 25072 + }, + { + "epoch": 0.64, + "learning_rate": 1.827249132694149e-06, + "loss": 0.6992, + "step": 25073 + }, + { + "epoch": 0.64, + "learning_rate": 1.8272335861404765e-06, + "loss": 1.0068, + "step": 25074 + }, + { + "epoch": 0.64, + "learning_rate": 1.827218038953429e-06, + "loss": 0.6348, + "step": 25075 + }, + { + "epoch": 0.64, + "learning_rate": 1.8272024911330192e-06, + "loss": 0.9805, + "step": 25076 + }, + { + "epoch": 0.64, + "learning_rate": 1.827186942679258e-06, + "loss": 0.6914, + "step": 25077 + }, + { + "epoch": 0.64, + "learning_rate": 1.827171393592158e-06, + "loss": 0.7119, + "step": 25078 + }, + { + "epoch": 0.64, + "learning_rate": 1.827155843871731e-06, + "loss": 0.9102, + "step": 25079 + }, + { + "epoch": 0.64, + "learning_rate": 1.8271402935179884e-06, + "loss": 0.9395, + "step": 25080 + }, + { + "epoch": 0.64, + "learning_rate": 1.827124742530943e-06, + "loss": 0.8398, + "step": 25081 + }, + { + "epoch": 0.64, + "learning_rate": 1.8271091909106059e-06, + "loss": 0.7617, + "step": 25082 + }, + { + "epoch": 0.64, + "learning_rate": 1.8270936386569893e-06, + "loss": 0.7783, + "step": 25083 + }, + { + "epoch": 0.64, + "learning_rate": 1.8270780857701053e-06, + "loss": 0.9629, + "step": 25084 + }, + { + "epoch": 0.64, + "learning_rate": 1.8270625322499654e-06, + "loss": 1.0293, + "step": 25085 + }, + { + "epoch": 0.64, + "learning_rate": 1.827046978096582e-06, + "loss": 0.7822, + "step": 25086 + }, + { + "epoch": 0.64, + "learning_rate": 1.8270314233099666e-06, + "loss": 0.7852, + "step": 25087 + }, + { + "epoch": 0.64, + "learning_rate": 1.8270158678901316e-06, + "loss": 0.7837, + "step": 25088 + }, + { + "epoch": 0.64, + "learning_rate": 1.827000311837088e-06, + "loss": 0.9951, + "step": 25089 + }, + { + "epoch": 0.64, + "learning_rate": 1.8269847551508488e-06, + "loss": 0.8906, + "step": 25090 + }, + { + "epoch": 0.64, + "learning_rate": 1.826969197831425e-06, + "loss": 0.7109, + "step": 25091 + }, + { + "epoch": 0.64, + "learning_rate": 1.8269536398788292e-06, + "loss": 0.9912, + "step": 25092 + }, + { + "epoch": 0.64, + "learning_rate": 1.826938081293073e-06, + "loss": 0.7534, + "step": 25093 + }, + { + "epoch": 0.64, + "learning_rate": 1.8269225220741683e-06, + "loss": 1.1621, + "step": 25094 + }, + { + "epoch": 0.64, + "learning_rate": 1.8269069622221269e-06, + "loss": 0.8374, + "step": 25095 + }, + { + "epoch": 0.64, + "learning_rate": 1.8268914017369613e-06, + "loss": 0.9121, + "step": 25096 + }, + { + "epoch": 0.64, + "learning_rate": 1.8268758406186825e-06, + "loss": 0.9365, + "step": 25097 + }, + { + "epoch": 0.64, + "learning_rate": 1.8268602788673028e-06, + "loss": 0.9106, + "step": 25098 + }, + { + "epoch": 0.64, + "learning_rate": 1.8268447164828346e-06, + "loss": 0.7051, + "step": 25099 + }, + { + "epoch": 0.64, + "learning_rate": 1.8268291534652894e-06, + "loss": 0.7852, + "step": 25100 + }, + { + "epoch": 0.64, + "learning_rate": 1.826813589814679e-06, + "loss": 0.873, + "step": 25101 + }, + { + "epoch": 0.64, + "learning_rate": 1.8267980255310153e-06, + "loss": 0.7363, + "step": 25102 + }, + { + "epoch": 0.64, + "learning_rate": 1.8267824606143106e-06, + "loss": 0.6475, + "step": 25103 + }, + { + "epoch": 0.64, + "learning_rate": 1.8267668950645764e-06, + "loss": 0.8652, + "step": 25104 + }, + { + "epoch": 0.64, + "learning_rate": 1.8267513288818251e-06, + "loss": 0.6851, + "step": 25105 + }, + { + "epoch": 0.64, + "learning_rate": 1.826735762066068e-06, + "loss": 0.9141, + "step": 25106 + }, + { + "epoch": 0.64, + "learning_rate": 1.8267201946173174e-06, + "loss": 0.7236, + "step": 25107 + }, + { + "epoch": 0.64, + "learning_rate": 1.8267046265355854e-06, + "loss": 0.7061, + "step": 25108 + }, + { + "epoch": 0.64, + "learning_rate": 1.8266890578208836e-06, + "loss": 0.9033, + "step": 25109 + }, + { + "epoch": 0.64, + "learning_rate": 1.8266734884732237e-06, + "loss": 0.7871, + "step": 25110 + }, + { + "epoch": 0.64, + "learning_rate": 1.8266579184926183e-06, + "loss": 0.8359, + "step": 25111 + }, + { + "epoch": 0.64, + "learning_rate": 1.8266423478790787e-06, + "loss": 0.8398, + "step": 25112 + }, + { + "epoch": 0.64, + "learning_rate": 1.8266267766326173e-06, + "loss": 0.9092, + "step": 25113 + }, + { + "epoch": 0.64, + "learning_rate": 1.8266112047532456e-06, + "loss": 0.6592, + "step": 25114 + }, + { + "epoch": 0.64, + "learning_rate": 1.8265956322409756e-06, + "loss": 0.8623, + "step": 25115 + }, + { + "epoch": 0.64, + "learning_rate": 1.8265800590958195e-06, + "loss": 0.7686, + "step": 25116 + }, + { + "epoch": 0.64, + "learning_rate": 1.826564485317789e-06, + "loss": 0.8486, + "step": 25117 + }, + { + "epoch": 0.64, + "learning_rate": 1.8265489109068963e-06, + "loss": 0.7246, + "step": 25118 + }, + { + "epoch": 0.64, + "learning_rate": 1.8265333358631527e-06, + "loss": 0.8213, + "step": 25119 + }, + { + "epoch": 0.64, + "learning_rate": 1.826517760186571e-06, + "loss": 0.8604, + "step": 25120 + }, + { + "epoch": 0.64, + "learning_rate": 1.8265021838771623e-06, + "loss": 0.8965, + "step": 25121 + }, + { + "epoch": 0.64, + "learning_rate": 1.826486606934939e-06, + "loss": 0.7163, + "step": 25122 + }, + { + "epoch": 0.64, + "learning_rate": 1.8264710293599128e-06, + "loss": 0.7715, + "step": 25123 + }, + { + "epoch": 0.64, + "learning_rate": 1.8264554511520959e-06, + "loss": 0.7861, + "step": 25124 + }, + { + "epoch": 0.64, + "learning_rate": 1.8264398723115e-06, + "loss": 0.8057, + "step": 25125 + }, + { + "epoch": 0.64, + "learning_rate": 1.826424292838137e-06, + "loss": 0.7021, + "step": 25126 + }, + { + "epoch": 0.64, + "learning_rate": 1.8264087127320188e-06, + "loss": 0.9512, + "step": 25127 + }, + { + "epoch": 0.64, + "learning_rate": 1.8263931319931577e-06, + "loss": 0.9424, + "step": 25128 + }, + { + "epoch": 0.64, + "learning_rate": 1.8263775506215656e-06, + "loss": 0.8721, + "step": 25129 + }, + { + "epoch": 0.64, + "learning_rate": 1.8263619686172538e-06, + "loss": 0.7554, + "step": 25130 + }, + { + "epoch": 0.64, + "learning_rate": 1.8263463859802348e-06, + "loss": 0.7061, + "step": 25131 + }, + { + "epoch": 0.64, + "learning_rate": 1.8263308027105202e-06, + "loss": 0.8389, + "step": 25132 + }, + { + "epoch": 0.64, + "learning_rate": 1.8263152188081223e-06, + "loss": 1.0342, + "step": 25133 + }, + { + "epoch": 0.64, + "learning_rate": 1.8262996342730529e-06, + "loss": 0.8105, + "step": 25134 + }, + { + "epoch": 0.64, + "learning_rate": 1.8262840491053235e-06, + "loss": 1.002, + "step": 25135 + }, + { + "epoch": 0.64, + "learning_rate": 1.8262684633049467e-06, + "loss": 0.9414, + "step": 25136 + }, + { + "epoch": 0.64, + "learning_rate": 1.8262528768719342e-06, + "loss": 0.9678, + "step": 25137 + }, + { + "epoch": 0.64, + "learning_rate": 1.8262372898062977e-06, + "loss": 0.8926, + "step": 25138 + }, + { + "epoch": 0.64, + "learning_rate": 1.8262217021080494e-06, + "loss": 0.8232, + "step": 25139 + }, + { + "epoch": 0.64, + "learning_rate": 1.8262061137772008e-06, + "loss": 0.7871, + "step": 25140 + }, + { + "epoch": 0.64, + "learning_rate": 1.8261905248137646e-06, + "loss": 0.8877, + "step": 25141 + }, + { + "epoch": 0.64, + "learning_rate": 1.826174935217752e-06, + "loss": 0.8721, + "step": 25142 + }, + { + "epoch": 0.64, + "learning_rate": 1.8261593449891755e-06, + "loss": 0.7266, + "step": 25143 + }, + { + "epoch": 0.64, + "learning_rate": 1.8261437541280467e-06, + "loss": 0.8364, + "step": 25144 + }, + { + "epoch": 0.64, + "learning_rate": 1.8261281626343776e-06, + "loss": 0.6733, + "step": 25145 + }, + { + "epoch": 0.64, + "learning_rate": 1.82611257050818e-06, + "loss": 0.9414, + "step": 25146 + }, + { + "epoch": 0.64, + "learning_rate": 1.826096977749466e-06, + "loss": 1.0703, + "step": 25147 + }, + { + "epoch": 0.64, + "learning_rate": 1.8260813843582477e-06, + "loss": 0.958, + "step": 25148 + }, + { + "epoch": 0.64, + "learning_rate": 1.8260657903345367e-06, + "loss": 0.7305, + "step": 25149 + }, + { + "epoch": 0.64, + "learning_rate": 1.8260501956783453e-06, + "loss": 0.9102, + "step": 25150 + }, + { + "epoch": 0.64, + "learning_rate": 1.8260346003896852e-06, + "loss": 1.0039, + "step": 25151 + }, + { + "epoch": 0.64, + "learning_rate": 1.8260190044685683e-06, + "loss": 0.6875, + "step": 25152 + }, + { + "epoch": 0.64, + "learning_rate": 1.8260034079150066e-06, + "loss": 0.9082, + "step": 25153 + }, + { + "epoch": 0.64, + "learning_rate": 1.8259878107290123e-06, + "loss": 0.7891, + "step": 25154 + }, + { + "epoch": 0.64, + "learning_rate": 1.8259722129105968e-06, + "loss": 0.7939, + "step": 25155 + }, + { + "epoch": 0.64, + "learning_rate": 1.8259566144597726e-06, + "loss": 0.8994, + "step": 25156 + }, + { + "epoch": 0.64, + "learning_rate": 1.8259410153765512e-06, + "loss": 0.7891, + "step": 25157 + }, + { + "epoch": 0.64, + "learning_rate": 1.825925415660945e-06, + "loss": 0.8672, + "step": 25158 + }, + { + "epoch": 0.64, + "learning_rate": 1.8259098153129656e-06, + "loss": 0.7329, + "step": 25159 + }, + { + "epoch": 0.64, + "learning_rate": 1.825894214332625e-06, + "loss": 0.8877, + "step": 25160 + }, + { + "epoch": 0.64, + "learning_rate": 1.8258786127199351e-06, + "loss": 0.7695, + "step": 25161 + }, + { + "epoch": 0.64, + "learning_rate": 1.825863010474908e-06, + "loss": 0.8779, + "step": 25162 + }, + { + "epoch": 0.64, + "learning_rate": 1.8258474075975556e-06, + "loss": 0.8857, + "step": 25163 + }, + { + "epoch": 0.64, + "learning_rate": 1.8258318040878897e-06, + "loss": 0.7808, + "step": 25164 + }, + { + "epoch": 0.64, + "learning_rate": 1.8258161999459225e-06, + "loss": 0.8604, + "step": 25165 + }, + { + "epoch": 0.65, + "learning_rate": 1.8258005951716657e-06, + "loss": 1.0205, + "step": 25166 + }, + { + "epoch": 0.65, + "learning_rate": 1.8257849897651312e-06, + "loss": 0.8711, + "step": 25167 + }, + { + "epoch": 0.65, + "learning_rate": 1.8257693837263313e-06, + "loss": 0.8232, + "step": 25168 + }, + { + "epoch": 0.65, + "learning_rate": 1.8257537770552777e-06, + "loss": 0.6792, + "step": 25169 + }, + { + "epoch": 0.65, + "learning_rate": 1.8257381697519825e-06, + "loss": 0.7734, + "step": 25170 + }, + { + "epoch": 0.65, + "learning_rate": 1.8257225618164575e-06, + "loss": 0.7695, + "step": 25171 + }, + { + "epoch": 0.65, + "learning_rate": 1.8257069532487148e-06, + "loss": 0.7388, + "step": 25172 + }, + { + "epoch": 0.65, + "learning_rate": 1.8256913440487661e-06, + "loss": 0.8525, + "step": 25173 + }, + { + "epoch": 0.65, + "learning_rate": 1.8256757342166234e-06, + "loss": 1.0547, + "step": 25174 + }, + { + "epoch": 0.65, + "learning_rate": 1.8256601237522991e-06, + "loss": 0.6147, + "step": 25175 + }, + { + "epoch": 0.65, + "learning_rate": 1.8256445126558045e-06, + "loss": 0.9814, + "step": 25176 + }, + { + "epoch": 0.65, + "learning_rate": 1.8256289009271518e-06, + "loss": 0.9385, + "step": 25177 + }, + { + "epoch": 0.65, + "learning_rate": 1.8256132885663536e-06, + "loss": 1.0371, + "step": 25178 + }, + { + "epoch": 0.65, + "learning_rate": 1.8255976755734206e-06, + "loss": 0.877, + "step": 25179 + }, + { + "epoch": 0.65, + "learning_rate": 1.8255820619483658e-06, + "loss": 0.9131, + "step": 25180 + }, + { + "epoch": 0.65, + "learning_rate": 1.8255664476912008e-06, + "loss": 1.0166, + "step": 25181 + }, + { + "epoch": 0.65, + "learning_rate": 1.8255508328019372e-06, + "loss": 0.9395, + "step": 25182 + }, + { + "epoch": 0.65, + "learning_rate": 1.8255352172805876e-06, + "loss": 0.915, + "step": 25183 + }, + { + "epoch": 0.65, + "learning_rate": 1.8255196011271633e-06, + "loss": 0.7627, + "step": 25184 + }, + { + "epoch": 0.65, + "learning_rate": 1.8255039843416768e-06, + "loss": 1.0332, + "step": 25185 + }, + { + "epoch": 0.65, + "learning_rate": 1.82548836692414e-06, + "loss": 0.7651, + "step": 25186 + }, + { + "epoch": 0.65, + "learning_rate": 1.8254727488745644e-06, + "loss": 0.9238, + "step": 25187 + }, + { + "epoch": 0.65, + "learning_rate": 1.8254571301929626e-06, + "loss": 0.7861, + "step": 25188 + }, + { + "epoch": 0.65, + "learning_rate": 1.825441510879346e-06, + "loss": 0.9062, + "step": 25189 + }, + { + "epoch": 0.65, + "learning_rate": 1.8254258909337268e-06, + "loss": 0.7905, + "step": 25190 + }, + { + "epoch": 0.65, + "learning_rate": 1.8254102703561171e-06, + "loss": 0.9082, + "step": 25191 + }, + { + "epoch": 0.65, + "learning_rate": 1.8253946491465285e-06, + "loss": 0.7412, + "step": 25192 + }, + { + "epoch": 0.65, + "learning_rate": 1.8253790273049735e-06, + "loss": 0.8408, + "step": 25193 + }, + { + "epoch": 0.65, + "learning_rate": 1.8253634048314634e-06, + "loss": 0.8291, + "step": 25194 + }, + { + "epoch": 0.65, + "learning_rate": 1.8253477817260107e-06, + "loss": 0.833, + "step": 25195 + }, + { + "epoch": 0.65, + "learning_rate": 1.8253321579886272e-06, + "loss": 1.0254, + "step": 25196 + }, + { + "epoch": 0.65, + "learning_rate": 1.8253165336193245e-06, + "loss": 0.7036, + "step": 25197 + }, + { + "epoch": 0.65, + "learning_rate": 1.8253009086181153e-06, + "loss": 0.79, + "step": 25198 + }, + { + "epoch": 0.65, + "learning_rate": 1.825285282985011e-06, + "loss": 1.0146, + "step": 25199 + }, + { + "epoch": 0.65, + "learning_rate": 1.8252696567200237e-06, + "loss": 0.7686, + "step": 25200 + }, + { + "epoch": 0.65, + "learning_rate": 1.825254029823165e-06, + "loss": 0.73, + "step": 25201 + }, + { + "epoch": 0.65, + "learning_rate": 1.8252384022944476e-06, + "loss": 0.8936, + "step": 25202 + }, + { + "epoch": 0.65, + "learning_rate": 1.825222774133883e-06, + "loss": 0.9443, + "step": 25203 + }, + { + "epoch": 0.65, + "learning_rate": 1.8252071453414835e-06, + "loss": 0.8936, + "step": 25204 + }, + { + "epoch": 0.65, + "learning_rate": 1.8251915159172606e-06, + "loss": 0.7959, + "step": 25205 + }, + { + "epoch": 0.65, + "learning_rate": 1.8251758858612262e-06, + "loss": 1.0381, + "step": 25206 + }, + { + "epoch": 0.65, + "learning_rate": 1.8251602551733932e-06, + "loss": 1.0381, + "step": 25207 + }, + { + "epoch": 0.65, + "learning_rate": 1.8251446238537725e-06, + "loss": 0.8525, + "step": 25208 + }, + { + "epoch": 0.65, + "learning_rate": 1.8251289919023767e-06, + "loss": 0.7285, + "step": 25209 + }, + { + "epoch": 0.65, + "learning_rate": 1.8251133593192175e-06, + "loss": 0.8672, + "step": 25210 + }, + { + "epoch": 0.65, + "learning_rate": 1.825097726104307e-06, + "loss": 0.8408, + "step": 25211 + }, + { + "epoch": 0.65, + "learning_rate": 1.825082092257657e-06, + "loss": 0.8459, + "step": 25212 + }, + { + "epoch": 0.65, + "learning_rate": 1.8250664577792795e-06, + "loss": 0.9785, + "step": 25213 + }, + { + "epoch": 0.65, + "learning_rate": 1.8250508226691868e-06, + "loss": 0.9336, + "step": 25214 + }, + { + "epoch": 0.65, + "learning_rate": 1.8250351869273906e-06, + "loss": 0.8159, + "step": 25215 + }, + { + "epoch": 0.65, + "learning_rate": 1.8250195505539025e-06, + "loss": 1.0859, + "step": 25216 + }, + { + "epoch": 0.65, + "learning_rate": 1.8250039135487355e-06, + "loss": 0.6733, + "step": 25217 + }, + { + "epoch": 0.65, + "learning_rate": 1.8249882759119007e-06, + "loss": 0.8213, + "step": 25218 + }, + { + "epoch": 0.65, + "learning_rate": 1.82497263764341e-06, + "loss": 1.1016, + "step": 25219 + }, + { + "epoch": 0.65, + "learning_rate": 1.8249569987432758e-06, + "loss": 0.9863, + "step": 25220 + }, + { + "epoch": 0.65, + "learning_rate": 1.8249413592115102e-06, + "loss": 0.6221, + "step": 25221 + }, + { + "epoch": 0.65, + "learning_rate": 1.824925719048125e-06, + "loss": 0.7969, + "step": 25222 + }, + { + "epoch": 0.65, + "learning_rate": 1.8249100782531318e-06, + "loss": 1.0264, + "step": 25223 + }, + { + "epoch": 0.65, + "learning_rate": 1.8248944368265428e-06, + "loss": 0.8901, + "step": 25224 + }, + { + "epoch": 0.65, + "learning_rate": 1.8248787947683703e-06, + "loss": 0.8047, + "step": 25225 + }, + { + "epoch": 0.65, + "learning_rate": 1.824863152078626e-06, + "loss": 0.998, + "step": 25226 + }, + { + "epoch": 0.65, + "learning_rate": 1.824847508757322e-06, + "loss": 0.999, + "step": 25227 + }, + { + "epoch": 0.65, + "learning_rate": 1.82483186480447e-06, + "loss": 0.7927, + "step": 25228 + }, + { + "epoch": 0.65, + "learning_rate": 1.8248162202200823e-06, + "loss": 0.666, + "step": 25229 + }, + { + "epoch": 0.65, + "learning_rate": 1.8248005750041705e-06, + "loss": 0.9473, + "step": 25230 + }, + { + "epoch": 0.65, + "learning_rate": 1.8247849291567472e-06, + "loss": 0.834, + "step": 25231 + }, + { + "epoch": 0.65, + "learning_rate": 1.8247692826778238e-06, + "loss": 0.9277, + "step": 25232 + }, + { + "epoch": 0.65, + "learning_rate": 1.8247536355674127e-06, + "loss": 0.9902, + "step": 25233 + }, + { + "epoch": 0.65, + "learning_rate": 1.8247379878255254e-06, + "loss": 0.9287, + "step": 25234 + }, + { + "epoch": 0.65, + "learning_rate": 1.8247223394521743e-06, + "loss": 0.9497, + "step": 25235 + }, + { + "epoch": 0.65, + "learning_rate": 1.8247066904473708e-06, + "loss": 0.8677, + "step": 25236 + }, + { + "epoch": 0.65, + "learning_rate": 1.8246910408111278e-06, + "loss": 0.8765, + "step": 25237 + }, + { + "epoch": 0.65, + "learning_rate": 1.8246753905434567e-06, + "loss": 0.8213, + "step": 25238 + }, + { + "epoch": 0.65, + "learning_rate": 1.8246597396443696e-06, + "loss": 0.8496, + "step": 25239 + }, + { + "epoch": 0.65, + "learning_rate": 1.8246440881138782e-06, + "loss": 0.9502, + "step": 25240 + }, + { + "epoch": 0.65, + "learning_rate": 1.824628435951995e-06, + "loss": 0.7148, + "step": 25241 + }, + { + "epoch": 0.65, + "learning_rate": 1.8246127831587316e-06, + "loss": 1.0273, + "step": 25242 + }, + { + "epoch": 0.65, + "learning_rate": 1.8245971297341e-06, + "loss": 0.709, + "step": 25243 + }, + { + "epoch": 0.65, + "learning_rate": 1.8245814756781127e-06, + "loss": 0.8301, + "step": 25244 + }, + { + "epoch": 0.65, + "learning_rate": 1.824565820990781e-06, + "loss": 0.876, + "step": 25245 + }, + { + "epoch": 0.65, + "learning_rate": 1.824550165672117e-06, + "loss": 0.9424, + "step": 25246 + }, + { + "epoch": 0.65, + "learning_rate": 1.8245345097221333e-06, + "loss": 0.9326, + "step": 25247 + }, + { + "epoch": 0.65, + "learning_rate": 1.824518853140841e-06, + "loss": 1.04, + "step": 25248 + }, + { + "epoch": 0.65, + "learning_rate": 1.8245031959282527e-06, + "loss": 0.9404, + "step": 25249 + }, + { + "epoch": 0.65, + "learning_rate": 1.8244875380843805e-06, + "loss": 0.9131, + "step": 25250 + }, + { + "epoch": 0.65, + "learning_rate": 1.8244718796092355e-06, + "loss": 0.8066, + "step": 25251 + }, + { + "epoch": 0.65, + "learning_rate": 1.8244562205028306e-06, + "loss": 1.0566, + "step": 25252 + }, + { + "epoch": 0.65, + "learning_rate": 1.8244405607651778e-06, + "loss": 0.7524, + "step": 25253 + }, + { + "epoch": 0.65, + "learning_rate": 1.8244249003962883e-06, + "loss": 0.8555, + "step": 25254 + }, + { + "epoch": 0.65, + "learning_rate": 1.8244092393961747e-06, + "loss": 0.8809, + "step": 25255 + }, + { + "epoch": 0.65, + "learning_rate": 1.8243935777648489e-06, + "loss": 0.4637, + "step": 25256 + }, + { + "epoch": 0.65, + "learning_rate": 1.8243779155023228e-06, + "loss": 0.7202, + "step": 25257 + }, + { + "epoch": 0.65, + "learning_rate": 1.8243622526086083e-06, + "loss": 0.823, + "step": 25258 + }, + { + "epoch": 0.65, + "learning_rate": 1.824346589083718e-06, + "loss": 0.8335, + "step": 25259 + }, + { + "epoch": 0.65, + "learning_rate": 1.824330924927663e-06, + "loss": 0.9424, + "step": 25260 + }, + { + "epoch": 0.65, + "learning_rate": 1.8243152601404558e-06, + "loss": 0.9307, + "step": 25261 + }, + { + "epoch": 0.65, + "learning_rate": 1.8242995947221084e-06, + "loss": 0.8594, + "step": 25262 + }, + { + "epoch": 0.65, + "learning_rate": 1.8242839286726327e-06, + "loss": 0.8984, + "step": 25263 + }, + { + "epoch": 0.65, + "learning_rate": 1.8242682619920403e-06, + "loss": 0.8901, + "step": 25264 + }, + { + "epoch": 0.65, + "learning_rate": 1.8242525946803443e-06, + "loss": 0.9043, + "step": 25265 + }, + { + "epoch": 0.65, + "learning_rate": 1.8242369267375554e-06, + "loss": 0.9414, + "step": 25266 + }, + { + "epoch": 0.65, + "learning_rate": 1.8242212581636864e-06, + "loss": 0.9131, + "step": 25267 + }, + { + "epoch": 0.65, + "learning_rate": 1.8242055889587494e-06, + "loss": 0.7148, + "step": 25268 + }, + { + "epoch": 0.65, + "learning_rate": 1.8241899191227556e-06, + "loss": 0.876, + "step": 25269 + }, + { + "epoch": 0.65, + "learning_rate": 1.8241742486557177e-06, + "loss": 0.8613, + "step": 25270 + }, + { + "epoch": 0.65, + "learning_rate": 1.8241585775576473e-06, + "loss": 0.6489, + "step": 25271 + }, + { + "epoch": 0.65, + "learning_rate": 1.8241429058285568e-06, + "loss": 0.9707, + "step": 25272 + }, + { + "epoch": 0.65, + "learning_rate": 1.8241272334684577e-06, + "loss": 0.9053, + "step": 25273 + }, + { + "epoch": 0.65, + "learning_rate": 1.8241115604773624e-06, + "loss": 0.6157, + "step": 25274 + }, + { + "epoch": 0.65, + "learning_rate": 1.824095886855283e-06, + "loss": 1.0117, + "step": 25275 + }, + { + "epoch": 0.65, + "learning_rate": 1.824080212602231e-06, + "loss": 0.9175, + "step": 25276 + }, + { + "epoch": 0.65, + "learning_rate": 1.8240645377182188e-06, + "loss": 0.8662, + "step": 25277 + }, + { + "epoch": 0.65, + "learning_rate": 1.824048862203258e-06, + "loss": 0.8799, + "step": 25278 + }, + { + "epoch": 0.65, + "learning_rate": 1.8240331860573612e-06, + "loss": 0.6228, + "step": 25279 + }, + { + "epoch": 0.65, + "learning_rate": 1.82401750928054e-06, + "loss": 1.0303, + "step": 25280 + }, + { + "epoch": 0.65, + "learning_rate": 1.8240018318728065e-06, + "loss": 0.8667, + "step": 25281 + }, + { + "epoch": 0.65, + "learning_rate": 1.8239861538341725e-06, + "loss": 0.8047, + "step": 25282 + }, + { + "epoch": 0.65, + "learning_rate": 1.8239704751646503e-06, + "loss": 0.8848, + "step": 25283 + }, + { + "epoch": 0.65, + "learning_rate": 1.823954795864252e-06, + "loss": 0.7275, + "step": 25284 + }, + { + "epoch": 0.65, + "learning_rate": 1.8239391159329891e-06, + "loss": 0.7871, + "step": 25285 + }, + { + "epoch": 0.65, + "learning_rate": 1.823923435370874e-06, + "loss": 1.0439, + "step": 25286 + }, + { + "epoch": 0.65, + "learning_rate": 1.8239077541779188e-06, + "loss": 0.8545, + "step": 25287 + }, + { + "epoch": 0.65, + "learning_rate": 1.8238920723541352e-06, + "loss": 0.6514, + "step": 25288 + }, + { + "epoch": 0.65, + "learning_rate": 1.823876389899535e-06, + "loss": 0.8076, + "step": 25289 + }, + { + "epoch": 0.65, + "learning_rate": 1.823860706814131e-06, + "loss": 1.1592, + "step": 25290 + }, + { + "epoch": 0.65, + "learning_rate": 1.8238450230979345e-06, + "loss": 1.0088, + "step": 25291 + }, + { + "epoch": 0.65, + "learning_rate": 1.8238293387509577e-06, + "loss": 1.0566, + "step": 25292 + }, + { + "epoch": 0.65, + "learning_rate": 1.8238136537732128e-06, + "loss": 0.8247, + "step": 25293 + }, + { + "epoch": 0.65, + "learning_rate": 1.8237979681647118e-06, + "loss": 0.876, + "step": 25294 + }, + { + "epoch": 0.65, + "learning_rate": 1.8237822819254665e-06, + "loss": 0.9023, + "step": 25295 + }, + { + "epoch": 0.65, + "learning_rate": 1.8237665950554888e-06, + "loss": 0.9893, + "step": 25296 + }, + { + "epoch": 0.65, + "learning_rate": 1.8237509075547908e-06, + "loss": 0.8516, + "step": 25297 + }, + { + "epoch": 0.65, + "learning_rate": 1.8237352194233847e-06, + "loss": 0.812, + "step": 25298 + }, + { + "epoch": 0.65, + "learning_rate": 1.8237195306612828e-06, + "loss": 0.751, + "step": 25299 + }, + { + "epoch": 0.65, + "learning_rate": 1.8237038412684964e-06, + "loss": 0.959, + "step": 25300 + }, + { + "epoch": 0.65, + "learning_rate": 1.8236881512450379e-06, + "loss": 0.8564, + "step": 25301 + }, + { + "epoch": 0.65, + "learning_rate": 1.8236724605909192e-06, + "loss": 1.083, + "step": 25302 + }, + { + "epoch": 0.65, + "learning_rate": 1.8236567693061524e-06, + "loss": 0.8086, + "step": 25303 + }, + { + "epoch": 0.65, + "learning_rate": 1.8236410773907497e-06, + "loss": 0.8345, + "step": 25304 + }, + { + "epoch": 0.65, + "learning_rate": 1.8236253848447224e-06, + "loss": 0.917, + "step": 25305 + }, + { + "epoch": 0.65, + "learning_rate": 1.8236096916680834e-06, + "loss": 0.6299, + "step": 25306 + }, + { + "epoch": 0.65, + "learning_rate": 1.8235939978608442e-06, + "loss": 1.0078, + "step": 25307 + }, + { + "epoch": 0.65, + "learning_rate": 1.823578303423017e-06, + "loss": 0.8896, + "step": 25308 + }, + { + "epoch": 0.65, + "learning_rate": 1.8235626083546136e-06, + "loss": 0.9766, + "step": 25309 + }, + { + "epoch": 0.65, + "learning_rate": 1.8235469126556464e-06, + "loss": 0.8516, + "step": 25310 + }, + { + "epoch": 0.65, + "learning_rate": 1.823531216326127e-06, + "loss": 0.9541, + "step": 25311 + }, + { + "epoch": 0.65, + "learning_rate": 1.8235155193660678e-06, + "loss": 1.0254, + "step": 25312 + }, + { + "epoch": 0.65, + "learning_rate": 1.8234998217754808e-06, + "loss": 0.9629, + "step": 25313 + }, + { + "epoch": 0.65, + "learning_rate": 1.8234841235543774e-06, + "loss": 0.6943, + "step": 25314 + }, + { + "epoch": 0.65, + "learning_rate": 1.8234684247027703e-06, + "loss": 0.8086, + "step": 25315 + }, + { + "epoch": 0.65, + "learning_rate": 1.8234527252206715e-06, + "loss": 0.9092, + "step": 25316 + }, + { + "epoch": 0.65, + "learning_rate": 1.8234370251080923e-06, + "loss": 0.6479, + "step": 25317 + }, + { + "epoch": 0.65, + "learning_rate": 1.8234213243650456e-06, + "loss": 0.8789, + "step": 25318 + }, + { + "epoch": 0.65, + "learning_rate": 1.8234056229915432e-06, + "loss": 0.731, + "step": 25319 + }, + { + "epoch": 0.65, + "learning_rate": 1.8233899209875966e-06, + "loss": 0.9678, + "step": 25320 + }, + { + "epoch": 0.65, + "learning_rate": 1.8233742183532183e-06, + "loss": 0.8623, + "step": 25321 + }, + { + "epoch": 0.65, + "learning_rate": 1.8233585150884204e-06, + "loss": 0.6382, + "step": 25322 + }, + { + "epoch": 0.65, + "learning_rate": 1.8233428111932145e-06, + "loss": 0.7061, + "step": 25323 + }, + { + "epoch": 0.65, + "learning_rate": 1.823327106667613e-06, + "loss": 0.8086, + "step": 25324 + }, + { + "epoch": 0.65, + "learning_rate": 1.8233114015116277e-06, + "loss": 0.6709, + "step": 25325 + }, + { + "epoch": 0.65, + "learning_rate": 1.823295695725271e-06, + "loss": 0.8696, + "step": 25326 + }, + { + "epoch": 0.65, + "learning_rate": 1.8232799893085543e-06, + "loss": 0.9863, + "step": 25327 + }, + { + "epoch": 0.65, + "learning_rate": 1.82326428226149e-06, + "loss": 0.769, + "step": 25328 + }, + { + "epoch": 0.65, + "learning_rate": 1.8232485745840904e-06, + "loss": 0.814, + "step": 25329 + }, + { + "epoch": 0.65, + "learning_rate": 1.823232866276367e-06, + "loss": 0.7998, + "step": 25330 + }, + { + "epoch": 0.65, + "learning_rate": 1.8232171573383321e-06, + "loss": 0.873, + "step": 25331 + }, + { + "epoch": 0.65, + "learning_rate": 1.8232014477699974e-06, + "loss": 0.6953, + "step": 25332 + }, + { + "epoch": 0.65, + "learning_rate": 1.8231857375713756e-06, + "loss": 0.6384, + "step": 25333 + }, + { + "epoch": 0.65, + "learning_rate": 1.823170026742478e-06, + "loss": 0.7705, + "step": 25334 + }, + { + "epoch": 0.65, + "learning_rate": 1.8231543152833172e-06, + "loss": 0.9668, + "step": 25335 + }, + { + "epoch": 0.65, + "learning_rate": 1.823138603193905e-06, + "loss": 0.8477, + "step": 25336 + }, + { + "epoch": 0.65, + "learning_rate": 1.8231228904742535e-06, + "loss": 0.792, + "step": 25337 + }, + { + "epoch": 0.65, + "learning_rate": 1.8231071771243743e-06, + "loss": 1.0615, + "step": 25338 + }, + { + "epoch": 0.65, + "learning_rate": 1.82309146314428e-06, + "loss": 0.5859, + "step": 25339 + }, + { + "epoch": 0.65, + "learning_rate": 1.8230757485339826e-06, + "loss": 0.9111, + "step": 25340 + }, + { + "epoch": 0.65, + "learning_rate": 1.8230600332934935e-06, + "loss": 0.7441, + "step": 25341 + }, + { + "epoch": 0.65, + "learning_rate": 1.8230443174228256e-06, + "loss": 1.0498, + "step": 25342 + }, + { + "epoch": 0.65, + "learning_rate": 1.8230286009219902e-06, + "loss": 0.873, + "step": 25343 + }, + { + "epoch": 0.65, + "learning_rate": 1.8230128837909998e-06, + "loss": 0.8525, + "step": 25344 + }, + { + "epoch": 0.65, + "learning_rate": 1.8229971660298662e-06, + "loss": 0.9727, + "step": 25345 + }, + { + "epoch": 0.65, + "learning_rate": 1.8229814476386015e-06, + "loss": 1.1367, + "step": 25346 + }, + { + "epoch": 0.65, + "learning_rate": 1.822965728617218e-06, + "loss": 0.5562, + "step": 25347 + }, + { + "epoch": 0.65, + "learning_rate": 1.8229500089657273e-06, + "loss": 0.916, + "step": 25348 + }, + { + "epoch": 0.65, + "learning_rate": 1.8229342886841415e-06, + "loss": 0.7607, + "step": 25349 + }, + { + "epoch": 0.65, + "learning_rate": 1.822918567772473e-06, + "loss": 0.9473, + "step": 25350 + }, + { + "epoch": 0.65, + "learning_rate": 1.8229028462307334e-06, + "loss": 0.7539, + "step": 25351 + }, + { + "epoch": 0.65, + "learning_rate": 1.822887124058935e-06, + "loss": 0.8135, + "step": 25352 + }, + { + "epoch": 0.65, + "learning_rate": 1.8228714012570898e-06, + "loss": 0.8223, + "step": 25353 + }, + { + "epoch": 0.65, + "learning_rate": 1.8228556778252098e-06, + "loss": 0.9473, + "step": 25354 + }, + { + "epoch": 0.65, + "learning_rate": 1.822839953763307e-06, + "loss": 0.9058, + "step": 25355 + }, + { + "epoch": 0.65, + "learning_rate": 1.8228242290713933e-06, + "loss": 0.916, + "step": 25356 + }, + { + "epoch": 0.65, + "learning_rate": 1.8228085037494812e-06, + "loss": 0.8652, + "step": 25357 + }, + { + "epoch": 0.65, + "learning_rate": 1.8227927777975824e-06, + "loss": 0.8428, + "step": 25358 + }, + { + "epoch": 0.65, + "learning_rate": 1.8227770512157088e-06, + "loss": 0.8682, + "step": 25359 + }, + { + "epoch": 0.65, + "learning_rate": 1.8227613240038729e-06, + "loss": 0.7344, + "step": 25360 + }, + { + "epoch": 0.65, + "learning_rate": 1.8227455961620865e-06, + "loss": 0.8057, + "step": 25361 + }, + { + "epoch": 0.65, + "learning_rate": 1.8227298676903615e-06, + "loss": 0.9229, + "step": 25362 + }, + { + "epoch": 0.65, + "learning_rate": 1.82271413858871e-06, + "loss": 0.9941, + "step": 25363 + }, + { + "epoch": 0.65, + "learning_rate": 1.8226984088571443e-06, + "loss": 1.0068, + "step": 25364 + }, + { + "epoch": 0.65, + "learning_rate": 1.822682678495676e-06, + "loss": 0.9609, + "step": 25365 + }, + { + "epoch": 0.65, + "learning_rate": 1.8226669475043177e-06, + "loss": 0.6938, + "step": 25366 + }, + { + "epoch": 0.65, + "learning_rate": 1.822651215883081e-06, + "loss": 0.8633, + "step": 25367 + }, + { + "epoch": 0.65, + "learning_rate": 1.8226354836319783e-06, + "loss": 0.8018, + "step": 25368 + }, + { + "epoch": 0.65, + "learning_rate": 1.8226197507510211e-06, + "loss": 0.7393, + "step": 25369 + }, + { + "epoch": 0.65, + "learning_rate": 1.8226040172402217e-06, + "loss": 0.6812, + "step": 25370 + }, + { + "epoch": 0.65, + "learning_rate": 1.8225882830995927e-06, + "loss": 0.7524, + "step": 25371 + }, + { + "epoch": 0.65, + "learning_rate": 1.8225725483291452e-06, + "loss": 0.8984, + "step": 25372 + }, + { + "epoch": 0.65, + "learning_rate": 1.8225568129288923e-06, + "loss": 0.8711, + "step": 25373 + }, + { + "epoch": 0.65, + "learning_rate": 1.8225410768988447e-06, + "loss": 1.043, + "step": 25374 + }, + { + "epoch": 0.65, + "learning_rate": 1.8225253402390157e-06, + "loss": 0.9287, + "step": 25375 + }, + { + "epoch": 0.65, + "learning_rate": 1.822509602949417e-06, + "loss": 0.874, + "step": 25376 + }, + { + "epoch": 0.65, + "learning_rate": 1.8224938650300604e-06, + "loss": 0.7417, + "step": 25377 + }, + { + "epoch": 0.65, + "learning_rate": 1.822478126480958e-06, + "loss": 1.0557, + "step": 25378 + }, + { + "epoch": 0.65, + "learning_rate": 1.8224623873021216e-06, + "loss": 0.9434, + "step": 25379 + }, + { + "epoch": 0.65, + "learning_rate": 1.822446647493564e-06, + "loss": 0.7959, + "step": 25380 + }, + { + "epoch": 0.65, + "learning_rate": 1.8224309070552967e-06, + "loss": 0.8438, + "step": 25381 + }, + { + "epoch": 0.65, + "learning_rate": 1.8224151659873319e-06, + "loss": 0.916, + "step": 25382 + }, + { + "epoch": 0.65, + "learning_rate": 1.8223994242896816e-06, + "loss": 0.8525, + "step": 25383 + }, + { + "epoch": 0.65, + "learning_rate": 1.8223836819623579e-06, + "loss": 1.0244, + "step": 25384 + }, + { + "epoch": 0.65, + "learning_rate": 1.8223679390053727e-06, + "loss": 0.8809, + "step": 25385 + }, + { + "epoch": 0.65, + "learning_rate": 1.8223521954187384e-06, + "loss": 0.917, + "step": 25386 + }, + { + "epoch": 0.65, + "learning_rate": 1.8223364512024668e-06, + "loss": 0.875, + "step": 25387 + }, + { + "epoch": 0.65, + "learning_rate": 1.8223207063565698e-06, + "loss": 0.7666, + "step": 25388 + }, + { + "epoch": 0.65, + "learning_rate": 1.8223049608810596e-06, + "loss": 0.9199, + "step": 25389 + }, + { + "epoch": 0.65, + "learning_rate": 1.8222892147759486e-06, + "loss": 0.751, + "step": 25390 + }, + { + "epoch": 0.65, + "learning_rate": 1.8222734680412484e-06, + "loss": 1.0312, + "step": 25391 + }, + { + "epoch": 0.65, + "learning_rate": 1.8222577206769712e-06, + "loss": 0.7197, + "step": 25392 + }, + { + "epoch": 0.65, + "learning_rate": 1.822241972683129e-06, + "loss": 0.8809, + "step": 25393 + }, + { + "epoch": 0.65, + "learning_rate": 1.822226224059734e-06, + "loss": 0.9541, + "step": 25394 + }, + { + "epoch": 0.65, + "learning_rate": 1.8222104748067984e-06, + "loss": 0.9102, + "step": 25395 + }, + { + "epoch": 0.65, + "learning_rate": 1.8221947249243338e-06, + "loss": 0.8955, + "step": 25396 + }, + { + "epoch": 0.65, + "learning_rate": 1.8221789744123526e-06, + "loss": 1.0049, + "step": 25397 + }, + { + "epoch": 0.65, + "learning_rate": 1.8221632232708667e-06, + "loss": 0.6216, + "step": 25398 + }, + { + "epoch": 0.65, + "learning_rate": 1.8221474714998882e-06, + "loss": 0.8232, + "step": 25399 + }, + { + "epoch": 0.65, + "learning_rate": 1.8221317190994295e-06, + "loss": 1.0371, + "step": 25400 + }, + { + "epoch": 0.65, + "learning_rate": 1.8221159660695018e-06, + "loss": 0.8657, + "step": 25401 + }, + { + "epoch": 0.65, + "learning_rate": 1.8221002124101181e-06, + "loss": 0.9238, + "step": 25402 + }, + { + "epoch": 0.65, + "learning_rate": 1.8220844581212899e-06, + "loss": 0.7058, + "step": 25403 + }, + { + "epoch": 0.65, + "learning_rate": 1.8220687032030293e-06, + "loss": 0.9141, + "step": 25404 + }, + { + "epoch": 0.65, + "learning_rate": 1.822052947655349e-06, + "loss": 0.999, + "step": 25405 + }, + { + "epoch": 0.65, + "learning_rate": 1.8220371914782602e-06, + "loss": 0.8857, + "step": 25406 + }, + { + "epoch": 0.65, + "learning_rate": 1.8220214346717752e-06, + "loss": 0.6919, + "step": 25407 + }, + { + "epoch": 0.65, + "learning_rate": 1.8220056772359063e-06, + "loss": 0.7954, + "step": 25408 + }, + { + "epoch": 0.65, + "learning_rate": 1.8219899191706655e-06, + "loss": 0.959, + "step": 25409 + }, + { + "epoch": 0.65, + "learning_rate": 1.8219741604760649e-06, + "loss": 0.7759, + "step": 25410 + }, + { + "epoch": 0.65, + "learning_rate": 1.8219584011521164e-06, + "loss": 0.7261, + "step": 25411 + }, + { + "epoch": 0.65, + "learning_rate": 1.8219426411988322e-06, + "loss": 0.9023, + "step": 25412 + }, + { + "epoch": 0.65, + "learning_rate": 1.8219268806162243e-06, + "loss": 0.6807, + "step": 25413 + }, + { + "epoch": 0.65, + "learning_rate": 1.8219111194043046e-06, + "loss": 0.8721, + "step": 25414 + }, + { + "epoch": 0.65, + "learning_rate": 1.8218953575630853e-06, + "loss": 0.9355, + "step": 25415 + }, + { + "epoch": 0.65, + "learning_rate": 1.8218795950925787e-06, + "loss": 0.7588, + "step": 25416 + }, + { + "epoch": 0.65, + "learning_rate": 1.8218638319927968e-06, + "loss": 0.9121, + "step": 25417 + }, + { + "epoch": 0.65, + "learning_rate": 1.8218480682637516e-06, + "loss": 0.7695, + "step": 25418 + }, + { + "epoch": 0.65, + "learning_rate": 1.8218323039054548e-06, + "loss": 0.8379, + "step": 25419 + }, + { + "epoch": 0.65, + "learning_rate": 1.821816538917919e-06, + "loss": 0.8691, + "step": 25420 + }, + { + "epoch": 0.65, + "learning_rate": 1.821800773301156e-06, + "loss": 0.917, + "step": 25421 + }, + { + "epoch": 0.65, + "learning_rate": 1.8217850070551778e-06, + "loss": 0.9775, + "step": 25422 + }, + { + "epoch": 0.65, + "learning_rate": 1.821769240179997e-06, + "loss": 0.7793, + "step": 25423 + }, + { + "epoch": 0.65, + "learning_rate": 1.8217534726756249e-06, + "loss": 0.708, + "step": 25424 + }, + { + "epoch": 0.65, + "learning_rate": 1.821737704542074e-06, + "loss": 0.7778, + "step": 25425 + }, + { + "epoch": 0.65, + "learning_rate": 1.8217219357793564e-06, + "loss": 0.8296, + "step": 25426 + }, + { + "epoch": 0.65, + "learning_rate": 1.8217061663874845e-06, + "loss": 0.8828, + "step": 25427 + }, + { + "epoch": 0.65, + "learning_rate": 1.8216903963664694e-06, + "loss": 0.6934, + "step": 25428 + }, + { + "epoch": 0.65, + "learning_rate": 1.8216746257163237e-06, + "loss": 0.9844, + "step": 25429 + }, + { + "epoch": 0.65, + "learning_rate": 1.82165885443706e-06, + "loss": 0.6143, + "step": 25430 + }, + { + "epoch": 0.65, + "learning_rate": 1.8216430825286894e-06, + "loss": 1.001, + "step": 25431 + }, + { + "epoch": 0.65, + "learning_rate": 1.821627309991225e-06, + "loss": 0.9541, + "step": 25432 + }, + { + "epoch": 0.65, + "learning_rate": 1.8216115368246778e-06, + "loss": 0.7432, + "step": 25433 + }, + { + "epoch": 0.65, + "learning_rate": 1.821595763029061e-06, + "loss": 0.792, + "step": 25434 + }, + { + "epoch": 0.65, + "learning_rate": 1.8215799886043856e-06, + "loss": 0.7412, + "step": 25435 + }, + { + "epoch": 0.65, + "learning_rate": 1.8215642135506643e-06, + "loss": 0.792, + "step": 25436 + }, + { + "epoch": 0.65, + "learning_rate": 1.8215484378679094e-06, + "loss": 0.7041, + "step": 25437 + }, + { + "epoch": 0.65, + "learning_rate": 1.8215326615561322e-06, + "loss": 0.8701, + "step": 25438 + }, + { + "epoch": 0.65, + "learning_rate": 1.8215168846153452e-06, + "loss": 0.8584, + "step": 25439 + }, + { + "epoch": 0.65, + "learning_rate": 1.8215011070455608e-06, + "loss": 0.6178, + "step": 25440 + }, + { + "epoch": 0.65, + "learning_rate": 1.8214853288467907e-06, + "loss": 0.6904, + "step": 25441 + }, + { + "epoch": 0.65, + "learning_rate": 1.8214695500190472e-06, + "loss": 0.7705, + "step": 25442 + }, + { + "epoch": 0.65, + "learning_rate": 1.8214537705623419e-06, + "loss": 1.0811, + "step": 25443 + }, + { + "epoch": 0.65, + "learning_rate": 1.8214379904766873e-06, + "loss": 0.8945, + "step": 25444 + }, + { + "epoch": 0.65, + "learning_rate": 1.8214222097620955e-06, + "loss": 0.9043, + "step": 25445 + }, + { + "epoch": 0.65, + "learning_rate": 1.8214064284185783e-06, + "loss": 0.595, + "step": 25446 + }, + { + "epoch": 0.65, + "learning_rate": 1.8213906464461481e-06, + "loss": 0.6636, + "step": 25447 + }, + { + "epoch": 0.65, + "learning_rate": 1.821374863844817e-06, + "loss": 0.8545, + "step": 25448 + }, + { + "epoch": 0.65, + "learning_rate": 1.8213590806145968e-06, + "loss": 0.7798, + "step": 25449 + }, + { + "epoch": 0.65, + "learning_rate": 1.8213432967554998e-06, + "loss": 0.8291, + "step": 25450 + }, + { + "epoch": 0.65, + "learning_rate": 1.8213275122675378e-06, + "loss": 1.0371, + "step": 25451 + }, + { + "epoch": 0.65, + "learning_rate": 1.8213117271507233e-06, + "loss": 0.9043, + "step": 25452 + }, + { + "epoch": 0.65, + "learning_rate": 1.8212959414050681e-06, + "loss": 0.8701, + "step": 25453 + }, + { + "epoch": 0.65, + "learning_rate": 1.8212801550305844e-06, + "loss": 1.0391, + "step": 25454 + }, + { + "epoch": 0.65, + "learning_rate": 1.8212643680272844e-06, + "loss": 0.8838, + "step": 25455 + }, + { + "epoch": 0.65, + "learning_rate": 1.8212485803951797e-06, + "loss": 0.6284, + "step": 25456 + }, + { + "epoch": 0.65, + "learning_rate": 1.8212327921342826e-06, + "loss": 0.7002, + "step": 25457 + }, + { + "epoch": 0.65, + "learning_rate": 1.8212170032446057e-06, + "loss": 0.7461, + "step": 25458 + }, + { + "epoch": 0.65, + "learning_rate": 1.8212012137261606e-06, + "loss": 0.7012, + "step": 25459 + }, + { + "epoch": 0.65, + "learning_rate": 1.8211854235789595e-06, + "loss": 0.832, + "step": 25460 + }, + { + "epoch": 0.65, + "learning_rate": 1.8211696328030143e-06, + "loss": 0.6621, + "step": 25461 + }, + { + "epoch": 0.65, + "learning_rate": 1.8211538413983373e-06, + "loss": 0.8721, + "step": 25462 + }, + { + "epoch": 0.65, + "learning_rate": 1.8211380493649408e-06, + "loss": 0.6099, + "step": 25463 + }, + { + "epoch": 0.65, + "learning_rate": 1.8211222567028367e-06, + "loss": 1.04, + "step": 25464 + }, + { + "epoch": 0.65, + "learning_rate": 1.8211064634120367e-06, + "loss": 0.645, + "step": 25465 + }, + { + "epoch": 0.65, + "learning_rate": 1.8210906694925536e-06, + "loss": 0.8916, + "step": 25466 + }, + { + "epoch": 0.65, + "learning_rate": 1.8210748749443989e-06, + "loss": 0.7334, + "step": 25467 + }, + { + "epoch": 0.65, + "learning_rate": 1.821059079767585e-06, + "loss": 0.7266, + "step": 25468 + }, + { + "epoch": 0.65, + "learning_rate": 1.821043283962124e-06, + "loss": 0.8066, + "step": 25469 + }, + { + "epoch": 0.65, + "learning_rate": 1.8210274875280275e-06, + "loss": 0.7134, + "step": 25470 + }, + { + "epoch": 0.65, + "learning_rate": 1.8210116904653083e-06, + "loss": 1.001, + "step": 25471 + }, + { + "epoch": 0.65, + "learning_rate": 1.8209958927739784e-06, + "loss": 0.8877, + "step": 25472 + }, + { + "epoch": 0.65, + "learning_rate": 1.8209800944540495e-06, + "loss": 0.7451, + "step": 25473 + }, + { + "epoch": 0.65, + "learning_rate": 1.8209642955055338e-06, + "loss": 0.9224, + "step": 25474 + }, + { + "epoch": 0.65, + "learning_rate": 1.8209484959284437e-06, + "loss": 0.8936, + "step": 25475 + }, + { + "epoch": 0.65, + "learning_rate": 1.820932695722791e-06, + "loss": 0.6396, + "step": 25476 + }, + { + "epoch": 0.65, + "learning_rate": 1.8209168948885876e-06, + "loss": 0.9912, + "step": 25477 + }, + { + "epoch": 0.65, + "learning_rate": 1.8209010934258463e-06, + "loss": 0.9355, + "step": 25478 + }, + { + "epoch": 0.65, + "learning_rate": 1.8208852913345786e-06, + "loss": 0.6162, + "step": 25479 + }, + { + "epoch": 0.65, + "learning_rate": 1.8208694886147967e-06, + "loss": 0.8711, + "step": 25480 + }, + { + "epoch": 0.65, + "learning_rate": 1.8208536852665128e-06, + "loss": 0.8799, + "step": 25481 + }, + { + "epoch": 0.65, + "learning_rate": 1.820837881289739e-06, + "loss": 1.0459, + "step": 25482 + }, + { + "epoch": 0.65, + "learning_rate": 1.8208220766844874e-06, + "loss": 0.8242, + "step": 25483 + }, + { + "epoch": 0.65, + "learning_rate": 1.8208062714507702e-06, + "loss": 0.8408, + "step": 25484 + }, + { + "epoch": 0.65, + "learning_rate": 1.8207904655885992e-06, + "loss": 0.8975, + "step": 25485 + }, + { + "epoch": 0.65, + "learning_rate": 1.8207746590979868e-06, + "loss": 0.6084, + "step": 25486 + }, + { + "epoch": 0.65, + "learning_rate": 1.8207588519789447e-06, + "loss": 0.8413, + "step": 25487 + }, + { + "epoch": 0.65, + "learning_rate": 1.8207430442314857e-06, + "loss": 0.7295, + "step": 25488 + }, + { + "epoch": 0.65, + "learning_rate": 1.8207272358556214e-06, + "loss": 0.7949, + "step": 25489 + }, + { + "epoch": 0.65, + "learning_rate": 1.8207114268513638e-06, + "loss": 1.0635, + "step": 25490 + }, + { + "epoch": 0.65, + "learning_rate": 1.8206956172187252e-06, + "loss": 0.7983, + "step": 25491 + }, + { + "epoch": 0.65, + "learning_rate": 1.820679806957718e-06, + "loss": 0.8818, + "step": 25492 + }, + { + "epoch": 0.65, + "learning_rate": 1.8206639960683537e-06, + "loss": 1.0029, + "step": 25493 + }, + { + "epoch": 0.65, + "learning_rate": 1.8206481845506448e-06, + "loss": 1.0225, + "step": 25494 + }, + { + "epoch": 0.65, + "learning_rate": 1.8206323724046034e-06, + "loss": 0.5024, + "step": 25495 + }, + { + "epoch": 0.65, + "learning_rate": 1.8206165596302414e-06, + "loss": 0.9043, + "step": 25496 + }, + { + "epoch": 0.65, + "learning_rate": 1.820600746227571e-06, + "loss": 0.7373, + "step": 25497 + }, + { + "epoch": 0.65, + "learning_rate": 1.8205849321966046e-06, + "loss": 0.8604, + "step": 25498 + }, + { + "epoch": 0.65, + "learning_rate": 1.820569117537354e-06, + "loss": 0.9102, + "step": 25499 + }, + { + "epoch": 0.65, + "learning_rate": 1.820553302249831e-06, + "loss": 0.8467, + "step": 25500 + }, + { + "epoch": 0.65, + "learning_rate": 1.8205374863340484e-06, + "loss": 0.7822, + "step": 25501 + }, + { + "epoch": 0.65, + "learning_rate": 1.8205216697900178e-06, + "loss": 0.6562, + "step": 25502 + }, + { + "epoch": 0.65, + "learning_rate": 1.8205058526177517e-06, + "loss": 0.875, + "step": 25503 + }, + { + "epoch": 0.65, + "learning_rate": 1.8204900348172619e-06, + "loss": 0.6895, + "step": 25504 + }, + { + "epoch": 0.65, + "learning_rate": 1.8204742163885605e-06, + "loss": 0.6646, + "step": 25505 + }, + { + "epoch": 0.65, + "learning_rate": 1.82045839733166e-06, + "loss": 0.9883, + "step": 25506 + }, + { + "epoch": 0.65, + "learning_rate": 1.8204425776465717e-06, + "loss": 0.8408, + "step": 25507 + }, + { + "epoch": 0.65, + "learning_rate": 1.8204267573333087e-06, + "loss": 0.4619, + "step": 25508 + }, + { + "epoch": 0.65, + "learning_rate": 1.8204109363918824e-06, + "loss": 0.8306, + "step": 25509 + }, + { + "epoch": 0.65, + "learning_rate": 1.8203951148223053e-06, + "loss": 0.9453, + "step": 25510 + }, + { + "epoch": 0.65, + "learning_rate": 1.8203792926245894e-06, + "loss": 0.8613, + "step": 25511 + }, + { + "epoch": 0.65, + "learning_rate": 1.820363469798747e-06, + "loss": 0.7612, + "step": 25512 + }, + { + "epoch": 0.65, + "learning_rate": 1.8203476463447896e-06, + "loss": 0.7764, + "step": 25513 + }, + { + "epoch": 0.65, + "learning_rate": 1.82033182226273e-06, + "loss": 0.9131, + "step": 25514 + }, + { + "epoch": 0.65, + "learning_rate": 1.82031599755258e-06, + "loss": 0.9932, + "step": 25515 + }, + { + "epoch": 0.65, + "learning_rate": 1.8203001722143516e-06, + "loss": 1.0225, + "step": 25516 + }, + { + "epoch": 0.65, + "learning_rate": 1.8202843462480573e-06, + "loss": 0.8037, + "step": 25517 + }, + { + "epoch": 0.65, + "learning_rate": 1.820268519653709e-06, + "loss": 1.1807, + "step": 25518 + }, + { + "epoch": 0.65, + "learning_rate": 1.8202526924313184e-06, + "loss": 0.8564, + "step": 25519 + }, + { + "epoch": 0.65, + "learning_rate": 1.8202368645808982e-06, + "loss": 0.7441, + "step": 25520 + }, + { + "epoch": 0.65, + "learning_rate": 1.8202210361024605e-06, + "loss": 0.7144, + "step": 25521 + }, + { + "epoch": 0.65, + "learning_rate": 1.8202052069960176e-06, + "loss": 1.0752, + "step": 25522 + }, + { + "epoch": 0.65, + "learning_rate": 1.8201893772615808e-06, + "loss": 0.8516, + "step": 25523 + }, + { + "epoch": 0.65, + "learning_rate": 1.8201735468991629e-06, + "loss": 0.9023, + "step": 25524 + }, + { + "epoch": 0.65, + "learning_rate": 1.8201577159087757e-06, + "loss": 0.8779, + "step": 25525 + }, + { + "epoch": 0.65, + "learning_rate": 1.8201418842904316e-06, + "loss": 1.0146, + "step": 25526 + }, + { + "epoch": 0.65, + "learning_rate": 1.8201260520441423e-06, + "loss": 0.5942, + "step": 25527 + }, + { + "epoch": 0.65, + "learning_rate": 1.8201102191699204e-06, + "loss": 0.8408, + "step": 25528 + }, + { + "epoch": 0.65, + "learning_rate": 1.8200943856677777e-06, + "loss": 0.7559, + "step": 25529 + }, + { + "epoch": 0.65, + "learning_rate": 1.8200785515377265e-06, + "loss": 1.0137, + "step": 25530 + }, + { + "epoch": 0.65, + "learning_rate": 1.820062716779779e-06, + "loss": 0.7158, + "step": 25531 + }, + { + "epoch": 0.65, + "learning_rate": 1.820046881393947e-06, + "loss": 1.1621, + "step": 25532 + }, + { + "epoch": 0.65, + "learning_rate": 1.8200310453802433e-06, + "loss": 0.9111, + "step": 25533 + }, + { + "epoch": 0.65, + "learning_rate": 1.8200152087386788e-06, + "loss": 0.9331, + "step": 25534 + }, + { + "epoch": 0.65, + "learning_rate": 1.8199993714692667e-06, + "loss": 0.9473, + "step": 25535 + }, + { + "epoch": 0.65, + "learning_rate": 1.8199835335720187e-06, + "loss": 0.8281, + "step": 25536 + }, + { + "epoch": 0.65, + "learning_rate": 1.8199676950469472e-06, + "loss": 0.9375, + "step": 25537 + }, + { + "epoch": 0.65, + "learning_rate": 1.8199518558940641e-06, + "loss": 0.834, + "step": 25538 + }, + { + "epoch": 0.65, + "learning_rate": 1.8199360161133814e-06, + "loss": 0.3955, + "step": 25539 + }, + { + "epoch": 0.65, + "learning_rate": 1.8199201757049116e-06, + "loss": 0.719, + "step": 25540 + }, + { + "epoch": 0.65, + "learning_rate": 1.8199043346686664e-06, + "loss": 0.7048, + "step": 25541 + }, + { + "epoch": 0.65, + "learning_rate": 1.8198884930046583e-06, + "loss": 0.8203, + "step": 25542 + }, + { + "epoch": 0.65, + "learning_rate": 1.8198726507128992e-06, + "loss": 0.7754, + "step": 25543 + }, + { + "epoch": 0.65, + "learning_rate": 1.8198568077934016e-06, + "loss": 0.6074, + "step": 25544 + }, + { + "epoch": 0.65, + "learning_rate": 1.8198409642461767e-06, + "loss": 0.7349, + "step": 25545 + }, + { + "epoch": 0.65, + "learning_rate": 1.8198251200712378e-06, + "loss": 1.1689, + "step": 25546 + }, + { + "epoch": 0.65, + "learning_rate": 1.8198092752685965e-06, + "loss": 0.8418, + "step": 25547 + }, + { + "epoch": 0.65, + "learning_rate": 1.8197934298382646e-06, + "loss": 0.791, + "step": 25548 + }, + { + "epoch": 0.65, + "learning_rate": 1.819777583780255e-06, + "loss": 1.0, + "step": 25549 + }, + { + "epoch": 0.65, + "learning_rate": 1.8197617370945788e-06, + "loss": 0.7329, + "step": 25550 + }, + { + "epoch": 0.65, + "learning_rate": 1.8197458897812492e-06, + "loss": 0.9395, + "step": 25551 + }, + { + "epoch": 0.65, + "learning_rate": 1.8197300418402776e-06, + "loss": 0.8018, + "step": 25552 + }, + { + "epoch": 0.65, + "learning_rate": 1.8197141932716766e-06, + "loss": 0.9453, + "step": 25553 + }, + { + "epoch": 0.65, + "learning_rate": 1.8196983440754584e-06, + "loss": 0.7334, + "step": 25554 + }, + { + "epoch": 0.65, + "learning_rate": 1.8196824942516344e-06, + "loss": 0.8828, + "step": 25555 + }, + { + "epoch": 0.66, + "learning_rate": 1.8196666438002174e-06, + "loss": 0.9014, + "step": 25556 + }, + { + "epoch": 0.66, + "learning_rate": 1.8196507927212193e-06, + "loss": 0.8691, + "step": 25557 + }, + { + "epoch": 0.66, + "learning_rate": 1.8196349410146521e-06, + "loss": 0.9238, + "step": 25558 + }, + { + "epoch": 0.66, + "learning_rate": 1.8196190886805284e-06, + "loss": 0.939, + "step": 25559 + }, + { + "epoch": 0.66, + "learning_rate": 1.81960323571886e-06, + "loss": 0.8174, + "step": 25560 + }, + { + "epoch": 0.66, + "learning_rate": 1.819587382129659e-06, + "loss": 0.6157, + "step": 25561 + }, + { + "epoch": 0.66, + "learning_rate": 1.8195715279129375e-06, + "loss": 0.9639, + "step": 25562 + }, + { + "epoch": 0.66, + "learning_rate": 1.819555673068708e-06, + "loss": 0.8975, + "step": 25563 + }, + { + "epoch": 0.66, + "learning_rate": 1.8195398175969825e-06, + "loss": 0.9111, + "step": 25564 + }, + { + "epoch": 0.66, + "learning_rate": 1.8195239614977726e-06, + "loss": 0.9229, + "step": 25565 + }, + { + "epoch": 0.66, + "learning_rate": 1.8195081047710912e-06, + "loss": 0.8022, + "step": 25566 + }, + { + "epoch": 0.66, + "learning_rate": 1.8194922474169503e-06, + "loss": 0.9541, + "step": 25567 + }, + { + "epoch": 0.66, + "learning_rate": 1.8194763894353615e-06, + "loss": 1.0059, + "step": 25568 + }, + { + "epoch": 0.66, + "learning_rate": 1.8194605308263375e-06, + "loss": 0.7729, + "step": 25569 + }, + { + "epoch": 0.66, + "learning_rate": 1.81944467158989e-06, + "loss": 0.8066, + "step": 25570 + }, + { + "epoch": 0.66, + "learning_rate": 1.8194288117260319e-06, + "loss": 0.7441, + "step": 25571 + }, + { + "epoch": 0.66, + "learning_rate": 1.8194129512347744e-06, + "loss": 0.791, + "step": 25572 + }, + { + "epoch": 0.66, + "learning_rate": 1.8193970901161305e-06, + "loss": 0.918, + "step": 25573 + }, + { + "epoch": 0.66, + "learning_rate": 1.8193812283701115e-06, + "loss": 0.9102, + "step": 25574 + }, + { + "epoch": 0.66, + "learning_rate": 1.81936536599673e-06, + "loss": 0.665, + "step": 25575 + }, + { + "epoch": 0.66, + "learning_rate": 1.8193495029959984e-06, + "loss": 0.9453, + "step": 25576 + }, + { + "epoch": 0.66, + "learning_rate": 1.819333639367928e-06, + "loss": 0.998, + "step": 25577 + }, + { + "epoch": 0.66, + "learning_rate": 1.8193177751125322e-06, + "loss": 0.917, + "step": 25578 + }, + { + "epoch": 0.66, + "learning_rate": 1.819301910229822e-06, + "loss": 0.7102, + "step": 25579 + }, + { + "epoch": 0.66, + "learning_rate": 1.8192860447198104e-06, + "loss": 0.7793, + "step": 25580 + }, + { + "epoch": 0.66, + "learning_rate": 1.8192701785825087e-06, + "loss": 0.8135, + "step": 25581 + }, + { + "epoch": 0.66, + "learning_rate": 1.81925431181793e-06, + "loss": 0.9609, + "step": 25582 + }, + { + "epoch": 0.66, + "learning_rate": 1.8192384444260855e-06, + "loss": 1.0615, + "step": 25583 + }, + { + "epoch": 0.66, + "learning_rate": 1.819222576406988e-06, + "loss": 0.8926, + "step": 25584 + }, + { + "epoch": 0.66, + "learning_rate": 1.8192067077606495e-06, + "loss": 0.7549, + "step": 25585 + }, + { + "epoch": 0.66, + "learning_rate": 1.8191908384870817e-06, + "loss": 1.1797, + "step": 25586 + }, + { + "epoch": 0.66, + "learning_rate": 1.8191749685862977e-06, + "loss": 0.877, + "step": 25587 + }, + { + "epoch": 0.66, + "learning_rate": 1.8191590980583084e-06, + "loss": 0.7139, + "step": 25588 + }, + { + "epoch": 0.66, + "learning_rate": 1.8191432269031273e-06, + "loss": 0.7441, + "step": 25589 + }, + { + "epoch": 0.66, + "learning_rate": 1.8191273551207656e-06, + "loss": 0.9434, + "step": 25590 + }, + { + "epoch": 0.66, + "learning_rate": 1.8191114827112358e-06, + "loss": 0.7859, + "step": 25591 + }, + { + "epoch": 0.66, + "learning_rate": 1.8190956096745499e-06, + "loss": 0.9932, + "step": 25592 + }, + { + "epoch": 0.66, + "learning_rate": 1.81907973601072e-06, + "loss": 0.9072, + "step": 25593 + }, + { + "epoch": 0.66, + "learning_rate": 1.8190638617197588e-06, + "loss": 0.8164, + "step": 25594 + }, + { + "epoch": 0.66, + "learning_rate": 1.819047986801678e-06, + "loss": 0.7148, + "step": 25595 + }, + { + "epoch": 0.66, + "learning_rate": 1.8190321112564896e-06, + "loss": 0.6992, + "step": 25596 + }, + { + "epoch": 0.66, + "learning_rate": 1.8190162350842063e-06, + "loss": 0.9619, + "step": 25597 + }, + { + "epoch": 0.66, + "learning_rate": 1.8190003582848397e-06, + "loss": 0.791, + "step": 25598 + }, + { + "epoch": 0.66, + "learning_rate": 1.8189844808584024e-06, + "loss": 0.8027, + "step": 25599 + }, + { + "epoch": 0.66, + "learning_rate": 1.8189686028049059e-06, + "loss": 0.7617, + "step": 25600 + }, + { + "epoch": 0.66, + "learning_rate": 1.818952724124363e-06, + "loss": 0.9551, + "step": 25601 + }, + { + "epoch": 0.66, + "learning_rate": 1.818936844816786e-06, + "loss": 0.8643, + "step": 25602 + }, + { + "epoch": 0.66, + "learning_rate": 1.8189209648821864e-06, + "loss": 0.9834, + "step": 25603 + }, + { + "epoch": 0.66, + "learning_rate": 1.8189050843205766e-06, + "loss": 0.9561, + "step": 25604 + }, + { + "epoch": 0.66, + "learning_rate": 1.818889203131969e-06, + "loss": 0.6658, + "step": 25605 + }, + { + "epoch": 0.66, + "learning_rate": 1.8188733213163754e-06, + "loss": 1.0703, + "step": 25606 + }, + { + "epoch": 0.66, + "learning_rate": 1.8188574388738083e-06, + "loss": 0.7822, + "step": 25607 + }, + { + "epoch": 0.66, + "learning_rate": 1.8188415558042797e-06, + "loss": 0.8955, + "step": 25608 + }, + { + "epoch": 0.66, + "learning_rate": 1.8188256721078017e-06, + "loss": 0.7905, + "step": 25609 + }, + { + "epoch": 0.66, + "learning_rate": 1.8188097877843867e-06, + "loss": 0.9727, + "step": 25610 + }, + { + "epoch": 0.66, + "learning_rate": 1.8187939028340464e-06, + "loss": 0.7314, + "step": 25611 + }, + { + "epoch": 0.66, + "learning_rate": 1.8187780172567938e-06, + "loss": 0.8369, + "step": 25612 + }, + { + "epoch": 0.66, + "learning_rate": 1.81876213105264e-06, + "loss": 1.0166, + "step": 25613 + }, + { + "epoch": 0.66, + "learning_rate": 1.8187462442215977e-06, + "loss": 0.7856, + "step": 25614 + }, + { + "epoch": 0.66, + "learning_rate": 1.8187303567636795e-06, + "loss": 0.8169, + "step": 25615 + }, + { + "epoch": 0.66, + "learning_rate": 1.8187144686788965e-06, + "loss": 0.8467, + "step": 25616 + }, + { + "epoch": 0.66, + "learning_rate": 1.8186985799672617e-06, + "loss": 0.9121, + "step": 25617 + }, + { + "epoch": 0.66, + "learning_rate": 1.8186826906287872e-06, + "loss": 0.8291, + "step": 25618 + }, + { + "epoch": 0.66, + "learning_rate": 1.818666800663485e-06, + "loss": 0.9385, + "step": 25619 + }, + { + "epoch": 0.66, + "learning_rate": 1.8186509100713673e-06, + "loss": 0.9502, + "step": 25620 + }, + { + "epoch": 0.66, + "learning_rate": 1.8186350188524461e-06, + "loss": 0.8652, + "step": 25621 + }, + { + "epoch": 0.66, + "learning_rate": 1.8186191270067338e-06, + "loss": 0.8516, + "step": 25622 + }, + { + "epoch": 0.66, + "learning_rate": 1.8186032345342424e-06, + "loss": 0.8506, + "step": 25623 + }, + { + "epoch": 0.66, + "learning_rate": 1.8185873414349842e-06, + "loss": 0.791, + "step": 25624 + }, + { + "epoch": 0.66, + "learning_rate": 1.8185714477089711e-06, + "loss": 0.7988, + "step": 25625 + }, + { + "epoch": 0.66, + "learning_rate": 1.8185555533562158e-06, + "loss": 1.0713, + "step": 25626 + }, + { + "epoch": 0.66, + "learning_rate": 1.81853965837673e-06, + "loss": 0.5459, + "step": 25627 + }, + { + "epoch": 0.66, + "learning_rate": 1.818523762770526e-06, + "loss": 0.7681, + "step": 25628 + }, + { + "epoch": 0.66, + "learning_rate": 1.818507866537616e-06, + "loss": 0.8379, + "step": 25629 + }, + { + "epoch": 0.66, + "learning_rate": 1.8184919696780124e-06, + "loss": 0.748, + "step": 25630 + }, + { + "epoch": 0.66, + "learning_rate": 1.8184760721917268e-06, + "loss": 0.7588, + "step": 25631 + }, + { + "epoch": 0.66, + "learning_rate": 1.818460174078772e-06, + "loss": 0.9043, + "step": 25632 + }, + { + "epoch": 0.66, + "learning_rate": 1.8184442753391596e-06, + "loss": 0.8042, + "step": 25633 + }, + { + "epoch": 0.66, + "learning_rate": 1.8184283759729022e-06, + "loss": 0.96, + "step": 25634 + }, + { + "epoch": 0.66, + "learning_rate": 1.8184124759800117e-06, + "loss": 0.8574, + "step": 25635 + }, + { + "epoch": 0.66, + "learning_rate": 1.8183965753605004e-06, + "loss": 0.8389, + "step": 25636 + }, + { + "epoch": 0.66, + "learning_rate": 1.8183806741143806e-06, + "loss": 0.7988, + "step": 25637 + }, + { + "epoch": 0.66, + "learning_rate": 1.8183647722416644e-06, + "loss": 0.8291, + "step": 25638 + }, + { + "epoch": 0.66, + "learning_rate": 1.8183488697423638e-06, + "loss": 0.6948, + "step": 25639 + }, + { + "epoch": 0.66, + "learning_rate": 1.818332966616491e-06, + "loss": 0.8755, + "step": 25640 + }, + { + "epoch": 0.66, + "learning_rate": 1.8183170628640588e-06, + "loss": 1.0312, + "step": 25641 + }, + { + "epoch": 0.66, + "learning_rate": 1.8183011584850782e-06, + "loss": 1.0146, + "step": 25642 + }, + { + "epoch": 0.66, + "learning_rate": 1.8182852534795623e-06, + "loss": 0.7803, + "step": 25643 + }, + { + "epoch": 0.66, + "learning_rate": 1.818269347847523e-06, + "loss": 0.8857, + "step": 25644 + }, + { + "epoch": 0.66, + "learning_rate": 1.8182534415889725e-06, + "loss": 0.7544, + "step": 25645 + }, + { + "epoch": 0.66, + "learning_rate": 1.818237534703923e-06, + "loss": 0.645, + "step": 25646 + }, + { + "epoch": 0.66, + "learning_rate": 1.8182216271923866e-06, + "loss": 0.7402, + "step": 25647 + }, + { + "epoch": 0.66, + "learning_rate": 1.8182057190543754e-06, + "loss": 0.7134, + "step": 25648 + }, + { + "epoch": 0.66, + "learning_rate": 1.818189810289902e-06, + "loss": 0.9189, + "step": 25649 + }, + { + "epoch": 0.66, + "learning_rate": 1.8181739008989779e-06, + "loss": 0.834, + "step": 25650 + }, + { + "epoch": 0.66, + "learning_rate": 1.8181579908816161e-06, + "loss": 0.7061, + "step": 25651 + }, + { + "epoch": 0.66, + "learning_rate": 1.818142080237828e-06, + "loss": 1.0283, + "step": 25652 + }, + { + "epoch": 0.66, + "learning_rate": 1.8181261689676262e-06, + "loss": 0.9873, + "step": 25653 + }, + { + "epoch": 0.66, + "learning_rate": 1.818110257071023e-06, + "loss": 0.8711, + "step": 25654 + }, + { + "epoch": 0.66, + "learning_rate": 1.8180943445480301e-06, + "loss": 0.7866, + "step": 25655 + }, + { + "epoch": 0.66, + "learning_rate": 1.81807843139866e-06, + "loss": 0.6836, + "step": 25656 + }, + { + "epoch": 0.66, + "learning_rate": 1.8180625176229253e-06, + "loss": 0.8555, + "step": 25657 + }, + { + "epoch": 0.66, + "learning_rate": 1.8180466032208373e-06, + "loss": 0.7183, + "step": 25658 + }, + { + "epoch": 0.66, + "learning_rate": 1.8180306881924086e-06, + "loss": 0.8291, + "step": 25659 + }, + { + "epoch": 0.66, + "learning_rate": 1.8180147725376516e-06, + "loss": 0.8594, + "step": 25660 + }, + { + "epoch": 0.66, + "learning_rate": 1.8179988562565782e-06, + "loss": 0.7037, + "step": 25661 + }, + { + "epoch": 0.66, + "learning_rate": 1.8179829393492008e-06, + "loss": 0.8057, + "step": 25662 + }, + { + "epoch": 0.66, + "learning_rate": 1.8179670218155315e-06, + "loss": 1.0273, + "step": 25663 + }, + { + "epoch": 0.66, + "learning_rate": 1.8179511036555825e-06, + "loss": 1.0137, + "step": 25664 + }, + { + "epoch": 0.66, + "learning_rate": 1.8179351848693658e-06, + "loss": 0.8186, + "step": 25665 + }, + { + "epoch": 0.66, + "learning_rate": 1.8179192654568937e-06, + "loss": 0.9697, + "step": 25666 + }, + { + "epoch": 0.66, + "learning_rate": 1.8179033454181786e-06, + "loss": 1.0693, + "step": 25667 + }, + { + "epoch": 0.66, + "learning_rate": 1.8178874247532322e-06, + "loss": 0.8994, + "step": 25668 + }, + { + "epoch": 0.66, + "learning_rate": 1.8178715034620673e-06, + "loss": 0.9209, + "step": 25669 + }, + { + "epoch": 0.66, + "learning_rate": 1.8178555815446959e-06, + "loss": 0.9111, + "step": 25670 + }, + { + "epoch": 0.66, + "learning_rate": 1.8178396590011297e-06, + "loss": 0.9746, + "step": 25671 + }, + { + "epoch": 0.66, + "learning_rate": 1.8178237358313817e-06, + "loss": 0.8525, + "step": 25672 + }, + { + "epoch": 0.66, + "learning_rate": 1.8178078120354633e-06, + "loss": 0.9111, + "step": 25673 + }, + { + "epoch": 0.66, + "learning_rate": 1.8177918876133873e-06, + "loss": 0.7305, + "step": 25674 + }, + { + "epoch": 0.66, + "learning_rate": 1.8177759625651658e-06, + "loss": 1.1494, + "step": 25675 + }, + { + "epoch": 0.66, + "learning_rate": 1.8177600368908106e-06, + "loss": 0.9634, + "step": 25676 + }, + { + "epoch": 0.66, + "learning_rate": 1.8177441105903342e-06, + "loss": 0.7031, + "step": 25677 + }, + { + "epoch": 0.66, + "learning_rate": 1.8177281836637488e-06, + "loss": 0.582, + "step": 25678 + }, + { + "epoch": 0.66, + "learning_rate": 1.8177122561110663e-06, + "loss": 0.8857, + "step": 25679 + }, + { + "epoch": 0.66, + "learning_rate": 1.8176963279322992e-06, + "loss": 0.8936, + "step": 25680 + }, + { + "epoch": 0.66, + "learning_rate": 1.8176803991274595e-06, + "loss": 0.6755, + "step": 25681 + }, + { + "epoch": 0.66, + "learning_rate": 1.81766446969656e-06, + "loss": 0.8076, + "step": 25682 + }, + { + "epoch": 0.66, + "learning_rate": 1.8176485396396121e-06, + "loss": 0.8135, + "step": 25683 + }, + { + "epoch": 0.66, + "learning_rate": 1.8176326089566283e-06, + "loss": 0.9775, + "step": 25684 + }, + { + "epoch": 0.66, + "learning_rate": 1.8176166776476206e-06, + "loss": 1.0186, + "step": 25685 + }, + { + "epoch": 0.66, + "learning_rate": 1.8176007457126019e-06, + "loss": 1.0488, + "step": 25686 + }, + { + "epoch": 0.66, + "learning_rate": 1.8175848131515836e-06, + "loss": 0.877, + "step": 25687 + }, + { + "epoch": 0.66, + "learning_rate": 1.817568879964578e-06, + "loss": 0.7607, + "step": 25688 + }, + { + "epoch": 0.66, + "learning_rate": 1.8175529461515979e-06, + "loss": 0.864, + "step": 25689 + }, + { + "epoch": 0.66, + "learning_rate": 1.8175370117126548e-06, + "loss": 1.1172, + "step": 25690 + }, + { + "epoch": 0.66, + "learning_rate": 1.8175210766477616e-06, + "loss": 0.9209, + "step": 25691 + }, + { + "epoch": 0.66, + "learning_rate": 1.8175051409569297e-06, + "loss": 0.9141, + "step": 25692 + }, + { + "epoch": 0.66, + "learning_rate": 1.817489204640172e-06, + "loss": 0.9043, + "step": 25693 + }, + { + "epoch": 0.66, + "learning_rate": 1.8174732676975002e-06, + "loss": 1.041, + "step": 25694 + }, + { + "epoch": 0.66, + "learning_rate": 1.8174573301289269e-06, + "loss": 0.8145, + "step": 25695 + }, + { + "epoch": 0.66, + "learning_rate": 1.817441391934464e-06, + "loss": 0.8887, + "step": 25696 + }, + { + "epoch": 0.66, + "learning_rate": 1.8174254531141238e-06, + "loss": 0.8623, + "step": 25697 + }, + { + "epoch": 0.66, + "learning_rate": 1.8174095136679184e-06, + "loss": 0.8623, + "step": 25698 + }, + { + "epoch": 0.66, + "learning_rate": 1.8173935735958604e-06, + "loss": 0.9824, + "step": 25699 + }, + { + "epoch": 0.66, + "learning_rate": 1.8173776328979616e-06, + "loss": 0.7441, + "step": 25700 + }, + { + "epoch": 0.66, + "learning_rate": 1.8173616915742343e-06, + "loss": 0.6372, + "step": 25701 + }, + { + "epoch": 0.66, + "learning_rate": 1.8173457496246906e-06, + "loss": 0.6699, + "step": 25702 + }, + { + "epoch": 0.66, + "learning_rate": 1.8173298070493428e-06, + "loss": 0.9121, + "step": 25703 + }, + { + "epoch": 0.66, + "learning_rate": 1.8173138638482035e-06, + "loss": 0.8311, + "step": 25704 + }, + { + "epoch": 0.66, + "learning_rate": 1.8172979200212843e-06, + "loss": 0.9609, + "step": 25705 + }, + { + "epoch": 0.66, + "learning_rate": 1.8172819755685976e-06, + "loss": 0.9326, + "step": 25706 + }, + { + "epoch": 0.66, + "learning_rate": 1.817266030490156e-06, + "loss": 0.9258, + "step": 25707 + }, + { + "epoch": 0.66, + "learning_rate": 1.8172500847859711e-06, + "loss": 0.7842, + "step": 25708 + }, + { + "epoch": 0.66, + "learning_rate": 1.8172341384560554e-06, + "loss": 0.8262, + "step": 25709 + }, + { + "epoch": 0.66, + "learning_rate": 1.8172181915004213e-06, + "loss": 0.6383, + "step": 25710 + }, + { + "epoch": 0.66, + "learning_rate": 1.8172022439190806e-06, + "loss": 0.7754, + "step": 25711 + }, + { + "epoch": 0.66, + "learning_rate": 1.8171862957120458e-06, + "loss": 1.0596, + "step": 25712 + }, + { + "epoch": 0.66, + "learning_rate": 1.8171703468793292e-06, + "loss": 1.0967, + "step": 25713 + }, + { + "epoch": 0.66, + "learning_rate": 1.8171543974209426e-06, + "loss": 0.772, + "step": 25714 + }, + { + "epoch": 0.66, + "learning_rate": 1.8171384473368984e-06, + "loss": 0.8252, + "step": 25715 + }, + { + "epoch": 0.66, + "learning_rate": 1.817122496627209e-06, + "loss": 0.8096, + "step": 25716 + }, + { + "epoch": 0.66, + "learning_rate": 1.8171065452918866e-06, + "loss": 0.7793, + "step": 25717 + }, + { + "epoch": 0.66, + "learning_rate": 1.8170905933309428e-06, + "loss": 0.7871, + "step": 25718 + }, + { + "epoch": 0.66, + "learning_rate": 1.8170746407443906e-06, + "loss": 0.7334, + "step": 25719 + }, + { + "epoch": 0.66, + "learning_rate": 1.817058687532242e-06, + "loss": 0.915, + "step": 25720 + }, + { + "epoch": 0.66, + "learning_rate": 1.8170427336945092e-06, + "loss": 0.8271, + "step": 25721 + }, + { + "epoch": 0.66, + "learning_rate": 1.8170267792312042e-06, + "loss": 0.9111, + "step": 25722 + }, + { + "epoch": 0.66, + "learning_rate": 1.8170108241423395e-06, + "loss": 0.9609, + "step": 25723 + }, + { + "epoch": 0.66, + "learning_rate": 1.8169948684279271e-06, + "loss": 1.0107, + "step": 25724 + }, + { + "epoch": 0.66, + "learning_rate": 1.8169789120879793e-06, + "loss": 0.7754, + "step": 25725 + }, + { + "epoch": 0.66, + "learning_rate": 1.8169629551225084e-06, + "loss": 0.917, + "step": 25726 + }, + { + "epoch": 0.66, + "learning_rate": 1.8169469975315263e-06, + "loss": 0.8574, + "step": 25727 + }, + { + "epoch": 0.66, + "learning_rate": 1.8169310393150456e-06, + "loss": 0.8281, + "step": 25728 + }, + { + "epoch": 0.66, + "learning_rate": 1.8169150804730783e-06, + "loss": 0.8125, + "step": 25729 + }, + { + "epoch": 0.66, + "learning_rate": 1.8168991210056368e-06, + "loss": 0.9897, + "step": 25730 + }, + { + "epoch": 0.66, + "learning_rate": 1.816883160912733e-06, + "loss": 0.9658, + "step": 25731 + }, + { + "epoch": 0.66, + "learning_rate": 1.8168672001943794e-06, + "loss": 0.7852, + "step": 25732 + }, + { + "epoch": 0.66, + "learning_rate": 1.8168512388505884e-06, + "loss": 0.6357, + "step": 25733 + }, + { + "epoch": 0.66, + "learning_rate": 1.8168352768813716e-06, + "loss": 0.9492, + "step": 25734 + }, + { + "epoch": 0.66, + "learning_rate": 1.816819314286742e-06, + "loss": 0.833, + "step": 25735 + }, + { + "epoch": 0.66, + "learning_rate": 1.816803351066711e-06, + "loss": 0.8965, + "step": 25736 + }, + { + "epoch": 0.66, + "learning_rate": 1.8167873872212914e-06, + "loss": 0.9297, + "step": 25737 + }, + { + "epoch": 0.66, + "learning_rate": 1.8167714227504951e-06, + "loss": 1.002, + "step": 25738 + }, + { + "epoch": 0.66, + "learning_rate": 1.8167554576543349e-06, + "loss": 0.8506, + "step": 25739 + }, + { + "epoch": 0.66, + "learning_rate": 1.816739491932822e-06, + "loss": 0.8076, + "step": 25740 + }, + { + "epoch": 0.66, + "learning_rate": 1.8167235255859698e-06, + "loss": 1.0527, + "step": 25741 + }, + { + "epoch": 0.66, + "learning_rate": 1.8167075586137897e-06, + "loss": 0.8711, + "step": 25742 + }, + { + "epoch": 0.66, + "learning_rate": 1.8166915910162942e-06, + "loss": 0.8799, + "step": 25743 + }, + { + "epoch": 0.66, + "learning_rate": 1.8166756227934954e-06, + "loss": 0.8037, + "step": 25744 + }, + { + "epoch": 0.66, + "learning_rate": 1.8166596539454058e-06, + "loss": 0.79, + "step": 25745 + }, + { + "epoch": 0.66, + "learning_rate": 1.8166436844720372e-06, + "loss": 0.791, + "step": 25746 + }, + { + "epoch": 0.66, + "learning_rate": 1.8166277143734022e-06, + "loss": 0.8682, + "step": 25747 + }, + { + "epoch": 0.66, + "learning_rate": 1.816611743649513e-06, + "loss": 0.8423, + "step": 25748 + }, + { + "epoch": 0.66, + "learning_rate": 1.8165957723003818e-06, + "loss": 0.7191, + "step": 25749 + }, + { + "epoch": 0.66, + "learning_rate": 1.8165798003260203e-06, + "loss": 0.8135, + "step": 25750 + }, + { + "epoch": 0.66, + "learning_rate": 1.816563827726442e-06, + "loss": 0.8706, + "step": 25751 + }, + { + "epoch": 0.66, + "learning_rate": 1.8165478545016576e-06, + "loss": 1.0635, + "step": 25752 + }, + { + "epoch": 0.66, + "learning_rate": 1.8165318806516804e-06, + "loss": 0.9727, + "step": 25753 + }, + { + "epoch": 0.66, + "learning_rate": 1.8165159061765223e-06, + "loss": 0.915, + "step": 25754 + }, + { + "epoch": 0.66, + "learning_rate": 1.8164999310761954e-06, + "loss": 0.8203, + "step": 25755 + }, + { + "epoch": 0.66, + "learning_rate": 1.8164839553507121e-06, + "loss": 0.8447, + "step": 25756 + }, + { + "epoch": 0.66, + "learning_rate": 1.8164679790000846e-06, + "loss": 0.8525, + "step": 25757 + }, + { + "epoch": 0.66, + "learning_rate": 1.816452002024325e-06, + "loss": 0.7959, + "step": 25758 + }, + { + "epoch": 0.66, + "learning_rate": 1.8164360244234459e-06, + "loss": 0.8496, + "step": 25759 + }, + { + "epoch": 0.66, + "learning_rate": 1.8164200461974588e-06, + "loss": 0.7305, + "step": 25760 + }, + { + "epoch": 0.66, + "learning_rate": 1.8164040673463767e-06, + "loss": 0.8672, + "step": 25761 + }, + { + "epoch": 0.66, + "learning_rate": 1.8163880878702116e-06, + "loss": 0.9521, + "step": 25762 + }, + { + "epoch": 0.66, + "learning_rate": 1.8163721077689757e-06, + "loss": 0.7515, + "step": 25763 + }, + { + "epoch": 0.66, + "learning_rate": 1.816356127042681e-06, + "loss": 0.8462, + "step": 25764 + }, + { + "epoch": 0.66, + "learning_rate": 1.8163401456913402e-06, + "loss": 0.9912, + "step": 25765 + }, + { + "epoch": 0.66, + "learning_rate": 1.816324163714965e-06, + "loss": 0.8301, + "step": 25766 + }, + { + "epoch": 0.66, + "learning_rate": 1.8163081811135683e-06, + "loss": 0.999, + "step": 25767 + }, + { + "epoch": 0.66, + "learning_rate": 1.8162921978871616e-06, + "loss": 0.5903, + "step": 25768 + }, + { + "epoch": 0.66, + "learning_rate": 1.8162762140357577e-06, + "loss": 0.7783, + "step": 25769 + }, + { + "epoch": 0.66, + "learning_rate": 1.8162602295593686e-06, + "loss": 0.8936, + "step": 25770 + }, + { + "epoch": 0.66, + "learning_rate": 1.8162442444580064e-06, + "loss": 0.8965, + "step": 25771 + }, + { + "epoch": 0.66, + "learning_rate": 1.8162282587316837e-06, + "loss": 0.7065, + "step": 25772 + }, + { + "epoch": 0.66, + "learning_rate": 1.8162122723804126e-06, + "loss": 0.7158, + "step": 25773 + }, + { + "epoch": 0.66, + "learning_rate": 1.8161962854042052e-06, + "loss": 0.8145, + "step": 25774 + }, + { + "epoch": 0.66, + "learning_rate": 1.8161802978030737e-06, + "loss": 0.6084, + "step": 25775 + }, + { + "epoch": 0.66, + "learning_rate": 1.8161643095770307e-06, + "loss": 0.8198, + "step": 25776 + }, + { + "epoch": 0.66, + "learning_rate": 1.8161483207260883e-06, + "loss": 1.04, + "step": 25777 + }, + { + "epoch": 0.66, + "learning_rate": 1.8161323312502584e-06, + "loss": 0.8564, + "step": 25778 + }, + { + "epoch": 0.66, + "learning_rate": 1.8161163411495538e-06, + "loss": 0.603, + "step": 25779 + }, + { + "epoch": 0.66, + "learning_rate": 1.8161003504239862e-06, + "loss": 0.7246, + "step": 25780 + }, + { + "epoch": 0.66, + "learning_rate": 1.8160843590735682e-06, + "loss": 0.5781, + "step": 25781 + }, + { + "epoch": 0.66, + "learning_rate": 1.8160683670983117e-06, + "loss": 0.8882, + "step": 25782 + }, + { + "epoch": 0.66, + "learning_rate": 1.8160523744982295e-06, + "loss": 0.7627, + "step": 25783 + }, + { + "epoch": 0.66, + "learning_rate": 1.8160363812733333e-06, + "loss": 1.0342, + "step": 25784 + }, + { + "epoch": 0.66, + "learning_rate": 1.8160203874236355e-06, + "loss": 0.7881, + "step": 25785 + }, + { + "epoch": 0.66, + "learning_rate": 1.8160043929491486e-06, + "loss": 0.8818, + "step": 25786 + }, + { + "epoch": 0.66, + "learning_rate": 1.8159883978498845e-06, + "loss": 0.7471, + "step": 25787 + }, + { + "epoch": 0.66, + "learning_rate": 1.815972402125856e-06, + "loss": 1.0322, + "step": 25788 + }, + { + "epoch": 0.66, + "learning_rate": 1.8159564057770744e-06, + "loss": 0.6826, + "step": 25789 + }, + { + "epoch": 0.66, + "learning_rate": 1.8159404088035527e-06, + "loss": 0.8701, + "step": 25790 + }, + { + "epoch": 0.66, + "learning_rate": 1.8159244112053032e-06, + "loss": 1.0215, + "step": 25791 + }, + { + "epoch": 0.66, + "learning_rate": 1.8159084129823376e-06, + "loss": 0.7031, + "step": 25792 + }, + { + "epoch": 0.66, + "learning_rate": 1.8158924141346686e-06, + "loss": 0.6851, + "step": 25793 + }, + { + "epoch": 0.66, + "learning_rate": 1.8158764146623082e-06, + "loss": 1.0088, + "step": 25794 + }, + { + "epoch": 0.66, + "learning_rate": 1.8158604145652687e-06, + "loss": 0.7266, + "step": 25795 + }, + { + "epoch": 0.66, + "learning_rate": 1.8158444138435626e-06, + "loss": 0.9238, + "step": 25796 + }, + { + "epoch": 0.66, + "learning_rate": 1.8158284124972015e-06, + "loss": 0.6162, + "step": 25797 + }, + { + "epoch": 0.66, + "learning_rate": 1.8158124105261984e-06, + "loss": 0.9463, + "step": 25798 + }, + { + "epoch": 0.66, + "learning_rate": 1.8157964079305655e-06, + "loss": 1.0576, + "step": 25799 + }, + { + "epoch": 0.66, + "learning_rate": 1.8157804047103147e-06, + "loss": 1.041, + "step": 25800 + }, + { + "epoch": 0.66, + "learning_rate": 1.8157644008654583e-06, + "loss": 0.7305, + "step": 25801 + }, + { + "epoch": 0.66, + "learning_rate": 1.8157483963960083e-06, + "loss": 1.0137, + "step": 25802 + }, + { + "epoch": 0.66, + "learning_rate": 1.8157323913019775e-06, + "loss": 0.6909, + "step": 25803 + }, + { + "epoch": 0.66, + "learning_rate": 1.815716385583378e-06, + "loss": 0.6221, + "step": 25804 + }, + { + "epoch": 0.66, + "learning_rate": 1.815700379240222e-06, + "loss": 0.8721, + "step": 25805 + }, + { + "epoch": 0.66, + "learning_rate": 1.8156843722725213e-06, + "loss": 0.7314, + "step": 25806 + }, + { + "epoch": 0.66, + "learning_rate": 1.815668364680289e-06, + "loss": 0.7129, + "step": 25807 + }, + { + "epoch": 0.66, + "learning_rate": 1.8156523564635369e-06, + "loss": 0.7588, + "step": 25808 + }, + { + "epoch": 0.66, + "learning_rate": 1.815636347622277e-06, + "loss": 0.7642, + "step": 25809 + }, + { + "epoch": 0.66, + "learning_rate": 1.8156203381565223e-06, + "loss": 0.7959, + "step": 25810 + }, + { + "epoch": 0.66, + "learning_rate": 1.8156043280662842e-06, + "loss": 0.9453, + "step": 25811 + }, + { + "epoch": 0.66, + "learning_rate": 1.8155883173515755e-06, + "loss": 1.248, + "step": 25812 + }, + { + "epoch": 0.66, + "learning_rate": 1.8155723060124086e-06, + "loss": 0.5811, + "step": 25813 + }, + { + "epoch": 0.66, + "learning_rate": 1.8155562940487951e-06, + "loss": 0.7881, + "step": 25814 + }, + { + "epoch": 0.66, + "learning_rate": 1.815540281460748e-06, + "loss": 0.7715, + "step": 25815 + }, + { + "epoch": 0.66, + "learning_rate": 1.8155242682482789e-06, + "loss": 0.8799, + "step": 25816 + }, + { + "epoch": 0.66, + "learning_rate": 1.8155082544114004e-06, + "loss": 0.9482, + "step": 25817 + }, + { + "epoch": 0.66, + "learning_rate": 1.8154922399501248e-06, + "loss": 0.6206, + "step": 25818 + }, + { + "epoch": 0.66, + "learning_rate": 1.8154762248644644e-06, + "loss": 0.9023, + "step": 25819 + }, + { + "epoch": 0.66, + "learning_rate": 1.8154602091544313e-06, + "loss": 0.7881, + "step": 25820 + }, + { + "epoch": 0.66, + "learning_rate": 1.8154441928200376e-06, + "loss": 0.8379, + "step": 25821 + }, + { + "epoch": 0.66, + "learning_rate": 1.815428175861296e-06, + "loss": 1.0215, + "step": 25822 + }, + { + "epoch": 0.66, + "learning_rate": 1.8154121582782184e-06, + "loss": 1.0469, + "step": 25823 + }, + { + "epoch": 0.66, + "learning_rate": 1.8153961400708172e-06, + "loss": 0.9395, + "step": 25824 + }, + { + "epoch": 0.66, + "learning_rate": 1.815380121239105e-06, + "loss": 0.793, + "step": 25825 + }, + { + "epoch": 0.66, + "learning_rate": 1.8153641017830933e-06, + "loss": 0.9053, + "step": 25826 + }, + { + "epoch": 0.66, + "learning_rate": 1.8153480817027951e-06, + "loss": 0.9121, + "step": 25827 + }, + { + "epoch": 0.66, + "learning_rate": 1.8153320609982222e-06, + "loss": 0.6235, + "step": 25828 + }, + { + "epoch": 0.66, + "learning_rate": 1.8153160396693871e-06, + "loss": 0.876, + "step": 25829 + }, + { + "epoch": 0.66, + "learning_rate": 1.815300017716302e-06, + "loss": 0.8408, + "step": 25830 + }, + { + "epoch": 0.66, + "learning_rate": 1.8152839951389791e-06, + "loss": 0.8086, + "step": 25831 + }, + { + "epoch": 0.66, + "learning_rate": 1.8152679719374308e-06, + "loss": 1.042, + "step": 25832 + }, + { + "epoch": 0.66, + "learning_rate": 1.8152519481116694e-06, + "loss": 0.8376, + "step": 25833 + }, + { + "epoch": 0.66, + "learning_rate": 1.815235923661707e-06, + "loss": 0.9453, + "step": 25834 + }, + { + "epoch": 0.66, + "learning_rate": 1.8152198985875558e-06, + "loss": 0.8984, + "step": 25835 + }, + { + "epoch": 0.66, + "learning_rate": 1.8152038728892282e-06, + "loss": 0.8594, + "step": 25836 + }, + { + "epoch": 0.66, + "learning_rate": 1.8151878465667366e-06, + "loss": 0.8115, + "step": 25837 + }, + { + "epoch": 0.66, + "learning_rate": 1.815171819620093e-06, + "loss": 0.9688, + "step": 25838 + }, + { + "epoch": 0.66, + "learning_rate": 1.81515579204931e-06, + "loss": 1.0273, + "step": 25839 + }, + { + "epoch": 0.66, + "learning_rate": 1.8151397638543997e-06, + "loss": 1.0264, + "step": 25840 + }, + { + "epoch": 0.66, + "learning_rate": 1.8151237350353742e-06, + "loss": 0.9844, + "step": 25841 + }, + { + "epoch": 0.66, + "learning_rate": 1.8151077055922462e-06, + "loss": 0.8828, + "step": 25842 + }, + { + "epoch": 0.66, + "learning_rate": 1.8150916755250276e-06, + "loss": 0.9316, + "step": 25843 + }, + { + "epoch": 0.66, + "learning_rate": 1.8150756448337305e-06, + "loss": 0.8477, + "step": 25844 + }, + { + "epoch": 0.66, + "learning_rate": 1.8150596135183678e-06, + "loss": 1.0059, + "step": 25845 + }, + { + "epoch": 0.66, + "learning_rate": 1.8150435815789513e-06, + "loss": 0.8916, + "step": 25846 + }, + { + "epoch": 0.66, + "learning_rate": 1.8150275490154934e-06, + "loss": 0.9102, + "step": 25847 + }, + { + "epoch": 0.66, + "learning_rate": 1.8150115158280066e-06, + "loss": 1.002, + "step": 25848 + }, + { + "epoch": 0.66, + "learning_rate": 1.8149954820165029e-06, + "loss": 0.8364, + "step": 25849 + }, + { + "epoch": 0.66, + "learning_rate": 1.8149794475809942e-06, + "loss": 0.7471, + "step": 25850 + }, + { + "epoch": 0.66, + "learning_rate": 1.8149634125214934e-06, + "loss": 0.6399, + "step": 25851 + }, + { + "epoch": 0.66, + "learning_rate": 1.8149473768380128e-06, + "loss": 0.8203, + "step": 25852 + }, + { + "epoch": 0.66, + "learning_rate": 1.8149313405305644e-06, + "loss": 0.9414, + "step": 25853 + }, + { + "epoch": 0.66, + "learning_rate": 1.8149153035991605e-06, + "loss": 0.8833, + "step": 25854 + }, + { + "epoch": 0.66, + "learning_rate": 1.8148992660438135e-06, + "loss": 0.9072, + "step": 25855 + }, + { + "epoch": 0.66, + "learning_rate": 1.8148832278645354e-06, + "loss": 0.9287, + "step": 25856 + }, + { + "epoch": 0.66, + "learning_rate": 1.814867189061339e-06, + "loss": 0.834, + "step": 25857 + }, + { + "epoch": 0.66, + "learning_rate": 1.814851149634236e-06, + "loss": 0.9824, + "step": 25858 + }, + { + "epoch": 0.66, + "learning_rate": 1.8148351095832389e-06, + "loss": 0.6895, + "step": 25859 + }, + { + "epoch": 0.66, + "learning_rate": 1.8148190689083601e-06, + "loss": 0.8735, + "step": 25860 + }, + { + "epoch": 0.66, + "learning_rate": 1.8148030276096118e-06, + "loss": 0.9092, + "step": 25861 + }, + { + "epoch": 0.66, + "learning_rate": 1.8147869856870065e-06, + "loss": 0.7388, + "step": 25862 + }, + { + "epoch": 0.66, + "learning_rate": 1.814770943140556e-06, + "loss": 0.8848, + "step": 25863 + }, + { + "epoch": 0.66, + "learning_rate": 1.814754899970273e-06, + "loss": 0.8682, + "step": 25864 + }, + { + "epoch": 0.66, + "learning_rate": 1.8147388561761696e-06, + "loss": 0.9502, + "step": 25865 + }, + { + "epoch": 0.66, + "learning_rate": 1.814722811758258e-06, + "loss": 0.7476, + "step": 25866 + }, + { + "epoch": 0.66, + "learning_rate": 1.8147067667165509e-06, + "loss": 0.8223, + "step": 25867 + }, + { + "epoch": 0.66, + "learning_rate": 1.81469072105106e-06, + "loss": 0.7588, + "step": 25868 + }, + { + "epoch": 0.66, + "learning_rate": 1.814674674761798e-06, + "loss": 0.8262, + "step": 25869 + }, + { + "epoch": 0.66, + "learning_rate": 1.814658627848777e-06, + "loss": 0.7471, + "step": 25870 + }, + { + "epoch": 0.66, + "learning_rate": 1.8146425803120095e-06, + "loss": 0.8555, + "step": 25871 + }, + { + "epoch": 0.66, + "learning_rate": 1.8146265321515074e-06, + "loss": 0.8721, + "step": 25872 + }, + { + "epoch": 0.66, + "learning_rate": 1.8146104833672834e-06, + "loss": 0.7236, + "step": 25873 + }, + { + "epoch": 0.66, + "learning_rate": 1.8145944339593495e-06, + "loss": 0.7722, + "step": 25874 + }, + { + "epoch": 0.66, + "learning_rate": 1.8145783839277181e-06, + "loss": 0.9277, + "step": 25875 + }, + { + "epoch": 0.66, + "learning_rate": 1.8145623332724016e-06, + "loss": 0.9326, + "step": 25876 + }, + { + "epoch": 0.66, + "learning_rate": 1.8145462819934121e-06, + "loss": 0.9238, + "step": 25877 + }, + { + "epoch": 0.66, + "learning_rate": 1.814530230090762e-06, + "loss": 0.6428, + "step": 25878 + }, + { + "epoch": 0.66, + "learning_rate": 1.8145141775644634e-06, + "loss": 0.7793, + "step": 25879 + }, + { + "epoch": 0.66, + "learning_rate": 1.8144981244145292e-06, + "loss": 1.1006, + "step": 25880 + }, + { + "epoch": 0.66, + "learning_rate": 1.8144820706409707e-06, + "loss": 1.0049, + "step": 25881 + }, + { + "epoch": 0.66, + "learning_rate": 1.814466016243801e-06, + "loss": 0.9229, + "step": 25882 + }, + { + "epoch": 0.66, + "learning_rate": 1.814449961223032e-06, + "loss": 0.9502, + "step": 25883 + }, + { + "epoch": 0.66, + "learning_rate": 1.8144339055786762e-06, + "loss": 0.6499, + "step": 25884 + }, + { + "epoch": 0.66, + "learning_rate": 1.8144178493107459e-06, + "loss": 0.9883, + "step": 25885 + }, + { + "epoch": 0.66, + "learning_rate": 1.8144017924192532e-06, + "loss": 0.9189, + "step": 25886 + }, + { + "epoch": 0.66, + "learning_rate": 1.8143857349042105e-06, + "loss": 0.9824, + "step": 25887 + }, + { + "epoch": 0.66, + "learning_rate": 1.81436967676563e-06, + "loss": 1.0186, + "step": 25888 + }, + { + "epoch": 0.66, + "learning_rate": 1.8143536180035241e-06, + "loss": 0.7598, + "step": 25889 + }, + { + "epoch": 0.66, + "learning_rate": 1.8143375586179053e-06, + "loss": 0.6914, + "step": 25890 + }, + { + "epoch": 0.66, + "learning_rate": 1.8143214986087854e-06, + "loss": 0.7268, + "step": 25891 + }, + { + "epoch": 0.66, + "learning_rate": 1.8143054379761772e-06, + "loss": 0.8789, + "step": 25892 + }, + { + "epoch": 0.66, + "learning_rate": 1.8142893767200927e-06, + "loss": 0.7861, + "step": 25893 + }, + { + "epoch": 0.66, + "learning_rate": 1.8142733148405442e-06, + "loss": 0.9141, + "step": 25894 + }, + { + "epoch": 0.66, + "learning_rate": 1.8142572523375442e-06, + "loss": 0.8584, + "step": 25895 + }, + { + "epoch": 0.66, + "learning_rate": 1.8142411892111045e-06, + "loss": 1.0225, + "step": 25896 + }, + { + "epoch": 0.66, + "learning_rate": 1.8142251254612381e-06, + "loss": 0.9297, + "step": 25897 + }, + { + "epoch": 0.66, + "learning_rate": 1.8142090610879568e-06, + "loss": 0.8936, + "step": 25898 + }, + { + "epoch": 0.66, + "learning_rate": 1.8141929960912732e-06, + "loss": 0.8389, + "step": 25899 + }, + { + "epoch": 0.66, + "learning_rate": 1.8141769304711994e-06, + "loss": 0.8848, + "step": 25900 + }, + { + "epoch": 0.66, + "learning_rate": 1.8141608642277477e-06, + "loss": 1.1172, + "step": 25901 + }, + { + "epoch": 0.66, + "learning_rate": 1.8141447973609308e-06, + "loss": 0.8867, + "step": 25902 + }, + { + "epoch": 0.66, + "learning_rate": 1.81412872987076e-06, + "loss": 0.8418, + "step": 25903 + }, + { + "epoch": 0.66, + "learning_rate": 1.814112661757249e-06, + "loss": 0.9072, + "step": 25904 + }, + { + "epoch": 0.66, + "learning_rate": 1.8140965930204088e-06, + "loss": 0.8926, + "step": 25905 + }, + { + "epoch": 0.66, + "learning_rate": 1.8140805236602525e-06, + "loss": 1.0654, + "step": 25906 + }, + { + "epoch": 0.66, + "learning_rate": 1.814064453676792e-06, + "loss": 0.9502, + "step": 25907 + }, + { + "epoch": 0.66, + "learning_rate": 1.81404838307004e-06, + "loss": 0.835, + "step": 25908 + }, + { + "epoch": 0.66, + "learning_rate": 1.8140323118400084e-06, + "loss": 0.7847, + "step": 25909 + }, + { + "epoch": 0.66, + "learning_rate": 1.81401623998671e-06, + "loss": 0.9346, + "step": 25910 + }, + { + "epoch": 0.66, + "learning_rate": 1.814000167510157e-06, + "loss": 1.0518, + "step": 25911 + }, + { + "epoch": 0.66, + "learning_rate": 1.8139840944103608e-06, + "loss": 0.9297, + "step": 25912 + }, + { + "epoch": 0.66, + "learning_rate": 1.8139680206873346e-06, + "loss": 0.9268, + "step": 25913 + }, + { + "epoch": 0.66, + "learning_rate": 1.8139519463410905e-06, + "loss": 0.7446, + "step": 25914 + }, + { + "epoch": 0.66, + "learning_rate": 1.8139358713716413e-06, + "loss": 0.8633, + "step": 25915 + }, + { + "epoch": 0.66, + "learning_rate": 1.8139197957789984e-06, + "loss": 0.835, + "step": 25916 + }, + { + "epoch": 0.66, + "learning_rate": 1.8139037195631746e-06, + "loss": 0.8003, + "step": 25917 + }, + { + "epoch": 0.66, + "learning_rate": 1.813887642724182e-06, + "loss": 0.6895, + "step": 25918 + }, + { + "epoch": 0.66, + "learning_rate": 1.8138715652620332e-06, + "loss": 0.9805, + "step": 25919 + }, + { + "epoch": 0.66, + "learning_rate": 1.8138554871767407e-06, + "loss": 0.9072, + "step": 25920 + }, + { + "epoch": 0.66, + "learning_rate": 1.8138394084683162e-06, + "loss": 0.7422, + "step": 25921 + }, + { + "epoch": 0.66, + "learning_rate": 1.8138233291367722e-06, + "loss": 0.9004, + "step": 25922 + }, + { + "epoch": 0.66, + "learning_rate": 1.813807249182121e-06, + "loss": 0.7754, + "step": 25923 + }, + { + "epoch": 0.66, + "learning_rate": 1.8137911686043752e-06, + "loss": 0.749, + "step": 25924 + }, + { + "epoch": 0.66, + "learning_rate": 1.8137750874035469e-06, + "loss": 0.6519, + "step": 25925 + }, + { + "epoch": 0.66, + "learning_rate": 1.8137590055796483e-06, + "loss": 0.7725, + "step": 25926 + }, + { + "epoch": 0.66, + "learning_rate": 1.813742923132692e-06, + "loss": 0.6763, + "step": 25927 + }, + { + "epoch": 0.66, + "learning_rate": 1.8137268400626902e-06, + "loss": 0.8389, + "step": 25928 + }, + { + "epoch": 0.66, + "learning_rate": 1.813710756369655e-06, + "loss": 0.7705, + "step": 25929 + }, + { + "epoch": 0.66, + "learning_rate": 1.813694672053599e-06, + "loss": 0.876, + "step": 25930 + }, + { + "epoch": 0.66, + "learning_rate": 1.8136785871145343e-06, + "loss": 1.0449, + "step": 25931 + }, + { + "epoch": 0.66, + "learning_rate": 1.8136625015524736e-06, + "loss": 0.9087, + "step": 25932 + }, + { + "epoch": 0.66, + "learning_rate": 1.8136464153674287e-06, + "loss": 0.6377, + "step": 25933 + }, + { + "epoch": 0.66, + "learning_rate": 1.813630328559412e-06, + "loss": 0.7549, + "step": 25934 + }, + { + "epoch": 0.66, + "learning_rate": 1.8136142411284362e-06, + "loss": 0.9883, + "step": 25935 + }, + { + "epoch": 0.66, + "learning_rate": 1.8135981530745136e-06, + "loss": 0.6226, + "step": 25936 + }, + { + "epoch": 0.66, + "learning_rate": 1.8135820643976558e-06, + "loss": 1.0234, + "step": 25937 + }, + { + "epoch": 0.66, + "learning_rate": 1.813565975097876e-06, + "loss": 0.7114, + "step": 25938 + }, + { + "epoch": 0.66, + "learning_rate": 1.813549885175186e-06, + "loss": 0.9092, + "step": 25939 + }, + { + "epoch": 0.66, + "learning_rate": 1.8135337946295984e-06, + "loss": 0.8965, + "step": 25940 + }, + { + "epoch": 0.66, + "learning_rate": 1.8135177034611254e-06, + "loss": 0.8623, + "step": 25941 + }, + { + "epoch": 0.66, + "learning_rate": 1.8135016116697787e-06, + "loss": 1.0254, + "step": 25942 + }, + { + "epoch": 0.66, + "learning_rate": 1.8134855192555718e-06, + "loss": 1.0098, + "step": 25943 + }, + { + "epoch": 0.66, + "learning_rate": 1.8134694262185164e-06, + "loss": 1.0225, + "step": 25944 + }, + { + "epoch": 0.66, + "learning_rate": 1.813453332558625e-06, + "loss": 0.7734, + "step": 25945 + }, + { + "epoch": 0.67, + "learning_rate": 1.8134372382759096e-06, + "loss": 0.9834, + "step": 25946 + }, + { + "epoch": 0.67, + "learning_rate": 1.8134211433703825e-06, + "loss": 1.0586, + "step": 25947 + }, + { + "epoch": 0.67, + "learning_rate": 1.8134050478420565e-06, + "loss": 0.7969, + "step": 25948 + }, + { + "epoch": 0.67, + "learning_rate": 1.8133889516909435e-06, + "loss": 0.7744, + "step": 25949 + }, + { + "epoch": 0.67, + "learning_rate": 1.813372854917056e-06, + "loss": 0.9619, + "step": 25950 + }, + { + "epoch": 0.67, + "learning_rate": 1.8133567575204065e-06, + "loss": 0.7827, + "step": 25951 + }, + { + "epoch": 0.67, + "learning_rate": 1.8133406595010067e-06, + "loss": 0.8652, + "step": 25952 + }, + { + "epoch": 0.67, + "learning_rate": 1.8133245608588698e-06, + "loss": 0.6391, + "step": 25953 + }, + { + "epoch": 0.67, + "learning_rate": 1.8133084615940074e-06, + "loss": 0.873, + "step": 25954 + }, + { + "epoch": 0.67, + "learning_rate": 1.8132923617064325e-06, + "loss": 1.0596, + "step": 25955 + }, + { + "epoch": 0.67, + "learning_rate": 1.8132762611961568e-06, + "loss": 1.0635, + "step": 25956 + }, + { + "epoch": 0.67, + "learning_rate": 1.8132601600631927e-06, + "loss": 0.9658, + "step": 25957 + }, + { + "epoch": 0.67, + "learning_rate": 1.813244058307553e-06, + "loss": 0.752, + "step": 25958 + }, + { + "epoch": 0.67, + "learning_rate": 1.8132279559292493e-06, + "loss": 0.6616, + "step": 25959 + }, + { + "epoch": 0.67, + "learning_rate": 1.8132118529282946e-06, + "loss": 0.771, + "step": 25960 + }, + { + "epoch": 0.67, + "learning_rate": 1.8131957493047013e-06, + "loss": 1.252, + "step": 25961 + }, + { + "epoch": 0.67, + "learning_rate": 1.8131796450584807e-06, + "loss": 1.0293, + "step": 25962 + }, + { + "epoch": 0.67, + "learning_rate": 1.8131635401896464e-06, + "loss": 0.7891, + "step": 25963 + }, + { + "epoch": 0.67, + "learning_rate": 1.8131474346982099e-06, + "loss": 0.9111, + "step": 25964 + }, + { + "epoch": 0.67, + "learning_rate": 1.813131328584184e-06, + "loss": 0.8779, + "step": 25965 + }, + { + "epoch": 0.67, + "learning_rate": 1.8131152218475804e-06, + "loss": 0.9834, + "step": 25966 + }, + { + "epoch": 0.67, + "learning_rate": 1.8130991144884123e-06, + "loss": 0.8311, + "step": 25967 + }, + { + "epoch": 0.67, + "learning_rate": 1.8130830065066915e-06, + "loss": 0.8291, + "step": 25968 + }, + { + "epoch": 0.67, + "learning_rate": 1.8130668979024303e-06, + "loss": 0.873, + "step": 25969 + }, + { + "epoch": 0.67, + "learning_rate": 1.8130507886756412e-06, + "loss": 1.0625, + "step": 25970 + }, + { + "epoch": 0.67, + "learning_rate": 1.8130346788263368e-06, + "loss": 0.7964, + "step": 25971 + }, + { + "epoch": 0.67, + "learning_rate": 1.8130185683545287e-06, + "loss": 0.7959, + "step": 25972 + }, + { + "epoch": 0.67, + "learning_rate": 1.81300245726023e-06, + "loss": 0.998, + "step": 25973 + }, + { + "epoch": 0.67, + "learning_rate": 1.8129863455434525e-06, + "loss": 0.9189, + "step": 25974 + }, + { + "epoch": 0.67, + "learning_rate": 1.8129702332042088e-06, + "loss": 0.8799, + "step": 25975 + }, + { + "epoch": 0.67, + "learning_rate": 1.812954120242511e-06, + "loss": 0.7192, + "step": 25976 + }, + { + "epoch": 0.67, + "learning_rate": 1.8129380066583719e-06, + "loss": 0.8857, + "step": 25977 + }, + { + "epoch": 0.67, + "learning_rate": 1.8129218924518032e-06, + "loss": 0.7964, + "step": 25978 + }, + { + "epoch": 0.67, + "learning_rate": 1.812905777622818e-06, + "loss": 0.7471, + "step": 25979 + }, + { + "epoch": 0.67, + "learning_rate": 1.812889662171428e-06, + "loss": 0.9951, + "step": 25980 + }, + { + "epoch": 0.67, + "learning_rate": 1.812873546097646e-06, + "loss": 0.575, + "step": 25981 + }, + { + "epoch": 0.67, + "learning_rate": 1.8128574294014838e-06, + "loss": 0.6853, + "step": 25982 + }, + { + "epoch": 0.67, + "learning_rate": 1.8128413120829541e-06, + "loss": 0.876, + "step": 25983 + }, + { + "epoch": 0.67, + "learning_rate": 1.8128251941420692e-06, + "loss": 0.7646, + "step": 25984 + }, + { + "epoch": 0.67, + "learning_rate": 1.8128090755788414e-06, + "loss": 0.7158, + "step": 25985 + }, + { + "epoch": 0.67, + "learning_rate": 1.812792956393283e-06, + "loss": 0.8096, + "step": 25986 + }, + { + "epoch": 0.67, + "learning_rate": 1.8127768365854066e-06, + "loss": 0.876, + "step": 25987 + }, + { + "epoch": 0.67, + "learning_rate": 1.8127607161552243e-06, + "loss": 0.9492, + "step": 25988 + }, + { + "epoch": 0.67, + "learning_rate": 1.8127445951027484e-06, + "loss": 0.999, + "step": 25989 + }, + { + "epoch": 0.67, + "learning_rate": 1.8127284734279914e-06, + "loss": 0.9355, + "step": 25990 + }, + { + "epoch": 0.67, + "learning_rate": 1.8127123511309657e-06, + "loss": 0.7654, + "step": 25991 + }, + { + "epoch": 0.67, + "learning_rate": 1.8126962282116834e-06, + "loss": 0.9521, + "step": 25992 + }, + { + "epoch": 0.67, + "learning_rate": 1.8126801046701566e-06, + "loss": 0.9287, + "step": 25993 + }, + { + "epoch": 0.67, + "learning_rate": 1.8126639805063989e-06, + "loss": 0.7261, + "step": 25994 + }, + { + "epoch": 0.67, + "learning_rate": 1.812647855720421e-06, + "loss": 1.0332, + "step": 25995 + }, + { + "epoch": 0.67, + "learning_rate": 1.812631730312236e-06, + "loss": 0.8672, + "step": 25996 + }, + { + "epoch": 0.67, + "learning_rate": 1.8126156042818566e-06, + "loss": 0.9375, + "step": 25997 + }, + { + "epoch": 0.67, + "learning_rate": 1.8125994776292948e-06, + "loss": 1.1074, + "step": 25998 + }, + { + "epoch": 0.67, + "learning_rate": 1.8125833503545627e-06, + "loss": 0.7734, + "step": 25999 + }, + { + "epoch": 0.67, + "learning_rate": 1.8125672224576732e-06, + "loss": 1.0771, + "step": 26000 + }, + { + "epoch": 0.67, + "learning_rate": 1.8125510939386382e-06, + "loss": 1.0781, + "step": 26001 + }, + { + "epoch": 0.67, + "learning_rate": 1.8125349647974699e-06, + "loss": 1.0527, + "step": 26002 + }, + { + "epoch": 0.67, + "learning_rate": 1.8125188350341812e-06, + "loss": 0.9023, + "step": 26003 + }, + { + "epoch": 0.67, + "learning_rate": 1.8125027046487841e-06, + "loss": 0.8594, + "step": 26004 + }, + { + "epoch": 0.67, + "learning_rate": 1.8124865736412913e-06, + "loss": 0.8652, + "step": 26005 + }, + { + "epoch": 0.67, + "learning_rate": 1.8124704420117144e-06, + "loss": 0.6719, + "step": 26006 + }, + { + "epoch": 0.67, + "learning_rate": 1.8124543097600666e-06, + "loss": 0.8809, + "step": 26007 + }, + { + "epoch": 0.67, + "learning_rate": 1.8124381768863598e-06, + "loss": 0.7139, + "step": 26008 + }, + { + "epoch": 0.67, + "learning_rate": 1.8124220433906067e-06, + "loss": 0.793, + "step": 26009 + }, + { + "epoch": 0.67, + "learning_rate": 1.8124059092728193e-06, + "loss": 0.8613, + "step": 26010 + }, + { + "epoch": 0.67, + "learning_rate": 1.8123897745330096e-06, + "loss": 0.9453, + "step": 26011 + }, + { + "epoch": 0.67, + "learning_rate": 1.812373639171191e-06, + "loss": 0.9727, + "step": 26012 + }, + { + "epoch": 0.67, + "learning_rate": 1.8123575031873748e-06, + "loss": 0.8652, + "step": 26013 + }, + { + "epoch": 0.67, + "learning_rate": 1.812341366581574e-06, + "loss": 0.8916, + "step": 26014 + }, + { + "epoch": 0.67, + "learning_rate": 1.8123252293538007e-06, + "loss": 0.6719, + "step": 26015 + }, + { + "epoch": 0.67, + "learning_rate": 1.8123090915040677e-06, + "loss": 0.8428, + "step": 26016 + }, + { + "epoch": 0.67, + "learning_rate": 1.8122929530323865e-06, + "loss": 0.6626, + "step": 26017 + }, + { + "epoch": 0.67, + "learning_rate": 1.8122768139387703e-06, + "loss": 0.7739, + "step": 26018 + }, + { + "epoch": 0.67, + "learning_rate": 1.8122606742232307e-06, + "loss": 0.918, + "step": 26019 + }, + { + "epoch": 0.67, + "learning_rate": 1.8122445338857805e-06, + "loss": 0.7842, + "step": 26020 + }, + { + "epoch": 0.67, + "learning_rate": 1.8122283929264324e-06, + "loss": 0.9404, + "step": 26021 + }, + { + "epoch": 0.67, + "learning_rate": 1.812212251345198e-06, + "loss": 0.8867, + "step": 26022 + }, + { + "epoch": 0.67, + "learning_rate": 1.8121961091420902e-06, + "loss": 0.8594, + "step": 26023 + }, + { + "epoch": 0.67, + "learning_rate": 1.812179966317121e-06, + "loss": 0.7549, + "step": 26024 + }, + { + "epoch": 0.67, + "learning_rate": 1.8121638228703033e-06, + "loss": 1.0312, + "step": 26025 + }, + { + "epoch": 0.67, + "learning_rate": 1.812147678801649e-06, + "loss": 0.8447, + "step": 26026 + }, + { + "epoch": 0.67, + "learning_rate": 1.8121315341111703e-06, + "loss": 0.9453, + "step": 26027 + }, + { + "epoch": 0.67, + "learning_rate": 1.81211538879888e-06, + "loss": 0.8057, + "step": 26028 + }, + { + "epoch": 0.67, + "learning_rate": 1.8120992428647903e-06, + "loss": 0.9414, + "step": 26029 + }, + { + "epoch": 0.67, + "learning_rate": 1.8120830963089136e-06, + "loss": 0.8281, + "step": 26030 + }, + { + "epoch": 0.67, + "learning_rate": 1.8120669491312622e-06, + "loss": 0.9707, + "step": 26031 + }, + { + "epoch": 0.67, + "learning_rate": 1.8120508013318482e-06, + "loss": 0.8076, + "step": 26032 + }, + { + "epoch": 0.67, + "learning_rate": 1.8120346529106844e-06, + "loss": 0.9004, + "step": 26033 + }, + { + "epoch": 0.67, + "learning_rate": 1.812018503867783e-06, + "loss": 0.7305, + "step": 26034 + }, + { + "epoch": 0.67, + "learning_rate": 1.8120023542031567e-06, + "loss": 0.9893, + "step": 26035 + }, + { + "epoch": 0.67, + "learning_rate": 1.8119862039168172e-06, + "loss": 0.8984, + "step": 26036 + }, + { + "epoch": 0.67, + "learning_rate": 1.8119700530087772e-06, + "loss": 0.9619, + "step": 26037 + }, + { + "epoch": 0.67, + "learning_rate": 1.811953901479049e-06, + "loss": 1.1406, + "step": 26038 + }, + { + "epoch": 0.67, + "learning_rate": 1.8119377493276453e-06, + "loss": 0.8877, + "step": 26039 + }, + { + "epoch": 0.67, + "learning_rate": 1.811921596554578e-06, + "loss": 0.813, + "step": 26040 + }, + { + "epoch": 0.67, + "learning_rate": 1.8119054431598598e-06, + "loss": 0.9297, + "step": 26041 + }, + { + "epoch": 0.67, + "learning_rate": 1.8118892891435026e-06, + "loss": 0.8145, + "step": 26042 + }, + { + "epoch": 0.67, + "learning_rate": 1.8118731345055196e-06, + "loss": 0.8643, + "step": 26043 + }, + { + "epoch": 0.67, + "learning_rate": 1.8118569792459223e-06, + "loss": 0.9619, + "step": 26044 + }, + { + "epoch": 0.67, + "learning_rate": 1.8118408233647236e-06, + "loss": 0.7549, + "step": 26045 + }, + { + "epoch": 0.67, + "learning_rate": 1.8118246668619357e-06, + "loss": 0.6851, + "step": 26046 + }, + { + "epoch": 0.67, + "learning_rate": 1.8118085097375709e-06, + "loss": 0.8408, + "step": 26047 + }, + { + "epoch": 0.67, + "learning_rate": 1.8117923519916419e-06, + "loss": 0.8223, + "step": 26048 + }, + { + "epoch": 0.67, + "learning_rate": 1.8117761936241607e-06, + "loss": 1.041, + "step": 26049 + }, + { + "epoch": 0.67, + "learning_rate": 1.8117600346351396e-06, + "loss": 0.7979, + "step": 26050 + }, + { + "epoch": 0.67, + "learning_rate": 1.8117438750245912e-06, + "loss": 0.71, + "step": 26051 + }, + { + "epoch": 0.67, + "learning_rate": 1.811727714792528e-06, + "loss": 0.8662, + "step": 26052 + }, + { + "epoch": 0.67, + "learning_rate": 1.8117115539389623e-06, + "loss": 0.9424, + "step": 26053 + }, + { + "epoch": 0.67, + "learning_rate": 1.811695392463906e-06, + "loss": 1.0098, + "step": 26054 + }, + { + "epoch": 0.67, + "learning_rate": 1.8116792303673722e-06, + "loss": 0.8809, + "step": 26055 + }, + { + "epoch": 0.67, + "learning_rate": 1.8116630676493729e-06, + "loss": 0.7061, + "step": 26056 + }, + { + "epoch": 0.67, + "learning_rate": 1.8116469043099205e-06, + "loss": 1.1426, + "step": 26057 + }, + { + "epoch": 0.67, + "learning_rate": 1.8116307403490274e-06, + "loss": 0.8853, + "step": 26058 + }, + { + "epoch": 0.67, + "learning_rate": 1.8116145757667058e-06, + "loss": 0.9453, + "step": 26059 + }, + { + "epoch": 0.67, + "learning_rate": 1.8115984105629683e-06, + "loss": 0.7744, + "step": 26060 + }, + { + "epoch": 0.67, + "learning_rate": 1.8115822447378272e-06, + "loss": 0.748, + "step": 26061 + }, + { + "epoch": 0.67, + "learning_rate": 1.8115660782912952e-06, + "loss": 0.8291, + "step": 26062 + }, + { + "epoch": 0.67, + "learning_rate": 1.8115499112233838e-06, + "loss": 1.0596, + "step": 26063 + }, + { + "epoch": 0.67, + "learning_rate": 1.8115337435341064e-06, + "loss": 0.9443, + "step": 26064 + }, + { + "epoch": 0.67, + "learning_rate": 1.8115175752234749e-06, + "loss": 0.5376, + "step": 26065 + }, + { + "epoch": 0.67, + "learning_rate": 1.8115014062915015e-06, + "loss": 0.8535, + "step": 26066 + }, + { + "epoch": 0.67, + "learning_rate": 1.811485236738199e-06, + "loss": 0.8457, + "step": 26067 + }, + { + "epoch": 0.67, + "learning_rate": 1.8114690665635793e-06, + "loss": 0.7354, + "step": 26068 + }, + { + "epoch": 0.67, + "learning_rate": 1.8114528957676552e-06, + "loss": 0.8154, + "step": 26069 + }, + { + "epoch": 0.67, + "learning_rate": 1.8114367243504389e-06, + "loss": 0.9102, + "step": 26070 + }, + { + "epoch": 0.67, + "learning_rate": 1.8114205523119427e-06, + "loss": 1.0449, + "step": 26071 + }, + { + "epoch": 0.67, + "learning_rate": 1.8114043796521794e-06, + "loss": 1.1445, + "step": 26072 + }, + { + "epoch": 0.67, + "learning_rate": 1.8113882063711609e-06, + "loss": 0.834, + "step": 26073 + }, + { + "epoch": 0.67, + "learning_rate": 1.8113720324689e-06, + "loss": 0.6655, + "step": 26074 + }, + { + "epoch": 0.67, + "learning_rate": 1.8113558579454084e-06, + "loss": 1.0654, + "step": 26075 + }, + { + "epoch": 0.67, + "learning_rate": 1.8113396828006993e-06, + "loss": 0.7891, + "step": 26076 + }, + { + "epoch": 0.67, + "learning_rate": 1.8113235070347846e-06, + "loss": 0.8105, + "step": 26077 + }, + { + "epoch": 0.67, + "learning_rate": 1.8113073306476766e-06, + "loss": 0.7593, + "step": 26078 + }, + { + "epoch": 0.67, + "learning_rate": 1.811291153639388e-06, + "loss": 0.9141, + "step": 26079 + }, + { + "epoch": 0.67, + "learning_rate": 1.811274976009931e-06, + "loss": 0.8193, + "step": 26080 + }, + { + "epoch": 0.67, + "learning_rate": 1.811258797759318e-06, + "loss": 0.5308, + "step": 26081 + }, + { + "epoch": 0.67, + "learning_rate": 1.8112426188875617e-06, + "loss": 0.9111, + "step": 26082 + }, + { + "epoch": 0.67, + "learning_rate": 1.8112264393946744e-06, + "loss": 1.124, + "step": 26083 + }, + { + "epoch": 0.67, + "learning_rate": 1.811210259280668e-06, + "loss": 1.0361, + "step": 26084 + }, + { + "epoch": 0.67, + "learning_rate": 1.811194078545555e-06, + "loss": 0.9648, + "step": 26085 + }, + { + "epoch": 0.67, + "learning_rate": 1.8111778971893484e-06, + "loss": 0.9727, + "step": 26086 + }, + { + "epoch": 0.67, + "learning_rate": 1.81116171521206e-06, + "loss": 0.9326, + "step": 26087 + }, + { + "epoch": 0.67, + "learning_rate": 1.8111455326137022e-06, + "loss": 0.6442, + "step": 26088 + }, + { + "epoch": 0.67, + "learning_rate": 1.8111293493942879e-06, + "loss": 0.8291, + "step": 26089 + }, + { + "epoch": 0.67, + "learning_rate": 1.811113165553829e-06, + "loss": 0.96, + "step": 26090 + }, + { + "epoch": 0.67, + "learning_rate": 1.811096981092338e-06, + "loss": 0.915, + "step": 26091 + }, + { + "epoch": 0.67, + "learning_rate": 1.8110807960098274e-06, + "loss": 0.6978, + "step": 26092 + }, + { + "epoch": 0.67, + "learning_rate": 1.8110646103063094e-06, + "loss": 0.9482, + "step": 26093 + }, + { + "epoch": 0.67, + "learning_rate": 1.8110484239817966e-06, + "loss": 0.8975, + "step": 26094 + }, + { + "epoch": 0.67, + "learning_rate": 1.8110322370363016e-06, + "loss": 0.9111, + "step": 26095 + }, + { + "epoch": 0.67, + "learning_rate": 1.811016049469836e-06, + "loss": 0.8486, + "step": 26096 + }, + { + "epoch": 0.67, + "learning_rate": 1.8109998612824132e-06, + "loss": 0.8564, + "step": 26097 + }, + { + "epoch": 0.67, + "learning_rate": 1.810983672474045e-06, + "loss": 0.8311, + "step": 26098 + }, + { + "epoch": 0.67, + "learning_rate": 1.8109674830447435e-06, + "loss": 0.7048, + "step": 26099 + }, + { + "epoch": 0.67, + "learning_rate": 1.810951292994522e-06, + "loss": 1.1367, + "step": 26100 + }, + { + "epoch": 0.67, + "learning_rate": 1.810935102323392e-06, + "loss": 1.0625, + "step": 26101 + }, + { + "epoch": 0.67, + "learning_rate": 1.8109189110313663e-06, + "loss": 0.9893, + "step": 26102 + }, + { + "epoch": 0.67, + "learning_rate": 1.8109027191184577e-06, + "loss": 0.6396, + "step": 26103 + }, + { + "epoch": 0.67, + "learning_rate": 1.8108865265846776e-06, + "loss": 1.0889, + "step": 26104 + }, + { + "epoch": 0.67, + "learning_rate": 1.8108703334300392e-06, + "loss": 0.5645, + "step": 26105 + }, + { + "epoch": 0.67, + "learning_rate": 1.810854139654555e-06, + "loss": 0.729, + "step": 26106 + }, + { + "epoch": 0.67, + "learning_rate": 1.8108379452582366e-06, + "loss": 0.6665, + "step": 26107 + }, + { + "epoch": 0.67, + "learning_rate": 1.810821750241097e-06, + "loss": 0.9165, + "step": 26108 + }, + { + "epoch": 0.67, + "learning_rate": 1.8108055546031484e-06, + "loss": 0.8394, + "step": 26109 + }, + { + "epoch": 0.67, + "learning_rate": 1.8107893583444034e-06, + "loss": 0.9189, + "step": 26110 + }, + { + "epoch": 0.67, + "learning_rate": 1.8107731614648742e-06, + "loss": 0.8984, + "step": 26111 + }, + { + "epoch": 0.67, + "learning_rate": 1.8107569639645735e-06, + "loss": 1.1328, + "step": 26112 + }, + { + "epoch": 0.67, + "learning_rate": 1.8107407658435132e-06, + "loss": 0.6914, + "step": 26113 + }, + { + "epoch": 0.67, + "learning_rate": 1.810724567101706e-06, + "loss": 0.8345, + "step": 26114 + }, + { + "epoch": 0.67, + "learning_rate": 1.8107083677391644e-06, + "loss": 0.7949, + "step": 26115 + }, + { + "epoch": 0.67, + "learning_rate": 1.8106921677559006e-06, + "loss": 0.8711, + "step": 26116 + }, + { + "epoch": 0.67, + "learning_rate": 1.8106759671519273e-06, + "loss": 0.8965, + "step": 26117 + }, + { + "epoch": 0.67, + "learning_rate": 1.8106597659272564e-06, + "loss": 0.8506, + "step": 26118 + }, + { + "epoch": 0.67, + "learning_rate": 1.8106435640819004e-06, + "loss": 0.7178, + "step": 26119 + }, + { + "epoch": 0.67, + "learning_rate": 1.8106273616158725e-06, + "loss": 0.9287, + "step": 26120 + }, + { + "epoch": 0.67, + "learning_rate": 1.8106111585291842e-06, + "loss": 1.0791, + "step": 26121 + }, + { + "epoch": 0.67, + "learning_rate": 1.810594954821848e-06, + "loss": 1.1143, + "step": 26122 + }, + { + "epoch": 0.67, + "learning_rate": 1.8105787504938768e-06, + "loss": 0.8281, + "step": 26123 + }, + { + "epoch": 0.67, + "learning_rate": 1.8105625455452826e-06, + "loss": 0.8511, + "step": 26124 + }, + { + "epoch": 0.67, + "learning_rate": 1.810546339976078e-06, + "loss": 0.9072, + "step": 26125 + }, + { + "epoch": 0.67, + "learning_rate": 1.8105301337862753e-06, + "loss": 0.9326, + "step": 26126 + }, + { + "epoch": 0.67, + "learning_rate": 1.810513926975887e-06, + "loss": 0.9375, + "step": 26127 + }, + { + "epoch": 0.67, + "learning_rate": 1.810497719544925e-06, + "loss": 0.7383, + "step": 26128 + }, + { + "epoch": 0.67, + "learning_rate": 1.8104815114934029e-06, + "loss": 0.8662, + "step": 26129 + }, + { + "epoch": 0.67, + "learning_rate": 1.8104653028213318e-06, + "loss": 0.918, + "step": 26130 + }, + { + "epoch": 0.67, + "learning_rate": 1.810449093528725e-06, + "loss": 0.9512, + "step": 26131 + }, + { + "epoch": 0.67, + "learning_rate": 1.8104328836155943e-06, + "loss": 0.7866, + "step": 26132 + }, + { + "epoch": 0.67, + "learning_rate": 1.8104166730819529e-06, + "loss": 0.8809, + "step": 26133 + }, + { + "epoch": 0.67, + "learning_rate": 1.8104004619278123e-06, + "loss": 0.9775, + "step": 26134 + }, + { + "epoch": 0.67, + "learning_rate": 1.8103842501531856e-06, + "loss": 0.8428, + "step": 26135 + }, + { + "epoch": 0.67, + "learning_rate": 1.8103680377580848e-06, + "loss": 0.7188, + "step": 26136 + }, + { + "epoch": 0.67, + "learning_rate": 1.8103518247425224e-06, + "loss": 0.9199, + "step": 26137 + }, + { + "epoch": 0.67, + "learning_rate": 1.810335611106511e-06, + "loss": 0.9531, + "step": 26138 + }, + { + "epoch": 0.67, + "learning_rate": 1.8103193968500627e-06, + "loss": 0.9863, + "step": 26139 + }, + { + "epoch": 0.67, + "learning_rate": 1.8103031819731905e-06, + "loss": 0.9561, + "step": 26140 + }, + { + "epoch": 0.67, + "learning_rate": 1.8102869664759059e-06, + "loss": 0.9229, + "step": 26141 + }, + { + "epoch": 0.67, + "learning_rate": 1.8102707503582221e-06, + "loss": 0.6638, + "step": 26142 + }, + { + "epoch": 0.67, + "learning_rate": 1.8102545336201511e-06, + "loss": 0.9756, + "step": 26143 + }, + { + "epoch": 0.67, + "learning_rate": 1.8102383162617056e-06, + "loss": 0.6807, + "step": 26144 + }, + { + "epoch": 0.67, + "learning_rate": 1.8102220982828977e-06, + "loss": 0.7461, + "step": 26145 + }, + { + "epoch": 0.67, + "learning_rate": 1.8102058796837403e-06, + "loss": 0.8169, + "step": 26146 + }, + { + "epoch": 0.67, + "learning_rate": 1.8101896604642452e-06, + "loss": 0.8633, + "step": 26147 + }, + { + "epoch": 0.67, + "learning_rate": 1.8101734406244255e-06, + "loss": 0.8008, + "step": 26148 + }, + { + "epoch": 0.67, + "learning_rate": 1.810157220164293e-06, + "loss": 0.8452, + "step": 26149 + }, + { + "epoch": 0.67, + "learning_rate": 1.8101409990838603e-06, + "loss": 0.9326, + "step": 26150 + }, + { + "epoch": 0.67, + "learning_rate": 1.8101247773831401e-06, + "loss": 1.041, + "step": 26151 + }, + { + "epoch": 0.67, + "learning_rate": 1.8101085550621443e-06, + "loss": 1.0332, + "step": 26152 + }, + { + "epoch": 0.67, + "learning_rate": 1.8100923321208858e-06, + "loss": 0.9287, + "step": 26153 + }, + { + "epoch": 0.67, + "learning_rate": 1.810076108559377e-06, + "loss": 0.6921, + "step": 26154 + }, + { + "epoch": 0.67, + "learning_rate": 1.81005988437763e-06, + "loss": 0.5059, + "step": 26155 + }, + { + "epoch": 0.67, + "learning_rate": 1.8100436595756575e-06, + "loss": 1.0156, + "step": 26156 + }, + { + "epoch": 0.67, + "learning_rate": 1.8100274341534716e-06, + "loss": 0.7588, + "step": 26157 + }, + { + "epoch": 0.67, + "learning_rate": 1.810011208111085e-06, + "loss": 0.7046, + "step": 26158 + }, + { + "epoch": 0.67, + "learning_rate": 1.8099949814485102e-06, + "loss": 0.7988, + "step": 26159 + }, + { + "epoch": 0.67, + "learning_rate": 1.8099787541657595e-06, + "loss": 0.6409, + "step": 26160 + }, + { + "epoch": 0.67, + "learning_rate": 1.8099625262628454e-06, + "loss": 0.8623, + "step": 26161 + }, + { + "epoch": 0.67, + "learning_rate": 1.8099462977397799e-06, + "loss": 0.8682, + "step": 26162 + }, + { + "epoch": 0.67, + "learning_rate": 1.809930068596576e-06, + "loss": 0.9238, + "step": 26163 + }, + { + "epoch": 0.67, + "learning_rate": 1.8099138388332458e-06, + "loss": 0.6104, + "step": 26164 + }, + { + "epoch": 0.67, + "learning_rate": 1.8098976084498018e-06, + "loss": 0.8223, + "step": 26165 + }, + { + "epoch": 0.67, + "learning_rate": 1.8098813774462567e-06, + "loss": 0.9248, + "step": 26166 + }, + { + "epoch": 0.67, + "learning_rate": 1.8098651458226222e-06, + "loss": 1.0186, + "step": 26167 + }, + { + "epoch": 0.67, + "learning_rate": 1.8098489135789118e-06, + "loss": 0.8916, + "step": 26168 + }, + { + "epoch": 0.67, + "learning_rate": 1.8098326807151368e-06, + "loss": 0.8086, + "step": 26169 + }, + { + "epoch": 0.67, + "learning_rate": 1.8098164472313102e-06, + "loss": 0.9688, + "step": 26170 + }, + { + "epoch": 0.67, + "learning_rate": 1.8098002131274446e-06, + "loss": 0.8198, + "step": 26171 + }, + { + "epoch": 0.67, + "learning_rate": 1.8097839784035523e-06, + "loss": 0.8115, + "step": 26172 + }, + { + "epoch": 0.67, + "learning_rate": 1.809767743059645e-06, + "loss": 0.6533, + "step": 26173 + }, + { + "epoch": 0.67, + "learning_rate": 1.8097515070957365e-06, + "loss": 0.8071, + "step": 26174 + }, + { + "epoch": 0.67, + "learning_rate": 1.8097352705118383e-06, + "loss": 0.8535, + "step": 26175 + }, + { + "epoch": 0.67, + "learning_rate": 1.8097190333079629e-06, + "loss": 0.7859, + "step": 26176 + }, + { + "epoch": 0.67, + "learning_rate": 1.809702795484123e-06, + "loss": 0.8311, + "step": 26177 + }, + { + "epoch": 0.67, + "learning_rate": 1.809686557040331e-06, + "loss": 0.7759, + "step": 26178 + }, + { + "epoch": 0.67, + "learning_rate": 1.809670317976599e-06, + "loss": 1.1348, + "step": 26179 + }, + { + "epoch": 0.67, + "learning_rate": 1.8096540782929397e-06, + "loss": 1.0605, + "step": 26180 + }, + { + "epoch": 0.67, + "learning_rate": 1.8096378379893655e-06, + "loss": 0.9375, + "step": 26181 + }, + { + "epoch": 0.67, + "learning_rate": 1.809621597065889e-06, + "loss": 0.7974, + "step": 26182 + }, + { + "epoch": 0.67, + "learning_rate": 1.8096053555225224e-06, + "loss": 1.0918, + "step": 26183 + }, + { + "epoch": 0.67, + "learning_rate": 1.809589113359278e-06, + "loss": 0.8096, + "step": 26184 + }, + { + "epoch": 0.67, + "learning_rate": 1.8095728705761686e-06, + "loss": 0.8662, + "step": 26185 + }, + { + "epoch": 0.67, + "learning_rate": 1.8095566271732065e-06, + "loss": 0.8115, + "step": 26186 + }, + { + "epoch": 0.67, + "learning_rate": 1.809540383150404e-06, + "loss": 0.876, + "step": 26187 + }, + { + "epoch": 0.67, + "learning_rate": 1.809524138507774e-06, + "loss": 0.6855, + "step": 26188 + }, + { + "epoch": 0.67, + "learning_rate": 1.8095078932453282e-06, + "loss": 0.6655, + "step": 26189 + }, + { + "epoch": 0.67, + "learning_rate": 1.8094916473630797e-06, + "loss": 0.8594, + "step": 26190 + }, + { + "epoch": 0.67, + "learning_rate": 1.8094754008610405e-06, + "loss": 0.8701, + "step": 26191 + }, + { + "epoch": 0.67, + "learning_rate": 1.8094591537392234e-06, + "loss": 0.7725, + "step": 26192 + }, + { + "epoch": 0.67, + "learning_rate": 1.8094429059976402e-06, + "loss": 0.8496, + "step": 26193 + }, + { + "epoch": 0.67, + "learning_rate": 1.8094266576363043e-06, + "loss": 0.8555, + "step": 26194 + }, + { + "epoch": 0.67, + "learning_rate": 1.809410408655227e-06, + "loss": 0.8164, + "step": 26195 + }, + { + "epoch": 0.67, + "learning_rate": 1.8093941590544222e-06, + "loss": 0.7246, + "step": 26196 + }, + { + "epoch": 0.67, + "learning_rate": 1.8093779088339009e-06, + "loss": 0.6268, + "step": 26197 + }, + { + "epoch": 0.67, + "learning_rate": 1.8093616579936763e-06, + "loss": 0.8848, + "step": 26198 + }, + { + "epoch": 0.67, + "learning_rate": 1.8093454065337607e-06, + "loss": 1.1348, + "step": 26199 + }, + { + "epoch": 0.67, + "learning_rate": 1.8093291544541666e-06, + "loss": 1.1416, + "step": 26200 + }, + { + "epoch": 0.67, + "learning_rate": 1.8093129017549066e-06, + "loss": 0.9316, + "step": 26201 + }, + { + "epoch": 0.67, + "learning_rate": 1.8092966484359925e-06, + "loss": 0.7568, + "step": 26202 + }, + { + "epoch": 0.67, + "learning_rate": 1.8092803944974373e-06, + "loss": 0.9502, + "step": 26203 + }, + { + "epoch": 0.67, + "learning_rate": 1.8092641399392533e-06, + "loss": 0.7622, + "step": 26204 + }, + { + "epoch": 0.67, + "learning_rate": 1.809247884761453e-06, + "loss": 0.8701, + "step": 26205 + }, + { + "epoch": 0.67, + "learning_rate": 1.8092316289640488e-06, + "loss": 0.9717, + "step": 26206 + }, + { + "epoch": 0.67, + "learning_rate": 1.809215372547053e-06, + "loss": 0.7852, + "step": 26207 + }, + { + "epoch": 0.67, + "learning_rate": 1.8091991155104784e-06, + "loss": 0.915, + "step": 26208 + }, + { + "epoch": 0.67, + "learning_rate": 1.8091828578543375e-06, + "loss": 0.8906, + "step": 26209 + }, + { + "epoch": 0.67, + "learning_rate": 1.8091665995786421e-06, + "loss": 0.7334, + "step": 26210 + }, + { + "epoch": 0.67, + "learning_rate": 1.8091503406834053e-06, + "loss": 0.9048, + "step": 26211 + }, + { + "epoch": 0.67, + "learning_rate": 1.809134081168639e-06, + "loss": 1.0664, + "step": 26212 + }, + { + "epoch": 0.67, + "learning_rate": 1.809117821034356e-06, + "loss": 1.1455, + "step": 26213 + }, + { + "epoch": 0.67, + "learning_rate": 1.8091015602805688e-06, + "loss": 1.0156, + "step": 26214 + }, + { + "epoch": 0.67, + "learning_rate": 1.8090852989072898e-06, + "loss": 1.0586, + "step": 26215 + }, + { + "epoch": 0.67, + "learning_rate": 1.8090690369145312e-06, + "loss": 0.7849, + "step": 26216 + }, + { + "epoch": 0.67, + "learning_rate": 1.8090527743023056e-06, + "loss": 0.9561, + "step": 26217 + }, + { + "epoch": 0.67, + "learning_rate": 1.8090365110706256e-06, + "loss": 0.8047, + "step": 26218 + }, + { + "epoch": 0.67, + "learning_rate": 1.8090202472195037e-06, + "loss": 0.9639, + "step": 26219 + }, + { + "epoch": 0.67, + "learning_rate": 1.809003982748952e-06, + "loss": 1.1172, + "step": 26220 + }, + { + "epoch": 0.67, + "learning_rate": 1.8089877176589834e-06, + "loss": 1.0586, + "step": 26221 + }, + { + "epoch": 0.67, + "learning_rate": 1.8089714519496097e-06, + "loss": 0.6582, + "step": 26222 + }, + { + "epoch": 0.67, + "learning_rate": 1.808955185620844e-06, + "loss": 0.5376, + "step": 26223 + }, + { + "epoch": 0.67, + "learning_rate": 1.8089389186726986e-06, + "loss": 0.8877, + "step": 26224 + }, + { + "epoch": 0.67, + "learning_rate": 1.8089226511051857e-06, + "loss": 0.9951, + "step": 26225 + }, + { + "epoch": 0.67, + "learning_rate": 1.808906382918318e-06, + "loss": 1.0703, + "step": 26226 + }, + { + "epoch": 0.67, + "learning_rate": 1.8088901141121079e-06, + "loss": 0.9453, + "step": 26227 + }, + { + "epoch": 0.67, + "learning_rate": 1.8088738446865676e-06, + "loss": 0.6709, + "step": 26228 + }, + { + "epoch": 0.67, + "learning_rate": 1.80885757464171e-06, + "loss": 0.8789, + "step": 26229 + }, + { + "epoch": 0.67, + "learning_rate": 1.8088413039775473e-06, + "loss": 0.8066, + "step": 26230 + }, + { + "epoch": 0.67, + "learning_rate": 1.808825032694092e-06, + "loss": 1.0547, + "step": 26231 + }, + { + "epoch": 0.67, + "learning_rate": 1.8088087607913568e-06, + "loss": 0.7642, + "step": 26232 + }, + { + "epoch": 0.67, + "learning_rate": 1.8087924882693537e-06, + "loss": 0.8408, + "step": 26233 + }, + { + "epoch": 0.67, + "learning_rate": 1.8087762151280953e-06, + "loss": 1.0332, + "step": 26234 + }, + { + "epoch": 0.67, + "learning_rate": 1.8087599413675943e-06, + "loss": 0.6987, + "step": 26235 + }, + { + "epoch": 0.67, + "learning_rate": 1.808743666987863e-06, + "loss": 0.8447, + "step": 26236 + }, + { + "epoch": 0.67, + "learning_rate": 1.8087273919889136e-06, + "loss": 0.709, + "step": 26237 + }, + { + "epoch": 0.67, + "learning_rate": 1.8087111163707588e-06, + "loss": 1.1611, + "step": 26238 + }, + { + "epoch": 0.67, + "learning_rate": 1.8086948401334116e-06, + "loss": 0.6577, + "step": 26239 + }, + { + "epoch": 0.67, + "learning_rate": 1.8086785632768834e-06, + "loss": 1.0078, + "step": 26240 + }, + { + "epoch": 0.67, + "learning_rate": 1.8086622858011875e-06, + "loss": 0.8291, + "step": 26241 + }, + { + "epoch": 0.67, + "learning_rate": 1.8086460077063362e-06, + "loss": 0.8784, + "step": 26242 + }, + { + "epoch": 0.67, + "learning_rate": 1.8086297289923416e-06, + "loss": 1.0117, + "step": 26243 + }, + { + "epoch": 0.67, + "learning_rate": 1.8086134496592164e-06, + "loss": 0.9062, + "step": 26244 + }, + { + "epoch": 0.67, + "learning_rate": 1.808597169706973e-06, + "loss": 0.7141, + "step": 26245 + }, + { + "epoch": 0.67, + "learning_rate": 1.8085808891356243e-06, + "loss": 0.9883, + "step": 26246 + }, + { + "epoch": 0.67, + "learning_rate": 1.8085646079451822e-06, + "loss": 0.8398, + "step": 26247 + }, + { + "epoch": 0.67, + "learning_rate": 1.8085483261356592e-06, + "loss": 0.8145, + "step": 26248 + }, + { + "epoch": 0.67, + "learning_rate": 1.8085320437070682e-06, + "loss": 0.915, + "step": 26249 + }, + { + "epoch": 0.67, + "learning_rate": 1.808515760659421e-06, + "loss": 0.6724, + "step": 26250 + }, + { + "epoch": 0.67, + "learning_rate": 1.8084994769927306e-06, + "loss": 0.9019, + "step": 26251 + }, + { + "epoch": 0.67, + "learning_rate": 1.8084831927070094e-06, + "loss": 0.834, + "step": 26252 + }, + { + "epoch": 0.67, + "learning_rate": 1.8084669078022698e-06, + "loss": 0.7041, + "step": 26253 + }, + { + "epoch": 0.67, + "learning_rate": 1.8084506222785243e-06, + "loss": 0.7031, + "step": 26254 + }, + { + "epoch": 0.67, + "learning_rate": 1.8084343361357853e-06, + "loss": 0.7881, + "step": 26255 + }, + { + "epoch": 0.67, + "learning_rate": 1.8084180493740653e-06, + "loss": 0.8857, + "step": 26256 + }, + { + "epoch": 0.67, + "learning_rate": 1.8084017619933766e-06, + "loss": 0.8911, + "step": 26257 + }, + { + "epoch": 0.67, + "learning_rate": 1.8083854739937321e-06, + "loss": 0.5557, + "step": 26258 + }, + { + "epoch": 0.67, + "learning_rate": 1.808369185375144e-06, + "loss": 0.8027, + "step": 26259 + }, + { + "epoch": 0.67, + "learning_rate": 1.8083528961376246e-06, + "loss": 0.8672, + "step": 26260 + }, + { + "epoch": 0.67, + "learning_rate": 1.8083366062811867e-06, + "loss": 1.1172, + "step": 26261 + }, + { + "epoch": 0.67, + "learning_rate": 1.8083203158058424e-06, + "loss": 0.6426, + "step": 26262 + }, + { + "epoch": 0.67, + "learning_rate": 1.8083040247116048e-06, + "loss": 0.7988, + "step": 26263 + }, + { + "epoch": 0.67, + "learning_rate": 1.8082877329984857e-06, + "loss": 0.8594, + "step": 26264 + }, + { + "epoch": 0.67, + "learning_rate": 1.808271440666498e-06, + "loss": 0.8594, + "step": 26265 + }, + { + "epoch": 0.67, + "learning_rate": 1.8082551477156538e-06, + "loss": 0.9678, + "step": 26266 + }, + { + "epoch": 0.67, + "learning_rate": 1.808238854145966e-06, + "loss": 0.9551, + "step": 26267 + }, + { + "epoch": 0.67, + "learning_rate": 1.8082225599574468e-06, + "loss": 0.8574, + "step": 26268 + }, + { + "epoch": 0.67, + "learning_rate": 1.8082062651501087e-06, + "loss": 0.6387, + "step": 26269 + }, + { + "epoch": 0.67, + "learning_rate": 1.8081899697239642e-06, + "loss": 0.8623, + "step": 26270 + }, + { + "epoch": 0.67, + "learning_rate": 1.8081736736790259e-06, + "loss": 0.6689, + "step": 26271 + }, + { + "epoch": 0.67, + "learning_rate": 1.8081573770153063e-06, + "loss": 0.833, + "step": 26272 + }, + { + "epoch": 0.67, + "learning_rate": 1.8081410797328177e-06, + "loss": 0.9346, + "step": 26273 + }, + { + "epoch": 0.67, + "learning_rate": 1.8081247818315726e-06, + "loss": 0.7349, + "step": 26274 + }, + { + "epoch": 0.67, + "learning_rate": 1.8081084833115835e-06, + "loss": 0.6982, + "step": 26275 + }, + { + "epoch": 0.67, + "learning_rate": 1.8080921841728624e-06, + "loss": 0.8491, + "step": 26276 + }, + { + "epoch": 0.67, + "learning_rate": 1.808075884415423e-06, + "loss": 0.6011, + "step": 26277 + }, + { + "epoch": 0.67, + "learning_rate": 1.8080595840392767e-06, + "loss": 0.9814, + "step": 26278 + }, + { + "epoch": 0.67, + "learning_rate": 1.8080432830444363e-06, + "loss": 0.7852, + "step": 26279 + }, + { + "epoch": 0.67, + "learning_rate": 1.8080269814309145e-06, + "loss": 0.9355, + "step": 26280 + }, + { + "epoch": 0.67, + "learning_rate": 1.8080106791987234e-06, + "loss": 0.9004, + "step": 26281 + }, + { + "epoch": 0.67, + "learning_rate": 1.807994376347876e-06, + "loss": 0.7871, + "step": 26282 + }, + { + "epoch": 0.67, + "learning_rate": 1.8079780728783841e-06, + "loss": 0.8291, + "step": 26283 + }, + { + "epoch": 0.67, + "learning_rate": 1.8079617687902609e-06, + "loss": 0.8154, + "step": 26284 + }, + { + "epoch": 0.67, + "learning_rate": 1.8079454640835183e-06, + "loss": 0.9453, + "step": 26285 + }, + { + "epoch": 0.67, + "learning_rate": 1.8079291587581688e-06, + "loss": 0.9941, + "step": 26286 + }, + { + "epoch": 0.67, + "learning_rate": 1.8079128528142254e-06, + "loss": 0.7886, + "step": 26287 + }, + { + "epoch": 0.67, + "learning_rate": 1.8078965462517001e-06, + "loss": 0.8604, + "step": 26288 + }, + { + "epoch": 0.67, + "learning_rate": 1.8078802390706058e-06, + "loss": 0.8584, + "step": 26289 + }, + { + "epoch": 0.67, + "learning_rate": 1.8078639312709546e-06, + "loss": 0.7168, + "step": 26290 + }, + { + "epoch": 0.67, + "learning_rate": 1.8078476228527593e-06, + "loss": 0.6382, + "step": 26291 + }, + { + "epoch": 0.67, + "learning_rate": 1.807831313816032e-06, + "loss": 0.7529, + "step": 26292 + }, + { + "epoch": 0.67, + "learning_rate": 1.8078150041607854e-06, + "loss": 0.752, + "step": 26293 + }, + { + "epoch": 0.67, + "learning_rate": 1.8077986938870323e-06, + "loss": 1.0449, + "step": 26294 + }, + { + "epoch": 0.67, + "learning_rate": 1.8077823829947842e-06, + "loss": 0.8682, + "step": 26295 + }, + { + "epoch": 0.67, + "learning_rate": 1.8077660714840551e-06, + "loss": 0.8352, + "step": 26296 + }, + { + "epoch": 0.67, + "learning_rate": 1.807749759354856e-06, + "loss": 0.9062, + "step": 26297 + }, + { + "epoch": 0.67, + "learning_rate": 1.8077334466072003e-06, + "loss": 1.0098, + "step": 26298 + }, + { + "epoch": 0.67, + "learning_rate": 1.8077171332411006e-06, + "loss": 0.9756, + "step": 26299 + }, + { + "epoch": 0.67, + "learning_rate": 1.8077008192565684e-06, + "loss": 0.9834, + "step": 26300 + }, + { + "epoch": 0.67, + "learning_rate": 1.8076845046536172e-06, + "loss": 0.9629, + "step": 26301 + }, + { + "epoch": 0.67, + "learning_rate": 1.807668189432259e-06, + "loss": 0.6904, + "step": 26302 + }, + { + "epoch": 0.67, + "learning_rate": 1.8076518735925066e-06, + "loss": 0.8125, + "step": 26303 + }, + { + "epoch": 0.67, + "learning_rate": 1.8076355571343722e-06, + "loss": 0.687, + "step": 26304 + }, + { + "epoch": 0.67, + "learning_rate": 1.8076192400578682e-06, + "loss": 0.9092, + "step": 26305 + }, + { + "epoch": 0.67, + "learning_rate": 1.8076029223630075e-06, + "loss": 0.7236, + "step": 26306 + }, + { + "epoch": 0.67, + "learning_rate": 1.8075866040498023e-06, + "loss": 0.9521, + "step": 26307 + }, + { + "epoch": 0.67, + "learning_rate": 1.807570285118265e-06, + "loss": 0.8447, + "step": 26308 + }, + { + "epoch": 0.67, + "learning_rate": 1.8075539655684085e-06, + "loss": 0.9736, + "step": 26309 + }, + { + "epoch": 0.67, + "learning_rate": 1.807537645400245e-06, + "loss": 0.8643, + "step": 26310 + }, + { + "epoch": 0.67, + "learning_rate": 1.807521324613787e-06, + "loss": 1.0664, + "step": 26311 + }, + { + "epoch": 0.67, + "learning_rate": 1.807505003209047e-06, + "loss": 0.6953, + "step": 26312 + }, + { + "epoch": 0.67, + "learning_rate": 1.8074886811860376e-06, + "loss": 0.874, + "step": 26313 + }, + { + "epoch": 0.67, + "learning_rate": 1.8074723585447715e-06, + "loss": 0.6323, + "step": 26314 + }, + { + "epoch": 0.67, + "learning_rate": 1.8074560352852605e-06, + "loss": 0.7732, + "step": 26315 + }, + { + "epoch": 0.67, + "learning_rate": 1.807439711407518e-06, + "loss": 0.8047, + "step": 26316 + }, + { + "epoch": 0.67, + "learning_rate": 1.8074233869115559e-06, + "loss": 0.8506, + "step": 26317 + }, + { + "epoch": 0.67, + "learning_rate": 1.8074070617973866e-06, + "loss": 0.5996, + "step": 26318 + }, + { + "epoch": 0.67, + "learning_rate": 1.807390736065023e-06, + "loss": 0.55, + "step": 26319 + }, + { + "epoch": 0.67, + "learning_rate": 1.8073744097144777e-06, + "loss": 0.8584, + "step": 26320 + }, + { + "epoch": 0.67, + "learning_rate": 1.8073580827457624e-06, + "loss": 0.8262, + "step": 26321 + }, + { + "epoch": 0.67, + "learning_rate": 1.8073417551588905e-06, + "loss": 0.9551, + "step": 26322 + }, + { + "epoch": 0.67, + "learning_rate": 1.807325426953874e-06, + "loss": 0.7749, + "step": 26323 + }, + { + "epoch": 0.67, + "learning_rate": 1.8073090981307258e-06, + "loss": 0.9717, + "step": 26324 + }, + { + "epoch": 0.67, + "learning_rate": 1.8072927686894578e-06, + "loss": 0.6816, + "step": 26325 + }, + { + "epoch": 0.67, + "learning_rate": 1.807276438630083e-06, + "loss": 0.8887, + "step": 26326 + }, + { + "epoch": 0.67, + "learning_rate": 1.8072601079526138e-06, + "loss": 0.5869, + "step": 26327 + }, + { + "epoch": 0.67, + "learning_rate": 1.8072437766570625e-06, + "loss": 1.0508, + "step": 26328 + }, + { + "epoch": 0.67, + "learning_rate": 1.8072274447434417e-06, + "loss": 0.9307, + "step": 26329 + }, + { + "epoch": 0.67, + "learning_rate": 1.8072111122117643e-06, + "loss": 0.9961, + "step": 26330 + }, + { + "epoch": 0.67, + "learning_rate": 1.8071947790620422e-06, + "loss": 0.7373, + "step": 26331 + }, + { + "epoch": 0.67, + "learning_rate": 1.8071784452942883e-06, + "loss": 0.9912, + "step": 26332 + }, + { + "epoch": 0.67, + "learning_rate": 1.8071621109085149e-06, + "loss": 0.9121, + "step": 26333 + }, + { + "epoch": 0.67, + "learning_rate": 1.8071457759047347e-06, + "loss": 0.6396, + "step": 26334 + }, + { + "epoch": 0.67, + "learning_rate": 1.80712944028296e-06, + "loss": 1.0254, + "step": 26335 + }, + { + "epoch": 0.68, + "learning_rate": 1.8071131040432033e-06, + "loss": 0.7139, + "step": 26336 + }, + { + "epoch": 0.68, + "learning_rate": 1.8070967671854774e-06, + "loss": 0.9219, + "step": 26337 + }, + { + "epoch": 0.68, + "learning_rate": 1.8070804297097944e-06, + "loss": 0.8662, + "step": 26338 + }, + { + "epoch": 0.68, + "learning_rate": 1.8070640916161674e-06, + "loss": 0.9199, + "step": 26339 + }, + { + "epoch": 0.68, + "learning_rate": 1.8070477529046081e-06, + "loss": 0.7324, + "step": 26340 + }, + { + "epoch": 0.68, + "learning_rate": 1.8070314135751296e-06, + "loss": 0.6992, + "step": 26341 + }, + { + "epoch": 0.68, + "learning_rate": 1.8070150736277445e-06, + "loss": 0.8564, + "step": 26342 + }, + { + "epoch": 0.68, + "learning_rate": 1.8069987330624648e-06, + "loss": 0.8223, + "step": 26343 + }, + { + "epoch": 0.68, + "learning_rate": 1.8069823918793032e-06, + "loss": 0.9463, + "step": 26344 + }, + { + "epoch": 0.68, + "learning_rate": 1.8069660500782727e-06, + "loss": 0.751, + "step": 26345 + }, + { + "epoch": 0.68, + "learning_rate": 1.8069497076593849e-06, + "loss": 0.6519, + "step": 26346 + }, + { + "epoch": 0.68, + "learning_rate": 1.8069333646226532e-06, + "loss": 0.9385, + "step": 26347 + }, + { + "epoch": 0.68, + "learning_rate": 1.8069170209680895e-06, + "loss": 0.9062, + "step": 26348 + }, + { + "epoch": 0.68, + "learning_rate": 1.8069006766957066e-06, + "loss": 0.874, + "step": 26349 + }, + { + "epoch": 0.68, + "learning_rate": 1.806884331805517e-06, + "loss": 0.9512, + "step": 26350 + }, + { + "epoch": 0.68, + "learning_rate": 1.8068679862975332e-06, + "loss": 0.7466, + "step": 26351 + }, + { + "epoch": 0.68, + "learning_rate": 1.8068516401717674e-06, + "loss": 0.6846, + "step": 26352 + }, + { + "epoch": 0.68, + "learning_rate": 1.8068352934282328e-06, + "loss": 0.9385, + "step": 26353 + }, + { + "epoch": 0.68, + "learning_rate": 1.8068189460669413e-06, + "loss": 0.7217, + "step": 26354 + }, + { + "epoch": 0.68, + "learning_rate": 1.8068025980879056e-06, + "loss": 0.8906, + "step": 26355 + }, + { + "epoch": 0.68, + "learning_rate": 1.8067862494911383e-06, + "loss": 0.7241, + "step": 26356 + }, + { + "epoch": 0.68, + "learning_rate": 1.8067699002766518e-06, + "loss": 0.9365, + "step": 26357 + }, + { + "epoch": 0.68, + "learning_rate": 1.8067535504444588e-06, + "loss": 0.8066, + "step": 26358 + }, + { + "epoch": 0.68, + "learning_rate": 1.8067371999945718e-06, + "loss": 0.833, + "step": 26359 + }, + { + "epoch": 0.68, + "learning_rate": 1.8067208489270033e-06, + "loss": 0.7705, + "step": 26360 + }, + { + "epoch": 0.68, + "learning_rate": 1.8067044972417653e-06, + "loss": 0.9463, + "step": 26361 + }, + { + "epoch": 0.68, + "learning_rate": 1.806688144938871e-06, + "loss": 0.959, + "step": 26362 + }, + { + "epoch": 0.68, + "learning_rate": 1.8066717920183325e-06, + "loss": 0.8125, + "step": 26363 + }, + { + "epoch": 0.68, + "learning_rate": 1.8066554384801628e-06, + "loss": 0.9453, + "step": 26364 + }, + { + "epoch": 0.68, + "learning_rate": 1.806639084324374e-06, + "loss": 0.9199, + "step": 26365 + }, + { + "epoch": 0.68, + "learning_rate": 1.8066227295509786e-06, + "loss": 0.8652, + "step": 26366 + }, + { + "epoch": 0.68, + "learning_rate": 1.8066063741599895e-06, + "loss": 0.6909, + "step": 26367 + }, + { + "epoch": 0.68, + "learning_rate": 1.8065900181514188e-06, + "loss": 0.8623, + "step": 26368 + }, + { + "epoch": 0.68, + "learning_rate": 1.8065736615252793e-06, + "loss": 0.8008, + "step": 26369 + }, + { + "epoch": 0.68, + "learning_rate": 1.8065573042815835e-06, + "loss": 0.7178, + "step": 26370 + }, + { + "epoch": 0.68, + "learning_rate": 1.8065409464203438e-06, + "loss": 0.9043, + "step": 26371 + }, + { + "epoch": 0.68, + "learning_rate": 1.8065245879415728e-06, + "loss": 0.9697, + "step": 26372 + }, + { + "epoch": 0.68, + "learning_rate": 1.806508228845283e-06, + "loss": 0.8809, + "step": 26373 + }, + { + "epoch": 0.68, + "learning_rate": 1.8064918691314869e-06, + "loss": 0.75, + "step": 26374 + }, + { + "epoch": 0.68, + "learning_rate": 1.8064755088001968e-06, + "loss": 0.793, + "step": 26375 + }, + { + "epoch": 0.68, + "learning_rate": 1.806459147851426e-06, + "loss": 0.7812, + "step": 26376 + }, + { + "epoch": 0.68, + "learning_rate": 1.8064427862851862e-06, + "loss": 0.7197, + "step": 26377 + }, + { + "epoch": 0.68, + "learning_rate": 1.8064264241014903e-06, + "loss": 0.9746, + "step": 26378 + }, + { + "epoch": 0.68, + "learning_rate": 1.8064100613003508e-06, + "loss": 0.8037, + "step": 26379 + }, + { + "epoch": 0.68, + "learning_rate": 1.8063936978817802e-06, + "loss": 0.9482, + "step": 26380 + }, + { + "epoch": 0.68, + "learning_rate": 1.8063773338457908e-06, + "loss": 0.7061, + "step": 26381 + }, + { + "epoch": 0.68, + "learning_rate": 1.8063609691923959e-06, + "loss": 0.9629, + "step": 26382 + }, + { + "epoch": 0.68, + "learning_rate": 1.806344603921607e-06, + "loss": 0.8755, + "step": 26383 + }, + { + "epoch": 0.68, + "learning_rate": 1.806328238033437e-06, + "loss": 0.7852, + "step": 26384 + }, + { + "epoch": 0.68, + "learning_rate": 1.806311871527899e-06, + "loss": 1.0225, + "step": 26385 + }, + { + "epoch": 0.68, + "learning_rate": 1.8062955044050047e-06, + "loss": 1.0225, + "step": 26386 + }, + { + "epoch": 0.68, + "learning_rate": 1.8062791366647674e-06, + "loss": 0.7988, + "step": 26387 + }, + { + "epoch": 0.68, + "learning_rate": 1.806262768307199e-06, + "loss": 0.7275, + "step": 26388 + }, + { + "epoch": 0.68, + "learning_rate": 1.8062463993323122e-06, + "loss": 0.7686, + "step": 26389 + }, + { + "epoch": 0.68, + "learning_rate": 1.8062300297401195e-06, + "loss": 0.7969, + "step": 26390 + }, + { + "epoch": 0.68, + "learning_rate": 1.806213659530634e-06, + "loss": 0.7859, + "step": 26391 + }, + { + "epoch": 0.68, + "learning_rate": 1.8061972887038675e-06, + "loss": 0.7588, + "step": 26392 + }, + { + "epoch": 0.68, + "learning_rate": 1.8061809172598327e-06, + "loss": 0.7695, + "step": 26393 + }, + { + "epoch": 0.68, + "learning_rate": 1.8061645451985424e-06, + "loss": 0.79, + "step": 26394 + }, + { + "epoch": 0.68, + "learning_rate": 1.8061481725200088e-06, + "loss": 0.8135, + "step": 26395 + }, + { + "epoch": 0.68, + "learning_rate": 1.8061317992242446e-06, + "loss": 0.8652, + "step": 26396 + }, + { + "epoch": 0.68, + "learning_rate": 1.8061154253112627e-06, + "loss": 0.8721, + "step": 26397 + }, + { + "epoch": 0.68, + "learning_rate": 1.806099050781075e-06, + "loss": 0.6992, + "step": 26398 + }, + { + "epoch": 0.68, + "learning_rate": 1.8060826756336945e-06, + "loss": 0.9062, + "step": 26399 + }, + { + "epoch": 0.68, + "learning_rate": 1.8060662998691333e-06, + "loss": 0.9434, + "step": 26400 + }, + { + "epoch": 0.68, + "learning_rate": 1.8060499234874045e-06, + "loss": 0.8311, + "step": 26401 + }, + { + "epoch": 0.68, + "learning_rate": 1.80603354648852e-06, + "loss": 0.8857, + "step": 26402 + }, + { + "epoch": 0.68, + "learning_rate": 1.806017168872493e-06, + "loss": 0.8311, + "step": 26403 + }, + { + "epoch": 0.68, + "learning_rate": 1.8060007906393354e-06, + "loss": 0.9814, + "step": 26404 + }, + { + "epoch": 0.68, + "learning_rate": 1.8059844117890604e-06, + "loss": 0.8262, + "step": 26405 + }, + { + "epoch": 0.68, + "learning_rate": 1.8059680323216798e-06, + "loss": 0.8276, + "step": 26406 + }, + { + "epoch": 0.68, + "learning_rate": 1.8059516522372068e-06, + "loss": 0.8613, + "step": 26407 + }, + { + "epoch": 0.68, + "learning_rate": 1.8059352715356538e-06, + "loss": 0.9863, + "step": 26408 + }, + { + "epoch": 0.68, + "learning_rate": 1.805918890217033e-06, + "loss": 1.0117, + "step": 26409 + }, + { + "epoch": 0.68, + "learning_rate": 1.8059025082813572e-06, + "loss": 0.9614, + "step": 26410 + }, + { + "epoch": 0.68, + "learning_rate": 1.805886125728639e-06, + "loss": 0.8389, + "step": 26411 + }, + { + "epoch": 0.68, + "learning_rate": 1.8058697425588906e-06, + "loss": 0.7031, + "step": 26412 + }, + { + "epoch": 0.68, + "learning_rate": 1.805853358772125e-06, + "loss": 1.0635, + "step": 26413 + }, + { + "epoch": 0.68, + "learning_rate": 1.8058369743683545e-06, + "loss": 0.8486, + "step": 26414 + }, + { + "epoch": 0.68, + "learning_rate": 1.8058205893475918e-06, + "loss": 0.96, + "step": 26415 + }, + { + "epoch": 0.68, + "learning_rate": 1.805804203709849e-06, + "loss": 0.9766, + "step": 26416 + }, + { + "epoch": 0.68, + "learning_rate": 1.8057878174551395e-06, + "loss": 0.645, + "step": 26417 + }, + { + "epoch": 0.68, + "learning_rate": 1.805771430583475e-06, + "loss": 0.7295, + "step": 26418 + }, + { + "epoch": 0.68, + "learning_rate": 1.8057550430948683e-06, + "loss": 0.7324, + "step": 26419 + }, + { + "epoch": 0.68, + "learning_rate": 1.8057386549893321e-06, + "loss": 0.7571, + "step": 26420 + }, + { + "epoch": 0.68, + "learning_rate": 1.805722266266879e-06, + "loss": 0.8594, + "step": 26421 + }, + { + "epoch": 0.68, + "learning_rate": 1.805705876927521e-06, + "loss": 0.8506, + "step": 26422 + }, + { + "epoch": 0.68, + "learning_rate": 1.8056894869712714e-06, + "loss": 0.8145, + "step": 26423 + }, + { + "epoch": 0.68, + "learning_rate": 1.8056730963981423e-06, + "loss": 0.7939, + "step": 26424 + }, + { + "epoch": 0.68, + "learning_rate": 1.8056567052081464e-06, + "loss": 0.8555, + "step": 26425 + }, + { + "epoch": 0.68, + "learning_rate": 1.8056403134012964e-06, + "loss": 0.8154, + "step": 26426 + }, + { + "epoch": 0.68, + "learning_rate": 1.805623920977604e-06, + "loss": 0.6304, + "step": 26427 + }, + { + "epoch": 0.68, + "learning_rate": 1.8056075279370831e-06, + "loss": 0.9717, + "step": 26428 + }, + { + "epoch": 0.68, + "learning_rate": 1.8055911342797453e-06, + "loss": 0.6558, + "step": 26429 + }, + { + "epoch": 0.68, + "learning_rate": 1.8055747400056033e-06, + "loss": 0.7764, + "step": 26430 + }, + { + "epoch": 0.68, + "learning_rate": 1.8055583451146702e-06, + "loss": 0.814, + "step": 26431 + }, + { + "epoch": 0.68, + "learning_rate": 1.8055419496069577e-06, + "loss": 0.7114, + "step": 26432 + }, + { + "epoch": 0.68, + "learning_rate": 1.8055255534824786e-06, + "loss": 0.6299, + "step": 26433 + }, + { + "epoch": 0.68, + "learning_rate": 1.805509156741246e-06, + "loss": 0.7842, + "step": 26434 + }, + { + "epoch": 0.68, + "learning_rate": 1.8054927593832718e-06, + "loss": 0.4966, + "step": 26435 + }, + { + "epoch": 0.68, + "learning_rate": 1.8054763614085693e-06, + "loss": 0.9834, + "step": 26436 + }, + { + "epoch": 0.68, + "learning_rate": 1.8054599628171502e-06, + "loss": 1.0186, + "step": 26437 + }, + { + "epoch": 0.68, + "learning_rate": 1.8054435636090275e-06, + "loss": 0.8064, + "step": 26438 + }, + { + "epoch": 0.68, + "learning_rate": 1.8054271637842139e-06, + "loss": 0.9399, + "step": 26439 + }, + { + "epoch": 0.68, + "learning_rate": 1.8054107633427213e-06, + "loss": 0.8555, + "step": 26440 + }, + { + "epoch": 0.68, + "learning_rate": 1.805394362284563e-06, + "loss": 0.8701, + "step": 26441 + }, + { + "epoch": 0.68, + "learning_rate": 1.8053779606097513e-06, + "loss": 0.8945, + "step": 26442 + }, + { + "epoch": 0.68, + "learning_rate": 1.8053615583182987e-06, + "loss": 0.752, + "step": 26443 + }, + { + "epoch": 0.68, + "learning_rate": 1.805345155410218e-06, + "loss": 0.8994, + "step": 26444 + }, + { + "epoch": 0.68, + "learning_rate": 1.8053287518855212e-06, + "loss": 0.7754, + "step": 26445 + }, + { + "epoch": 0.68, + "learning_rate": 1.805312347744221e-06, + "loss": 0.6875, + "step": 26446 + }, + { + "epoch": 0.68, + "learning_rate": 1.805295942986331e-06, + "loss": 0.7832, + "step": 26447 + }, + { + "epoch": 0.68, + "learning_rate": 1.8052795376118622e-06, + "loss": 0.877, + "step": 26448 + }, + { + "epoch": 0.68, + "learning_rate": 1.805263131620828e-06, + "loss": 0.6953, + "step": 26449 + }, + { + "epoch": 0.68, + "learning_rate": 1.805246725013241e-06, + "loss": 0.9639, + "step": 26450 + }, + { + "epoch": 0.68, + "learning_rate": 1.8052303177891135e-06, + "loss": 0.917, + "step": 26451 + }, + { + "epoch": 0.68, + "learning_rate": 1.8052139099484582e-06, + "loss": 1.1172, + "step": 26452 + }, + { + "epoch": 0.68, + "learning_rate": 1.8051975014912876e-06, + "loss": 0.8618, + "step": 26453 + }, + { + "epoch": 0.68, + "learning_rate": 1.8051810924176145e-06, + "loss": 0.8213, + "step": 26454 + }, + { + "epoch": 0.68, + "learning_rate": 1.8051646827274508e-06, + "loss": 1.082, + "step": 26455 + }, + { + "epoch": 0.68, + "learning_rate": 1.8051482724208103e-06, + "loss": 0.7144, + "step": 26456 + }, + { + "epoch": 0.68, + "learning_rate": 1.805131861497704e-06, + "loss": 0.9023, + "step": 26457 + }, + { + "epoch": 0.68, + "learning_rate": 1.8051154499581458e-06, + "loss": 0.9658, + "step": 26458 + }, + { + "epoch": 0.68, + "learning_rate": 1.8050990378021473e-06, + "loss": 0.5981, + "step": 26459 + }, + { + "epoch": 0.68, + "learning_rate": 1.8050826250297218e-06, + "loss": 0.9258, + "step": 26460 + }, + { + "epoch": 0.68, + "learning_rate": 1.8050662116408815e-06, + "loss": 0.8975, + "step": 26461 + }, + { + "epoch": 0.68, + "learning_rate": 1.8050497976356391e-06, + "loss": 0.9805, + "step": 26462 + }, + { + "epoch": 0.68, + "learning_rate": 1.805033383014007e-06, + "loss": 0.8604, + "step": 26463 + }, + { + "epoch": 0.68, + "learning_rate": 1.8050169677759977e-06, + "loss": 0.8477, + "step": 26464 + }, + { + "epoch": 0.68, + "learning_rate": 1.805000551921624e-06, + "loss": 0.8633, + "step": 26465 + }, + { + "epoch": 0.68, + "learning_rate": 1.8049841354508983e-06, + "loss": 0.8613, + "step": 26466 + }, + { + "epoch": 0.68, + "learning_rate": 1.8049677183638333e-06, + "loss": 1.1426, + "step": 26467 + }, + { + "epoch": 0.68, + "learning_rate": 1.8049513006604418e-06, + "loss": 0.873, + "step": 26468 + }, + { + "epoch": 0.68, + "learning_rate": 1.8049348823407357e-06, + "loss": 0.6055, + "step": 26469 + }, + { + "epoch": 0.68, + "learning_rate": 1.8049184634047283e-06, + "loss": 0.8623, + "step": 26470 + }, + { + "epoch": 0.68, + "learning_rate": 1.804902043852432e-06, + "loss": 0.7822, + "step": 26471 + }, + { + "epoch": 0.68, + "learning_rate": 1.8048856236838587e-06, + "loss": 0.501, + "step": 26472 + }, + { + "epoch": 0.68, + "learning_rate": 1.8048692028990219e-06, + "loss": 0.9175, + "step": 26473 + }, + { + "epoch": 0.68, + "learning_rate": 1.8048527814979336e-06, + "loss": 1.0449, + "step": 26474 + }, + { + "epoch": 0.68, + "learning_rate": 1.8048363594806064e-06, + "loss": 0.8203, + "step": 26475 + }, + { + "epoch": 0.68, + "learning_rate": 1.8048199368470535e-06, + "loss": 0.4724, + "step": 26476 + }, + { + "epoch": 0.68, + "learning_rate": 1.8048035135972863e-06, + "loss": 0.748, + "step": 26477 + }, + { + "epoch": 0.68, + "learning_rate": 1.8047870897313184e-06, + "loss": 0.708, + "step": 26478 + }, + { + "epoch": 0.68, + "learning_rate": 1.8047706652491618e-06, + "loss": 0.7363, + "step": 26479 + }, + { + "epoch": 0.68, + "learning_rate": 1.8047542401508298e-06, + "loss": 0.9004, + "step": 26480 + }, + { + "epoch": 0.68, + "learning_rate": 1.8047378144363342e-06, + "loss": 0.7773, + "step": 26481 + }, + { + "epoch": 0.68, + "learning_rate": 1.8047213881056878e-06, + "loss": 0.8291, + "step": 26482 + }, + { + "epoch": 0.68, + "learning_rate": 1.8047049611589031e-06, + "loss": 0.9199, + "step": 26483 + }, + { + "epoch": 0.68, + "learning_rate": 1.8046885335959932e-06, + "loss": 0.7568, + "step": 26484 + }, + { + "epoch": 0.68, + "learning_rate": 1.80467210541697e-06, + "loss": 0.7065, + "step": 26485 + }, + { + "epoch": 0.68, + "learning_rate": 1.8046556766218463e-06, + "loss": 1.0908, + "step": 26486 + }, + { + "epoch": 0.68, + "learning_rate": 1.8046392472106349e-06, + "loss": 0.873, + "step": 26487 + }, + { + "epoch": 0.68, + "learning_rate": 1.8046228171833482e-06, + "loss": 0.9883, + "step": 26488 + }, + { + "epoch": 0.68, + "learning_rate": 1.804606386539999e-06, + "loss": 0.74, + "step": 26489 + }, + { + "epoch": 0.68, + "learning_rate": 1.8045899552805995e-06, + "loss": 0.9814, + "step": 26490 + }, + { + "epoch": 0.68, + "learning_rate": 1.8045735234051626e-06, + "loss": 0.9023, + "step": 26491 + }, + { + "epoch": 0.68, + "learning_rate": 1.8045570909137004e-06, + "loss": 0.9082, + "step": 26492 + }, + { + "epoch": 0.68, + "learning_rate": 1.8045406578062261e-06, + "loss": 0.8008, + "step": 26493 + }, + { + "epoch": 0.68, + "learning_rate": 1.804524224082752e-06, + "loss": 0.9092, + "step": 26494 + }, + { + "epoch": 0.68, + "learning_rate": 1.8045077897432907e-06, + "loss": 0.8906, + "step": 26495 + }, + { + "epoch": 0.68, + "learning_rate": 1.8044913547878548e-06, + "loss": 1.001, + "step": 26496 + }, + { + "epoch": 0.68, + "learning_rate": 1.804474919216457e-06, + "loss": 0.6318, + "step": 26497 + }, + { + "epoch": 0.68, + "learning_rate": 1.8044584830291095e-06, + "loss": 0.8809, + "step": 26498 + }, + { + "epoch": 0.68, + "learning_rate": 1.8044420462258252e-06, + "loss": 0.6772, + "step": 26499 + }, + { + "epoch": 0.68, + "learning_rate": 1.8044256088066165e-06, + "loss": 0.666, + "step": 26500 + }, + { + "epoch": 0.68, + "learning_rate": 1.8044091707714963e-06, + "loss": 0.8018, + "step": 26501 + }, + { + "epoch": 0.68, + "learning_rate": 1.8043927321204768e-06, + "loss": 0.8086, + "step": 26502 + }, + { + "epoch": 0.68, + "learning_rate": 1.804376292853571e-06, + "loss": 0.9209, + "step": 26503 + }, + { + "epoch": 0.68, + "learning_rate": 1.8043598529707911e-06, + "loss": 0.7749, + "step": 26504 + }, + { + "epoch": 0.68, + "learning_rate": 1.8043434124721499e-06, + "loss": 0.8809, + "step": 26505 + }, + { + "epoch": 0.68, + "learning_rate": 1.8043269713576596e-06, + "loss": 0.6895, + "step": 26506 + }, + { + "epoch": 0.68, + "learning_rate": 1.8043105296273336e-06, + "loss": 0.7959, + "step": 26507 + }, + { + "epoch": 0.68, + "learning_rate": 1.8042940872811839e-06, + "loss": 0.7861, + "step": 26508 + }, + { + "epoch": 0.68, + "learning_rate": 1.804277644319223e-06, + "loss": 0.7793, + "step": 26509 + }, + { + "epoch": 0.68, + "learning_rate": 1.8042612007414637e-06, + "loss": 0.8213, + "step": 26510 + }, + { + "epoch": 0.68, + "learning_rate": 1.804244756547919e-06, + "loss": 0.7861, + "step": 26511 + }, + { + "epoch": 0.68, + "learning_rate": 1.8042283117386008e-06, + "loss": 0.9404, + "step": 26512 + }, + { + "epoch": 0.68, + "learning_rate": 1.8042118663135217e-06, + "loss": 1.0029, + "step": 26513 + }, + { + "epoch": 0.68, + "learning_rate": 1.8041954202726948e-06, + "loss": 0.8652, + "step": 26514 + }, + { + "epoch": 0.68, + "learning_rate": 1.8041789736161323e-06, + "loss": 0.8145, + "step": 26515 + }, + { + "epoch": 0.68, + "learning_rate": 1.8041625263438473e-06, + "loss": 0.4768, + "step": 26516 + }, + { + "epoch": 0.68, + "learning_rate": 1.8041460784558518e-06, + "loss": 0.665, + "step": 26517 + }, + { + "epoch": 0.68, + "learning_rate": 1.8041296299521587e-06, + "loss": 0.6768, + "step": 26518 + }, + { + "epoch": 0.68, + "learning_rate": 1.8041131808327803e-06, + "loss": 0.8604, + "step": 26519 + }, + { + "epoch": 0.68, + "learning_rate": 1.8040967310977297e-06, + "loss": 0.7998, + "step": 26520 + }, + { + "epoch": 0.68, + "learning_rate": 1.804080280747019e-06, + "loss": 0.7021, + "step": 26521 + }, + { + "epoch": 0.68, + "learning_rate": 1.8040638297806611e-06, + "loss": 0.6431, + "step": 26522 + }, + { + "epoch": 0.68, + "learning_rate": 1.8040473781986685e-06, + "loss": 0.9102, + "step": 26523 + }, + { + "epoch": 0.68, + "learning_rate": 1.8040309260010535e-06, + "loss": 0.9121, + "step": 26524 + }, + { + "epoch": 0.68, + "learning_rate": 1.8040144731878292e-06, + "loss": 0.9463, + "step": 26525 + }, + { + "epoch": 0.68, + "learning_rate": 1.8039980197590081e-06, + "loss": 0.6553, + "step": 26526 + }, + { + "epoch": 0.68, + "learning_rate": 1.8039815657146027e-06, + "loss": 0.9961, + "step": 26527 + }, + { + "epoch": 0.68, + "learning_rate": 1.8039651110546256e-06, + "loss": 0.4666, + "step": 26528 + }, + { + "epoch": 0.68, + "learning_rate": 1.8039486557790893e-06, + "loss": 0.553, + "step": 26529 + }, + { + "epoch": 0.68, + "learning_rate": 1.8039321998880063e-06, + "loss": 0.8794, + "step": 26530 + }, + { + "epoch": 0.68, + "learning_rate": 1.8039157433813895e-06, + "loss": 0.6924, + "step": 26531 + }, + { + "epoch": 0.68, + "learning_rate": 1.8038992862592515e-06, + "loss": 0.8711, + "step": 26532 + }, + { + "epoch": 0.68, + "learning_rate": 1.8038828285216048e-06, + "loss": 0.7412, + "step": 26533 + }, + { + "epoch": 0.68, + "learning_rate": 1.8038663701684617e-06, + "loss": 0.873, + "step": 26534 + }, + { + "epoch": 0.68, + "learning_rate": 1.8038499111998353e-06, + "loss": 0.999, + "step": 26535 + }, + { + "epoch": 0.68, + "learning_rate": 1.803833451615738e-06, + "loss": 0.8428, + "step": 26536 + }, + { + "epoch": 0.68, + "learning_rate": 1.8038169914161823e-06, + "loss": 0.585, + "step": 26537 + }, + { + "epoch": 0.68, + "learning_rate": 1.803800530601181e-06, + "loss": 0.8774, + "step": 26538 + }, + { + "epoch": 0.68, + "learning_rate": 1.8037840691707465e-06, + "loss": 0.9902, + "step": 26539 + }, + { + "epoch": 0.68, + "learning_rate": 1.8037676071248915e-06, + "loss": 1.0166, + "step": 26540 + }, + { + "epoch": 0.68, + "learning_rate": 1.8037511444636286e-06, + "loss": 0.8955, + "step": 26541 + }, + { + "epoch": 0.68, + "learning_rate": 1.8037346811869704e-06, + "loss": 0.8125, + "step": 26542 + }, + { + "epoch": 0.68, + "learning_rate": 1.8037182172949294e-06, + "loss": 0.8569, + "step": 26543 + }, + { + "epoch": 0.68, + "learning_rate": 1.8037017527875187e-06, + "loss": 0.8379, + "step": 26544 + }, + { + "epoch": 0.68, + "learning_rate": 1.80368528766475e-06, + "loss": 0.96, + "step": 26545 + }, + { + "epoch": 0.68, + "learning_rate": 1.803668821926637e-06, + "loss": 0.793, + "step": 26546 + }, + { + "epoch": 0.68, + "learning_rate": 1.8036523555731913e-06, + "loss": 0.6216, + "step": 26547 + }, + { + "epoch": 0.68, + "learning_rate": 1.8036358886044263e-06, + "loss": 0.5903, + "step": 26548 + }, + { + "epoch": 0.68, + "learning_rate": 1.803619421020354e-06, + "loss": 0.8428, + "step": 26549 + }, + { + "epoch": 0.68, + "learning_rate": 1.803602952820987e-06, + "loss": 0.5652, + "step": 26550 + }, + { + "epoch": 0.68, + "learning_rate": 1.8035864840063386e-06, + "loss": 0.6675, + "step": 26551 + }, + { + "epoch": 0.68, + "learning_rate": 1.803570014576421e-06, + "loss": 0.646, + "step": 26552 + }, + { + "epoch": 0.68, + "learning_rate": 1.8035535445312466e-06, + "loss": 0.9585, + "step": 26553 + }, + { + "epoch": 0.68, + "learning_rate": 1.8035370738708279e-06, + "loss": 1.0879, + "step": 26554 + }, + { + "epoch": 0.68, + "learning_rate": 1.8035206025951785e-06, + "loss": 0.52, + "step": 26555 + }, + { + "epoch": 0.68, + "learning_rate": 1.8035041307043097e-06, + "loss": 1.0029, + "step": 26556 + }, + { + "epoch": 0.68, + "learning_rate": 1.803487658198235e-06, + "loss": 0.6528, + "step": 26557 + }, + { + "epoch": 0.68, + "learning_rate": 1.803471185076967e-06, + "loss": 0.7939, + "step": 26558 + }, + { + "epoch": 0.68, + "learning_rate": 1.803454711340518e-06, + "loss": 0.7583, + "step": 26559 + }, + { + "epoch": 0.68, + "learning_rate": 1.8034382369889003e-06, + "loss": 0.9961, + "step": 26560 + }, + { + "epoch": 0.68, + "learning_rate": 1.8034217620221267e-06, + "loss": 1.0293, + "step": 26561 + }, + { + "epoch": 0.68, + "learning_rate": 1.8034052864402107e-06, + "loss": 0.8193, + "step": 26562 + }, + { + "epoch": 0.68, + "learning_rate": 1.8033888102431637e-06, + "loss": 0.7725, + "step": 26563 + }, + { + "epoch": 0.68, + "learning_rate": 1.8033723334309992e-06, + "loss": 0.7529, + "step": 26564 + }, + { + "epoch": 0.68, + "learning_rate": 1.803355856003729e-06, + "loss": 0.9893, + "step": 26565 + }, + { + "epoch": 0.68, + "learning_rate": 1.8033393779613667e-06, + "loss": 0.7676, + "step": 26566 + }, + { + "epoch": 0.68, + "learning_rate": 1.8033228993039238e-06, + "loss": 0.8066, + "step": 26567 + }, + { + "epoch": 0.68, + "learning_rate": 1.803306420031414e-06, + "loss": 0.6909, + "step": 26568 + }, + { + "epoch": 0.68, + "learning_rate": 1.803289940143849e-06, + "loss": 0.8691, + "step": 26569 + }, + { + "epoch": 0.68, + "learning_rate": 1.8032734596412422e-06, + "loss": 0.874, + "step": 26570 + }, + { + "epoch": 0.68, + "learning_rate": 1.8032569785236057e-06, + "loss": 0.8398, + "step": 26571 + }, + { + "epoch": 0.68, + "learning_rate": 1.803240496790952e-06, + "loss": 0.7573, + "step": 26572 + }, + { + "epoch": 0.68, + "learning_rate": 1.8032240144432943e-06, + "loss": 1.0273, + "step": 26573 + }, + { + "epoch": 0.68, + "learning_rate": 1.8032075314806447e-06, + "loss": 0.9473, + "step": 26574 + }, + { + "epoch": 0.68, + "learning_rate": 1.8031910479030163e-06, + "loss": 0.8975, + "step": 26575 + }, + { + "epoch": 0.68, + "learning_rate": 1.8031745637104213e-06, + "loss": 0.8535, + "step": 26576 + }, + { + "epoch": 0.68, + "learning_rate": 1.8031580789028725e-06, + "loss": 0.8003, + "step": 26577 + }, + { + "epoch": 0.68, + "learning_rate": 1.8031415934803824e-06, + "loss": 0.875, + "step": 26578 + }, + { + "epoch": 0.68, + "learning_rate": 1.8031251074429638e-06, + "loss": 0.6094, + "step": 26579 + }, + { + "epoch": 0.68, + "learning_rate": 1.8031086207906289e-06, + "loss": 0.5883, + "step": 26580 + }, + { + "epoch": 0.68, + "learning_rate": 1.8030921335233913e-06, + "loss": 0.9033, + "step": 26581 + }, + { + "epoch": 0.68, + "learning_rate": 1.8030756456412626e-06, + "loss": 0.834, + "step": 26582 + }, + { + "epoch": 0.68, + "learning_rate": 1.803059157144256e-06, + "loss": 1.0713, + "step": 26583 + }, + { + "epoch": 0.68, + "learning_rate": 1.8030426680323837e-06, + "loss": 0.6406, + "step": 26584 + }, + { + "epoch": 0.68, + "learning_rate": 1.8030261783056584e-06, + "loss": 0.915, + "step": 26585 + }, + { + "epoch": 0.68, + "learning_rate": 1.803009687964093e-06, + "loss": 0.6758, + "step": 26586 + }, + { + "epoch": 0.68, + "learning_rate": 1.8029931970077e-06, + "loss": 0.7314, + "step": 26587 + }, + { + "epoch": 0.68, + "learning_rate": 1.8029767054364924e-06, + "loss": 0.6099, + "step": 26588 + }, + { + "epoch": 0.68, + "learning_rate": 1.8029602132504822e-06, + "loss": 0.5947, + "step": 26589 + }, + { + "epoch": 0.68, + "learning_rate": 1.8029437204496823e-06, + "loss": 0.877, + "step": 26590 + }, + { + "epoch": 0.68, + "learning_rate": 1.8029272270341053e-06, + "loss": 0.834, + "step": 26591 + }, + { + "epoch": 0.68, + "learning_rate": 1.8029107330037638e-06, + "loss": 0.8838, + "step": 26592 + }, + { + "epoch": 0.68, + "learning_rate": 1.8028942383586708e-06, + "loss": 0.8525, + "step": 26593 + }, + { + "epoch": 0.68, + "learning_rate": 1.802877743098838e-06, + "loss": 0.8652, + "step": 26594 + }, + { + "epoch": 0.68, + "learning_rate": 1.802861247224279e-06, + "loss": 0.8398, + "step": 26595 + }, + { + "epoch": 0.68, + "learning_rate": 1.8028447507350059e-06, + "loss": 0.9531, + "step": 26596 + }, + { + "epoch": 0.68, + "learning_rate": 1.8028282536310315e-06, + "loss": 0.791, + "step": 26597 + }, + { + "epoch": 0.68, + "learning_rate": 1.8028117559123687e-06, + "loss": 0.8799, + "step": 26598 + }, + { + "epoch": 0.68, + "learning_rate": 1.8027952575790298e-06, + "loss": 0.7866, + "step": 26599 + }, + { + "epoch": 0.68, + "learning_rate": 1.8027787586310272e-06, + "loss": 0.8652, + "step": 26600 + }, + { + "epoch": 0.68, + "learning_rate": 1.802762259068374e-06, + "loss": 0.6741, + "step": 26601 + }, + { + "epoch": 0.68, + "learning_rate": 1.8027457588910826e-06, + "loss": 1.0547, + "step": 26602 + }, + { + "epoch": 0.68, + "learning_rate": 1.8027292580991657e-06, + "loss": 0.8252, + "step": 26603 + }, + { + "epoch": 0.68, + "learning_rate": 1.8027127566926358e-06, + "loss": 0.8203, + "step": 26604 + }, + { + "epoch": 0.68, + "learning_rate": 1.8026962546715056e-06, + "loss": 0.6934, + "step": 26605 + }, + { + "epoch": 0.68, + "learning_rate": 1.8026797520357881e-06, + "loss": 0.9053, + "step": 26606 + }, + { + "epoch": 0.68, + "learning_rate": 1.8026632487854956e-06, + "loss": 0.9443, + "step": 26607 + }, + { + "epoch": 0.68, + "learning_rate": 1.8026467449206406e-06, + "loss": 0.915, + "step": 26608 + }, + { + "epoch": 0.68, + "learning_rate": 1.8026302404412359e-06, + "loss": 0.8506, + "step": 26609 + }, + { + "epoch": 0.68, + "learning_rate": 1.8026137353472942e-06, + "loss": 0.7695, + "step": 26610 + }, + { + "epoch": 0.68, + "learning_rate": 1.802597229638828e-06, + "loss": 0.7422, + "step": 26611 + }, + { + "epoch": 0.68, + "learning_rate": 1.80258072331585e-06, + "loss": 0.9707, + "step": 26612 + }, + { + "epoch": 0.68, + "learning_rate": 1.802564216378373e-06, + "loss": 0.8037, + "step": 26613 + }, + { + "epoch": 0.68, + "learning_rate": 1.8025477088264091e-06, + "loss": 0.7539, + "step": 26614 + }, + { + "epoch": 0.68, + "learning_rate": 1.8025312006599719e-06, + "loss": 0.877, + "step": 26615 + }, + { + "epoch": 0.68, + "learning_rate": 1.802514691879073e-06, + "loss": 0.8799, + "step": 26616 + }, + { + "epoch": 0.68, + "learning_rate": 1.8024981824837258e-06, + "loss": 0.9697, + "step": 26617 + }, + { + "epoch": 0.68, + "learning_rate": 1.8024816724739424e-06, + "loss": 0.8115, + "step": 26618 + }, + { + "epoch": 0.68, + "learning_rate": 1.8024651618497354e-06, + "loss": 0.7607, + "step": 26619 + }, + { + "epoch": 0.68, + "learning_rate": 1.8024486506111184e-06, + "loss": 0.9482, + "step": 26620 + }, + { + "epoch": 0.68, + "learning_rate": 1.802432138758103e-06, + "loss": 0.7837, + "step": 26621 + }, + { + "epoch": 0.68, + "learning_rate": 1.8024156262907022e-06, + "loss": 0.9033, + "step": 26622 + }, + { + "epoch": 0.68, + "learning_rate": 1.8023991132089287e-06, + "loss": 0.8848, + "step": 26623 + }, + { + "epoch": 0.68, + "learning_rate": 1.802382599512795e-06, + "loss": 0.8213, + "step": 26624 + }, + { + "epoch": 0.68, + "learning_rate": 1.8023660852023142e-06, + "loss": 0.7612, + "step": 26625 + }, + { + "epoch": 0.68, + "learning_rate": 1.8023495702774983e-06, + "loss": 0.5889, + "step": 26626 + }, + { + "epoch": 0.68, + "learning_rate": 1.8023330547383602e-06, + "loss": 0.9541, + "step": 26627 + }, + { + "epoch": 0.68, + "learning_rate": 1.8023165385849126e-06, + "loss": 0.6699, + "step": 26628 + }, + { + "epoch": 0.68, + "learning_rate": 1.8023000218171683e-06, + "loss": 0.9082, + "step": 26629 + }, + { + "epoch": 0.68, + "learning_rate": 1.8022835044351394e-06, + "loss": 0.9199, + "step": 26630 + }, + { + "epoch": 0.68, + "learning_rate": 1.8022669864388393e-06, + "loss": 0.749, + "step": 26631 + }, + { + "epoch": 0.68, + "learning_rate": 1.80225046782828e-06, + "loss": 1.0713, + "step": 26632 + }, + { + "epoch": 0.68, + "learning_rate": 1.8022339486034745e-06, + "loss": 0.8174, + "step": 26633 + }, + { + "epoch": 0.68, + "learning_rate": 1.8022174287644354e-06, + "loss": 1.1494, + "step": 26634 + }, + { + "epoch": 0.68, + "learning_rate": 1.8022009083111751e-06, + "loss": 0.9619, + "step": 26635 + }, + { + "epoch": 0.68, + "learning_rate": 1.8021843872437067e-06, + "loss": 0.8799, + "step": 26636 + }, + { + "epoch": 0.68, + "learning_rate": 1.8021678655620424e-06, + "loss": 0.7861, + "step": 26637 + }, + { + "epoch": 0.68, + "learning_rate": 1.8021513432661952e-06, + "loss": 0.709, + "step": 26638 + }, + { + "epoch": 0.68, + "learning_rate": 1.8021348203561777e-06, + "loss": 0.7656, + "step": 26639 + }, + { + "epoch": 0.68, + "learning_rate": 1.802118296832002e-06, + "loss": 0.7461, + "step": 26640 + }, + { + "epoch": 0.68, + "learning_rate": 1.8021017726936816e-06, + "loss": 0.7744, + "step": 26641 + }, + { + "epoch": 0.68, + "learning_rate": 1.8020852479412288e-06, + "loss": 0.7588, + "step": 26642 + }, + { + "epoch": 0.68, + "learning_rate": 1.8020687225746559e-06, + "loss": 0.835, + "step": 26643 + }, + { + "epoch": 0.68, + "learning_rate": 1.8020521965939758e-06, + "loss": 0.873, + "step": 26644 + }, + { + "epoch": 0.68, + "learning_rate": 1.8020356699992013e-06, + "loss": 0.9316, + "step": 26645 + }, + { + "epoch": 0.68, + "learning_rate": 1.8020191427903453e-06, + "loss": 0.6826, + "step": 26646 + }, + { + "epoch": 0.68, + "learning_rate": 1.8020026149674199e-06, + "loss": 0.6274, + "step": 26647 + }, + { + "epoch": 0.68, + "learning_rate": 1.801986086530438e-06, + "loss": 0.8643, + "step": 26648 + }, + { + "epoch": 0.68, + "learning_rate": 1.8019695574794125e-06, + "loss": 0.9805, + "step": 26649 + }, + { + "epoch": 0.68, + "learning_rate": 1.8019530278143553e-06, + "loss": 0.8013, + "step": 26650 + }, + { + "epoch": 0.68, + "learning_rate": 1.8019364975352797e-06, + "loss": 1.0654, + "step": 26651 + }, + { + "epoch": 0.68, + "learning_rate": 1.8019199666421984e-06, + "loss": 0.958, + "step": 26652 + }, + { + "epoch": 0.68, + "learning_rate": 1.8019034351351237e-06, + "loss": 0.6455, + "step": 26653 + }, + { + "epoch": 0.68, + "learning_rate": 1.8018869030140685e-06, + "loss": 0.8746, + "step": 26654 + }, + { + "epoch": 0.68, + "learning_rate": 1.8018703702790452e-06, + "loss": 0.812, + "step": 26655 + }, + { + "epoch": 0.68, + "learning_rate": 1.8018538369300666e-06, + "loss": 0.8721, + "step": 26656 + }, + { + "epoch": 0.68, + "learning_rate": 1.8018373029671454e-06, + "loss": 0.9209, + "step": 26657 + }, + { + "epoch": 0.68, + "learning_rate": 1.8018207683902946e-06, + "loss": 0.874, + "step": 26658 + }, + { + "epoch": 0.68, + "learning_rate": 1.801804233199526e-06, + "loss": 0.6738, + "step": 26659 + }, + { + "epoch": 0.68, + "learning_rate": 1.801787697394853e-06, + "loss": 0.7334, + "step": 26660 + }, + { + "epoch": 0.68, + "learning_rate": 1.8017711609762883e-06, + "loss": 0.5825, + "step": 26661 + }, + { + "epoch": 0.68, + "learning_rate": 1.8017546239438438e-06, + "loss": 0.8003, + "step": 26662 + }, + { + "epoch": 0.68, + "learning_rate": 1.801738086297533e-06, + "loss": 0.793, + "step": 26663 + }, + { + "epoch": 0.68, + "learning_rate": 1.801721548037368e-06, + "loss": 1.0146, + "step": 26664 + }, + { + "epoch": 0.68, + "learning_rate": 1.8017050091633616e-06, + "loss": 0.6589, + "step": 26665 + }, + { + "epoch": 0.68, + "learning_rate": 1.8016884696755268e-06, + "loss": 0.9268, + "step": 26666 + }, + { + "epoch": 0.68, + "learning_rate": 1.801671929573876e-06, + "loss": 0.8838, + "step": 26667 + }, + { + "epoch": 0.68, + "learning_rate": 1.8016553888584217e-06, + "loss": 0.7236, + "step": 26668 + }, + { + "epoch": 0.68, + "learning_rate": 1.8016388475291769e-06, + "loss": 0.9648, + "step": 26669 + }, + { + "epoch": 0.68, + "learning_rate": 1.8016223055861542e-06, + "loss": 0.9766, + "step": 26670 + }, + { + "epoch": 0.68, + "learning_rate": 1.8016057630293657e-06, + "loss": 0.8208, + "step": 26671 + }, + { + "epoch": 0.68, + "learning_rate": 1.8015892198588247e-06, + "loss": 0.9224, + "step": 26672 + }, + { + "epoch": 0.68, + "learning_rate": 1.801572676074544e-06, + "loss": 0.8389, + "step": 26673 + }, + { + "epoch": 0.68, + "learning_rate": 1.8015561316765356e-06, + "loss": 0.6396, + "step": 26674 + }, + { + "epoch": 0.68, + "learning_rate": 1.8015395866648127e-06, + "loss": 0.7109, + "step": 26675 + }, + { + "epoch": 0.68, + "learning_rate": 1.8015230410393877e-06, + "loss": 0.748, + "step": 26676 + }, + { + "epoch": 0.68, + "learning_rate": 1.8015064948002734e-06, + "loss": 0.5356, + "step": 26677 + }, + { + "epoch": 0.68, + "learning_rate": 1.8014899479474825e-06, + "loss": 0.7139, + "step": 26678 + }, + { + "epoch": 0.68, + "learning_rate": 1.8014734004810276e-06, + "loss": 1.04, + "step": 26679 + }, + { + "epoch": 0.68, + "learning_rate": 1.8014568524009212e-06, + "loss": 0.7861, + "step": 26680 + }, + { + "epoch": 0.68, + "learning_rate": 1.8014403037071764e-06, + "loss": 0.9443, + "step": 26681 + }, + { + "epoch": 0.68, + "learning_rate": 1.8014237543998055e-06, + "loss": 0.9932, + "step": 26682 + }, + { + "epoch": 0.68, + "learning_rate": 1.801407204478821e-06, + "loss": 0.7236, + "step": 26683 + }, + { + "epoch": 0.68, + "learning_rate": 1.8013906539442362e-06, + "loss": 0.7686, + "step": 26684 + }, + { + "epoch": 0.68, + "learning_rate": 1.8013741027960635e-06, + "loss": 0.8369, + "step": 26685 + }, + { + "epoch": 0.68, + "learning_rate": 1.8013575510343153e-06, + "loss": 0.8972, + "step": 26686 + }, + { + "epoch": 0.68, + "learning_rate": 1.8013409986590044e-06, + "loss": 0.8232, + "step": 26687 + }, + { + "epoch": 0.68, + "learning_rate": 1.8013244456701435e-06, + "loss": 0.9561, + "step": 26688 + }, + { + "epoch": 0.68, + "learning_rate": 1.8013078920677455e-06, + "loss": 0.8359, + "step": 26689 + }, + { + "epoch": 0.68, + "learning_rate": 1.801291337851823e-06, + "loss": 0.9473, + "step": 26690 + }, + { + "epoch": 0.68, + "learning_rate": 1.8012747830223885e-06, + "loss": 1.0068, + "step": 26691 + }, + { + "epoch": 0.68, + "learning_rate": 1.8012582275794546e-06, + "loss": 0.9424, + "step": 26692 + }, + { + "epoch": 0.68, + "learning_rate": 1.801241671523034e-06, + "loss": 1.0107, + "step": 26693 + }, + { + "epoch": 0.68, + "learning_rate": 1.80122511485314e-06, + "loss": 0.9443, + "step": 26694 + }, + { + "epoch": 0.68, + "learning_rate": 1.8012085575697845e-06, + "loss": 1.0439, + "step": 26695 + }, + { + "epoch": 0.68, + "learning_rate": 1.80119199967298e-06, + "loss": 0.874, + "step": 26696 + }, + { + "epoch": 0.68, + "learning_rate": 1.8011754411627402e-06, + "loss": 1.0723, + "step": 26697 + }, + { + "epoch": 0.68, + "learning_rate": 1.801158882039077e-06, + "loss": 0.7764, + "step": 26698 + }, + { + "epoch": 0.68, + "learning_rate": 1.8011423223020032e-06, + "loss": 0.8477, + "step": 26699 + }, + { + "epoch": 0.68, + "learning_rate": 1.8011257619515318e-06, + "loss": 0.7612, + "step": 26700 + }, + { + "epoch": 0.68, + "learning_rate": 1.801109200987675e-06, + "loss": 0.8604, + "step": 26701 + }, + { + "epoch": 0.68, + "learning_rate": 1.801092639410446e-06, + "loss": 0.876, + "step": 26702 + }, + { + "epoch": 0.68, + "learning_rate": 1.8010760772198569e-06, + "loss": 0.8418, + "step": 26703 + }, + { + "epoch": 0.68, + "learning_rate": 1.8010595144159208e-06, + "loss": 0.7402, + "step": 26704 + }, + { + "epoch": 0.68, + "learning_rate": 1.8010429509986503e-06, + "loss": 0.7183, + "step": 26705 + }, + { + "epoch": 0.68, + "learning_rate": 1.801026386968058e-06, + "loss": 1.0635, + "step": 26706 + }, + { + "epoch": 0.68, + "learning_rate": 1.8010098223241568e-06, + "loss": 0.7241, + "step": 26707 + }, + { + "epoch": 0.68, + "learning_rate": 1.8009932570669588e-06, + "loss": 0.9727, + "step": 26708 + }, + { + "epoch": 0.68, + "learning_rate": 1.8009766911964772e-06, + "loss": 0.9502, + "step": 26709 + }, + { + "epoch": 0.68, + "learning_rate": 1.8009601247127248e-06, + "loss": 0.8921, + "step": 26710 + }, + { + "epoch": 0.68, + "learning_rate": 1.800943557615714e-06, + "loss": 0.8545, + "step": 26711 + }, + { + "epoch": 0.68, + "learning_rate": 1.8009269899054576e-06, + "loss": 0.873, + "step": 26712 + }, + { + "epoch": 0.68, + "learning_rate": 1.8009104215819684e-06, + "loss": 0.8359, + "step": 26713 + }, + { + "epoch": 0.68, + "learning_rate": 1.8008938526452586e-06, + "loss": 0.999, + "step": 26714 + }, + { + "epoch": 0.68, + "learning_rate": 1.8008772830953412e-06, + "loss": 0.8975, + "step": 26715 + }, + { + "epoch": 0.68, + "learning_rate": 1.8008607129322288e-06, + "loss": 0.8667, + "step": 26716 + }, + { + "epoch": 0.68, + "learning_rate": 1.8008441421559345e-06, + "loss": 0.8721, + "step": 26717 + }, + { + "epoch": 0.68, + "learning_rate": 1.8008275707664704e-06, + "loss": 0.7705, + "step": 26718 + }, + { + "epoch": 0.68, + "learning_rate": 1.8008109987638495e-06, + "loss": 0.8838, + "step": 26719 + }, + { + "epoch": 0.68, + "learning_rate": 1.8007944261480847e-06, + "loss": 1.0303, + "step": 26720 + }, + { + "epoch": 0.68, + "learning_rate": 1.8007778529191882e-06, + "loss": 0.8877, + "step": 26721 + }, + { + "epoch": 0.68, + "learning_rate": 1.800761279077173e-06, + "loss": 0.9639, + "step": 26722 + }, + { + "epoch": 0.68, + "learning_rate": 1.8007447046220516e-06, + "loss": 1.0488, + "step": 26723 + }, + { + "epoch": 0.68, + "learning_rate": 1.8007281295538368e-06, + "loss": 0.9561, + "step": 26724 + }, + { + "epoch": 0.68, + "learning_rate": 1.8007115538725416e-06, + "loss": 0.8575, + "step": 26725 + }, + { + "epoch": 0.69, + "learning_rate": 1.8006949775781782e-06, + "loss": 0.8047, + "step": 26726 + }, + { + "epoch": 0.69, + "learning_rate": 1.8006784006707592e-06, + "loss": 0.8701, + "step": 26727 + }, + { + "epoch": 0.69, + "learning_rate": 1.8006618231502978e-06, + "loss": 0.8428, + "step": 26728 + }, + { + "epoch": 0.69, + "learning_rate": 1.8006452450168065e-06, + "loss": 1.0518, + "step": 26729 + }, + { + "epoch": 0.69, + "learning_rate": 1.800628666270298e-06, + "loss": 0.8281, + "step": 26730 + }, + { + "epoch": 0.69, + "learning_rate": 1.8006120869107846e-06, + "loss": 1.1143, + "step": 26731 + }, + { + "epoch": 0.69, + "learning_rate": 1.8005955069382798e-06, + "loss": 0.6143, + "step": 26732 + }, + { + "epoch": 0.69, + "learning_rate": 1.8005789263527955e-06, + "loss": 1.0088, + "step": 26733 + }, + { + "epoch": 0.69, + "learning_rate": 1.8005623451543447e-06, + "loss": 0.9092, + "step": 26734 + }, + { + "epoch": 0.69, + "learning_rate": 1.8005457633429404e-06, + "loss": 0.9277, + "step": 26735 + }, + { + "epoch": 0.69, + "learning_rate": 1.8005291809185947e-06, + "loss": 0.8037, + "step": 26736 + }, + { + "epoch": 0.69, + "learning_rate": 1.8005125978813206e-06, + "loss": 0.9707, + "step": 26737 + }, + { + "epoch": 0.69, + "learning_rate": 1.8004960142311313e-06, + "loss": 0.5767, + "step": 26738 + }, + { + "epoch": 0.69, + "learning_rate": 1.8004794299680386e-06, + "loss": 0.9099, + "step": 26739 + }, + { + "epoch": 0.69, + "learning_rate": 1.8004628450920557e-06, + "loss": 0.9761, + "step": 26740 + }, + { + "epoch": 0.69, + "learning_rate": 1.8004462596031954e-06, + "loss": 0.7598, + "step": 26741 + }, + { + "epoch": 0.69, + "learning_rate": 1.8004296735014699e-06, + "loss": 0.7607, + "step": 26742 + }, + { + "epoch": 0.69, + "learning_rate": 1.8004130867868923e-06, + "loss": 0.8994, + "step": 26743 + }, + { + "epoch": 0.69, + "learning_rate": 1.8003964994594752e-06, + "loss": 0.7871, + "step": 26744 + }, + { + "epoch": 0.69, + "learning_rate": 1.8003799115192314e-06, + "loss": 0.9609, + "step": 26745 + }, + { + "epoch": 0.69, + "learning_rate": 1.8003633229661735e-06, + "loss": 0.7539, + "step": 26746 + }, + { + "epoch": 0.69, + "learning_rate": 1.800346733800314e-06, + "loss": 0.8203, + "step": 26747 + }, + { + "epoch": 0.69, + "learning_rate": 1.800330144021666e-06, + "loss": 0.8018, + "step": 26748 + }, + { + "epoch": 0.69, + "learning_rate": 1.8003135536302421e-06, + "loss": 0.7534, + "step": 26749 + }, + { + "epoch": 0.69, + "learning_rate": 1.8002969626260547e-06, + "loss": 0.7339, + "step": 26750 + }, + { + "epoch": 0.69, + "learning_rate": 1.8002803710091166e-06, + "loss": 0.999, + "step": 26751 + }, + { + "epoch": 0.69, + "learning_rate": 1.800263778779441e-06, + "loss": 1.043, + "step": 26752 + }, + { + "epoch": 0.69, + "learning_rate": 1.80024718593704e-06, + "loss": 0.9922, + "step": 26753 + }, + { + "epoch": 0.69, + "learning_rate": 1.8002305924819265e-06, + "loss": 0.6807, + "step": 26754 + }, + { + "epoch": 0.69, + "learning_rate": 1.8002139984141135e-06, + "loss": 0.7021, + "step": 26755 + }, + { + "epoch": 0.69, + "learning_rate": 1.800197403733613e-06, + "loss": 0.7607, + "step": 26756 + }, + { + "epoch": 0.69, + "learning_rate": 1.8001808084404383e-06, + "loss": 1.0488, + "step": 26757 + }, + { + "epoch": 0.69, + "learning_rate": 1.800164212534602e-06, + "loss": 0.5344, + "step": 26758 + }, + { + "epoch": 0.69, + "learning_rate": 1.8001476160161166e-06, + "loss": 0.8467, + "step": 26759 + }, + { + "epoch": 0.69, + "learning_rate": 1.8001310188849953e-06, + "loss": 0.7583, + "step": 26760 + }, + { + "epoch": 0.69, + "learning_rate": 1.8001144211412504e-06, + "loss": 0.8018, + "step": 26761 + }, + { + "epoch": 0.69, + "learning_rate": 1.8000978227848945e-06, + "loss": 1.0205, + "step": 26762 + }, + { + "epoch": 0.69, + "learning_rate": 1.8000812238159404e-06, + "loss": 1.001, + "step": 26763 + }, + { + "epoch": 0.69, + "learning_rate": 1.8000646242344013e-06, + "loss": 0.9697, + "step": 26764 + }, + { + "epoch": 0.69, + "learning_rate": 1.8000480240402892e-06, + "loss": 1.0449, + "step": 26765 + }, + { + "epoch": 0.69, + "learning_rate": 1.800031423233617e-06, + "loss": 0.8867, + "step": 26766 + }, + { + "epoch": 0.69, + "learning_rate": 1.8000148218143978e-06, + "loss": 0.8604, + "step": 26767 + }, + { + "epoch": 0.69, + "learning_rate": 1.799998219782644e-06, + "loss": 0.6729, + "step": 26768 + }, + { + "epoch": 0.69, + "learning_rate": 1.7999816171383682e-06, + "loss": 1.0283, + "step": 26769 + }, + { + "epoch": 0.69, + "learning_rate": 1.7999650138815834e-06, + "loss": 0.6274, + "step": 26770 + }, + { + "epoch": 0.69, + "learning_rate": 1.799948410012302e-06, + "loss": 0.6299, + "step": 26771 + }, + { + "epoch": 0.69, + "learning_rate": 1.799931805530537e-06, + "loss": 0.8926, + "step": 26772 + }, + { + "epoch": 0.69, + "learning_rate": 1.7999152004363012e-06, + "loss": 0.7568, + "step": 26773 + }, + { + "epoch": 0.69, + "learning_rate": 1.7998985947296068e-06, + "loss": 1.1191, + "step": 26774 + }, + { + "epoch": 0.69, + "learning_rate": 1.7998819884104669e-06, + "loss": 0.7808, + "step": 26775 + }, + { + "epoch": 0.69, + "learning_rate": 1.7998653814788942e-06, + "loss": 0.835, + "step": 26776 + }, + { + "epoch": 0.69, + "learning_rate": 1.7998487739349013e-06, + "loss": 0.918, + "step": 26777 + }, + { + "epoch": 0.69, + "learning_rate": 1.799832165778501e-06, + "loss": 0.8848, + "step": 26778 + }, + { + "epoch": 0.69, + "learning_rate": 1.799815557009706e-06, + "loss": 0.7112, + "step": 26779 + }, + { + "epoch": 0.69, + "learning_rate": 1.799798947628529e-06, + "loss": 1.0391, + "step": 26780 + }, + { + "epoch": 0.69, + "learning_rate": 1.7997823376349828e-06, + "loss": 0.9189, + "step": 26781 + }, + { + "epoch": 0.69, + "learning_rate": 1.79976572702908e-06, + "loss": 0.9932, + "step": 26782 + }, + { + "epoch": 0.69, + "learning_rate": 1.7997491158108332e-06, + "loss": 0.8652, + "step": 26783 + }, + { + "epoch": 0.69, + "learning_rate": 1.7997325039802553e-06, + "loss": 0.9053, + "step": 26784 + }, + { + "epoch": 0.69, + "learning_rate": 1.7997158915373594e-06, + "loss": 0.7559, + "step": 26785 + }, + { + "epoch": 0.69, + "learning_rate": 1.7996992784821572e-06, + "loss": 0.7388, + "step": 26786 + }, + { + "epoch": 0.69, + "learning_rate": 1.7996826648146626e-06, + "loss": 0.8486, + "step": 26787 + }, + { + "epoch": 0.69, + "learning_rate": 1.7996660505348873e-06, + "loss": 0.9268, + "step": 26788 + }, + { + "epoch": 0.69, + "learning_rate": 1.7996494356428446e-06, + "loss": 0.7588, + "step": 26789 + }, + { + "epoch": 0.69, + "learning_rate": 1.7996328201385472e-06, + "loss": 0.7783, + "step": 26790 + }, + { + "epoch": 0.69, + "learning_rate": 1.7996162040220078e-06, + "loss": 0.9365, + "step": 26791 + }, + { + "epoch": 0.69, + "learning_rate": 1.7995995872932388e-06, + "loss": 0.8125, + "step": 26792 + }, + { + "epoch": 0.69, + "learning_rate": 1.7995829699522533e-06, + "loss": 0.8081, + "step": 26793 + }, + { + "epoch": 0.69, + "learning_rate": 1.799566351999064e-06, + "loss": 0.9004, + "step": 26794 + }, + { + "epoch": 0.69, + "learning_rate": 1.7995497334336834e-06, + "loss": 0.8994, + "step": 26795 + }, + { + "epoch": 0.69, + "learning_rate": 1.7995331142561243e-06, + "loss": 0.8501, + "step": 26796 + }, + { + "epoch": 0.69, + "learning_rate": 1.7995164944663994e-06, + "loss": 0.8994, + "step": 26797 + }, + { + "epoch": 0.69, + "learning_rate": 1.7994998740645215e-06, + "loss": 0.8379, + "step": 26798 + }, + { + "epoch": 0.69, + "learning_rate": 1.7994832530505033e-06, + "loss": 0.7344, + "step": 26799 + }, + { + "epoch": 0.69, + "learning_rate": 1.7994666314243576e-06, + "loss": 0.8457, + "step": 26800 + }, + { + "epoch": 0.69, + "learning_rate": 1.7994500091860969e-06, + "loss": 0.7734, + "step": 26801 + }, + { + "epoch": 0.69, + "learning_rate": 1.7994333863357345e-06, + "loss": 0.9346, + "step": 26802 + }, + { + "epoch": 0.69, + "learning_rate": 1.7994167628732824e-06, + "loss": 0.7314, + "step": 26803 + }, + { + "epoch": 0.69, + "learning_rate": 1.7994001387987537e-06, + "loss": 0.9238, + "step": 26804 + }, + { + "epoch": 0.69, + "learning_rate": 1.799383514112161e-06, + "loss": 0.7734, + "step": 26805 + }, + { + "epoch": 0.69, + "learning_rate": 1.7993668888135172e-06, + "loss": 0.7944, + "step": 26806 + }, + { + "epoch": 0.69, + "learning_rate": 1.799350262902835e-06, + "loss": 0.8125, + "step": 26807 + }, + { + "epoch": 0.69, + "learning_rate": 1.799333636380127e-06, + "loss": 0.8496, + "step": 26808 + }, + { + "epoch": 0.69, + "learning_rate": 1.7993170092454058e-06, + "loss": 0.7178, + "step": 26809 + }, + { + "epoch": 0.69, + "learning_rate": 1.7993003814986844e-06, + "loss": 0.8916, + "step": 26810 + }, + { + "epoch": 0.69, + "learning_rate": 1.7992837531399757e-06, + "loss": 0.8242, + "step": 26811 + }, + { + "epoch": 0.69, + "learning_rate": 1.799267124169292e-06, + "loss": 0.5588, + "step": 26812 + }, + { + "epoch": 0.69, + "learning_rate": 1.799250494586646e-06, + "loss": 1.0801, + "step": 26813 + }, + { + "epoch": 0.69, + "learning_rate": 1.7992338643920508e-06, + "loss": 0.7959, + "step": 26814 + }, + { + "epoch": 0.69, + "learning_rate": 1.7992172335855194e-06, + "loss": 1.0088, + "step": 26815 + }, + { + "epoch": 0.69, + "learning_rate": 1.7992006021670636e-06, + "loss": 0.6978, + "step": 26816 + }, + { + "epoch": 0.69, + "learning_rate": 1.7991839701366969e-06, + "loss": 0.959, + "step": 26817 + }, + { + "epoch": 0.69, + "learning_rate": 1.7991673374944316e-06, + "loss": 0.6069, + "step": 26818 + }, + { + "epoch": 0.69, + "learning_rate": 1.7991507042402808e-06, + "loss": 0.771, + "step": 26819 + }, + { + "epoch": 0.69, + "learning_rate": 1.7991340703742566e-06, + "loss": 0.7549, + "step": 26820 + }, + { + "epoch": 0.69, + "learning_rate": 1.7991174358963725e-06, + "loss": 0.7705, + "step": 26821 + }, + { + "epoch": 0.69, + "learning_rate": 1.7991008008066411e-06, + "loss": 0.6062, + "step": 26822 + }, + { + "epoch": 0.69, + "learning_rate": 1.799084165105075e-06, + "loss": 1.1152, + "step": 26823 + }, + { + "epoch": 0.69, + "learning_rate": 1.7990675287916866e-06, + "loss": 0.7915, + "step": 26824 + }, + { + "epoch": 0.69, + "learning_rate": 1.799050891866489e-06, + "loss": 0.8379, + "step": 26825 + }, + { + "epoch": 0.69, + "learning_rate": 1.799034254329495e-06, + "loss": 0.748, + "step": 26826 + }, + { + "epoch": 0.69, + "learning_rate": 1.799017616180717e-06, + "loss": 0.7461, + "step": 26827 + }, + { + "epoch": 0.69, + "learning_rate": 1.7990009774201683e-06, + "loss": 0.9492, + "step": 26828 + }, + { + "epoch": 0.69, + "learning_rate": 1.798984338047861e-06, + "loss": 0.874, + "step": 26829 + }, + { + "epoch": 0.69, + "learning_rate": 1.7989676980638082e-06, + "loss": 0.7188, + "step": 26830 + }, + { + "epoch": 0.69, + "learning_rate": 1.7989510574680224e-06, + "loss": 0.8135, + "step": 26831 + }, + { + "epoch": 0.69, + "learning_rate": 1.7989344162605168e-06, + "loss": 0.9648, + "step": 26832 + }, + { + "epoch": 0.69, + "learning_rate": 1.7989177744413037e-06, + "loss": 0.9961, + "step": 26833 + }, + { + "epoch": 0.69, + "learning_rate": 1.7989011320103962e-06, + "loss": 0.8271, + "step": 26834 + }, + { + "epoch": 0.69, + "learning_rate": 1.7988844889678068e-06, + "loss": 1.0176, + "step": 26835 + }, + { + "epoch": 0.69, + "learning_rate": 1.7988678453135479e-06, + "loss": 0.8955, + "step": 26836 + }, + { + "epoch": 0.69, + "learning_rate": 1.798851201047633e-06, + "loss": 0.8169, + "step": 26837 + }, + { + "epoch": 0.69, + "learning_rate": 1.798834556170074e-06, + "loss": 0.9189, + "step": 26838 + }, + { + "epoch": 0.69, + "learning_rate": 1.7988179106808847e-06, + "loss": 0.9873, + "step": 26839 + }, + { + "epoch": 0.69, + "learning_rate": 1.798801264580077e-06, + "loss": 0.655, + "step": 26840 + }, + { + "epoch": 0.69, + "learning_rate": 1.798784617867664e-06, + "loss": 0.8145, + "step": 26841 + }, + { + "epoch": 0.69, + "learning_rate": 1.7987679705436583e-06, + "loss": 1.0161, + "step": 26842 + }, + { + "epoch": 0.69, + "learning_rate": 1.7987513226080725e-06, + "loss": 0.6978, + "step": 26843 + }, + { + "epoch": 0.69, + "learning_rate": 1.7987346740609197e-06, + "loss": 0.748, + "step": 26844 + }, + { + "epoch": 0.69, + "learning_rate": 1.7987180249022127e-06, + "loss": 0.8564, + "step": 26845 + }, + { + "epoch": 0.69, + "learning_rate": 1.7987013751319638e-06, + "loss": 0.6763, + "step": 26846 + }, + { + "epoch": 0.69, + "learning_rate": 1.798684724750186e-06, + "loss": 0.8213, + "step": 26847 + }, + { + "epoch": 0.69, + "learning_rate": 1.798668073756892e-06, + "loss": 0.5027, + "step": 26848 + }, + { + "epoch": 0.69, + "learning_rate": 1.7986514221520945e-06, + "loss": 0.9385, + "step": 26849 + }, + { + "epoch": 0.69, + "learning_rate": 1.7986347699358065e-06, + "loss": 0.9355, + "step": 26850 + }, + { + "epoch": 0.69, + "learning_rate": 1.7986181171080405e-06, + "loss": 0.958, + "step": 26851 + }, + { + "epoch": 0.69, + "learning_rate": 1.7986014636688093e-06, + "loss": 0.8682, + "step": 26852 + }, + { + "epoch": 0.69, + "learning_rate": 1.7985848096181258e-06, + "loss": 0.8306, + "step": 26853 + }, + { + "epoch": 0.69, + "learning_rate": 1.7985681549560026e-06, + "loss": 0.8867, + "step": 26854 + }, + { + "epoch": 0.69, + "learning_rate": 1.7985514996824525e-06, + "loss": 0.9434, + "step": 26855 + }, + { + "epoch": 0.69, + "learning_rate": 1.7985348437974882e-06, + "loss": 0.7617, + "step": 26856 + }, + { + "epoch": 0.69, + "learning_rate": 1.7985181873011226e-06, + "loss": 0.8789, + "step": 26857 + }, + { + "epoch": 0.69, + "learning_rate": 1.7985015301933682e-06, + "loss": 0.8203, + "step": 26858 + }, + { + "epoch": 0.69, + "learning_rate": 1.7984848724742379e-06, + "loss": 1.1396, + "step": 26859 + }, + { + "epoch": 0.69, + "learning_rate": 1.7984682141437442e-06, + "loss": 1.0557, + "step": 26860 + }, + { + "epoch": 0.69, + "learning_rate": 1.7984515552019004e-06, + "loss": 0.9219, + "step": 26861 + }, + { + "epoch": 0.69, + "learning_rate": 1.7984348956487189e-06, + "loss": 0.6011, + "step": 26862 + }, + { + "epoch": 0.69, + "learning_rate": 1.7984182354842125e-06, + "loss": 1.0547, + "step": 26863 + }, + { + "epoch": 0.69, + "learning_rate": 1.798401574708394e-06, + "loss": 0.4355, + "step": 26864 + }, + { + "epoch": 0.69, + "learning_rate": 1.7983849133212762e-06, + "loss": 0.9619, + "step": 26865 + }, + { + "epoch": 0.69, + "learning_rate": 1.7983682513228717e-06, + "loss": 0.8877, + "step": 26866 + }, + { + "epoch": 0.69, + "learning_rate": 1.7983515887131934e-06, + "loss": 0.8975, + "step": 26867 + }, + { + "epoch": 0.69, + "learning_rate": 1.798334925492254e-06, + "loss": 0.8545, + "step": 26868 + }, + { + "epoch": 0.69, + "learning_rate": 1.7983182616600662e-06, + "loss": 1.0586, + "step": 26869 + }, + { + "epoch": 0.69, + "learning_rate": 1.7983015972166426e-06, + "loss": 0.9297, + "step": 26870 + }, + { + "epoch": 0.69, + "learning_rate": 1.7982849321619963e-06, + "loss": 1.0479, + "step": 26871 + }, + { + "epoch": 0.69, + "learning_rate": 1.79826826649614e-06, + "loss": 0.8975, + "step": 26872 + }, + { + "epoch": 0.69, + "learning_rate": 1.7982516002190865e-06, + "loss": 0.876, + "step": 26873 + }, + { + "epoch": 0.69, + "learning_rate": 1.7982349333308485e-06, + "loss": 0.7876, + "step": 26874 + }, + { + "epoch": 0.69, + "learning_rate": 1.7982182658314385e-06, + "loss": 0.9795, + "step": 26875 + }, + { + "epoch": 0.69, + "learning_rate": 1.7982015977208695e-06, + "loss": 0.6941, + "step": 26876 + }, + { + "epoch": 0.69, + "learning_rate": 1.7981849289991545e-06, + "loss": 0.9761, + "step": 26877 + }, + { + "epoch": 0.69, + "learning_rate": 1.7981682596663057e-06, + "loss": 0.8535, + "step": 26878 + }, + { + "epoch": 0.69, + "learning_rate": 1.7981515897223362e-06, + "loss": 0.5573, + "step": 26879 + }, + { + "epoch": 0.69, + "learning_rate": 1.7981349191672589e-06, + "loss": 0.8276, + "step": 26880 + }, + { + "epoch": 0.69, + "learning_rate": 1.7981182480010864e-06, + "loss": 0.876, + "step": 26881 + }, + { + "epoch": 0.69, + "learning_rate": 1.7981015762238312e-06, + "loss": 0.9131, + "step": 26882 + }, + { + "epoch": 0.69, + "learning_rate": 1.7980849038355067e-06, + "loss": 0.7739, + "step": 26883 + }, + { + "epoch": 0.69, + "learning_rate": 1.7980682308361248e-06, + "loss": 0.96, + "step": 26884 + }, + { + "epoch": 0.69, + "learning_rate": 1.7980515572256988e-06, + "loss": 0.687, + "step": 26885 + }, + { + "epoch": 0.69, + "learning_rate": 1.7980348830042417e-06, + "loss": 0.7891, + "step": 26886 + }, + { + "epoch": 0.69, + "learning_rate": 1.798018208171766e-06, + "loss": 0.7393, + "step": 26887 + }, + { + "epoch": 0.69, + "learning_rate": 1.7980015327282843e-06, + "loss": 0.7031, + "step": 26888 + }, + { + "epoch": 0.69, + "learning_rate": 1.7979848566738095e-06, + "loss": 0.9688, + "step": 26889 + }, + { + "epoch": 0.69, + "learning_rate": 1.7979681800083547e-06, + "loss": 0.8662, + "step": 26890 + }, + { + "epoch": 0.69, + "learning_rate": 1.7979515027319318e-06, + "loss": 0.7373, + "step": 26891 + }, + { + "epoch": 0.69, + "learning_rate": 1.7979348248445544e-06, + "loss": 0.9424, + "step": 26892 + }, + { + "epoch": 0.69, + "learning_rate": 1.7979181463462352e-06, + "loss": 0.9375, + "step": 26893 + }, + { + "epoch": 0.69, + "learning_rate": 1.7979014672369868e-06, + "loss": 0.6829, + "step": 26894 + }, + { + "epoch": 0.69, + "learning_rate": 1.7978847875168218e-06, + "loss": 0.9629, + "step": 26895 + }, + { + "epoch": 0.69, + "learning_rate": 1.7978681071857528e-06, + "loss": 1.0615, + "step": 26896 + }, + { + "epoch": 0.69, + "learning_rate": 1.7978514262437932e-06, + "loss": 0.9639, + "step": 26897 + }, + { + "epoch": 0.69, + "learning_rate": 1.7978347446909555e-06, + "loss": 0.8545, + "step": 26898 + }, + { + "epoch": 0.69, + "learning_rate": 1.797818062527252e-06, + "loss": 0.8799, + "step": 26899 + }, + { + "epoch": 0.69, + "learning_rate": 1.7978013797526963e-06, + "loss": 0.7285, + "step": 26900 + }, + { + "epoch": 0.69, + "learning_rate": 1.7977846963673007e-06, + "loss": 0.7319, + "step": 26901 + }, + { + "epoch": 0.69, + "learning_rate": 1.797768012371078e-06, + "loss": 0.7041, + "step": 26902 + }, + { + "epoch": 0.69, + "learning_rate": 1.797751327764041e-06, + "loss": 1.0605, + "step": 26903 + }, + { + "epoch": 0.69, + "learning_rate": 1.7977346425462025e-06, + "loss": 1.0146, + "step": 26904 + }, + { + "epoch": 0.69, + "learning_rate": 1.7977179567175753e-06, + "loss": 1.0059, + "step": 26905 + }, + { + "epoch": 0.69, + "learning_rate": 1.7977012702781723e-06, + "loss": 1.0781, + "step": 26906 + }, + { + "epoch": 0.69, + "learning_rate": 1.7976845832280056e-06, + "loss": 0.9922, + "step": 26907 + }, + { + "epoch": 0.69, + "learning_rate": 1.797667895567089e-06, + "loss": 0.8291, + "step": 26908 + }, + { + "epoch": 0.69, + "learning_rate": 1.7976512072954344e-06, + "loss": 0.8921, + "step": 26909 + }, + { + "epoch": 0.69, + "learning_rate": 1.797634518413055e-06, + "loss": 0.9668, + "step": 26910 + }, + { + "epoch": 0.69, + "learning_rate": 1.797617828919964e-06, + "loss": 0.5967, + "step": 26911 + }, + { + "epoch": 0.69, + "learning_rate": 1.797601138816173e-06, + "loss": 0.793, + "step": 26912 + }, + { + "epoch": 0.69, + "learning_rate": 1.797584448101696e-06, + "loss": 1.1611, + "step": 26913 + }, + { + "epoch": 0.69, + "learning_rate": 1.797567756776545e-06, + "loss": 1.1133, + "step": 26914 + }, + { + "epoch": 0.69, + "learning_rate": 1.7975510648407332e-06, + "loss": 0.9512, + "step": 26915 + }, + { + "epoch": 0.69, + "learning_rate": 1.7975343722942733e-06, + "loss": 0.6719, + "step": 26916 + }, + { + "epoch": 0.69, + "learning_rate": 1.797517679137178e-06, + "loss": 0.8081, + "step": 26917 + }, + { + "epoch": 0.69, + "learning_rate": 1.7975009853694597e-06, + "loss": 0.8965, + "step": 26918 + }, + { + "epoch": 0.69, + "learning_rate": 1.7974842909911318e-06, + "loss": 0.8633, + "step": 26919 + }, + { + "epoch": 0.69, + "learning_rate": 1.797467596002207e-06, + "loss": 0.9463, + "step": 26920 + }, + { + "epoch": 0.69, + "learning_rate": 1.7974509004026976e-06, + "loss": 0.7915, + "step": 26921 + }, + { + "epoch": 0.69, + "learning_rate": 1.7974342041926171e-06, + "loss": 0.8574, + "step": 26922 + }, + { + "epoch": 0.69, + "learning_rate": 1.7974175073719777e-06, + "loss": 0.707, + "step": 26923 + }, + { + "epoch": 0.69, + "learning_rate": 1.7974008099407923e-06, + "loss": 0.6226, + "step": 26924 + }, + { + "epoch": 0.69, + "learning_rate": 1.797384111899074e-06, + "loss": 0.8159, + "step": 26925 + }, + { + "epoch": 0.69, + "learning_rate": 1.7973674132468353e-06, + "loss": 0.9141, + "step": 26926 + }, + { + "epoch": 0.69, + "learning_rate": 1.7973507139840888e-06, + "loss": 1.0273, + "step": 26927 + }, + { + "epoch": 0.69, + "learning_rate": 1.7973340141108477e-06, + "loss": 0.7969, + "step": 26928 + }, + { + "epoch": 0.69, + "learning_rate": 1.7973173136271245e-06, + "loss": 0.7959, + "step": 26929 + }, + { + "epoch": 0.69, + "learning_rate": 1.7973006125329322e-06, + "loss": 0.8799, + "step": 26930 + }, + { + "epoch": 0.69, + "learning_rate": 1.7972839108282837e-06, + "loss": 0.8623, + "step": 26931 + }, + { + "epoch": 0.69, + "learning_rate": 1.797267208513191e-06, + "loss": 0.7866, + "step": 26932 + }, + { + "epoch": 0.69, + "learning_rate": 1.7972505055876677e-06, + "loss": 0.814, + "step": 26933 + }, + { + "epoch": 0.69, + "learning_rate": 1.7972338020517265e-06, + "loss": 0.6987, + "step": 26934 + }, + { + "epoch": 0.69, + "learning_rate": 1.79721709790538e-06, + "loss": 0.5674, + "step": 26935 + }, + { + "epoch": 0.69, + "learning_rate": 1.7972003931486407e-06, + "loss": 0.8887, + "step": 26936 + }, + { + "epoch": 0.69, + "learning_rate": 1.7971836877815223e-06, + "loss": 0.8223, + "step": 26937 + }, + { + "epoch": 0.69, + "learning_rate": 1.7971669818040364e-06, + "loss": 0.8787, + "step": 26938 + }, + { + "epoch": 0.69, + "learning_rate": 1.797150275216197e-06, + "loss": 0.7085, + "step": 26939 + }, + { + "epoch": 0.69, + "learning_rate": 1.7971335680180159e-06, + "loss": 0.9277, + "step": 26940 + }, + { + "epoch": 0.69, + "learning_rate": 1.7971168602095063e-06, + "loss": 0.875, + "step": 26941 + }, + { + "epoch": 0.69, + "learning_rate": 1.7971001517906813e-06, + "loss": 0.7207, + "step": 26942 + }, + { + "epoch": 0.69, + "learning_rate": 1.797083442761553e-06, + "loss": 0.8252, + "step": 26943 + }, + { + "epoch": 0.69, + "learning_rate": 1.7970667331221346e-06, + "loss": 0.6284, + "step": 26944 + }, + { + "epoch": 0.69, + "learning_rate": 1.797050022872439e-06, + "loss": 0.5957, + "step": 26945 + }, + { + "epoch": 0.69, + "learning_rate": 1.7970333120124787e-06, + "loss": 1.0322, + "step": 26946 + }, + { + "epoch": 0.69, + "learning_rate": 1.7970166005422667e-06, + "loss": 0.9102, + "step": 26947 + }, + { + "epoch": 0.69, + "learning_rate": 1.7969998884618156e-06, + "loss": 0.8926, + "step": 26948 + }, + { + "epoch": 0.69, + "learning_rate": 1.7969831757711388e-06, + "loss": 0.7441, + "step": 26949 + }, + { + "epoch": 0.69, + "learning_rate": 1.7969664624702481e-06, + "loss": 0.7827, + "step": 26950 + }, + { + "epoch": 0.69, + "learning_rate": 1.7969497485591569e-06, + "loss": 0.8311, + "step": 26951 + }, + { + "epoch": 0.69, + "learning_rate": 1.7969330340378781e-06, + "loss": 0.8789, + "step": 26952 + }, + { + "epoch": 0.69, + "learning_rate": 1.7969163189064242e-06, + "loss": 0.8672, + "step": 26953 + }, + { + "epoch": 0.69, + "learning_rate": 1.7968996031648085e-06, + "loss": 0.8369, + "step": 26954 + }, + { + "epoch": 0.69, + "learning_rate": 1.796882886813043e-06, + "loss": 1.0459, + "step": 26955 + }, + { + "epoch": 0.69, + "learning_rate": 1.796866169851141e-06, + "loss": 0.6685, + "step": 26956 + }, + { + "epoch": 0.69, + "learning_rate": 1.7968494522791153e-06, + "loss": 0.7588, + "step": 26957 + }, + { + "epoch": 0.69, + "learning_rate": 1.7968327340969785e-06, + "loss": 0.6796, + "step": 26958 + }, + { + "epoch": 0.69, + "learning_rate": 1.7968160153047435e-06, + "loss": 0.9326, + "step": 26959 + }, + { + "epoch": 0.69, + "learning_rate": 1.7967992959024232e-06, + "loss": 0.6421, + "step": 26960 + }, + { + "epoch": 0.69, + "learning_rate": 1.7967825758900301e-06, + "loss": 0.8906, + "step": 26961 + }, + { + "epoch": 0.69, + "learning_rate": 1.7967658552675777e-06, + "loss": 0.6758, + "step": 26962 + }, + { + "epoch": 0.69, + "learning_rate": 1.7967491340350778e-06, + "loss": 0.8867, + "step": 26963 + }, + { + "epoch": 0.69, + "learning_rate": 1.796732412192544e-06, + "loss": 0.877, + "step": 26964 + }, + { + "epoch": 0.69, + "learning_rate": 1.7967156897399889e-06, + "loss": 0.8867, + "step": 26965 + }, + { + "epoch": 0.69, + "learning_rate": 1.7966989666774251e-06, + "loss": 0.7432, + "step": 26966 + }, + { + "epoch": 0.69, + "learning_rate": 1.7966822430048655e-06, + "loss": 0.9482, + "step": 26967 + }, + { + "epoch": 0.69, + "learning_rate": 1.796665518722323e-06, + "loss": 0.6914, + "step": 26968 + }, + { + "epoch": 0.69, + "learning_rate": 1.7966487938298106e-06, + "loss": 0.9717, + "step": 26969 + }, + { + "epoch": 0.69, + "learning_rate": 1.7966320683273403e-06, + "loss": 0.7866, + "step": 26970 + }, + { + "epoch": 0.69, + "learning_rate": 1.7966153422149258e-06, + "loss": 0.8975, + "step": 26971 + }, + { + "epoch": 0.69, + "learning_rate": 1.7965986154925793e-06, + "loss": 0.8066, + "step": 26972 + }, + { + "epoch": 0.69, + "learning_rate": 1.7965818881603144e-06, + "loss": 0.833, + "step": 26973 + }, + { + "epoch": 0.69, + "learning_rate": 1.7965651602181429e-06, + "loss": 0.8711, + "step": 26974 + }, + { + "epoch": 0.69, + "learning_rate": 1.7965484316660784e-06, + "loss": 0.8359, + "step": 26975 + }, + { + "epoch": 0.69, + "learning_rate": 1.796531702504133e-06, + "loss": 0.9297, + "step": 26976 + }, + { + "epoch": 0.69, + "learning_rate": 1.79651497273232e-06, + "loss": 0.8633, + "step": 26977 + }, + { + "epoch": 0.69, + "learning_rate": 1.7964982423506522e-06, + "loss": 0.8521, + "step": 26978 + }, + { + "epoch": 0.69, + "learning_rate": 1.7964815113591424e-06, + "loss": 0.8877, + "step": 26979 + }, + { + "epoch": 0.69, + "learning_rate": 1.7964647797578034e-06, + "loss": 0.8945, + "step": 26980 + }, + { + "epoch": 0.69, + "learning_rate": 1.7964480475466477e-06, + "loss": 0.9004, + "step": 26981 + }, + { + "epoch": 0.69, + "learning_rate": 1.7964313147256887e-06, + "loss": 0.9033, + "step": 26982 + }, + { + "epoch": 0.69, + "learning_rate": 1.7964145812949385e-06, + "loss": 0.8711, + "step": 26983 + }, + { + "epoch": 0.69, + "learning_rate": 1.7963978472544104e-06, + "loss": 0.8257, + "step": 26984 + }, + { + "epoch": 0.69, + "learning_rate": 1.7963811126041172e-06, + "loss": 0.916, + "step": 26985 + }, + { + "epoch": 0.69, + "learning_rate": 1.7963643773440715e-06, + "loss": 0.7568, + "step": 26986 + }, + { + "epoch": 0.69, + "learning_rate": 1.7963476414742861e-06, + "loss": 0.8477, + "step": 26987 + }, + { + "epoch": 0.69, + "learning_rate": 1.7963309049947739e-06, + "loss": 0.606, + "step": 26988 + }, + { + "epoch": 0.69, + "learning_rate": 1.7963141679055482e-06, + "loss": 0.6714, + "step": 26989 + }, + { + "epoch": 0.69, + "learning_rate": 1.796297430206621e-06, + "loss": 0.8071, + "step": 26990 + }, + { + "epoch": 0.69, + "learning_rate": 1.7962806918980053e-06, + "loss": 0.833, + "step": 26991 + }, + { + "epoch": 0.69, + "learning_rate": 1.7962639529797143e-06, + "loss": 0.6493, + "step": 26992 + }, + { + "epoch": 0.69, + "learning_rate": 1.7962472134517607e-06, + "loss": 0.7451, + "step": 26993 + }, + { + "epoch": 0.69, + "learning_rate": 1.796230473314157e-06, + "loss": 0.9707, + "step": 26994 + }, + { + "epoch": 0.69, + "learning_rate": 1.7962137325669167e-06, + "loss": 0.7949, + "step": 26995 + }, + { + "epoch": 0.69, + "learning_rate": 1.7961969912100517e-06, + "loss": 0.7666, + "step": 26996 + }, + { + "epoch": 0.69, + "learning_rate": 1.7961802492435752e-06, + "loss": 1.0029, + "step": 26997 + }, + { + "epoch": 0.69, + "learning_rate": 1.7961635066675003e-06, + "loss": 0.8467, + "step": 26998 + }, + { + "epoch": 0.69, + "learning_rate": 1.7961467634818397e-06, + "loss": 0.7568, + "step": 26999 + }, + { + "epoch": 0.69, + "learning_rate": 1.796130019686606e-06, + "loss": 1.083, + "step": 27000 + }, + { + "epoch": 0.69, + "learning_rate": 1.7961132752818121e-06, + "loss": 0.6743, + "step": 27001 + }, + { + "epoch": 0.69, + "learning_rate": 1.7960965302674711e-06, + "loss": 0.9629, + "step": 27002 + }, + { + "epoch": 0.69, + "learning_rate": 1.7960797846435955e-06, + "loss": 0.918, + "step": 27003 + }, + { + "epoch": 0.69, + "learning_rate": 1.7960630384101982e-06, + "loss": 0.8013, + "step": 27004 + }, + { + "epoch": 0.69, + "learning_rate": 1.7960462915672918e-06, + "loss": 0.9756, + "step": 27005 + }, + { + "epoch": 0.69, + "learning_rate": 1.7960295441148897e-06, + "loss": 0.9229, + "step": 27006 + }, + { + "epoch": 0.69, + "learning_rate": 1.796012796053004e-06, + "loss": 0.8472, + "step": 27007 + }, + { + "epoch": 0.69, + "learning_rate": 1.7959960473816483e-06, + "loss": 0.4858, + "step": 27008 + }, + { + "epoch": 0.69, + "learning_rate": 1.795979298100835e-06, + "loss": 0.8789, + "step": 27009 + }, + { + "epoch": 0.69, + "learning_rate": 1.7959625482105768e-06, + "loss": 0.7983, + "step": 27010 + }, + { + "epoch": 0.69, + "learning_rate": 1.7959457977108864e-06, + "loss": 0.7671, + "step": 27011 + }, + { + "epoch": 0.69, + "learning_rate": 1.7959290466017773e-06, + "loss": 0.8613, + "step": 27012 + }, + { + "epoch": 0.69, + "learning_rate": 1.795912294883262e-06, + "loss": 0.9844, + "step": 27013 + }, + { + "epoch": 0.69, + "learning_rate": 1.795895542555353e-06, + "loss": 0.7734, + "step": 27014 + }, + { + "epoch": 0.69, + "learning_rate": 1.7958787896180633e-06, + "loss": 0.8926, + "step": 27015 + }, + { + "epoch": 0.69, + "learning_rate": 1.7958620360714061e-06, + "loss": 0.8135, + "step": 27016 + }, + { + "epoch": 0.69, + "learning_rate": 1.7958452819153937e-06, + "loss": 0.8926, + "step": 27017 + }, + { + "epoch": 0.69, + "learning_rate": 1.7958285271500392e-06, + "loss": 0.6895, + "step": 27018 + }, + { + "epoch": 0.69, + "learning_rate": 1.7958117717753556e-06, + "loss": 0.9209, + "step": 27019 + }, + { + "epoch": 0.69, + "learning_rate": 1.7957950157913552e-06, + "loss": 0.6777, + "step": 27020 + }, + { + "epoch": 0.69, + "learning_rate": 1.7957782591980512e-06, + "loss": 0.6836, + "step": 27021 + }, + { + "epoch": 0.69, + "learning_rate": 1.7957615019954567e-06, + "loss": 0.7451, + "step": 27022 + }, + { + "epoch": 0.69, + "learning_rate": 1.795744744183584e-06, + "loss": 0.9355, + "step": 27023 + }, + { + "epoch": 0.69, + "learning_rate": 1.7957279857624461e-06, + "loss": 1.0654, + "step": 27024 + }, + { + "epoch": 0.69, + "learning_rate": 1.795711226732056e-06, + "loss": 1.0283, + "step": 27025 + }, + { + "epoch": 0.69, + "learning_rate": 1.795694467092426e-06, + "loss": 0.9268, + "step": 27026 + }, + { + "epoch": 0.69, + "learning_rate": 1.7956777068435697e-06, + "loss": 0.8213, + "step": 27027 + }, + { + "epoch": 0.69, + "learning_rate": 1.7956609459854997e-06, + "loss": 0.8604, + "step": 27028 + }, + { + "epoch": 0.69, + "learning_rate": 1.7956441845182285e-06, + "loss": 0.7554, + "step": 27029 + }, + { + "epoch": 0.69, + "learning_rate": 1.7956274224417691e-06, + "loss": 0.7808, + "step": 27030 + }, + { + "epoch": 0.69, + "learning_rate": 1.7956106597561345e-06, + "loss": 0.9072, + "step": 27031 + }, + { + "epoch": 0.69, + "learning_rate": 1.7955938964613372e-06, + "loss": 0.7822, + "step": 27032 + }, + { + "epoch": 0.69, + "learning_rate": 1.7955771325573903e-06, + "loss": 0.7358, + "step": 27033 + }, + { + "epoch": 0.69, + "learning_rate": 1.7955603680443066e-06, + "loss": 0.9717, + "step": 27034 + }, + { + "epoch": 0.69, + "learning_rate": 1.795543602922099e-06, + "loss": 0.8054, + "step": 27035 + }, + { + "epoch": 0.69, + "learning_rate": 1.79552683719078e-06, + "loss": 0.813, + "step": 27036 + }, + { + "epoch": 0.69, + "learning_rate": 1.795510070850363e-06, + "loss": 0.7705, + "step": 27037 + }, + { + "epoch": 0.69, + "learning_rate": 1.7954933039008604e-06, + "loss": 0.8398, + "step": 27038 + }, + { + "epoch": 0.69, + "learning_rate": 1.795476536342285e-06, + "loss": 0.856, + "step": 27039 + }, + { + "epoch": 0.69, + "learning_rate": 1.79545976817465e-06, + "loss": 0.9033, + "step": 27040 + }, + { + "epoch": 0.69, + "learning_rate": 1.7954429993979679e-06, + "loss": 0.9814, + "step": 27041 + }, + { + "epoch": 0.69, + "learning_rate": 1.7954262300122518e-06, + "loss": 0.8066, + "step": 27042 + }, + { + "epoch": 0.69, + "learning_rate": 1.7954094600175143e-06, + "loss": 0.9434, + "step": 27043 + }, + { + "epoch": 0.69, + "learning_rate": 1.7953926894137682e-06, + "loss": 0.7402, + "step": 27044 + }, + { + "epoch": 0.69, + "learning_rate": 1.7953759182010266e-06, + "loss": 0.7402, + "step": 27045 + }, + { + "epoch": 0.69, + "learning_rate": 1.7953591463793022e-06, + "loss": 0.9053, + "step": 27046 + }, + { + "epoch": 0.69, + "learning_rate": 1.7953423739486081e-06, + "loss": 0.8496, + "step": 27047 + }, + { + "epoch": 0.69, + "learning_rate": 1.7953256009089569e-06, + "loss": 0.9492, + "step": 27048 + }, + { + "epoch": 0.69, + "learning_rate": 1.7953088272603613e-06, + "loss": 0.9102, + "step": 27049 + }, + { + "epoch": 0.69, + "learning_rate": 1.7952920530028345e-06, + "loss": 0.9316, + "step": 27050 + }, + { + "epoch": 0.69, + "learning_rate": 1.7952752781363887e-06, + "loss": 0.7725, + "step": 27051 + }, + { + "epoch": 0.69, + "learning_rate": 1.7952585026610377e-06, + "loss": 0.7441, + "step": 27052 + }, + { + "epoch": 0.69, + "learning_rate": 1.7952417265767936e-06, + "loss": 0.6396, + "step": 27053 + }, + { + "epoch": 0.69, + "learning_rate": 1.7952249498836694e-06, + "loss": 0.7812, + "step": 27054 + }, + { + "epoch": 0.69, + "learning_rate": 1.795208172581678e-06, + "loss": 0.7717, + "step": 27055 + }, + { + "epoch": 0.69, + "learning_rate": 1.7951913946708324e-06, + "loss": 0.959, + "step": 27056 + }, + { + "epoch": 0.69, + "learning_rate": 1.7951746161511454e-06, + "loss": 0.9746, + "step": 27057 + }, + { + "epoch": 0.69, + "learning_rate": 1.7951578370226294e-06, + "loss": 1.0352, + "step": 27058 + }, + { + "epoch": 0.69, + "learning_rate": 1.795141057285298e-06, + "loss": 1.0312, + "step": 27059 + }, + { + "epoch": 0.69, + "learning_rate": 1.7951242769391634e-06, + "loss": 0.6328, + "step": 27060 + }, + { + "epoch": 0.69, + "learning_rate": 1.7951074959842387e-06, + "loss": 0.7236, + "step": 27061 + }, + { + "epoch": 0.69, + "learning_rate": 1.795090714420537e-06, + "loss": 0.811, + "step": 27062 + }, + { + "epoch": 0.69, + "learning_rate": 1.7950739322480708e-06, + "loss": 1.0215, + "step": 27063 + }, + { + "epoch": 0.69, + "learning_rate": 1.7950571494668529e-06, + "loss": 0.7295, + "step": 27064 + }, + { + "epoch": 0.69, + "learning_rate": 1.7950403660768965e-06, + "loss": 0.658, + "step": 27065 + }, + { + "epoch": 0.69, + "learning_rate": 1.795023582078214e-06, + "loss": 0.9551, + "step": 27066 + }, + { + "epoch": 0.69, + "learning_rate": 1.7950067974708188e-06, + "loss": 1.0293, + "step": 27067 + }, + { + "epoch": 0.69, + "learning_rate": 1.7949900122547233e-06, + "loss": 0.8311, + "step": 27068 + }, + { + "epoch": 0.69, + "learning_rate": 1.7949732264299404e-06, + "loss": 0.8975, + "step": 27069 + }, + { + "epoch": 0.69, + "learning_rate": 1.7949564399964833e-06, + "loss": 0.8027, + "step": 27070 + }, + { + "epoch": 0.69, + "learning_rate": 1.7949396529543643e-06, + "loss": 0.7017, + "step": 27071 + }, + { + "epoch": 0.69, + "learning_rate": 1.7949228653035967e-06, + "loss": 0.8394, + "step": 27072 + }, + { + "epoch": 0.69, + "learning_rate": 1.7949060770441932e-06, + "loss": 0.8496, + "step": 27073 + }, + { + "epoch": 0.69, + "learning_rate": 1.7948892881761668e-06, + "loss": 0.9795, + "step": 27074 + }, + { + "epoch": 0.69, + "learning_rate": 1.7948724986995301e-06, + "loss": 0.7334, + "step": 27075 + }, + { + "epoch": 0.69, + "learning_rate": 1.794855708614296e-06, + "loss": 0.7158, + "step": 27076 + }, + { + "epoch": 0.69, + "learning_rate": 1.7948389179204777e-06, + "loss": 0.7666, + "step": 27077 + }, + { + "epoch": 0.69, + "learning_rate": 1.7948221266180873e-06, + "loss": 0.8252, + "step": 27078 + }, + { + "epoch": 0.69, + "learning_rate": 1.7948053347071387e-06, + "loss": 0.8047, + "step": 27079 + }, + { + "epoch": 0.69, + "learning_rate": 1.7947885421876442e-06, + "loss": 0.4888, + "step": 27080 + }, + { + "epoch": 0.69, + "learning_rate": 1.7947717490596162e-06, + "loss": 0.8564, + "step": 27081 + }, + { + "epoch": 0.69, + "learning_rate": 1.7947549553230682e-06, + "loss": 0.6875, + "step": 27082 + }, + { + "epoch": 0.69, + "learning_rate": 1.794738160978013e-06, + "loss": 0.9658, + "step": 27083 + }, + { + "epoch": 0.69, + "learning_rate": 1.794721366024463e-06, + "loss": 0.9482, + "step": 27084 + }, + { + "epoch": 0.69, + "learning_rate": 1.7947045704624317e-06, + "loss": 1.0068, + "step": 27085 + }, + { + "epoch": 0.69, + "learning_rate": 1.7946877742919317e-06, + "loss": 0.4658, + "step": 27086 + }, + { + "epoch": 0.69, + "learning_rate": 1.7946709775129759e-06, + "loss": 0.8218, + "step": 27087 + }, + { + "epoch": 0.69, + "learning_rate": 1.7946541801255768e-06, + "loss": 1.0322, + "step": 27088 + }, + { + "epoch": 0.69, + "learning_rate": 1.7946373821297477e-06, + "loss": 0.9219, + "step": 27089 + }, + { + "epoch": 0.69, + "learning_rate": 1.794620583525501e-06, + "loss": 1.0703, + "step": 27090 + }, + { + "epoch": 0.69, + "learning_rate": 1.79460378431285e-06, + "loss": 0.8018, + "step": 27091 + }, + { + "epoch": 0.69, + "learning_rate": 1.7945869844918076e-06, + "loss": 0.5942, + "step": 27092 + }, + { + "epoch": 0.69, + "learning_rate": 1.7945701840623863e-06, + "loss": 0.7671, + "step": 27093 + }, + { + "epoch": 0.69, + "learning_rate": 1.794553383024599e-06, + "loss": 1.0645, + "step": 27094 + }, + { + "epoch": 0.69, + "learning_rate": 1.794536581378459e-06, + "loss": 0.8174, + "step": 27095 + }, + { + "epoch": 0.69, + "learning_rate": 1.794519779123979e-06, + "loss": 1.0137, + "step": 27096 + }, + { + "epoch": 0.69, + "learning_rate": 1.7945029762611715e-06, + "loss": 0.7236, + "step": 27097 + }, + { + "epoch": 0.69, + "learning_rate": 1.7944861727900496e-06, + "loss": 1.0156, + "step": 27098 + }, + { + "epoch": 0.69, + "learning_rate": 1.7944693687106263e-06, + "loss": 0.8438, + "step": 27099 + }, + { + "epoch": 0.69, + "learning_rate": 1.7944525640229142e-06, + "loss": 0.8184, + "step": 27100 + }, + { + "epoch": 0.69, + "learning_rate": 1.7944357587269263e-06, + "loss": 0.5933, + "step": 27101 + }, + { + "epoch": 0.69, + "learning_rate": 1.7944189528226757e-06, + "loss": 0.8926, + "step": 27102 + }, + { + "epoch": 0.69, + "learning_rate": 1.7944021463101747e-06, + "loss": 0.8672, + "step": 27103 + }, + { + "epoch": 0.69, + "learning_rate": 1.7943853391894366e-06, + "loss": 0.9854, + "step": 27104 + }, + { + "epoch": 0.69, + "learning_rate": 1.7943685314604742e-06, + "loss": 0.8926, + "step": 27105 + }, + { + "epoch": 0.69, + "learning_rate": 1.7943517231233005e-06, + "loss": 0.9897, + "step": 27106 + }, + { + "epoch": 0.69, + "learning_rate": 1.794334914177928e-06, + "loss": 1.0059, + "step": 27107 + }, + { + "epoch": 0.69, + "learning_rate": 1.7943181046243695e-06, + "loss": 0.9404, + "step": 27108 + }, + { + "epoch": 0.69, + "learning_rate": 1.7943012944626388e-06, + "loss": 0.8887, + "step": 27109 + }, + { + "epoch": 0.69, + "learning_rate": 1.7942844836927479e-06, + "loss": 0.8359, + "step": 27110 + }, + { + "epoch": 0.69, + "learning_rate": 1.7942676723147098e-06, + "loss": 0.7305, + "step": 27111 + }, + { + "epoch": 0.69, + "learning_rate": 1.7942508603285374e-06, + "loss": 0.8252, + "step": 27112 + }, + { + "epoch": 0.69, + "learning_rate": 1.7942340477342438e-06, + "loss": 0.7266, + "step": 27113 + }, + { + "epoch": 0.69, + "learning_rate": 1.7942172345318416e-06, + "loss": 0.8013, + "step": 27114 + }, + { + "epoch": 0.69, + "learning_rate": 1.7942004207213438e-06, + "loss": 0.9072, + "step": 27115 + }, + { + "epoch": 0.69, + "learning_rate": 1.7941836063027634e-06, + "loss": 0.6504, + "step": 27116 + }, + { + "epoch": 0.7, + "learning_rate": 1.7941667912761127e-06, + "loss": 0.6875, + "step": 27117 + }, + { + "epoch": 0.7, + "learning_rate": 1.7941499756414053e-06, + "loss": 0.8613, + "step": 27118 + }, + { + "epoch": 0.7, + "learning_rate": 1.794133159398654e-06, + "loss": 0.8354, + "step": 27119 + }, + { + "epoch": 0.7, + "learning_rate": 1.7941163425478712e-06, + "loss": 0.9336, + "step": 27120 + }, + { + "epoch": 0.7, + "learning_rate": 1.79409952508907e-06, + "loss": 0.9814, + "step": 27121 + }, + { + "epoch": 0.7, + "learning_rate": 1.7940827070222634e-06, + "loss": 0.6609, + "step": 27122 + }, + { + "epoch": 0.7, + "learning_rate": 1.7940658883474642e-06, + "loss": 0.9609, + "step": 27123 + }, + { + "epoch": 0.7, + "learning_rate": 1.7940490690646853e-06, + "loss": 0.7954, + "step": 27124 + }, + { + "epoch": 0.7, + "learning_rate": 1.7940322491739392e-06, + "loss": 0.8662, + "step": 27125 + }, + { + "epoch": 0.7, + "learning_rate": 1.7940154286752396e-06, + "loss": 0.7307, + "step": 27126 + }, + { + "epoch": 0.7, + "learning_rate": 1.7939986075685986e-06, + "loss": 0.8086, + "step": 27127 + }, + { + "epoch": 0.7, + "learning_rate": 1.7939817858540294e-06, + "loss": 0.9053, + "step": 27128 + }, + { + "epoch": 0.7, + "learning_rate": 1.793964963531545e-06, + "loss": 0.8857, + "step": 27129 + }, + { + "epoch": 0.7, + "learning_rate": 1.7939481406011582e-06, + "loss": 0.6133, + "step": 27130 + }, + { + "epoch": 0.7, + "learning_rate": 1.7939313170628813e-06, + "loss": 1.0479, + "step": 27131 + }, + { + "epoch": 0.7, + "learning_rate": 1.7939144929167282e-06, + "loss": 0.8018, + "step": 27132 + }, + { + "epoch": 0.7, + "learning_rate": 1.7938976681627111e-06, + "loss": 0.8831, + "step": 27133 + }, + { + "epoch": 0.7, + "learning_rate": 1.793880842800843e-06, + "loss": 0.8008, + "step": 27134 + }, + { + "epoch": 0.7, + "learning_rate": 1.793864016831137e-06, + "loss": 0.7734, + "step": 27135 + }, + { + "epoch": 0.7, + "learning_rate": 1.7938471902536056e-06, + "loss": 0.915, + "step": 27136 + }, + { + "epoch": 0.7, + "learning_rate": 1.7938303630682624e-06, + "loss": 0.7266, + "step": 27137 + }, + { + "epoch": 0.7, + "learning_rate": 1.7938135352751194e-06, + "loss": 1.0146, + "step": 27138 + }, + { + "epoch": 0.7, + "learning_rate": 1.7937967068741897e-06, + "loss": 0.8027, + "step": 27139 + }, + { + "epoch": 0.7, + "learning_rate": 1.7937798778654867e-06, + "loss": 0.8906, + "step": 27140 + }, + { + "epoch": 0.7, + "learning_rate": 1.7937630482490227e-06, + "loss": 0.9551, + "step": 27141 + }, + { + "epoch": 0.7, + "learning_rate": 1.793746218024811e-06, + "loss": 0.999, + "step": 27142 + }, + { + "epoch": 0.7, + "learning_rate": 1.7937293871928642e-06, + "loss": 0.7319, + "step": 27143 + }, + { + "epoch": 0.7, + "learning_rate": 1.7937125557531957e-06, + "loss": 0.9678, + "step": 27144 + }, + { + "epoch": 0.7, + "learning_rate": 1.7936957237058174e-06, + "loss": 0.9678, + "step": 27145 + }, + { + "epoch": 0.7, + "learning_rate": 1.7936788910507433e-06, + "loss": 0.792, + "step": 27146 + }, + { + "epoch": 0.7, + "learning_rate": 1.7936620577879854e-06, + "loss": 0.6633, + "step": 27147 + }, + { + "epoch": 0.7, + "learning_rate": 1.793645223917557e-06, + "loss": 0.7744, + "step": 27148 + }, + { + "epoch": 0.7, + "learning_rate": 1.7936283894394712e-06, + "loss": 0.8252, + "step": 27149 + }, + { + "epoch": 0.7, + "learning_rate": 1.7936115543537405e-06, + "loss": 0.7559, + "step": 27150 + }, + { + "epoch": 0.7, + "learning_rate": 1.793594718660378e-06, + "loss": 0.9512, + "step": 27151 + }, + { + "epoch": 0.7, + "learning_rate": 1.7935778823593964e-06, + "loss": 0.6655, + "step": 27152 + }, + { + "epoch": 0.7, + "learning_rate": 1.7935610454508086e-06, + "loss": 0.8857, + "step": 27153 + }, + { + "epoch": 0.7, + "learning_rate": 1.7935442079346276e-06, + "loss": 0.8164, + "step": 27154 + }, + { + "epoch": 0.7, + "learning_rate": 1.7935273698108665e-06, + "loss": 0.7329, + "step": 27155 + }, + { + "epoch": 0.7, + "learning_rate": 1.793510531079538e-06, + "loss": 0.8193, + "step": 27156 + }, + { + "epoch": 0.7, + "learning_rate": 1.7934936917406547e-06, + "loss": 0.998, + "step": 27157 + }, + { + "epoch": 0.7, + "learning_rate": 1.7934768517942298e-06, + "loss": 0.8721, + "step": 27158 + }, + { + "epoch": 0.7, + "learning_rate": 1.7934600112402763e-06, + "loss": 0.9697, + "step": 27159 + }, + { + "epoch": 0.7, + "learning_rate": 1.7934431700788068e-06, + "loss": 0.8721, + "step": 27160 + }, + { + "epoch": 0.7, + "learning_rate": 1.7934263283098348e-06, + "loss": 1.0234, + "step": 27161 + }, + { + "epoch": 0.7, + "learning_rate": 1.7934094859333721e-06, + "loss": 0.8555, + "step": 27162 + }, + { + "epoch": 0.7, + "learning_rate": 1.7933926429494325e-06, + "loss": 0.959, + "step": 27163 + }, + { + "epoch": 0.7, + "learning_rate": 1.793375799358029e-06, + "loss": 0.751, + "step": 27164 + }, + { + "epoch": 0.7, + "learning_rate": 1.793358955159174e-06, + "loss": 0.998, + "step": 27165 + }, + { + "epoch": 0.7, + "learning_rate": 1.79334211035288e-06, + "loss": 0.8652, + "step": 27166 + }, + { + "epoch": 0.7, + "learning_rate": 1.7933252649391611e-06, + "loss": 0.8809, + "step": 27167 + }, + { + "epoch": 0.7, + "learning_rate": 1.793308418918029e-06, + "loss": 0.9287, + "step": 27168 + }, + { + "epoch": 0.7, + "learning_rate": 1.7932915722894974e-06, + "loss": 0.917, + "step": 27169 + }, + { + "epoch": 0.7, + "learning_rate": 1.7932747250535786e-06, + "loss": 0.9248, + "step": 27170 + }, + { + "epoch": 0.7, + "learning_rate": 1.7932578772102861e-06, + "loss": 0.9365, + "step": 27171 + }, + { + "epoch": 0.7, + "learning_rate": 1.7932410287596327e-06, + "loss": 0.8574, + "step": 27172 + }, + { + "epoch": 0.7, + "learning_rate": 1.7932241797016308e-06, + "loss": 0.7959, + "step": 27173 + }, + { + "epoch": 0.7, + "learning_rate": 1.7932073300362938e-06, + "loss": 0.8418, + "step": 27174 + }, + { + "epoch": 0.7, + "learning_rate": 1.7931904797636342e-06, + "loss": 0.7295, + "step": 27175 + }, + { + "epoch": 0.7, + "learning_rate": 1.7931736288836653e-06, + "loss": 0.624, + "step": 27176 + }, + { + "epoch": 0.7, + "learning_rate": 1.7931567773963998e-06, + "loss": 0.9131, + "step": 27177 + }, + { + "epoch": 0.7, + "learning_rate": 1.7931399253018507e-06, + "loss": 0.8936, + "step": 27178 + }, + { + "epoch": 0.7, + "learning_rate": 1.7931230726000306e-06, + "loss": 0.8496, + "step": 27179 + }, + { + "epoch": 0.7, + "learning_rate": 1.7931062192909527e-06, + "loss": 0.74, + "step": 27180 + }, + { + "epoch": 0.7, + "learning_rate": 1.7930893653746299e-06, + "loss": 0.8584, + "step": 27181 + }, + { + "epoch": 0.7, + "learning_rate": 1.793072510851075e-06, + "loss": 0.832, + "step": 27182 + }, + { + "epoch": 0.7, + "learning_rate": 1.793055655720301e-06, + "loss": 0.5874, + "step": 27183 + }, + { + "epoch": 0.7, + "learning_rate": 1.793038799982321e-06, + "loss": 0.8643, + "step": 27184 + }, + { + "epoch": 0.7, + "learning_rate": 1.7930219436371472e-06, + "loss": 1.0459, + "step": 27185 + }, + { + "epoch": 0.7, + "learning_rate": 1.7930050866847932e-06, + "loss": 0.9473, + "step": 27186 + }, + { + "epoch": 0.7, + "learning_rate": 1.7929882291252715e-06, + "loss": 0.9043, + "step": 27187 + }, + { + "epoch": 0.7, + "learning_rate": 1.7929713709585954e-06, + "loss": 0.8799, + "step": 27188 + }, + { + "epoch": 0.7, + "learning_rate": 1.7929545121847775e-06, + "loss": 0.7891, + "step": 27189 + }, + { + "epoch": 0.7, + "learning_rate": 1.7929376528038307e-06, + "loss": 0.9316, + "step": 27190 + }, + { + "epoch": 0.7, + "learning_rate": 1.7929207928157682e-06, + "loss": 0.7119, + "step": 27191 + }, + { + "epoch": 0.7, + "learning_rate": 1.7929039322206026e-06, + "loss": 0.9502, + "step": 27192 + }, + { + "epoch": 0.7, + "learning_rate": 1.7928870710183468e-06, + "loss": 0.5837, + "step": 27193 + }, + { + "epoch": 0.7, + "learning_rate": 1.792870209209014e-06, + "loss": 0.9775, + "step": 27194 + }, + { + "epoch": 0.7, + "learning_rate": 1.7928533467926168e-06, + "loss": 0.8516, + "step": 27195 + }, + { + "epoch": 0.7, + "learning_rate": 1.7928364837691685e-06, + "loss": 0.8994, + "step": 27196 + }, + { + "epoch": 0.7, + "learning_rate": 1.7928196201386813e-06, + "loss": 0.9639, + "step": 27197 + }, + { + "epoch": 0.7, + "learning_rate": 1.7928027559011689e-06, + "loss": 0.8418, + "step": 27198 + }, + { + "epoch": 0.7, + "learning_rate": 1.7927858910566438e-06, + "loss": 0.9473, + "step": 27199 + }, + { + "epoch": 0.7, + "learning_rate": 1.792769025605119e-06, + "loss": 0.9727, + "step": 27200 + }, + { + "epoch": 0.7, + "learning_rate": 1.7927521595466075e-06, + "loss": 1.0664, + "step": 27201 + }, + { + "epoch": 0.7, + "learning_rate": 1.7927352928811221e-06, + "loss": 0.8809, + "step": 27202 + }, + { + "epoch": 0.7, + "learning_rate": 1.7927184256086756e-06, + "loss": 0.877, + "step": 27203 + }, + { + "epoch": 0.7, + "learning_rate": 1.7927015577292812e-06, + "loss": 0.7324, + "step": 27204 + }, + { + "epoch": 0.7, + "learning_rate": 1.7926846892429515e-06, + "loss": 0.7913, + "step": 27205 + }, + { + "epoch": 0.7, + "learning_rate": 1.7926678201497e-06, + "loss": 1.125, + "step": 27206 + }, + { + "epoch": 0.7, + "learning_rate": 1.7926509504495386e-06, + "loss": 0.7827, + "step": 27207 + }, + { + "epoch": 0.7, + "learning_rate": 1.792634080142481e-06, + "loss": 0.9443, + "step": 27208 + }, + { + "epoch": 0.7, + "learning_rate": 1.7926172092285403e-06, + "loss": 0.7197, + "step": 27209 + }, + { + "epoch": 0.7, + "learning_rate": 1.7926003377077287e-06, + "loss": 0.9688, + "step": 27210 + }, + { + "epoch": 0.7, + "learning_rate": 1.7925834655800599e-06, + "loss": 0.8721, + "step": 27211 + }, + { + "epoch": 0.7, + "learning_rate": 1.7925665928455457e-06, + "loss": 0.6855, + "step": 27212 + }, + { + "epoch": 0.7, + "learning_rate": 1.7925497195042e-06, + "loss": 0.8506, + "step": 27213 + }, + { + "epoch": 0.7, + "learning_rate": 1.7925328455560356e-06, + "loss": 0.7764, + "step": 27214 + }, + { + "epoch": 0.7, + "learning_rate": 1.7925159710010652e-06, + "loss": 0.8027, + "step": 27215 + }, + { + "epoch": 0.7, + "learning_rate": 1.7924990958393016e-06, + "loss": 0.6919, + "step": 27216 + }, + { + "epoch": 0.7, + "learning_rate": 1.7924822200707578e-06, + "loss": 0.7617, + "step": 27217 + }, + { + "epoch": 0.7, + "learning_rate": 1.792465343695447e-06, + "loss": 0.8848, + "step": 27218 + }, + { + "epoch": 0.7, + "learning_rate": 1.792448466713382e-06, + "loss": 0.8623, + "step": 27219 + }, + { + "epoch": 0.7, + "learning_rate": 1.7924315891245754e-06, + "loss": 0.7021, + "step": 27220 + }, + { + "epoch": 0.7, + "learning_rate": 1.7924147109290403e-06, + "loss": 0.6304, + "step": 27221 + }, + { + "epoch": 0.7, + "learning_rate": 1.79239783212679e-06, + "loss": 0.7471, + "step": 27222 + }, + { + "epoch": 0.7, + "learning_rate": 1.792380952717837e-06, + "loss": 0.688, + "step": 27223 + }, + { + "epoch": 0.7, + "learning_rate": 1.7923640727021944e-06, + "loss": 0.8096, + "step": 27224 + }, + { + "epoch": 0.7, + "learning_rate": 1.7923471920798748e-06, + "loss": 0.8203, + "step": 27225 + }, + { + "epoch": 0.7, + "learning_rate": 1.7923303108508918e-06, + "loss": 0.9336, + "step": 27226 + }, + { + "epoch": 0.7, + "learning_rate": 1.7923134290152577e-06, + "loss": 0.9551, + "step": 27227 + }, + { + "epoch": 0.7, + "learning_rate": 1.7922965465729858e-06, + "loss": 0.7434, + "step": 27228 + }, + { + "epoch": 0.7, + "learning_rate": 1.7922796635240887e-06, + "loss": 0.9053, + "step": 27229 + }, + { + "epoch": 0.7, + "learning_rate": 1.7922627798685795e-06, + "loss": 0.6255, + "step": 27230 + }, + { + "epoch": 0.7, + "learning_rate": 1.792245895606471e-06, + "loss": 0.6016, + "step": 27231 + }, + { + "epoch": 0.7, + "learning_rate": 1.7922290107377762e-06, + "loss": 0.8203, + "step": 27232 + }, + { + "epoch": 0.7, + "learning_rate": 1.7922121252625084e-06, + "loss": 1.0146, + "step": 27233 + }, + { + "epoch": 0.7, + "learning_rate": 1.7921952391806801e-06, + "loss": 0.7834, + "step": 27234 + }, + { + "epoch": 0.7, + "learning_rate": 1.7921783524923042e-06, + "loss": 0.8994, + "step": 27235 + }, + { + "epoch": 0.7, + "learning_rate": 1.7921614651973939e-06, + "loss": 0.9854, + "step": 27236 + }, + { + "epoch": 0.7, + "learning_rate": 1.792144577295962e-06, + "loss": 0.6863, + "step": 27237 + }, + { + "epoch": 0.7, + "learning_rate": 1.7921276887880212e-06, + "loss": 0.6853, + "step": 27238 + }, + { + "epoch": 0.7, + "learning_rate": 1.7921107996735846e-06, + "loss": 0.9482, + "step": 27239 + }, + { + "epoch": 0.7, + "learning_rate": 1.7920939099526656e-06, + "loss": 0.7051, + "step": 27240 + }, + { + "epoch": 0.7, + "learning_rate": 1.7920770196252767e-06, + "loss": 0.8975, + "step": 27241 + }, + { + "epoch": 0.7, + "learning_rate": 1.7920601286914306e-06, + "loss": 0.8555, + "step": 27242 + }, + { + "epoch": 0.7, + "learning_rate": 1.7920432371511405e-06, + "loss": 0.9766, + "step": 27243 + }, + { + "epoch": 0.7, + "learning_rate": 1.792026345004419e-06, + "loss": 0.6506, + "step": 27244 + }, + { + "epoch": 0.7, + "learning_rate": 1.7920094522512799e-06, + "loss": 0.8643, + "step": 27245 + }, + { + "epoch": 0.7, + "learning_rate": 1.7919925588917354e-06, + "loss": 0.9004, + "step": 27246 + }, + { + "epoch": 0.7, + "learning_rate": 1.7919756649257985e-06, + "loss": 0.9141, + "step": 27247 + }, + { + "epoch": 0.7, + "learning_rate": 1.7919587703534824e-06, + "loss": 0.8374, + "step": 27248 + }, + { + "epoch": 0.7, + "learning_rate": 1.7919418751747998e-06, + "loss": 0.9375, + "step": 27249 + }, + { + "epoch": 0.7, + "learning_rate": 1.7919249793897637e-06, + "loss": 1.0605, + "step": 27250 + }, + { + "epoch": 0.7, + "learning_rate": 1.791908082998387e-06, + "loss": 0.8887, + "step": 27251 + }, + { + "epoch": 0.7, + "learning_rate": 1.7918911860006829e-06, + "loss": 0.8643, + "step": 27252 + }, + { + "epoch": 0.7, + "learning_rate": 1.791874288396664e-06, + "loss": 0.6016, + "step": 27253 + }, + { + "epoch": 0.7, + "learning_rate": 1.7918573901863434e-06, + "loss": 0.7517, + "step": 27254 + }, + { + "epoch": 0.7, + "learning_rate": 1.7918404913697339e-06, + "loss": 0.9941, + "step": 27255 + }, + { + "epoch": 0.7, + "learning_rate": 1.7918235919468486e-06, + "loss": 0.7988, + "step": 27256 + }, + { + "epoch": 0.7, + "learning_rate": 1.7918066919177004e-06, + "loss": 0.7139, + "step": 27257 + }, + { + "epoch": 0.7, + "learning_rate": 1.7917897912823024e-06, + "loss": 1.0332, + "step": 27258 + }, + { + "epoch": 0.7, + "learning_rate": 1.7917728900406672e-06, + "loss": 0.7534, + "step": 27259 + }, + { + "epoch": 0.7, + "learning_rate": 1.7917559881928077e-06, + "loss": 0.8037, + "step": 27260 + }, + { + "epoch": 0.7, + "learning_rate": 1.7917390857387374e-06, + "loss": 0.8389, + "step": 27261 + }, + { + "epoch": 0.7, + "learning_rate": 1.7917221826784687e-06, + "loss": 0.9268, + "step": 27262 + }, + { + "epoch": 0.7, + "learning_rate": 1.7917052790120149e-06, + "loss": 1.0322, + "step": 27263 + }, + { + "epoch": 0.7, + "learning_rate": 1.7916883747393885e-06, + "loss": 0.8379, + "step": 27264 + }, + { + "epoch": 0.7, + "learning_rate": 1.7916714698606027e-06, + "loss": 0.6572, + "step": 27265 + }, + { + "epoch": 0.7, + "learning_rate": 1.7916545643756708e-06, + "loss": 0.8535, + "step": 27266 + }, + { + "epoch": 0.7, + "learning_rate": 1.7916376582846051e-06, + "loss": 0.9561, + "step": 27267 + }, + { + "epoch": 0.7, + "learning_rate": 1.7916207515874192e-06, + "loss": 1.1133, + "step": 27268 + }, + { + "epoch": 0.7, + "learning_rate": 1.7916038442841252e-06, + "loss": 0.7314, + "step": 27269 + }, + { + "epoch": 0.7, + "learning_rate": 1.7915869363747369e-06, + "loss": 0.9863, + "step": 27270 + }, + { + "epoch": 0.7, + "learning_rate": 1.7915700278592668e-06, + "loss": 0.8306, + "step": 27271 + }, + { + "epoch": 0.7, + "learning_rate": 1.791553118737728e-06, + "loss": 1.0244, + "step": 27272 + }, + { + "epoch": 0.7, + "learning_rate": 1.7915362090101331e-06, + "loss": 0.9775, + "step": 27273 + }, + { + "epoch": 0.7, + "learning_rate": 1.7915192986764956e-06, + "loss": 0.8662, + "step": 27274 + }, + { + "epoch": 0.7, + "learning_rate": 1.7915023877368278e-06, + "loss": 1.1162, + "step": 27275 + }, + { + "epoch": 0.7, + "learning_rate": 1.7914854761911435e-06, + "loss": 1.0098, + "step": 27276 + }, + { + "epoch": 0.7, + "learning_rate": 1.7914685640394548e-06, + "loss": 0.7988, + "step": 27277 + }, + { + "epoch": 0.7, + "learning_rate": 1.7914516512817752e-06, + "loss": 0.9365, + "step": 27278 + }, + { + "epoch": 0.7, + "learning_rate": 1.7914347379181175e-06, + "loss": 0.8794, + "step": 27279 + }, + { + "epoch": 0.7, + "learning_rate": 1.7914178239484942e-06, + "loss": 0.8486, + "step": 27280 + }, + { + "epoch": 0.7, + "learning_rate": 1.7914009093729193e-06, + "loss": 0.7969, + "step": 27281 + }, + { + "epoch": 0.7, + "learning_rate": 1.7913839941914047e-06, + "loss": 1.002, + "step": 27282 + }, + { + "epoch": 0.7, + "learning_rate": 1.791367078403964e-06, + "loss": 0.9189, + "step": 27283 + }, + { + "epoch": 0.7, + "learning_rate": 1.7913501620106097e-06, + "loss": 0.9893, + "step": 27284 + }, + { + "epoch": 0.7, + "learning_rate": 1.791333245011355e-06, + "loss": 0.8818, + "step": 27285 + }, + { + "epoch": 0.7, + "learning_rate": 1.7913163274062128e-06, + "loss": 0.8467, + "step": 27286 + }, + { + "epoch": 0.7, + "learning_rate": 1.7912994091951962e-06, + "loss": 0.9639, + "step": 27287 + }, + { + "epoch": 0.7, + "learning_rate": 1.791282490378318e-06, + "loss": 0.6951, + "step": 27288 + }, + { + "epoch": 0.7, + "learning_rate": 1.7912655709555912e-06, + "loss": 0.8193, + "step": 27289 + }, + { + "epoch": 0.7, + "learning_rate": 1.7912486509270286e-06, + "loss": 1.0186, + "step": 27290 + }, + { + "epoch": 0.7, + "learning_rate": 1.7912317302926433e-06, + "loss": 0.8477, + "step": 27291 + }, + { + "epoch": 0.7, + "learning_rate": 1.7912148090524484e-06, + "loss": 0.8428, + "step": 27292 + }, + { + "epoch": 0.7, + "learning_rate": 1.7911978872064566e-06, + "loss": 0.6992, + "step": 27293 + }, + { + "epoch": 0.7, + "learning_rate": 1.7911809647546812e-06, + "loss": 0.8076, + "step": 27294 + }, + { + "epoch": 0.7, + "learning_rate": 1.7911640416971346e-06, + "loss": 0.876, + "step": 27295 + }, + { + "epoch": 0.7, + "learning_rate": 1.7911471180338302e-06, + "loss": 1.1152, + "step": 27296 + }, + { + "epoch": 0.7, + "learning_rate": 1.7911301937647808e-06, + "loss": 0.6816, + "step": 27297 + }, + { + "epoch": 0.7, + "learning_rate": 1.7911132688899993e-06, + "loss": 0.6689, + "step": 27298 + }, + { + "epoch": 0.7, + "learning_rate": 1.791096343409499e-06, + "loss": 0.7495, + "step": 27299 + }, + { + "epoch": 0.7, + "learning_rate": 1.7910794173232922e-06, + "loss": 0.7676, + "step": 27300 + }, + { + "epoch": 0.7, + "learning_rate": 1.7910624906313925e-06, + "loss": 0.7529, + "step": 27301 + }, + { + "epoch": 0.7, + "learning_rate": 1.7910455633338128e-06, + "loss": 0.9482, + "step": 27302 + }, + { + "epoch": 0.7, + "learning_rate": 1.7910286354305658e-06, + "loss": 0.9199, + "step": 27303 + }, + { + "epoch": 0.7, + "learning_rate": 1.7910117069216644e-06, + "loss": 0.9375, + "step": 27304 + }, + { + "epoch": 0.7, + "learning_rate": 1.7909947778071217e-06, + "loss": 0.8613, + "step": 27305 + }, + { + "epoch": 0.7, + "learning_rate": 1.7909778480869507e-06, + "loss": 0.8936, + "step": 27306 + }, + { + "epoch": 0.7, + "learning_rate": 1.7909609177611644e-06, + "loss": 0.8408, + "step": 27307 + }, + { + "epoch": 0.7, + "learning_rate": 1.7909439868297755e-06, + "loss": 0.8115, + "step": 27308 + }, + { + "epoch": 0.7, + "learning_rate": 1.7909270552927976e-06, + "loss": 0.6313, + "step": 27309 + }, + { + "epoch": 0.7, + "learning_rate": 1.7909101231502427e-06, + "loss": 0.8047, + "step": 27310 + }, + { + "epoch": 0.7, + "learning_rate": 1.7908931904021248e-06, + "loss": 0.8242, + "step": 27311 + }, + { + "epoch": 0.7, + "learning_rate": 1.7908762570484558e-06, + "loss": 0.9736, + "step": 27312 + }, + { + "epoch": 0.7, + "learning_rate": 1.7908593230892498e-06, + "loss": 0.6235, + "step": 27313 + }, + { + "epoch": 0.7, + "learning_rate": 1.7908423885245187e-06, + "loss": 0.6914, + "step": 27314 + }, + { + "epoch": 0.7, + "learning_rate": 1.7908254533542762e-06, + "loss": 0.9004, + "step": 27315 + }, + { + "epoch": 0.7, + "learning_rate": 1.7908085175785349e-06, + "loss": 1.0801, + "step": 27316 + }, + { + "epoch": 0.7, + "learning_rate": 1.790791581197308e-06, + "loss": 0.8354, + "step": 27317 + }, + { + "epoch": 0.7, + "learning_rate": 1.7907746442106082e-06, + "loss": 0.5962, + "step": 27318 + }, + { + "epoch": 0.7, + "learning_rate": 1.7907577066184488e-06, + "loss": 1.0508, + "step": 27319 + }, + { + "epoch": 0.7, + "learning_rate": 1.7907407684208421e-06, + "loss": 0.9482, + "step": 27320 + }, + { + "epoch": 0.7, + "learning_rate": 1.7907238296178021e-06, + "loss": 0.8301, + "step": 27321 + }, + { + "epoch": 0.7, + "learning_rate": 1.7907068902093409e-06, + "loss": 0.6345, + "step": 27322 + }, + { + "epoch": 0.7, + "learning_rate": 1.790689950195472e-06, + "loss": 0.915, + "step": 27323 + }, + { + "epoch": 0.7, + "learning_rate": 1.7906730095762082e-06, + "loss": 0.8945, + "step": 27324 + }, + { + "epoch": 0.7, + "learning_rate": 1.7906560683515625e-06, + "loss": 0.5955, + "step": 27325 + }, + { + "epoch": 0.7, + "learning_rate": 1.7906391265215475e-06, + "loss": 0.7296, + "step": 27326 + }, + { + "epoch": 0.7, + "learning_rate": 1.7906221840861763e-06, + "loss": 0.8018, + "step": 27327 + }, + { + "epoch": 0.7, + "learning_rate": 1.7906052410454627e-06, + "loss": 0.7734, + "step": 27328 + }, + { + "epoch": 0.7, + "learning_rate": 1.7905882973994187e-06, + "loss": 0.7266, + "step": 27329 + }, + { + "epoch": 0.7, + "learning_rate": 1.7905713531480573e-06, + "loss": 0.8672, + "step": 27330 + }, + { + "epoch": 0.7, + "learning_rate": 1.790554408291392e-06, + "loss": 0.7065, + "step": 27331 + }, + { + "epoch": 0.7, + "learning_rate": 1.7905374628294356e-06, + "loss": 0.8643, + "step": 27332 + }, + { + "epoch": 0.7, + "learning_rate": 1.790520516762201e-06, + "loss": 0.7744, + "step": 27333 + }, + { + "epoch": 0.7, + "learning_rate": 1.7905035700897013e-06, + "loss": 0.8105, + "step": 27334 + }, + { + "epoch": 0.7, + "learning_rate": 1.790486622811949e-06, + "loss": 0.8408, + "step": 27335 + }, + { + "epoch": 0.7, + "learning_rate": 1.790469674928958e-06, + "loss": 0.7969, + "step": 27336 + }, + { + "epoch": 0.7, + "learning_rate": 1.7904527264407403e-06, + "loss": 0.8662, + "step": 27337 + }, + { + "epoch": 0.7, + "learning_rate": 1.7904357773473095e-06, + "loss": 0.9121, + "step": 27338 + }, + { + "epoch": 0.7, + "learning_rate": 1.7904188276486782e-06, + "loss": 0.7705, + "step": 27339 + }, + { + "epoch": 0.7, + "learning_rate": 1.7904018773448595e-06, + "loss": 0.8115, + "step": 27340 + }, + { + "epoch": 0.7, + "learning_rate": 1.7903849264358666e-06, + "loss": 0.8203, + "step": 27341 + }, + { + "epoch": 0.7, + "learning_rate": 1.7903679749217122e-06, + "loss": 0.834, + "step": 27342 + }, + { + "epoch": 0.7, + "learning_rate": 1.7903510228024094e-06, + "loss": 0.8818, + "step": 27343 + }, + { + "epoch": 0.7, + "learning_rate": 1.7903340700779712e-06, + "loss": 0.666, + "step": 27344 + }, + { + "epoch": 0.7, + "learning_rate": 1.7903171167484107e-06, + "loss": 0.7451, + "step": 27345 + }, + { + "epoch": 0.7, + "learning_rate": 1.7903001628137403e-06, + "loss": 0.8506, + "step": 27346 + }, + { + "epoch": 0.7, + "learning_rate": 1.7902832082739738e-06, + "loss": 0.8018, + "step": 27347 + }, + { + "epoch": 0.7, + "learning_rate": 1.7902662531291237e-06, + "loss": 0.853, + "step": 27348 + }, + { + "epoch": 0.7, + "learning_rate": 1.790249297379203e-06, + "loss": 0.9219, + "step": 27349 + }, + { + "epoch": 0.7, + "learning_rate": 1.7902323410242249e-06, + "loss": 0.8945, + "step": 27350 + }, + { + "epoch": 0.7, + "learning_rate": 1.790215384064202e-06, + "loss": 0.7402, + "step": 27351 + }, + { + "epoch": 0.7, + "learning_rate": 1.7901984264991477e-06, + "loss": 0.9551, + "step": 27352 + }, + { + "epoch": 0.7, + "learning_rate": 1.7901814683290746e-06, + "loss": 0.7188, + "step": 27353 + }, + { + "epoch": 0.7, + "learning_rate": 1.7901645095539961e-06, + "loss": 1.0889, + "step": 27354 + }, + { + "epoch": 0.7, + "learning_rate": 1.7901475501739248e-06, + "loss": 0.7881, + "step": 27355 + }, + { + "epoch": 0.7, + "learning_rate": 1.7901305901888738e-06, + "loss": 0.7695, + "step": 27356 + }, + { + "epoch": 0.7, + "learning_rate": 1.7901136295988563e-06, + "loss": 0.6953, + "step": 27357 + }, + { + "epoch": 0.7, + "learning_rate": 1.7900966684038852e-06, + "loss": 0.9893, + "step": 27358 + }, + { + "epoch": 0.7, + "learning_rate": 1.790079706603973e-06, + "loss": 0.9053, + "step": 27359 + }, + { + "epoch": 0.7, + "learning_rate": 1.7900627441991336e-06, + "loss": 0.9619, + "step": 27360 + }, + { + "epoch": 0.7, + "learning_rate": 1.7900457811893792e-06, + "loss": 0.9092, + "step": 27361 + }, + { + "epoch": 0.7, + "learning_rate": 1.7900288175747231e-06, + "loss": 0.9082, + "step": 27362 + }, + { + "epoch": 0.7, + "learning_rate": 1.7900118533551782e-06, + "loss": 0.9854, + "step": 27363 + }, + { + "epoch": 0.7, + "learning_rate": 1.789994888530758e-06, + "loss": 0.958, + "step": 27364 + }, + { + "epoch": 0.7, + "learning_rate": 1.7899779231014744e-06, + "loss": 1.165, + "step": 27365 + }, + { + "epoch": 0.7, + "learning_rate": 1.7899609570673416e-06, + "loss": 0.9297, + "step": 27366 + }, + { + "epoch": 0.7, + "learning_rate": 1.7899439904283716e-06, + "loss": 0.7617, + "step": 27367 + }, + { + "epoch": 0.7, + "learning_rate": 1.7899270231845777e-06, + "loss": 0.9082, + "step": 27368 + }, + { + "epoch": 0.7, + "learning_rate": 1.7899100553359735e-06, + "loss": 0.7529, + "step": 27369 + }, + { + "epoch": 0.7, + "learning_rate": 1.789893086882571e-06, + "loss": 0.8584, + "step": 27370 + }, + { + "epoch": 0.7, + "learning_rate": 1.789876117824384e-06, + "loss": 0.752, + "step": 27371 + }, + { + "epoch": 0.7, + "learning_rate": 1.789859148161425e-06, + "loss": 0.9893, + "step": 27372 + }, + { + "epoch": 0.7, + "learning_rate": 1.7898421778937074e-06, + "loss": 0.7354, + "step": 27373 + }, + { + "epoch": 0.7, + "learning_rate": 1.7898252070212439e-06, + "loss": 0.9033, + "step": 27374 + }, + { + "epoch": 0.7, + "learning_rate": 1.7898082355440473e-06, + "loss": 0.709, + "step": 27375 + }, + { + "epoch": 0.7, + "learning_rate": 1.7897912634621312e-06, + "loss": 0.9727, + "step": 27376 + }, + { + "epoch": 0.7, + "learning_rate": 1.789774290775508e-06, + "loss": 0.9053, + "step": 27377 + }, + { + "epoch": 0.7, + "learning_rate": 1.7897573174841912e-06, + "loss": 0.9375, + "step": 27378 + }, + { + "epoch": 0.7, + "learning_rate": 1.7897403435881931e-06, + "loss": 0.8291, + "step": 27379 + }, + { + "epoch": 0.7, + "learning_rate": 1.7897233690875275e-06, + "loss": 0.8164, + "step": 27380 + }, + { + "epoch": 0.7, + "learning_rate": 1.7897063939822071e-06, + "loss": 0.8906, + "step": 27381 + }, + { + "epoch": 0.7, + "learning_rate": 1.7896894182722444e-06, + "loss": 0.7437, + "step": 27382 + }, + { + "epoch": 0.7, + "learning_rate": 1.789672441957653e-06, + "loss": 0.7354, + "step": 27383 + }, + { + "epoch": 0.7, + "learning_rate": 1.7896554650384459e-06, + "loss": 0.8501, + "step": 27384 + }, + { + "epoch": 0.7, + "learning_rate": 1.7896384875146358e-06, + "loss": 0.9336, + "step": 27385 + }, + { + "epoch": 0.7, + "learning_rate": 1.7896215093862358e-06, + "loss": 1.0117, + "step": 27386 + }, + { + "epoch": 0.7, + "learning_rate": 1.789604530653259e-06, + "loss": 0.6309, + "step": 27387 + }, + { + "epoch": 0.7, + "learning_rate": 1.7895875513157184e-06, + "loss": 0.9746, + "step": 27388 + }, + { + "epoch": 0.7, + "learning_rate": 1.7895705713736267e-06, + "loss": 0.9219, + "step": 27389 + }, + { + "epoch": 0.7, + "learning_rate": 1.7895535908269972e-06, + "loss": 0.9258, + "step": 27390 + }, + { + "epoch": 0.7, + "learning_rate": 1.7895366096758426e-06, + "loss": 0.6377, + "step": 27391 + }, + { + "epoch": 0.7, + "learning_rate": 1.7895196279201765e-06, + "loss": 0.875, + "step": 27392 + }, + { + "epoch": 0.7, + "learning_rate": 1.7895026455600113e-06, + "loss": 0.8525, + "step": 27393 + }, + { + "epoch": 0.7, + "learning_rate": 1.7894856625953602e-06, + "loss": 0.7036, + "step": 27394 + }, + { + "epoch": 0.7, + "learning_rate": 1.7894686790262366e-06, + "loss": 0.7915, + "step": 27395 + }, + { + "epoch": 0.7, + "learning_rate": 1.7894516948526529e-06, + "loss": 1.0449, + "step": 27396 + }, + { + "epoch": 0.7, + "learning_rate": 1.789434710074622e-06, + "loss": 0.8213, + "step": 27397 + }, + { + "epoch": 0.7, + "learning_rate": 1.7894177246921575e-06, + "loss": 1.0283, + "step": 27398 + }, + { + "epoch": 0.7, + "learning_rate": 1.7894007387052723e-06, + "loss": 0.9287, + "step": 27399 + }, + { + "epoch": 0.7, + "learning_rate": 1.7893837521139792e-06, + "loss": 0.4854, + "step": 27400 + }, + { + "epoch": 0.7, + "learning_rate": 1.7893667649182912e-06, + "loss": 0.6299, + "step": 27401 + }, + { + "epoch": 0.7, + "learning_rate": 1.7893497771182212e-06, + "loss": 0.998, + "step": 27402 + }, + { + "epoch": 0.7, + "learning_rate": 1.7893327887137825e-06, + "loss": 0.9229, + "step": 27403 + }, + { + "epoch": 0.7, + "learning_rate": 1.789315799704988e-06, + "loss": 0.9224, + "step": 27404 + }, + { + "epoch": 0.7, + "learning_rate": 1.7892988100918509e-06, + "loss": 0.7271, + "step": 27405 + }, + { + "epoch": 0.7, + "learning_rate": 1.7892818198743838e-06, + "loss": 0.8643, + "step": 27406 + }, + { + "epoch": 0.7, + "learning_rate": 1.7892648290525999e-06, + "loss": 0.8262, + "step": 27407 + }, + { + "epoch": 0.7, + "learning_rate": 1.789247837626512e-06, + "loss": 1.083, + "step": 27408 + }, + { + "epoch": 0.7, + "learning_rate": 1.7892308455961337e-06, + "loss": 0.9502, + "step": 27409 + }, + { + "epoch": 0.7, + "learning_rate": 1.7892138529614773e-06, + "loss": 0.9043, + "step": 27410 + }, + { + "epoch": 0.7, + "learning_rate": 1.7891968597225563e-06, + "loss": 0.7822, + "step": 27411 + }, + { + "epoch": 0.7, + "learning_rate": 1.7891798658793835e-06, + "loss": 0.9082, + "step": 27412 + }, + { + "epoch": 0.7, + "learning_rate": 1.789162871431972e-06, + "loss": 0.8145, + "step": 27413 + }, + { + "epoch": 0.7, + "learning_rate": 1.7891458763803349e-06, + "loss": 0.9463, + "step": 27414 + }, + { + "epoch": 0.7, + "learning_rate": 1.7891288807244852e-06, + "loss": 1.0459, + "step": 27415 + }, + { + "epoch": 0.7, + "learning_rate": 1.7891118844644352e-06, + "loss": 0.5898, + "step": 27416 + }, + { + "epoch": 0.7, + "learning_rate": 1.789094887600199e-06, + "loss": 0.6682, + "step": 27417 + }, + { + "epoch": 0.7, + "learning_rate": 1.7890778901317888e-06, + "loss": 0.8623, + "step": 27418 + }, + { + "epoch": 0.7, + "learning_rate": 1.7890608920592186e-06, + "loss": 0.7969, + "step": 27419 + }, + { + "epoch": 0.7, + "learning_rate": 1.7890438933825e-06, + "loss": 1.0156, + "step": 27420 + }, + { + "epoch": 0.7, + "learning_rate": 1.789026894101647e-06, + "loss": 0.792, + "step": 27421 + }, + { + "epoch": 0.7, + "learning_rate": 1.7890098942166728e-06, + "loss": 0.7212, + "step": 27422 + }, + { + "epoch": 0.7, + "learning_rate": 1.7889928937275895e-06, + "loss": 0.8125, + "step": 27423 + }, + { + "epoch": 0.7, + "learning_rate": 1.7889758926344107e-06, + "loss": 0.7812, + "step": 27424 + }, + { + "epoch": 0.7, + "learning_rate": 1.7889588909371495e-06, + "loss": 0.7612, + "step": 27425 + }, + { + "epoch": 0.7, + "learning_rate": 1.7889418886358188e-06, + "loss": 0.8193, + "step": 27426 + }, + { + "epoch": 0.7, + "learning_rate": 1.7889248857304313e-06, + "loss": 0.8325, + "step": 27427 + }, + { + "epoch": 0.7, + "learning_rate": 1.7889078822210006e-06, + "loss": 0.8154, + "step": 27428 + }, + { + "epoch": 0.7, + "learning_rate": 1.7888908781075394e-06, + "loss": 0.7991, + "step": 27429 + }, + { + "epoch": 0.7, + "learning_rate": 1.7888738733900603e-06, + "loss": 0.707, + "step": 27430 + }, + { + "epoch": 0.7, + "learning_rate": 1.7888568680685772e-06, + "loss": 0.8335, + "step": 27431 + }, + { + "epoch": 0.7, + "learning_rate": 1.7888398621431025e-06, + "loss": 0.9531, + "step": 27432 + }, + { + "epoch": 0.7, + "learning_rate": 1.7888228556136493e-06, + "loss": 0.8877, + "step": 27433 + }, + { + "epoch": 0.7, + "learning_rate": 1.7888058484802308e-06, + "loss": 0.8525, + "step": 27434 + }, + { + "epoch": 0.7, + "learning_rate": 1.78878884074286e-06, + "loss": 1.1562, + "step": 27435 + }, + { + "epoch": 0.7, + "learning_rate": 1.78877183240155e-06, + "loss": 0.7383, + "step": 27436 + }, + { + "epoch": 0.7, + "learning_rate": 1.7887548234563132e-06, + "loss": 0.874, + "step": 27437 + }, + { + "epoch": 0.7, + "learning_rate": 1.7887378139071636e-06, + "loss": 0.8877, + "step": 27438 + }, + { + "epoch": 0.7, + "learning_rate": 1.7887208037541135e-06, + "loss": 0.7832, + "step": 27439 + }, + { + "epoch": 0.7, + "learning_rate": 1.788703792997176e-06, + "loss": 0.689, + "step": 27440 + }, + { + "epoch": 0.7, + "learning_rate": 1.7886867816363643e-06, + "loss": 0.8394, + "step": 27441 + }, + { + "epoch": 0.7, + "learning_rate": 1.7886697696716917e-06, + "loss": 0.9355, + "step": 27442 + }, + { + "epoch": 0.7, + "learning_rate": 1.7886527571031707e-06, + "loss": 0.8857, + "step": 27443 + }, + { + "epoch": 0.7, + "learning_rate": 1.7886357439308143e-06, + "loss": 0.749, + "step": 27444 + }, + { + "epoch": 0.7, + "learning_rate": 1.7886187301546363e-06, + "loss": 0.6707, + "step": 27445 + }, + { + "epoch": 0.7, + "learning_rate": 1.788601715774649e-06, + "loss": 1.0137, + "step": 27446 + }, + { + "epoch": 0.7, + "learning_rate": 1.7885847007908654e-06, + "loss": 0.8701, + "step": 27447 + }, + { + "epoch": 0.7, + "learning_rate": 1.788567685203299e-06, + "loss": 0.9277, + "step": 27448 + }, + { + "epoch": 0.7, + "learning_rate": 1.7885506690119624e-06, + "loss": 0.957, + "step": 27449 + }, + { + "epoch": 0.7, + "learning_rate": 1.788533652216869e-06, + "loss": 0.6099, + "step": 27450 + }, + { + "epoch": 0.7, + "learning_rate": 1.7885166348180317e-06, + "loss": 0.8955, + "step": 27451 + }, + { + "epoch": 0.7, + "learning_rate": 1.7884996168154634e-06, + "loss": 0.8555, + "step": 27452 + }, + { + "epoch": 0.7, + "learning_rate": 1.788482598209177e-06, + "loss": 0.8955, + "step": 27453 + }, + { + "epoch": 0.7, + "learning_rate": 1.7884655789991859e-06, + "loss": 0.9941, + "step": 27454 + }, + { + "epoch": 0.7, + "learning_rate": 1.788448559185503e-06, + "loss": 0.9014, + "step": 27455 + }, + { + "epoch": 0.7, + "learning_rate": 1.7884315387681413e-06, + "loss": 0.9824, + "step": 27456 + }, + { + "epoch": 0.7, + "learning_rate": 1.7884145177471135e-06, + "loss": 1.0332, + "step": 27457 + }, + { + "epoch": 0.7, + "learning_rate": 1.7883974961224332e-06, + "loss": 0.7871, + "step": 27458 + }, + { + "epoch": 0.7, + "learning_rate": 1.7883804738941133e-06, + "loss": 0.918, + "step": 27459 + }, + { + "epoch": 0.7, + "learning_rate": 1.7883634510621665e-06, + "loss": 0.875, + "step": 27460 + }, + { + "epoch": 0.7, + "learning_rate": 1.7883464276266062e-06, + "loss": 0.8359, + "step": 27461 + }, + { + "epoch": 0.7, + "learning_rate": 1.7883294035874452e-06, + "loss": 1.043, + "step": 27462 + }, + { + "epoch": 0.7, + "learning_rate": 1.7883123789446968e-06, + "loss": 0.769, + "step": 27463 + }, + { + "epoch": 0.7, + "learning_rate": 1.7882953536983739e-06, + "loss": 0.7314, + "step": 27464 + }, + { + "epoch": 0.7, + "learning_rate": 1.7882783278484891e-06, + "loss": 0.7256, + "step": 27465 + }, + { + "epoch": 0.7, + "learning_rate": 1.788261301395056e-06, + "loss": 0.8174, + "step": 27466 + }, + { + "epoch": 0.7, + "learning_rate": 1.7882442743380875e-06, + "loss": 1.0361, + "step": 27467 + }, + { + "epoch": 0.7, + "learning_rate": 1.7882272466775967e-06, + "loss": 0.9365, + "step": 27468 + }, + { + "epoch": 0.7, + "learning_rate": 1.7882102184135963e-06, + "loss": 0.9185, + "step": 27469 + }, + { + "epoch": 0.7, + "learning_rate": 1.7881931895461e-06, + "loss": 0.9971, + "step": 27470 + }, + { + "epoch": 0.7, + "learning_rate": 1.7881761600751202e-06, + "loss": 0.7358, + "step": 27471 + }, + { + "epoch": 0.7, + "learning_rate": 1.78815913000067e-06, + "loss": 1.0449, + "step": 27472 + }, + { + "epoch": 0.7, + "learning_rate": 1.7881420993227628e-06, + "loss": 0.8008, + "step": 27473 + }, + { + "epoch": 0.7, + "learning_rate": 1.7881250680414112e-06, + "loss": 0.9482, + "step": 27474 + }, + { + "epoch": 0.7, + "learning_rate": 1.7881080361566287e-06, + "loss": 0.7058, + "step": 27475 + }, + { + "epoch": 0.7, + "learning_rate": 1.788091003668428e-06, + "loss": 1.0391, + "step": 27476 + }, + { + "epoch": 0.7, + "learning_rate": 1.7880739705768221e-06, + "loss": 0.8457, + "step": 27477 + }, + { + "epoch": 0.7, + "learning_rate": 1.7880569368818245e-06, + "loss": 0.9473, + "step": 27478 + }, + { + "epoch": 0.7, + "learning_rate": 1.788039902583448e-06, + "loss": 0.8291, + "step": 27479 + }, + { + "epoch": 0.7, + "learning_rate": 1.7880228676817054e-06, + "loss": 0.8633, + "step": 27480 + }, + { + "epoch": 0.7, + "learning_rate": 1.7880058321766098e-06, + "loss": 0.7627, + "step": 27481 + }, + { + "epoch": 0.7, + "learning_rate": 1.7879887960681748e-06, + "loss": 0.9434, + "step": 27482 + }, + { + "epoch": 0.7, + "learning_rate": 1.7879717593564126e-06, + "loss": 0.7212, + "step": 27483 + }, + { + "epoch": 0.7, + "learning_rate": 1.7879547220413368e-06, + "loss": 0.7803, + "step": 27484 + }, + { + "epoch": 0.7, + "learning_rate": 1.7879376841229604e-06, + "loss": 0.9199, + "step": 27485 + }, + { + "epoch": 0.7, + "learning_rate": 1.787920645601296e-06, + "loss": 0.8218, + "step": 27486 + }, + { + "epoch": 0.7, + "learning_rate": 1.7879036064763574e-06, + "loss": 0.7715, + "step": 27487 + }, + { + "epoch": 0.7, + "learning_rate": 1.7878865667481571e-06, + "loss": 0.9736, + "step": 27488 + }, + { + "epoch": 0.7, + "learning_rate": 1.787869526416708e-06, + "loss": 0.7676, + "step": 27489 + }, + { + "epoch": 0.7, + "learning_rate": 1.7878524854820238e-06, + "loss": 1.0156, + "step": 27490 + }, + { + "epoch": 0.7, + "learning_rate": 1.7878354439441169e-06, + "loss": 0.9189, + "step": 27491 + }, + { + "epoch": 0.7, + "learning_rate": 1.7878184018030008e-06, + "loss": 0.8594, + "step": 27492 + }, + { + "epoch": 0.7, + "learning_rate": 1.7878013590586884e-06, + "loss": 0.8701, + "step": 27493 + }, + { + "epoch": 0.7, + "learning_rate": 1.7877843157111924e-06, + "loss": 0.8711, + "step": 27494 + }, + { + "epoch": 0.7, + "learning_rate": 1.7877672717605266e-06, + "loss": 0.8706, + "step": 27495 + }, + { + "epoch": 0.7, + "learning_rate": 1.7877502272067036e-06, + "loss": 0.8936, + "step": 27496 + }, + { + "epoch": 0.7, + "learning_rate": 1.7877331820497364e-06, + "loss": 0.9932, + "step": 27497 + }, + { + "epoch": 0.7, + "learning_rate": 1.7877161362896378e-06, + "loss": 0.6533, + "step": 27498 + }, + { + "epoch": 0.7, + "learning_rate": 1.7876990899264216e-06, + "loss": 1.0195, + "step": 27499 + }, + { + "epoch": 0.7, + "learning_rate": 1.7876820429601003e-06, + "loss": 0.8896, + "step": 27500 + }, + { + "epoch": 0.7, + "learning_rate": 1.787664995390687e-06, + "loss": 0.8018, + "step": 27501 + }, + { + "epoch": 0.7, + "learning_rate": 1.7876479472181946e-06, + "loss": 0.7197, + "step": 27502 + }, + { + "epoch": 0.7, + "learning_rate": 1.7876308984426369e-06, + "loss": 0.998, + "step": 27503 + }, + { + "epoch": 0.7, + "learning_rate": 1.787613849064026e-06, + "loss": 0.9121, + "step": 27504 + }, + { + "epoch": 0.7, + "learning_rate": 1.7875967990823758e-06, + "loss": 0.9346, + "step": 27505 + }, + { + "epoch": 0.7, + "learning_rate": 1.7875797484976986e-06, + "loss": 0.7842, + "step": 27506 + }, + { + "epoch": 0.71, + "learning_rate": 1.787562697310008e-06, + "loss": 0.834, + "step": 27507 + }, + { + "epoch": 0.71, + "learning_rate": 1.7875456455193167e-06, + "loss": 1.0049, + "step": 27508 + }, + { + "epoch": 0.71, + "learning_rate": 1.7875285931256382e-06, + "loss": 0.6953, + "step": 27509 + }, + { + "epoch": 0.71, + "learning_rate": 1.7875115401289849e-06, + "loss": 1.0049, + "step": 27510 + }, + { + "epoch": 0.71, + "learning_rate": 1.7874944865293703e-06, + "loss": 0.9014, + "step": 27511 + }, + { + "epoch": 0.71, + "learning_rate": 1.7874774323268077e-06, + "loss": 0.8789, + "step": 27512 + }, + { + "epoch": 0.71, + "learning_rate": 1.7874603775213096e-06, + "loss": 0.7637, + "step": 27513 + }, + { + "epoch": 0.71, + "learning_rate": 1.7874433221128892e-06, + "loss": 0.5981, + "step": 27514 + }, + { + "epoch": 0.71, + "learning_rate": 1.7874262661015597e-06, + "loss": 0.8857, + "step": 27515 + }, + { + "epoch": 0.71, + "learning_rate": 1.7874092094873343e-06, + "loss": 0.9199, + "step": 27516 + }, + { + "epoch": 0.71, + "learning_rate": 1.7873921522702257e-06, + "loss": 0.9473, + "step": 27517 + }, + { + "epoch": 0.71, + "learning_rate": 1.787375094450247e-06, + "loss": 0.8818, + "step": 27518 + }, + { + "epoch": 0.71, + "learning_rate": 1.7873580360274117e-06, + "loss": 0.8486, + "step": 27519 + }, + { + "epoch": 0.71, + "learning_rate": 1.7873409770017325e-06, + "loss": 0.6167, + "step": 27520 + }, + { + "epoch": 0.71, + "learning_rate": 1.7873239173732225e-06, + "loss": 0.8525, + "step": 27521 + }, + { + "epoch": 0.71, + "learning_rate": 1.7873068571418946e-06, + "loss": 0.917, + "step": 27522 + }, + { + "epoch": 0.71, + "learning_rate": 1.7872897963077623e-06, + "loss": 0.8887, + "step": 27523 + }, + { + "epoch": 0.71, + "learning_rate": 1.787272734870838e-06, + "loss": 0.9775, + "step": 27524 + }, + { + "epoch": 0.71, + "learning_rate": 1.7872556728311356e-06, + "loss": 0.999, + "step": 27525 + }, + { + "epoch": 0.71, + "learning_rate": 1.7872386101886676e-06, + "loss": 0.8682, + "step": 27526 + }, + { + "epoch": 0.71, + "learning_rate": 1.7872215469434471e-06, + "loss": 0.7314, + "step": 27527 + }, + { + "epoch": 0.71, + "learning_rate": 1.7872044830954876e-06, + "loss": 1.0566, + "step": 27528 + }, + { + "epoch": 0.71, + "learning_rate": 1.7871874186448012e-06, + "loss": 0.8604, + "step": 27529 + }, + { + "epoch": 0.71, + "learning_rate": 1.787170353591402e-06, + "loss": 0.7544, + "step": 27530 + }, + { + "epoch": 0.71, + "learning_rate": 1.7871532879353025e-06, + "loss": 0.9482, + "step": 27531 + }, + { + "epoch": 0.71, + "learning_rate": 1.7871362216765161e-06, + "loss": 0.7378, + "step": 27532 + }, + { + "epoch": 0.71, + "learning_rate": 1.7871191548150558e-06, + "loss": 1.0215, + "step": 27533 + }, + { + "epoch": 0.71, + "learning_rate": 1.7871020873509343e-06, + "loss": 1.2529, + "step": 27534 + }, + { + "epoch": 0.71, + "learning_rate": 1.787085019284165e-06, + "loss": 0.7285, + "step": 27535 + }, + { + "epoch": 0.71, + "learning_rate": 1.7870679506147608e-06, + "loss": 0.8975, + "step": 27536 + }, + { + "epoch": 0.71, + "learning_rate": 1.787050881342735e-06, + "loss": 0.8633, + "step": 27537 + }, + { + "epoch": 0.71, + "learning_rate": 1.7870338114681002e-06, + "loss": 0.7295, + "step": 27538 + }, + { + "epoch": 0.71, + "learning_rate": 1.7870167409908703e-06, + "loss": 0.7334, + "step": 27539 + }, + { + "epoch": 0.71, + "learning_rate": 1.7869996699110574e-06, + "loss": 0.9062, + "step": 27540 + }, + { + "epoch": 0.71, + "learning_rate": 1.7869825982286754e-06, + "loss": 0.6338, + "step": 27541 + }, + { + "epoch": 0.71, + "learning_rate": 1.7869655259437368e-06, + "loss": 0.9805, + "step": 27542 + }, + { + "epoch": 0.71, + "learning_rate": 1.7869484530562552e-06, + "loss": 1.0732, + "step": 27543 + }, + { + "epoch": 0.71, + "learning_rate": 1.7869313795662428e-06, + "loss": 0.9004, + "step": 27544 + }, + { + "epoch": 0.71, + "learning_rate": 1.7869143054737137e-06, + "loss": 1.0244, + "step": 27545 + }, + { + "epoch": 0.71, + "learning_rate": 1.7868972307786803e-06, + "loss": 0.9619, + "step": 27546 + }, + { + "epoch": 0.71, + "learning_rate": 1.7868801554811561e-06, + "loss": 0.8936, + "step": 27547 + }, + { + "epoch": 0.71, + "learning_rate": 1.7868630795811538e-06, + "loss": 0.8193, + "step": 27548 + }, + { + "epoch": 0.71, + "learning_rate": 1.7868460030786865e-06, + "loss": 1.0352, + "step": 27549 + }, + { + "epoch": 0.71, + "learning_rate": 1.7868289259737675e-06, + "loss": 0.6919, + "step": 27550 + }, + { + "epoch": 0.71, + "learning_rate": 1.7868118482664096e-06, + "loss": 0.9541, + "step": 27551 + }, + { + "epoch": 0.71, + "learning_rate": 1.7867947699566263e-06, + "loss": 0.8818, + "step": 27552 + }, + { + "epoch": 0.71, + "learning_rate": 1.7867776910444303e-06, + "loss": 0.8486, + "step": 27553 + }, + { + "epoch": 0.71, + "learning_rate": 1.7867606115298347e-06, + "loss": 0.5787, + "step": 27554 + }, + { + "epoch": 0.71, + "learning_rate": 1.786743531412853e-06, + "loss": 1.041, + "step": 27555 + }, + { + "epoch": 0.71, + "learning_rate": 1.7867264506934978e-06, + "loss": 0.9707, + "step": 27556 + }, + { + "epoch": 0.71, + "learning_rate": 1.786709369371782e-06, + "loss": 0.8135, + "step": 27557 + }, + { + "epoch": 0.71, + "learning_rate": 1.7866922874477194e-06, + "loss": 0.8564, + "step": 27558 + }, + { + "epoch": 0.71, + "learning_rate": 1.7866752049213226e-06, + "loss": 0.5417, + "step": 27559 + }, + { + "epoch": 0.71, + "learning_rate": 1.786658121792605e-06, + "loss": 0.9492, + "step": 27560 + }, + { + "epoch": 0.71, + "learning_rate": 1.786641038061579e-06, + "loss": 0.8994, + "step": 27561 + }, + { + "epoch": 0.71, + "learning_rate": 1.7866239537282583e-06, + "loss": 0.7278, + "step": 27562 + }, + { + "epoch": 0.71, + "learning_rate": 1.7866068687926559e-06, + "loss": 0.752, + "step": 27563 + }, + { + "epoch": 0.71, + "learning_rate": 1.7865897832547846e-06, + "loss": 0.7866, + "step": 27564 + }, + { + "epoch": 0.71, + "learning_rate": 1.786572697114658e-06, + "loss": 0.8125, + "step": 27565 + }, + { + "epoch": 0.71, + "learning_rate": 1.7865556103722884e-06, + "loss": 1.0068, + "step": 27566 + }, + { + "epoch": 0.71, + "learning_rate": 1.7865385230276898e-06, + "loss": 0.9717, + "step": 27567 + }, + { + "epoch": 0.71, + "learning_rate": 1.7865214350808744e-06, + "loss": 0.6672, + "step": 27568 + }, + { + "epoch": 0.71, + "learning_rate": 1.7865043465318559e-06, + "loss": 0.8379, + "step": 27569 + }, + { + "epoch": 0.71, + "learning_rate": 1.7864872573806473e-06, + "loss": 0.8657, + "step": 27570 + }, + { + "epoch": 0.71, + "learning_rate": 1.7864701676272614e-06, + "loss": 0.8115, + "step": 27571 + }, + { + "epoch": 0.71, + "learning_rate": 1.7864530772717116e-06, + "loss": 0.9541, + "step": 27572 + }, + { + "epoch": 0.71, + "learning_rate": 1.7864359863140108e-06, + "loss": 0.9268, + "step": 27573 + }, + { + "epoch": 0.71, + "learning_rate": 1.7864188947541718e-06, + "loss": 1.0039, + "step": 27574 + }, + { + "epoch": 0.71, + "learning_rate": 1.7864018025922085e-06, + "loss": 0.7871, + "step": 27575 + }, + { + "epoch": 0.71, + "learning_rate": 1.7863847098281332e-06, + "loss": 0.9395, + "step": 27576 + }, + { + "epoch": 0.71, + "learning_rate": 1.7863676164619595e-06, + "loss": 1.0283, + "step": 27577 + }, + { + "epoch": 0.71, + "learning_rate": 1.7863505224937002e-06, + "loss": 0.8457, + "step": 27578 + }, + { + "epoch": 0.71, + "learning_rate": 1.7863334279233684e-06, + "loss": 0.7881, + "step": 27579 + }, + { + "epoch": 0.71, + "learning_rate": 1.7863163327509772e-06, + "loss": 0.9785, + "step": 27580 + }, + { + "epoch": 0.71, + "learning_rate": 1.7862992369765398e-06, + "loss": 0.96, + "step": 27581 + }, + { + "epoch": 0.71, + "learning_rate": 1.7862821406000692e-06, + "loss": 1.0166, + "step": 27582 + }, + { + "epoch": 0.71, + "learning_rate": 1.7862650436215785e-06, + "loss": 0.7046, + "step": 27583 + }, + { + "epoch": 0.71, + "learning_rate": 1.786247946041081e-06, + "loss": 0.7686, + "step": 27584 + }, + { + "epoch": 0.71, + "learning_rate": 1.7862308478585894e-06, + "loss": 0.8789, + "step": 27585 + }, + { + "epoch": 0.71, + "learning_rate": 1.786213749074117e-06, + "loss": 0.7148, + "step": 27586 + }, + { + "epoch": 0.71, + "learning_rate": 1.786196649687677e-06, + "loss": 0.8018, + "step": 27587 + }, + { + "epoch": 0.71, + "learning_rate": 1.7861795496992824e-06, + "loss": 0.834, + "step": 27588 + }, + { + "epoch": 0.71, + "learning_rate": 1.786162449108946e-06, + "loss": 0.7725, + "step": 27589 + }, + { + "epoch": 0.71, + "learning_rate": 1.7861453479166815e-06, + "loss": 0.9834, + "step": 27590 + }, + { + "epoch": 0.71, + "learning_rate": 1.7861282461225016e-06, + "loss": 0.9395, + "step": 27591 + }, + { + "epoch": 0.71, + "learning_rate": 1.786111143726419e-06, + "loss": 0.6536, + "step": 27592 + }, + { + "epoch": 0.71, + "learning_rate": 1.786094040728448e-06, + "loss": 1.082, + "step": 27593 + }, + { + "epoch": 0.71, + "learning_rate": 1.7860769371286004e-06, + "loss": 0.9756, + "step": 27594 + }, + { + "epoch": 0.71, + "learning_rate": 1.7860598329268899e-06, + "loss": 0.7156, + "step": 27595 + }, + { + "epoch": 0.71, + "learning_rate": 1.7860427281233296e-06, + "loss": 0.9941, + "step": 27596 + }, + { + "epoch": 0.71, + "learning_rate": 1.7860256227179328e-06, + "loss": 0.7356, + "step": 27597 + }, + { + "epoch": 0.71, + "learning_rate": 1.7860085167107118e-06, + "loss": 0.7734, + "step": 27598 + }, + { + "epoch": 0.71, + "learning_rate": 1.7859914101016807e-06, + "loss": 0.9512, + "step": 27599 + }, + { + "epoch": 0.71, + "learning_rate": 1.7859743028908515e-06, + "loss": 0.8086, + "step": 27600 + }, + { + "epoch": 0.71, + "learning_rate": 1.7859571950782387e-06, + "loss": 0.6318, + "step": 27601 + }, + { + "epoch": 0.71, + "learning_rate": 1.7859400866638539e-06, + "loss": 0.8081, + "step": 27602 + }, + { + "epoch": 0.71, + "learning_rate": 1.7859229776477114e-06, + "loss": 0.7959, + "step": 27603 + }, + { + "epoch": 0.71, + "learning_rate": 1.7859058680298236e-06, + "loss": 0.8823, + "step": 27604 + }, + { + "epoch": 0.71, + "learning_rate": 1.7858887578102039e-06, + "loss": 0.6436, + "step": 27605 + }, + { + "epoch": 0.71, + "learning_rate": 1.7858716469888652e-06, + "loss": 0.9229, + "step": 27606 + }, + { + "epoch": 0.71, + "learning_rate": 1.7858545355658208e-06, + "loss": 0.6953, + "step": 27607 + }, + { + "epoch": 0.71, + "learning_rate": 1.7858374235410838e-06, + "loss": 0.998, + "step": 27608 + }, + { + "epoch": 0.71, + "learning_rate": 1.785820310914667e-06, + "loss": 0.9541, + "step": 27609 + }, + { + "epoch": 0.71, + "learning_rate": 1.785803197686584e-06, + "loss": 0.8936, + "step": 27610 + }, + { + "epoch": 0.71, + "learning_rate": 1.7857860838568474e-06, + "loss": 0.9443, + "step": 27611 + }, + { + "epoch": 0.71, + "learning_rate": 1.7857689694254705e-06, + "loss": 1.002, + "step": 27612 + }, + { + "epoch": 0.71, + "learning_rate": 1.7857518543924665e-06, + "loss": 0.7119, + "step": 27613 + }, + { + "epoch": 0.71, + "learning_rate": 1.7857347387578486e-06, + "loss": 0.605, + "step": 27614 + }, + { + "epoch": 0.71, + "learning_rate": 1.7857176225216294e-06, + "loss": 0.71, + "step": 27615 + }, + { + "epoch": 0.71, + "learning_rate": 1.7857005056838226e-06, + "loss": 1.0029, + "step": 27616 + }, + { + "epoch": 0.71, + "learning_rate": 1.785683388244441e-06, + "loss": 0.5664, + "step": 27617 + }, + { + "epoch": 0.71, + "learning_rate": 1.7856662702034977e-06, + "loss": 0.4883, + "step": 27618 + }, + { + "epoch": 0.71, + "learning_rate": 1.7856491515610062e-06, + "loss": 0.9111, + "step": 27619 + }, + { + "epoch": 0.71, + "learning_rate": 1.7856320323169788e-06, + "loss": 0.6033, + "step": 27620 + }, + { + "epoch": 0.71, + "learning_rate": 1.7856149124714293e-06, + "loss": 0.915, + "step": 27621 + }, + { + "epoch": 0.71, + "learning_rate": 1.7855977920243706e-06, + "loss": 0.6858, + "step": 27622 + }, + { + "epoch": 0.71, + "learning_rate": 1.7855806709758157e-06, + "loss": 0.6384, + "step": 27623 + }, + { + "epoch": 0.71, + "learning_rate": 1.7855635493257779e-06, + "loss": 0.6865, + "step": 27624 + }, + { + "epoch": 0.71, + "learning_rate": 1.7855464270742702e-06, + "loss": 0.9414, + "step": 27625 + }, + { + "epoch": 0.71, + "learning_rate": 1.7855293042213052e-06, + "loss": 0.7949, + "step": 27626 + }, + { + "epoch": 0.71, + "learning_rate": 1.7855121807668973e-06, + "loss": 0.8301, + "step": 27627 + }, + { + "epoch": 0.71, + "learning_rate": 1.7854950567110585e-06, + "loss": 0.874, + "step": 27628 + }, + { + "epoch": 0.71, + "learning_rate": 1.7854779320538024e-06, + "loss": 0.8481, + "step": 27629 + }, + { + "epoch": 0.71, + "learning_rate": 1.7854608067951418e-06, + "loss": 0.8223, + "step": 27630 + }, + { + "epoch": 0.71, + "learning_rate": 1.78544368093509e-06, + "loss": 0.8433, + "step": 27631 + }, + { + "epoch": 0.71, + "learning_rate": 1.7854265544736603e-06, + "loss": 0.9697, + "step": 27632 + }, + { + "epoch": 0.71, + "learning_rate": 1.7854094274108653e-06, + "loss": 0.8813, + "step": 27633 + }, + { + "epoch": 0.71, + "learning_rate": 1.7853922997467186e-06, + "loss": 0.9248, + "step": 27634 + }, + { + "epoch": 0.71, + "learning_rate": 1.785375171481233e-06, + "loss": 1.0029, + "step": 27635 + }, + { + "epoch": 0.71, + "learning_rate": 1.785358042614422e-06, + "loss": 0.9316, + "step": 27636 + }, + { + "epoch": 0.71, + "learning_rate": 1.7853409131462982e-06, + "loss": 0.707, + "step": 27637 + }, + { + "epoch": 0.71, + "learning_rate": 1.785323783076875e-06, + "loss": 0.8721, + "step": 27638 + }, + { + "epoch": 0.71, + "learning_rate": 1.7853066524061655e-06, + "loss": 0.9785, + "step": 27639 + }, + { + "epoch": 0.71, + "learning_rate": 1.785289521134183e-06, + "loss": 0.9609, + "step": 27640 + }, + { + "epoch": 0.71, + "learning_rate": 1.7852723892609403e-06, + "loss": 0.8262, + "step": 27641 + }, + { + "epoch": 0.71, + "learning_rate": 1.7852552567864506e-06, + "loss": 0.8262, + "step": 27642 + }, + { + "epoch": 0.71, + "learning_rate": 1.7852381237107271e-06, + "loss": 0.7773, + "step": 27643 + }, + { + "epoch": 0.71, + "learning_rate": 1.7852209900337826e-06, + "loss": 0.9248, + "step": 27644 + }, + { + "epoch": 0.71, + "learning_rate": 1.7852038557556309e-06, + "loss": 0.8545, + "step": 27645 + }, + { + "epoch": 0.71, + "learning_rate": 1.7851867208762846e-06, + "loss": 0.8398, + "step": 27646 + }, + { + "epoch": 0.71, + "learning_rate": 1.7851695853957568e-06, + "loss": 0.7506, + "step": 27647 + }, + { + "epoch": 0.71, + "learning_rate": 1.7851524493140606e-06, + "loss": 1.0098, + "step": 27648 + }, + { + "epoch": 0.71, + "learning_rate": 1.7851353126312096e-06, + "loss": 0.9844, + "step": 27649 + }, + { + "epoch": 0.71, + "learning_rate": 1.7851181753472164e-06, + "loss": 0.8604, + "step": 27650 + }, + { + "epoch": 0.71, + "learning_rate": 1.7851010374620947e-06, + "loss": 0.8633, + "step": 27651 + }, + { + "epoch": 0.71, + "learning_rate": 1.785083898975857e-06, + "loss": 1.0576, + "step": 27652 + }, + { + "epoch": 0.71, + "learning_rate": 1.7850667598885165e-06, + "loss": 0.9258, + "step": 27653 + }, + { + "epoch": 0.71, + "learning_rate": 1.7850496202000866e-06, + "loss": 0.9639, + "step": 27654 + }, + { + "epoch": 0.71, + "learning_rate": 1.7850324799105804e-06, + "loss": 0.7832, + "step": 27655 + }, + { + "epoch": 0.71, + "learning_rate": 1.7850153390200106e-06, + "loss": 1.0742, + "step": 27656 + }, + { + "epoch": 0.71, + "learning_rate": 1.784998197528391e-06, + "loss": 0.8994, + "step": 27657 + }, + { + "epoch": 0.71, + "learning_rate": 1.7849810554357343e-06, + "loss": 0.9141, + "step": 27658 + }, + { + "epoch": 0.71, + "learning_rate": 1.7849639127420534e-06, + "loss": 0.9502, + "step": 27659 + }, + { + "epoch": 0.71, + "learning_rate": 1.7849467694473621e-06, + "loss": 0.8301, + "step": 27660 + }, + { + "epoch": 0.71, + "learning_rate": 1.784929625551673e-06, + "loss": 0.7734, + "step": 27661 + }, + { + "epoch": 0.71, + "learning_rate": 1.7849124810549995e-06, + "loss": 0.9609, + "step": 27662 + }, + { + "epoch": 0.71, + "learning_rate": 1.7848953359573545e-06, + "loss": 1.0381, + "step": 27663 + }, + { + "epoch": 0.71, + "learning_rate": 1.7848781902587511e-06, + "loss": 1.0742, + "step": 27664 + }, + { + "epoch": 0.71, + "learning_rate": 1.7848610439592026e-06, + "loss": 0.5249, + "step": 27665 + }, + { + "epoch": 0.71, + "learning_rate": 1.7848438970587222e-06, + "loss": 0.7588, + "step": 27666 + }, + { + "epoch": 0.71, + "learning_rate": 1.784826749557323e-06, + "loss": 0.7747, + "step": 27667 + }, + { + "epoch": 0.71, + "learning_rate": 1.7848096014550179e-06, + "loss": 0.6714, + "step": 27668 + }, + { + "epoch": 0.71, + "learning_rate": 1.7847924527518203e-06, + "loss": 0.8477, + "step": 27669 + }, + { + "epoch": 0.71, + "learning_rate": 1.784775303447743e-06, + "loss": 0.7471, + "step": 27670 + }, + { + "epoch": 0.71, + "learning_rate": 1.7847581535427994e-06, + "loss": 0.9395, + "step": 27671 + }, + { + "epoch": 0.71, + "learning_rate": 1.7847410030370027e-06, + "loss": 0.7646, + "step": 27672 + }, + { + "epoch": 0.71, + "learning_rate": 1.7847238519303658e-06, + "loss": 0.6123, + "step": 27673 + }, + { + "epoch": 0.71, + "learning_rate": 1.784706700222902e-06, + "loss": 1.1836, + "step": 27674 + }, + { + "epoch": 0.71, + "learning_rate": 1.7846895479146242e-06, + "loss": 0.9229, + "step": 27675 + }, + { + "epoch": 0.71, + "learning_rate": 1.7846723950055457e-06, + "loss": 0.8281, + "step": 27676 + }, + { + "epoch": 0.71, + "learning_rate": 1.7846552414956799e-06, + "loss": 0.9541, + "step": 27677 + }, + { + "epoch": 0.71, + "learning_rate": 1.7846380873850396e-06, + "loss": 0.9141, + "step": 27678 + }, + { + "epoch": 0.71, + "learning_rate": 1.7846209326736376e-06, + "loss": 0.8125, + "step": 27679 + }, + { + "epoch": 0.71, + "learning_rate": 1.784603777361488e-06, + "loss": 0.8633, + "step": 27680 + }, + { + "epoch": 0.71, + "learning_rate": 1.784586621448603e-06, + "loss": 0.7764, + "step": 27681 + }, + { + "epoch": 0.71, + "learning_rate": 1.784569464934996e-06, + "loss": 0.9873, + "step": 27682 + }, + { + "epoch": 0.71, + "learning_rate": 1.7845523078206806e-06, + "loss": 0.9707, + "step": 27683 + }, + { + "epoch": 0.71, + "learning_rate": 1.7845351501056693e-06, + "loss": 0.73, + "step": 27684 + }, + { + "epoch": 0.71, + "learning_rate": 1.7845179917899755e-06, + "loss": 0.9961, + "step": 27685 + }, + { + "epoch": 0.71, + "learning_rate": 1.7845008328736127e-06, + "loss": 1.0127, + "step": 27686 + }, + { + "epoch": 0.71, + "learning_rate": 1.7844836733565932e-06, + "loss": 0.6528, + "step": 27687 + }, + { + "epoch": 0.71, + "learning_rate": 1.7844665132389308e-06, + "loss": 0.7573, + "step": 27688 + }, + { + "epoch": 0.71, + "learning_rate": 1.7844493525206389e-06, + "loss": 0.8408, + "step": 27689 + }, + { + "epoch": 0.71, + "learning_rate": 1.7844321912017296e-06, + "loss": 0.8945, + "step": 27690 + }, + { + "epoch": 0.71, + "learning_rate": 1.7844150292822168e-06, + "loss": 0.8906, + "step": 27691 + }, + { + "epoch": 0.71, + "learning_rate": 1.7843978667621136e-06, + "loss": 0.771, + "step": 27692 + }, + { + "epoch": 0.71, + "learning_rate": 1.7843807036414329e-06, + "loss": 0.8789, + "step": 27693 + }, + { + "epoch": 0.71, + "learning_rate": 1.784363539920188e-06, + "loss": 0.9492, + "step": 27694 + }, + { + "epoch": 0.71, + "learning_rate": 1.7843463755983921e-06, + "loss": 1.1133, + "step": 27695 + }, + { + "epoch": 0.71, + "learning_rate": 1.7843292106760582e-06, + "loss": 0.7407, + "step": 27696 + }, + { + "epoch": 0.71, + "learning_rate": 1.7843120451531994e-06, + "loss": 0.9531, + "step": 27697 + }, + { + "epoch": 0.71, + "learning_rate": 1.7842948790298289e-06, + "loss": 0.8184, + "step": 27698 + }, + { + "epoch": 0.71, + "learning_rate": 1.78427771230596e-06, + "loss": 0.7793, + "step": 27699 + }, + { + "epoch": 0.71, + "learning_rate": 1.7842605449816058e-06, + "loss": 0.9023, + "step": 27700 + }, + { + "epoch": 0.71, + "learning_rate": 1.784243377056779e-06, + "loss": 0.7363, + "step": 27701 + }, + { + "epoch": 0.71, + "learning_rate": 1.7842262085314937e-06, + "loss": 0.9521, + "step": 27702 + }, + { + "epoch": 0.71, + "learning_rate": 1.7842090394057619e-06, + "loss": 0.9717, + "step": 27703 + }, + { + "epoch": 0.71, + "learning_rate": 1.7841918696795975e-06, + "loss": 0.8887, + "step": 27704 + }, + { + "epoch": 0.71, + "learning_rate": 1.7841746993530133e-06, + "loss": 0.7773, + "step": 27705 + }, + { + "epoch": 0.71, + "learning_rate": 1.784157528426023e-06, + "loss": 0.7461, + "step": 27706 + }, + { + "epoch": 0.71, + "learning_rate": 1.784140356898639e-06, + "loss": 0.6714, + "step": 27707 + }, + { + "epoch": 0.71, + "learning_rate": 1.7841231847708745e-06, + "loss": 0.8379, + "step": 27708 + }, + { + "epoch": 0.71, + "learning_rate": 1.7841060120427436e-06, + "loss": 1.0029, + "step": 27709 + }, + { + "epoch": 0.71, + "learning_rate": 1.7840888387142586e-06, + "loss": 0.6686, + "step": 27710 + }, + { + "epoch": 0.71, + "learning_rate": 1.7840716647854324e-06, + "loss": 0.9512, + "step": 27711 + }, + { + "epoch": 0.71, + "learning_rate": 1.7840544902562788e-06, + "loss": 0.957, + "step": 27712 + }, + { + "epoch": 0.71, + "learning_rate": 1.784037315126811e-06, + "loss": 0.9561, + "step": 27713 + }, + { + "epoch": 0.71, + "learning_rate": 1.7840201393970417e-06, + "loss": 0.4406, + "step": 27714 + }, + { + "epoch": 0.71, + "learning_rate": 1.7840029630669843e-06, + "loss": 0.7329, + "step": 27715 + }, + { + "epoch": 0.71, + "learning_rate": 1.7839857861366517e-06, + "loss": 0.7246, + "step": 27716 + }, + { + "epoch": 0.71, + "learning_rate": 1.7839686086060572e-06, + "loss": 1.1064, + "step": 27717 + }, + { + "epoch": 0.71, + "learning_rate": 1.783951430475214e-06, + "loss": 0.7715, + "step": 27718 + }, + { + "epoch": 0.71, + "learning_rate": 1.7839342517441356e-06, + "loss": 0.7461, + "step": 27719 + }, + { + "epoch": 0.71, + "learning_rate": 1.7839170724128346e-06, + "loss": 1.0, + "step": 27720 + }, + { + "epoch": 0.71, + "learning_rate": 1.7838998924813242e-06, + "loss": 0.7529, + "step": 27721 + }, + { + "epoch": 0.71, + "learning_rate": 1.7838827119496176e-06, + "loss": 0.7292, + "step": 27722 + }, + { + "epoch": 0.71, + "learning_rate": 1.7838655308177284e-06, + "loss": 0.7715, + "step": 27723 + }, + { + "epoch": 0.71, + "learning_rate": 1.783848349085669e-06, + "loss": 0.9346, + "step": 27724 + }, + { + "epoch": 0.71, + "learning_rate": 1.7838311667534533e-06, + "loss": 0.8755, + "step": 27725 + }, + { + "epoch": 0.71, + "learning_rate": 1.7838139838210942e-06, + "loss": 0.6641, + "step": 27726 + }, + { + "epoch": 0.71, + "learning_rate": 1.7837968002886043e-06, + "loss": 0.8096, + "step": 27727 + }, + { + "epoch": 0.71, + "learning_rate": 1.7837796161559978e-06, + "loss": 0.6729, + "step": 27728 + }, + { + "epoch": 0.71, + "learning_rate": 1.7837624314232869e-06, + "loss": 1.0293, + "step": 27729 + }, + { + "epoch": 0.71, + "learning_rate": 1.7837452460904851e-06, + "loss": 0.9814, + "step": 27730 + }, + { + "epoch": 0.71, + "learning_rate": 1.7837280601576058e-06, + "loss": 0.9648, + "step": 27731 + }, + { + "epoch": 0.71, + "learning_rate": 1.783710873624662e-06, + "loss": 0.8186, + "step": 27732 + }, + { + "epoch": 0.71, + "learning_rate": 1.7836936864916666e-06, + "loss": 0.6187, + "step": 27733 + }, + { + "epoch": 0.71, + "learning_rate": 1.7836764987586333e-06, + "loss": 0.6562, + "step": 27734 + }, + { + "epoch": 0.71, + "learning_rate": 1.7836593104255745e-06, + "loss": 0.9609, + "step": 27735 + }, + { + "epoch": 0.71, + "learning_rate": 1.783642121492504e-06, + "loss": 1.1172, + "step": 27736 + }, + { + "epoch": 0.71, + "learning_rate": 1.783624931959435e-06, + "loss": 0.9023, + "step": 27737 + }, + { + "epoch": 0.71, + "learning_rate": 1.7836077418263801e-06, + "loss": 0.9082, + "step": 27738 + }, + { + "epoch": 0.71, + "learning_rate": 1.7835905510933529e-06, + "loss": 1.0371, + "step": 27739 + }, + { + "epoch": 0.71, + "learning_rate": 1.7835733597603664e-06, + "loss": 0.8428, + "step": 27740 + }, + { + "epoch": 0.71, + "learning_rate": 1.783556167827434e-06, + "loss": 0.957, + "step": 27741 + }, + { + "epoch": 0.71, + "learning_rate": 1.7835389752945686e-06, + "loss": 0.7676, + "step": 27742 + }, + { + "epoch": 0.71, + "learning_rate": 1.7835217821617833e-06, + "loss": 0.957, + "step": 27743 + }, + { + "epoch": 0.71, + "learning_rate": 1.7835045884290913e-06, + "loss": 0.8047, + "step": 27744 + }, + { + "epoch": 0.71, + "learning_rate": 1.783487394096506e-06, + "loss": 0.7808, + "step": 27745 + }, + { + "epoch": 0.71, + "learning_rate": 1.7834701991640406e-06, + "loss": 1.0186, + "step": 27746 + }, + { + "epoch": 0.71, + "learning_rate": 1.7834530036317079e-06, + "loss": 0.8535, + "step": 27747 + }, + { + "epoch": 0.71, + "learning_rate": 1.7834358074995213e-06, + "loss": 0.7671, + "step": 27748 + }, + { + "epoch": 0.71, + "learning_rate": 1.783418610767494e-06, + "loss": 0.877, + "step": 27749 + }, + { + "epoch": 0.71, + "learning_rate": 1.783401413435639e-06, + "loss": 0.7275, + "step": 27750 + }, + { + "epoch": 0.71, + "learning_rate": 1.7833842155039695e-06, + "loss": 1.0195, + "step": 27751 + }, + { + "epoch": 0.71, + "learning_rate": 1.783367016972499e-06, + "loss": 0.7446, + "step": 27752 + }, + { + "epoch": 0.71, + "learning_rate": 1.7833498178412402e-06, + "loss": 0.8994, + "step": 27753 + }, + { + "epoch": 0.71, + "learning_rate": 1.7833326181102067e-06, + "loss": 0.9678, + "step": 27754 + }, + { + "epoch": 0.71, + "learning_rate": 1.783315417779411e-06, + "loss": 0.9238, + "step": 27755 + }, + { + "epoch": 0.71, + "learning_rate": 1.7832982168488668e-06, + "loss": 0.9258, + "step": 27756 + }, + { + "epoch": 0.71, + "learning_rate": 1.7832810153185873e-06, + "loss": 0.8115, + "step": 27757 + }, + { + "epoch": 0.71, + "learning_rate": 1.7832638131885856e-06, + "loss": 1.0117, + "step": 27758 + }, + { + "epoch": 0.71, + "learning_rate": 1.7832466104588746e-06, + "loss": 0.6506, + "step": 27759 + }, + { + "epoch": 0.71, + "learning_rate": 1.7832294071294677e-06, + "loss": 0.8223, + "step": 27760 + }, + { + "epoch": 0.71, + "learning_rate": 1.7832122032003784e-06, + "loss": 0.9517, + "step": 27761 + }, + { + "epoch": 0.71, + "learning_rate": 1.7831949986716192e-06, + "loss": 0.8555, + "step": 27762 + }, + { + "epoch": 0.71, + "learning_rate": 1.7831777935432037e-06, + "loss": 1.0088, + "step": 27763 + }, + { + "epoch": 0.71, + "learning_rate": 1.783160587815145e-06, + "loss": 0.7217, + "step": 27764 + }, + { + "epoch": 0.71, + "learning_rate": 1.7831433814874563e-06, + "loss": 0.8364, + "step": 27765 + }, + { + "epoch": 0.71, + "learning_rate": 1.7831261745601507e-06, + "loss": 1.1641, + "step": 27766 + }, + { + "epoch": 0.71, + "learning_rate": 1.7831089670332413e-06, + "loss": 1.0166, + "step": 27767 + }, + { + "epoch": 0.71, + "learning_rate": 1.7830917589067417e-06, + "loss": 1.0303, + "step": 27768 + }, + { + "epoch": 0.71, + "learning_rate": 1.7830745501806644e-06, + "loss": 0.7988, + "step": 27769 + }, + { + "epoch": 0.71, + "learning_rate": 1.783057340855023e-06, + "loss": 0.9902, + "step": 27770 + }, + { + "epoch": 0.71, + "learning_rate": 1.7830401309298304e-06, + "loss": 0.7139, + "step": 27771 + }, + { + "epoch": 0.71, + "learning_rate": 1.7830229204051003e-06, + "loss": 0.8857, + "step": 27772 + }, + { + "epoch": 0.71, + "learning_rate": 1.7830057092808452e-06, + "loss": 0.9297, + "step": 27773 + }, + { + "epoch": 0.71, + "learning_rate": 1.782988497557079e-06, + "loss": 0.7578, + "step": 27774 + }, + { + "epoch": 0.71, + "learning_rate": 1.7829712852338146e-06, + "loss": 0.8418, + "step": 27775 + }, + { + "epoch": 0.71, + "learning_rate": 1.7829540723110648e-06, + "loss": 0.8457, + "step": 27776 + }, + { + "epoch": 0.71, + "learning_rate": 1.7829368587888428e-06, + "loss": 0.6592, + "step": 27777 + }, + { + "epoch": 0.71, + "learning_rate": 1.7829196446671625e-06, + "loss": 0.9067, + "step": 27778 + }, + { + "epoch": 0.71, + "learning_rate": 1.7829024299460364e-06, + "loss": 0.7678, + "step": 27779 + }, + { + "epoch": 0.71, + "learning_rate": 1.782885214625478e-06, + "loss": 0.9814, + "step": 27780 + }, + { + "epoch": 0.71, + "learning_rate": 1.7828679987055006e-06, + "loss": 0.6648, + "step": 27781 + }, + { + "epoch": 0.71, + "learning_rate": 1.782850782186117e-06, + "loss": 0.7822, + "step": 27782 + }, + { + "epoch": 0.71, + "learning_rate": 1.7828335650673406e-06, + "loss": 0.9297, + "step": 27783 + }, + { + "epoch": 0.71, + "learning_rate": 1.7828163473491845e-06, + "loss": 0.8145, + "step": 27784 + }, + { + "epoch": 0.71, + "learning_rate": 1.7827991290316617e-06, + "loss": 0.7358, + "step": 27785 + }, + { + "epoch": 0.71, + "learning_rate": 1.7827819101147856e-06, + "loss": 1.0791, + "step": 27786 + }, + { + "epoch": 0.71, + "learning_rate": 1.7827646905985695e-06, + "loss": 0.9922, + "step": 27787 + }, + { + "epoch": 0.71, + "learning_rate": 1.7827474704830268e-06, + "loss": 0.9609, + "step": 27788 + }, + { + "epoch": 0.71, + "learning_rate": 1.78273024976817e-06, + "loss": 0.8477, + "step": 27789 + }, + { + "epoch": 0.71, + "learning_rate": 1.7827130284540128e-06, + "loss": 0.7734, + "step": 27790 + }, + { + "epoch": 0.71, + "learning_rate": 1.7826958065405679e-06, + "loss": 0.7803, + "step": 27791 + }, + { + "epoch": 0.71, + "learning_rate": 1.7826785840278493e-06, + "loss": 0.8652, + "step": 27792 + }, + { + "epoch": 0.71, + "learning_rate": 1.7826613609158693e-06, + "loss": 0.877, + "step": 27793 + }, + { + "epoch": 0.71, + "learning_rate": 1.7826441372046417e-06, + "loss": 1.0107, + "step": 27794 + }, + { + "epoch": 0.71, + "learning_rate": 1.7826269128941795e-06, + "loss": 0.7715, + "step": 27795 + }, + { + "epoch": 0.71, + "learning_rate": 1.7826096879844958e-06, + "loss": 0.8906, + "step": 27796 + }, + { + "epoch": 0.71, + "learning_rate": 1.7825924624756038e-06, + "loss": 1.0566, + "step": 27797 + }, + { + "epoch": 0.71, + "learning_rate": 1.7825752363675166e-06, + "loss": 0.7485, + "step": 27798 + }, + { + "epoch": 0.71, + "learning_rate": 1.782558009660248e-06, + "loss": 0.8242, + "step": 27799 + }, + { + "epoch": 0.71, + "learning_rate": 1.7825407823538101e-06, + "loss": 0.9404, + "step": 27800 + }, + { + "epoch": 0.71, + "learning_rate": 1.7825235544482172e-06, + "loss": 1.1221, + "step": 27801 + }, + { + "epoch": 0.71, + "learning_rate": 1.7825063259434817e-06, + "loss": 0.6758, + "step": 27802 + }, + { + "epoch": 0.71, + "learning_rate": 1.782489096839617e-06, + "loss": 1.002, + "step": 27803 + }, + { + "epoch": 0.71, + "learning_rate": 1.7824718671366368e-06, + "loss": 0.9766, + "step": 27804 + }, + { + "epoch": 0.71, + "learning_rate": 1.7824546368345535e-06, + "loss": 0.6104, + "step": 27805 + }, + { + "epoch": 0.71, + "learning_rate": 1.7824374059333809e-06, + "loss": 0.8447, + "step": 27806 + }, + { + "epoch": 0.71, + "learning_rate": 1.7824201744331318e-06, + "loss": 0.9443, + "step": 27807 + }, + { + "epoch": 0.71, + "learning_rate": 1.7824029423338197e-06, + "loss": 0.9932, + "step": 27808 + }, + { + "epoch": 0.71, + "learning_rate": 1.7823857096354575e-06, + "loss": 0.9287, + "step": 27809 + }, + { + "epoch": 0.71, + "learning_rate": 1.7823684763380585e-06, + "loss": 1.0684, + "step": 27810 + }, + { + "epoch": 0.71, + "learning_rate": 1.7823512424416358e-06, + "loss": 1.0537, + "step": 27811 + }, + { + "epoch": 0.71, + "learning_rate": 1.7823340079462032e-06, + "loss": 0.8555, + "step": 27812 + }, + { + "epoch": 0.71, + "learning_rate": 1.7823167728517729e-06, + "loss": 0.7476, + "step": 27813 + }, + { + "epoch": 0.71, + "learning_rate": 1.7822995371583591e-06, + "loss": 0.8164, + "step": 27814 + }, + { + "epoch": 0.71, + "learning_rate": 1.7822823008659741e-06, + "loss": 1.0654, + "step": 27815 + }, + { + "epoch": 0.71, + "learning_rate": 1.782265063974632e-06, + "loss": 1.0996, + "step": 27816 + }, + { + "epoch": 0.71, + "learning_rate": 1.7822478264843452e-06, + "loss": 1.0732, + "step": 27817 + }, + { + "epoch": 0.71, + "learning_rate": 1.782230588395127e-06, + "loss": 0.8242, + "step": 27818 + }, + { + "epoch": 0.71, + "learning_rate": 1.7822133497069914e-06, + "loss": 1.0908, + "step": 27819 + }, + { + "epoch": 0.71, + "learning_rate": 1.7821961104199504e-06, + "loss": 0.9629, + "step": 27820 + }, + { + "epoch": 0.71, + "learning_rate": 1.7821788705340181e-06, + "loss": 0.897, + "step": 27821 + }, + { + "epoch": 0.71, + "learning_rate": 1.7821616300492073e-06, + "loss": 0.7554, + "step": 27822 + }, + { + "epoch": 0.71, + "learning_rate": 1.7821443889655315e-06, + "loss": 0.8467, + "step": 27823 + }, + { + "epoch": 0.71, + "learning_rate": 1.7821271472830034e-06, + "loss": 0.8862, + "step": 27824 + }, + { + "epoch": 0.71, + "learning_rate": 1.7821099050016366e-06, + "loss": 0.9844, + "step": 27825 + }, + { + "epoch": 0.71, + "learning_rate": 1.7820926621214443e-06, + "loss": 0.8701, + "step": 27826 + }, + { + "epoch": 0.71, + "learning_rate": 1.7820754186424396e-06, + "loss": 0.9307, + "step": 27827 + }, + { + "epoch": 0.71, + "learning_rate": 1.7820581745646357e-06, + "loss": 0.8789, + "step": 27828 + }, + { + "epoch": 0.71, + "learning_rate": 1.7820409298880458e-06, + "loss": 0.8457, + "step": 27829 + }, + { + "epoch": 0.71, + "learning_rate": 1.782023684612683e-06, + "loss": 0.8711, + "step": 27830 + }, + { + "epoch": 0.71, + "learning_rate": 1.782006438738561e-06, + "loss": 0.8164, + "step": 27831 + }, + { + "epoch": 0.71, + "learning_rate": 1.7819891922656922e-06, + "loss": 0.7744, + "step": 27832 + }, + { + "epoch": 0.71, + "learning_rate": 1.7819719451940904e-06, + "loss": 0.7744, + "step": 27833 + }, + { + "epoch": 0.71, + "learning_rate": 1.7819546975237687e-06, + "loss": 0.959, + "step": 27834 + }, + { + "epoch": 0.71, + "learning_rate": 1.7819374492547401e-06, + "loss": 0.8223, + "step": 27835 + }, + { + "epoch": 0.71, + "learning_rate": 1.7819202003870179e-06, + "loss": 0.8135, + "step": 27836 + }, + { + "epoch": 0.71, + "learning_rate": 1.7819029509206157e-06, + "loss": 0.8369, + "step": 27837 + }, + { + "epoch": 0.71, + "learning_rate": 1.781885700855546e-06, + "loss": 0.4861, + "step": 27838 + }, + { + "epoch": 0.71, + "learning_rate": 1.7818684501918226e-06, + "loss": 0.874, + "step": 27839 + }, + { + "epoch": 0.71, + "learning_rate": 1.7818511989294584e-06, + "loss": 0.7812, + "step": 27840 + }, + { + "epoch": 0.71, + "learning_rate": 1.781833947068467e-06, + "loss": 0.959, + "step": 27841 + }, + { + "epoch": 0.71, + "learning_rate": 1.7818166946088607e-06, + "loss": 0.834, + "step": 27842 + }, + { + "epoch": 0.71, + "learning_rate": 1.7817994415506536e-06, + "loss": 0.748, + "step": 27843 + }, + { + "epoch": 0.71, + "learning_rate": 1.7817821878938587e-06, + "loss": 0.6487, + "step": 27844 + }, + { + "epoch": 0.71, + "learning_rate": 1.781764933638489e-06, + "loss": 0.7681, + "step": 27845 + }, + { + "epoch": 0.71, + "learning_rate": 1.781747678784558e-06, + "loss": 0.6362, + "step": 27846 + }, + { + "epoch": 0.71, + "learning_rate": 1.7817304233320784e-06, + "loss": 0.8164, + "step": 27847 + }, + { + "epoch": 0.71, + "learning_rate": 1.781713167281064e-06, + "loss": 0.7285, + "step": 27848 + }, + { + "epoch": 0.71, + "learning_rate": 1.7816959106315279e-06, + "loss": 0.8457, + "step": 27849 + }, + { + "epoch": 0.71, + "learning_rate": 1.7816786533834831e-06, + "loss": 0.8877, + "step": 27850 + }, + { + "epoch": 0.71, + "learning_rate": 1.781661395536943e-06, + "loss": 0.958, + "step": 27851 + }, + { + "epoch": 0.71, + "learning_rate": 1.7816441370919204e-06, + "loss": 0.9053, + "step": 27852 + }, + { + "epoch": 0.71, + "learning_rate": 1.7816268780484288e-06, + "loss": 0.8457, + "step": 27853 + }, + { + "epoch": 0.71, + "learning_rate": 1.7816096184064818e-06, + "loss": 0.9141, + "step": 27854 + }, + { + "epoch": 0.71, + "learning_rate": 1.781592358166092e-06, + "loss": 0.9492, + "step": 27855 + }, + { + "epoch": 0.71, + "learning_rate": 1.781575097327273e-06, + "loss": 0.7842, + "step": 27856 + }, + { + "epoch": 0.71, + "learning_rate": 1.781557835890038e-06, + "loss": 0.7476, + "step": 27857 + }, + { + "epoch": 0.71, + "learning_rate": 1.7815405738543995e-06, + "loss": 0.8979, + "step": 27858 + }, + { + "epoch": 0.71, + "learning_rate": 1.7815233112203721e-06, + "loss": 0.8105, + "step": 27859 + }, + { + "epoch": 0.71, + "learning_rate": 1.7815060479879676e-06, + "loss": 0.7393, + "step": 27860 + }, + { + "epoch": 0.71, + "learning_rate": 1.7814887841572004e-06, + "loss": 0.7598, + "step": 27861 + }, + { + "epoch": 0.71, + "learning_rate": 1.7814715197280828e-06, + "loss": 0.709, + "step": 27862 + }, + { + "epoch": 0.71, + "learning_rate": 1.7814542547006285e-06, + "loss": 0.7949, + "step": 27863 + }, + { + "epoch": 0.71, + "learning_rate": 1.7814369890748506e-06, + "loss": 0.5498, + "step": 27864 + }, + { + "epoch": 0.71, + "learning_rate": 1.7814197228507624e-06, + "loss": 0.7346, + "step": 27865 + }, + { + "epoch": 0.71, + "learning_rate": 1.7814024560283769e-06, + "loss": 0.8955, + "step": 27866 + }, + { + "epoch": 0.71, + "learning_rate": 1.7813851886077074e-06, + "loss": 0.916, + "step": 27867 + }, + { + "epoch": 0.71, + "learning_rate": 1.7813679205887672e-06, + "loss": 0.9121, + "step": 27868 + }, + { + "epoch": 0.71, + "learning_rate": 1.7813506519715697e-06, + "loss": 0.9072, + "step": 27869 + }, + { + "epoch": 0.71, + "learning_rate": 1.781333382756128e-06, + "loss": 0.6814, + "step": 27870 + }, + { + "epoch": 0.71, + "learning_rate": 1.7813161129424552e-06, + "loss": 0.7422, + "step": 27871 + }, + { + "epoch": 0.71, + "learning_rate": 1.7812988425305643e-06, + "loss": 0.6494, + "step": 27872 + }, + { + "epoch": 0.71, + "learning_rate": 1.7812815715204693e-06, + "loss": 0.7832, + "step": 27873 + }, + { + "epoch": 0.71, + "learning_rate": 1.7812642999121827e-06, + "loss": 0.834, + "step": 27874 + }, + { + "epoch": 0.71, + "learning_rate": 1.7812470277057176e-06, + "loss": 0.8203, + "step": 27875 + }, + { + "epoch": 0.71, + "learning_rate": 1.781229754901088e-06, + "loss": 0.8364, + "step": 27876 + }, + { + "epoch": 0.71, + "learning_rate": 1.7812124814983066e-06, + "loss": 0.832, + "step": 27877 + }, + { + "epoch": 0.71, + "learning_rate": 1.7811952074973867e-06, + "loss": 0.9053, + "step": 27878 + }, + { + "epoch": 0.71, + "learning_rate": 1.7811779328983415e-06, + "loss": 1.2246, + "step": 27879 + }, + { + "epoch": 0.71, + "learning_rate": 1.7811606577011844e-06, + "loss": 0.7412, + "step": 27880 + }, + { + "epoch": 0.71, + "learning_rate": 1.7811433819059283e-06, + "loss": 0.8926, + "step": 27881 + }, + { + "epoch": 0.71, + "learning_rate": 1.781126105512587e-06, + "loss": 0.9082, + "step": 27882 + }, + { + "epoch": 0.71, + "learning_rate": 1.781108828521173e-06, + "loss": 0.7485, + "step": 27883 + }, + { + "epoch": 0.71, + "learning_rate": 1.7810915509317e-06, + "loss": 0.9199, + "step": 27884 + }, + { + "epoch": 0.71, + "learning_rate": 1.7810742727441812e-06, + "loss": 0.9541, + "step": 27885 + }, + { + "epoch": 0.71, + "learning_rate": 1.7810569939586295e-06, + "loss": 0.5928, + "step": 27886 + }, + { + "epoch": 0.71, + "learning_rate": 1.7810397145750585e-06, + "loss": 0.7239, + "step": 27887 + }, + { + "epoch": 0.71, + "learning_rate": 1.7810224345934815e-06, + "loss": 0.8877, + "step": 27888 + }, + { + "epoch": 0.71, + "learning_rate": 1.7810051540139113e-06, + "loss": 1.1602, + "step": 27889 + }, + { + "epoch": 0.71, + "learning_rate": 1.7809878728363614e-06, + "loss": 0.6157, + "step": 27890 + }, + { + "epoch": 0.71, + "learning_rate": 1.780970591060845e-06, + "loss": 0.9111, + "step": 27891 + }, + { + "epoch": 0.71, + "learning_rate": 1.7809533086873753e-06, + "loss": 0.8264, + "step": 27892 + }, + { + "epoch": 0.71, + "learning_rate": 1.7809360257159657e-06, + "loss": 0.9219, + "step": 27893 + }, + { + "epoch": 0.71, + "learning_rate": 1.7809187421466292e-06, + "loss": 0.9121, + "step": 27894 + }, + { + "epoch": 0.71, + "learning_rate": 1.7809014579793792e-06, + "loss": 0.9795, + "step": 27895 + }, + { + "epoch": 0.71, + "learning_rate": 1.7808841732142289e-06, + "loss": 1.0918, + "step": 27896 + }, + { + "epoch": 0.72, + "learning_rate": 1.7808668878511913e-06, + "loss": 0.6758, + "step": 27897 + }, + { + "epoch": 0.72, + "learning_rate": 1.78084960189028e-06, + "loss": 0.7363, + "step": 27898 + }, + { + "epoch": 0.72, + "learning_rate": 1.780832315331508e-06, + "loss": 0.8213, + "step": 27899 + }, + { + "epoch": 0.72, + "learning_rate": 1.7808150281748884e-06, + "loss": 0.9326, + "step": 27900 + }, + { + "epoch": 0.72, + "learning_rate": 1.7807977404204348e-06, + "loss": 0.4316, + "step": 27901 + }, + { + "epoch": 0.72, + "learning_rate": 1.7807804520681603e-06, + "loss": 0.9297, + "step": 27902 + }, + { + "epoch": 0.72, + "learning_rate": 1.7807631631180781e-06, + "loss": 0.7607, + "step": 27903 + }, + { + "epoch": 0.72, + "learning_rate": 1.7807458735702014e-06, + "loss": 0.833, + "step": 27904 + }, + { + "epoch": 0.72, + "learning_rate": 1.7807285834245435e-06, + "loss": 0.8574, + "step": 27905 + }, + { + "epoch": 0.72, + "learning_rate": 1.7807112926811179e-06, + "loss": 0.8838, + "step": 27906 + }, + { + "epoch": 0.72, + "learning_rate": 1.7806940013399375e-06, + "loss": 0.8398, + "step": 27907 + }, + { + "epoch": 0.72, + "learning_rate": 1.780676709401015e-06, + "loss": 1.0391, + "step": 27908 + }, + { + "epoch": 0.72, + "learning_rate": 1.7806594168643646e-06, + "loss": 0.5353, + "step": 27909 + }, + { + "epoch": 0.72, + "learning_rate": 1.7806421237299994e-06, + "loss": 0.8799, + "step": 27910 + }, + { + "epoch": 0.72, + "learning_rate": 1.7806248299979322e-06, + "loss": 0.7793, + "step": 27911 + }, + { + "epoch": 0.72, + "learning_rate": 1.7806075356681767e-06, + "loss": 0.8027, + "step": 27912 + }, + { + "epoch": 0.72, + "learning_rate": 1.7805902407407457e-06, + "loss": 0.9326, + "step": 27913 + }, + { + "epoch": 0.72, + "learning_rate": 1.7805729452156526e-06, + "loss": 0.7617, + "step": 27914 + }, + { + "epoch": 0.72, + "learning_rate": 1.7805556490929107e-06, + "loss": 0.8633, + "step": 27915 + }, + { + "epoch": 0.72, + "learning_rate": 1.7805383523725333e-06, + "loss": 0.8203, + "step": 27916 + }, + { + "epoch": 0.72, + "learning_rate": 1.7805210550545334e-06, + "loss": 0.8477, + "step": 27917 + }, + { + "epoch": 0.72, + "learning_rate": 1.7805037571389247e-06, + "loss": 0.6787, + "step": 27918 + }, + { + "epoch": 0.72, + "learning_rate": 1.7804864586257201e-06, + "loss": 0.8359, + "step": 27919 + }, + { + "epoch": 0.72, + "learning_rate": 1.780469159514933e-06, + "loss": 0.7539, + "step": 27920 + }, + { + "epoch": 0.72, + "learning_rate": 1.7804518598065762e-06, + "loss": 0.5693, + "step": 27921 + }, + { + "epoch": 0.72, + "learning_rate": 1.7804345595006636e-06, + "loss": 0.8789, + "step": 27922 + }, + { + "epoch": 0.72, + "learning_rate": 1.7804172585972078e-06, + "loss": 0.6768, + "step": 27923 + }, + { + "epoch": 0.72, + "learning_rate": 1.7803999570962228e-06, + "loss": 0.7891, + "step": 27924 + }, + { + "epoch": 0.72, + "learning_rate": 1.7803826549977213e-06, + "loss": 0.9902, + "step": 27925 + }, + { + "epoch": 0.72, + "learning_rate": 1.7803653523017168e-06, + "loss": 0.5569, + "step": 27926 + }, + { + "epoch": 0.72, + "learning_rate": 1.7803480490082224e-06, + "loss": 1.0137, + "step": 27927 + }, + { + "epoch": 0.72, + "learning_rate": 1.7803307451172511e-06, + "loss": 0.7822, + "step": 27928 + }, + { + "epoch": 0.72, + "learning_rate": 1.7803134406288165e-06, + "loss": 0.8789, + "step": 27929 + }, + { + "epoch": 0.72, + "learning_rate": 1.7802961355429318e-06, + "loss": 0.7007, + "step": 27930 + }, + { + "epoch": 0.72, + "learning_rate": 1.7802788298596102e-06, + "loss": 0.8193, + "step": 27931 + }, + { + "epoch": 0.72, + "learning_rate": 1.7802615235788655e-06, + "loss": 0.6792, + "step": 27932 + }, + { + "epoch": 0.72, + "learning_rate": 1.78024421670071e-06, + "loss": 0.9341, + "step": 27933 + }, + { + "epoch": 0.72, + "learning_rate": 1.7802269092251573e-06, + "loss": 0.8047, + "step": 27934 + }, + { + "epoch": 0.72, + "learning_rate": 1.7802096011522206e-06, + "loss": 0.9248, + "step": 27935 + }, + { + "epoch": 0.72, + "learning_rate": 1.7801922924819136e-06, + "loss": 0.6187, + "step": 27936 + }, + { + "epoch": 0.72, + "learning_rate": 1.7801749832142493e-06, + "loss": 0.7805, + "step": 27937 + }, + { + "epoch": 0.72, + "learning_rate": 1.7801576733492406e-06, + "loss": 0.7012, + "step": 27938 + }, + { + "epoch": 0.72, + "learning_rate": 1.780140362886901e-06, + "loss": 0.853, + "step": 27939 + }, + { + "epoch": 0.72, + "learning_rate": 1.780123051827244e-06, + "loss": 0.6995, + "step": 27940 + }, + { + "epoch": 0.72, + "learning_rate": 1.7801057401702826e-06, + "loss": 0.7617, + "step": 27941 + }, + { + "epoch": 0.72, + "learning_rate": 1.7800884279160303e-06, + "loss": 0.9741, + "step": 27942 + }, + { + "epoch": 0.72, + "learning_rate": 1.7800711150644997e-06, + "loss": 0.7793, + "step": 27943 + }, + { + "epoch": 0.72, + "learning_rate": 1.780053801615705e-06, + "loss": 0.8213, + "step": 27944 + }, + { + "epoch": 0.72, + "learning_rate": 1.7800364875696587e-06, + "loss": 1.0068, + "step": 27945 + }, + { + "epoch": 0.72, + "learning_rate": 1.7800191729263743e-06, + "loss": 0.8828, + "step": 27946 + }, + { + "epoch": 0.72, + "learning_rate": 1.7800018576858652e-06, + "loss": 0.9805, + "step": 27947 + }, + { + "epoch": 0.72, + "learning_rate": 1.7799845418481445e-06, + "loss": 0.6909, + "step": 27948 + }, + { + "epoch": 0.72, + "learning_rate": 1.7799672254132256e-06, + "loss": 1.0283, + "step": 27949 + }, + { + "epoch": 0.72, + "learning_rate": 1.7799499083811215e-06, + "loss": 0.708, + "step": 27950 + }, + { + "epoch": 0.72, + "learning_rate": 1.7799325907518459e-06, + "loss": 0.6514, + "step": 27951 + }, + { + "epoch": 0.72, + "learning_rate": 1.7799152725254114e-06, + "loss": 0.8955, + "step": 27952 + }, + { + "epoch": 0.72, + "learning_rate": 1.7798979537018318e-06, + "loss": 0.8086, + "step": 27953 + }, + { + "epoch": 0.72, + "learning_rate": 1.7798806342811204e-06, + "loss": 0.7256, + "step": 27954 + }, + { + "epoch": 0.72, + "learning_rate": 1.77986331426329e-06, + "loss": 0.7256, + "step": 27955 + }, + { + "epoch": 0.72, + "learning_rate": 1.7798459936483541e-06, + "loss": 0.875, + "step": 27956 + }, + { + "epoch": 0.72, + "learning_rate": 1.7798286724363263e-06, + "loss": 0.8193, + "step": 27957 + }, + { + "epoch": 0.72, + "learning_rate": 1.7798113506272192e-06, + "loss": 1.0439, + "step": 27958 + }, + { + "epoch": 0.72, + "learning_rate": 1.7797940282210464e-06, + "loss": 0.8149, + "step": 27959 + }, + { + "epoch": 0.72, + "learning_rate": 1.7797767052178215e-06, + "loss": 0.8564, + "step": 27960 + }, + { + "epoch": 0.72, + "learning_rate": 1.779759381617557e-06, + "loss": 0.8564, + "step": 27961 + }, + { + "epoch": 0.72, + "learning_rate": 1.779742057420267e-06, + "loss": 0.8867, + "step": 27962 + }, + { + "epoch": 0.72, + "learning_rate": 1.7797247326259641e-06, + "loss": 0.8926, + "step": 27963 + }, + { + "epoch": 0.72, + "learning_rate": 1.7797074072346618e-06, + "loss": 0.7832, + "step": 27964 + }, + { + "epoch": 0.72, + "learning_rate": 1.7796900812463735e-06, + "loss": 0.874, + "step": 27965 + }, + { + "epoch": 0.72, + "learning_rate": 1.7796727546611123e-06, + "loss": 1.0908, + "step": 27966 + }, + { + "epoch": 0.72, + "learning_rate": 1.7796554274788918e-06, + "loss": 0.9893, + "step": 27967 + }, + { + "epoch": 0.72, + "learning_rate": 1.7796380996997247e-06, + "loss": 0.8481, + "step": 27968 + }, + { + "epoch": 0.72, + "learning_rate": 1.7796207713236243e-06, + "loss": 0.9355, + "step": 27969 + }, + { + "epoch": 0.72, + "learning_rate": 1.7796034423506048e-06, + "loss": 0.9043, + "step": 27970 + }, + { + "epoch": 0.72, + "learning_rate": 1.7795861127806782e-06, + "loss": 0.748, + "step": 27971 + }, + { + "epoch": 0.72, + "learning_rate": 1.7795687826138589e-06, + "loss": 0.8818, + "step": 27972 + }, + { + "epoch": 0.72, + "learning_rate": 1.7795514518501592e-06, + "loss": 0.9277, + "step": 27973 + }, + { + "epoch": 0.72, + "learning_rate": 1.7795341204895928e-06, + "loss": 0.7139, + "step": 27974 + }, + { + "epoch": 0.72, + "learning_rate": 1.779516788532173e-06, + "loss": 0.7588, + "step": 27975 + }, + { + "epoch": 0.72, + "learning_rate": 1.779499455977913e-06, + "loss": 1.0371, + "step": 27976 + }, + { + "epoch": 0.72, + "learning_rate": 1.7794821228268264e-06, + "loss": 0.8486, + "step": 27977 + }, + { + "epoch": 0.72, + "learning_rate": 1.779464789078926e-06, + "loss": 0.8965, + "step": 27978 + }, + { + "epoch": 0.72, + "learning_rate": 1.7794474547342254e-06, + "loss": 1.0811, + "step": 27979 + }, + { + "epoch": 0.72, + "learning_rate": 1.7794301197927374e-06, + "loss": 0.9775, + "step": 27980 + }, + { + "epoch": 0.72, + "learning_rate": 1.7794127842544757e-06, + "loss": 0.958, + "step": 27981 + }, + { + "epoch": 0.72, + "learning_rate": 1.7793954481194535e-06, + "loss": 1.0498, + "step": 27982 + }, + { + "epoch": 0.72, + "learning_rate": 1.7793781113876842e-06, + "loss": 1.0732, + "step": 27983 + }, + { + "epoch": 0.72, + "learning_rate": 1.7793607740591808e-06, + "loss": 0.8779, + "step": 27984 + }, + { + "epoch": 0.72, + "learning_rate": 1.7793434361339569e-06, + "loss": 0.9922, + "step": 27985 + }, + { + "epoch": 0.72, + "learning_rate": 1.7793260976120253e-06, + "loss": 0.8457, + "step": 27986 + }, + { + "epoch": 0.72, + "learning_rate": 1.7793087584933995e-06, + "loss": 0.8291, + "step": 27987 + }, + { + "epoch": 0.72, + "learning_rate": 1.7792914187780932e-06, + "loss": 0.9971, + "step": 27988 + }, + { + "epoch": 0.72, + "learning_rate": 1.7792740784661189e-06, + "loss": 1.0967, + "step": 27989 + }, + { + "epoch": 0.72, + "learning_rate": 1.7792567375574903e-06, + "loss": 0.8711, + "step": 27990 + }, + { + "epoch": 0.72, + "learning_rate": 1.7792393960522207e-06, + "loss": 0.7715, + "step": 27991 + }, + { + "epoch": 0.72, + "learning_rate": 1.7792220539503236e-06, + "loss": 0.7407, + "step": 27992 + }, + { + "epoch": 0.72, + "learning_rate": 1.7792047112518116e-06, + "loss": 0.6982, + "step": 27993 + }, + { + "epoch": 0.72, + "learning_rate": 1.7791873679566986e-06, + "loss": 0.7905, + "step": 27994 + }, + { + "epoch": 0.72, + "learning_rate": 1.7791700240649977e-06, + "loss": 0.8213, + "step": 27995 + }, + { + "epoch": 0.72, + "learning_rate": 1.7791526795767217e-06, + "loss": 0.917, + "step": 27996 + }, + { + "epoch": 0.72, + "learning_rate": 1.7791353344918848e-06, + "loss": 0.6597, + "step": 27997 + }, + { + "epoch": 0.72, + "learning_rate": 1.7791179888104999e-06, + "loss": 0.832, + "step": 27998 + }, + { + "epoch": 0.72, + "learning_rate": 1.7791006425325796e-06, + "loss": 0.7598, + "step": 27999 + }, + { + "epoch": 0.72, + "learning_rate": 1.7790832956581384e-06, + "loss": 0.8418, + "step": 28000 + }, + { + "epoch": 0.72, + "learning_rate": 1.7790659481871883e-06, + "loss": 0.7783, + "step": 28001 + }, + { + "epoch": 0.72, + "learning_rate": 1.7790486001197437e-06, + "loss": 0.8994, + "step": 28002 + }, + { + "epoch": 0.72, + "learning_rate": 1.7790312514558172e-06, + "loss": 0.8711, + "step": 28003 + }, + { + "epoch": 0.72, + "learning_rate": 1.7790139021954224e-06, + "loss": 0.8994, + "step": 28004 + }, + { + "epoch": 0.72, + "learning_rate": 1.7789965523385726e-06, + "loss": 0.8633, + "step": 28005 + }, + { + "epoch": 0.72, + "learning_rate": 1.778979201885281e-06, + "loss": 0.9307, + "step": 28006 + }, + { + "epoch": 0.72, + "learning_rate": 1.7789618508355604e-06, + "loss": 0.9209, + "step": 28007 + }, + { + "epoch": 0.72, + "learning_rate": 1.778944499189425e-06, + "loss": 0.7354, + "step": 28008 + }, + { + "epoch": 0.72, + "learning_rate": 1.7789271469468874e-06, + "loss": 0.9482, + "step": 28009 + }, + { + "epoch": 0.72, + "learning_rate": 1.7789097941079609e-06, + "loss": 0.4575, + "step": 28010 + }, + { + "epoch": 0.72, + "learning_rate": 1.778892440672659e-06, + "loss": 0.9062, + "step": 28011 + }, + { + "epoch": 0.72, + "learning_rate": 1.7788750866409954e-06, + "loss": 0.9385, + "step": 28012 + }, + { + "epoch": 0.72, + "learning_rate": 1.7788577320129827e-06, + "loss": 0.709, + "step": 28013 + }, + { + "epoch": 0.72, + "learning_rate": 1.7788403767886344e-06, + "loss": 0.9229, + "step": 28014 + }, + { + "epoch": 0.72, + "learning_rate": 1.7788230209679637e-06, + "loss": 0.7719, + "step": 28015 + }, + { + "epoch": 0.72, + "learning_rate": 1.7788056645509846e-06, + "loss": 0.7451, + "step": 28016 + }, + { + "epoch": 0.72, + "learning_rate": 1.7787883075377093e-06, + "loss": 1.0254, + "step": 28017 + }, + { + "epoch": 0.72, + "learning_rate": 1.7787709499281518e-06, + "loss": 0.7432, + "step": 28018 + }, + { + "epoch": 0.72, + "learning_rate": 1.778753591722325e-06, + "loss": 0.833, + "step": 28019 + }, + { + "epoch": 0.72, + "learning_rate": 1.7787362329202424e-06, + "loss": 0.7959, + "step": 28020 + }, + { + "epoch": 0.72, + "learning_rate": 1.7787188735219175e-06, + "loss": 0.6389, + "step": 28021 + }, + { + "epoch": 0.72, + "learning_rate": 1.7787015135273632e-06, + "loss": 0.8496, + "step": 28022 + }, + { + "epoch": 0.72, + "learning_rate": 1.7786841529365933e-06, + "loss": 1.0718, + "step": 28023 + }, + { + "epoch": 0.72, + "learning_rate": 1.7786667917496203e-06, + "loss": 0.958, + "step": 28024 + }, + { + "epoch": 0.72, + "learning_rate": 1.778649429966458e-06, + "loss": 0.791, + "step": 28025 + }, + { + "epoch": 0.72, + "learning_rate": 1.7786320675871198e-06, + "loss": 0.6709, + "step": 28026 + }, + { + "epoch": 0.72, + "learning_rate": 1.778614704611619e-06, + "loss": 1.0957, + "step": 28027 + }, + { + "epoch": 0.72, + "learning_rate": 1.778597341039968e-06, + "loss": 0.8652, + "step": 28028 + }, + { + "epoch": 0.72, + "learning_rate": 1.7785799768721814e-06, + "loss": 0.853, + "step": 28029 + }, + { + "epoch": 0.72, + "learning_rate": 1.7785626121082719e-06, + "loss": 0.9297, + "step": 28030 + }, + { + "epoch": 0.72, + "learning_rate": 1.7785452467482526e-06, + "loss": 0.9678, + "step": 28031 + }, + { + "epoch": 0.72, + "learning_rate": 1.7785278807921373e-06, + "loss": 0.9014, + "step": 28032 + }, + { + "epoch": 0.72, + "learning_rate": 1.7785105142399388e-06, + "loss": 0.7128, + "step": 28033 + }, + { + "epoch": 0.72, + "learning_rate": 1.7784931470916706e-06, + "loss": 0.8789, + "step": 28034 + }, + { + "epoch": 0.72, + "learning_rate": 1.7784757793473459e-06, + "loss": 1.0254, + "step": 28035 + }, + { + "epoch": 0.72, + "learning_rate": 1.7784584110069783e-06, + "loss": 0.8379, + "step": 28036 + }, + { + "epoch": 0.72, + "learning_rate": 1.778441042070581e-06, + "loss": 0.6826, + "step": 28037 + }, + { + "epoch": 0.72, + "learning_rate": 1.778423672538167e-06, + "loss": 0.748, + "step": 28038 + }, + { + "epoch": 0.72, + "learning_rate": 1.7784063024097496e-06, + "loss": 0.8311, + "step": 28039 + }, + { + "epoch": 0.72, + "learning_rate": 1.7783889316853424e-06, + "loss": 0.5825, + "step": 28040 + }, + { + "epoch": 0.72, + "learning_rate": 1.7783715603649587e-06, + "loss": 0.8608, + "step": 28041 + }, + { + "epoch": 0.72, + "learning_rate": 1.7783541884486116e-06, + "loss": 0.7812, + "step": 28042 + }, + { + "epoch": 0.72, + "learning_rate": 1.7783368159363145e-06, + "loss": 0.709, + "step": 28043 + }, + { + "epoch": 0.72, + "learning_rate": 1.7783194428280808e-06, + "loss": 0.8223, + "step": 28044 + }, + { + "epoch": 0.72, + "learning_rate": 1.7783020691239234e-06, + "loss": 1.0381, + "step": 28045 + }, + { + "epoch": 0.72, + "learning_rate": 1.7782846948238564e-06, + "loss": 0.8145, + "step": 28046 + }, + { + "epoch": 0.72, + "learning_rate": 1.778267319927892e-06, + "loss": 0.7314, + "step": 28047 + }, + { + "epoch": 0.72, + "learning_rate": 1.7782499444360446e-06, + "loss": 1.1201, + "step": 28048 + }, + { + "epoch": 0.72, + "learning_rate": 1.7782325683483266e-06, + "loss": 0.8857, + "step": 28049 + }, + { + "epoch": 0.72, + "learning_rate": 1.7782151916647518e-06, + "loss": 0.6792, + "step": 28050 + }, + { + "epoch": 0.72, + "learning_rate": 1.7781978143853338e-06, + "loss": 1.001, + "step": 28051 + }, + { + "epoch": 0.72, + "learning_rate": 1.7781804365100853e-06, + "loss": 0.7812, + "step": 28052 + }, + { + "epoch": 0.72, + "learning_rate": 1.7781630580390194e-06, + "loss": 0.5264, + "step": 28053 + }, + { + "epoch": 0.72, + "learning_rate": 1.7781456789721504e-06, + "loss": 0.8828, + "step": 28054 + }, + { + "epoch": 0.72, + "learning_rate": 1.7781282993094906e-06, + "loss": 0.6543, + "step": 28055 + }, + { + "epoch": 0.72, + "learning_rate": 1.7781109190510541e-06, + "loss": 0.6685, + "step": 28056 + }, + { + "epoch": 0.72, + "learning_rate": 1.7780935381968537e-06, + "loss": 0.8408, + "step": 28057 + }, + { + "epoch": 0.72, + "learning_rate": 1.778076156746903e-06, + "loss": 0.5991, + "step": 28058 + }, + { + "epoch": 0.72, + "learning_rate": 1.7780587747012149e-06, + "loss": 0.9678, + "step": 28059 + }, + { + "epoch": 0.72, + "learning_rate": 1.778041392059803e-06, + "loss": 0.8311, + "step": 28060 + }, + { + "epoch": 0.72, + "learning_rate": 1.7780240088226806e-06, + "loss": 0.9434, + "step": 28061 + }, + { + "epoch": 0.72, + "learning_rate": 1.7780066249898612e-06, + "loss": 0.8218, + "step": 28062 + }, + { + "epoch": 0.72, + "learning_rate": 1.7779892405613576e-06, + "loss": 0.8223, + "step": 28063 + }, + { + "epoch": 0.72, + "learning_rate": 1.7779718555371837e-06, + "loss": 0.8105, + "step": 28064 + }, + { + "epoch": 0.72, + "learning_rate": 1.7779544699173522e-06, + "loss": 0.752, + "step": 28065 + }, + { + "epoch": 0.72, + "learning_rate": 1.777937083701877e-06, + "loss": 0.8096, + "step": 28066 + }, + { + "epoch": 0.72, + "learning_rate": 1.777919696890771e-06, + "loss": 0.9492, + "step": 28067 + }, + { + "epoch": 0.72, + "learning_rate": 1.7779023094840477e-06, + "loss": 0.6064, + "step": 28068 + }, + { + "epoch": 0.72, + "learning_rate": 1.7778849214817203e-06, + "loss": 0.7891, + "step": 28069 + }, + { + "epoch": 0.72, + "learning_rate": 1.7778675328838023e-06, + "loss": 0.8804, + "step": 28070 + }, + { + "epoch": 0.72, + "learning_rate": 1.7778501436903071e-06, + "loss": 0.6411, + "step": 28071 + }, + { + "epoch": 0.72, + "learning_rate": 1.7778327539012474e-06, + "loss": 0.9844, + "step": 28072 + }, + { + "epoch": 0.72, + "learning_rate": 1.777815363516637e-06, + "loss": 1.0205, + "step": 28073 + }, + { + "epoch": 0.72, + "learning_rate": 1.7777979725364895e-06, + "loss": 0.8906, + "step": 28074 + }, + { + "epoch": 0.72, + "learning_rate": 1.7777805809608174e-06, + "loss": 0.6069, + "step": 28075 + }, + { + "epoch": 0.72, + "learning_rate": 1.7777631887896346e-06, + "loss": 0.7002, + "step": 28076 + }, + { + "epoch": 0.72, + "learning_rate": 1.7777457960229544e-06, + "loss": 0.9751, + "step": 28077 + }, + { + "epoch": 0.72, + "learning_rate": 1.7777284026607901e-06, + "loss": 0.9844, + "step": 28078 + }, + { + "epoch": 0.72, + "learning_rate": 1.7777110087031547e-06, + "loss": 0.7749, + "step": 28079 + }, + { + "epoch": 0.72, + "learning_rate": 1.7776936141500621e-06, + "loss": 0.9482, + "step": 28080 + }, + { + "epoch": 0.72, + "learning_rate": 1.7776762190015248e-06, + "loss": 0.7441, + "step": 28081 + }, + { + "epoch": 0.72, + "learning_rate": 1.7776588232575568e-06, + "loss": 0.8081, + "step": 28082 + }, + { + "epoch": 0.72, + "learning_rate": 1.7776414269181715e-06, + "loss": 0.6748, + "step": 28083 + }, + { + "epoch": 0.72, + "learning_rate": 1.7776240299833813e-06, + "loss": 0.8408, + "step": 28084 + }, + { + "epoch": 0.72, + "learning_rate": 1.7776066324532004e-06, + "loss": 0.6055, + "step": 28085 + }, + { + "epoch": 0.72, + "learning_rate": 1.777589234327642e-06, + "loss": 0.8271, + "step": 28086 + }, + { + "epoch": 0.72, + "learning_rate": 1.777571835606719e-06, + "loss": 0.8687, + "step": 28087 + }, + { + "epoch": 0.72, + "learning_rate": 1.7775544362904453e-06, + "loss": 0.9961, + "step": 28088 + }, + { + "epoch": 0.72, + "learning_rate": 1.7775370363788338e-06, + "loss": 0.7285, + "step": 28089 + }, + { + "epoch": 0.72, + "learning_rate": 1.777519635871898e-06, + "loss": 0.7163, + "step": 28090 + }, + { + "epoch": 0.72, + "learning_rate": 1.777502234769651e-06, + "loss": 1.1113, + "step": 28091 + }, + { + "epoch": 0.72, + "learning_rate": 1.7774848330721063e-06, + "loss": 0.9707, + "step": 28092 + }, + { + "epoch": 0.72, + "learning_rate": 1.7774674307792772e-06, + "loss": 0.8975, + "step": 28093 + }, + { + "epoch": 0.72, + "learning_rate": 1.7774500278911774e-06, + "loss": 0.9307, + "step": 28094 + }, + { + "epoch": 0.72, + "learning_rate": 1.7774326244078194e-06, + "loss": 0.7192, + "step": 28095 + }, + { + "epoch": 0.72, + "learning_rate": 1.7774152203292172e-06, + "loss": 1.0059, + "step": 28096 + }, + { + "epoch": 0.72, + "learning_rate": 1.7773978156553838e-06, + "loss": 0.6453, + "step": 28097 + }, + { + "epoch": 0.72, + "learning_rate": 1.7773804103863328e-06, + "loss": 0.7651, + "step": 28098 + }, + { + "epoch": 0.72, + "learning_rate": 1.7773630045220774e-06, + "loss": 0.8545, + "step": 28099 + }, + { + "epoch": 0.72, + "learning_rate": 1.7773455980626308e-06, + "loss": 0.8516, + "step": 28100 + }, + { + "epoch": 0.72, + "learning_rate": 1.7773281910080064e-06, + "loss": 1.0566, + "step": 28101 + }, + { + "epoch": 0.72, + "learning_rate": 1.7773107833582174e-06, + "loss": 0.8164, + "step": 28102 + }, + { + "epoch": 0.72, + "learning_rate": 1.7772933751132774e-06, + "loss": 0.8032, + "step": 28103 + }, + { + "epoch": 0.72, + "learning_rate": 1.7772759662731999e-06, + "loss": 0.957, + "step": 28104 + }, + { + "epoch": 0.72, + "learning_rate": 1.7772585568379976e-06, + "loss": 0.8672, + "step": 28105 + }, + { + "epoch": 0.72, + "learning_rate": 1.7772411468076843e-06, + "loss": 0.7744, + "step": 28106 + }, + { + "epoch": 0.72, + "learning_rate": 1.777223736182273e-06, + "loss": 0.8594, + "step": 28107 + }, + { + "epoch": 0.72, + "learning_rate": 1.7772063249617775e-06, + "loss": 1.0054, + "step": 28108 + }, + { + "epoch": 0.72, + "learning_rate": 1.7771889131462106e-06, + "loss": 0.8574, + "step": 28109 + }, + { + "epoch": 0.72, + "learning_rate": 1.777171500735586e-06, + "loss": 1.0137, + "step": 28110 + }, + { + "epoch": 0.72, + "learning_rate": 1.777154087729917e-06, + "loss": 0.873, + "step": 28111 + }, + { + "epoch": 0.72, + "learning_rate": 1.7771366741292165e-06, + "loss": 0.5957, + "step": 28112 + }, + { + "epoch": 0.72, + "learning_rate": 1.7771192599334985e-06, + "loss": 0.9346, + "step": 28113 + }, + { + "epoch": 0.72, + "learning_rate": 1.777101845142776e-06, + "loss": 0.7383, + "step": 28114 + }, + { + "epoch": 0.72, + "learning_rate": 1.7770844297570622e-06, + "loss": 0.9434, + "step": 28115 + }, + { + "epoch": 0.72, + "learning_rate": 1.7770670137763707e-06, + "loss": 0.7559, + "step": 28116 + }, + { + "epoch": 0.72, + "learning_rate": 1.7770495972007145e-06, + "loss": 1.0225, + "step": 28117 + }, + { + "epoch": 0.72, + "learning_rate": 1.7770321800301073e-06, + "loss": 1.0205, + "step": 28118 + }, + { + "epoch": 0.72, + "learning_rate": 1.7770147622645623e-06, + "loss": 0.7041, + "step": 28119 + }, + { + "epoch": 0.72, + "learning_rate": 1.776997343904093e-06, + "loss": 0.6548, + "step": 28120 + }, + { + "epoch": 0.72, + "learning_rate": 1.7769799249487126e-06, + "loss": 0.9814, + "step": 28121 + }, + { + "epoch": 0.72, + "learning_rate": 1.776962505398434e-06, + "loss": 1.0898, + "step": 28122 + }, + { + "epoch": 0.72, + "learning_rate": 1.7769450852532712e-06, + "loss": 0.9268, + "step": 28123 + }, + { + "epoch": 0.72, + "learning_rate": 1.7769276645132374e-06, + "loss": 1.0283, + "step": 28124 + }, + { + "epoch": 0.72, + "learning_rate": 1.7769102431783454e-06, + "loss": 0.7585, + "step": 28125 + }, + { + "epoch": 0.72, + "learning_rate": 1.7768928212486092e-06, + "loss": 0.9912, + "step": 28126 + }, + { + "epoch": 0.72, + "learning_rate": 1.776875398724042e-06, + "loss": 0.7549, + "step": 28127 + }, + { + "epoch": 0.72, + "learning_rate": 1.7768579756046568e-06, + "loss": 0.8066, + "step": 28128 + }, + { + "epoch": 0.72, + "learning_rate": 1.7768405518904674e-06, + "loss": 0.9414, + "step": 28129 + }, + { + "epoch": 0.72, + "learning_rate": 1.7768231275814869e-06, + "loss": 0.7715, + "step": 28130 + }, + { + "epoch": 0.72, + "learning_rate": 1.7768057026777284e-06, + "loss": 0.8828, + "step": 28131 + }, + { + "epoch": 0.72, + "learning_rate": 1.7767882771792055e-06, + "loss": 0.8105, + "step": 28132 + }, + { + "epoch": 0.72, + "learning_rate": 1.7767708510859318e-06, + "loss": 0.7012, + "step": 28133 + }, + { + "epoch": 0.72, + "learning_rate": 1.77675342439792e-06, + "loss": 0.5427, + "step": 28134 + }, + { + "epoch": 0.72, + "learning_rate": 1.7767359971151843e-06, + "loss": 1.125, + "step": 28135 + }, + { + "epoch": 0.72, + "learning_rate": 1.7767185692377371e-06, + "loss": 1.0518, + "step": 28136 + }, + { + "epoch": 0.72, + "learning_rate": 1.7767011407655926e-06, + "loss": 0.9551, + "step": 28137 + }, + { + "epoch": 0.72, + "learning_rate": 1.7766837116987636e-06, + "loss": 0.8174, + "step": 28138 + }, + { + "epoch": 0.72, + "learning_rate": 1.7766662820372635e-06, + "loss": 1.0449, + "step": 28139 + }, + { + "epoch": 0.72, + "learning_rate": 1.7766488517811058e-06, + "loss": 0.918, + "step": 28140 + }, + { + "epoch": 0.72, + "learning_rate": 1.776631420930304e-06, + "loss": 0.9785, + "step": 28141 + }, + { + "epoch": 0.72, + "learning_rate": 1.7766139894848708e-06, + "loss": 0.9043, + "step": 28142 + }, + { + "epoch": 0.72, + "learning_rate": 1.7765965574448204e-06, + "loss": 0.9951, + "step": 28143 + }, + { + "epoch": 0.72, + "learning_rate": 1.7765791248101654e-06, + "loss": 1.0117, + "step": 28144 + }, + { + "epoch": 0.72, + "learning_rate": 1.7765616915809197e-06, + "loss": 0.6462, + "step": 28145 + }, + { + "epoch": 0.72, + "learning_rate": 1.7765442577570965e-06, + "loss": 0.6685, + "step": 28146 + }, + { + "epoch": 0.72, + "learning_rate": 1.7765268233387088e-06, + "loss": 0.8794, + "step": 28147 + }, + { + "epoch": 0.72, + "learning_rate": 1.77650938832577e-06, + "loss": 0.9238, + "step": 28148 + }, + { + "epoch": 0.72, + "learning_rate": 1.776491952718294e-06, + "loss": 0.8516, + "step": 28149 + }, + { + "epoch": 0.72, + "learning_rate": 1.776474516516294e-06, + "loss": 1.0146, + "step": 28150 + }, + { + "epoch": 0.72, + "learning_rate": 1.7764570797197829e-06, + "loss": 1.0898, + "step": 28151 + }, + { + "epoch": 0.72, + "learning_rate": 1.7764396423287744e-06, + "loss": 0.6934, + "step": 28152 + }, + { + "epoch": 0.72, + "learning_rate": 1.7764222043432816e-06, + "loss": 0.8789, + "step": 28153 + }, + { + "epoch": 0.72, + "learning_rate": 1.7764047657633184e-06, + "loss": 0.6484, + "step": 28154 + }, + { + "epoch": 0.72, + "learning_rate": 1.7763873265888974e-06, + "loss": 0.8416, + "step": 28155 + }, + { + "epoch": 0.72, + "learning_rate": 1.7763698868200324e-06, + "loss": 0.7632, + "step": 28156 + }, + { + "epoch": 0.72, + "learning_rate": 1.7763524464567368e-06, + "loss": 0.8838, + "step": 28157 + }, + { + "epoch": 0.72, + "learning_rate": 1.7763350054990238e-06, + "loss": 1.0088, + "step": 28158 + }, + { + "epoch": 0.72, + "learning_rate": 1.7763175639469065e-06, + "loss": 0.7588, + "step": 28159 + }, + { + "epoch": 0.72, + "learning_rate": 1.776300121800399e-06, + "loss": 0.6562, + "step": 28160 + }, + { + "epoch": 0.72, + "learning_rate": 1.776282679059514e-06, + "loss": 1.0059, + "step": 28161 + }, + { + "epoch": 0.72, + "learning_rate": 1.7762652357242649e-06, + "loss": 0.75, + "step": 28162 + }, + { + "epoch": 0.72, + "learning_rate": 1.7762477917946654e-06, + "loss": 0.9248, + "step": 28163 + }, + { + "epoch": 0.72, + "learning_rate": 1.7762303472707286e-06, + "loss": 0.7271, + "step": 28164 + }, + { + "epoch": 0.72, + "learning_rate": 1.7762129021524679e-06, + "loss": 0.7866, + "step": 28165 + }, + { + "epoch": 0.72, + "learning_rate": 1.7761954564398965e-06, + "loss": 0.9268, + "step": 28166 + }, + { + "epoch": 0.72, + "learning_rate": 1.7761780101330281e-06, + "loss": 0.8125, + "step": 28167 + }, + { + "epoch": 0.72, + "learning_rate": 1.776160563231876e-06, + "loss": 0.7979, + "step": 28168 + }, + { + "epoch": 0.72, + "learning_rate": 1.7761431157364533e-06, + "loss": 0.6687, + "step": 28169 + }, + { + "epoch": 0.72, + "learning_rate": 1.7761256676467735e-06, + "loss": 0.6309, + "step": 28170 + }, + { + "epoch": 0.72, + "learning_rate": 1.77610821896285e-06, + "loss": 0.7676, + "step": 28171 + }, + { + "epoch": 0.72, + "learning_rate": 1.776090769684696e-06, + "loss": 0.8496, + "step": 28172 + }, + { + "epoch": 0.72, + "learning_rate": 1.7760733198123253e-06, + "loss": 1.0244, + "step": 28173 + }, + { + "epoch": 0.72, + "learning_rate": 1.7760558693457507e-06, + "loss": 0.9365, + "step": 28174 + }, + { + "epoch": 0.72, + "learning_rate": 1.776038418284986e-06, + "loss": 0.9053, + "step": 28175 + }, + { + "epoch": 0.72, + "learning_rate": 1.7760209666300441e-06, + "loss": 0.9189, + "step": 28176 + }, + { + "epoch": 0.72, + "learning_rate": 1.7760035143809387e-06, + "loss": 0.874, + "step": 28177 + }, + { + "epoch": 0.72, + "learning_rate": 1.7759860615376831e-06, + "loss": 0.9258, + "step": 28178 + }, + { + "epoch": 0.72, + "learning_rate": 1.7759686081002907e-06, + "loss": 0.9111, + "step": 28179 + }, + { + "epoch": 0.72, + "learning_rate": 1.775951154068775e-06, + "loss": 0.8955, + "step": 28180 + }, + { + "epoch": 0.72, + "learning_rate": 1.7759336994431488e-06, + "loss": 0.9609, + "step": 28181 + }, + { + "epoch": 0.72, + "learning_rate": 1.775916244223426e-06, + "loss": 0.8506, + "step": 28182 + }, + { + "epoch": 0.72, + "learning_rate": 1.77589878840962e-06, + "loss": 0.8496, + "step": 28183 + }, + { + "epoch": 0.72, + "learning_rate": 1.7758813320017437e-06, + "loss": 0.7471, + "step": 28184 + }, + { + "epoch": 0.72, + "learning_rate": 1.7758638749998108e-06, + "loss": 1.0146, + "step": 28185 + }, + { + "epoch": 0.72, + "learning_rate": 1.7758464174038345e-06, + "loss": 0.9814, + "step": 28186 + }, + { + "epoch": 0.72, + "learning_rate": 1.7758289592138285e-06, + "loss": 0.9248, + "step": 28187 + }, + { + "epoch": 0.72, + "learning_rate": 1.775811500429806e-06, + "loss": 0.8955, + "step": 28188 + }, + { + "epoch": 0.72, + "learning_rate": 1.77579404105178e-06, + "loss": 0.8662, + "step": 28189 + }, + { + "epoch": 0.72, + "learning_rate": 1.7757765810797647e-06, + "loss": 0.7144, + "step": 28190 + }, + { + "epoch": 0.72, + "learning_rate": 1.7757591205137724e-06, + "loss": 0.7207, + "step": 28191 + }, + { + "epoch": 0.72, + "learning_rate": 1.7757416593538173e-06, + "loss": 0.8057, + "step": 28192 + }, + { + "epoch": 0.72, + "learning_rate": 1.7757241975999121e-06, + "loss": 0.7891, + "step": 28193 + }, + { + "epoch": 0.72, + "learning_rate": 1.775706735252071e-06, + "loss": 1.002, + "step": 28194 + }, + { + "epoch": 0.72, + "learning_rate": 1.775689272310307e-06, + "loss": 1.0654, + "step": 28195 + }, + { + "epoch": 0.72, + "learning_rate": 1.775671808774633e-06, + "loss": 0.6621, + "step": 28196 + }, + { + "epoch": 0.72, + "learning_rate": 1.775654344645063e-06, + "loss": 1.0293, + "step": 28197 + }, + { + "epoch": 0.72, + "learning_rate": 1.77563687992161e-06, + "loss": 0.7451, + "step": 28198 + }, + { + "epoch": 0.72, + "learning_rate": 1.7756194146042876e-06, + "loss": 0.7905, + "step": 28199 + }, + { + "epoch": 0.72, + "learning_rate": 1.775601948693109e-06, + "loss": 0.7178, + "step": 28200 + }, + { + "epoch": 0.72, + "learning_rate": 1.7755844821880877e-06, + "loss": 0.9277, + "step": 28201 + }, + { + "epoch": 0.72, + "learning_rate": 1.775567015089237e-06, + "loss": 0.8984, + "step": 28202 + }, + { + "epoch": 0.72, + "learning_rate": 1.7755495473965703e-06, + "loss": 0.8184, + "step": 28203 + }, + { + "epoch": 0.72, + "learning_rate": 1.7755320791101007e-06, + "loss": 0.7197, + "step": 28204 + }, + { + "epoch": 0.72, + "learning_rate": 1.7755146102298424e-06, + "loss": 0.8149, + "step": 28205 + }, + { + "epoch": 0.72, + "learning_rate": 1.775497140755808e-06, + "loss": 0.9404, + "step": 28206 + }, + { + "epoch": 0.72, + "learning_rate": 1.775479670688011e-06, + "loss": 0.9375, + "step": 28207 + }, + { + "epoch": 0.72, + "learning_rate": 1.7754622000264648e-06, + "loss": 0.9082, + "step": 28208 + }, + { + "epoch": 0.72, + "learning_rate": 1.775444728771183e-06, + "loss": 0.8516, + "step": 28209 + }, + { + "epoch": 0.72, + "learning_rate": 1.775427256922179e-06, + "loss": 0.8516, + "step": 28210 + }, + { + "epoch": 0.72, + "learning_rate": 1.7754097844794656e-06, + "loss": 0.9775, + "step": 28211 + }, + { + "epoch": 0.72, + "learning_rate": 1.7753923114430566e-06, + "loss": 0.9668, + "step": 28212 + }, + { + "epoch": 0.72, + "learning_rate": 1.7753748378129658e-06, + "loss": 0.9346, + "step": 28213 + }, + { + "epoch": 0.72, + "learning_rate": 1.7753573635892059e-06, + "loss": 0.7666, + "step": 28214 + }, + { + "epoch": 0.72, + "learning_rate": 1.7753398887717906e-06, + "loss": 0.8477, + "step": 28215 + }, + { + "epoch": 0.72, + "learning_rate": 1.775322413360733e-06, + "loss": 0.958, + "step": 28216 + }, + { + "epoch": 0.72, + "learning_rate": 1.7753049373560467e-06, + "loss": 0.7095, + "step": 28217 + }, + { + "epoch": 0.72, + "learning_rate": 1.7752874607577453e-06, + "loss": 0.8779, + "step": 28218 + }, + { + "epoch": 0.72, + "learning_rate": 1.7752699835658415e-06, + "loss": 0.8213, + "step": 28219 + }, + { + "epoch": 0.72, + "learning_rate": 1.7752525057803496e-06, + "loss": 0.7275, + "step": 28220 + }, + { + "epoch": 0.72, + "learning_rate": 1.7752350274012824e-06, + "loss": 0.8662, + "step": 28221 + }, + { + "epoch": 0.72, + "learning_rate": 1.7752175484286532e-06, + "loss": 0.8555, + "step": 28222 + }, + { + "epoch": 0.72, + "learning_rate": 1.7752000688624756e-06, + "loss": 0.7153, + "step": 28223 + }, + { + "epoch": 0.72, + "learning_rate": 1.775182588702763e-06, + "loss": 0.877, + "step": 28224 + }, + { + "epoch": 0.72, + "learning_rate": 1.7751651079495287e-06, + "loss": 0.9141, + "step": 28225 + }, + { + "epoch": 0.72, + "learning_rate": 1.775147626602786e-06, + "loss": 0.6384, + "step": 28226 + }, + { + "epoch": 0.72, + "learning_rate": 1.7751301446625488e-06, + "loss": 0.8184, + "step": 28227 + }, + { + "epoch": 0.72, + "learning_rate": 1.7751126621288298e-06, + "loss": 0.8242, + "step": 28228 + }, + { + "epoch": 0.72, + "learning_rate": 1.7750951790016425e-06, + "loss": 0.8506, + "step": 28229 + }, + { + "epoch": 0.72, + "learning_rate": 1.7750776952810009e-06, + "loss": 0.793, + "step": 28230 + }, + { + "epoch": 0.72, + "learning_rate": 1.7750602109669178e-06, + "loss": 0.9346, + "step": 28231 + }, + { + "epoch": 0.72, + "learning_rate": 1.7750427260594068e-06, + "loss": 0.8994, + "step": 28232 + }, + { + "epoch": 0.72, + "learning_rate": 1.7750252405584808e-06, + "loss": 0.7185, + "step": 28233 + }, + { + "epoch": 0.72, + "learning_rate": 1.775007754464154e-06, + "loss": 0.8794, + "step": 28234 + }, + { + "epoch": 0.72, + "learning_rate": 1.7749902677764394e-06, + "loss": 0.8545, + "step": 28235 + }, + { + "epoch": 0.72, + "learning_rate": 1.7749727804953503e-06, + "loss": 0.8115, + "step": 28236 + }, + { + "epoch": 0.72, + "learning_rate": 1.7749552926209001e-06, + "loss": 0.8887, + "step": 28237 + }, + { + "epoch": 0.72, + "learning_rate": 1.7749378041531023e-06, + "loss": 0.792, + "step": 28238 + }, + { + "epoch": 0.72, + "learning_rate": 1.7749203150919705e-06, + "loss": 0.915, + "step": 28239 + }, + { + "epoch": 0.72, + "learning_rate": 1.7749028254375174e-06, + "loss": 0.7847, + "step": 28240 + }, + { + "epoch": 0.72, + "learning_rate": 1.774885335189757e-06, + "loss": 0.8291, + "step": 28241 + }, + { + "epoch": 0.72, + "learning_rate": 1.774867844348703e-06, + "loss": 0.8501, + "step": 28242 + }, + { + "epoch": 0.72, + "learning_rate": 1.7748503529143677e-06, + "loss": 0.7437, + "step": 28243 + }, + { + "epoch": 0.72, + "learning_rate": 1.7748328608867653e-06, + "loss": 0.9014, + "step": 28244 + }, + { + "epoch": 0.72, + "learning_rate": 1.774815368265909e-06, + "loss": 0.6998, + "step": 28245 + }, + { + "epoch": 0.72, + "learning_rate": 1.7747978750518123e-06, + "loss": 0.8535, + "step": 28246 + }, + { + "epoch": 0.72, + "learning_rate": 1.7747803812444887e-06, + "loss": 1.0498, + "step": 28247 + }, + { + "epoch": 0.72, + "learning_rate": 1.7747628868439508e-06, + "loss": 0.8274, + "step": 28248 + }, + { + "epoch": 0.72, + "learning_rate": 1.7747453918502129e-06, + "loss": 0.9053, + "step": 28249 + }, + { + "epoch": 0.72, + "learning_rate": 1.774727896263288e-06, + "loss": 0.9238, + "step": 28250 + }, + { + "epoch": 0.72, + "learning_rate": 1.7747104000831898e-06, + "loss": 0.9004, + "step": 28251 + }, + { + "epoch": 0.72, + "learning_rate": 1.7746929033099312e-06, + "loss": 0.7935, + "step": 28252 + }, + { + "epoch": 0.72, + "learning_rate": 1.774675405943526e-06, + "loss": 0.8911, + "step": 28253 + }, + { + "epoch": 0.72, + "learning_rate": 1.7746579079839874e-06, + "loss": 0.8867, + "step": 28254 + }, + { + "epoch": 0.72, + "learning_rate": 1.774640409431329e-06, + "loss": 0.897, + "step": 28255 + }, + { + "epoch": 0.72, + "learning_rate": 1.774622910285564e-06, + "loss": 1.1309, + "step": 28256 + }, + { + "epoch": 0.72, + "learning_rate": 1.7746054105467058e-06, + "loss": 0.8926, + "step": 28257 + }, + { + "epoch": 0.72, + "learning_rate": 1.7745879102147679e-06, + "loss": 1.0752, + "step": 28258 + }, + { + "epoch": 0.72, + "learning_rate": 1.7745704092897634e-06, + "loss": 0.9492, + "step": 28259 + }, + { + "epoch": 0.72, + "learning_rate": 1.7745529077717066e-06, + "loss": 0.7939, + "step": 28260 + }, + { + "epoch": 0.72, + "learning_rate": 1.7745354056606096e-06, + "loss": 0.7329, + "step": 28261 + }, + { + "epoch": 0.72, + "learning_rate": 1.7745179029564868e-06, + "loss": 0.9189, + "step": 28262 + }, + { + "epoch": 0.72, + "learning_rate": 1.774500399659351e-06, + "loss": 1.0811, + "step": 28263 + }, + { + "epoch": 0.72, + "learning_rate": 1.7744828957692163e-06, + "loss": 0.7529, + "step": 28264 + }, + { + "epoch": 0.72, + "learning_rate": 1.7744653912860952e-06, + "loss": 0.9541, + "step": 28265 + }, + { + "epoch": 0.72, + "learning_rate": 1.7744478862100019e-06, + "loss": 0.9668, + "step": 28266 + }, + { + "epoch": 0.72, + "learning_rate": 1.7744303805409491e-06, + "loss": 1.1348, + "step": 28267 + }, + { + "epoch": 0.72, + "learning_rate": 1.7744128742789508e-06, + "loss": 0.5928, + "step": 28268 + }, + { + "epoch": 0.72, + "learning_rate": 1.7743953674240202e-06, + "loss": 0.8936, + "step": 28269 + }, + { + "epoch": 0.72, + "learning_rate": 1.7743778599761705e-06, + "loss": 0.7432, + "step": 28270 + }, + { + "epoch": 0.72, + "learning_rate": 1.7743603519354155e-06, + "loss": 0.8252, + "step": 28271 + }, + { + "epoch": 0.72, + "learning_rate": 1.7743428433017682e-06, + "loss": 1.0215, + "step": 28272 + }, + { + "epoch": 0.72, + "learning_rate": 1.7743253340752422e-06, + "loss": 0.7866, + "step": 28273 + }, + { + "epoch": 0.72, + "learning_rate": 1.7743078242558509e-06, + "loss": 0.8994, + "step": 28274 + }, + { + "epoch": 0.72, + "learning_rate": 1.7742903138436078e-06, + "loss": 0.8477, + "step": 28275 + }, + { + "epoch": 0.72, + "learning_rate": 1.7742728028385261e-06, + "loss": 0.8301, + "step": 28276 + }, + { + "epoch": 0.72, + "learning_rate": 1.7742552912406196e-06, + "loss": 0.8867, + "step": 28277 + }, + { + "epoch": 0.72, + "learning_rate": 1.7742377790499013e-06, + "loss": 0.8604, + "step": 28278 + }, + { + "epoch": 0.72, + "learning_rate": 1.7742202662663846e-06, + "loss": 0.9385, + "step": 28279 + }, + { + "epoch": 0.72, + "learning_rate": 1.7742027528900829e-06, + "loss": 0.96, + "step": 28280 + }, + { + "epoch": 0.72, + "learning_rate": 1.77418523892101e-06, + "loss": 0.9072, + "step": 28281 + }, + { + "epoch": 0.72, + "learning_rate": 1.7741677243591791e-06, + "loss": 0.8623, + "step": 28282 + }, + { + "epoch": 0.72, + "learning_rate": 1.7741502092046034e-06, + "loss": 0.7568, + "step": 28283 + }, + { + "epoch": 0.72, + "learning_rate": 1.7741326934572964e-06, + "loss": 0.8867, + "step": 28284 + }, + { + "epoch": 0.72, + "learning_rate": 1.774115177117272e-06, + "loss": 1.084, + "step": 28285 + }, + { + "epoch": 0.72, + "learning_rate": 1.7740976601845427e-06, + "loss": 0.6455, + "step": 28286 + }, + { + "epoch": 0.73, + "learning_rate": 1.7740801426591228e-06, + "loss": 0.9033, + "step": 28287 + }, + { + "epoch": 0.73, + "learning_rate": 1.774062624541025e-06, + "loss": 0.6909, + "step": 28288 + }, + { + "epoch": 0.73, + "learning_rate": 1.7740451058302633e-06, + "loss": 0.874, + "step": 28289 + }, + { + "epoch": 0.73, + "learning_rate": 1.7740275865268509e-06, + "loss": 0.8682, + "step": 28290 + }, + { + "epoch": 0.73, + "learning_rate": 1.7740100666308009e-06, + "loss": 0.7368, + "step": 28291 + }, + { + "epoch": 0.73, + "learning_rate": 1.7739925461421272e-06, + "loss": 0.9834, + "step": 28292 + }, + { + "epoch": 0.73, + "learning_rate": 1.7739750250608428e-06, + "loss": 1.0488, + "step": 28293 + }, + { + "epoch": 0.73, + "learning_rate": 1.7739575033869617e-06, + "loss": 0.8477, + "step": 28294 + }, + { + "epoch": 0.73, + "learning_rate": 1.7739399811204965e-06, + "loss": 0.917, + "step": 28295 + }, + { + "epoch": 0.73, + "learning_rate": 1.773922458261461e-06, + "loss": 0.8955, + "step": 28296 + }, + { + "epoch": 0.73, + "learning_rate": 1.773904934809869e-06, + "loss": 0.8086, + "step": 28297 + }, + { + "epoch": 0.73, + "learning_rate": 1.7738874107657336e-06, + "loss": 0.7295, + "step": 28298 + }, + { + "epoch": 0.73, + "learning_rate": 1.7738698861290678e-06, + "loss": 1.0371, + "step": 28299 + }, + { + "epoch": 0.73, + "learning_rate": 1.7738523608998857e-06, + "loss": 0.7632, + "step": 28300 + }, + { + "epoch": 0.73, + "learning_rate": 1.7738348350782003e-06, + "loss": 0.5583, + "step": 28301 + }, + { + "epoch": 0.73, + "learning_rate": 1.7738173086640253e-06, + "loss": 0.5886, + "step": 28302 + }, + { + "epoch": 0.73, + "learning_rate": 1.773799781657374e-06, + "loss": 1.0371, + "step": 28303 + }, + { + "epoch": 0.73, + "learning_rate": 1.7737822540582596e-06, + "loss": 0.7471, + "step": 28304 + }, + { + "epoch": 0.73, + "learning_rate": 1.7737647258666959e-06, + "loss": 0.8945, + "step": 28305 + }, + { + "epoch": 0.73, + "learning_rate": 1.773747197082696e-06, + "loss": 0.8262, + "step": 28306 + }, + { + "epoch": 0.73, + "learning_rate": 1.7737296677062734e-06, + "loss": 0.8975, + "step": 28307 + }, + { + "epoch": 0.73, + "learning_rate": 1.7737121377374416e-06, + "loss": 0.5657, + "step": 28308 + }, + { + "epoch": 0.73, + "learning_rate": 1.773694607176214e-06, + "loss": 0.7314, + "step": 28309 + }, + { + "epoch": 0.73, + "learning_rate": 1.7736770760226043e-06, + "loss": 0.6685, + "step": 28310 + }, + { + "epoch": 0.73, + "learning_rate": 1.7736595442766253e-06, + "loss": 0.6243, + "step": 28311 + }, + { + "epoch": 0.73, + "learning_rate": 1.7736420119382909e-06, + "loss": 0.7432, + "step": 28312 + }, + { + "epoch": 0.73, + "learning_rate": 1.7736244790076142e-06, + "loss": 0.958, + "step": 28313 + }, + { + "epoch": 0.73, + "learning_rate": 1.7736069454846087e-06, + "loss": 0.9297, + "step": 28314 + }, + { + "epoch": 0.73, + "learning_rate": 1.7735894113692882e-06, + "loss": 0.9932, + "step": 28315 + }, + { + "epoch": 0.73, + "learning_rate": 1.7735718766616658e-06, + "loss": 0.7324, + "step": 28316 + }, + { + "epoch": 0.73, + "learning_rate": 1.773554341361755e-06, + "loss": 0.7759, + "step": 28317 + }, + { + "epoch": 0.73, + "learning_rate": 1.7735368054695695e-06, + "loss": 0.7056, + "step": 28318 + }, + { + "epoch": 0.73, + "learning_rate": 1.773519268985122e-06, + "loss": 1.0518, + "step": 28319 + }, + { + "epoch": 0.73, + "learning_rate": 1.7735017319084266e-06, + "loss": 0.8018, + "step": 28320 + }, + { + "epoch": 0.73, + "learning_rate": 1.7734841942394963e-06, + "loss": 0.9678, + "step": 28321 + }, + { + "epoch": 0.73, + "learning_rate": 1.773466655978345e-06, + "loss": 0.7524, + "step": 28322 + }, + { + "epoch": 0.73, + "learning_rate": 1.7734491171249854e-06, + "loss": 0.8916, + "step": 28323 + }, + { + "epoch": 0.73, + "learning_rate": 1.7734315776794317e-06, + "loss": 1.0098, + "step": 28324 + }, + { + "epoch": 0.73, + "learning_rate": 1.7734140376416972e-06, + "loss": 0.7749, + "step": 28325 + }, + { + "epoch": 0.73, + "learning_rate": 1.7733964970117947e-06, + "loss": 0.8696, + "step": 28326 + }, + { + "epoch": 0.73, + "learning_rate": 1.7733789557897384e-06, + "loss": 0.9238, + "step": 28327 + }, + { + "epoch": 0.73, + "learning_rate": 1.7733614139755413e-06, + "loss": 0.9741, + "step": 28328 + }, + { + "epoch": 0.73, + "learning_rate": 1.7733438715692168e-06, + "loss": 1.0068, + "step": 28329 + }, + { + "epoch": 0.73, + "learning_rate": 1.7733263285707785e-06, + "loss": 0.9609, + "step": 28330 + }, + { + "epoch": 0.73, + "learning_rate": 1.77330878498024e-06, + "loss": 0.6895, + "step": 28331 + }, + { + "epoch": 0.73, + "learning_rate": 1.773291240797614e-06, + "loss": 0.604, + "step": 28332 + }, + { + "epoch": 0.73, + "learning_rate": 1.773273696022915e-06, + "loss": 0.7949, + "step": 28333 + }, + { + "epoch": 0.73, + "learning_rate": 1.7732561506561555e-06, + "loss": 0.8672, + "step": 28334 + }, + { + "epoch": 0.73, + "learning_rate": 1.7732386046973496e-06, + "loss": 0.6846, + "step": 28335 + }, + { + "epoch": 0.73, + "learning_rate": 1.7732210581465104e-06, + "loss": 0.9883, + "step": 28336 + }, + { + "epoch": 0.73, + "learning_rate": 1.7732035110036513e-06, + "loss": 0.8428, + "step": 28337 + }, + { + "epoch": 0.73, + "learning_rate": 1.7731859632687858e-06, + "loss": 0.7925, + "step": 28338 + }, + { + "epoch": 0.73, + "learning_rate": 1.7731684149419275e-06, + "loss": 0.8057, + "step": 28339 + }, + { + "epoch": 0.73, + "learning_rate": 1.7731508660230896e-06, + "loss": 1.0723, + "step": 28340 + }, + { + "epoch": 0.73, + "learning_rate": 1.7731333165122857e-06, + "loss": 1.0376, + "step": 28341 + }, + { + "epoch": 0.73, + "learning_rate": 1.773115766409529e-06, + "loss": 1.1201, + "step": 28342 + }, + { + "epoch": 0.73, + "learning_rate": 1.7730982157148333e-06, + "loss": 0.7041, + "step": 28343 + }, + { + "epoch": 0.73, + "learning_rate": 1.7730806644282118e-06, + "loss": 0.8037, + "step": 28344 + }, + { + "epoch": 0.73, + "learning_rate": 1.773063112549678e-06, + "loss": 0.8291, + "step": 28345 + }, + { + "epoch": 0.73, + "learning_rate": 1.7730455600792453e-06, + "loss": 0.9854, + "step": 28346 + }, + { + "epoch": 0.73, + "learning_rate": 1.773028007016927e-06, + "loss": 0.9102, + "step": 28347 + }, + { + "epoch": 0.73, + "learning_rate": 1.773010453362737e-06, + "loss": 0.8535, + "step": 28348 + }, + { + "epoch": 0.73, + "learning_rate": 1.772992899116688e-06, + "loss": 0.8926, + "step": 28349 + }, + { + "epoch": 0.73, + "learning_rate": 1.7729753442787945e-06, + "loss": 0.7061, + "step": 28350 + }, + { + "epoch": 0.73, + "learning_rate": 1.7729577888490688e-06, + "loss": 0.8301, + "step": 28351 + }, + { + "epoch": 0.73, + "learning_rate": 1.7729402328275252e-06, + "loss": 0.6719, + "step": 28352 + }, + { + "epoch": 0.73, + "learning_rate": 1.7729226762141764e-06, + "loss": 0.7588, + "step": 28353 + }, + { + "epoch": 0.73, + "learning_rate": 1.7729051190090364e-06, + "loss": 0.8232, + "step": 28354 + }, + { + "epoch": 0.73, + "learning_rate": 1.7728875612121187e-06, + "loss": 0.8071, + "step": 28355 + }, + { + "epoch": 0.73, + "learning_rate": 1.7728700028234365e-06, + "loss": 1.0391, + "step": 28356 + }, + { + "epoch": 0.73, + "learning_rate": 1.7728524438430032e-06, + "loss": 1.0098, + "step": 28357 + }, + { + "epoch": 0.73, + "learning_rate": 1.7728348842708325e-06, + "loss": 0.8418, + "step": 28358 + }, + { + "epoch": 0.73, + "learning_rate": 1.7728173241069372e-06, + "loss": 0.9316, + "step": 28359 + }, + { + "epoch": 0.73, + "learning_rate": 1.7727997633513314e-06, + "loss": 0.7993, + "step": 28360 + }, + { + "epoch": 0.73, + "learning_rate": 1.7727822020040287e-06, + "loss": 0.9043, + "step": 28361 + }, + { + "epoch": 0.73, + "learning_rate": 1.7727646400650418e-06, + "loss": 0.7803, + "step": 28362 + }, + { + "epoch": 0.73, + "learning_rate": 1.7727470775343846e-06, + "loss": 0.7925, + "step": 28363 + }, + { + "epoch": 0.73, + "learning_rate": 1.7727295144120706e-06, + "loss": 0.6357, + "step": 28364 + }, + { + "epoch": 0.73, + "learning_rate": 1.7727119506981133e-06, + "loss": 0.9629, + "step": 28365 + }, + { + "epoch": 0.73, + "learning_rate": 1.7726943863925258e-06, + "loss": 0.834, + "step": 28366 + }, + { + "epoch": 0.73, + "learning_rate": 1.7726768214953217e-06, + "loss": 1.0693, + "step": 28367 + }, + { + "epoch": 0.73, + "learning_rate": 1.7726592560065145e-06, + "loss": 0.635, + "step": 28368 + }, + { + "epoch": 0.73, + "learning_rate": 1.7726416899261176e-06, + "loss": 0.9717, + "step": 28369 + }, + { + "epoch": 0.73, + "learning_rate": 1.7726241232541447e-06, + "loss": 0.8984, + "step": 28370 + }, + { + "epoch": 0.73, + "learning_rate": 1.772606555990609e-06, + "loss": 0.6272, + "step": 28371 + }, + { + "epoch": 0.73, + "learning_rate": 1.7725889881355238e-06, + "loss": 0.7471, + "step": 28372 + }, + { + "epoch": 0.73, + "learning_rate": 1.7725714196889029e-06, + "loss": 0.8242, + "step": 28373 + }, + { + "epoch": 0.73, + "learning_rate": 1.7725538506507594e-06, + "loss": 0.7251, + "step": 28374 + }, + { + "epoch": 0.73, + "learning_rate": 1.7725362810211072e-06, + "loss": 0.8721, + "step": 28375 + }, + { + "epoch": 0.73, + "learning_rate": 1.7725187107999592e-06, + "loss": 0.892, + "step": 28376 + }, + { + "epoch": 0.73, + "learning_rate": 1.7725011399873293e-06, + "loss": 0.8066, + "step": 28377 + }, + { + "epoch": 0.73, + "learning_rate": 1.772483568583231e-06, + "loss": 0.6992, + "step": 28378 + }, + { + "epoch": 0.73, + "learning_rate": 1.7724659965876773e-06, + "loss": 0.9365, + "step": 28379 + }, + { + "epoch": 0.73, + "learning_rate": 1.772448424000682e-06, + "loss": 0.9917, + "step": 28380 + }, + { + "epoch": 0.73, + "learning_rate": 1.7724308508222584e-06, + "loss": 0.7612, + "step": 28381 + }, + { + "epoch": 0.73, + "learning_rate": 1.7724132770524199e-06, + "loss": 0.9268, + "step": 28382 + }, + { + "epoch": 0.73, + "learning_rate": 1.77239570269118e-06, + "loss": 0.7739, + "step": 28383 + }, + { + "epoch": 0.73, + "learning_rate": 1.7723781277385523e-06, + "loss": 0.9844, + "step": 28384 + }, + { + "epoch": 0.73, + "learning_rate": 1.7723605521945504e-06, + "loss": 1.1016, + "step": 28385 + }, + { + "epoch": 0.73, + "learning_rate": 1.7723429760591875e-06, + "loss": 1.0674, + "step": 28386 + }, + { + "epoch": 0.73, + "learning_rate": 1.7723253993324772e-06, + "loss": 0.8096, + "step": 28387 + }, + { + "epoch": 0.73, + "learning_rate": 1.7723078220144325e-06, + "loss": 0.8301, + "step": 28388 + }, + { + "epoch": 0.73, + "learning_rate": 1.7722902441050674e-06, + "loss": 0.6316, + "step": 28389 + }, + { + "epoch": 0.73, + "learning_rate": 1.772272665604395e-06, + "loss": 0.665, + "step": 28390 + }, + { + "epoch": 0.73, + "learning_rate": 1.772255086512429e-06, + "loss": 0.9673, + "step": 28391 + }, + { + "epoch": 0.73, + "learning_rate": 1.772237506829183e-06, + "loss": 0.9551, + "step": 28392 + }, + { + "epoch": 0.73, + "learning_rate": 1.7722199265546702e-06, + "loss": 1.0098, + "step": 28393 + }, + { + "epoch": 0.73, + "learning_rate": 1.772202345688904e-06, + "loss": 0.6725, + "step": 28394 + }, + { + "epoch": 0.73, + "learning_rate": 1.772184764231898e-06, + "loss": 0.8462, + "step": 28395 + }, + { + "epoch": 0.73, + "learning_rate": 1.7721671821836659e-06, + "loss": 0.8555, + "step": 28396 + }, + { + "epoch": 0.73, + "learning_rate": 1.7721495995442205e-06, + "loss": 0.6299, + "step": 28397 + }, + { + "epoch": 0.73, + "learning_rate": 1.7721320163135759e-06, + "loss": 0.6807, + "step": 28398 + }, + { + "epoch": 0.73, + "learning_rate": 1.7721144324917452e-06, + "loss": 0.874, + "step": 28399 + }, + { + "epoch": 0.73, + "learning_rate": 1.772096848078742e-06, + "loss": 0.7529, + "step": 28400 + }, + { + "epoch": 0.73, + "learning_rate": 1.7720792630745796e-06, + "loss": 0.7061, + "step": 28401 + }, + { + "epoch": 0.73, + "learning_rate": 1.7720616774792717e-06, + "loss": 0.9189, + "step": 28402 + }, + { + "epoch": 0.73, + "learning_rate": 1.7720440912928319e-06, + "loss": 0.752, + "step": 28403 + }, + { + "epoch": 0.73, + "learning_rate": 1.7720265045152734e-06, + "loss": 1.0293, + "step": 28404 + }, + { + "epoch": 0.73, + "learning_rate": 1.7720089171466093e-06, + "loss": 0.7578, + "step": 28405 + }, + { + "epoch": 0.73, + "learning_rate": 1.7719913291868537e-06, + "loss": 0.7749, + "step": 28406 + }, + { + "epoch": 0.73, + "learning_rate": 1.77197374063602e-06, + "loss": 0.957, + "step": 28407 + }, + { + "epoch": 0.73, + "learning_rate": 1.7719561514941215e-06, + "loss": 0.4404, + "step": 28408 + }, + { + "epoch": 0.73, + "learning_rate": 1.7719385617611713e-06, + "loss": 0.709, + "step": 28409 + }, + { + "epoch": 0.73, + "learning_rate": 1.7719209714371836e-06, + "loss": 0.7334, + "step": 28410 + }, + { + "epoch": 0.73, + "learning_rate": 1.7719033805221716e-06, + "loss": 0.6255, + "step": 28411 + }, + { + "epoch": 0.73, + "learning_rate": 1.7718857890161482e-06, + "loss": 0.7327, + "step": 28412 + }, + { + "epoch": 0.73, + "learning_rate": 1.7718681969191275e-06, + "loss": 0.9404, + "step": 28413 + }, + { + "epoch": 0.73, + "learning_rate": 1.771850604231123e-06, + "loss": 0.9766, + "step": 28414 + }, + { + "epoch": 0.73, + "learning_rate": 1.771833010952148e-06, + "loss": 0.7466, + "step": 28415 + }, + { + "epoch": 0.73, + "learning_rate": 1.771815417082216e-06, + "loss": 1.0039, + "step": 28416 + }, + { + "epoch": 0.73, + "learning_rate": 1.7717978226213402e-06, + "loss": 0.7783, + "step": 28417 + }, + { + "epoch": 0.73, + "learning_rate": 1.7717802275695344e-06, + "loss": 1.0586, + "step": 28418 + }, + { + "epoch": 0.73, + "learning_rate": 1.771762631926812e-06, + "loss": 0.7246, + "step": 28419 + }, + { + "epoch": 0.73, + "learning_rate": 1.7717450356931863e-06, + "loss": 0.7666, + "step": 28420 + }, + { + "epoch": 0.73, + "learning_rate": 1.771727438868671e-06, + "loss": 0.7578, + "step": 28421 + }, + { + "epoch": 0.73, + "learning_rate": 1.7717098414532794e-06, + "loss": 0.6885, + "step": 28422 + }, + { + "epoch": 0.73, + "learning_rate": 1.771692243447025e-06, + "loss": 1.0391, + "step": 28423 + }, + { + "epoch": 0.73, + "learning_rate": 1.7716746448499216e-06, + "loss": 0.9453, + "step": 28424 + }, + { + "epoch": 0.73, + "learning_rate": 1.7716570456619823e-06, + "loss": 0.8105, + "step": 28425 + }, + { + "epoch": 0.73, + "learning_rate": 1.7716394458832207e-06, + "loss": 0.7129, + "step": 28426 + }, + { + "epoch": 0.73, + "learning_rate": 1.7716218455136501e-06, + "loss": 0.7163, + "step": 28427 + }, + { + "epoch": 0.73, + "learning_rate": 1.771604244553284e-06, + "loss": 0.957, + "step": 28428 + }, + { + "epoch": 0.73, + "learning_rate": 1.7715866430021365e-06, + "loss": 0.7842, + "step": 28429 + }, + { + "epoch": 0.73, + "learning_rate": 1.7715690408602204e-06, + "loss": 0.5476, + "step": 28430 + }, + { + "epoch": 0.73, + "learning_rate": 1.7715514381275493e-06, + "loss": 0.8564, + "step": 28431 + }, + { + "epoch": 0.73, + "learning_rate": 1.7715338348041367e-06, + "loss": 0.9736, + "step": 28432 + }, + { + "epoch": 0.73, + "learning_rate": 1.7715162308899963e-06, + "loss": 0.6665, + "step": 28433 + }, + { + "epoch": 0.73, + "learning_rate": 1.7714986263851412e-06, + "loss": 1.0205, + "step": 28434 + }, + { + "epoch": 0.73, + "learning_rate": 1.7714810212895853e-06, + "loss": 0.9463, + "step": 28435 + }, + { + "epoch": 0.73, + "learning_rate": 1.7714634156033416e-06, + "loss": 1.0762, + "step": 28436 + }, + { + "epoch": 0.73, + "learning_rate": 1.771445809326424e-06, + "loss": 1.0801, + "step": 28437 + }, + { + "epoch": 0.73, + "learning_rate": 1.771428202458846e-06, + "loss": 0.874, + "step": 28438 + }, + { + "epoch": 0.73, + "learning_rate": 1.7714105950006203e-06, + "loss": 0.9502, + "step": 28439 + }, + { + "epoch": 0.73, + "learning_rate": 1.7713929869517612e-06, + "loss": 0.7793, + "step": 28440 + }, + { + "epoch": 0.73, + "learning_rate": 1.7713753783122821e-06, + "loss": 0.4625, + "step": 28441 + }, + { + "epoch": 0.73, + "learning_rate": 1.7713577690821966e-06, + "loss": 0.8457, + "step": 28442 + }, + { + "epoch": 0.73, + "learning_rate": 1.7713401592615176e-06, + "loss": 0.5254, + "step": 28443 + }, + { + "epoch": 0.73, + "learning_rate": 1.771322548850259e-06, + "loss": 0.8215, + "step": 28444 + }, + { + "epoch": 0.73, + "learning_rate": 1.7713049378484343e-06, + "loss": 0.9238, + "step": 28445 + }, + { + "epoch": 0.73, + "learning_rate": 1.7712873262560564e-06, + "loss": 0.7319, + "step": 28446 + }, + { + "epoch": 0.73, + "learning_rate": 1.7712697140731397e-06, + "loss": 0.6562, + "step": 28447 + }, + { + "epoch": 0.73, + "learning_rate": 1.771252101299697e-06, + "loss": 0.73, + "step": 28448 + }, + { + "epoch": 0.73, + "learning_rate": 1.7712344879357422e-06, + "loss": 1.0195, + "step": 28449 + }, + { + "epoch": 0.73, + "learning_rate": 1.7712168739812885e-06, + "loss": 0.4001, + "step": 28450 + }, + { + "epoch": 0.73, + "learning_rate": 1.7711992594363497e-06, + "loss": 0.9062, + "step": 28451 + }, + { + "epoch": 0.73, + "learning_rate": 1.771181644300939e-06, + "loss": 0.7422, + "step": 28452 + }, + { + "epoch": 0.73, + "learning_rate": 1.7711640285750698e-06, + "loss": 0.8389, + "step": 28453 + }, + { + "epoch": 0.73, + "learning_rate": 1.7711464122587557e-06, + "loss": 0.9111, + "step": 28454 + }, + { + "epoch": 0.73, + "learning_rate": 1.7711287953520106e-06, + "loss": 0.9092, + "step": 28455 + }, + { + "epoch": 0.73, + "learning_rate": 1.7711111778548475e-06, + "loss": 0.9053, + "step": 28456 + }, + { + "epoch": 0.73, + "learning_rate": 1.77109355976728e-06, + "loss": 0.645, + "step": 28457 + }, + { + "epoch": 0.73, + "learning_rate": 1.7710759410893217e-06, + "loss": 0.5415, + "step": 28458 + }, + { + "epoch": 0.73, + "learning_rate": 1.7710583218209858e-06, + "loss": 0.9717, + "step": 28459 + }, + { + "epoch": 0.73, + "learning_rate": 1.7710407019622862e-06, + "loss": 0.7129, + "step": 28460 + }, + { + "epoch": 0.73, + "learning_rate": 1.7710230815132362e-06, + "loss": 0.9863, + "step": 28461 + }, + { + "epoch": 0.73, + "learning_rate": 1.7710054604738493e-06, + "loss": 0.9189, + "step": 28462 + }, + { + "epoch": 0.73, + "learning_rate": 1.7709878388441388e-06, + "loss": 0.8799, + "step": 28463 + }, + { + "epoch": 0.73, + "learning_rate": 1.7709702166241185e-06, + "loss": 0.8838, + "step": 28464 + }, + { + "epoch": 0.73, + "learning_rate": 1.7709525938138015e-06, + "loss": 0.9297, + "step": 28465 + }, + { + "epoch": 0.73, + "learning_rate": 1.7709349704132018e-06, + "loss": 0.9175, + "step": 28466 + }, + { + "epoch": 0.73, + "learning_rate": 1.7709173464223326e-06, + "loss": 0.8789, + "step": 28467 + }, + { + "epoch": 0.73, + "learning_rate": 1.7708997218412075e-06, + "loss": 0.7129, + "step": 28468 + }, + { + "epoch": 0.73, + "learning_rate": 1.77088209666984e-06, + "loss": 0.6321, + "step": 28469 + }, + { + "epoch": 0.73, + "learning_rate": 1.7708644709082433e-06, + "loss": 0.9062, + "step": 28470 + }, + { + "epoch": 0.73, + "learning_rate": 1.7708468445564311e-06, + "loss": 0.7183, + "step": 28471 + }, + { + "epoch": 0.73, + "learning_rate": 1.770829217614417e-06, + "loss": 0.834, + "step": 28472 + }, + { + "epoch": 0.73, + "learning_rate": 1.7708115900822142e-06, + "loss": 1.0625, + "step": 28473 + }, + { + "epoch": 0.73, + "learning_rate": 1.7707939619598368e-06, + "loss": 0.9512, + "step": 28474 + }, + { + "epoch": 0.73, + "learning_rate": 1.770776333247298e-06, + "loss": 0.8174, + "step": 28475 + }, + { + "epoch": 0.73, + "learning_rate": 1.7707587039446106e-06, + "loss": 0.7578, + "step": 28476 + }, + { + "epoch": 0.73, + "learning_rate": 1.7707410740517893e-06, + "loss": 0.7881, + "step": 28477 + }, + { + "epoch": 0.73, + "learning_rate": 1.7707234435688464e-06, + "loss": 0.7932, + "step": 28478 + }, + { + "epoch": 0.73, + "learning_rate": 1.7707058124957963e-06, + "loss": 0.8525, + "step": 28479 + }, + { + "epoch": 0.73, + "learning_rate": 1.7706881808326524e-06, + "loss": 0.8369, + "step": 28480 + }, + { + "epoch": 0.73, + "learning_rate": 1.7706705485794279e-06, + "loss": 0.8154, + "step": 28481 + }, + { + "epoch": 0.73, + "learning_rate": 1.7706529157361362e-06, + "loss": 0.7461, + "step": 28482 + }, + { + "epoch": 0.73, + "learning_rate": 1.7706352823027913e-06, + "loss": 0.8223, + "step": 28483 + }, + { + "epoch": 0.73, + "learning_rate": 1.7706176482794062e-06, + "loss": 0.8735, + "step": 28484 + }, + { + "epoch": 0.73, + "learning_rate": 1.7706000136659945e-06, + "loss": 0.8359, + "step": 28485 + }, + { + "epoch": 0.73, + "learning_rate": 1.7705823784625698e-06, + "loss": 1.0166, + "step": 28486 + }, + { + "epoch": 0.73, + "learning_rate": 1.770564742669146e-06, + "loss": 0.9404, + "step": 28487 + }, + { + "epoch": 0.73, + "learning_rate": 1.7705471062857358e-06, + "loss": 0.8887, + "step": 28488 + }, + { + "epoch": 0.73, + "learning_rate": 1.7705294693123532e-06, + "loss": 0.7202, + "step": 28489 + }, + { + "epoch": 0.73, + "learning_rate": 1.7705118317490118e-06, + "loss": 0.7129, + "step": 28490 + }, + { + "epoch": 0.73, + "learning_rate": 1.7704941935957244e-06, + "loss": 1.0273, + "step": 28491 + }, + { + "epoch": 0.73, + "learning_rate": 1.7704765548525055e-06, + "loss": 0.9038, + "step": 28492 + }, + { + "epoch": 0.73, + "learning_rate": 1.7704589155193684e-06, + "loss": 0.8545, + "step": 28493 + }, + { + "epoch": 0.73, + "learning_rate": 1.7704412755963255e-06, + "loss": 0.9336, + "step": 28494 + }, + { + "epoch": 0.73, + "learning_rate": 1.770423635083392e-06, + "loss": 0.7988, + "step": 28495 + }, + { + "epoch": 0.73, + "learning_rate": 1.77040599398058e-06, + "loss": 0.9619, + "step": 28496 + }, + { + "epoch": 0.73, + "learning_rate": 1.7703883522879037e-06, + "loss": 0.9668, + "step": 28497 + }, + { + "epoch": 0.73, + "learning_rate": 1.7703707100053764e-06, + "loss": 0.8955, + "step": 28498 + }, + { + "epoch": 0.73, + "learning_rate": 1.770353067133012e-06, + "loss": 0.8965, + "step": 28499 + }, + { + "epoch": 0.73, + "learning_rate": 1.7703354236708235e-06, + "loss": 0.8369, + "step": 28500 + }, + { + "epoch": 0.73, + "learning_rate": 1.7703177796188243e-06, + "loss": 0.9482, + "step": 28501 + }, + { + "epoch": 0.73, + "learning_rate": 1.7703001349770284e-06, + "loss": 0.8564, + "step": 28502 + }, + { + "epoch": 0.73, + "learning_rate": 1.770282489745449e-06, + "loss": 0.7803, + "step": 28503 + }, + { + "epoch": 0.73, + "learning_rate": 1.7702648439240999e-06, + "loss": 0.7285, + "step": 28504 + }, + { + "epoch": 0.73, + "learning_rate": 1.7702471975129945e-06, + "loss": 0.7344, + "step": 28505 + }, + { + "epoch": 0.73, + "learning_rate": 1.770229550512146e-06, + "loss": 0.835, + "step": 28506 + }, + { + "epoch": 0.73, + "learning_rate": 1.7702119029215682e-06, + "loss": 0.8477, + "step": 28507 + }, + { + "epoch": 0.73, + "learning_rate": 1.7701942547412747e-06, + "loss": 0.8311, + "step": 28508 + }, + { + "epoch": 0.73, + "learning_rate": 1.7701766059712789e-06, + "loss": 0.873, + "step": 28509 + }, + { + "epoch": 0.73, + "learning_rate": 1.770158956611594e-06, + "loss": 0.9033, + "step": 28510 + }, + { + "epoch": 0.73, + "learning_rate": 1.770141306662234e-06, + "loss": 0.7773, + "step": 28511 + }, + { + "epoch": 0.73, + "learning_rate": 1.7701236561232122e-06, + "loss": 0.7021, + "step": 28512 + }, + { + "epoch": 0.73, + "learning_rate": 1.7701060049945422e-06, + "loss": 0.9072, + "step": 28513 + }, + { + "epoch": 0.73, + "learning_rate": 1.7700883532762371e-06, + "loss": 0.9033, + "step": 28514 + }, + { + "epoch": 0.73, + "learning_rate": 1.7700707009683111e-06, + "loss": 0.6938, + "step": 28515 + }, + { + "epoch": 0.73, + "learning_rate": 1.7700530480707774e-06, + "loss": 0.7808, + "step": 28516 + }, + { + "epoch": 0.73, + "learning_rate": 1.7700353945836492e-06, + "loss": 0.7598, + "step": 28517 + }, + { + "epoch": 0.73, + "learning_rate": 1.7700177405069405e-06, + "loss": 0.7422, + "step": 28518 + }, + { + "epoch": 0.73, + "learning_rate": 1.7700000858406647e-06, + "loss": 0.9141, + "step": 28519 + }, + { + "epoch": 0.73, + "learning_rate": 1.769982430584835e-06, + "loss": 0.7578, + "step": 28520 + }, + { + "epoch": 0.73, + "learning_rate": 1.7699647747394652e-06, + "loss": 0.7998, + "step": 28521 + }, + { + "epoch": 0.73, + "learning_rate": 1.769947118304569e-06, + "loss": 0.8784, + "step": 28522 + }, + { + "epoch": 0.73, + "learning_rate": 1.7699294612801596e-06, + "loss": 1.001, + "step": 28523 + }, + { + "epoch": 0.73, + "learning_rate": 1.7699118036662506e-06, + "loss": 0.9141, + "step": 28524 + }, + { + "epoch": 0.73, + "learning_rate": 1.7698941454628555e-06, + "loss": 0.73, + "step": 28525 + }, + { + "epoch": 0.73, + "learning_rate": 1.7698764866699878e-06, + "loss": 0.9043, + "step": 28526 + }, + { + "epoch": 0.73, + "learning_rate": 1.769858827287661e-06, + "loss": 0.9971, + "step": 28527 + }, + { + "epoch": 0.73, + "learning_rate": 1.769841167315889e-06, + "loss": 0.564, + "step": 28528 + }, + { + "epoch": 0.73, + "learning_rate": 1.7698235067546849e-06, + "loss": 0.8262, + "step": 28529 + }, + { + "epoch": 0.73, + "learning_rate": 1.7698058456040623e-06, + "loss": 1.0127, + "step": 28530 + }, + { + "epoch": 0.73, + "learning_rate": 1.7697881838640348e-06, + "loss": 0.8965, + "step": 28531 + }, + { + "epoch": 0.73, + "learning_rate": 1.7697705215346157e-06, + "loss": 0.6958, + "step": 28532 + }, + { + "epoch": 0.73, + "learning_rate": 1.7697528586158189e-06, + "loss": 0.8047, + "step": 28533 + }, + { + "epoch": 0.73, + "learning_rate": 1.7697351951076577e-06, + "loss": 0.6235, + "step": 28534 + }, + { + "epoch": 0.73, + "learning_rate": 1.7697175310101455e-06, + "loss": 0.9424, + "step": 28535 + }, + { + "epoch": 0.73, + "learning_rate": 1.7696998663232963e-06, + "loss": 1.0527, + "step": 28536 + }, + { + "epoch": 0.73, + "learning_rate": 1.7696822010471229e-06, + "loss": 0.9238, + "step": 28537 + }, + { + "epoch": 0.73, + "learning_rate": 1.7696645351816394e-06, + "loss": 0.7646, + "step": 28538 + }, + { + "epoch": 0.73, + "learning_rate": 1.7696468687268592e-06, + "loss": 0.7085, + "step": 28539 + }, + { + "epoch": 0.73, + "learning_rate": 1.769629201682796e-06, + "loss": 0.605, + "step": 28540 + }, + { + "epoch": 0.73, + "learning_rate": 1.7696115340494626e-06, + "loss": 0.8545, + "step": 28541 + }, + { + "epoch": 0.73, + "learning_rate": 1.7695938658268736e-06, + "loss": 0.8906, + "step": 28542 + }, + { + "epoch": 0.73, + "learning_rate": 1.7695761970150415e-06, + "loss": 0.606, + "step": 28543 + }, + { + "epoch": 0.73, + "learning_rate": 1.7695585276139807e-06, + "loss": 0.6021, + "step": 28544 + }, + { + "epoch": 0.73, + "learning_rate": 1.769540857623704e-06, + "loss": 0.8047, + "step": 28545 + }, + { + "epoch": 0.73, + "learning_rate": 1.7695231870442254e-06, + "loss": 0.8057, + "step": 28546 + }, + { + "epoch": 0.73, + "learning_rate": 1.7695055158755582e-06, + "loss": 0.7651, + "step": 28547 + }, + { + "epoch": 0.73, + "learning_rate": 1.7694878441177159e-06, + "loss": 0.9932, + "step": 28548 + }, + { + "epoch": 0.73, + "learning_rate": 1.7694701717707124e-06, + "loss": 0.77, + "step": 28549 + }, + { + "epoch": 0.73, + "learning_rate": 1.769452498834561e-06, + "loss": 0.7285, + "step": 28550 + }, + { + "epoch": 0.73, + "learning_rate": 1.7694348253092748e-06, + "loss": 0.9639, + "step": 28551 + }, + { + "epoch": 0.73, + "learning_rate": 1.769417151194868e-06, + "loss": 0.7324, + "step": 28552 + }, + { + "epoch": 0.73, + "learning_rate": 1.7693994764913538e-06, + "loss": 0.7114, + "step": 28553 + }, + { + "epoch": 0.73, + "learning_rate": 1.769381801198746e-06, + "loss": 0.9561, + "step": 28554 + }, + { + "epoch": 0.73, + "learning_rate": 1.7693641253170577e-06, + "loss": 0.9189, + "step": 28555 + }, + { + "epoch": 0.73, + "learning_rate": 1.7693464488463029e-06, + "loss": 0.8945, + "step": 28556 + }, + { + "epoch": 0.73, + "learning_rate": 1.7693287717864947e-06, + "loss": 1.085, + "step": 28557 + }, + { + "epoch": 0.73, + "learning_rate": 1.7693110941376468e-06, + "loss": 0.8975, + "step": 28558 + }, + { + "epoch": 0.73, + "learning_rate": 1.7692934158997727e-06, + "loss": 1.04, + "step": 28559 + }, + { + "epoch": 0.73, + "learning_rate": 1.769275737072886e-06, + "loss": 0.8867, + "step": 28560 + }, + { + "epoch": 0.73, + "learning_rate": 1.7692580576570006e-06, + "loss": 0.791, + "step": 28561 + }, + { + "epoch": 0.73, + "learning_rate": 1.7692403776521294e-06, + "loss": 0.769, + "step": 28562 + }, + { + "epoch": 0.73, + "learning_rate": 1.7692226970582862e-06, + "loss": 0.8076, + "step": 28563 + }, + { + "epoch": 0.73, + "learning_rate": 1.7692050158754848e-06, + "loss": 0.9824, + "step": 28564 + }, + { + "epoch": 0.73, + "learning_rate": 1.7691873341037384e-06, + "loss": 0.8389, + "step": 28565 + }, + { + "epoch": 0.73, + "learning_rate": 1.7691696517430606e-06, + "loss": 0.9473, + "step": 28566 + }, + { + "epoch": 0.73, + "learning_rate": 1.7691519687934649e-06, + "loss": 0.6777, + "step": 28567 + }, + { + "epoch": 0.73, + "learning_rate": 1.7691342852549646e-06, + "loss": 0.9717, + "step": 28568 + }, + { + "epoch": 0.73, + "learning_rate": 1.7691166011275743e-06, + "loss": 0.874, + "step": 28569 + }, + { + "epoch": 0.73, + "learning_rate": 1.7690989164113059e-06, + "loss": 0.7949, + "step": 28570 + }, + { + "epoch": 0.73, + "learning_rate": 1.7690812311061744e-06, + "loss": 0.9756, + "step": 28571 + }, + { + "epoch": 0.73, + "learning_rate": 1.7690635452121927e-06, + "loss": 0.8584, + "step": 28572 + }, + { + "epoch": 0.73, + "learning_rate": 1.7690458587293744e-06, + "loss": 0.615, + "step": 28573 + }, + { + "epoch": 0.73, + "learning_rate": 1.7690281716577329e-06, + "loss": 0.7026, + "step": 28574 + }, + { + "epoch": 0.73, + "learning_rate": 1.769010483997282e-06, + "loss": 0.667, + "step": 28575 + }, + { + "epoch": 0.73, + "learning_rate": 1.7689927957480353e-06, + "loss": 1.0088, + "step": 28576 + }, + { + "epoch": 0.73, + "learning_rate": 1.7689751069100059e-06, + "loss": 0.9092, + "step": 28577 + }, + { + "epoch": 0.73, + "learning_rate": 1.7689574174832077e-06, + "loss": 0.9541, + "step": 28578 + }, + { + "epoch": 0.73, + "learning_rate": 1.768939727467654e-06, + "loss": 0.8862, + "step": 28579 + }, + { + "epoch": 0.73, + "learning_rate": 1.7689220368633589e-06, + "loss": 0.8613, + "step": 28580 + }, + { + "epoch": 0.73, + "learning_rate": 1.768904345670335e-06, + "loss": 0.6733, + "step": 28581 + }, + { + "epoch": 0.73, + "learning_rate": 1.7688866538885967e-06, + "loss": 0.9375, + "step": 28582 + }, + { + "epoch": 0.73, + "learning_rate": 1.7688689615181572e-06, + "loss": 0.686, + "step": 28583 + }, + { + "epoch": 0.73, + "learning_rate": 1.7688512685590303e-06, + "loss": 0.7427, + "step": 28584 + }, + { + "epoch": 0.73, + "learning_rate": 1.7688335750112292e-06, + "loss": 0.8225, + "step": 28585 + }, + { + "epoch": 0.73, + "learning_rate": 1.7688158808747677e-06, + "loss": 0.7017, + "step": 28586 + }, + { + "epoch": 0.73, + "learning_rate": 1.768798186149659e-06, + "loss": 0.9521, + "step": 28587 + }, + { + "epoch": 0.73, + "learning_rate": 1.768780490835917e-06, + "loss": 1.0703, + "step": 28588 + }, + { + "epoch": 0.73, + "learning_rate": 1.768762794933555e-06, + "loss": 0.9414, + "step": 28589 + }, + { + "epoch": 0.73, + "learning_rate": 1.7687450984425868e-06, + "loss": 1.0908, + "step": 28590 + }, + { + "epoch": 0.73, + "learning_rate": 1.768727401363026e-06, + "loss": 0.7344, + "step": 28591 + }, + { + "epoch": 0.73, + "learning_rate": 1.7687097036948858e-06, + "loss": 0.8076, + "step": 28592 + }, + { + "epoch": 0.73, + "learning_rate": 1.7686920054381797e-06, + "loss": 1.0596, + "step": 28593 + }, + { + "epoch": 0.73, + "learning_rate": 1.7686743065929219e-06, + "loss": 0.8086, + "step": 28594 + }, + { + "epoch": 0.73, + "learning_rate": 1.768656607159125e-06, + "loss": 1.0742, + "step": 28595 + }, + { + "epoch": 0.73, + "learning_rate": 1.7686389071368035e-06, + "loss": 0.79, + "step": 28596 + }, + { + "epoch": 0.73, + "learning_rate": 1.7686212065259706e-06, + "loss": 0.9082, + "step": 28597 + }, + { + "epoch": 0.73, + "learning_rate": 1.7686035053266396e-06, + "loss": 0.8447, + "step": 28598 + }, + { + "epoch": 0.73, + "learning_rate": 1.768585803538824e-06, + "loss": 1.1465, + "step": 28599 + }, + { + "epoch": 0.73, + "learning_rate": 1.768568101162538e-06, + "loss": 0.9082, + "step": 28600 + }, + { + "epoch": 0.73, + "learning_rate": 1.7685503981977946e-06, + "loss": 0.73, + "step": 28601 + }, + { + "epoch": 0.73, + "learning_rate": 1.7685326946446074e-06, + "loss": 0.9111, + "step": 28602 + }, + { + "epoch": 0.73, + "learning_rate": 1.7685149905029904e-06, + "loss": 0.8984, + "step": 28603 + }, + { + "epoch": 0.73, + "learning_rate": 1.7684972857729564e-06, + "loss": 0.8682, + "step": 28604 + }, + { + "epoch": 0.73, + "learning_rate": 1.7684795804545197e-06, + "loss": 0.9756, + "step": 28605 + }, + { + "epoch": 0.73, + "learning_rate": 1.768461874547693e-06, + "loss": 0.4963, + "step": 28606 + }, + { + "epoch": 0.73, + "learning_rate": 1.7684441680524908e-06, + "loss": 0.9277, + "step": 28607 + }, + { + "epoch": 0.73, + "learning_rate": 1.7684264609689264e-06, + "loss": 0.9453, + "step": 28608 + }, + { + "epoch": 0.73, + "learning_rate": 1.7684087532970127e-06, + "loss": 0.7529, + "step": 28609 + }, + { + "epoch": 0.73, + "learning_rate": 1.768391045036764e-06, + "loss": 0.8066, + "step": 28610 + }, + { + "epoch": 0.73, + "learning_rate": 1.7683733361881937e-06, + "loss": 1.0029, + "step": 28611 + }, + { + "epoch": 0.73, + "learning_rate": 1.7683556267513153e-06, + "loss": 0.7441, + "step": 28612 + }, + { + "epoch": 0.73, + "learning_rate": 1.768337916726142e-06, + "loss": 0.9365, + "step": 28613 + }, + { + "epoch": 0.73, + "learning_rate": 1.7683202061126879e-06, + "loss": 0.8818, + "step": 28614 + }, + { + "epoch": 0.73, + "learning_rate": 1.7683024949109664e-06, + "loss": 1.0605, + "step": 28615 + }, + { + "epoch": 0.73, + "learning_rate": 1.768284783120991e-06, + "loss": 0.845, + "step": 28616 + }, + { + "epoch": 0.73, + "learning_rate": 1.7682670707427751e-06, + "loss": 0.8467, + "step": 28617 + }, + { + "epoch": 0.73, + "learning_rate": 1.7682493577763324e-06, + "loss": 0.8955, + "step": 28618 + }, + { + "epoch": 0.73, + "learning_rate": 1.7682316442216769e-06, + "loss": 1.002, + "step": 28619 + }, + { + "epoch": 0.73, + "learning_rate": 1.7682139300788213e-06, + "loss": 1.0234, + "step": 28620 + }, + { + "epoch": 0.73, + "learning_rate": 1.7681962153477799e-06, + "loss": 0.8584, + "step": 28621 + }, + { + "epoch": 0.73, + "learning_rate": 1.7681785000285658e-06, + "loss": 0.8079, + "step": 28622 + }, + { + "epoch": 0.73, + "learning_rate": 1.7681607841211927e-06, + "loss": 0.9014, + "step": 28623 + }, + { + "epoch": 0.73, + "learning_rate": 1.7681430676256746e-06, + "loss": 0.5098, + "step": 28624 + }, + { + "epoch": 0.73, + "learning_rate": 1.7681253505420241e-06, + "loss": 0.8633, + "step": 28625 + }, + { + "epoch": 0.73, + "learning_rate": 1.7681076328702558e-06, + "loss": 0.9756, + "step": 28626 + }, + { + "epoch": 0.73, + "learning_rate": 1.7680899146103826e-06, + "loss": 0.7739, + "step": 28627 + }, + { + "epoch": 0.73, + "learning_rate": 1.7680721957624183e-06, + "loss": 0.8066, + "step": 28628 + }, + { + "epoch": 0.73, + "learning_rate": 1.7680544763263765e-06, + "loss": 0.9375, + "step": 28629 + }, + { + "epoch": 0.73, + "learning_rate": 1.7680367563022707e-06, + "loss": 1.0244, + "step": 28630 + }, + { + "epoch": 0.73, + "learning_rate": 1.7680190356901143e-06, + "loss": 1.0713, + "step": 28631 + }, + { + "epoch": 0.73, + "learning_rate": 1.768001314489921e-06, + "loss": 0.8975, + "step": 28632 + }, + { + "epoch": 0.73, + "learning_rate": 1.7679835927017046e-06, + "loss": 0.8936, + "step": 28633 + }, + { + "epoch": 0.73, + "learning_rate": 1.7679658703254785e-06, + "loss": 0.8662, + "step": 28634 + }, + { + "epoch": 0.73, + "learning_rate": 1.7679481473612563e-06, + "loss": 0.8101, + "step": 28635 + }, + { + "epoch": 0.73, + "learning_rate": 1.7679304238090515e-06, + "loss": 0.7378, + "step": 28636 + }, + { + "epoch": 0.73, + "learning_rate": 1.7679126996688776e-06, + "loss": 0.6943, + "step": 28637 + }, + { + "epoch": 0.73, + "learning_rate": 1.767894974940748e-06, + "loss": 0.7212, + "step": 28638 + }, + { + "epoch": 0.73, + "learning_rate": 1.767877249624677e-06, + "loss": 0.9053, + "step": 28639 + }, + { + "epoch": 0.73, + "learning_rate": 1.7678595237206775e-06, + "loss": 0.9756, + "step": 28640 + }, + { + "epoch": 0.73, + "learning_rate": 1.7678417972287632e-06, + "loss": 0.9424, + "step": 28641 + }, + { + "epoch": 0.73, + "learning_rate": 1.7678240701489477e-06, + "loss": 0.6455, + "step": 28642 + }, + { + "epoch": 0.73, + "learning_rate": 1.767806342481245e-06, + "loss": 0.8965, + "step": 28643 + }, + { + "epoch": 0.73, + "learning_rate": 1.767788614225668e-06, + "loss": 1.0713, + "step": 28644 + }, + { + "epoch": 0.73, + "learning_rate": 1.7677708853822302e-06, + "loss": 0.7583, + "step": 28645 + }, + { + "epoch": 0.73, + "learning_rate": 1.767753155950946e-06, + "loss": 0.9434, + "step": 28646 + }, + { + "epoch": 0.73, + "learning_rate": 1.7677354259318285e-06, + "loss": 0.9326, + "step": 28647 + }, + { + "epoch": 0.73, + "learning_rate": 1.767717695324891e-06, + "loss": 0.9922, + "step": 28648 + }, + { + "epoch": 0.73, + "learning_rate": 1.7676999641301476e-06, + "loss": 0.7239, + "step": 28649 + }, + { + "epoch": 0.73, + "learning_rate": 1.7676822323476115e-06, + "loss": 0.7559, + "step": 28650 + }, + { + "epoch": 0.73, + "learning_rate": 1.7676644999772968e-06, + "loss": 0.6885, + "step": 28651 + }, + { + "epoch": 0.73, + "learning_rate": 1.7676467670192162e-06, + "loss": 0.4807, + "step": 28652 + }, + { + "epoch": 0.73, + "learning_rate": 1.7676290334733838e-06, + "loss": 0.8125, + "step": 28653 + }, + { + "epoch": 0.73, + "learning_rate": 1.7676112993398134e-06, + "loss": 0.8926, + "step": 28654 + }, + { + "epoch": 0.73, + "learning_rate": 1.7675935646185183e-06, + "loss": 0.8193, + "step": 28655 + }, + { + "epoch": 0.73, + "learning_rate": 1.7675758293095119e-06, + "loss": 0.8633, + "step": 28656 + }, + { + "epoch": 0.73, + "learning_rate": 1.7675580934128082e-06, + "loss": 0.6816, + "step": 28657 + }, + { + "epoch": 0.73, + "learning_rate": 1.7675403569284204e-06, + "loss": 0.8457, + "step": 28658 + }, + { + "epoch": 0.73, + "learning_rate": 1.7675226198563622e-06, + "loss": 0.9609, + "step": 28659 + }, + { + "epoch": 0.73, + "learning_rate": 1.7675048821966473e-06, + "loss": 0.6328, + "step": 28660 + }, + { + "epoch": 0.73, + "learning_rate": 1.7674871439492894e-06, + "loss": 0.9434, + "step": 28661 + }, + { + "epoch": 0.73, + "learning_rate": 1.7674694051143017e-06, + "loss": 1.0508, + "step": 28662 + }, + { + "epoch": 0.73, + "learning_rate": 1.767451665691698e-06, + "loss": 0.7324, + "step": 28663 + }, + { + "epoch": 0.73, + "learning_rate": 1.767433925681492e-06, + "loss": 0.6621, + "step": 28664 + }, + { + "epoch": 0.73, + "learning_rate": 1.7674161850836966e-06, + "loss": 0.792, + "step": 28665 + }, + { + "epoch": 0.73, + "learning_rate": 1.7673984438983265e-06, + "loss": 0.8594, + "step": 28666 + }, + { + "epoch": 0.73, + "learning_rate": 1.7673807021253944e-06, + "loss": 0.8086, + "step": 28667 + }, + { + "epoch": 0.73, + "learning_rate": 1.7673629597649142e-06, + "loss": 0.8975, + "step": 28668 + }, + { + "epoch": 0.73, + "learning_rate": 1.7673452168168997e-06, + "loss": 0.7334, + "step": 28669 + }, + { + "epoch": 0.73, + "learning_rate": 1.7673274732813638e-06, + "loss": 0.9902, + "step": 28670 + }, + { + "epoch": 0.73, + "learning_rate": 1.7673097291583209e-06, + "loss": 0.9893, + "step": 28671 + }, + { + "epoch": 0.73, + "learning_rate": 1.7672919844477843e-06, + "loss": 0.9512, + "step": 28672 + }, + { + "epoch": 0.73, + "learning_rate": 1.7672742391497673e-06, + "loss": 0.9297, + "step": 28673 + }, + { + "epoch": 0.73, + "learning_rate": 1.7672564932642836e-06, + "loss": 0.7871, + "step": 28674 + }, + { + "epoch": 0.73, + "learning_rate": 1.767238746791347e-06, + "loss": 1.1465, + "step": 28675 + }, + { + "epoch": 0.73, + "learning_rate": 1.767220999730971e-06, + "loss": 1.0508, + "step": 28676 + }, + { + "epoch": 0.74, + "learning_rate": 1.7672032520831693e-06, + "loss": 0.7471, + "step": 28677 + }, + { + "epoch": 0.74, + "learning_rate": 1.7671855038479548e-06, + "loss": 0.7051, + "step": 28678 + }, + { + "epoch": 0.74, + "learning_rate": 1.7671677550253424e-06, + "loss": 0.8848, + "step": 28679 + }, + { + "epoch": 0.74, + "learning_rate": 1.7671500056153445e-06, + "loss": 0.793, + "step": 28680 + }, + { + "epoch": 0.74, + "learning_rate": 1.7671322556179751e-06, + "loss": 0.9229, + "step": 28681 + }, + { + "epoch": 0.74, + "learning_rate": 1.767114505033248e-06, + "loss": 0.77, + "step": 28682 + }, + { + "epoch": 0.74, + "learning_rate": 1.7670967538611762e-06, + "loss": 0.6047, + "step": 28683 + }, + { + "epoch": 0.74, + "learning_rate": 1.767079002101774e-06, + "loss": 0.9746, + "step": 28684 + }, + { + "epoch": 0.74, + "learning_rate": 1.7670612497550548e-06, + "loss": 0.8271, + "step": 28685 + }, + { + "epoch": 0.74, + "learning_rate": 1.767043496821032e-06, + "loss": 0.7988, + "step": 28686 + }, + { + "epoch": 0.74, + "learning_rate": 1.7670257432997189e-06, + "loss": 1.0869, + "step": 28687 + }, + { + "epoch": 0.74, + "learning_rate": 1.7670079891911299e-06, + "loss": 0.6846, + "step": 28688 + }, + { + "epoch": 0.74, + "learning_rate": 1.766990234495278e-06, + "loss": 0.9434, + "step": 28689 + }, + { + "epoch": 0.74, + "learning_rate": 1.7669724792121769e-06, + "loss": 0.7817, + "step": 28690 + }, + { + "epoch": 0.74, + "learning_rate": 1.7669547233418402e-06, + "loss": 0.6108, + "step": 28691 + }, + { + "epoch": 0.74, + "learning_rate": 1.7669369668842817e-06, + "loss": 0.877, + "step": 28692 + }, + { + "epoch": 0.74, + "learning_rate": 1.7669192098395148e-06, + "loss": 1.1484, + "step": 28693 + }, + { + "epoch": 0.74, + "learning_rate": 1.7669014522075529e-06, + "loss": 0.9238, + "step": 28694 + }, + { + "epoch": 0.74, + "learning_rate": 1.76688369398841e-06, + "loss": 1.1055, + "step": 28695 + }, + { + "epoch": 0.74, + "learning_rate": 1.7668659351820993e-06, + "loss": 0.8311, + "step": 28696 + }, + { + "epoch": 0.74, + "learning_rate": 1.7668481757886348e-06, + "loss": 1.0156, + "step": 28697 + }, + { + "epoch": 0.74, + "learning_rate": 1.76683041580803e-06, + "loss": 0.6953, + "step": 28698 + }, + { + "epoch": 0.74, + "learning_rate": 1.7668126552402982e-06, + "loss": 0.7529, + "step": 28699 + }, + { + "epoch": 0.74, + "learning_rate": 1.7667948940854536e-06, + "loss": 0.8281, + "step": 28700 + }, + { + "epoch": 0.74, + "learning_rate": 1.766777132343509e-06, + "loss": 0.7891, + "step": 28701 + }, + { + "epoch": 0.74, + "learning_rate": 1.7667593700144785e-06, + "loss": 0.9023, + "step": 28702 + }, + { + "epoch": 0.74, + "learning_rate": 1.7667416070983757e-06, + "loss": 0.6768, + "step": 28703 + }, + { + "epoch": 0.74, + "learning_rate": 1.766723843595214e-06, + "loss": 0.9434, + "step": 28704 + }, + { + "epoch": 0.74, + "learning_rate": 1.7667060795050073e-06, + "loss": 1.041, + "step": 28705 + }, + { + "epoch": 0.74, + "learning_rate": 1.766688314827769e-06, + "loss": 0.9258, + "step": 28706 + }, + { + "epoch": 0.74, + "learning_rate": 1.7666705495635123e-06, + "loss": 0.8047, + "step": 28707 + }, + { + "epoch": 0.74, + "learning_rate": 1.7666527837122515e-06, + "loss": 0.9209, + "step": 28708 + }, + { + "epoch": 0.74, + "learning_rate": 1.766635017274e-06, + "loss": 0.7061, + "step": 28709 + }, + { + "epoch": 0.74, + "learning_rate": 1.7666172502487713e-06, + "loss": 1.0918, + "step": 28710 + }, + { + "epoch": 0.74, + "learning_rate": 1.766599482636579e-06, + "loss": 0.9043, + "step": 28711 + }, + { + "epoch": 0.74, + "learning_rate": 1.7665817144374367e-06, + "loss": 0.8555, + "step": 28712 + }, + { + "epoch": 0.74, + "learning_rate": 1.7665639456513579e-06, + "loss": 0.8564, + "step": 28713 + }, + { + "epoch": 0.74, + "learning_rate": 1.7665461762783564e-06, + "loss": 1.1133, + "step": 28714 + }, + { + "epoch": 0.74, + "learning_rate": 1.766528406318446e-06, + "loss": 0.998, + "step": 28715 + }, + { + "epoch": 0.74, + "learning_rate": 1.7665106357716395e-06, + "loss": 0.9209, + "step": 28716 + }, + { + "epoch": 0.74, + "learning_rate": 1.7664928646379516e-06, + "loss": 0.8545, + "step": 28717 + }, + { + "epoch": 0.74, + "learning_rate": 1.7664750929173953e-06, + "loss": 0.772, + "step": 28718 + }, + { + "epoch": 0.74, + "learning_rate": 1.7664573206099837e-06, + "loss": 0.7686, + "step": 28719 + }, + { + "epoch": 0.74, + "learning_rate": 1.7664395477157315e-06, + "loss": 0.7988, + "step": 28720 + }, + { + "epoch": 0.74, + "learning_rate": 1.7664217742346516e-06, + "loss": 0.7979, + "step": 28721 + }, + { + "epoch": 0.74, + "learning_rate": 1.766404000166758e-06, + "loss": 0.8438, + "step": 28722 + }, + { + "epoch": 0.74, + "learning_rate": 1.7663862255120639e-06, + "loss": 0.8848, + "step": 28723 + }, + { + "epoch": 0.74, + "learning_rate": 1.7663684502705832e-06, + "loss": 0.8691, + "step": 28724 + }, + { + "epoch": 0.74, + "learning_rate": 1.7663506744423292e-06, + "loss": 0.8838, + "step": 28725 + }, + { + "epoch": 0.74, + "learning_rate": 1.7663328980273162e-06, + "loss": 0.5798, + "step": 28726 + }, + { + "epoch": 0.74, + "learning_rate": 1.766315121025557e-06, + "loss": 0.9756, + "step": 28727 + }, + { + "epoch": 0.74, + "learning_rate": 1.7662973434370655e-06, + "loss": 0.9082, + "step": 28728 + }, + { + "epoch": 0.74, + "learning_rate": 1.7662795652618554e-06, + "loss": 0.8955, + "step": 28729 + }, + { + "epoch": 0.74, + "learning_rate": 1.7662617864999402e-06, + "loss": 0.9951, + "step": 28730 + }, + { + "epoch": 0.74, + "learning_rate": 1.7662440071513339e-06, + "loss": 0.8359, + "step": 28731 + }, + { + "epoch": 0.74, + "learning_rate": 1.7662262272160496e-06, + "loss": 0.7856, + "step": 28732 + }, + { + "epoch": 0.74, + "learning_rate": 1.766208446694101e-06, + "loss": 1.0264, + "step": 28733 + }, + { + "epoch": 0.74, + "learning_rate": 1.7661906655855018e-06, + "loss": 0.7051, + "step": 28734 + }, + { + "epoch": 0.74, + "learning_rate": 1.7661728838902658e-06, + "loss": 1.0059, + "step": 28735 + }, + { + "epoch": 0.74, + "learning_rate": 1.7661551016084064e-06, + "loss": 0.917, + "step": 28736 + }, + { + "epoch": 0.74, + "learning_rate": 1.7661373187399372e-06, + "loss": 0.7891, + "step": 28737 + }, + { + "epoch": 0.74, + "learning_rate": 1.7661195352848722e-06, + "loss": 0.7646, + "step": 28738 + }, + { + "epoch": 0.74, + "learning_rate": 1.7661017512432243e-06, + "loss": 0.6455, + "step": 28739 + }, + { + "epoch": 0.74, + "learning_rate": 1.7660839666150077e-06, + "loss": 0.8418, + "step": 28740 + }, + { + "epoch": 0.74, + "learning_rate": 1.766066181400236e-06, + "loss": 0.7314, + "step": 28741 + }, + { + "epoch": 0.74, + "learning_rate": 1.7660483955989222e-06, + "loss": 0.7598, + "step": 28742 + }, + { + "epoch": 0.74, + "learning_rate": 1.766030609211081e-06, + "loss": 0.7012, + "step": 28743 + }, + { + "epoch": 0.74, + "learning_rate": 1.7660128222367248e-06, + "loss": 0.6318, + "step": 28744 + }, + { + "epoch": 0.74, + "learning_rate": 1.765995034675868e-06, + "loss": 0.9326, + "step": 28745 + }, + { + "epoch": 0.74, + "learning_rate": 1.7659772465285242e-06, + "loss": 0.604, + "step": 28746 + }, + { + "epoch": 0.74, + "learning_rate": 1.7659594577947065e-06, + "loss": 0.6709, + "step": 28747 + }, + { + "epoch": 0.74, + "learning_rate": 1.7659416684744291e-06, + "loss": 0.8945, + "step": 28748 + }, + { + "epoch": 0.74, + "learning_rate": 1.7659238785677053e-06, + "loss": 0.9619, + "step": 28749 + }, + { + "epoch": 0.74, + "learning_rate": 1.7659060880745486e-06, + "loss": 0.8364, + "step": 28750 + }, + { + "epoch": 0.74, + "learning_rate": 1.7658882969949734e-06, + "loss": 0.7427, + "step": 28751 + }, + { + "epoch": 0.74, + "learning_rate": 1.7658705053289924e-06, + "loss": 0.9785, + "step": 28752 + }, + { + "epoch": 0.74, + "learning_rate": 1.7658527130766194e-06, + "loss": 0.6172, + "step": 28753 + }, + { + "epoch": 0.74, + "learning_rate": 1.7658349202378684e-06, + "loss": 0.9771, + "step": 28754 + }, + { + "epoch": 0.74, + "learning_rate": 1.7658171268127529e-06, + "loss": 0.584, + "step": 28755 + }, + { + "epoch": 0.74, + "learning_rate": 1.7657993328012864e-06, + "loss": 0.7871, + "step": 28756 + }, + { + "epoch": 0.74, + "learning_rate": 1.7657815382034821e-06, + "loss": 0.8276, + "step": 28757 + }, + { + "epoch": 0.74, + "learning_rate": 1.7657637430193547e-06, + "loss": 0.7441, + "step": 28758 + }, + { + "epoch": 0.74, + "learning_rate": 1.765745947248917e-06, + "loss": 0.6885, + "step": 28759 + }, + { + "epoch": 0.74, + "learning_rate": 1.765728150892183e-06, + "loss": 1.0078, + "step": 28760 + }, + { + "epoch": 0.74, + "learning_rate": 1.7657103539491657e-06, + "loss": 0.7119, + "step": 28761 + }, + { + "epoch": 0.74, + "learning_rate": 1.7656925564198795e-06, + "loss": 1.0127, + "step": 28762 + }, + { + "epoch": 0.74, + "learning_rate": 1.7656747583043377e-06, + "loss": 1.0195, + "step": 28763 + }, + { + "epoch": 0.74, + "learning_rate": 1.765656959602554e-06, + "loss": 0.8877, + "step": 28764 + }, + { + "epoch": 0.74, + "learning_rate": 1.7656391603145417e-06, + "loss": 0.7051, + "step": 28765 + }, + { + "epoch": 0.74, + "learning_rate": 1.7656213604403151e-06, + "loss": 1.041, + "step": 28766 + }, + { + "epoch": 0.74, + "learning_rate": 1.7656035599798873e-06, + "loss": 0.7886, + "step": 28767 + }, + { + "epoch": 0.74, + "learning_rate": 1.7655857589332718e-06, + "loss": 0.8477, + "step": 28768 + }, + { + "epoch": 0.74, + "learning_rate": 1.7655679573004826e-06, + "loss": 0.8135, + "step": 28769 + }, + { + "epoch": 0.74, + "learning_rate": 1.7655501550815335e-06, + "loss": 0.9834, + "step": 28770 + }, + { + "epoch": 0.74, + "learning_rate": 1.7655323522764376e-06, + "loss": 0.8574, + "step": 28771 + }, + { + "epoch": 0.74, + "learning_rate": 1.7655145488852088e-06, + "loss": 0.9004, + "step": 28772 + }, + { + "epoch": 0.74, + "learning_rate": 1.7654967449078608e-06, + "loss": 0.8975, + "step": 28773 + }, + { + "epoch": 0.74, + "learning_rate": 1.7654789403444071e-06, + "loss": 0.9199, + "step": 28774 + }, + { + "epoch": 0.74, + "learning_rate": 1.7654611351948612e-06, + "loss": 0.9375, + "step": 28775 + }, + { + "epoch": 0.74, + "learning_rate": 1.7654433294592371e-06, + "loss": 0.8408, + "step": 28776 + }, + { + "epoch": 0.74, + "learning_rate": 1.7654255231375484e-06, + "loss": 0.9473, + "step": 28777 + }, + { + "epoch": 0.74, + "learning_rate": 1.7654077162298084e-06, + "loss": 0.7715, + "step": 28778 + }, + { + "epoch": 0.74, + "learning_rate": 1.7653899087360306e-06, + "loss": 0.6406, + "step": 28779 + }, + { + "epoch": 0.74, + "learning_rate": 1.7653721006562291e-06, + "loss": 0.7703, + "step": 28780 + }, + { + "epoch": 0.74, + "learning_rate": 1.7653542919904178e-06, + "loss": 0.6851, + "step": 28781 + }, + { + "epoch": 0.74, + "learning_rate": 1.7653364827386094e-06, + "loss": 0.8613, + "step": 28782 + }, + { + "epoch": 0.74, + "learning_rate": 1.7653186729008183e-06, + "loss": 0.8569, + "step": 28783 + }, + { + "epoch": 0.74, + "learning_rate": 1.765300862477058e-06, + "loss": 0.564, + "step": 28784 + }, + { + "epoch": 0.74, + "learning_rate": 1.7652830514673418e-06, + "loss": 0.7744, + "step": 28785 + }, + { + "epoch": 0.74, + "learning_rate": 1.7652652398716836e-06, + "loss": 0.8643, + "step": 28786 + }, + { + "epoch": 0.74, + "learning_rate": 1.765247427690097e-06, + "loss": 0.9922, + "step": 28787 + }, + { + "epoch": 0.74, + "learning_rate": 1.7652296149225956e-06, + "loss": 0.999, + "step": 28788 + }, + { + "epoch": 0.74, + "learning_rate": 1.765211801569193e-06, + "loss": 0.7461, + "step": 28789 + }, + { + "epoch": 0.74, + "learning_rate": 1.7651939876299032e-06, + "loss": 0.6838, + "step": 28790 + }, + { + "epoch": 0.74, + "learning_rate": 1.7651761731047391e-06, + "loss": 1.1689, + "step": 28791 + }, + { + "epoch": 0.74, + "learning_rate": 1.765158357993715e-06, + "loss": 0.9043, + "step": 28792 + }, + { + "epoch": 0.74, + "learning_rate": 1.7651405422968443e-06, + "loss": 0.6729, + "step": 28793 + }, + { + "epoch": 0.74, + "learning_rate": 1.7651227260141411e-06, + "loss": 0.834, + "step": 28794 + }, + { + "epoch": 0.74, + "learning_rate": 1.765104909145618e-06, + "loss": 0.916, + "step": 28795 + }, + { + "epoch": 0.74, + "learning_rate": 1.7650870916912898e-06, + "loss": 1.0742, + "step": 28796 + }, + { + "epoch": 0.74, + "learning_rate": 1.7650692736511692e-06, + "loss": 1.002, + "step": 28797 + }, + { + "epoch": 0.74, + "learning_rate": 1.7650514550252704e-06, + "loss": 0.6519, + "step": 28798 + }, + { + "epoch": 0.74, + "learning_rate": 1.7650336358136067e-06, + "loss": 0.7915, + "step": 28799 + }, + { + "epoch": 0.74, + "learning_rate": 1.765015816016192e-06, + "loss": 0.8623, + "step": 28800 + }, + { + "epoch": 0.74, + "learning_rate": 1.76499799563304e-06, + "loss": 0.8057, + "step": 28801 + }, + { + "epoch": 0.74, + "learning_rate": 1.764980174664164e-06, + "loss": 0.9229, + "step": 28802 + }, + { + "epoch": 0.74, + "learning_rate": 1.764962353109578e-06, + "loss": 0.9629, + "step": 28803 + }, + { + "epoch": 0.74, + "learning_rate": 1.7649445309692954e-06, + "loss": 0.5957, + "step": 28804 + }, + { + "epoch": 0.74, + "learning_rate": 1.76492670824333e-06, + "loss": 0.6455, + "step": 28805 + }, + { + "epoch": 0.74, + "learning_rate": 1.7649088849316954e-06, + "loss": 1.04, + "step": 28806 + }, + { + "epoch": 0.74, + "learning_rate": 1.7648910610344053e-06, + "loss": 0.8276, + "step": 28807 + }, + { + "epoch": 0.74, + "learning_rate": 1.7648732365514732e-06, + "loss": 1.083, + "step": 28808 + }, + { + "epoch": 0.74, + "learning_rate": 1.764855411482913e-06, + "loss": 0.8584, + "step": 28809 + }, + { + "epoch": 0.74, + "learning_rate": 1.7648375858287378e-06, + "loss": 1.0859, + "step": 28810 + }, + { + "epoch": 0.74, + "learning_rate": 1.764819759588962e-06, + "loss": 0.917, + "step": 28811 + }, + { + "epoch": 0.74, + "learning_rate": 1.7648019327635986e-06, + "loss": 0.835, + "step": 28812 + }, + { + "epoch": 0.74, + "learning_rate": 1.7647841053526618e-06, + "loss": 1.0029, + "step": 28813 + }, + { + "epoch": 0.74, + "learning_rate": 1.7647662773561648e-06, + "loss": 0.8799, + "step": 28814 + }, + { + "epoch": 0.74, + "learning_rate": 1.7647484487741214e-06, + "loss": 0.6875, + "step": 28815 + }, + { + "epoch": 0.74, + "learning_rate": 1.7647306196065455e-06, + "loss": 0.8408, + "step": 28816 + }, + { + "epoch": 0.74, + "learning_rate": 1.7647127898534504e-06, + "loss": 0.6523, + "step": 28817 + }, + { + "epoch": 0.74, + "learning_rate": 1.7646949595148498e-06, + "loss": 1.0361, + "step": 28818 + }, + { + "epoch": 0.74, + "learning_rate": 1.7646771285907573e-06, + "loss": 0.8145, + "step": 28819 + }, + { + "epoch": 0.74, + "learning_rate": 1.7646592970811871e-06, + "loss": 0.9541, + "step": 28820 + }, + { + "epoch": 0.74, + "learning_rate": 1.7646414649861523e-06, + "loss": 0.8887, + "step": 28821 + }, + { + "epoch": 0.74, + "learning_rate": 1.7646236323056664e-06, + "loss": 0.9756, + "step": 28822 + }, + { + "epoch": 0.74, + "learning_rate": 1.7646057990397436e-06, + "loss": 0.9375, + "step": 28823 + }, + { + "epoch": 0.74, + "learning_rate": 1.7645879651883972e-06, + "loss": 0.6938, + "step": 28824 + }, + { + "epoch": 0.74, + "learning_rate": 1.764570130751641e-06, + "loss": 0.8203, + "step": 28825 + }, + { + "epoch": 0.74, + "learning_rate": 1.7645522957294886e-06, + "loss": 1.0127, + "step": 28826 + }, + { + "epoch": 0.74, + "learning_rate": 1.7645344601219535e-06, + "loss": 0.9258, + "step": 28827 + }, + { + "epoch": 0.74, + "learning_rate": 1.7645166239290497e-06, + "loss": 0.9014, + "step": 28828 + }, + { + "epoch": 0.74, + "learning_rate": 1.7644987871507909e-06, + "loss": 1.0039, + "step": 28829 + }, + { + "epoch": 0.74, + "learning_rate": 1.7644809497871899e-06, + "loss": 0.793, + "step": 28830 + }, + { + "epoch": 0.74, + "learning_rate": 1.7644631118382616e-06, + "loss": 0.6304, + "step": 28831 + }, + { + "epoch": 0.74, + "learning_rate": 1.7644452733040188e-06, + "loss": 0.8223, + "step": 28832 + }, + { + "epoch": 0.74, + "learning_rate": 1.7644274341844753e-06, + "loss": 0.8379, + "step": 28833 + }, + { + "epoch": 0.74, + "learning_rate": 1.7644095944796452e-06, + "loss": 0.9688, + "step": 28834 + }, + { + "epoch": 0.74, + "learning_rate": 1.7643917541895414e-06, + "loss": 0.8525, + "step": 28835 + }, + { + "epoch": 0.74, + "learning_rate": 1.7643739133141784e-06, + "loss": 0.8096, + "step": 28836 + }, + { + "epoch": 0.74, + "learning_rate": 1.764356071853569e-06, + "loss": 0.7275, + "step": 28837 + }, + { + "epoch": 0.74, + "learning_rate": 1.764338229807728e-06, + "loss": 1.0352, + "step": 28838 + }, + { + "epoch": 0.74, + "learning_rate": 1.7643203871766677e-06, + "loss": 0.7988, + "step": 28839 + }, + { + "epoch": 0.74, + "learning_rate": 1.7643025439604024e-06, + "loss": 0.8242, + "step": 28840 + }, + { + "epoch": 0.74, + "learning_rate": 1.7642847001589463e-06, + "loss": 0.79, + "step": 28841 + }, + { + "epoch": 0.74, + "learning_rate": 1.764266855772312e-06, + "loss": 0.6621, + "step": 28842 + }, + { + "epoch": 0.74, + "learning_rate": 1.7642490108005142e-06, + "loss": 0.8145, + "step": 28843 + }, + { + "epoch": 0.74, + "learning_rate": 1.7642311652435654e-06, + "loss": 0.8291, + "step": 28844 + }, + { + "epoch": 0.74, + "learning_rate": 1.7642133191014806e-06, + "loss": 0.9824, + "step": 28845 + }, + { + "epoch": 0.74, + "learning_rate": 1.7641954723742724e-06, + "loss": 0.5688, + "step": 28846 + }, + { + "epoch": 0.74, + "learning_rate": 1.7641776250619552e-06, + "loss": 0.8076, + "step": 28847 + }, + { + "epoch": 0.74, + "learning_rate": 1.7641597771645422e-06, + "loss": 0.7188, + "step": 28848 + }, + { + "epoch": 0.74, + "learning_rate": 1.764141928682047e-06, + "loss": 0.8975, + "step": 28849 + }, + { + "epoch": 0.74, + "learning_rate": 1.7641240796144836e-06, + "loss": 0.9902, + "step": 28850 + }, + { + "epoch": 0.74, + "learning_rate": 1.7641062299618656e-06, + "loss": 0.8721, + "step": 28851 + }, + { + "epoch": 0.74, + "learning_rate": 1.7640883797242067e-06, + "loss": 0.8018, + "step": 28852 + }, + { + "epoch": 0.74, + "learning_rate": 1.7640705289015203e-06, + "loss": 0.7217, + "step": 28853 + }, + { + "epoch": 0.74, + "learning_rate": 1.76405267749382e-06, + "loss": 0.9287, + "step": 28854 + }, + { + "epoch": 0.74, + "learning_rate": 1.76403482550112e-06, + "loss": 0.9873, + "step": 28855 + }, + { + "epoch": 0.74, + "learning_rate": 1.7640169729234337e-06, + "loss": 1.0098, + "step": 28856 + }, + { + "epoch": 0.74, + "learning_rate": 1.7639991197607746e-06, + "loss": 0.75, + "step": 28857 + }, + { + "epoch": 0.74, + "learning_rate": 1.7639812660131565e-06, + "loss": 0.8418, + "step": 28858 + }, + { + "epoch": 0.74, + "learning_rate": 1.763963411680593e-06, + "loss": 0.9648, + "step": 28859 + }, + { + "epoch": 0.74, + "learning_rate": 1.7639455567630982e-06, + "loss": 0.9277, + "step": 28860 + }, + { + "epoch": 0.74, + "learning_rate": 1.7639277012606852e-06, + "loss": 0.8359, + "step": 28861 + }, + { + "epoch": 0.74, + "learning_rate": 1.7639098451733675e-06, + "loss": 0.7778, + "step": 28862 + }, + { + "epoch": 0.74, + "learning_rate": 1.7638919885011599e-06, + "loss": 0.5789, + "step": 28863 + }, + { + "epoch": 0.74, + "learning_rate": 1.763874131244075e-06, + "loss": 0.7666, + "step": 28864 + }, + { + "epoch": 0.74, + "learning_rate": 1.7638562734021264e-06, + "loss": 0.8994, + "step": 28865 + }, + { + "epoch": 0.74, + "learning_rate": 1.7638384149753288e-06, + "loss": 1.0381, + "step": 28866 + }, + { + "epoch": 0.74, + "learning_rate": 1.7638205559636949e-06, + "loss": 0.9785, + "step": 28867 + }, + { + "epoch": 0.74, + "learning_rate": 1.7638026963672387e-06, + "loss": 0.8608, + "step": 28868 + }, + { + "epoch": 0.74, + "learning_rate": 1.763784836185974e-06, + "loss": 0.9199, + "step": 28869 + }, + { + "epoch": 0.74, + "learning_rate": 1.7637669754199146e-06, + "loss": 0.8857, + "step": 28870 + }, + { + "epoch": 0.74, + "learning_rate": 1.7637491140690734e-06, + "loss": 0.8359, + "step": 28871 + }, + { + "epoch": 0.74, + "learning_rate": 1.763731252133465e-06, + "loss": 0.6514, + "step": 28872 + }, + { + "epoch": 0.74, + "learning_rate": 1.7637133896131027e-06, + "loss": 0.708, + "step": 28873 + }, + { + "epoch": 0.74, + "learning_rate": 1.763695526508e-06, + "loss": 0.751, + "step": 28874 + }, + { + "epoch": 0.74, + "learning_rate": 1.763677662818171e-06, + "loss": 0.8613, + "step": 28875 + }, + { + "epoch": 0.74, + "learning_rate": 1.7636597985436287e-06, + "loss": 0.8213, + "step": 28876 + }, + { + "epoch": 0.74, + "learning_rate": 1.7636419336843875e-06, + "loss": 0.9736, + "step": 28877 + }, + { + "epoch": 0.74, + "learning_rate": 1.7636240682404608e-06, + "loss": 0.8379, + "step": 28878 + }, + { + "epoch": 0.74, + "learning_rate": 1.7636062022118622e-06, + "loss": 0.9512, + "step": 28879 + }, + { + "epoch": 0.74, + "learning_rate": 1.7635883355986057e-06, + "loss": 0.8965, + "step": 28880 + }, + { + "epoch": 0.74, + "learning_rate": 1.7635704684007044e-06, + "loss": 0.9824, + "step": 28881 + }, + { + "epoch": 0.74, + "learning_rate": 1.7635526006181722e-06, + "loss": 0.7212, + "step": 28882 + }, + { + "epoch": 0.74, + "learning_rate": 1.7635347322510232e-06, + "loss": 0.8262, + "step": 28883 + }, + { + "epoch": 0.74, + "learning_rate": 1.7635168632992707e-06, + "loss": 0.875, + "step": 28884 + }, + { + "epoch": 0.74, + "learning_rate": 1.7634989937629283e-06, + "loss": 0.6846, + "step": 28885 + }, + { + "epoch": 0.74, + "learning_rate": 1.76348112364201e-06, + "loss": 0.9355, + "step": 28886 + }, + { + "epoch": 0.74, + "learning_rate": 1.7634632529365292e-06, + "loss": 1.2227, + "step": 28887 + }, + { + "epoch": 0.74, + "learning_rate": 1.7634453816464995e-06, + "loss": 0.7319, + "step": 28888 + }, + { + "epoch": 0.74, + "learning_rate": 1.763427509771935e-06, + "loss": 0.8945, + "step": 28889 + }, + { + "epoch": 0.74, + "learning_rate": 1.7634096373128493e-06, + "loss": 0.6328, + "step": 28890 + }, + { + "epoch": 0.74, + "learning_rate": 1.7633917642692558e-06, + "loss": 0.8857, + "step": 28891 + }, + { + "epoch": 0.74, + "learning_rate": 1.7633738906411684e-06, + "loss": 1.0508, + "step": 28892 + }, + { + "epoch": 0.74, + "learning_rate": 1.7633560164286006e-06, + "loss": 0.7222, + "step": 28893 + }, + { + "epoch": 0.74, + "learning_rate": 1.763338141631566e-06, + "loss": 0.7842, + "step": 28894 + }, + { + "epoch": 0.74, + "learning_rate": 1.763320266250079e-06, + "loss": 0.6125, + "step": 28895 + }, + { + "epoch": 0.74, + "learning_rate": 1.7633023902841524e-06, + "loss": 0.832, + "step": 28896 + }, + { + "epoch": 0.74, + "learning_rate": 1.7632845137338005e-06, + "loss": 0.9805, + "step": 28897 + }, + { + "epoch": 0.74, + "learning_rate": 1.7632666365990363e-06, + "loss": 0.5728, + "step": 28898 + }, + { + "epoch": 0.74, + "learning_rate": 1.7632487588798743e-06, + "loss": 0.8057, + "step": 28899 + }, + { + "epoch": 0.74, + "learning_rate": 1.763230880576328e-06, + "loss": 0.9316, + "step": 28900 + }, + { + "epoch": 0.74, + "learning_rate": 1.7632130016884103e-06, + "loss": 0.8555, + "step": 28901 + }, + { + "epoch": 0.74, + "learning_rate": 1.763195122216136e-06, + "loss": 0.7764, + "step": 28902 + }, + { + "epoch": 0.74, + "learning_rate": 1.7631772421595178e-06, + "loss": 0.7246, + "step": 28903 + }, + { + "epoch": 0.74, + "learning_rate": 1.7631593615185705e-06, + "loss": 0.8379, + "step": 28904 + }, + { + "epoch": 0.74, + "learning_rate": 1.763141480293307e-06, + "loss": 0.7043, + "step": 28905 + }, + { + "epoch": 0.74, + "learning_rate": 1.7631235984837409e-06, + "loss": 1.0771, + "step": 28906 + }, + { + "epoch": 0.74, + "learning_rate": 1.7631057160898864e-06, + "loss": 0.8701, + "step": 28907 + }, + { + "epoch": 0.74, + "learning_rate": 1.7630878331117566e-06, + "loss": 1.1611, + "step": 28908 + }, + { + "epoch": 0.74, + "learning_rate": 1.763069949549366e-06, + "loss": 0.709, + "step": 28909 + }, + { + "epoch": 0.74, + "learning_rate": 1.7630520654027275e-06, + "loss": 0.9658, + "step": 28910 + }, + { + "epoch": 0.74, + "learning_rate": 1.763034180671855e-06, + "loss": 0.9102, + "step": 28911 + }, + { + "epoch": 0.74, + "learning_rate": 1.7630162953567627e-06, + "loss": 0.8691, + "step": 28912 + }, + { + "epoch": 0.74, + "learning_rate": 1.7629984094574636e-06, + "loss": 0.8516, + "step": 28913 + }, + { + "epoch": 0.74, + "learning_rate": 1.7629805229739718e-06, + "loss": 1.1572, + "step": 28914 + }, + { + "epoch": 0.74, + "learning_rate": 1.762962635906301e-06, + "loss": 0.8701, + "step": 28915 + }, + { + "epoch": 0.74, + "learning_rate": 1.7629447482544648e-06, + "loss": 0.7905, + "step": 28916 + }, + { + "epoch": 0.74, + "learning_rate": 1.7629268600184769e-06, + "loss": 0.8857, + "step": 28917 + }, + { + "epoch": 0.74, + "learning_rate": 1.7629089711983507e-06, + "loss": 0.9951, + "step": 28918 + }, + { + "epoch": 0.74, + "learning_rate": 1.7628910817941004e-06, + "loss": 0.6168, + "step": 28919 + }, + { + "epoch": 0.74, + "learning_rate": 1.7628731918057396e-06, + "loss": 0.8262, + "step": 28920 + }, + { + "epoch": 0.74, + "learning_rate": 1.7628553012332814e-06, + "loss": 0.9668, + "step": 28921 + }, + { + "epoch": 0.74, + "learning_rate": 1.7628374100767404e-06, + "loss": 0.9238, + "step": 28922 + }, + { + "epoch": 0.74, + "learning_rate": 1.76281951833613e-06, + "loss": 0.8721, + "step": 28923 + }, + { + "epoch": 0.74, + "learning_rate": 1.7628016260114634e-06, + "loss": 1.0332, + "step": 28924 + }, + { + "epoch": 0.74, + "learning_rate": 1.7627837331027547e-06, + "loss": 0.9395, + "step": 28925 + }, + { + "epoch": 0.74, + "learning_rate": 1.7627658396100178e-06, + "loss": 0.8496, + "step": 28926 + }, + { + "epoch": 0.74, + "learning_rate": 1.762747945533266e-06, + "loss": 0.834, + "step": 28927 + }, + { + "epoch": 0.74, + "learning_rate": 1.7627300508725132e-06, + "loss": 0.9551, + "step": 28928 + }, + { + "epoch": 0.74, + "learning_rate": 1.762712155627773e-06, + "loss": 0.8643, + "step": 28929 + }, + { + "epoch": 0.74, + "learning_rate": 1.7626942597990592e-06, + "loss": 0.9062, + "step": 28930 + }, + { + "epoch": 0.74, + "learning_rate": 1.7626763633863857e-06, + "loss": 0.7007, + "step": 28931 + }, + { + "epoch": 0.74, + "learning_rate": 1.762658466389766e-06, + "loss": 0.9502, + "step": 28932 + }, + { + "epoch": 0.74, + "learning_rate": 1.7626405688092134e-06, + "loss": 0.8584, + "step": 28933 + }, + { + "epoch": 0.74, + "learning_rate": 1.7626226706447421e-06, + "loss": 0.7898, + "step": 28934 + }, + { + "epoch": 0.74, + "learning_rate": 1.762604771896366e-06, + "loss": 0.9727, + "step": 28935 + }, + { + "epoch": 0.74, + "learning_rate": 1.762586872564098e-06, + "loss": 0.9346, + "step": 28936 + }, + { + "epoch": 0.74, + "learning_rate": 1.7625689726479526e-06, + "loss": 0.916, + "step": 28937 + }, + { + "epoch": 0.74, + "learning_rate": 1.7625510721479432e-06, + "loss": 0.9658, + "step": 28938 + }, + { + "epoch": 0.74, + "learning_rate": 1.7625331710640833e-06, + "loss": 0.7969, + "step": 28939 + }, + { + "epoch": 0.74, + "learning_rate": 1.762515269396387e-06, + "loss": 0.5625, + "step": 28940 + }, + { + "epoch": 0.74, + "learning_rate": 1.762497367144868e-06, + "loss": 0.9785, + "step": 28941 + }, + { + "epoch": 0.74, + "learning_rate": 1.7624794643095396e-06, + "loss": 0.918, + "step": 28942 + }, + { + "epoch": 0.74, + "learning_rate": 1.7624615608904156e-06, + "loss": 0.6248, + "step": 28943 + }, + { + "epoch": 0.74, + "learning_rate": 1.76244365688751e-06, + "loss": 0.7446, + "step": 28944 + }, + { + "epoch": 0.74, + "learning_rate": 1.7624257523008363e-06, + "loss": 0.915, + "step": 28945 + }, + { + "epoch": 0.74, + "learning_rate": 1.7624078471304084e-06, + "loss": 0.7585, + "step": 28946 + }, + { + "epoch": 0.74, + "learning_rate": 1.7623899413762399e-06, + "loss": 0.9648, + "step": 28947 + }, + { + "epoch": 0.74, + "learning_rate": 1.7623720350383443e-06, + "loss": 0.9551, + "step": 28948 + }, + { + "epoch": 0.74, + "learning_rate": 1.7623541281167356e-06, + "loss": 0.8584, + "step": 28949 + }, + { + "epoch": 0.74, + "learning_rate": 1.762336220611427e-06, + "loss": 0.572, + "step": 28950 + }, + { + "epoch": 0.74, + "learning_rate": 1.7623183125224332e-06, + "loss": 0.8203, + "step": 28951 + }, + { + "epoch": 0.74, + "learning_rate": 1.762300403849767e-06, + "loss": 0.9492, + "step": 28952 + }, + { + "epoch": 0.74, + "learning_rate": 1.7622824945934424e-06, + "loss": 0.8242, + "step": 28953 + }, + { + "epoch": 0.74, + "learning_rate": 1.7622645847534732e-06, + "loss": 0.7251, + "step": 28954 + }, + { + "epoch": 0.74, + "learning_rate": 1.7622466743298733e-06, + "loss": 1.0977, + "step": 28955 + }, + { + "epoch": 0.74, + "learning_rate": 1.7622287633226561e-06, + "loss": 0.7427, + "step": 28956 + }, + { + "epoch": 0.74, + "learning_rate": 1.7622108517318351e-06, + "loss": 0.8652, + "step": 28957 + }, + { + "epoch": 0.74, + "learning_rate": 1.7621929395574245e-06, + "loss": 1.0088, + "step": 28958 + }, + { + "epoch": 0.74, + "learning_rate": 1.7621750267994378e-06, + "loss": 0.6919, + "step": 28959 + }, + { + "epoch": 0.74, + "learning_rate": 1.7621571134578884e-06, + "loss": 0.8984, + "step": 28960 + }, + { + "epoch": 0.74, + "learning_rate": 1.7621391995327907e-06, + "loss": 0.7231, + "step": 28961 + }, + { + "epoch": 0.74, + "learning_rate": 1.762121285024158e-06, + "loss": 0.8564, + "step": 28962 + }, + { + "epoch": 0.74, + "learning_rate": 1.762103369932004e-06, + "loss": 0.7334, + "step": 28963 + }, + { + "epoch": 0.74, + "learning_rate": 1.7620854542563427e-06, + "loss": 0.7515, + "step": 28964 + }, + { + "epoch": 0.74, + "learning_rate": 1.7620675379971874e-06, + "loss": 0.7783, + "step": 28965 + }, + { + "epoch": 0.74, + "learning_rate": 1.762049621154552e-06, + "loss": 0.9316, + "step": 28966 + }, + { + "epoch": 0.74, + "learning_rate": 1.7620317037284504e-06, + "loss": 0.8184, + "step": 28967 + }, + { + "epoch": 0.74, + "learning_rate": 1.762013785718896e-06, + "loss": 0.6533, + "step": 28968 + }, + { + "epoch": 0.74, + "learning_rate": 1.761995867125903e-06, + "loss": 0.7495, + "step": 28969 + }, + { + "epoch": 0.74, + "learning_rate": 1.7619779479494845e-06, + "loss": 0.7974, + "step": 28970 + }, + { + "epoch": 0.74, + "learning_rate": 1.7619600281896548e-06, + "loss": 0.9521, + "step": 28971 + }, + { + "epoch": 0.74, + "learning_rate": 1.7619421078464269e-06, + "loss": 0.9062, + "step": 28972 + }, + { + "epoch": 0.74, + "learning_rate": 1.7619241869198154e-06, + "loss": 1.1006, + "step": 28973 + }, + { + "epoch": 0.74, + "learning_rate": 1.7619062654098333e-06, + "loss": 0.9277, + "step": 28974 + }, + { + "epoch": 0.74, + "learning_rate": 1.7618883433164947e-06, + "loss": 1.1689, + "step": 28975 + }, + { + "epoch": 0.74, + "learning_rate": 1.7618704206398132e-06, + "loss": 0.999, + "step": 28976 + }, + { + "epoch": 0.74, + "learning_rate": 1.7618524973798028e-06, + "loss": 0.7275, + "step": 28977 + }, + { + "epoch": 0.74, + "learning_rate": 1.7618345735364767e-06, + "loss": 1.0312, + "step": 28978 + }, + { + "epoch": 0.74, + "learning_rate": 1.761816649109849e-06, + "loss": 0.9375, + "step": 28979 + }, + { + "epoch": 0.74, + "learning_rate": 1.761798724099933e-06, + "loss": 0.957, + "step": 28980 + }, + { + "epoch": 0.74, + "learning_rate": 1.7617807985067432e-06, + "loss": 1.0137, + "step": 28981 + }, + { + "epoch": 0.74, + "learning_rate": 1.7617628723302927e-06, + "loss": 0.8359, + "step": 28982 + }, + { + "epoch": 0.74, + "learning_rate": 1.7617449455705954e-06, + "loss": 0.8828, + "step": 28983 + }, + { + "epoch": 0.74, + "learning_rate": 1.761727018227665e-06, + "loss": 0.8096, + "step": 28984 + }, + { + "epoch": 0.74, + "learning_rate": 1.7617090903015153e-06, + "loss": 0.4728, + "step": 28985 + }, + { + "epoch": 0.74, + "learning_rate": 1.7616911617921598e-06, + "loss": 0.9346, + "step": 28986 + }, + { + "epoch": 0.74, + "learning_rate": 1.7616732326996125e-06, + "loss": 0.6895, + "step": 28987 + }, + { + "epoch": 0.74, + "learning_rate": 1.761655303023887e-06, + "loss": 0.6963, + "step": 28988 + }, + { + "epoch": 0.74, + "learning_rate": 1.7616373727649974e-06, + "loss": 0.916, + "step": 28989 + }, + { + "epoch": 0.74, + "learning_rate": 1.7616194419229566e-06, + "loss": 0.792, + "step": 28990 + }, + { + "epoch": 0.74, + "learning_rate": 1.761601510497779e-06, + "loss": 0.7827, + "step": 28991 + }, + { + "epoch": 0.74, + "learning_rate": 1.761583578489478e-06, + "loss": 0.8691, + "step": 28992 + }, + { + "epoch": 0.74, + "learning_rate": 1.761565645898068e-06, + "loss": 0.8555, + "step": 28993 + }, + { + "epoch": 0.74, + "learning_rate": 1.7615477127235616e-06, + "loss": 0.8252, + "step": 28994 + }, + { + "epoch": 0.74, + "learning_rate": 1.7615297789659733e-06, + "loss": 0.9458, + "step": 28995 + }, + { + "epoch": 0.74, + "learning_rate": 1.7615118446253167e-06, + "loss": 0.6492, + "step": 28996 + }, + { + "epoch": 0.74, + "learning_rate": 1.7614939097016057e-06, + "loss": 0.9023, + "step": 28997 + }, + { + "epoch": 0.74, + "learning_rate": 1.7614759741948534e-06, + "loss": 0.709, + "step": 28998 + }, + { + "epoch": 0.74, + "learning_rate": 1.7614580381050743e-06, + "loss": 0.9658, + "step": 28999 + }, + { + "epoch": 0.74, + "learning_rate": 1.7614401014322819e-06, + "loss": 0.7598, + "step": 29000 + }, + { + "epoch": 0.74, + "learning_rate": 1.7614221641764896e-06, + "loss": 0.8569, + "step": 29001 + }, + { + "epoch": 0.74, + "learning_rate": 1.7614042263377113e-06, + "loss": 0.877, + "step": 29002 + }, + { + "epoch": 0.74, + "learning_rate": 1.7613862879159612e-06, + "loss": 0.9736, + "step": 29003 + }, + { + "epoch": 0.74, + "learning_rate": 1.7613683489112522e-06, + "loss": 0.874, + "step": 29004 + }, + { + "epoch": 0.74, + "learning_rate": 1.7613504093235985e-06, + "loss": 0.9951, + "step": 29005 + }, + { + "epoch": 0.74, + "learning_rate": 1.7613324691530139e-06, + "loss": 0.73, + "step": 29006 + }, + { + "epoch": 0.74, + "learning_rate": 1.761314528399512e-06, + "loss": 1.002, + "step": 29007 + }, + { + "epoch": 0.74, + "learning_rate": 1.7612965870631065e-06, + "loss": 0.8442, + "step": 29008 + }, + { + "epoch": 0.74, + "learning_rate": 1.7612786451438113e-06, + "loss": 0.8057, + "step": 29009 + }, + { + "epoch": 0.74, + "learning_rate": 1.7612607026416399e-06, + "loss": 0.8633, + "step": 29010 + }, + { + "epoch": 0.74, + "learning_rate": 1.7612427595566067e-06, + "loss": 0.9805, + "step": 29011 + }, + { + "epoch": 0.74, + "learning_rate": 1.7612248158887244e-06, + "loss": 0.5591, + "step": 29012 + }, + { + "epoch": 0.74, + "learning_rate": 1.7612068716380072e-06, + "loss": 0.9121, + "step": 29013 + }, + { + "epoch": 0.74, + "learning_rate": 1.7611889268044694e-06, + "loss": 0.937, + "step": 29014 + }, + { + "epoch": 0.74, + "learning_rate": 1.7611709813881239e-06, + "loss": 0.751, + "step": 29015 + }, + { + "epoch": 0.74, + "learning_rate": 1.7611530353889848e-06, + "loss": 0.8179, + "step": 29016 + }, + { + "epoch": 0.74, + "learning_rate": 1.7611350888070657e-06, + "loss": 0.9209, + "step": 29017 + }, + { + "epoch": 0.74, + "learning_rate": 1.7611171416423807e-06, + "loss": 0.9854, + "step": 29018 + }, + { + "epoch": 0.74, + "learning_rate": 1.7610991938949431e-06, + "loss": 0.8584, + "step": 29019 + }, + { + "epoch": 0.74, + "learning_rate": 1.761081245564767e-06, + "loss": 0.9219, + "step": 29020 + }, + { + "epoch": 0.74, + "learning_rate": 1.761063296651866e-06, + "loss": 0.8975, + "step": 29021 + }, + { + "epoch": 0.74, + "learning_rate": 1.7610453471562537e-06, + "loss": 0.6143, + "step": 29022 + }, + { + "epoch": 0.74, + "learning_rate": 1.761027397077944e-06, + "loss": 0.9453, + "step": 29023 + }, + { + "epoch": 0.74, + "learning_rate": 1.7610094464169506e-06, + "loss": 0.8301, + "step": 29024 + }, + { + "epoch": 0.74, + "learning_rate": 1.7609914951732874e-06, + "loss": 0.8457, + "step": 29025 + }, + { + "epoch": 0.74, + "learning_rate": 1.760973543346968e-06, + "loss": 0.9805, + "step": 29026 + }, + { + "epoch": 0.74, + "learning_rate": 1.760955590938006e-06, + "loss": 0.7656, + "step": 29027 + }, + { + "epoch": 0.74, + "learning_rate": 1.7609376379464153e-06, + "loss": 0.835, + "step": 29028 + }, + { + "epoch": 0.74, + "learning_rate": 1.7609196843722098e-06, + "loss": 0.8643, + "step": 29029 + }, + { + "epoch": 0.74, + "learning_rate": 1.7609017302154027e-06, + "loss": 0.9414, + "step": 29030 + }, + { + "epoch": 0.74, + "learning_rate": 1.7608837754760084e-06, + "loss": 0.7358, + "step": 29031 + }, + { + "epoch": 0.74, + "learning_rate": 1.7608658201540404e-06, + "loss": 0.8262, + "step": 29032 + }, + { + "epoch": 0.74, + "learning_rate": 1.7608478642495125e-06, + "loss": 0.8057, + "step": 29033 + }, + { + "epoch": 0.74, + "learning_rate": 1.7608299077624382e-06, + "loss": 0.7715, + "step": 29034 + }, + { + "epoch": 0.74, + "learning_rate": 1.7608119506928317e-06, + "loss": 0.9414, + "step": 29035 + }, + { + "epoch": 0.74, + "learning_rate": 1.7607939930407064e-06, + "loss": 0.832, + "step": 29036 + }, + { + "epoch": 0.74, + "learning_rate": 1.760776034806076e-06, + "loss": 0.9043, + "step": 29037 + }, + { + "epoch": 0.74, + "learning_rate": 1.7607580759889542e-06, + "loss": 0.5695, + "step": 29038 + }, + { + "epoch": 0.74, + "learning_rate": 1.7607401165893551e-06, + "loss": 0.9551, + "step": 29039 + }, + { + "epoch": 0.74, + "learning_rate": 1.7607221566072924e-06, + "loss": 0.7397, + "step": 29040 + }, + { + "epoch": 0.74, + "learning_rate": 1.7607041960427795e-06, + "loss": 0.7357, + "step": 29041 + }, + { + "epoch": 0.74, + "learning_rate": 1.7606862348958305e-06, + "loss": 0.875, + "step": 29042 + }, + { + "epoch": 0.74, + "learning_rate": 1.760668273166459e-06, + "loss": 0.6616, + "step": 29043 + }, + { + "epoch": 0.74, + "learning_rate": 1.7606503108546788e-06, + "loss": 0.8525, + "step": 29044 + }, + { + "epoch": 0.74, + "learning_rate": 1.7606323479605037e-06, + "loss": 0.8867, + "step": 29045 + }, + { + "epoch": 0.74, + "learning_rate": 1.7606143844839472e-06, + "loss": 0.9365, + "step": 29046 + }, + { + "epoch": 0.74, + "learning_rate": 1.7605964204250234e-06, + "loss": 0.7786, + "step": 29047 + }, + { + "epoch": 0.74, + "learning_rate": 1.760578455783746e-06, + "loss": 0.957, + "step": 29048 + }, + { + "epoch": 0.74, + "learning_rate": 1.7605604905601282e-06, + "loss": 0.8955, + "step": 29049 + }, + { + "epoch": 0.74, + "learning_rate": 1.7605425247541846e-06, + "loss": 1.0684, + "step": 29050 + }, + { + "epoch": 0.74, + "learning_rate": 1.7605245583659285e-06, + "loss": 0.8877, + "step": 29051 + }, + { + "epoch": 0.74, + "learning_rate": 1.7605065913953736e-06, + "loss": 0.9404, + "step": 29052 + }, + { + "epoch": 0.74, + "learning_rate": 1.7604886238425338e-06, + "loss": 0.9023, + "step": 29053 + }, + { + "epoch": 0.74, + "learning_rate": 1.7604706557074227e-06, + "loss": 0.918, + "step": 29054 + }, + { + "epoch": 0.74, + "learning_rate": 1.7604526869900545e-06, + "loss": 0.958, + "step": 29055 + }, + { + "epoch": 0.74, + "learning_rate": 1.7604347176904426e-06, + "loss": 0.7583, + "step": 29056 + }, + { + "epoch": 0.74, + "learning_rate": 1.7604167478086005e-06, + "loss": 0.9443, + "step": 29057 + }, + { + "epoch": 0.74, + "learning_rate": 1.7603987773445425e-06, + "loss": 0.7319, + "step": 29058 + }, + { + "epoch": 0.74, + "learning_rate": 1.7603808062982822e-06, + "loss": 0.9111, + "step": 29059 + }, + { + "epoch": 0.74, + "learning_rate": 1.7603628346698332e-06, + "loss": 1.0088, + "step": 29060 + }, + { + "epoch": 0.74, + "learning_rate": 1.7603448624592092e-06, + "loss": 0.9678, + "step": 29061 + }, + { + "epoch": 0.74, + "learning_rate": 1.7603268896664243e-06, + "loss": 0.7949, + "step": 29062 + }, + { + "epoch": 0.74, + "learning_rate": 1.7603089162914918e-06, + "loss": 0.7637, + "step": 29063 + }, + { + "epoch": 0.74, + "learning_rate": 1.7602909423344258e-06, + "loss": 0.7803, + "step": 29064 + }, + { + "epoch": 0.74, + "learning_rate": 1.7602729677952405e-06, + "loss": 0.791, + "step": 29065 + }, + { + "epoch": 0.74, + "learning_rate": 1.7602549926739484e-06, + "loss": 0.8042, + "step": 29066 + }, + { + "epoch": 0.75, + "learning_rate": 1.7602370169705646e-06, + "loss": 0.8438, + "step": 29067 + }, + { + "epoch": 0.75, + "learning_rate": 1.7602190406851016e-06, + "loss": 0.875, + "step": 29068 + }, + { + "epoch": 0.75, + "learning_rate": 1.7602010638175745e-06, + "loss": 0.7871, + "step": 29069 + }, + { + "epoch": 0.75, + "learning_rate": 1.7601830863679962e-06, + "loss": 1.0615, + "step": 29070 + }, + { + "epoch": 0.75, + "learning_rate": 1.7601651083363805e-06, + "loss": 0.8926, + "step": 29071 + }, + { + "epoch": 0.75, + "learning_rate": 1.7601471297227413e-06, + "loss": 0.5347, + "step": 29072 + }, + { + "epoch": 0.75, + "learning_rate": 1.7601291505270925e-06, + "loss": 0.7402, + "step": 29073 + }, + { + "epoch": 0.75, + "learning_rate": 1.7601111707494477e-06, + "loss": 0.7852, + "step": 29074 + }, + { + "epoch": 0.75, + "learning_rate": 1.760093190389821e-06, + "loss": 0.7744, + "step": 29075 + }, + { + "epoch": 0.75, + "learning_rate": 1.7600752094482255e-06, + "loss": 0.6675, + "step": 29076 + }, + { + "epoch": 0.75, + "learning_rate": 1.7600572279246756e-06, + "loss": 0.8599, + "step": 29077 + }, + { + "epoch": 0.75, + "learning_rate": 1.7600392458191849e-06, + "loss": 0.7728, + "step": 29078 + }, + { + "epoch": 0.75, + "learning_rate": 1.760021263131767e-06, + "loss": 0.8916, + "step": 29079 + }, + { + "epoch": 0.75, + "learning_rate": 1.7600032798624358e-06, + "loss": 0.8867, + "step": 29080 + }, + { + "epoch": 0.75, + "learning_rate": 1.7599852960112049e-06, + "loss": 0.8906, + "step": 29081 + }, + { + "epoch": 0.75, + "learning_rate": 1.7599673115780883e-06, + "loss": 0.8633, + "step": 29082 + }, + { + "epoch": 0.75, + "learning_rate": 1.7599493265630997e-06, + "loss": 0.7314, + "step": 29083 + }, + { + "epoch": 0.75, + "learning_rate": 1.7599313409662529e-06, + "loss": 0.9375, + "step": 29084 + }, + { + "epoch": 0.75, + "learning_rate": 1.7599133547875615e-06, + "loss": 0.7451, + "step": 29085 + }, + { + "epoch": 0.75, + "learning_rate": 1.7598953680270394e-06, + "loss": 1.043, + "step": 29086 + }, + { + "epoch": 0.75, + "learning_rate": 1.7598773806847005e-06, + "loss": 0.9629, + "step": 29087 + }, + { + "epoch": 0.75, + "learning_rate": 1.7598593927605582e-06, + "loss": 0.5767, + "step": 29088 + }, + { + "epoch": 0.75, + "learning_rate": 1.7598414042546265e-06, + "loss": 0.7192, + "step": 29089 + }, + { + "epoch": 0.75, + "learning_rate": 1.7598234151669193e-06, + "loss": 0.8457, + "step": 29090 + }, + { + "epoch": 0.75, + "learning_rate": 1.7598054254974501e-06, + "loss": 0.8135, + "step": 29091 + }, + { + "epoch": 0.75, + "learning_rate": 1.7597874352462332e-06, + "loss": 0.8828, + "step": 29092 + }, + { + "epoch": 0.75, + "learning_rate": 1.7597694444132815e-06, + "loss": 1.0449, + "step": 29093 + }, + { + "epoch": 0.75, + "learning_rate": 1.7597514529986096e-06, + "loss": 0.749, + "step": 29094 + }, + { + "epoch": 0.75, + "learning_rate": 1.7597334610022309e-06, + "loss": 0.624, + "step": 29095 + }, + { + "epoch": 0.75, + "learning_rate": 1.7597154684241592e-06, + "loss": 0.6152, + "step": 29096 + }, + { + "epoch": 0.75, + "learning_rate": 1.7596974752644082e-06, + "loss": 0.7871, + "step": 29097 + }, + { + "epoch": 0.75, + "learning_rate": 1.7596794815229919e-06, + "loss": 0.9248, + "step": 29098 + }, + { + "epoch": 0.75, + "learning_rate": 1.7596614871999237e-06, + "loss": 0.8799, + "step": 29099 + }, + { + "epoch": 0.75, + "learning_rate": 1.7596434922952182e-06, + "loss": 0.8403, + "step": 29100 + }, + { + "epoch": 0.75, + "learning_rate": 1.759625496808888e-06, + "loss": 1.04, + "step": 29101 + }, + { + "epoch": 0.75, + "learning_rate": 1.759607500740948e-06, + "loss": 0.8457, + "step": 29102 + }, + { + "epoch": 0.75, + "learning_rate": 1.7595895040914113e-06, + "loss": 0.9229, + "step": 29103 + }, + { + "epoch": 0.75, + "learning_rate": 1.7595715068602916e-06, + "loss": 0.8125, + "step": 29104 + }, + { + "epoch": 0.75, + "learning_rate": 1.7595535090476031e-06, + "loss": 0.8115, + "step": 29105 + }, + { + "epoch": 0.75, + "learning_rate": 1.7595355106533592e-06, + "loss": 1.0215, + "step": 29106 + }, + { + "epoch": 0.75, + "learning_rate": 1.7595175116775742e-06, + "loss": 0.9268, + "step": 29107 + }, + { + "epoch": 0.75, + "learning_rate": 1.7594995121202613e-06, + "loss": 1.0742, + "step": 29108 + }, + { + "epoch": 0.75, + "learning_rate": 1.7594815119814346e-06, + "loss": 1.0049, + "step": 29109 + }, + { + "epoch": 0.75, + "learning_rate": 1.759463511261108e-06, + "loss": 0.6343, + "step": 29110 + }, + { + "epoch": 0.75, + "learning_rate": 1.7594455099592952e-06, + "loss": 0.8242, + "step": 29111 + }, + { + "epoch": 0.75, + "learning_rate": 1.7594275080760097e-06, + "loss": 0.7976, + "step": 29112 + }, + { + "epoch": 0.75, + "learning_rate": 1.7594095056112655e-06, + "loss": 0.8623, + "step": 29113 + }, + { + "epoch": 0.75, + "learning_rate": 1.7593915025650761e-06, + "loss": 0.7393, + "step": 29114 + }, + { + "epoch": 0.75, + "learning_rate": 1.7593734989374559e-06, + "loss": 0.8096, + "step": 29115 + }, + { + "epoch": 0.75, + "learning_rate": 1.7593554947284182e-06, + "loss": 0.5864, + "step": 29116 + }, + { + "epoch": 0.75, + "learning_rate": 1.7593374899379767e-06, + "loss": 0.6895, + "step": 29117 + }, + { + "epoch": 0.75, + "learning_rate": 1.7593194845661458e-06, + "loss": 1.0146, + "step": 29118 + }, + { + "epoch": 0.75, + "learning_rate": 1.7593014786129388e-06, + "loss": 1.0586, + "step": 29119 + }, + { + "epoch": 0.75, + "learning_rate": 1.7592834720783694e-06, + "loss": 0.8369, + "step": 29120 + }, + { + "epoch": 0.75, + "learning_rate": 1.7592654649624517e-06, + "loss": 1.1377, + "step": 29121 + }, + { + "epoch": 0.75, + "learning_rate": 1.7592474572651992e-06, + "loss": 0.8574, + "step": 29122 + }, + { + "epoch": 0.75, + "learning_rate": 1.759229448986626e-06, + "loss": 0.9082, + "step": 29123 + }, + { + "epoch": 0.75, + "learning_rate": 1.7592114401267454e-06, + "loss": 1.0522, + "step": 29124 + }, + { + "epoch": 0.75, + "learning_rate": 1.7591934306855719e-06, + "loss": 0.7241, + "step": 29125 + }, + { + "epoch": 0.75, + "learning_rate": 1.7591754206631186e-06, + "loss": 0.6106, + "step": 29126 + }, + { + "epoch": 0.75, + "learning_rate": 1.7591574100593998e-06, + "loss": 0.6812, + "step": 29127 + }, + { + "epoch": 0.75, + "learning_rate": 1.759139398874429e-06, + "loss": 0.8848, + "step": 29128 + }, + { + "epoch": 0.75, + "learning_rate": 1.75912138710822e-06, + "loss": 0.876, + "step": 29129 + }, + { + "epoch": 0.75, + "learning_rate": 1.7591033747607868e-06, + "loss": 0.7852, + "step": 29130 + }, + { + "epoch": 0.75, + "learning_rate": 1.7590853618321431e-06, + "loss": 0.9756, + "step": 29131 + }, + { + "epoch": 0.75, + "learning_rate": 1.7590673483223023e-06, + "loss": 0.8701, + "step": 29132 + }, + { + "epoch": 0.75, + "learning_rate": 1.7590493342312788e-06, + "loss": 0.6606, + "step": 29133 + }, + { + "epoch": 0.75, + "learning_rate": 1.759031319559086e-06, + "loss": 0.7891, + "step": 29134 + }, + { + "epoch": 0.75, + "learning_rate": 1.7590133043057382e-06, + "loss": 0.8857, + "step": 29135 + }, + { + "epoch": 0.75, + "learning_rate": 1.7589952884712485e-06, + "loss": 0.8506, + "step": 29136 + }, + { + "epoch": 0.75, + "learning_rate": 1.7589772720556312e-06, + "loss": 0.835, + "step": 29137 + }, + { + "epoch": 0.75, + "learning_rate": 1.7589592550588996e-06, + "loss": 0.9941, + "step": 29138 + }, + { + "epoch": 0.75, + "learning_rate": 1.7589412374810677e-06, + "loss": 1.0068, + "step": 29139 + }, + { + "epoch": 0.75, + "learning_rate": 1.7589232193221498e-06, + "loss": 0.7666, + "step": 29140 + }, + { + "epoch": 0.75, + "learning_rate": 1.7589052005821592e-06, + "loss": 0.7715, + "step": 29141 + }, + { + "epoch": 0.75, + "learning_rate": 1.7588871812611095e-06, + "loss": 1.0645, + "step": 29142 + }, + { + "epoch": 0.75, + "learning_rate": 1.758869161359015e-06, + "loss": 0.9414, + "step": 29143 + }, + { + "epoch": 0.75, + "learning_rate": 1.758851140875889e-06, + "loss": 0.7241, + "step": 29144 + }, + { + "epoch": 0.75, + "learning_rate": 1.7588331198117462e-06, + "loss": 0.7964, + "step": 29145 + }, + { + "epoch": 0.75, + "learning_rate": 1.7588150981665992e-06, + "loss": 0.7803, + "step": 29146 + }, + { + "epoch": 0.75, + "learning_rate": 1.7587970759404627e-06, + "loss": 0.834, + "step": 29147 + }, + { + "epoch": 0.75, + "learning_rate": 1.75877905313335e-06, + "loss": 0.5481, + "step": 29148 + }, + { + "epoch": 0.75, + "learning_rate": 1.7587610297452748e-06, + "loss": 0.9141, + "step": 29149 + }, + { + "epoch": 0.75, + "learning_rate": 1.7587430057762517e-06, + "loss": 0.7401, + "step": 29150 + }, + { + "epoch": 0.75, + "learning_rate": 1.7587249812262938e-06, + "loss": 0.7393, + "step": 29151 + }, + { + "epoch": 0.75, + "learning_rate": 1.758706956095415e-06, + "loss": 0.7266, + "step": 29152 + }, + { + "epoch": 0.75, + "learning_rate": 1.758688930383629e-06, + "loss": 0.8599, + "step": 29153 + }, + { + "epoch": 0.75, + "learning_rate": 1.75867090409095e-06, + "loss": 0.832, + "step": 29154 + }, + { + "epoch": 0.75, + "learning_rate": 1.7586528772173917e-06, + "loss": 0.8955, + "step": 29155 + }, + { + "epoch": 0.75, + "learning_rate": 1.7586348497629676e-06, + "loss": 0.9717, + "step": 29156 + }, + { + "epoch": 0.75, + "learning_rate": 1.7586168217276916e-06, + "loss": 0.8164, + "step": 29157 + }, + { + "epoch": 0.75, + "learning_rate": 1.7585987931115777e-06, + "loss": 0.793, + "step": 29158 + }, + { + "epoch": 0.75, + "learning_rate": 1.7585807639146395e-06, + "loss": 0.9199, + "step": 29159 + }, + { + "epoch": 0.75, + "learning_rate": 1.758562734136891e-06, + "loss": 1.0996, + "step": 29160 + }, + { + "epoch": 0.75, + "learning_rate": 1.7585447037783458e-06, + "loss": 0.7407, + "step": 29161 + }, + { + "epoch": 0.75, + "learning_rate": 1.7585266728390179e-06, + "loss": 0.8291, + "step": 29162 + }, + { + "epoch": 0.75, + "learning_rate": 1.7585086413189207e-06, + "loss": 0.9473, + "step": 29163 + }, + { + "epoch": 0.75, + "learning_rate": 1.7584906092180685e-06, + "loss": 0.7959, + "step": 29164 + }, + { + "epoch": 0.75, + "learning_rate": 1.7584725765364751e-06, + "loss": 0.7188, + "step": 29165 + }, + { + "epoch": 0.75, + "learning_rate": 1.758454543274154e-06, + "loss": 0.7344, + "step": 29166 + }, + { + "epoch": 0.75, + "learning_rate": 1.7584365094311192e-06, + "loss": 0.8555, + "step": 29167 + }, + { + "epoch": 0.75, + "learning_rate": 1.7584184750073842e-06, + "loss": 0.7559, + "step": 29168 + }, + { + "epoch": 0.75, + "learning_rate": 1.7584004400029632e-06, + "loss": 0.749, + "step": 29169 + }, + { + "epoch": 0.75, + "learning_rate": 1.7583824044178698e-06, + "loss": 0.9541, + "step": 29170 + }, + { + "epoch": 0.75, + "learning_rate": 1.758364368252118e-06, + "loss": 0.7866, + "step": 29171 + }, + { + "epoch": 0.75, + "learning_rate": 1.7583463315057214e-06, + "loss": 0.834, + "step": 29172 + }, + { + "epoch": 0.75, + "learning_rate": 1.7583282941786938e-06, + "loss": 0.7803, + "step": 29173 + }, + { + "epoch": 0.75, + "learning_rate": 1.7583102562710492e-06, + "loss": 0.7549, + "step": 29174 + }, + { + "epoch": 0.75, + "learning_rate": 1.7582922177828014e-06, + "loss": 0.771, + "step": 29175 + }, + { + "epoch": 0.75, + "learning_rate": 1.758274178713964e-06, + "loss": 1.0029, + "step": 29176 + }, + { + "epoch": 0.75, + "learning_rate": 1.7582561390645507e-06, + "loss": 0.8105, + "step": 29177 + }, + { + "epoch": 0.75, + "learning_rate": 1.758238098834576e-06, + "loss": 0.7988, + "step": 29178 + }, + { + "epoch": 0.75, + "learning_rate": 1.7582200580240529e-06, + "loss": 0.8135, + "step": 29179 + }, + { + "epoch": 0.75, + "learning_rate": 1.7582020166329956e-06, + "loss": 0.8154, + "step": 29180 + }, + { + "epoch": 0.75, + "learning_rate": 1.758183974661418e-06, + "loss": 0.7646, + "step": 29181 + }, + { + "epoch": 0.75, + "learning_rate": 1.7581659321093338e-06, + "loss": 0.9268, + "step": 29182 + }, + { + "epoch": 0.75, + "learning_rate": 1.7581478889767567e-06, + "loss": 0.6875, + "step": 29183 + }, + { + "epoch": 0.75, + "learning_rate": 1.7581298452637005e-06, + "loss": 0.8169, + "step": 29184 + }, + { + "epoch": 0.75, + "learning_rate": 1.7581118009701794e-06, + "loss": 1.1191, + "step": 29185 + }, + { + "epoch": 0.75, + "learning_rate": 1.758093756096207e-06, + "loss": 0.9551, + "step": 29186 + }, + { + "epoch": 0.75, + "learning_rate": 1.7580757106417968e-06, + "loss": 0.7451, + "step": 29187 + }, + { + "epoch": 0.75, + "learning_rate": 1.7580576646069632e-06, + "loss": 0.9619, + "step": 29188 + }, + { + "epoch": 0.75, + "learning_rate": 1.7580396179917195e-06, + "loss": 0.8945, + "step": 29189 + }, + { + "epoch": 0.75, + "learning_rate": 1.7580215707960795e-06, + "loss": 0.793, + "step": 29190 + }, + { + "epoch": 0.75, + "learning_rate": 1.7580035230200576e-06, + "loss": 0.8936, + "step": 29191 + }, + { + "epoch": 0.75, + "learning_rate": 1.757985474663667e-06, + "loss": 0.917, + "step": 29192 + }, + { + "epoch": 0.75, + "learning_rate": 1.7579674257269218e-06, + "loss": 0.9131, + "step": 29193 + }, + { + "epoch": 0.75, + "learning_rate": 1.757949376209836e-06, + "loss": 0.873, + "step": 29194 + }, + { + "epoch": 0.75, + "learning_rate": 1.7579313261124234e-06, + "loss": 1.0, + "step": 29195 + }, + { + "epoch": 0.75, + "learning_rate": 1.7579132754346972e-06, + "loss": 0.7949, + "step": 29196 + }, + { + "epoch": 0.75, + "learning_rate": 1.7578952241766718e-06, + "loss": 0.9951, + "step": 29197 + }, + { + "epoch": 0.75, + "learning_rate": 1.757877172338361e-06, + "loss": 0.8633, + "step": 29198 + }, + { + "epoch": 0.75, + "learning_rate": 1.7578591199197782e-06, + "loss": 0.9844, + "step": 29199 + }, + { + "epoch": 0.75, + "learning_rate": 1.757841066920938e-06, + "loss": 0.7407, + "step": 29200 + }, + { + "epoch": 0.75, + "learning_rate": 1.7578230133418533e-06, + "loss": 0.7402, + "step": 29201 + }, + { + "epoch": 0.75, + "learning_rate": 1.7578049591825386e-06, + "loss": 0.96, + "step": 29202 + }, + { + "epoch": 0.75, + "learning_rate": 1.7577869044430074e-06, + "loss": 0.9541, + "step": 29203 + }, + { + "epoch": 0.75, + "learning_rate": 1.7577688491232737e-06, + "loss": 0.9297, + "step": 29204 + }, + { + "epoch": 0.75, + "learning_rate": 1.757750793223351e-06, + "loss": 0.8105, + "step": 29205 + }, + { + "epoch": 0.75, + "learning_rate": 1.7577327367432535e-06, + "loss": 0.873, + "step": 29206 + }, + { + "epoch": 0.75, + "learning_rate": 1.7577146796829948e-06, + "loss": 0.9424, + "step": 29207 + }, + { + "epoch": 0.75, + "learning_rate": 1.7576966220425888e-06, + "loss": 0.8271, + "step": 29208 + }, + { + "epoch": 0.75, + "learning_rate": 1.7576785638220497e-06, + "loss": 0.998, + "step": 29209 + }, + { + "epoch": 0.75, + "learning_rate": 1.7576605050213905e-06, + "loss": 0.9941, + "step": 29210 + }, + { + "epoch": 0.75, + "learning_rate": 1.7576424456406259e-06, + "loss": 1.1641, + "step": 29211 + }, + { + "epoch": 0.75, + "learning_rate": 1.7576243856797689e-06, + "loss": 0.8906, + "step": 29212 + }, + { + "epoch": 0.75, + "learning_rate": 1.757606325138834e-06, + "loss": 0.9492, + "step": 29213 + }, + { + "epoch": 0.75, + "learning_rate": 1.7575882640178348e-06, + "loss": 0.6353, + "step": 29214 + }, + { + "epoch": 0.75, + "learning_rate": 1.7575702023167848e-06, + "loss": 0.5163, + "step": 29215 + }, + { + "epoch": 0.75, + "learning_rate": 1.7575521400356986e-06, + "loss": 0.7764, + "step": 29216 + }, + { + "epoch": 0.75, + "learning_rate": 1.7575340771745893e-06, + "loss": 0.9102, + "step": 29217 + }, + { + "epoch": 0.75, + "learning_rate": 1.757516013733471e-06, + "loss": 0.79, + "step": 29218 + }, + { + "epoch": 0.75, + "learning_rate": 1.7574979497123574e-06, + "loss": 1.001, + "step": 29219 + }, + { + "epoch": 0.75, + "learning_rate": 1.7574798851112625e-06, + "loss": 0.7822, + "step": 29220 + }, + { + "epoch": 0.75, + "learning_rate": 1.7574618199302004e-06, + "loss": 0.7891, + "step": 29221 + }, + { + "epoch": 0.75, + "learning_rate": 1.7574437541691842e-06, + "loss": 1.0166, + "step": 29222 + }, + { + "epoch": 0.75, + "learning_rate": 1.7574256878282284e-06, + "loss": 0.7227, + "step": 29223 + }, + { + "epoch": 0.75, + "learning_rate": 1.7574076209073466e-06, + "loss": 0.6729, + "step": 29224 + }, + { + "epoch": 0.75, + "learning_rate": 1.7573895534065523e-06, + "loss": 0.8105, + "step": 29225 + }, + { + "epoch": 0.75, + "learning_rate": 1.7573714853258598e-06, + "loss": 0.7021, + "step": 29226 + }, + { + "epoch": 0.75, + "learning_rate": 1.7573534166652829e-06, + "loss": 0.8154, + "step": 29227 + }, + { + "epoch": 0.75, + "learning_rate": 1.7573353474248354e-06, + "loss": 0.9531, + "step": 29228 + }, + { + "epoch": 0.75, + "learning_rate": 1.7573172776045306e-06, + "loss": 0.9756, + "step": 29229 + }, + { + "epoch": 0.75, + "learning_rate": 1.757299207204383e-06, + "loss": 0.7393, + "step": 29230 + }, + { + "epoch": 0.75, + "learning_rate": 1.7572811362244064e-06, + "loss": 0.9814, + "step": 29231 + }, + { + "epoch": 0.75, + "learning_rate": 1.7572630646646144e-06, + "loss": 0.7002, + "step": 29232 + }, + { + "epoch": 0.75, + "learning_rate": 1.7572449925250207e-06, + "loss": 0.9224, + "step": 29233 + }, + { + "epoch": 0.75, + "learning_rate": 1.7572269198056395e-06, + "loss": 1.0605, + "step": 29234 + }, + { + "epoch": 0.75, + "learning_rate": 1.7572088465064844e-06, + "loss": 0.9443, + "step": 29235 + }, + { + "epoch": 0.75, + "learning_rate": 1.7571907726275693e-06, + "loss": 0.7275, + "step": 29236 + }, + { + "epoch": 0.75, + "learning_rate": 1.757172698168908e-06, + "loss": 1.043, + "step": 29237 + }, + { + "epoch": 0.75, + "learning_rate": 1.7571546231305146e-06, + "loss": 1.0615, + "step": 29238 + }, + { + "epoch": 0.75, + "learning_rate": 1.7571365475124024e-06, + "loss": 0.7061, + "step": 29239 + }, + { + "epoch": 0.75, + "learning_rate": 1.757118471314586e-06, + "loss": 0.9043, + "step": 29240 + }, + { + "epoch": 0.75, + "learning_rate": 1.7571003945370784e-06, + "loss": 0.79, + "step": 29241 + }, + { + "epoch": 0.75, + "learning_rate": 1.7570823171798941e-06, + "loss": 0.9521, + "step": 29242 + }, + { + "epoch": 0.75, + "learning_rate": 1.7570642392430464e-06, + "loss": 0.8242, + "step": 29243 + }, + { + "epoch": 0.75, + "learning_rate": 1.7570461607265497e-06, + "loss": 0.8428, + "step": 29244 + }, + { + "epoch": 0.75, + "learning_rate": 1.7570280816304176e-06, + "loss": 0.8057, + "step": 29245 + }, + { + "epoch": 0.75, + "learning_rate": 1.7570100019546636e-06, + "loss": 0.7437, + "step": 29246 + }, + { + "epoch": 0.75, + "learning_rate": 1.7569919216993018e-06, + "loss": 0.9785, + "step": 29247 + }, + { + "epoch": 0.75, + "learning_rate": 1.7569738408643463e-06, + "loss": 0.9473, + "step": 29248 + }, + { + "epoch": 0.75, + "learning_rate": 1.756955759449811e-06, + "loss": 0.9258, + "step": 29249 + }, + { + "epoch": 0.75, + "learning_rate": 1.756937677455709e-06, + "loss": 0.8325, + "step": 29250 + }, + { + "epoch": 0.75, + "learning_rate": 1.756919594882055e-06, + "loss": 0.9531, + "step": 29251 + }, + { + "epoch": 0.75, + "learning_rate": 1.756901511728862e-06, + "loss": 0.6982, + "step": 29252 + }, + { + "epoch": 0.75, + "learning_rate": 1.7568834279961448e-06, + "loss": 0.7842, + "step": 29253 + }, + { + "epoch": 0.75, + "learning_rate": 1.7568653436839167e-06, + "loss": 0.8945, + "step": 29254 + }, + { + "epoch": 0.75, + "learning_rate": 1.7568472587921911e-06, + "loss": 0.9531, + "step": 29255 + }, + { + "epoch": 0.75, + "learning_rate": 1.756829173320983e-06, + "loss": 0.7832, + "step": 29256 + }, + { + "epoch": 0.75, + "learning_rate": 1.7568110872703055e-06, + "loss": 0.7363, + "step": 29257 + }, + { + "epoch": 0.75, + "learning_rate": 1.7567930006401723e-06, + "loss": 0.7891, + "step": 29258 + }, + { + "epoch": 0.75, + "learning_rate": 1.7567749134305977e-06, + "loss": 0.6631, + "step": 29259 + }, + { + "epoch": 0.75, + "learning_rate": 1.7567568256415953e-06, + "loss": 0.9561, + "step": 29260 + }, + { + "epoch": 0.75, + "learning_rate": 1.7567387372731788e-06, + "loss": 0.6631, + "step": 29261 + }, + { + "epoch": 0.75, + "learning_rate": 1.7567206483253623e-06, + "loss": 0.9473, + "step": 29262 + }, + { + "epoch": 0.75, + "learning_rate": 1.7567025587981596e-06, + "loss": 0.9482, + "step": 29263 + }, + { + "epoch": 0.75, + "learning_rate": 1.7566844686915847e-06, + "loss": 0.8569, + "step": 29264 + }, + { + "epoch": 0.75, + "learning_rate": 1.7566663780056513e-06, + "loss": 0.9736, + "step": 29265 + }, + { + "epoch": 0.75, + "learning_rate": 1.756648286740373e-06, + "loss": 0.8721, + "step": 29266 + }, + { + "epoch": 0.75, + "learning_rate": 1.7566301948957643e-06, + "loss": 0.7852, + "step": 29267 + }, + { + "epoch": 0.75, + "learning_rate": 1.7566121024718381e-06, + "loss": 0.7271, + "step": 29268 + }, + { + "epoch": 0.75, + "learning_rate": 1.7565940094686091e-06, + "loss": 0.8105, + "step": 29269 + }, + { + "epoch": 0.75, + "learning_rate": 1.7565759158860911e-06, + "loss": 0.8633, + "step": 29270 + }, + { + "epoch": 0.75, + "learning_rate": 1.7565578217242973e-06, + "loss": 0.8267, + "step": 29271 + }, + { + "epoch": 0.75, + "learning_rate": 1.7565397269832423e-06, + "loss": 0.8193, + "step": 29272 + }, + { + "epoch": 0.75, + "learning_rate": 1.7565216316629395e-06, + "loss": 0.8867, + "step": 29273 + }, + { + "epoch": 0.75, + "learning_rate": 1.7565035357634029e-06, + "loss": 0.9229, + "step": 29274 + }, + { + "epoch": 0.75, + "learning_rate": 1.756485439284646e-06, + "loss": 0.9668, + "step": 29275 + }, + { + "epoch": 0.75, + "learning_rate": 1.7564673422266833e-06, + "loss": 0.7998, + "step": 29276 + }, + { + "epoch": 0.75, + "learning_rate": 1.7564492445895283e-06, + "loss": 0.7866, + "step": 29277 + }, + { + "epoch": 0.75, + "learning_rate": 1.7564311463731948e-06, + "loss": 0.959, + "step": 29278 + }, + { + "epoch": 0.75, + "learning_rate": 1.756413047577697e-06, + "loss": 0.999, + "step": 29279 + }, + { + "epoch": 0.75, + "learning_rate": 1.7563949482030483e-06, + "loss": 0.8594, + "step": 29280 + }, + { + "epoch": 0.75, + "learning_rate": 1.7563768482492626e-06, + "loss": 0.7036, + "step": 29281 + }, + { + "epoch": 0.75, + "learning_rate": 1.7563587477163542e-06, + "loss": 0.6567, + "step": 29282 + }, + { + "epoch": 0.75, + "learning_rate": 1.7563406466043367e-06, + "loss": 0.6025, + "step": 29283 + }, + { + "epoch": 0.75, + "learning_rate": 1.7563225449132238e-06, + "loss": 0.8086, + "step": 29284 + }, + { + "epoch": 0.75, + "learning_rate": 1.7563044426430296e-06, + "loss": 0.9141, + "step": 29285 + }, + { + "epoch": 0.75, + "learning_rate": 1.756286339793768e-06, + "loss": 0.9805, + "step": 29286 + }, + { + "epoch": 0.75, + "learning_rate": 1.7562682363654524e-06, + "loss": 0.9287, + "step": 29287 + }, + { + "epoch": 0.75, + "learning_rate": 1.7562501323580971e-06, + "loss": 0.9355, + "step": 29288 + }, + { + "epoch": 0.75, + "learning_rate": 1.7562320277717159e-06, + "loss": 1.0068, + "step": 29289 + }, + { + "epoch": 0.75, + "learning_rate": 1.7562139226063226e-06, + "loss": 0.7764, + "step": 29290 + }, + { + "epoch": 0.75, + "learning_rate": 1.756195816861931e-06, + "loss": 0.8174, + "step": 29291 + }, + { + "epoch": 0.75, + "learning_rate": 1.756177710538555e-06, + "loss": 0.6621, + "step": 29292 + }, + { + "epoch": 0.75, + "learning_rate": 1.7561596036362087e-06, + "loss": 0.8389, + "step": 29293 + }, + { + "epoch": 0.75, + "learning_rate": 1.756141496154906e-06, + "loss": 0.7896, + "step": 29294 + }, + { + "epoch": 0.75, + "learning_rate": 1.7561233880946599e-06, + "loss": 0.7705, + "step": 29295 + }, + { + "epoch": 0.75, + "learning_rate": 1.7561052794554852e-06, + "loss": 0.8027, + "step": 29296 + }, + { + "epoch": 0.75, + "learning_rate": 1.7560871702373954e-06, + "loss": 0.8867, + "step": 29297 + }, + { + "epoch": 0.75, + "learning_rate": 1.7560690604404044e-06, + "loss": 0.8789, + "step": 29298 + }, + { + "epoch": 0.75, + "learning_rate": 1.7560509500645263e-06, + "loss": 0.8442, + "step": 29299 + }, + { + "epoch": 0.75, + "learning_rate": 1.7560328391097744e-06, + "loss": 0.9785, + "step": 29300 + }, + { + "epoch": 0.75, + "learning_rate": 1.7560147275761632e-06, + "loss": 0.6812, + "step": 29301 + }, + { + "epoch": 0.75, + "learning_rate": 1.7559966154637062e-06, + "loss": 0.7842, + "step": 29302 + }, + { + "epoch": 0.75, + "learning_rate": 1.7559785027724171e-06, + "loss": 0.791, + "step": 29303 + }, + { + "epoch": 0.75, + "learning_rate": 1.7559603895023104e-06, + "loss": 0.8164, + "step": 29304 + }, + { + "epoch": 0.75, + "learning_rate": 1.7559422756533997e-06, + "loss": 1.0254, + "step": 29305 + }, + { + "epoch": 0.75, + "learning_rate": 1.7559241612256984e-06, + "loss": 0.9922, + "step": 29306 + }, + { + "epoch": 0.75, + "learning_rate": 1.7559060462192207e-06, + "loss": 0.6636, + "step": 29307 + }, + { + "epoch": 0.75, + "learning_rate": 1.755887930633981e-06, + "loss": 0.7988, + "step": 29308 + }, + { + "epoch": 0.75, + "learning_rate": 1.7558698144699919e-06, + "loss": 0.7832, + "step": 29309 + }, + { + "epoch": 0.75, + "learning_rate": 1.7558516977272686e-06, + "loss": 0.7783, + "step": 29310 + }, + { + "epoch": 0.75, + "learning_rate": 1.7558335804058241e-06, + "loss": 0.6406, + "step": 29311 + }, + { + "epoch": 0.75, + "learning_rate": 1.755815462505673e-06, + "loss": 0.916, + "step": 29312 + }, + { + "epoch": 0.75, + "learning_rate": 1.7557973440268284e-06, + "loss": 0.958, + "step": 29313 + }, + { + "epoch": 0.75, + "learning_rate": 1.7557792249693047e-06, + "loss": 0.8291, + "step": 29314 + }, + { + "epoch": 0.75, + "learning_rate": 1.7557611053331154e-06, + "loss": 0.9023, + "step": 29315 + }, + { + "epoch": 0.75, + "learning_rate": 1.7557429851182748e-06, + "loss": 0.9961, + "step": 29316 + }, + { + "epoch": 0.75, + "learning_rate": 1.7557248643247964e-06, + "loss": 0.9648, + "step": 29317 + }, + { + "epoch": 0.75, + "learning_rate": 1.7557067429526942e-06, + "loss": 0.8691, + "step": 29318 + }, + { + "epoch": 0.75, + "learning_rate": 1.7556886210019822e-06, + "loss": 0.7041, + "step": 29319 + }, + { + "epoch": 0.75, + "learning_rate": 1.755670498472674e-06, + "loss": 1.0322, + "step": 29320 + }, + { + "epoch": 0.75, + "learning_rate": 1.7556523753647838e-06, + "loss": 0.7217, + "step": 29321 + }, + { + "epoch": 0.75, + "learning_rate": 1.7556342516783254e-06, + "loss": 0.9082, + "step": 29322 + }, + { + "epoch": 0.75, + "learning_rate": 1.7556161274133124e-06, + "loss": 0.4453, + "step": 29323 + }, + { + "epoch": 0.75, + "learning_rate": 1.755598002569759e-06, + "loss": 0.5957, + "step": 29324 + }, + { + "epoch": 0.75, + "learning_rate": 1.7555798771476788e-06, + "loss": 0.7715, + "step": 29325 + }, + { + "epoch": 0.75, + "learning_rate": 1.755561751147086e-06, + "loss": 0.8984, + "step": 29326 + }, + { + "epoch": 0.75, + "learning_rate": 1.7555436245679943e-06, + "loss": 0.811, + "step": 29327 + }, + { + "epoch": 0.75, + "learning_rate": 1.7555254974104173e-06, + "loss": 0.6172, + "step": 29328 + }, + { + "epoch": 0.75, + "learning_rate": 1.7555073696743696e-06, + "loss": 0.8291, + "step": 29329 + }, + { + "epoch": 0.75, + "learning_rate": 1.7554892413598643e-06, + "loss": 0.9629, + "step": 29330 + }, + { + "epoch": 0.75, + "learning_rate": 1.755471112466916e-06, + "loss": 0.9648, + "step": 29331 + }, + { + "epoch": 0.75, + "learning_rate": 1.7554529829955378e-06, + "loss": 0.833, + "step": 29332 + }, + { + "epoch": 0.75, + "learning_rate": 1.7554348529457444e-06, + "loss": 0.6108, + "step": 29333 + }, + { + "epoch": 0.75, + "learning_rate": 1.755416722317549e-06, + "loss": 0.7832, + "step": 29334 + }, + { + "epoch": 0.75, + "learning_rate": 1.7553985911109658e-06, + "loss": 0.9634, + "step": 29335 + }, + { + "epoch": 0.75, + "learning_rate": 1.7553804593260087e-06, + "loss": 0.9707, + "step": 29336 + }, + { + "epoch": 0.75, + "learning_rate": 1.7553623269626914e-06, + "loss": 0.8564, + "step": 29337 + }, + { + "epoch": 0.75, + "learning_rate": 1.7553441940210278e-06, + "loss": 1.1221, + "step": 29338 + }, + { + "epoch": 0.75, + "learning_rate": 1.7553260605010323e-06, + "loss": 0.9502, + "step": 29339 + }, + { + "epoch": 0.75, + "learning_rate": 1.7553079264027177e-06, + "loss": 0.8457, + "step": 29340 + }, + { + "epoch": 0.75, + "learning_rate": 1.7552897917260992e-06, + "loss": 0.9775, + "step": 29341 + }, + { + "epoch": 0.75, + "learning_rate": 1.7552716564711899e-06, + "loss": 0.8379, + "step": 29342 + }, + { + "epoch": 0.75, + "learning_rate": 1.7552535206380035e-06, + "loss": 0.9189, + "step": 29343 + }, + { + "epoch": 0.75, + "learning_rate": 1.7552353842265544e-06, + "loss": 0.9004, + "step": 29344 + }, + { + "epoch": 0.75, + "learning_rate": 1.7552172472368562e-06, + "loss": 0.8789, + "step": 29345 + }, + { + "epoch": 0.75, + "learning_rate": 1.7551991096689229e-06, + "loss": 0.6431, + "step": 29346 + }, + { + "epoch": 0.75, + "learning_rate": 1.7551809715227685e-06, + "loss": 0.7124, + "step": 29347 + }, + { + "epoch": 0.75, + "learning_rate": 1.7551628327984067e-06, + "loss": 0.667, + "step": 29348 + }, + { + "epoch": 0.75, + "learning_rate": 1.7551446934958516e-06, + "loss": 0.9844, + "step": 29349 + }, + { + "epoch": 0.75, + "learning_rate": 1.7551265536151166e-06, + "loss": 0.8096, + "step": 29350 + }, + { + "epoch": 0.75, + "learning_rate": 1.7551084131562162e-06, + "loss": 0.8408, + "step": 29351 + }, + { + "epoch": 0.75, + "learning_rate": 1.755090272119164e-06, + "loss": 0.9844, + "step": 29352 + }, + { + "epoch": 0.75, + "learning_rate": 1.7550721305039734e-06, + "loss": 1.0488, + "step": 29353 + }, + { + "epoch": 0.75, + "learning_rate": 1.7550539883106596e-06, + "loss": 0.8457, + "step": 29354 + }, + { + "epoch": 0.75, + "learning_rate": 1.7550358455392352e-06, + "loss": 0.9697, + "step": 29355 + }, + { + "epoch": 0.75, + "learning_rate": 1.7550177021897146e-06, + "loss": 0.8506, + "step": 29356 + }, + { + "epoch": 0.75, + "learning_rate": 1.7549995582621118e-06, + "loss": 0.71, + "step": 29357 + }, + { + "epoch": 0.75, + "learning_rate": 1.7549814137564402e-06, + "loss": 0.8711, + "step": 29358 + }, + { + "epoch": 0.75, + "learning_rate": 1.7549632686727145e-06, + "loss": 0.7583, + "step": 29359 + }, + { + "epoch": 0.75, + "learning_rate": 1.7549451230109477e-06, + "loss": 0.6836, + "step": 29360 + }, + { + "epoch": 0.75, + "learning_rate": 1.7549269767711548e-06, + "loss": 0.9102, + "step": 29361 + }, + { + "epoch": 0.75, + "learning_rate": 1.7549088299533484e-06, + "loss": 0.917, + "step": 29362 + }, + { + "epoch": 0.75, + "learning_rate": 1.7548906825575431e-06, + "loss": 0.8975, + "step": 29363 + }, + { + "epoch": 0.75, + "learning_rate": 1.754872534583753e-06, + "loss": 0.7061, + "step": 29364 + }, + { + "epoch": 0.75, + "learning_rate": 1.7548543860319916e-06, + "loss": 0.9521, + "step": 29365 + }, + { + "epoch": 0.75, + "learning_rate": 1.7548362369022727e-06, + "loss": 0.8506, + "step": 29366 + }, + { + "epoch": 0.75, + "learning_rate": 1.7548180871946102e-06, + "loss": 0.9023, + "step": 29367 + }, + { + "epoch": 0.75, + "learning_rate": 1.754799936909019e-06, + "loss": 1.1436, + "step": 29368 + }, + { + "epoch": 0.75, + "learning_rate": 1.7547817860455116e-06, + "loss": 0.7109, + "step": 29369 + }, + { + "epoch": 0.75, + "learning_rate": 1.7547636346041025e-06, + "loss": 0.8813, + "step": 29370 + }, + { + "epoch": 0.75, + "learning_rate": 1.754745482584806e-06, + "loss": 0.8096, + "step": 29371 + }, + { + "epoch": 0.75, + "learning_rate": 1.7547273299876354e-06, + "loss": 0.7495, + "step": 29372 + }, + { + "epoch": 0.75, + "learning_rate": 1.7547091768126046e-06, + "loss": 0.791, + "step": 29373 + }, + { + "epoch": 0.75, + "learning_rate": 1.7546910230597275e-06, + "loss": 0.8853, + "step": 29374 + }, + { + "epoch": 0.75, + "learning_rate": 1.7546728687290185e-06, + "loss": 1.1035, + "step": 29375 + }, + { + "epoch": 0.75, + "learning_rate": 1.7546547138204914e-06, + "loss": 0.9053, + "step": 29376 + }, + { + "epoch": 0.75, + "learning_rate": 1.7546365583341595e-06, + "loss": 0.5188, + "step": 29377 + }, + { + "epoch": 0.75, + "learning_rate": 1.7546184022700372e-06, + "loss": 0.6292, + "step": 29378 + }, + { + "epoch": 0.75, + "learning_rate": 1.7546002456281383e-06, + "loss": 0.6953, + "step": 29379 + }, + { + "epoch": 0.75, + "learning_rate": 1.7545820884084767e-06, + "loss": 1.0127, + "step": 29380 + }, + { + "epoch": 0.75, + "learning_rate": 1.7545639306110664e-06, + "loss": 0.7896, + "step": 29381 + }, + { + "epoch": 0.75, + "learning_rate": 1.7545457722359212e-06, + "loss": 1.001, + "step": 29382 + }, + { + "epoch": 0.75, + "learning_rate": 1.754527613283055e-06, + "loss": 0.8984, + "step": 29383 + }, + { + "epoch": 0.75, + "learning_rate": 1.7545094537524814e-06, + "loss": 0.7871, + "step": 29384 + }, + { + "epoch": 0.75, + "learning_rate": 1.7544912936442149e-06, + "loss": 1.0811, + "step": 29385 + }, + { + "epoch": 0.75, + "learning_rate": 1.7544731329582687e-06, + "loss": 1.0518, + "step": 29386 + }, + { + "epoch": 0.75, + "learning_rate": 1.7544549716946576e-06, + "loss": 0.8188, + "step": 29387 + }, + { + "epoch": 0.75, + "learning_rate": 1.7544368098533947e-06, + "loss": 1.0039, + "step": 29388 + }, + { + "epoch": 0.75, + "learning_rate": 1.7544186474344943e-06, + "loss": 0.9717, + "step": 29389 + }, + { + "epoch": 0.75, + "learning_rate": 1.7544004844379706e-06, + "loss": 0.7891, + "step": 29390 + }, + { + "epoch": 0.75, + "learning_rate": 1.7543823208638367e-06, + "loss": 0.7471, + "step": 29391 + }, + { + "epoch": 0.75, + "learning_rate": 1.754364156712107e-06, + "loss": 0.7793, + "step": 29392 + }, + { + "epoch": 0.75, + "learning_rate": 1.7543459919827953e-06, + "loss": 0.7075, + "step": 29393 + }, + { + "epoch": 0.75, + "learning_rate": 1.7543278266759158e-06, + "loss": 0.7285, + "step": 29394 + }, + { + "epoch": 0.75, + "learning_rate": 1.754309660791482e-06, + "loss": 0.7979, + "step": 29395 + }, + { + "epoch": 0.75, + "learning_rate": 1.7542914943295082e-06, + "loss": 0.9033, + "step": 29396 + }, + { + "epoch": 0.75, + "learning_rate": 1.7542733272900078e-06, + "loss": 0.958, + "step": 29397 + }, + { + "epoch": 0.75, + "learning_rate": 1.7542551596729952e-06, + "loss": 0.6611, + "step": 29398 + }, + { + "epoch": 0.75, + "learning_rate": 1.754236991478484e-06, + "loss": 1.042, + "step": 29399 + }, + { + "epoch": 0.75, + "learning_rate": 1.7542188227064881e-06, + "loss": 0.8096, + "step": 29400 + }, + { + "epoch": 0.75, + "learning_rate": 1.7542006533570216e-06, + "loss": 0.6611, + "step": 29401 + }, + { + "epoch": 0.75, + "learning_rate": 1.7541824834300987e-06, + "loss": 0.79, + "step": 29402 + }, + { + "epoch": 0.75, + "learning_rate": 1.7541643129257327e-06, + "loss": 0.8662, + "step": 29403 + }, + { + "epoch": 0.75, + "learning_rate": 1.7541461418439373e-06, + "loss": 0.8027, + "step": 29404 + }, + { + "epoch": 0.75, + "learning_rate": 1.7541279701847276e-06, + "loss": 0.876, + "step": 29405 + }, + { + "epoch": 0.75, + "learning_rate": 1.7541097979481165e-06, + "loss": 0.8462, + "step": 29406 + }, + { + "epoch": 0.75, + "learning_rate": 1.754091625134118e-06, + "loss": 0.7949, + "step": 29407 + }, + { + "epoch": 0.75, + "learning_rate": 1.7540734517427465e-06, + "loss": 0.9512, + "step": 29408 + }, + { + "epoch": 0.75, + "learning_rate": 1.7540552777740155e-06, + "loss": 1.0781, + "step": 29409 + }, + { + "epoch": 0.75, + "learning_rate": 1.7540371032279388e-06, + "loss": 0.6641, + "step": 29410 + }, + { + "epoch": 0.75, + "learning_rate": 1.7540189281045312e-06, + "loss": 0.8691, + "step": 29411 + }, + { + "epoch": 0.75, + "learning_rate": 1.7540007524038054e-06, + "loss": 0.9502, + "step": 29412 + }, + { + "epoch": 0.75, + "learning_rate": 1.753982576125776e-06, + "loss": 0.606, + "step": 29413 + }, + { + "epoch": 0.75, + "learning_rate": 1.7539643992704572e-06, + "loss": 0.75, + "step": 29414 + }, + { + "epoch": 0.75, + "learning_rate": 1.7539462218378622e-06, + "loss": 1.0166, + "step": 29415 + }, + { + "epoch": 0.75, + "learning_rate": 1.7539280438280052e-06, + "loss": 0.9229, + "step": 29416 + }, + { + "epoch": 0.75, + "learning_rate": 1.7539098652409004e-06, + "loss": 0.7842, + "step": 29417 + }, + { + "epoch": 0.75, + "learning_rate": 1.7538916860765612e-06, + "loss": 0.792, + "step": 29418 + }, + { + "epoch": 0.75, + "learning_rate": 1.7538735063350018e-06, + "loss": 0.8506, + "step": 29419 + }, + { + "epoch": 0.75, + "learning_rate": 1.7538553260162363e-06, + "loss": 0.9268, + "step": 29420 + }, + { + "epoch": 0.75, + "learning_rate": 1.7538371451202787e-06, + "loss": 0.8828, + "step": 29421 + }, + { + "epoch": 0.75, + "learning_rate": 1.7538189636471424e-06, + "loss": 0.9434, + "step": 29422 + }, + { + "epoch": 0.75, + "learning_rate": 1.7538007815968415e-06, + "loss": 0.9033, + "step": 29423 + }, + { + "epoch": 0.75, + "learning_rate": 1.7537825989693896e-06, + "loss": 0.7178, + "step": 29424 + }, + { + "epoch": 0.75, + "learning_rate": 1.7537644157648017e-06, + "loss": 0.9062, + "step": 29425 + }, + { + "epoch": 0.75, + "learning_rate": 1.753746231983091e-06, + "loss": 0.877, + "step": 29426 + }, + { + "epoch": 0.75, + "learning_rate": 1.7537280476242711e-06, + "loss": 1.0537, + "step": 29427 + }, + { + "epoch": 0.75, + "learning_rate": 1.7537098626883564e-06, + "loss": 0.6348, + "step": 29428 + }, + { + "epoch": 0.75, + "learning_rate": 1.7536916771753608e-06, + "loss": 0.7307, + "step": 29429 + }, + { + "epoch": 0.75, + "learning_rate": 1.7536734910852982e-06, + "loss": 1.0488, + "step": 29430 + }, + { + "epoch": 0.75, + "learning_rate": 1.7536553044181824e-06, + "loss": 0.8643, + "step": 29431 + }, + { + "epoch": 0.75, + "learning_rate": 1.7536371171740273e-06, + "loss": 0.9619, + "step": 29432 + }, + { + "epoch": 0.75, + "learning_rate": 1.753618929352847e-06, + "loss": 0.8525, + "step": 29433 + }, + { + "epoch": 0.75, + "learning_rate": 1.7536007409546554e-06, + "loss": 1.0293, + "step": 29434 + }, + { + "epoch": 0.75, + "learning_rate": 1.7535825519794663e-06, + "loss": 0.7007, + "step": 29435 + }, + { + "epoch": 0.75, + "learning_rate": 1.7535643624272935e-06, + "loss": 0.7144, + "step": 29436 + }, + { + "epoch": 0.75, + "learning_rate": 1.7535461722981514e-06, + "loss": 0.7832, + "step": 29437 + }, + { + "epoch": 0.75, + "learning_rate": 1.7535279815920534e-06, + "loss": 0.6006, + "step": 29438 + }, + { + "epoch": 0.75, + "learning_rate": 1.7535097903090139e-06, + "loss": 0.8789, + "step": 29439 + }, + { + "epoch": 0.75, + "learning_rate": 1.7534915984490465e-06, + "loss": 1.0684, + "step": 29440 + }, + { + "epoch": 0.75, + "learning_rate": 1.7534734060121652e-06, + "loss": 1.0664, + "step": 29441 + }, + { + "epoch": 0.75, + "learning_rate": 1.753455212998384e-06, + "loss": 0.9766, + "step": 29442 + }, + { + "epoch": 0.75, + "learning_rate": 1.753437019407717e-06, + "loss": 0.8174, + "step": 29443 + }, + { + "epoch": 0.75, + "learning_rate": 1.7534188252401777e-06, + "loss": 0.8789, + "step": 29444 + }, + { + "epoch": 0.75, + "learning_rate": 1.75340063049578e-06, + "loss": 0.8896, + "step": 29445 + }, + { + "epoch": 0.75, + "learning_rate": 1.7533824351745385e-06, + "loss": 0.8389, + "step": 29446 + }, + { + "epoch": 0.75, + "learning_rate": 1.7533642392764665e-06, + "loss": 1.0459, + "step": 29447 + }, + { + "epoch": 0.75, + "learning_rate": 1.7533460428015784e-06, + "loss": 0.667, + "step": 29448 + }, + { + "epoch": 0.75, + "learning_rate": 1.7533278457498875e-06, + "loss": 0.9297, + "step": 29449 + }, + { + "epoch": 0.75, + "learning_rate": 1.7533096481214083e-06, + "loss": 0.8447, + "step": 29450 + }, + { + "epoch": 0.75, + "learning_rate": 1.7532914499161544e-06, + "loss": 0.8418, + "step": 29451 + }, + { + "epoch": 0.75, + "learning_rate": 1.7532732511341402e-06, + "loss": 0.6748, + "step": 29452 + }, + { + "epoch": 0.75, + "learning_rate": 1.7532550517753787e-06, + "loss": 0.8347, + "step": 29453 + }, + { + "epoch": 0.75, + "learning_rate": 1.753236851839885e-06, + "loss": 0.8389, + "step": 29454 + }, + { + "epoch": 0.75, + "learning_rate": 1.7532186513276724e-06, + "loss": 0.8604, + "step": 29455 + }, + { + "epoch": 0.75, + "learning_rate": 1.7532004502387548e-06, + "loss": 1.0938, + "step": 29456 + }, + { + "epoch": 0.75, + "learning_rate": 1.7531822485731463e-06, + "loss": 0.9287, + "step": 29457 + }, + { + "epoch": 0.76, + "learning_rate": 1.7531640463308608e-06, + "loss": 0.6924, + "step": 29458 + }, + { + "epoch": 0.76, + "learning_rate": 1.7531458435119122e-06, + "loss": 0.7363, + "step": 29459 + }, + { + "epoch": 0.76, + "learning_rate": 1.7531276401163142e-06, + "loss": 0.8262, + "step": 29460 + }, + { + "epoch": 0.76, + "learning_rate": 1.7531094361440815e-06, + "loss": 0.8555, + "step": 29461 + }, + { + "epoch": 0.76, + "learning_rate": 1.753091231595227e-06, + "loss": 0.7959, + "step": 29462 + }, + { + "epoch": 0.76, + "learning_rate": 1.7530730264697655e-06, + "loss": 0.9111, + "step": 29463 + }, + { + "epoch": 0.76, + "learning_rate": 1.7530548207677106e-06, + "loss": 0.9795, + "step": 29464 + }, + { + "epoch": 0.76, + "learning_rate": 1.7530366144890762e-06, + "loss": 0.644, + "step": 29465 + }, + { + "epoch": 0.76, + "learning_rate": 1.7530184076338764e-06, + "loss": 0.6816, + "step": 29466 + }, + { + "epoch": 0.76, + "learning_rate": 1.7530002002021246e-06, + "loss": 1.2051, + "step": 29467 + }, + { + "epoch": 0.76, + "learning_rate": 1.7529819921938358e-06, + "loss": 0.7744, + "step": 29468 + }, + { + "epoch": 0.76, + "learning_rate": 1.752963783609023e-06, + "loss": 0.9229, + "step": 29469 + }, + { + "epoch": 0.76, + "learning_rate": 1.7529455744477005e-06, + "loss": 0.8184, + "step": 29470 + }, + { + "epoch": 0.76, + "learning_rate": 1.7529273647098821e-06, + "loss": 0.6426, + "step": 29471 + }, + { + "epoch": 0.76, + "learning_rate": 1.752909154395582e-06, + "loss": 0.8984, + "step": 29472 + }, + { + "epoch": 0.76, + "learning_rate": 1.7528909435048137e-06, + "loss": 0.5981, + "step": 29473 + }, + { + "epoch": 0.76, + "learning_rate": 1.7528727320375917e-06, + "loss": 0.8496, + "step": 29474 + }, + { + "epoch": 0.76, + "learning_rate": 1.7528545199939293e-06, + "loss": 0.7744, + "step": 29475 + }, + { + "epoch": 0.76, + "learning_rate": 1.7528363073738412e-06, + "loss": 0.7383, + "step": 29476 + }, + { + "epoch": 0.76, + "learning_rate": 1.752818094177341e-06, + "loss": 1.0117, + "step": 29477 + }, + { + "epoch": 0.76, + "learning_rate": 1.752799880404442e-06, + "loss": 0.9727, + "step": 29478 + }, + { + "epoch": 0.76, + "learning_rate": 1.7527816660551596e-06, + "loss": 0.8359, + "step": 29479 + }, + { + "epoch": 0.76, + "learning_rate": 1.7527634511295063e-06, + "loss": 0.8633, + "step": 29480 + }, + { + "epoch": 0.76, + "learning_rate": 1.7527452356274967e-06, + "loss": 1.0498, + "step": 29481 + }, + { + "epoch": 0.76, + "learning_rate": 1.752727019549145e-06, + "loss": 0.7632, + "step": 29482 + }, + { + "epoch": 0.76, + "learning_rate": 1.7527088028944646e-06, + "loss": 0.9736, + "step": 29483 + }, + { + "epoch": 0.76, + "learning_rate": 1.7526905856634695e-06, + "loss": 0.9062, + "step": 29484 + }, + { + "epoch": 0.76, + "learning_rate": 1.7526723678561741e-06, + "loss": 0.9092, + "step": 29485 + }, + { + "epoch": 0.76, + "learning_rate": 1.752654149472592e-06, + "loss": 0.9521, + "step": 29486 + }, + { + "epoch": 0.76, + "learning_rate": 1.7526359305127373e-06, + "loss": 0.7148, + "step": 29487 + }, + { + "epoch": 0.76, + "learning_rate": 1.7526177109766237e-06, + "loss": 0.7881, + "step": 29488 + }, + { + "epoch": 0.76, + "learning_rate": 1.7525994908642656e-06, + "loss": 0.6658, + "step": 29489 + }, + { + "epoch": 0.76, + "learning_rate": 1.7525812701756763e-06, + "loss": 0.6611, + "step": 29490 + }, + { + "epoch": 0.76, + "learning_rate": 1.7525630489108704e-06, + "loss": 0.7969, + "step": 29491 + }, + { + "epoch": 0.76, + "learning_rate": 1.7525448270698618e-06, + "loss": 0.8018, + "step": 29492 + }, + { + "epoch": 0.76, + "learning_rate": 1.752526604652664e-06, + "loss": 0.9424, + "step": 29493 + }, + { + "epoch": 0.76, + "learning_rate": 1.752508381659291e-06, + "loss": 0.7817, + "step": 29494 + }, + { + "epoch": 0.76, + "learning_rate": 1.752490158089757e-06, + "loss": 0.7847, + "step": 29495 + }, + { + "epoch": 0.76, + "learning_rate": 1.752471933944076e-06, + "loss": 0.9717, + "step": 29496 + }, + { + "epoch": 0.76, + "learning_rate": 1.7524537092222617e-06, + "loss": 0.749, + "step": 29497 + }, + { + "epoch": 0.76, + "learning_rate": 1.7524354839243283e-06, + "loss": 0.8311, + "step": 29498 + }, + { + "epoch": 0.76, + "learning_rate": 1.7524172580502895e-06, + "loss": 0.5977, + "step": 29499 + }, + { + "epoch": 0.76, + "learning_rate": 1.7523990316001594e-06, + "loss": 0.8506, + "step": 29500 + }, + { + "epoch": 0.76, + "learning_rate": 1.7523808045739523e-06, + "loss": 0.4318, + "step": 29501 + }, + { + "epoch": 0.76, + "learning_rate": 1.7523625769716814e-06, + "loss": 0.9082, + "step": 29502 + }, + { + "epoch": 0.76, + "learning_rate": 1.7523443487933614e-06, + "loss": 1.0898, + "step": 29503 + }, + { + "epoch": 0.76, + "learning_rate": 1.752326120039006e-06, + "loss": 0.7676, + "step": 29504 + }, + { + "epoch": 0.76, + "learning_rate": 1.7523078907086286e-06, + "loss": 0.6621, + "step": 29505 + }, + { + "epoch": 0.76, + "learning_rate": 1.7522896608022439e-06, + "loss": 0.6895, + "step": 29506 + }, + { + "epoch": 0.76, + "learning_rate": 1.7522714303198655e-06, + "loss": 0.9055, + "step": 29507 + }, + { + "epoch": 0.76, + "learning_rate": 1.7522531992615078e-06, + "loss": 0.9941, + "step": 29508 + }, + { + "epoch": 0.76, + "learning_rate": 1.752234967627184e-06, + "loss": 0.8857, + "step": 29509 + }, + { + "epoch": 0.76, + "learning_rate": 1.752216735416909e-06, + "loss": 0.8691, + "step": 29510 + }, + { + "epoch": 0.76, + "learning_rate": 1.7521985026306956e-06, + "loss": 0.8711, + "step": 29511 + }, + { + "epoch": 0.76, + "learning_rate": 1.7521802692685586e-06, + "loss": 0.9111, + "step": 29512 + }, + { + "epoch": 0.76, + "learning_rate": 1.752162035330512e-06, + "loss": 0.6248, + "step": 29513 + }, + { + "epoch": 0.76, + "learning_rate": 1.7521438008165692e-06, + "loss": 0.9434, + "step": 29514 + }, + { + "epoch": 0.76, + "learning_rate": 1.752125565726745e-06, + "loss": 1.0957, + "step": 29515 + }, + { + "epoch": 0.76, + "learning_rate": 1.7521073300610523e-06, + "loss": 0.6787, + "step": 29516 + }, + { + "epoch": 0.76, + "learning_rate": 1.7520890938195057e-06, + "loss": 0.9248, + "step": 29517 + }, + { + "epoch": 0.76, + "learning_rate": 1.7520708570021193e-06, + "loss": 0.915, + "step": 29518 + }, + { + "epoch": 0.76, + "learning_rate": 1.7520526196089065e-06, + "loss": 0.9199, + "step": 29519 + }, + { + "epoch": 0.76, + "learning_rate": 1.7520343816398817e-06, + "loss": 0.8164, + "step": 29520 + }, + { + "epoch": 0.76, + "learning_rate": 1.7520161430950586e-06, + "loss": 0.8467, + "step": 29521 + }, + { + "epoch": 0.76, + "learning_rate": 1.7519979039744517e-06, + "loss": 0.8379, + "step": 29522 + }, + { + "epoch": 0.76, + "learning_rate": 1.7519796642780744e-06, + "loss": 0.8828, + "step": 29523 + }, + { + "epoch": 0.76, + "learning_rate": 1.7519614240059408e-06, + "loss": 1.0059, + "step": 29524 + }, + { + "epoch": 0.76, + "learning_rate": 1.751943183158065e-06, + "loss": 0.7744, + "step": 29525 + }, + { + "epoch": 0.76, + "learning_rate": 1.7519249417344608e-06, + "loss": 0.939, + "step": 29526 + }, + { + "epoch": 0.76, + "learning_rate": 1.7519066997351422e-06, + "loss": 0.8701, + "step": 29527 + }, + { + "epoch": 0.76, + "learning_rate": 1.7518884571601236e-06, + "loss": 1.0098, + "step": 29528 + }, + { + "epoch": 0.76, + "learning_rate": 1.751870214009418e-06, + "loss": 1.0693, + "step": 29529 + }, + { + "epoch": 0.76, + "learning_rate": 1.7518519702830402e-06, + "loss": 0.8208, + "step": 29530 + }, + { + "epoch": 0.76, + "learning_rate": 1.751833725981004e-06, + "loss": 1.0537, + "step": 29531 + }, + { + "epoch": 0.76, + "learning_rate": 1.7518154811033235e-06, + "loss": 0.8398, + "step": 29532 + }, + { + "epoch": 0.76, + "learning_rate": 1.7517972356500122e-06, + "loss": 0.7773, + "step": 29533 + }, + { + "epoch": 0.76, + "learning_rate": 1.751778989621084e-06, + "loss": 0.8359, + "step": 29534 + }, + { + "epoch": 0.76, + "learning_rate": 1.7517607430165535e-06, + "loss": 1.0156, + "step": 29535 + }, + { + "epoch": 0.76, + "learning_rate": 1.7517424958364346e-06, + "loss": 0.6748, + "step": 29536 + }, + { + "epoch": 0.76, + "learning_rate": 1.7517242480807406e-06, + "loss": 1.0234, + "step": 29537 + }, + { + "epoch": 0.76, + "learning_rate": 1.7517059997494862e-06, + "loss": 0.8281, + "step": 29538 + }, + { + "epoch": 0.76, + "learning_rate": 1.751687750842685e-06, + "loss": 0.8701, + "step": 29539 + }, + { + "epoch": 0.76, + "learning_rate": 1.751669501360351e-06, + "loss": 0.8965, + "step": 29540 + }, + { + "epoch": 0.76, + "learning_rate": 1.7516512513024983e-06, + "loss": 0.8008, + "step": 29541 + }, + { + "epoch": 0.76, + "learning_rate": 1.751633000669141e-06, + "loss": 0.8921, + "step": 29542 + }, + { + "epoch": 0.76, + "learning_rate": 1.7516147494602924e-06, + "loss": 0.7842, + "step": 29543 + }, + { + "epoch": 0.76, + "learning_rate": 1.7515964976759672e-06, + "loss": 0.7959, + "step": 29544 + }, + { + "epoch": 0.76, + "learning_rate": 1.7515782453161792e-06, + "loss": 0.7881, + "step": 29545 + }, + { + "epoch": 0.76, + "learning_rate": 1.751559992380942e-06, + "loss": 0.7671, + "step": 29546 + }, + { + "epoch": 0.76, + "learning_rate": 1.7515417388702703e-06, + "loss": 0.8047, + "step": 29547 + }, + { + "epoch": 0.76, + "learning_rate": 1.7515234847841773e-06, + "loss": 0.9033, + "step": 29548 + }, + { + "epoch": 0.76, + "learning_rate": 1.7515052301226777e-06, + "loss": 0.9497, + "step": 29549 + }, + { + "epoch": 0.76, + "learning_rate": 1.7514869748857848e-06, + "loss": 0.8047, + "step": 29550 + }, + { + "epoch": 0.76, + "learning_rate": 1.751468719073513e-06, + "loss": 0.8535, + "step": 29551 + }, + { + "epoch": 0.76, + "learning_rate": 1.751450462685876e-06, + "loss": 0.7329, + "step": 29552 + }, + { + "epoch": 0.76, + "learning_rate": 1.7514322057228879e-06, + "loss": 0.6675, + "step": 29553 + }, + { + "epoch": 0.76, + "learning_rate": 1.7514139481845628e-06, + "loss": 0.9463, + "step": 29554 + }, + { + "epoch": 0.76, + "learning_rate": 1.7513956900709146e-06, + "loss": 0.7471, + "step": 29555 + }, + { + "epoch": 0.76, + "learning_rate": 1.7513774313819573e-06, + "loss": 0.9033, + "step": 29556 + }, + { + "epoch": 0.76, + "learning_rate": 1.751359172117705e-06, + "loss": 0.8193, + "step": 29557 + }, + { + "epoch": 0.76, + "learning_rate": 1.7513409122781716e-06, + "loss": 0.6587, + "step": 29558 + }, + { + "epoch": 0.76, + "learning_rate": 1.7513226518633705e-06, + "loss": 0.8027, + "step": 29559 + }, + { + "epoch": 0.76, + "learning_rate": 1.7513043908733165e-06, + "loss": 0.916, + "step": 29560 + }, + { + "epoch": 0.76, + "learning_rate": 1.7512861293080232e-06, + "loss": 0.6597, + "step": 29561 + }, + { + "epoch": 0.76, + "learning_rate": 1.7512678671675047e-06, + "loss": 0.666, + "step": 29562 + }, + { + "epoch": 0.76, + "learning_rate": 1.751249604451775e-06, + "loss": 0.7783, + "step": 29563 + }, + { + "epoch": 0.76, + "learning_rate": 1.751231341160848e-06, + "loss": 0.9736, + "step": 29564 + }, + { + "epoch": 0.76, + "learning_rate": 1.7512130772947376e-06, + "loss": 0.8369, + "step": 29565 + }, + { + "epoch": 0.76, + "learning_rate": 1.7511948128534582e-06, + "loss": 0.6826, + "step": 29566 + }, + { + "epoch": 0.76, + "learning_rate": 1.751176547837023e-06, + "loss": 0.9629, + "step": 29567 + }, + { + "epoch": 0.76, + "learning_rate": 1.7511582822454468e-06, + "loss": 0.9502, + "step": 29568 + }, + { + "epoch": 0.76, + "learning_rate": 1.751140016078743e-06, + "loss": 0.6616, + "step": 29569 + }, + { + "epoch": 0.76, + "learning_rate": 1.751121749336926e-06, + "loss": 0.8291, + "step": 29570 + }, + { + "epoch": 0.76, + "learning_rate": 1.7511034820200097e-06, + "loss": 0.5261, + "step": 29571 + }, + { + "epoch": 0.76, + "learning_rate": 1.7510852141280078e-06, + "loss": 0.8838, + "step": 29572 + }, + { + "epoch": 0.76, + "learning_rate": 1.7510669456609346e-06, + "loss": 0.7559, + "step": 29573 + }, + { + "epoch": 0.76, + "learning_rate": 1.751048676618804e-06, + "loss": 0.5625, + "step": 29574 + }, + { + "epoch": 0.76, + "learning_rate": 1.7510304070016298e-06, + "loss": 0.8389, + "step": 29575 + }, + { + "epoch": 0.76, + "learning_rate": 1.7510121368094262e-06, + "loss": 0.998, + "step": 29576 + }, + { + "epoch": 0.76, + "learning_rate": 1.7509938660422073e-06, + "loss": 0.6504, + "step": 29577 + }, + { + "epoch": 0.76, + "learning_rate": 1.750975594699987e-06, + "loss": 0.7788, + "step": 29578 + }, + { + "epoch": 0.76, + "learning_rate": 1.7509573227827788e-06, + "loss": 0.6208, + "step": 29579 + }, + { + "epoch": 0.76, + "learning_rate": 1.7509390502905971e-06, + "loss": 0.8252, + "step": 29580 + }, + { + "epoch": 0.76, + "learning_rate": 1.7509207772234565e-06, + "loss": 0.7727, + "step": 29581 + }, + { + "epoch": 0.76, + "learning_rate": 1.7509025035813699e-06, + "loss": 0.9609, + "step": 29582 + }, + { + "epoch": 0.76, + "learning_rate": 1.750884229364352e-06, + "loss": 0.6948, + "step": 29583 + }, + { + "epoch": 0.76, + "learning_rate": 1.7508659545724164e-06, + "loss": 0.7246, + "step": 29584 + }, + { + "epoch": 0.76, + "learning_rate": 1.7508476792055773e-06, + "loss": 0.9795, + "step": 29585 + }, + { + "epoch": 0.76, + "learning_rate": 1.750829403263849e-06, + "loss": 0.7744, + "step": 29586 + }, + { + "epoch": 0.76, + "learning_rate": 1.7508111267472448e-06, + "loss": 0.7866, + "step": 29587 + }, + { + "epoch": 0.76, + "learning_rate": 1.7507928496557789e-06, + "loss": 0.7422, + "step": 29588 + }, + { + "epoch": 0.76, + "learning_rate": 1.7507745719894658e-06, + "loss": 0.999, + "step": 29589 + }, + { + "epoch": 0.76, + "learning_rate": 1.7507562937483189e-06, + "loss": 0.9097, + "step": 29590 + }, + { + "epoch": 0.76, + "learning_rate": 1.7507380149323523e-06, + "loss": 0.9229, + "step": 29591 + }, + { + "epoch": 0.76, + "learning_rate": 1.7507197355415803e-06, + "loss": 0.6128, + "step": 29592 + }, + { + "epoch": 0.76, + "learning_rate": 1.7507014555760168e-06, + "loss": 0.7725, + "step": 29593 + }, + { + "epoch": 0.76, + "learning_rate": 1.7506831750356756e-06, + "loss": 0.6284, + "step": 29594 + }, + { + "epoch": 0.76, + "learning_rate": 1.750664893920571e-06, + "loss": 0.6504, + "step": 29595 + }, + { + "epoch": 0.76, + "learning_rate": 1.7506466122307166e-06, + "loss": 0.8711, + "step": 29596 + }, + { + "epoch": 0.76, + "learning_rate": 1.7506283299661266e-06, + "loss": 0.6694, + "step": 29597 + }, + { + "epoch": 0.76, + "learning_rate": 1.7506100471268152e-06, + "loss": 0.9863, + "step": 29598 + }, + { + "epoch": 0.76, + "learning_rate": 1.7505917637127961e-06, + "loss": 0.7939, + "step": 29599 + }, + { + "epoch": 0.76, + "learning_rate": 1.7505734797240832e-06, + "loss": 0.9229, + "step": 29600 + }, + { + "epoch": 0.76, + "learning_rate": 1.7505551951606908e-06, + "loss": 0.8672, + "step": 29601 + }, + { + "epoch": 0.76, + "learning_rate": 1.750536910022633e-06, + "loss": 0.9443, + "step": 29602 + }, + { + "epoch": 0.76, + "learning_rate": 1.7505186243099237e-06, + "loss": 0.834, + "step": 29603 + }, + { + "epoch": 0.76, + "learning_rate": 1.7505003380225764e-06, + "loss": 0.9062, + "step": 29604 + }, + { + "epoch": 0.76, + "learning_rate": 1.7504820511606057e-06, + "loss": 0.8374, + "step": 29605 + }, + { + "epoch": 0.76, + "learning_rate": 1.7504637637240253e-06, + "loss": 0.7803, + "step": 29606 + }, + { + "epoch": 0.76, + "learning_rate": 1.7504454757128495e-06, + "loss": 0.6929, + "step": 29607 + }, + { + "epoch": 0.76, + "learning_rate": 1.7504271871270918e-06, + "loss": 0.9609, + "step": 29608 + }, + { + "epoch": 0.76, + "learning_rate": 1.7504088979667668e-06, + "loss": 1.0303, + "step": 29609 + }, + { + "epoch": 0.76, + "learning_rate": 1.7503906082318882e-06, + "loss": 0.7412, + "step": 29610 + }, + { + "epoch": 0.76, + "learning_rate": 1.7503723179224696e-06, + "loss": 1.0029, + "step": 29611 + }, + { + "epoch": 0.76, + "learning_rate": 1.7503540270385258e-06, + "loss": 0.8223, + "step": 29612 + }, + { + "epoch": 0.76, + "learning_rate": 1.7503357355800705e-06, + "loss": 0.8232, + "step": 29613 + }, + { + "epoch": 0.76, + "learning_rate": 1.7503174435471175e-06, + "loss": 0.7749, + "step": 29614 + }, + { + "epoch": 0.76, + "learning_rate": 1.7502991509396809e-06, + "loss": 0.8145, + "step": 29615 + }, + { + "epoch": 0.76, + "learning_rate": 1.7502808577577749e-06, + "loss": 0.9424, + "step": 29616 + }, + { + "epoch": 0.76, + "learning_rate": 1.750262564001413e-06, + "loss": 0.9297, + "step": 29617 + }, + { + "epoch": 0.76, + "learning_rate": 1.7502442696706097e-06, + "loss": 0.4971, + "step": 29618 + }, + { + "epoch": 0.76, + "learning_rate": 1.750225974765379e-06, + "loss": 0.5254, + "step": 29619 + }, + { + "epoch": 0.76, + "learning_rate": 1.7502076792857347e-06, + "loss": 1.0547, + "step": 29620 + }, + { + "epoch": 0.76, + "learning_rate": 1.750189383231691e-06, + "loss": 0.8193, + "step": 29621 + }, + { + "epoch": 0.76, + "learning_rate": 1.7501710866032614e-06, + "loss": 0.8457, + "step": 29622 + }, + { + "epoch": 0.76, + "learning_rate": 1.7501527894004608e-06, + "loss": 0.9854, + "step": 29623 + }, + { + "epoch": 0.76, + "learning_rate": 1.7501344916233024e-06, + "loss": 0.7227, + "step": 29624 + }, + { + "epoch": 0.76, + "learning_rate": 1.7501161932718005e-06, + "loss": 0.9121, + "step": 29625 + }, + { + "epoch": 0.76, + "learning_rate": 1.750097894345969e-06, + "loss": 0.9102, + "step": 29626 + }, + { + "epoch": 0.76, + "learning_rate": 1.7500795948458222e-06, + "loss": 0.9551, + "step": 29627 + }, + { + "epoch": 0.76, + "learning_rate": 1.750061294771374e-06, + "loss": 0.5867, + "step": 29628 + }, + { + "epoch": 0.76, + "learning_rate": 1.7500429941226384e-06, + "loss": 0.8857, + "step": 29629 + }, + { + "epoch": 0.76, + "learning_rate": 1.7500246928996294e-06, + "loss": 0.7852, + "step": 29630 + }, + { + "epoch": 0.76, + "learning_rate": 1.7500063911023605e-06, + "loss": 0.7856, + "step": 29631 + }, + { + "epoch": 0.76, + "learning_rate": 1.7499880887308467e-06, + "loss": 0.7595, + "step": 29632 + }, + { + "epoch": 0.76, + "learning_rate": 1.7499697857851015e-06, + "loss": 0.6714, + "step": 29633 + }, + { + "epoch": 0.76, + "learning_rate": 1.7499514822651386e-06, + "loss": 0.7622, + "step": 29634 + }, + { + "epoch": 0.76, + "learning_rate": 1.7499331781709726e-06, + "loss": 0.8994, + "step": 29635 + }, + { + "epoch": 0.76, + "learning_rate": 1.7499148735026173e-06, + "loss": 0.6841, + "step": 29636 + }, + { + "epoch": 0.76, + "learning_rate": 1.7498965682600861e-06, + "loss": 0.9238, + "step": 29637 + }, + { + "epoch": 0.76, + "learning_rate": 1.7498782624433943e-06, + "loss": 1.001, + "step": 29638 + }, + { + "epoch": 0.76, + "learning_rate": 1.7498599560525546e-06, + "loss": 0.875, + "step": 29639 + }, + { + "epoch": 0.76, + "learning_rate": 1.7498416490875823e-06, + "loss": 0.9346, + "step": 29640 + }, + { + "epoch": 0.76, + "learning_rate": 1.74982334154849e-06, + "loss": 1.0322, + "step": 29641 + }, + { + "epoch": 0.76, + "learning_rate": 1.7498050334352929e-06, + "loss": 0.6284, + "step": 29642 + }, + { + "epoch": 0.76, + "learning_rate": 1.7497867247480045e-06, + "loss": 0.8047, + "step": 29643 + }, + { + "epoch": 0.76, + "learning_rate": 1.7497684154866387e-06, + "loss": 0.8105, + "step": 29644 + }, + { + "epoch": 0.76, + "learning_rate": 1.74975010565121e-06, + "loss": 0.7979, + "step": 29645 + }, + { + "epoch": 0.76, + "learning_rate": 1.749731795241732e-06, + "loss": 0.8857, + "step": 29646 + }, + { + "epoch": 0.76, + "learning_rate": 1.7497134842582186e-06, + "loss": 0.7852, + "step": 29647 + }, + { + "epoch": 0.76, + "learning_rate": 1.7496951727006843e-06, + "loss": 0.999, + "step": 29648 + }, + { + "epoch": 0.76, + "learning_rate": 1.7496768605691427e-06, + "loss": 0.7305, + "step": 29649 + }, + { + "epoch": 0.76, + "learning_rate": 1.7496585478636084e-06, + "loss": 0.8994, + "step": 29650 + }, + { + "epoch": 0.76, + "learning_rate": 1.7496402345840946e-06, + "loss": 0.9805, + "step": 29651 + }, + { + "epoch": 0.76, + "learning_rate": 1.7496219207306157e-06, + "loss": 0.7627, + "step": 29652 + }, + { + "epoch": 0.76, + "learning_rate": 1.7496036063031858e-06, + "loss": 0.9033, + "step": 29653 + }, + { + "epoch": 0.76, + "learning_rate": 1.7495852913018193e-06, + "loss": 0.9834, + "step": 29654 + }, + { + "epoch": 0.76, + "learning_rate": 1.7495669757265295e-06, + "loss": 0.8135, + "step": 29655 + }, + { + "epoch": 0.76, + "learning_rate": 1.7495486595773308e-06, + "loss": 1.0586, + "step": 29656 + }, + { + "epoch": 0.76, + "learning_rate": 1.7495303428542368e-06, + "loss": 0.8311, + "step": 29657 + }, + { + "epoch": 0.76, + "learning_rate": 1.7495120255572624e-06, + "loss": 0.9062, + "step": 29658 + }, + { + "epoch": 0.76, + "learning_rate": 1.749493707686421e-06, + "loss": 1.0068, + "step": 29659 + }, + { + "epoch": 0.76, + "learning_rate": 1.7494753892417266e-06, + "loss": 1.2227, + "step": 29660 + }, + { + "epoch": 0.76, + "learning_rate": 1.7494570702231935e-06, + "loss": 0.562, + "step": 29661 + }, + { + "epoch": 0.76, + "learning_rate": 1.7494387506308353e-06, + "loss": 0.8643, + "step": 29662 + }, + { + "epoch": 0.76, + "learning_rate": 1.7494204304646665e-06, + "loss": 0.874, + "step": 29663 + }, + { + "epoch": 0.76, + "learning_rate": 1.749402109724701e-06, + "loss": 0.6768, + "step": 29664 + }, + { + "epoch": 0.76, + "learning_rate": 1.7493837884109526e-06, + "loss": 0.7266, + "step": 29665 + }, + { + "epoch": 0.76, + "learning_rate": 1.7493654665234355e-06, + "loss": 0.9175, + "step": 29666 + }, + { + "epoch": 0.76, + "learning_rate": 1.7493471440621638e-06, + "loss": 0.7529, + "step": 29667 + }, + { + "epoch": 0.76, + "learning_rate": 1.7493288210271516e-06, + "loss": 0.8994, + "step": 29668 + }, + { + "epoch": 0.76, + "learning_rate": 1.7493104974184125e-06, + "loss": 0.6943, + "step": 29669 + }, + { + "epoch": 0.76, + "learning_rate": 1.7492921732359612e-06, + "loss": 0.9531, + "step": 29670 + }, + { + "epoch": 0.76, + "learning_rate": 1.7492738484798108e-06, + "loss": 0.8809, + "step": 29671 + }, + { + "epoch": 0.76, + "learning_rate": 1.7492555231499761e-06, + "loss": 0.9673, + "step": 29672 + }, + { + "epoch": 0.76, + "learning_rate": 1.749237197246471e-06, + "loss": 0.9658, + "step": 29673 + }, + { + "epoch": 0.76, + "learning_rate": 1.7492188707693094e-06, + "loss": 0.6162, + "step": 29674 + }, + { + "epoch": 0.76, + "learning_rate": 1.7492005437185053e-06, + "loss": 0.9541, + "step": 29675 + }, + { + "epoch": 0.76, + "learning_rate": 1.7491822160940725e-06, + "loss": 0.9092, + "step": 29676 + }, + { + "epoch": 0.76, + "learning_rate": 1.7491638878960259e-06, + "loss": 0.9053, + "step": 29677 + }, + { + "epoch": 0.76, + "learning_rate": 1.7491455591243786e-06, + "loss": 0.8271, + "step": 29678 + }, + { + "epoch": 0.76, + "learning_rate": 1.749127229779145e-06, + "loss": 0.9209, + "step": 29679 + }, + { + "epoch": 0.76, + "learning_rate": 1.749108899860339e-06, + "loss": 0.8232, + "step": 29680 + }, + { + "epoch": 0.76, + "learning_rate": 1.7490905693679751e-06, + "loss": 0.8467, + "step": 29681 + }, + { + "epoch": 0.76, + "learning_rate": 1.7490722383020668e-06, + "loss": 0.9287, + "step": 29682 + }, + { + "epoch": 0.76, + "learning_rate": 1.7490539066626286e-06, + "loss": 0.7192, + "step": 29683 + }, + { + "epoch": 0.76, + "learning_rate": 1.749035574449674e-06, + "loss": 0.9141, + "step": 29684 + }, + { + "epoch": 0.76, + "learning_rate": 1.7490172416632176e-06, + "loss": 0.9268, + "step": 29685 + }, + { + "epoch": 0.76, + "learning_rate": 1.7489989083032727e-06, + "loss": 0.9043, + "step": 29686 + }, + { + "epoch": 0.76, + "learning_rate": 1.748980574369854e-06, + "loss": 0.9434, + "step": 29687 + }, + { + "epoch": 0.76, + "learning_rate": 1.7489622398629754e-06, + "loss": 0.7881, + "step": 29688 + }, + { + "epoch": 0.76, + "learning_rate": 1.7489439047826507e-06, + "loss": 0.8447, + "step": 29689 + }, + { + "epoch": 0.76, + "learning_rate": 1.748925569128894e-06, + "loss": 0.8052, + "step": 29690 + }, + { + "epoch": 0.76, + "learning_rate": 1.7489072329017196e-06, + "loss": 0.7446, + "step": 29691 + }, + { + "epoch": 0.76, + "learning_rate": 1.7488888961011413e-06, + "loss": 1.0049, + "step": 29692 + }, + { + "epoch": 0.76, + "learning_rate": 1.7488705587271736e-06, + "loss": 1.0156, + "step": 29693 + }, + { + "epoch": 0.76, + "learning_rate": 1.7488522207798296e-06, + "loss": 1.0068, + "step": 29694 + }, + { + "epoch": 0.76, + "learning_rate": 1.748833882259124e-06, + "loss": 0.7559, + "step": 29695 + }, + { + "epoch": 0.76, + "learning_rate": 1.7488155431650707e-06, + "loss": 0.8188, + "step": 29696 + }, + { + "epoch": 0.76, + "learning_rate": 1.748797203497684e-06, + "loss": 0.7139, + "step": 29697 + }, + { + "epoch": 0.76, + "learning_rate": 1.7487788632569775e-06, + "loss": 0.9629, + "step": 29698 + }, + { + "epoch": 0.76, + "learning_rate": 1.7487605224429657e-06, + "loss": 0.8242, + "step": 29699 + }, + { + "epoch": 0.76, + "learning_rate": 1.748742181055662e-06, + "loss": 0.8691, + "step": 29700 + }, + { + "epoch": 0.76, + "learning_rate": 1.748723839095081e-06, + "loss": 0.6353, + "step": 29701 + }, + { + "epoch": 0.76, + "learning_rate": 1.7487054965612367e-06, + "loss": 0.7803, + "step": 29702 + }, + { + "epoch": 0.76, + "learning_rate": 1.748687153454143e-06, + "loss": 0.6091, + "step": 29703 + }, + { + "epoch": 0.76, + "learning_rate": 1.748668809773814e-06, + "loss": 0.8984, + "step": 29704 + }, + { + "epoch": 0.76, + "learning_rate": 1.7486504655202636e-06, + "loss": 0.9062, + "step": 29705 + }, + { + "epoch": 0.76, + "learning_rate": 1.748632120693506e-06, + "loss": 0.5796, + "step": 29706 + }, + { + "epoch": 0.76, + "learning_rate": 1.7486137752935553e-06, + "loss": 0.7773, + "step": 29707 + }, + { + "epoch": 0.76, + "learning_rate": 1.7485954293204255e-06, + "loss": 0.8037, + "step": 29708 + }, + { + "epoch": 0.76, + "learning_rate": 1.7485770827741305e-06, + "loss": 0.6772, + "step": 29709 + }, + { + "epoch": 0.76, + "learning_rate": 1.7485587356546843e-06, + "loss": 0.7783, + "step": 29710 + }, + { + "epoch": 0.76, + "learning_rate": 1.7485403879621012e-06, + "loss": 0.9072, + "step": 29711 + }, + { + "epoch": 0.76, + "learning_rate": 1.7485220396963954e-06, + "loss": 0.7417, + "step": 29712 + }, + { + "epoch": 0.76, + "learning_rate": 1.7485036908575803e-06, + "loss": 0.9053, + "step": 29713 + }, + { + "epoch": 0.76, + "learning_rate": 1.7484853414456706e-06, + "loss": 0.8936, + "step": 29714 + }, + { + "epoch": 0.76, + "learning_rate": 1.74846699146068e-06, + "loss": 0.9346, + "step": 29715 + }, + { + "epoch": 0.76, + "learning_rate": 1.7484486409026228e-06, + "loss": 1.126, + "step": 29716 + }, + { + "epoch": 0.76, + "learning_rate": 1.7484302897715125e-06, + "loss": 1.1035, + "step": 29717 + }, + { + "epoch": 0.76, + "learning_rate": 1.7484119380673639e-06, + "loss": 0.751, + "step": 29718 + }, + { + "epoch": 0.76, + "learning_rate": 1.7483935857901907e-06, + "loss": 0.8906, + "step": 29719 + }, + { + "epoch": 0.76, + "learning_rate": 1.7483752329400065e-06, + "loss": 0.823, + "step": 29720 + }, + { + "epoch": 0.76, + "learning_rate": 1.7483568795168263e-06, + "loss": 0.9033, + "step": 29721 + }, + { + "epoch": 0.76, + "learning_rate": 1.7483385255206633e-06, + "loss": 0.9219, + "step": 29722 + }, + { + "epoch": 0.76, + "learning_rate": 1.748320170951532e-06, + "loss": 0.834, + "step": 29723 + }, + { + "epoch": 0.76, + "learning_rate": 1.7483018158094465e-06, + "loss": 0.9561, + "step": 29724 + }, + { + "epoch": 0.76, + "learning_rate": 1.7482834600944204e-06, + "loss": 0.9629, + "step": 29725 + }, + { + "epoch": 0.76, + "learning_rate": 1.7482651038064685e-06, + "loss": 0.9551, + "step": 29726 + }, + { + "epoch": 0.76, + "learning_rate": 1.748246746945604e-06, + "loss": 0.8301, + "step": 29727 + }, + { + "epoch": 0.76, + "learning_rate": 1.748228389511842e-06, + "loss": 0.6792, + "step": 29728 + }, + { + "epoch": 0.76, + "learning_rate": 1.7482100315051953e-06, + "loss": 0.9243, + "step": 29729 + }, + { + "epoch": 0.76, + "learning_rate": 1.748191672925679e-06, + "loss": 0.8896, + "step": 29730 + }, + { + "epoch": 0.76, + "learning_rate": 1.7481733137733063e-06, + "loss": 0.8984, + "step": 29731 + }, + { + "epoch": 0.76, + "learning_rate": 1.748154954048092e-06, + "loss": 0.9414, + "step": 29732 + }, + { + "epoch": 0.76, + "learning_rate": 1.7481365937500497e-06, + "loss": 0.7822, + "step": 29733 + }, + { + "epoch": 0.76, + "learning_rate": 1.7481182328791934e-06, + "loss": 0.5864, + "step": 29734 + }, + { + "epoch": 0.76, + "learning_rate": 1.7480998714355379e-06, + "loss": 0.7852, + "step": 29735 + }, + { + "epoch": 0.76, + "learning_rate": 1.7480815094190966e-06, + "loss": 0.937, + "step": 29736 + }, + { + "epoch": 0.76, + "learning_rate": 1.7480631468298835e-06, + "loss": 0.9473, + "step": 29737 + }, + { + "epoch": 0.76, + "learning_rate": 1.7480447836679128e-06, + "loss": 1.041, + "step": 29738 + }, + { + "epoch": 0.76, + "learning_rate": 1.7480264199331987e-06, + "loss": 0.8164, + "step": 29739 + }, + { + "epoch": 0.76, + "learning_rate": 1.7480080556257553e-06, + "loss": 0.9004, + "step": 29740 + }, + { + "epoch": 0.76, + "learning_rate": 1.7479896907455962e-06, + "loss": 0.7808, + "step": 29741 + }, + { + "epoch": 0.76, + "learning_rate": 1.747971325292736e-06, + "loss": 0.8369, + "step": 29742 + }, + { + "epoch": 0.76, + "learning_rate": 1.7479529592671885e-06, + "loss": 0.9014, + "step": 29743 + }, + { + "epoch": 0.76, + "learning_rate": 1.747934592668968e-06, + "loss": 0.7783, + "step": 29744 + }, + { + "epoch": 0.76, + "learning_rate": 1.747916225498088e-06, + "loss": 0.8115, + "step": 29745 + }, + { + "epoch": 0.76, + "learning_rate": 1.7478978577545634e-06, + "loss": 0.77, + "step": 29746 + }, + { + "epoch": 0.76, + "learning_rate": 1.7478794894384072e-06, + "loss": 1.0186, + "step": 29747 + }, + { + "epoch": 0.76, + "learning_rate": 1.7478611205496346e-06, + "loss": 0.7617, + "step": 29748 + }, + { + "epoch": 0.76, + "learning_rate": 1.747842751088259e-06, + "loss": 0.9844, + "step": 29749 + }, + { + "epoch": 0.76, + "learning_rate": 1.7478243810542944e-06, + "loss": 0.665, + "step": 29750 + }, + { + "epoch": 0.76, + "learning_rate": 1.7478060104477552e-06, + "loss": 0.9102, + "step": 29751 + }, + { + "epoch": 0.76, + "learning_rate": 1.7477876392686555e-06, + "loss": 0.8818, + "step": 29752 + }, + { + "epoch": 0.76, + "learning_rate": 1.7477692675170088e-06, + "loss": 0.5962, + "step": 29753 + }, + { + "epoch": 0.76, + "learning_rate": 1.7477508951928299e-06, + "loss": 0.9434, + "step": 29754 + }, + { + "epoch": 0.76, + "learning_rate": 1.7477325222961325e-06, + "loss": 0.8555, + "step": 29755 + }, + { + "epoch": 0.76, + "learning_rate": 1.7477141488269304e-06, + "loss": 0.7612, + "step": 29756 + }, + { + "epoch": 0.76, + "learning_rate": 1.7476957747852384e-06, + "loss": 0.6255, + "step": 29757 + }, + { + "epoch": 0.76, + "learning_rate": 1.7476774001710697e-06, + "loss": 1.0117, + "step": 29758 + }, + { + "epoch": 0.76, + "learning_rate": 1.7476590249844389e-06, + "loss": 0.96, + "step": 29759 + }, + { + "epoch": 0.76, + "learning_rate": 1.74764064922536e-06, + "loss": 1.0811, + "step": 29760 + }, + { + "epoch": 0.76, + "learning_rate": 1.747622272893847e-06, + "loss": 0.9346, + "step": 29761 + }, + { + "epoch": 0.76, + "learning_rate": 1.747603895989914e-06, + "loss": 0.7231, + "step": 29762 + }, + { + "epoch": 0.76, + "learning_rate": 1.7475855185135753e-06, + "loss": 0.6377, + "step": 29763 + }, + { + "epoch": 0.76, + "learning_rate": 1.7475671404648445e-06, + "loss": 0.8174, + "step": 29764 + }, + { + "epoch": 0.76, + "learning_rate": 1.7475487618437358e-06, + "loss": 0.8574, + "step": 29765 + }, + { + "epoch": 0.76, + "learning_rate": 1.7475303826502637e-06, + "loss": 0.9795, + "step": 29766 + }, + { + "epoch": 0.76, + "learning_rate": 1.7475120028844419e-06, + "loss": 0.8672, + "step": 29767 + }, + { + "epoch": 0.76, + "learning_rate": 1.747493622546284e-06, + "loss": 0.8604, + "step": 29768 + }, + { + "epoch": 0.76, + "learning_rate": 1.7474752416358055e-06, + "loss": 0.8242, + "step": 29769 + }, + { + "epoch": 0.76, + "learning_rate": 1.747456860153019e-06, + "loss": 0.6777, + "step": 29770 + }, + { + "epoch": 0.76, + "learning_rate": 1.7474384780979393e-06, + "loss": 0.7402, + "step": 29771 + }, + { + "epoch": 0.76, + "learning_rate": 1.7474200954705803e-06, + "loss": 0.7075, + "step": 29772 + }, + { + "epoch": 0.76, + "learning_rate": 1.7474017122709562e-06, + "loss": 0.7068, + "step": 29773 + }, + { + "epoch": 0.76, + "learning_rate": 1.7473833284990808e-06, + "loss": 0.6768, + "step": 29774 + }, + { + "epoch": 0.76, + "learning_rate": 1.7473649441549686e-06, + "loss": 0.71, + "step": 29775 + }, + { + "epoch": 0.76, + "learning_rate": 1.7473465592386331e-06, + "loss": 1.0293, + "step": 29776 + }, + { + "epoch": 0.76, + "learning_rate": 1.747328173750089e-06, + "loss": 0.6071, + "step": 29777 + }, + { + "epoch": 0.76, + "learning_rate": 1.74730978768935e-06, + "loss": 1.002, + "step": 29778 + }, + { + "epoch": 0.76, + "learning_rate": 1.74729140105643e-06, + "loss": 0.6572, + "step": 29779 + }, + { + "epoch": 0.76, + "learning_rate": 1.7472730138513435e-06, + "loss": 0.8477, + "step": 29780 + }, + { + "epoch": 0.76, + "learning_rate": 1.7472546260741045e-06, + "loss": 0.6689, + "step": 29781 + }, + { + "epoch": 0.76, + "learning_rate": 1.747236237724727e-06, + "loss": 0.8203, + "step": 29782 + }, + { + "epoch": 0.76, + "learning_rate": 1.747217848803225e-06, + "loss": 0.8447, + "step": 29783 + }, + { + "epoch": 0.76, + "learning_rate": 1.7471994593096126e-06, + "loss": 0.771, + "step": 29784 + }, + { + "epoch": 0.76, + "learning_rate": 1.7471810692439042e-06, + "loss": 0.8535, + "step": 29785 + }, + { + "epoch": 0.76, + "learning_rate": 1.7471626786061134e-06, + "loss": 0.8516, + "step": 29786 + }, + { + "epoch": 0.76, + "learning_rate": 1.7471442873962543e-06, + "loss": 0.5986, + "step": 29787 + }, + { + "epoch": 0.76, + "learning_rate": 1.7471258956143413e-06, + "loss": 1.0, + "step": 29788 + }, + { + "epoch": 0.76, + "learning_rate": 1.7471075032603885e-06, + "loss": 0.9111, + "step": 29789 + }, + { + "epoch": 0.76, + "learning_rate": 1.74708911033441e-06, + "loss": 0.7559, + "step": 29790 + }, + { + "epoch": 0.76, + "learning_rate": 1.7470707168364195e-06, + "loss": 0.9609, + "step": 29791 + }, + { + "epoch": 0.76, + "learning_rate": 1.747052322766431e-06, + "loss": 1.0625, + "step": 29792 + }, + { + "epoch": 0.76, + "learning_rate": 1.7470339281244592e-06, + "loss": 1.0166, + "step": 29793 + }, + { + "epoch": 0.76, + "learning_rate": 1.747015532910518e-06, + "loss": 0.8174, + "step": 29794 + }, + { + "epoch": 0.76, + "learning_rate": 1.7469971371246213e-06, + "loss": 0.96, + "step": 29795 + }, + { + "epoch": 0.76, + "learning_rate": 1.7469787407667828e-06, + "loss": 0.7593, + "step": 29796 + }, + { + "epoch": 0.76, + "learning_rate": 1.7469603438370174e-06, + "loss": 0.6311, + "step": 29797 + }, + { + "epoch": 0.76, + "learning_rate": 1.746941946335339e-06, + "loss": 0.8613, + "step": 29798 + }, + { + "epoch": 0.76, + "learning_rate": 1.7469235482617612e-06, + "loss": 0.8267, + "step": 29799 + }, + { + "epoch": 0.76, + "learning_rate": 1.7469051496162985e-06, + "loss": 0.6553, + "step": 29800 + }, + { + "epoch": 0.76, + "learning_rate": 1.7468867503989648e-06, + "loss": 0.8535, + "step": 29801 + }, + { + "epoch": 0.76, + "learning_rate": 1.7468683506097743e-06, + "loss": 0.7217, + "step": 29802 + }, + { + "epoch": 0.76, + "learning_rate": 1.746849950248741e-06, + "loss": 0.7896, + "step": 29803 + }, + { + "epoch": 0.76, + "learning_rate": 1.7468315493158793e-06, + "loss": 0.7366, + "step": 29804 + }, + { + "epoch": 0.76, + "learning_rate": 1.7468131478112027e-06, + "loss": 0.8525, + "step": 29805 + }, + { + "epoch": 0.76, + "learning_rate": 1.7467947457347255e-06, + "loss": 0.8135, + "step": 29806 + }, + { + "epoch": 0.76, + "learning_rate": 1.7467763430864624e-06, + "loss": 0.7271, + "step": 29807 + }, + { + "epoch": 0.76, + "learning_rate": 1.7467579398664266e-06, + "loss": 0.8096, + "step": 29808 + }, + { + "epoch": 0.76, + "learning_rate": 1.7467395360746327e-06, + "loss": 0.7397, + "step": 29809 + }, + { + "epoch": 0.76, + "learning_rate": 1.7467211317110946e-06, + "loss": 0.8984, + "step": 29810 + }, + { + "epoch": 0.76, + "learning_rate": 1.7467027267758266e-06, + "loss": 0.7266, + "step": 29811 + }, + { + "epoch": 0.76, + "learning_rate": 1.7466843212688425e-06, + "loss": 0.9678, + "step": 29812 + }, + { + "epoch": 0.76, + "learning_rate": 1.7466659151901566e-06, + "loss": 0.748, + "step": 29813 + }, + { + "epoch": 0.76, + "learning_rate": 1.7466475085397829e-06, + "loss": 0.8936, + "step": 29814 + }, + { + "epoch": 0.76, + "learning_rate": 1.7466291013177358e-06, + "loss": 0.8174, + "step": 29815 + }, + { + "epoch": 0.76, + "learning_rate": 1.7466106935240289e-06, + "loss": 0.8115, + "step": 29816 + }, + { + "epoch": 0.76, + "learning_rate": 1.7465922851586766e-06, + "loss": 0.7314, + "step": 29817 + }, + { + "epoch": 0.76, + "learning_rate": 1.7465738762216927e-06, + "loss": 0.9541, + "step": 29818 + }, + { + "epoch": 0.76, + "learning_rate": 1.7465554667130918e-06, + "loss": 0.9922, + "step": 29819 + }, + { + "epoch": 0.76, + "learning_rate": 1.7465370566328876e-06, + "loss": 0.834, + "step": 29820 + }, + { + "epoch": 0.76, + "learning_rate": 1.7465186459810942e-06, + "loss": 1.0449, + "step": 29821 + }, + { + "epoch": 0.76, + "learning_rate": 1.7465002347577257e-06, + "loss": 0.7734, + "step": 29822 + }, + { + "epoch": 0.76, + "learning_rate": 1.7464818229627966e-06, + "loss": 0.6428, + "step": 29823 + }, + { + "epoch": 0.76, + "learning_rate": 1.7464634105963207e-06, + "loss": 0.8813, + "step": 29824 + }, + { + "epoch": 0.76, + "learning_rate": 1.7464449976583119e-06, + "loss": 0.8062, + "step": 29825 + }, + { + "epoch": 0.76, + "learning_rate": 1.7464265841487845e-06, + "loss": 0.8115, + "step": 29826 + }, + { + "epoch": 0.76, + "learning_rate": 1.7464081700677528e-06, + "loss": 0.7783, + "step": 29827 + }, + { + "epoch": 0.76, + "learning_rate": 1.7463897554152305e-06, + "loss": 0.9531, + "step": 29828 + }, + { + "epoch": 0.76, + "learning_rate": 1.7463713401912318e-06, + "loss": 0.8037, + "step": 29829 + }, + { + "epoch": 0.76, + "learning_rate": 1.746352924395771e-06, + "loss": 0.9043, + "step": 29830 + }, + { + "epoch": 0.76, + "learning_rate": 1.7463345080288622e-06, + "loss": 0.7769, + "step": 29831 + }, + { + "epoch": 0.76, + "learning_rate": 1.7463160910905192e-06, + "loss": 0.6768, + "step": 29832 + }, + { + "epoch": 0.76, + "learning_rate": 1.7462976735807561e-06, + "loss": 1.0225, + "step": 29833 + }, + { + "epoch": 0.76, + "learning_rate": 1.7462792554995876e-06, + "loss": 0.7656, + "step": 29834 + }, + { + "epoch": 0.76, + "learning_rate": 1.7462608368470272e-06, + "loss": 0.7314, + "step": 29835 + }, + { + "epoch": 0.76, + "learning_rate": 1.7462424176230892e-06, + "loss": 0.9121, + "step": 29836 + }, + { + "epoch": 0.76, + "learning_rate": 1.7462239978277877e-06, + "loss": 0.646, + "step": 29837 + }, + { + "epoch": 0.76, + "learning_rate": 1.746205577461137e-06, + "loss": 0.6738, + "step": 29838 + }, + { + "epoch": 0.76, + "learning_rate": 1.7461871565231507e-06, + "loss": 0.8467, + "step": 29839 + }, + { + "epoch": 0.76, + "learning_rate": 1.7461687350138434e-06, + "loss": 0.7559, + "step": 29840 + }, + { + "epoch": 0.76, + "learning_rate": 1.7461503129332286e-06, + "loss": 0.957, + "step": 29841 + }, + { + "epoch": 0.76, + "learning_rate": 1.7461318902813214e-06, + "loss": 0.8384, + "step": 29842 + }, + { + "epoch": 0.76, + "learning_rate": 1.746113467058135e-06, + "loss": 0.6167, + "step": 29843 + }, + { + "epoch": 0.76, + "learning_rate": 1.746095043263684e-06, + "loss": 0.8359, + "step": 29844 + }, + { + "epoch": 0.76, + "learning_rate": 1.7460766188979822e-06, + "loss": 0.9277, + "step": 29845 + }, + { + "epoch": 0.76, + "learning_rate": 1.7460581939610438e-06, + "loss": 0.7959, + "step": 29846 + }, + { + "epoch": 0.76, + "learning_rate": 1.7460397684528828e-06, + "loss": 0.7222, + "step": 29847 + }, + { + "epoch": 0.77, + "learning_rate": 1.7460213423735138e-06, + "loss": 0.7222, + "step": 29848 + }, + { + "epoch": 0.77, + "learning_rate": 1.7460029157229504e-06, + "loss": 0.8032, + "step": 29849 + }, + { + "epoch": 0.77, + "learning_rate": 1.745984488501207e-06, + "loss": 0.5918, + "step": 29850 + }, + { + "epoch": 0.77, + "learning_rate": 1.7459660607082974e-06, + "loss": 0.8516, + "step": 29851 + }, + { + "epoch": 0.77, + "learning_rate": 1.745947632344236e-06, + "loss": 0.8623, + "step": 29852 + }, + { + "epoch": 0.77, + "learning_rate": 1.7459292034090365e-06, + "loss": 0.5393, + "step": 29853 + }, + { + "epoch": 0.77, + "learning_rate": 1.7459107739027136e-06, + "loss": 0.8398, + "step": 29854 + }, + { + "epoch": 0.77, + "learning_rate": 1.745892343825281e-06, + "loss": 0.9502, + "step": 29855 + }, + { + "epoch": 0.77, + "learning_rate": 1.7458739131767531e-06, + "loss": 0.7354, + "step": 29856 + }, + { + "epoch": 0.77, + "learning_rate": 1.7458554819571437e-06, + "loss": 0.8062, + "step": 29857 + }, + { + "epoch": 0.77, + "learning_rate": 1.7458370501664672e-06, + "loss": 1.0176, + "step": 29858 + }, + { + "epoch": 0.77, + "learning_rate": 1.7458186178047374e-06, + "loss": 0.8369, + "step": 29859 + }, + { + "epoch": 0.77, + "learning_rate": 1.7458001848719687e-06, + "loss": 0.9443, + "step": 29860 + }, + { + "epoch": 0.77, + "learning_rate": 1.7457817513681748e-06, + "loss": 1.0635, + "step": 29861 + }, + { + "epoch": 0.77, + "learning_rate": 1.7457633172933704e-06, + "loss": 0.8076, + "step": 29862 + }, + { + "epoch": 0.77, + "learning_rate": 1.7457448826475694e-06, + "loss": 0.8193, + "step": 29863 + }, + { + "epoch": 0.77, + "learning_rate": 1.7457264474307855e-06, + "loss": 0.9805, + "step": 29864 + }, + { + "epoch": 0.77, + "learning_rate": 1.7457080116430333e-06, + "loss": 0.6702, + "step": 29865 + }, + { + "epoch": 0.77, + "learning_rate": 1.7456895752843268e-06, + "loss": 0.7588, + "step": 29866 + }, + { + "epoch": 0.77, + "learning_rate": 1.7456711383546802e-06, + "loss": 0.811, + "step": 29867 + }, + { + "epoch": 0.77, + "learning_rate": 1.7456527008541074e-06, + "loss": 0.9297, + "step": 29868 + }, + { + "epoch": 0.77, + "learning_rate": 1.7456342627826227e-06, + "loss": 0.7451, + "step": 29869 + }, + { + "epoch": 0.77, + "learning_rate": 1.74561582414024e-06, + "loss": 0.6326, + "step": 29870 + }, + { + "epoch": 0.77, + "learning_rate": 1.7455973849269735e-06, + "loss": 0.7314, + "step": 29871 + }, + { + "epoch": 0.77, + "learning_rate": 1.7455789451428373e-06, + "loss": 0.5981, + "step": 29872 + }, + { + "epoch": 0.77, + "learning_rate": 1.7455605047878458e-06, + "loss": 0.7852, + "step": 29873 + }, + { + "epoch": 0.77, + "learning_rate": 1.7455420638620128e-06, + "loss": 0.8359, + "step": 29874 + }, + { + "epoch": 0.77, + "learning_rate": 1.7455236223653524e-06, + "loss": 0.9395, + "step": 29875 + }, + { + "epoch": 0.77, + "learning_rate": 1.745505180297879e-06, + "loss": 1.127, + "step": 29876 + }, + { + "epoch": 0.77, + "learning_rate": 1.7454867376596067e-06, + "loss": 0.7246, + "step": 29877 + }, + { + "epoch": 0.77, + "learning_rate": 1.7454682944505491e-06, + "loss": 1.0547, + "step": 29878 + }, + { + "epoch": 0.77, + "learning_rate": 1.7454498506707212e-06, + "loss": 1.082, + "step": 29879 + }, + { + "epoch": 0.77, + "learning_rate": 1.7454314063201362e-06, + "loss": 0.9951, + "step": 29880 + }, + { + "epoch": 0.77, + "learning_rate": 1.745412961398809e-06, + "loss": 0.9941, + "step": 29881 + }, + { + "epoch": 0.77, + "learning_rate": 1.745394515906753e-06, + "loss": 0.9307, + "step": 29882 + }, + { + "epoch": 0.77, + "learning_rate": 1.7453760698439827e-06, + "loss": 0.7988, + "step": 29883 + }, + { + "epoch": 0.77, + "learning_rate": 1.7453576232105124e-06, + "loss": 0.7881, + "step": 29884 + }, + { + "epoch": 0.77, + "learning_rate": 1.745339176006356e-06, + "loss": 0.9463, + "step": 29885 + }, + { + "epoch": 0.77, + "learning_rate": 1.7453207282315278e-06, + "loss": 0.8535, + "step": 29886 + }, + { + "epoch": 0.77, + "learning_rate": 1.7453022798860417e-06, + "loss": 1.0156, + "step": 29887 + }, + { + "epoch": 0.77, + "learning_rate": 1.745283830969912e-06, + "loss": 0.8672, + "step": 29888 + }, + { + "epoch": 0.77, + "learning_rate": 1.7452653814831524e-06, + "loss": 0.6631, + "step": 29889 + }, + { + "epoch": 0.77, + "learning_rate": 1.7452469314257775e-06, + "loss": 0.9512, + "step": 29890 + }, + { + "epoch": 0.77, + "learning_rate": 1.7452284807978015e-06, + "loss": 0.9307, + "step": 29891 + }, + { + "epoch": 0.77, + "learning_rate": 1.7452100295992382e-06, + "loss": 0.7808, + "step": 29892 + }, + { + "epoch": 0.77, + "learning_rate": 1.7451915778301021e-06, + "loss": 0.6035, + "step": 29893 + }, + { + "epoch": 0.77, + "learning_rate": 1.7451731254904067e-06, + "loss": 0.9062, + "step": 29894 + }, + { + "epoch": 0.77, + "learning_rate": 1.7451546725801667e-06, + "loss": 0.9502, + "step": 29895 + }, + { + "epoch": 0.77, + "learning_rate": 1.745136219099396e-06, + "loss": 0.4932, + "step": 29896 + }, + { + "epoch": 0.77, + "learning_rate": 1.7451177650481087e-06, + "loss": 0.9023, + "step": 29897 + }, + { + "epoch": 0.77, + "learning_rate": 1.745099310426319e-06, + "loss": 0.8926, + "step": 29898 + }, + { + "epoch": 0.77, + "learning_rate": 1.745080855234041e-06, + "loss": 1.0068, + "step": 29899 + }, + { + "epoch": 0.77, + "learning_rate": 1.7450623994712888e-06, + "loss": 0.7202, + "step": 29900 + }, + { + "epoch": 0.77, + "learning_rate": 1.7450439431380768e-06, + "loss": 0.9067, + "step": 29901 + }, + { + "epoch": 0.77, + "learning_rate": 1.7450254862344186e-06, + "loss": 0.8398, + "step": 29902 + }, + { + "epoch": 0.77, + "learning_rate": 1.7450070287603289e-06, + "loss": 0.7612, + "step": 29903 + }, + { + "epoch": 0.77, + "learning_rate": 1.7449885707158215e-06, + "loss": 0.7778, + "step": 29904 + }, + { + "epoch": 0.77, + "learning_rate": 1.7449701121009107e-06, + "loss": 0.8008, + "step": 29905 + }, + { + "epoch": 0.77, + "learning_rate": 1.7449516529156104e-06, + "loss": 1.0, + "step": 29906 + }, + { + "epoch": 0.77, + "learning_rate": 1.7449331931599347e-06, + "loss": 0.7734, + "step": 29907 + }, + { + "epoch": 0.77, + "learning_rate": 1.7449147328338983e-06, + "loss": 0.7949, + "step": 29908 + }, + { + "epoch": 0.77, + "learning_rate": 1.7448962719375146e-06, + "loss": 0.7424, + "step": 29909 + }, + { + "epoch": 0.77, + "learning_rate": 1.7448778104707983e-06, + "loss": 1.1328, + "step": 29910 + }, + { + "epoch": 0.77, + "learning_rate": 1.7448593484337632e-06, + "loss": 0.5593, + "step": 29911 + }, + { + "epoch": 0.77, + "learning_rate": 1.7448408858264236e-06, + "loss": 0.833, + "step": 29912 + }, + { + "epoch": 0.77, + "learning_rate": 1.7448224226487936e-06, + "loss": 0.7529, + "step": 29913 + }, + { + "epoch": 0.77, + "learning_rate": 1.7448039589008873e-06, + "loss": 0.9893, + "step": 29914 + }, + { + "epoch": 0.77, + "learning_rate": 1.744785494582719e-06, + "loss": 0.9951, + "step": 29915 + }, + { + "epoch": 0.77, + "learning_rate": 1.7447670296943025e-06, + "loss": 0.7666, + "step": 29916 + }, + { + "epoch": 0.77, + "learning_rate": 1.7447485642356522e-06, + "loss": 0.873, + "step": 29917 + }, + { + "epoch": 0.77, + "learning_rate": 1.7447300982067818e-06, + "loss": 0.7261, + "step": 29918 + }, + { + "epoch": 0.77, + "learning_rate": 1.7447116316077063e-06, + "loss": 1.0508, + "step": 29919 + }, + { + "epoch": 0.77, + "learning_rate": 1.744693164438439e-06, + "loss": 0.9287, + "step": 29920 + }, + { + "epoch": 0.77, + "learning_rate": 1.7446746966989948e-06, + "loss": 0.7476, + "step": 29921 + }, + { + "epoch": 0.77, + "learning_rate": 1.744656228389387e-06, + "loss": 0.8433, + "step": 29922 + }, + { + "epoch": 0.77, + "learning_rate": 1.7446377595096304e-06, + "loss": 0.8926, + "step": 29923 + }, + { + "epoch": 0.77, + "learning_rate": 1.744619290059739e-06, + "loss": 0.8047, + "step": 29924 + }, + { + "epoch": 0.77, + "learning_rate": 1.7446008200397267e-06, + "loss": 0.9526, + "step": 29925 + }, + { + "epoch": 0.77, + "learning_rate": 1.7445823494496076e-06, + "loss": 0.8037, + "step": 29926 + }, + { + "epoch": 0.77, + "learning_rate": 1.7445638782893965e-06, + "loss": 1.0908, + "step": 29927 + }, + { + "epoch": 0.77, + "learning_rate": 1.7445454065591067e-06, + "loss": 0.9551, + "step": 29928 + }, + { + "epoch": 0.77, + "learning_rate": 1.744526934258753e-06, + "loss": 1.1055, + "step": 29929 + }, + { + "epoch": 0.77, + "learning_rate": 1.744508461388349e-06, + "loss": 0.9199, + "step": 29930 + }, + { + "epoch": 0.77, + "learning_rate": 1.744489987947909e-06, + "loss": 0.7983, + "step": 29931 + }, + { + "epoch": 0.77, + "learning_rate": 1.7444715139374475e-06, + "loss": 1.0137, + "step": 29932 + }, + { + "epoch": 0.77, + "learning_rate": 1.7444530393569784e-06, + "loss": 0.9023, + "step": 29933 + }, + { + "epoch": 0.77, + "learning_rate": 1.744434564206516e-06, + "loss": 0.8413, + "step": 29934 + }, + { + "epoch": 0.77, + "learning_rate": 1.744416088486074e-06, + "loss": 0.8428, + "step": 29935 + }, + { + "epoch": 0.77, + "learning_rate": 1.7443976121956667e-06, + "loss": 0.8252, + "step": 29936 + }, + { + "epoch": 0.77, + "learning_rate": 1.7443791353353086e-06, + "loss": 0.9414, + "step": 29937 + }, + { + "epoch": 0.77, + "learning_rate": 1.7443606579050137e-06, + "loss": 1.0234, + "step": 29938 + }, + { + "epoch": 0.77, + "learning_rate": 1.744342179904796e-06, + "loss": 0.6484, + "step": 29939 + }, + { + "epoch": 0.77, + "learning_rate": 1.7443237013346696e-06, + "loss": 0.6494, + "step": 29940 + }, + { + "epoch": 0.77, + "learning_rate": 1.744305222194649e-06, + "loss": 0.7832, + "step": 29941 + }, + { + "epoch": 0.77, + "learning_rate": 1.744286742484748e-06, + "loss": 1.0371, + "step": 29942 + }, + { + "epoch": 0.77, + "learning_rate": 1.7442682622049807e-06, + "loss": 0.8955, + "step": 29943 + }, + { + "epoch": 0.77, + "learning_rate": 1.7442497813553617e-06, + "loss": 0.6309, + "step": 29944 + }, + { + "epoch": 0.77, + "learning_rate": 1.7442312999359046e-06, + "loss": 0.9629, + "step": 29945 + }, + { + "epoch": 0.77, + "learning_rate": 1.7442128179466239e-06, + "loss": 0.9639, + "step": 29946 + }, + { + "epoch": 0.77, + "learning_rate": 1.7441943353875335e-06, + "loss": 0.7236, + "step": 29947 + }, + { + "epoch": 0.77, + "learning_rate": 1.7441758522586481e-06, + "loss": 0.8506, + "step": 29948 + }, + { + "epoch": 0.77, + "learning_rate": 1.744157368559981e-06, + "loss": 1.002, + "step": 29949 + }, + { + "epoch": 0.77, + "learning_rate": 1.7441388842915474e-06, + "loss": 0.9414, + "step": 29950 + }, + { + "epoch": 0.77, + "learning_rate": 1.7441203994533604e-06, + "loss": 0.6055, + "step": 29951 + }, + { + "epoch": 0.77, + "learning_rate": 1.744101914045435e-06, + "loss": 0.9619, + "step": 29952 + }, + { + "epoch": 0.77, + "learning_rate": 1.7440834280677844e-06, + "loss": 0.8281, + "step": 29953 + }, + { + "epoch": 0.77, + "learning_rate": 1.744064941520424e-06, + "loss": 0.7891, + "step": 29954 + }, + { + "epoch": 0.77, + "learning_rate": 1.744046454403367e-06, + "loss": 0.8262, + "step": 29955 + }, + { + "epoch": 0.77, + "learning_rate": 1.7440279667166277e-06, + "loss": 0.8477, + "step": 29956 + }, + { + "epoch": 0.77, + "learning_rate": 1.7440094784602206e-06, + "loss": 0.7871, + "step": 29957 + }, + { + "epoch": 0.77, + "learning_rate": 1.7439909896341596e-06, + "loss": 0.8604, + "step": 29958 + }, + { + "epoch": 0.77, + "learning_rate": 1.743972500238459e-06, + "loss": 1.0059, + "step": 29959 + }, + { + "epoch": 0.77, + "learning_rate": 1.7439540102731325e-06, + "loss": 0.8955, + "step": 29960 + }, + { + "epoch": 0.77, + "learning_rate": 1.743935519738195e-06, + "loss": 0.6138, + "step": 29961 + }, + { + "epoch": 0.77, + "learning_rate": 1.7439170286336601e-06, + "loss": 0.9482, + "step": 29962 + }, + { + "epoch": 0.77, + "learning_rate": 1.7438985369595424e-06, + "loss": 0.874, + "step": 29963 + }, + { + "epoch": 0.77, + "learning_rate": 1.7438800447158553e-06, + "loss": 0.8545, + "step": 29964 + }, + { + "epoch": 0.77, + "learning_rate": 1.7438615519026139e-06, + "loss": 0.7124, + "step": 29965 + }, + { + "epoch": 0.77, + "learning_rate": 1.7438430585198316e-06, + "loss": 0.7646, + "step": 29966 + }, + { + "epoch": 0.77, + "learning_rate": 1.7438245645675232e-06, + "loss": 0.958, + "step": 29967 + }, + { + "epoch": 0.77, + "learning_rate": 1.7438060700457022e-06, + "loss": 0.5366, + "step": 29968 + }, + { + "epoch": 0.77, + "learning_rate": 1.7437875749543833e-06, + "loss": 0.8408, + "step": 29969 + }, + { + "epoch": 0.77, + "learning_rate": 1.7437690792935805e-06, + "loss": 0.6396, + "step": 29970 + }, + { + "epoch": 0.77, + "learning_rate": 1.7437505830633076e-06, + "loss": 0.9971, + "step": 29971 + }, + { + "epoch": 0.77, + "learning_rate": 1.7437320862635793e-06, + "loss": 0.9893, + "step": 29972 + }, + { + "epoch": 0.77, + "learning_rate": 1.7437135888944097e-06, + "loss": 0.7593, + "step": 29973 + }, + { + "epoch": 0.77, + "learning_rate": 1.7436950909558128e-06, + "loss": 0.874, + "step": 29974 + }, + { + "epoch": 0.77, + "learning_rate": 1.7436765924478025e-06, + "loss": 0.728, + "step": 29975 + }, + { + "epoch": 0.77, + "learning_rate": 1.7436580933703936e-06, + "loss": 0.6943, + "step": 29976 + }, + { + "epoch": 0.77, + "learning_rate": 1.7436395937235996e-06, + "loss": 0.9238, + "step": 29977 + }, + { + "epoch": 0.77, + "learning_rate": 1.7436210935074347e-06, + "loss": 0.793, + "step": 29978 + }, + { + "epoch": 0.77, + "learning_rate": 1.7436025927219137e-06, + "loss": 0.7437, + "step": 29979 + }, + { + "epoch": 0.77, + "learning_rate": 1.7435840913670504e-06, + "loss": 0.8682, + "step": 29980 + }, + { + "epoch": 0.77, + "learning_rate": 1.7435655894428586e-06, + "loss": 0.5166, + "step": 29981 + }, + { + "epoch": 0.77, + "learning_rate": 1.7435470869493533e-06, + "loss": 0.9609, + "step": 29982 + }, + { + "epoch": 0.77, + "learning_rate": 1.7435285838865478e-06, + "loss": 0.7979, + "step": 29983 + }, + { + "epoch": 0.77, + "learning_rate": 1.7435100802544568e-06, + "loss": 0.8105, + "step": 29984 + }, + { + "epoch": 0.77, + "learning_rate": 1.7434915760530944e-06, + "loss": 0.9551, + "step": 29985 + }, + { + "epoch": 0.77, + "learning_rate": 1.7434730712824746e-06, + "loss": 0.6812, + "step": 29986 + }, + { + "epoch": 0.77, + "learning_rate": 1.7434545659426117e-06, + "loss": 0.6943, + "step": 29987 + }, + { + "epoch": 0.77, + "learning_rate": 1.74343606003352e-06, + "loss": 0.9707, + "step": 29988 + }, + { + "epoch": 0.77, + "learning_rate": 1.743417553555213e-06, + "loss": 0.9004, + "step": 29989 + }, + { + "epoch": 0.77, + "learning_rate": 1.7433990465077057e-06, + "loss": 0.9434, + "step": 29990 + }, + { + "epoch": 0.77, + "learning_rate": 1.743380538891012e-06, + "loss": 0.8809, + "step": 29991 + }, + { + "epoch": 0.77, + "learning_rate": 1.7433620307051458e-06, + "loss": 0.7568, + "step": 29992 + }, + { + "epoch": 0.77, + "learning_rate": 1.7433435219501214e-06, + "loss": 0.8203, + "step": 29993 + }, + { + "epoch": 0.77, + "learning_rate": 1.743325012625953e-06, + "loss": 0.8721, + "step": 29994 + }, + { + "epoch": 0.77, + "learning_rate": 1.7433065027326553e-06, + "loss": 0.7441, + "step": 29995 + }, + { + "epoch": 0.77, + "learning_rate": 1.7432879922702416e-06, + "loss": 0.9316, + "step": 29996 + }, + { + "epoch": 0.77, + "learning_rate": 1.7432694812387267e-06, + "loss": 0.7119, + "step": 29997 + }, + { + "epoch": 0.77, + "learning_rate": 1.7432509696381244e-06, + "loss": 0.8809, + "step": 29998 + }, + { + "epoch": 0.77, + "learning_rate": 1.743232457468449e-06, + "loss": 0.96, + "step": 29999 + }, + { + "epoch": 0.77, + "learning_rate": 1.7432139447297147e-06, + "loss": 0.6895, + "step": 30000 + }, + { + "epoch": 0.77, + "learning_rate": 1.7431954314219354e-06, + "loss": 0.73, + "step": 30001 + }, + { + "epoch": 0.77, + "learning_rate": 1.7431769175451262e-06, + "loss": 0.8896, + "step": 30002 + }, + { + "epoch": 0.77, + "learning_rate": 1.7431584030992999e-06, + "loss": 0.8604, + "step": 30003 + }, + { + "epoch": 0.77, + "learning_rate": 1.7431398880844718e-06, + "loss": 0.9375, + "step": 30004 + }, + { + "epoch": 0.77, + "learning_rate": 1.7431213725006555e-06, + "loss": 1.0127, + "step": 30005 + }, + { + "epoch": 0.77, + "learning_rate": 1.7431028563478653e-06, + "loss": 0.9746, + "step": 30006 + }, + { + "epoch": 0.77, + "learning_rate": 1.7430843396261155e-06, + "loss": 1.0654, + "step": 30007 + }, + { + "epoch": 0.77, + "learning_rate": 1.7430658223354202e-06, + "loss": 0.8325, + "step": 30008 + }, + { + "epoch": 0.77, + "learning_rate": 1.7430473044757934e-06, + "loss": 0.8613, + "step": 30009 + }, + { + "epoch": 0.77, + "learning_rate": 1.7430287860472497e-06, + "loss": 0.7666, + "step": 30010 + }, + { + "epoch": 0.77, + "learning_rate": 1.7430102670498027e-06, + "loss": 0.9316, + "step": 30011 + }, + { + "epoch": 0.77, + "learning_rate": 1.742991747483467e-06, + "loss": 0.8403, + "step": 30012 + }, + { + "epoch": 0.77, + "learning_rate": 1.742973227348257e-06, + "loss": 0.8047, + "step": 30013 + }, + { + "epoch": 0.77, + "learning_rate": 1.7429547066441862e-06, + "loss": 0.8672, + "step": 30014 + }, + { + "epoch": 0.77, + "learning_rate": 1.742936185371269e-06, + "loss": 1.0479, + "step": 30015 + }, + { + "epoch": 0.77, + "learning_rate": 1.7429176635295204e-06, + "loss": 0.8672, + "step": 30016 + }, + { + "epoch": 0.77, + "learning_rate": 1.7428991411189535e-06, + "loss": 0.792, + "step": 30017 + }, + { + "epoch": 0.77, + "learning_rate": 1.742880618139583e-06, + "loss": 1.0469, + "step": 30018 + }, + { + "epoch": 0.77, + "learning_rate": 1.7428620945914228e-06, + "loss": 0.9912, + "step": 30019 + }, + { + "epoch": 0.77, + "learning_rate": 1.7428435704744873e-06, + "loss": 0.9141, + "step": 30020 + }, + { + "epoch": 0.77, + "learning_rate": 1.7428250457887907e-06, + "loss": 0.8887, + "step": 30021 + }, + { + "epoch": 0.77, + "learning_rate": 1.742806520534347e-06, + "loss": 0.9609, + "step": 30022 + }, + { + "epoch": 0.77, + "learning_rate": 1.7427879947111705e-06, + "loss": 0.7607, + "step": 30023 + }, + { + "epoch": 0.77, + "learning_rate": 1.7427694683192758e-06, + "loss": 0.9001, + "step": 30024 + }, + { + "epoch": 0.77, + "learning_rate": 1.742750941358676e-06, + "loss": 0.9395, + "step": 30025 + }, + { + "epoch": 0.77, + "learning_rate": 1.7427324138293865e-06, + "loss": 0.6309, + "step": 30026 + }, + { + "epoch": 0.77, + "learning_rate": 1.7427138857314207e-06, + "loss": 0.9854, + "step": 30027 + }, + { + "epoch": 0.77, + "learning_rate": 1.742695357064793e-06, + "loss": 0.7715, + "step": 30028 + }, + { + "epoch": 0.77, + "learning_rate": 1.7426768278295175e-06, + "loss": 0.5098, + "step": 30029 + }, + { + "epoch": 0.77, + "learning_rate": 1.742658298025609e-06, + "loss": 0.8594, + "step": 30030 + }, + { + "epoch": 0.77, + "learning_rate": 1.7426397676530806e-06, + "loss": 0.6719, + "step": 30031 + }, + { + "epoch": 0.77, + "learning_rate": 1.7426212367119475e-06, + "loss": 1.0283, + "step": 30032 + }, + { + "epoch": 0.77, + "learning_rate": 1.7426027052022234e-06, + "loss": 0.8555, + "step": 30033 + }, + { + "epoch": 0.77, + "learning_rate": 1.7425841731239223e-06, + "loss": 0.8174, + "step": 30034 + }, + { + "epoch": 0.77, + "learning_rate": 1.7425656404770588e-06, + "loss": 0.9258, + "step": 30035 + }, + { + "epoch": 0.77, + "learning_rate": 1.7425471072616471e-06, + "loss": 0.9824, + "step": 30036 + }, + { + "epoch": 0.77, + "learning_rate": 1.7425285734777008e-06, + "loss": 0.9385, + "step": 30037 + }, + { + "epoch": 0.77, + "learning_rate": 1.742510039125235e-06, + "loss": 1.1328, + "step": 30038 + }, + { + "epoch": 0.77, + "learning_rate": 1.7424915042042632e-06, + "loss": 0.9463, + "step": 30039 + }, + { + "epoch": 0.77, + "learning_rate": 1.7424729687147997e-06, + "loss": 1.1299, + "step": 30040 + }, + { + "epoch": 0.77, + "learning_rate": 1.742454432656859e-06, + "loss": 0.8906, + "step": 30041 + }, + { + "epoch": 0.77, + "learning_rate": 1.7424358960304549e-06, + "loss": 0.8525, + "step": 30042 + }, + { + "epoch": 0.77, + "learning_rate": 1.7424173588356017e-06, + "loss": 1.0215, + "step": 30043 + }, + { + "epoch": 0.77, + "learning_rate": 1.7423988210723136e-06, + "loss": 0.9785, + "step": 30044 + }, + { + "epoch": 0.77, + "learning_rate": 1.7423802827406052e-06, + "loss": 1.0156, + "step": 30045 + }, + { + "epoch": 0.77, + "learning_rate": 1.7423617438404903e-06, + "loss": 0.9365, + "step": 30046 + }, + { + "epoch": 0.77, + "learning_rate": 1.7423432043719833e-06, + "loss": 0.7378, + "step": 30047 + }, + { + "epoch": 0.77, + "learning_rate": 1.7423246643350978e-06, + "loss": 0.96, + "step": 30048 + }, + { + "epoch": 0.77, + "learning_rate": 1.7423061237298486e-06, + "loss": 0.7695, + "step": 30049 + }, + { + "epoch": 0.77, + "learning_rate": 1.7422875825562498e-06, + "loss": 0.7852, + "step": 30050 + }, + { + "epoch": 0.77, + "learning_rate": 1.7422690408143154e-06, + "loss": 1.0078, + "step": 30051 + }, + { + "epoch": 0.77, + "learning_rate": 1.74225049850406e-06, + "loss": 0.8975, + "step": 30052 + }, + { + "epoch": 0.77, + "learning_rate": 1.7422319556254972e-06, + "loss": 0.8242, + "step": 30053 + }, + { + "epoch": 0.77, + "learning_rate": 1.7422134121786415e-06, + "loss": 0.6711, + "step": 30054 + }, + { + "epoch": 0.77, + "learning_rate": 1.7421948681635075e-06, + "loss": 0.8564, + "step": 30055 + }, + { + "epoch": 0.77, + "learning_rate": 1.7421763235801085e-06, + "loss": 0.8779, + "step": 30056 + }, + { + "epoch": 0.77, + "learning_rate": 1.7421577784284595e-06, + "loss": 1.0498, + "step": 30057 + }, + { + "epoch": 0.77, + "learning_rate": 1.7421392327085746e-06, + "loss": 0.8994, + "step": 30058 + }, + { + "epoch": 0.77, + "learning_rate": 1.7421206864204679e-06, + "loss": 0.8682, + "step": 30059 + }, + { + "epoch": 0.77, + "learning_rate": 1.742102139564153e-06, + "loss": 0.6389, + "step": 30060 + }, + { + "epoch": 0.77, + "learning_rate": 1.7420835921396448e-06, + "loss": 0.9697, + "step": 30061 + }, + { + "epoch": 0.77, + "learning_rate": 1.7420650441469573e-06, + "loss": 0.6621, + "step": 30062 + }, + { + "epoch": 0.77, + "learning_rate": 1.7420464955861049e-06, + "loss": 0.9287, + "step": 30063 + }, + { + "epoch": 0.77, + "learning_rate": 1.7420279464571017e-06, + "loss": 0.8994, + "step": 30064 + }, + { + "epoch": 0.77, + "learning_rate": 1.7420093967599616e-06, + "loss": 0.9678, + "step": 30065 + }, + { + "epoch": 0.77, + "learning_rate": 1.741990846494699e-06, + "loss": 0.8489, + "step": 30066 + }, + { + "epoch": 0.77, + "learning_rate": 1.7419722956613284e-06, + "loss": 0.9453, + "step": 30067 + }, + { + "epoch": 0.77, + "learning_rate": 1.7419537442598633e-06, + "loss": 0.728, + "step": 30068 + }, + { + "epoch": 0.77, + "learning_rate": 1.7419351922903184e-06, + "loss": 0.8184, + "step": 30069 + }, + { + "epoch": 0.77, + "learning_rate": 1.7419166397527083e-06, + "loss": 0.8877, + "step": 30070 + }, + { + "epoch": 0.77, + "learning_rate": 1.7418980866470464e-06, + "loss": 0.6064, + "step": 30071 + }, + { + "epoch": 0.77, + "learning_rate": 1.741879532973347e-06, + "loss": 0.8477, + "step": 30072 + }, + { + "epoch": 0.77, + "learning_rate": 1.741860978731625e-06, + "loss": 0.7124, + "step": 30073 + }, + { + "epoch": 0.77, + "learning_rate": 1.741842423921894e-06, + "loss": 0.7188, + "step": 30074 + }, + { + "epoch": 0.77, + "learning_rate": 1.7418238685441684e-06, + "loss": 0.6265, + "step": 30075 + }, + { + "epoch": 0.77, + "learning_rate": 1.7418053125984624e-06, + "loss": 0.6475, + "step": 30076 + }, + { + "epoch": 0.77, + "learning_rate": 1.7417867560847901e-06, + "loss": 0.6787, + "step": 30077 + }, + { + "epoch": 0.77, + "learning_rate": 1.741768199003166e-06, + "loss": 0.9756, + "step": 30078 + }, + { + "epoch": 0.77, + "learning_rate": 1.7417496413536034e-06, + "loss": 1.0234, + "step": 30079 + }, + { + "epoch": 0.77, + "learning_rate": 1.741731083136118e-06, + "loss": 0.9351, + "step": 30080 + }, + { + "epoch": 0.77, + "learning_rate": 1.741712524350723e-06, + "loss": 0.9102, + "step": 30081 + }, + { + "epoch": 0.77, + "learning_rate": 1.7416939649974327e-06, + "loss": 1.0098, + "step": 30082 + }, + { + "epoch": 0.77, + "learning_rate": 1.7416754050762612e-06, + "loss": 0.8119, + "step": 30083 + }, + { + "epoch": 0.77, + "learning_rate": 1.7416568445872235e-06, + "loss": 0.8242, + "step": 30084 + }, + { + "epoch": 0.77, + "learning_rate": 1.7416382835303329e-06, + "loss": 0.917, + "step": 30085 + }, + { + "epoch": 0.77, + "learning_rate": 1.741619721905604e-06, + "loss": 1.0117, + "step": 30086 + }, + { + "epoch": 0.77, + "learning_rate": 1.741601159713051e-06, + "loss": 0.916, + "step": 30087 + }, + { + "epoch": 0.77, + "learning_rate": 1.7415825969526882e-06, + "loss": 0.6831, + "step": 30088 + }, + { + "epoch": 0.77, + "learning_rate": 1.7415640336245297e-06, + "loss": 0.9668, + "step": 30089 + }, + { + "epoch": 0.77, + "learning_rate": 1.7415454697285896e-06, + "loss": 0.8506, + "step": 30090 + }, + { + "epoch": 0.77, + "learning_rate": 1.7415269052648825e-06, + "loss": 0.9053, + "step": 30091 + }, + { + "epoch": 0.77, + "learning_rate": 1.7415083402334219e-06, + "loss": 0.7109, + "step": 30092 + }, + { + "epoch": 0.77, + "learning_rate": 1.7414897746342226e-06, + "loss": 1.0107, + "step": 30093 + }, + { + "epoch": 0.77, + "learning_rate": 1.741471208467299e-06, + "loss": 0.7842, + "step": 30094 + }, + { + "epoch": 0.77, + "learning_rate": 1.7414526417326645e-06, + "loss": 0.7759, + "step": 30095 + }, + { + "epoch": 0.77, + "learning_rate": 1.7414340744303341e-06, + "loss": 0.9102, + "step": 30096 + }, + { + "epoch": 0.77, + "learning_rate": 1.7414155065603217e-06, + "loss": 0.7686, + "step": 30097 + }, + { + "epoch": 0.77, + "learning_rate": 1.7413969381226416e-06, + "loss": 0.9473, + "step": 30098 + }, + { + "epoch": 0.77, + "learning_rate": 1.7413783691173079e-06, + "loss": 1.0576, + "step": 30099 + }, + { + "epoch": 0.77, + "learning_rate": 1.7413597995443349e-06, + "loss": 0.605, + "step": 30100 + }, + { + "epoch": 0.77, + "learning_rate": 1.7413412294037367e-06, + "loss": 1.0273, + "step": 30101 + }, + { + "epoch": 0.77, + "learning_rate": 1.7413226586955275e-06, + "loss": 0.8276, + "step": 30102 + }, + { + "epoch": 0.77, + "learning_rate": 1.7413040874197216e-06, + "loss": 0.8486, + "step": 30103 + }, + { + "epoch": 0.77, + "learning_rate": 1.7412855155763335e-06, + "loss": 0.9004, + "step": 30104 + }, + { + "epoch": 0.77, + "learning_rate": 1.7412669431653773e-06, + "loss": 0.6589, + "step": 30105 + }, + { + "epoch": 0.77, + "learning_rate": 1.7412483701868668e-06, + "loss": 1.0703, + "step": 30106 + }, + { + "epoch": 0.77, + "learning_rate": 1.7412297966408165e-06, + "loss": 0.9082, + "step": 30107 + }, + { + "epoch": 0.77, + "learning_rate": 1.7412112225272405e-06, + "loss": 0.9766, + "step": 30108 + }, + { + "epoch": 0.77, + "learning_rate": 1.7411926478461534e-06, + "loss": 0.9307, + "step": 30109 + }, + { + "epoch": 0.77, + "learning_rate": 1.7411740725975692e-06, + "loss": 0.8652, + "step": 30110 + }, + { + "epoch": 0.77, + "learning_rate": 1.7411554967815021e-06, + "loss": 0.8672, + "step": 30111 + }, + { + "epoch": 0.77, + "learning_rate": 1.7411369203979662e-06, + "loss": 0.9072, + "step": 30112 + }, + { + "epoch": 0.77, + "learning_rate": 1.7411183434469758e-06, + "loss": 1.04, + "step": 30113 + }, + { + "epoch": 0.77, + "learning_rate": 1.741099765928545e-06, + "loss": 0.8672, + "step": 30114 + }, + { + "epoch": 0.77, + "learning_rate": 1.7410811878426887e-06, + "loss": 0.7842, + "step": 30115 + }, + { + "epoch": 0.77, + "learning_rate": 1.7410626091894202e-06, + "loss": 0.8511, + "step": 30116 + }, + { + "epoch": 0.77, + "learning_rate": 1.7410440299687544e-06, + "loss": 0.9414, + "step": 30117 + }, + { + "epoch": 0.77, + "learning_rate": 1.741025450180705e-06, + "loss": 0.7871, + "step": 30118 + }, + { + "epoch": 0.77, + "learning_rate": 1.7410068698252866e-06, + "loss": 0.9775, + "step": 30119 + }, + { + "epoch": 0.77, + "learning_rate": 1.7409882889025134e-06, + "loss": 0.9014, + "step": 30120 + }, + { + "epoch": 0.77, + "learning_rate": 1.7409697074123994e-06, + "loss": 0.7017, + "step": 30121 + }, + { + "epoch": 0.77, + "learning_rate": 1.740951125354959e-06, + "loss": 1.0225, + "step": 30122 + }, + { + "epoch": 0.77, + "learning_rate": 1.7409325427302064e-06, + "loss": 0.7537, + "step": 30123 + }, + { + "epoch": 0.77, + "learning_rate": 1.7409139595381559e-06, + "loss": 0.853, + "step": 30124 + }, + { + "epoch": 0.77, + "learning_rate": 1.7408953757788214e-06, + "loss": 0.8369, + "step": 30125 + }, + { + "epoch": 0.77, + "learning_rate": 1.7408767914522177e-06, + "loss": 0.8428, + "step": 30126 + }, + { + "epoch": 0.77, + "learning_rate": 1.7408582065583585e-06, + "loss": 0.9619, + "step": 30127 + }, + { + "epoch": 0.77, + "learning_rate": 1.7408396210972582e-06, + "loss": 1.0498, + "step": 30128 + }, + { + "epoch": 0.77, + "learning_rate": 1.7408210350689314e-06, + "loss": 0.8613, + "step": 30129 + }, + { + "epoch": 0.77, + "learning_rate": 1.7408024484733916e-06, + "loss": 0.8013, + "step": 30130 + }, + { + "epoch": 0.77, + "learning_rate": 1.7407838613106537e-06, + "loss": 0.8193, + "step": 30131 + }, + { + "epoch": 0.77, + "learning_rate": 1.7407652735807313e-06, + "loss": 0.9072, + "step": 30132 + }, + { + "epoch": 0.77, + "learning_rate": 1.7407466852836395e-06, + "loss": 0.875, + "step": 30133 + }, + { + "epoch": 0.77, + "learning_rate": 1.7407280964193918e-06, + "loss": 1.0312, + "step": 30134 + }, + { + "epoch": 0.77, + "learning_rate": 1.7407095069880024e-06, + "loss": 0.9639, + "step": 30135 + }, + { + "epoch": 0.77, + "learning_rate": 1.7406909169894863e-06, + "loss": 0.7524, + "step": 30136 + }, + { + "epoch": 0.77, + "learning_rate": 1.7406723264238567e-06, + "loss": 0.6846, + "step": 30137 + }, + { + "epoch": 0.77, + "learning_rate": 1.7406537352911287e-06, + "loss": 0.8516, + "step": 30138 + }, + { + "epoch": 0.77, + "learning_rate": 1.7406351435913163e-06, + "loss": 0.6411, + "step": 30139 + }, + { + "epoch": 0.77, + "learning_rate": 1.7406165513244332e-06, + "loss": 0.8232, + "step": 30140 + }, + { + "epoch": 0.77, + "learning_rate": 1.7405979584904945e-06, + "loss": 0.8765, + "step": 30141 + }, + { + "epoch": 0.77, + "learning_rate": 1.7405793650895135e-06, + "loss": 1.0625, + "step": 30142 + }, + { + "epoch": 0.77, + "learning_rate": 1.7405607711215054e-06, + "loss": 1.0586, + "step": 30143 + }, + { + "epoch": 0.77, + "learning_rate": 1.7405421765864837e-06, + "loss": 0.6953, + "step": 30144 + }, + { + "epoch": 0.77, + "learning_rate": 1.740523581484463e-06, + "loss": 0.8872, + "step": 30145 + }, + { + "epoch": 0.77, + "learning_rate": 1.7405049858154573e-06, + "loss": 1.042, + "step": 30146 + }, + { + "epoch": 0.77, + "learning_rate": 1.7404863895794813e-06, + "loss": 0.7988, + "step": 30147 + }, + { + "epoch": 0.77, + "learning_rate": 1.7404677927765485e-06, + "loss": 0.9473, + "step": 30148 + }, + { + "epoch": 0.77, + "learning_rate": 1.7404491954066738e-06, + "loss": 0.7305, + "step": 30149 + }, + { + "epoch": 0.77, + "learning_rate": 1.7404305974698712e-06, + "loss": 0.8945, + "step": 30150 + }, + { + "epoch": 0.77, + "learning_rate": 1.740411998966155e-06, + "loss": 0.8506, + "step": 30151 + }, + { + "epoch": 0.77, + "learning_rate": 1.7403933998955393e-06, + "loss": 0.8779, + "step": 30152 + }, + { + "epoch": 0.77, + "learning_rate": 1.7403748002580386e-06, + "loss": 0.7495, + "step": 30153 + }, + { + "epoch": 0.77, + "learning_rate": 1.7403562000536668e-06, + "loss": 0.9785, + "step": 30154 + }, + { + "epoch": 0.77, + "learning_rate": 1.740337599282438e-06, + "loss": 0.9492, + "step": 30155 + }, + { + "epoch": 0.77, + "learning_rate": 1.740318997944367e-06, + "loss": 0.7407, + "step": 30156 + }, + { + "epoch": 0.77, + "learning_rate": 1.7403003960394678e-06, + "loss": 1.1143, + "step": 30157 + }, + { + "epoch": 0.77, + "learning_rate": 1.7402817935677545e-06, + "loss": 0.657, + "step": 30158 + }, + { + "epoch": 0.77, + "learning_rate": 1.7402631905292418e-06, + "loss": 0.9424, + "step": 30159 + }, + { + "epoch": 0.77, + "learning_rate": 1.7402445869239434e-06, + "loss": 0.6904, + "step": 30160 + }, + { + "epoch": 0.77, + "learning_rate": 1.7402259827518738e-06, + "loss": 0.6812, + "step": 30161 + }, + { + "epoch": 0.77, + "learning_rate": 1.740207378013047e-06, + "loss": 0.8228, + "step": 30162 + }, + { + "epoch": 0.77, + "learning_rate": 1.7401887727074777e-06, + "loss": 0.9106, + "step": 30163 + }, + { + "epoch": 0.77, + "learning_rate": 1.7401701668351799e-06, + "loss": 0.75, + "step": 30164 + }, + { + "epoch": 0.77, + "learning_rate": 1.7401515603961676e-06, + "loss": 0.7104, + "step": 30165 + }, + { + "epoch": 0.77, + "learning_rate": 1.7401329533904554e-06, + "loss": 1.0049, + "step": 30166 + }, + { + "epoch": 0.77, + "learning_rate": 1.7401143458180573e-06, + "loss": 0.9951, + "step": 30167 + }, + { + "epoch": 0.77, + "learning_rate": 1.7400957376789881e-06, + "loss": 0.6538, + "step": 30168 + }, + { + "epoch": 0.77, + "learning_rate": 1.7400771289732613e-06, + "loss": 0.873, + "step": 30169 + }, + { + "epoch": 0.77, + "learning_rate": 1.7400585197008914e-06, + "loss": 1.0586, + "step": 30170 + }, + { + "epoch": 0.77, + "learning_rate": 1.740039909861893e-06, + "loss": 0.7783, + "step": 30171 + }, + { + "epoch": 0.77, + "learning_rate": 1.7400212994562796e-06, + "loss": 0.999, + "step": 30172 + }, + { + "epoch": 0.77, + "learning_rate": 1.7400026884840667e-06, + "loss": 0.9355, + "step": 30173 + }, + { + "epoch": 0.77, + "learning_rate": 1.739984076945267e-06, + "loss": 0.8682, + "step": 30174 + }, + { + "epoch": 0.77, + "learning_rate": 1.739965464839896e-06, + "loss": 0.8291, + "step": 30175 + }, + { + "epoch": 0.77, + "learning_rate": 1.7399468521679672e-06, + "loss": 0.6477, + "step": 30176 + }, + { + "epoch": 0.77, + "learning_rate": 1.7399282389294952e-06, + "loss": 0.9854, + "step": 30177 + }, + { + "epoch": 0.77, + "learning_rate": 1.7399096251244943e-06, + "loss": 0.8579, + "step": 30178 + }, + { + "epoch": 0.77, + "learning_rate": 1.7398910107529785e-06, + "loss": 0.7935, + "step": 30179 + }, + { + "epoch": 0.77, + "learning_rate": 1.7398723958149621e-06, + "loss": 0.9609, + "step": 30180 + }, + { + "epoch": 0.77, + "learning_rate": 1.7398537803104593e-06, + "loss": 0.7815, + "step": 30181 + }, + { + "epoch": 0.77, + "learning_rate": 1.739835164239485e-06, + "loss": 0.8408, + "step": 30182 + }, + { + "epoch": 0.77, + "learning_rate": 1.7398165476020522e-06, + "loss": 0.6514, + "step": 30183 + }, + { + "epoch": 0.77, + "learning_rate": 1.7397979303981764e-06, + "loss": 0.9893, + "step": 30184 + }, + { + "epoch": 0.77, + "learning_rate": 1.7397793126278714e-06, + "loss": 0.8281, + "step": 30185 + }, + { + "epoch": 0.77, + "learning_rate": 1.7397606942911513e-06, + "loss": 0.7368, + "step": 30186 + }, + { + "epoch": 0.77, + "learning_rate": 1.7397420753880306e-06, + "loss": 0.8271, + "step": 30187 + }, + { + "epoch": 0.77, + "learning_rate": 1.739723455918523e-06, + "loss": 0.8574, + "step": 30188 + }, + { + "epoch": 0.77, + "learning_rate": 1.7397048358826432e-06, + "loss": 0.7236, + "step": 30189 + }, + { + "epoch": 0.77, + "learning_rate": 1.7396862152804057e-06, + "loss": 0.7354, + "step": 30190 + }, + { + "epoch": 0.77, + "learning_rate": 1.7396675941118245e-06, + "loss": 0.8447, + "step": 30191 + }, + { + "epoch": 0.77, + "learning_rate": 1.7396489723769134e-06, + "loss": 0.9609, + "step": 30192 + }, + { + "epoch": 0.77, + "learning_rate": 1.7396303500756875e-06, + "loss": 0.6792, + "step": 30193 + }, + { + "epoch": 0.77, + "learning_rate": 1.7396117272081606e-06, + "loss": 0.8379, + "step": 30194 + }, + { + "epoch": 0.77, + "learning_rate": 1.739593103774347e-06, + "loss": 0.8652, + "step": 30195 + }, + { + "epoch": 0.77, + "learning_rate": 1.7395744797742609e-06, + "loss": 0.7949, + "step": 30196 + }, + { + "epoch": 0.77, + "learning_rate": 1.7395558552079166e-06, + "loss": 0.6934, + "step": 30197 + }, + { + "epoch": 0.77, + "learning_rate": 1.7395372300753283e-06, + "loss": 0.8174, + "step": 30198 + }, + { + "epoch": 0.77, + "learning_rate": 1.7395186043765103e-06, + "loss": 0.9131, + "step": 30199 + }, + { + "epoch": 0.77, + "learning_rate": 1.7394999781114773e-06, + "loss": 0.8418, + "step": 30200 + }, + { + "epoch": 0.77, + "learning_rate": 1.739481351280243e-06, + "loss": 1.0859, + "step": 30201 + }, + { + "epoch": 0.77, + "learning_rate": 1.7394627238828216e-06, + "loss": 0.7998, + "step": 30202 + }, + { + "epoch": 0.77, + "learning_rate": 1.7394440959192279e-06, + "loss": 0.729, + "step": 30203 + }, + { + "epoch": 0.77, + "learning_rate": 1.7394254673894757e-06, + "loss": 0.7725, + "step": 30204 + }, + { + "epoch": 0.77, + "learning_rate": 1.7394068382935796e-06, + "loss": 0.875, + "step": 30205 + }, + { + "epoch": 0.77, + "learning_rate": 1.7393882086315535e-06, + "loss": 0.7285, + "step": 30206 + }, + { + "epoch": 0.77, + "learning_rate": 1.7393695784034117e-06, + "loss": 0.793, + "step": 30207 + }, + { + "epoch": 0.77, + "learning_rate": 1.739350947609169e-06, + "loss": 0.8779, + "step": 30208 + }, + { + "epoch": 0.77, + "learning_rate": 1.7393323162488392e-06, + "loss": 0.9805, + "step": 30209 + }, + { + "epoch": 0.77, + "learning_rate": 1.7393136843224363e-06, + "loss": 0.6309, + "step": 30210 + }, + { + "epoch": 0.77, + "learning_rate": 1.7392950518299751e-06, + "loss": 0.7703, + "step": 30211 + }, + { + "epoch": 0.77, + "learning_rate": 1.7392764187714696e-06, + "loss": 0.8018, + "step": 30212 + }, + { + "epoch": 0.77, + "learning_rate": 1.7392577851469343e-06, + "loss": 0.7725, + "step": 30213 + }, + { + "epoch": 0.77, + "learning_rate": 1.7392391509563834e-06, + "loss": 0.7744, + "step": 30214 + }, + { + "epoch": 0.77, + "learning_rate": 1.7392205161998308e-06, + "loss": 0.8311, + "step": 30215 + }, + { + "epoch": 0.77, + "learning_rate": 1.739201880877291e-06, + "loss": 0.8701, + "step": 30216 + }, + { + "epoch": 0.77, + "learning_rate": 1.7391832449887784e-06, + "loss": 0.7534, + "step": 30217 + }, + { + "epoch": 0.77, + "learning_rate": 1.7391646085343075e-06, + "loss": 0.6035, + "step": 30218 + }, + { + "epoch": 0.77, + "learning_rate": 1.739145971513892e-06, + "loss": 0.7715, + "step": 30219 + }, + { + "epoch": 0.77, + "learning_rate": 1.7391273339275463e-06, + "loss": 0.8525, + "step": 30220 + }, + { + "epoch": 0.77, + "learning_rate": 1.7391086957752847e-06, + "loss": 0.8438, + "step": 30221 + }, + { + "epoch": 0.77, + "learning_rate": 1.7390900570571218e-06, + "loss": 0.7949, + "step": 30222 + }, + { + "epoch": 0.77, + "learning_rate": 1.7390714177730717e-06, + "loss": 0.7783, + "step": 30223 + }, + { + "epoch": 0.77, + "learning_rate": 1.7390527779231485e-06, + "loss": 0.8828, + "step": 30224 + }, + { + "epoch": 0.77, + "learning_rate": 1.7390341375073664e-06, + "loss": 0.6558, + "step": 30225 + }, + { + "epoch": 0.77, + "learning_rate": 1.7390154965257399e-06, + "loss": 0.8223, + "step": 30226 + }, + { + "epoch": 0.77, + "learning_rate": 1.7389968549782835e-06, + "loss": 1.0234, + "step": 30227 + }, + { + "epoch": 0.77, + "learning_rate": 1.7389782128650107e-06, + "loss": 1.001, + "step": 30228 + }, + { + "epoch": 0.77, + "learning_rate": 1.7389595701859367e-06, + "loss": 0.8154, + "step": 30229 + }, + { + "epoch": 0.77, + "learning_rate": 1.7389409269410752e-06, + "loss": 1.0703, + "step": 30230 + }, + { + "epoch": 0.77, + "learning_rate": 1.7389222831304406e-06, + "loss": 1.1436, + "step": 30231 + }, + { + "epoch": 0.77, + "learning_rate": 1.7389036387540472e-06, + "loss": 0.8828, + "step": 30232 + }, + { + "epoch": 0.77, + "learning_rate": 1.7388849938119093e-06, + "loss": 0.4924, + "step": 30233 + }, + { + "epoch": 0.77, + "learning_rate": 1.7388663483040409e-06, + "loss": 0.792, + "step": 30234 + }, + { + "epoch": 0.77, + "learning_rate": 1.7388477022304567e-06, + "loss": 0.8311, + "step": 30235 + }, + { + "epoch": 0.77, + "learning_rate": 1.7388290555911706e-06, + "loss": 1.0156, + "step": 30236 + }, + { + "epoch": 0.77, + "learning_rate": 1.7388104083861975e-06, + "loss": 0.6714, + "step": 30237 + }, + { + "epoch": 0.78, + "learning_rate": 1.7387917606155509e-06, + "loss": 0.8828, + "step": 30238 + }, + { + "epoch": 0.78, + "learning_rate": 1.7387731122792454e-06, + "loss": 0.7871, + "step": 30239 + }, + { + "epoch": 0.78, + "learning_rate": 1.7387544633772952e-06, + "loss": 0.8174, + "step": 30240 + }, + { + "epoch": 0.78, + "learning_rate": 1.7387358139097153e-06, + "loss": 1.0166, + "step": 30241 + }, + { + "epoch": 0.78, + "learning_rate": 1.7387171638765189e-06, + "loss": 0.9453, + "step": 30242 + }, + { + "epoch": 0.78, + "learning_rate": 1.7386985132777205e-06, + "loss": 1.0244, + "step": 30243 + }, + { + "epoch": 0.78, + "learning_rate": 1.7386798621133349e-06, + "loss": 0.8242, + "step": 30244 + }, + { + "epoch": 0.78, + "learning_rate": 1.738661210383376e-06, + "loss": 0.8535, + "step": 30245 + }, + { + "epoch": 0.78, + "learning_rate": 1.7386425580878585e-06, + "loss": 1.0713, + "step": 30246 + }, + { + "epoch": 0.78, + "learning_rate": 1.738623905226796e-06, + "loss": 0.9316, + "step": 30247 + }, + { + "epoch": 0.78, + "learning_rate": 1.7386052518002033e-06, + "loss": 0.8516, + "step": 30248 + }, + { + "epoch": 0.78, + "learning_rate": 1.7385865978080942e-06, + "loss": 0.6208, + "step": 30249 + }, + { + "epoch": 0.78, + "learning_rate": 1.7385679432504836e-06, + "loss": 0.8916, + "step": 30250 + }, + { + "epoch": 0.78, + "learning_rate": 1.7385492881273855e-06, + "loss": 0.8545, + "step": 30251 + }, + { + "epoch": 0.78, + "learning_rate": 1.738530632438814e-06, + "loss": 0.9424, + "step": 30252 + }, + { + "epoch": 0.78, + "learning_rate": 1.738511976184784e-06, + "loss": 0.5132, + "step": 30253 + }, + { + "epoch": 0.78, + "learning_rate": 1.7384933193653088e-06, + "loss": 0.9106, + "step": 30254 + }, + { + "epoch": 0.78, + "learning_rate": 1.7384746619804034e-06, + "loss": 0.9678, + "step": 30255 + }, + { + "epoch": 0.78, + "learning_rate": 1.738456004030082e-06, + "loss": 0.9316, + "step": 30256 + }, + { + "epoch": 0.78, + "learning_rate": 1.7384373455143586e-06, + "loss": 0.7559, + "step": 30257 + }, + { + "epoch": 0.78, + "learning_rate": 1.738418686433248e-06, + "loss": 0.7959, + "step": 30258 + }, + { + "epoch": 0.78, + "learning_rate": 1.7384000267867638e-06, + "loss": 0.9883, + "step": 30259 + }, + { + "epoch": 0.78, + "learning_rate": 1.738381366574921e-06, + "loss": 0.835, + "step": 30260 + }, + { + "epoch": 0.78, + "learning_rate": 1.7383627057977332e-06, + "loss": 0.8623, + "step": 30261 + }, + { + "epoch": 0.78, + "learning_rate": 1.7383440444552152e-06, + "loss": 0.9297, + "step": 30262 + }, + { + "epoch": 0.78, + "learning_rate": 1.7383253825473814e-06, + "loss": 0.8213, + "step": 30263 + }, + { + "epoch": 0.78, + "learning_rate": 1.7383067200742452e-06, + "loss": 0.8599, + "step": 30264 + }, + { + "epoch": 0.78, + "learning_rate": 1.738288057035822e-06, + "loss": 0.8857, + "step": 30265 + }, + { + "epoch": 0.78, + "learning_rate": 1.7382693934321253e-06, + "loss": 0.832, + "step": 30266 + }, + { + "epoch": 0.78, + "learning_rate": 1.7382507292631696e-06, + "loss": 0.7212, + "step": 30267 + }, + { + "epoch": 0.78, + "learning_rate": 1.7382320645289697e-06, + "loss": 0.8838, + "step": 30268 + }, + { + "epoch": 0.78, + "learning_rate": 1.738213399229539e-06, + "loss": 0.8926, + "step": 30269 + }, + { + "epoch": 0.78, + "learning_rate": 1.7381947333648923e-06, + "loss": 1.0518, + "step": 30270 + }, + { + "epoch": 0.78, + "learning_rate": 1.7381760669350443e-06, + "loss": 0.9883, + "step": 30271 + }, + { + "epoch": 0.78, + "learning_rate": 1.7381573999400082e-06, + "loss": 0.458, + "step": 30272 + }, + { + "epoch": 0.78, + "learning_rate": 1.7381387323797994e-06, + "loss": 0.8584, + "step": 30273 + }, + { + "epoch": 0.78, + "learning_rate": 1.7381200642544314e-06, + "loss": 0.7959, + "step": 30274 + }, + { + "epoch": 0.78, + "learning_rate": 1.7381013955639188e-06, + "loss": 0.7988, + "step": 30275 + }, + { + "epoch": 0.78, + "learning_rate": 1.738082726308276e-06, + "loss": 0.6157, + "step": 30276 + }, + { + "epoch": 0.78, + "learning_rate": 1.7380640564875172e-06, + "loss": 0.5559, + "step": 30277 + }, + { + "epoch": 0.78, + "learning_rate": 1.7380453861016569e-06, + "loss": 0.9351, + "step": 30278 + }, + { + "epoch": 0.78, + "learning_rate": 1.738026715150709e-06, + "loss": 0.999, + "step": 30279 + }, + { + "epoch": 0.78, + "learning_rate": 1.738008043634688e-06, + "loss": 1.0986, + "step": 30280 + }, + { + "epoch": 0.78, + "learning_rate": 1.737989371553608e-06, + "loss": 0.7803, + "step": 30281 + }, + { + "epoch": 0.78, + "learning_rate": 1.7379706989074835e-06, + "loss": 0.874, + "step": 30282 + }, + { + "epoch": 0.78, + "learning_rate": 1.737952025696329e-06, + "loss": 1.1289, + "step": 30283 + }, + { + "epoch": 0.78, + "learning_rate": 1.7379333519201584e-06, + "loss": 1.0225, + "step": 30284 + }, + { + "epoch": 0.78, + "learning_rate": 1.737914677578986e-06, + "loss": 0.67, + "step": 30285 + }, + { + "epoch": 0.78, + "learning_rate": 1.7378960026728269e-06, + "loss": 0.9209, + "step": 30286 + }, + { + "epoch": 0.78, + "learning_rate": 1.7378773272016941e-06, + "loss": 1.0312, + "step": 30287 + }, + { + "epoch": 0.78, + "learning_rate": 1.7378586511656027e-06, + "loss": 0.7856, + "step": 30288 + }, + { + "epoch": 0.78, + "learning_rate": 1.737839974564567e-06, + "loss": 0.8936, + "step": 30289 + }, + { + "epoch": 0.78, + "learning_rate": 1.737821297398601e-06, + "loss": 0.9736, + "step": 30290 + }, + { + "epoch": 0.78, + "learning_rate": 1.7378026196677197e-06, + "loss": 1.0264, + "step": 30291 + }, + { + "epoch": 0.78, + "learning_rate": 1.7377839413719362e-06, + "loss": 0.6729, + "step": 30292 + }, + { + "epoch": 0.78, + "learning_rate": 1.7377652625112658e-06, + "loss": 0.8789, + "step": 30293 + }, + { + "epoch": 0.78, + "learning_rate": 1.7377465830857223e-06, + "loss": 0.8611, + "step": 30294 + }, + { + "epoch": 0.78, + "learning_rate": 1.7377279030953202e-06, + "loss": 0.8027, + "step": 30295 + }, + { + "epoch": 0.78, + "learning_rate": 1.7377092225400738e-06, + "loss": 0.7178, + "step": 30296 + }, + { + "epoch": 0.78, + "learning_rate": 1.7376905414199975e-06, + "loss": 0.7063, + "step": 30297 + }, + { + "epoch": 0.78, + "learning_rate": 1.7376718597351052e-06, + "loss": 0.9229, + "step": 30298 + }, + { + "epoch": 0.78, + "learning_rate": 1.7376531774854115e-06, + "loss": 0.4912, + "step": 30299 + }, + { + "epoch": 0.78, + "learning_rate": 1.7376344946709306e-06, + "loss": 1.0498, + "step": 30300 + }, + { + "epoch": 0.78, + "learning_rate": 1.7376158112916772e-06, + "loss": 0.957, + "step": 30301 + }, + { + "epoch": 0.78, + "learning_rate": 1.7375971273476653e-06, + "loss": 0.7397, + "step": 30302 + }, + { + "epoch": 0.78, + "learning_rate": 1.737578442838909e-06, + "loss": 0.9224, + "step": 30303 + }, + { + "epoch": 0.78, + "learning_rate": 1.737559757765423e-06, + "loss": 0.6968, + "step": 30304 + }, + { + "epoch": 0.78, + "learning_rate": 1.737541072127221e-06, + "loss": 0.8496, + "step": 30305 + }, + { + "epoch": 0.78, + "learning_rate": 1.737522385924318e-06, + "loss": 0.8818, + "step": 30306 + }, + { + "epoch": 0.78, + "learning_rate": 1.737503699156728e-06, + "loss": 0.834, + "step": 30307 + }, + { + "epoch": 0.78, + "learning_rate": 1.7374850118244653e-06, + "loss": 1.0293, + "step": 30308 + }, + { + "epoch": 0.78, + "learning_rate": 1.7374663239275443e-06, + "loss": 0.9229, + "step": 30309 + }, + { + "epoch": 0.78, + "learning_rate": 1.7374476354659793e-06, + "loss": 0.7646, + "step": 30310 + }, + { + "epoch": 0.78, + "learning_rate": 1.7374289464397842e-06, + "loss": 0.9375, + "step": 30311 + }, + { + "epoch": 0.78, + "learning_rate": 1.7374102568489742e-06, + "loss": 0.9668, + "step": 30312 + }, + { + "epoch": 0.78, + "learning_rate": 1.7373915666935628e-06, + "loss": 0.8223, + "step": 30313 + }, + { + "epoch": 0.78, + "learning_rate": 1.7373728759735645e-06, + "loss": 1.0098, + "step": 30314 + }, + { + "epoch": 0.78, + "learning_rate": 1.7373541846889937e-06, + "loss": 0.8125, + "step": 30315 + }, + { + "epoch": 0.78, + "learning_rate": 1.7373354928398648e-06, + "loss": 0.7646, + "step": 30316 + }, + { + "epoch": 0.78, + "learning_rate": 1.737316800426192e-06, + "loss": 0.8721, + "step": 30317 + }, + { + "epoch": 0.78, + "learning_rate": 1.7372981074479895e-06, + "loss": 0.8506, + "step": 30318 + }, + { + "epoch": 0.78, + "learning_rate": 1.737279413905272e-06, + "loss": 0.5801, + "step": 30319 + }, + { + "epoch": 0.78, + "learning_rate": 1.7372607197980533e-06, + "loss": 0.9014, + "step": 30320 + }, + { + "epoch": 0.78, + "learning_rate": 1.7372420251263482e-06, + "loss": 0.6562, + "step": 30321 + }, + { + "epoch": 0.78, + "learning_rate": 1.7372233298901705e-06, + "loss": 0.6641, + "step": 30322 + }, + { + "epoch": 0.78, + "learning_rate": 1.737204634089535e-06, + "loss": 0.8643, + "step": 30323 + }, + { + "epoch": 0.78, + "learning_rate": 1.7371859377244558e-06, + "loss": 0.9082, + "step": 30324 + }, + { + "epoch": 0.78, + "learning_rate": 1.7371672407949474e-06, + "loss": 0.8652, + "step": 30325 + }, + { + "epoch": 0.78, + "learning_rate": 1.7371485433010235e-06, + "loss": 0.9053, + "step": 30326 + }, + { + "epoch": 0.78, + "learning_rate": 1.7371298452426993e-06, + "loss": 0.8364, + "step": 30327 + }, + { + "epoch": 0.78, + "learning_rate": 1.7371111466199881e-06, + "loss": 0.8066, + "step": 30328 + }, + { + "epoch": 0.78, + "learning_rate": 1.7370924474329055e-06, + "loss": 0.6079, + "step": 30329 + }, + { + "epoch": 0.78, + "learning_rate": 1.7370737476814645e-06, + "loss": 0.8218, + "step": 30330 + }, + { + "epoch": 0.78, + "learning_rate": 1.7370550473656804e-06, + "loss": 0.811, + "step": 30331 + }, + { + "epoch": 0.78, + "learning_rate": 1.7370363464855671e-06, + "loss": 0.8223, + "step": 30332 + }, + { + "epoch": 0.78, + "learning_rate": 1.737017645041139e-06, + "loss": 0.6294, + "step": 30333 + }, + { + "epoch": 0.78, + "learning_rate": 1.7369989430324102e-06, + "loss": 0.9473, + "step": 30334 + }, + { + "epoch": 0.78, + "learning_rate": 1.736980240459395e-06, + "loss": 0.9619, + "step": 30335 + }, + { + "epoch": 0.78, + "learning_rate": 1.7369615373221082e-06, + "loss": 0.8083, + "step": 30336 + }, + { + "epoch": 0.78, + "learning_rate": 1.7369428336205638e-06, + "loss": 0.6841, + "step": 30337 + }, + { + "epoch": 0.78, + "learning_rate": 1.7369241293547764e-06, + "loss": 0.7646, + "step": 30338 + }, + { + "epoch": 0.78, + "learning_rate": 1.7369054245247596e-06, + "loss": 0.9561, + "step": 30339 + }, + { + "epoch": 0.78, + "learning_rate": 1.7368867191305285e-06, + "loss": 0.9238, + "step": 30340 + }, + { + "epoch": 0.78, + "learning_rate": 1.736868013172097e-06, + "loss": 0.9028, + "step": 30341 + }, + { + "epoch": 0.78, + "learning_rate": 1.7368493066494796e-06, + "loss": 0.6772, + "step": 30342 + }, + { + "epoch": 0.78, + "learning_rate": 1.7368305995626905e-06, + "loss": 0.8584, + "step": 30343 + }, + { + "epoch": 0.78, + "learning_rate": 1.7368118919117442e-06, + "loss": 0.8086, + "step": 30344 + }, + { + "epoch": 0.78, + "learning_rate": 1.736793183696655e-06, + "loss": 0.8525, + "step": 30345 + }, + { + "epoch": 0.78, + "learning_rate": 1.7367744749174368e-06, + "loss": 0.9971, + "step": 30346 + }, + { + "epoch": 0.78, + "learning_rate": 1.7367557655741045e-06, + "loss": 0.8477, + "step": 30347 + }, + { + "epoch": 0.78, + "learning_rate": 1.7367370556666722e-06, + "loss": 0.9004, + "step": 30348 + }, + { + "epoch": 0.78, + "learning_rate": 1.7367183451951545e-06, + "loss": 0.9785, + "step": 30349 + }, + { + "epoch": 0.78, + "learning_rate": 1.736699634159565e-06, + "loss": 0.6392, + "step": 30350 + }, + { + "epoch": 0.78, + "learning_rate": 1.7366809225599183e-06, + "loss": 0.9531, + "step": 30351 + }, + { + "epoch": 0.78, + "learning_rate": 1.7366622103962293e-06, + "loss": 0.8154, + "step": 30352 + }, + { + "epoch": 0.78, + "learning_rate": 1.7366434976685118e-06, + "loss": 0.7285, + "step": 30353 + }, + { + "epoch": 0.78, + "learning_rate": 1.7366247843767803e-06, + "loss": 0.8096, + "step": 30354 + }, + { + "epoch": 0.78, + "learning_rate": 1.736606070521049e-06, + "loss": 0.7668, + "step": 30355 + }, + { + "epoch": 0.78, + "learning_rate": 1.7365873561013324e-06, + "loss": 0.9199, + "step": 30356 + }, + { + "epoch": 0.78, + "learning_rate": 1.7365686411176445e-06, + "loss": 0.8145, + "step": 30357 + }, + { + "epoch": 0.78, + "learning_rate": 1.7365499255700002e-06, + "loss": 0.9717, + "step": 30358 + }, + { + "epoch": 0.78, + "learning_rate": 1.736531209458413e-06, + "loss": 0.7241, + "step": 30359 + }, + { + "epoch": 0.78, + "learning_rate": 1.7365124927828982e-06, + "loss": 0.8271, + "step": 30360 + }, + { + "epoch": 0.78, + "learning_rate": 1.7364937755434695e-06, + "loss": 0.7866, + "step": 30361 + }, + { + "epoch": 0.78, + "learning_rate": 1.7364750577401413e-06, + "loss": 1.0381, + "step": 30362 + }, + { + "epoch": 0.78, + "learning_rate": 1.736456339372928e-06, + "loss": 1.0342, + "step": 30363 + }, + { + "epoch": 0.78, + "learning_rate": 1.736437620441844e-06, + "loss": 0.856, + "step": 30364 + }, + { + "epoch": 0.78, + "learning_rate": 1.7364189009469036e-06, + "loss": 0.6858, + "step": 30365 + }, + { + "epoch": 0.78, + "learning_rate": 1.736400180888121e-06, + "loss": 0.7666, + "step": 30366 + }, + { + "epoch": 0.78, + "learning_rate": 1.7363814602655106e-06, + "loss": 0.9805, + "step": 30367 + }, + { + "epoch": 0.78, + "learning_rate": 1.7363627390790869e-06, + "loss": 0.7764, + "step": 30368 + }, + { + "epoch": 0.78, + "learning_rate": 1.7363440173288645e-06, + "loss": 0.7876, + "step": 30369 + }, + { + "epoch": 0.78, + "learning_rate": 1.7363252950148567e-06, + "loss": 0.8164, + "step": 30370 + }, + { + "epoch": 0.78, + "learning_rate": 1.7363065721370789e-06, + "loss": 1.0156, + "step": 30371 + }, + { + "epoch": 0.78, + "learning_rate": 1.7362878486955449e-06, + "loss": 0.8711, + "step": 30372 + }, + { + "epoch": 0.78, + "learning_rate": 1.736269124690269e-06, + "loss": 0.6108, + "step": 30373 + }, + { + "epoch": 0.78, + "learning_rate": 1.7362504001212658e-06, + "loss": 0.793, + "step": 30374 + }, + { + "epoch": 0.78, + "learning_rate": 1.7362316749885494e-06, + "loss": 0.8994, + "step": 30375 + }, + { + "epoch": 0.78, + "learning_rate": 1.7362129492921343e-06, + "loss": 0.8867, + "step": 30376 + }, + { + "epoch": 0.78, + "learning_rate": 1.7361942230320347e-06, + "loss": 0.7246, + "step": 30377 + }, + { + "epoch": 0.78, + "learning_rate": 1.7361754962082653e-06, + "loss": 1.0, + "step": 30378 + }, + { + "epoch": 0.78, + "learning_rate": 1.73615676882084e-06, + "loss": 0.7754, + "step": 30379 + }, + { + "epoch": 0.78, + "learning_rate": 1.7361380408697736e-06, + "loss": 0.7783, + "step": 30380 + }, + { + "epoch": 0.78, + "learning_rate": 1.73611931235508e-06, + "loss": 0.9141, + "step": 30381 + }, + { + "epoch": 0.78, + "learning_rate": 1.7361005832767734e-06, + "loss": 0.7754, + "step": 30382 + }, + { + "epoch": 0.78, + "learning_rate": 1.7360818536348689e-06, + "loss": 0.8477, + "step": 30383 + }, + { + "epoch": 0.78, + "learning_rate": 1.73606312342938e-06, + "loss": 1.002, + "step": 30384 + }, + { + "epoch": 0.78, + "learning_rate": 1.7360443926603216e-06, + "loss": 0.8555, + "step": 30385 + }, + { + "epoch": 0.78, + "learning_rate": 1.7360256613277077e-06, + "loss": 0.8359, + "step": 30386 + }, + { + "epoch": 0.78, + "learning_rate": 1.736006929431553e-06, + "loss": 0.4766, + "step": 30387 + }, + { + "epoch": 0.78, + "learning_rate": 1.7359881969718716e-06, + "loss": 0.8652, + "step": 30388 + }, + { + "epoch": 0.78, + "learning_rate": 1.7359694639486774e-06, + "loss": 0.8398, + "step": 30389 + }, + { + "epoch": 0.78, + "learning_rate": 1.7359507303619859e-06, + "loss": 0.9033, + "step": 30390 + }, + { + "epoch": 0.78, + "learning_rate": 1.7359319962118103e-06, + "loss": 0.793, + "step": 30391 + }, + { + "epoch": 0.78, + "learning_rate": 1.7359132614981658e-06, + "loss": 0.687, + "step": 30392 + }, + { + "epoch": 0.78, + "learning_rate": 1.735894526221066e-06, + "loss": 0.7871, + "step": 30393 + }, + { + "epoch": 0.78, + "learning_rate": 1.735875790380526e-06, + "loss": 0.834, + "step": 30394 + }, + { + "epoch": 0.78, + "learning_rate": 1.7358570539765593e-06, + "loss": 0.7656, + "step": 30395 + }, + { + "epoch": 0.78, + "learning_rate": 1.7358383170091807e-06, + "loss": 0.7188, + "step": 30396 + }, + { + "epoch": 0.78, + "learning_rate": 1.735819579478405e-06, + "loss": 0.9629, + "step": 30397 + }, + { + "epoch": 0.78, + "learning_rate": 1.7358008413842456e-06, + "loss": 0.9473, + "step": 30398 + }, + { + "epoch": 0.78, + "learning_rate": 1.7357821027267177e-06, + "loss": 0.7524, + "step": 30399 + }, + { + "epoch": 0.78, + "learning_rate": 1.735763363505835e-06, + "loss": 1.0625, + "step": 30400 + }, + { + "epoch": 0.78, + "learning_rate": 1.7357446237216123e-06, + "loss": 0.9697, + "step": 30401 + }, + { + "epoch": 0.78, + "learning_rate": 1.7357258833740637e-06, + "loss": 1.0645, + "step": 30402 + }, + { + "epoch": 0.78, + "learning_rate": 1.7357071424632034e-06, + "loss": 0.5676, + "step": 30403 + }, + { + "epoch": 0.78, + "learning_rate": 1.7356884009890465e-06, + "loss": 0.9717, + "step": 30404 + }, + { + "epoch": 0.78, + "learning_rate": 1.7356696589516064e-06, + "loss": 0.9316, + "step": 30405 + }, + { + "epoch": 0.78, + "learning_rate": 1.7356509163508978e-06, + "loss": 1.1523, + "step": 30406 + }, + { + "epoch": 0.78, + "learning_rate": 1.7356321731869354e-06, + "loss": 0.8955, + "step": 30407 + }, + { + "epoch": 0.78, + "learning_rate": 1.7356134294597333e-06, + "loss": 0.8975, + "step": 30408 + }, + { + "epoch": 0.78, + "learning_rate": 1.7355946851693054e-06, + "loss": 0.6885, + "step": 30409 + }, + { + "epoch": 0.78, + "learning_rate": 1.7355759403156669e-06, + "loss": 0.874, + "step": 30410 + }, + { + "epoch": 0.78, + "learning_rate": 1.7355571948988317e-06, + "loss": 0.9355, + "step": 30411 + }, + { + "epoch": 0.78, + "learning_rate": 1.735538448918814e-06, + "loss": 0.9609, + "step": 30412 + }, + { + "epoch": 0.78, + "learning_rate": 1.7355197023756282e-06, + "loss": 0.8965, + "step": 30413 + }, + { + "epoch": 0.78, + "learning_rate": 1.735500955269289e-06, + "loss": 0.9951, + "step": 30414 + }, + { + "epoch": 0.78, + "learning_rate": 1.7354822075998108e-06, + "loss": 0.8281, + "step": 30415 + }, + { + "epoch": 0.78, + "learning_rate": 1.7354634593672073e-06, + "loss": 0.9629, + "step": 30416 + }, + { + "epoch": 0.78, + "learning_rate": 1.7354447105714933e-06, + "loss": 0.7324, + "step": 30417 + }, + { + "epoch": 0.78, + "learning_rate": 1.7354259612126832e-06, + "loss": 0.7095, + "step": 30418 + }, + { + "epoch": 0.78, + "learning_rate": 1.7354072112907912e-06, + "loss": 0.7957, + "step": 30419 + }, + { + "epoch": 0.78, + "learning_rate": 1.7353884608058318e-06, + "loss": 0.9199, + "step": 30420 + }, + { + "epoch": 0.78, + "learning_rate": 1.735369709757819e-06, + "loss": 0.9746, + "step": 30421 + }, + { + "epoch": 0.78, + "learning_rate": 1.7353509581467676e-06, + "loss": 0.9316, + "step": 30422 + }, + { + "epoch": 0.78, + "learning_rate": 1.7353322059726917e-06, + "loss": 1.0078, + "step": 30423 + }, + { + "epoch": 0.78, + "learning_rate": 1.735313453235606e-06, + "loss": 0.6899, + "step": 30424 + }, + { + "epoch": 0.78, + "learning_rate": 1.7352946999355247e-06, + "loss": 0.7977, + "step": 30425 + }, + { + "epoch": 0.78, + "learning_rate": 1.7352759460724617e-06, + "loss": 0.7266, + "step": 30426 + }, + { + "epoch": 0.78, + "learning_rate": 1.7352571916464318e-06, + "loss": 0.8389, + "step": 30427 + }, + { + "epoch": 0.78, + "learning_rate": 1.7352384366574492e-06, + "loss": 0.9033, + "step": 30428 + }, + { + "epoch": 0.78, + "learning_rate": 1.7352196811055287e-06, + "loss": 0.7617, + "step": 30429 + }, + { + "epoch": 0.78, + "learning_rate": 1.735200924990684e-06, + "loss": 0.8818, + "step": 30430 + }, + { + "epoch": 0.78, + "learning_rate": 1.7351821683129298e-06, + "loss": 0.6753, + "step": 30431 + }, + { + "epoch": 0.78, + "learning_rate": 1.7351634110722801e-06, + "loss": 0.8887, + "step": 30432 + }, + { + "epoch": 0.78, + "learning_rate": 1.7351446532687502e-06, + "loss": 0.7773, + "step": 30433 + }, + { + "epoch": 0.78, + "learning_rate": 1.7351258949023536e-06, + "loss": 0.9092, + "step": 30434 + }, + { + "epoch": 0.78, + "learning_rate": 1.7351071359731043e-06, + "loss": 0.9736, + "step": 30435 + }, + { + "epoch": 0.78, + "learning_rate": 1.735088376481018e-06, + "loss": 0.7393, + "step": 30436 + }, + { + "epoch": 0.78, + "learning_rate": 1.735069616426108e-06, + "loss": 0.7231, + "step": 30437 + }, + { + "epoch": 0.78, + "learning_rate": 1.7350508558083892e-06, + "loss": 0.9727, + "step": 30438 + }, + { + "epoch": 0.78, + "learning_rate": 1.7350320946278757e-06, + "loss": 0.8271, + "step": 30439 + }, + { + "epoch": 0.78, + "learning_rate": 1.735013332884582e-06, + "loss": 0.7329, + "step": 30440 + }, + { + "epoch": 0.78, + "learning_rate": 1.7349945705785223e-06, + "loss": 0.7881, + "step": 30441 + }, + { + "epoch": 0.78, + "learning_rate": 1.734975807709711e-06, + "loss": 0.9746, + "step": 30442 + }, + { + "epoch": 0.78, + "learning_rate": 1.7349570442781624e-06, + "loss": 0.6055, + "step": 30443 + }, + { + "epoch": 0.78, + "learning_rate": 1.7349382802838912e-06, + "loss": 0.9287, + "step": 30444 + }, + { + "epoch": 0.78, + "learning_rate": 1.7349195157269117e-06, + "loss": 0.7637, + "step": 30445 + }, + { + "epoch": 0.78, + "learning_rate": 1.7349007506072378e-06, + "loss": 0.7705, + "step": 30446 + }, + { + "epoch": 0.78, + "learning_rate": 1.7348819849248844e-06, + "loss": 0.9512, + "step": 30447 + }, + { + "epoch": 0.78, + "learning_rate": 1.7348632186798656e-06, + "loss": 0.8486, + "step": 30448 + }, + { + "epoch": 0.78, + "learning_rate": 1.7348444518721958e-06, + "loss": 0.7852, + "step": 30449 + }, + { + "epoch": 0.78, + "learning_rate": 1.7348256845018894e-06, + "loss": 0.5398, + "step": 30450 + }, + { + "epoch": 0.78, + "learning_rate": 1.7348069165689607e-06, + "loss": 0.6875, + "step": 30451 + }, + { + "epoch": 0.78, + "learning_rate": 1.734788148073424e-06, + "loss": 1.1006, + "step": 30452 + }, + { + "epoch": 0.78, + "learning_rate": 1.7347693790152941e-06, + "loss": 0.9321, + "step": 30453 + }, + { + "epoch": 0.78, + "learning_rate": 1.734750609394585e-06, + "loss": 0.9775, + "step": 30454 + }, + { + "epoch": 0.78, + "learning_rate": 1.734731839211311e-06, + "loss": 0.9697, + "step": 30455 + }, + { + "epoch": 0.78, + "learning_rate": 1.7347130684654868e-06, + "loss": 0.9287, + "step": 30456 + }, + { + "epoch": 0.78, + "learning_rate": 1.7346942971571266e-06, + "loss": 0.6709, + "step": 30457 + }, + { + "epoch": 0.78, + "learning_rate": 1.7346755252862443e-06, + "loss": 0.5254, + "step": 30458 + }, + { + "epoch": 0.78, + "learning_rate": 1.7346567528528554e-06, + "loss": 0.5513, + "step": 30459 + }, + { + "epoch": 0.78, + "learning_rate": 1.734637979856973e-06, + "loss": 0.9453, + "step": 30460 + }, + { + "epoch": 0.78, + "learning_rate": 1.7346192062986124e-06, + "loss": 0.9609, + "step": 30461 + }, + { + "epoch": 0.78, + "learning_rate": 1.7346004321777875e-06, + "loss": 0.7346, + "step": 30462 + }, + { + "epoch": 0.78, + "learning_rate": 1.7345816574945132e-06, + "loss": 0.915, + "step": 30463 + }, + { + "epoch": 0.78, + "learning_rate": 1.7345628822488031e-06, + "loss": 0.9121, + "step": 30464 + }, + { + "epoch": 0.78, + "learning_rate": 1.7345441064406723e-06, + "loss": 0.8682, + "step": 30465 + }, + { + "epoch": 0.78, + "learning_rate": 1.7345253300701346e-06, + "loss": 0.9775, + "step": 30466 + }, + { + "epoch": 0.78, + "learning_rate": 1.7345065531372048e-06, + "loss": 0.9287, + "step": 30467 + }, + { + "epoch": 0.78, + "learning_rate": 1.734487775641897e-06, + "loss": 0.9219, + "step": 30468 + }, + { + "epoch": 0.78, + "learning_rate": 1.7344689975842255e-06, + "loss": 0.7517, + "step": 30469 + }, + { + "epoch": 0.78, + "learning_rate": 1.7344502189642053e-06, + "loss": 1.0527, + "step": 30470 + }, + { + "epoch": 0.78, + "learning_rate": 1.7344314397818498e-06, + "loss": 0.636, + "step": 30471 + }, + { + "epoch": 0.78, + "learning_rate": 1.7344126600371744e-06, + "loss": 0.8555, + "step": 30472 + }, + { + "epoch": 0.78, + "learning_rate": 1.734393879730193e-06, + "loss": 0.9053, + "step": 30473 + }, + { + "epoch": 0.78, + "learning_rate": 1.7343750988609196e-06, + "loss": 0.9199, + "step": 30474 + }, + { + "epoch": 0.78, + "learning_rate": 1.7343563174293692e-06, + "loss": 0.769, + "step": 30475 + }, + { + "epoch": 0.78, + "learning_rate": 1.7343375354355557e-06, + "loss": 0.8955, + "step": 30476 + }, + { + "epoch": 0.78, + "learning_rate": 1.734318752879494e-06, + "loss": 0.8574, + "step": 30477 + }, + { + "epoch": 0.78, + "learning_rate": 1.7342999697611979e-06, + "loss": 0.8267, + "step": 30478 + }, + { + "epoch": 0.78, + "learning_rate": 1.7342811860806824e-06, + "loss": 0.998, + "step": 30479 + }, + { + "epoch": 0.78, + "learning_rate": 1.7342624018379612e-06, + "loss": 0.7568, + "step": 30480 + }, + { + "epoch": 0.78, + "learning_rate": 1.7342436170330493e-06, + "loss": 0.6804, + "step": 30481 + }, + { + "epoch": 0.78, + "learning_rate": 1.7342248316659606e-06, + "loss": 0.8516, + "step": 30482 + }, + { + "epoch": 0.78, + "learning_rate": 1.7342060457367102e-06, + "loss": 0.9766, + "step": 30483 + }, + { + "epoch": 0.78, + "learning_rate": 1.7341872592453116e-06, + "loss": 1.1631, + "step": 30484 + }, + { + "epoch": 0.78, + "learning_rate": 1.7341684721917797e-06, + "loss": 0.8999, + "step": 30485 + }, + { + "epoch": 0.78, + "learning_rate": 1.7341496845761286e-06, + "loss": 0.8945, + "step": 30486 + }, + { + "epoch": 0.78, + "learning_rate": 1.7341308963983733e-06, + "loss": 0.9268, + "step": 30487 + }, + { + "epoch": 0.78, + "learning_rate": 1.734112107658527e-06, + "loss": 0.7632, + "step": 30488 + }, + { + "epoch": 0.78, + "learning_rate": 1.7340933183566053e-06, + "loss": 0.7451, + "step": 30489 + }, + { + "epoch": 0.78, + "learning_rate": 1.734074528492622e-06, + "loss": 0.791, + "step": 30490 + }, + { + "epoch": 0.78, + "learning_rate": 1.7340557380665916e-06, + "loss": 0.6831, + "step": 30491 + }, + { + "epoch": 0.78, + "learning_rate": 1.7340369470785286e-06, + "loss": 1.0508, + "step": 30492 + }, + { + "epoch": 0.78, + "learning_rate": 1.734018155528447e-06, + "loss": 0.9355, + "step": 30493 + }, + { + "epoch": 0.78, + "learning_rate": 1.7339993634163618e-06, + "loss": 0.8164, + "step": 30494 + }, + { + "epoch": 0.78, + "learning_rate": 1.7339805707422866e-06, + "loss": 0.7178, + "step": 30495 + }, + { + "epoch": 0.78, + "learning_rate": 1.7339617775062364e-06, + "loss": 0.9414, + "step": 30496 + }, + { + "epoch": 0.78, + "learning_rate": 1.7339429837082256e-06, + "loss": 0.8706, + "step": 30497 + }, + { + "epoch": 0.78, + "learning_rate": 1.7339241893482682e-06, + "loss": 0.8223, + "step": 30498 + }, + { + "epoch": 0.78, + "learning_rate": 1.7339053944263787e-06, + "loss": 0.9092, + "step": 30499 + }, + { + "epoch": 0.78, + "learning_rate": 1.7338865989425718e-06, + "loss": 0.8975, + "step": 30500 + }, + { + "epoch": 0.78, + "learning_rate": 1.7338678028968617e-06, + "loss": 0.8462, + "step": 30501 + }, + { + "epoch": 0.78, + "learning_rate": 1.7338490062892625e-06, + "loss": 0.8555, + "step": 30502 + }, + { + "epoch": 0.78, + "learning_rate": 1.7338302091197891e-06, + "loss": 0.7319, + "step": 30503 + }, + { + "epoch": 0.78, + "learning_rate": 1.7338114113884555e-06, + "loss": 0.8154, + "step": 30504 + }, + { + "epoch": 0.78, + "learning_rate": 1.7337926130952764e-06, + "loss": 0.8486, + "step": 30505 + }, + { + "epoch": 0.78, + "learning_rate": 1.733773814240266e-06, + "loss": 0.8848, + "step": 30506 + }, + { + "epoch": 0.78, + "learning_rate": 1.7337550148234387e-06, + "loss": 0.9111, + "step": 30507 + }, + { + "epoch": 0.78, + "learning_rate": 1.733736214844809e-06, + "loss": 0.6182, + "step": 30508 + }, + { + "epoch": 0.78, + "learning_rate": 1.7337174143043911e-06, + "loss": 0.8281, + "step": 30509 + }, + { + "epoch": 0.78, + "learning_rate": 1.7336986132021996e-06, + "loss": 0.9531, + "step": 30510 + }, + { + "epoch": 0.78, + "learning_rate": 1.7336798115382485e-06, + "loss": 0.8115, + "step": 30511 + }, + { + "epoch": 0.78, + "learning_rate": 1.733661009312553e-06, + "loss": 1.0127, + "step": 30512 + }, + { + "epoch": 0.78, + "learning_rate": 1.7336422065251268e-06, + "loss": 0.7402, + "step": 30513 + }, + { + "epoch": 0.78, + "learning_rate": 1.7336234031759841e-06, + "loss": 0.9121, + "step": 30514 + }, + { + "epoch": 0.78, + "learning_rate": 1.7336045992651402e-06, + "loss": 0.6697, + "step": 30515 + }, + { + "epoch": 0.78, + "learning_rate": 1.733585794792609e-06, + "loss": 0.9053, + "step": 30516 + }, + { + "epoch": 0.78, + "learning_rate": 1.7335669897584047e-06, + "loss": 0.9092, + "step": 30517 + }, + { + "epoch": 0.78, + "learning_rate": 1.733548184162542e-06, + "loss": 0.8135, + "step": 30518 + }, + { + "epoch": 0.78, + "learning_rate": 1.733529378005035e-06, + "loss": 0.8057, + "step": 30519 + }, + { + "epoch": 0.78, + "learning_rate": 1.7335105712858983e-06, + "loss": 0.9346, + "step": 30520 + }, + { + "epoch": 0.78, + "learning_rate": 1.7334917640051466e-06, + "loss": 0.8418, + "step": 30521 + }, + { + "epoch": 0.78, + "learning_rate": 1.7334729561627938e-06, + "loss": 0.8701, + "step": 30522 + }, + { + "epoch": 0.78, + "learning_rate": 1.7334541477588545e-06, + "loss": 1.0752, + "step": 30523 + }, + { + "epoch": 0.78, + "learning_rate": 1.7334353387933428e-06, + "loss": 0.7444, + "step": 30524 + }, + { + "epoch": 0.78, + "learning_rate": 1.7334165292662734e-06, + "loss": 0.7549, + "step": 30525 + }, + { + "epoch": 0.78, + "learning_rate": 1.733397719177661e-06, + "loss": 0.8662, + "step": 30526 + }, + { + "epoch": 0.78, + "learning_rate": 1.7333789085275198e-06, + "loss": 0.9736, + "step": 30527 + }, + { + "epoch": 0.78, + "learning_rate": 1.7333600973158637e-06, + "loss": 1.002, + "step": 30528 + }, + { + "epoch": 0.78, + "learning_rate": 1.7333412855427077e-06, + "loss": 0.8721, + "step": 30529 + }, + { + "epoch": 0.78, + "learning_rate": 1.7333224732080661e-06, + "loss": 0.7183, + "step": 30530 + }, + { + "epoch": 0.78, + "learning_rate": 1.7333036603119528e-06, + "loss": 1.3154, + "step": 30531 + }, + { + "epoch": 0.78, + "learning_rate": 1.733284846854383e-06, + "loss": 0.6633, + "step": 30532 + }, + { + "epoch": 0.78, + "learning_rate": 1.7332660328353708e-06, + "loss": 0.9033, + "step": 30533 + }, + { + "epoch": 0.78, + "learning_rate": 1.73324721825493e-06, + "loss": 0.7578, + "step": 30534 + }, + { + "epoch": 0.78, + "learning_rate": 1.733228403113076e-06, + "loss": 0.8159, + "step": 30535 + }, + { + "epoch": 0.78, + "learning_rate": 1.7332095874098224e-06, + "loss": 0.8262, + "step": 30536 + }, + { + "epoch": 0.78, + "learning_rate": 1.733190771145184e-06, + "loss": 0.7373, + "step": 30537 + }, + { + "epoch": 0.78, + "learning_rate": 1.7331719543191755e-06, + "loss": 0.875, + "step": 30538 + }, + { + "epoch": 0.78, + "learning_rate": 1.7331531369318104e-06, + "loss": 0.7832, + "step": 30539 + }, + { + "epoch": 0.78, + "learning_rate": 1.733134318983104e-06, + "loss": 1.0068, + "step": 30540 + }, + { + "epoch": 0.78, + "learning_rate": 1.73311550047307e-06, + "loss": 0.6387, + "step": 30541 + }, + { + "epoch": 0.78, + "learning_rate": 1.733096681401724e-06, + "loss": 0.4897, + "step": 30542 + }, + { + "epoch": 0.78, + "learning_rate": 1.7330778617690788e-06, + "loss": 0.9326, + "step": 30543 + }, + { + "epoch": 0.78, + "learning_rate": 1.7330590415751497e-06, + "loss": 0.7754, + "step": 30544 + }, + { + "epoch": 0.78, + "learning_rate": 1.7330402208199514e-06, + "loss": 0.7222, + "step": 30545 + }, + { + "epoch": 0.78, + "learning_rate": 1.7330213995034975e-06, + "loss": 0.5425, + "step": 30546 + }, + { + "epoch": 0.78, + "learning_rate": 1.733002577625803e-06, + "loss": 0.9404, + "step": 30547 + }, + { + "epoch": 0.78, + "learning_rate": 1.732983755186882e-06, + "loss": 0.8896, + "step": 30548 + }, + { + "epoch": 0.78, + "learning_rate": 1.732964932186749e-06, + "loss": 1.0615, + "step": 30549 + }, + { + "epoch": 0.78, + "learning_rate": 1.7329461086254188e-06, + "loss": 0.752, + "step": 30550 + }, + { + "epoch": 0.78, + "learning_rate": 1.7329272845029053e-06, + "loss": 0.9912, + "step": 30551 + }, + { + "epoch": 0.78, + "learning_rate": 1.7329084598192228e-06, + "loss": 0.915, + "step": 30552 + }, + { + "epoch": 0.78, + "learning_rate": 1.7328896345743864e-06, + "loss": 0.8042, + "step": 30553 + }, + { + "epoch": 0.78, + "learning_rate": 1.7328708087684096e-06, + "loss": 1.0801, + "step": 30554 + }, + { + "epoch": 0.78, + "learning_rate": 1.732851982401308e-06, + "loss": 0.9268, + "step": 30555 + }, + { + "epoch": 0.78, + "learning_rate": 1.7328331554730948e-06, + "loss": 0.7891, + "step": 30556 + }, + { + "epoch": 0.78, + "learning_rate": 1.7328143279837853e-06, + "loss": 0.958, + "step": 30557 + }, + { + "epoch": 0.78, + "learning_rate": 1.732795499933393e-06, + "loss": 0.8281, + "step": 30558 + }, + { + "epoch": 0.78, + "learning_rate": 1.7327766713219334e-06, + "loss": 0.9209, + "step": 30559 + }, + { + "epoch": 0.78, + "learning_rate": 1.7327578421494201e-06, + "loss": 0.8965, + "step": 30560 + }, + { + "epoch": 0.78, + "learning_rate": 1.7327390124158682e-06, + "loss": 0.8203, + "step": 30561 + }, + { + "epoch": 0.78, + "learning_rate": 1.7327201821212916e-06, + "loss": 0.8018, + "step": 30562 + }, + { + "epoch": 0.78, + "learning_rate": 1.7327013512657048e-06, + "loss": 1.082, + "step": 30563 + }, + { + "epoch": 0.78, + "learning_rate": 1.732682519849122e-06, + "loss": 0.6718, + "step": 30564 + }, + { + "epoch": 0.78, + "learning_rate": 1.7326636878715584e-06, + "loss": 0.5869, + "step": 30565 + }, + { + "epoch": 0.78, + "learning_rate": 1.7326448553330274e-06, + "loss": 0.8535, + "step": 30566 + }, + { + "epoch": 0.78, + "learning_rate": 1.732626022233544e-06, + "loss": 0.8374, + "step": 30567 + }, + { + "epoch": 0.78, + "learning_rate": 1.7326071885731228e-06, + "loss": 0.9932, + "step": 30568 + }, + { + "epoch": 0.78, + "learning_rate": 1.732588354351778e-06, + "loss": 0.7178, + "step": 30569 + }, + { + "epoch": 0.78, + "learning_rate": 1.7325695195695236e-06, + "loss": 0.6948, + "step": 30570 + }, + { + "epoch": 0.78, + "learning_rate": 1.7325506842263746e-06, + "loss": 0.8452, + "step": 30571 + }, + { + "epoch": 0.78, + "learning_rate": 1.7325318483223454e-06, + "loss": 0.8237, + "step": 30572 + }, + { + "epoch": 0.78, + "learning_rate": 1.73251301185745e-06, + "loss": 0.6733, + "step": 30573 + }, + { + "epoch": 0.78, + "learning_rate": 1.7324941748317033e-06, + "loss": 0.7646, + "step": 30574 + }, + { + "epoch": 0.78, + "learning_rate": 1.7324753372451192e-06, + "loss": 0.9355, + "step": 30575 + }, + { + "epoch": 0.78, + "learning_rate": 1.7324564990977127e-06, + "loss": 0.8018, + "step": 30576 + }, + { + "epoch": 0.78, + "learning_rate": 1.7324376603894977e-06, + "loss": 0.8105, + "step": 30577 + }, + { + "epoch": 0.78, + "learning_rate": 1.7324188211204889e-06, + "loss": 0.8164, + "step": 30578 + }, + { + "epoch": 0.78, + "learning_rate": 1.7323999812907006e-06, + "loss": 0.8276, + "step": 30579 + }, + { + "epoch": 0.78, + "learning_rate": 1.7323811409001475e-06, + "loss": 0.9834, + "step": 30580 + }, + { + "epoch": 0.78, + "learning_rate": 1.732362299948844e-06, + "loss": 0.9404, + "step": 30581 + }, + { + "epoch": 0.78, + "learning_rate": 1.732343458436804e-06, + "loss": 0.8856, + "step": 30582 + }, + { + "epoch": 0.78, + "learning_rate": 1.7323246163640425e-06, + "loss": 0.9883, + "step": 30583 + }, + { + "epoch": 0.78, + "learning_rate": 1.7323057737305737e-06, + "loss": 0.8076, + "step": 30584 + }, + { + "epoch": 0.78, + "learning_rate": 1.7322869305364121e-06, + "loss": 1.0283, + "step": 30585 + }, + { + "epoch": 0.78, + "learning_rate": 1.7322680867815719e-06, + "loss": 0.8428, + "step": 30586 + }, + { + "epoch": 0.78, + "learning_rate": 1.732249242466068e-06, + "loss": 0.7949, + "step": 30587 + }, + { + "epoch": 0.78, + "learning_rate": 1.7322303975899141e-06, + "loss": 0.7578, + "step": 30588 + }, + { + "epoch": 0.78, + "learning_rate": 1.7322115521531252e-06, + "loss": 0.958, + "step": 30589 + }, + { + "epoch": 0.78, + "learning_rate": 1.7321927061557155e-06, + "loss": 0.689, + "step": 30590 + }, + { + "epoch": 0.78, + "learning_rate": 1.7321738595977e-06, + "loss": 0.7959, + "step": 30591 + }, + { + "epoch": 0.78, + "learning_rate": 1.732155012479092e-06, + "loss": 0.686, + "step": 30592 + }, + { + "epoch": 0.78, + "learning_rate": 1.732136164799907e-06, + "loss": 0.8398, + "step": 30593 + }, + { + "epoch": 0.78, + "learning_rate": 1.7321173165601588e-06, + "loss": 1.126, + "step": 30594 + }, + { + "epoch": 0.78, + "learning_rate": 1.732098467759862e-06, + "loss": 0.5806, + "step": 30595 + }, + { + "epoch": 0.78, + "learning_rate": 1.7320796183990312e-06, + "loss": 0.9243, + "step": 30596 + }, + { + "epoch": 0.78, + "learning_rate": 1.7320607684776807e-06, + "loss": 0.7998, + "step": 30597 + }, + { + "epoch": 0.78, + "learning_rate": 1.7320419179958247e-06, + "loss": 0.7847, + "step": 30598 + }, + { + "epoch": 0.78, + "learning_rate": 1.732023066953478e-06, + "loss": 0.7148, + "step": 30599 + }, + { + "epoch": 0.78, + "learning_rate": 1.7320042153506554e-06, + "loss": 0.9365, + "step": 30600 + }, + { + "epoch": 0.78, + "learning_rate": 1.7319853631873703e-06, + "loss": 0.7783, + "step": 30601 + }, + { + "epoch": 0.78, + "learning_rate": 1.7319665104636378e-06, + "loss": 1.0088, + "step": 30602 + }, + { + "epoch": 0.78, + "learning_rate": 1.731947657179472e-06, + "loss": 0.8848, + "step": 30603 + }, + { + "epoch": 0.78, + "learning_rate": 1.7319288033348877e-06, + "loss": 0.8232, + "step": 30604 + }, + { + "epoch": 0.78, + "learning_rate": 1.7319099489298992e-06, + "loss": 0.7803, + "step": 30605 + }, + { + "epoch": 0.78, + "learning_rate": 1.7318910939645207e-06, + "loss": 0.8047, + "step": 30606 + }, + { + "epoch": 0.78, + "learning_rate": 1.7318722384387673e-06, + "loss": 0.8945, + "step": 30607 + }, + { + "epoch": 0.78, + "learning_rate": 1.7318533823526524e-06, + "loss": 0.7021, + "step": 30608 + }, + { + "epoch": 0.78, + "learning_rate": 1.7318345257061916e-06, + "loss": 0.7354, + "step": 30609 + }, + { + "epoch": 0.78, + "learning_rate": 1.7318156684993983e-06, + "loss": 1.1035, + "step": 30610 + }, + { + "epoch": 0.78, + "learning_rate": 1.7317968107322875e-06, + "loss": 0.9072, + "step": 30611 + }, + { + "epoch": 0.78, + "learning_rate": 1.7317779524048736e-06, + "loss": 1.0566, + "step": 30612 + }, + { + "epoch": 0.78, + "learning_rate": 1.7317590935171708e-06, + "loss": 0.707, + "step": 30613 + }, + { + "epoch": 0.78, + "learning_rate": 1.731740234069194e-06, + "loss": 0.9629, + "step": 30614 + }, + { + "epoch": 0.78, + "learning_rate": 1.731721374060957e-06, + "loss": 1.0205, + "step": 30615 + }, + { + "epoch": 0.78, + "learning_rate": 1.7317025134924749e-06, + "loss": 0.8296, + "step": 30616 + }, + { + "epoch": 0.78, + "learning_rate": 1.7316836523637618e-06, + "loss": 0.8252, + "step": 30617 + }, + { + "epoch": 0.78, + "learning_rate": 1.731664790674832e-06, + "loss": 0.9951, + "step": 30618 + }, + { + "epoch": 0.78, + "learning_rate": 1.7316459284257001e-06, + "loss": 0.874, + "step": 30619 + }, + { + "epoch": 0.78, + "learning_rate": 1.7316270656163807e-06, + "loss": 0.6406, + "step": 30620 + }, + { + "epoch": 0.78, + "learning_rate": 1.731608202246888e-06, + "loss": 0.8818, + "step": 30621 + }, + { + "epoch": 0.78, + "learning_rate": 1.7315893383172369e-06, + "loss": 0.9746, + "step": 30622 + }, + { + "epoch": 0.78, + "learning_rate": 1.731570473827441e-06, + "loss": 0.7412, + "step": 30623 + }, + { + "epoch": 0.78, + "learning_rate": 1.7315516087775156e-06, + "loss": 1.0381, + "step": 30624 + }, + { + "epoch": 0.78, + "learning_rate": 1.7315327431674744e-06, + "loss": 0.6729, + "step": 30625 + }, + { + "epoch": 0.78, + "learning_rate": 1.7315138769973326e-06, + "loss": 1.002, + "step": 30626 + }, + { + "epoch": 0.78, + "learning_rate": 1.7314950102671038e-06, + "loss": 1.1914, + "step": 30627 + }, + { + "epoch": 0.79, + "learning_rate": 1.7314761429768032e-06, + "loss": 0.8379, + "step": 30628 + }, + { + "epoch": 0.79, + "learning_rate": 1.7314572751264448e-06, + "loss": 0.8652, + "step": 30629 + }, + { + "epoch": 0.79, + "learning_rate": 1.7314384067160434e-06, + "loss": 0.8247, + "step": 30630 + }, + { + "epoch": 0.79, + "learning_rate": 1.7314195377456131e-06, + "loss": 0.6304, + "step": 30631 + }, + { + "epoch": 0.79, + "learning_rate": 1.7314006682151688e-06, + "loss": 0.8838, + "step": 30632 + }, + { + "epoch": 0.79, + "learning_rate": 1.7313817981247242e-06, + "loss": 0.7842, + "step": 30633 + }, + { + "epoch": 0.79, + "learning_rate": 1.7313629274742946e-06, + "loss": 0.8135, + "step": 30634 + }, + { + "epoch": 0.79, + "learning_rate": 1.7313440562638935e-06, + "loss": 0.8188, + "step": 30635 + }, + { + "epoch": 0.79, + "learning_rate": 1.7313251844935364e-06, + "loss": 0.6675, + "step": 30636 + }, + { + "epoch": 0.79, + "learning_rate": 1.7313063121632369e-06, + "loss": 0.7959, + "step": 30637 + }, + { + "epoch": 0.79, + "learning_rate": 1.7312874392730099e-06, + "loss": 0.6084, + "step": 30638 + }, + { + "epoch": 0.79, + "learning_rate": 1.7312685658228697e-06, + "loss": 0.7371, + "step": 30639 + }, + { + "epoch": 0.79, + "learning_rate": 1.7312496918128308e-06, + "loss": 0.8535, + "step": 30640 + }, + { + "epoch": 0.79, + "learning_rate": 1.7312308172429076e-06, + "loss": 0.7988, + "step": 30641 + }, + { + "epoch": 0.79, + "learning_rate": 1.7312119421131146e-06, + "loss": 0.7402, + "step": 30642 + }, + { + "epoch": 0.79, + "learning_rate": 1.7311930664234664e-06, + "loss": 0.9268, + "step": 30643 + }, + { + "epoch": 0.79, + "learning_rate": 1.7311741901739772e-06, + "loss": 0.8018, + "step": 30644 + }, + { + "epoch": 0.79, + "learning_rate": 1.7311553133646615e-06, + "loss": 0.8467, + "step": 30645 + }, + { + "epoch": 0.79, + "learning_rate": 1.7311364359955337e-06, + "loss": 0.7932, + "step": 30646 + }, + { + "epoch": 0.79, + "learning_rate": 1.7311175580666085e-06, + "loss": 0.8853, + "step": 30647 + }, + { + "epoch": 0.79, + "learning_rate": 1.7310986795779003e-06, + "loss": 0.8682, + "step": 30648 + }, + { + "epoch": 0.79, + "learning_rate": 1.7310798005294234e-06, + "loss": 0.7578, + "step": 30649 + }, + { + "epoch": 0.79, + "learning_rate": 1.7310609209211919e-06, + "loss": 0.9893, + "step": 30650 + }, + { + "epoch": 0.79, + "learning_rate": 1.7310420407532211e-06, + "loss": 1.0547, + "step": 30651 + }, + { + "epoch": 0.79, + "learning_rate": 1.731023160025525e-06, + "loss": 0.9307, + "step": 30652 + }, + { + "epoch": 0.79, + "learning_rate": 1.7310042787381182e-06, + "loss": 0.8369, + "step": 30653 + }, + { + "epoch": 0.79, + "learning_rate": 1.7309853968910147e-06, + "loss": 0.9434, + "step": 30654 + }, + { + "epoch": 0.79, + "learning_rate": 1.7309665144842294e-06, + "loss": 0.8984, + "step": 30655 + }, + { + "epoch": 0.79, + "learning_rate": 1.7309476315177767e-06, + "loss": 0.9951, + "step": 30656 + }, + { + "epoch": 0.79, + "learning_rate": 1.7309287479916708e-06, + "loss": 0.6865, + "step": 30657 + }, + { + "epoch": 0.79, + "learning_rate": 1.7309098639059268e-06, + "loss": 0.8862, + "step": 30658 + }, + { + "epoch": 0.79, + "learning_rate": 1.7308909792605584e-06, + "loss": 0.9023, + "step": 30659 + }, + { + "epoch": 0.79, + "learning_rate": 1.7308720940555804e-06, + "loss": 0.5674, + "step": 30660 + }, + { + "epoch": 0.79, + "learning_rate": 1.7308532082910072e-06, + "loss": 0.9004, + "step": 30661 + }, + { + "epoch": 0.79, + "learning_rate": 1.7308343219668535e-06, + "loss": 0.9258, + "step": 30662 + }, + { + "epoch": 0.79, + "learning_rate": 1.7308154350831337e-06, + "loss": 0.7988, + "step": 30663 + }, + { + "epoch": 0.79, + "learning_rate": 1.730796547639862e-06, + "loss": 0.9365, + "step": 30664 + }, + { + "epoch": 0.79, + "learning_rate": 1.7307776596370526e-06, + "loss": 0.9473, + "step": 30665 + }, + { + "epoch": 0.79, + "learning_rate": 1.7307587710747207e-06, + "loss": 1.0078, + "step": 30666 + }, + { + "epoch": 0.79, + "learning_rate": 1.7307398819528802e-06, + "loss": 0.9219, + "step": 30667 + }, + { + "epoch": 0.79, + "learning_rate": 1.730720992271546e-06, + "loss": 0.7881, + "step": 30668 + }, + { + "epoch": 0.79, + "learning_rate": 1.7307021020307325e-06, + "loss": 0.8232, + "step": 30669 + }, + { + "epoch": 0.79, + "learning_rate": 1.7306832112304535e-06, + "loss": 0.9795, + "step": 30670 + }, + { + "epoch": 0.79, + "learning_rate": 1.7306643198707243e-06, + "loss": 0.7393, + "step": 30671 + }, + { + "epoch": 0.79, + "learning_rate": 1.730645427951559e-06, + "loss": 0.9336, + "step": 30672 + }, + { + "epoch": 0.79, + "learning_rate": 1.7306265354729722e-06, + "loss": 0.5161, + "step": 30673 + }, + { + "epoch": 0.79, + "learning_rate": 1.730607642434978e-06, + "loss": 0.7217, + "step": 30674 + }, + { + "epoch": 0.79, + "learning_rate": 1.730588748837591e-06, + "loss": 0.998, + "step": 30675 + }, + { + "epoch": 0.79, + "learning_rate": 1.7305698546808261e-06, + "loss": 1.0957, + "step": 30676 + }, + { + "epoch": 0.79, + "learning_rate": 1.7305509599646976e-06, + "loss": 0.9785, + "step": 30677 + }, + { + "epoch": 0.79, + "learning_rate": 1.7305320646892193e-06, + "loss": 0.8037, + "step": 30678 + }, + { + "epoch": 0.79, + "learning_rate": 1.7305131688544065e-06, + "loss": 0.8936, + "step": 30679 + }, + { + "epoch": 0.79, + "learning_rate": 1.7304942724602734e-06, + "loss": 0.9551, + "step": 30680 + }, + { + "epoch": 0.79, + "learning_rate": 1.7304753755068342e-06, + "loss": 0.8755, + "step": 30681 + }, + { + "epoch": 0.79, + "learning_rate": 1.7304564779941039e-06, + "loss": 0.8535, + "step": 30682 + }, + { + "epoch": 0.79, + "learning_rate": 1.7304375799220962e-06, + "loss": 0.9248, + "step": 30683 + }, + { + "epoch": 0.79, + "learning_rate": 1.7304186812908265e-06, + "loss": 0.915, + "step": 30684 + }, + { + "epoch": 0.79, + "learning_rate": 1.7303997821003086e-06, + "loss": 0.9404, + "step": 30685 + }, + { + "epoch": 0.79, + "learning_rate": 1.7303808823505572e-06, + "loss": 0.8135, + "step": 30686 + }, + { + "epoch": 0.79, + "learning_rate": 1.730361982041587e-06, + "loss": 0.8438, + "step": 30687 + }, + { + "epoch": 0.79, + "learning_rate": 1.7303430811734119e-06, + "loss": 0.6401, + "step": 30688 + }, + { + "epoch": 0.79, + "learning_rate": 1.7303241797460468e-06, + "loss": 0.9736, + "step": 30689 + }, + { + "epoch": 0.79, + "learning_rate": 1.730305277759506e-06, + "loss": 0.7427, + "step": 30690 + }, + { + "epoch": 0.79, + "learning_rate": 1.730286375213804e-06, + "loss": 0.6758, + "step": 30691 + }, + { + "epoch": 0.79, + "learning_rate": 1.7302674721089555e-06, + "loss": 0.8867, + "step": 30692 + }, + { + "epoch": 0.79, + "learning_rate": 1.7302485684449745e-06, + "loss": 0.8105, + "step": 30693 + }, + { + "epoch": 0.79, + "learning_rate": 1.7302296642218758e-06, + "loss": 0.959, + "step": 30694 + }, + { + "epoch": 0.79, + "learning_rate": 1.7302107594396738e-06, + "loss": 1.0459, + "step": 30695 + }, + { + "epoch": 0.79, + "learning_rate": 1.7301918540983832e-06, + "loss": 0.7739, + "step": 30696 + }, + { + "epoch": 0.79, + "learning_rate": 1.7301729481980182e-06, + "loss": 0.8809, + "step": 30697 + }, + { + "epoch": 0.79, + "learning_rate": 1.730154041738593e-06, + "loss": 0.7354, + "step": 30698 + }, + { + "epoch": 0.79, + "learning_rate": 1.7301351347201232e-06, + "loss": 0.8906, + "step": 30699 + }, + { + "epoch": 0.79, + "learning_rate": 1.7301162271426218e-06, + "loss": 0.7607, + "step": 30700 + }, + { + "epoch": 0.79, + "learning_rate": 1.7300973190061044e-06, + "loss": 0.7153, + "step": 30701 + }, + { + "epoch": 0.79, + "learning_rate": 1.7300784103105847e-06, + "loss": 0.9541, + "step": 30702 + }, + { + "epoch": 0.79, + "learning_rate": 1.7300595010560777e-06, + "loss": 0.8428, + "step": 30703 + }, + { + "epoch": 0.79, + "learning_rate": 1.7300405912425978e-06, + "loss": 0.8223, + "step": 30704 + }, + { + "epoch": 0.79, + "learning_rate": 1.730021680870159e-06, + "loss": 0.9473, + "step": 30705 + }, + { + "epoch": 0.79, + "learning_rate": 1.7300027699387765e-06, + "loss": 0.8545, + "step": 30706 + }, + { + "epoch": 0.79, + "learning_rate": 1.7299838584484644e-06, + "loss": 0.7676, + "step": 30707 + }, + { + "epoch": 0.79, + "learning_rate": 1.7299649463992374e-06, + "loss": 1.1797, + "step": 30708 + }, + { + "epoch": 0.79, + "learning_rate": 1.7299460337911097e-06, + "loss": 0.7607, + "step": 30709 + }, + { + "epoch": 0.79, + "learning_rate": 1.7299271206240954e-06, + "loss": 0.7832, + "step": 30710 + }, + { + "epoch": 0.79, + "learning_rate": 1.7299082068982101e-06, + "loss": 0.8047, + "step": 30711 + }, + { + "epoch": 0.79, + "learning_rate": 1.7298892926134677e-06, + "loss": 0.7607, + "step": 30712 + }, + { + "epoch": 0.79, + "learning_rate": 1.729870377769882e-06, + "loss": 0.9463, + "step": 30713 + }, + { + "epoch": 0.79, + "learning_rate": 1.7298514623674688e-06, + "loss": 0.8525, + "step": 30714 + }, + { + "epoch": 0.79, + "learning_rate": 1.7298325464062415e-06, + "loss": 0.9541, + "step": 30715 + }, + { + "epoch": 0.79, + "learning_rate": 1.729813629886215e-06, + "loss": 0.8672, + "step": 30716 + }, + { + "epoch": 0.79, + "learning_rate": 1.7297947128074037e-06, + "loss": 1.0127, + "step": 30717 + }, + { + "epoch": 0.79, + "learning_rate": 1.7297757951698224e-06, + "loss": 0.8555, + "step": 30718 + }, + { + "epoch": 0.79, + "learning_rate": 1.729756876973485e-06, + "loss": 0.8232, + "step": 30719 + }, + { + "epoch": 0.79, + "learning_rate": 1.7297379582184066e-06, + "loss": 0.9443, + "step": 30720 + }, + { + "epoch": 0.79, + "learning_rate": 1.7297190389046013e-06, + "loss": 0.8086, + "step": 30721 + }, + { + "epoch": 0.79, + "learning_rate": 1.7297001190320837e-06, + "loss": 0.6499, + "step": 30722 + }, + { + "epoch": 0.79, + "learning_rate": 1.7296811986008681e-06, + "loss": 0.7642, + "step": 30723 + }, + { + "epoch": 0.79, + "learning_rate": 1.7296622776109695e-06, + "loss": 0.8613, + "step": 30724 + }, + { + "epoch": 0.79, + "learning_rate": 1.7296433560624018e-06, + "loss": 0.7678, + "step": 30725 + }, + { + "epoch": 0.79, + "learning_rate": 1.7296244339551797e-06, + "loss": 0.6841, + "step": 30726 + }, + { + "epoch": 0.79, + "learning_rate": 1.7296055112893178e-06, + "loss": 0.835, + "step": 30727 + }, + { + "epoch": 0.79, + "learning_rate": 1.7295865880648304e-06, + "loss": 0.9883, + "step": 30728 + }, + { + "epoch": 0.79, + "learning_rate": 1.7295676642817324e-06, + "loss": 0.917, + "step": 30729 + }, + { + "epoch": 0.79, + "learning_rate": 1.7295487399400376e-06, + "loss": 1.0215, + "step": 30730 + }, + { + "epoch": 0.79, + "learning_rate": 1.7295298150397612e-06, + "loss": 0.5799, + "step": 30731 + }, + { + "epoch": 0.79, + "learning_rate": 1.7295108895809171e-06, + "loss": 0.9072, + "step": 30732 + }, + { + "epoch": 0.79, + "learning_rate": 1.7294919635635203e-06, + "loss": 0.9473, + "step": 30733 + }, + { + "epoch": 0.79, + "learning_rate": 1.7294730369875849e-06, + "loss": 0.9014, + "step": 30734 + }, + { + "epoch": 0.79, + "learning_rate": 1.7294541098531256e-06, + "loss": 0.7461, + "step": 30735 + }, + { + "epoch": 0.79, + "learning_rate": 1.7294351821601566e-06, + "loss": 0.6836, + "step": 30736 + }, + { + "epoch": 0.79, + "learning_rate": 1.7294162539086932e-06, + "loss": 0.6914, + "step": 30737 + }, + { + "epoch": 0.79, + "learning_rate": 1.7293973250987488e-06, + "loss": 0.9395, + "step": 30738 + }, + { + "epoch": 0.79, + "learning_rate": 1.7293783957303387e-06, + "loss": 0.6709, + "step": 30739 + }, + { + "epoch": 0.79, + "learning_rate": 1.7293594658034768e-06, + "loss": 0.7412, + "step": 30740 + }, + { + "epoch": 0.79, + "learning_rate": 1.729340535318178e-06, + "loss": 1.0283, + "step": 30741 + }, + { + "epoch": 0.79, + "learning_rate": 1.7293216042744568e-06, + "loss": 1.0615, + "step": 30742 + }, + { + "epoch": 0.79, + "learning_rate": 1.7293026726723276e-06, + "loss": 1.0049, + "step": 30743 + }, + { + "epoch": 0.79, + "learning_rate": 1.7292837405118048e-06, + "loss": 0.8662, + "step": 30744 + }, + { + "epoch": 0.79, + "learning_rate": 1.729264807792903e-06, + "loss": 0.8394, + "step": 30745 + }, + { + "epoch": 0.79, + "learning_rate": 1.7292458745156365e-06, + "loss": 0.8701, + "step": 30746 + }, + { + "epoch": 0.79, + "learning_rate": 1.72922694068002e-06, + "loss": 0.8379, + "step": 30747 + }, + { + "epoch": 0.79, + "learning_rate": 1.7292080062860681e-06, + "loss": 0.8882, + "step": 30748 + }, + { + "epoch": 0.79, + "learning_rate": 1.729189071333795e-06, + "loss": 0.6709, + "step": 30749 + }, + { + "epoch": 0.79, + "learning_rate": 1.7291701358232155e-06, + "loss": 0.9414, + "step": 30750 + }, + { + "epoch": 0.79, + "learning_rate": 1.729151199754344e-06, + "loss": 0.9365, + "step": 30751 + }, + { + "epoch": 0.79, + "learning_rate": 1.729132263127195e-06, + "loss": 0.6064, + "step": 30752 + }, + { + "epoch": 0.79, + "learning_rate": 1.7291133259417827e-06, + "loss": 0.8164, + "step": 30753 + }, + { + "epoch": 0.79, + "learning_rate": 1.7290943881981221e-06, + "loss": 0.7495, + "step": 30754 + }, + { + "epoch": 0.79, + "learning_rate": 1.7290754498962272e-06, + "loss": 1.1338, + "step": 30755 + }, + { + "epoch": 0.79, + "learning_rate": 1.7290565110361128e-06, + "loss": 0.9697, + "step": 30756 + }, + { + "epoch": 0.79, + "learning_rate": 1.7290375716177938e-06, + "loss": 0.9658, + "step": 30757 + }, + { + "epoch": 0.79, + "learning_rate": 1.7290186316412838e-06, + "loss": 0.917, + "step": 30758 + }, + { + "epoch": 0.79, + "learning_rate": 1.7289996911065977e-06, + "loss": 0.7979, + "step": 30759 + }, + { + "epoch": 0.79, + "learning_rate": 1.7289807500137502e-06, + "loss": 1.0078, + "step": 30760 + }, + { + "epoch": 0.79, + "learning_rate": 1.7289618083627557e-06, + "loss": 0.7764, + "step": 30761 + }, + { + "epoch": 0.79, + "learning_rate": 1.7289428661536286e-06, + "loss": 0.7451, + "step": 30762 + }, + { + "epoch": 0.79, + "learning_rate": 1.7289239233863838e-06, + "loss": 0.7949, + "step": 30763 + }, + { + "epoch": 0.79, + "learning_rate": 1.728904980061035e-06, + "loss": 0.8408, + "step": 30764 + }, + { + "epoch": 0.79, + "learning_rate": 1.7288860361775974e-06, + "loss": 0.9346, + "step": 30765 + }, + { + "epoch": 0.79, + "learning_rate": 1.728867091736085e-06, + "loss": 0.7803, + "step": 30766 + }, + { + "epoch": 0.79, + "learning_rate": 1.728848146736513e-06, + "loss": 0.8271, + "step": 30767 + }, + { + "epoch": 0.79, + "learning_rate": 1.7288292011788955e-06, + "loss": 0.9258, + "step": 30768 + }, + { + "epoch": 0.79, + "learning_rate": 1.7288102550632466e-06, + "loss": 0.7881, + "step": 30769 + }, + { + "epoch": 0.79, + "learning_rate": 1.728791308389581e-06, + "loss": 0.8535, + "step": 30770 + }, + { + "epoch": 0.79, + "learning_rate": 1.7287723611579141e-06, + "loss": 0.9434, + "step": 30771 + }, + { + "epoch": 0.79, + "learning_rate": 1.7287534133682594e-06, + "loss": 1.1094, + "step": 30772 + }, + { + "epoch": 0.79, + "learning_rate": 1.7287344650206317e-06, + "loss": 0.8115, + "step": 30773 + }, + { + "epoch": 0.79, + "learning_rate": 1.7287155161150455e-06, + "loss": 0.9668, + "step": 30774 + }, + { + "epoch": 0.79, + "learning_rate": 1.7286965666515154e-06, + "loss": 0.7739, + "step": 30775 + }, + { + "epoch": 0.79, + "learning_rate": 1.7286776166300557e-06, + "loss": 0.7461, + "step": 30776 + }, + { + "epoch": 0.79, + "learning_rate": 1.7286586660506814e-06, + "loss": 0.8396, + "step": 30777 + }, + { + "epoch": 0.79, + "learning_rate": 1.7286397149134064e-06, + "loss": 1.3643, + "step": 30778 + }, + { + "epoch": 0.79, + "learning_rate": 1.7286207632182455e-06, + "loss": 0.3237, + "step": 30779 + }, + { + "epoch": 0.79, + "learning_rate": 1.7286018109652132e-06, + "loss": 0.8613, + "step": 30780 + }, + { + "epoch": 0.79, + "learning_rate": 1.7285828581543238e-06, + "loss": 0.9844, + "step": 30781 + }, + { + "epoch": 0.79, + "learning_rate": 1.7285639047855923e-06, + "loss": 0.9209, + "step": 30782 + }, + { + "epoch": 0.79, + "learning_rate": 1.7285449508590331e-06, + "loss": 0.6904, + "step": 30783 + }, + { + "epoch": 0.79, + "learning_rate": 1.7285259963746602e-06, + "loss": 0.7217, + "step": 30784 + }, + { + "epoch": 0.79, + "learning_rate": 1.7285070413324885e-06, + "loss": 0.8623, + "step": 30785 + }, + { + "epoch": 0.79, + "learning_rate": 1.7284880857325324e-06, + "loss": 0.7988, + "step": 30786 + }, + { + "epoch": 0.79, + "learning_rate": 1.7284691295748065e-06, + "loss": 0.7505, + "step": 30787 + }, + { + "epoch": 0.79, + "learning_rate": 1.7284501728593252e-06, + "loss": 0.9697, + "step": 30788 + }, + { + "epoch": 0.79, + "learning_rate": 1.7284312155861033e-06, + "loss": 0.5938, + "step": 30789 + }, + { + "epoch": 0.79, + "learning_rate": 1.728412257755155e-06, + "loss": 0.9629, + "step": 30790 + }, + { + "epoch": 0.79, + "learning_rate": 1.7283932993664948e-06, + "loss": 0.7476, + "step": 30791 + }, + { + "epoch": 0.79, + "learning_rate": 1.7283743404201374e-06, + "loss": 0.833, + "step": 30792 + }, + { + "epoch": 0.79, + "learning_rate": 1.7283553809160974e-06, + "loss": 0.7886, + "step": 30793 + }, + { + "epoch": 0.79, + "learning_rate": 1.7283364208543892e-06, + "loss": 0.7654, + "step": 30794 + }, + { + "epoch": 0.79, + "learning_rate": 1.7283174602350271e-06, + "loss": 0.8564, + "step": 30795 + }, + { + "epoch": 0.79, + "learning_rate": 1.728298499058026e-06, + "loss": 0.8252, + "step": 30796 + }, + { + "epoch": 0.79, + "learning_rate": 1.7282795373234002e-06, + "loss": 0.7617, + "step": 30797 + }, + { + "epoch": 0.79, + "learning_rate": 1.728260575031164e-06, + "loss": 1.0146, + "step": 30798 + }, + { + "epoch": 0.79, + "learning_rate": 1.7282416121813326e-06, + "loss": 0.7578, + "step": 30799 + }, + { + "epoch": 0.79, + "learning_rate": 1.72822264877392e-06, + "loss": 0.7676, + "step": 30800 + }, + { + "epoch": 0.79, + "learning_rate": 1.7282036848089404e-06, + "loss": 0.8965, + "step": 30801 + }, + { + "epoch": 0.79, + "learning_rate": 1.728184720286409e-06, + "loss": 0.9629, + "step": 30802 + }, + { + "epoch": 0.79, + "learning_rate": 1.72816575520634e-06, + "loss": 0.667, + "step": 30803 + }, + { + "epoch": 0.79, + "learning_rate": 1.7281467895687481e-06, + "loss": 0.9229, + "step": 30804 + }, + { + "epoch": 0.79, + "learning_rate": 1.7281278233736477e-06, + "loss": 0.9121, + "step": 30805 + }, + { + "epoch": 0.79, + "learning_rate": 1.7281088566210528e-06, + "loss": 0.7524, + "step": 30806 + }, + { + "epoch": 0.79, + "learning_rate": 1.728089889310979e-06, + "loss": 0.8926, + "step": 30807 + }, + { + "epoch": 0.79, + "learning_rate": 1.7280709214434398e-06, + "loss": 0.7563, + "step": 30808 + }, + { + "epoch": 0.79, + "learning_rate": 1.7280519530184506e-06, + "loss": 0.8652, + "step": 30809 + }, + { + "epoch": 0.79, + "learning_rate": 1.7280329840360252e-06, + "loss": 1.0264, + "step": 30810 + }, + { + "epoch": 0.79, + "learning_rate": 1.7280140144961788e-06, + "loss": 0.9258, + "step": 30811 + }, + { + "epoch": 0.79, + "learning_rate": 1.7279950443989252e-06, + "loss": 0.9375, + "step": 30812 + }, + { + "epoch": 0.79, + "learning_rate": 1.7279760737442795e-06, + "loss": 0.9346, + "step": 30813 + }, + { + "epoch": 0.79, + "learning_rate": 1.7279571025322554e-06, + "loss": 0.9365, + "step": 30814 + }, + { + "epoch": 0.79, + "learning_rate": 1.7279381307628686e-06, + "loss": 0.7412, + "step": 30815 + }, + { + "epoch": 0.79, + "learning_rate": 1.727919158436133e-06, + "loss": 0.8342, + "step": 30816 + }, + { + "epoch": 0.79, + "learning_rate": 1.727900185552063e-06, + "loss": 0.9189, + "step": 30817 + }, + { + "epoch": 0.79, + "learning_rate": 1.7278812121106734e-06, + "loss": 0.7227, + "step": 30818 + }, + { + "epoch": 0.79, + "learning_rate": 1.7278622381119784e-06, + "loss": 0.7285, + "step": 30819 + }, + { + "epoch": 0.79, + "learning_rate": 1.727843263555993e-06, + "loss": 1.1104, + "step": 30820 + }, + { + "epoch": 0.79, + "learning_rate": 1.7278242884427316e-06, + "loss": 0.8984, + "step": 30821 + }, + { + "epoch": 0.79, + "learning_rate": 1.7278053127722086e-06, + "loss": 0.8809, + "step": 30822 + }, + { + "epoch": 0.79, + "learning_rate": 1.727786336544438e-06, + "loss": 0.7734, + "step": 30823 + }, + { + "epoch": 0.79, + "learning_rate": 1.7277673597594356e-06, + "loss": 0.7505, + "step": 30824 + }, + { + "epoch": 0.79, + "learning_rate": 1.7277483824172147e-06, + "loss": 0.8125, + "step": 30825 + }, + { + "epoch": 0.79, + "learning_rate": 1.7277294045177903e-06, + "loss": 0.8115, + "step": 30826 + }, + { + "epoch": 0.79, + "learning_rate": 1.7277104260611773e-06, + "loss": 0.8604, + "step": 30827 + }, + { + "epoch": 0.79, + "learning_rate": 1.7276914470473898e-06, + "loss": 0.6641, + "step": 30828 + }, + { + "epoch": 0.79, + "learning_rate": 1.7276724674764422e-06, + "loss": 1.0703, + "step": 30829 + }, + { + "epoch": 0.79, + "learning_rate": 1.7276534873483492e-06, + "loss": 0.6675, + "step": 30830 + }, + { + "epoch": 0.79, + "learning_rate": 1.7276345066631258e-06, + "loss": 0.8984, + "step": 30831 + }, + { + "epoch": 0.79, + "learning_rate": 1.7276155254207857e-06, + "loss": 0.998, + "step": 30832 + }, + { + "epoch": 0.79, + "learning_rate": 1.727596543621344e-06, + "loss": 1.1318, + "step": 30833 + }, + { + "epoch": 0.79, + "learning_rate": 1.7275775612648151e-06, + "loss": 0.7549, + "step": 30834 + }, + { + "epoch": 0.79, + "learning_rate": 1.7275585783512136e-06, + "loss": 0.8301, + "step": 30835 + }, + { + "epoch": 0.79, + "learning_rate": 1.7275395948805539e-06, + "loss": 0.8984, + "step": 30836 + }, + { + "epoch": 0.79, + "learning_rate": 1.7275206108528506e-06, + "loss": 0.915, + "step": 30837 + }, + { + "epoch": 0.79, + "learning_rate": 1.727501626268118e-06, + "loss": 0.8535, + "step": 30838 + }, + { + "epoch": 0.79, + "learning_rate": 1.7274826411263712e-06, + "loss": 0.6948, + "step": 30839 + }, + { + "epoch": 0.79, + "learning_rate": 1.7274636554276243e-06, + "loss": 0.9629, + "step": 30840 + }, + { + "epoch": 0.79, + "learning_rate": 1.727444669171892e-06, + "loss": 0.8662, + "step": 30841 + }, + { + "epoch": 0.79, + "learning_rate": 1.7274256823591883e-06, + "loss": 0.5795, + "step": 30842 + }, + { + "epoch": 0.79, + "learning_rate": 1.7274066949895288e-06, + "loss": 0.7158, + "step": 30843 + }, + { + "epoch": 0.79, + "learning_rate": 1.727387707062927e-06, + "loss": 0.8926, + "step": 30844 + }, + { + "epoch": 0.79, + "learning_rate": 1.7273687185793978e-06, + "loss": 0.9131, + "step": 30845 + }, + { + "epoch": 0.79, + "learning_rate": 1.7273497295389563e-06, + "loss": 0.9062, + "step": 30846 + }, + { + "epoch": 0.79, + "learning_rate": 1.7273307399416162e-06, + "loss": 0.9111, + "step": 30847 + }, + { + "epoch": 0.79, + "learning_rate": 1.7273117497873926e-06, + "loss": 0.917, + "step": 30848 + }, + { + "epoch": 0.79, + "learning_rate": 1.7272927590762997e-06, + "loss": 0.8555, + "step": 30849 + }, + { + "epoch": 0.79, + "learning_rate": 1.7272737678083521e-06, + "loss": 0.6226, + "step": 30850 + }, + { + "epoch": 0.79, + "learning_rate": 1.7272547759835646e-06, + "loss": 0.8052, + "step": 30851 + }, + { + "epoch": 0.79, + "learning_rate": 1.7272357836019516e-06, + "loss": 0.8379, + "step": 30852 + }, + { + "epoch": 0.79, + "learning_rate": 1.7272167906635276e-06, + "loss": 0.8438, + "step": 30853 + }, + { + "epoch": 0.79, + "learning_rate": 1.7271977971683073e-06, + "loss": 1.0205, + "step": 30854 + }, + { + "epoch": 0.79, + "learning_rate": 1.7271788031163044e-06, + "loss": 0.9951, + "step": 30855 + }, + { + "epoch": 0.79, + "learning_rate": 1.7271598085075348e-06, + "loss": 0.6318, + "step": 30856 + }, + { + "epoch": 0.79, + "learning_rate": 1.727140813342012e-06, + "loss": 0.5947, + "step": 30857 + }, + { + "epoch": 0.79, + "learning_rate": 1.7271218176197511e-06, + "loss": 0.6785, + "step": 30858 + }, + { + "epoch": 0.79, + "learning_rate": 1.7271028213407663e-06, + "loss": 1.0205, + "step": 30859 + }, + { + "epoch": 0.79, + "learning_rate": 1.7270838245050725e-06, + "loss": 0.834, + "step": 30860 + }, + { + "epoch": 0.79, + "learning_rate": 1.727064827112684e-06, + "loss": 0.7422, + "step": 30861 + }, + { + "epoch": 0.79, + "learning_rate": 1.7270458291636153e-06, + "loss": 0.9854, + "step": 30862 + }, + { + "epoch": 0.79, + "learning_rate": 1.727026830657881e-06, + "loss": 0.7017, + "step": 30863 + }, + { + "epoch": 0.79, + "learning_rate": 1.727007831595496e-06, + "loss": 0.9648, + "step": 30864 + }, + { + "epoch": 0.79, + "learning_rate": 1.726988831976474e-06, + "loss": 0.9546, + "step": 30865 + }, + { + "epoch": 0.79, + "learning_rate": 1.7269698318008304e-06, + "loss": 0.8252, + "step": 30866 + }, + { + "epoch": 0.79, + "learning_rate": 1.7269508310685794e-06, + "loss": 0.7969, + "step": 30867 + }, + { + "epoch": 0.79, + "learning_rate": 1.7269318297797354e-06, + "loss": 0.7014, + "step": 30868 + }, + { + "epoch": 0.79, + "learning_rate": 1.7269128279343135e-06, + "loss": 0.9746, + "step": 30869 + }, + { + "epoch": 0.79, + "learning_rate": 1.7268938255323277e-06, + "loss": 0.9131, + "step": 30870 + }, + { + "epoch": 0.79, + "learning_rate": 1.7268748225737925e-06, + "loss": 0.5811, + "step": 30871 + }, + { + "epoch": 0.79, + "learning_rate": 1.726855819058723e-06, + "loss": 0.9307, + "step": 30872 + }, + { + "epoch": 0.79, + "learning_rate": 1.7268368149871333e-06, + "loss": 0.6079, + "step": 30873 + }, + { + "epoch": 0.79, + "learning_rate": 1.7268178103590382e-06, + "loss": 0.7808, + "step": 30874 + }, + { + "epoch": 0.79, + "learning_rate": 1.7267988051744519e-06, + "loss": 0.7905, + "step": 30875 + }, + { + "epoch": 0.79, + "learning_rate": 1.7267797994333893e-06, + "loss": 0.8799, + "step": 30876 + }, + { + "epoch": 0.79, + "learning_rate": 1.7267607931358648e-06, + "loss": 0.916, + "step": 30877 + }, + { + "epoch": 0.79, + "learning_rate": 1.7267417862818929e-06, + "loss": 0.8447, + "step": 30878 + }, + { + "epoch": 0.79, + "learning_rate": 1.7267227788714882e-06, + "loss": 0.6489, + "step": 30879 + }, + { + "epoch": 0.79, + "learning_rate": 1.7267037709046655e-06, + "loss": 0.8613, + "step": 30880 + }, + { + "epoch": 0.79, + "learning_rate": 1.726684762381439e-06, + "loss": 0.8574, + "step": 30881 + }, + { + "epoch": 0.79, + "learning_rate": 1.7266657533018231e-06, + "loss": 0.8115, + "step": 30882 + }, + { + "epoch": 0.79, + "learning_rate": 1.7266467436658329e-06, + "loss": 0.8203, + "step": 30883 + }, + { + "epoch": 0.79, + "learning_rate": 1.726627733473483e-06, + "loss": 0.9375, + "step": 30884 + }, + { + "epoch": 0.79, + "learning_rate": 1.7266087227247875e-06, + "loss": 0.8433, + "step": 30885 + }, + { + "epoch": 0.79, + "learning_rate": 1.726589711419761e-06, + "loss": 0.9668, + "step": 30886 + }, + { + "epoch": 0.79, + "learning_rate": 1.726570699558418e-06, + "loss": 0.8721, + "step": 30887 + }, + { + "epoch": 0.79, + "learning_rate": 1.7265516871407736e-06, + "loss": 0.7227, + "step": 30888 + }, + { + "epoch": 0.79, + "learning_rate": 1.7265326741668416e-06, + "loss": 0.8584, + "step": 30889 + }, + { + "epoch": 0.79, + "learning_rate": 1.726513660636637e-06, + "loss": 0.6096, + "step": 30890 + }, + { + "epoch": 0.79, + "learning_rate": 1.7264946465501745e-06, + "loss": 0.9502, + "step": 30891 + }, + { + "epoch": 0.79, + "learning_rate": 1.7264756319074684e-06, + "loss": 1.085, + "step": 30892 + }, + { + "epoch": 0.79, + "learning_rate": 1.7264566167085332e-06, + "loss": 0.668, + "step": 30893 + }, + { + "epoch": 0.79, + "learning_rate": 1.7264376009533838e-06, + "loss": 0.833, + "step": 30894 + }, + { + "epoch": 0.79, + "learning_rate": 1.7264185846420344e-06, + "loss": 0.9814, + "step": 30895 + }, + { + "epoch": 0.79, + "learning_rate": 1.7263995677744997e-06, + "loss": 0.7217, + "step": 30896 + }, + { + "epoch": 0.79, + "learning_rate": 1.7263805503507945e-06, + "loss": 0.6875, + "step": 30897 + }, + { + "epoch": 0.79, + "learning_rate": 1.7263615323709326e-06, + "loss": 0.7966, + "step": 30898 + }, + { + "epoch": 0.79, + "learning_rate": 1.7263425138349295e-06, + "loss": 0.7261, + "step": 30899 + }, + { + "epoch": 0.79, + "learning_rate": 1.726323494742799e-06, + "loss": 0.9727, + "step": 30900 + }, + { + "epoch": 0.79, + "learning_rate": 1.7263044750945563e-06, + "loss": 0.7759, + "step": 30901 + }, + { + "epoch": 0.79, + "learning_rate": 1.7262854548902154e-06, + "loss": 0.8057, + "step": 30902 + }, + { + "epoch": 0.79, + "learning_rate": 1.7262664341297912e-06, + "loss": 0.8311, + "step": 30903 + }, + { + "epoch": 0.79, + "learning_rate": 1.7262474128132983e-06, + "loss": 0.7666, + "step": 30904 + }, + { + "epoch": 0.79, + "learning_rate": 1.726228390940751e-06, + "loss": 0.8926, + "step": 30905 + }, + { + "epoch": 0.79, + "learning_rate": 1.7262093685121642e-06, + "loss": 0.999, + "step": 30906 + }, + { + "epoch": 0.79, + "learning_rate": 1.7261903455275521e-06, + "loss": 0.7432, + "step": 30907 + }, + { + "epoch": 0.79, + "learning_rate": 1.7261713219869295e-06, + "loss": 0.7808, + "step": 30908 + }, + { + "epoch": 0.79, + "learning_rate": 1.726152297890311e-06, + "loss": 1.0039, + "step": 30909 + }, + { + "epoch": 0.79, + "learning_rate": 1.7261332732377109e-06, + "loss": 0.8984, + "step": 30910 + }, + { + "epoch": 0.79, + "learning_rate": 1.726114248029144e-06, + "loss": 0.9717, + "step": 30911 + }, + { + "epoch": 0.79, + "learning_rate": 1.7260952222646249e-06, + "loss": 0.646, + "step": 30912 + }, + { + "epoch": 0.79, + "learning_rate": 1.726076195944168e-06, + "loss": 1.0166, + "step": 30913 + }, + { + "epoch": 0.79, + "learning_rate": 1.7260571690677879e-06, + "loss": 0.5547, + "step": 30914 + }, + { + "epoch": 0.79, + "learning_rate": 1.7260381416354992e-06, + "loss": 0.9209, + "step": 30915 + }, + { + "epoch": 0.79, + "learning_rate": 1.7260191136473168e-06, + "loss": 0.5781, + "step": 30916 + }, + { + "epoch": 0.79, + "learning_rate": 1.7260000851032547e-06, + "loss": 0.7217, + "step": 30917 + }, + { + "epoch": 0.79, + "learning_rate": 1.7259810560033277e-06, + "loss": 0.8848, + "step": 30918 + }, + { + "epoch": 0.79, + "learning_rate": 1.7259620263475503e-06, + "loss": 0.7539, + "step": 30919 + }, + { + "epoch": 0.79, + "learning_rate": 1.7259429961359371e-06, + "loss": 1.0293, + "step": 30920 + }, + { + "epoch": 0.79, + "learning_rate": 1.7259239653685032e-06, + "loss": 0.6611, + "step": 30921 + }, + { + "epoch": 0.79, + "learning_rate": 1.7259049340452622e-06, + "loss": 0.8193, + "step": 30922 + }, + { + "epoch": 0.79, + "learning_rate": 1.7258859021662293e-06, + "loss": 0.6641, + "step": 30923 + }, + { + "epoch": 0.79, + "learning_rate": 1.7258668697314192e-06, + "loss": 0.9102, + "step": 30924 + }, + { + "epoch": 0.79, + "learning_rate": 1.7258478367408459e-06, + "loss": 0.8252, + "step": 30925 + }, + { + "epoch": 0.79, + "learning_rate": 1.7258288031945243e-06, + "loss": 1.0122, + "step": 30926 + }, + { + "epoch": 0.79, + "learning_rate": 1.7258097690924691e-06, + "loss": 0.9561, + "step": 30927 + }, + { + "epoch": 0.79, + "learning_rate": 1.7257907344346947e-06, + "loss": 0.8613, + "step": 30928 + }, + { + "epoch": 0.79, + "learning_rate": 1.7257716992212154e-06, + "loss": 0.79, + "step": 30929 + }, + { + "epoch": 0.79, + "learning_rate": 1.7257526634520464e-06, + "loss": 0.7197, + "step": 30930 + }, + { + "epoch": 0.79, + "learning_rate": 1.725733627127202e-06, + "loss": 0.7122, + "step": 30931 + }, + { + "epoch": 0.79, + "learning_rate": 1.7257145902466967e-06, + "loss": 0.6953, + "step": 30932 + }, + { + "epoch": 0.79, + "learning_rate": 1.7256955528105453e-06, + "loss": 0.7808, + "step": 30933 + }, + { + "epoch": 0.79, + "learning_rate": 1.7256765148187617e-06, + "loss": 0.7471, + "step": 30934 + }, + { + "epoch": 0.79, + "learning_rate": 1.7256574762713614e-06, + "loss": 0.8066, + "step": 30935 + }, + { + "epoch": 0.79, + "learning_rate": 1.7256384371683584e-06, + "loss": 1.1328, + "step": 30936 + }, + { + "epoch": 0.79, + "learning_rate": 1.7256193975097673e-06, + "loss": 0.6895, + "step": 30937 + }, + { + "epoch": 0.79, + "learning_rate": 1.7256003572956028e-06, + "loss": 0.7656, + "step": 30938 + }, + { + "epoch": 0.79, + "learning_rate": 1.7255813165258796e-06, + "loss": 0.7168, + "step": 30939 + }, + { + "epoch": 0.79, + "learning_rate": 1.725562275200612e-06, + "loss": 0.9619, + "step": 30940 + }, + { + "epoch": 0.79, + "learning_rate": 1.725543233319815e-06, + "loss": 0.8496, + "step": 30941 + }, + { + "epoch": 0.79, + "learning_rate": 1.7255241908835027e-06, + "loss": 0.7505, + "step": 30942 + }, + { + "epoch": 0.79, + "learning_rate": 1.72550514789169e-06, + "loss": 0.7407, + "step": 30943 + }, + { + "epoch": 0.79, + "learning_rate": 1.7254861043443911e-06, + "loss": 0.9502, + "step": 30944 + }, + { + "epoch": 0.79, + "learning_rate": 1.725467060241621e-06, + "loss": 0.9121, + "step": 30945 + }, + { + "epoch": 0.79, + "learning_rate": 1.7254480155833942e-06, + "loss": 0.6084, + "step": 30946 + }, + { + "epoch": 0.79, + "learning_rate": 1.725428970369725e-06, + "loss": 0.8867, + "step": 30947 + }, + { + "epoch": 0.79, + "learning_rate": 1.7254099246006283e-06, + "loss": 0.9629, + "step": 30948 + }, + { + "epoch": 0.79, + "learning_rate": 1.7253908782761187e-06, + "loss": 0.9277, + "step": 30949 + }, + { + "epoch": 0.79, + "learning_rate": 1.7253718313962105e-06, + "loss": 0.8975, + "step": 30950 + }, + { + "epoch": 0.79, + "learning_rate": 1.7253527839609188e-06, + "loss": 1.0146, + "step": 30951 + }, + { + "epoch": 0.79, + "learning_rate": 1.7253337359702575e-06, + "loss": 0.9434, + "step": 30952 + }, + { + "epoch": 0.79, + "learning_rate": 1.7253146874242414e-06, + "loss": 0.8203, + "step": 30953 + }, + { + "epoch": 0.79, + "learning_rate": 1.7252956383228857e-06, + "loss": 0.8965, + "step": 30954 + }, + { + "epoch": 0.79, + "learning_rate": 1.7252765886662037e-06, + "loss": 0.915, + "step": 30955 + }, + { + "epoch": 0.79, + "learning_rate": 1.7252575384542114e-06, + "loss": 0.6187, + "step": 30956 + }, + { + "epoch": 0.79, + "learning_rate": 1.7252384876869225e-06, + "loss": 0.7583, + "step": 30957 + }, + { + "epoch": 0.79, + "learning_rate": 1.7252194363643523e-06, + "loss": 0.7102, + "step": 30958 + }, + { + "epoch": 0.79, + "learning_rate": 1.7252003844865143e-06, + "loss": 1.0117, + "step": 30959 + }, + { + "epoch": 0.79, + "learning_rate": 1.725181332053424e-06, + "loss": 0.8633, + "step": 30960 + }, + { + "epoch": 0.79, + "learning_rate": 1.7251622790650954e-06, + "loss": 0.5498, + "step": 30961 + }, + { + "epoch": 0.79, + "learning_rate": 1.7251432255215436e-06, + "loss": 0.9658, + "step": 30962 + }, + { + "epoch": 0.79, + "learning_rate": 1.725124171422783e-06, + "loss": 0.4546, + "step": 30963 + }, + { + "epoch": 0.79, + "learning_rate": 1.7251051167688284e-06, + "loss": 1.1436, + "step": 30964 + }, + { + "epoch": 0.79, + "learning_rate": 1.725086061559694e-06, + "loss": 0.873, + "step": 30965 + }, + { + "epoch": 0.79, + "learning_rate": 1.7250670057953943e-06, + "loss": 0.7964, + "step": 30966 + }, + { + "epoch": 0.79, + "learning_rate": 1.7250479494759442e-06, + "loss": 0.9375, + "step": 30967 + }, + { + "epoch": 0.79, + "learning_rate": 1.7250288926013582e-06, + "loss": 0.7354, + "step": 30968 + }, + { + "epoch": 0.79, + "learning_rate": 1.725009835171651e-06, + "loss": 1.002, + "step": 30969 + }, + { + "epoch": 0.79, + "learning_rate": 1.7249907771868374e-06, + "loss": 1.0029, + "step": 30970 + }, + { + "epoch": 0.79, + "learning_rate": 1.7249717186469313e-06, + "loss": 0.7441, + "step": 30971 + }, + { + "epoch": 0.79, + "learning_rate": 1.7249526595519477e-06, + "loss": 1.0234, + "step": 30972 + }, + { + "epoch": 0.79, + "learning_rate": 1.7249335999019014e-06, + "loss": 1.043, + "step": 30973 + }, + { + "epoch": 0.79, + "learning_rate": 1.7249145396968067e-06, + "loss": 0.7227, + "step": 30974 + }, + { + "epoch": 0.79, + "learning_rate": 1.7248954789366784e-06, + "loss": 0.855, + "step": 30975 + }, + { + "epoch": 0.79, + "learning_rate": 1.7248764176215306e-06, + "loss": 1.1406, + "step": 30976 + }, + { + "epoch": 0.79, + "learning_rate": 1.7248573557513786e-06, + "loss": 0.6768, + "step": 30977 + }, + { + "epoch": 0.79, + "learning_rate": 1.7248382933262365e-06, + "loss": 0.9111, + "step": 30978 + }, + { + "epoch": 0.79, + "learning_rate": 1.7248192303461191e-06, + "loss": 0.9805, + "step": 30979 + }, + { + "epoch": 0.79, + "learning_rate": 1.7248001668110408e-06, + "loss": 0.8467, + "step": 30980 + }, + { + "epoch": 0.79, + "learning_rate": 1.7247811027210163e-06, + "loss": 0.5366, + "step": 30981 + }, + { + "epoch": 0.79, + "learning_rate": 1.7247620380760605e-06, + "loss": 0.6313, + "step": 30982 + }, + { + "epoch": 0.79, + "learning_rate": 1.7247429728761876e-06, + "loss": 1.0205, + "step": 30983 + }, + { + "epoch": 0.79, + "learning_rate": 1.7247239071214124e-06, + "loss": 0.8154, + "step": 30984 + }, + { + "epoch": 0.79, + "learning_rate": 1.7247048408117495e-06, + "loss": 0.9131, + "step": 30985 + }, + { + "epoch": 0.79, + "learning_rate": 1.7246857739472132e-06, + "loss": 0.5234, + "step": 30986 + }, + { + "epoch": 0.79, + "learning_rate": 1.7246667065278183e-06, + "loss": 0.7632, + "step": 30987 + }, + { + "epoch": 0.79, + "learning_rate": 1.7246476385535798e-06, + "loss": 1.042, + "step": 30988 + }, + { + "epoch": 0.79, + "learning_rate": 1.7246285700245115e-06, + "loss": 0.8901, + "step": 30989 + }, + { + "epoch": 0.79, + "learning_rate": 1.7246095009406285e-06, + "loss": 0.9092, + "step": 30990 + }, + { + "epoch": 0.79, + "learning_rate": 1.7245904313019457e-06, + "loss": 0.8096, + "step": 30991 + }, + { + "epoch": 0.79, + "learning_rate": 1.724571361108477e-06, + "loss": 0.791, + "step": 30992 + }, + { + "epoch": 0.79, + "learning_rate": 1.724552290360237e-06, + "loss": 0.9658, + "step": 30993 + }, + { + "epoch": 0.79, + "learning_rate": 1.7245332190572413e-06, + "loss": 0.6792, + "step": 30994 + }, + { + "epoch": 0.79, + "learning_rate": 1.7245141471995033e-06, + "loss": 0.833, + "step": 30995 + }, + { + "epoch": 0.79, + "learning_rate": 1.7244950747870383e-06, + "loss": 0.8691, + "step": 30996 + }, + { + "epoch": 0.79, + "learning_rate": 1.724476001819861e-06, + "loss": 0.7969, + "step": 30997 + }, + { + "epoch": 0.79, + "learning_rate": 1.7244569282979856e-06, + "loss": 0.7949, + "step": 30998 + }, + { + "epoch": 0.79, + "learning_rate": 1.7244378542214267e-06, + "loss": 0.8877, + "step": 30999 + }, + { + "epoch": 0.79, + "learning_rate": 1.724418779590199e-06, + "loss": 0.8154, + "step": 31000 + }, + { + "epoch": 0.79, + "learning_rate": 1.7243997044043176e-06, + "loss": 0.8594, + "step": 31001 + }, + { + "epoch": 0.79, + "learning_rate": 1.724380628663796e-06, + "loss": 0.7969, + "step": 31002 + }, + { + "epoch": 0.79, + "learning_rate": 1.72436155236865e-06, + "loss": 0.9062, + "step": 31003 + }, + { + "epoch": 0.79, + "learning_rate": 1.7243424755188934e-06, + "loss": 1.0107, + "step": 31004 + }, + { + "epoch": 0.79, + "learning_rate": 1.724323398114541e-06, + "loss": 1.0371, + "step": 31005 + }, + { + "epoch": 0.79, + "learning_rate": 1.7243043201556077e-06, + "loss": 0.8467, + "step": 31006 + }, + { + "epoch": 0.79, + "learning_rate": 1.7242852416421076e-06, + "loss": 0.8774, + "step": 31007 + }, + { + "epoch": 0.79, + "learning_rate": 1.724266162574056e-06, + "loss": 0.8994, + "step": 31008 + }, + { + "epoch": 0.79, + "learning_rate": 1.724247082951467e-06, + "loss": 0.998, + "step": 31009 + }, + { + "epoch": 0.79, + "learning_rate": 1.724228002774355e-06, + "loss": 0.7471, + "step": 31010 + }, + { + "epoch": 0.79, + "learning_rate": 1.7242089220427353e-06, + "loss": 0.6445, + "step": 31011 + }, + { + "epoch": 0.79, + "learning_rate": 1.724189840756622e-06, + "loss": 0.8398, + "step": 31012 + }, + { + "epoch": 0.79, + "learning_rate": 1.7241707589160295e-06, + "loss": 0.8652, + "step": 31013 + }, + { + "epoch": 0.79, + "learning_rate": 1.724151676520973e-06, + "loss": 0.7451, + "step": 31014 + }, + { + "epoch": 0.79, + "learning_rate": 1.724132593571467e-06, + "loss": 0.7783, + "step": 31015 + }, + { + "epoch": 0.79, + "learning_rate": 1.724113510067526e-06, + "loss": 0.6699, + "step": 31016 + }, + { + "epoch": 0.79, + "learning_rate": 1.7240944260091643e-06, + "loss": 0.9883, + "step": 31017 + }, + { + "epoch": 0.8, + "learning_rate": 1.724075341396397e-06, + "loss": 0.8984, + "step": 31018 + }, + { + "epoch": 0.8, + "learning_rate": 1.7240562562292383e-06, + "loss": 0.8574, + "step": 31019 + }, + { + "epoch": 0.8, + "learning_rate": 1.724037170507703e-06, + "loss": 0.8887, + "step": 31020 + }, + { + "epoch": 0.8, + "learning_rate": 1.724018084231806e-06, + "loss": 0.6758, + "step": 31021 + }, + { + "epoch": 0.8, + "learning_rate": 1.7239989974015616e-06, + "loss": 0.8203, + "step": 31022 + }, + { + "epoch": 0.8, + "learning_rate": 1.7239799100169844e-06, + "loss": 0.9404, + "step": 31023 + }, + { + "epoch": 0.8, + "learning_rate": 1.723960822078089e-06, + "loss": 0.7275, + "step": 31024 + }, + { + "epoch": 0.8, + "learning_rate": 1.72394173358489e-06, + "loss": 0.8818, + "step": 31025 + }, + { + "epoch": 0.8, + "learning_rate": 1.7239226445374025e-06, + "loss": 0.7051, + "step": 31026 + }, + { + "epoch": 0.8, + "learning_rate": 1.7239035549356405e-06, + "loss": 0.8447, + "step": 31027 + }, + { + "epoch": 0.8, + "learning_rate": 1.7238844647796188e-06, + "loss": 1.0176, + "step": 31028 + }, + { + "epoch": 0.8, + "learning_rate": 1.7238653740693518e-06, + "loss": 0.9102, + "step": 31029 + }, + { + "epoch": 0.8, + "learning_rate": 1.7238462828048548e-06, + "loss": 0.9736, + "step": 31030 + }, + { + "epoch": 0.8, + "learning_rate": 1.7238271909861419e-06, + "loss": 0.8301, + "step": 31031 + }, + { + "epoch": 0.8, + "learning_rate": 1.7238080986132278e-06, + "loss": 0.595, + "step": 31032 + }, + { + "epoch": 0.8, + "learning_rate": 1.723789005686127e-06, + "loss": 0.6909, + "step": 31033 + }, + { + "epoch": 0.8, + "learning_rate": 1.723769912204854e-06, + "loss": 0.8662, + "step": 31034 + }, + { + "epoch": 0.8, + "learning_rate": 1.723750818169424e-06, + "loss": 0.9883, + "step": 31035 + }, + { + "epoch": 0.8, + "learning_rate": 1.7237317235798513e-06, + "loss": 1.0752, + "step": 31036 + }, + { + "epoch": 0.8, + "learning_rate": 1.7237126284361506e-06, + "loss": 0.6611, + "step": 31037 + }, + { + "epoch": 0.8, + "learning_rate": 1.723693532738336e-06, + "loss": 0.7383, + "step": 31038 + }, + { + "epoch": 0.8, + "learning_rate": 1.7236744364864226e-06, + "loss": 1.0088, + "step": 31039 + }, + { + "epoch": 0.8, + "learning_rate": 1.723655339680425e-06, + "loss": 0.8574, + "step": 31040 + }, + { + "epoch": 0.8, + "learning_rate": 1.723636242320358e-06, + "loss": 0.7446, + "step": 31041 + }, + { + "epoch": 0.8, + "learning_rate": 1.723617144406236e-06, + "loss": 0.7732, + "step": 31042 + }, + { + "epoch": 0.8, + "learning_rate": 1.7235980459380736e-06, + "loss": 0.9268, + "step": 31043 + }, + { + "epoch": 0.8, + "learning_rate": 1.7235789469158853e-06, + "loss": 1.0498, + "step": 31044 + }, + { + "epoch": 0.8, + "learning_rate": 1.7235598473396857e-06, + "loss": 0.9502, + "step": 31045 + }, + { + "epoch": 0.8, + "learning_rate": 1.72354074720949e-06, + "loss": 0.7266, + "step": 31046 + }, + { + "epoch": 0.8, + "learning_rate": 1.723521646525312e-06, + "loss": 0.7529, + "step": 31047 + }, + { + "epoch": 0.8, + "learning_rate": 1.7235025452871672e-06, + "loss": 0.5576, + "step": 31048 + }, + { + "epoch": 0.8, + "learning_rate": 1.7234834434950699e-06, + "loss": 0.834, + "step": 31049 + }, + { + "epoch": 0.8, + "learning_rate": 1.7234643411490342e-06, + "loss": 0.9219, + "step": 31050 + }, + { + "epoch": 0.8, + "learning_rate": 1.723445238249075e-06, + "loss": 0.9297, + "step": 31051 + }, + { + "epoch": 0.8, + "learning_rate": 1.7234261347952073e-06, + "loss": 0.9189, + "step": 31052 + }, + { + "epoch": 0.8, + "learning_rate": 1.7234070307874452e-06, + "loss": 0.7417, + "step": 31053 + }, + { + "epoch": 0.8, + "learning_rate": 1.723387926225804e-06, + "loss": 1.0361, + "step": 31054 + }, + { + "epoch": 0.8, + "learning_rate": 1.7233688211102976e-06, + "loss": 0.9922, + "step": 31055 + }, + { + "epoch": 0.8, + "learning_rate": 1.7233497154409413e-06, + "loss": 0.7852, + "step": 31056 + }, + { + "epoch": 0.8, + "learning_rate": 1.723330609217749e-06, + "loss": 0.5734, + "step": 31057 + }, + { + "epoch": 0.8, + "learning_rate": 1.723311502440736e-06, + "loss": 0.8608, + "step": 31058 + }, + { + "epoch": 0.8, + "learning_rate": 1.7232923951099166e-06, + "loss": 0.9209, + "step": 31059 + }, + { + "epoch": 0.8, + "learning_rate": 1.7232732872253051e-06, + "loss": 0.749, + "step": 31060 + }, + { + "epoch": 0.8, + "learning_rate": 1.723254178786917e-06, + "loss": 0.7578, + "step": 31061 + }, + { + "epoch": 0.8, + "learning_rate": 1.7232350697947663e-06, + "loss": 0.8037, + "step": 31062 + }, + { + "epoch": 0.8, + "learning_rate": 1.7232159602488675e-06, + "loss": 0.8643, + "step": 31063 + }, + { + "epoch": 0.8, + "learning_rate": 1.7231968501492356e-06, + "loss": 0.8574, + "step": 31064 + }, + { + "epoch": 0.8, + "learning_rate": 1.7231777394958852e-06, + "loss": 0.8877, + "step": 31065 + }, + { + "epoch": 0.8, + "learning_rate": 1.7231586282888307e-06, + "loss": 0.9082, + "step": 31066 + }, + { + "epoch": 0.8, + "learning_rate": 1.7231395165280874e-06, + "loss": 0.8633, + "step": 31067 + }, + { + "epoch": 0.8, + "learning_rate": 1.723120404213669e-06, + "loss": 0.6313, + "step": 31068 + }, + { + "epoch": 0.8, + "learning_rate": 1.7231012913455905e-06, + "loss": 0.7075, + "step": 31069 + }, + { + "epoch": 0.8, + "learning_rate": 1.723082177923867e-06, + "loss": 0.9971, + "step": 31070 + }, + { + "epoch": 0.8, + "learning_rate": 1.7230630639485124e-06, + "loss": 0.7485, + "step": 31071 + }, + { + "epoch": 0.8, + "learning_rate": 1.7230439494195417e-06, + "loss": 0.8975, + "step": 31072 + }, + { + "epoch": 0.8, + "learning_rate": 1.7230248343369693e-06, + "loss": 0.9707, + "step": 31073 + }, + { + "epoch": 0.8, + "learning_rate": 1.7230057187008103e-06, + "loss": 0.9619, + "step": 31074 + }, + { + "epoch": 0.8, + "learning_rate": 1.7229866025110789e-06, + "loss": 0.8413, + "step": 31075 + }, + { + "epoch": 0.8, + "learning_rate": 1.72296748576779e-06, + "loss": 0.7266, + "step": 31076 + }, + { + "epoch": 0.8, + "learning_rate": 1.7229483684709583e-06, + "loss": 0.5337, + "step": 31077 + }, + { + "epoch": 0.8, + "learning_rate": 1.722929250620598e-06, + "loss": 0.7969, + "step": 31078 + }, + { + "epoch": 0.8, + "learning_rate": 1.7229101322167244e-06, + "loss": 0.9092, + "step": 31079 + }, + { + "epoch": 0.8, + "learning_rate": 1.7228910132593513e-06, + "loss": 0.7441, + "step": 31080 + }, + { + "epoch": 0.8, + "learning_rate": 1.7228718937484939e-06, + "loss": 0.8936, + "step": 31081 + }, + { + "epoch": 0.8, + "learning_rate": 1.7228527736841669e-06, + "loss": 0.6597, + "step": 31082 + }, + { + "epoch": 0.8, + "learning_rate": 1.7228336530663846e-06, + "loss": 0.5833, + "step": 31083 + }, + { + "epoch": 0.8, + "learning_rate": 1.7228145318951617e-06, + "loss": 0.7783, + "step": 31084 + }, + { + "epoch": 0.8, + "learning_rate": 1.7227954101705132e-06, + "loss": 0.7192, + "step": 31085 + }, + { + "epoch": 0.8, + "learning_rate": 1.7227762878924535e-06, + "loss": 0.7881, + "step": 31086 + }, + { + "epoch": 0.8, + "learning_rate": 1.7227571650609972e-06, + "loss": 0.9092, + "step": 31087 + }, + { + "epoch": 0.8, + "learning_rate": 1.722738041676159e-06, + "loss": 0.8828, + "step": 31088 + }, + { + "epoch": 0.8, + "learning_rate": 1.722718917737953e-06, + "loss": 0.9404, + "step": 31089 + }, + { + "epoch": 0.8, + "learning_rate": 1.7226997932463951e-06, + "loss": 1.0361, + "step": 31090 + }, + { + "epoch": 0.8, + "learning_rate": 1.722680668201499e-06, + "loss": 0.5918, + "step": 31091 + }, + { + "epoch": 0.8, + "learning_rate": 1.7226615426032792e-06, + "loss": 0.4253, + "step": 31092 + }, + { + "epoch": 0.8, + "learning_rate": 1.722642416451751e-06, + "loss": 0.9307, + "step": 31093 + }, + { + "epoch": 0.8, + "learning_rate": 1.7226232897469286e-06, + "loss": 0.9893, + "step": 31094 + }, + { + "epoch": 0.8, + "learning_rate": 1.7226041624888268e-06, + "loss": 0.6304, + "step": 31095 + }, + { + "epoch": 0.8, + "learning_rate": 1.7225850346774605e-06, + "loss": 0.873, + "step": 31096 + }, + { + "epoch": 0.8, + "learning_rate": 1.7225659063128438e-06, + "loss": 1.0137, + "step": 31097 + }, + { + "epoch": 0.8, + "learning_rate": 1.7225467773949914e-06, + "loss": 0.8594, + "step": 31098 + }, + { + "epoch": 0.8, + "learning_rate": 1.7225276479239184e-06, + "loss": 0.8682, + "step": 31099 + }, + { + "epoch": 0.8, + "learning_rate": 1.722508517899639e-06, + "loss": 0.875, + "step": 31100 + }, + { + "epoch": 0.8, + "learning_rate": 1.7224893873221685e-06, + "loss": 0.793, + "step": 31101 + }, + { + "epoch": 0.8, + "learning_rate": 1.7224702561915208e-06, + "loss": 0.8086, + "step": 31102 + }, + { + "epoch": 0.8, + "learning_rate": 1.7224511245077107e-06, + "loss": 0.9395, + "step": 31103 + }, + { + "epoch": 0.8, + "learning_rate": 1.7224319922707533e-06, + "loss": 1.0508, + "step": 31104 + }, + { + "epoch": 0.8, + "learning_rate": 1.7224128594806626e-06, + "loss": 0.9375, + "step": 31105 + }, + { + "epoch": 0.8, + "learning_rate": 1.7223937261374539e-06, + "loss": 1.0645, + "step": 31106 + }, + { + "epoch": 0.8, + "learning_rate": 1.7223745922411411e-06, + "loss": 1.0029, + "step": 31107 + }, + { + "epoch": 0.8, + "learning_rate": 1.7223554577917398e-06, + "loss": 0.7744, + "step": 31108 + }, + { + "epoch": 0.8, + "learning_rate": 1.722336322789264e-06, + "loss": 0.7842, + "step": 31109 + }, + { + "epoch": 0.8, + "learning_rate": 1.7223171872337286e-06, + "loss": 0.7246, + "step": 31110 + }, + { + "epoch": 0.8, + "learning_rate": 1.7222980511251479e-06, + "loss": 0.8623, + "step": 31111 + }, + { + "epoch": 0.8, + "learning_rate": 1.7222789144635368e-06, + "loss": 0.8936, + "step": 31112 + }, + { + "epoch": 0.8, + "learning_rate": 1.7222597772489103e-06, + "loss": 0.8115, + "step": 31113 + }, + { + "epoch": 0.8, + "learning_rate": 1.7222406394812824e-06, + "loss": 0.8828, + "step": 31114 + }, + { + "epoch": 0.8, + "learning_rate": 1.7222215011606677e-06, + "loss": 0.7324, + "step": 31115 + }, + { + "epoch": 0.8, + "learning_rate": 1.7222023622870818e-06, + "loss": 1.0391, + "step": 31116 + }, + { + "epoch": 0.8, + "learning_rate": 1.7221832228605386e-06, + "loss": 0.7754, + "step": 31117 + }, + { + "epoch": 0.8, + "learning_rate": 1.722164082881053e-06, + "loss": 0.8711, + "step": 31118 + }, + { + "epoch": 0.8, + "learning_rate": 1.7221449423486392e-06, + "loss": 0.7515, + "step": 31119 + }, + { + "epoch": 0.8, + "learning_rate": 1.7221258012633126e-06, + "loss": 0.6846, + "step": 31120 + }, + { + "epoch": 0.8, + "learning_rate": 1.7221066596250873e-06, + "loss": 0.9746, + "step": 31121 + }, + { + "epoch": 0.8, + "learning_rate": 1.7220875174339779e-06, + "loss": 0.7969, + "step": 31122 + }, + { + "epoch": 0.8, + "learning_rate": 1.7220683746899999e-06, + "loss": 0.7227, + "step": 31123 + }, + { + "epoch": 0.8, + "learning_rate": 1.722049231393167e-06, + "loss": 0.9102, + "step": 31124 + }, + { + "epoch": 0.8, + "learning_rate": 1.7220300875434938e-06, + "loss": 1.0117, + "step": 31125 + }, + { + "epoch": 0.8, + "learning_rate": 1.722010943140996e-06, + "loss": 0.9062, + "step": 31126 + }, + { + "epoch": 0.8, + "learning_rate": 1.7219917981856873e-06, + "loss": 1.0361, + "step": 31127 + }, + { + "epoch": 0.8, + "learning_rate": 1.7219726526775828e-06, + "loss": 0.8508, + "step": 31128 + }, + { + "epoch": 0.8, + "learning_rate": 1.721953506616697e-06, + "loss": 0.8701, + "step": 31129 + }, + { + "epoch": 0.8, + "learning_rate": 1.7219343600030448e-06, + "loss": 0.9492, + "step": 31130 + }, + { + "epoch": 0.8, + "learning_rate": 1.7219152128366404e-06, + "loss": 0.8301, + "step": 31131 + }, + { + "epoch": 0.8, + "learning_rate": 1.7218960651174985e-06, + "loss": 0.9209, + "step": 31132 + }, + { + "epoch": 0.8, + "learning_rate": 1.7218769168456344e-06, + "loss": 0.9873, + "step": 31133 + }, + { + "epoch": 0.8, + "learning_rate": 1.7218577680210622e-06, + "loss": 0.9414, + "step": 31134 + }, + { + "epoch": 0.8, + "learning_rate": 1.7218386186437968e-06, + "loss": 0.9053, + "step": 31135 + }, + { + "epoch": 0.8, + "learning_rate": 1.7218194687138526e-06, + "loss": 0.7891, + "step": 31136 + }, + { + "epoch": 0.8, + "learning_rate": 1.7218003182312443e-06, + "loss": 1.0039, + "step": 31137 + }, + { + "epoch": 0.8, + "learning_rate": 1.721781167195987e-06, + "loss": 0.8545, + "step": 31138 + }, + { + "epoch": 0.8, + "learning_rate": 1.7217620156080948e-06, + "loss": 0.79, + "step": 31139 + }, + { + "epoch": 0.8, + "learning_rate": 1.7217428634675829e-06, + "loss": 0.7031, + "step": 31140 + }, + { + "epoch": 0.8, + "learning_rate": 1.7217237107744653e-06, + "loss": 0.7932, + "step": 31141 + }, + { + "epoch": 0.8, + "learning_rate": 1.7217045575287572e-06, + "loss": 0.6641, + "step": 31142 + }, + { + "epoch": 0.8, + "learning_rate": 1.7216854037304732e-06, + "loss": 0.7141, + "step": 31143 + }, + { + "epoch": 0.8, + "learning_rate": 1.721666249379628e-06, + "loss": 0.9189, + "step": 31144 + }, + { + "epoch": 0.8, + "learning_rate": 1.7216470944762357e-06, + "loss": 0.7861, + "step": 31145 + }, + { + "epoch": 0.8, + "learning_rate": 1.7216279390203118e-06, + "loss": 0.782, + "step": 31146 + }, + { + "epoch": 0.8, + "learning_rate": 1.7216087830118703e-06, + "loss": 0.8867, + "step": 31147 + }, + { + "epoch": 0.8, + "learning_rate": 1.7215896264509263e-06, + "loss": 0.875, + "step": 31148 + }, + { + "epoch": 0.8, + "learning_rate": 1.7215704693374944e-06, + "loss": 0.9834, + "step": 31149 + }, + { + "epoch": 0.8, + "learning_rate": 1.7215513116715888e-06, + "loss": 0.9785, + "step": 31150 + }, + { + "epoch": 0.8, + "learning_rate": 1.7215321534532247e-06, + "loss": 0.8503, + "step": 31151 + }, + { + "epoch": 0.8, + "learning_rate": 1.7215129946824168e-06, + "loss": 0.9756, + "step": 31152 + }, + { + "epoch": 0.8, + "learning_rate": 1.7214938353591792e-06, + "loss": 0.8828, + "step": 31153 + }, + { + "epoch": 0.8, + "learning_rate": 1.7214746754835274e-06, + "loss": 0.5942, + "step": 31154 + }, + { + "epoch": 0.8, + "learning_rate": 1.7214555150554752e-06, + "loss": 0.7822, + "step": 31155 + }, + { + "epoch": 0.8, + "learning_rate": 1.7214363540750381e-06, + "loss": 0.96, + "step": 31156 + }, + { + "epoch": 0.8, + "learning_rate": 1.72141719254223e-06, + "loss": 0.7568, + "step": 31157 + }, + { + "epoch": 0.8, + "learning_rate": 1.7213980304570664e-06, + "loss": 0.8789, + "step": 31158 + }, + { + "epoch": 0.8, + "learning_rate": 1.7213788678195612e-06, + "loss": 1.1016, + "step": 31159 + }, + { + "epoch": 0.8, + "learning_rate": 1.7213597046297293e-06, + "loss": 0.6943, + "step": 31160 + }, + { + "epoch": 0.8, + "learning_rate": 1.7213405408875853e-06, + "loss": 1.0293, + "step": 31161 + }, + { + "epoch": 0.8, + "learning_rate": 1.7213213765931443e-06, + "loss": 0.8545, + "step": 31162 + }, + { + "epoch": 0.8, + "learning_rate": 1.7213022117464205e-06, + "loss": 0.7324, + "step": 31163 + }, + { + "epoch": 0.8, + "learning_rate": 1.7212830463474288e-06, + "loss": 0.6758, + "step": 31164 + }, + { + "epoch": 0.8, + "learning_rate": 1.7212638803961838e-06, + "loss": 0.7542, + "step": 31165 + }, + { + "epoch": 0.8, + "learning_rate": 1.7212447138927003e-06, + "loss": 0.8457, + "step": 31166 + }, + { + "epoch": 0.8, + "learning_rate": 1.721225546836993e-06, + "loss": 0.6719, + "step": 31167 + }, + { + "epoch": 0.8, + "learning_rate": 1.7212063792290766e-06, + "loss": 0.9775, + "step": 31168 + }, + { + "epoch": 0.8, + "learning_rate": 1.7211872110689652e-06, + "loss": 0.9307, + "step": 31169 + }, + { + "epoch": 0.8, + "learning_rate": 1.7211680423566742e-06, + "loss": 0.7358, + "step": 31170 + }, + { + "epoch": 0.8, + "learning_rate": 1.7211488730922176e-06, + "loss": 1.0098, + "step": 31171 + }, + { + "epoch": 0.8, + "learning_rate": 1.721129703275611e-06, + "loss": 0.8804, + "step": 31172 + }, + { + "epoch": 0.8, + "learning_rate": 1.7211105329068682e-06, + "loss": 0.8076, + "step": 31173 + }, + { + "epoch": 0.8, + "learning_rate": 1.7210913619860042e-06, + "loss": 0.8008, + "step": 31174 + }, + { + "epoch": 0.8, + "learning_rate": 1.721072190513034e-06, + "loss": 0.8936, + "step": 31175 + }, + { + "epoch": 0.8, + "learning_rate": 1.7210530184879716e-06, + "loss": 0.7944, + "step": 31176 + }, + { + "epoch": 0.8, + "learning_rate": 1.7210338459108323e-06, + "loss": 0.5916, + "step": 31177 + }, + { + "epoch": 0.8, + "learning_rate": 1.7210146727816306e-06, + "loss": 0.8838, + "step": 31178 + }, + { + "epoch": 0.8, + "learning_rate": 1.720995499100381e-06, + "loss": 0.7119, + "step": 31179 + }, + { + "epoch": 0.8, + "learning_rate": 1.7209763248670983e-06, + "loss": 0.9199, + "step": 31180 + }, + { + "epoch": 0.8, + "learning_rate": 1.7209571500817972e-06, + "loss": 0.8545, + "step": 31181 + }, + { + "epoch": 0.8, + "learning_rate": 1.7209379747444922e-06, + "loss": 0.6396, + "step": 31182 + }, + { + "epoch": 0.8, + "learning_rate": 1.7209187988551985e-06, + "loss": 0.7695, + "step": 31183 + }, + { + "epoch": 0.8, + "learning_rate": 1.7208996224139302e-06, + "loss": 0.8018, + "step": 31184 + }, + { + "epoch": 0.8, + "learning_rate": 1.7208804454207022e-06, + "loss": 0.7725, + "step": 31185 + }, + { + "epoch": 0.8, + "learning_rate": 1.7208612678755292e-06, + "loss": 0.8145, + "step": 31186 + }, + { + "epoch": 0.8, + "learning_rate": 1.720842089778426e-06, + "loss": 0.9014, + "step": 31187 + }, + { + "epoch": 0.8, + "learning_rate": 1.720822911129407e-06, + "loss": 0.7939, + "step": 31188 + }, + { + "epoch": 0.8, + "learning_rate": 1.7208037319284872e-06, + "loss": 0.9883, + "step": 31189 + }, + { + "epoch": 0.8, + "learning_rate": 1.720784552175681e-06, + "loss": 0.8882, + "step": 31190 + }, + { + "epoch": 0.8, + "learning_rate": 1.720765371871003e-06, + "loss": 0.8223, + "step": 31191 + }, + { + "epoch": 0.8, + "learning_rate": 1.7207461910144684e-06, + "loss": 1.0029, + "step": 31192 + }, + { + "epoch": 0.8, + "learning_rate": 1.7207270096060916e-06, + "loss": 0.9209, + "step": 31193 + }, + { + "epoch": 0.8, + "learning_rate": 1.7207078276458872e-06, + "loss": 0.6989, + "step": 31194 + }, + { + "epoch": 0.8, + "learning_rate": 1.7206886451338698e-06, + "loss": 1.2227, + "step": 31195 + }, + { + "epoch": 0.8, + "learning_rate": 1.7206694620700544e-06, + "loss": 1.0215, + "step": 31196 + }, + { + "epoch": 0.8, + "learning_rate": 1.7206502784544554e-06, + "loss": 1.0566, + "step": 31197 + }, + { + "epoch": 0.8, + "learning_rate": 1.7206310942870879e-06, + "loss": 0.9023, + "step": 31198 + }, + { + "epoch": 0.8, + "learning_rate": 1.720611909567966e-06, + "loss": 0.5334, + "step": 31199 + }, + { + "epoch": 0.8, + "learning_rate": 1.7205927242971048e-06, + "loss": 0.9375, + "step": 31200 + }, + { + "epoch": 0.8, + "learning_rate": 1.7205735384745191e-06, + "loss": 0.5137, + "step": 31201 + }, + { + "epoch": 0.8, + "learning_rate": 1.720554352100223e-06, + "loss": 0.8799, + "step": 31202 + }, + { + "epoch": 0.8, + "learning_rate": 1.720535165174232e-06, + "loss": 0.8828, + "step": 31203 + }, + { + "epoch": 0.8, + "learning_rate": 1.7205159776965598e-06, + "loss": 0.7695, + "step": 31204 + }, + { + "epoch": 0.8, + "learning_rate": 1.720496789667222e-06, + "loss": 1.0098, + "step": 31205 + }, + { + "epoch": 0.8, + "learning_rate": 1.7204776010862329e-06, + "loss": 0.7773, + "step": 31206 + }, + { + "epoch": 0.8, + "learning_rate": 1.7204584119536074e-06, + "loss": 0.668, + "step": 31207 + }, + { + "epoch": 0.8, + "learning_rate": 1.7204392222693597e-06, + "loss": 0.7417, + "step": 31208 + }, + { + "epoch": 0.8, + "learning_rate": 1.720420032033505e-06, + "loss": 0.6729, + "step": 31209 + }, + { + "epoch": 0.8, + "learning_rate": 1.7204008412460578e-06, + "loss": 0.8438, + "step": 31210 + }, + { + "epoch": 0.8, + "learning_rate": 1.7203816499070326e-06, + "loss": 1.0723, + "step": 31211 + }, + { + "epoch": 0.8, + "learning_rate": 1.7203624580164444e-06, + "loss": 0.916, + "step": 31212 + }, + { + "epoch": 0.8, + "learning_rate": 1.720343265574308e-06, + "loss": 0.8916, + "step": 31213 + }, + { + "epoch": 0.8, + "learning_rate": 1.7203240725806376e-06, + "loss": 0.9678, + "step": 31214 + }, + { + "epoch": 0.8, + "learning_rate": 1.7203048790354484e-06, + "loss": 0.9229, + "step": 31215 + }, + { + "epoch": 0.8, + "learning_rate": 1.7202856849387548e-06, + "loss": 1.1953, + "step": 31216 + }, + { + "epoch": 0.8, + "learning_rate": 1.7202664902905718e-06, + "loss": 0.6743, + "step": 31217 + }, + { + "epoch": 0.8, + "learning_rate": 1.7202472950909135e-06, + "loss": 0.9336, + "step": 31218 + }, + { + "epoch": 0.8, + "learning_rate": 1.7202280993397951e-06, + "loss": 0.8076, + "step": 31219 + }, + { + "epoch": 0.8, + "learning_rate": 1.7202089030372312e-06, + "loss": 0.9023, + "step": 31220 + }, + { + "epoch": 0.8, + "learning_rate": 1.7201897061832363e-06, + "loss": 0.7285, + "step": 31221 + }, + { + "epoch": 0.8, + "learning_rate": 1.720170508777825e-06, + "loss": 0.6909, + "step": 31222 + }, + { + "epoch": 0.8, + "learning_rate": 1.7201513108210128e-06, + "loss": 0.7114, + "step": 31223 + }, + { + "epoch": 0.8, + "learning_rate": 1.7201321123128136e-06, + "loss": 1.0547, + "step": 31224 + }, + { + "epoch": 0.8, + "learning_rate": 1.7201129132532425e-06, + "loss": 0.606, + "step": 31225 + }, + { + "epoch": 0.8, + "learning_rate": 1.7200937136423142e-06, + "loss": 0.6963, + "step": 31226 + }, + { + "epoch": 0.8, + "learning_rate": 1.7200745134800428e-06, + "loss": 0.8701, + "step": 31227 + }, + { + "epoch": 0.8, + "learning_rate": 1.7200553127664438e-06, + "loss": 1.0273, + "step": 31228 + }, + { + "epoch": 0.8, + "learning_rate": 1.7200361115015315e-06, + "loss": 0.5615, + "step": 31229 + }, + { + "epoch": 0.8, + "learning_rate": 1.7200169096853205e-06, + "loss": 0.9971, + "step": 31230 + }, + { + "epoch": 0.8, + "learning_rate": 1.7199977073178257e-06, + "loss": 0.8672, + "step": 31231 + }, + { + "epoch": 0.8, + "learning_rate": 1.719978504399062e-06, + "loss": 0.4878, + "step": 31232 + }, + { + "epoch": 0.8, + "learning_rate": 1.7199593009290435e-06, + "loss": 0.8447, + "step": 31233 + }, + { + "epoch": 0.8, + "learning_rate": 1.7199400969077856e-06, + "loss": 0.8252, + "step": 31234 + }, + { + "epoch": 0.8, + "learning_rate": 1.7199208923353027e-06, + "loss": 0.917, + "step": 31235 + }, + { + "epoch": 0.8, + "learning_rate": 1.719901687211609e-06, + "loss": 0.8828, + "step": 31236 + }, + { + "epoch": 0.8, + "learning_rate": 1.71988248153672e-06, + "loss": 0.9287, + "step": 31237 + }, + { + "epoch": 0.8, + "learning_rate": 1.71986327531065e-06, + "loss": 0.6245, + "step": 31238 + }, + { + "epoch": 0.8, + "learning_rate": 1.7198440685334141e-06, + "loss": 0.6816, + "step": 31239 + }, + { + "epoch": 0.8, + "learning_rate": 1.7198248612050263e-06, + "loss": 0.7451, + "step": 31240 + }, + { + "epoch": 0.8, + "learning_rate": 1.719805653325502e-06, + "loss": 0.917, + "step": 31241 + }, + { + "epoch": 0.8, + "learning_rate": 1.7197864448948556e-06, + "loss": 0.6787, + "step": 31242 + }, + { + "epoch": 0.8, + "learning_rate": 1.7197672359131014e-06, + "loss": 0.7373, + "step": 31243 + }, + { + "epoch": 0.8, + "learning_rate": 1.7197480263802549e-06, + "loss": 0.8223, + "step": 31244 + }, + { + "epoch": 0.8, + "learning_rate": 1.7197288162963304e-06, + "loss": 0.8359, + "step": 31245 + }, + { + "epoch": 0.8, + "learning_rate": 1.7197096056613424e-06, + "loss": 0.9844, + "step": 31246 + }, + { + "epoch": 0.8, + "learning_rate": 1.719690394475306e-06, + "loss": 0.6466, + "step": 31247 + }, + { + "epoch": 0.8, + "learning_rate": 1.719671182738236e-06, + "loss": 1.0454, + "step": 31248 + }, + { + "epoch": 0.8, + "learning_rate": 1.7196519704501466e-06, + "loss": 0.6433, + "step": 31249 + }, + { + "epoch": 0.8, + "learning_rate": 1.7196327576110527e-06, + "loss": 0.8574, + "step": 31250 + }, + { + "epoch": 0.8, + "learning_rate": 1.7196135442209693e-06, + "loss": 0.7881, + "step": 31251 + }, + { + "epoch": 0.8, + "learning_rate": 1.7195943302799107e-06, + "loss": 0.9221, + "step": 31252 + }, + { + "epoch": 0.8, + "learning_rate": 1.719575115787892e-06, + "loss": 0.6362, + "step": 31253 + }, + { + "epoch": 0.8, + "learning_rate": 1.7195559007449277e-06, + "loss": 0.7678, + "step": 31254 + }, + { + "epoch": 0.8, + "learning_rate": 1.7195366851510325e-06, + "loss": 0.7871, + "step": 31255 + }, + { + "epoch": 0.8, + "learning_rate": 1.719517469006221e-06, + "loss": 0.9639, + "step": 31256 + }, + { + "epoch": 0.8, + "learning_rate": 1.7194982523105081e-06, + "loss": 0.8887, + "step": 31257 + }, + { + "epoch": 0.8, + "learning_rate": 1.7194790350639087e-06, + "loss": 0.9355, + "step": 31258 + }, + { + "epoch": 0.8, + "learning_rate": 1.7194598172664372e-06, + "loss": 1.0605, + "step": 31259 + }, + { + "epoch": 0.8, + "learning_rate": 1.7194405989181082e-06, + "loss": 1.0381, + "step": 31260 + }, + { + "epoch": 0.8, + "learning_rate": 1.7194213800189367e-06, + "loss": 0.9043, + "step": 31261 + }, + { + "epoch": 0.8, + "learning_rate": 1.7194021605689374e-06, + "loss": 0.998, + "step": 31262 + }, + { + "epoch": 0.8, + "learning_rate": 1.719382940568125e-06, + "loss": 0.5486, + "step": 31263 + }, + { + "epoch": 0.8, + "learning_rate": 1.7193637200165139e-06, + "loss": 0.9482, + "step": 31264 + }, + { + "epoch": 0.8, + "learning_rate": 1.7193444989141193e-06, + "loss": 0.791, + "step": 31265 + }, + { + "epoch": 0.8, + "learning_rate": 1.719325277260956e-06, + "loss": 0.7197, + "step": 31266 + }, + { + "epoch": 0.8, + "learning_rate": 1.719306055057038e-06, + "loss": 0.9258, + "step": 31267 + }, + { + "epoch": 0.8, + "learning_rate": 1.71928683230238e-06, + "loss": 0.9844, + "step": 31268 + }, + { + "epoch": 0.8, + "learning_rate": 1.719267608996998e-06, + "loss": 0.6836, + "step": 31269 + }, + { + "epoch": 0.8, + "learning_rate": 1.7192483851409055e-06, + "loss": 1.0176, + "step": 31270 + }, + { + "epoch": 0.8, + "learning_rate": 1.7192291607341174e-06, + "loss": 0.7939, + "step": 31271 + }, + { + "epoch": 0.8, + "learning_rate": 1.7192099357766489e-06, + "loss": 0.7307, + "step": 31272 + }, + { + "epoch": 0.8, + "learning_rate": 1.7191907102685143e-06, + "loss": 1.0488, + "step": 31273 + }, + { + "epoch": 0.8, + "learning_rate": 1.7191714842097284e-06, + "loss": 0.6807, + "step": 31274 + }, + { + "epoch": 0.8, + "learning_rate": 1.7191522576003061e-06, + "loss": 1.0723, + "step": 31275 + }, + { + "epoch": 0.8, + "learning_rate": 1.719133030440262e-06, + "loss": 0.9395, + "step": 31276 + }, + { + "epoch": 0.8, + "learning_rate": 1.7191138027296105e-06, + "loss": 0.8384, + "step": 31277 + }, + { + "epoch": 0.8, + "learning_rate": 1.7190945744683669e-06, + "loss": 1.0303, + "step": 31278 + }, + { + "epoch": 0.8, + "learning_rate": 1.7190753456565456e-06, + "loss": 0.835, + "step": 31279 + }, + { + "epoch": 0.8, + "learning_rate": 1.7190561162941614e-06, + "loss": 1.0078, + "step": 31280 + }, + { + "epoch": 0.8, + "learning_rate": 1.7190368863812287e-06, + "loss": 0.7979, + "step": 31281 + }, + { + "epoch": 0.8, + "learning_rate": 1.719017655917763e-06, + "loss": 0.8311, + "step": 31282 + }, + { + "epoch": 0.8, + "learning_rate": 1.7189984249037784e-06, + "loss": 0.9443, + "step": 31283 + }, + { + "epoch": 0.8, + "learning_rate": 1.7189791933392894e-06, + "loss": 0.8438, + "step": 31284 + }, + { + "epoch": 0.8, + "learning_rate": 1.7189599612243116e-06, + "loss": 0.4159, + "step": 31285 + }, + { + "epoch": 0.8, + "learning_rate": 1.718940728558859e-06, + "loss": 0.7905, + "step": 31286 + }, + { + "epoch": 0.8, + "learning_rate": 1.7189214953429466e-06, + "loss": 0.7554, + "step": 31287 + }, + { + "epoch": 0.8, + "learning_rate": 1.7189022615765887e-06, + "loss": 1.0059, + "step": 31288 + }, + { + "epoch": 0.8, + "learning_rate": 1.7188830272598008e-06, + "loss": 0.8462, + "step": 31289 + }, + { + "epoch": 0.8, + "learning_rate": 1.7188637923925971e-06, + "loss": 0.9072, + "step": 31290 + }, + { + "epoch": 0.8, + "learning_rate": 1.7188445569749925e-06, + "loss": 0.8223, + "step": 31291 + }, + { + "epoch": 0.8, + "learning_rate": 1.7188253210070016e-06, + "loss": 0.833, + "step": 31292 + }, + { + "epoch": 0.8, + "learning_rate": 1.7188060844886391e-06, + "loss": 0.7861, + "step": 31293 + }, + { + "epoch": 0.8, + "learning_rate": 1.7187868474199202e-06, + "loss": 0.9268, + "step": 31294 + }, + { + "epoch": 0.8, + "learning_rate": 1.7187676098008587e-06, + "loss": 0.8213, + "step": 31295 + }, + { + "epoch": 0.8, + "learning_rate": 1.7187483716314704e-06, + "loss": 0.8643, + "step": 31296 + }, + { + "epoch": 0.8, + "learning_rate": 1.7187291329117693e-06, + "loss": 0.8525, + "step": 31297 + }, + { + "epoch": 0.8, + "learning_rate": 1.7187098936417703e-06, + "loss": 0.9199, + "step": 31298 + }, + { + "epoch": 0.8, + "learning_rate": 1.7186906538214886e-06, + "loss": 1.0967, + "step": 31299 + }, + { + "epoch": 0.8, + "learning_rate": 1.718671413450938e-06, + "loss": 0.7021, + "step": 31300 + }, + { + "epoch": 0.8, + "learning_rate": 1.7186521725301339e-06, + "loss": 0.8369, + "step": 31301 + }, + { + "epoch": 0.8, + "learning_rate": 1.718632931059091e-06, + "loss": 0.8867, + "step": 31302 + }, + { + "epoch": 0.8, + "learning_rate": 1.7186136890378238e-06, + "loss": 0.7271, + "step": 31303 + }, + { + "epoch": 0.8, + "learning_rate": 1.718594446466347e-06, + "loss": 0.791, + "step": 31304 + }, + { + "epoch": 0.8, + "learning_rate": 1.7185752033446756e-06, + "loss": 0.8979, + "step": 31305 + }, + { + "epoch": 0.8, + "learning_rate": 1.7185559596728243e-06, + "loss": 0.8838, + "step": 31306 + }, + { + "epoch": 0.8, + "learning_rate": 1.7185367154508077e-06, + "loss": 0.6624, + "step": 31307 + }, + { + "epoch": 0.8, + "learning_rate": 1.7185174706786405e-06, + "loss": 0.6304, + "step": 31308 + }, + { + "epoch": 0.8, + "learning_rate": 1.7184982253563376e-06, + "loss": 1.1016, + "step": 31309 + }, + { + "epoch": 0.8, + "learning_rate": 1.7184789794839135e-06, + "loss": 0.9434, + "step": 31310 + }, + { + "epoch": 0.8, + "learning_rate": 1.7184597330613833e-06, + "loss": 0.8486, + "step": 31311 + }, + { + "epoch": 0.8, + "learning_rate": 1.7184404860887613e-06, + "loss": 0.9023, + "step": 31312 + }, + { + "epoch": 0.8, + "learning_rate": 1.7184212385660625e-06, + "loss": 0.5947, + "step": 31313 + }, + { + "epoch": 0.8, + "learning_rate": 1.7184019904933018e-06, + "loss": 0.9795, + "step": 31314 + }, + { + "epoch": 0.8, + "learning_rate": 1.7183827418704938e-06, + "loss": 1.0469, + "step": 31315 + }, + { + "epoch": 0.8, + "learning_rate": 1.7183634926976528e-06, + "loss": 0.9414, + "step": 31316 + }, + { + "epoch": 0.8, + "learning_rate": 1.718344242974794e-06, + "loss": 1.0869, + "step": 31317 + }, + { + "epoch": 0.8, + "learning_rate": 1.7183249927019321e-06, + "loss": 0.6885, + "step": 31318 + }, + { + "epoch": 0.8, + "learning_rate": 1.7183057418790818e-06, + "loss": 0.9902, + "step": 31319 + }, + { + "epoch": 0.8, + "learning_rate": 1.7182864905062577e-06, + "loss": 0.6494, + "step": 31320 + }, + { + "epoch": 0.8, + "learning_rate": 1.718267238583475e-06, + "loss": 0.832, + "step": 31321 + }, + { + "epoch": 0.8, + "learning_rate": 1.718247986110748e-06, + "loss": 0.8799, + "step": 31322 + }, + { + "epoch": 0.8, + "learning_rate": 1.7182287330880913e-06, + "loss": 0.7402, + "step": 31323 + }, + { + "epoch": 0.8, + "learning_rate": 1.71820947951552e-06, + "loss": 0.5845, + "step": 31324 + }, + { + "epoch": 0.8, + "learning_rate": 1.7181902253930486e-06, + "loss": 0.9385, + "step": 31325 + }, + { + "epoch": 0.8, + "learning_rate": 1.7181709707206921e-06, + "loss": 0.9287, + "step": 31326 + }, + { + "epoch": 0.8, + "learning_rate": 1.7181517154984651e-06, + "loss": 0.9131, + "step": 31327 + }, + { + "epoch": 0.8, + "learning_rate": 1.7181324597263824e-06, + "loss": 0.8965, + "step": 31328 + }, + { + "epoch": 0.8, + "learning_rate": 1.7181132034044587e-06, + "loss": 1.0986, + "step": 31329 + }, + { + "epoch": 0.8, + "learning_rate": 1.7180939465327087e-06, + "loss": 1.0684, + "step": 31330 + }, + { + "epoch": 0.8, + "learning_rate": 1.7180746891111471e-06, + "loss": 0.9248, + "step": 31331 + }, + { + "epoch": 0.8, + "learning_rate": 1.7180554311397887e-06, + "loss": 0.8271, + "step": 31332 + }, + { + "epoch": 0.8, + "learning_rate": 1.7180361726186483e-06, + "loss": 1.0674, + "step": 31333 + }, + { + "epoch": 0.8, + "learning_rate": 1.718016913547741e-06, + "loss": 0.7949, + "step": 31334 + }, + { + "epoch": 0.8, + "learning_rate": 1.717997653927081e-06, + "loss": 0.9697, + "step": 31335 + }, + { + "epoch": 0.8, + "learning_rate": 1.7179783937566827e-06, + "loss": 0.8926, + "step": 31336 + }, + { + "epoch": 0.8, + "learning_rate": 1.7179591330365617e-06, + "loss": 0.7891, + "step": 31337 + }, + { + "epoch": 0.8, + "learning_rate": 1.7179398717667323e-06, + "loss": 0.5605, + "step": 31338 + }, + { + "epoch": 0.8, + "learning_rate": 1.7179206099472096e-06, + "loss": 0.7568, + "step": 31339 + }, + { + "epoch": 0.8, + "learning_rate": 1.7179013475780079e-06, + "loss": 0.6387, + "step": 31340 + }, + { + "epoch": 0.8, + "learning_rate": 1.7178820846591423e-06, + "loss": 0.8613, + "step": 31341 + }, + { + "epoch": 0.8, + "learning_rate": 1.7178628211906275e-06, + "loss": 0.8379, + "step": 31342 + }, + { + "epoch": 0.8, + "learning_rate": 1.7178435571724782e-06, + "loss": 0.8652, + "step": 31343 + }, + { + "epoch": 0.8, + "learning_rate": 1.7178242926047086e-06, + "loss": 0.9834, + "step": 31344 + }, + { + "epoch": 0.8, + "learning_rate": 1.7178050274873343e-06, + "loss": 0.7803, + "step": 31345 + }, + { + "epoch": 0.8, + "learning_rate": 1.7177857618203694e-06, + "loss": 0.8984, + "step": 31346 + }, + { + "epoch": 0.8, + "learning_rate": 1.7177664956038295e-06, + "loss": 0.9199, + "step": 31347 + }, + { + "epoch": 0.8, + "learning_rate": 1.7177472288377284e-06, + "loss": 0.6509, + "step": 31348 + }, + { + "epoch": 0.8, + "learning_rate": 1.7177279615220812e-06, + "loss": 1.0049, + "step": 31349 + }, + { + "epoch": 0.8, + "learning_rate": 1.7177086936569028e-06, + "loss": 0.6841, + "step": 31350 + }, + { + "epoch": 0.8, + "learning_rate": 1.7176894252422078e-06, + "loss": 0.6843, + "step": 31351 + }, + { + "epoch": 0.8, + "learning_rate": 1.717670156278011e-06, + "loss": 0.6846, + "step": 31352 + }, + { + "epoch": 0.8, + "learning_rate": 1.7176508867643274e-06, + "loss": 0.9463, + "step": 31353 + }, + { + "epoch": 0.8, + "learning_rate": 1.7176316167011713e-06, + "loss": 0.7861, + "step": 31354 + }, + { + "epoch": 0.8, + "learning_rate": 1.7176123460885577e-06, + "loss": 1.0273, + "step": 31355 + }, + { + "epoch": 0.8, + "learning_rate": 1.7175930749265013e-06, + "loss": 0.875, + "step": 31356 + }, + { + "epoch": 0.8, + "learning_rate": 1.7175738032150168e-06, + "loss": 0.9062, + "step": 31357 + }, + { + "epoch": 0.8, + "learning_rate": 1.7175545309541192e-06, + "loss": 0.9521, + "step": 31358 + }, + { + "epoch": 0.8, + "learning_rate": 1.7175352581438229e-06, + "loss": 1.0322, + "step": 31359 + }, + { + "epoch": 0.8, + "learning_rate": 1.7175159847841431e-06, + "loss": 0.5898, + "step": 31360 + }, + { + "epoch": 0.8, + "learning_rate": 1.7174967108750943e-06, + "loss": 0.6841, + "step": 31361 + }, + { + "epoch": 0.8, + "learning_rate": 1.7174774364166913e-06, + "loss": 0.8152, + "step": 31362 + }, + { + "epoch": 0.8, + "learning_rate": 1.7174581614089486e-06, + "loss": 0.8486, + "step": 31363 + }, + { + "epoch": 0.8, + "learning_rate": 1.7174388858518811e-06, + "loss": 0.9727, + "step": 31364 + }, + { + "epoch": 0.8, + "learning_rate": 1.717419609745504e-06, + "loss": 0.6404, + "step": 31365 + }, + { + "epoch": 0.8, + "learning_rate": 1.7174003330898311e-06, + "loss": 0.9863, + "step": 31366 + }, + { + "epoch": 0.8, + "learning_rate": 1.7173810558848784e-06, + "loss": 0.8115, + "step": 31367 + }, + { + "epoch": 0.8, + "learning_rate": 1.7173617781306598e-06, + "loss": 0.5669, + "step": 31368 + }, + { + "epoch": 0.8, + "learning_rate": 1.71734249982719e-06, + "loss": 0.9082, + "step": 31369 + }, + { + "epoch": 0.8, + "learning_rate": 1.7173232209744843e-06, + "loss": 0.7622, + "step": 31370 + }, + { + "epoch": 0.8, + "learning_rate": 1.717303941572557e-06, + "loss": 0.896, + "step": 31371 + }, + { + "epoch": 0.8, + "learning_rate": 1.7172846616214232e-06, + "loss": 0.8916, + "step": 31372 + }, + { + "epoch": 0.8, + "learning_rate": 1.7172653811210975e-06, + "loss": 1.0059, + "step": 31373 + }, + { + "epoch": 0.8, + "learning_rate": 1.7172461000715948e-06, + "loss": 0.8335, + "step": 31374 + }, + { + "epoch": 0.8, + "learning_rate": 1.7172268184729295e-06, + "loss": 0.8818, + "step": 31375 + }, + { + "epoch": 0.8, + "learning_rate": 1.717207536325117e-06, + "loss": 0.8125, + "step": 31376 + }, + { + "epoch": 0.8, + "learning_rate": 1.7171882536281712e-06, + "loss": 0.8652, + "step": 31377 + }, + { + "epoch": 0.8, + "learning_rate": 1.7171689703821075e-06, + "loss": 0.8574, + "step": 31378 + }, + { + "epoch": 0.8, + "learning_rate": 1.7171496865869405e-06, + "loss": 0.6934, + "step": 31379 + }, + { + "epoch": 0.8, + "learning_rate": 1.7171304022426849e-06, + "loss": 0.9141, + "step": 31380 + }, + { + "epoch": 0.8, + "learning_rate": 1.7171111173493556e-06, + "loss": 0.5537, + "step": 31381 + }, + { + "epoch": 0.8, + "learning_rate": 1.7170918319069675e-06, + "loss": 1.0625, + "step": 31382 + }, + { + "epoch": 0.8, + "learning_rate": 1.717072545915535e-06, + "loss": 0.9648, + "step": 31383 + }, + { + "epoch": 0.8, + "learning_rate": 1.7170532593750728e-06, + "loss": 0.6079, + "step": 31384 + }, + { + "epoch": 0.8, + "learning_rate": 1.7170339722855962e-06, + "loss": 0.9717, + "step": 31385 + }, + { + "epoch": 0.8, + "learning_rate": 1.7170146846471193e-06, + "loss": 0.793, + "step": 31386 + }, + { + "epoch": 0.8, + "learning_rate": 1.7169953964596575e-06, + "loss": 1.0088, + "step": 31387 + }, + { + "epoch": 0.8, + "learning_rate": 1.7169761077232252e-06, + "loss": 0.7544, + "step": 31388 + }, + { + "epoch": 0.8, + "learning_rate": 1.7169568184378376e-06, + "loss": 1.0225, + "step": 31389 + }, + { + "epoch": 0.8, + "learning_rate": 1.7169375286035086e-06, + "loss": 0.9512, + "step": 31390 + }, + { + "epoch": 0.8, + "learning_rate": 1.7169182382202539e-06, + "loss": 1.1172, + "step": 31391 + }, + { + "epoch": 0.8, + "learning_rate": 1.7168989472880875e-06, + "loss": 0.7344, + "step": 31392 + }, + { + "epoch": 0.8, + "learning_rate": 1.7168796558070246e-06, + "loss": 0.686, + "step": 31393 + }, + { + "epoch": 0.8, + "learning_rate": 1.7168603637770802e-06, + "loss": 1.0449, + "step": 31394 + }, + { + "epoch": 0.8, + "learning_rate": 1.7168410711982686e-06, + "loss": 0.6147, + "step": 31395 + }, + { + "epoch": 0.8, + "learning_rate": 1.7168217780706047e-06, + "loss": 0.8525, + "step": 31396 + }, + { + "epoch": 0.8, + "learning_rate": 1.7168024843941036e-06, + "loss": 0.644, + "step": 31397 + }, + { + "epoch": 0.8, + "learning_rate": 1.7167831901687794e-06, + "loss": 0.792, + "step": 31398 + }, + { + "epoch": 0.8, + "learning_rate": 1.7167638953946477e-06, + "loss": 0.8818, + "step": 31399 + }, + { + "epoch": 0.8, + "learning_rate": 1.7167446000717225e-06, + "loss": 0.8506, + "step": 31400 + }, + { + "epoch": 0.8, + "learning_rate": 1.7167253042000191e-06, + "loss": 0.7822, + "step": 31401 + }, + { + "epoch": 0.8, + "learning_rate": 1.716706007779552e-06, + "loss": 0.7534, + "step": 31402 + }, + { + "epoch": 0.8, + "learning_rate": 1.716686710810336e-06, + "loss": 0.9375, + "step": 31403 + }, + { + "epoch": 0.8, + "learning_rate": 1.716667413292386e-06, + "loss": 0.6499, + "step": 31404 + }, + { + "epoch": 0.8, + "learning_rate": 1.716648115225717e-06, + "loss": 0.939, + "step": 31405 + }, + { + "epoch": 0.8, + "learning_rate": 1.716628816610343e-06, + "loss": 1.0137, + "step": 31406 + }, + { + "epoch": 0.8, + "learning_rate": 1.7166095174462795e-06, + "loss": 0.625, + "step": 31407 + }, + { + "epoch": 0.81, + "learning_rate": 1.7165902177335411e-06, + "loss": 0.7832, + "step": 31408 + }, + { + "epoch": 0.81, + "learning_rate": 1.7165709174721426e-06, + "loss": 0.5706, + "step": 31409 + }, + { + "epoch": 0.81, + "learning_rate": 1.7165516166620986e-06, + "loss": 0.7651, + "step": 31410 + }, + { + "epoch": 0.81, + "learning_rate": 1.716532315303424e-06, + "loss": 0.7783, + "step": 31411 + }, + { + "epoch": 0.81, + "learning_rate": 1.7165130133961335e-06, + "loss": 0.7578, + "step": 31412 + }, + { + "epoch": 0.81, + "learning_rate": 1.7164937109402418e-06, + "loss": 0.8438, + "step": 31413 + }, + { + "epoch": 0.81, + "learning_rate": 1.7164744079357641e-06, + "loss": 0.8545, + "step": 31414 + }, + { + "epoch": 0.81, + "learning_rate": 1.7164551043827147e-06, + "loss": 0.876, + "step": 31415 + }, + { + "epoch": 0.81, + "learning_rate": 1.7164358002811085e-06, + "loss": 0.7622, + "step": 31416 + }, + { + "epoch": 0.81, + "learning_rate": 1.7164164956309604e-06, + "loss": 0.9072, + "step": 31417 + }, + { + "epoch": 0.81, + "learning_rate": 1.7163971904322851e-06, + "loss": 0.8838, + "step": 31418 + }, + { + "epoch": 0.81, + "learning_rate": 1.7163778846850976e-06, + "loss": 0.9639, + "step": 31419 + }, + { + "epoch": 0.81, + "learning_rate": 1.7163585783894123e-06, + "loss": 0.8054, + "step": 31420 + }, + { + "epoch": 0.81, + "learning_rate": 1.7163392715452442e-06, + "loss": 0.769, + "step": 31421 + }, + { + "epoch": 0.81, + "learning_rate": 1.7163199641526082e-06, + "loss": 0.9873, + "step": 31422 + }, + { + "epoch": 0.81, + "learning_rate": 1.7163006562115188e-06, + "loss": 0.9043, + "step": 31423 + }, + { + "epoch": 0.81, + "learning_rate": 1.7162813477219912e-06, + "loss": 0.8301, + "step": 31424 + }, + { + "epoch": 0.81, + "learning_rate": 1.7162620386840394e-06, + "loss": 0.9434, + "step": 31425 + }, + { + "epoch": 0.81, + "learning_rate": 1.716242729097679e-06, + "loss": 0.8174, + "step": 31426 + }, + { + "epoch": 0.81, + "learning_rate": 1.7162234189629246e-06, + "loss": 0.9355, + "step": 31427 + }, + { + "epoch": 0.81, + "learning_rate": 1.7162041082797907e-06, + "loss": 1.0742, + "step": 31428 + }, + { + "epoch": 0.81, + "learning_rate": 1.7161847970482923e-06, + "loss": 0.8662, + "step": 31429 + }, + { + "epoch": 0.81, + "learning_rate": 1.7161654852684443e-06, + "loss": 0.6682, + "step": 31430 + }, + { + "epoch": 0.81, + "learning_rate": 1.716146172940261e-06, + "loss": 0.6797, + "step": 31431 + }, + { + "epoch": 0.81, + "learning_rate": 1.7161268600637574e-06, + "loss": 1.1807, + "step": 31432 + }, + { + "epoch": 0.81, + "learning_rate": 1.7161075466389487e-06, + "loss": 0.8252, + "step": 31433 + }, + { + "epoch": 0.81, + "learning_rate": 1.7160882326658493e-06, + "loss": 0.8311, + "step": 31434 + }, + { + "epoch": 0.81, + "learning_rate": 1.716068918144474e-06, + "loss": 1.0381, + "step": 31435 + }, + { + "epoch": 0.81, + "learning_rate": 1.7160496030748377e-06, + "loss": 0.8467, + "step": 31436 + }, + { + "epoch": 0.81, + "learning_rate": 1.7160302874569552e-06, + "loss": 0.7129, + "step": 31437 + }, + { + "epoch": 0.81, + "learning_rate": 1.7160109712908413e-06, + "loss": 0.8691, + "step": 31438 + }, + { + "epoch": 0.81, + "learning_rate": 1.7159916545765105e-06, + "loss": 0.9678, + "step": 31439 + }, + { + "epoch": 0.81, + "learning_rate": 1.7159723373139778e-06, + "loss": 0.9707, + "step": 31440 + }, + { + "epoch": 0.81, + "learning_rate": 1.7159530195032584e-06, + "loss": 0.873, + "step": 31441 + }, + { + "epoch": 0.81, + "learning_rate": 1.7159337011443663e-06, + "loss": 0.7612, + "step": 31442 + }, + { + "epoch": 0.81, + "learning_rate": 1.7159143822373169e-06, + "loss": 0.8369, + "step": 31443 + }, + { + "epoch": 0.81, + "learning_rate": 1.7158950627821244e-06, + "loss": 0.5562, + "step": 31444 + }, + { + "epoch": 0.81, + "learning_rate": 1.7158757427788045e-06, + "loss": 0.8149, + "step": 31445 + }, + { + "epoch": 0.81, + "learning_rate": 1.715856422227371e-06, + "loss": 0.707, + "step": 31446 + }, + { + "epoch": 0.81, + "learning_rate": 1.7158371011278395e-06, + "loss": 0.915, + "step": 31447 + }, + { + "epoch": 0.81, + "learning_rate": 1.7158177794802242e-06, + "loss": 0.752, + "step": 31448 + }, + { + "epoch": 0.81, + "learning_rate": 1.7157984572845403e-06, + "loss": 1.043, + "step": 31449 + }, + { + "epoch": 0.81, + "learning_rate": 1.7157791345408024e-06, + "loss": 0.7559, + "step": 31450 + }, + { + "epoch": 0.81, + "learning_rate": 1.7157598112490253e-06, + "loss": 0.8271, + "step": 31451 + }, + { + "epoch": 0.81, + "learning_rate": 1.7157404874092238e-06, + "loss": 0.9463, + "step": 31452 + }, + { + "epoch": 0.81, + "learning_rate": 1.7157211630214127e-06, + "loss": 0.7998, + "step": 31453 + }, + { + "epoch": 0.81, + "learning_rate": 1.715701838085607e-06, + "loss": 0.918, + "step": 31454 + }, + { + "epoch": 0.81, + "learning_rate": 1.715682512601821e-06, + "loss": 0.7314, + "step": 31455 + }, + { + "epoch": 0.81, + "learning_rate": 1.7156631865700701e-06, + "loss": 0.8164, + "step": 31456 + }, + { + "epoch": 0.81, + "learning_rate": 1.7156438599903686e-06, + "loss": 0.9609, + "step": 31457 + }, + { + "epoch": 0.81, + "learning_rate": 1.7156245328627316e-06, + "loss": 0.8311, + "step": 31458 + }, + { + "epoch": 0.81, + "learning_rate": 1.7156052051871738e-06, + "loss": 1.0059, + "step": 31459 + }, + { + "epoch": 0.81, + "learning_rate": 1.7155858769637102e-06, + "loss": 0.8428, + "step": 31460 + }, + { + "epoch": 0.81, + "learning_rate": 1.7155665481923552e-06, + "loss": 1.0049, + "step": 31461 + }, + { + "epoch": 0.81, + "learning_rate": 1.7155472188731238e-06, + "loss": 0.8916, + "step": 31462 + }, + { + "epoch": 0.81, + "learning_rate": 1.7155278890060306e-06, + "loss": 0.8086, + "step": 31463 + }, + { + "epoch": 0.81, + "learning_rate": 1.715508558591091e-06, + "loss": 1.0088, + "step": 31464 + }, + { + "epoch": 0.81, + "learning_rate": 1.715489227628319e-06, + "loss": 0.8467, + "step": 31465 + }, + { + "epoch": 0.81, + "learning_rate": 1.71546989611773e-06, + "loss": 0.77, + "step": 31466 + }, + { + "epoch": 0.81, + "learning_rate": 1.7154505640593386e-06, + "loss": 0.7305, + "step": 31467 + }, + { + "epoch": 0.81, + "learning_rate": 1.7154312314531597e-06, + "loss": 0.9707, + "step": 31468 + }, + { + "epoch": 0.81, + "learning_rate": 1.715411898299208e-06, + "loss": 0.9453, + "step": 31469 + }, + { + "epoch": 0.81, + "learning_rate": 1.715392564597498e-06, + "loss": 0.6025, + "step": 31470 + }, + { + "epoch": 0.81, + "learning_rate": 1.715373230348045e-06, + "loss": 0.8965, + "step": 31471 + }, + { + "epoch": 0.81, + "learning_rate": 1.7153538955508635e-06, + "loss": 0.8428, + "step": 31472 + }, + { + "epoch": 0.81, + "learning_rate": 1.7153345602059685e-06, + "loss": 0.6797, + "step": 31473 + }, + { + "epoch": 0.81, + "learning_rate": 1.7153152243133747e-06, + "loss": 0.8174, + "step": 31474 + }, + { + "epoch": 0.81, + "learning_rate": 1.715295887873097e-06, + "loss": 1.0596, + "step": 31475 + }, + { + "epoch": 0.81, + "learning_rate": 1.71527655088515e-06, + "loss": 1.0186, + "step": 31476 + }, + { + "epoch": 0.81, + "learning_rate": 1.715257213349549e-06, + "loss": 0.874, + "step": 31477 + }, + { + "epoch": 0.81, + "learning_rate": 1.715237875266308e-06, + "loss": 0.5916, + "step": 31478 + }, + { + "epoch": 0.81, + "learning_rate": 1.7152185366354424e-06, + "loss": 0.957, + "step": 31479 + }, + { + "epoch": 0.81, + "learning_rate": 1.715199197456967e-06, + "loss": 0.8955, + "step": 31480 + }, + { + "epoch": 0.81, + "learning_rate": 1.7151798577308963e-06, + "loss": 0.958, + "step": 31481 + }, + { + "epoch": 0.81, + "learning_rate": 1.7151605174572455e-06, + "loss": 0.9121, + "step": 31482 + }, + { + "epoch": 0.81, + "learning_rate": 1.715141176636029e-06, + "loss": 0.7686, + "step": 31483 + }, + { + "epoch": 0.81, + "learning_rate": 1.7151218352672613e-06, + "loss": 0.8145, + "step": 31484 + }, + { + "epoch": 0.81, + "learning_rate": 1.715102493350958e-06, + "loss": 0.8984, + "step": 31485 + }, + { + "epoch": 0.81, + "learning_rate": 1.715083150887134e-06, + "loss": 0.7236, + "step": 31486 + }, + { + "epoch": 0.81, + "learning_rate": 1.7150638078758035e-06, + "loss": 0.6587, + "step": 31487 + }, + { + "epoch": 0.81, + "learning_rate": 1.7150444643169816e-06, + "loss": 0.8298, + "step": 31488 + }, + { + "epoch": 0.81, + "learning_rate": 1.7150251202106829e-06, + "loss": 1.0342, + "step": 31489 + }, + { + "epoch": 0.81, + "learning_rate": 1.7150057755569222e-06, + "loss": 0.8936, + "step": 31490 + }, + { + "epoch": 0.81, + "learning_rate": 1.7149864303557147e-06, + "loss": 0.8921, + "step": 31491 + }, + { + "epoch": 0.81, + "learning_rate": 1.7149670846070748e-06, + "loss": 0.8418, + "step": 31492 + }, + { + "epoch": 0.81, + "learning_rate": 1.7149477383110176e-06, + "loss": 0.8203, + "step": 31493 + }, + { + "epoch": 0.81, + "learning_rate": 1.7149283914675578e-06, + "loss": 0.688, + "step": 31494 + }, + { + "epoch": 0.81, + "learning_rate": 1.7149090440767101e-06, + "loss": 1.0928, + "step": 31495 + }, + { + "epoch": 0.81, + "learning_rate": 1.7148896961384892e-06, + "loss": 0.9258, + "step": 31496 + }, + { + "epoch": 0.81, + "learning_rate": 1.7148703476529108e-06, + "loss": 0.8613, + "step": 31497 + }, + { + "epoch": 0.81, + "learning_rate": 1.7148509986199885e-06, + "loss": 0.7852, + "step": 31498 + }, + { + "epoch": 0.81, + "learning_rate": 1.714831649039738e-06, + "loss": 0.9863, + "step": 31499 + }, + { + "epoch": 0.81, + "learning_rate": 1.7148122989121734e-06, + "loss": 1.0596, + "step": 31500 + }, + { + "epoch": 0.81, + "learning_rate": 1.71479294823731e-06, + "loss": 0.7012, + "step": 31501 + }, + { + "epoch": 0.81, + "learning_rate": 1.7147735970151627e-06, + "loss": 0.5493, + "step": 31502 + }, + { + "epoch": 0.81, + "learning_rate": 1.7147542452457459e-06, + "loss": 0.6846, + "step": 31503 + }, + { + "epoch": 0.81, + "learning_rate": 1.7147348929290747e-06, + "loss": 0.8936, + "step": 31504 + }, + { + "epoch": 0.81, + "learning_rate": 1.714715540065164e-06, + "loss": 0.9014, + "step": 31505 + }, + { + "epoch": 0.81, + "learning_rate": 1.7146961866540284e-06, + "loss": 0.7236, + "step": 31506 + }, + { + "epoch": 0.81, + "learning_rate": 1.7146768326956827e-06, + "loss": 0.7188, + "step": 31507 + }, + { + "epoch": 0.81, + "learning_rate": 1.714657478190142e-06, + "loss": 0.8379, + "step": 31508 + }, + { + "epoch": 0.81, + "learning_rate": 1.7146381231374205e-06, + "loss": 0.7852, + "step": 31509 + }, + { + "epoch": 0.81, + "learning_rate": 1.714618767537534e-06, + "loss": 0.8682, + "step": 31510 + }, + { + "epoch": 0.81, + "learning_rate": 1.7145994113904965e-06, + "loss": 0.708, + "step": 31511 + }, + { + "epoch": 0.81, + "learning_rate": 1.7145800546963233e-06, + "loss": 0.7598, + "step": 31512 + }, + { + "epoch": 0.81, + "learning_rate": 1.7145606974550283e-06, + "loss": 0.9678, + "step": 31513 + }, + { + "epoch": 0.81, + "learning_rate": 1.7145413396666278e-06, + "loss": 1.0557, + "step": 31514 + }, + { + "epoch": 0.81, + "learning_rate": 1.7145219813311355e-06, + "loss": 1.0029, + "step": 31515 + }, + { + "epoch": 0.81, + "learning_rate": 1.7145026224485669e-06, + "loss": 0.8096, + "step": 31516 + }, + { + "epoch": 0.81, + "learning_rate": 1.7144832630189363e-06, + "loss": 0.6533, + "step": 31517 + }, + { + "epoch": 0.81, + "learning_rate": 1.7144639030422586e-06, + "loss": 0.8975, + "step": 31518 + }, + { + "epoch": 0.81, + "learning_rate": 1.7144445425185488e-06, + "loss": 0.7808, + "step": 31519 + }, + { + "epoch": 0.81, + "learning_rate": 1.7144251814478217e-06, + "loss": 0.8252, + "step": 31520 + }, + { + "epoch": 0.81, + "learning_rate": 1.714405819830092e-06, + "loss": 0.8594, + "step": 31521 + }, + { + "epoch": 0.81, + "learning_rate": 1.7143864576653748e-06, + "loss": 0.75, + "step": 31522 + }, + { + "epoch": 0.81, + "learning_rate": 1.7143670949536847e-06, + "loss": 0.7554, + "step": 31523 + }, + { + "epoch": 0.81, + "learning_rate": 1.7143477316950366e-06, + "loss": 0.7363, + "step": 31524 + }, + { + "epoch": 0.81, + "learning_rate": 1.714328367889445e-06, + "loss": 1.0303, + "step": 31525 + }, + { + "epoch": 0.81, + "learning_rate": 1.7143090035369253e-06, + "loss": 0.8701, + "step": 31526 + }, + { + "epoch": 0.81, + "learning_rate": 1.714289638637492e-06, + "loss": 0.957, + "step": 31527 + }, + { + "epoch": 0.81, + "learning_rate": 1.7142702731911598e-06, + "loss": 1.167, + "step": 31528 + }, + { + "epoch": 0.81, + "learning_rate": 1.7142509071979437e-06, + "loss": 0.8418, + "step": 31529 + }, + { + "epoch": 0.81, + "learning_rate": 1.7142315406578586e-06, + "loss": 0.8667, + "step": 31530 + }, + { + "epoch": 0.81, + "learning_rate": 1.714212173570919e-06, + "loss": 0.8818, + "step": 31531 + }, + { + "epoch": 0.81, + "learning_rate": 1.7141928059371406e-06, + "loss": 0.7852, + "step": 31532 + }, + { + "epoch": 0.81, + "learning_rate": 1.7141734377565374e-06, + "loss": 0.5671, + "step": 31533 + }, + { + "epoch": 0.81, + "learning_rate": 1.7141540690291244e-06, + "loss": 0.6848, + "step": 31534 + }, + { + "epoch": 0.81, + "learning_rate": 1.7141346997549162e-06, + "loss": 0.7695, + "step": 31535 + }, + { + "epoch": 0.81, + "learning_rate": 1.7141153299339282e-06, + "loss": 0.5859, + "step": 31536 + }, + { + "epoch": 0.81, + "learning_rate": 1.7140959595661745e-06, + "loss": 1.0, + "step": 31537 + }, + { + "epoch": 0.81, + "learning_rate": 1.7140765886516707e-06, + "loss": 0.9492, + "step": 31538 + }, + { + "epoch": 0.81, + "learning_rate": 1.7140572171904314e-06, + "loss": 0.7988, + "step": 31539 + }, + { + "epoch": 0.81, + "learning_rate": 1.7140378451824708e-06, + "loss": 0.8359, + "step": 31540 + }, + { + "epoch": 0.81, + "learning_rate": 1.7140184726278048e-06, + "loss": 1.0283, + "step": 31541 + }, + { + "epoch": 0.81, + "learning_rate": 1.7139990995264475e-06, + "loss": 0.7466, + "step": 31542 + }, + { + "epoch": 0.81, + "learning_rate": 1.7139797258784139e-06, + "loss": 0.791, + "step": 31543 + }, + { + "epoch": 0.81, + "learning_rate": 1.7139603516837192e-06, + "loss": 0.791, + "step": 31544 + }, + { + "epoch": 0.81, + "learning_rate": 1.713940976942377e-06, + "loss": 0.7896, + "step": 31545 + }, + { + "epoch": 0.81, + "learning_rate": 1.713921601654404e-06, + "loss": 0.8594, + "step": 31546 + }, + { + "epoch": 0.81, + "learning_rate": 1.7139022258198135e-06, + "loss": 0.625, + "step": 31547 + }, + { + "epoch": 0.81, + "learning_rate": 1.7138828494386211e-06, + "loss": 0.9971, + "step": 31548 + }, + { + "epoch": 0.81, + "learning_rate": 1.7138634725108414e-06, + "loss": 0.8975, + "step": 31549 + }, + { + "epoch": 0.81, + "learning_rate": 1.713844095036489e-06, + "loss": 0.96, + "step": 31550 + }, + { + "epoch": 0.81, + "learning_rate": 1.7138247170155795e-06, + "loss": 1.043, + "step": 31551 + }, + { + "epoch": 0.81, + "learning_rate": 1.713805338448127e-06, + "loss": 0.7788, + "step": 31552 + }, + { + "epoch": 0.81, + "learning_rate": 1.7137859593341465e-06, + "loss": 0.7385, + "step": 31553 + }, + { + "epoch": 0.81, + "learning_rate": 1.7137665796736527e-06, + "loss": 0.8936, + "step": 31554 + }, + { + "epoch": 0.81, + "learning_rate": 1.713747199466661e-06, + "loss": 0.7202, + "step": 31555 + }, + { + "epoch": 0.81, + "learning_rate": 1.7137278187131858e-06, + "loss": 0.7266, + "step": 31556 + }, + { + "epoch": 0.81, + "learning_rate": 1.713708437413242e-06, + "loss": 0.9395, + "step": 31557 + }, + { + "epoch": 0.81, + "learning_rate": 1.7136890555668444e-06, + "loss": 0.748, + "step": 31558 + }, + { + "epoch": 0.81, + "learning_rate": 1.713669673174008e-06, + "loss": 0.9648, + "step": 31559 + }, + { + "epoch": 0.81, + "learning_rate": 1.7136502902347477e-06, + "loss": 1.0635, + "step": 31560 + }, + { + "epoch": 0.81, + "learning_rate": 1.713630906749078e-06, + "loss": 0.7246, + "step": 31561 + }, + { + "epoch": 0.81, + "learning_rate": 1.7136115227170139e-06, + "loss": 0.9805, + "step": 31562 + }, + { + "epoch": 0.81, + "learning_rate": 1.7135921381385702e-06, + "loss": 0.9756, + "step": 31563 + }, + { + "epoch": 0.81, + "learning_rate": 1.7135727530137621e-06, + "loss": 0.9541, + "step": 31564 + }, + { + "epoch": 0.81, + "learning_rate": 1.713553367342604e-06, + "loss": 0.8057, + "step": 31565 + }, + { + "epoch": 0.81, + "learning_rate": 1.713533981125111e-06, + "loss": 0.666, + "step": 31566 + }, + { + "epoch": 0.81, + "learning_rate": 1.7135145943612974e-06, + "loss": 0.8662, + "step": 31567 + }, + { + "epoch": 0.81, + "learning_rate": 1.7134952070511789e-06, + "loss": 0.8604, + "step": 31568 + }, + { + "epoch": 0.81, + "learning_rate": 1.71347581919477e-06, + "loss": 0.875, + "step": 31569 + }, + { + "epoch": 0.81, + "learning_rate": 1.7134564307920854e-06, + "loss": 0.9893, + "step": 31570 + }, + { + "epoch": 0.81, + "learning_rate": 1.7134370418431395e-06, + "loss": 0.6816, + "step": 31571 + }, + { + "epoch": 0.81, + "learning_rate": 1.7134176523479483e-06, + "loss": 0.8257, + "step": 31572 + }, + { + "epoch": 0.81, + "learning_rate": 1.7133982623065258e-06, + "loss": 0.8652, + "step": 31573 + }, + { + "epoch": 0.81, + "learning_rate": 1.713378871718887e-06, + "loss": 0.8896, + "step": 31574 + }, + { + "epoch": 0.81, + "learning_rate": 1.7133594805850469e-06, + "loss": 0.5898, + "step": 31575 + }, + { + "epoch": 0.81, + "learning_rate": 1.7133400889050203e-06, + "loss": 0.9551, + "step": 31576 + }, + { + "epoch": 0.81, + "learning_rate": 1.7133206966788216e-06, + "loss": 0.6616, + "step": 31577 + }, + { + "epoch": 0.81, + "learning_rate": 1.7133013039064666e-06, + "loss": 0.7788, + "step": 31578 + }, + { + "epoch": 0.81, + "learning_rate": 1.7132819105879692e-06, + "loss": 0.917, + "step": 31579 + }, + { + "epoch": 0.81, + "learning_rate": 1.7132625167233447e-06, + "loss": 0.7202, + "step": 31580 + }, + { + "epoch": 0.81, + "learning_rate": 1.713243122312608e-06, + "loss": 0.877, + "step": 31581 + }, + { + "epoch": 0.81, + "learning_rate": 1.7132237273557737e-06, + "loss": 0.6106, + "step": 31582 + }, + { + "epoch": 0.81, + "learning_rate": 1.7132043318528568e-06, + "loss": 1.0264, + "step": 31583 + }, + { + "epoch": 0.81, + "learning_rate": 1.7131849358038724e-06, + "loss": 0.7744, + "step": 31584 + }, + { + "epoch": 0.81, + "learning_rate": 1.713165539208835e-06, + "loss": 0.8926, + "step": 31585 + }, + { + "epoch": 0.81, + "learning_rate": 1.7131461420677593e-06, + "loss": 0.9385, + "step": 31586 + }, + { + "epoch": 0.81, + "learning_rate": 1.7131267443806606e-06, + "loss": 0.8154, + "step": 31587 + }, + { + "epoch": 0.81, + "learning_rate": 1.713107346147553e-06, + "loss": 0.7803, + "step": 31588 + }, + { + "epoch": 0.81, + "learning_rate": 1.7130879473684527e-06, + "loss": 0.8662, + "step": 31589 + }, + { + "epoch": 0.81, + "learning_rate": 1.7130685480433736e-06, + "loss": 0.8252, + "step": 31590 + }, + { + "epoch": 0.81, + "learning_rate": 1.7130491481723303e-06, + "loss": 0.9609, + "step": 31591 + }, + { + "epoch": 0.81, + "learning_rate": 1.7130297477553382e-06, + "loss": 0.9189, + "step": 31592 + }, + { + "epoch": 0.81, + "learning_rate": 1.7130103467924122e-06, + "loss": 1.002, + "step": 31593 + }, + { + "epoch": 0.81, + "learning_rate": 1.7129909452835668e-06, + "loss": 0.8164, + "step": 31594 + }, + { + "epoch": 0.81, + "learning_rate": 1.712971543228817e-06, + "loss": 0.8394, + "step": 31595 + }, + { + "epoch": 0.81, + "learning_rate": 1.7129521406281778e-06, + "loss": 0.8735, + "step": 31596 + }, + { + "epoch": 0.81, + "learning_rate": 1.7129327374816636e-06, + "loss": 0.6709, + "step": 31597 + }, + { + "epoch": 0.81, + "learning_rate": 1.7129133337892898e-06, + "loss": 0.9795, + "step": 31598 + }, + { + "epoch": 0.81, + "learning_rate": 1.7128939295510714e-06, + "loss": 0.6934, + "step": 31599 + }, + { + "epoch": 0.81, + "learning_rate": 1.7128745247670225e-06, + "loss": 0.6772, + "step": 31600 + }, + { + "epoch": 0.81, + "learning_rate": 1.7128551194371582e-06, + "loss": 0.6548, + "step": 31601 + }, + { + "epoch": 0.81, + "learning_rate": 1.712835713561494e-06, + "loss": 1.0391, + "step": 31602 + }, + { + "epoch": 0.81, + "learning_rate": 1.7128163071400439e-06, + "loss": 0.73, + "step": 31603 + }, + { + "epoch": 0.81, + "learning_rate": 1.7127969001728232e-06, + "loss": 0.9814, + "step": 31604 + }, + { + "epoch": 0.81, + "learning_rate": 1.7127774926598465e-06, + "loss": 0.8389, + "step": 31605 + }, + { + "epoch": 0.81, + "learning_rate": 1.7127580846011295e-06, + "loss": 0.9756, + "step": 31606 + }, + { + "epoch": 0.81, + "learning_rate": 1.712738675996686e-06, + "loss": 0.8025, + "step": 31607 + }, + { + "epoch": 0.81, + "learning_rate": 1.7127192668465312e-06, + "loss": 0.9297, + "step": 31608 + }, + { + "epoch": 0.81, + "learning_rate": 1.71269985715068e-06, + "loss": 0.9409, + "step": 31609 + }, + { + "epoch": 0.81, + "learning_rate": 1.7126804469091473e-06, + "loss": 0.7236, + "step": 31610 + }, + { + "epoch": 0.81, + "learning_rate": 1.7126610361219482e-06, + "loss": 0.7905, + "step": 31611 + }, + { + "epoch": 0.81, + "learning_rate": 1.7126416247890969e-06, + "loss": 0.8906, + "step": 31612 + }, + { + "epoch": 0.81, + "learning_rate": 1.7126222129106091e-06, + "loss": 0.6943, + "step": 31613 + }, + { + "epoch": 0.81, + "learning_rate": 1.712602800486499e-06, + "loss": 0.8184, + "step": 31614 + }, + { + "epoch": 0.81, + "learning_rate": 1.7125833875167817e-06, + "loss": 0.665, + "step": 31615 + }, + { + "epoch": 0.81, + "learning_rate": 1.712563974001472e-06, + "loss": 1.0322, + "step": 31616 + }, + { + "epoch": 0.81, + "learning_rate": 1.7125445599405853e-06, + "loss": 0.7979, + "step": 31617 + }, + { + "epoch": 0.81, + "learning_rate": 1.7125251453341356e-06, + "loss": 0.957, + "step": 31618 + }, + { + "epoch": 0.81, + "learning_rate": 1.7125057301821379e-06, + "loss": 0.5947, + "step": 31619 + }, + { + "epoch": 0.81, + "learning_rate": 1.7124863144846077e-06, + "loss": 0.5942, + "step": 31620 + }, + { + "epoch": 0.81, + "learning_rate": 1.7124668982415595e-06, + "loss": 0.8525, + "step": 31621 + }, + { + "epoch": 0.81, + "learning_rate": 1.7124474814530081e-06, + "loss": 0.804, + "step": 31622 + }, + { + "epoch": 0.81, + "learning_rate": 1.7124280641189684e-06, + "loss": 0.793, + "step": 31623 + }, + { + "epoch": 0.81, + "learning_rate": 1.712408646239455e-06, + "loss": 0.7119, + "step": 31624 + }, + { + "epoch": 0.81, + "learning_rate": 1.7123892278144835e-06, + "loss": 0.9463, + "step": 31625 + }, + { + "epoch": 0.81, + "learning_rate": 1.7123698088440684e-06, + "loss": 0.9053, + "step": 31626 + }, + { + "epoch": 0.81, + "learning_rate": 1.712350389328224e-06, + "loss": 0.8975, + "step": 31627 + }, + { + "epoch": 0.81, + "learning_rate": 1.7123309692669658e-06, + "loss": 0.7656, + "step": 31628 + }, + { + "epoch": 0.81, + "learning_rate": 1.7123115486603088e-06, + "loss": 0.9834, + "step": 31629 + }, + { + "epoch": 0.81, + "learning_rate": 1.7122921275082677e-06, + "loss": 0.9111, + "step": 31630 + }, + { + "epoch": 0.81, + "learning_rate": 1.712272705810857e-06, + "loss": 0.7271, + "step": 31631 + }, + { + "epoch": 0.81, + "learning_rate": 1.7122532835680916e-06, + "loss": 1.124, + "step": 31632 + }, + { + "epoch": 0.81, + "learning_rate": 1.712233860779987e-06, + "loss": 1.2744, + "step": 31633 + }, + { + "epoch": 0.81, + "learning_rate": 1.7122144374465575e-06, + "loss": 0.854, + "step": 31634 + }, + { + "epoch": 0.81, + "learning_rate": 1.7121950135678182e-06, + "loss": 0.8848, + "step": 31635 + }, + { + "epoch": 0.81, + "learning_rate": 1.7121755891437842e-06, + "loss": 0.9111, + "step": 31636 + }, + { + "epoch": 0.81, + "learning_rate": 1.7121561641744696e-06, + "loss": 0.7334, + "step": 31637 + }, + { + "epoch": 0.81, + "learning_rate": 1.71213673865989e-06, + "loss": 0.8086, + "step": 31638 + }, + { + "epoch": 0.81, + "learning_rate": 1.7121173126000602e-06, + "loss": 0.999, + "step": 31639 + }, + { + "epoch": 0.81, + "learning_rate": 1.7120978859949945e-06, + "loss": 1.042, + "step": 31640 + }, + { + "epoch": 0.81, + "learning_rate": 1.7120784588447086e-06, + "loss": 0.5464, + "step": 31641 + }, + { + "epoch": 0.81, + "learning_rate": 1.712059031149217e-06, + "loss": 0.8887, + "step": 31642 + }, + { + "epoch": 0.81, + "learning_rate": 1.712039602908534e-06, + "loss": 0.9321, + "step": 31643 + }, + { + "epoch": 0.81, + "learning_rate": 1.7120201741226756e-06, + "loss": 0.8315, + "step": 31644 + }, + { + "epoch": 0.81, + "learning_rate": 1.7120007447916559e-06, + "loss": 1.0566, + "step": 31645 + }, + { + "epoch": 0.81, + "learning_rate": 1.7119813149154898e-06, + "loss": 0.9346, + "step": 31646 + }, + { + "epoch": 0.81, + "learning_rate": 1.7119618844941926e-06, + "loss": 0.7676, + "step": 31647 + }, + { + "epoch": 0.81, + "learning_rate": 1.7119424535277788e-06, + "loss": 0.8623, + "step": 31648 + }, + { + "epoch": 0.81, + "learning_rate": 1.7119230220162634e-06, + "loss": 0.6523, + "step": 31649 + }, + { + "epoch": 0.81, + "learning_rate": 1.7119035899596615e-06, + "loss": 0.5405, + "step": 31650 + }, + { + "epoch": 0.81, + "learning_rate": 1.7118841573579873e-06, + "loss": 0.9131, + "step": 31651 + }, + { + "epoch": 0.81, + "learning_rate": 1.7118647242112566e-06, + "loss": 0.7017, + "step": 31652 + }, + { + "epoch": 0.81, + "learning_rate": 1.7118452905194834e-06, + "loss": 0.815, + "step": 31653 + }, + { + "epoch": 0.81, + "learning_rate": 1.7118258562826833e-06, + "loss": 0.8887, + "step": 31654 + }, + { + "epoch": 0.81, + "learning_rate": 1.7118064215008707e-06, + "loss": 0.9854, + "step": 31655 + }, + { + "epoch": 0.81, + "learning_rate": 1.7117869861740605e-06, + "loss": 0.5005, + "step": 31656 + }, + { + "epoch": 0.81, + "learning_rate": 1.7117675503022682e-06, + "loss": 0.8979, + "step": 31657 + }, + { + "epoch": 0.81, + "learning_rate": 1.711748113885508e-06, + "loss": 0.7466, + "step": 31658 + }, + { + "epoch": 0.81, + "learning_rate": 1.7117286769237948e-06, + "loss": 1.1523, + "step": 31659 + }, + { + "epoch": 0.81, + "learning_rate": 1.7117092394171438e-06, + "loss": 0.8848, + "step": 31660 + }, + { + "epoch": 0.81, + "learning_rate": 1.71168980136557e-06, + "loss": 0.875, + "step": 31661 + }, + { + "epoch": 0.81, + "learning_rate": 1.7116703627690878e-06, + "loss": 0.4827, + "step": 31662 + }, + { + "epoch": 0.81, + "learning_rate": 1.7116509236277122e-06, + "loss": 0.6553, + "step": 31663 + }, + { + "epoch": 0.81, + "learning_rate": 1.7116314839414585e-06, + "loss": 0.8198, + "step": 31664 + }, + { + "epoch": 0.81, + "learning_rate": 1.7116120437103411e-06, + "loss": 0.7329, + "step": 31665 + }, + { + "epoch": 0.81, + "learning_rate": 1.7115926029343753e-06, + "loss": 0.8428, + "step": 31666 + }, + { + "epoch": 0.81, + "learning_rate": 1.7115731616135754e-06, + "loss": 0.9219, + "step": 31667 + }, + { + "epoch": 0.81, + "learning_rate": 1.7115537197479568e-06, + "loss": 0.9346, + "step": 31668 + }, + { + "epoch": 0.81, + "learning_rate": 1.7115342773375346e-06, + "loss": 0.9229, + "step": 31669 + }, + { + "epoch": 0.81, + "learning_rate": 1.711514834382323e-06, + "loss": 0.8242, + "step": 31670 + }, + { + "epoch": 0.81, + "learning_rate": 1.7114953908823371e-06, + "loss": 0.8301, + "step": 31671 + }, + { + "epoch": 0.81, + "learning_rate": 1.711475946837592e-06, + "loss": 0.9365, + "step": 31672 + }, + { + "epoch": 0.81, + "learning_rate": 1.7114565022481023e-06, + "loss": 0.79, + "step": 31673 + }, + { + "epoch": 0.81, + "learning_rate": 1.7114370571138835e-06, + "loss": 0.6304, + "step": 31674 + }, + { + "epoch": 0.81, + "learning_rate": 1.7114176114349496e-06, + "loss": 0.9043, + "step": 31675 + }, + { + "epoch": 0.81, + "learning_rate": 1.7113981652113163e-06, + "loss": 0.9678, + "step": 31676 + }, + { + "epoch": 0.81, + "learning_rate": 1.711378718442998e-06, + "loss": 0.9453, + "step": 31677 + }, + { + "epoch": 0.81, + "learning_rate": 1.7113592711300098e-06, + "loss": 1.0166, + "step": 31678 + }, + { + "epoch": 0.81, + "learning_rate": 1.7113398232723664e-06, + "loss": 1.0088, + "step": 31679 + }, + { + "epoch": 0.81, + "learning_rate": 1.7113203748700829e-06, + "loss": 0.5432, + "step": 31680 + }, + { + "epoch": 0.81, + "learning_rate": 1.7113009259231741e-06, + "loss": 0.7109, + "step": 31681 + }, + { + "epoch": 0.81, + "learning_rate": 1.7112814764316547e-06, + "loss": 0.7793, + "step": 31682 + }, + { + "epoch": 0.81, + "learning_rate": 1.71126202639554e-06, + "loss": 0.9785, + "step": 31683 + }, + { + "epoch": 0.81, + "learning_rate": 1.7112425758148446e-06, + "loss": 0.7539, + "step": 31684 + }, + { + "epoch": 0.81, + "learning_rate": 1.7112231246895833e-06, + "loss": 0.9238, + "step": 31685 + }, + { + "epoch": 0.81, + "learning_rate": 1.7112036730197713e-06, + "loss": 0.9775, + "step": 31686 + }, + { + "epoch": 0.81, + "learning_rate": 1.7111842208054235e-06, + "loss": 0.918, + "step": 31687 + }, + { + "epoch": 0.81, + "learning_rate": 1.7111647680465543e-06, + "loss": 0.8564, + "step": 31688 + }, + { + "epoch": 0.81, + "learning_rate": 1.7111453147431792e-06, + "loss": 0.8496, + "step": 31689 + }, + { + "epoch": 0.81, + "learning_rate": 1.7111258608953128e-06, + "loss": 1.0068, + "step": 31690 + }, + { + "epoch": 0.81, + "learning_rate": 1.7111064065029698e-06, + "loss": 0.9365, + "step": 31691 + }, + { + "epoch": 0.81, + "learning_rate": 1.7110869515661657e-06, + "loss": 0.8584, + "step": 31692 + }, + { + "epoch": 0.81, + "learning_rate": 1.711067496084915e-06, + "loss": 0.876, + "step": 31693 + }, + { + "epoch": 0.81, + "learning_rate": 1.7110480400592322e-06, + "loss": 0.8271, + "step": 31694 + }, + { + "epoch": 0.81, + "learning_rate": 1.7110285834891332e-06, + "loss": 0.6111, + "step": 31695 + }, + { + "epoch": 0.81, + "learning_rate": 1.7110091263746317e-06, + "loss": 1.0117, + "step": 31696 + }, + { + "epoch": 0.81, + "learning_rate": 1.7109896687157437e-06, + "loss": 0.7432, + "step": 31697 + }, + { + "epoch": 0.81, + "learning_rate": 1.7109702105124833e-06, + "loss": 0.8574, + "step": 31698 + }, + { + "epoch": 0.81, + "learning_rate": 1.7109507517648659e-06, + "loss": 0.4272, + "step": 31699 + }, + { + "epoch": 0.81, + "learning_rate": 1.7109312924729057e-06, + "loss": 0.7622, + "step": 31700 + }, + { + "epoch": 0.81, + "learning_rate": 1.7109118326366187e-06, + "loss": 0.9658, + "step": 31701 + }, + { + "epoch": 0.81, + "learning_rate": 1.710892372256019e-06, + "loss": 1.0967, + "step": 31702 + }, + { + "epoch": 0.81, + "learning_rate": 1.7108729113311218e-06, + "loss": 0.6372, + "step": 31703 + }, + { + "epoch": 0.81, + "learning_rate": 1.7108534498619416e-06, + "loss": 0.707, + "step": 31704 + }, + { + "epoch": 0.81, + "learning_rate": 1.7108339878484936e-06, + "loss": 0.998, + "step": 31705 + }, + { + "epoch": 0.81, + "learning_rate": 1.710814525290793e-06, + "loss": 0.7935, + "step": 31706 + }, + { + "epoch": 0.81, + "learning_rate": 1.7107950621888543e-06, + "loss": 0.8154, + "step": 31707 + }, + { + "epoch": 0.81, + "learning_rate": 1.7107755985426925e-06, + "loss": 0.791, + "step": 31708 + }, + { + "epoch": 0.81, + "learning_rate": 1.7107561343523224e-06, + "loss": 0.9219, + "step": 31709 + }, + { + "epoch": 0.81, + "learning_rate": 1.7107366696177593e-06, + "loss": 1.0156, + "step": 31710 + }, + { + "epoch": 0.81, + "learning_rate": 1.7107172043390175e-06, + "loss": 1.1221, + "step": 31711 + }, + { + "epoch": 0.81, + "learning_rate": 1.7106977385161122e-06, + "loss": 0.875, + "step": 31712 + }, + { + "epoch": 0.81, + "learning_rate": 1.7106782721490585e-06, + "loss": 0.8882, + "step": 31713 + }, + { + "epoch": 0.81, + "learning_rate": 1.710658805237871e-06, + "loss": 0.6064, + "step": 31714 + }, + { + "epoch": 0.81, + "learning_rate": 1.710639337782565e-06, + "loss": 0.707, + "step": 31715 + }, + { + "epoch": 0.81, + "learning_rate": 1.710619869783155e-06, + "loss": 0.7026, + "step": 31716 + }, + { + "epoch": 0.81, + "learning_rate": 1.7106004012396557e-06, + "loss": 1.0264, + "step": 31717 + }, + { + "epoch": 0.81, + "learning_rate": 1.7105809321520827e-06, + "loss": 0.6914, + "step": 31718 + }, + { + "epoch": 0.81, + "learning_rate": 1.7105614625204504e-06, + "loss": 0.9033, + "step": 31719 + }, + { + "epoch": 0.81, + "learning_rate": 1.710541992344774e-06, + "loss": 0.7705, + "step": 31720 + }, + { + "epoch": 0.81, + "learning_rate": 1.7105225216250682e-06, + "loss": 0.605, + "step": 31721 + }, + { + "epoch": 0.81, + "learning_rate": 1.710503050361348e-06, + "loss": 0.7803, + "step": 31722 + }, + { + "epoch": 0.81, + "learning_rate": 1.7104835785536285e-06, + "loss": 0.8516, + "step": 31723 + }, + { + "epoch": 0.81, + "learning_rate": 1.710464106201924e-06, + "loss": 0.6602, + "step": 31724 + }, + { + "epoch": 0.81, + "learning_rate": 1.7104446333062498e-06, + "loss": 1.082, + "step": 31725 + }, + { + "epoch": 0.81, + "learning_rate": 1.710425159866621e-06, + "loss": 0.8154, + "step": 31726 + }, + { + "epoch": 0.81, + "learning_rate": 1.7104056858830523e-06, + "loss": 0.7158, + "step": 31727 + }, + { + "epoch": 0.81, + "learning_rate": 1.7103862113555584e-06, + "loss": 0.8613, + "step": 31728 + }, + { + "epoch": 0.81, + "learning_rate": 1.710366736284155e-06, + "loss": 1.0176, + "step": 31729 + }, + { + "epoch": 0.81, + "learning_rate": 1.710347260668856e-06, + "loss": 0.8447, + "step": 31730 + }, + { + "epoch": 0.81, + "learning_rate": 1.710327784509677e-06, + "loss": 0.8076, + "step": 31731 + }, + { + "epoch": 0.81, + "learning_rate": 1.7103083078066326e-06, + "loss": 0.7773, + "step": 31732 + }, + { + "epoch": 0.81, + "learning_rate": 1.7102888305597377e-06, + "loss": 0.9443, + "step": 31733 + }, + { + "epoch": 0.81, + "learning_rate": 1.7102693527690074e-06, + "loss": 1.0068, + "step": 31734 + }, + { + "epoch": 0.81, + "learning_rate": 1.7102498744344564e-06, + "loss": 0.7344, + "step": 31735 + }, + { + "epoch": 0.81, + "learning_rate": 1.7102303955560998e-06, + "loss": 0.8555, + "step": 31736 + }, + { + "epoch": 0.81, + "learning_rate": 1.7102109161339525e-06, + "loss": 0.8672, + "step": 31737 + }, + { + "epoch": 0.81, + "learning_rate": 1.7101914361680291e-06, + "loss": 0.6929, + "step": 31738 + }, + { + "epoch": 0.81, + "learning_rate": 1.710171955658345e-06, + "loss": 0.9395, + "step": 31739 + }, + { + "epoch": 0.81, + "learning_rate": 1.7101524746049146e-06, + "loss": 0.769, + "step": 31740 + }, + { + "epoch": 0.81, + "learning_rate": 1.7101329930077536e-06, + "loss": 0.6631, + "step": 31741 + }, + { + "epoch": 0.81, + "learning_rate": 1.7101135108668762e-06, + "loss": 0.7695, + "step": 31742 + }, + { + "epoch": 0.81, + "learning_rate": 1.7100940281822975e-06, + "loss": 0.8462, + "step": 31743 + }, + { + "epoch": 0.81, + "learning_rate": 1.7100745449540326e-06, + "loss": 0.7246, + "step": 31744 + }, + { + "epoch": 0.81, + "learning_rate": 1.710055061182096e-06, + "loss": 0.8887, + "step": 31745 + }, + { + "epoch": 0.81, + "learning_rate": 1.710035576866503e-06, + "loss": 0.8125, + "step": 31746 + }, + { + "epoch": 0.81, + "learning_rate": 1.7100160920072687e-06, + "loss": 0.7285, + "step": 31747 + }, + { + "epoch": 0.81, + "learning_rate": 1.7099966066044075e-06, + "loss": 0.7334, + "step": 31748 + }, + { + "epoch": 0.81, + "learning_rate": 1.7099771206579345e-06, + "loss": 0.873, + "step": 31749 + }, + { + "epoch": 0.81, + "learning_rate": 1.7099576341678646e-06, + "loss": 0.9033, + "step": 31750 + }, + { + "epoch": 0.81, + "learning_rate": 1.709938147134213e-06, + "loss": 0.8818, + "step": 31751 + }, + { + "epoch": 0.81, + "learning_rate": 1.7099186595569938e-06, + "loss": 0.6418, + "step": 31752 + }, + { + "epoch": 0.81, + "learning_rate": 1.7098991714362232e-06, + "loss": 1.0029, + "step": 31753 + }, + { + "epoch": 0.81, + "learning_rate": 1.7098796827719152e-06, + "loss": 0.647, + "step": 31754 + }, + { + "epoch": 0.81, + "learning_rate": 1.709860193564085e-06, + "loss": 0.8394, + "step": 31755 + }, + { + "epoch": 0.81, + "learning_rate": 1.7098407038127477e-06, + "loss": 0.6973, + "step": 31756 + }, + { + "epoch": 0.81, + "learning_rate": 1.7098212135179178e-06, + "loss": 0.6797, + "step": 31757 + }, + { + "epoch": 0.81, + "learning_rate": 1.7098017226796103e-06, + "loss": 0.7441, + "step": 31758 + }, + { + "epoch": 0.81, + "learning_rate": 1.7097822312978404e-06, + "loss": 0.8467, + "step": 31759 + }, + { + "epoch": 0.81, + "learning_rate": 1.7097627393726229e-06, + "loss": 0.8086, + "step": 31760 + }, + { + "epoch": 0.81, + "learning_rate": 1.7097432469039727e-06, + "loss": 0.8438, + "step": 31761 + }, + { + "epoch": 0.81, + "learning_rate": 1.7097237538919047e-06, + "loss": 0.6538, + "step": 31762 + }, + { + "epoch": 0.81, + "learning_rate": 1.709704260336434e-06, + "loss": 0.9258, + "step": 31763 + }, + { + "epoch": 0.81, + "learning_rate": 1.7096847662375753e-06, + "loss": 0.9365, + "step": 31764 + }, + { + "epoch": 0.81, + "learning_rate": 1.7096652715953433e-06, + "loss": 1.0283, + "step": 31765 + }, + { + "epoch": 0.81, + "learning_rate": 1.7096457764097536e-06, + "loss": 0.8613, + "step": 31766 + }, + { + "epoch": 0.81, + "learning_rate": 1.7096262806808207e-06, + "loss": 0.8589, + "step": 31767 + }, + { + "epoch": 0.81, + "learning_rate": 1.7096067844085595e-06, + "loss": 0.9688, + "step": 31768 + }, + { + "epoch": 0.81, + "learning_rate": 1.7095872875929852e-06, + "loss": 0.8066, + "step": 31769 + }, + { + "epoch": 0.81, + "learning_rate": 1.709567790234112e-06, + "loss": 0.7622, + "step": 31770 + }, + { + "epoch": 0.81, + "learning_rate": 1.7095482923319562e-06, + "loss": 0.7832, + "step": 31771 + }, + { + "epoch": 0.81, + "learning_rate": 1.7095287938865312e-06, + "loss": 0.8369, + "step": 31772 + }, + { + "epoch": 0.81, + "learning_rate": 1.709509294897853e-06, + "loss": 0.9766, + "step": 31773 + }, + { + "epoch": 0.81, + "learning_rate": 1.709489795365936e-06, + "loss": 0.9248, + "step": 31774 + }, + { + "epoch": 0.81, + "learning_rate": 1.7094702952907953e-06, + "loss": 1.0195, + "step": 31775 + }, + { + "epoch": 0.81, + "learning_rate": 1.7094507946724458e-06, + "loss": 0.8271, + "step": 31776 + }, + { + "epoch": 0.81, + "learning_rate": 1.7094312935109025e-06, + "loss": 0.8057, + "step": 31777 + }, + { + "epoch": 0.81, + "learning_rate": 1.7094117918061803e-06, + "loss": 0.8154, + "step": 31778 + }, + { + "epoch": 0.81, + "learning_rate": 1.7093922895582942e-06, + "loss": 0.8447, + "step": 31779 + }, + { + "epoch": 0.81, + "learning_rate": 1.709372786767259e-06, + "loss": 0.7207, + "step": 31780 + }, + { + "epoch": 0.81, + "learning_rate": 1.7093532834330896e-06, + "loss": 0.7373, + "step": 31781 + }, + { + "epoch": 0.81, + "learning_rate": 1.709333779555801e-06, + "loss": 0.7747, + "step": 31782 + }, + { + "epoch": 0.81, + "learning_rate": 1.709314275135408e-06, + "loss": 0.8599, + "step": 31783 + }, + { + "epoch": 0.81, + "learning_rate": 1.709294770171926e-06, + "loss": 0.958, + "step": 31784 + }, + { + "epoch": 0.81, + "learning_rate": 1.7092752646653695e-06, + "loss": 0.7944, + "step": 31785 + }, + { + "epoch": 0.81, + "learning_rate": 1.7092557586157535e-06, + "loss": 0.8145, + "step": 31786 + }, + { + "epoch": 0.81, + "learning_rate": 1.7092362520230927e-06, + "loss": 0.7646, + "step": 31787 + }, + { + "epoch": 0.81, + "learning_rate": 1.7092167448874028e-06, + "loss": 0.6885, + "step": 31788 + }, + { + "epoch": 0.81, + "learning_rate": 1.709197237208698e-06, + "loss": 0.8525, + "step": 31789 + }, + { + "epoch": 0.81, + "learning_rate": 1.7091777289869933e-06, + "loss": 0.7922, + "step": 31790 + }, + { + "epoch": 0.81, + "learning_rate": 1.7091582202223044e-06, + "loss": 0.8105, + "step": 31791 + }, + { + "epoch": 0.81, + "learning_rate": 1.7091387109146451e-06, + "loss": 0.7158, + "step": 31792 + }, + { + "epoch": 0.81, + "learning_rate": 1.709119201064031e-06, + "loss": 0.916, + "step": 31793 + }, + { + "epoch": 0.81, + "learning_rate": 1.7090996906704768e-06, + "loss": 0.7483, + "step": 31794 + }, + { + "epoch": 0.81, + "learning_rate": 1.709080179733998e-06, + "loss": 0.9883, + "step": 31795 + }, + { + "epoch": 0.81, + "learning_rate": 1.709060668254609e-06, + "loss": 0.9824, + "step": 31796 + }, + { + "epoch": 0.81, + "learning_rate": 1.7090411562323247e-06, + "loss": 0.9082, + "step": 31797 + }, + { + "epoch": 0.81, + "learning_rate": 1.7090216436671603e-06, + "loss": 0.7998, + "step": 31798 + }, + { + "epoch": 0.82, + "learning_rate": 1.7090021305591304e-06, + "loss": 0.9033, + "step": 31799 + }, + { + "epoch": 0.82, + "learning_rate": 1.7089826169082505e-06, + "loss": 0.8164, + "step": 31800 + }, + { + "epoch": 0.82, + "learning_rate": 1.7089631027145348e-06, + "loss": 0.8779, + "step": 31801 + }, + { + "epoch": 0.82, + "learning_rate": 1.708943587977999e-06, + "loss": 0.875, + "step": 31802 + }, + { + "epoch": 0.82, + "learning_rate": 1.7089240726986577e-06, + "loss": 1.1104, + "step": 31803 + }, + { + "epoch": 0.82, + "learning_rate": 1.7089045568765256e-06, + "loss": 0.7979, + "step": 31804 + }, + { + "epoch": 0.82, + "learning_rate": 1.708885040511618e-06, + "loss": 0.8838, + "step": 31805 + }, + { + "epoch": 0.82, + "learning_rate": 1.7088655236039498e-06, + "loss": 0.8828, + "step": 31806 + }, + { + "epoch": 0.82, + "learning_rate": 1.7088460061535356e-06, + "loss": 0.8467, + "step": 31807 + }, + { + "epoch": 0.82, + "learning_rate": 1.7088264881603908e-06, + "loss": 0.9307, + "step": 31808 + }, + { + "epoch": 0.82, + "learning_rate": 1.7088069696245303e-06, + "loss": 0.8203, + "step": 31809 + }, + { + "epoch": 0.82, + "learning_rate": 1.7087874505459687e-06, + "loss": 0.832, + "step": 31810 + }, + { + "epoch": 0.82, + "learning_rate": 1.708767930924721e-06, + "loss": 0.6553, + "step": 31811 + }, + { + "epoch": 0.82, + "learning_rate": 1.7087484107608028e-06, + "loss": 0.8926, + "step": 31812 + }, + { + "epoch": 0.82, + "learning_rate": 1.7087288900542283e-06, + "loss": 0.9512, + "step": 31813 + }, + { + "epoch": 0.82, + "learning_rate": 1.7087093688050124e-06, + "loss": 0.9033, + "step": 31814 + }, + { + "epoch": 0.82, + "learning_rate": 1.7086898470131705e-06, + "loss": 0.8896, + "step": 31815 + }, + { + "epoch": 0.82, + "learning_rate": 1.7086703246787173e-06, + "loss": 0.8843, + "step": 31816 + }, + { + "epoch": 0.82, + "learning_rate": 1.7086508018016682e-06, + "loss": 0.8408, + "step": 31817 + }, + { + "epoch": 0.82, + "learning_rate": 1.7086312783820373e-06, + "loss": 0.6875, + "step": 31818 + }, + { + "epoch": 0.82, + "learning_rate": 1.7086117544198403e-06, + "loss": 0.6951, + "step": 31819 + }, + { + "epoch": 0.82, + "learning_rate": 1.7085922299150917e-06, + "loss": 0.7422, + "step": 31820 + }, + { + "epoch": 0.82, + "learning_rate": 1.7085727048678066e-06, + "loss": 0.8838, + "step": 31821 + }, + { + "epoch": 0.82, + "learning_rate": 1.7085531792779997e-06, + "loss": 0.8037, + "step": 31822 + }, + { + "epoch": 0.82, + "learning_rate": 1.7085336531456867e-06, + "loss": 0.79, + "step": 31823 + }, + { + "epoch": 0.82, + "learning_rate": 1.7085141264708817e-06, + "loss": 0.751, + "step": 31824 + }, + { + "epoch": 0.82, + "learning_rate": 1.7084945992536004e-06, + "loss": 0.8711, + "step": 31825 + }, + { + "epoch": 0.82, + "learning_rate": 1.708475071493857e-06, + "loss": 0.7178, + "step": 31826 + }, + { + "epoch": 0.82, + "learning_rate": 1.708455543191667e-06, + "loss": 0.8516, + "step": 31827 + }, + { + "epoch": 0.82, + "learning_rate": 1.708436014347045e-06, + "loss": 1.0156, + "step": 31828 + }, + { + "epoch": 0.82, + "learning_rate": 1.7084164849600065e-06, + "loss": 0.9229, + "step": 31829 + }, + { + "epoch": 0.82, + "learning_rate": 1.7083969550305657e-06, + "loss": 0.6924, + "step": 31830 + }, + { + "epoch": 0.82, + "learning_rate": 1.7083774245587382e-06, + "loss": 0.8613, + "step": 31831 + }, + { + "epoch": 0.82, + "learning_rate": 1.7083578935445385e-06, + "loss": 0.9736, + "step": 31832 + }, + { + "epoch": 0.82, + "learning_rate": 1.7083383619879817e-06, + "loss": 0.6699, + "step": 31833 + }, + { + "epoch": 0.82, + "learning_rate": 1.7083188298890829e-06, + "loss": 0.9639, + "step": 31834 + }, + { + "epoch": 0.82, + "learning_rate": 1.7082992972478568e-06, + "loss": 0.5278, + "step": 31835 + }, + { + "epoch": 0.82, + "learning_rate": 1.7082797640643185e-06, + "loss": 0.9189, + "step": 31836 + }, + { + "epoch": 0.82, + "learning_rate": 1.708260230338483e-06, + "loss": 0.7744, + "step": 31837 + }, + { + "epoch": 0.82, + "learning_rate": 1.7082406960703652e-06, + "loss": 0.7646, + "step": 31838 + }, + { + "epoch": 0.82, + "learning_rate": 1.7082211612599805e-06, + "loss": 0.7246, + "step": 31839 + }, + { + "epoch": 0.82, + "learning_rate": 1.7082016259073426e-06, + "loss": 0.7881, + "step": 31840 + }, + { + "epoch": 0.82, + "learning_rate": 1.708182090012468e-06, + "loss": 0.7441, + "step": 31841 + }, + { + "epoch": 0.82, + "learning_rate": 1.7081625535753704e-06, + "loss": 0.7156, + "step": 31842 + }, + { + "epoch": 0.82, + "learning_rate": 1.7081430165960655e-06, + "loss": 1.0742, + "step": 31843 + }, + { + "epoch": 0.82, + "learning_rate": 1.708123479074568e-06, + "loss": 1.0654, + "step": 31844 + }, + { + "epoch": 0.82, + "learning_rate": 1.708103941010893e-06, + "loss": 0.7002, + "step": 31845 + }, + { + "epoch": 0.82, + "learning_rate": 1.7080844024050556e-06, + "loss": 0.5337, + "step": 31846 + }, + { + "epoch": 0.82, + "learning_rate": 1.7080648632570702e-06, + "loss": 0.7986, + "step": 31847 + }, + { + "epoch": 0.82, + "learning_rate": 1.7080453235669524e-06, + "loss": 0.6611, + "step": 31848 + }, + { + "epoch": 0.82, + "learning_rate": 1.7080257833347165e-06, + "loss": 1.0635, + "step": 31849 + }, + { + "epoch": 0.82, + "learning_rate": 1.7080062425603781e-06, + "loss": 0.8574, + "step": 31850 + }, + { + "epoch": 0.82, + "learning_rate": 1.7079867012439518e-06, + "loss": 0.877, + "step": 31851 + }, + { + "epoch": 0.82, + "learning_rate": 1.7079671593854523e-06, + "loss": 0.9199, + "step": 31852 + }, + { + "epoch": 0.82, + "learning_rate": 1.7079476169848955e-06, + "loss": 1.0596, + "step": 31853 + }, + { + "epoch": 0.82, + "learning_rate": 1.7079280740422953e-06, + "loss": 0.9561, + "step": 31854 + }, + { + "epoch": 0.82, + "learning_rate": 1.7079085305576672e-06, + "loss": 0.9824, + "step": 31855 + }, + { + "epoch": 0.82, + "learning_rate": 1.7078889865310262e-06, + "loss": 0.6748, + "step": 31856 + }, + { + "epoch": 0.82, + "learning_rate": 1.7078694419623872e-06, + "loss": 0.7803, + "step": 31857 + }, + { + "epoch": 0.82, + "learning_rate": 1.7078498968517648e-06, + "loss": 0.8804, + "step": 31858 + }, + { + "epoch": 0.82, + "learning_rate": 1.7078303511991746e-06, + "loss": 1.0449, + "step": 31859 + }, + { + "epoch": 0.82, + "learning_rate": 1.707810805004631e-06, + "loss": 0.3906, + "step": 31860 + }, + { + "epoch": 0.82, + "learning_rate": 1.7077912582681495e-06, + "loss": 0.8066, + "step": 31861 + }, + { + "epoch": 0.82, + "learning_rate": 1.7077717109897445e-06, + "loss": 0.8311, + "step": 31862 + }, + { + "epoch": 0.82, + "learning_rate": 1.7077521631694314e-06, + "loss": 0.9639, + "step": 31863 + }, + { + "epoch": 0.82, + "learning_rate": 1.707732614807225e-06, + "loss": 1.001, + "step": 31864 + }, + { + "epoch": 0.82, + "learning_rate": 1.7077130659031402e-06, + "loss": 0.8379, + "step": 31865 + }, + { + "epoch": 0.82, + "learning_rate": 1.7076935164571921e-06, + "loss": 0.9541, + "step": 31866 + }, + { + "epoch": 0.82, + "learning_rate": 1.7076739664693958e-06, + "loss": 0.9453, + "step": 31867 + }, + { + "epoch": 0.82, + "learning_rate": 1.7076544159397658e-06, + "loss": 0.8975, + "step": 31868 + }, + { + "epoch": 0.82, + "learning_rate": 1.7076348648683174e-06, + "loss": 0.7393, + "step": 31869 + }, + { + "epoch": 0.82, + "learning_rate": 1.707615313255066e-06, + "loss": 1.041, + "step": 31870 + }, + { + "epoch": 0.82, + "learning_rate": 1.7075957611000256e-06, + "loss": 0.8027, + "step": 31871 + }, + { + "epoch": 0.82, + "learning_rate": 1.7075762084032115e-06, + "loss": 0.9009, + "step": 31872 + }, + { + "epoch": 0.82, + "learning_rate": 1.7075566551646392e-06, + "loss": 0.8486, + "step": 31873 + }, + { + "epoch": 0.82, + "learning_rate": 1.7075371013843232e-06, + "loss": 0.8457, + "step": 31874 + }, + { + "epoch": 0.82, + "learning_rate": 1.7075175470622787e-06, + "loss": 0.813, + "step": 31875 + }, + { + "epoch": 0.82, + "learning_rate": 1.7074979921985203e-06, + "loss": 1.0288, + "step": 31876 + }, + { + "epoch": 0.82, + "learning_rate": 1.7074784367930633e-06, + "loss": 0.7559, + "step": 31877 + }, + { + "epoch": 0.82, + "learning_rate": 1.7074588808459228e-06, + "loss": 0.8662, + "step": 31878 + }, + { + "epoch": 0.82, + "learning_rate": 1.707439324357113e-06, + "loss": 0.7549, + "step": 31879 + }, + { + "epoch": 0.82, + "learning_rate": 1.70741976732665e-06, + "loss": 0.6968, + "step": 31880 + }, + { + "epoch": 0.82, + "learning_rate": 1.7074002097545481e-06, + "loss": 0.9131, + "step": 31881 + }, + { + "epoch": 0.82, + "learning_rate": 1.7073806516408223e-06, + "loss": 0.9131, + "step": 31882 + }, + { + "epoch": 0.82, + "learning_rate": 1.7073610929854877e-06, + "loss": 0.7212, + "step": 31883 + }, + { + "epoch": 0.82, + "learning_rate": 1.707341533788559e-06, + "loss": 1.084, + "step": 31884 + }, + { + "epoch": 0.82, + "learning_rate": 1.7073219740500518e-06, + "loss": 1.0547, + "step": 31885 + }, + { + "epoch": 0.82, + "learning_rate": 1.7073024137699804e-06, + "loss": 0.8545, + "step": 31886 + }, + { + "epoch": 0.82, + "learning_rate": 1.70728285294836e-06, + "loss": 0.8828, + "step": 31887 + }, + { + "epoch": 0.82, + "learning_rate": 1.707263291585206e-06, + "loss": 0.5757, + "step": 31888 + }, + { + "epoch": 0.82, + "learning_rate": 1.7072437296805328e-06, + "loss": 0.877, + "step": 31889 + }, + { + "epoch": 0.82, + "learning_rate": 1.7072241672343556e-06, + "loss": 0.9346, + "step": 31890 + }, + { + "epoch": 0.82, + "learning_rate": 1.7072046042466894e-06, + "loss": 0.9805, + "step": 31891 + }, + { + "epoch": 0.82, + "learning_rate": 1.7071850407175492e-06, + "loss": 0.9268, + "step": 31892 + }, + { + "epoch": 0.82, + "learning_rate": 1.70716547664695e-06, + "loss": 0.6416, + "step": 31893 + }, + { + "epoch": 0.82, + "learning_rate": 1.7071459120349065e-06, + "loss": 0.8438, + "step": 31894 + }, + { + "epoch": 0.82, + "learning_rate": 1.7071263468814341e-06, + "loss": 1.0215, + "step": 31895 + }, + { + "epoch": 0.82, + "learning_rate": 1.7071067811865474e-06, + "loss": 1.0059, + "step": 31896 + }, + { + "epoch": 0.82, + "learning_rate": 1.7070872149502616e-06, + "loss": 0.7842, + "step": 31897 + }, + { + "epoch": 0.82, + "learning_rate": 1.7070676481725915e-06, + "loss": 0.7197, + "step": 31898 + }, + { + "epoch": 0.82, + "learning_rate": 1.7070480808535526e-06, + "loss": 0.9395, + "step": 31899 + }, + { + "epoch": 0.82, + "learning_rate": 1.7070285129931593e-06, + "loss": 0.7822, + "step": 31900 + }, + { + "epoch": 0.82, + "learning_rate": 1.707008944591427e-06, + "loss": 1.2422, + "step": 31901 + }, + { + "epoch": 0.82, + "learning_rate": 1.7069893756483697e-06, + "loss": 1.1035, + "step": 31902 + }, + { + "epoch": 0.82, + "learning_rate": 1.7069698061640039e-06, + "loss": 0.9023, + "step": 31903 + }, + { + "epoch": 0.82, + "learning_rate": 1.7069502361383434e-06, + "loss": 0.6616, + "step": 31904 + }, + { + "epoch": 0.82, + "learning_rate": 1.706930665571404e-06, + "loss": 1.0166, + "step": 31905 + }, + { + "epoch": 0.82, + "learning_rate": 1.7069110944632e-06, + "loss": 0.6484, + "step": 31906 + }, + { + "epoch": 0.82, + "learning_rate": 1.7068915228137465e-06, + "loss": 0.9043, + "step": 31907 + }, + { + "epoch": 0.82, + "learning_rate": 1.706871950623059e-06, + "loss": 0.8369, + "step": 31908 + }, + { + "epoch": 0.82, + "learning_rate": 1.7068523778911522e-06, + "loss": 0.8584, + "step": 31909 + }, + { + "epoch": 0.82, + "learning_rate": 1.7068328046180409e-06, + "loss": 0.5923, + "step": 31910 + }, + { + "epoch": 0.82, + "learning_rate": 1.70681323080374e-06, + "loss": 0.8301, + "step": 31911 + }, + { + "epoch": 0.82, + "learning_rate": 1.7067936564482653e-06, + "loss": 0.9619, + "step": 31912 + }, + { + "epoch": 0.82, + "learning_rate": 1.7067740815516304e-06, + "loss": 0.6206, + "step": 31913 + }, + { + "epoch": 0.82, + "learning_rate": 1.7067545061138517e-06, + "loss": 0.8037, + "step": 31914 + }, + { + "epoch": 0.82, + "learning_rate": 1.7067349301349435e-06, + "loss": 0.8223, + "step": 31915 + }, + { + "epoch": 0.82, + "learning_rate": 1.7067153536149207e-06, + "loss": 0.7354, + "step": 31916 + }, + { + "epoch": 0.82, + "learning_rate": 1.7066957765537984e-06, + "loss": 0.8066, + "step": 31917 + }, + { + "epoch": 0.82, + "learning_rate": 1.706676198951592e-06, + "loss": 0.835, + "step": 31918 + }, + { + "epoch": 0.82, + "learning_rate": 1.7066566208083158e-06, + "loss": 0.7285, + "step": 31919 + }, + { + "epoch": 0.82, + "learning_rate": 1.7066370421239853e-06, + "loss": 0.8311, + "step": 31920 + }, + { + "epoch": 0.82, + "learning_rate": 1.706617462898615e-06, + "loss": 0.6943, + "step": 31921 + }, + { + "epoch": 0.82, + "learning_rate": 1.7065978831322205e-06, + "loss": 0.6741, + "step": 31922 + }, + { + "epoch": 0.82, + "learning_rate": 1.7065783028248163e-06, + "loss": 0.6816, + "step": 31923 + }, + { + "epoch": 0.82, + "learning_rate": 1.7065587219764176e-06, + "loss": 0.8574, + "step": 31924 + }, + { + "epoch": 0.82, + "learning_rate": 1.7065391405870396e-06, + "loss": 0.8809, + "step": 31925 + }, + { + "epoch": 0.82, + "learning_rate": 1.706519558656697e-06, + "loss": 0.9375, + "step": 31926 + }, + { + "epoch": 0.82, + "learning_rate": 1.7064999761854045e-06, + "loss": 0.7651, + "step": 31927 + }, + { + "epoch": 0.82, + "learning_rate": 1.7064803931731778e-06, + "loss": 0.5275, + "step": 31928 + }, + { + "epoch": 0.82, + "learning_rate": 1.7064608096200314e-06, + "loss": 0.9512, + "step": 31929 + }, + { + "epoch": 0.82, + "learning_rate": 1.7064412255259806e-06, + "loss": 0.9268, + "step": 31930 + }, + { + "epoch": 0.82, + "learning_rate": 1.7064216408910401e-06, + "loss": 0.7144, + "step": 31931 + }, + { + "epoch": 0.82, + "learning_rate": 1.706402055715225e-06, + "loss": 0.9492, + "step": 31932 + }, + { + "epoch": 0.82, + "learning_rate": 1.7063824699985505e-06, + "loss": 0.7993, + "step": 31933 + }, + { + "epoch": 0.82, + "learning_rate": 1.7063628837410312e-06, + "loss": 0.9697, + "step": 31934 + }, + { + "epoch": 0.82, + "learning_rate": 1.7063432969426827e-06, + "loss": 0.573, + "step": 31935 + }, + { + "epoch": 0.82, + "learning_rate": 1.7063237096035192e-06, + "loss": 0.8057, + "step": 31936 + }, + { + "epoch": 0.82, + "learning_rate": 1.7063041217235564e-06, + "loss": 0.8486, + "step": 31937 + }, + { + "epoch": 0.82, + "learning_rate": 1.7062845333028085e-06, + "loss": 1.0703, + "step": 31938 + }, + { + "epoch": 0.82, + "learning_rate": 1.7062649443412918e-06, + "loss": 0.686, + "step": 31939 + }, + { + "epoch": 0.82, + "learning_rate": 1.70624535483902e-06, + "loss": 0.9316, + "step": 31940 + }, + { + "epoch": 0.82, + "learning_rate": 1.7062257647960087e-06, + "loss": 0.8564, + "step": 31941 + }, + { + "epoch": 0.82, + "learning_rate": 1.7062061742122728e-06, + "loss": 0.6753, + "step": 31942 + }, + { + "epoch": 0.82, + "learning_rate": 1.7061865830878276e-06, + "loss": 1.0469, + "step": 31943 + }, + { + "epoch": 0.82, + "learning_rate": 1.7061669914226875e-06, + "loss": 0.6016, + "step": 31944 + }, + { + "epoch": 0.82, + "learning_rate": 1.7061473992168675e-06, + "loss": 0.7007, + "step": 31945 + }, + { + "epoch": 0.82, + "learning_rate": 1.7061278064703832e-06, + "loss": 0.887, + "step": 31946 + }, + { + "epoch": 0.82, + "learning_rate": 1.7061082131832495e-06, + "loss": 1.042, + "step": 31947 + }, + { + "epoch": 0.82, + "learning_rate": 1.7060886193554808e-06, + "loss": 0.7671, + "step": 31948 + }, + { + "epoch": 0.82, + "learning_rate": 1.706069024987093e-06, + "loss": 0.8135, + "step": 31949 + }, + { + "epoch": 0.82, + "learning_rate": 1.7060494300781003e-06, + "loss": 0.834, + "step": 31950 + }, + { + "epoch": 0.82, + "learning_rate": 1.7060298346285182e-06, + "loss": 0.6138, + "step": 31951 + }, + { + "epoch": 0.82, + "learning_rate": 1.7060102386383614e-06, + "loss": 0.8486, + "step": 31952 + }, + { + "epoch": 0.82, + "learning_rate": 1.7059906421076452e-06, + "loss": 0.8848, + "step": 31953 + }, + { + "epoch": 0.82, + "learning_rate": 1.7059710450363842e-06, + "loss": 0.6306, + "step": 31954 + }, + { + "epoch": 0.82, + "learning_rate": 1.7059514474245935e-06, + "loss": 0.6919, + "step": 31955 + }, + { + "epoch": 0.82, + "learning_rate": 1.7059318492722885e-06, + "loss": 0.9854, + "step": 31956 + }, + { + "epoch": 0.82, + "learning_rate": 1.7059122505794838e-06, + "loss": 0.5931, + "step": 31957 + }, + { + "epoch": 0.82, + "learning_rate": 1.7058926513461946e-06, + "loss": 0.9678, + "step": 31958 + }, + { + "epoch": 0.82, + "learning_rate": 1.705873051572436e-06, + "loss": 0.7949, + "step": 31959 + }, + { + "epoch": 0.82, + "learning_rate": 1.7058534512582227e-06, + "loss": 0.6143, + "step": 31960 + }, + { + "epoch": 0.82, + "learning_rate": 1.70583385040357e-06, + "loss": 0.7241, + "step": 31961 + }, + { + "epoch": 0.82, + "learning_rate": 1.7058142490084925e-06, + "loss": 0.9766, + "step": 31962 + }, + { + "epoch": 0.82, + "learning_rate": 1.7057946470730058e-06, + "loss": 0.7627, + "step": 31963 + }, + { + "epoch": 0.82, + "learning_rate": 1.7057750445971247e-06, + "loss": 0.7812, + "step": 31964 + }, + { + "epoch": 0.82, + "learning_rate": 1.7057554415808637e-06, + "loss": 0.8066, + "step": 31965 + }, + { + "epoch": 0.82, + "learning_rate": 1.7057358380242383e-06, + "loss": 0.7988, + "step": 31966 + }, + { + "epoch": 0.82, + "learning_rate": 1.7057162339272634e-06, + "loss": 0.8359, + "step": 31967 + }, + { + "epoch": 0.82, + "learning_rate": 1.7056966292899542e-06, + "loss": 0.9619, + "step": 31968 + }, + { + "epoch": 0.82, + "learning_rate": 1.7056770241123256e-06, + "loss": 0.8359, + "step": 31969 + }, + { + "epoch": 0.82, + "learning_rate": 1.7056574183943925e-06, + "loss": 0.9531, + "step": 31970 + }, + { + "epoch": 0.82, + "learning_rate": 1.7056378121361696e-06, + "loss": 1.0078, + "step": 31971 + }, + { + "epoch": 0.82, + "learning_rate": 1.7056182053376725e-06, + "loss": 0.8242, + "step": 31972 + }, + { + "epoch": 0.82, + "learning_rate": 1.7055985979989162e-06, + "loss": 0.8359, + "step": 31973 + }, + { + "epoch": 0.82, + "learning_rate": 1.7055789901199153e-06, + "loss": 1.0156, + "step": 31974 + }, + { + "epoch": 0.82, + "learning_rate": 1.705559381700685e-06, + "loss": 0.5875, + "step": 31975 + }, + { + "epoch": 0.82, + "learning_rate": 1.7055397727412403e-06, + "loss": 0.793, + "step": 31976 + }, + { + "epoch": 0.82, + "learning_rate": 1.7055201632415962e-06, + "loss": 0.7822, + "step": 31977 + }, + { + "epoch": 0.82, + "learning_rate": 1.7055005532017681e-06, + "loss": 0.8364, + "step": 31978 + }, + { + "epoch": 0.82, + "learning_rate": 1.7054809426217704e-06, + "loss": 0.6084, + "step": 31979 + }, + { + "epoch": 0.82, + "learning_rate": 1.7054613315016185e-06, + "loss": 0.874, + "step": 31980 + }, + { + "epoch": 0.82, + "learning_rate": 1.705441719841327e-06, + "loss": 1.1133, + "step": 31981 + }, + { + "epoch": 0.82, + "learning_rate": 1.7054221076409113e-06, + "loss": 0.791, + "step": 31982 + }, + { + "epoch": 0.82, + "learning_rate": 1.7054024949003867e-06, + "loss": 0.9355, + "step": 31983 + }, + { + "epoch": 0.82, + "learning_rate": 1.7053828816197675e-06, + "loss": 1.0479, + "step": 31984 + }, + { + "epoch": 0.82, + "learning_rate": 1.7053632677990693e-06, + "loss": 0.9531, + "step": 31985 + }, + { + "epoch": 0.82, + "learning_rate": 1.7053436534383066e-06, + "loss": 0.8037, + "step": 31986 + }, + { + "epoch": 0.82, + "learning_rate": 1.7053240385374947e-06, + "loss": 0.9531, + "step": 31987 + }, + { + "epoch": 0.82, + "learning_rate": 1.7053044230966486e-06, + "loss": 0.7842, + "step": 31988 + }, + { + "epoch": 0.82, + "learning_rate": 1.7052848071157837e-06, + "loss": 1.1133, + "step": 31989 + }, + { + "epoch": 0.82, + "learning_rate": 1.7052651905949144e-06, + "loss": 0.6694, + "step": 31990 + }, + { + "epoch": 0.82, + "learning_rate": 1.7052455735340558e-06, + "loss": 0.7563, + "step": 31991 + }, + { + "epoch": 0.82, + "learning_rate": 1.7052259559332237e-06, + "loss": 0.6404, + "step": 31992 + }, + { + "epoch": 0.82, + "learning_rate": 1.7052063377924317e-06, + "loss": 0.9736, + "step": 31993 + }, + { + "epoch": 0.82, + "learning_rate": 1.7051867191116961e-06, + "loss": 0.7715, + "step": 31994 + }, + { + "epoch": 0.82, + "learning_rate": 1.7051670998910316e-06, + "loss": 0.8408, + "step": 31995 + }, + { + "epoch": 0.82, + "learning_rate": 1.7051474801304529e-06, + "loss": 0.8926, + "step": 31996 + }, + { + "epoch": 0.82, + "learning_rate": 1.7051278598299751e-06, + "loss": 0.7891, + "step": 31997 + }, + { + "epoch": 0.82, + "learning_rate": 1.7051082389896134e-06, + "loss": 1.1318, + "step": 31998 + }, + { + "epoch": 0.82, + "learning_rate": 1.7050886176093827e-06, + "loss": 0.9248, + "step": 31999 + }, + { + "epoch": 0.82, + "learning_rate": 1.7050689956892981e-06, + "loss": 0.8721, + "step": 32000 + }, + { + "epoch": 0.82, + "learning_rate": 1.7050493732293744e-06, + "loss": 0.6841, + "step": 32001 + }, + { + "epoch": 0.82, + "learning_rate": 1.705029750229627e-06, + "loss": 0.79, + "step": 32002 + }, + { + "epoch": 0.82, + "learning_rate": 1.7050101266900706e-06, + "loss": 0.7979, + "step": 32003 + }, + { + "epoch": 0.82, + "learning_rate": 1.7049905026107208e-06, + "loss": 0.9229, + "step": 32004 + }, + { + "epoch": 0.82, + "learning_rate": 1.704970877991592e-06, + "loss": 0.688, + "step": 32005 + }, + { + "epoch": 0.82, + "learning_rate": 1.704951252832699e-06, + "loss": 0.8115, + "step": 32006 + }, + { + "epoch": 0.82, + "learning_rate": 1.7049316271340576e-06, + "loss": 1.0566, + "step": 32007 + }, + { + "epoch": 0.82, + "learning_rate": 1.7049120008956824e-06, + "loss": 1.0635, + "step": 32008 + }, + { + "epoch": 0.82, + "learning_rate": 1.7048923741175888e-06, + "loss": 0.6826, + "step": 32009 + }, + { + "epoch": 0.82, + "learning_rate": 1.704872746799791e-06, + "loss": 0.7827, + "step": 32010 + }, + { + "epoch": 0.82, + "learning_rate": 1.7048531189423048e-06, + "loss": 0.6406, + "step": 32011 + }, + { + "epoch": 0.82, + "learning_rate": 1.704833490545145e-06, + "loss": 0.7168, + "step": 32012 + }, + { + "epoch": 0.82, + "learning_rate": 1.7048138616083265e-06, + "loss": 0.8682, + "step": 32013 + }, + { + "epoch": 0.82, + "learning_rate": 1.7047942321318644e-06, + "loss": 0.728, + "step": 32014 + }, + { + "epoch": 0.82, + "learning_rate": 1.7047746021157741e-06, + "loss": 0.8643, + "step": 32015 + }, + { + "epoch": 0.82, + "learning_rate": 1.70475497156007e-06, + "loss": 0.8672, + "step": 32016 + }, + { + "epoch": 0.82, + "learning_rate": 1.7047353404647672e-06, + "loss": 0.8008, + "step": 32017 + }, + { + "epoch": 0.82, + "learning_rate": 1.7047157088298814e-06, + "loss": 0.8696, + "step": 32018 + }, + { + "epoch": 0.82, + "learning_rate": 1.704696076655427e-06, + "loss": 0.7451, + "step": 32019 + }, + { + "epoch": 0.82, + "learning_rate": 1.7046764439414193e-06, + "loss": 0.834, + "step": 32020 + }, + { + "epoch": 0.82, + "learning_rate": 1.7046568106878731e-06, + "loss": 0.7339, + "step": 32021 + }, + { + "epoch": 0.82, + "learning_rate": 1.7046371768948036e-06, + "loss": 0.7729, + "step": 32022 + }, + { + "epoch": 0.82, + "learning_rate": 1.704617542562226e-06, + "loss": 0.8945, + "step": 32023 + }, + { + "epoch": 0.82, + "learning_rate": 1.704597907690155e-06, + "loss": 0.9033, + "step": 32024 + }, + { + "epoch": 0.82, + "learning_rate": 1.7045782722786058e-06, + "loss": 0.8525, + "step": 32025 + }, + { + "epoch": 0.82, + "learning_rate": 1.7045586363275932e-06, + "loss": 0.7744, + "step": 32026 + }, + { + "epoch": 0.82, + "learning_rate": 1.7045389998371327e-06, + "loss": 0.8545, + "step": 32027 + }, + { + "epoch": 0.82, + "learning_rate": 1.704519362807239e-06, + "loss": 1.0, + "step": 32028 + }, + { + "epoch": 0.82, + "learning_rate": 1.7044997252379274e-06, + "loss": 0.9346, + "step": 32029 + }, + { + "epoch": 0.82, + "learning_rate": 1.7044800871292124e-06, + "loss": 0.77, + "step": 32030 + }, + { + "epoch": 0.82, + "learning_rate": 1.7044604484811099e-06, + "loss": 0.6118, + "step": 32031 + }, + { + "epoch": 0.82, + "learning_rate": 1.704440809293634e-06, + "loss": 0.874, + "step": 32032 + }, + { + "epoch": 0.82, + "learning_rate": 1.7044211695668003e-06, + "loss": 0.9951, + "step": 32033 + }, + { + "epoch": 0.82, + "learning_rate": 1.7044015293006237e-06, + "loss": 0.7725, + "step": 32034 + }, + { + "epoch": 0.82, + "learning_rate": 1.7043818884951192e-06, + "loss": 0.7949, + "step": 32035 + }, + { + "epoch": 0.82, + "learning_rate": 1.704362247150302e-06, + "loss": 0.9785, + "step": 32036 + }, + { + "epoch": 0.82, + "learning_rate": 1.7043426052661869e-06, + "loss": 0.7197, + "step": 32037 + }, + { + "epoch": 0.82, + "learning_rate": 1.7043229628427889e-06, + "loss": 0.9346, + "step": 32038 + }, + { + "epoch": 0.82, + "learning_rate": 1.7043033198801236e-06, + "loss": 0.7637, + "step": 32039 + }, + { + "epoch": 0.82, + "learning_rate": 1.7042836763782053e-06, + "loss": 0.8779, + "step": 32040 + }, + { + "epoch": 0.82, + "learning_rate": 1.7042640323370496e-06, + "loss": 0.71, + "step": 32041 + }, + { + "epoch": 0.82, + "learning_rate": 1.7042443877566712e-06, + "loss": 0.55, + "step": 32042 + }, + { + "epoch": 0.82, + "learning_rate": 1.7042247426370851e-06, + "loss": 0.8516, + "step": 32043 + }, + { + "epoch": 0.82, + "learning_rate": 1.7042050969783065e-06, + "loss": 0.8301, + "step": 32044 + }, + { + "epoch": 0.82, + "learning_rate": 1.7041854507803506e-06, + "loss": 0.9688, + "step": 32045 + }, + { + "epoch": 0.82, + "learning_rate": 1.7041658040432325e-06, + "loss": 0.8345, + "step": 32046 + }, + { + "epoch": 0.82, + "learning_rate": 1.7041461567669666e-06, + "loss": 0.9609, + "step": 32047 + }, + { + "epoch": 0.82, + "learning_rate": 1.7041265089515688e-06, + "loss": 0.835, + "step": 32048 + }, + { + "epoch": 0.82, + "learning_rate": 1.7041068605970534e-06, + "loss": 0.6689, + "step": 32049 + }, + { + "epoch": 0.82, + "learning_rate": 1.7040872117034357e-06, + "loss": 0.835, + "step": 32050 + }, + { + "epoch": 0.82, + "learning_rate": 1.704067562270731e-06, + "loss": 0.7905, + "step": 32051 + }, + { + "epoch": 0.82, + "learning_rate": 1.7040479122989538e-06, + "loss": 0.8447, + "step": 32052 + }, + { + "epoch": 0.82, + "learning_rate": 1.7040282617881201e-06, + "loss": 0.8638, + "step": 32053 + }, + { + "epoch": 0.82, + "learning_rate": 1.7040086107382439e-06, + "loss": 0.7334, + "step": 32054 + }, + { + "epoch": 0.82, + "learning_rate": 1.7039889591493406e-06, + "loss": 0.9648, + "step": 32055 + }, + { + "epoch": 0.82, + "learning_rate": 1.7039693070214253e-06, + "loss": 0.835, + "step": 32056 + }, + { + "epoch": 0.82, + "learning_rate": 1.7039496543545134e-06, + "loss": 0.8936, + "step": 32057 + }, + { + "epoch": 0.82, + "learning_rate": 1.7039300011486195e-06, + "loss": 0.6211, + "step": 32058 + }, + { + "epoch": 0.82, + "learning_rate": 1.7039103474037586e-06, + "loss": 0.8838, + "step": 32059 + }, + { + "epoch": 0.82, + "learning_rate": 1.7038906931199461e-06, + "loss": 0.7476, + "step": 32060 + }, + { + "epoch": 0.82, + "learning_rate": 1.7038710382971968e-06, + "loss": 0.8726, + "step": 32061 + }, + { + "epoch": 0.82, + "learning_rate": 1.7038513829355256e-06, + "loss": 0.8408, + "step": 32062 + }, + { + "epoch": 0.82, + "learning_rate": 1.7038317270349483e-06, + "loss": 0.9023, + "step": 32063 + }, + { + "epoch": 0.82, + "learning_rate": 1.7038120705954788e-06, + "loss": 0.7056, + "step": 32064 + }, + { + "epoch": 0.82, + "learning_rate": 1.7037924136171332e-06, + "loss": 0.791, + "step": 32065 + }, + { + "epoch": 0.82, + "learning_rate": 1.703772756099926e-06, + "loss": 1.0332, + "step": 32066 + }, + { + "epoch": 0.82, + "learning_rate": 1.703753098043872e-06, + "loss": 1.1289, + "step": 32067 + }, + { + "epoch": 0.82, + "learning_rate": 1.7037334394489871e-06, + "loss": 0.54, + "step": 32068 + }, + { + "epoch": 0.82, + "learning_rate": 1.7037137803152857e-06, + "loss": 0.6609, + "step": 32069 + }, + { + "epoch": 0.82, + "learning_rate": 1.7036941206427828e-06, + "loss": 0.7283, + "step": 32070 + }, + { + "epoch": 0.82, + "learning_rate": 1.703674460431494e-06, + "loss": 0.8408, + "step": 32071 + }, + { + "epoch": 0.82, + "learning_rate": 1.703654799681434e-06, + "loss": 0.8613, + "step": 32072 + }, + { + "epoch": 0.82, + "learning_rate": 1.7036351383926178e-06, + "loss": 0.9185, + "step": 32073 + }, + { + "epoch": 0.82, + "learning_rate": 1.7036154765650602e-06, + "loss": 0.9775, + "step": 32074 + }, + { + "epoch": 0.82, + "learning_rate": 1.7035958141987772e-06, + "loss": 0.6895, + "step": 32075 + }, + { + "epoch": 0.82, + "learning_rate": 1.7035761512937827e-06, + "loss": 0.8779, + "step": 32076 + }, + { + "epoch": 0.82, + "learning_rate": 1.7035564878500925e-06, + "loss": 0.6382, + "step": 32077 + }, + { + "epoch": 0.82, + "learning_rate": 1.7035368238677217e-06, + "loss": 0.8633, + "step": 32078 + }, + { + "epoch": 0.82, + "learning_rate": 1.7035171593466848e-06, + "loss": 0.9658, + "step": 32079 + }, + { + "epoch": 0.82, + "learning_rate": 1.703497494286997e-06, + "loss": 0.9922, + "step": 32080 + }, + { + "epoch": 0.82, + "learning_rate": 1.703477828688674e-06, + "loss": 0.8525, + "step": 32081 + }, + { + "epoch": 0.82, + "learning_rate": 1.7034581625517299e-06, + "loss": 1.0098, + "step": 32082 + }, + { + "epoch": 0.82, + "learning_rate": 1.7034384958761805e-06, + "loss": 0.7983, + "step": 32083 + }, + { + "epoch": 0.82, + "learning_rate": 1.7034188286620403e-06, + "loss": 0.9951, + "step": 32084 + }, + { + "epoch": 0.82, + "learning_rate": 1.703399160909325e-06, + "loss": 1.0908, + "step": 32085 + }, + { + "epoch": 0.82, + "learning_rate": 1.7033794926180495e-06, + "loss": 0.79, + "step": 32086 + }, + { + "epoch": 0.82, + "learning_rate": 1.703359823788228e-06, + "loss": 0.7207, + "step": 32087 + }, + { + "epoch": 0.82, + "learning_rate": 1.7033401544198766e-06, + "loss": 0.9092, + "step": 32088 + }, + { + "epoch": 0.82, + "learning_rate": 1.70332048451301e-06, + "loss": 0.8906, + "step": 32089 + }, + { + "epoch": 0.82, + "learning_rate": 1.703300814067643e-06, + "loss": 0.668, + "step": 32090 + }, + { + "epoch": 0.82, + "learning_rate": 1.7032811430837912e-06, + "loss": 0.8081, + "step": 32091 + }, + { + "epoch": 0.82, + "learning_rate": 1.7032614715614693e-06, + "loss": 0.9651, + "step": 32092 + }, + { + "epoch": 0.82, + "learning_rate": 1.7032417995006926e-06, + "loss": 0.6914, + "step": 32093 + }, + { + "epoch": 0.82, + "learning_rate": 1.7032221269014756e-06, + "loss": 1.0498, + "step": 32094 + }, + { + "epoch": 0.82, + "learning_rate": 1.7032024537638342e-06, + "loss": 0.9326, + "step": 32095 + }, + { + "epoch": 0.82, + "learning_rate": 1.7031827800877825e-06, + "loss": 0.7827, + "step": 32096 + }, + { + "epoch": 0.82, + "learning_rate": 1.7031631058733362e-06, + "loss": 1.2617, + "step": 32097 + }, + { + "epoch": 0.82, + "learning_rate": 1.7031434311205107e-06, + "loss": 0.9619, + "step": 32098 + }, + { + "epoch": 0.82, + "learning_rate": 1.7031237558293201e-06, + "loss": 0.7256, + "step": 32099 + }, + { + "epoch": 0.82, + "learning_rate": 1.7031040799997802e-06, + "loss": 0.8428, + "step": 32100 + }, + { + "epoch": 0.82, + "learning_rate": 1.7030844036319055e-06, + "loss": 0.9209, + "step": 32101 + }, + { + "epoch": 0.82, + "learning_rate": 1.703064726725712e-06, + "loss": 0.8125, + "step": 32102 + }, + { + "epoch": 0.82, + "learning_rate": 1.7030450492812138e-06, + "loss": 0.6917, + "step": 32103 + }, + { + "epoch": 0.82, + "learning_rate": 1.7030253712984263e-06, + "loss": 0.5117, + "step": 32104 + }, + { + "epoch": 0.82, + "learning_rate": 1.7030056927773648e-06, + "loss": 0.8125, + "step": 32105 + }, + { + "epoch": 0.82, + "learning_rate": 1.702986013718044e-06, + "loss": 0.623, + "step": 32106 + }, + { + "epoch": 0.82, + "learning_rate": 1.702966334120479e-06, + "loss": 0.9131, + "step": 32107 + }, + { + "epoch": 0.82, + "learning_rate": 1.7029466539846853e-06, + "loss": 0.8147, + "step": 32108 + }, + { + "epoch": 0.82, + "learning_rate": 1.7029269733106774e-06, + "loss": 0.958, + "step": 32109 + }, + { + "epoch": 0.82, + "learning_rate": 1.7029072920984708e-06, + "loss": 0.9932, + "step": 32110 + }, + { + "epoch": 0.82, + "learning_rate": 1.7028876103480805e-06, + "loss": 0.7432, + "step": 32111 + }, + { + "epoch": 0.82, + "learning_rate": 1.7028679280595216e-06, + "loss": 0.8115, + "step": 32112 + }, + { + "epoch": 0.82, + "learning_rate": 1.7028482452328087e-06, + "loss": 0.8496, + "step": 32113 + }, + { + "epoch": 0.82, + "learning_rate": 1.7028285618679574e-06, + "loss": 0.9688, + "step": 32114 + }, + { + "epoch": 0.82, + "learning_rate": 1.7028088779649824e-06, + "loss": 0.8296, + "step": 32115 + }, + { + "epoch": 0.82, + "learning_rate": 1.702789193523899e-06, + "loss": 0.5969, + "step": 32116 + }, + { + "epoch": 0.82, + "learning_rate": 1.7027695085447224e-06, + "loss": 1.0039, + "step": 32117 + }, + { + "epoch": 0.82, + "learning_rate": 1.7027498230274676e-06, + "loss": 0.7275, + "step": 32118 + }, + { + "epoch": 0.82, + "learning_rate": 1.7027301369721493e-06, + "loss": 0.8086, + "step": 32119 + }, + { + "epoch": 0.82, + "learning_rate": 1.7027104503787828e-06, + "loss": 0.9043, + "step": 32120 + }, + { + "epoch": 0.82, + "learning_rate": 1.7026907632473835e-06, + "loss": 0.8262, + "step": 32121 + }, + { + "epoch": 0.82, + "learning_rate": 1.7026710755779662e-06, + "loss": 0.7026, + "step": 32122 + }, + { + "epoch": 0.82, + "learning_rate": 1.7026513873705458e-06, + "loss": 0.8662, + "step": 32123 + }, + { + "epoch": 0.82, + "learning_rate": 1.7026316986251374e-06, + "loss": 0.9648, + "step": 32124 + }, + { + "epoch": 0.82, + "learning_rate": 1.7026120093417565e-06, + "loss": 0.8867, + "step": 32125 + }, + { + "epoch": 0.82, + "learning_rate": 1.7025923195204177e-06, + "loss": 0.6958, + "step": 32126 + }, + { + "epoch": 0.82, + "learning_rate": 1.702572629161136e-06, + "loss": 0.959, + "step": 32127 + }, + { + "epoch": 0.82, + "learning_rate": 1.7025529382639272e-06, + "loss": 0.8506, + "step": 32128 + }, + { + "epoch": 0.82, + "learning_rate": 1.702533246828806e-06, + "loss": 0.8955, + "step": 32129 + }, + { + "epoch": 0.82, + "learning_rate": 1.702513554855787e-06, + "loss": 0.6958, + "step": 32130 + }, + { + "epoch": 0.82, + "learning_rate": 1.7024938623448862e-06, + "loss": 0.9521, + "step": 32131 + }, + { + "epoch": 0.82, + "learning_rate": 1.7024741692961174e-06, + "loss": 0.918, + "step": 32132 + }, + { + "epoch": 0.82, + "learning_rate": 1.702454475709497e-06, + "loss": 0.7754, + "step": 32133 + }, + { + "epoch": 0.82, + "learning_rate": 1.7024347815850396e-06, + "loss": 0.6245, + "step": 32134 + }, + { + "epoch": 0.82, + "learning_rate": 1.70241508692276e-06, + "loss": 0.7939, + "step": 32135 + }, + { + "epoch": 0.82, + "learning_rate": 1.702395391722673e-06, + "loss": 0.6794, + "step": 32136 + }, + { + "epoch": 0.82, + "learning_rate": 1.7023756959847946e-06, + "loss": 0.7188, + "step": 32137 + }, + { + "epoch": 0.82, + "learning_rate": 1.7023559997091395e-06, + "loss": 0.7832, + "step": 32138 + }, + { + "epoch": 0.82, + "learning_rate": 1.7023363028957225e-06, + "loss": 0.8584, + "step": 32139 + }, + { + "epoch": 0.82, + "learning_rate": 1.702316605544559e-06, + "loss": 0.957, + "step": 32140 + }, + { + "epoch": 0.82, + "learning_rate": 1.702296907655664e-06, + "loss": 0.7002, + "step": 32141 + }, + { + "epoch": 0.82, + "learning_rate": 1.7022772092290523e-06, + "loss": 0.9004, + "step": 32142 + }, + { + "epoch": 0.82, + "learning_rate": 1.7022575102647395e-06, + "loss": 0.6733, + "step": 32143 + }, + { + "epoch": 0.82, + "learning_rate": 1.7022378107627404e-06, + "loss": 0.7734, + "step": 32144 + }, + { + "epoch": 0.82, + "learning_rate": 1.70221811072307e-06, + "loss": 0.8252, + "step": 32145 + }, + { + "epoch": 0.82, + "learning_rate": 1.7021984101457436e-06, + "loss": 0.801, + "step": 32146 + }, + { + "epoch": 0.82, + "learning_rate": 1.702178709030776e-06, + "loss": 0.627, + "step": 32147 + }, + { + "epoch": 0.82, + "learning_rate": 1.7021590073781827e-06, + "loss": 0.9365, + "step": 32148 + }, + { + "epoch": 0.82, + "learning_rate": 1.7021393051879781e-06, + "loss": 0.96, + "step": 32149 + }, + { + "epoch": 0.82, + "learning_rate": 1.7021196024601781e-06, + "loss": 0.8516, + "step": 32150 + }, + { + "epoch": 0.82, + "learning_rate": 1.7020998991947972e-06, + "loss": 0.8809, + "step": 32151 + }, + { + "epoch": 0.82, + "learning_rate": 1.7020801953918506e-06, + "loss": 0.6533, + "step": 32152 + }, + { + "epoch": 0.82, + "learning_rate": 1.7020604910513538e-06, + "loss": 0.8193, + "step": 32153 + }, + { + "epoch": 0.82, + "learning_rate": 1.7020407861733215e-06, + "loss": 0.7256, + "step": 32154 + }, + { + "epoch": 0.82, + "learning_rate": 1.7020210807577686e-06, + "loss": 0.96, + "step": 32155 + }, + { + "epoch": 0.82, + "learning_rate": 1.7020013748047108e-06, + "loss": 0.5815, + "step": 32156 + }, + { + "epoch": 0.82, + "learning_rate": 1.7019816683141626e-06, + "loss": 0.8076, + "step": 32157 + }, + { + "epoch": 0.82, + "learning_rate": 1.7019619612861393e-06, + "loss": 0.8535, + "step": 32158 + }, + { + "epoch": 0.82, + "learning_rate": 1.7019422537206563e-06, + "loss": 0.9414, + "step": 32159 + }, + { + "epoch": 0.82, + "learning_rate": 1.701922545617728e-06, + "loss": 0.8701, + "step": 32160 + }, + { + "epoch": 0.82, + "learning_rate": 1.70190283697737e-06, + "loss": 0.7041, + "step": 32161 + }, + { + "epoch": 0.82, + "learning_rate": 1.701883127799597e-06, + "loss": 0.9775, + "step": 32162 + }, + { + "epoch": 0.82, + "learning_rate": 1.701863418084425e-06, + "loss": 0.7129, + "step": 32163 + }, + { + "epoch": 0.82, + "learning_rate": 1.7018437078318679e-06, + "loss": 0.9688, + "step": 32164 + }, + { + "epoch": 0.82, + "learning_rate": 1.7018239970419418e-06, + "loss": 1.0107, + "step": 32165 + }, + { + "epoch": 0.82, + "learning_rate": 1.701804285714661e-06, + "loss": 0.8535, + "step": 32166 + }, + { + "epoch": 0.82, + "learning_rate": 1.701784573850041e-06, + "loss": 0.7676, + "step": 32167 + }, + { + "epoch": 0.82, + "learning_rate": 1.701764861448097e-06, + "loss": 0.7134, + "step": 32168 + }, + { + "epoch": 0.82, + "learning_rate": 1.7017451485088436e-06, + "loss": 0.7998, + "step": 32169 + }, + { + "epoch": 0.82, + "learning_rate": 1.7017254350322965e-06, + "loss": 0.7646, + "step": 32170 + }, + { + "epoch": 0.82, + "learning_rate": 1.7017057210184702e-06, + "loss": 0.8037, + "step": 32171 + }, + { + "epoch": 0.82, + "learning_rate": 1.7016860064673803e-06, + "loss": 0.9111, + "step": 32172 + }, + { + "epoch": 0.82, + "learning_rate": 1.7016662913790417e-06, + "loss": 0.7803, + "step": 32173 + }, + { + "epoch": 0.82, + "learning_rate": 1.7016465757534695e-06, + "loss": 0.8398, + "step": 32174 + }, + { + "epoch": 0.82, + "learning_rate": 1.7016268595906787e-06, + "loss": 1.1387, + "step": 32175 + }, + { + "epoch": 0.82, + "learning_rate": 1.7016071428906844e-06, + "loss": 0.9141, + "step": 32176 + }, + { + "epoch": 0.82, + "learning_rate": 1.7015874256535018e-06, + "loss": 0.9922, + "step": 32177 + }, + { + "epoch": 0.82, + "learning_rate": 1.701567707879146e-06, + "loss": 0.9766, + "step": 32178 + }, + { + "epoch": 0.82, + "learning_rate": 1.7015479895676322e-06, + "loss": 0.6973, + "step": 32179 + }, + { + "epoch": 0.82, + "learning_rate": 1.7015282707189753e-06, + "loss": 0.8599, + "step": 32180 + }, + { + "epoch": 0.82, + "learning_rate": 1.70150855133319e-06, + "loss": 0.7964, + "step": 32181 + }, + { + "epoch": 0.82, + "learning_rate": 1.7014888314102923e-06, + "loss": 0.9727, + "step": 32182 + }, + { + "epoch": 0.82, + "learning_rate": 1.7014691109502972e-06, + "loss": 0.8164, + "step": 32183 + }, + { + "epoch": 0.82, + "learning_rate": 1.701449389953219e-06, + "loss": 0.6577, + "step": 32184 + }, + { + "epoch": 0.82, + "learning_rate": 1.7014296684190733e-06, + "loss": 0.9092, + "step": 32185 + }, + { + "epoch": 0.82, + "learning_rate": 1.701409946347875e-06, + "loss": 0.7754, + "step": 32186 + }, + { + "epoch": 0.82, + "learning_rate": 1.7013902237396397e-06, + "loss": 0.9316, + "step": 32187 + }, + { + "epoch": 0.82, + "learning_rate": 1.7013705005943821e-06, + "loss": 0.6982, + "step": 32188 + }, + { + "epoch": 0.83, + "learning_rate": 1.7013507769121174e-06, + "loss": 0.7837, + "step": 32189 + }, + { + "epoch": 0.83, + "learning_rate": 1.7013310526928604e-06, + "loss": 1.1074, + "step": 32190 + }, + { + "epoch": 0.83, + "learning_rate": 1.7013113279366266e-06, + "loss": 0.8149, + "step": 32191 + }, + { + "epoch": 0.83, + "learning_rate": 1.701291602643431e-06, + "loss": 1.1914, + "step": 32192 + }, + { + "epoch": 0.83, + "learning_rate": 1.7012718768132886e-06, + "loss": 0.627, + "step": 32193 + }, + { + "epoch": 0.83, + "learning_rate": 1.7012521504462146e-06, + "loss": 0.8379, + "step": 32194 + }, + { + "epoch": 0.83, + "learning_rate": 1.701232423542224e-06, + "loss": 0.8428, + "step": 32195 + }, + { + "epoch": 0.83, + "learning_rate": 1.701212696101332e-06, + "loss": 1.0283, + "step": 32196 + }, + { + "epoch": 0.83, + "learning_rate": 1.7011929681235538e-06, + "loss": 0.6528, + "step": 32197 + }, + { + "epoch": 0.83, + "learning_rate": 1.7011732396089042e-06, + "loss": 0.8926, + "step": 32198 + }, + { + "epoch": 0.83, + "learning_rate": 1.7011535105573985e-06, + "loss": 0.9136, + "step": 32199 + }, + { + "epoch": 0.83, + "learning_rate": 1.7011337809690521e-06, + "loss": 0.9688, + "step": 32200 + }, + { + "epoch": 0.83, + "learning_rate": 1.7011140508438793e-06, + "loss": 0.8379, + "step": 32201 + }, + { + "epoch": 0.83, + "learning_rate": 1.7010943201818961e-06, + "loss": 0.7153, + "step": 32202 + }, + { + "epoch": 0.83, + "learning_rate": 1.7010745889831173e-06, + "loss": 0.998, + "step": 32203 + }, + { + "epoch": 0.83, + "learning_rate": 1.7010548572475578e-06, + "loss": 0.9932, + "step": 32204 + }, + { + "epoch": 0.83, + "learning_rate": 1.7010351249752327e-06, + "loss": 0.9551, + "step": 32205 + }, + { + "epoch": 0.83, + "learning_rate": 1.7010153921661572e-06, + "loss": 0.8633, + "step": 32206 + }, + { + "epoch": 0.83, + "learning_rate": 1.7009956588203466e-06, + "loss": 1.1104, + "step": 32207 + }, + { + "epoch": 0.83, + "learning_rate": 1.7009759249378156e-06, + "loss": 0.875, + "step": 32208 + }, + { + "epoch": 0.83, + "learning_rate": 1.70095619051858e-06, + "loss": 0.6794, + "step": 32209 + }, + { + "epoch": 0.83, + "learning_rate": 1.7009364555626542e-06, + "loss": 0.7539, + "step": 32210 + }, + { + "epoch": 0.83, + "learning_rate": 1.7009167200700536e-06, + "loss": 0.9209, + "step": 32211 + }, + { + "epoch": 0.83, + "learning_rate": 1.7008969840407935e-06, + "loss": 0.7036, + "step": 32212 + }, + { + "epoch": 0.83, + "learning_rate": 1.7008772474748886e-06, + "loss": 0.6338, + "step": 32213 + }, + { + "epoch": 0.83, + "learning_rate": 1.7008575103723541e-06, + "loss": 0.7097, + "step": 32214 + }, + { + "epoch": 0.83, + "learning_rate": 1.7008377727332056e-06, + "loss": 0.5322, + "step": 32215 + }, + { + "epoch": 0.83, + "learning_rate": 1.7008180345574577e-06, + "loss": 0.8844, + "step": 32216 + }, + { + "epoch": 0.83, + "learning_rate": 1.7007982958451254e-06, + "loss": 1.0, + "step": 32217 + }, + { + "epoch": 0.83, + "learning_rate": 1.7007785565962242e-06, + "loss": 0.8975, + "step": 32218 + }, + { + "epoch": 0.83, + "learning_rate": 1.7007588168107691e-06, + "loss": 0.75, + "step": 32219 + }, + { + "epoch": 0.83, + "learning_rate": 1.7007390764887752e-06, + "loss": 0.7549, + "step": 32220 + }, + { + "epoch": 0.83, + "learning_rate": 1.7007193356302578e-06, + "loss": 0.7114, + "step": 32221 + }, + { + "epoch": 0.83, + "learning_rate": 1.7006995942352317e-06, + "loss": 0.6616, + "step": 32222 + }, + { + "epoch": 0.83, + "learning_rate": 1.700679852303712e-06, + "loss": 0.8447, + "step": 32223 + }, + { + "epoch": 0.83, + "learning_rate": 1.7006601098357144e-06, + "loss": 1.1289, + "step": 32224 + }, + { + "epoch": 0.83, + "learning_rate": 1.700640366831253e-06, + "loss": 0.7959, + "step": 32225 + }, + { + "epoch": 0.83, + "learning_rate": 1.7006206232903437e-06, + "loss": 0.7192, + "step": 32226 + }, + { + "epoch": 0.83, + "learning_rate": 1.7006008792130014e-06, + "loss": 0.917, + "step": 32227 + }, + { + "epoch": 0.83, + "learning_rate": 1.7005811345992415e-06, + "loss": 1.0361, + "step": 32228 + }, + { + "epoch": 0.83, + "learning_rate": 1.7005613894490785e-06, + "loss": 0.6829, + "step": 32229 + }, + { + "epoch": 0.83, + "learning_rate": 1.700541643762528e-06, + "loss": 0.7236, + "step": 32230 + }, + { + "epoch": 0.83, + "learning_rate": 1.7005218975396049e-06, + "loss": 0.7773, + "step": 32231 + }, + { + "epoch": 0.83, + "learning_rate": 1.7005021507803243e-06, + "loss": 0.8599, + "step": 32232 + }, + { + "epoch": 0.83, + "learning_rate": 1.7004824034847016e-06, + "loss": 1.0938, + "step": 32233 + }, + { + "epoch": 0.83, + "learning_rate": 1.7004626556527518e-06, + "loss": 0.7676, + "step": 32234 + }, + { + "epoch": 0.83, + "learning_rate": 1.7004429072844897e-06, + "loss": 0.6851, + "step": 32235 + }, + { + "epoch": 0.83, + "learning_rate": 1.7004231583799307e-06, + "loss": 0.7417, + "step": 32236 + }, + { + "epoch": 0.83, + "learning_rate": 1.7004034089390901e-06, + "loss": 0.835, + "step": 32237 + }, + { + "epoch": 0.83, + "learning_rate": 1.7003836589619826e-06, + "loss": 0.7705, + "step": 32238 + }, + { + "epoch": 0.83, + "learning_rate": 1.7003639084486236e-06, + "loss": 0.8604, + "step": 32239 + }, + { + "epoch": 0.83, + "learning_rate": 1.7003441573990282e-06, + "loss": 1.0645, + "step": 32240 + }, + { + "epoch": 0.83, + "learning_rate": 1.7003244058132115e-06, + "loss": 0.8701, + "step": 32241 + }, + { + "epoch": 0.83, + "learning_rate": 1.7003046536911887e-06, + "loss": 0.6855, + "step": 32242 + }, + { + "epoch": 0.83, + "learning_rate": 1.7002849010329748e-06, + "loss": 0.7651, + "step": 32243 + }, + { + "epoch": 0.83, + "learning_rate": 1.7002651478385848e-06, + "loss": 0.7793, + "step": 32244 + }, + { + "epoch": 0.83, + "learning_rate": 1.700245394108034e-06, + "loss": 0.7725, + "step": 32245 + }, + { + "epoch": 0.83, + "learning_rate": 1.7002256398413375e-06, + "loss": 0.8887, + "step": 32246 + }, + { + "epoch": 0.83, + "learning_rate": 1.7002058850385105e-06, + "loss": 0.9199, + "step": 32247 + }, + { + "epoch": 0.83, + "learning_rate": 1.700186129699568e-06, + "loss": 0.8467, + "step": 32248 + }, + { + "epoch": 0.83, + "learning_rate": 1.7001663738245253e-06, + "loss": 0.9678, + "step": 32249 + }, + { + "epoch": 0.83, + "learning_rate": 1.7001466174133972e-06, + "loss": 0.9092, + "step": 32250 + }, + { + "epoch": 0.83, + "learning_rate": 1.7001268604661992e-06, + "loss": 0.7993, + "step": 32251 + }, + { + "epoch": 0.83, + "learning_rate": 1.700107102982946e-06, + "loss": 0.7163, + "step": 32252 + }, + { + "epoch": 0.83, + "learning_rate": 1.7000873449636532e-06, + "loss": 0.9531, + "step": 32253 + }, + { + "epoch": 0.83, + "learning_rate": 1.7000675864083357e-06, + "loss": 0.8521, + "step": 32254 + }, + { + "epoch": 0.83, + "learning_rate": 1.7000478273170086e-06, + "loss": 1.0391, + "step": 32255 + }, + { + "epoch": 0.83, + "learning_rate": 1.700028067689687e-06, + "loss": 0.7715, + "step": 32256 + }, + { + "epoch": 0.83, + "learning_rate": 1.700008307526386e-06, + "loss": 0.688, + "step": 32257 + }, + { + "epoch": 0.83, + "learning_rate": 1.699988546827121e-06, + "loss": 0.8975, + "step": 32258 + }, + { + "epoch": 0.83, + "learning_rate": 1.6999687855919072e-06, + "loss": 0.541, + "step": 32259 + }, + { + "epoch": 0.83, + "learning_rate": 1.6999490238207591e-06, + "loss": 0.9619, + "step": 32260 + }, + { + "epoch": 0.83, + "learning_rate": 1.6999292615136924e-06, + "loss": 0.8457, + "step": 32261 + }, + { + "epoch": 0.83, + "learning_rate": 1.699909498670722e-06, + "loss": 0.593, + "step": 32262 + }, + { + "epoch": 0.83, + "learning_rate": 1.6998897352918632e-06, + "loss": 0.8691, + "step": 32263 + }, + { + "epoch": 0.83, + "learning_rate": 1.6998699713771307e-06, + "loss": 0.7422, + "step": 32264 + }, + { + "epoch": 0.83, + "learning_rate": 1.6998502069265404e-06, + "loss": 0.9219, + "step": 32265 + }, + { + "epoch": 0.83, + "learning_rate": 1.6998304419401066e-06, + "loss": 0.6094, + "step": 32266 + }, + { + "epoch": 0.83, + "learning_rate": 1.699810676417845e-06, + "loss": 0.8804, + "step": 32267 + }, + { + "epoch": 0.83, + "learning_rate": 1.6997909103597703e-06, + "loss": 0.9307, + "step": 32268 + }, + { + "epoch": 0.83, + "learning_rate": 1.699771143765898e-06, + "loss": 0.9756, + "step": 32269 + }, + { + "epoch": 0.83, + "learning_rate": 1.6997513766362433e-06, + "loss": 0.8477, + "step": 32270 + }, + { + "epoch": 0.83, + "learning_rate": 1.699731608970821e-06, + "loss": 0.7915, + "step": 32271 + }, + { + "epoch": 0.83, + "learning_rate": 1.6997118407696463e-06, + "loss": 1.0957, + "step": 32272 + }, + { + "epoch": 0.83, + "learning_rate": 1.6996920720327345e-06, + "loss": 0.7051, + "step": 32273 + }, + { + "epoch": 0.83, + "learning_rate": 1.6996723027601008e-06, + "loss": 0.8506, + "step": 32274 + }, + { + "epoch": 0.83, + "learning_rate": 1.6996525329517599e-06, + "loss": 0.7861, + "step": 32275 + }, + { + "epoch": 0.83, + "learning_rate": 1.6996327626077273e-06, + "loss": 0.6855, + "step": 32276 + }, + { + "epoch": 0.83, + "learning_rate": 1.6996129917280183e-06, + "loss": 0.8545, + "step": 32277 + }, + { + "epoch": 0.83, + "learning_rate": 1.6995932203126477e-06, + "loss": 1.0879, + "step": 32278 + }, + { + "epoch": 0.83, + "learning_rate": 1.6995734483616306e-06, + "loss": 0.6411, + "step": 32279 + }, + { + "epoch": 0.83, + "learning_rate": 1.6995536758749825e-06, + "loss": 0.6772, + "step": 32280 + }, + { + "epoch": 0.83, + "learning_rate": 1.699533902852718e-06, + "loss": 0.7695, + "step": 32281 + }, + { + "epoch": 0.83, + "learning_rate": 1.6995141292948527e-06, + "loss": 0.9795, + "step": 32282 + }, + { + "epoch": 0.83, + "learning_rate": 1.6994943552014015e-06, + "loss": 0.791, + "step": 32283 + }, + { + "epoch": 0.83, + "learning_rate": 1.6994745805723799e-06, + "loss": 0.8457, + "step": 32284 + }, + { + "epoch": 0.83, + "learning_rate": 1.6994548054078026e-06, + "loss": 0.835, + "step": 32285 + }, + { + "epoch": 0.83, + "learning_rate": 1.699435029707685e-06, + "loss": 0.9463, + "step": 32286 + }, + { + "epoch": 0.83, + "learning_rate": 1.699415253472042e-06, + "loss": 0.9951, + "step": 32287 + }, + { + "epoch": 0.83, + "learning_rate": 1.6993954767008891e-06, + "loss": 0.7285, + "step": 32288 + }, + { + "epoch": 0.83, + "learning_rate": 1.699375699394241e-06, + "loss": 0.7822, + "step": 32289 + }, + { + "epoch": 0.83, + "learning_rate": 1.6993559215521133e-06, + "loss": 0.8252, + "step": 32290 + }, + { + "epoch": 0.83, + "learning_rate": 1.6993361431745209e-06, + "loss": 0.542, + "step": 32291 + }, + { + "epoch": 0.83, + "learning_rate": 1.6993163642614787e-06, + "loss": 0.8301, + "step": 32292 + }, + { + "epoch": 0.83, + "learning_rate": 1.6992965848130028e-06, + "loss": 0.6802, + "step": 32293 + }, + { + "epoch": 0.83, + "learning_rate": 1.699276804829107e-06, + "loss": 0.875, + "step": 32294 + }, + { + "epoch": 0.83, + "learning_rate": 1.6992570243098073e-06, + "loss": 0.9189, + "step": 32295 + }, + { + "epoch": 0.83, + "learning_rate": 1.6992372432551188e-06, + "loss": 0.7192, + "step": 32296 + }, + { + "epoch": 0.83, + "learning_rate": 1.6992174616650563e-06, + "loss": 0.8135, + "step": 32297 + }, + { + "epoch": 0.83, + "learning_rate": 1.6991976795396353e-06, + "loss": 0.8828, + "step": 32298 + }, + { + "epoch": 0.83, + "learning_rate": 1.6991778968788706e-06, + "loss": 0.9512, + "step": 32299 + }, + { + "epoch": 0.83, + "learning_rate": 1.6991581136827775e-06, + "loss": 0.8672, + "step": 32300 + }, + { + "epoch": 0.83, + "learning_rate": 1.6991383299513713e-06, + "loss": 1.1553, + "step": 32301 + }, + { + "epoch": 0.83, + "learning_rate": 1.6991185456846671e-06, + "loss": 0.9697, + "step": 32302 + }, + { + "epoch": 0.83, + "learning_rate": 1.69909876088268e-06, + "loss": 0.8926, + "step": 32303 + }, + { + "epoch": 0.83, + "learning_rate": 1.6990789755454249e-06, + "loss": 0.8096, + "step": 32304 + }, + { + "epoch": 0.83, + "learning_rate": 1.6990591896729173e-06, + "loss": 0.8994, + "step": 32305 + }, + { + "epoch": 0.83, + "learning_rate": 1.6990394032651722e-06, + "loss": 0.9053, + "step": 32306 + }, + { + "epoch": 0.83, + "learning_rate": 1.6990196163222047e-06, + "loss": 0.689, + "step": 32307 + }, + { + "epoch": 0.83, + "learning_rate": 1.6989998288440304e-06, + "loss": 0.8389, + "step": 32308 + }, + { + "epoch": 0.83, + "learning_rate": 1.6989800408306636e-06, + "loss": 0.96, + "step": 32309 + }, + { + "epoch": 0.83, + "learning_rate": 1.69896025228212e-06, + "loss": 0.97, + "step": 32310 + }, + { + "epoch": 0.83, + "learning_rate": 1.698940463198415e-06, + "loss": 0.6951, + "step": 32311 + }, + { + "epoch": 0.83, + "learning_rate": 1.698920673579563e-06, + "loss": 1.0059, + "step": 32312 + }, + { + "epoch": 0.83, + "learning_rate": 1.69890088342558e-06, + "loss": 0.8887, + "step": 32313 + }, + { + "epoch": 0.83, + "learning_rate": 1.6988810927364805e-06, + "loss": 0.8247, + "step": 32314 + }, + { + "epoch": 0.83, + "learning_rate": 1.6988613015122799e-06, + "loss": 0.9268, + "step": 32315 + }, + { + "epoch": 0.83, + "learning_rate": 1.6988415097529933e-06, + "loss": 0.9053, + "step": 32316 + }, + { + "epoch": 0.83, + "learning_rate": 1.698821717458636e-06, + "loss": 0.6719, + "step": 32317 + }, + { + "epoch": 0.83, + "learning_rate": 1.6988019246292228e-06, + "loss": 0.7959, + "step": 32318 + }, + { + "epoch": 0.83, + "learning_rate": 1.6987821312647694e-06, + "loss": 0.6631, + "step": 32319 + }, + { + "epoch": 0.83, + "learning_rate": 1.6987623373652906e-06, + "loss": 0.8965, + "step": 32320 + }, + { + "epoch": 0.83, + "learning_rate": 1.6987425429308014e-06, + "loss": 0.8711, + "step": 32321 + }, + { + "epoch": 0.83, + "learning_rate": 1.6987227479613174e-06, + "loss": 0.8438, + "step": 32322 + }, + { + "epoch": 0.83, + "learning_rate": 1.6987029524568532e-06, + "loss": 0.873, + "step": 32323 + }, + { + "epoch": 0.83, + "learning_rate": 1.6986831564174246e-06, + "loss": 0.7769, + "step": 32324 + }, + { + "epoch": 0.83, + "learning_rate": 1.6986633598430463e-06, + "loss": 0.9033, + "step": 32325 + }, + { + "epoch": 0.83, + "learning_rate": 1.6986435627337336e-06, + "loss": 0.9961, + "step": 32326 + }, + { + "epoch": 0.83, + "learning_rate": 1.6986237650895016e-06, + "loss": 0.9014, + "step": 32327 + }, + { + "epoch": 0.83, + "learning_rate": 1.6986039669103657e-06, + "loss": 0.8301, + "step": 32328 + }, + { + "epoch": 0.83, + "learning_rate": 1.6985841681963406e-06, + "loss": 0.9033, + "step": 32329 + }, + { + "epoch": 0.83, + "learning_rate": 1.698564368947442e-06, + "loss": 0.8965, + "step": 32330 + }, + { + "epoch": 0.83, + "learning_rate": 1.6985445691636846e-06, + "loss": 0.9766, + "step": 32331 + }, + { + "epoch": 0.83, + "learning_rate": 1.698524768845084e-06, + "loss": 0.7666, + "step": 32332 + }, + { + "epoch": 0.83, + "learning_rate": 1.6985049679916545e-06, + "loss": 0.7681, + "step": 32333 + }, + { + "epoch": 0.83, + "learning_rate": 1.6984851666034126e-06, + "loss": 0.7793, + "step": 32334 + }, + { + "epoch": 0.83, + "learning_rate": 1.698465364680372e-06, + "loss": 0.834, + "step": 32335 + }, + { + "epoch": 0.83, + "learning_rate": 1.698445562222549e-06, + "loss": 0.8232, + "step": 32336 + }, + { + "epoch": 0.83, + "learning_rate": 1.6984257592299583e-06, + "loss": 0.8447, + "step": 32337 + }, + { + "epoch": 0.83, + "learning_rate": 1.6984059557026153e-06, + "loss": 0.6357, + "step": 32338 + }, + { + "epoch": 0.83, + "learning_rate": 1.698386151640535e-06, + "loss": 0.7979, + "step": 32339 + }, + { + "epoch": 0.83, + "learning_rate": 1.6983663470437322e-06, + "loss": 0.8574, + "step": 32340 + }, + { + "epoch": 0.83, + "learning_rate": 1.6983465419122226e-06, + "loss": 0.7104, + "step": 32341 + }, + { + "epoch": 0.83, + "learning_rate": 1.6983267362460213e-06, + "loss": 0.9609, + "step": 32342 + }, + { + "epoch": 0.83, + "learning_rate": 1.6983069300451427e-06, + "loss": 1.0723, + "step": 32343 + }, + { + "epoch": 0.83, + "learning_rate": 1.698287123309603e-06, + "loss": 0.8525, + "step": 32344 + }, + { + "epoch": 0.83, + "learning_rate": 1.6982673160394172e-06, + "loss": 0.6587, + "step": 32345 + }, + { + "epoch": 0.83, + "learning_rate": 1.6982475082346e-06, + "loss": 1.0449, + "step": 32346 + }, + { + "epoch": 0.83, + "learning_rate": 1.6982276998951668e-06, + "loss": 0.9092, + "step": 32347 + }, + { + "epoch": 0.83, + "learning_rate": 1.6982078910211329e-06, + "loss": 0.8237, + "step": 32348 + }, + { + "epoch": 0.83, + "learning_rate": 1.698188081612513e-06, + "loss": 0.6575, + "step": 32349 + }, + { + "epoch": 0.83, + "learning_rate": 1.6981682716693226e-06, + "loss": 0.4856, + "step": 32350 + }, + { + "epoch": 0.83, + "learning_rate": 1.698148461191577e-06, + "loss": 0.7871, + "step": 32351 + }, + { + "epoch": 0.83, + "learning_rate": 1.6981286501792913e-06, + "loss": 0.9355, + "step": 32352 + }, + { + "epoch": 0.83, + "learning_rate": 1.6981088386324807e-06, + "loss": 0.9824, + "step": 32353 + }, + { + "epoch": 0.83, + "learning_rate": 1.6980890265511598e-06, + "loss": 0.8032, + "step": 32354 + }, + { + "epoch": 0.83, + "learning_rate": 1.6980692139353445e-06, + "loss": 0.9258, + "step": 32355 + }, + { + "epoch": 0.83, + "learning_rate": 1.69804940078505e-06, + "loss": 1.0498, + "step": 32356 + }, + { + "epoch": 0.83, + "learning_rate": 1.6980295871002908e-06, + "loss": 0.9043, + "step": 32357 + }, + { + "epoch": 0.83, + "learning_rate": 1.6980097728810826e-06, + "loss": 0.9121, + "step": 32358 + }, + { + "epoch": 0.83, + "learning_rate": 1.6979899581274402e-06, + "loss": 0.6704, + "step": 32359 + }, + { + "epoch": 0.83, + "learning_rate": 1.6979701428393791e-06, + "loss": 0.792, + "step": 32360 + }, + { + "epoch": 0.83, + "learning_rate": 1.6979503270169144e-06, + "loss": 1.0654, + "step": 32361 + }, + { + "epoch": 0.83, + "learning_rate": 1.6979305106600612e-06, + "loss": 0.8213, + "step": 32362 + }, + { + "epoch": 0.83, + "learning_rate": 1.6979106937688349e-06, + "loss": 0.8652, + "step": 32363 + }, + { + "epoch": 0.83, + "learning_rate": 1.69789087634325e-06, + "loss": 0.6978, + "step": 32364 + }, + { + "epoch": 0.83, + "learning_rate": 1.6978710583833228e-06, + "loss": 1.0186, + "step": 32365 + }, + { + "epoch": 0.83, + "learning_rate": 1.6978512398890673e-06, + "loss": 0.7866, + "step": 32366 + }, + { + "epoch": 0.83, + "learning_rate": 1.6978314208604994e-06, + "loss": 0.7007, + "step": 32367 + }, + { + "epoch": 0.83, + "learning_rate": 1.697811601297634e-06, + "loss": 0.7207, + "step": 32368 + }, + { + "epoch": 0.83, + "learning_rate": 1.6977917812004864e-06, + "loss": 0.7422, + "step": 32369 + }, + { + "epoch": 0.83, + "learning_rate": 1.6977719605690717e-06, + "loss": 0.8359, + "step": 32370 + }, + { + "epoch": 0.83, + "learning_rate": 1.697752139403405e-06, + "loss": 0.9795, + "step": 32371 + }, + { + "epoch": 0.83, + "learning_rate": 1.6977323177035014e-06, + "loss": 0.9033, + "step": 32372 + }, + { + "epoch": 0.83, + "learning_rate": 1.6977124954693767e-06, + "loss": 0.8008, + "step": 32373 + }, + { + "epoch": 0.83, + "learning_rate": 1.6976926727010455e-06, + "loss": 0.814, + "step": 32374 + }, + { + "epoch": 0.83, + "learning_rate": 1.6976728493985228e-06, + "loss": 0.835, + "step": 32375 + }, + { + "epoch": 0.83, + "learning_rate": 1.6976530255618245e-06, + "loss": 1.0059, + "step": 32376 + }, + { + "epoch": 0.83, + "learning_rate": 1.697633201190965e-06, + "loss": 0.9214, + "step": 32377 + }, + { + "epoch": 0.83, + "learning_rate": 1.6976133762859601e-06, + "loss": 0.6667, + "step": 32378 + }, + { + "epoch": 0.83, + "learning_rate": 1.6975935508468245e-06, + "loss": 0.9092, + "step": 32379 + }, + { + "epoch": 0.83, + "learning_rate": 1.6975737248735737e-06, + "loss": 0.8506, + "step": 32380 + }, + { + "epoch": 0.83, + "learning_rate": 1.6975538983662229e-06, + "loss": 1.0098, + "step": 32381 + }, + { + "epoch": 0.83, + "learning_rate": 1.697534071324787e-06, + "loss": 0.7852, + "step": 32382 + }, + { + "epoch": 0.83, + "learning_rate": 1.697514243749281e-06, + "loss": 0.8506, + "step": 32383 + }, + { + "epoch": 0.83, + "learning_rate": 1.697494415639721e-06, + "loss": 0.439, + "step": 32384 + }, + { + "epoch": 0.83, + "learning_rate": 1.6974745869961213e-06, + "loss": 0.7764, + "step": 32385 + }, + { + "epoch": 0.83, + "learning_rate": 1.6974547578184974e-06, + "loss": 0.7871, + "step": 32386 + }, + { + "epoch": 0.83, + "learning_rate": 1.6974349281068648e-06, + "loss": 0.5645, + "step": 32387 + }, + { + "epoch": 0.83, + "learning_rate": 1.697415097861238e-06, + "loss": 0.7637, + "step": 32388 + }, + { + "epoch": 0.83, + "learning_rate": 1.6973952670816325e-06, + "loss": 0.8301, + "step": 32389 + }, + { + "epoch": 0.83, + "learning_rate": 1.6973754357680634e-06, + "loss": 0.9873, + "step": 32390 + }, + { + "epoch": 0.83, + "learning_rate": 1.6973556039205463e-06, + "loss": 0.8613, + "step": 32391 + }, + { + "epoch": 0.83, + "learning_rate": 1.6973357715390961e-06, + "loss": 0.7593, + "step": 32392 + }, + { + "epoch": 0.83, + "learning_rate": 1.6973159386237278e-06, + "loss": 1.0947, + "step": 32393 + }, + { + "epoch": 0.83, + "learning_rate": 1.6972961051744568e-06, + "loss": 0.5903, + "step": 32394 + }, + { + "epoch": 0.83, + "learning_rate": 1.6972762711912982e-06, + "loss": 0.9502, + "step": 32395 + }, + { + "epoch": 0.83, + "learning_rate": 1.6972564366742672e-06, + "loss": 0.9482, + "step": 32396 + }, + { + "epoch": 0.83, + "learning_rate": 1.6972366016233793e-06, + "loss": 0.8867, + "step": 32397 + }, + { + "epoch": 0.83, + "learning_rate": 1.697216766038649e-06, + "loss": 0.9453, + "step": 32398 + }, + { + "epoch": 0.83, + "learning_rate": 1.6971969299200919e-06, + "loss": 1.041, + "step": 32399 + }, + { + "epoch": 0.83, + "learning_rate": 1.6971770932677232e-06, + "loss": 0.8066, + "step": 32400 + }, + { + "epoch": 0.83, + "learning_rate": 1.6971572560815585e-06, + "loss": 0.958, + "step": 32401 + }, + { + "epoch": 0.83, + "learning_rate": 1.6971374183616121e-06, + "loss": 0.7461, + "step": 32402 + }, + { + "epoch": 0.83, + "learning_rate": 1.6971175801078993e-06, + "loss": 1.0215, + "step": 32403 + }, + { + "epoch": 0.83, + "learning_rate": 1.6970977413204364e-06, + "loss": 0.9463, + "step": 32404 + }, + { + "epoch": 0.83, + "learning_rate": 1.6970779019992372e-06, + "loss": 0.8574, + "step": 32405 + }, + { + "epoch": 0.83, + "learning_rate": 1.6970580621443178e-06, + "loss": 0.9648, + "step": 32406 + }, + { + "epoch": 0.83, + "learning_rate": 1.6970382217556934e-06, + "loss": 0.917, + "step": 32407 + }, + { + "epoch": 0.83, + "learning_rate": 1.6970183808333785e-06, + "loss": 0.8574, + "step": 32408 + }, + { + "epoch": 0.83, + "learning_rate": 1.6969985393773887e-06, + "loss": 0.7856, + "step": 32409 + }, + { + "epoch": 0.83, + "learning_rate": 1.6969786973877392e-06, + "loss": 0.9355, + "step": 32410 + }, + { + "epoch": 0.83, + "learning_rate": 1.6969588548644448e-06, + "loss": 0.8506, + "step": 32411 + }, + { + "epoch": 0.83, + "learning_rate": 1.6969390118075216e-06, + "loss": 0.834, + "step": 32412 + }, + { + "epoch": 0.83, + "learning_rate": 1.696919168216984e-06, + "loss": 0.833, + "step": 32413 + }, + { + "epoch": 0.83, + "learning_rate": 1.6968993240928476e-06, + "loss": 0.9414, + "step": 32414 + }, + { + "epoch": 0.83, + "learning_rate": 1.6968794794351272e-06, + "loss": 0.6855, + "step": 32415 + }, + { + "epoch": 0.83, + "learning_rate": 1.6968596342438382e-06, + "loss": 0.8672, + "step": 32416 + }, + { + "epoch": 0.83, + "learning_rate": 1.696839788518996e-06, + "loss": 1.1602, + "step": 32417 + }, + { + "epoch": 0.83, + "learning_rate": 1.6968199422606157e-06, + "loss": 0.7227, + "step": 32418 + }, + { + "epoch": 0.83, + "learning_rate": 1.6968000954687123e-06, + "loss": 0.7236, + "step": 32419 + }, + { + "epoch": 0.83, + "learning_rate": 1.696780248143301e-06, + "loss": 0.7363, + "step": 32420 + }, + { + "epoch": 0.83, + "learning_rate": 1.6967604002843972e-06, + "loss": 0.8301, + "step": 32421 + }, + { + "epoch": 0.83, + "learning_rate": 1.6967405518920161e-06, + "loss": 0.6475, + "step": 32422 + }, + { + "epoch": 0.83, + "learning_rate": 1.6967207029661727e-06, + "loss": 0.9497, + "step": 32423 + }, + { + "epoch": 0.83, + "learning_rate": 1.6967008535068823e-06, + "loss": 0.8315, + "step": 32424 + }, + { + "epoch": 0.83, + "learning_rate": 1.6966810035141598e-06, + "loss": 0.9717, + "step": 32425 + }, + { + "epoch": 0.83, + "learning_rate": 1.696661152988021e-06, + "loss": 0.8223, + "step": 32426 + }, + { + "epoch": 0.83, + "learning_rate": 1.6966413019284809e-06, + "loss": 0.625, + "step": 32427 + }, + { + "epoch": 0.83, + "learning_rate": 1.6966214503355545e-06, + "loss": 0.7445, + "step": 32428 + }, + { + "epoch": 0.83, + "learning_rate": 1.696601598209257e-06, + "loss": 0.9512, + "step": 32429 + }, + { + "epoch": 0.83, + "learning_rate": 1.6965817455496036e-06, + "loss": 0.8232, + "step": 32430 + }, + { + "epoch": 0.83, + "learning_rate": 1.6965618923566098e-06, + "loss": 0.7329, + "step": 32431 + }, + { + "epoch": 0.83, + "learning_rate": 1.6965420386302903e-06, + "loss": 0.7134, + "step": 32432 + }, + { + "epoch": 0.83, + "learning_rate": 1.696522184370661e-06, + "loss": 0.6416, + "step": 32433 + }, + { + "epoch": 0.83, + "learning_rate": 1.6965023295777362e-06, + "loss": 0.8672, + "step": 32434 + }, + { + "epoch": 0.83, + "learning_rate": 1.696482474251532e-06, + "loss": 0.8955, + "step": 32435 + }, + { + "epoch": 0.83, + "learning_rate": 1.696462618392063e-06, + "loss": 0.7227, + "step": 32436 + }, + { + "epoch": 0.83, + "learning_rate": 1.6964427619993447e-06, + "loss": 0.9277, + "step": 32437 + }, + { + "epoch": 0.83, + "learning_rate": 1.6964229050733922e-06, + "loss": 0.6787, + "step": 32438 + }, + { + "epoch": 0.83, + "learning_rate": 1.6964030476142206e-06, + "loss": 1.041, + "step": 32439 + }, + { + "epoch": 0.83, + "learning_rate": 1.6963831896218453e-06, + "loss": 0.6553, + "step": 32440 + }, + { + "epoch": 0.83, + "learning_rate": 1.6963633310962812e-06, + "loss": 0.7954, + "step": 32441 + }, + { + "epoch": 0.83, + "learning_rate": 1.6963434720375442e-06, + "loss": 0.7744, + "step": 32442 + }, + { + "epoch": 0.83, + "learning_rate": 1.6963236124456487e-06, + "loss": 0.833, + "step": 32443 + }, + { + "epoch": 0.83, + "learning_rate": 1.69630375232061e-06, + "loss": 0.8818, + "step": 32444 + }, + { + "epoch": 0.83, + "learning_rate": 1.696283891662444e-06, + "loss": 0.783, + "step": 32445 + }, + { + "epoch": 0.83, + "learning_rate": 1.6962640304711654e-06, + "loss": 0.9336, + "step": 32446 + }, + { + "epoch": 0.83, + "learning_rate": 1.696244168746789e-06, + "loss": 0.9375, + "step": 32447 + }, + { + "epoch": 0.83, + "learning_rate": 1.6962243064893308e-06, + "loss": 1.0742, + "step": 32448 + }, + { + "epoch": 0.83, + "learning_rate": 1.6962044436988054e-06, + "loss": 0.7729, + "step": 32449 + }, + { + "epoch": 0.83, + "learning_rate": 1.6961845803752283e-06, + "loss": 0.8115, + "step": 32450 + }, + { + "epoch": 0.83, + "learning_rate": 1.696164716518615e-06, + "loss": 0.9619, + "step": 32451 + }, + { + "epoch": 0.83, + "learning_rate": 1.6961448521289805e-06, + "loss": 1.0195, + "step": 32452 + }, + { + "epoch": 0.83, + "learning_rate": 1.6961249872063394e-06, + "loss": 0.8789, + "step": 32453 + }, + { + "epoch": 0.83, + "learning_rate": 1.6961051217507077e-06, + "loss": 0.7451, + "step": 32454 + }, + { + "epoch": 0.83, + "learning_rate": 1.6960852557621002e-06, + "loss": 0.644, + "step": 32455 + }, + { + "epoch": 0.83, + "learning_rate": 1.696065389240532e-06, + "loss": 0.8047, + "step": 32456 + }, + { + "epoch": 0.83, + "learning_rate": 1.6960455221860191e-06, + "loss": 0.9346, + "step": 32457 + }, + { + "epoch": 0.83, + "learning_rate": 1.6960256545985758e-06, + "loss": 0.7788, + "step": 32458 + }, + { + "epoch": 0.83, + "learning_rate": 1.6960057864782176e-06, + "loss": 0.9326, + "step": 32459 + }, + { + "epoch": 0.83, + "learning_rate": 1.69598591782496e-06, + "loss": 0.5102, + "step": 32460 + }, + { + "epoch": 0.83, + "learning_rate": 1.6959660486388177e-06, + "loss": 0.8799, + "step": 32461 + }, + { + "epoch": 0.83, + "learning_rate": 1.6959461789198066e-06, + "loss": 0.5645, + "step": 32462 + }, + { + "epoch": 0.83, + "learning_rate": 1.695926308667941e-06, + "loss": 0.8301, + "step": 32463 + }, + { + "epoch": 0.83, + "learning_rate": 1.6959064378832371e-06, + "loss": 0.8379, + "step": 32464 + }, + { + "epoch": 0.83, + "learning_rate": 1.6958865665657093e-06, + "loss": 0.6826, + "step": 32465 + }, + { + "epoch": 0.83, + "learning_rate": 1.6958666947153734e-06, + "loss": 0.8096, + "step": 32466 + }, + { + "epoch": 0.83, + "learning_rate": 1.6958468223322444e-06, + "loss": 0.6465, + "step": 32467 + }, + { + "epoch": 0.83, + "learning_rate": 1.6958269494163374e-06, + "loss": 0.8398, + "step": 32468 + }, + { + "epoch": 0.83, + "learning_rate": 1.6958070759676675e-06, + "loss": 1.0303, + "step": 32469 + }, + { + "epoch": 0.83, + "learning_rate": 1.69578720198625e-06, + "loss": 0.9414, + "step": 32470 + }, + { + "epoch": 0.83, + "learning_rate": 1.6957673274721005e-06, + "loss": 0.9902, + "step": 32471 + }, + { + "epoch": 0.83, + "learning_rate": 1.695747452425234e-06, + "loss": 0.9766, + "step": 32472 + }, + { + "epoch": 0.83, + "learning_rate": 1.6957275768456656e-06, + "loss": 1.0557, + "step": 32473 + }, + { + "epoch": 0.83, + "learning_rate": 1.6957077007334108e-06, + "loss": 0.8438, + "step": 32474 + }, + { + "epoch": 0.83, + "learning_rate": 1.6956878240884842e-06, + "loss": 0.9668, + "step": 32475 + }, + { + "epoch": 0.83, + "learning_rate": 1.6956679469109017e-06, + "loss": 0.9092, + "step": 32476 + }, + { + "epoch": 0.83, + "learning_rate": 1.6956480692006783e-06, + "loss": 0.8086, + "step": 32477 + }, + { + "epoch": 0.83, + "learning_rate": 1.695628190957829e-06, + "loss": 0.5361, + "step": 32478 + }, + { + "epoch": 0.83, + "learning_rate": 1.6956083121823692e-06, + "loss": 0.6602, + "step": 32479 + }, + { + "epoch": 0.83, + "learning_rate": 1.695588432874314e-06, + "loss": 0.8027, + "step": 32480 + }, + { + "epoch": 0.83, + "learning_rate": 1.6955685530336787e-06, + "loss": 0.9365, + "step": 32481 + }, + { + "epoch": 0.83, + "learning_rate": 1.6955486726604789e-06, + "loss": 0.8486, + "step": 32482 + }, + { + "epoch": 0.83, + "learning_rate": 1.6955287917547293e-06, + "loss": 0.8398, + "step": 32483 + }, + { + "epoch": 0.83, + "learning_rate": 1.695508910316445e-06, + "loss": 0.73, + "step": 32484 + }, + { + "epoch": 0.83, + "learning_rate": 1.6954890283456417e-06, + "loss": 0.6985, + "step": 32485 + }, + { + "epoch": 0.83, + "learning_rate": 1.6954691458423346e-06, + "loss": 0.8955, + "step": 32486 + }, + { + "epoch": 0.83, + "learning_rate": 1.6954492628065385e-06, + "loss": 0.7969, + "step": 32487 + }, + { + "epoch": 0.83, + "learning_rate": 1.695429379238269e-06, + "loss": 0.7515, + "step": 32488 + }, + { + "epoch": 0.83, + "learning_rate": 1.6954094951375411e-06, + "loss": 0.8447, + "step": 32489 + }, + { + "epoch": 0.83, + "learning_rate": 1.6953896105043701e-06, + "loss": 1.0205, + "step": 32490 + }, + { + "epoch": 0.83, + "learning_rate": 1.6953697253387715e-06, + "loss": 0.8423, + "step": 32491 + }, + { + "epoch": 0.83, + "learning_rate": 1.6953498396407603e-06, + "loss": 0.8643, + "step": 32492 + }, + { + "epoch": 0.83, + "learning_rate": 1.6953299534103513e-06, + "loss": 0.7881, + "step": 32493 + }, + { + "epoch": 0.83, + "learning_rate": 1.6953100666475605e-06, + "loss": 0.8828, + "step": 32494 + }, + { + "epoch": 0.83, + "learning_rate": 1.6952901793524025e-06, + "loss": 0.8262, + "step": 32495 + }, + { + "epoch": 0.83, + "learning_rate": 1.6952702915248928e-06, + "loss": 0.8726, + "step": 32496 + }, + { + "epoch": 0.83, + "learning_rate": 1.6952504031650468e-06, + "loss": 0.6685, + "step": 32497 + }, + { + "epoch": 0.83, + "learning_rate": 1.6952305142728793e-06, + "loss": 0.9209, + "step": 32498 + }, + { + "epoch": 0.83, + "learning_rate": 1.695210624848406e-06, + "loss": 0.8359, + "step": 32499 + }, + { + "epoch": 0.83, + "learning_rate": 1.6951907348916419e-06, + "loss": 0.8029, + "step": 32500 + }, + { + "epoch": 0.83, + "learning_rate": 1.695170844402602e-06, + "loss": 0.877, + "step": 32501 + }, + { + "epoch": 0.83, + "learning_rate": 1.695150953381302e-06, + "loss": 0.5042, + "step": 32502 + }, + { + "epoch": 0.83, + "learning_rate": 1.6951310618277566e-06, + "loss": 0.9033, + "step": 32503 + }, + { + "epoch": 0.83, + "learning_rate": 1.6951111697419816e-06, + "loss": 0.6904, + "step": 32504 + }, + { + "epoch": 0.83, + "learning_rate": 1.6950912771239917e-06, + "loss": 0.6943, + "step": 32505 + }, + { + "epoch": 0.83, + "learning_rate": 1.6950713839738024e-06, + "loss": 0.7197, + "step": 32506 + }, + { + "epoch": 0.83, + "learning_rate": 1.695051490291429e-06, + "loss": 0.6885, + "step": 32507 + }, + { + "epoch": 0.83, + "learning_rate": 1.6950315960768866e-06, + "loss": 0.7842, + "step": 32508 + }, + { + "epoch": 0.83, + "learning_rate": 1.6950117013301902e-06, + "loss": 0.9268, + "step": 32509 + }, + { + "epoch": 0.83, + "learning_rate": 1.6949918060513558e-06, + "loss": 0.7417, + "step": 32510 + }, + { + "epoch": 0.83, + "learning_rate": 1.694971910240398e-06, + "loss": 0.9336, + "step": 32511 + }, + { + "epoch": 0.83, + "learning_rate": 1.6949520138973318e-06, + "loss": 0.9326, + "step": 32512 + }, + { + "epoch": 0.83, + "learning_rate": 1.694932117022173e-06, + "loss": 0.5508, + "step": 32513 + }, + { + "epoch": 0.83, + "learning_rate": 1.6949122196149368e-06, + "loss": 0.5701, + "step": 32514 + }, + { + "epoch": 0.83, + "learning_rate": 1.6948923216756382e-06, + "loss": 1.0352, + "step": 32515 + }, + { + "epoch": 0.83, + "learning_rate": 1.6948724232042924e-06, + "loss": 1.0107, + "step": 32516 + }, + { + "epoch": 0.83, + "learning_rate": 1.6948525242009147e-06, + "loss": 0.8193, + "step": 32517 + }, + { + "epoch": 0.83, + "learning_rate": 1.6948326246655204e-06, + "loss": 0.7593, + "step": 32518 + }, + { + "epoch": 0.83, + "learning_rate": 1.6948127245981247e-06, + "loss": 0.96, + "step": 32519 + }, + { + "epoch": 0.83, + "learning_rate": 1.694792823998743e-06, + "loss": 0.9023, + "step": 32520 + }, + { + "epoch": 0.83, + "learning_rate": 1.6947729228673904e-06, + "loss": 0.5811, + "step": 32521 + }, + { + "epoch": 0.83, + "learning_rate": 1.694753021204082e-06, + "loss": 0.7451, + "step": 32522 + }, + { + "epoch": 0.83, + "learning_rate": 1.6947331190088333e-06, + "loss": 0.751, + "step": 32523 + }, + { + "epoch": 0.83, + "learning_rate": 1.6947132162816591e-06, + "loss": 0.8633, + "step": 32524 + }, + { + "epoch": 0.83, + "learning_rate": 1.6946933130225752e-06, + "loss": 1.0264, + "step": 32525 + }, + { + "epoch": 0.83, + "learning_rate": 1.6946734092315964e-06, + "loss": 0.7637, + "step": 32526 + }, + { + "epoch": 0.83, + "learning_rate": 1.6946535049087382e-06, + "loss": 1.0039, + "step": 32527 + }, + { + "epoch": 0.83, + "learning_rate": 1.6946336000540159e-06, + "loss": 0.7178, + "step": 32528 + }, + { + "epoch": 0.83, + "learning_rate": 1.6946136946674443e-06, + "loss": 0.8848, + "step": 32529 + }, + { + "epoch": 0.83, + "learning_rate": 1.694593788749039e-06, + "loss": 0.8594, + "step": 32530 + }, + { + "epoch": 0.83, + "learning_rate": 1.6945738822988152e-06, + "loss": 0.6758, + "step": 32531 + }, + { + "epoch": 0.83, + "learning_rate": 1.694553975316788e-06, + "loss": 0.8647, + "step": 32532 + }, + { + "epoch": 0.83, + "learning_rate": 1.6945340678029729e-06, + "loss": 1.0186, + "step": 32533 + }, + { + "epoch": 0.83, + "learning_rate": 1.6945141597573851e-06, + "loss": 0.8086, + "step": 32534 + }, + { + "epoch": 0.83, + "learning_rate": 1.6944942511800394e-06, + "loss": 0.9277, + "step": 32535 + }, + { + "epoch": 0.83, + "learning_rate": 1.694474342070952e-06, + "loss": 0.7588, + "step": 32536 + }, + { + "epoch": 0.83, + "learning_rate": 1.6944544324301372e-06, + "loss": 1.0303, + "step": 32537 + }, + { + "epoch": 0.83, + "learning_rate": 1.6944345222576104e-06, + "loss": 0.915, + "step": 32538 + }, + { + "epoch": 0.83, + "learning_rate": 1.6944146115533872e-06, + "loss": 0.6445, + "step": 32539 + }, + { + "epoch": 0.83, + "learning_rate": 1.6943947003174826e-06, + "loss": 0.6758, + "step": 32540 + }, + { + "epoch": 0.83, + "learning_rate": 1.6943747885499118e-06, + "loss": 0.749, + "step": 32541 + }, + { + "epoch": 0.83, + "learning_rate": 1.6943548762506904e-06, + "loss": 0.7026, + "step": 32542 + }, + { + "epoch": 0.83, + "learning_rate": 1.6943349634198333e-06, + "loss": 0.8047, + "step": 32543 + }, + { + "epoch": 0.83, + "learning_rate": 1.6943150500573558e-06, + "loss": 0.7705, + "step": 32544 + }, + { + "epoch": 0.83, + "learning_rate": 1.6942951361632732e-06, + "loss": 0.8511, + "step": 32545 + }, + { + "epoch": 0.83, + "learning_rate": 1.6942752217376008e-06, + "loss": 0.8447, + "step": 32546 + }, + { + "epoch": 0.83, + "learning_rate": 1.6942553067803538e-06, + "loss": 0.6807, + "step": 32547 + }, + { + "epoch": 0.83, + "learning_rate": 1.6942353912915474e-06, + "loss": 0.8936, + "step": 32548 + }, + { + "epoch": 0.83, + "learning_rate": 1.6942154752711968e-06, + "loss": 0.874, + "step": 32549 + }, + { + "epoch": 0.83, + "learning_rate": 1.6941955587193173e-06, + "loss": 0.8142, + "step": 32550 + }, + { + "epoch": 0.83, + "learning_rate": 1.6941756416359242e-06, + "loss": 0.8174, + "step": 32551 + }, + { + "epoch": 0.83, + "learning_rate": 1.6941557240210328e-06, + "loss": 0.8535, + "step": 32552 + }, + { + "epoch": 0.83, + "learning_rate": 1.6941358058746583e-06, + "loss": 0.9795, + "step": 32553 + }, + { + "epoch": 0.83, + "learning_rate": 1.6941158871968159e-06, + "loss": 0.8047, + "step": 32554 + }, + { + "epoch": 0.83, + "learning_rate": 1.694095967987521e-06, + "loss": 0.8359, + "step": 32555 + }, + { + "epoch": 0.83, + "learning_rate": 1.6940760482467887e-06, + "loss": 0.9775, + "step": 32556 + }, + { + "epoch": 0.83, + "learning_rate": 1.6940561279746342e-06, + "loss": 0.8145, + "step": 32557 + }, + { + "epoch": 0.83, + "learning_rate": 1.6940362071710729e-06, + "loss": 0.8857, + "step": 32558 + }, + { + "epoch": 0.83, + "learning_rate": 1.6940162858361195e-06, + "loss": 0.8945, + "step": 32559 + }, + { + "epoch": 0.83, + "learning_rate": 1.6939963639697903e-06, + "loss": 0.793, + "step": 32560 + }, + { + "epoch": 0.83, + "learning_rate": 1.6939764415720998e-06, + "loss": 0.8169, + "step": 32561 + }, + { + "epoch": 0.83, + "learning_rate": 1.6939565186430636e-06, + "loss": 0.9189, + "step": 32562 + }, + { + "epoch": 0.83, + "learning_rate": 1.6939365951826966e-06, + "loss": 0.752, + "step": 32563 + }, + { + "epoch": 0.83, + "learning_rate": 1.6939166711910144e-06, + "loss": 0.8604, + "step": 32564 + }, + { + "epoch": 0.83, + "learning_rate": 1.6938967466680323e-06, + "loss": 0.959, + "step": 32565 + }, + { + "epoch": 0.83, + "learning_rate": 1.6938768216137648e-06, + "loss": 0.8018, + "step": 32566 + }, + { + "epoch": 0.83, + "learning_rate": 1.6938568960282286e-06, + "loss": 0.7383, + "step": 32567 + }, + { + "epoch": 0.83, + "learning_rate": 1.6938369699114375e-06, + "loss": 0.8379, + "step": 32568 + }, + { + "epoch": 0.83, + "learning_rate": 1.6938170432634072e-06, + "loss": 0.7842, + "step": 32569 + }, + { + "epoch": 0.83, + "learning_rate": 1.6937971160841533e-06, + "loss": 0.9688, + "step": 32570 + }, + { + "epoch": 0.83, + "learning_rate": 1.6937771883736906e-06, + "loss": 0.9102, + "step": 32571 + }, + { + "epoch": 0.83, + "learning_rate": 1.693757260132035e-06, + "loss": 0.8286, + "step": 32572 + }, + { + "epoch": 0.83, + "learning_rate": 1.6937373313592015e-06, + "loss": 0.7295, + "step": 32573 + }, + { + "epoch": 0.83, + "learning_rate": 1.6937174020552047e-06, + "loss": 0.8594, + "step": 32574 + }, + { + "epoch": 0.83, + "learning_rate": 1.6936974722200606e-06, + "loss": 1.043, + "step": 32575 + }, + { + "epoch": 0.83, + "learning_rate": 1.6936775418537842e-06, + "loss": 0.874, + "step": 32576 + }, + { + "epoch": 0.83, + "learning_rate": 1.693657610956391e-06, + "loss": 0.7769, + "step": 32577 + }, + { + "epoch": 0.83, + "learning_rate": 1.6936376795278959e-06, + "loss": 0.7236, + "step": 32578 + }, + { + "epoch": 0.84, + "learning_rate": 1.6936177475683143e-06, + "loss": 0.8418, + "step": 32579 + }, + { + "epoch": 0.84, + "learning_rate": 1.6935978150776613e-06, + "loss": 0.876, + "step": 32580 + }, + { + "epoch": 0.84, + "learning_rate": 1.6935778820559527e-06, + "loss": 0.8398, + "step": 32581 + }, + { + "epoch": 0.84, + "learning_rate": 1.6935579485032035e-06, + "loss": 0.8818, + "step": 32582 + }, + { + "epoch": 0.84, + "learning_rate": 1.6935380144194285e-06, + "loss": 0.8472, + "step": 32583 + }, + { + "epoch": 0.84, + "learning_rate": 1.6935180798046434e-06, + "loss": 0.9492, + "step": 32584 + }, + { + "epoch": 0.84, + "learning_rate": 1.6934981446588635e-06, + "loss": 0.9355, + "step": 32585 + }, + { + "epoch": 0.84, + "learning_rate": 1.693478208982104e-06, + "loss": 0.9341, + "step": 32586 + }, + { + "epoch": 0.84, + "learning_rate": 1.69345827277438e-06, + "loss": 0.6836, + "step": 32587 + }, + { + "epoch": 0.84, + "learning_rate": 1.6934383360357072e-06, + "loss": 0.9756, + "step": 32588 + }, + { + "epoch": 0.84, + "learning_rate": 1.6934183987661002e-06, + "loss": 0.8457, + "step": 32589 + }, + { + "epoch": 0.84, + "learning_rate": 1.6933984609655747e-06, + "loss": 0.793, + "step": 32590 + }, + { + "epoch": 0.84, + "learning_rate": 1.6933785226341458e-06, + "loss": 0.7036, + "step": 32591 + }, + { + "epoch": 0.84, + "learning_rate": 1.6933585837718289e-06, + "loss": 0.7363, + "step": 32592 + }, + { + "epoch": 0.84, + "learning_rate": 1.6933386443786396e-06, + "loss": 0.8477, + "step": 32593 + }, + { + "epoch": 0.84, + "learning_rate": 1.693318704454592e-06, + "loss": 1.0586, + "step": 32594 + }, + { + "epoch": 0.84, + "learning_rate": 1.6932987639997028e-06, + "loss": 0.5798, + "step": 32595 + }, + { + "epoch": 0.84, + "learning_rate": 1.6932788230139863e-06, + "loss": 0.9023, + "step": 32596 + }, + { + "epoch": 0.84, + "learning_rate": 1.6932588814974582e-06, + "loss": 1.0205, + "step": 32597 + }, + { + "epoch": 0.84, + "learning_rate": 1.6932389394501337e-06, + "loss": 0.6011, + "step": 32598 + }, + { + "epoch": 0.84, + "learning_rate": 1.6932189968720279e-06, + "loss": 0.6641, + "step": 32599 + }, + { + "epoch": 0.84, + "learning_rate": 1.6931990537631564e-06, + "loss": 0.8779, + "step": 32600 + }, + { + "epoch": 0.84, + "learning_rate": 1.693179110123534e-06, + "loss": 0.8223, + "step": 32601 + }, + { + "epoch": 0.84, + "learning_rate": 1.6931591659531763e-06, + "loss": 0.7847, + "step": 32602 + }, + { + "epoch": 0.84, + "learning_rate": 1.6931392212520986e-06, + "loss": 0.8242, + "step": 32603 + }, + { + "epoch": 0.84, + "learning_rate": 1.6931192760203159e-06, + "loss": 0.6538, + "step": 32604 + }, + { + "epoch": 0.84, + "learning_rate": 1.6930993302578439e-06, + "loss": 1.0166, + "step": 32605 + }, + { + "epoch": 0.84, + "learning_rate": 1.6930793839646973e-06, + "loss": 0.7764, + "step": 32606 + }, + { + "epoch": 0.84, + "learning_rate": 1.6930594371408917e-06, + "loss": 0.8213, + "step": 32607 + }, + { + "epoch": 0.84, + "learning_rate": 1.6930394897864427e-06, + "loss": 1.0322, + "step": 32608 + }, + { + "epoch": 0.84, + "learning_rate": 1.693019541901365e-06, + "loss": 1.2217, + "step": 32609 + }, + { + "epoch": 0.84, + "learning_rate": 1.692999593485674e-06, + "loss": 0.7891, + "step": 32610 + }, + { + "epoch": 0.84, + "learning_rate": 1.692979644539385e-06, + "loss": 0.8867, + "step": 32611 + }, + { + "epoch": 0.84, + "learning_rate": 1.6929596950625137e-06, + "loss": 1.1074, + "step": 32612 + }, + { + "epoch": 0.84, + "learning_rate": 1.692939745055075e-06, + "loss": 0.8477, + "step": 32613 + }, + { + "epoch": 0.84, + "learning_rate": 1.6929197945170841e-06, + "loss": 0.8271, + "step": 32614 + }, + { + "epoch": 0.84, + "learning_rate": 1.6928998434485563e-06, + "loss": 0.9463, + "step": 32615 + }, + { + "epoch": 0.84, + "learning_rate": 1.692879891849507e-06, + "loss": 0.7681, + "step": 32616 + }, + { + "epoch": 0.84, + "learning_rate": 1.6928599397199515e-06, + "loss": 0.6245, + "step": 32617 + }, + { + "epoch": 0.84, + "learning_rate": 1.6928399870599052e-06, + "loss": 0.8633, + "step": 32618 + }, + { + "epoch": 0.84, + "learning_rate": 1.6928200338693826e-06, + "loss": 0.9141, + "step": 32619 + }, + { + "epoch": 0.84, + "learning_rate": 1.6928000801484e-06, + "loss": 0.7495, + "step": 32620 + }, + { + "epoch": 0.84, + "learning_rate": 1.6927801258969718e-06, + "loss": 0.6797, + "step": 32621 + }, + { + "epoch": 0.84, + "learning_rate": 1.6927601711151143e-06, + "loss": 0.9307, + "step": 32622 + }, + { + "epoch": 0.84, + "learning_rate": 1.692740215802842e-06, + "loss": 0.5938, + "step": 32623 + }, + { + "epoch": 0.84, + "learning_rate": 1.6927202599601699e-06, + "loss": 0.7573, + "step": 32624 + }, + { + "epoch": 0.84, + "learning_rate": 1.6927003035871144e-06, + "loss": 0.6396, + "step": 32625 + }, + { + "epoch": 0.84, + "learning_rate": 1.6926803466836896e-06, + "loss": 0.9355, + "step": 32626 + }, + { + "epoch": 0.84, + "learning_rate": 1.6926603892499119e-06, + "loss": 1.0977, + "step": 32627 + }, + { + "epoch": 0.84, + "learning_rate": 1.6926404312857954e-06, + "loss": 0.5513, + "step": 32628 + }, + { + "epoch": 0.84, + "learning_rate": 1.6926204727913562e-06, + "loss": 0.7222, + "step": 32629 + }, + { + "epoch": 0.84, + "learning_rate": 1.6926005137666092e-06, + "loss": 1.1328, + "step": 32630 + }, + { + "epoch": 0.84, + "learning_rate": 1.69258055421157e-06, + "loss": 0.6992, + "step": 32631 + }, + { + "epoch": 0.84, + "learning_rate": 1.692560594126254e-06, + "loss": 1.0674, + "step": 32632 + }, + { + "epoch": 0.84, + "learning_rate": 1.692540633510676e-06, + "loss": 0.7119, + "step": 32633 + }, + { + "epoch": 0.84, + "learning_rate": 1.6925206723648513e-06, + "loss": 0.9014, + "step": 32634 + }, + { + "epoch": 0.84, + "learning_rate": 1.6925007106887955e-06, + "loss": 0.8447, + "step": 32635 + }, + { + "epoch": 0.84, + "learning_rate": 1.6924807484825237e-06, + "loss": 1.0742, + "step": 32636 + }, + { + "epoch": 0.84, + "learning_rate": 1.6924607857460514e-06, + "loss": 0.811, + "step": 32637 + }, + { + "epoch": 0.84, + "learning_rate": 1.6924408224793933e-06, + "loss": 0.8398, + "step": 32638 + }, + { + "epoch": 0.84, + "learning_rate": 1.6924208586825651e-06, + "loss": 0.8789, + "step": 32639 + }, + { + "epoch": 0.84, + "learning_rate": 1.6924008943555825e-06, + "loss": 0.7852, + "step": 32640 + }, + { + "epoch": 0.84, + "learning_rate": 1.6923809294984603e-06, + "loss": 0.6685, + "step": 32641 + }, + { + "epoch": 0.84, + "learning_rate": 1.6923609641112137e-06, + "loss": 0.7725, + "step": 32642 + }, + { + "epoch": 0.84, + "learning_rate": 1.6923409981938583e-06, + "loss": 0.8467, + "step": 32643 + }, + { + "epoch": 0.84, + "learning_rate": 1.692321031746409e-06, + "loss": 0.8252, + "step": 32644 + }, + { + "epoch": 0.84, + "learning_rate": 1.6923010647688818e-06, + "loss": 0.8311, + "step": 32645 + }, + { + "epoch": 0.84, + "learning_rate": 1.692281097261291e-06, + "loss": 1.1221, + "step": 32646 + }, + { + "epoch": 0.84, + "learning_rate": 1.6922611292236527e-06, + "loss": 0.8213, + "step": 32647 + }, + { + "epoch": 0.84, + "learning_rate": 1.6922411606559816e-06, + "loss": 0.9199, + "step": 32648 + }, + { + "epoch": 0.84, + "learning_rate": 1.6922211915582936e-06, + "loss": 0.6226, + "step": 32649 + }, + { + "epoch": 0.84, + "learning_rate": 1.6922012219306035e-06, + "loss": 1.0371, + "step": 32650 + }, + { + "epoch": 0.84, + "learning_rate": 1.6921812517729266e-06, + "loss": 0.8081, + "step": 32651 + }, + { + "epoch": 0.84, + "learning_rate": 1.6921612810852786e-06, + "loss": 0.7993, + "step": 32652 + }, + { + "epoch": 0.84, + "learning_rate": 1.6921413098676744e-06, + "loss": 0.7378, + "step": 32653 + }, + { + "epoch": 0.84, + "learning_rate": 1.6921213381201294e-06, + "loss": 1.001, + "step": 32654 + }, + { + "epoch": 0.84, + "learning_rate": 1.692101365842659e-06, + "loss": 0.835, + "step": 32655 + }, + { + "epoch": 0.84, + "learning_rate": 1.6920813930352785e-06, + "loss": 0.791, + "step": 32656 + }, + { + "epoch": 0.84, + "learning_rate": 1.692061419698003e-06, + "loss": 0.8696, + "step": 32657 + }, + { + "epoch": 0.84, + "learning_rate": 1.6920414458308478e-06, + "loss": 0.7393, + "step": 32658 + }, + { + "epoch": 0.84, + "learning_rate": 1.6920214714338284e-06, + "loss": 1.0811, + "step": 32659 + }, + { + "epoch": 0.84, + "learning_rate": 1.6920014965069598e-06, + "loss": 0.9404, + "step": 32660 + }, + { + "epoch": 0.84, + "learning_rate": 1.6919815210502577e-06, + "loss": 0.4829, + "step": 32661 + }, + { + "epoch": 0.84, + "learning_rate": 1.6919615450637371e-06, + "loss": 0.9502, + "step": 32662 + }, + { + "epoch": 0.84, + "learning_rate": 1.6919415685474135e-06, + "loss": 0.9092, + "step": 32663 + }, + { + "epoch": 0.84, + "learning_rate": 1.6919215915013015e-06, + "loss": 0.8848, + "step": 32664 + }, + { + "epoch": 0.84, + "learning_rate": 1.6919016139254177e-06, + "loss": 0.677, + "step": 32665 + }, + { + "epoch": 0.84, + "learning_rate": 1.6918816358197763e-06, + "loss": 0.8066, + "step": 32666 + }, + { + "epoch": 0.84, + "learning_rate": 1.691861657184393e-06, + "loss": 0.9316, + "step": 32667 + }, + { + "epoch": 0.84, + "learning_rate": 1.6918416780192825e-06, + "loss": 0.7729, + "step": 32668 + }, + { + "epoch": 0.84, + "learning_rate": 1.6918216983244612e-06, + "loss": 0.7424, + "step": 32669 + }, + { + "epoch": 0.84, + "learning_rate": 1.6918017180999437e-06, + "loss": 0.9834, + "step": 32670 + }, + { + "epoch": 0.84, + "learning_rate": 1.6917817373457457e-06, + "loss": 0.8486, + "step": 32671 + }, + { + "epoch": 0.84, + "learning_rate": 1.691761756061882e-06, + "loss": 0.7158, + "step": 32672 + }, + { + "epoch": 0.84, + "learning_rate": 1.6917417742483682e-06, + "loss": 1.0215, + "step": 32673 + }, + { + "epoch": 0.84, + "learning_rate": 1.6917217919052194e-06, + "loss": 0.9209, + "step": 32674 + }, + { + "epoch": 0.84, + "learning_rate": 1.691701809032451e-06, + "loss": 0.8516, + "step": 32675 + }, + { + "epoch": 0.84, + "learning_rate": 1.6916818256300787e-06, + "loss": 0.6421, + "step": 32676 + }, + { + "epoch": 0.84, + "learning_rate": 1.6916618416981171e-06, + "loss": 0.7856, + "step": 32677 + }, + { + "epoch": 0.84, + "learning_rate": 1.6916418572365817e-06, + "loss": 0.833, + "step": 32678 + }, + { + "epoch": 0.84, + "learning_rate": 1.6916218722454883e-06, + "loss": 0.6514, + "step": 32679 + }, + { + "epoch": 0.84, + "learning_rate": 1.6916018867248515e-06, + "loss": 1.0576, + "step": 32680 + }, + { + "epoch": 0.84, + "learning_rate": 1.6915819006746874e-06, + "loss": 1.0625, + "step": 32681 + }, + { + "epoch": 0.84, + "learning_rate": 1.6915619140950106e-06, + "loss": 0.6445, + "step": 32682 + }, + { + "epoch": 0.84, + "learning_rate": 1.6915419269858365e-06, + "loss": 0.7544, + "step": 32683 + }, + { + "epoch": 0.84, + "learning_rate": 1.6915219393471807e-06, + "loss": 0.8557, + "step": 32684 + }, + { + "epoch": 0.84, + "learning_rate": 1.6915019511790583e-06, + "loss": 0.5503, + "step": 32685 + }, + { + "epoch": 0.84, + "learning_rate": 1.6914819624814847e-06, + "loss": 0.7061, + "step": 32686 + }, + { + "epoch": 0.84, + "learning_rate": 1.691461973254475e-06, + "loss": 0.7959, + "step": 32687 + }, + { + "epoch": 0.84, + "learning_rate": 1.6914419834980447e-06, + "loss": 0.8188, + "step": 32688 + }, + { + "epoch": 0.84, + "learning_rate": 1.6914219932122091e-06, + "loss": 0.7051, + "step": 32689 + }, + { + "epoch": 0.84, + "learning_rate": 1.6914020023969835e-06, + "loss": 0.7407, + "step": 32690 + }, + { + "epoch": 0.84, + "learning_rate": 1.6913820110523834e-06, + "loss": 0.9854, + "step": 32691 + }, + { + "epoch": 0.84, + "learning_rate": 1.6913620191784235e-06, + "loss": 0.8574, + "step": 32692 + }, + { + "epoch": 0.84, + "learning_rate": 1.6913420267751194e-06, + "loss": 0.8633, + "step": 32693 + }, + { + "epoch": 0.84, + "learning_rate": 1.691322033842487e-06, + "loss": 0.9883, + "step": 32694 + }, + { + "epoch": 0.84, + "learning_rate": 1.6913020403805408e-06, + "loss": 0.668, + "step": 32695 + }, + { + "epoch": 0.84, + "learning_rate": 1.6912820463892964e-06, + "loss": 0.6665, + "step": 32696 + }, + { + "epoch": 0.84, + "learning_rate": 1.6912620518687692e-06, + "loss": 0.8506, + "step": 32697 + }, + { + "epoch": 0.84, + "learning_rate": 1.6912420568189744e-06, + "loss": 0.8237, + "step": 32698 + }, + { + "epoch": 0.84, + "learning_rate": 1.6912220612399275e-06, + "loss": 0.9629, + "step": 32699 + }, + { + "epoch": 0.84, + "learning_rate": 1.6912020651316435e-06, + "loss": 0.8994, + "step": 32700 + }, + { + "epoch": 0.84, + "learning_rate": 1.6911820684941378e-06, + "loss": 0.6746, + "step": 32701 + }, + { + "epoch": 0.84, + "learning_rate": 1.691162071327426e-06, + "loss": 1.001, + "step": 32702 + }, + { + "epoch": 0.84, + "learning_rate": 1.691142073631523e-06, + "loss": 0.8535, + "step": 32703 + }, + { + "epoch": 0.84, + "learning_rate": 1.6911220754064442e-06, + "loss": 0.7261, + "step": 32704 + }, + { + "epoch": 0.84, + "learning_rate": 1.6911020766522051e-06, + "loss": 0.8379, + "step": 32705 + }, + { + "epoch": 0.84, + "learning_rate": 1.6910820773688211e-06, + "loss": 0.9697, + "step": 32706 + }, + { + "epoch": 0.84, + "learning_rate": 1.691062077556307e-06, + "loss": 0.8252, + "step": 32707 + }, + { + "epoch": 0.84, + "learning_rate": 1.6910420772146786e-06, + "loss": 0.7197, + "step": 32708 + }, + { + "epoch": 0.84, + "learning_rate": 1.691022076343951e-06, + "loss": 0.7344, + "step": 32709 + }, + { + "epoch": 0.84, + "learning_rate": 1.6910020749441399e-06, + "loss": 0.7603, + "step": 32710 + }, + { + "epoch": 0.84, + "learning_rate": 1.69098207301526e-06, + "loss": 0.9014, + "step": 32711 + }, + { + "epoch": 0.84, + "learning_rate": 1.690962070557327e-06, + "loss": 0.8418, + "step": 32712 + }, + { + "epoch": 0.84, + "learning_rate": 1.6909420675703558e-06, + "loss": 0.8428, + "step": 32713 + }, + { + "epoch": 0.84, + "learning_rate": 1.6909220640543621e-06, + "loss": 0.8369, + "step": 32714 + }, + { + "epoch": 0.84, + "learning_rate": 1.6909020600093614e-06, + "loss": 0.8701, + "step": 32715 + }, + { + "epoch": 0.84, + "learning_rate": 1.6908820554353688e-06, + "loss": 1.0547, + "step": 32716 + }, + { + "epoch": 0.84, + "learning_rate": 1.6908620503323996e-06, + "loss": 0.6548, + "step": 32717 + }, + { + "epoch": 0.84, + "learning_rate": 1.690842044700469e-06, + "loss": 0.7949, + "step": 32718 + }, + { + "epoch": 0.84, + "learning_rate": 1.6908220385395923e-06, + "loss": 0.8369, + "step": 32719 + }, + { + "epoch": 0.84, + "learning_rate": 1.6908020318497848e-06, + "loss": 0.9326, + "step": 32720 + }, + { + "epoch": 0.84, + "learning_rate": 1.6907820246310624e-06, + "loss": 0.6157, + "step": 32721 + }, + { + "epoch": 0.84, + "learning_rate": 1.6907620168834397e-06, + "loss": 0.8066, + "step": 32722 + }, + { + "epoch": 0.84, + "learning_rate": 1.6907420086069322e-06, + "loss": 0.8926, + "step": 32723 + }, + { + "epoch": 0.84, + "learning_rate": 1.6907219998015554e-06, + "loss": 0.9893, + "step": 32724 + }, + { + "epoch": 0.84, + "learning_rate": 1.6907019904673244e-06, + "loss": 0.7612, + "step": 32725 + }, + { + "epoch": 0.84, + "learning_rate": 1.690681980604255e-06, + "loss": 0.9502, + "step": 32726 + }, + { + "epoch": 0.84, + "learning_rate": 1.6906619702123618e-06, + "loss": 0.8428, + "step": 32727 + }, + { + "epoch": 0.84, + "learning_rate": 1.6906419592916606e-06, + "loss": 0.8506, + "step": 32728 + }, + { + "epoch": 0.84, + "learning_rate": 1.6906219478421666e-06, + "loss": 1.0342, + "step": 32729 + }, + { + "epoch": 0.84, + "learning_rate": 1.6906019358638951e-06, + "loss": 0.9082, + "step": 32730 + }, + { + "epoch": 0.84, + "learning_rate": 1.6905819233568617e-06, + "loss": 0.6787, + "step": 32731 + }, + { + "epoch": 0.84, + "learning_rate": 1.6905619103210812e-06, + "loss": 0.9209, + "step": 32732 + }, + { + "epoch": 0.84, + "learning_rate": 1.6905418967565693e-06, + "loss": 0.9453, + "step": 32733 + }, + { + "epoch": 0.84, + "learning_rate": 1.690521882663341e-06, + "loss": 0.9717, + "step": 32734 + }, + { + "epoch": 0.84, + "learning_rate": 1.6905018680414122e-06, + "loss": 0.959, + "step": 32735 + }, + { + "epoch": 0.84, + "learning_rate": 1.6904818528907978e-06, + "loss": 0.5698, + "step": 32736 + }, + { + "epoch": 0.84, + "learning_rate": 1.6904618372115131e-06, + "loss": 0.832, + "step": 32737 + }, + { + "epoch": 0.84, + "learning_rate": 1.6904418210035733e-06, + "loss": 0.541, + "step": 32738 + }, + { + "epoch": 0.84, + "learning_rate": 1.6904218042669944e-06, + "loss": 0.79, + "step": 32739 + }, + { + "epoch": 0.84, + "learning_rate": 1.690401787001791e-06, + "loss": 0.9102, + "step": 32740 + }, + { + "epoch": 0.84, + "learning_rate": 1.690381769207979e-06, + "loss": 0.9531, + "step": 32741 + }, + { + "epoch": 0.84, + "learning_rate": 1.690361750885573e-06, + "loss": 0.8096, + "step": 32742 + }, + { + "epoch": 0.84, + "learning_rate": 1.690341732034589e-06, + "loss": 0.9004, + "step": 32743 + }, + { + "epoch": 0.84, + "learning_rate": 1.690321712655042e-06, + "loss": 1.1875, + "step": 32744 + }, + { + "epoch": 0.84, + "learning_rate": 1.690301692746947e-06, + "loss": 0.9346, + "step": 32745 + }, + { + "epoch": 0.84, + "learning_rate": 1.6902816723103206e-06, + "loss": 0.6777, + "step": 32746 + }, + { + "epoch": 0.84, + "learning_rate": 1.6902616513451768e-06, + "loss": 0.6724, + "step": 32747 + }, + { + "epoch": 0.84, + "learning_rate": 1.6902416298515312e-06, + "loss": 0.832, + "step": 32748 + }, + { + "epoch": 0.84, + "learning_rate": 1.6902216078293997e-06, + "loss": 0.9062, + "step": 32749 + }, + { + "epoch": 0.84, + "learning_rate": 1.690201585278797e-06, + "loss": 0.9248, + "step": 32750 + }, + { + "epoch": 0.84, + "learning_rate": 1.6901815621997388e-06, + "loss": 0.9785, + "step": 32751 + }, + { + "epoch": 0.84, + "learning_rate": 1.6901615385922403e-06, + "loss": 0.6389, + "step": 32752 + }, + { + "epoch": 0.84, + "learning_rate": 1.6901415144563167e-06, + "loss": 0.6914, + "step": 32753 + }, + { + "epoch": 0.84, + "learning_rate": 1.6901214897919837e-06, + "loss": 0.5713, + "step": 32754 + }, + { + "epoch": 0.84, + "learning_rate": 1.6901014645992563e-06, + "loss": 0.7368, + "step": 32755 + }, + { + "epoch": 0.84, + "learning_rate": 1.69008143887815e-06, + "loss": 0.813, + "step": 32756 + }, + { + "epoch": 0.84, + "learning_rate": 1.6900614126286798e-06, + "loss": 0.8262, + "step": 32757 + }, + { + "epoch": 0.84, + "learning_rate": 1.6900413858508615e-06, + "loss": 0.7095, + "step": 32758 + }, + { + "epoch": 0.84, + "learning_rate": 1.6900213585447103e-06, + "loss": 1.1133, + "step": 32759 + }, + { + "epoch": 0.84, + "learning_rate": 1.6900013307102414e-06, + "loss": 0.9297, + "step": 32760 + }, + { + "epoch": 0.84, + "learning_rate": 1.6899813023474706e-06, + "loss": 0.8818, + "step": 32761 + }, + { + "epoch": 0.84, + "learning_rate": 1.6899612734564122e-06, + "loss": 0.7549, + "step": 32762 + }, + { + "epoch": 0.84, + "learning_rate": 1.6899412440370825e-06, + "loss": 0.8662, + "step": 32763 + }, + { + "epoch": 0.84, + "learning_rate": 1.6899212140894962e-06, + "loss": 0.6445, + "step": 32764 + }, + { + "epoch": 0.84, + "learning_rate": 1.6899011836136693e-06, + "loss": 0.8975, + "step": 32765 + }, + { + "epoch": 0.84, + "learning_rate": 1.689881152609617e-06, + "loss": 0.8535, + "step": 32766 + }, + { + "epoch": 0.84, + "learning_rate": 1.6898611210773538e-06, + "loss": 0.9395, + "step": 32767 + }, + { + "epoch": 0.84, + "learning_rate": 1.6898410890168962e-06, + "loss": 0.7998, + "step": 32768 + }, + { + "epoch": 0.84, + "learning_rate": 1.6898210564282586e-06, + "loss": 0.6821, + "step": 32769 + }, + { + "epoch": 0.84, + "learning_rate": 1.689801023311457e-06, + "loss": 0.5591, + "step": 32770 + }, + { + "epoch": 0.84, + "learning_rate": 1.6897809896665068e-06, + "loss": 0.876, + "step": 32771 + }, + { + "epoch": 0.84, + "learning_rate": 1.6897609554934221e-06, + "loss": 0.7334, + "step": 32772 + }, + { + "epoch": 0.84, + "learning_rate": 1.6897409207922198e-06, + "loss": 0.9072, + "step": 32773 + }, + { + "epoch": 0.84, + "learning_rate": 1.6897208855629145e-06, + "loss": 0.8491, + "step": 32774 + }, + { + "epoch": 0.84, + "learning_rate": 1.6897008498055217e-06, + "loss": 0.9688, + "step": 32775 + }, + { + "epoch": 0.84, + "learning_rate": 1.6896808135200567e-06, + "loss": 0.7336, + "step": 32776 + }, + { + "epoch": 0.84, + "learning_rate": 1.6896607767065344e-06, + "loss": 0.7573, + "step": 32777 + }, + { + "epoch": 0.84, + "learning_rate": 1.6896407393649708e-06, + "loss": 1.1504, + "step": 32778 + }, + { + "epoch": 0.84, + "learning_rate": 1.6896207014953812e-06, + "loss": 0.8164, + "step": 32779 + }, + { + "epoch": 0.84, + "learning_rate": 1.6896006630977807e-06, + "loss": 0.8149, + "step": 32780 + }, + { + "epoch": 0.84, + "learning_rate": 1.6895806241721843e-06, + "loss": 0.877, + "step": 32781 + }, + { + "epoch": 0.84, + "learning_rate": 1.689560584718608e-06, + "loss": 0.6904, + "step": 32782 + }, + { + "epoch": 0.84, + "learning_rate": 1.6895405447370669e-06, + "loss": 0.8906, + "step": 32783 + }, + { + "epoch": 0.84, + "learning_rate": 1.6895205042275763e-06, + "loss": 0.7686, + "step": 32784 + }, + { + "epoch": 0.84, + "learning_rate": 1.6895004631901512e-06, + "loss": 0.8672, + "step": 32785 + }, + { + "epoch": 0.84, + "learning_rate": 1.689480421624808e-06, + "loss": 0.6331, + "step": 32786 + }, + { + "epoch": 0.84, + "learning_rate": 1.6894603795315606e-06, + "loss": 0.8574, + "step": 32787 + }, + { + "epoch": 0.84, + "learning_rate": 1.6894403369104256e-06, + "loss": 0.6338, + "step": 32788 + }, + { + "epoch": 0.84, + "learning_rate": 1.6894202937614177e-06, + "loss": 0.667, + "step": 32789 + }, + { + "epoch": 0.84, + "learning_rate": 1.6894002500845522e-06, + "loss": 0.8154, + "step": 32790 + }, + { + "epoch": 0.84, + "learning_rate": 1.689380205879845e-06, + "loss": 0.8027, + "step": 32791 + }, + { + "epoch": 0.84, + "learning_rate": 1.6893601611473108e-06, + "loss": 0.7673, + "step": 32792 + }, + { + "epoch": 0.84, + "learning_rate": 1.6893401158869653e-06, + "loss": 0.8066, + "step": 32793 + }, + { + "epoch": 0.84, + "learning_rate": 1.6893200700988238e-06, + "loss": 0.6328, + "step": 32794 + }, + { + "epoch": 0.84, + "learning_rate": 1.6893000237829016e-06, + "loss": 0.749, + "step": 32795 + }, + { + "epoch": 0.84, + "learning_rate": 1.689279976939214e-06, + "loss": 0.8584, + "step": 32796 + }, + { + "epoch": 0.84, + "learning_rate": 1.6892599295677762e-06, + "loss": 1.0449, + "step": 32797 + }, + { + "epoch": 0.84, + "learning_rate": 1.6892398816686042e-06, + "loss": 1.1133, + "step": 32798 + }, + { + "epoch": 0.84, + "learning_rate": 1.6892198332417126e-06, + "loss": 0.8936, + "step": 32799 + }, + { + "epoch": 0.84, + "learning_rate": 1.6891997842871172e-06, + "loss": 0.856, + "step": 32800 + }, + { + "epoch": 0.84, + "learning_rate": 1.6891797348048334e-06, + "loss": 0.7666, + "step": 32801 + }, + { + "epoch": 0.84, + "learning_rate": 1.6891596847948762e-06, + "loss": 0.9814, + "step": 32802 + }, + { + "epoch": 0.84, + "learning_rate": 1.6891396342572609e-06, + "loss": 0.8652, + "step": 32803 + }, + { + "epoch": 0.84, + "learning_rate": 1.6891195831920034e-06, + "loss": 0.8926, + "step": 32804 + }, + { + "epoch": 0.84, + "learning_rate": 1.6890995315991186e-06, + "loss": 0.856, + "step": 32805 + }, + { + "epoch": 0.84, + "learning_rate": 1.6890794794786222e-06, + "loss": 0.8374, + "step": 32806 + }, + { + "epoch": 0.84, + "learning_rate": 1.689059426830529e-06, + "loss": 0.9067, + "step": 32807 + }, + { + "epoch": 0.84, + "learning_rate": 1.6890393736548546e-06, + "loss": 0.6797, + "step": 32808 + }, + { + "epoch": 0.84, + "learning_rate": 1.6890193199516146e-06, + "loss": 0.9697, + "step": 32809 + }, + { + "epoch": 0.84, + "learning_rate": 1.688999265720824e-06, + "loss": 0.6309, + "step": 32810 + }, + { + "epoch": 0.84, + "learning_rate": 1.6889792109624988e-06, + "loss": 1.1328, + "step": 32811 + }, + { + "epoch": 0.84, + "learning_rate": 1.6889591556766535e-06, + "loss": 0.6685, + "step": 32812 + }, + { + "epoch": 0.84, + "learning_rate": 1.688939099863304e-06, + "loss": 0.96, + "step": 32813 + }, + { + "epoch": 0.84, + "learning_rate": 1.6889190435224654e-06, + "loss": 0.6001, + "step": 32814 + }, + { + "epoch": 0.84, + "learning_rate": 1.6888989866541533e-06, + "loss": 1.0146, + "step": 32815 + }, + { + "epoch": 0.84, + "learning_rate": 1.688878929258383e-06, + "loss": 1.0586, + "step": 32816 + }, + { + "epoch": 0.84, + "learning_rate": 1.6888588713351697e-06, + "loss": 0.8428, + "step": 32817 + }, + { + "epoch": 0.84, + "learning_rate": 1.6888388128845288e-06, + "loss": 0.9707, + "step": 32818 + }, + { + "epoch": 0.84, + "learning_rate": 1.6888187539064756e-06, + "loss": 0.8301, + "step": 32819 + }, + { + "epoch": 0.84, + "learning_rate": 1.6887986944010258e-06, + "loss": 0.7666, + "step": 32820 + }, + { + "epoch": 0.84, + "learning_rate": 1.6887786343681942e-06, + "loss": 0.9443, + "step": 32821 + }, + { + "epoch": 0.84, + "learning_rate": 1.6887585738079966e-06, + "loss": 0.8281, + "step": 32822 + }, + { + "epoch": 0.84, + "learning_rate": 1.688738512720448e-06, + "loss": 1.0312, + "step": 32823 + }, + { + "epoch": 0.84, + "learning_rate": 1.6887184511055646e-06, + "loss": 0.8008, + "step": 32824 + }, + { + "epoch": 0.84, + "learning_rate": 1.6886983889633605e-06, + "loss": 0.6516, + "step": 32825 + }, + { + "epoch": 0.84, + "learning_rate": 1.6886783262938522e-06, + "loss": 1.0273, + "step": 32826 + }, + { + "epoch": 0.84, + "learning_rate": 1.6886582630970544e-06, + "loss": 0.7251, + "step": 32827 + }, + { + "epoch": 0.84, + "learning_rate": 1.6886381993729825e-06, + "loss": 0.8887, + "step": 32828 + }, + { + "epoch": 0.84, + "learning_rate": 1.6886181351216522e-06, + "loss": 0.6699, + "step": 32829 + }, + { + "epoch": 0.84, + "learning_rate": 1.6885980703430786e-06, + "loss": 0.7305, + "step": 32830 + }, + { + "epoch": 0.84, + "learning_rate": 1.6885780050372772e-06, + "loss": 0.6895, + "step": 32831 + }, + { + "epoch": 0.84, + "learning_rate": 1.688557939204263e-06, + "loss": 1.1113, + "step": 32832 + }, + { + "epoch": 0.84, + "learning_rate": 1.6885378728440518e-06, + "loss": 0.8867, + "step": 32833 + }, + { + "epoch": 0.84, + "learning_rate": 1.688517805956659e-06, + "loss": 0.7852, + "step": 32834 + }, + { + "epoch": 0.84, + "learning_rate": 1.6884977385420992e-06, + "loss": 1.0957, + "step": 32835 + }, + { + "epoch": 0.84, + "learning_rate": 1.6884776706003891e-06, + "loss": 0.793, + "step": 32836 + }, + { + "epoch": 0.84, + "learning_rate": 1.688457602131543e-06, + "loss": 0.96, + "step": 32837 + }, + { + "epoch": 0.84, + "learning_rate": 1.6884375331355764e-06, + "loss": 0.7458, + "step": 32838 + }, + { + "epoch": 0.84, + "learning_rate": 1.6884174636125051e-06, + "loss": 0.4956, + "step": 32839 + }, + { + "epoch": 0.84, + "learning_rate": 1.6883973935623439e-06, + "loss": 0.7754, + "step": 32840 + }, + { + "epoch": 0.84, + "learning_rate": 1.6883773229851087e-06, + "loss": 0.7852, + "step": 32841 + }, + { + "epoch": 0.84, + "learning_rate": 1.6883572518808148e-06, + "loss": 0.7513, + "step": 32842 + }, + { + "epoch": 0.84, + "learning_rate": 1.6883371802494768e-06, + "loss": 0.6484, + "step": 32843 + }, + { + "epoch": 0.84, + "learning_rate": 1.6883171080911111e-06, + "loss": 0.8135, + "step": 32844 + }, + { + "epoch": 0.84, + "learning_rate": 1.6882970354057327e-06, + "loss": 1.0049, + "step": 32845 + }, + { + "epoch": 0.84, + "learning_rate": 1.6882769621933565e-06, + "loss": 0.8623, + "step": 32846 + }, + { + "epoch": 0.84, + "learning_rate": 1.6882568884539987e-06, + "loss": 1.1406, + "step": 32847 + }, + { + "epoch": 0.84, + "learning_rate": 1.6882368141876742e-06, + "loss": 0.8477, + "step": 32848 + }, + { + "epoch": 0.84, + "learning_rate": 1.6882167393943983e-06, + "loss": 0.9629, + "step": 32849 + }, + { + "epoch": 0.84, + "learning_rate": 1.6881966640741865e-06, + "loss": 0.8477, + "step": 32850 + }, + { + "epoch": 0.84, + "learning_rate": 1.6881765882270541e-06, + "loss": 0.8225, + "step": 32851 + }, + { + "epoch": 0.84, + "learning_rate": 1.6881565118530167e-06, + "loss": 0.8418, + "step": 32852 + }, + { + "epoch": 0.84, + "learning_rate": 1.6881364349520894e-06, + "loss": 0.9404, + "step": 32853 + }, + { + "epoch": 0.84, + "learning_rate": 1.6881163575242877e-06, + "loss": 1.1133, + "step": 32854 + }, + { + "epoch": 0.84, + "learning_rate": 1.6880962795696268e-06, + "loss": 0.8408, + "step": 32855 + }, + { + "epoch": 0.84, + "learning_rate": 1.6880762010881227e-06, + "loss": 0.6523, + "step": 32856 + }, + { + "epoch": 0.84, + "learning_rate": 1.6880561220797897e-06, + "loss": 0.8691, + "step": 32857 + }, + { + "epoch": 0.84, + "learning_rate": 1.688036042544644e-06, + "loss": 0.9619, + "step": 32858 + }, + { + "epoch": 0.84, + "learning_rate": 1.6880159624827006e-06, + "loss": 0.854, + "step": 32859 + }, + { + "epoch": 0.84, + "learning_rate": 1.6879958818939753e-06, + "loss": 0.8608, + "step": 32860 + }, + { + "epoch": 0.84, + "learning_rate": 1.6879758007784833e-06, + "loss": 0.8159, + "step": 32861 + }, + { + "epoch": 0.84, + "learning_rate": 1.6879557191362395e-06, + "loss": 0.689, + "step": 32862 + }, + { + "epoch": 0.84, + "learning_rate": 1.6879356369672598e-06, + "loss": 0.9434, + "step": 32863 + }, + { + "epoch": 0.84, + "learning_rate": 1.687915554271559e-06, + "loss": 0.9492, + "step": 32864 + }, + { + "epoch": 0.84, + "learning_rate": 1.6878954710491533e-06, + "loss": 0.7939, + "step": 32865 + }, + { + "epoch": 0.84, + "learning_rate": 1.6878753873000578e-06, + "loss": 0.627, + "step": 32866 + }, + { + "epoch": 0.84, + "learning_rate": 1.6878553030242875e-06, + "loss": 0.8281, + "step": 32867 + }, + { + "epoch": 0.84, + "learning_rate": 1.687835218221858e-06, + "loss": 0.8682, + "step": 32868 + }, + { + "epoch": 0.84, + "learning_rate": 1.6878151328927848e-06, + "loss": 0.8232, + "step": 32869 + }, + { + "epoch": 0.84, + "learning_rate": 1.6877950470370832e-06, + "loss": 0.8723, + "step": 32870 + }, + { + "epoch": 0.84, + "learning_rate": 1.6877749606547687e-06, + "loss": 0.8711, + "step": 32871 + }, + { + "epoch": 0.84, + "learning_rate": 1.687754873745856e-06, + "loss": 0.7817, + "step": 32872 + }, + { + "epoch": 0.84, + "learning_rate": 1.6877347863103615e-06, + "loss": 0.958, + "step": 32873 + }, + { + "epoch": 0.84, + "learning_rate": 1.6877146983482999e-06, + "loss": 0.8174, + "step": 32874 + }, + { + "epoch": 0.84, + "learning_rate": 1.6876946098596868e-06, + "loss": 0.7344, + "step": 32875 + }, + { + "epoch": 0.84, + "learning_rate": 1.6876745208445379e-06, + "loss": 0.8105, + "step": 32876 + }, + { + "epoch": 0.84, + "learning_rate": 1.6876544313028678e-06, + "loss": 0.79, + "step": 32877 + }, + { + "epoch": 0.84, + "learning_rate": 1.6876343412346926e-06, + "loss": 1.0615, + "step": 32878 + }, + { + "epoch": 0.84, + "learning_rate": 1.6876142506400272e-06, + "loss": 0.9375, + "step": 32879 + }, + { + "epoch": 0.84, + "learning_rate": 1.6875941595188871e-06, + "loss": 1.0381, + "step": 32880 + }, + { + "epoch": 0.84, + "learning_rate": 1.6875740678712882e-06, + "loss": 0.7832, + "step": 32881 + }, + { + "epoch": 0.84, + "learning_rate": 1.687553975697245e-06, + "loss": 0.791, + "step": 32882 + }, + { + "epoch": 0.84, + "learning_rate": 1.6875338829967736e-06, + "loss": 0.8457, + "step": 32883 + }, + { + "epoch": 0.84, + "learning_rate": 1.687513789769889e-06, + "loss": 0.6855, + "step": 32884 + }, + { + "epoch": 0.84, + "learning_rate": 1.6874936960166067e-06, + "loss": 0.8247, + "step": 32885 + }, + { + "epoch": 0.84, + "learning_rate": 1.6874736017369422e-06, + "loss": 0.9189, + "step": 32886 + }, + { + "epoch": 0.84, + "learning_rate": 1.6874535069309106e-06, + "loss": 0.7178, + "step": 32887 + }, + { + "epoch": 0.84, + "learning_rate": 1.6874334115985276e-06, + "loss": 0.8477, + "step": 32888 + }, + { + "epoch": 0.84, + "learning_rate": 1.6874133157398084e-06, + "loss": 0.8438, + "step": 32889 + }, + { + "epoch": 0.84, + "learning_rate": 1.6873932193547683e-06, + "loss": 0.8223, + "step": 32890 + }, + { + "epoch": 0.84, + "learning_rate": 1.687373122443423e-06, + "loss": 0.9658, + "step": 32891 + }, + { + "epoch": 0.84, + "learning_rate": 1.6873530250057877e-06, + "loss": 0.8418, + "step": 32892 + }, + { + "epoch": 0.84, + "learning_rate": 1.687332927041878e-06, + "loss": 1.0166, + "step": 32893 + }, + { + "epoch": 0.84, + "learning_rate": 1.6873128285517084e-06, + "loss": 0.8496, + "step": 32894 + }, + { + "epoch": 0.84, + "learning_rate": 1.6872927295352955e-06, + "loss": 0.8174, + "step": 32895 + }, + { + "epoch": 0.84, + "learning_rate": 1.6872726299926543e-06, + "loss": 0.6748, + "step": 32896 + }, + { + "epoch": 0.84, + "learning_rate": 1.6872525299238e-06, + "loss": 0.8047, + "step": 32897 + }, + { + "epoch": 0.84, + "learning_rate": 1.6872324293287474e-06, + "loss": 0.7783, + "step": 32898 + }, + { + "epoch": 0.84, + "learning_rate": 1.6872123282075133e-06, + "loss": 0.7334, + "step": 32899 + }, + { + "epoch": 0.84, + "learning_rate": 1.6871922265601118e-06, + "loss": 0.7119, + "step": 32900 + }, + { + "epoch": 0.84, + "learning_rate": 1.6871721243865592e-06, + "loss": 0.6597, + "step": 32901 + }, + { + "epoch": 0.84, + "learning_rate": 1.6871520216868703e-06, + "loss": 0.8379, + "step": 32902 + }, + { + "epoch": 0.84, + "learning_rate": 1.6871319184610606e-06, + "loss": 0.6753, + "step": 32903 + }, + { + "epoch": 0.84, + "learning_rate": 1.6871118147091457e-06, + "loss": 1.0, + "step": 32904 + }, + { + "epoch": 0.84, + "learning_rate": 1.687091710431141e-06, + "loss": 0.9551, + "step": 32905 + }, + { + "epoch": 0.84, + "learning_rate": 1.6870716056270618e-06, + "loss": 1.1973, + "step": 32906 + }, + { + "epoch": 0.84, + "learning_rate": 1.6870515002969233e-06, + "loss": 0.7393, + "step": 32907 + }, + { + "epoch": 0.84, + "learning_rate": 1.6870313944407407e-06, + "loss": 0.8398, + "step": 32908 + }, + { + "epoch": 0.84, + "learning_rate": 1.6870112880585304e-06, + "loss": 0.6387, + "step": 32909 + }, + { + "epoch": 0.84, + "learning_rate": 1.6869911811503066e-06, + "loss": 0.8613, + "step": 32910 + }, + { + "epoch": 0.84, + "learning_rate": 1.6869710737160856e-06, + "loss": 0.8574, + "step": 32911 + }, + { + "epoch": 0.84, + "learning_rate": 1.6869509657558823e-06, + "loss": 0.9893, + "step": 32912 + }, + { + "epoch": 0.84, + "learning_rate": 1.6869308572697124e-06, + "loss": 0.8926, + "step": 32913 + }, + { + "epoch": 0.84, + "learning_rate": 1.6869107482575911e-06, + "loss": 0.7959, + "step": 32914 + }, + { + "epoch": 0.84, + "learning_rate": 1.6868906387195335e-06, + "loss": 0.9473, + "step": 32915 + }, + { + "epoch": 0.84, + "learning_rate": 1.6868705286555556e-06, + "loss": 0.8304, + "step": 32916 + }, + { + "epoch": 0.84, + "learning_rate": 1.6868504180656724e-06, + "loss": 0.8965, + "step": 32917 + }, + { + "epoch": 0.84, + "learning_rate": 1.6868303069498995e-06, + "loss": 0.9424, + "step": 32918 + }, + { + "epoch": 0.84, + "learning_rate": 1.6868101953082521e-06, + "loss": 1.0, + "step": 32919 + }, + { + "epoch": 0.84, + "learning_rate": 1.686790083140746e-06, + "loss": 0.833, + "step": 32920 + }, + { + "epoch": 0.84, + "learning_rate": 1.686769970447396e-06, + "loss": 0.9629, + "step": 32921 + }, + { + "epoch": 0.84, + "learning_rate": 1.686749857228218e-06, + "loss": 0.6719, + "step": 32922 + }, + { + "epoch": 0.84, + "learning_rate": 1.686729743483227e-06, + "loss": 0.5156, + "step": 32923 + }, + { + "epoch": 0.84, + "learning_rate": 1.686709629212439e-06, + "loss": 0.8965, + "step": 32924 + }, + { + "epoch": 0.84, + "learning_rate": 1.6866895144158686e-06, + "loss": 0.917, + "step": 32925 + }, + { + "epoch": 0.84, + "learning_rate": 1.6866693990935319e-06, + "loss": 0.8877, + "step": 32926 + }, + { + "epoch": 0.84, + "learning_rate": 1.686649283245444e-06, + "loss": 0.8633, + "step": 32927 + }, + { + "epoch": 0.84, + "learning_rate": 1.6866291668716202e-06, + "loss": 0.9434, + "step": 32928 + }, + { + "epoch": 0.84, + "learning_rate": 1.686609049972076e-06, + "loss": 0.8276, + "step": 32929 + }, + { + "epoch": 0.84, + "learning_rate": 1.6865889325468268e-06, + "loss": 0.6685, + "step": 32930 + }, + { + "epoch": 0.84, + "learning_rate": 1.6865688145958881e-06, + "loss": 0.6406, + "step": 32931 + }, + { + "epoch": 0.84, + "learning_rate": 1.6865486961192753e-06, + "loss": 0.6655, + "step": 32932 + }, + { + "epoch": 0.84, + "learning_rate": 1.6865285771170035e-06, + "loss": 0.7617, + "step": 32933 + }, + { + "epoch": 0.84, + "learning_rate": 1.6865084575890887e-06, + "loss": 0.9463, + "step": 32934 + }, + { + "epoch": 0.84, + "learning_rate": 1.6864883375355457e-06, + "loss": 0.8516, + "step": 32935 + }, + { + "epoch": 0.84, + "learning_rate": 1.6864682169563902e-06, + "loss": 0.8828, + "step": 32936 + }, + { + "epoch": 0.84, + "learning_rate": 1.6864480958516371e-06, + "loss": 0.8049, + "step": 32937 + }, + { + "epoch": 0.84, + "learning_rate": 1.6864279742213027e-06, + "loss": 0.8262, + "step": 32938 + }, + { + "epoch": 0.84, + "learning_rate": 1.6864078520654021e-06, + "loss": 0.8213, + "step": 32939 + }, + { + "epoch": 0.84, + "learning_rate": 1.6863877293839504e-06, + "loss": 0.7539, + "step": 32940 + }, + { + "epoch": 0.84, + "learning_rate": 1.6863676061769635e-06, + "loss": 0.7534, + "step": 32941 + }, + { + "epoch": 0.84, + "learning_rate": 1.686347482444456e-06, + "loss": 0.9746, + "step": 32942 + }, + { + "epoch": 0.84, + "learning_rate": 1.6863273581864438e-06, + "loss": 0.8174, + "step": 32943 + }, + { + "epoch": 0.84, + "learning_rate": 1.6863072334029424e-06, + "loss": 0.8125, + "step": 32944 + }, + { + "epoch": 0.84, + "learning_rate": 1.6862871080939674e-06, + "loss": 0.4692, + "step": 32945 + }, + { + "epoch": 0.84, + "learning_rate": 1.6862669822595336e-06, + "loss": 0.9492, + "step": 32946 + }, + { + "epoch": 0.84, + "learning_rate": 1.6862468558996569e-06, + "loss": 0.9443, + "step": 32947 + }, + { + "epoch": 0.84, + "learning_rate": 1.6862267290143525e-06, + "loss": 0.8301, + "step": 32948 + }, + { + "epoch": 0.84, + "learning_rate": 1.6862066016036357e-06, + "loss": 0.9546, + "step": 32949 + }, + { + "epoch": 0.84, + "learning_rate": 1.686186473667522e-06, + "loss": 0.6885, + "step": 32950 + }, + { + "epoch": 0.84, + "learning_rate": 1.6861663452060273e-06, + "loss": 0.8369, + "step": 32951 + }, + { + "epoch": 0.84, + "learning_rate": 1.6861462162191662e-06, + "loss": 0.7227, + "step": 32952 + }, + { + "epoch": 0.84, + "learning_rate": 1.6861260867069547e-06, + "loss": 0.6719, + "step": 32953 + }, + { + "epoch": 0.84, + "learning_rate": 1.6861059566694076e-06, + "loss": 0.7261, + "step": 32954 + }, + { + "epoch": 0.84, + "learning_rate": 1.6860858261065412e-06, + "loss": 0.9727, + "step": 32955 + }, + { + "epoch": 0.84, + "learning_rate": 1.68606569501837e-06, + "loss": 1.0176, + "step": 32956 + }, + { + "epoch": 0.84, + "learning_rate": 1.6860455634049102e-06, + "loss": 0.8096, + "step": 32957 + }, + { + "epoch": 0.84, + "learning_rate": 1.6860254312661768e-06, + "loss": 0.9648, + "step": 32958 + }, + { + "epoch": 0.84, + "learning_rate": 1.6860052986021854e-06, + "loss": 0.9102, + "step": 32959 + }, + { + "epoch": 0.84, + "learning_rate": 1.685985165412951e-06, + "loss": 0.6504, + "step": 32960 + }, + { + "epoch": 0.84, + "learning_rate": 1.6859650316984895e-06, + "loss": 0.8618, + "step": 32961 + }, + { + "epoch": 0.84, + "learning_rate": 1.6859448974588157e-06, + "loss": 0.9023, + "step": 32962 + }, + { + "epoch": 0.84, + "learning_rate": 1.685924762693946e-06, + "loss": 0.7427, + "step": 32963 + }, + { + "epoch": 0.84, + "learning_rate": 1.685904627403895e-06, + "loss": 0.8936, + "step": 32964 + }, + { + "epoch": 0.84, + "learning_rate": 1.6858844915886784e-06, + "loss": 0.7671, + "step": 32965 + }, + { + "epoch": 0.84, + "learning_rate": 1.6858643552483115e-06, + "loss": 0.7935, + "step": 32966 + }, + { + "epoch": 0.84, + "learning_rate": 1.6858442183828099e-06, + "loss": 1.0396, + "step": 32967 + }, + { + "epoch": 0.84, + "learning_rate": 1.6858240809921887e-06, + "loss": 0.5015, + "step": 32968 + }, + { + "epoch": 0.85, + "learning_rate": 1.6858039430764638e-06, + "loss": 0.9209, + "step": 32969 + }, + { + "epoch": 0.85, + "learning_rate": 1.6857838046356503e-06, + "loss": 1.127, + "step": 32970 + }, + { + "epoch": 0.85, + "learning_rate": 1.6857636656697638e-06, + "loss": 0.7959, + "step": 32971 + }, + { + "epoch": 0.85, + "learning_rate": 1.6857435261788192e-06, + "loss": 0.8398, + "step": 32972 + }, + { + "epoch": 0.85, + "learning_rate": 1.6857233861628327e-06, + "loss": 0.9268, + "step": 32973 + }, + { + "epoch": 0.85, + "learning_rate": 1.685703245621819e-06, + "loss": 0.7295, + "step": 32974 + }, + { + "epoch": 0.85, + "learning_rate": 1.6856831045557941e-06, + "loss": 0.8877, + "step": 32975 + }, + { + "epoch": 0.85, + "learning_rate": 1.685662962964773e-06, + "loss": 0.9961, + "step": 32976 + }, + { + "epoch": 0.85, + "learning_rate": 1.6856428208487716e-06, + "loss": 1.0312, + "step": 32977 + }, + { + "epoch": 0.85, + "learning_rate": 1.6856226782078046e-06, + "loss": 0.8877, + "step": 32978 + }, + { + "epoch": 0.85, + "learning_rate": 1.6856025350418883e-06, + "loss": 0.7644, + "step": 32979 + }, + { + "epoch": 0.85, + "learning_rate": 1.6855823913510373e-06, + "loss": 0.7227, + "step": 32980 + }, + { + "epoch": 0.85, + "learning_rate": 1.6855622471352675e-06, + "loss": 0.8848, + "step": 32981 + }, + { + "epoch": 0.85, + "learning_rate": 1.6855421023945944e-06, + "loss": 1.0703, + "step": 32982 + }, + { + "epoch": 0.85, + "learning_rate": 1.685521957129033e-06, + "loss": 0.9648, + "step": 32983 + }, + { + "epoch": 0.85, + "learning_rate": 1.6855018113385988e-06, + "loss": 0.6128, + "step": 32984 + }, + { + "epoch": 0.85, + "learning_rate": 1.6854816650233077e-06, + "loss": 0.9639, + "step": 32985 + }, + { + "epoch": 0.85, + "learning_rate": 1.6854615181831746e-06, + "loss": 1.0244, + "step": 32986 + }, + { + "epoch": 0.85, + "learning_rate": 1.6854413708182153e-06, + "loss": 1.1152, + "step": 32987 + }, + { + "epoch": 0.85, + "learning_rate": 1.685421222928445e-06, + "loss": 0.8672, + "step": 32988 + }, + { + "epoch": 0.85, + "learning_rate": 1.685401074513879e-06, + "loss": 0.7832, + "step": 32989 + }, + { + "epoch": 0.85, + "learning_rate": 1.6853809255745335e-06, + "loss": 0.6543, + "step": 32990 + }, + { + "epoch": 0.85, + "learning_rate": 1.6853607761104226e-06, + "loss": 0.7881, + "step": 32991 + }, + { + "epoch": 0.85, + "learning_rate": 1.685340626121563e-06, + "loss": 0.8008, + "step": 32992 + }, + { + "epoch": 0.85, + "learning_rate": 1.6853204756079694e-06, + "loss": 0.7383, + "step": 32993 + }, + { + "epoch": 0.85, + "learning_rate": 1.6853003245696575e-06, + "loss": 0.9893, + "step": 32994 + }, + { + "epoch": 0.85, + "learning_rate": 1.6852801730066426e-06, + "loss": 0.7168, + "step": 32995 + }, + { + "epoch": 0.85, + "learning_rate": 1.6852600209189403e-06, + "loss": 0.8623, + "step": 32996 + }, + { + "epoch": 0.85, + "learning_rate": 1.6852398683065655e-06, + "loss": 0.9941, + "step": 32997 + }, + { + "epoch": 0.85, + "learning_rate": 1.6852197151695343e-06, + "loss": 0.6924, + "step": 32998 + }, + { + "epoch": 0.85, + "learning_rate": 1.6851995615078619e-06, + "loss": 0.8154, + "step": 32999 + }, + { + "epoch": 0.85, + "learning_rate": 1.6851794073215637e-06, + "loss": 0.7725, + "step": 33000 + }, + { + "epoch": 0.85, + "learning_rate": 1.685159252610655e-06, + "loss": 0.791, + "step": 33001 + }, + { + "epoch": 0.85, + "learning_rate": 1.6851390973751515e-06, + "loss": 0.6465, + "step": 33002 + }, + { + "epoch": 0.85, + "learning_rate": 1.6851189416150687e-06, + "loss": 0.7275, + "step": 33003 + }, + { + "epoch": 0.85, + "learning_rate": 1.6850987853304215e-06, + "loss": 0.7603, + "step": 33004 + }, + { + "epoch": 0.85, + "learning_rate": 1.685078628521226e-06, + "loss": 0.8052, + "step": 33005 + }, + { + "epoch": 0.85, + "learning_rate": 1.6850584711874969e-06, + "loss": 1.1309, + "step": 33006 + }, + { + "epoch": 0.85, + "learning_rate": 1.68503831332925e-06, + "loss": 0.9556, + "step": 33007 + }, + { + "epoch": 0.85, + "learning_rate": 1.6850181549465013e-06, + "loss": 1.0557, + "step": 33008 + }, + { + "epoch": 0.85, + "learning_rate": 1.6849979960392652e-06, + "loss": 0.9238, + "step": 33009 + }, + { + "epoch": 0.85, + "learning_rate": 1.6849778366075577e-06, + "loss": 0.8906, + "step": 33010 + }, + { + "epoch": 0.85, + "learning_rate": 1.6849576766513941e-06, + "loss": 0.8467, + "step": 33011 + }, + { + "epoch": 0.85, + "learning_rate": 1.68493751617079e-06, + "loss": 0.646, + "step": 33012 + }, + { + "epoch": 0.85, + "learning_rate": 1.684917355165761e-06, + "loss": 0.9404, + "step": 33013 + }, + { + "epoch": 0.85, + "learning_rate": 1.6848971936363221e-06, + "loss": 0.8027, + "step": 33014 + }, + { + "epoch": 0.85, + "learning_rate": 1.6848770315824888e-06, + "loss": 0.7627, + "step": 33015 + }, + { + "epoch": 0.85, + "learning_rate": 1.6848568690042768e-06, + "loss": 0.9258, + "step": 33016 + }, + { + "epoch": 0.85, + "learning_rate": 1.6848367059017013e-06, + "loss": 0.8154, + "step": 33017 + }, + { + "epoch": 0.85, + "learning_rate": 1.684816542274778e-06, + "loss": 0.9072, + "step": 33018 + }, + { + "epoch": 0.85, + "learning_rate": 1.6847963781235217e-06, + "loss": 0.9854, + "step": 33019 + }, + { + "epoch": 0.85, + "learning_rate": 1.6847762134479489e-06, + "loss": 0.5991, + "step": 33020 + }, + { + "epoch": 0.85, + "learning_rate": 1.684756048248074e-06, + "loss": 0.7129, + "step": 33021 + }, + { + "epoch": 0.85, + "learning_rate": 1.684735882523913e-06, + "loss": 0.9492, + "step": 33022 + }, + { + "epoch": 0.85, + "learning_rate": 1.6847157162754814e-06, + "loss": 0.6731, + "step": 33023 + }, + { + "epoch": 0.85, + "learning_rate": 1.684695549502794e-06, + "loss": 1.0938, + "step": 33024 + }, + { + "epoch": 0.85, + "learning_rate": 1.6846753822058673e-06, + "loss": 0.7378, + "step": 33025 + }, + { + "epoch": 0.85, + "learning_rate": 1.6846552143847157e-06, + "loss": 0.8301, + "step": 33026 + }, + { + "epoch": 0.85, + "learning_rate": 1.6846350460393553e-06, + "loss": 0.9346, + "step": 33027 + }, + { + "epoch": 0.85, + "learning_rate": 1.6846148771698013e-06, + "loss": 0.9893, + "step": 33028 + }, + { + "epoch": 0.85, + "learning_rate": 1.6845947077760688e-06, + "loss": 0.8042, + "step": 33029 + }, + { + "epoch": 0.85, + "learning_rate": 1.6845745378581744e-06, + "loss": 0.7773, + "step": 33030 + }, + { + "epoch": 0.85, + "learning_rate": 1.684554367416132e-06, + "loss": 0.9111, + "step": 33031 + }, + { + "epoch": 0.85, + "learning_rate": 1.6845341964499582e-06, + "loss": 0.7764, + "step": 33032 + }, + { + "epoch": 0.85, + "learning_rate": 1.684514024959668e-06, + "loss": 0.8506, + "step": 33033 + }, + { + "epoch": 0.85, + "learning_rate": 1.6844938529452766e-06, + "loss": 0.8271, + "step": 33034 + }, + { + "epoch": 0.85, + "learning_rate": 1.6844736804068e-06, + "loss": 0.8682, + "step": 33035 + }, + { + "epoch": 0.85, + "learning_rate": 1.6844535073442534e-06, + "loss": 0.853, + "step": 33036 + }, + { + "epoch": 0.85, + "learning_rate": 1.684433333757652e-06, + "loss": 0.7705, + "step": 33037 + }, + { + "epoch": 0.85, + "learning_rate": 1.6844131596470117e-06, + "loss": 0.9111, + "step": 33038 + }, + { + "epoch": 0.85, + "learning_rate": 1.6843929850123474e-06, + "loss": 1.0742, + "step": 33039 + }, + { + "epoch": 0.85, + "learning_rate": 1.6843728098536754e-06, + "loss": 0.7861, + "step": 33040 + }, + { + "epoch": 0.85, + "learning_rate": 1.6843526341710103e-06, + "loss": 1.1553, + "step": 33041 + }, + { + "epoch": 0.85, + "learning_rate": 1.6843324579643676e-06, + "loss": 0.8789, + "step": 33042 + }, + { + "epoch": 0.85, + "learning_rate": 1.6843122812337634e-06, + "loss": 0.75, + "step": 33043 + }, + { + "epoch": 0.85, + "learning_rate": 1.6842921039792124e-06, + "loss": 0.8799, + "step": 33044 + }, + { + "epoch": 0.85, + "learning_rate": 1.6842719262007309e-06, + "loss": 1.165, + "step": 33045 + }, + { + "epoch": 0.85, + "learning_rate": 1.6842517478983334e-06, + "loss": 0.9961, + "step": 33046 + }, + { + "epoch": 0.85, + "learning_rate": 1.6842315690720359e-06, + "loss": 0.585, + "step": 33047 + }, + { + "epoch": 0.85, + "learning_rate": 1.6842113897218538e-06, + "loss": 0.8301, + "step": 33048 + }, + { + "epoch": 0.85, + "learning_rate": 1.6841912098478024e-06, + "loss": 0.7686, + "step": 33049 + }, + { + "epoch": 0.85, + "learning_rate": 1.6841710294498977e-06, + "loss": 0.9238, + "step": 33050 + }, + { + "epoch": 0.85, + "learning_rate": 1.6841508485281542e-06, + "loss": 0.6978, + "step": 33051 + }, + { + "epoch": 0.85, + "learning_rate": 1.684130667082588e-06, + "loss": 0.9678, + "step": 33052 + }, + { + "epoch": 0.85, + "learning_rate": 1.6841104851132143e-06, + "loss": 0.9258, + "step": 33053 + }, + { + "epoch": 0.85, + "learning_rate": 1.6840903026200487e-06, + "loss": 0.8008, + "step": 33054 + }, + { + "epoch": 0.85, + "learning_rate": 1.6840701196031068e-06, + "loss": 0.8726, + "step": 33055 + }, + { + "epoch": 0.85, + "learning_rate": 1.6840499360624039e-06, + "loss": 0.7959, + "step": 33056 + }, + { + "epoch": 0.85, + "learning_rate": 1.684029751997955e-06, + "loss": 0.8506, + "step": 33057 + }, + { + "epoch": 0.85, + "learning_rate": 1.6840095674097763e-06, + "loss": 0.7681, + "step": 33058 + }, + { + "epoch": 0.85, + "learning_rate": 1.6839893822978828e-06, + "loss": 0.7649, + "step": 33059 + }, + { + "epoch": 0.85, + "learning_rate": 1.6839691966622901e-06, + "loss": 0.8281, + "step": 33060 + }, + { + "epoch": 0.85, + "learning_rate": 1.683949010503014e-06, + "loss": 0.9473, + "step": 33061 + }, + { + "epoch": 0.85, + "learning_rate": 1.683928823820069e-06, + "loss": 0.9902, + "step": 33062 + }, + { + "epoch": 0.85, + "learning_rate": 1.6839086366134713e-06, + "loss": 0.7407, + "step": 33063 + }, + { + "epoch": 0.85, + "learning_rate": 1.6838884488832363e-06, + "loss": 0.8203, + "step": 33064 + }, + { + "epoch": 0.85, + "learning_rate": 1.6838682606293797e-06, + "loss": 0.9014, + "step": 33065 + }, + { + "epoch": 0.85, + "learning_rate": 1.6838480718519162e-06, + "loss": 0.793, + "step": 33066 + }, + { + "epoch": 0.85, + "learning_rate": 1.6838278825508615e-06, + "loss": 0.7197, + "step": 33067 + }, + { + "epoch": 0.85, + "learning_rate": 1.6838076927262317e-06, + "loss": 0.6079, + "step": 33068 + }, + { + "epoch": 0.85, + "learning_rate": 1.6837875023780415e-06, + "loss": 0.7148, + "step": 33069 + }, + { + "epoch": 0.85, + "learning_rate": 1.683767311506307e-06, + "loss": 0.8965, + "step": 33070 + }, + { + "epoch": 0.85, + "learning_rate": 1.683747120111043e-06, + "loss": 0.9375, + "step": 33071 + }, + { + "epoch": 0.85, + "learning_rate": 1.6837269281922652e-06, + "loss": 0.9648, + "step": 33072 + }, + { + "epoch": 0.85, + "learning_rate": 1.6837067357499893e-06, + "loss": 0.7793, + "step": 33073 + }, + { + "epoch": 0.85, + "learning_rate": 1.6836865427842303e-06, + "loss": 0.7131, + "step": 33074 + }, + { + "epoch": 0.85, + "learning_rate": 1.6836663492950045e-06, + "loss": 0.9531, + "step": 33075 + }, + { + "epoch": 0.85, + "learning_rate": 1.6836461552823266e-06, + "loss": 0.8735, + "step": 33076 + }, + { + "epoch": 0.85, + "learning_rate": 1.6836259607462119e-06, + "loss": 0.8232, + "step": 33077 + }, + { + "epoch": 0.85, + "learning_rate": 1.6836057656866766e-06, + "loss": 0.731, + "step": 33078 + }, + { + "epoch": 0.85, + "learning_rate": 1.6835855701037355e-06, + "loss": 1.0254, + "step": 33079 + }, + { + "epoch": 0.85, + "learning_rate": 1.6835653739974047e-06, + "loss": 0.686, + "step": 33080 + }, + { + "epoch": 0.85, + "learning_rate": 1.6835451773676993e-06, + "loss": 0.7408, + "step": 33081 + }, + { + "epoch": 0.85, + "learning_rate": 1.6835249802146348e-06, + "loss": 0.6836, + "step": 33082 + }, + { + "epoch": 0.85, + "learning_rate": 1.6835047825382262e-06, + "loss": 0.6543, + "step": 33083 + }, + { + "epoch": 0.85, + "learning_rate": 1.6834845843384899e-06, + "loss": 0.8091, + "step": 33084 + }, + { + "epoch": 0.85, + "learning_rate": 1.683464385615441e-06, + "loss": 0.9424, + "step": 33085 + }, + { + "epoch": 0.85, + "learning_rate": 1.6834441863690944e-06, + "loss": 0.8721, + "step": 33086 + }, + { + "epoch": 0.85, + "learning_rate": 1.6834239865994664e-06, + "loss": 0.8496, + "step": 33087 + }, + { + "epoch": 0.85, + "learning_rate": 1.6834037863065715e-06, + "loss": 0.9551, + "step": 33088 + }, + { + "epoch": 0.85, + "learning_rate": 1.6833835854904263e-06, + "loss": 0.7783, + "step": 33089 + }, + { + "epoch": 0.85, + "learning_rate": 1.6833633841510455e-06, + "loss": 0.8135, + "step": 33090 + }, + { + "epoch": 0.85, + "learning_rate": 1.683343182288445e-06, + "loss": 0.6313, + "step": 33091 + }, + { + "epoch": 0.85, + "learning_rate": 1.6833229799026397e-06, + "loss": 0.8213, + "step": 33092 + }, + { + "epoch": 0.85, + "learning_rate": 1.6833027769936456e-06, + "loss": 0.7988, + "step": 33093 + }, + { + "epoch": 0.85, + "learning_rate": 1.683282573561478e-06, + "loss": 0.9873, + "step": 33094 + }, + { + "epoch": 0.85, + "learning_rate": 1.6832623696061523e-06, + "loss": 0.7393, + "step": 33095 + }, + { + "epoch": 0.85, + "learning_rate": 1.6832421651276839e-06, + "loss": 0.6987, + "step": 33096 + }, + { + "epoch": 0.85, + "learning_rate": 1.6832219601260883e-06, + "loss": 0.9785, + "step": 33097 + }, + { + "epoch": 0.85, + "learning_rate": 1.6832017546013814e-06, + "loss": 0.8916, + "step": 33098 + }, + { + "epoch": 0.85, + "learning_rate": 1.6831815485535784e-06, + "loss": 0.7324, + "step": 33099 + }, + { + "epoch": 0.85, + "learning_rate": 1.6831613419826947e-06, + "loss": 0.729, + "step": 33100 + }, + { + "epoch": 0.85, + "learning_rate": 1.6831411348887455e-06, + "loss": 0.8213, + "step": 33101 + }, + { + "epoch": 0.85, + "learning_rate": 1.6831209272717466e-06, + "loss": 0.9209, + "step": 33102 + }, + { + "epoch": 0.85, + "learning_rate": 1.6831007191317132e-06, + "loss": 0.9404, + "step": 33103 + }, + { + "epoch": 0.85, + "learning_rate": 1.6830805104686615e-06, + "loss": 0.8926, + "step": 33104 + }, + { + "epoch": 0.85, + "learning_rate": 1.683060301282606e-06, + "loss": 0.9678, + "step": 33105 + }, + { + "epoch": 0.85, + "learning_rate": 1.683040091573563e-06, + "loss": 0.8755, + "step": 33106 + }, + { + "epoch": 0.85, + "learning_rate": 1.6830198813415472e-06, + "loss": 0.7759, + "step": 33107 + }, + { + "epoch": 0.85, + "learning_rate": 1.6829996705865749e-06, + "loss": 0.7783, + "step": 33108 + }, + { + "epoch": 0.85, + "learning_rate": 1.6829794593086609e-06, + "loss": 0.6855, + "step": 33109 + }, + { + "epoch": 0.85, + "learning_rate": 1.6829592475078211e-06, + "loss": 0.73, + "step": 33110 + }, + { + "epoch": 0.85, + "learning_rate": 1.6829390351840707e-06, + "loss": 0.9014, + "step": 33111 + }, + { + "epoch": 0.85, + "learning_rate": 1.6829188223374252e-06, + "loss": 0.7861, + "step": 33112 + }, + { + "epoch": 0.85, + "learning_rate": 1.6828986089679004e-06, + "loss": 0.7031, + "step": 33113 + }, + { + "epoch": 0.85, + "learning_rate": 1.6828783950755112e-06, + "loss": 0.7275, + "step": 33114 + }, + { + "epoch": 0.85, + "learning_rate": 1.6828581806602738e-06, + "loss": 0.9932, + "step": 33115 + }, + { + "epoch": 0.85, + "learning_rate": 1.682837965722203e-06, + "loss": 0.7563, + "step": 33116 + }, + { + "epoch": 0.85, + "learning_rate": 1.6828177502613148e-06, + "loss": 0.9473, + "step": 33117 + }, + { + "epoch": 0.85, + "learning_rate": 1.6827975342776241e-06, + "loss": 0.833, + "step": 33118 + }, + { + "epoch": 0.85, + "learning_rate": 1.6827773177711468e-06, + "loss": 0.9365, + "step": 33119 + }, + { + "epoch": 0.85, + "learning_rate": 1.6827571007418988e-06, + "loss": 0.6934, + "step": 33120 + }, + { + "epoch": 0.85, + "learning_rate": 1.6827368831898947e-06, + "loss": 0.874, + "step": 33121 + }, + { + "epoch": 0.85, + "learning_rate": 1.68271666511515e-06, + "loss": 0.9941, + "step": 33122 + }, + { + "epoch": 0.85, + "learning_rate": 1.6826964465176812e-06, + "loss": 0.8525, + "step": 33123 + }, + { + "epoch": 0.85, + "learning_rate": 1.6826762273975029e-06, + "loss": 0.9023, + "step": 33124 + }, + { + "epoch": 0.85, + "learning_rate": 1.6826560077546307e-06, + "loss": 0.9131, + "step": 33125 + }, + { + "epoch": 0.85, + "learning_rate": 1.6826357875890802e-06, + "loss": 0.7744, + "step": 33126 + }, + { + "epoch": 0.85, + "learning_rate": 1.6826155669008669e-06, + "loss": 0.7793, + "step": 33127 + }, + { + "epoch": 0.85, + "learning_rate": 1.6825953456900061e-06, + "loss": 0.793, + "step": 33128 + }, + { + "epoch": 0.85, + "learning_rate": 1.6825751239565137e-06, + "loss": 0.7681, + "step": 33129 + }, + { + "epoch": 0.85, + "learning_rate": 1.6825549017004047e-06, + "loss": 0.8477, + "step": 33130 + }, + { + "epoch": 0.85, + "learning_rate": 1.682534678921695e-06, + "loss": 0.9199, + "step": 33131 + }, + { + "epoch": 0.85, + "learning_rate": 1.6825144556203998e-06, + "loss": 0.7627, + "step": 33132 + }, + { + "epoch": 0.85, + "learning_rate": 1.6824942317965345e-06, + "loss": 0.7891, + "step": 33133 + }, + { + "epoch": 0.85, + "learning_rate": 1.6824740074501148e-06, + "loss": 0.9326, + "step": 33134 + }, + { + "epoch": 0.85, + "learning_rate": 1.6824537825811565e-06, + "loss": 0.9678, + "step": 33135 + }, + { + "epoch": 0.85, + "learning_rate": 1.6824335571896744e-06, + "loss": 0.9785, + "step": 33136 + }, + { + "epoch": 0.85, + "learning_rate": 1.682413331275684e-06, + "loss": 0.8301, + "step": 33137 + }, + { + "epoch": 0.85, + "learning_rate": 1.6823931048392014e-06, + "loss": 0.8281, + "step": 33138 + }, + { + "epoch": 0.85, + "learning_rate": 1.6823728778802419e-06, + "loss": 0.8213, + "step": 33139 + }, + { + "epoch": 0.85, + "learning_rate": 1.6823526503988208e-06, + "loss": 0.9023, + "step": 33140 + }, + { + "epoch": 0.85, + "learning_rate": 1.6823324223949537e-06, + "loss": 0.915, + "step": 33141 + }, + { + "epoch": 0.85, + "learning_rate": 1.682312193868656e-06, + "loss": 1.0244, + "step": 33142 + }, + { + "epoch": 0.85, + "learning_rate": 1.6822919648199432e-06, + "loss": 1.0049, + "step": 33143 + }, + { + "epoch": 0.85, + "learning_rate": 1.6822717352488308e-06, + "loss": 1.0215, + "step": 33144 + }, + { + "epoch": 0.85, + "learning_rate": 1.6822515051553343e-06, + "loss": 0.8232, + "step": 33145 + }, + { + "epoch": 0.85, + "learning_rate": 1.682231274539469e-06, + "loss": 0.918, + "step": 33146 + }, + { + "epoch": 0.85, + "learning_rate": 1.682211043401251e-06, + "loss": 0.7617, + "step": 33147 + }, + { + "epoch": 0.85, + "learning_rate": 1.6821908117406951e-06, + "loss": 0.6885, + "step": 33148 + }, + { + "epoch": 0.85, + "learning_rate": 1.682170579557817e-06, + "loss": 0.8613, + "step": 33149 + }, + { + "epoch": 0.85, + "learning_rate": 1.6821503468526325e-06, + "loss": 0.6475, + "step": 33150 + }, + { + "epoch": 0.85, + "learning_rate": 1.6821301136251567e-06, + "loss": 0.6631, + "step": 33151 + }, + { + "epoch": 0.85, + "learning_rate": 1.6821098798754055e-06, + "loss": 0.8555, + "step": 33152 + }, + { + "epoch": 0.85, + "learning_rate": 1.6820896456033936e-06, + "loss": 0.7539, + "step": 33153 + }, + { + "epoch": 0.85, + "learning_rate": 1.6820694108091373e-06, + "loss": 0.7744, + "step": 33154 + }, + { + "epoch": 0.85, + "learning_rate": 1.682049175492652e-06, + "loss": 0.7549, + "step": 33155 + }, + { + "epoch": 0.85, + "learning_rate": 1.6820289396539526e-06, + "loss": 1.0459, + "step": 33156 + }, + { + "epoch": 0.85, + "learning_rate": 1.6820087032930555e-06, + "loss": 0.7656, + "step": 33157 + }, + { + "epoch": 0.85, + "learning_rate": 1.6819884664099752e-06, + "loss": 1.0586, + "step": 33158 + }, + { + "epoch": 0.85, + "learning_rate": 1.681968229004728e-06, + "loss": 0.915, + "step": 33159 + }, + { + "epoch": 0.85, + "learning_rate": 1.681947991077329e-06, + "loss": 0.9492, + "step": 33160 + }, + { + "epoch": 0.85, + "learning_rate": 1.6819277526277937e-06, + "loss": 0.9062, + "step": 33161 + }, + { + "epoch": 0.85, + "learning_rate": 1.6819075136561377e-06, + "loss": 1.0029, + "step": 33162 + }, + { + "epoch": 0.85, + "learning_rate": 1.6818872741623764e-06, + "loss": 0.8159, + "step": 33163 + }, + { + "epoch": 0.85, + "learning_rate": 1.6818670341465255e-06, + "loss": 0.7871, + "step": 33164 + }, + { + "epoch": 0.85, + "learning_rate": 1.6818467936086007e-06, + "loss": 0.8281, + "step": 33165 + }, + { + "epoch": 0.85, + "learning_rate": 1.6818265525486166e-06, + "loss": 0.8115, + "step": 33166 + }, + { + "epoch": 0.85, + "learning_rate": 1.6818063109665897e-06, + "loss": 0.6548, + "step": 33167 + }, + { + "epoch": 0.85, + "learning_rate": 1.6817860688625345e-06, + "loss": 0.8984, + "step": 33168 + }, + { + "epoch": 0.85, + "learning_rate": 1.6817658262364675e-06, + "loss": 0.707, + "step": 33169 + }, + { + "epoch": 0.85, + "learning_rate": 1.6817455830884038e-06, + "loss": 0.917, + "step": 33170 + }, + { + "epoch": 0.85, + "learning_rate": 1.6817253394183587e-06, + "loss": 0.874, + "step": 33171 + }, + { + "epoch": 0.85, + "learning_rate": 1.6817050952263476e-06, + "loss": 0.9023, + "step": 33172 + }, + { + "epoch": 0.85, + "learning_rate": 1.6816848505123866e-06, + "loss": 0.8389, + "step": 33173 + }, + { + "epoch": 0.85, + "learning_rate": 1.6816646052764906e-06, + "loss": 0.9404, + "step": 33174 + }, + { + "epoch": 0.85, + "learning_rate": 1.681644359518676e-06, + "loss": 0.9727, + "step": 33175 + }, + { + "epoch": 0.85, + "learning_rate": 1.6816241132389571e-06, + "loss": 0.6934, + "step": 33176 + }, + { + "epoch": 0.85, + "learning_rate": 1.6816038664373498e-06, + "loss": 0.7507, + "step": 33177 + }, + { + "epoch": 0.85, + "learning_rate": 1.6815836191138701e-06, + "loss": 0.7729, + "step": 33178 + }, + { + "epoch": 0.85, + "learning_rate": 1.6815633712685329e-06, + "loss": 0.8086, + "step": 33179 + }, + { + "epoch": 0.85, + "learning_rate": 1.6815431229013543e-06, + "loss": 0.71, + "step": 33180 + }, + { + "epoch": 0.85, + "learning_rate": 1.6815228740123492e-06, + "loss": 0.8608, + "step": 33181 + }, + { + "epoch": 0.85, + "learning_rate": 1.6815026246015335e-06, + "loss": 0.7344, + "step": 33182 + }, + { + "epoch": 0.85, + "learning_rate": 1.6814823746689224e-06, + "loss": 0.7432, + "step": 33183 + }, + { + "epoch": 0.85, + "learning_rate": 1.6814621242145318e-06, + "loss": 0.8691, + "step": 33184 + }, + { + "epoch": 0.85, + "learning_rate": 1.681441873238377e-06, + "loss": 0.5488, + "step": 33185 + }, + { + "epoch": 0.85, + "learning_rate": 1.6814216217404735e-06, + "loss": 0.8955, + "step": 33186 + }, + { + "epoch": 0.85, + "learning_rate": 1.6814013697208366e-06, + "loss": 0.7581, + "step": 33187 + }, + { + "epoch": 0.85, + "learning_rate": 1.681381117179482e-06, + "loss": 0.9512, + "step": 33188 + }, + { + "epoch": 0.85, + "learning_rate": 1.6813608641164251e-06, + "loss": 0.9043, + "step": 33189 + }, + { + "epoch": 0.85, + "learning_rate": 1.681340610531682e-06, + "loss": 0.8809, + "step": 33190 + }, + { + "epoch": 0.85, + "learning_rate": 1.6813203564252673e-06, + "loss": 1.0215, + "step": 33191 + }, + { + "epoch": 0.85, + "learning_rate": 1.6813001017971973e-06, + "loss": 0.7627, + "step": 33192 + }, + { + "epoch": 0.85, + "learning_rate": 1.6812798466474869e-06, + "loss": 0.8882, + "step": 33193 + }, + { + "epoch": 0.85, + "learning_rate": 1.6812595909761517e-06, + "loss": 0.7344, + "step": 33194 + }, + { + "epoch": 0.85, + "learning_rate": 1.6812393347832078e-06, + "loss": 0.7754, + "step": 33195 + }, + { + "epoch": 0.85, + "learning_rate": 1.6812190780686699e-06, + "loss": 0.8457, + "step": 33196 + }, + { + "epoch": 0.85, + "learning_rate": 1.681198820832554e-06, + "loss": 1.0049, + "step": 33197 + }, + { + "epoch": 0.85, + "learning_rate": 1.6811785630748753e-06, + "loss": 0.6338, + "step": 33198 + }, + { + "epoch": 0.85, + "learning_rate": 1.6811583047956496e-06, + "loss": 0.6562, + "step": 33199 + }, + { + "epoch": 0.85, + "learning_rate": 1.6811380459948924e-06, + "loss": 0.7144, + "step": 33200 + }, + { + "epoch": 0.85, + "learning_rate": 1.6811177866726191e-06, + "loss": 0.7598, + "step": 33201 + }, + { + "epoch": 0.85, + "learning_rate": 1.6810975268288453e-06, + "loss": 1.0488, + "step": 33202 + }, + { + "epoch": 0.85, + "learning_rate": 1.6810772664635864e-06, + "loss": 0.9961, + "step": 33203 + }, + { + "epoch": 0.85, + "learning_rate": 1.681057005576858e-06, + "loss": 0.8359, + "step": 33204 + }, + { + "epoch": 0.85, + "learning_rate": 1.6810367441686751e-06, + "loss": 0.8447, + "step": 33205 + }, + { + "epoch": 0.85, + "learning_rate": 1.6810164822390542e-06, + "loss": 0.582, + "step": 33206 + }, + { + "epoch": 0.85, + "learning_rate": 1.68099621978801e-06, + "loss": 0.8047, + "step": 33207 + }, + { + "epoch": 0.85, + "learning_rate": 1.6809759568155586e-06, + "loss": 0.9658, + "step": 33208 + }, + { + "epoch": 0.85, + "learning_rate": 1.680955693321715e-06, + "loss": 0.9199, + "step": 33209 + }, + { + "epoch": 0.85, + "learning_rate": 1.680935429306495e-06, + "loss": 0.6914, + "step": 33210 + }, + { + "epoch": 0.85, + "learning_rate": 1.6809151647699142e-06, + "loss": 0.7314, + "step": 33211 + }, + { + "epoch": 0.85, + "learning_rate": 1.6808948997119878e-06, + "loss": 0.8447, + "step": 33212 + }, + { + "epoch": 0.85, + "learning_rate": 1.6808746341327313e-06, + "loss": 0.6143, + "step": 33213 + }, + { + "epoch": 0.85, + "learning_rate": 1.6808543680321607e-06, + "loss": 0.9023, + "step": 33214 + }, + { + "epoch": 0.85, + "learning_rate": 1.6808341014102911e-06, + "loss": 1.0264, + "step": 33215 + }, + { + "epoch": 0.85, + "learning_rate": 1.6808138342671384e-06, + "loss": 0.7598, + "step": 33216 + }, + { + "epoch": 0.85, + "learning_rate": 1.6807935666027175e-06, + "loss": 0.9209, + "step": 33217 + }, + { + "epoch": 0.85, + "learning_rate": 1.6807732984170443e-06, + "loss": 1.0049, + "step": 33218 + }, + { + "epoch": 0.85, + "learning_rate": 1.6807530297101345e-06, + "loss": 0.7026, + "step": 33219 + }, + { + "epoch": 0.85, + "learning_rate": 1.6807327604820031e-06, + "loss": 0.792, + "step": 33220 + }, + { + "epoch": 0.85, + "learning_rate": 1.6807124907326662e-06, + "loss": 1.0156, + "step": 33221 + }, + { + "epoch": 0.85, + "learning_rate": 1.6806922204621388e-06, + "loss": 0.8369, + "step": 33222 + }, + { + "epoch": 0.85, + "learning_rate": 1.680671949670437e-06, + "loss": 0.8574, + "step": 33223 + }, + { + "epoch": 0.85, + "learning_rate": 1.6806516783575757e-06, + "loss": 0.9097, + "step": 33224 + }, + { + "epoch": 0.85, + "learning_rate": 1.6806314065235708e-06, + "loss": 1.0117, + "step": 33225 + }, + { + "epoch": 0.85, + "learning_rate": 1.6806111341684378e-06, + "loss": 1.0801, + "step": 33226 + }, + { + "epoch": 0.85, + "learning_rate": 1.6805908612921919e-06, + "loss": 0.9609, + "step": 33227 + }, + { + "epoch": 0.85, + "learning_rate": 1.680570587894849e-06, + "loss": 0.8115, + "step": 33228 + }, + { + "epoch": 0.85, + "learning_rate": 1.6805503139764248e-06, + "loss": 0.8906, + "step": 33229 + }, + { + "epoch": 0.85, + "learning_rate": 1.6805300395369342e-06, + "loss": 0.7266, + "step": 33230 + }, + { + "epoch": 0.85, + "learning_rate": 1.680509764576393e-06, + "loss": 0.9287, + "step": 33231 + }, + { + "epoch": 0.85, + "learning_rate": 1.680489489094817e-06, + "loss": 0.7158, + "step": 33232 + }, + { + "epoch": 0.85, + "learning_rate": 1.6804692130922212e-06, + "loss": 0.7407, + "step": 33233 + }, + { + "epoch": 0.85, + "learning_rate": 1.6804489365686218e-06, + "loss": 0.9541, + "step": 33234 + }, + { + "epoch": 0.85, + "learning_rate": 1.6804286595240336e-06, + "loss": 0.751, + "step": 33235 + }, + { + "epoch": 0.85, + "learning_rate": 1.6804083819584727e-06, + "loss": 0.9629, + "step": 33236 + }, + { + "epoch": 0.85, + "learning_rate": 1.6803881038719543e-06, + "loss": 0.8926, + "step": 33237 + }, + { + "epoch": 0.85, + "learning_rate": 1.6803678252644938e-06, + "loss": 0.8525, + "step": 33238 + }, + { + "epoch": 0.85, + "learning_rate": 1.680347546136107e-06, + "loss": 0.6763, + "step": 33239 + }, + { + "epoch": 0.85, + "learning_rate": 1.6803272664868096e-06, + "loss": 0.751, + "step": 33240 + }, + { + "epoch": 0.85, + "learning_rate": 1.6803069863166169e-06, + "loss": 0.7988, + "step": 33241 + }, + { + "epoch": 0.85, + "learning_rate": 1.6802867056255444e-06, + "loss": 0.9204, + "step": 33242 + }, + { + "epoch": 0.85, + "learning_rate": 1.6802664244136072e-06, + "loss": 0.8428, + "step": 33243 + }, + { + "epoch": 0.85, + "learning_rate": 1.6802461426808217e-06, + "loss": 0.8276, + "step": 33244 + }, + { + "epoch": 0.85, + "learning_rate": 1.6802258604272028e-06, + "loss": 0.9004, + "step": 33245 + }, + { + "epoch": 0.85, + "learning_rate": 1.6802055776527664e-06, + "loss": 0.583, + "step": 33246 + }, + { + "epoch": 0.85, + "learning_rate": 1.6801852943575278e-06, + "loss": 0.9385, + "step": 33247 + }, + { + "epoch": 0.85, + "learning_rate": 1.6801650105415028e-06, + "loss": 0.9316, + "step": 33248 + }, + { + "epoch": 0.85, + "learning_rate": 1.6801447262047065e-06, + "loss": 0.7104, + "step": 33249 + }, + { + "epoch": 0.85, + "learning_rate": 1.6801244413471548e-06, + "loss": 0.8486, + "step": 33250 + }, + { + "epoch": 0.85, + "learning_rate": 1.680104155968863e-06, + "loss": 0.8867, + "step": 33251 + }, + { + "epoch": 0.85, + "learning_rate": 1.6800838700698465e-06, + "loss": 0.9092, + "step": 33252 + }, + { + "epoch": 0.85, + "learning_rate": 1.6800635836501214e-06, + "loss": 0.8369, + "step": 33253 + }, + { + "epoch": 0.85, + "learning_rate": 1.680043296709703e-06, + "loss": 0.9355, + "step": 33254 + }, + { + "epoch": 0.85, + "learning_rate": 1.6800230092486062e-06, + "loss": 0.833, + "step": 33255 + }, + { + "epoch": 0.85, + "learning_rate": 1.6800027212668476e-06, + "loss": 0.7441, + "step": 33256 + }, + { + "epoch": 0.85, + "learning_rate": 1.6799824327644417e-06, + "loss": 0.8389, + "step": 33257 + }, + { + "epoch": 0.85, + "learning_rate": 1.6799621437414046e-06, + "loss": 0.9277, + "step": 33258 + }, + { + "epoch": 0.85, + "learning_rate": 1.6799418541977521e-06, + "loss": 0.8242, + "step": 33259 + }, + { + "epoch": 0.85, + "learning_rate": 1.6799215641334993e-06, + "loss": 0.8945, + "step": 33260 + }, + { + "epoch": 0.85, + "learning_rate": 1.6799012735486614e-06, + "loss": 0.9219, + "step": 33261 + }, + { + "epoch": 0.85, + "learning_rate": 1.6798809824432547e-06, + "loss": 0.9707, + "step": 33262 + }, + { + "epoch": 0.85, + "learning_rate": 1.6798606908172944e-06, + "loss": 0.8154, + "step": 33263 + }, + { + "epoch": 0.85, + "learning_rate": 1.6798403986707959e-06, + "loss": 0.709, + "step": 33264 + }, + { + "epoch": 0.85, + "learning_rate": 1.6798201060037749e-06, + "loss": 0.8877, + "step": 33265 + }, + { + "epoch": 0.85, + "learning_rate": 1.679799812816247e-06, + "loss": 0.3755, + "step": 33266 + }, + { + "epoch": 0.85, + "learning_rate": 1.6797795191082276e-06, + "loss": 0.8027, + "step": 33267 + }, + { + "epoch": 0.85, + "learning_rate": 1.6797592248797323e-06, + "loss": 0.8984, + "step": 33268 + }, + { + "epoch": 0.85, + "learning_rate": 1.6797389301307766e-06, + "loss": 1.0361, + "step": 33269 + }, + { + "epoch": 0.85, + "learning_rate": 1.6797186348613758e-06, + "loss": 0.8281, + "step": 33270 + }, + { + "epoch": 0.85, + "learning_rate": 1.6796983390715461e-06, + "loss": 0.8125, + "step": 33271 + }, + { + "epoch": 0.85, + "learning_rate": 1.6796780427613024e-06, + "loss": 0.9863, + "step": 33272 + }, + { + "epoch": 0.85, + "learning_rate": 1.6796577459306604e-06, + "loss": 0.8379, + "step": 33273 + }, + { + "epoch": 0.85, + "learning_rate": 1.6796374485796362e-06, + "loss": 0.853, + "step": 33274 + }, + { + "epoch": 0.85, + "learning_rate": 1.6796171507082444e-06, + "loss": 0.8848, + "step": 33275 + }, + { + "epoch": 0.85, + "learning_rate": 1.6795968523165008e-06, + "loss": 0.8428, + "step": 33276 + }, + { + "epoch": 0.85, + "learning_rate": 1.6795765534044218e-06, + "loss": 0.9375, + "step": 33277 + }, + { + "epoch": 0.85, + "learning_rate": 1.6795562539720218e-06, + "loss": 0.7969, + "step": 33278 + }, + { + "epoch": 0.85, + "learning_rate": 1.679535954019317e-06, + "loss": 0.917, + "step": 33279 + }, + { + "epoch": 0.85, + "learning_rate": 1.6795156535463226e-06, + "loss": 0.9771, + "step": 33280 + }, + { + "epoch": 0.85, + "learning_rate": 1.6794953525530543e-06, + "loss": 0.876, + "step": 33281 + }, + { + "epoch": 0.85, + "learning_rate": 1.6794750510395278e-06, + "loss": 0.6279, + "step": 33282 + }, + { + "epoch": 0.85, + "learning_rate": 1.6794547490057584e-06, + "loss": 0.5913, + "step": 33283 + }, + { + "epoch": 0.85, + "learning_rate": 1.6794344464517622e-06, + "loss": 0.6807, + "step": 33284 + }, + { + "epoch": 0.85, + "learning_rate": 1.6794141433775536e-06, + "loss": 0.8994, + "step": 33285 + }, + { + "epoch": 0.85, + "learning_rate": 1.6793938397831493e-06, + "loss": 1.0391, + "step": 33286 + }, + { + "epoch": 0.85, + "learning_rate": 1.6793735356685642e-06, + "loss": 0.7295, + "step": 33287 + }, + { + "epoch": 0.85, + "learning_rate": 1.679353231033814e-06, + "loss": 0.8076, + "step": 33288 + }, + { + "epoch": 0.85, + "learning_rate": 1.6793329258789145e-06, + "loss": 0.8486, + "step": 33289 + }, + { + "epoch": 0.85, + "learning_rate": 1.6793126202038806e-06, + "loss": 0.8132, + "step": 33290 + }, + { + "epoch": 0.85, + "learning_rate": 1.6792923140087285e-06, + "loss": 0.8467, + "step": 33291 + }, + { + "epoch": 0.85, + "learning_rate": 1.6792720072934734e-06, + "loss": 0.918, + "step": 33292 + }, + { + "epoch": 0.85, + "learning_rate": 1.6792517000581313e-06, + "loss": 0.9561, + "step": 33293 + }, + { + "epoch": 0.85, + "learning_rate": 1.679231392302717e-06, + "loss": 0.8306, + "step": 33294 + }, + { + "epoch": 0.85, + "learning_rate": 1.6792110840272464e-06, + "loss": 0.7542, + "step": 33295 + }, + { + "epoch": 0.85, + "learning_rate": 1.6791907752317353e-06, + "loss": 0.6335, + "step": 33296 + }, + { + "epoch": 0.85, + "learning_rate": 1.6791704659161992e-06, + "loss": 0.7988, + "step": 33297 + }, + { + "epoch": 0.85, + "learning_rate": 1.6791501560806532e-06, + "loss": 0.7451, + "step": 33298 + }, + { + "epoch": 0.85, + "learning_rate": 1.6791298457251135e-06, + "loss": 0.9902, + "step": 33299 + }, + { + "epoch": 0.85, + "learning_rate": 1.6791095348495952e-06, + "loss": 0.9248, + "step": 33300 + }, + { + "epoch": 0.85, + "learning_rate": 1.6790892234541135e-06, + "loss": 0.9844, + "step": 33301 + }, + { + "epoch": 0.85, + "learning_rate": 1.679068911538685e-06, + "loss": 0.8154, + "step": 33302 + }, + { + "epoch": 0.85, + "learning_rate": 1.6790485991033246e-06, + "loss": 0.6509, + "step": 33303 + }, + { + "epoch": 0.85, + "learning_rate": 1.6790282861480476e-06, + "loss": 0.8652, + "step": 33304 + }, + { + "epoch": 0.85, + "learning_rate": 1.6790079726728701e-06, + "loss": 0.8857, + "step": 33305 + }, + { + "epoch": 0.85, + "learning_rate": 1.6789876586778073e-06, + "loss": 0.7856, + "step": 33306 + }, + { + "epoch": 0.85, + "learning_rate": 1.678967344162875e-06, + "loss": 0.9023, + "step": 33307 + }, + { + "epoch": 0.85, + "learning_rate": 1.6789470291280883e-06, + "loss": 1.0332, + "step": 33308 + }, + { + "epoch": 0.85, + "learning_rate": 1.6789267135734635e-06, + "loss": 0.9043, + "step": 33309 + }, + { + "epoch": 0.85, + "learning_rate": 1.6789063974990154e-06, + "loss": 0.585, + "step": 33310 + }, + { + "epoch": 0.85, + "learning_rate": 1.67888608090476e-06, + "loss": 0.8901, + "step": 33311 + }, + { + "epoch": 0.85, + "learning_rate": 1.6788657637907128e-06, + "loss": 0.8667, + "step": 33312 + }, + { + "epoch": 0.85, + "learning_rate": 1.6788454461568896e-06, + "loss": 0.8633, + "step": 33313 + }, + { + "epoch": 0.85, + "learning_rate": 1.678825128003305e-06, + "loss": 0.9668, + "step": 33314 + }, + { + "epoch": 0.85, + "learning_rate": 1.6788048093299756e-06, + "loss": 0.5161, + "step": 33315 + }, + { + "epoch": 0.85, + "learning_rate": 1.6787844901369165e-06, + "loss": 1.0068, + "step": 33316 + }, + { + "epoch": 0.85, + "learning_rate": 1.6787641704241432e-06, + "loss": 0.707, + "step": 33317 + }, + { + "epoch": 0.85, + "learning_rate": 1.6787438501916714e-06, + "loss": 0.8232, + "step": 33318 + }, + { + "epoch": 0.85, + "learning_rate": 1.6787235294395172e-06, + "loss": 0.71, + "step": 33319 + }, + { + "epoch": 0.85, + "learning_rate": 1.678703208167695e-06, + "loss": 0.7375, + "step": 33320 + }, + { + "epoch": 0.85, + "learning_rate": 1.678682886376221e-06, + "loss": 0.5332, + "step": 33321 + }, + { + "epoch": 0.85, + "learning_rate": 1.678662564065111e-06, + "loss": 0.5955, + "step": 33322 + }, + { + "epoch": 0.85, + "learning_rate": 1.67864224123438e-06, + "loss": 0.8965, + "step": 33323 + }, + { + "epoch": 0.85, + "learning_rate": 1.6786219178840442e-06, + "loss": 0.8994, + "step": 33324 + }, + { + "epoch": 0.85, + "learning_rate": 1.6786015940141185e-06, + "loss": 0.71, + "step": 33325 + }, + { + "epoch": 0.85, + "learning_rate": 1.6785812696246189e-06, + "loss": 0.8076, + "step": 33326 + }, + { + "epoch": 0.85, + "learning_rate": 1.6785609447155606e-06, + "loss": 0.7991, + "step": 33327 + }, + { + "epoch": 0.85, + "learning_rate": 1.6785406192869595e-06, + "loss": 0.7686, + "step": 33328 + }, + { + "epoch": 0.85, + "learning_rate": 1.678520293338831e-06, + "loss": 0.7979, + "step": 33329 + }, + { + "epoch": 0.85, + "learning_rate": 1.678499966871191e-06, + "loss": 0.5913, + "step": 33330 + }, + { + "epoch": 0.85, + "learning_rate": 1.6784796398840547e-06, + "loss": 0.9912, + "step": 33331 + }, + { + "epoch": 0.85, + "learning_rate": 1.6784593123774376e-06, + "loss": 0.7812, + "step": 33332 + }, + { + "epoch": 0.85, + "learning_rate": 1.6784389843513553e-06, + "loss": 0.8271, + "step": 33333 + }, + { + "epoch": 0.85, + "learning_rate": 1.6784186558058236e-06, + "loss": 0.6426, + "step": 33334 + }, + { + "epoch": 0.85, + "learning_rate": 1.678398326740858e-06, + "loss": 0.8594, + "step": 33335 + }, + { + "epoch": 0.85, + "learning_rate": 1.6783779971564737e-06, + "loss": 0.8105, + "step": 33336 + }, + { + "epoch": 0.85, + "learning_rate": 1.6783576670526869e-06, + "loss": 0.8984, + "step": 33337 + }, + { + "epoch": 0.85, + "learning_rate": 1.6783373364295126e-06, + "loss": 0.8584, + "step": 33338 + }, + { + "epoch": 0.85, + "learning_rate": 1.6783170052869668e-06, + "loss": 0.6719, + "step": 33339 + }, + { + "epoch": 0.85, + "learning_rate": 1.6782966736250648e-06, + "loss": 0.8203, + "step": 33340 + }, + { + "epoch": 0.85, + "learning_rate": 1.678276341443822e-06, + "loss": 0.7598, + "step": 33341 + }, + { + "epoch": 0.85, + "learning_rate": 1.6782560087432544e-06, + "loss": 0.9834, + "step": 33342 + }, + { + "epoch": 0.85, + "learning_rate": 1.6782356755233772e-06, + "loss": 0.8525, + "step": 33343 + }, + { + "epoch": 0.85, + "learning_rate": 1.6782153417842063e-06, + "loss": 0.728, + "step": 33344 + }, + { + "epoch": 0.85, + "learning_rate": 1.6781950075257572e-06, + "loss": 0.8896, + "step": 33345 + }, + { + "epoch": 0.85, + "learning_rate": 1.678174672748045e-06, + "loss": 1.0469, + "step": 33346 + }, + { + "epoch": 0.85, + "learning_rate": 1.678154337451086e-06, + "loss": 0.6934, + "step": 33347 + }, + { + "epoch": 0.85, + "learning_rate": 1.6781340016348953e-06, + "loss": 0.9082, + "step": 33348 + }, + { + "epoch": 0.85, + "learning_rate": 1.6781136652994886e-06, + "loss": 0.7231, + "step": 33349 + }, + { + "epoch": 0.85, + "learning_rate": 1.6780933284448814e-06, + "loss": 0.8418, + "step": 33350 + }, + { + "epoch": 0.85, + "learning_rate": 1.6780729910710894e-06, + "loss": 0.5332, + "step": 33351 + }, + { + "epoch": 0.85, + "learning_rate": 1.6780526531781278e-06, + "loss": 0.9795, + "step": 33352 + }, + { + "epoch": 0.85, + "learning_rate": 1.6780323147660127e-06, + "loss": 0.999, + "step": 33353 + }, + { + "epoch": 0.85, + "learning_rate": 1.6780119758347592e-06, + "loss": 0.8115, + "step": 33354 + }, + { + "epoch": 0.85, + "learning_rate": 1.6779916363843834e-06, + "loss": 0.8037, + "step": 33355 + }, + { + "epoch": 0.85, + "learning_rate": 1.6779712964149004e-06, + "loss": 0.8867, + "step": 33356 + }, + { + "epoch": 0.85, + "learning_rate": 1.6779509559263262e-06, + "loss": 0.9023, + "step": 33357 + }, + { + "epoch": 0.85, + "learning_rate": 1.6779306149186758e-06, + "loss": 0.791, + "step": 33358 + }, + { + "epoch": 0.86, + "learning_rate": 1.6779102733919653e-06, + "loss": 0.9678, + "step": 33359 + }, + { + "epoch": 0.86, + "learning_rate": 1.67788993134621e-06, + "loss": 0.6895, + "step": 33360 + }, + { + "epoch": 0.86, + "learning_rate": 1.6778695887814257e-06, + "loss": 0.875, + "step": 33361 + }, + { + "epoch": 0.86, + "learning_rate": 1.6778492456976276e-06, + "loss": 0.999, + "step": 33362 + }, + { + "epoch": 0.86, + "learning_rate": 1.6778289020948316e-06, + "loss": 1.0293, + "step": 33363 + }, + { + "epoch": 0.86, + "learning_rate": 1.6778085579730533e-06, + "loss": 0.9482, + "step": 33364 + }, + { + "epoch": 0.86, + "learning_rate": 1.6777882133323077e-06, + "loss": 0.8486, + "step": 33365 + }, + { + "epoch": 0.86, + "learning_rate": 1.6777678681726113e-06, + "loss": 0.6895, + "step": 33366 + }, + { + "epoch": 0.86, + "learning_rate": 1.6777475224939793e-06, + "loss": 0.77, + "step": 33367 + }, + { + "epoch": 0.86, + "learning_rate": 1.6777271762964268e-06, + "loss": 0.832, + "step": 33368 + }, + { + "epoch": 0.86, + "learning_rate": 1.6777068295799702e-06, + "loss": 0.915, + "step": 33369 + }, + { + "epoch": 0.86, + "learning_rate": 1.6776864823446242e-06, + "loss": 0.811, + "step": 33370 + }, + { + "epoch": 0.86, + "learning_rate": 1.6776661345904049e-06, + "loss": 0.7017, + "step": 33371 + }, + { + "epoch": 0.86, + "learning_rate": 1.6776457863173277e-06, + "loss": 0.6433, + "step": 33372 + }, + { + "epoch": 0.86, + "learning_rate": 1.6776254375254087e-06, + "loss": 0.9736, + "step": 33373 + }, + { + "epoch": 0.86, + "learning_rate": 1.6776050882146628e-06, + "loss": 0.8145, + "step": 33374 + }, + { + "epoch": 0.86, + "learning_rate": 1.6775847383851058e-06, + "loss": 0.6987, + "step": 33375 + }, + { + "epoch": 0.86, + "learning_rate": 1.6775643880367534e-06, + "loss": 0.835, + "step": 33376 + }, + { + "epoch": 0.86, + "learning_rate": 1.677544037169621e-06, + "loss": 0.6592, + "step": 33377 + }, + { + "epoch": 0.86, + "learning_rate": 1.6775236857837243e-06, + "loss": 0.6748, + "step": 33378 + }, + { + "epoch": 0.86, + "learning_rate": 1.6775033338790791e-06, + "loss": 0.8242, + "step": 33379 + }, + { + "epoch": 0.86, + "learning_rate": 1.6774829814557006e-06, + "loss": 0.6904, + "step": 33380 + }, + { + "epoch": 0.86, + "learning_rate": 1.6774626285136043e-06, + "loss": 0.7246, + "step": 33381 + }, + { + "epoch": 0.86, + "learning_rate": 1.6774422750528063e-06, + "loss": 0.793, + "step": 33382 + }, + { + "epoch": 0.86, + "learning_rate": 1.6774219210733217e-06, + "loss": 0.834, + "step": 33383 + }, + { + "epoch": 0.86, + "learning_rate": 1.677401566575167e-06, + "loss": 0.8174, + "step": 33384 + }, + { + "epoch": 0.86, + "learning_rate": 1.677381211558356e-06, + "loss": 0.8281, + "step": 33385 + }, + { + "epoch": 0.86, + "learning_rate": 1.677360856022906e-06, + "loss": 0.833, + "step": 33386 + }, + { + "epoch": 0.86, + "learning_rate": 1.6773404999688317e-06, + "loss": 0.7412, + "step": 33387 + }, + { + "epoch": 0.86, + "learning_rate": 1.677320143396149e-06, + "loss": 0.792, + "step": 33388 + }, + { + "epoch": 0.86, + "learning_rate": 1.6772997863048737e-06, + "loss": 0.7031, + "step": 33389 + }, + { + "epoch": 0.86, + "learning_rate": 1.6772794286950207e-06, + "loss": 0.9229, + "step": 33390 + }, + { + "epoch": 0.86, + "learning_rate": 1.6772590705666062e-06, + "loss": 0.8154, + "step": 33391 + }, + { + "epoch": 0.86, + "learning_rate": 1.6772387119196454e-06, + "loss": 0.6592, + "step": 33392 + }, + { + "epoch": 0.86, + "learning_rate": 1.6772183527541542e-06, + "loss": 0.7715, + "step": 33393 + }, + { + "epoch": 0.86, + "learning_rate": 1.677197993070148e-06, + "loss": 1.335, + "step": 33394 + }, + { + "epoch": 0.86, + "learning_rate": 1.677177632867642e-06, + "loss": 0.6533, + "step": 33395 + }, + { + "epoch": 0.86, + "learning_rate": 1.677157272146653e-06, + "loss": 0.9365, + "step": 33396 + }, + { + "epoch": 0.86, + "learning_rate": 1.6771369109071954e-06, + "loss": 0.7124, + "step": 33397 + }, + { + "epoch": 0.86, + "learning_rate": 1.6771165491492851e-06, + "loss": 0.8945, + "step": 33398 + }, + { + "epoch": 0.86, + "learning_rate": 1.6770961868729381e-06, + "loss": 0.8779, + "step": 33399 + }, + { + "epoch": 0.86, + "learning_rate": 1.6770758240781695e-06, + "loss": 0.7217, + "step": 33400 + }, + { + "epoch": 0.86, + "learning_rate": 1.677055460764995e-06, + "loss": 0.8096, + "step": 33401 + }, + { + "epoch": 0.86, + "learning_rate": 1.6770350969334303e-06, + "loss": 0.8164, + "step": 33402 + }, + { + "epoch": 0.86, + "learning_rate": 1.677014732583491e-06, + "loss": 0.8203, + "step": 33403 + }, + { + "epoch": 0.86, + "learning_rate": 1.6769943677151927e-06, + "loss": 0.9692, + "step": 33404 + }, + { + "epoch": 0.86, + "learning_rate": 1.676974002328551e-06, + "loss": 0.7939, + "step": 33405 + }, + { + "epoch": 0.86, + "learning_rate": 1.6769536364235814e-06, + "loss": 0.9336, + "step": 33406 + }, + { + "epoch": 0.86, + "learning_rate": 1.6769332700002994e-06, + "loss": 0.7109, + "step": 33407 + }, + { + "epoch": 0.86, + "learning_rate": 1.6769129030587209e-06, + "loss": 0.728, + "step": 33408 + }, + { + "epoch": 0.86, + "learning_rate": 1.6768925355988613e-06, + "loss": 0.8345, + "step": 33409 + }, + { + "epoch": 0.86, + "learning_rate": 1.6768721676207357e-06, + "loss": 0.8555, + "step": 33410 + }, + { + "epoch": 0.86, + "learning_rate": 1.676851799124361e-06, + "loss": 0.9521, + "step": 33411 + }, + { + "epoch": 0.86, + "learning_rate": 1.6768314301097514e-06, + "loss": 1.0361, + "step": 33412 + }, + { + "epoch": 0.86, + "learning_rate": 1.6768110605769233e-06, + "loss": 0.795, + "step": 33413 + }, + { + "epoch": 0.86, + "learning_rate": 1.6767906905258924e-06, + "loss": 0.6631, + "step": 33414 + }, + { + "epoch": 0.86, + "learning_rate": 1.6767703199566733e-06, + "loss": 0.7822, + "step": 33415 + }, + { + "epoch": 0.86, + "learning_rate": 1.676749948869283e-06, + "loss": 0.6885, + "step": 33416 + }, + { + "epoch": 0.86, + "learning_rate": 1.676729577263736e-06, + "loss": 0.9277, + "step": 33417 + }, + { + "epoch": 0.86, + "learning_rate": 1.6767092051400482e-06, + "loss": 0.7983, + "step": 33418 + }, + { + "epoch": 0.86, + "learning_rate": 1.6766888324982355e-06, + "loss": 0.8223, + "step": 33419 + }, + { + "epoch": 0.86, + "learning_rate": 1.6766684593383134e-06, + "loss": 0.8799, + "step": 33420 + }, + { + "epoch": 0.86, + "learning_rate": 1.6766480856602971e-06, + "loss": 1.0107, + "step": 33421 + }, + { + "epoch": 0.86, + "learning_rate": 1.6766277114642024e-06, + "loss": 0.918, + "step": 33422 + }, + { + "epoch": 0.86, + "learning_rate": 1.6766073367500452e-06, + "loss": 0.8672, + "step": 33423 + }, + { + "epoch": 0.86, + "learning_rate": 1.6765869615178408e-06, + "loss": 0.6785, + "step": 33424 + }, + { + "epoch": 0.86, + "learning_rate": 1.6765665857676047e-06, + "loss": 0.8867, + "step": 33425 + }, + { + "epoch": 0.86, + "learning_rate": 1.676546209499353e-06, + "loss": 0.9707, + "step": 33426 + }, + { + "epoch": 0.86, + "learning_rate": 1.6765258327131008e-06, + "loss": 0.9033, + "step": 33427 + }, + { + "epoch": 0.86, + "learning_rate": 1.676505455408864e-06, + "loss": 0.8447, + "step": 33428 + }, + { + "epoch": 0.86, + "learning_rate": 1.676485077586658e-06, + "loss": 0.6846, + "step": 33429 + }, + { + "epoch": 0.86, + "learning_rate": 1.6764646992464984e-06, + "loss": 0.8213, + "step": 33430 + }, + { + "epoch": 0.86, + "learning_rate": 1.6764443203884008e-06, + "loss": 0.7783, + "step": 33431 + }, + { + "epoch": 0.86, + "learning_rate": 1.676423941012381e-06, + "loss": 0.7092, + "step": 33432 + }, + { + "epoch": 0.86, + "learning_rate": 1.6764035611184546e-06, + "loss": 0.5874, + "step": 33433 + }, + { + "epoch": 0.86, + "learning_rate": 1.6763831807066372e-06, + "loss": 0.8203, + "step": 33434 + }, + { + "epoch": 0.86, + "learning_rate": 1.676362799776944e-06, + "loss": 1.0713, + "step": 33435 + }, + { + "epoch": 0.86, + "learning_rate": 1.676342418329391e-06, + "loss": 0.7881, + "step": 33436 + }, + { + "epoch": 0.86, + "learning_rate": 1.6763220363639938e-06, + "loss": 0.6855, + "step": 33437 + }, + { + "epoch": 0.86, + "learning_rate": 1.6763016538807676e-06, + "loss": 0.6611, + "step": 33438 + }, + { + "epoch": 0.86, + "learning_rate": 1.6762812708797286e-06, + "loss": 0.9248, + "step": 33439 + }, + { + "epoch": 0.86, + "learning_rate": 1.6762608873608924e-06, + "loss": 0.7915, + "step": 33440 + }, + { + "epoch": 0.86, + "learning_rate": 1.6762405033242739e-06, + "loss": 0.8135, + "step": 33441 + }, + { + "epoch": 0.86, + "learning_rate": 1.6762201187698893e-06, + "loss": 0.9414, + "step": 33442 + }, + { + "epoch": 0.86, + "learning_rate": 1.6761997336977541e-06, + "loss": 0.7559, + "step": 33443 + }, + { + "epoch": 0.86, + "learning_rate": 1.6761793481078836e-06, + "loss": 0.7629, + "step": 33444 + }, + { + "epoch": 0.86, + "learning_rate": 1.676158962000294e-06, + "loss": 0.9014, + "step": 33445 + }, + { + "epoch": 0.86, + "learning_rate": 1.6761385753750003e-06, + "loss": 0.8838, + "step": 33446 + }, + { + "epoch": 0.86, + "learning_rate": 1.6761181882320185e-06, + "loss": 0.8252, + "step": 33447 + }, + { + "epoch": 0.86, + "learning_rate": 1.676097800571364e-06, + "loss": 1.0391, + "step": 33448 + }, + { + "epoch": 0.86, + "learning_rate": 1.6760774123930529e-06, + "loss": 1.0986, + "step": 33449 + }, + { + "epoch": 0.86, + "learning_rate": 1.6760570236970998e-06, + "loss": 0.7783, + "step": 33450 + }, + { + "epoch": 0.86, + "learning_rate": 1.676036634483521e-06, + "loss": 0.8389, + "step": 33451 + }, + { + "epoch": 0.86, + "learning_rate": 1.6760162447523323e-06, + "loss": 0.8154, + "step": 33452 + }, + { + "epoch": 0.86, + "learning_rate": 1.6759958545035491e-06, + "loss": 0.793, + "step": 33453 + }, + { + "epoch": 0.86, + "learning_rate": 1.675975463737187e-06, + "loss": 0.6865, + "step": 33454 + }, + { + "epoch": 0.86, + "learning_rate": 1.6759550724532613e-06, + "loss": 0.9346, + "step": 33455 + }, + { + "epoch": 0.86, + "learning_rate": 1.675934680651788e-06, + "loss": 0.7568, + "step": 33456 + }, + { + "epoch": 0.86, + "learning_rate": 1.6759142883327826e-06, + "loss": 0.7637, + "step": 33457 + }, + { + "epoch": 0.86, + "learning_rate": 1.6758938954962606e-06, + "loss": 0.9258, + "step": 33458 + }, + { + "epoch": 0.86, + "learning_rate": 1.6758735021422381e-06, + "loss": 0.7695, + "step": 33459 + }, + { + "epoch": 0.86, + "learning_rate": 1.6758531082707302e-06, + "loss": 0.9668, + "step": 33460 + }, + { + "epoch": 0.86, + "learning_rate": 1.6758327138817525e-06, + "loss": 0.9355, + "step": 33461 + }, + { + "epoch": 0.86, + "learning_rate": 1.6758123189753207e-06, + "loss": 0.8779, + "step": 33462 + }, + { + "epoch": 0.86, + "learning_rate": 1.6757919235514506e-06, + "loss": 0.9541, + "step": 33463 + }, + { + "epoch": 0.86, + "learning_rate": 1.6757715276101577e-06, + "loss": 0.8623, + "step": 33464 + }, + { + "epoch": 0.86, + "learning_rate": 1.6757511311514575e-06, + "loss": 0.8184, + "step": 33465 + }, + { + "epoch": 0.86, + "learning_rate": 1.6757307341753659e-06, + "loss": 0.7969, + "step": 33466 + }, + { + "epoch": 0.86, + "learning_rate": 1.675710336681898e-06, + "loss": 0.9785, + "step": 33467 + }, + { + "epoch": 0.86, + "learning_rate": 1.6756899386710701e-06, + "loss": 0.8037, + "step": 33468 + }, + { + "epoch": 0.86, + "learning_rate": 1.6756695401428976e-06, + "loss": 0.8193, + "step": 33469 + }, + { + "epoch": 0.86, + "learning_rate": 1.6756491410973958e-06, + "loss": 0.8623, + "step": 33470 + }, + { + "epoch": 0.86, + "learning_rate": 1.6756287415345803e-06, + "loss": 0.6733, + "step": 33471 + }, + { + "epoch": 0.86, + "learning_rate": 1.6756083414544672e-06, + "loss": 0.9189, + "step": 33472 + }, + { + "epoch": 0.86, + "learning_rate": 1.675587940857072e-06, + "loss": 0.6123, + "step": 33473 + }, + { + "epoch": 0.86, + "learning_rate": 1.6755675397424097e-06, + "loss": 0.9268, + "step": 33474 + }, + { + "epoch": 0.86, + "learning_rate": 1.6755471381104971e-06, + "loss": 0.8398, + "step": 33475 + }, + { + "epoch": 0.86, + "learning_rate": 1.6755267359613485e-06, + "loss": 0.6865, + "step": 33476 + }, + { + "epoch": 0.86, + "learning_rate": 1.6755063332949804e-06, + "loss": 1.0703, + "step": 33477 + }, + { + "epoch": 0.86, + "learning_rate": 1.675485930111408e-06, + "loss": 0.7715, + "step": 33478 + }, + { + "epoch": 0.86, + "learning_rate": 1.6754655264106475e-06, + "loss": 0.7202, + "step": 33479 + }, + { + "epoch": 0.86, + "learning_rate": 1.6754451221927136e-06, + "loss": 0.7148, + "step": 33480 + }, + { + "epoch": 0.86, + "learning_rate": 1.6754247174576225e-06, + "loss": 0.8857, + "step": 33481 + }, + { + "epoch": 0.86, + "learning_rate": 1.6754043122053903e-06, + "loss": 0.8428, + "step": 33482 + }, + { + "epoch": 0.86, + "learning_rate": 1.6753839064360315e-06, + "loss": 0.8291, + "step": 33483 + }, + { + "epoch": 0.86, + "learning_rate": 1.6753635001495625e-06, + "loss": 0.9326, + "step": 33484 + }, + { + "epoch": 0.86, + "learning_rate": 1.6753430933459986e-06, + "loss": 1.1074, + "step": 33485 + }, + { + "epoch": 0.86, + "learning_rate": 1.6753226860253557e-06, + "loss": 0.8115, + "step": 33486 + }, + { + "epoch": 0.86, + "learning_rate": 1.6753022781876492e-06, + "loss": 0.793, + "step": 33487 + }, + { + "epoch": 0.86, + "learning_rate": 1.6752818698328948e-06, + "loss": 0.8457, + "step": 33488 + }, + { + "epoch": 0.86, + "learning_rate": 1.6752614609611082e-06, + "loss": 0.8154, + "step": 33489 + }, + { + "epoch": 0.86, + "learning_rate": 1.6752410515723048e-06, + "loss": 0.7715, + "step": 33490 + }, + { + "epoch": 0.86, + "learning_rate": 1.6752206416665005e-06, + "loss": 0.5874, + "step": 33491 + }, + { + "epoch": 0.86, + "learning_rate": 1.6752002312437106e-06, + "loss": 0.5474, + "step": 33492 + }, + { + "epoch": 0.86, + "learning_rate": 1.6751798203039511e-06, + "loss": 0.4722, + "step": 33493 + }, + { + "epoch": 0.86, + "learning_rate": 1.6751594088472377e-06, + "loss": 0.8633, + "step": 33494 + }, + { + "epoch": 0.86, + "learning_rate": 1.6751389968735854e-06, + "loss": 0.7891, + "step": 33495 + }, + { + "epoch": 0.86, + "learning_rate": 1.6751185843830102e-06, + "loss": 0.8311, + "step": 33496 + }, + { + "epoch": 0.86, + "learning_rate": 1.675098171375528e-06, + "loss": 0.8374, + "step": 33497 + }, + { + "epoch": 0.86, + "learning_rate": 1.675077757851154e-06, + "loss": 0.8574, + "step": 33498 + }, + { + "epoch": 0.86, + "learning_rate": 1.6750573438099043e-06, + "loss": 0.8999, + "step": 33499 + }, + { + "epoch": 0.86, + "learning_rate": 1.6750369292517935e-06, + "loss": 0.8418, + "step": 33500 + }, + { + "epoch": 0.86, + "learning_rate": 1.6750165141768387e-06, + "loss": 0.9521, + "step": 33501 + }, + { + "epoch": 0.86, + "learning_rate": 1.6749960985850544e-06, + "loss": 0.6766, + "step": 33502 + }, + { + "epoch": 0.86, + "learning_rate": 1.674975682476457e-06, + "loss": 0.8789, + "step": 33503 + }, + { + "epoch": 0.86, + "learning_rate": 1.6749552658510615e-06, + "loss": 0.9287, + "step": 33504 + }, + { + "epoch": 0.86, + "learning_rate": 1.6749348487088838e-06, + "loss": 0.9141, + "step": 33505 + }, + { + "epoch": 0.86, + "learning_rate": 1.6749144310499394e-06, + "loss": 1.0781, + "step": 33506 + }, + { + "epoch": 0.86, + "learning_rate": 1.6748940128742444e-06, + "loss": 0.7676, + "step": 33507 + }, + { + "epoch": 0.86, + "learning_rate": 1.6748735941818137e-06, + "loss": 0.9209, + "step": 33508 + }, + { + "epoch": 0.86, + "learning_rate": 1.6748531749726636e-06, + "loss": 0.7344, + "step": 33509 + }, + { + "epoch": 0.86, + "learning_rate": 1.6748327552468093e-06, + "loss": 0.7588, + "step": 33510 + }, + { + "epoch": 0.86, + "learning_rate": 1.6748123350042667e-06, + "loss": 0.7998, + "step": 33511 + }, + { + "epoch": 0.86, + "learning_rate": 1.674791914245051e-06, + "loss": 0.8125, + "step": 33512 + }, + { + "epoch": 0.86, + "learning_rate": 1.6747714929691785e-06, + "loss": 0.6616, + "step": 33513 + }, + { + "epoch": 0.86, + "learning_rate": 1.6747510711766645e-06, + "loss": 0.9229, + "step": 33514 + }, + { + "epoch": 0.86, + "learning_rate": 1.6747306488675244e-06, + "loss": 0.8521, + "step": 33515 + }, + { + "epoch": 0.86, + "learning_rate": 1.6747102260417743e-06, + "loss": 0.918, + "step": 33516 + }, + { + "epoch": 0.86, + "learning_rate": 1.6746898026994293e-06, + "loss": 0.7686, + "step": 33517 + }, + { + "epoch": 0.86, + "learning_rate": 1.6746693788405058e-06, + "loss": 0.7197, + "step": 33518 + }, + { + "epoch": 0.86, + "learning_rate": 1.674648954465019e-06, + "loss": 0.7744, + "step": 33519 + }, + { + "epoch": 0.86, + "learning_rate": 1.6746285295729838e-06, + "loss": 0.9414, + "step": 33520 + }, + { + "epoch": 0.86, + "learning_rate": 1.6746081041644171e-06, + "loss": 0.9219, + "step": 33521 + }, + { + "epoch": 0.86, + "learning_rate": 1.6745876782393338e-06, + "loss": 1.0752, + "step": 33522 + }, + { + "epoch": 0.86, + "learning_rate": 1.67456725179775e-06, + "loss": 0.9727, + "step": 33523 + }, + { + "epoch": 0.86, + "learning_rate": 1.6745468248396807e-06, + "loss": 0.8662, + "step": 33524 + }, + { + "epoch": 0.86, + "learning_rate": 1.6745263973651423e-06, + "loss": 0.7534, + "step": 33525 + }, + { + "epoch": 0.86, + "learning_rate": 1.6745059693741499e-06, + "loss": 0.834, + "step": 33526 + }, + { + "epoch": 0.86, + "learning_rate": 1.6744855408667191e-06, + "loss": 0.8604, + "step": 33527 + }, + { + "epoch": 0.86, + "learning_rate": 1.6744651118428662e-06, + "loss": 0.7637, + "step": 33528 + }, + { + "epoch": 0.86, + "learning_rate": 1.6744446823026062e-06, + "loss": 0.8975, + "step": 33529 + }, + { + "epoch": 0.86, + "learning_rate": 1.6744242522459543e-06, + "loss": 0.8613, + "step": 33530 + }, + { + "epoch": 0.86, + "learning_rate": 1.6744038216729274e-06, + "loss": 1.0049, + "step": 33531 + }, + { + "epoch": 0.86, + "learning_rate": 1.6743833905835404e-06, + "loss": 1.042, + "step": 33532 + }, + { + "epoch": 0.86, + "learning_rate": 1.674362958977809e-06, + "loss": 0.7812, + "step": 33533 + }, + { + "epoch": 0.86, + "learning_rate": 1.674342526855749e-06, + "loss": 0.8555, + "step": 33534 + }, + { + "epoch": 0.86, + "learning_rate": 1.6743220942173757e-06, + "loss": 0.8042, + "step": 33535 + }, + { + "epoch": 0.86, + "learning_rate": 1.6743016610627052e-06, + "loss": 0.915, + "step": 33536 + }, + { + "epoch": 0.86, + "learning_rate": 1.6742812273917527e-06, + "loss": 0.6133, + "step": 33537 + }, + { + "epoch": 0.86, + "learning_rate": 1.6742607932045343e-06, + "loss": 0.6862, + "step": 33538 + }, + { + "epoch": 0.86, + "learning_rate": 1.6742403585010654e-06, + "loss": 0.7766, + "step": 33539 + }, + { + "epoch": 0.86, + "learning_rate": 1.6742199232813614e-06, + "loss": 0.9561, + "step": 33540 + }, + { + "epoch": 0.86, + "learning_rate": 1.6741994875454383e-06, + "loss": 0.8325, + "step": 33541 + }, + { + "epoch": 0.86, + "learning_rate": 1.6741790512933118e-06, + "loss": 0.6388, + "step": 33542 + }, + { + "epoch": 0.86, + "learning_rate": 1.6741586145249976e-06, + "loss": 0.916, + "step": 33543 + }, + { + "epoch": 0.86, + "learning_rate": 1.6741381772405109e-06, + "loss": 0.8252, + "step": 33544 + }, + { + "epoch": 0.86, + "learning_rate": 1.6741177394398672e-06, + "loss": 0.8047, + "step": 33545 + }, + { + "epoch": 0.86, + "learning_rate": 1.674097301123083e-06, + "loss": 0.8193, + "step": 33546 + }, + { + "epoch": 0.86, + "learning_rate": 1.6740768622901735e-06, + "loss": 0.8535, + "step": 33547 + }, + { + "epoch": 0.86, + "learning_rate": 1.6740564229411543e-06, + "loss": 0.6626, + "step": 33548 + }, + { + "epoch": 0.86, + "learning_rate": 1.674035983076041e-06, + "loss": 1.2129, + "step": 33549 + }, + { + "epoch": 0.86, + "learning_rate": 1.6740155426948495e-06, + "loss": 0.7812, + "step": 33550 + }, + { + "epoch": 0.86, + "learning_rate": 1.6739951017975951e-06, + "loss": 0.9883, + "step": 33551 + }, + { + "epoch": 0.86, + "learning_rate": 1.6739746603842937e-06, + "loss": 0.9941, + "step": 33552 + }, + { + "epoch": 0.86, + "learning_rate": 1.6739542184549608e-06, + "loss": 0.8604, + "step": 33553 + }, + { + "epoch": 0.86, + "learning_rate": 1.6739337760096124e-06, + "loss": 0.8682, + "step": 33554 + }, + { + "epoch": 0.86, + "learning_rate": 1.6739133330482637e-06, + "loss": 0.8311, + "step": 33555 + }, + { + "epoch": 0.86, + "learning_rate": 1.6738928895709306e-06, + "loss": 0.8877, + "step": 33556 + }, + { + "epoch": 0.86, + "learning_rate": 1.6738724455776287e-06, + "loss": 0.835, + "step": 33557 + }, + { + "epoch": 0.86, + "learning_rate": 1.6738520010683738e-06, + "loss": 0.9238, + "step": 33558 + }, + { + "epoch": 0.86, + "learning_rate": 1.673831556043181e-06, + "loss": 0.8105, + "step": 33559 + }, + { + "epoch": 0.86, + "learning_rate": 1.6738111105020667e-06, + "loss": 0.7007, + "step": 33560 + }, + { + "epoch": 0.86, + "learning_rate": 1.6737906644450461e-06, + "loss": 0.8174, + "step": 33561 + }, + { + "epoch": 0.86, + "learning_rate": 1.6737702178721352e-06, + "loss": 1.0771, + "step": 33562 + }, + { + "epoch": 0.86, + "learning_rate": 1.6737497707833493e-06, + "loss": 0.8594, + "step": 33563 + }, + { + "epoch": 0.86, + "learning_rate": 1.673729323178704e-06, + "loss": 1.1504, + "step": 33564 + }, + { + "epoch": 0.86, + "learning_rate": 1.6737088750582152e-06, + "loss": 0.8813, + "step": 33565 + }, + { + "epoch": 0.86, + "learning_rate": 1.6736884264218985e-06, + "loss": 0.7053, + "step": 33566 + }, + { + "epoch": 0.86, + "learning_rate": 1.6736679772697696e-06, + "loss": 0.751, + "step": 33567 + }, + { + "epoch": 0.86, + "learning_rate": 1.6736475276018443e-06, + "loss": 0.918, + "step": 33568 + }, + { + "epoch": 0.86, + "learning_rate": 1.6736270774181378e-06, + "loss": 1.0, + "step": 33569 + }, + { + "epoch": 0.86, + "learning_rate": 1.6736066267186662e-06, + "loss": 0.6814, + "step": 33570 + }, + { + "epoch": 0.86, + "learning_rate": 1.6735861755034447e-06, + "loss": 0.8506, + "step": 33571 + }, + { + "epoch": 0.86, + "learning_rate": 1.6735657237724894e-06, + "loss": 0.8311, + "step": 33572 + }, + { + "epoch": 0.86, + "learning_rate": 1.6735452715258158e-06, + "loss": 0.565, + "step": 33573 + }, + { + "epoch": 0.86, + "learning_rate": 1.6735248187634397e-06, + "loss": 0.9463, + "step": 33574 + }, + { + "epoch": 0.86, + "learning_rate": 1.6735043654853764e-06, + "loss": 0.6903, + "step": 33575 + }, + { + "epoch": 0.86, + "learning_rate": 1.6734839116916417e-06, + "loss": 0.8809, + "step": 33576 + }, + { + "epoch": 0.86, + "learning_rate": 1.6734634573822514e-06, + "loss": 0.8496, + "step": 33577 + }, + { + "epoch": 0.86, + "learning_rate": 1.6734430025572213e-06, + "loss": 0.959, + "step": 33578 + }, + { + "epoch": 0.86, + "learning_rate": 1.6734225472165665e-06, + "loss": 0.8945, + "step": 33579 + }, + { + "epoch": 0.86, + "learning_rate": 1.6734020913603035e-06, + "loss": 0.8125, + "step": 33580 + }, + { + "epoch": 0.86, + "learning_rate": 1.673381634988447e-06, + "loss": 0.7466, + "step": 33581 + }, + { + "epoch": 0.86, + "learning_rate": 1.6733611781010135e-06, + "loss": 0.8711, + "step": 33582 + }, + { + "epoch": 0.86, + "learning_rate": 1.673340720698018e-06, + "loss": 0.8936, + "step": 33583 + }, + { + "epoch": 0.86, + "learning_rate": 1.673320262779477e-06, + "loss": 0.8008, + "step": 33584 + }, + { + "epoch": 0.86, + "learning_rate": 1.6732998043454053e-06, + "loss": 0.6743, + "step": 33585 + }, + { + "epoch": 0.86, + "learning_rate": 1.6732793453958188e-06, + "loss": 1.0273, + "step": 33586 + }, + { + "epoch": 0.86, + "learning_rate": 1.6732588859307333e-06, + "loss": 0.8896, + "step": 33587 + }, + { + "epoch": 0.86, + "learning_rate": 1.6732384259501646e-06, + "loss": 0.7021, + "step": 33588 + }, + { + "epoch": 0.86, + "learning_rate": 1.673217965454128e-06, + "loss": 0.8955, + "step": 33589 + }, + { + "epoch": 0.86, + "learning_rate": 1.6731975044426395e-06, + "loss": 0.6929, + "step": 33590 + }, + { + "epoch": 0.86, + "learning_rate": 1.6731770429157145e-06, + "loss": 0.9639, + "step": 33591 + }, + { + "epoch": 0.86, + "learning_rate": 1.673156580873369e-06, + "loss": 0.9541, + "step": 33592 + }, + { + "epoch": 0.86, + "learning_rate": 1.6731361183156183e-06, + "loss": 0.8286, + "step": 33593 + }, + { + "epoch": 0.86, + "learning_rate": 1.673115655242478e-06, + "loss": 0.7393, + "step": 33594 + }, + { + "epoch": 0.86, + "learning_rate": 1.6730951916539644e-06, + "loss": 0.8115, + "step": 33595 + }, + { + "epoch": 0.86, + "learning_rate": 1.6730747275500927e-06, + "loss": 0.6504, + "step": 33596 + }, + { + "epoch": 0.86, + "learning_rate": 1.6730542629308784e-06, + "loss": 0.8945, + "step": 33597 + }, + { + "epoch": 0.86, + "learning_rate": 1.6730337977963376e-06, + "loss": 0.9736, + "step": 33598 + }, + { + "epoch": 0.86, + "learning_rate": 1.6730133321464857e-06, + "loss": 1.0479, + "step": 33599 + }, + { + "epoch": 0.86, + "learning_rate": 1.6729928659813385e-06, + "loss": 0.8643, + "step": 33600 + }, + { + "epoch": 0.86, + "learning_rate": 1.6729723993009115e-06, + "loss": 0.835, + "step": 33601 + }, + { + "epoch": 0.86, + "learning_rate": 1.6729519321052204e-06, + "loss": 0.5422, + "step": 33602 + }, + { + "epoch": 0.86, + "learning_rate": 1.672931464394281e-06, + "loss": 0.7734, + "step": 33603 + }, + { + "epoch": 0.86, + "learning_rate": 1.6729109961681091e-06, + "loss": 1.1172, + "step": 33604 + }, + { + "epoch": 0.86, + "learning_rate": 1.67289052742672e-06, + "loss": 0.9463, + "step": 33605 + }, + { + "epoch": 0.86, + "learning_rate": 1.6728700581701297e-06, + "loss": 0.6938, + "step": 33606 + }, + { + "epoch": 0.86, + "learning_rate": 1.6728495883983537e-06, + "loss": 0.9014, + "step": 33607 + }, + { + "epoch": 0.86, + "learning_rate": 1.6728291181114078e-06, + "loss": 0.8936, + "step": 33608 + }, + { + "epoch": 0.86, + "learning_rate": 1.6728086473093072e-06, + "loss": 0.8818, + "step": 33609 + }, + { + "epoch": 0.86, + "learning_rate": 1.6727881759920684e-06, + "loss": 0.8359, + "step": 33610 + }, + { + "epoch": 0.86, + "learning_rate": 1.6727677041597064e-06, + "loss": 0.636, + "step": 33611 + }, + { + "epoch": 0.86, + "learning_rate": 1.672747231812237e-06, + "loss": 0.79, + "step": 33612 + }, + { + "epoch": 0.86, + "learning_rate": 1.6727267589496764e-06, + "loss": 0.8604, + "step": 33613 + }, + { + "epoch": 0.86, + "learning_rate": 1.6727062855720396e-06, + "loss": 0.7842, + "step": 33614 + }, + { + "epoch": 0.86, + "learning_rate": 1.6726858116793422e-06, + "loss": 0.6167, + "step": 33615 + }, + { + "epoch": 0.86, + "learning_rate": 1.6726653372716007e-06, + "loss": 0.9092, + "step": 33616 + }, + { + "epoch": 0.86, + "learning_rate": 1.67264486234883e-06, + "loss": 0.9707, + "step": 33617 + }, + { + "epoch": 0.86, + "learning_rate": 1.6726243869110464e-06, + "loss": 0.8604, + "step": 33618 + }, + { + "epoch": 0.86, + "learning_rate": 1.6726039109582648e-06, + "loss": 0.7773, + "step": 33619 + }, + { + "epoch": 0.86, + "learning_rate": 1.6725834344905017e-06, + "loss": 0.9111, + "step": 33620 + }, + { + "epoch": 0.86, + "learning_rate": 1.672562957507772e-06, + "loss": 0.9482, + "step": 33621 + }, + { + "epoch": 0.86, + "learning_rate": 1.672542480010092e-06, + "loss": 0.8105, + "step": 33622 + }, + { + "epoch": 0.86, + "learning_rate": 1.672522001997477e-06, + "loss": 0.7139, + "step": 33623 + }, + { + "epoch": 0.86, + "learning_rate": 1.672501523469943e-06, + "loss": 0.8584, + "step": 33624 + }, + { + "epoch": 0.86, + "learning_rate": 1.6724810444275055e-06, + "loss": 0.6855, + "step": 33625 + }, + { + "epoch": 0.86, + "learning_rate": 1.6724605648701802e-06, + "loss": 0.7969, + "step": 33626 + }, + { + "epoch": 0.86, + "learning_rate": 1.6724400847979828e-06, + "loss": 0.9199, + "step": 33627 + }, + { + "epoch": 0.86, + "learning_rate": 1.6724196042109286e-06, + "loss": 0.7871, + "step": 33628 + }, + { + "epoch": 0.86, + "learning_rate": 1.672399123109034e-06, + "loss": 0.5742, + "step": 33629 + }, + { + "epoch": 0.86, + "learning_rate": 1.672378641492314e-06, + "loss": 0.8262, + "step": 33630 + }, + { + "epoch": 0.86, + "learning_rate": 1.672358159360785e-06, + "loss": 0.7588, + "step": 33631 + }, + { + "epoch": 0.86, + "learning_rate": 1.6723376767144619e-06, + "loss": 0.8447, + "step": 33632 + }, + { + "epoch": 0.86, + "learning_rate": 1.672317193553361e-06, + "loss": 0.6621, + "step": 33633 + }, + { + "epoch": 0.86, + "learning_rate": 1.6722967098774976e-06, + "loss": 0.9209, + "step": 33634 + }, + { + "epoch": 0.86, + "learning_rate": 1.6722762256868875e-06, + "loss": 0.791, + "step": 33635 + }, + { + "epoch": 0.86, + "learning_rate": 1.6722557409815465e-06, + "loss": 0.9678, + "step": 33636 + }, + { + "epoch": 0.86, + "learning_rate": 1.67223525576149e-06, + "loss": 0.918, + "step": 33637 + }, + { + "epoch": 0.86, + "learning_rate": 1.6722147700267341e-06, + "loss": 0.7017, + "step": 33638 + }, + { + "epoch": 0.86, + "learning_rate": 1.6721942837772941e-06, + "loss": 0.7935, + "step": 33639 + }, + { + "epoch": 0.86, + "learning_rate": 1.672173797013186e-06, + "loss": 0.8774, + "step": 33640 + }, + { + "epoch": 0.86, + "learning_rate": 1.6721533097344254e-06, + "loss": 0.8369, + "step": 33641 + }, + { + "epoch": 0.86, + "learning_rate": 1.6721328219410276e-06, + "loss": 0.6992, + "step": 33642 + }, + { + "epoch": 0.86, + "learning_rate": 1.672112333633009e-06, + "loss": 0.875, + "step": 33643 + }, + { + "epoch": 0.86, + "learning_rate": 1.6720918448103847e-06, + "loss": 0.8213, + "step": 33644 + }, + { + "epoch": 0.86, + "learning_rate": 1.6720713554731704e-06, + "loss": 0.8818, + "step": 33645 + }, + { + "epoch": 0.86, + "learning_rate": 1.6720508656213821e-06, + "loss": 0.8574, + "step": 33646 + }, + { + "epoch": 0.86, + "learning_rate": 1.6720303752550353e-06, + "loss": 1.0352, + "step": 33647 + }, + { + "epoch": 0.86, + "learning_rate": 1.672009884374146e-06, + "loss": 1.0029, + "step": 33648 + }, + { + "epoch": 0.86, + "learning_rate": 1.6719893929787295e-06, + "loss": 0.6704, + "step": 33649 + }, + { + "epoch": 0.86, + "learning_rate": 1.6719689010688013e-06, + "loss": 0.7422, + "step": 33650 + }, + { + "epoch": 0.86, + "learning_rate": 1.6719484086443779e-06, + "loss": 0.9766, + "step": 33651 + }, + { + "epoch": 0.86, + "learning_rate": 1.6719279157054742e-06, + "loss": 1.1641, + "step": 33652 + }, + { + "epoch": 0.86, + "learning_rate": 1.6719074222521065e-06, + "loss": 0.7783, + "step": 33653 + }, + { + "epoch": 0.86, + "learning_rate": 1.6718869282842897e-06, + "loss": 0.958, + "step": 33654 + }, + { + "epoch": 0.86, + "learning_rate": 1.6718664338020404e-06, + "loss": 0.9287, + "step": 33655 + }, + { + "epoch": 0.86, + "learning_rate": 1.6718459388053736e-06, + "loss": 0.9893, + "step": 33656 + }, + { + "epoch": 0.86, + "learning_rate": 1.6718254432943053e-06, + "loss": 0.8291, + "step": 33657 + }, + { + "epoch": 0.86, + "learning_rate": 1.6718049472688513e-06, + "loss": 0.6533, + "step": 33658 + }, + { + "epoch": 0.86, + "learning_rate": 1.671784450729027e-06, + "loss": 0.6348, + "step": 33659 + }, + { + "epoch": 0.86, + "learning_rate": 1.6717639536748483e-06, + "loss": 0.9531, + "step": 33660 + }, + { + "epoch": 0.86, + "learning_rate": 1.671743456106331e-06, + "loss": 0.832, + "step": 33661 + }, + { + "epoch": 0.86, + "learning_rate": 1.6717229580234902e-06, + "loss": 0.7559, + "step": 33662 + }, + { + "epoch": 0.86, + "learning_rate": 1.6717024594263425e-06, + "loss": 0.8789, + "step": 33663 + }, + { + "epoch": 0.86, + "learning_rate": 1.6716819603149025e-06, + "loss": 0.9424, + "step": 33664 + }, + { + "epoch": 0.86, + "learning_rate": 1.671661460689187e-06, + "loss": 1.0264, + "step": 33665 + }, + { + "epoch": 0.86, + "learning_rate": 1.6716409605492112e-06, + "loss": 0.9893, + "step": 33666 + }, + { + "epoch": 0.86, + "learning_rate": 1.6716204598949905e-06, + "loss": 0.876, + "step": 33667 + }, + { + "epoch": 0.86, + "learning_rate": 1.6715999587265413e-06, + "loss": 0.5815, + "step": 33668 + }, + { + "epoch": 0.86, + "learning_rate": 1.6715794570438786e-06, + "loss": 0.8643, + "step": 33669 + }, + { + "epoch": 0.86, + "learning_rate": 1.6715589548470183e-06, + "loss": 0.8779, + "step": 33670 + }, + { + "epoch": 0.86, + "learning_rate": 1.6715384521359765e-06, + "loss": 0.9541, + "step": 33671 + }, + { + "epoch": 0.86, + "learning_rate": 1.6715179489107683e-06, + "loss": 1.0352, + "step": 33672 + }, + { + "epoch": 0.86, + "learning_rate": 1.67149744517141e-06, + "loss": 0.7578, + "step": 33673 + }, + { + "epoch": 0.86, + "learning_rate": 1.6714769409179165e-06, + "loss": 0.7666, + "step": 33674 + }, + { + "epoch": 0.86, + "learning_rate": 1.6714564361503043e-06, + "loss": 0.7949, + "step": 33675 + }, + { + "epoch": 0.86, + "learning_rate": 1.6714359308685888e-06, + "loss": 0.9482, + "step": 33676 + }, + { + "epoch": 0.86, + "learning_rate": 1.6714154250727855e-06, + "loss": 0.689, + "step": 33677 + }, + { + "epoch": 0.86, + "learning_rate": 1.6713949187629107e-06, + "loss": 0.8604, + "step": 33678 + }, + { + "epoch": 0.86, + "learning_rate": 1.6713744119389795e-06, + "loss": 0.9092, + "step": 33679 + }, + { + "epoch": 0.86, + "learning_rate": 1.6713539046010074e-06, + "loss": 0.9805, + "step": 33680 + }, + { + "epoch": 0.86, + "learning_rate": 1.6713333967490107e-06, + "loss": 0.8511, + "step": 33681 + }, + { + "epoch": 0.86, + "learning_rate": 1.671312888383005e-06, + "loss": 0.8398, + "step": 33682 + }, + { + "epoch": 0.86, + "learning_rate": 1.671292379503006e-06, + "loss": 0.8828, + "step": 33683 + }, + { + "epoch": 0.86, + "learning_rate": 1.6712718701090293e-06, + "loss": 0.79, + "step": 33684 + }, + { + "epoch": 0.86, + "learning_rate": 1.67125136020109e-06, + "loss": 0.8867, + "step": 33685 + }, + { + "epoch": 0.86, + "learning_rate": 1.6712308497792049e-06, + "loss": 1.0195, + "step": 33686 + }, + { + "epoch": 0.86, + "learning_rate": 1.6712103388433892e-06, + "loss": 0.8438, + "step": 33687 + }, + { + "epoch": 0.86, + "learning_rate": 1.6711898273936586e-06, + "loss": 0.835, + "step": 33688 + }, + { + "epoch": 0.86, + "learning_rate": 1.6711693154300286e-06, + "loss": 0.9277, + "step": 33689 + }, + { + "epoch": 0.86, + "learning_rate": 1.6711488029525154e-06, + "loss": 0.5605, + "step": 33690 + }, + { + "epoch": 0.86, + "learning_rate": 1.671128289961134e-06, + "loss": 0.9229, + "step": 33691 + }, + { + "epoch": 0.86, + "learning_rate": 1.6711077764559009e-06, + "loss": 0.8369, + "step": 33692 + }, + { + "epoch": 0.86, + "learning_rate": 1.6710872624368316e-06, + "loss": 0.8701, + "step": 33693 + }, + { + "epoch": 0.86, + "learning_rate": 1.6710667479039412e-06, + "loss": 1.0156, + "step": 33694 + }, + { + "epoch": 0.86, + "learning_rate": 1.671046232857246e-06, + "loss": 0.9004, + "step": 33695 + }, + { + "epoch": 0.86, + "learning_rate": 1.6710257172967616e-06, + "loss": 0.8213, + "step": 33696 + }, + { + "epoch": 0.86, + "learning_rate": 1.6710052012225036e-06, + "loss": 0.9277, + "step": 33697 + }, + { + "epoch": 0.86, + "learning_rate": 1.670984684634488e-06, + "loss": 0.8857, + "step": 33698 + }, + { + "epoch": 0.86, + "learning_rate": 1.67096416753273e-06, + "loss": 0.7559, + "step": 33699 + }, + { + "epoch": 0.86, + "learning_rate": 1.6709436499172458e-06, + "loss": 0.8164, + "step": 33700 + }, + { + "epoch": 0.86, + "learning_rate": 1.6709231317880508e-06, + "loss": 0.9531, + "step": 33701 + }, + { + "epoch": 0.86, + "learning_rate": 1.6709026131451607e-06, + "loss": 0.8804, + "step": 33702 + }, + { + "epoch": 0.86, + "learning_rate": 1.6708820939885918e-06, + "loss": 1.0303, + "step": 33703 + }, + { + "epoch": 0.86, + "learning_rate": 1.6708615743183585e-06, + "loss": 0.8232, + "step": 33704 + }, + { + "epoch": 0.86, + "learning_rate": 1.670841054134478e-06, + "loss": 0.9111, + "step": 33705 + }, + { + "epoch": 0.86, + "learning_rate": 1.6708205334369652e-06, + "loss": 1.1113, + "step": 33706 + }, + { + "epoch": 0.86, + "learning_rate": 1.6708000122258357e-06, + "loss": 0.6646, + "step": 33707 + }, + { + "epoch": 0.86, + "learning_rate": 1.6707794905011058e-06, + "loss": 0.812, + "step": 33708 + }, + { + "epoch": 0.86, + "learning_rate": 1.6707589682627907e-06, + "loss": 0.3755, + "step": 33709 + }, + { + "epoch": 0.86, + "learning_rate": 1.6707384455109063e-06, + "loss": 0.8438, + "step": 33710 + }, + { + "epoch": 0.86, + "learning_rate": 1.6707179222454684e-06, + "loss": 1.0342, + "step": 33711 + }, + { + "epoch": 0.86, + "learning_rate": 1.6706973984664926e-06, + "loss": 1.0049, + "step": 33712 + }, + { + "epoch": 0.86, + "learning_rate": 1.6706768741739947e-06, + "loss": 0.8315, + "step": 33713 + }, + { + "epoch": 0.86, + "learning_rate": 1.6706563493679902e-06, + "loss": 0.8945, + "step": 33714 + }, + { + "epoch": 0.86, + "learning_rate": 1.670635824048495e-06, + "loss": 0.9961, + "step": 33715 + }, + { + "epoch": 0.86, + "learning_rate": 1.6706152982155247e-06, + "loss": 0.9971, + "step": 33716 + }, + { + "epoch": 0.86, + "learning_rate": 1.6705947718690955e-06, + "loss": 0.9697, + "step": 33717 + }, + { + "epoch": 0.86, + "learning_rate": 1.6705742450092225e-06, + "loss": 0.9092, + "step": 33718 + }, + { + "epoch": 0.86, + "learning_rate": 1.6705537176359217e-06, + "loss": 0.7539, + "step": 33719 + }, + { + "epoch": 0.86, + "learning_rate": 1.6705331897492086e-06, + "loss": 0.6257, + "step": 33720 + }, + { + "epoch": 0.86, + "learning_rate": 1.670512661349099e-06, + "loss": 0.9531, + "step": 33721 + }, + { + "epoch": 0.86, + "learning_rate": 1.670492132435609e-06, + "loss": 0.7207, + "step": 33722 + }, + { + "epoch": 0.86, + "learning_rate": 1.6704716030087538e-06, + "loss": 0.6108, + "step": 33723 + }, + { + "epoch": 0.86, + "learning_rate": 1.6704510730685493e-06, + "loss": 0.6836, + "step": 33724 + }, + { + "epoch": 0.86, + "learning_rate": 1.670430542615011e-06, + "loss": 0.8818, + "step": 33725 + }, + { + "epoch": 0.86, + "learning_rate": 1.6704100116481552e-06, + "loss": 0.6943, + "step": 33726 + }, + { + "epoch": 0.86, + "learning_rate": 1.6703894801679974e-06, + "loss": 1.0615, + "step": 33727 + }, + { + "epoch": 0.86, + "learning_rate": 1.670368948174553e-06, + "loss": 0.8408, + "step": 33728 + }, + { + "epoch": 0.86, + "learning_rate": 1.670348415667838e-06, + "loss": 0.9209, + "step": 33729 + }, + { + "epoch": 0.86, + "learning_rate": 1.670327882647868e-06, + "loss": 0.7065, + "step": 33730 + }, + { + "epoch": 0.86, + "learning_rate": 1.6703073491146586e-06, + "loss": 0.9385, + "step": 33731 + }, + { + "epoch": 0.86, + "learning_rate": 1.6702868150682258e-06, + "loss": 0.7939, + "step": 33732 + }, + { + "epoch": 0.86, + "learning_rate": 1.6702662805085855e-06, + "loss": 0.9219, + "step": 33733 + }, + { + "epoch": 0.86, + "learning_rate": 1.6702457454357529e-06, + "loss": 0.8975, + "step": 33734 + }, + { + "epoch": 0.86, + "learning_rate": 1.6702252098497439e-06, + "loss": 0.9326, + "step": 33735 + }, + { + "epoch": 0.86, + "learning_rate": 1.6702046737505741e-06, + "loss": 0.9453, + "step": 33736 + }, + { + "epoch": 0.86, + "learning_rate": 1.6701841371382598e-06, + "loss": 0.7603, + "step": 33737 + }, + { + "epoch": 0.86, + "learning_rate": 1.6701636000128158e-06, + "loss": 0.6826, + "step": 33738 + }, + { + "epoch": 0.86, + "learning_rate": 1.670143062374259e-06, + "loss": 0.6948, + "step": 33739 + }, + { + "epoch": 0.86, + "learning_rate": 1.670122524222604e-06, + "loss": 0.5615, + "step": 33740 + }, + { + "epoch": 0.86, + "learning_rate": 1.6701019855578671e-06, + "loss": 0.7852, + "step": 33741 + }, + { + "epoch": 0.86, + "learning_rate": 1.6700814463800638e-06, + "loss": 0.8604, + "step": 33742 + }, + { + "epoch": 0.86, + "learning_rate": 1.6700609066892101e-06, + "loss": 0.9092, + "step": 33743 + }, + { + "epoch": 0.86, + "learning_rate": 1.6700403664853217e-06, + "loss": 0.7285, + "step": 33744 + }, + { + "epoch": 0.86, + "learning_rate": 1.6700198257684142e-06, + "loss": 0.8071, + "step": 33745 + }, + { + "epoch": 0.86, + "learning_rate": 1.6699992845385032e-06, + "loss": 0.7227, + "step": 33746 + }, + { + "epoch": 0.86, + "learning_rate": 1.6699787427956046e-06, + "loss": 0.6128, + "step": 33747 + }, + { + "epoch": 0.86, + "learning_rate": 1.669958200539734e-06, + "loss": 0.8262, + "step": 33748 + }, + { + "epoch": 0.87, + "learning_rate": 1.6699376577709071e-06, + "loss": 0.9014, + "step": 33749 + }, + { + "epoch": 0.87, + "learning_rate": 1.66991711448914e-06, + "loss": 0.8105, + "step": 33750 + }, + { + "epoch": 0.87, + "learning_rate": 1.6698965706944482e-06, + "loss": 0.8096, + "step": 33751 + }, + { + "epoch": 0.87, + "learning_rate": 1.6698760263868469e-06, + "loss": 1.0361, + "step": 33752 + }, + { + "epoch": 0.87, + "learning_rate": 1.669855481566353e-06, + "loss": 0.999, + "step": 33753 + }, + { + "epoch": 0.87, + "learning_rate": 1.669834936232981e-06, + "loss": 0.8389, + "step": 33754 + }, + { + "epoch": 0.87, + "learning_rate": 1.6698143903867474e-06, + "loss": 1.0508, + "step": 33755 + }, + { + "epoch": 0.87, + "learning_rate": 1.669793844027668e-06, + "loss": 0.9609, + "step": 33756 + }, + { + "epoch": 0.87, + "learning_rate": 1.6697732971557578e-06, + "loss": 0.8242, + "step": 33757 + }, + { + "epoch": 0.87, + "learning_rate": 1.6697527497710332e-06, + "loss": 0.6426, + "step": 33758 + }, + { + "epoch": 0.87, + "learning_rate": 1.6697322018735098e-06, + "loss": 0.9434, + "step": 33759 + }, + { + "epoch": 0.87, + "learning_rate": 1.669711653463203e-06, + "loss": 0.6416, + "step": 33760 + }, + { + "epoch": 0.87, + "learning_rate": 1.6696911045401292e-06, + "loss": 0.8926, + "step": 33761 + }, + { + "epoch": 0.87, + "learning_rate": 1.6696705551043033e-06, + "loss": 0.728, + "step": 33762 + }, + { + "epoch": 0.87, + "learning_rate": 1.6696500051557417e-06, + "loss": 0.8154, + "step": 33763 + }, + { + "epoch": 0.87, + "learning_rate": 1.6696294546944598e-06, + "loss": 0.9795, + "step": 33764 + }, + { + "epoch": 0.87, + "learning_rate": 1.6696089037204732e-06, + "loss": 0.7734, + "step": 33765 + }, + { + "epoch": 0.87, + "learning_rate": 1.6695883522337982e-06, + "loss": 0.7241, + "step": 33766 + }, + { + "epoch": 0.87, + "learning_rate": 1.66956780023445e-06, + "loss": 0.6963, + "step": 33767 + }, + { + "epoch": 0.87, + "learning_rate": 1.6695472477224446e-06, + "loss": 0.9775, + "step": 33768 + }, + { + "epoch": 0.87, + "learning_rate": 1.6695266946977977e-06, + "loss": 0.8975, + "step": 33769 + }, + { + "epoch": 0.87, + "learning_rate": 1.6695061411605246e-06, + "loss": 0.8633, + "step": 33770 + }, + { + "epoch": 0.87, + "learning_rate": 1.669485587110642e-06, + "loss": 0.6726, + "step": 33771 + }, + { + "epoch": 0.87, + "learning_rate": 1.6694650325481646e-06, + "loss": 0.791, + "step": 33772 + }, + { + "epoch": 0.87, + "learning_rate": 1.669444477473109e-06, + "loss": 0.7256, + "step": 33773 + }, + { + "epoch": 0.87, + "learning_rate": 1.6694239218854905e-06, + "loss": 0.8159, + "step": 33774 + }, + { + "epoch": 0.87, + "learning_rate": 1.6694033657853246e-06, + "loss": 0.7339, + "step": 33775 + }, + { + "epoch": 0.87, + "learning_rate": 1.6693828091726275e-06, + "loss": 0.7124, + "step": 33776 + }, + { + "epoch": 0.87, + "learning_rate": 1.6693622520474147e-06, + "loss": 0.8174, + "step": 33777 + }, + { + "epoch": 0.87, + "learning_rate": 1.669341694409702e-06, + "loss": 0.7354, + "step": 33778 + }, + { + "epoch": 0.87, + "learning_rate": 1.6693211362595051e-06, + "loss": 0.9102, + "step": 33779 + }, + { + "epoch": 0.87, + "learning_rate": 1.6693005775968399e-06, + "loss": 0.8027, + "step": 33780 + }, + { + "epoch": 0.87, + "learning_rate": 1.669280018421722e-06, + "loss": 0.8379, + "step": 33781 + }, + { + "epoch": 0.87, + "learning_rate": 1.6692594587341672e-06, + "loss": 0.6938, + "step": 33782 + }, + { + "epoch": 0.87, + "learning_rate": 1.6692388985341912e-06, + "loss": 0.9902, + "step": 33783 + }, + { + "epoch": 0.87, + "learning_rate": 1.6692183378218098e-06, + "loss": 0.7773, + "step": 33784 + }, + { + "epoch": 0.87, + "learning_rate": 1.6691977765970384e-06, + "loss": 0.5803, + "step": 33785 + }, + { + "epoch": 0.87, + "learning_rate": 1.6691772148598932e-06, + "loss": 0.7715, + "step": 33786 + }, + { + "epoch": 0.87, + "learning_rate": 1.6691566526103897e-06, + "loss": 0.5513, + "step": 33787 + }, + { + "epoch": 0.87, + "learning_rate": 1.669136089848544e-06, + "loss": 0.8086, + "step": 33788 + }, + { + "epoch": 0.87, + "learning_rate": 1.6691155265743712e-06, + "loss": 0.7832, + "step": 33789 + }, + { + "epoch": 0.87, + "learning_rate": 1.6690949627878878e-06, + "loss": 0.9395, + "step": 33790 + }, + { + "epoch": 0.87, + "learning_rate": 1.669074398489109e-06, + "loss": 0.7339, + "step": 33791 + }, + { + "epoch": 0.87, + "learning_rate": 1.6690538336780505e-06, + "loss": 0.9902, + "step": 33792 + }, + { + "epoch": 0.87, + "learning_rate": 1.6690332683547283e-06, + "loss": 0.9082, + "step": 33793 + }, + { + "epoch": 0.87, + "learning_rate": 1.6690127025191583e-06, + "loss": 0.7734, + "step": 33794 + }, + { + "epoch": 0.87, + "learning_rate": 1.668992136171356e-06, + "loss": 1.0244, + "step": 33795 + }, + { + "epoch": 0.87, + "learning_rate": 1.668971569311337e-06, + "loss": 0.8408, + "step": 33796 + }, + { + "epoch": 0.87, + "learning_rate": 1.6689510019391173e-06, + "loss": 0.7803, + "step": 33797 + }, + { + "epoch": 0.87, + "learning_rate": 1.6689304340547127e-06, + "loss": 0.7944, + "step": 33798 + }, + { + "epoch": 0.87, + "learning_rate": 1.6689098656581386e-06, + "loss": 0.7148, + "step": 33799 + }, + { + "epoch": 0.87, + "learning_rate": 1.6688892967494113e-06, + "loss": 0.8359, + "step": 33800 + }, + { + "epoch": 0.87, + "learning_rate": 1.668868727328546e-06, + "loss": 0.9785, + "step": 33801 + }, + { + "epoch": 0.87, + "learning_rate": 1.6688481573955586e-06, + "loss": 0.959, + "step": 33802 + }, + { + "epoch": 0.87, + "learning_rate": 1.668827586950465e-06, + "loss": 0.6887, + "step": 33803 + }, + { + "epoch": 0.87, + "learning_rate": 1.668807015993281e-06, + "loss": 0.7109, + "step": 33804 + }, + { + "epoch": 0.87, + "learning_rate": 1.6687864445240218e-06, + "loss": 0.8252, + "step": 33805 + }, + { + "epoch": 0.87, + "learning_rate": 1.668765872542704e-06, + "loss": 0.626, + "step": 33806 + }, + { + "epoch": 0.87, + "learning_rate": 1.668745300049343e-06, + "loss": 0.5913, + "step": 33807 + }, + { + "epoch": 0.87, + "learning_rate": 1.6687247270439543e-06, + "loss": 0.9365, + "step": 33808 + }, + { + "epoch": 0.87, + "learning_rate": 1.6687041535265535e-06, + "loss": 0.7861, + "step": 33809 + }, + { + "epoch": 0.87, + "learning_rate": 1.668683579497157e-06, + "loss": 0.8877, + "step": 33810 + }, + { + "epoch": 0.87, + "learning_rate": 1.6686630049557802e-06, + "loss": 0.8291, + "step": 33811 + }, + { + "epoch": 0.87, + "learning_rate": 1.668642429902439e-06, + "loss": 0.9229, + "step": 33812 + }, + { + "epoch": 0.87, + "learning_rate": 1.6686218543371488e-06, + "loss": 0.8857, + "step": 33813 + }, + { + "epoch": 0.87, + "learning_rate": 1.668601278259926e-06, + "loss": 0.752, + "step": 33814 + }, + { + "epoch": 0.87, + "learning_rate": 1.6685807016707853e-06, + "loss": 0.6377, + "step": 33815 + }, + { + "epoch": 0.87, + "learning_rate": 1.6685601245697436e-06, + "loss": 0.8555, + "step": 33816 + }, + { + "epoch": 0.87, + "learning_rate": 1.668539546956816e-06, + "loss": 0.6631, + "step": 33817 + }, + { + "epoch": 0.87, + "learning_rate": 1.6685189688320186e-06, + "loss": 0.7354, + "step": 33818 + }, + { + "epoch": 0.87, + "learning_rate": 1.6684983901953667e-06, + "loss": 0.7764, + "step": 33819 + }, + { + "epoch": 0.87, + "learning_rate": 1.6684778110468764e-06, + "loss": 0.7715, + "step": 33820 + }, + { + "epoch": 0.87, + "learning_rate": 1.6684572313865634e-06, + "loss": 0.9219, + "step": 33821 + }, + { + "epoch": 0.87, + "learning_rate": 1.6684366512144434e-06, + "loss": 1.0596, + "step": 33822 + }, + { + "epoch": 0.87, + "learning_rate": 1.6684160705305321e-06, + "loss": 1.0381, + "step": 33823 + }, + { + "epoch": 0.87, + "learning_rate": 1.6683954893348457e-06, + "loss": 0.8975, + "step": 33824 + }, + { + "epoch": 0.87, + "learning_rate": 1.6683749076273991e-06, + "loss": 0.8574, + "step": 33825 + }, + { + "epoch": 0.87, + "learning_rate": 1.668354325408209e-06, + "loss": 0.8066, + "step": 33826 + }, + { + "epoch": 0.87, + "learning_rate": 1.6683337426772905e-06, + "loss": 0.7275, + "step": 33827 + }, + { + "epoch": 0.87, + "learning_rate": 1.6683131594346596e-06, + "loss": 0.7725, + "step": 33828 + }, + { + "epoch": 0.87, + "learning_rate": 1.668292575680332e-06, + "loss": 0.9004, + "step": 33829 + }, + { + "epoch": 0.87, + "learning_rate": 1.6682719914143237e-06, + "loss": 0.7031, + "step": 33830 + }, + { + "epoch": 0.87, + "learning_rate": 1.6682514066366502e-06, + "loss": 0.833, + "step": 33831 + }, + { + "epoch": 0.87, + "learning_rate": 1.6682308213473272e-06, + "loss": 0.9648, + "step": 33832 + }, + { + "epoch": 0.87, + "learning_rate": 1.6682102355463707e-06, + "loss": 0.9648, + "step": 33833 + }, + { + "epoch": 0.87, + "learning_rate": 1.6681896492337963e-06, + "loss": 0.8506, + "step": 33834 + }, + { + "epoch": 0.87, + "learning_rate": 1.6681690624096198e-06, + "loss": 0.8779, + "step": 33835 + }, + { + "epoch": 0.87, + "learning_rate": 1.668148475073857e-06, + "loss": 0.8389, + "step": 33836 + }, + { + "epoch": 0.87, + "learning_rate": 1.668127887226524e-06, + "loss": 0.623, + "step": 33837 + }, + { + "epoch": 0.87, + "learning_rate": 1.6681072988676355e-06, + "loss": 0.7891, + "step": 33838 + }, + { + "epoch": 0.87, + "learning_rate": 1.6680867099972082e-06, + "loss": 0.8828, + "step": 33839 + }, + { + "epoch": 0.87, + "learning_rate": 1.6680661206152577e-06, + "loss": 0.7158, + "step": 33840 + }, + { + "epoch": 0.87, + "learning_rate": 1.6680455307217997e-06, + "loss": 0.7144, + "step": 33841 + }, + { + "epoch": 0.87, + "learning_rate": 1.66802494031685e-06, + "loss": 0.96, + "step": 33842 + }, + { + "epoch": 0.87, + "learning_rate": 1.6680043494004244e-06, + "loss": 0.5376, + "step": 33843 + }, + { + "epoch": 0.87, + "learning_rate": 1.6679837579725385e-06, + "loss": 1.0137, + "step": 33844 + }, + { + "epoch": 0.87, + "learning_rate": 1.6679631660332079e-06, + "loss": 0.6233, + "step": 33845 + }, + { + "epoch": 0.87, + "learning_rate": 1.6679425735824488e-06, + "loss": 0.8779, + "step": 33846 + }, + { + "epoch": 0.87, + "learning_rate": 1.667921980620277e-06, + "loss": 0.8184, + "step": 33847 + }, + { + "epoch": 0.87, + "learning_rate": 1.6679013871467078e-06, + "loss": 0.915, + "step": 33848 + }, + { + "epoch": 0.87, + "learning_rate": 1.6678807931617573e-06, + "loss": 0.7607, + "step": 33849 + }, + { + "epoch": 0.87, + "learning_rate": 1.667860198665441e-06, + "loss": 0.8438, + "step": 33850 + }, + { + "epoch": 0.87, + "learning_rate": 1.667839603657775e-06, + "loss": 0.9355, + "step": 33851 + }, + { + "epoch": 0.87, + "learning_rate": 1.667819008138775e-06, + "loss": 0.8867, + "step": 33852 + }, + { + "epoch": 0.87, + "learning_rate": 1.6677984121084567e-06, + "loss": 0.8115, + "step": 33853 + }, + { + "epoch": 0.87, + "learning_rate": 1.6677778155668358e-06, + "loss": 0.6685, + "step": 33854 + }, + { + "epoch": 0.87, + "learning_rate": 1.667757218513928e-06, + "loss": 0.7603, + "step": 33855 + }, + { + "epoch": 0.87, + "learning_rate": 1.6677366209497495e-06, + "loss": 0.8027, + "step": 33856 + }, + { + "epoch": 0.87, + "learning_rate": 1.6677160228743157e-06, + "loss": 1.0596, + "step": 33857 + }, + { + "epoch": 0.87, + "learning_rate": 1.6676954242876425e-06, + "loss": 0.5299, + "step": 33858 + }, + { + "epoch": 0.87, + "learning_rate": 1.6676748251897453e-06, + "loss": 1.0693, + "step": 33859 + }, + { + "epoch": 0.87, + "learning_rate": 1.6676542255806402e-06, + "loss": 0.9697, + "step": 33860 + }, + { + "epoch": 0.87, + "learning_rate": 1.6676336254603432e-06, + "loss": 0.8474, + "step": 33861 + }, + { + "epoch": 0.87, + "learning_rate": 1.6676130248288698e-06, + "loss": 0.8271, + "step": 33862 + }, + { + "epoch": 0.87, + "learning_rate": 1.6675924236862357e-06, + "loss": 0.9268, + "step": 33863 + }, + { + "epoch": 0.87, + "learning_rate": 1.6675718220324568e-06, + "loss": 0.8008, + "step": 33864 + }, + { + "epoch": 0.87, + "learning_rate": 1.667551219867549e-06, + "loss": 0.9443, + "step": 33865 + }, + { + "epoch": 0.87, + "learning_rate": 1.6675306171915278e-06, + "loss": 0.9111, + "step": 33866 + }, + { + "epoch": 0.87, + "learning_rate": 1.6675100140044093e-06, + "loss": 0.9336, + "step": 33867 + }, + { + "epoch": 0.87, + "learning_rate": 1.6674894103062088e-06, + "loss": 1.0215, + "step": 33868 + }, + { + "epoch": 0.87, + "learning_rate": 1.6674688060969423e-06, + "loss": 0.8169, + "step": 33869 + }, + { + "epoch": 0.87, + "learning_rate": 1.6674482013766257e-06, + "loss": 0.9297, + "step": 33870 + }, + { + "epoch": 0.87, + "learning_rate": 1.667427596145275e-06, + "loss": 0.8677, + "step": 33871 + }, + { + "epoch": 0.87, + "learning_rate": 1.6674069904029053e-06, + "loss": 0.9277, + "step": 33872 + }, + { + "epoch": 0.87, + "learning_rate": 1.6673863841495327e-06, + "loss": 1.0693, + "step": 33873 + }, + { + "epoch": 0.87, + "learning_rate": 1.6673657773851732e-06, + "loss": 0.9473, + "step": 33874 + }, + { + "epoch": 0.87, + "learning_rate": 1.6673451701098427e-06, + "loss": 0.7285, + "step": 33875 + }, + { + "epoch": 0.87, + "learning_rate": 1.6673245623235563e-06, + "loss": 0.916, + "step": 33876 + }, + { + "epoch": 0.87, + "learning_rate": 1.6673039540263303e-06, + "loss": 0.6084, + "step": 33877 + }, + { + "epoch": 0.87, + "learning_rate": 1.6672833452181804e-06, + "loss": 1.0, + "step": 33878 + }, + { + "epoch": 0.87, + "learning_rate": 1.6672627358991222e-06, + "loss": 0.8564, + "step": 33879 + }, + { + "epoch": 0.87, + "learning_rate": 1.6672421260691717e-06, + "loss": 1.0342, + "step": 33880 + }, + { + "epoch": 0.87, + "learning_rate": 1.6672215157283445e-06, + "loss": 0.5425, + "step": 33881 + }, + { + "epoch": 0.87, + "learning_rate": 1.6672009048766567e-06, + "loss": 0.7812, + "step": 33882 + }, + { + "epoch": 0.87, + "learning_rate": 1.6671802935141237e-06, + "loss": 1.0332, + "step": 33883 + }, + { + "epoch": 0.87, + "learning_rate": 1.6671596816407614e-06, + "loss": 0.832, + "step": 33884 + }, + { + "epoch": 0.87, + "learning_rate": 1.6671390692565854e-06, + "loss": 0.6567, + "step": 33885 + }, + { + "epoch": 0.87, + "learning_rate": 1.6671184563616118e-06, + "loss": 1.0215, + "step": 33886 + }, + { + "epoch": 0.87, + "learning_rate": 1.6670978429558567e-06, + "loss": 0.916, + "step": 33887 + }, + { + "epoch": 0.87, + "learning_rate": 1.667077229039335e-06, + "loss": 0.9121, + "step": 33888 + }, + { + "epoch": 0.87, + "learning_rate": 1.667056614612063e-06, + "loss": 1.0938, + "step": 33889 + }, + { + "epoch": 0.87, + "learning_rate": 1.6670359996740567e-06, + "loss": 0.9668, + "step": 33890 + }, + { + "epoch": 0.87, + "learning_rate": 1.667015384225331e-06, + "loss": 0.7017, + "step": 33891 + }, + { + "epoch": 0.87, + "learning_rate": 1.6669947682659029e-06, + "loss": 0.959, + "step": 33892 + }, + { + "epoch": 0.87, + "learning_rate": 1.666974151795787e-06, + "loss": 0.7295, + "step": 33893 + }, + { + "epoch": 0.87, + "learning_rate": 1.6669535348150002e-06, + "loss": 0.7363, + "step": 33894 + }, + { + "epoch": 0.87, + "learning_rate": 1.6669329173235576e-06, + "loss": 0.8828, + "step": 33895 + }, + { + "epoch": 0.87, + "learning_rate": 1.666912299321475e-06, + "loss": 0.6953, + "step": 33896 + }, + { + "epoch": 0.87, + "learning_rate": 1.6668916808087684e-06, + "loss": 0.9268, + "step": 33897 + }, + { + "epoch": 0.87, + "learning_rate": 1.6668710617854535e-06, + "loss": 0.8457, + "step": 33898 + }, + { + "epoch": 0.87, + "learning_rate": 1.6668504422515462e-06, + "loss": 0.7227, + "step": 33899 + }, + { + "epoch": 0.87, + "learning_rate": 1.6668298222070623e-06, + "loss": 0.7246, + "step": 33900 + }, + { + "epoch": 0.87, + "learning_rate": 1.666809201652017e-06, + "loss": 0.6772, + "step": 33901 + }, + { + "epoch": 0.87, + "learning_rate": 1.6667885805864271e-06, + "loss": 0.96, + "step": 33902 + }, + { + "epoch": 0.87, + "learning_rate": 1.6667679590103073e-06, + "loss": 0.7852, + "step": 33903 + }, + { + "epoch": 0.87, + "learning_rate": 1.6667473369236742e-06, + "loss": 0.7329, + "step": 33904 + }, + { + "epoch": 0.87, + "learning_rate": 1.6667267143265433e-06, + "loss": 0.9072, + "step": 33905 + }, + { + "epoch": 0.87, + "learning_rate": 1.6667060912189305e-06, + "loss": 0.7114, + "step": 33906 + }, + { + "epoch": 0.87, + "learning_rate": 1.6666854676008515e-06, + "loss": 0.8096, + "step": 33907 + }, + { + "epoch": 0.87, + "learning_rate": 1.666664843472322e-06, + "loss": 0.8438, + "step": 33908 + }, + { + "epoch": 0.87, + "learning_rate": 1.6666442188333578e-06, + "loss": 0.5942, + "step": 33909 + }, + { + "epoch": 0.87, + "learning_rate": 1.6666235936839749e-06, + "loss": 0.8311, + "step": 33910 + }, + { + "epoch": 0.87, + "learning_rate": 1.666602968024189e-06, + "loss": 0.8318, + "step": 33911 + }, + { + "epoch": 0.87, + "learning_rate": 1.6665823418540157e-06, + "loss": 0.6421, + "step": 33912 + }, + { + "epoch": 0.87, + "learning_rate": 1.6665617151734713e-06, + "loss": 0.7598, + "step": 33913 + }, + { + "epoch": 0.87, + "learning_rate": 1.6665410879825708e-06, + "loss": 0.9072, + "step": 33914 + }, + { + "epoch": 0.87, + "learning_rate": 1.6665204602813305e-06, + "loss": 0.999, + "step": 33915 + }, + { + "epoch": 0.87, + "learning_rate": 1.6664998320697664e-06, + "loss": 0.9678, + "step": 33916 + }, + { + "epoch": 0.87, + "learning_rate": 1.666479203347894e-06, + "loss": 0.6821, + "step": 33917 + }, + { + "epoch": 0.87, + "learning_rate": 1.6664585741157288e-06, + "loss": 0.8281, + "step": 33918 + }, + { + "epoch": 0.87, + "learning_rate": 1.6664379443732873e-06, + "loss": 0.7358, + "step": 33919 + }, + { + "epoch": 0.87, + "learning_rate": 1.6664173141205846e-06, + "loss": 0.7783, + "step": 33920 + }, + { + "epoch": 0.87, + "learning_rate": 1.6663966833576368e-06, + "loss": 1.0078, + "step": 33921 + }, + { + "epoch": 0.87, + "learning_rate": 1.6663760520844598e-06, + "loss": 0.8311, + "step": 33922 + }, + { + "epoch": 0.87, + "learning_rate": 1.6663554203010695e-06, + "loss": 0.9355, + "step": 33923 + }, + { + "epoch": 0.87, + "learning_rate": 1.6663347880074814e-06, + "loss": 0.5664, + "step": 33924 + }, + { + "epoch": 0.87, + "learning_rate": 1.666314155203711e-06, + "loss": 0.999, + "step": 33925 + }, + { + "epoch": 0.87, + "learning_rate": 1.6662935218897748e-06, + "loss": 0.9346, + "step": 33926 + }, + { + "epoch": 0.87, + "learning_rate": 1.6662728880656886e-06, + "loss": 0.916, + "step": 33927 + }, + { + "epoch": 0.87, + "learning_rate": 1.6662522537314673e-06, + "loss": 1.0859, + "step": 33928 + }, + { + "epoch": 0.87, + "learning_rate": 1.6662316188871276e-06, + "loss": 0.6875, + "step": 33929 + }, + { + "epoch": 0.87, + "learning_rate": 1.666210983532685e-06, + "loss": 0.8066, + "step": 33930 + }, + { + "epoch": 0.87, + "learning_rate": 1.6661903476681553e-06, + "loss": 0.7222, + "step": 33931 + }, + { + "epoch": 0.87, + "learning_rate": 1.6661697112935543e-06, + "loss": 0.8008, + "step": 33932 + }, + { + "epoch": 0.87, + "learning_rate": 1.6661490744088975e-06, + "loss": 0.8169, + "step": 33933 + }, + { + "epoch": 0.87, + "learning_rate": 1.6661284370142013e-06, + "loss": 0.8252, + "step": 33934 + }, + { + "epoch": 0.87, + "learning_rate": 1.666107799109481e-06, + "loss": 0.7686, + "step": 33935 + }, + { + "epoch": 0.87, + "learning_rate": 1.6660871606947525e-06, + "loss": 0.7463, + "step": 33936 + }, + { + "epoch": 0.87, + "learning_rate": 1.666066521770032e-06, + "loss": 0.7617, + "step": 33937 + }, + { + "epoch": 0.87, + "learning_rate": 1.6660458823353348e-06, + "loss": 0.833, + "step": 33938 + }, + { + "epoch": 0.87, + "learning_rate": 1.666025242390677e-06, + "loss": 0.791, + "step": 33939 + }, + { + "epoch": 0.87, + "learning_rate": 1.6660046019360742e-06, + "loss": 0.7217, + "step": 33940 + }, + { + "epoch": 0.87, + "learning_rate": 1.6659839609715422e-06, + "loss": 0.9678, + "step": 33941 + }, + { + "epoch": 0.87, + "learning_rate": 1.6659633194970972e-06, + "loss": 0.8535, + "step": 33942 + }, + { + "epoch": 0.87, + "learning_rate": 1.6659426775127545e-06, + "loss": 0.8418, + "step": 33943 + }, + { + "epoch": 0.87, + "learning_rate": 1.6659220350185301e-06, + "loss": 0.832, + "step": 33944 + }, + { + "epoch": 0.87, + "learning_rate": 1.6659013920144398e-06, + "loss": 0.8916, + "step": 33945 + }, + { + "epoch": 0.87, + "learning_rate": 1.6658807485004995e-06, + "loss": 0.8408, + "step": 33946 + }, + { + "epoch": 0.87, + "learning_rate": 1.6658601044767249e-06, + "loss": 1.0762, + "step": 33947 + }, + { + "epoch": 0.87, + "learning_rate": 1.6658394599431321e-06, + "loss": 0.9434, + "step": 33948 + }, + { + "epoch": 0.87, + "learning_rate": 1.6658188148997362e-06, + "loss": 0.7783, + "step": 33949 + }, + { + "epoch": 0.87, + "learning_rate": 1.6657981693465536e-06, + "loss": 0.8252, + "step": 33950 + }, + { + "epoch": 0.87, + "learning_rate": 1.6657775232836e-06, + "loss": 0.7393, + "step": 33951 + }, + { + "epoch": 0.87, + "learning_rate": 1.6657568767108913e-06, + "loss": 1.0625, + "step": 33952 + }, + { + "epoch": 0.87, + "learning_rate": 1.665736229628443e-06, + "loss": 0.9893, + "step": 33953 + }, + { + "epoch": 0.87, + "learning_rate": 1.6657155820362712e-06, + "loss": 0.959, + "step": 33954 + }, + { + "epoch": 0.87, + "learning_rate": 1.6656949339343914e-06, + "loss": 0.7354, + "step": 33955 + }, + { + "epoch": 0.87, + "learning_rate": 1.6656742853228197e-06, + "loss": 0.7998, + "step": 33956 + }, + { + "epoch": 0.87, + "learning_rate": 1.6656536362015716e-06, + "loss": 0.6416, + "step": 33957 + }, + { + "epoch": 0.87, + "learning_rate": 1.6656329865706635e-06, + "loss": 0.8125, + "step": 33958 + }, + { + "epoch": 0.87, + "learning_rate": 1.6656123364301107e-06, + "loss": 0.7529, + "step": 33959 + }, + { + "epoch": 0.87, + "learning_rate": 1.665591685779929e-06, + "loss": 0.9512, + "step": 33960 + }, + { + "epoch": 0.87, + "learning_rate": 1.6655710346201346e-06, + "loss": 0.8252, + "step": 33961 + }, + { + "epoch": 0.87, + "learning_rate": 1.6655503829507426e-06, + "loss": 0.7881, + "step": 33962 + }, + { + "epoch": 0.87, + "learning_rate": 1.6655297307717697e-06, + "loss": 0.8213, + "step": 33963 + }, + { + "epoch": 0.87, + "learning_rate": 1.6655090780832312e-06, + "loss": 0.686, + "step": 33964 + }, + { + "epoch": 0.87, + "learning_rate": 1.6654884248851428e-06, + "loss": 0.9434, + "step": 33965 + }, + { + "epoch": 0.87, + "learning_rate": 1.6654677711775208e-06, + "loss": 0.6631, + "step": 33966 + }, + { + "epoch": 0.87, + "learning_rate": 1.6654471169603808e-06, + "loss": 0.9507, + "step": 33967 + }, + { + "epoch": 0.87, + "learning_rate": 1.6654264622337384e-06, + "loss": 0.9062, + "step": 33968 + }, + { + "epoch": 0.87, + "learning_rate": 1.6654058069976094e-06, + "loss": 0.9453, + "step": 33969 + }, + { + "epoch": 0.87, + "learning_rate": 1.6653851512520099e-06, + "loss": 0.6138, + "step": 33970 + }, + { + "epoch": 0.87, + "learning_rate": 1.6653644949969554e-06, + "loss": 0.7046, + "step": 33971 + }, + { + "epoch": 0.87, + "learning_rate": 1.6653438382324622e-06, + "loss": 0.9141, + "step": 33972 + }, + { + "epoch": 0.87, + "learning_rate": 1.6653231809585457e-06, + "loss": 0.6384, + "step": 33973 + }, + { + "epoch": 0.87, + "learning_rate": 1.6653025231752218e-06, + "loss": 0.9229, + "step": 33974 + }, + { + "epoch": 0.87, + "learning_rate": 1.6652818648825063e-06, + "loss": 0.8887, + "step": 33975 + }, + { + "epoch": 0.87, + "learning_rate": 1.665261206080415e-06, + "loss": 0.8008, + "step": 33976 + }, + { + "epoch": 0.87, + "learning_rate": 1.6652405467689641e-06, + "loss": 0.96, + "step": 33977 + }, + { + "epoch": 0.87, + "learning_rate": 1.665219886948169e-06, + "loss": 0.668, + "step": 33978 + }, + { + "epoch": 0.87, + "learning_rate": 1.6651992266180455e-06, + "loss": 1.0566, + "step": 33979 + }, + { + "epoch": 0.87, + "learning_rate": 1.6651785657786094e-06, + "loss": 1.0625, + "step": 33980 + }, + { + "epoch": 0.87, + "learning_rate": 1.665157904429877e-06, + "loss": 1.0889, + "step": 33981 + }, + { + "epoch": 0.87, + "learning_rate": 1.6651372425718634e-06, + "loss": 0.751, + "step": 33982 + }, + { + "epoch": 0.87, + "learning_rate": 1.665116580204585e-06, + "loss": 0.7549, + "step": 33983 + }, + { + "epoch": 0.87, + "learning_rate": 1.6650959173280574e-06, + "loss": 0.6484, + "step": 33984 + }, + { + "epoch": 0.87, + "learning_rate": 1.6650752539422965e-06, + "loss": 0.7437, + "step": 33985 + }, + { + "epoch": 0.87, + "learning_rate": 1.665054590047318e-06, + "loss": 0.917, + "step": 33986 + }, + { + "epoch": 0.87, + "learning_rate": 1.6650339256431378e-06, + "loss": 0.9414, + "step": 33987 + }, + { + "epoch": 0.87, + "learning_rate": 1.6650132607297718e-06, + "loss": 0.6943, + "step": 33988 + }, + { + "epoch": 0.87, + "learning_rate": 1.6649925953072357e-06, + "loss": 0.9365, + "step": 33989 + }, + { + "epoch": 0.87, + "learning_rate": 1.664971929375545e-06, + "loss": 0.8594, + "step": 33990 + }, + { + "epoch": 0.87, + "learning_rate": 1.6649512629347163e-06, + "loss": 0.9658, + "step": 33991 + }, + { + "epoch": 0.87, + "learning_rate": 1.664930595984765e-06, + "loss": 0.9561, + "step": 33992 + }, + { + "epoch": 0.87, + "learning_rate": 1.6649099285257067e-06, + "loss": 1.0322, + "step": 33993 + }, + { + "epoch": 0.87, + "learning_rate": 1.6648892605575573e-06, + "loss": 0.8853, + "step": 33994 + }, + { + "epoch": 0.87, + "learning_rate": 1.664868592080333e-06, + "loss": 0.8916, + "step": 33995 + }, + { + "epoch": 0.87, + "learning_rate": 1.6648479230940493e-06, + "loss": 0.9141, + "step": 33996 + }, + { + "epoch": 0.87, + "learning_rate": 1.6648272535987223e-06, + "loss": 0.6904, + "step": 33997 + }, + { + "epoch": 0.87, + "learning_rate": 1.6648065835943674e-06, + "loss": 0.9785, + "step": 33998 + }, + { + "epoch": 0.87, + "learning_rate": 1.6647859130810007e-06, + "loss": 0.8418, + "step": 33999 + }, + { + "epoch": 0.87, + "learning_rate": 1.6647652420586382e-06, + "loss": 0.7588, + "step": 34000 + }, + { + "epoch": 0.87, + "learning_rate": 1.6647445705272954e-06, + "loss": 0.8711, + "step": 34001 + }, + { + "epoch": 0.87, + "learning_rate": 1.6647238984869883e-06, + "loss": 0.7607, + "step": 34002 + }, + { + "epoch": 0.87, + "learning_rate": 1.6647032259377327e-06, + "loss": 0.6333, + "step": 34003 + }, + { + "epoch": 0.87, + "learning_rate": 1.6646825528795443e-06, + "loss": 0.9658, + "step": 34004 + }, + { + "epoch": 0.87, + "learning_rate": 1.664661879312439e-06, + "loss": 0.7729, + "step": 34005 + }, + { + "epoch": 0.87, + "learning_rate": 1.6646412052364327e-06, + "loss": 1.0166, + "step": 34006 + }, + { + "epoch": 0.87, + "learning_rate": 1.664620530651541e-06, + "loss": 0.7549, + "step": 34007 + }, + { + "epoch": 0.87, + "learning_rate": 1.6645998555577802e-06, + "loss": 1.0312, + "step": 34008 + }, + { + "epoch": 0.87, + "learning_rate": 1.6645791799551657e-06, + "loss": 0.9775, + "step": 34009 + }, + { + "epoch": 0.87, + "learning_rate": 1.6645585038437135e-06, + "loss": 0.7969, + "step": 34010 + }, + { + "epoch": 0.87, + "learning_rate": 1.6645378272234397e-06, + "loss": 0.9482, + "step": 34011 + }, + { + "epoch": 0.87, + "learning_rate": 1.6645171500943595e-06, + "loss": 0.8633, + "step": 34012 + }, + { + "epoch": 0.87, + "learning_rate": 1.6644964724564892e-06, + "loss": 0.8887, + "step": 34013 + }, + { + "epoch": 0.87, + "learning_rate": 1.6644757943098444e-06, + "loss": 0.917, + "step": 34014 + }, + { + "epoch": 0.87, + "learning_rate": 1.664455115654441e-06, + "loss": 0.5789, + "step": 34015 + }, + { + "epoch": 0.87, + "learning_rate": 1.6644344364902952e-06, + "loss": 0.8613, + "step": 34016 + }, + { + "epoch": 0.87, + "learning_rate": 1.6644137568174224e-06, + "loss": 0.8752, + "step": 34017 + }, + { + "epoch": 0.87, + "learning_rate": 1.6643930766358382e-06, + "loss": 0.9766, + "step": 34018 + }, + { + "epoch": 0.87, + "learning_rate": 1.6643723959455592e-06, + "loss": 1.0459, + "step": 34019 + }, + { + "epoch": 0.87, + "learning_rate": 1.6643517147466003e-06, + "loss": 0.8613, + "step": 34020 + }, + { + "epoch": 0.87, + "learning_rate": 1.6643310330389785e-06, + "loss": 0.7397, + "step": 34021 + }, + { + "epoch": 0.87, + "learning_rate": 1.6643103508227084e-06, + "loss": 0.7778, + "step": 34022 + }, + { + "epoch": 0.87, + "learning_rate": 1.6642896680978068e-06, + "loss": 0.9375, + "step": 34023 + }, + { + "epoch": 0.87, + "learning_rate": 1.664268984864289e-06, + "loss": 0.6675, + "step": 34024 + }, + { + "epoch": 0.87, + "learning_rate": 1.6642483011221708e-06, + "loss": 0.7339, + "step": 34025 + }, + { + "epoch": 0.87, + "learning_rate": 1.6642276168714685e-06, + "loss": 0.96, + "step": 34026 + }, + { + "epoch": 0.87, + "learning_rate": 1.6642069321121974e-06, + "loss": 1.0088, + "step": 34027 + }, + { + "epoch": 0.87, + "learning_rate": 1.6641862468443737e-06, + "loss": 0.8916, + "step": 34028 + }, + { + "epoch": 0.87, + "learning_rate": 1.6641655610680131e-06, + "loss": 0.8584, + "step": 34029 + }, + { + "epoch": 0.87, + "learning_rate": 1.6641448747831315e-06, + "loss": 1.0181, + "step": 34030 + }, + { + "epoch": 0.87, + "learning_rate": 1.6641241879897447e-06, + "loss": 0.9648, + "step": 34031 + }, + { + "epoch": 0.87, + "learning_rate": 1.6641035006878688e-06, + "loss": 0.79, + "step": 34032 + }, + { + "epoch": 0.87, + "learning_rate": 1.6640828128775191e-06, + "loss": 0.6348, + "step": 34033 + }, + { + "epoch": 0.87, + "learning_rate": 1.6640621245587117e-06, + "loss": 0.9678, + "step": 34034 + }, + { + "epoch": 0.87, + "learning_rate": 1.6640414357314624e-06, + "loss": 0.8047, + "step": 34035 + }, + { + "epoch": 0.87, + "learning_rate": 1.6640207463957873e-06, + "loss": 0.8896, + "step": 34036 + }, + { + "epoch": 0.87, + "learning_rate": 1.6640000565517023e-06, + "loss": 0.9243, + "step": 34037 + }, + { + "epoch": 0.87, + "learning_rate": 1.6639793661992228e-06, + "loss": 0.8525, + "step": 34038 + }, + { + "epoch": 0.87, + "learning_rate": 1.6639586753383645e-06, + "loss": 0.6357, + "step": 34039 + }, + { + "epoch": 0.87, + "learning_rate": 1.6639379839691437e-06, + "loss": 0.9033, + "step": 34040 + }, + { + "epoch": 0.87, + "learning_rate": 1.6639172920915762e-06, + "loss": 0.833, + "step": 34041 + }, + { + "epoch": 0.87, + "learning_rate": 1.6638965997056779e-06, + "loss": 0.8906, + "step": 34042 + }, + { + "epoch": 0.87, + "learning_rate": 1.6638759068114645e-06, + "loss": 0.752, + "step": 34043 + }, + { + "epoch": 0.87, + "learning_rate": 1.6638552134089517e-06, + "loss": 0.707, + "step": 34044 + }, + { + "epoch": 0.87, + "learning_rate": 1.6638345194981553e-06, + "loss": 0.6777, + "step": 34045 + }, + { + "epoch": 0.87, + "learning_rate": 1.6638138250790916e-06, + "loss": 0.9043, + "step": 34046 + }, + { + "epoch": 0.87, + "learning_rate": 1.663793130151776e-06, + "loss": 0.9619, + "step": 34047 + }, + { + "epoch": 0.87, + "learning_rate": 1.6637724347162248e-06, + "loss": 0.7744, + "step": 34048 + }, + { + "epoch": 0.87, + "learning_rate": 1.6637517387724533e-06, + "loss": 0.9014, + "step": 34049 + }, + { + "epoch": 0.87, + "learning_rate": 1.6637310423204779e-06, + "loss": 0.8701, + "step": 34050 + }, + { + "epoch": 0.87, + "learning_rate": 1.6637103453603138e-06, + "loss": 0.7043, + "step": 34051 + }, + { + "epoch": 0.87, + "learning_rate": 1.6636896478919774e-06, + "loss": 0.7773, + "step": 34052 + }, + { + "epoch": 0.87, + "learning_rate": 1.6636689499154844e-06, + "loss": 0.8462, + "step": 34053 + }, + { + "epoch": 0.87, + "learning_rate": 1.6636482514308506e-06, + "loss": 1.0635, + "step": 34054 + }, + { + "epoch": 0.87, + "learning_rate": 1.6636275524380916e-06, + "loss": 0.8379, + "step": 34055 + }, + { + "epoch": 0.87, + "learning_rate": 1.6636068529372237e-06, + "loss": 0.7974, + "step": 34056 + }, + { + "epoch": 0.87, + "learning_rate": 1.6635861529282626e-06, + "loss": 0.8867, + "step": 34057 + }, + { + "epoch": 0.87, + "learning_rate": 1.6635654524112242e-06, + "loss": 0.8604, + "step": 34058 + }, + { + "epoch": 0.87, + "learning_rate": 1.6635447513861238e-06, + "loss": 0.8193, + "step": 34059 + }, + { + "epoch": 0.87, + "learning_rate": 1.663524049852978e-06, + "loss": 0.7178, + "step": 34060 + }, + { + "epoch": 0.87, + "learning_rate": 1.6635033478118023e-06, + "loss": 0.7812, + "step": 34061 + }, + { + "epoch": 0.87, + "learning_rate": 1.6634826452626127e-06, + "loss": 0.8994, + "step": 34062 + }, + { + "epoch": 0.87, + "learning_rate": 1.663461942205425e-06, + "loss": 0.6953, + "step": 34063 + }, + { + "epoch": 0.87, + "learning_rate": 1.6634412386402548e-06, + "loss": 0.9189, + "step": 34064 + }, + { + "epoch": 0.87, + "learning_rate": 1.663420534567118e-06, + "loss": 0.7246, + "step": 34065 + }, + { + "epoch": 0.87, + "learning_rate": 1.663399829986031e-06, + "loss": 0.9111, + "step": 34066 + }, + { + "epoch": 0.87, + "learning_rate": 1.663379124897009e-06, + "loss": 0.874, + "step": 34067 + }, + { + "epoch": 0.87, + "learning_rate": 1.663358419300068e-06, + "loss": 1.0352, + "step": 34068 + }, + { + "epoch": 0.87, + "learning_rate": 1.6633377131952245e-06, + "loss": 0.6226, + "step": 34069 + }, + { + "epoch": 0.87, + "learning_rate": 1.6633170065824932e-06, + "loss": 1.1113, + "step": 34070 + }, + { + "epoch": 0.87, + "learning_rate": 1.6632962994618907e-06, + "loss": 0.9434, + "step": 34071 + }, + { + "epoch": 0.87, + "learning_rate": 1.6632755918334329e-06, + "loss": 1.0732, + "step": 34072 + }, + { + "epoch": 0.87, + "learning_rate": 1.6632548836971354e-06, + "loss": 0.9053, + "step": 34073 + }, + { + "epoch": 0.87, + "learning_rate": 1.663234175053014e-06, + "loss": 1.0576, + "step": 34074 + }, + { + "epoch": 0.87, + "learning_rate": 1.663213465901085e-06, + "loss": 1.0049, + "step": 34075 + }, + { + "epoch": 0.87, + "learning_rate": 1.6631927562413637e-06, + "loss": 0.7427, + "step": 34076 + }, + { + "epoch": 0.87, + "learning_rate": 1.6631720460738664e-06, + "loss": 0.7285, + "step": 34077 + }, + { + "epoch": 0.87, + "learning_rate": 1.6631513353986084e-06, + "loss": 0.8486, + "step": 34078 + }, + { + "epoch": 0.87, + "learning_rate": 1.6631306242156062e-06, + "loss": 0.8682, + "step": 34079 + }, + { + "epoch": 0.87, + "learning_rate": 1.6631099125248754e-06, + "loss": 0.7439, + "step": 34080 + }, + { + "epoch": 0.87, + "learning_rate": 1.6630892003264317e-06, + "loss": 0.8428, + "step": 34081 + }, + { + "epoch": 0.87, + "learning_rate": 1.6630684876202913e-06, + "loss": 0.9795, + "step": 34082 + }, + { + "epoch": 0.87, + "learning_rate": 1.6630477744064698e-06, + "loss": 0.8501, + "step": 34083 + }, + { + "epoch": 0.87, + "learning_rate": 1.6630270606849827e-06, + "loss": 0.835, + "step": 34084 + }, + { + "epoch": 0.87, + "learning_rate": 1.6630063464558466e-06, + "loss": 0.8242, + "step": 34085 + }, + { + "epoch": 0.87, + "learning_rate": 1.6629856317190768e-06, + "loss": 0.6221, + "step": 34086 + }, + { + "epoch": 0.87, + "learning_rate": 1.66296491647469e-06, + "loss": 0.9678, + "step": 34087 + }, + { + "epoch": 0.87, + "learning_rate": 1.6629442007227008e-06, + "loss": 0.8555, + "step": 34088 + }, + { + "epoch": 0.87, + "learning_rate": 1.662923484463126e-06, + "loss": 0.8154, + "step": 34089 + }, + { + "epoch": 0.87, + "learning_rate": 1.6629027676959811e-06, + "loss": 0.8643, + "step": 34090 + }, + { + "epoch": 0.87, + "learning_rate": 1.6628820504212819e-06, + "loss": 0.7344, + "step": 34091 + }, + { + "epoch": 0.87, + "learning_rate": 1.6628613326390446e-06, + "loss": 0.647, + "step": 34092 + }, + { + "epoch": 0.87, + "learning_rate": 1.6628406143492848e-06, + "loss": 0.8379, + "step": 34093 + }, + { + "epoch": 0.87, + "learning_rate": 1.6628198955520184e-06, + "loss": 0.9717, + "step": 34094 + }, + { + "epoch": 0.87, + "learning_rate": 1.6627991762472614e-06, + "loss": 0.8154, + "step": 34095 + }, + { + "epoch": 0.87, + "learning_rate": 1.6627784564350291e-06, + "loss": 1.0293, + "step": 34096 + }, + { + "epoch": 0.87, + "learning_rate": 1.6627577361153383e-06, + "loss": 0.6709, + "step": 34097 + }, + { + "epoch": 0.87, + "learning_rate": 1.6627370152882043e-06, + "loss": 0.9238, + "step": 34098 + }, + { + "epoch": 0.87, + "learning_rate": 1.6627162939536427e-06, + "loss": 0.6348, + "step": 34099 + }, + { + "epoch": 0.87, + "learning_rate": 1.66269557211167e-06, + "loss": 0.7671, + "step": 34100 + }, + { + "epoch": 0.87, + "learning_rate": 1.6626748497623018e-06, + "loss": 0.8916, + "step": 34101 + }, + { + "epoch": 0.87, + "learning_rate": 1.6626541269055538e-06, + "loss": 0.8242, + "step": 34102 + }, + { + "epoch": 0.87, + "learning_rate": 1.6626334035414422e-06, + "loss": 1.0605, + "step": 34103 + }, + { + "epoch": 0.87, + "learning_rate": 1.6626126796699826e-06, + "loss": 0.7861, + "step": 34104 + }, + { + "epoch": 0.87, + "learning_rate": 1.662591955291191e-06, + "loss": 0.5156, + "step": 34105 + }, + { + "epoch": 0.87, + "learning_rate": 1.6625712304050827e-06, + "loss": 0.957, + "step": 34106 + }, + { + "epoch": 0.87, + "learning_rate": 1.6625505050116745e-06, + "loss": 0.5942, + "step": 34107 + }, + { + "epoch": 0.87, + "learning_rate": 1.662529779110982e-06, + "loss": 1.0264, + "step": 34108 + }, + { + "epoch": 0.87, + "learning_rate": 1.6625090527030208e-06, + "loss": 0.7505, + "step": 34109 + }, + { + "epoch": 0.87, + "learning_rate": 1.6624883257878066e-06, + "loss": 0.9502, + "step": 34110 + }, + { + "epoch": 0.87, + "learning_rate": 1.6624675983653558e-06, + "loss": 0.9355, + "step": 34111 + }, + { + "epoch": 0.87, + "learning_rate": 1.662446870435684e-06, + "loss": 1.0059, + "step": 34112 + }, + { + "epoch": 0.87, + "learning_rate": 1.6624261419988073e-06, + "loss": 0.8018, + "step": 34113 + }, + { + "epoch": 0.87, + "learning_rate": 1.6624054130547412e-06, + "loss": 0.9443, + "step": 34114 + }, + { + "epoch": 0.87, + "learning_rate": 1.6623846836035014e-06, + "loss": 0.8203, + "step": 34115 + }, + { + "epoch": 0.87, + "learning_rate": 1.6623639536451045e-06, + "loss": 0.8438, + "step": 34116 + }, + { + "epoch": 0.87, + "learning_rate": 1.6623432231795658e-06, + "loss": 0.6953, + "step": 34117 + }, + { + "epoch": 0.87, + "learning_rate": 1.6623224922069014e-06, + "loss": 0.8013, + "step": 34118 + }, + { + "epoch": 0.87, + "learning_rate": 1.662301760727127e-06, + "loss": 0.9941, + "step": 34119 + }, + { + "epoch": 0.87, + "learning_rate": 1.6622810287402587e-06, + "loss": 1.0205, + "step": 34120 + }, + { + "epoch": 0.87, + "learning_rate": 1.6622602962463124e-06, + "loss": 0.8984, + "step": 34121 + }, + { + "epoch": 0.87, + "learning_rate": 1.6622395632453037e-06, + "loss": 0.8223, + "step": 34122 + }, + { + "epoch": 0.87, + "learning_rate": 1.6622188297372485e-06, + "loss": 0.7815, + "step": 34123 + }, + { + "epoch": 0.87, + "learning_rate": 1.662198095722163e-06, + "loss": 0.7271, + "step": 34124 + }, + { + "epoch": 0.87, + "learning_rate": 1.662177361200063e-06, + "loss": 0.7939, + "step": 34125 + }, + { + "epoch": 0.87, + "learning_rate": 1.6621566261709638e-06, + "loss": 0.9912, + "step": 34126 + }, + { + "epoch": 0.87, + "learning_rate": 1.6621358906348822e-06, + "loss": 0.8447, + "step": 34127 + }, + { + "epoch": 0.87, + "learning_rate": 1.6621151545918332e-06, + "loss": 0.7881, + "step": 34128 + }, + { + "epoch": 0.87, + "learning_rate": 1.6620944180418333e-06, + "loss": 0.8186, + "step": 34129 + }, + { + "epoch": 0.87, + "learning_rate": 1.6620736809848981e-06, + "loss": 0.7485, + "step": 34130 + }, + { + "epoch": 0.87, + "learning_rate": 1.6620529434210436e-06, + "loss": 0.6404, + "step": 34131 + }, + { + "epoch": 0.87, + "learning_rate": 1.6620322053502854e-06, + "loss": 0.6953, + "step": 34132 + }, + { + "epoch": 0.87, + "learning_rate": 1.6620114667726398e-06, + "loss": 0.9365, + "step": 34133 + }, + { + "epoch": 0.87, + "learning_rate": 1.661990727688122e-06, + "loss": 0.7266, + "step": 34134 + }, + { + "epoch": 0.87, + "learning_rate": 1.6619699880967489e-06, + "loss": 0.6877, + "step": 34135 + }, + { + "epoch": 0.87, + "learning_rate": 1.6619492479985355e-06, + "loss": 0.7134, + "step": 34136 + }, + { + "epoch": 0.87, + "learning_rate": 1.6619285073934981e-06, + "loss": 0.8276, + "step": 34137 + }, + { + "epoch": 0.87, + "learning_rate": 1.6619077662816526e-06, + "loss": 0.8906, + "step": 34138 + }, + { + "epoch": 0.88, + "learning_rate": 1.6618870246630145e-06, + "loss": 0.79, + "step": 34139 + }, + { + "epoch": 0.88, + "learning_rate": 1.6618662825376002e-06, + "loss": 0.6687, + "step": 34140 + }, + { + "epoch": 0.88, + "learning_rate": 1.6618455399054251e-06, + "loss": 1.0576, + "step": 34141 + }, + { + "epoch": 0.88, + "learning_rate": 1.6618247967665054e-06, + "loss": 1.1064, + "step": 34142 + }, + { + "epoch": 0.88, + "learning_rate": 1.661804053120857e-06, + "loss": 0.9277, + "step": 34143 + }, + { + "epoch": 0.88, + "learning_rate": 1.6617833089684955e-06, + "loss": 0.7563, + "step": 34144 + }, + { + "epoch": 0.88, + "learning_rate": 1.6617625643094369e-06, + "loss": 0.8604, + "step": 34145 + }, + { + "epoch": 0.88, + "learning_rate": 1.6617418191436973e-06, + "loss": 0.6997, + "step": 34146 + }, + { + "epoch": 0.88, + "learning_rate": 1.6617210734712923e-06, + "loss": 0.5957, + "step": 34147 + }, + { + "epoch": 0.88, + "learning_rate": 1.661700327292238e-06, + "loss": 0.9844, + "step": 34148 + }, + { + "epoch": 0.88, + "learning_rate": 1.6616795806065503e-06, + "loss": 0.6543, + "step": 34149 + }, + { + "epoch": 0.88, + "learning_rate": 1.6616588334142448e-06, + "loss": 0.6042, + "step": 34150 + }, + { + "epoch": 0.88, + "learning_rate": 1.6616380857153374e-06, + "loss": 0.9121, + "step": 34151 + }, + { + "epoch": 0.88, + "learning_rate": 1.6616173375098444e-06, + "loss": 1.043, + "step": 34152 + }, + { + "epoch": 0.88, + "learning_rate": 1.6615965887977812e-06, + "loss": 0.731, + "step": 34153 + }, + { + "epoch": 0.88, + "learning_rate": 1.6615758395791639e-06, + "loss": 0.8926, + "step": 34154 + }, + { + "epoch": 0.88, + "learning_rate": 1.6615550898540084e-06, + "loss": 0.8369, + "step": 34155 + }, + { + "epoch": 0.88, + "learning_rate": 1.661534339622331e-06, + "loss": 1.0859, + "step": 34156 + }, + { + "epoch": 0.88, + "learning_rate": 1.661513588884147e-06, + "loss": 0.8408, + "step": 34157 + }, + { + "epoch": 0.88, + "learning_rate": 1.6614928376394722e-06, + "loss": 0.8857, + "step": 34158 + }, + { + "epoch": 0.88, + "learning_rate": 1.6614720858883228e-06, + "loss": 0.8896, + "step": 34159 + }, + { + "epoch": 0.88, + "learning_rate": 1.661451333630715e-06, + "loss": 0.9717, + "step": 34160 + }, + { + "epoch": 0.88, + "learning_rate": 1.6614305808666643e-06, + "loss": 0.7896, + "step": 34161 + }, + { + "epoch": 0.88, + "learning_rate": 1.661409827596186e-06, + "loss": 0.7031, + "step": 34162 + }, + { + "epoch": 0.88, + "learning_rate": 1.661389073819297e-06, + "loss": 0.7808, + "step": 34163 + }, + { + "epoch": 0.88, + "learning_rate": 1.6613683195360129e-06, + "loss": 0.771, + "step": 34164 + }, + { + "epoch": 0.88, + "learning_rate": 1.6613475647463494e-06, + "loss": 0.6191, + "step": 34165 + }, + { + "epoch": 0.88, + "learning_rate": 1.6613268094503226e-06, + "loss": 0.8545, + "step": 34166 + }, + { + "epoch": 0.88, + "learning_rate": 1.661306053647948e-06, + "loss": 0.9385, + "step": 34167 + }, + { + "epoch": 0.88, + "learning_rate": 1.661285297339242e-06, + "loss": 0.999, + "step": 34168 + }, + { + "epoch": 0.88, + "learning_rate": 1.66126454052422e-06, + "loss": 1.0996, + "step": 34169 + }, + { + "epoch": 0.88, + "learning_rate": 1.6612437832028982e-06, + "loss": 0.7837, + "step": 34170 + }, + { + "epoch": 0.88, + "learning_rate": 1.661223025375293e-06, + "loss": 0.8516, + "step": 34171 + }, + { + "epoch": 0.88, + "learning_rate": 1.661202267041419e-06, + "loss": 0.73, + "step": 34172 + }, + { + "epoch": 0.88, + "learning_rate": 1.6611815082012933e-06, + "loss": 0.9048, + "step": 34173 + }, + { + "epoch": 0.88, + "learning_rate": 1.661160748854931e-06, + "loss": 0.8672, + "step": 34174 + }, + { + "epoch": 0.88, + "learning_rate": 1.6611399890023484e-06, + "loss": 0.8096, + "step": 34175 + }, + { + "epoch": 0.88, + "learning_rate": 1.6611192286435616e-06, + "loss": 0.8022, + "step": 34176 + }, + { + "epoch": 0.88, + "learning_rate": 1.661098467778586e-06, + "loss": 0.9033, + "step": 34177 + }, + { + "epoch": 0.88, + "learning_rate": 1.6610777064074376e-06, + "loss": 0.8154, + "step": 34178 + }, + { + "epoch": 0.88, + "learning_rate": 1.661056944530132e-06, + "loss": 0.7136, + "step": 34179 + }, + { + "epoch": 0.88, + "learning_rate": 1.6610361821466862e-06, + "loss": 1.0117, + "step": 34180 + }, + { + "epoch": 0.88, + "learning_rate": 1.6610154192571151e-06, + "loss": 0.8477, + "step": 34181 + }, + { + "epoch": 0.88, + "learning_rate": 1.6609946558614349e-06, + "loss": 0.9355, + "step": 34182 + }, + { + "epoch": 0.88, + "learning_rate": 1.6609738919596616e-06, + "loss": 1.0488, + "step": 34183 + }, + { + "epoch": 0.88, + "learning_rate": 1.660953127551811e-06, + "loss": 0.7666, + "step": 34184 + }, + { + "epoch": 0.88, + "learning_rate": 1.6609323626378987e-06, + "loss": 0.729, + "step": 34185 + }, + { + "epoch": 0.88, + "learning_rate": 1.6609115972179412e-06, + "loss": 0.791, + "step": 34186 + }, + { + "epoch": 0.88, + "learning_rate": 1.660890831291954e-06, + "loss": 1.0225, + "step": 34187 + }, + { + "epoch": 0.88, + "learning_rate": 1.660870064859953e-06, + "loss": 0.731, + "step": 34188 + }, + { + "epoch": 0.88, + "learning_rate": 1.660849297921954e-06, + "loss": 0.9365, + "step": 34189 + }, + { + "epoch": 0.88, + "learning_rate": 1.6608285304779735e-06, + "loss": 0.8525, + "step": 34190 + }, + { + "epoch": 0.88, + "learning_rate": 1.6608077625280266e-06, + "loss": 0.7441, + "step": 34191 + }, + { + "epoch": 0.88, + "learning_rate": 1.6607869940721298e-06, + "loss": 0.7393, + "step": 34192 + }, + { + "epoch": 0.88, + "learning_rate": 1.6607662251102988e-06, + "loss": 0.8564, + "step": 34193 + }, + { + "epoch": 0.88, + "learning_rate": 1.6607454556425493e-06, + "loss": 0.9609, + "step": 34194 + }, + { + "epoch": 0.88, + "learning_rate": 1.6607246856688974e-06, + "loss": 1.0518, + "step": 34195 + }, + { + "epoch": 0.88, + "learning_rate": 1.6607039151893592e-06, + "loss": 1.1182, + "step": 34196 + }, + { + "epoch": 0.88, + "learning_rate": 1.6606831442039504e-06, + "loss": 0.8984, + "step": 34197 + }, + { + "epoch": 0.88, + "learning_rate": 1.6606623727126867e-06, + "loss": 0.8828, + "step": 34198 + }, + { + "epoch": 0.88, + "learning_rate": 1.6606416007155844e-06, + "loss": 0.748, + "step": 34199 + }, + { + "epoch": 0.88, + "learning_rate": 1.6606208282126588e-06, + "loss": 1.0342, + "step": 34200 + }, + { + "epoch": 0.88, + "learning_rate": 1.6606000552039267e-06, + "loss": 0.6328, + "step": 34201 + }, + { + "epoch": 0.88, + "learning_rate": 1.660579281689403e-06, + "loss": 0.6836, + "step": 34202 + }, + { + "epoch": 0.88, + "learning_rate": 1.6605585076691048e-06, + "loss": 0.8516, + "step": 34203 + }, + { + "epoch": 0.88, + "learning_rate": 1.6605377331430467e-06, + "loss": 0.79, + "step": 34204 + }, + { + "epoch": 0.88, + "learning_rate": 1.6605169581112454e-06, + "loss": 1.0596, + "step": 34205 + }, + { + "epoch": 0.88, + "learning_rate": 1.6604961825737167e-06, + "loss": 0.9004, + "step": 34206 + }, + { + "epoch": 0.88, + "learning_rate": 1.6604754065304768e-06, + "loss": 0.8594, + "step": 34207 + }, + { + "epoch": 0.88, + "learning_rate": 1.6604546299815408e-06, + "loss": 0.8311, + "step": 34208 + }, + { + "epoch": 0.88, + "learning_rate": 1.6604338529269249e-06, + "loss": 0.8252, + "step": 34209 + }, + { + "epoch": 0.88, + "learning_rate": 1.6604130753666455e-06, + "loss": 0.8525, + "step": 34210 + }, + { + "epoch": 0.88, + "learning_rate": 1.660392297300718e-06, + "loss": 0.9473, + "step": 34211 + }, + { + "epoch": 0.88, + "learning_rate": 1.6603715187291586e-06, + "loss": 0.8445, + "step": 34212 + }, + { + "epoch": 0.88, + "learning_rate": 1.6603507396519832e-06, + "loss": 0.8271, + "step": 34213 + }, + { + "epoch": 0.88, + "learning_rate": 1.6603299600692073e-06, + "loss": 1.0713, + "step": 34214 + }, + { + "epoch": 0.88, + "learning_rate": 1.6603091799808474e-06, + "loss": 0.812, + "step": 34215 + }, + { + "epoch": 0.88, + "learning_rate": 1.6602883993869191e-06, + "loss": 0.9717, + "step": 34216 + }, + { + "epoch": 0.88, + "learning_rate": 1.6602676182874382e-06, + "loss": 0.6768, + "step": 34217 + }, + { + "epoch": 0.88, + "learning_rate": 1.6602468366824206e-06, + "loss": 0.8789, + "step": 34218 + }, + { + "epoch": 0.88, + "learning_rate": 1.6602260545718826e-06, + "loss": 0.7695, + "step": 34219 + }, + { + "epoch": 0.88, + "learning_rate": 1.66020527195584e-06, + "loss": 0.8662, + "step": 34220 + }, + { + "epoch": 0.88, + "learning_rate": 1.6601844888343085e-06, + "loss": 1.041, + "step": 34221 + }, + { + "epoch": 0.88, + "learning_rate": 1.6601637052073039e-06, + "loss": 0.6768, + "step": 34222 + }, + { + "epoch": 0.88, + "learning_rate": 1.6601429210748423e-06, + "loss": 0.8164, + "step": 34223 + }, + { + "epoch": 0.88, + "learning_rate": 1.6601221364369399e-06, + "loss": 1.0566, + "step": 34224 + }, + { + "epoch": 0.88, + "learning_rate": 1.660101351293612e-06, + "loss": 0.8799, + "step": 34225 + }, + { + "epoch": 0.88, + "learning_rate": 1.660080565644875e-06, + "loss": 0.6855, + "step": 34226 + }, + { + "epoch": 0.88, + "learning_rate": 1.6600597794907447e-06, + "loss": 0.6545, + "step": 34227 + }, + { + "epoch": 0.88, + "learning_rate": 1.6600389928312368e-06, + "loss": 0.8516, + "step": 34228 + }, + { + "epoch": 0.88, + "learning_rate": 1.6600182056663674e-06, + "loss": 0.8984, + "step": 34229 + }, + { + "epoch": 0.88, + "learning_rate": 1.6599974179961527e-06, + "loss": 0.7134, + "step": 34230 + }, + { + "epoch": 0.88, + "learning_rate": 1.659976629820608e-06, + "loss": 0.8896, + "step": 34231 + }, + { + "epoch": 0.88, + "learning_rate": 1.6599558411397498e-06, + "loss": 0.9707, + "step": 34232 + }, + { + "epoch": 0.88, + "learning_rate": 1.6599350519535937e-06, + "loss": 0.999, + "step": 34233 + }, + { + "epoch": 0.88, + "learning_rate": 1.6599142622621557e-06, + "loss": 0.9072, + "step": 34234 + }, + { + "epoch": 0.88, + "learning_rate": 1.6598934720654513e-06, + "loss": 0.6304, + "step": 34235 + }, + { + "epoch": 0.88, + "learning_rate": 1.6598726813634975e-06, + "loss": 0.7256, + "step": 34236 + }, + { + "epoch": 0.88, + "learning_rate": 1.659851890156309e-06, + "loss": 0.644, + "step": 34237 + }, + { + "epoch": 0.88, + "learning_rate": 1.6598310984439024e-06, + "loss": 0.8848, + "step": 34238 + }, + { + "epoch": 0.88, + "learning_rate": 1.6598103062262934e-06, + "loss": 0.7117, + "step": 34239 + }, + { + "epoch": 0.88, + "learning_rate": 1.6597895135034983e-06, + "loss": 0.8223, + "step": 34240 + }, + { + "epoch": 0.88, + "learning_rate": 1.6597687202755324e-06, + "loss": 1.0859, + "step": 34241 + }, + { + "epoch": 0.88, + "learning_rate": 1.659747926542412e-06, + "loss": 0.7168, + "step": 34242 + }, + { + "epoch": 0.88, + "learning_rate": 1.6597271323041531e-06, + "loss": 0.8896, + "step": 34243 + }, + { + "epoch": 0.88, + "learning_rate": 1.6597063375607712e-06, + "loss": 0.6392, + "step": 34244 + }, + { + "epoch": 0.88, + "learning_rate": 1.6596855423122827e-06, + "loss": 0.8359, + "step": 34245 + }, + { + "epoch": 0.88, + "learning_rate": 1.6596647465587031e-06, + "loss": 0.8867, + "step": 34246 + }, + { + "epoch": 0.88, + "learning_rate": 1.6596439503000489e-06, + "loss": 0.7271, + "step": 34247 + }, + { + "epoch": 0.88, + "learning_rate": 1.659623153536335e-06, + "loss": 0.8613, + "step": 34248 + }, + { + "epoch": 0.88, + "learning_rate": 1.6596023562675786e-06, + "loss": 0.8936, + "step": 34249 + }, + { + "epoch": 0.88, + "learning_rate": 1.659581558493795e-06, + "loss": 0.5469, + "step": 34250 + }, + { + "epoch": 0.88, + "learning_rate": 1.6595607602149997e-06, + "loss": 0.9058, + "step": 34251 + }, + { + "epoch": 0.88, + "learning_rate": 1.6595399614312094e-06, + "loss": 0.9668, + "step": 34252 + }, + { + "epoch": 0.88, + "learning_rate": 1.6595191621424394e-06, + "loss": 0.8662, + "step": 34253 + }, + { + "epoch": 0.88, + "learning_rate": 1.6594983623487063e-06, + "loss": 0.9834, + "step": 34254 + }, + { + "epoch": 0.88, + "learning_rate": 1.659477562050025e-06, + "loss": 0.9697, + "step": 34255 + }, + { + "epoch": 0.88, + "learning_rate": 1.6594567612464128e-06, + "loss": 0.7827, + "step": 34256 + }, + { + "epoch": 0.88, + "learning_rate": 1.6594359599378845e-06, + "loss": 0.8025, + "step": 34257 + }, + { + "epoch": 0.88, + "learning_rate": 1.6594151581244561e-06, + "loss": 0.7976, + "step": 34258 + }, + { + "epoch": 0.88, + "learning_rate": 1.6593943558061442e-06, + "loss": 0.6943, + "step": 34259 + }, + { + "epoch": 0.88, + "learning_rate": 1.6593735529829645e-06, + "loss": 0.8633, + "step": 34260 + }, + { + "epoch": 0.88, + "learning_rate": 1.6593527496549328e-06, + "loss": 0.9775, + "step": 34261 + }, + { + "epoch": 0.88, + "learning_rate": 1.6593319458220648e-06, + "loss": 0.9199, + "step": 34262 + }, + { + "epoch": 0.88, + "learning_rate": 1.6593111414843769e-06, + "loss": 1.0557, + "step": 34263 + }, + { + "epoch": 0.88, + "learning_rate": 1.6592903366418841e-06, + "loss": 0.9131, + "step": 34264 + }, + { + "epoch": 0.88, + "learning_rate": 1.6592695312946034e-06, + "loss": 1.0869, + "step": 34265 + }, + { + "epoch": 0.88, + "learning_rate": 1.6592487254425508e-06, + "loss": 1.0879, + "step": 34266 + }, + { + "epoch": 0.88, + "learning_rate": 1.6592279190857412e-06, + "loss": 0.563, + "step": 34267 + }, + { + "epoch": 0.88, + "learning_rate": 1.6592071122241913e-06, + "loss": 0.6777, + "step": 34268 + }, + { + "epoch": 0.88, + "learning_rate": 1.6591863048579167e-06, + "loss": 0.8291, + "step": 34269 + }, + { + "epoch": 0.88, + "learning_rate": 1.6591654969869335e-06, + "loss": 0.8408, + "step": 34270 + }, + { + "epoch": 0.88, + "learning_rate": 1.6591446886112578e-06, + "loss": 0.9014, + "step": 34271 + }, + { + "epoch": 0.88, + "learning_rate": 1.659123879730905e-06, + "loss": 0.9023, + "step": 34272 + }, + { + "epoch": 0.88, + "learning_rate": 1.6591030703458917e-06, + "loss": 0.7671, + "step": 34273 + }, + { + "epoch": 0.88, + "learning_rate": 1.659082260456233e-06, + "loss": 0.7471, + "step": 34274 + }, + { + "epoch": 0.88, + "learning_rate": 1.6590614500619457e-06, + "loss": 0.9492, + "step": 34275 + }, + { + "epoch": 0.88, + "learning_rate": 1.6590406391630454e-06, + "loss": 0.916, + "step": 34276 + }, + { + "epoch": 0.88, + "learning_rate": 1.6590198277595477e-06, + "loss": 0.6265, + "step": 34277 + }, + { + "epoch": 0.88, + "learning_rate": 1.6589990158514691e-06, + "loss": 0.9111, + "step": 34278 + }, + { + "epoch": 0.88, + "learning_rate": 1.658978203438825e-06, + "loss": 0.834, + "step": 34279 + }, + { + "epoch": 0.88, + "learning_rate": 1.6589573905216318e-06, + "loss": 0.7124, + "step": 34280 + }, + { + "epoch": 0.88, + "learning_rate": 1.6589365770999053e-06, + "loss": 0.8428, + "step": 34281 + }, + { + "epoch": 0.88, + "learning_rate": 1.658915763173661e-06, + "loss": 1.0938, + "step": 34282 + }, + { + "epoch": 0.88, + "learning_rate": 1.6588949487429154e-06, + "loss": 0.7793, + "step": 34283 + }, + { + "epoch": 0.88, + "learning_rate": 1.6588741338076844e-06, + "loss": 0.9062, + "step": 34284 + }, + { + "epoch": 0.88, + "learning_rate": 1.6588533183679833e-06, + "loss": 0.6089, + "step": 34285 + }, + { + "epoch": 0.88, + "learning_rate": 1.658832502423829e-06, + "loss": 0.8838, + "step": 34286 + }, + { + "epoch": 0.88, + "learning_rate": 1.6588116859752367e-06, + "loss": 0.9971, + "step": 34287 + }, + { + "epoch": 0.88, + "learning_rate": 1.6587908690222227e-06, + "loss": 0.8369, + "step": 34288 + }, + { + "epoch": 0.88, + "learning_rate": 1.6587700515648026e-06, + "loss": 0.9004, + "step": 34289 + }, + { + "epoch": 0.88, + "learning_rate": 1.6587492336029927e-06, + "loss": 0.8691, + "step": 34290 + }, + { + "epoch": 0.88, + "learning_rate": 1.6587284151368093e-06, + "loss": 0.7393, + "step": 34291 + }, + { + "epoch": 0.88, + "learning_rate": 1.6587075961662672e-06, + "loss": 0.7861, + "step": 34292 + }, + { + "epoch": 0.88, + "learning_rate": 1.658686776691383e-06, + "loss": 0.6919, + "step": 34293 + }, + { + "epoch": 0.88, + "learning_rate": 1.6586659567121729e-06, + "loss": 0.5806, + "step": 34294 + }, + { + "epoch": 0.88, + "learning_rate": 1.6586451362286522e-06, + "loss": 0.7402, + "step": 34295 + }, + { + "epoch": 0.88, + "learning_rate": 1.6586243152408376e-06, + "loss": 0.7285, + "step": 34296 + }, + { + "epoch": 0.88, + "learning_rate": 1.6586034937487445e-06, + "loss": 0.6689, + "step": 34297 + }, + { + "epoch": 0.88, + "learning_rate": 1.658582671752389e-06, + "loss": 0.8877, + "step": 34298 + }, + { + "epoch": 0.88, + "learning_rate": 1.6585618492517868e-06, + "loss": 0.7812, + "step": 34299 + }, + { + "epoch": 0.88, + "learning_rate": 1.6585410262469544e-06, + "loss": 0.9775, + "step": 34300 + }, + { + "epoch": 0.88, + "learning_rate": 1.6585202027379075e-06, + "loss": 0.7954, + "step": 34301 + }, + { + "epoch": 0.88, + "learning_rate": 1.6584993787246616e-06, + "loss": 0.876, + "step": 34302 + }, + { + "epoch": 0.88, + "learning_rate": 1.658478554207233e-06, + "loss": 0.8027, + "step": 34303 + }, + { + "epoch": 0.88, + "learning_rate": 1.6584577291856378e-06, + "loss": 0.6594, + "step": 34304 + }, + { + "epoch": 0.88, + "learning_rate": 1.658436903659892e-06, + "loss": 0.8154, + "step": 34305 + }, + { + "epoch": 0.88, + "learning_rate": 1.658416077630011e-06, + "loss": 0.7168, + "step": 34306 + }, + { + "epoch": 0.88, + "learning_rate": 1.6583952510960115e-06, + "loss": 0.959, + "step": 34307 + }, + { + "epoch": 0.88, + "learning_rate": 1.6583744240579085e-06, + "loss": 1.1162, + "step": 34308 + }, + { + "epoch": 0.88, + "learning_rate": 1.6583535965157189e-06, + "loss": 0.7617, + "step": 34309 + }, + { + "epoch": 0.88, + "learning_rate": 1.658332768469458e-06, + "loss": 1.0615, + "step": 34310 + }, + { + "epoch": 0.88, + "learning_rate": 1.6583119399191422e-06, + "loss": 0.8247, + "step": 34311 + }, + { + "epoch": 0.88, + "learning_rate": 1.658291110864787e-06, + "loss": 0.7583, + "step": 34312 + }, + { + "epoch": 0.88, + "learning_rate": 1.6582702813064086e-06, + "loss": 0.7163, + "step": 34313 + }, + { + "epoch": 0.88, + "learning_rate": 1.6582494512440228e-06, + "loss": 0.9092, + "step": 34314 + }, + { + "epoch": 0.88, + "learning_rate": 1.658228620677646e-06, + "loss": 0.6323, + "step": 34315 + }, + { + "epoch": 0.88, + "learning_rate": 1.6582077896072935e-06, + "loss": 1.04, + "step": 34316 + }, + { + "epoch": 0.88, + "learning_rate": 1.6581869580329815e-06, + "loss": 0.7715, + "step": 34317 + }, + { + "epoch": 0.88, + "learning_rate": 1.658166125954726e-06, + "loss": 0.9639, + "step": 34318 + }, + { + "epoch": 0.88, + "learning_rate": 1.6581452933725434e-06, + "loss": 0.7559, + "step": 34319 + }, + { + "epoch": 0.88, + "learning_rate": 1.6581244602864488e-06, + "loss": 0.897, + "step": 34320 + }, + { + "epoch": 0.88, + "learning_rate": 1.6581036266964587e-06, + "loss": 0.9775, + "step": 34321 + }, + { + "epoch": 0.88, + "learning_rate": 1.658082792602589e-06, + "loss": 1.0732, + "step": 34322 + }, + { + "epoch": 0.88, + "learning_rate": 1.6580619580048555e-06, + "loss": 0.8604, + "step": 34323 + }, + { + "epoch": 0.88, + "learning_rate": 1.6580411229032742e-06, + "loss": 0.9775, + "step": 34324 + }, + { + "epoch": 0.88, + "learning_rate": 1.658020287297861e-06, + "loss": 0.6465, + "step": 34325 + }, + { + "epoch": 0.88, + "learning_rate": 1.6579994511886322e-06, + "loss": 0.6143, + "step": 34326 + }, + { + "epoch": 0.88, + "learning_rate": 1.6579786145756031e-06, + "loss": 0.9512, + "step": 34327 + }, + { + "epoch": 0.88, + "learning_rate": 1.6579577774587902e-06, + "loss": 0.874, + "step": 34328 + }, + { + "epoch": 0.88, + "learning_rate": 1.6579369398382093e-06, + "loss": 0.8149, + "step": 34329 + }, + { + "epoch": 0.88, + "learning_rate": 1.6579161017138763e-06, + "loss": 0.875, + "step": 34330 + }, + { + "epoch": 0.88, + "learning_rate": 1.6578952630858073e-06, + "loss": 0.8691, + "step": 34331 + }, + { + "epoch": 0.88, + "learning_rate": 1.6578744239540182e-06, + "loss": 0.873, + "step": 34332 + }, + { + "epoch": 0.88, + "learning_rate": 1.6578535843185246e-06, + "loss": 0.8457, + "step": 34333 + }, + { + "epoch": 0.88, + "learning_rate": 1.657832744179343e-06, + "loss": 0.8789, + "step": 34334 + }, + { + "epoch": 0.88, + "learning_rate": 1.6578119035364888e-06, + "loss": 0.7139, + "step": 34335 + }, + { + "epoch": 0.88, + "learning_rate": 1.6577910623899789e-06, + "loss": 0.7905, + "step": 34336 + }, + { + "epoch": 0.88, + "learning_rate": 1.657770220739828e-06, + "loss": 0.7285, + "step": 34337 + }, + { + "epoch": 0.88, + "learning_rate": 1.657749378586053e-06, + "loss": 0.6013, + "step": 34338 + }, + { + "epoch": 0.88, + "learning_rate": 1.6577285359286694e-06, + "loss": 0.7295, + "step": 34339 + }, + { + "epoch": 0.88, + "learning_rate": 1.6577076927676935e-06, + "loss": 0.75, + "step": 34340 + }, + { + "epoch": 0.88, + "learning_rate": 1.657686849103141e-06, + "loss": 0.9336, + "step": 34341 + }, + { + "epoch": 0.88, + "learning_rate": 1.6576660049350278e-06, + "loss": 0.6709, + "step": 34342 + }, + { + "epoch": 0.88, + "learning_rate": 1.65764516026337e-06, + "loss": 0.7434, + "step": 34343 + }, + { + "epoch": 0.88, + "learning_rate": 1.6576243150881834e-06, + "loss": 0.7891, + "step": 34344 + }, + { + "epoch": 0.88, + "learning_rate": 1.6576034694094845e-06, + "loss": 0.7178, + "step": 34345 + }, + { + "epoch": 0.88, + "learning_rate": 1.6575826232272886e-06, + "loss": 0.603, + "step": 34346 + }, + { + "epoch": 0.88, + "learning_rate": 1.6575617765416122e-06, + "loss": 0.8242, + "step": 34347 + }, + { + "epoch": 0.88, + "learning_rate": 1.6575409293524705e-06, + "loss": 0.9355, + "step": 34348 + }, + { + "epoch": 0.88, + "learning_rate": 1.65752008165988e-06, + "loss": 0.8457, + "step": 34349 + }, + { + "epoch": 0.88, + "learning_rate": 1.657499233463857e-06, + "loss": 0.8154, + "step": 34350 + }, + { + "epoch": 0.88, + "learning_rate": 1.657478384764417e-06, + "loss": 0.7456, + "step": 34351 + }, + { + "epoch": 0.88, + "learning_rate": 1.6574575355615759e-06, + "loss": 0.9551, + "step": 34352 + }, + { + "epoch": 0.88, + "learning_rate": 1.6574366858553497e-06, + "loss": 0.7524, + "step": 34353 + }, + { + "epoch": 0.88, + "learning_rate": 1.6574158356457546e-06, + "loss": 0.9453, + "step": 34354 + }, + { + "epoch": 0.88, + "learning_rate": 1.6573949849328065e-06, + "loss": 0.6885, + "step": 34355 + }, + { + "epoch": 0.88, + "learning_rate": 1.657374133716521e-06, + "loss": 0.9727, + "step": 34356 + }, + { + "epoch": 0.88, + "learning_rate": 1.6573532819969144e-06, + "loss": 0.8408, + "step": 34357 + }, + { + "epoch": 0.88, + "learning_rate": 1.6573324297740028e-06, + "loss": 0.9492, + "step": 34358 + }, + { + "epoch": 0.88, + "learning_rate": 1.6573115770478018e-06, + "loss": 0.8604, + "step": 34359 + }, + { + "epoch": 0.88, + "learning_rate": 1.6572907238183278e-06, + "loss": 0.7578, + "step": 34360 + }, + { + "epoch": 0.88, + "learning_rate": 1.6572698700855962e-06, + "loss": 0.7783, + "step": 34361 + }, + { + "epoch": 0.88, + "learning_rate": 1.6572490158496234e-06, + "loss": 0.6738, + "step": 34362 + }, + { + "epoch": 0.88, + "learning_rate": 1.6572281611104255e-06, + "loss": 0.9385, + "step": 34363 + }, + { + "epoch": 0.88, + "learning_rate": 1.657207305868018e-06, + "loss": 0.8252, + "step": 34364 + }, + { + "epoch": 0.88, + "learning_rate": 1.6571864501224174e-06, + "loss": 0.8149, + "step": 34365 + }, + { + "epoch": 0.88, + "learning_rate": 1.6571655938736391e-06, + "loss": 0.8506, + "step": 34366 + }, + { + "epoch": 0.88, + "learning_rate": 1.657144737121699e-06, + "loss": 1.0176, + "step": 34367 + }, + { + "epoch": 0.88, + "learning_rate": 1.6571238798666137e-06, + "loss": 0.7217, + "step": 34368 + }, + { + "epoch": 0.88, + "learning_rate": 1.6571030221083988e-06, + "loss": 0.7095, + "step": 34369 + }, + { + "epoch": 0.88, + "learning_rate": 1.6570821638470704e-06, + "loss": 0.9229, + "step": 34370 + }, + { + "epoch": 0.88, + "learning_rate": 1.6570613050826445e-06, + "loss": 0.8945, + "step": 34371 + }, + { + "epoch": 0.88, + "learning_rate": 1.6570404458151367e-06, + "loss": 0.7842, + "step": 34372 + }, + { + "epoch": 0.88, + "learning_rate": 1.6570195860445635e-06, + "loss": 0.5664, + "step": 34373 + }, + { + "epoch": 0.88, + "learning_rate": 1.6569987257709403e-06, + "loss": 0.873, + "step": 34374 + }, + { + "epoch": 0.88, + "learning_rate": 1.6569778649942836e-06, + "loss": 0.8633, + "step": 34375 + }, + { + "epoch": 0.88, + "learning_rate": 1.6569570037146095e-06, + "loss": 0.7402, + "step": 34376 + }, + { + "epoch": 0.88, + "learning_rate": 1.6569361419319333e-06, + "loss": 0.5537, + "step": 34377 + }, + { + "epoch": 0.88, + "learning_rate": 1.6569152796462711e-06, + "loss": 0.9297, + "step": 34378 + }, + { + "epoch": 0.88, + "learning_rate": 1.6568944168576393e-06, + "loss": 0.8613, + "step": 34379 + }, + { + "epoch": 0.88, + "learning_rate": 1.6568735535660533e-06, + "loss": 0.9268, + "step": 34380 + }, + { + "epoch": 0.88, + "learning_rate": 1.6568526897715303e-06, + "loss": 0.6685, + "step": 34381 + }, + { + "epoch": 0.88, + "learning_rate": 1.6568318254740844e-06, + "loss": 0.7773, + "step": 34382 + }, + { + "epoch": 0.88, + "learning_rate": 1.656810960673733e-06, + "loss": 0.9326, + "step": 34383 + }, + { + "epoch": 0.88, + "learning_rate": 1.656790095370492e-06, + "loss": 0.8633, + "step": 34384 + }, + { + "epoch": 0.88, + "learning_rate": 1.6567692295643764e-06, + "loss": 0.79, + "step": 34385 + }, + { + "epoch": 0.88, + "learning_rate": 1.656748363255403e-06, + "loss": 0.7639, + "step": 34386 + }, + { + "epoch": 0.88, + "learning_rate": 1.6567274964435877e-06, + "loss": 0.9062, + "step": 34387 + }, + { + "epoch": 0.88, + "learning_rate": 1.6567066291289463e-06, + "loss": 0.8545, + "step": 34388 + }, + { + "epoch": 0.88, + "learning_rate": 1.6566857613114947e-06, + "loss": 0.7612, + "step": 34389 + }, + { + "epoch": 0.88, + "learning_rate": 1.6566648929912493e-06, + "loss": 0.7451, + "step": 34390 + }, + { + "epoch": 0.88, + "learning_rate": 1.6566440241682256e-06, + "loss": 0.8779, + "step": 34391 + }, + { + "epoch": 0.88, + "learning_rate": 1.6566231548424398e-06, + "loss": 0.8506, + "step": 34392 + }, + { + "epoch": 0.88, + "learning_rate": 1.656602285013908e-06, + "loss": 0.9434, + "step": 34393 + }, + { + "epoch": 0.88, + "learning_rate": 1.6565814146826455e-06, + "loss": 0.709, + "step": 34394 + }, + { + "epoch": 0.88, + "learning_rate": 1.6565605438486695e-06, + "loss": 0.7773, + "step": 34395 + }, + { + "epoch": 0.88, + "learning_rate": 1.6565396725119948e-06, + "loss": 0.8291, + "step": 34396 + }, + { + "epoch": 0.88, + "learning_rate": 1.6565188006726381e-06, + "loss": 1.0176, + "step": 34397 + }, + { + "epoch": 0.88, + "learning_rate": 1.6564979283306148e-06, + "loss": 0.8633, + "step": 34398 + }, + { + "epoch": 0.88, + "learning_rate": 1.6564770554859418e-06, + "loss": 0.7114, + "step": 34399 + }, + { + "epoch": 0.88, + "learning_rate": 1.656456182138634e-06, + "loss": 0.8037, + "step": 34400 + }, + { + "epoch": 0.88, + "learning_rate": 1.6564353082887081e-06, + "loss": 0.8174, + "step": 34401 + }, + { + "epoch": 0.88, + "learning_rate": 1.6564144339361799e-06, + "loss": 0.874, + "step": 34402 + }, + { + "epoch": 0.88, + "learning_rate": 1.6563935590810653e-06, + "loss": 0.8428, + "step": 34403 + }, + { + "epoch": 0.88, + "learning_rate": 1.6563726837233802e-06, + "loss": 0.9717, + "step": 34404 + }, + { + "epoch": 0.88, + "learning_rate": 1.6563518078631407e-06, + "loss": 1.0225, + "step": 34405 + }, + { + "epoch": 0.88, + "learning_rate": 1.6563309315003631e-06, + "loss": 0.876, + "step": 34406 + }, + { + "epoch": 0.88, + "learning_rate": 1.6563100546350627e-06, + "loss": 0.6743, + "step": 34407 + }, + { + "epoch": 0.88, + "learning_rate": 1.656289177267256e-06, + "loss": 0.8691, + "step": 34408 + }, + { + "epoch": 0.88, + "learning_rate": 1.656268299396959e-06, + "loss": 0.8047, + "step": 34409 + }, + { + "epoch": 0.88, + "learning_rate": 1.6562474210241878e-06, + "loss": 0.8496, + "step": 34410 + }, + { + "epoch": 0.88, + "learning_rate": 1.6562265421489576e-06, + "loss": 0.7964, + "step": 34411 + }, + { + "epoch": 0.88, + "learning_rate": 1.6562056627712852e-06, + "loss": 0.875, + "step": 34412 + }, + { + "epoch": 0.88, + "learning_rate": 1.6561847828911862e-06, + "loss": 0.8311, + "step": 34413 + }, + { + "epoch": 0.88, + "learning_rate": 1.6561639025086764e-06, + "loss": 0.7568, + "step": 34414 + }, + { + "epoch": 0.88, + "learning_rate": 1.6561430216237726e-06, + "loss": 0.6426, + "step": 34415 + }, + { + "epoch": 0.88, + "learning_rate": 1.65612214023649e-06, + "loss": 0.9707, + "step": 34416 + }, + { + "epoch": 0.88, + "learning_rate": 1.6561012583468448e-06, + "loss": 0.6792, + "step": 34417 + }, + { + "epoch": 0.88, + "learning_rate": 1.6560803759548532e-06, + "loss": 0.9678, + "step": 34418 + }, + { + "epoch": 0.88, + "learning_rate": 1.656059493060531e-06, + "loss": 0.8555, + "step": 34419 + }, + { + "epoch": 0.88, + "learning_rate": 1.6560386096638941e-06, + "loss": 0.7686, + "step": 34420 + }, + { + "epoch": 0.88, + "learning_rate": 1.6560177257649586e-06, + "loss": 0.6611, + "step": 34421 + }, + { + "epoch": 0.88, + "learning_rate": 1.6559968413637405e-06, + "loss": 0.7783, + "step": 34422 + }, + { + "epoch": 0.88, + "learning_rate": 1.6559759564602558e-06, + "loss": 0.8052, + "step": 34423 + }, + { + "epoch": 0.88, + "learning_rate": 1.6559550710545204e-06, + "loss": 0.9814, + "step": 34424 + }, + { + "epoch": 0.88, + "learning_rate": 1.6559341851465504e-06, + "loss": 0.8789, + "step": 34425 + }, + { + "epoch": 0.88, + "learning_rate": 1.6559132987363618e-06, + "loss": 0.9385, + "step": 34426 + }, + { + "epoch": 0.88, + "learning_rate": 1.6558924118239706e-06, + "loss": 0.9199, + "step": 34427 + }, + { + "epoch": 0.88, + "learning_rate": 1.6558715244093928e-06, + "loss": 0.7402, + "step": 34428 + }, + { + "epoch": 0.88, + "learning_rate": 1.655850636492644e-06, + "loss": 0.9121, + "step": 34429 + }, + { + "epoch": 0.88, + "learning_rate": 1.6558297480737408e-06, + "loss": 0.7715, + "step": 34430 + }, + { + "epoch": 0.88, + "learning_rate": 1.655808859152699e-06, + "loss": 1.0635, + "step": 34431 + }, + { + "epoch": 0.88, + "learning_rate": 1.6557879697295342e-06, + "loss": 0.8486, + "step": 34432 + }, + { + "epoch": 0.88, + "learning_rate": 1.655767079804263e-06, + "loss": 0.7126, + "step": 34433 + }, + { + "epoch": 0.88, + "learning_rate": 1.655746189376901e-06, + "loss": 0.6156, + "step": 34434 + }, + { + "epoch": 0.88, + "learning_rate": 1.6557252984474644e-06, + "loss": 0.8584, + "step": 34435 + }, + { + "epoch": 0.88, + "learning_rate": 1.655704407015969e-06, + "loss": 0.7073, + "step": 34436 + }, + { + "epoch": 0.88, + "learning_rate": 1.6556835150824306e-06, + "loss": 0.9824, + "step": 34437 + }, + { + "epoch": 0.88, + "learning_rate": 1.6556626226468657e-06, + "loss": 0.583, + "step": 34438 + }, + { + "epoch": 0.88, + "learning_rate": 1.65564172970929e-06, + "loss": 0.7046, + "step": 34439 + }, + { + "epoch": 0.88, + "learning_rate": 1.65562083626972e-06, + "loss": 0.8652, + "step": 34440 + }, + { + "epoch": 0.88, + "learning_rate": 1.655599942328171e-06, + "loss": 0.9053, + "step": 34441 + }, + { + "epoch": 0.88, + "learning_rate": 1.6555790478846592e-06, + "loss": 0.8408, + "step": 34442 + }, + { + "epoch": 0.88, + "learning_rate": 1.6555581529392004e-06, + "loss": 0.9033, + "step": 34443 + }, + { + "epoch": 0.88, + "learning_rate": 1.6555372574918113e-06, + "loss": 0.833, + "step": 34444 + }, + { + "epoch": 0.88, + "learning_rate": 1.6555163615425075e-06, + "loss": 0.9697, + "step": 34445 + }, + { + "epoch": 0.88, + "learning_rate": 1.6554954650913047e-06, + "loss": 0.8857, + "step": 34446 + }, + { + "epoch": 0.88, + "learning_rate": 1.6554745681382192e-06, + "loss": 0.8018, + "step": 34447 + }, + { + "epoch": 0.88, + "learning_rate": 1.6554536706832671e-06, + "loss": 0.6953, + "step": 34448 + }, + { + "epoch": 0.88, + "learning_rate": 1.655432772726464e-06, + "loss": 0.8008, + "step": 34449 + }, + { + "epoch": 0.88, + "learning_rate": 1.6554118742678265e-06, + "loss": 0.8838, + "step": 34450 + }, + { + "epoch": 0.88, + "learning_rate": 1.65539097530737e-06, + "loss": 0.8467, + "step": 34451 + }, + { + "epoch": 0.88, + "learning_rate": 1.6553700758451109e-06, + "loss": 0.5132, + "step": 34452 + }, + { + "epoch": 0.88, + "learning_rate": 1.6553491758810649e-06, + "loss": 0.7666, + "step": 34453 + }, + { + "epoch": 0.88, + "learning_rate": 1.6553282754152484e-06, + "loss": 0.6992, + "step": 34454 + }, + { + "epoch": 0.88, + "learning_rate": 1.6553073744476772e-06, + "loss": 0.7471, + "step": 34455 + }, + { + "epoch": 0.88, + "learning_rate": 1.655286472978367e-06, + "loss": 0.8159, + "step": 34456 + }, + { + "epoch": 0.88, + "learning_rate": 1.6552655710073342e-06, + "loss": 0.7451, + "step": 34457 + }, + { + "epoch": 0.88, + "learning_rate": 1.655244668534595e-06, + "loss": 0.7764, + "step": 34458 + }, + { + "epoch": 0.88, + "learning_rate": 1.6552237655601645e-06, + "loss": 0.8525, + "step": 34459 + }, + { + "epoch": 0.88, + "learning_rate": 1.6552028620840596e-06, + "loss": 0.4675, + "step": 34460 + }, + { + "epoch": 0.88, + "learning_rate": 1.6551819581062963e-06, + "loss": 0.8809, + "step": 34461 + }, + { + "epoch": 0.88, + "learning_rate": 1.6551610536268896e-06, + "loss": 0.8555, + "step": 34462 + }, + { + "epoch": 0.88, + "learning_rate": 1.6551401486458567e-06, + "loss": 0.8701, + "step": 34463 + }, + { + "epoch": 0.88, + "learning_rate": 1.6551192431632132e-06, + "loss": 0.7832, + "step": 34464 + }, + { + "epoch": 0.88, + "learning_rate": 1.6550983371789747e-06, + "loss": 0.8281, + "step": 34465 + }, + { + "epoch": 0.88, + "learning_rate": 1.6550774306931577e-06, + "loss": 0.8525, + "step": 34466 + }, + { + "epoch": 0.88, + "learning_rate": 1.655056523705778e-06, + "loss": 0.7852, + "step": 34467 + }, + { + "epoch": 0.88, + "learning_rate": 1.6550356162168515e-06, + "loss": 1.082, + "step": 34468 + }, + { + "epoch": 0.88, + "learning_rate": 1.6550147082263944e-06, + "loss": 0.9902, + "step": 34469 + }, + { + "epoch": 0.88, + "learning_rate": 1.6549937997344228e-06, + "loss": 0.7646, + "step": 34470 + }, + { + "epoch": 0.88, + "learning_rate": 1.6549728907409524e-06, + "loss": 0.7188, + "step": 34471 + }, + { + "epoch": 0.88, + "learning_rate": 1.6549519812459996e-06, + "loss": 0.8945, + "step": 34472 + }, + { + "epoch": 0.88, + "learning_rate": 1.65493107124958e-06, + "loss": 0.4934, + "step": 34473 + }, + { + "epoch": 0.88, + "learning_rate": 1.6549101607517098e-06, + "loss": 0.772, + "step": 34474 + }, + { + "epoch": 0.88, + "learning_rate": 1.6548892497524053e-06, + "loss": 0.9111, + "step": 34475 + }, + { + "epoch": 0.88, + "learning_rate": 1.6548683382516816e-06, + "loss": 0.71, + "step": 34476 + }, + { + "epoch": 0.88, + "learning_rate": 1.6548474262495557e-06, + "loss": 0.7188, + "step": 34477 + }, + { + "epoch": 0.88, + "learning_rate": 1.6548265137460433e-06, + "loss": 0.7783, + "step": 34478 + }, + { + "epoch": 0.88, + "learning_rate": 1.6548056007411604e-06, + "loss": 0.7468, + "step": 34479 + }, + { + "epoch": 0.88, + "learning_rate": 1.654784687234923e-06, + "loss": 0.958, + "step": 34480 + }, + { + "epoch": 0.88, + "learning_rate": 1.6547637732273468e-06, + "loss": 0.918, + "step": 34481 + }, + { + "epoch": 0.88, + "learning_rate": 1.6547428587184479e-06, + "loss": 0.6821, + "step": 34482 + }, + { + "epoch": 0.88, + "learning_rate": 1.6547219437082429e-06, + "loss": 0.8057, + "step": 34483 + }, + { + "epoch": 0.88, + "learning_rate": 1.6547010281967473e-06, + "loss": 0.5962, + "step": 34484 + }, + { + "epoch": 0.88, + "learning_rate": 1.6546801121839773e-06, + "loss": 0.875, + "step": 34485 + }, + { + "epoch": 0.88, + "learning_rate": 1.6546591956699488e-06, + "loss": 0.7244, + "step": 34486 + }, + { + "epoch": 0.88, + "learning_rate": 1.6546382786546779e-06, + "loss": 0.8926, + "step": 34487 + }, + { + "epoch": 0.88, + "learning_rate": 1.6546173611381803e-06, + "loss": 1.0742, + "step": 34488 + }, + { + "epoch": 0.88, + "learning_rate": 1.6545964431204724e-06, + "loss": 0.7451, + "step": 34489 + }, + { + "epoch": 0.88, + "learning_rate": 1.6545755246015704e-06, + "loss": 1.0068, + "step": 34490 + }, + { + "epoch": 0.88, + "learning_rate": 1.6545546055814898e-06, + "loss": 1.1768, + "step": 34491 + }, + { + "epoch": 0.88, + "learning_rate": 1.6545336860602467e-06, + "loss": 0.729, + "step": 34492 + }, + { + "epoch": 0.88, + "learning_rate": 1.6545127660378574e-06, + "loss": 0.7874, + "step": 34493 + }, + { + "epoch": 0.88, + "learning_rate": 1.6544918455143376e-06, + "loss": 0.7021, + "step": 34494 + }, + { + "epoch": 0.88, + "learning_rate": 1.6544709244897036e-06, + "loss": 0.8896, + "step": 34495 + }, + { + "epoch": 0.88, + "learning_rate": 1.6544500029639717e-06, + "loss": 0.7539, + "step": 34496 + }, + { + "epoch": 0.88, + "learning_rate": 1.654429080937157e-06, + "loss": 0.8643, + "step": 34497 + }, + { + "epoch": 0.88, + "learning_rate": 1.6544081584092763e-06, + "loss": 1.0723, + "step": 34498 + }, + { + "epoch": 0.88, + "learning_rate": 1.6543872353803453e-06, + "loss": 0.666, + "step": 34499 + }, + { + "epoch": 0.88, + "learning_rate": 1.65436631185038e-06, + "loss": 0.7461, + "step": 34500 + }, + { + "epoch": 0.88, + "learning_rate": 1.6543453878193968e-06, + "loss": 0.9912, + "step": 34501 + }, + { + "epoch": 0.88, + "learning_rate": 1.6543244632874109e-06, + "loss": 0.9854, + "step": 34502 + }, + { + "epoch": 0.88, + "learning_rate": 1.6543035382544393e-06, + "loss": 1.123, + "step": 34503 + }, + { + "epoch": 0.88, + "learning_rate": 1.6542826127204972e-06, + "loss": 0.9912, + "step": 34504 + }, + { + "epoch": 0.88, + "learning_rate": 1.6542616866856017e-06, + "loss": 1.0908, + "step": 34505 + }, + { + "epoch": 0.88, + "learning_rate": 1.6542407601497673e-06, + "loss": 0.8252, + "step": 34506 + }, + { + "epoch": 0.88, + "learning_rate": 1.6542198331130114e-06, + "loss": 0.8906, + "step": 34507 + }, + { + "epoch": 0.88, + "learning_rate": 1.654198905575349e-06, + "loss": 0.6123, + "step": 34508 + }, + { + "epoch": 0.88, + "learning_rate": 1.6541779775367966e-06, + "loss": 0.6273, + "step": 34509 + }, + { + "epoch": 0.88, + "learning_rate": 1.6541570489973707e-06, + "loss": 0.6318, + "step": 34510 + }, + { + "epoch": 0.88, + "learning_rate": 1.6541361199570863e-06, + "loss": 0.9326, + "step": 34511 + }, + { + "epoch": 0.88, + "learning_rate": 1.6541151904159603e-06, + "loss": 0.7979, + "step": 34512 + }, + { + "epoch": 0.88, + "learning_rate": 1.6540942603740081e-06, + "loss": 0.9043, + "step": 34513 + }, + { + "epoch": 0.88, + "learning_rate": 1.654073329831246e-06, + "loss": 0.6992, + "step": 34514 + }, + { + "epoch": 0.88, + "learning_rate": 1.6540523987876903e-06, + "loss": 0.8389, + "step": 34515 + }, + { + "epoch": 0.88, + "learning_rate": 1.6540314672433567e-06, + "loss": 0.7461, + "step": 34516 + }, + { + "epoch": 0.88, + "learning_rate": 1.6540105351982611e-06, + "loss": 0.8623, + "step": 34517 + }, + { + "epoch": 0.88, + "learning_rate": 1.6539896026524199e-06, + "loss": 0.6924, + "step": 34518 + }, + { + "epoch": 0.88, + "learning_rate": 1.6539686696058487e-06, + "loss": 0.5852, + "step": 34519 + }, + { + "epoch": 0.88, + "learning_rate": 1.6539477360585638e-06, + "loss": 0.666, + "step": 34520 + }, + { + "epoch": 0.88, + "learning_rate": 1.6539268020105815e-06, + "loss": 0.448, + "step": 34521 + }, + { + "epoch": 0.88, + "learning_rate": 1.6539058674619173e-06, + "loss": 0.8574, + "step": 34522 + }, + { + "epoch": 0.88, + "learning_rate": 1.6538849324125871e-06, + "loss": 0.8755, + "step": 34523 + }, + { + "epoch": 0.88, + "learning_rate": 1.6538639968626078e-06, + "loss": 0.5488, + "step": 34524 + }, + { + "epoch": 0.88, + "learning_rate": 1.6538430608119947e-06, + "loss": 0.6567, + "step": 34525 + }, + { + "epoch": 0.88, + "learning_rate": 1.6538221242607641e-06, + "loss": 0.7383, + "step": 34526 + }, + { + "epoch": 0.88, + "learning_rate": 1.6538011872089318e-06, + "loss": 0.9766, + "step": 34527 + }, + { + "epoch": 0.88, + "learning_rate": 1.6537802496565143e-06, + "loss": 0.772, + "step": 34528 + }, + { + "epoch": 0.88, + "learning_rate": 1.653759311603527e-06, + "loss": 0.9727, + "step": 34529 + }, + { + "epoch": 0.89, + "learning_rate": 1.6537383730499865e-06, + "loss": 0.7969, + "step": 34530 + }, + { + "epoch": 0.89, + "learning_rate": 1.6537174339959083e-06, + "loss": 0.668, + "step": 34531 + }, + { + "epoch": 0.89, + "learning_rate": 1.653696494441309e-06, + "loss": 0.9717, + "step": 34532 + }, + { + "epoch": 0.89, + "learning_rate": 1.6536755543862042e-06, + "loss": 1.0986, + "step": 34533 + }, + { + "epoch": 0.89, + "learning_rate": 1.6536546138306102e-06, + "loss": 0.8623, + "step": 34534 + }, + { + "epoch": 0.89, + "learning_rate": 1.6536336727745427e-06, + "loss": 1.0361, + "step": 34535 + }, + { + "epoch": 0.89, + "learning_rate": 1.6536127312180183e-06, + "loss": 1.0195, + "step": 34536 + }, + { + "epoch": 0.89, + "learning_rate": 1.6535917891610524e-06, + "loss": 0.915, + "step": 34537 + }, + { + "epoch": 0.89, + "learning_rate": 1.6535708466036616e-06, + "loss": 0.5605, + "step": 34538 + }, + { + "epoch": 0.89, + "learning_rate": 1.653549903545861e-06, + "loss": 0.873, + "step": 34539 + }, + { + "epoch": 0.89, + "learning_rate": 1.653528959987668e-06, + "loss": 1.001, + "step": 34540 + }, + { + "epoch": 0.89, + "learning_rate": 1.6535080159290974e-06, + "loss": 0.96, + "step": 34541 + }, + { + "epoch": 0.89, + "learning_rate": 1.6534870713701662e-06, + "loss": 0.7395, + "step": 34542 + }, + { + "epoch": 0.89, + "learning_rate": 1.65346612631089e-06, + "loss": 0.8906, + "step": 34543 + }, + { + "epoch": 0.89, + "learning_rate": 1.6534451807512847e-06, + "loss": 0.9404, + "step": 34544 + }, + { + "epoch": 0.89, + "learning_rate": 1.6534242346913664e-06, + "loss": 0.9316, + "step": 34545 + }, + { + "epoch": 0.89, + "learning_rate": 1.6534032881311512e-06, + "loss": 0.8945, + "step": 34546 + }, + { + "epoch": 0.89, + "learning_rate": 1.6533823410706552e-06, + "loss": 0.792, + "step": 34547 + }, + { + "epoch": 0.89, + "learning_rate": 1.6533613935098943e-06, + "loss": 0.9717, + "step": 34548 + }, + { + "epoch": 0.89, + "learning_rate": 1.6533404454488847e-06, + "loss": 1.1738, + "step": 34549 + }, + { + "epoch": 0.89, + "learning_rate": 1.6533194968876426e-06, + "loss": 0.627, + "step": 34550 + }, + { + "epoch": 0.89, + "learning_rate": 1.6532985478261835e-06, + "loss": 0.877, + "step": 34551 + }, + { + "epoch": 0.89, + "learning_rate": 1.6532775982645237e-06, + "loss": 0.7944, + "step": 34552 + }, + { + "epoch": 0.89, + "learning_rate": 1.6532566482026793e-06, + "loss": 0.8188, + "step": 34553 + }, + { + "epoch": 0.89, + "learning_rate": 1.6532356976406664e-06, + "loss": 0.8193, + "step": 34554 + }, + { + "epoch": 0.89, + "learning_rate": 1.653214746578501e-06, + "loss": 0.8057, + "step": 34555 + }, + { + "epoch": 0.89, + "learning_rate": 1.6531937950161992e-06, + "loss": 0.7202, + "step": 34556 + }, + { + "epoch": 0.89, + "learning_rate": 1.6531728429537765e-06, + "loss": 0.8789, + "step": 34557 + }, + { + "epoch": 0.89, + "learning_rate": 1.65315189039125e-06, + "loss": 0.8184, + "step": 34558 + }, + { + "epoch": 0.89, + "learning_rate": 1.6531309373286346e-06, + "loss": 0.8301, + "step": 34559 + }, + { + "epoch": 0.89, + "learning_rate": 1.6531099837659475e-06, + "loss": 0.6694, + "step": 34560 + }, + { + "epoch": 0.89, + "learning_rate": 1.6530890297032034e-06, + "loss": 0.9346, + "step": 34561 + }, + { + "epoch": 0.89, + "learning_rate": 1.6530680751404197e-06, + "loss": 0.8008, + "step": 34562 + }, + { + "epoch": 0.89, + "learning_rate": 1.6530471200776112e-06, + "loss": 0.7192, + "step": 34563 + }, + { + "epoch": 0.89, + "learning_rate": 1.653026164514795e-06, + "loss": 0.7217, + "step": 34564 + }, + { + "epoch": 0.89, + "learning_rate": 1.6530052084519865e-06, + "loss": 0.9604, + "step": 34565 + }, + { + "epoch": 0.89, + "learning_rate": 1.6529842518892019e-06, + "loss": 0.8594, + "step": 34566 + }, + { + "epoch": 0.89, + "learning_rate": 1.6529632948264574e-06, + "loss": 0.9287, + "step": 34567 + }, + { + "epoch": 0.89, + "learning_rate": 1.6529423372637688e-06, + "loss": 0.8828, + "step": 34568 + }, + { + "epoch": 0.89, + "learning_rate": 1.6529213792011524e-06, + "loss": 0.7759, + "step": 34569 + }, + { + "epoch": 0.89, + "learning_rate": 1.652900420638624e-06, + "loss": 0.9307, + "step": 34570 + }, + { + "epoch": 0.89, + "learning_rate": 1.6528794615762e-06, + "loss": 0.6533, + "step": 34571 + }, + { + "epoch": 0.89, + "learning_rate": 1.652858502013896e-06, + "loss": 0.7222, + "step": 34572 + }, + { + "epoch": 0.89, + "learning_rate": 1.6528375419517281e-06, + "loss": 0.7236, + "step": 34573 + }, + { + "epoch": 0.89, + "learning_rate": 1.6528165813897129e-06, + "loss": 0.7783, + "step": 34574 + }, + { + "epoch": 0.89, + "learning_rate": 1.6527956203278662e-06, + "loss": 0.8555, + "step": 34575 + }, + { + "epoch": 0.89, + "learning_rate": 1.6527746587662034e-06, + "loss": 0.7231, + "step": 34576 + }, + { + "epoch": 0.89, + "learning_rate": 1.6527536967047412e-06, + "loss": 0.8577, + "step": 34577 + }, + { + "epoch": 0.89, + "learning_rate": 1.6527327341434957e-06, + "loss": 0.9287, + "step": 34578 + }, + { + "epoch": 0.89, + "learning_rate": 1.6527117710824827e-06, + "loss": 0.8848, + "step": 34579 + }, + { + "epoch": 0.89, + "learning_rate": 1.6526908075217184e-06, + "loss": 1.0254, + "step": 34580 + }, + { + "epoch": 0.89, + "learning_rate": 1.6526698434612186e-06, + "loss": 0.8174, + "step": 34581 + }, + { + "epoch": 0.89, + "learning_rate": 1.6526488789009995e-06, + "loss": 0.8506, + "step": 34582 + }, + { + "epoch": 0.89, + "learning_rate": 1.652627913841077e-06, + "loss": 0.8311, + "step": 34583 + }, + { + "epoch": 0.89, + "learning_rate": 1.6526069482814674e-06, + "loss": 0.6572, + "step": 34584 + }, + { + "epoch": 0.89, + "learning_rate": 1.6525859822221867e-06, + "loss": 0.7617, + "step": 34585 + }, + { + "epoch": 0.89, + "learning_rate": 1.652565015663251e-06, + "loss": 0.6914, + "step": 34586 + }, + { + "epoch": 0.89, + "learning_rate": 1.6525440486046765e-06, + "loss": 0.8213, + "step": 34587 + }, + { + "epoch": 0.89, + "learning_rate": 1.6525230810464789e-06, + "loss": 0.8081, + "step": 34588 + }, + { + "epoch": 0.89, + "learning_rate": 1.6525021129886741e-06, + "loss": 0.9814, + "step": 34589 + }, + { + "epoch": 0.89, + "learning_rate": 1.6524811444312787e-06, + "loss": 0.8535, + "step": 34590 + }, + { + "epoch": 0.89, + "learning_rate": 1.6524601753743084e-06, + "loss": 0.9873, + "step": 34591 + }, + { + "epoch": 0.89, + "learning_rate": 1.6524392058177793e-06, + "loss": 0.5947, + "step": 34592 + }, + { + "epoch": 0.89, + "learning_rate": 1.6524182357617073e-06, + "loss": 0.8271, + "step": 34593 + }, + { + "epoch": 0.89, + "learning_rate": 1.652397265206109e-06, + "loss": 0.8145, + "step": 34594 + }, + { + "epoch": 0.89, + "learning_rate": 1.6523762941510002e-06, + "loss": 0.9336, + "step": 34595 + }, + { + "epoch": 0.89, + "learning_rate": 1.6523553225963967e-06, + "loss": 0.7881, + "step": 34596 + }, + { + "epoch": 0.89, + "learning_rate": 1.6523343505423145e-06, + "loss": 0.7051, + "step": 34597 + }, + { + "epoch": 0.89, + "learning_rate": 1.65231337798877e-06, + "loss": 0.8213, + "step": 34598 + }, + { + "epoch": 0.89, + "learning_rate": 1.6522924049357791e-06, + "loss": 0.9521, + "step": 34599 + }, + { + "epoch": 0.89, + "learning_rate": 1.6522714313833583e-06, + "loss": 0.7861, + "step": 34600 + }, + { + "epoch": 0.89, + "learning_rate": 1.6522504573315228e-06, + "loss": 0.8279, + "step": 34601 + }, + { + "epoch": 0.89, + "learning_rate": 1.6522294827802893e-06, + "loss": 0.9619, + "step": 34602 + }, + { + "epoch": 0.89, + "learning_rate": 1.6522085077296737e-06, + "loss": 0.8848, + "step": 34603 + }, + { + "epoch": 0.89, + "learning_rate": 1.6521875321796918e-06, + "loss": 0.9023, + "step": 34604 + }, + { + "epoch": 0.89, + "learning_rate": 1.6521665561303603e-06, + "loss": 0.4976, + "step": 34605 + }, + { + "epoch": 0.89, + "learning_rate": 1.6521455795816947e-06, + "loss": 0.8848, + "step": 34606 + }, + { + "epoch": 0.89, + "learning_rate": 1.6521246025337111e-06, + "loss": 0.9702, + "step": 34607 + }, + { + "epoch": 0.89, + "learning_rate": 1.652103624986426e-06, + "loss": 0.6973, + "step": 34608 + }, + { + "epoch": 0.89, + "learning_rate": 1.6520826469398546e-06, + "loss": 0.8701, + "step": 34609 + }, + { + "epoch": 0.89, + "learning_rate": 1.652061668394014e-06, + "loss": 1.0889, + "step": 34610 + }, + { + "epoch": 0.89, + "learning_rate": 1.6520406893489197e-06, + "loss": 0.7271, + "step": 34611 + }, + { + "epoch": 0.89, + "learning_rate": 1.6520197098045873e-06, + "loss": 0.6699, + "step": 34612 + }, + { + "epoch": 0.89, + "learning_rate": 1.6519987297610339e-06, + "loss": 0.8867, + "step": 34613 + }, + { + "epoch": 0.89, + "learning_rate": 1.651977749218275e-06, + "loss": 0.8252, + "step": 34614 + }, + { + "epoch": 0.89, + "learning_rate": 1.6519567681763267e-06, + "loss": 0.9131, + "step": 34615 + }, + { + "epoch": 0.89, + "learning_rate": 1.6519357866352049e-06, + "loss": 0.9053, + "step": 34616 + }, + { + "epoch": 0.89, + "learning_rate": 1.6519148045949258e-06, + "loss": 0.6357, + "step": 34617 + }, + { + "epoch": 0.89, + "learning_rate": 1.6518938220555057e-06, + "loss": 0.7817, + "step": 34618 + }, + { + "epoch": 0.89, + "learning_rate": 1.6518728390169604e-06, + "loss": 0.8496, + "step": 34619 + }, + { + "epoch": 0.89, + "learning_rate": 1.6518518554793063e-06, + "loss": 0.5593, + "step": 34620 + }, + { + "epoch": 0.89, + "learning_rate": 1.651830871442559e-06, + "loss": 0.5693, + "step": 34621 + }, + { + "epoch": 0.89, + "learning_rate": 1.6518098869067347e-06, + "loss": 1.043, + "step": 34622 + }, + { + "epoch": 0.89, + "learning_rate": 1.6517889018718496e-06, + "loss": 0.5894, + "step": 34623 + }, + { + "epoch": 0.89, + "learning_rate": 1.6517679163379196e-06, + "loss": 0.9209, + "step": 34624 + }, + { + "epoch": 0.89, + "learning_rate": 1.651746930304961e-06, + "loss": 0.8613, + "step": 34625 + }, + { + "epoch": 0.89, + "learning_rate": 1.6517259437729898e-06, + "loss": 1.0381, + "step": 34626 + }, + { + "epoch": 0.89, + "learning_rate": 1.651704956742022e-06, + "loss": 0.9502, + "step": 34627 + }, + { + "epoch": 0.89, + "learning_rate": 1.6516839692120737e-06, + "loss": 0.874, + "step": 34628 + }, + { + "epoch": 0.89, + "learning_rate": 1.6516629811831608e-06, + "loss": 0.7983, + "step": 34629 + }, + { + "epoch": 0.89, + "learning_rate": 1.6516419926553e-06, + "loss": 0.9883, + "step": 34630 + }, + { + "epoch": 0.89, + "learning_rate": 1.6516210036285061e-06, + "loss": 0.8604, + "step": 34631 + }, + { + "epoch": 0.89, + "learning_rate": 1.6516000141027964e-06, + "loss": 0.8813, + "step": 34632 + }, + { + "epoch": 0.89, + "learning_rate": 1.6515790240781864e-06, + "loss": 0.4575, + "step": 34633 + }, + { + "epoch": 0.89, + "learning_rate": 1.6515580335546923e-06, + "loss": 0.8174, + "step": 34634 + }, + { + "epoch": 0.89, + "learning_rate": 1.6515370425323302e-06, + "loss": 0.9043, + "step": 34635 + }, + { + "epoch": 0.89, + "learning_rate": 1.6515160510111163e-06, + "loss": 0.8936, + "step": 34636 + }, + { + "epoch": 0.89, + "learning_rate": 1.6514950589910663e-06, + "loss": 0.7988, + "step": 34637 + }, + { + "epoch": 0.89, + "learning_rate": 1.6514740664721969e-06, + "loss": 0.6274, + "step": 34638 + }, + { + "epoch": 0.89, + "learning_rate": 1.6514530734545233e-06, + "loss": 0.9121, + "step": 34639 + }, + { + "epoch": 0.89, + "learning_rate": 1.6514320799380623e-06, + "loss": 0.8999, + "step": 34640 + }, + { + "epoch": 0.89, + "learning_rate": 1.6514110859228295e-06, + "loss": 0.9233, + "step": 34641 + }, + { + "epoch": 0.89, + "learning_rate": 1.6513900914088413e-06, + "loss": 0.8975, + "step": 34642 + }, + { + "epoch": 0.89, + "learning_rate": 1.6513690963961136e-06, + "loss": 0.8281, + "step": 34643 + }, + { + "epoch": 0.89, + "learning_rate": 1.6513481008846628e-06, + "loss": 0.8379, + "step": 34644 + }, + { + "epoch": 0.89, + "learning_rate": 1.6513271048745044e-06, + "loss": 0.5896, + "step": 34645 + }, + { + "epoch": 0.89, + "learning_rate": 1.651306108365655e-06, + "loss": 0.6904, + "step": 34646 + }, + { + "epoch": 0.89, + "learning_rate": 1.6512851113581303e-06, + "loss": 0.6885, + "step": 34647 + }, + { + "epoch": 0.89, + "learning_rate": 1.6512641138519465e-06, + "loss": 0.8975, + "step": 34648 + }, + { + "epoch": 0.89, + "learning_rate": 1.6512431158471197e-06, + "loss": 0.7646, + "step": 34649 + }, + { + "epoch": 0.89, + "learning_rate": 1.6512221173436663e-06, + "loss": 0.8926, + "step": 34650 + }, + { + "epoch": 0.89, + "learning_rate": 1.6512011183416016e-06, + "loss": 0.8447, + "step": 34651 + }, + { + "epoch": 0.89, + "learning_rate": 1.6511801188409424e-06, + "loss": 0.6069, + "step": 34652 + }, + { + "epoch": 0.89, + "learning_rate": 1.6511591188417046e-06, + "loss": 0.6877, + "step": 34653 + }, + { + "epoch": 0.89, + "learning_rate": 1.6511381183439042e-06, + "loss": 0.5923, + "step": 34654 + }, + { + "epoch": 0.89, + "learning_rate": 1.651117117347557e-06, + "loss": 0.9023, + "step": 34655 + }, + { + "epoch": 0.89, + "learning_rate": 1.6510961158526796e-06, + "loss": 1.0361, + "step": 34656 + }, + { + "epoch": 0.89, + "learning_rate": 1.651075113859288e-06, + "loss": 0.9102, + "step": 34657 + }, + { + "epoch": 0.89, + "learning_rate": 1.6510541113673978e-06, + "loss": 0.8613, + "step": 34658 + }, + { + "epoch": 0.89, + "learning_rate": 1.6510331083770256e-06, + "loss": 0.8516, + "step": 34659 + }, + { + "epoch": 0.89, + "learning_rate": 1.6510121048881875e-06, + "loss": 0.8555, + "step": 34660 + }, + { + "epoch": 0.89, + "learning_rate": 1.650991100900899e-06, + "loss": 0.9463, + "step": 34661 + }, + { + "epoch": 0.89, + "learning_rate": 1.6509700964151767e-06, + "loss": 0.6099, + "step": 34662 + }, + { + "epoch": 0.89, + "learning_rate": 1.6509490914310363e-06, + "loss": 0.8418, + "step": 34663 + }, + { + "epoch": 0.89, + "learning_rate": 1.6509280859484942e-06, + "loss": 0.9824, + "step": 34664 + }, + { + "epoch": 0.89, + "learning_rate": 1.6509070799675667e-06, + "loss": 0.8472, + "step": 34665 + }, + { + "epoch": 0.89, + "learning_rate": 1.6508860734882693e-06, + "loss": 0.7036, + "step": 34666 + }, + { + "epoch": 0.89, + "learning_rate": 1.6508650665106182e-06, + "loss": 0.9365, + "step": 34667 + }, + { + "epoch": 0.89, + "learning_rate": 1.65084405903463e-06, + "loss": 0.7002, + "step": 34668 + }, + { + "epoch": 0.89, + "learning_rate": 1.6508230510603202e-06, + "loss": 0.9199, + "step": 34669 + }, + { + "epoch": 0.89, + "learning_rate": 1.6508020425877055e-06, + "loss": 1.0693, + "step": 34670 + }, + { + "epoch": 0.89, + "learning_rate": 1.6507810336168012e-06, + "loss": 0.8438, + "step": 34671 + }, + { + "epoch": 0.89, + "learning_rate": 1.6507600241476238e-06, + "loss": 0.9746, + "step": 34672 + }, + { + "epoch": 0.89, + "learning_rate": 1.6507390141801895e-06, + "loss": 0.9414, + "step": 34673 + }, + { + "epoch": 0.89, + "learning_rate": 1.6507180037145143e-06, + "loss": 0.8115, + "step": 34674 + }, + { + "epoch": 0.89, + "learning_rate": 1.650696992750614e-06, + "loss": 0.8467, + "step": 34675 + }, + { + "epoch": 0.89, + "learning_rate": 1.650675981288505e-06, + "loss": 0.8223, + "step": 34676 + }, + { + "epoch": 0.89, + "learning_rate": 1.6506549693282036e-06, + "loss": 0.7141, + "step": 34677 + }, + { + "epoch": 0.89, + "learning_rate": 1.6506339568697254e-06, + "loss": 0.9424, + "step": 34678 + }, + { + "epoch": 0.89, + "learning_rate": 1.6506129439130867e-06, + "loss": 0.8506, + "step": 34679 + }, + { + "epoch": 0.89, + "learning_rate": 1.6505919304583038e-06, + "loss": 1.0049, + "step": 34680 + }, + { + "epoch": 0.89, + "learning_rate": 1.6505709165053925e-06, + "loss": 0.8984, + "step": 34681 + }, + { + "epoch": 0.89, + "learning_rate": 1.6505499020543688e-06, + "loss": 0.688, + "step": 34682 + }, + { + "epoch": 0.89, + "learning_rate": 1.6505288871052487e-06, + "loss": 0.6343, + "step": 34683 + }, + { + "epoch": 0.89, + "learning_rate": 1.6505078716580489e-06, + "loss": 0.7324, + "step": 34684 + }, + { + "epoch": 0.89, + "learning_rate": 1.6504868557127854e-06, + "loss": 0.8613, + "step": 34685 + }, + { + "epoch": 0.89, + "learning_rate": 1.6504658392694736e-06, + "loss": 0.7383, + "step": 34686 + }, + { + "epoch": 0.89, + "learning_rate": 1.6504448223281303e-06, + "loss": 0.8701, + "step": 34687 + }, + { + "epoch": 0.89, + "learning_rate": 1.6504238048887708e-06, + "loss": 0.917, + "step": 34688 + }, + { + "epoch": 0.89, + "learning_rate": 1.650402786951412e-06, + "loss": 0.9561, + "step": 34689 + }, + { + "epoch": 0.89, + "learning_rate": 1.65038176851607e-06, + "loss": 0.6553, + "step": 34690 + }, + { + "epoch": 0.89, + "learning_rate": 1.6503607495827603e-06, + "loss": 0.9502, + "step": 34691 + }, + { + "epoch": 0.89, + "learning_rate": 1.6503397301514993e-06, + "loss": 0.7744, + "step": 34692 + }, + { + "epoch": 0.89, + "learning_rate": 1.6503187102223027e-06, + "loss": 1.0029, + "step": 34693 + }, + { + "epoch": 0.89, + "learning_rate": 1.6502976897951874e-06, + "loss": 1.0654, + "step": 34694 + }, + { + "epoch": 0.89, + "learning_rate": 1.6502766688701692e-06, + "loss": 0.9375, + "step": 34695 + }, + { + "epoch": 0.89, + "learning_rate": 1.6502556474472637e-06, + "loss": 0.8018, + "step": 34696 + }, + { + "epoch": 0.89, + "learning_rate": 1.6502346255264875e-06, + "loss": 0.957, + "step": 34697 + }, + { + "epoch": 0.89, + "learning_rate": 1.6502136031078563e-06, + "loss": 0.8652, + "step": 34698 + }, + { + "epoch": 0.89, + "learning_rate": 1.650192580191387e-06, + "loss": 0.9883, + "step": 34699 + }, + { + "epoch": 0.89, + "learning_rate": 1.6501715567770948e-06, + "loss": 0.9268, + "step": 34700 + }, + { + "epoch": 0.89, + "learning_rate": 1.650150532864996e-06, + "loss": 0.7949, + "step": 34701 + }, + { + "epoch": 0.89, + "learning_rate": 1.650129508455107e-06, + "loss": 0.7441, + "step": 34702 + }, + { + "epoch": 0.89, + "learning_rate": 1.6501084835474438e-06, + "loss": 0.7852, + "step": 34703 + }, + { + "epoch": 0.89, + "learning_rate": 1.6500874581420221e-06, + "loss": 1.0254, + "step": 34704 + }, + { + "epoch": 0.89, + "learning_rate": 1.650066432238859e-06, + "loss": 1.0869, + "step": 34705 + }, + { + "epoch": 0.89, + "learning_rate": 1.6500454058379694e-06, + "loss": 1.0352, + "step": 34706 + }, + { + "epoch": 0.89, + "learning_rate": 1.6500243789393697e-06, + "loss": 0.7793, + "step": 34707 + }, + { + "epoch": 0.89, + "learning_rate": 1.6500033515430767e-06, + "loss": 0.8423, + "step": 34708 + }, + { + "epoch": 0.89, + "learning_rate": 1.649982323649106e-06, + "loss": 0.749, + "step": 34709 + }, + { + "epoch": 0.89, + "learning_rate": 1.6499612952574734e-06, + "loss": 0.7607, + "step": 34710 + }, + { + "epoch": 0.89, + "learning_rate": 1.6499402663681955e-06, + "loss": 0.8281, + "step": 34711 + }, + { + "epoch": 0.89, + "learning_rate": 1.6499192369812885e-06, + "loss": 0.8555, + "step": 34712 + }, + { + "epoch": 0.89, + "learning_rate": 1.6498982070967678e-06, + "loss": 0.8159, + "step": 34713 + }, + { + "epoch": 0.89, + "learning_rate": 1.64987717671465e-06, + "loss": 0.592, + "step": 34714 + }, + { + "epoch": 0.89, + "learning_rate": 1.6498561458349514e-06, + "loss": 0.8042, + "step": 34715 + }, + { + "epoch": 0.89, + "learning_rate": 1.6498351144576877e-06, + "loss": 0.6831, + "step": 34716 + }, + { + "epoch": 0.89, + "learning_rate": 1.6498140825828748e-06, + "loss": 0.7793, + "step": 34717 + }, + { + "epoch": 0.89, + "learning_rate": 1.6497930502105292e-06, + "loss": 1.0684, + "step": 34718 + }, + { + "epoch": 0.89, + "learning_rate": 1.6497720173406674e-06, + "loss": 0.8389, + "step": 34719 + }, + { + "epoch": 0.89, + "learning_rate": 1.6497509839733046e-06, + "loss": 0.6382, + "step": 34720 + }, + { + "epoch": 0.89, + "learning_rate": 1.6497299501084576e-06, + "loss": 0.9746, + "step": 34721 + }, + { + "epoch": 0.89, + "learning_rate": 1.6497089157461421e-06, + "loss": 0.8457, + "step": 34722 + }, + { + "epoch": 0.89, + "learning_rate": 1.6496878808863746e-06, + "loss": 0.7871, + "step": 34723 + }, + { + "epoch": 0.89, + "learning_rate": 1.6496668455291709e-06, + "loss": 0.998, + "step": 34724 + }, + { + "epoch": 0.89, + "learning_rate": 1.6496458096745469e-06, + "loss": 1.0186, + "step": 34725 + }, + { + "epoch": 0.89, + "learning_rate": 1.649624773322519e-06, + "loss": 0.9023, + "step": 34726 + }, + { + "epoch": 0.89, + "learning_rate": 1.6496037364731037e-06, + "loss": 0.8682, + "step": 34727 + }, + { + "epoch": 0.89, + "learning_rate": 1.6495826991263164e-06, + "loss": 0.8564, + "step": 34728 + }, + { + "epoch": 0.89, + "learning_rate": 1.6495616612821736e-06, + "loss": 0.8535, + "step": 34729 + }, + { + "epoch": 0.89, + "learning_rate": 1.6495406229406909e-06, + "loss": 0.7988, + "step": 34730 + }, + { + "epoch": 0.89, + "learning_rate": 1.649519584101885e-06, + "loss": 0.9102, + "step": 34731 + }, + { + "epoch": 0.89, + "learning_rate": 1.6494985447657723e-06, + "loss": 0.7368, + "step": 34732 + }, + { + "epoch": 0.89, + "learning_rate": 1.6494775049323679e-06, + "loss": 0.7627, + "step": 34733 + }, + { + "epoch": 0.89, + "learning_rate": 1.6494564646016889e-06, + "loss": 0.5718, + "step": 34734 + }, + { + "epoch": 0.89, + "learning_rate": 1.6494354237737507e-06, + "loss": 0.8506, + "step": 34735 + }, + { + "epoch": 0.89, + "learning_rate": 1.6494143824485693e-06, + "loss": 0.9062, + "step": 34736 + }, + { + "epoch": 0.89, + "learning_rate": 1.6493933406261617e-06, + "loss": 0.7056, + "step": 34737 + }, + { + "epoch": 0.89, + "learning_rate": 1.649372298306543e-06, + "loss": 0.8652, + "step": 34738 + }, + { + "epoch": 0.89, + "learning_rate": 1.6493512554897305e-06, + "loss": 0.9463, + "step": 34739 + }, + { + "epoch": 0.89, + "learning_rate": 1.649330212175739e-06, + "loss": 0.7344, + "step": 34740 + }, + { + "epoch": 0.89, + "learning_rate": 1.6493091683645853e-06, + "loss": 0.5061, + "step": 34741 + }, + { + "epoch": 0.89, + "learning_rate": 1.6492881240562855e-06, + "loss": 0.6191, + "step": 34742 + }, + { + "epoch": 0.89, + "learning_rate": 1.6492670792508555e-06, + "loss": 0.8574, + "step": 34743 + }, + { + "epoch": 0.89, + "learning_rate": 1.6492460339483119e-06, + "loss": 0.7061, + "step": 34744 + }, + { + "epoch": 0.89, + "learning_rate": 1.6492249881486702e-06, + "loss": 0.8154, + "step": 34745 + }, + { + "epoch": 0.89, + "learning_rate": 1.6492039418519468e-06, + "loss": 0.73, + "step": 34746 + }, + { + "epoch": 0.89, + "learning_rate": 1.6491828950581578e-06, + "loss": 1.0762, + "step": 34747 + }, + { + "epoch": 0.89, + "learning_rate": 1.6491618477673193e-06, + "loss": 0.9688, + "step": 34748 + }, + { + "epoch": 0.89, + "learning_rate": 1.6491407999794476e-06, + "loss": 0.9199, + "step": 34749 + }, + { + "epoch": 0.89, + "learning_rate": 1.6491197516945583e-06, + "loss": 0.6592, + "step": 34750 + }, + { + "epoch": 0.89, + "learning_rate": 1.6490987029126682e-06, + "loss": 0.6309, + "step": 34751 + }, + { + "epoch": 0.89, + "learning_rate": 1.649077653633793e-06, + "loss": 0.8359, + "step": 34752 + }, + { + "epoch": 0.89, + "learning_rate": 1.6490566038579487e-06, + "loss": 0.833, + "step": 34753 + }, + { + "epoch": 0.89, + "learning_rate": 1.6490355535851519e-06, + "loss": 1.0088, + "step": 34754 + }, + { + "epoch": 0.89, + "learning_rate": 1.6490145028154182e-06, + "loss": 0.7104, + "step": 34755 + }, + { + "epoch": 0.89, + "learning_rate": 1.6489934515487637e-06, + "loss": 0.9814, + "step": 34756 + }, + { + "epoch": 0.89, + "learning_rate": 1.648972399785205e-06, + "loss": 0.9072, + "step": 34757 + }, + { + "epoch": 0.89, + "learning_rate": 1.6489513475247581e-06, + "loss": 0.8135, + "step": 34758 + }, + { + "epoch": 0.89, + "learning_rate": 1.6489302947674387e-06, + "loss": 0.7178, + "step": 34759 + }, + { + "epoch": 0.89, + "learning_rate": 1.6489092415132638e-06, + "loss": 0.9824, + "step": 34760 + }, + { + "epoch": 0.89, + "learning_rate": 1.6488881877622482e-06, + "loss": 0.6331, + "step": 34761 + }, + { + "epoch": 0.89, + "learning_rate": 1.6488671335144094e-06, + "loss": 0.9092, + "step": 34762 + }, + { + "epoch": 0.89, + "learning_rate": 1.6488460787697624e-06, + "loss": 0.7021, + "step": 34763 + }, + { + "epoch": 0.89, + "learning_rate": 1.648825023528324e-06, + "loss": 0.8076, + "step": 34764 + }, + { + "epoch": 0.89, + "learning_rate": 1.6488039677901097e-06, + "loss": 0.6738, + "step": 34765 + }, + { + "epoch": 0.89, + "learning_rate": 1.6487829115551367e-06, + "loss": 0.8799, + "step": 34766 + }, + { + "epoch": 0.89, + "learning_rate": 1.64876185482342e-06, + "loss": 0.614, + "step": 34767 + }, + { + "epoch": 0.89, + "learning_rate": 1.6487407975949763e-06, + "loss": 0.9126, + "step": 34768 + }, + { + "epoch": 0.89, + "learning_rate": 1.6487197398698216e-06, + "loss": 0.8047, + "step": 34769 + }, + { + "epoch": 0.89, + "learning_rate": 1.6486986816479721e-06, + "loss": 0.7576, + "step": 34770 + }, + { + "epoch": 0.89, + "learning_rate": 1.6486776229294439e-06, + "loss": 0.9404, + "step": 34771 + }, + { + "epoch": 0.89, + "learning_rate": 1.648656563714253e-06, + "loss": 0.6182, + "step": 34772 + }, + { + "epoch": 0.89, + "learning_rate": 1.6486355040024153e-06, + "loss": 0.8237, + "step": 34773 + }, + { + "epoch": 0.89, + "learning_rate": 1.6486144437939477e-06, + "loss": 0.8867, + "step": 34774 + }, + { + "epoch": 0.89, + "learning_rate": 1.6485933830888656e-06, + "loss": 0.8896, + "step": 34775 + }, + { + "epoch": 0.89, + "learning_rate": 1.6485723218871853e-06, + "loss": 0.915, + "step": 34776 + }, + { + "epoch": 0.89, + "learning_rate": 1.648551260188923e-06, + "loss": 0.8555, + "step": 34777 + }, + { + "epoch": 0.89, + "learning_rate": 1.6485301979940952e-06, + "loss": 0.8359, + "step": 34778 + }, + { + "epoch": 0.89, + "learning_rate": 1.6485091353027175e-06, + "loss": 0.6987, + "step": 34779 + }, + { + "epoch": 0.89, + "learning_rate": 1.648488072114806e-06, + "loss": 0.8662, + "step": 34780 + }, + { + "epoch": 0.89, + "learning_rate": 1.648467008430377e-06, + "loss": 0.7627, + "step": 34781 + }, + { + "epoch": 0.89, + "learning_rate": 1.6484459442494465e-06, + "loss": 0.9756, + "step": 34782 + }, + { + "epoch": 0.89, + "learning_rate": 1.648424879572031e-06, + "loss": 0.8418, + "step": 34783 + }, + { + "epoch": 0.89, + "learning_rate": 1.6484038143981462e-06, + "loss": 0.9004, + "step": 34784 + }, + { + "epoch": 0.89, + "learning_rate": 1.6483827487278087e-06, + "loss": 1.042, + "step": 34785 + }, + { + "epoch": 0.89, + "learning_rate": 1.648361682561034e-06, + "loss": 0.7832, + "step": 34786 + }, + { + "epoch": 0.89, + "learning_rate": 1.6483406158978388e-06, + "loss": 0.7886, + "step": 34787 + }, + { + "epoch": 0.89, + "learning_rate": 1.6483195487382391e-06, + "loss": 0.7334, + "step": 34788 + }, + { + "epoch": 0.89, + "learning_rate": 1.6482984810822508e-06, + "loss": 0.8242, + "step": 34789 + }, + { + "epoch": 0.89, + "learning_rate": 1.6482774129298899e-06, + "loss": 0.7471, + "step": 34790 + }, + { + "epoch": 0.89, + "learning_rate": 1.6482563442811732e-06, + "loss": 0.8174, + "step": 34791 + }, + { + "epoch": 0.89, + "learning_rate": 1.6482352751361162e-06, + "loss": 0.8887, + "step": 34792 + }, + { + "epoch": 0.89, + "learning_rate": 1.6482142054947351e-06, + "loss": 0.9229, + "step": 34793 + }, + { + "epoch": 0.89, + "learning_rate": 1.6481931353570465e-06, + "loss": 0.7617, + "step": 34794 + }, + { + "epoch": 0.89, + "learning_rate": 1.6481720647230661e-06, + "loss": 1.0039, + "step": 34795 + }, + { + "epoch": 0.89, + "learning_rate": 1.6481509935928101e-06, + "loss": 0.9365, + "step": 34796 + }, + { + "epoch": 0.89, + "learning_rate": 1.6481299219662947e-06, + "loss": 0.6914, + "step": 34797 + }, + { + "epoch": 0.89, + "learning_rate": 1.6481088498435364e-06, + "loss": 0.7734, + "step": 34798 + }, + { + "epoch": 0.89, + "learning_rate": 1.6480877772245507e-06, + "loss": 0.8271, + "step": 34799 + }, + { + "epoch": 0.89, + "learning_rate": 1.648066704109354e-06, + "loss": 0.957, + "step": 34800 + }, + { + "epoch": 0.89, + "learning_rate": 1.648045630497962e-06, + "loss": 0.8672, + "step": 34801 + }, + { + "epoch": 0.89, + "learning_rate": 1.6480245563903918e-06, + "loss": 0.8193, + "step": 34802 + }, + { + "epoch": 0.89, + "learning_rate": 1.6480034817866585e-06, + "loss": 0.7061, + "step": 34803 + }, + { + "epoch": 0.89, + "learning_rate": 1.647982406686779e-06, + "loss": 0.6987, + "step": 34804 + }, + { + "epoch": 0.89, + "learning_rate": 1.6479613310907695e-06, + "loss": 0.8496, + "step": 34805 + }, + { + "epoch": 0.89, + "learning_rate": 1.6479402549986453e-06, + "loss": 0.9043, + "step": 34806 + }, + { + "epoch": 0.89, + "learning_rate": 1.6479191784104233e-06, + "loss": 0.8608, + "step": 34807 + }, + { + "epoch": 0.89, + "learning_rate": 1.6478981013261195e-06, + "loss": 0.9199, + "step": 34808 + }, + { + "epoch": 0.89, + "learning_rate": 1.6478770237457495e-06, + "loss": 0.8682, + "step": 34809 + }, + { + "epoch": 0.89, + "learning_rate": 1.6478559456693302e-06, + "loss": 0.998, + "step": 34810 + }, + { + "epoch": 0.89, + "learning_rate": 1.6478348670968774e-06, + "loss": 0.8945, + "step": 34811 + }, + { + "epoch": 0.89, + "learning_rate": 1.647813788028407e-06, + "loss": 0.8154, + "step": 34812 + }, + { + "epoch": 0.89, + "learning_rate": 1.6477927084639353e-06, + "loss": 0.6431, + "step": 34813 + }, + { + "epoch": 0.89, + "learning_rate": 1.6477716284034788e-06, + "loss": 0.8174, + "step": 34814 + }, + { + "epoch": 0.89, + "learning_rate": 1.6477505478470533e-06, + "loss": 0.7891, + "step": 34815 + }, + { + "epoch": 0.89, + "learning_rate": 1.6477294667946747e-06, + "loss": 0.9541, + "step": 34816 + }, + { + "epoch": 0.89, + "learning_rate": 1.64770838524636e-06, + "loss": 0.8135, + "step": 34817 + }, + { + "epoch": 0.89, + "learning_rate": 1.6476873032021242e-06, + "loss": 1.0195, + "step": 34818 + }, + { + "epoch": 0.89, + "learning_rate": 1.6476662206619842e-06, + "loss": 0.8926, + "step": 34819 + }, + { + "epoch": 0.89, + "learning_rate": 1.6476451376259561e-06, + "loss": 0.8203, + "step": 34820 + }, + { + "epoch": 0.89, + "learning_rate": 1.6476240540940557e-06, + "loss": 0.8623, + "step": 34821 + }, + { + "epoch": 0.89, + "learning_rate": 1.6476029700662997e-06, + "loss": 0.917, + "step": 34822 + }, + { + "epoch": 0.89, + "learning_rate": 1.6475818855427033e-06, + "loss": 0.8574, + "step": 34823 + }, + { + "epoch": 0.89, + "learning_rate": 1.647560800523284e-06, + "loss": 0.6821, + "step": 34824 + }, + { + "epoch": 0.89, + "learning_rate": 1.6475397150080564e-06, + "loss": 0.8154, + "step": 34825 + }, + { + "epoch": 0.89, + "learning_rate": 1.6475186289970377e-06, + "loss": 0.8633, + "step": 34826 + }, + { + "epoch": 0.89, + "learning_rate": 1.6474975424902437e-06, + "loss": 0.9238, + "step": 34827 + }, + { + "epoch": 0.89, + "learning_rate": 1.6474764554876908e-06, + "loss": 0.9209, + "step": 34828 + }, + { + "epoch": 0.89, + "learning_rate": 1.6474553679893947e-06, + "loss": 0.8428, + "step": 34829 + }, + { + "epoch": 0.89, + "learning_rate": 1.6474342799953722e-06, + "loss": 0.877, + "step": 34830 + }, + { + "epoch": 0.89, + "learning_rate": 1.6474131915056386e-06, + "loss": 0.562, + "step": 34831 + }, + { + "epoch": 0.89, + "learning_rate": 1.6473921025202108e-06, + "loss": 0.8271, + "step": 34832 + }, + { + "epoch": 0.89, + "learning_rate": 1.6473710130391044e-06, + "loss": 1.0723, + "step": 34833 + }, + { + "epoch": 0.89, + "learning_rate": 1.647349923062336e-06, + "loss": 0.6689, + "step": 34834 + }, + { + "epoch": 0.89, + "learning_rate": 1.6473288325899213e-06, + "loss": 1.0234, + "step": 34835 + }, + { + "epoch": 0.89, + "learning_rate": 1.6473077416218769e-06, + "loss": 0.9141, + "step": 34836 + }, + { + "epoch": 0.89, + "learning_rate": 1.6472866501582185e-06, + "loss": 0.999, + "step": 34837 + }, + { + "epoch": 0.89, + "learning_rate": 1.6472655581989624e-06, + "loss": 1.0176, + "step": 34838 + }, + { + "epoch": 0.89, + "learning_rate": 1.6472444657441253e-06, + "loss": 1.0469, + "step": 34839 + }, + { + "epoch": 0.89, + "learning_rate": 1.6472233727937226e-06, + "loss": 1.0645, + "step": 34840 + }, + { + "epoch": 0.89, + "learning_rate": 1.6472022793477708e-06, + "loss": 0.9512, + "step": 34841 + }, + { + "epoch": 0.89, + "learning_rate": 1.6471811854062858e-06, + "loss": 0.8711, + "step": 34842 + }, + { + "epoch": 0.89, + "learning_rate": 1.6471600909692839e-06, + "loss": 0.5391, + "step": 34843 + }, + { + "epoch": 0.89, + "learning_rate": 1.6471389960367816e-06, + "loss": 0.8926, + "step": 34844 + }, + { + "epoch": 0.89, + "learning_rate": 1.6471179006087946e-06, + "loss": 0.8701, + "step": 34845 + }, + { + "epoch": 0.89, + "learning_rate": 1.6470968046853391e-06, + "loss": 0.8862, + "step": 34846 + }, + { + "epoch": 0.89, + "learning_rate": 1.6470757082664313e-06, + "loss": 1.0098, + "step": 34847 + }, + { + "epoch": 0.89, + "learning_rate": 1.6470546113520873e-06, + "loss": 0.7783, + "step": 34848 + }, + { + "epoch": 0.89, + "learning_rate": 1.6470335139423233e-06, + "loss": 0.8477, + "step": 34849 + }, + { + "epoch": 0.89, + "learning_rate": 1.647012416037156e-06, + "loss": 0.7446, + "step": 34850 + }, + { + "epoch": 0.89, + "learning_rate": 1.6469913176366003e-06, + "loss": 0.7861, + "step": 34851 + }, + { + "epoch": 0.89, + "learning_rate": 1.6469702187406736e-06, + "loss": 0.7227, + "step": 34852 + }, + { + "epoch": 0.89, + "learning_rate": 1.6469491193493914e-06, + "loss": 0.9395, + "step": 34853 + }, + { + "epoch": 0.89, + "learning_rate": 1.6469280194627703e-06, + "loss": 0.7993, + "step": 34854 + }, + { + "epoch": 0.89, + "learning_rate": 1.6469069190808256e-06, + "loss": 0.8521, + "step": 34855 + }, + { + "epoch": 0.89, + "learning_rate": 1.6468858182035743e-06, + "loss": 0.6147, + "step": 34856 + }, + { + "epoch": 0.89, + "learning_rate": 1.6468647168310323e-06, + "loss": 0.8613, + "step": 34857 + }, + { + "epoch": 0.89, + "learning_rate": 1.6468436149632157e-06, + "loss": 0.7812, + "step": 34858 + }, + { + "epoch": 0.89, + "learning_rate": 1.6468225126001406e-06, + "loss": 0.752, + "step": 34859 + }, + { + "epoch": 0.89, + "learning_rate": 1.6468014097418234e-06, + "loss": 0.6709, + "step": 34860 + }, + { + "epoch": 0.89, + "learning_rate": 1.64678030638828e-06, + "loss": 0.8633, + "step": 34861 + }, + { + "epoch": 0.89, + "learning_rate": 1.646759202539527e-06, + "loss": 0.8545, + "step": 34862 + }, + { + "epoch": 0.89, + "learning_rate": 1.6467380981955797e-06, + "loss": 0.8218, + "step": 34863 + }, + { + "epoch": 0.89, + "learning_rate": 1.6467169933564554e-06, + "loss": 0.8145, + "step": 34864 + }, + { + "epoch": 0.89, + "learning_rate": 1.6466958880221691e-06, + "loss": 0.6699, + "step": 34865 + }, + { + "epoch": 0.89, + "learning_rate": 1.6466747821927375e-06, + "loss": 0.6982, + "step": 34866 + }, + { + "epoch": 0.89, + "learning_rate": 1.646653675868177e-06, + "loss": 0.8467, + "step": 34867 + }, + { + "epoch": 0.89, + "learning_rate": 1.6466325690485031e-06, + "loss": 0.876, + "step": 34868 + }, + { + "epoch": 0.89, + "learning_rate": 1.646611461733733e-06, + "loss": 0.6685, + "step": 34869 + }, + { + "epoch": 0.89, + "learning_rate": 1.6465903539238818e-06, + "loss": 0.6924, + "step": 34870 + }, + { + "epoch": 0.89, + "learning_rate": 1.6465692456189663e-06, + "loss": 1.0742, + "step": 34871 + }, + { + "epoch": 0.89, + "learning_rate": 1.6465481368190025e-06, + "loss": 1.043, + "step": 34872 + }, + { + "epoch": 0.89, + "learning_rate": 1.6465270275240063e-06, + "loss": 0.8066, + "step": 34873 + }, + { + "epoch": 0.89, + "learning_rate": 1.6465059177339939e-06, + "loss": 0.7104, + "step": 34874 + }, + { + "epoch": 0.89, + "learning_rate": 1.6464848074489822e-06, + "loss": 0.833, + "step": 34875 + }, + { + "epoch": 0.89, + "learning_rate": 1.6464636966689863e-06, + "loss": 0.6382, + "step": 34876 + }, + { + "epoch": 0.89, + "learning_rate": 1.6464425853940234e-06, + "loss": 0.9375, + "step": 34877 + }, + { + "epoch": 0.89, + "learning_rate": 1.6464214736241086e-06, + "loss": 1.1475, + "step": 34878 + }, + { + "epoch": 0.89, + "learning_rate": 1.6464003613592588e-06, + "loss": 0.9736, + "step": 34879 + }, + { + "epoch": 0.89, + "learning_rate": 1.64637924859949e-06, + "loss": 0.8408, + "step": 34880 + }, + { + "epoch": 0.89, + "learning_rate": 1.6463581353448183e-06, + "loss": 0.6826, + "step": 34881 + }, + { + "epoch": 0.89, + "learning_rate": 1.6463370215952602e-06, + "loss": 0.8416, + "step": 34882 + }, + { + "epoch": 0.89, + "learning_rate": 1.6463159073508311e-06, + "loss": 0.7344, + "step": 34883 + }, + { + "epoch": 0.89, + "learning_rate": 1.646294792611548e-06, + "loss": 0.8408, + "step": 34884 + }, + { + "epoch": 0.89, + "learning_rate": 1.6462736773774264e-06, + "loss": 0.606, + "step": 34885 + }, + { + "epoch": 0.89, + "learning_rate": 1.646252561648483e-06, + "loss": 0.6787, + "step": 34886 + }, + { + "epoch": 0.89, + "learning_rate": 1.6462314454247333e-06, + "loss": 0.7695, + "step": 34887 + }, + { + "epoch": 0.89, + "learning_rate": 1.6462103287061942e-06, + "loss": 0.7312, + "step": 34888 + }, + { + "epoch": 0.89, + "learning_rate": 1.6461892114928819e-06, + "loss": 0.7891, + "step": 34889 + }, + { + "epoch": 0.89, + "learning_rate": 1.6461680937848116e-06, + "loss": 0.7979, + "step": 34890 + }, + { + "epoch": 0.89, + "learning_rate": 1.6461469755820006e-06, + "loss": 0.7354, + "step": 34891 + }, + { + "epoch": 0.89, + "learning_rate": 1.6461258568844642e-06, + "loss": 0.9004, + "step": 34892 + }, + { + "epoch": 0.89, + "learning_rate": 1.646104737692219e-06, + "loss": 1.0283, + "step": 34893 + }, + { + "epoch": 0.89, + "learning_rate": 1.6460836180052815e-06, + "loss": 0.8711, + "step": 34894 + }, + { + "epoch": 0.89, + "learning_rate": 1.6460624978236671e-06, + "loss": 1.0186, + "step": 34895 + }, + { + "epoch": 0.89, + "learning_rate": 1.6460413771473927e-06, + "loss": 1.04, + "step": 34896 + }, + { + "epoch": 0.89, + "learning_rate": 1.6460202559764737e-06, + "loss": 0.9912, + "step": 34897 + }, + { + "epoch": 0.89, + "learning_rate": 1.645999134310927e-06, + "loss": 0.8896, + "step": 34898 + }, + { + "epoch": 0.89, + "learning_rate": 1.6459780121507683e-06, + "loss": 0.8164, + "step": 34899 + }, + { + "epoch": 0.89, + "learning_rate": 1.6459568894960138e-06, + "loss": 0.8887, + "step": 34900 + }, + { + "epoch": 0.89, + "learning_rate": 1.64593576634668e-06, + "loss": 0.7109, + "step": 34901 + }, + { + "epoch": 0.89, + "learning_rate": 1.6459146427027828e-06, + "loss": 0.9346, + "step": 34902 + }, + { + "epoch": 0.89, + "learning_rate": 1.6458935185643386e-06, + "loss": 0.7253, + "step": 34903 + }, + { + "epoch": 0.89, + "learning_rate": 1.6458723939313634e-06, + "loss": 0.8721, + "step": 34904 + }, + { + "epoch": 0.89, + "learning_rate": 1.6458512688038735e-06, + "loss": 0.6919, + "step": 34905 + }, + { + "epoch": 0.89, + "learning_rate": 1.6458301431818846e-06, + "loss": 0.7217, + "step": 34906 + }, + { + "epoch": 0.89, + "learning_rate": 1.6458090170654138e-06, + "loss": 0.7236, + "step": 34907 + }, + { + "epoch": 0.89, + "learning_rate": 1.6457878904544763e-06, + "loss": 0.7695, + "step": 34908 + }, + { + "epoch": 0.89, + "learning_rate": 1.6457667633490888e-06, + "loss": 0.8394, + "step": 34909 + }, + { + "epoch": 0.89, + "learning_rate": 1.6457456357492676e-06, + "loss": 0.8887, + "step": 34910 + }, + { + "epoch": 0.89, + "learning_rate": 1.6457245076550286e-06, + "loss": 0.8555, + "step": 34911 + }, + { + "epoch": 0.89, + "learning_rate": 1.6457033790663877e-06, + "loss": 0.7651, + "step": 34912 + }, + { + "epoch": 0.89, + "learning_rate": 1.6456822499833615e-06, + "loss": 0.9336, + "step": 34913 + }, + { + "epoch": 0.89, + "learning_rate": 1.6456611204059666e-06, + "loss": 0.5151, + "step": 34914 + }, + { + "epoch": 0.89, + "learning_rate": 1.6456399903342182e-06, + "loss": 0.9258, + "step": 34915 + }, + { + "epoch": 0.89, + "learning_rate": 1.6456188597681328e-06, + "loss": 0.6289, + "step": 34916 + }, + { + "epoch": 0.89, + "learning_rate": 1.645597728707727e-06, + "loss": 0.6133, + "step": 34917 + }, + { + "epoch": 0.89, + "learning_rate": 1.6455765971530168e-06, + "loss": 0.8037, + "step": 34918 + }, + { + "epoch": 0.89, + "learning_rate": 1.6455554651040183e-06, + "loss": 1.0088, + "step": 34919 + }, + { + "epoch": 0.9, + "learning_rate": 1.6455343325607474e-06, + "loss": 0.8232, + "step": 34920 + }, + { + "epoch": 0.9, + "learning_rate": 1.6455131995232206e-06, + "loss": 0.9209, + "step": 34921 + }, + { + "epoch": 0.9, + "learning_rate": 1.645492065991454e-06, + "loss": 0.6553, + "step": 34922 + }, + { + "epoch": 0.9, + "learning_rate": 1.6454709319654641e-06, + "loss": 0.9639, + "step": 34923 + }, + { + "epoch": 0.9, + "learning_rate": 1.6454497974452667e-06, + "loss": 0.9736, + "step": 34924 + }, + { + "epoch": 0.9, + "learning_rate": 1.6454286624308778e-06, + "loss": 0.9287, + "step": 34925 + }, + { + "epoch": 0.9, + "learning_rate": 1.6454075269223138e-06, + "loss": 0.9844, + "step": 34926 + }, + { + "epoch": 0.9, + "learning_rate": 1.645386390919591e-06, + "loss": 0.875, + "step": 34927 + }, + { + "epoch": 0.9, + "learning_rate": 1.6453652544227259e-06, + "loss": 0.917, + "step": 34928 + }, + { + "epoch": 0.9, + "learning_rate": 1.6453441174317342e-06, + "loss": 0.8345, + "step": 34929 + }, + { + "epoch": 0.9, + "learning_rate": 1.645322979946632e-06, + "loss": 0.7578, + "step": 34930 + }, + { + "epoch": 0.9, + "learning_rate": 1.6453018419674357e-06, + "loss": 0.877, + "step": 34931 + }, + { + "epoch": 0.9, + "learning_rate": 1.6452807034941613e-06, + "loss": 0.8271, + "step": 34932 + }, + { + "epoch": 0.9, + "learning_rate": 1.6452595645268255e-06, + "loss": 0.7957, + "step": 34933 + }, + { + "epoch": 0.9, + "learning_rate": 1.6452384250654438e-06, + "loss": 0.8311, + "step": 34934 + }, + { + "epoch": 0.9, + "learning_rate": 1.645217285110033e-06, + "loss": 0.7666, + "step": 34935 + }, + { + "epoch": 0.9, + "learning_rate": 1.6451961446606085e-06, + "loss": 0.9668, + "step": 34936 + }, + { + "epoch": 0.9, + "learning_rate": 1.6451750037171875e-06, + "loss": 0.73, + "step": 34937 + }, + { + "epoch": 0.9, + "learning_rate": 1.6451538622797854e-06, + "loss": 0.8271, + "step": 34938 + }, + { + "epoch": 0.9, + "learning_rate": 1.6451327203484186e-06, + "loss": 0.811, + "step": 34939 + }, + { + "epoch": 0.9, + "learning_rate": 1.6451115779231036e-06, + "loss": 0.9697, + "step": 34940 + }, + { + "epoch": 0.9, + "learning_rate": 1.6450904350038562e-06, + "loss": 0.9014, + "step": 34941 + }, + { + "epoch": 0.9, + "learning_rate": 1.6450692915906924e-06, + "loss": 0.6943, + "step": 34942 + }, + { + "epoch": 0.9, + "learning_rate": 1.645048147683629e-06, + "loss": 0.9424, + "step": 34943 + }, + { + "epoch": 0.9, + "learning_rate": 1.6450270032826821e-06, + "loss": 0.7573, + "step": 34944 + }, + { + "epoch": 0.9, + "learning_rate": 1.6450058583878674e-06, + "loss": 0.8887, + "step": 34945 + }, + { + "epoch": 0.9, + "learning_rate": 1.6449847129992013e-06, + "loss": 0.8252, + "step": 34946 + }, + { + "epoch": 0.9, + "learning_rate": 1.6449635671167004e-06, + "loss": 0.7979, + "step": 34947 + }, + { + "epoch": 0.9, + "learning_rate": 1.6449424207403801e-06, + "loss": 0.8125, + "step": 34948 + }, + { + "epoch": 0.9, + "learning_rate": 1.6449212738702576e-06, + "loss": 0.7891, + "step": 34949 + }, + { + "epoch": 0.9, + "learning_rate": 1.6449001265063482e-06, + "loss": 0.8945, + "step": 34950 + }, + { + "epoch": 0.9, + "learning_rate": 1.6448789786486685e-06, + "loss": 0.9248, + "step": 34951 + }, + { + "epoch": 0.9, + "learning_rate": 1.6448578302972345e-06, + "loss": 0.8105, + "step": 34952 + }, + { + "epoch": 0.9, + "learning_rate": 1.6448366814520624e-06, + "loss": 0.9453, + "step": 34953 + }, + { + "epoch": 0.9, + "learning_rate": 1.644815532113169e-06, + "loss": 0.9961, + "step": 34954 + }, + { + "epoch": 0.9, + "learning_rate": 1.6447943822805694e-06, + "loss": 0.7529, + "step": 34955 + }, + { + "epoch": 0.9, + "learning_rate": 1.6447732319542808e-06, + "loss": 0.7104, + "step": 34956 + }, + { + "epoch": 0.9, + "learning_rate": 1.6447520811343187e-06, + "loss": 0.8809, + "step": 34957 + }, + { + "epoch": 0.9, + "learning_rate": 1.6447309298207e-06, + "loss": 0.7803, + "step": 34958 + }, + { + "epoch": 0.9, + "learning_rate": 1.6447097780134403e-06, + "loss": 1.1113, + "step": 34959 + }, + { + "epoch": 0.9, + "learning_rate": 1.644688625712556e-06, + "loss": 1.0791, + "step": 34960 + }, + { + "epoch": 0.9, + "learning_rate": 1.6446674729180629e-06, + "loss": 0.7656, + "step": 34961 + }, + { + "epoch": 0.9, + "learning_rate": 1.6446463196299779e-06, + "loss": 0.9141, + "step": 34962 + }, + { + "epoch": 0.9, + "learning_rate": 1.6446251658483169e-06, + "loss": 1.0156, + "step": 34963 + }, + { + "epoch": 0.9, + "learning_rate": 1.6446040115730957e-06, + "loss": 0.9404, + "step": 34964 + }, + { + "epoch": 0.9, + "learning_rate": 1.6445828568043312e-06, + "loss": 0.7363, + "step": 34965 + }, + { + "epoch": 0.9, + "learning_rate": 1.644561701542039e-06, + "loss": 0.8369, + "step": 34966 + }, + { + "epoch": 0.9, + "learning_rate": 1.6445405457862354e-06, + "loss": 0.7876, + "step": 34967 + }, + { + "epoch": 0.9, + "learning_rate": 1.6445193895369372e-06, + "loss": 0.8857, + "step": 34968 + }, + { + "epoch": 0.9, + "learning_rate": 1.64449823279416e-06, + "loss": 0.7725, + "step": 34969 + }, + { + "epoch": 0.9, + "learning_rate": 1.6444770755579201e-06, + "loss": 0.5283, + "step": 34970 + }, + { + "epoch": 0.9, + "learning_rate": 1.6444559178282336e-06, + "loss": 0.7793, + "step": 34971 + }, + { + "epoch": 0.9, + "learning_rate": 1.6444347596051168e-06, + "loss": 1.0898, + "step": 34972 + }, + { + "epoch": 0.9, + "learning_rate": 1.6444136008885861e-06, + "loss": 0.9209, + "step": 34973 + }, + { + "epoch": 0.9, + "learning_rate": 1.6443924416786577e-06, + "loss": 0.9746, + "step": 34974 + }, + { + "epoch": 0.9, + "learning_rate": 1.6443712819753474e-06, + "loss": 0.6064, + "step": 34975 + }, + { + "epoch": 0.9, + "learning_rate": 1.6443501217786718e-06, + "loss": 0.8652, + "step": 34976 + }, + { + "epoch": 0.9, + "learning_rate": 1.6443289610886467e-06, + "loss": 0.8184, + "step": 34977 + }, + { + "epoch": 0.9, + "learning_rate": 1.6443077999052886e-06, + "loss": 0.7471, + "step": 34978 + }, + { + "epoch": 0.9, + "learning_rate": 1.6442866382286139e-06, + "loss": 1.0234, + "step": 34979 + }, + { + "epoch": 0.9, + "learning_rate": 1.6442654760586382e-06, + "loss": 0.876, + "step": 34980 + }, + { + "epoch": 0.9, + "learning_rate": 1.644244313395378e-06, + "loss": 0.916, + "step": 34981 + }, + { + "epoch": 0.9, + "learning_rate": 1.64422315023885e-06, + "loss": 0.8325, + "step": 34982 + }, + { + "epoch": 0.9, + "learning_rate": 1.6442019865890698e-06, + "loss": 0.7144, + "step": 34983 + }, + { + "epoch": 0.9, + "learning_rate": 1.6441808224460537e-06, + "loss": 1.0293, + "step": 34984 + }, + { + "epoch": 0.9, + "learning_rate": 1.6441596578098179e-06, + "loss": 0.8545, + "step": 34985 + }, + { + "epoch": 0.9, + "learning_rate": 1.6441384926803785e-06, + "loss": 0.7983, + "step": 34986 + }, + { + "epoch": 0.9, + "learning_rate": 1.6441173270577521e-06, + "loss": 0.8203, + "step": 34987 + }, + { + "epoch": 0.9, + "learning_rate": 1.6440961609419545e-06, + "loss": 0.7812, + "step": 34988 + }, + { + "epoch": 0.9, + "learning_rate": 1.6440749943330025e-06, + "loss": 0.9209, + "step": 34989 + }, + { + "epoch": 0.9, + "learning_rate": 1.6440538272309117e-06, + "loss": 1.1465, + "step": 34990 + }, + { + "epoch": 0.9, + "learning_rate": 1.6440326596356983e-06, + "loss": 0.8779, + "step": 34991 + }, + { + "epoch": 0.9, + "learning_rate": 1.6440114915473789e-06, + "loss": 0.9116, + "step": 34992 + }, + { + "epoch": 0.9, + "learning_rate": 1.6439903229659696e-06, + "loss": 0.8906, + "step": 34993 + }, + { + "epoch": 0.9, + "learning_rate": 1.6439691538914864e-06, + "loss": 0.9287, + "step": 34994 + }, + { + "epoch": 0.9, + "learning_rate": 1.6439479843239457e-06, + "loss": 0.7588, + "step": 34995 + }, + { + "epoch": 0.9, + "learning_rate": 1.6439268142633634e-06, + "loss": 0.7314, + "step": 34996 + }, + { + "epoch": 0.9, + "learning_rate": 1.6439056437097559e-06, + "loss": 0.8369, + "step": 34997 + }, + { + "epoch": 0.9, + "learning_rate": 1.6438844726631396e-06, + "loss": 0.9453, + "step": 34998 + }, + { + "epoch": 0.9, + "learning_rate": 1.643863301123531e-06, + "loss": 0.7656, + "step": 34999 + }, + { + "epoch": 0.9, + "learning_rate": 1.6438421290909452e-06, + "loss": 0.9951, + "step": 35000 + }, + { + "epoch": 0.9, + "learning_rate": 1.6438209565653996e-06, + "loss": 0.8135, + "step": 35001 + }, + { + "epoch": 0.9, + "learning_rate": 1.6437997835469095e-06, + "loss": 0.7607, + "step": 35002 + }, + { + "epoch": 0.9, + "learning_rate": 1.643778610035492e-06, + "loss": 0.8057, + "step": 35003 + }, + { + "epoch": 0.9, + "learning_rate": 1.6437574360311624e-06, + "loss": 1.0967, + "step": 35004 + }, + { + "epoch": 0.9, + "learning_rate": 1.6437362615339371e-06, + "loss": 0.8838, + "step": 35005 + }, + { + "epoch": 0.9, + "learning_rate": 1.6437150865438332e-06, + "loss": 0.8555, + "step": 35006 + }, + { + "epoch": 0.9, + "learning_rate": 1.6436939110608655e-06, + "loss": 0.957, + "step": 35007 + }, + { + "epoch": 0.9, + "learning_rate": 1.643672735085052e-06, + "loss": 0.8291, + "step": 35008 + }, + { + "epoch": 0.9, + "learning_rate": 1.6436515586164071e-06, + "loss": 0.6753, + "step": 35009 + }, + { + "epoch": 0.9, + "learning_rate": 1.643630381654948e-06, + "loss": 0.7783, + "step": 35010 + }, + { + "epoch": 0.9, + "learning_rate": 1.6436092042006906e-06, + "loss": 0.8076, + "step": 35011 + }, + { + "epoch": 0.9, + "learning_rate": 1.6435880262536512e-06, + "loss": 0.7256, + "step": 35012 + }, + { + "epoch": 0.9, + "learning_rate": 1.6435668478138466e-06, + "loss": 0.7852, + "step": 35013 + }, + { + "epoch": 0.9, + "learning_rate": 1.6435456688812917e-06, + "loss": 0.8643, + "step": 35014 + }, + { + "epoch": 0.9, + "learning_rate": 1.6435244894560038e-06, + "loss": 0.8613, + "step": 35015 + }, + { + "epoch": 0.9, + "learning_rate": 1.6435033095379988e-06, + "loss": 0.7842, + "step": 35016 + }, + { + "epoch": 0.9, + "learning_rate": 1.6434821291272928e-06, + "loss": 0.6729, + "step": 35017 + }, + { + "epoch": 0.9, + "learning_rate": 1.6434609482239024e-06, + "loss": 0.8096, + "step": 35018 + }, + { + "epoch": 0.9, + "learning_rate": 1.6434397668278433e-06, + "loss": 0.9668, + "step": 35019 + }, + { + "epoch": 0.9, + "learning_rate": 1.643418584939132e-06, + "loss": 0.9766, + "step": 35020 + }, + { + "epoch": 0.9, + "learning_rate": 1.6433974025577847e-06, + "loss": 0.6406, + "step": 35021 + }, + { + "epoch": 0.9, + "learning_rate": 1.6433762196838174e-06, + "loss": 0.6526, + "step": 35022 + }, + { + "epoch": 0.9, + "learning_rate": 1.643355036317247e-06, + "loss": 0.8003, + "step": 35023 + }, + { + "epoch": 0.9, + "learning_rate": 1.643333852458089e-06, + "loss": 0.8828, + "step": 35024 + }, + { + "epoch": 0.9, + "learning_rate": 1.6433126681063596e-06, + "loss": 0.998, + "step": 35025 + }, + { + "epoch": 0.9, + "learning_rate": 1.6432914832620753e-06, + "loss": 0.7227, + "step": 35026 + }, + { + "epoch": 0.9, + "learning_rate": 1.6432702979252526e-06, + "loss": 0.8828, + "step": 35027 + }, + { + "epoch": 0.9, + "learning_rate": 1.643249112095907e-06, + "loss": 0.8691, + "step": 35028 + }, + { + "epoch": 0.9, + "learning_rate": 1.6432279257740555e-06, + "loss": 0.8994, + "step": 35029 + }, + { + "epoch": 0.9, + "learning_rate": 1.643206738959714e-06, + "loss": 0.9229, + "step": 35030 + }, + { + "epoch": 0.9, + "learning_rate": 1.6431855516528983e-06, + "loss": 0.9502, + "step": 35031 + }, + { + "epoch": 0.9, + "learning_rate": 1.6431643638536252e-06, + "loss": 1.0684, + "step": 35032 + }, + { + "epoch": 0.9, + "learning_rate": 1.6431431755619109e-06, + "loss": 0.7749, + "step": 35033 + }, + { + "epoch": 0.9, + "learning_rate": 1.6431219867777712e-06, + "loss": 0.6562, + "step": 35034 + }, + { + "epoch": 0.9, + "learning_rate": 1.6431007975012225e-06, + "loss": 0.873, + "step": 35035 + }, + { + "epoch": 0.9, + "learning_rate": 1.6430796077322812e-06, + "loss": 0.6775, + "step": 35036 + }, + { + "epoch": 0.9, + "learning_rate": 1.6430584174709635e-06, + "loss": 0.8301, + "step": 35037 + }, + { + "epoch": 0.9, + "learning_rate": 1.6430372267172854e-06, + "loss": 0.6914, + "step": 35038 + }, + { + "epoch": 0.9, + "learning_rate": 1.6430160354712635e-06, + "loss": 0.5869, + "step": 35039 + }, + { + "epoch": 0.9, + "learning_rate": 1.6429948437329135e-06, + "loss": 0.6592, + "step": 35040 + }, + { + "epoch": 0.9, + "learning_rate": 1.642973651502252e-06, + "loss": 0.7432, + "step": 35041 + }, + { + "epoch": 0.9, + "learning_rate": 1.6429524587792952e-06, + "loss": 0.6467, + "step": 35042 + }, + { + "epoch": 0.9, + "learning_rate": 1.6429312655640596e-06, + "loss": 0.958, + "step": 35043 + }, + { + "epoch": 0.9, + "learning_rate": 1.6429100718565606e-06, + "loss": 0.3379, + "step": 35044 + }, + { + "epoch": 0.9, + "learning_rate": 1.642888877656815e-06, + "loss": 0.646, + "step": 35045 + }, + { + "epoch": 0.9, + "learning_rate": 1.642867682964839e-06, + "loss": 0.8315, + "step": 35046 + }, + { + "epoch": 0.9, + "learning_rate": 1.6428464877806488e-06, + "loss": 0.6299, + "step": 35047 + }, + { + "epoch": 0.9, + "learning_rate": 1.6428252921042605e-06, + "loss": 0.9131, + "step": 35048 + }, + { + "epoch": 0.9, + "learning_rate": 1.6428040959356905e-06, + "loss": 0.7612, + "step": 35049 + }, + { + "epoch": 0.9, + "learning_rate": 1.6427828992749548e-06, + "loss": 0.5732, + "step": 35050 + }, + { + "epoch": 0.9, + "learning_rate": 1.6427617021220701e-06, + "loss": 0.8301, + "step": 35051 + }, + { + "epoch": 0.9, + "learning_rate": 1.642740504477052e-06, + "loss": 1.0225, + "step": 35052 + }, + { + "epoch": 0.9, + "learning_rate": 1.6427193063399174e-06, + "loss": 0.8838, + "step": 35053 + }, + { + "epoch": 0.9, + "learning_rate": 1.642698107710682e-06, + "loss": 0.8428, + "step": 35054 + }, + { + "epoch": 0.9, + "learning_rate": 1.6426769085893622e-06, + "loss": 0.9756, + "step": 35055 + }, + { + "epoch": 0.9, + "learning_rate": 1.6426557089759742e-06, + "loss": 0.7627, + "step": 35056 + }, + { + "epoch": 0.9, + "learning_rate": 1.6426345088705343e-06, + "loss": 0.9775, + "step": 35057 + }, + { + "epoch": 0.9, + "learning_rate": 1.6426133082730588e-06, + "loss": 0.5925, + "step": 35058 + }, + { + "epoch": 0.9, + "learning_rate": 1.6425921071835637e-06, + "loss": 0.9707, + "step": 35059 + }, + { + "epoch": 0.9, + "learning_rate": 1.6425709056020657e-06, + "loss": 0.8047, + "step": 35060 + }, + { + "epoch": 0.9, + "learning_rate": 1.6425497035285805e-06, + "loss": 0.9521, + "step": 35061 + }, + { + "epoch": 0.9, + "learning_rate": 1.6425285009631243e-06, + "loss": 0.71, + "step": 35062 + }, + { + "epoch": 0.9, + "learning_rate": 1.642507297905714e-06, + "loss": 0.835, + "step": 35063 + }, + { + "epoch": 0.9, + "learning_rate": 1.6424860943563653e-06, + "loss": 0.6899, + "step": 35064 + }, + { + "epoch": 0.9, + "learning_rate": 1.6424648903150942e-06, + "loss": 0.875, + "step": 35065 + }, + { + "epoch": 0.9, + "learning_rate": 1.6424436857819174e-06, + "loss": 0.8311, + "step": 35066 + }, + { + "epoch": 0.9, + "learning_rate": 1.642422480756851e-06, + "loss": 0.9268, + "step": 35067 + }, + { + "epoch": 0.9, + "learning_rate": 1.6424012752399117e-06, + "loss": 0.7451, + "step": 35068 + }, + { + "epoch": 0.9, + "learning_rate": 1.6423800692311148e-06, + "loss": 0.6836, + "step": 35069 + }, + { + "epoch": 0.9, + "learning_rate": 1.642358862730477e-06, + "loss": 0.8379, + "step": 35070 + }, + { + "epoch": 0.9, + "learning_rate": 1.6423376557380148e-06, + "loss": 0.7139, + "step": 35071 + }, + { + "epoch": 0.9, + "learning_rate": 1.6423164482537438e-06, + "loss": 0.9766, + "step": 35072 + }, + { + "epoch": 0.9, + "learning_rate": 1.6422952402776811e-06, + "loss": 0.9619, + "step": 35073 + }, + { + "epoch": 0.9, + "learning_rate": 1.6422740318098423e-06, + "loss": 0.7158, + "step": 35074 + }, + { + "epoch": 0.9, + "learning_rate": 1.642252822850244e-06, + "loss": 0.875, + "step": 35075 + }, + { + "epoch": 0.9, + "learning_rate": 1.642231613398902e-06, + "loss": 0.7471, + "step": 35076 + }, + { + "epoch": 0.9, + "learning_rate": 1.6422104034558325e-06, + "loss": 0.9561, + "step": 35077 + }, + { + "epoch": 0.9, + "learning_rate": 1.6421891930210526e-06, + "loss": 0.834, + "step": 35078 + }, + { + "epoch": 0.9, + "learning_rate": 1.6421679820945778e-06, + "loss": 0.958, + "step": 35079 + }, + { + "epoch": 0.9, + "learning_rate": 1.6421467706764242e-06, + "loss": 0.9248, + "step": 35080 + }, + { + "epoch": 0.9, + "learning_rate": 1.6421255587666085e-06, + "loss": 0.8599, + "step": 35081 + }, + { + "epoch": 0.9, + "learning_rate": 1.642104346365147e-06, + "loss": 0.8594, + "step": 35082 + }, + { + "epoch": 0.9, + "learning_rate": 1.6420831334720555e-06, + "loss": 0.8574, + "step": 35083 + }, + { + "epoch": 0.9, + "learning_rate": 1.6420619200873508e-06, + "loss": 1.0703, + "step": 35084 + }, + { + "epoch": 0.9, + "learning_rate": 1.6420407062110484e-06, + "loss": 0.5884, + "step": 35085 + }, + { + "epoch": 0.9, + "learning_rate": 1.6420194918431652e-06, + "loss": 0.7832, + "step": 35086 + }, + { + "epoch": 0.9, + "learning_rate": 1.6419982769837168e-06, + "loss": 0.877, + "step": 35087 + }, + { + "epoch": 0.9, + "learning_rate": 1.6419770616327205e-06, + "loss": 0.4651, + "step": 35088 + }, + { + "epoch": 0.9, + "learning_rate": 1.6419558457901915e-06, + "loss": 0.7671, + "step": 35089 + }, + { + "epoch": 0.9, + "learning_rate": 1.6419346294561463e-06, + "loss": 0.5342, + "step": 35090 + }, + { + "epoch": 0.9, + "learning_rate": 1.6419134126306013e-06, + "loss": 0.7769, + "step": 35091 + }, + { + "epoch": 0.9, + "learning_rate": 1.641892195313573e-06, + "loss": 0.48, + "step": 35092 + }, + { + "epoch": 0.9, + "learning_rate": 1.6418709775050772e-06, + "loss": 0.8687, + "step": 35093 + }, + { + "epoch": 0.9, + "learning_rate": 1.6418497592051303e-06, + "loss": 0.8564, + "step": 35094 + }, + { + "epoch": 0.9, + "learning_rate": 1.6418285404137486e-06, + "loss": 0.9385, + "step": 35095 + }, + { + "epoch": 0.9, + "learning_rate": 1.641807321130948e-06, + "loss": 1.0312, + "step": 35096 + }, + { + "epoch": 0.9, + "learning_rate": 1.6417861013567453e-06, + "loss": 0.7178, + "step": 35097 + }, + { + "epoch": 0.9, + "learning_rate": 1.6417648810911567e-06, + "loss": 0.8867, + "step": 35098 + }, + { + "epoch": 0.9, + "learning_rate": 1.6417436603341978e-06, + "loss": 0.7117, + "step": 35099 + }, + { + "epoch": 0.9, + "learning_rate": 1.6417224390858854e-06, + "loss": 0.626, + "step": 35100 + }, + { + "epoch": 0.9, + "learning_rate": 1.641701217346236e-06, + "loss": 0.7852, + "step": 35101 + }, + { + "epoch": 0.9, + "learning_rate": 1.6416799951152651e-06, + "loss": 0.6909, + "step": 35102 + }, + { + "epoch": 0.9, + "learning_rate": 1.6416587723929894e-06, + "loss": 0.8916, + "step": 35103 + }, + { + "epoch": 0.9, + "learning_rate": 1.6416375491794253e-06, + "loss": 0.8369, + "step": 35104 + }, + { + "epoch": 0.9, + "learning_rate": 1.6416163254745887e-06, + "loss": 0.7222, + "step": 35105 + }, + { + "epoch": 0.9, + "learning_rate": 1.641595101278496e-06, + "loss": 1.0264, + "step": 35106 + }, + { + "epoch": 0.9, + "learning_rate": 1.6415738765911633e-06, + "loss": 0.8701, + "step": 35107 + }, + { + "epoch": 0.9, + "learning_rate": 1.6415526514126073e-06, + "loss": 0.9453, + "step": 35108 + }, + { + "epoch": 0.9, + "learning_rate": 1.6415314257428437e-06, + "loss": 1.0361, + "step": 35109 + }, + { + "epoch": 0.9, + "learning_rate": 1.6415101995818889e-06, + "loss": 0.8223, + "step": 35110 + }, + { + "epoch": 0.9, + "learning_rate": 1.6414889729297594e-06, + "loss": 0.8555, + "step": 35111 + }, + { + "epoch": 0.9, + "learning_rate": 1.6414677457864712e-06, + "loss": 1.0156, + "step": 35112 + }, + { + "epoch": 0.9, + "learning_rate": 1.641446518152041e-06, + "loss": 1.0029, + "step": 35113 + }, + { + "epoch": 0.9, + "learning_rate": 1.641425290026484e-06, + "loss": 0.8262, + "step": 35114 + }, + { + "epoch": 0.9, + "learning_rate": 1.6414040614098177e-06, + "loss": 0.8252, + "step": 35115 + }, + { + "epoch": 0.9, + "learning_rate": 1.6413828323020575e-06, + "loss": 0.7471, + "step": 35116 + }, + { + "epoch": 0.9, + "learning_rate": 1.64136160270322e-06, + "loss": 0.8896, + "step": 35117 + }, + { + "epoch": 0.9, + "learning_rate": 1.6413403726133215e-06, + "loss": 1.083, + "step": 35118 + }, + { + "epoch": 0.9, + "learning_rate": 1.6413191420323783e-06, + "loss": 0.8398, + "step": 35119 + }, + { + "epoch": 0.9, + "learning_rate": 1.6412979109604063e-06, + "loss": 0.7324, + "step": 35120 + }, + { + "epoch": 0.9, + "learning_rate": 1.6412766793974222e-06, + "loss": 0.958, + "step": 35121 + }, + { + "epoch": 0.9, + "learning_rate": 1.6412554473434417e-06, + "loss": 0.9941, + "step": 35122 + }, + { + "epoch": 0.9, + "learning_rate": 1.6412342147984817e-06, + "loss": 0.9204, + "step": 35123 + }, + { + "epoch": 0.9, + "learning_rate": 1.641212981762558e-06, + "loss": 0.8154, + "step": 35124 + }, + { + "epoch": 0.9, + "learning_rate": 1.641191748235687e-06, + "loss": 0.6792, + "step": 35125 + }, + { + "epoch": 0.9, + "learning_rate": 1.6411705142178849e-06, + "loss": 1.0547, + "step": 35126 + }, + { + "epoch": 0.9, + "learning_rate": 1.6411492797091682e-06, + "loss": 0.7646, + "step": 35127 + }, + { + "epoch": 0.9, + "learning_rate": 1.641128044709553e-06, + "loss": 0.8301, + "step": 35128 + }, + { + "epoch": 0.9, + "learning_rate": 1.6411068092190555e-06, + "loss": 1.1201, + "step": 35129 + }, + { + "epoch": 0.9, + "learning_rate": 1.6410855732376918e-06, + "loss": 1.1445, + "step": 35130 + }, + { + "epoch": 0.9, + "learning_rate": 1.6410643367654781e-06, + "loss": 0.8301, + "step": 35131 + }, + { + "epoch": 0.9, + "learning_rate": 1.6410430998024314e-06, + "loss": 0.8975, + "step": 35132 + }, + { + "epoch": 0.9, + "learning_rate": 1.6410218623485673e-06, + "loss": 0.7217, + "step": 35133 + }, + { + "epoch": 0.9, + "learning_rate": 1.6410006244039026e-06, + "loss": 0.7178, + "step": 35134 + }, + { + "epoch": 0.9, + "learning_rate": 1.640979385968453e-06, + "loss": 0.9736, + "step": 35135 + }, + { + "epoch": 0.9, + "learning_rate": 1.6409581470422347e-06, + "loss": 0.9141, + "step": 35136 + }, + { + "epoch": 0.9, + "learning_rate": 1.6409369076252642e-06, + "loss": 0.9121, + "step": 35137 + }, + { + "epoch": 0.9, + "learning_rate": 1.6409156677175583e-06, + "loss": 0.7339, + "step": 35138 + }, + { + "epoch": 0.9, + "learning_rate": 1.6408944273191322e-06, + "loss": 0.875, + "step": 35139 + }, + { + "epoch": 0.9, + "learning_rate": 1.640873186430003e-06, + "loss": 0.9023, + "step": 35140 + }, + { + "epoch": 0.9, + "learning_rate": 1.6408519450501866e-06, + "loss": 0.7695, + "step": 35141 + }, + { + "epoch": 0.9, + "learning_rate": 1.640830703179699e-06, + "loss": 1.082, + "step": 35142 + }, + { + "epoch": 0.9, + "learning_rate": 1.6408094608185572e-06, + "loss": 0.5334, + "step": 35143 + }, + { + "epoch": 0.9, + "learning_rate": 1.6407882179667769e-06, + "loss": 0.8467, + "step": 35144 + }, + { + "epoch": 0.9, + "learning_rate": 1.6407669746243745e-06, + "loss": 0.8125, + "step": 35145 + }, + { + "epoch": 0.9, + "learning_rate": 1.6407457307913663e-06, + "loss": 0.9092, + "step": 35146 + }, + { + "epoch": 0.9, + "learning_rate": 1.6407244864677688e-06, + "loss": 0.8594, + "step": 35147 + }, + { + "epoch": 0.9, + "learning_rate": 1.6407032416535978e-06, + "loss": 0.9941, + "step": 35148 + }, + { + "epoch": 0.9, + "learning_rate": 1.64068199634887e-06, + "loss": 0.877, + "step": 35149 + }, + { + "epoch": 0.9, + "learning_rate": 1.6406607505536012e-06, + "loss": 0.7666, + "step": 35150 + }, + { + "epoch": 0.9, + "learning_rate": 1.640639504267808e-06, + "loss": 0.9551, + "step": 35151 + }, + { + "epoch": 0.9, + "learning_rate": 1.6406182574915066e-06, + "loss": 0.8115, + "step": 35152 + }, + { + "epoch": 0.9, + "learning_rate": 1.6405970102247134e-06, + "loss": 0.8945, + "step": 35153 + }, + { + "epoch": 0.9, + "learning_rate": 1.6405757624674444e-06, + "loss": 0.9175, + "step": 35154 + }, + { + "epoch": 0.9, + "learning_rate": 1.6405545142197159e-06, + "loss": 0.9521, + "step": 35155 + }, + { + "epoch": 0.9, + "learning_rate": 1.6405332654815442e-06, + "loss": 0.7378, + "step": 35156 + }, + { + "epoch": 0.9, + "learning_rate": 1.6405120162529458e-06, + "loss": 0.9805, + "step": 35157 + }, + { + "epoch": 0.9, + "learning_rate": 1.640490766533937e-06, + "loss": 0.8486, + "step": 35158 + }, + { + "epoch": 0.9, + "learning_rate": 1.6404695163245334e-06, + "loss": 0.9004, + "step": 35159 + }, + { + "epoch": 0.9, + "learning_rate": 1.640448265624752e-06, + "loss": 0.874, + "step": 35160 + }, + { + "epoch": 0.9, + "learning_rate": 1.640427014434609e-06, + "loss": 0.9014, + "step": 35161 + }, + { + "epoch": 0.9, + "learning_rate": 1.6404057627541201e-06, + "loss": 1.0771, + "step": 35162 + }, + { + "epoch": 0.9, + "learning_rate": 1.6403845105833024e-06, + "loss": 0.8486, + "step": 35163 + }, + { + "epoch": 0.9, + "learning_rate": 1.6403632579221713e-06, + "loss": 0.9482, + "step": 35164 + }, + { + "epoch": 0.9, + "learning_rate": 1.6403420047707438e-06, + "loss": 0.8516, + "step": 35165 + }, + { + "epoch": 0.9, + "learning_rate": 1.6403207511290353e-06, + "loss": 0.835, + "step": 35166 + }, + { + "epoch": 0.9, + "learning_rate": 1.640299496997063e-06, + "loss": 0.6279, + "step": 35167 + }, + { + "epoch": 0.9, + "learning_rate": 1.640278242374843e-06, + "loss": 0.9033, + "step": 35168 + }, + { + "epoch": 0.9, + "learning_rate": 1.6402569872623912e-06, + "loss": 0.9727, + "step": 35169 + }, + { + "epoch": 0.9, + "learning_rate": 1.6402357316597244e-06, + "loss": 0.7549, + "step": 35170 + }, + { + "epoch": 0.9, + "learning_rate": 1.640214475566858e-06, + "loss": 0.7939, + "step": 35171 + }, + { + "epoch": 0.9, + "learning_rate": 1.6401932189838092e-06, + "loss": 0.6001, + "step": 35172 + }, + { + "epoch": 0.9, + "learning_rate": 1.640171961910594e-06, + "loss": 0.8008, + "step": 35173 + }, + { + "epoch": 0.9, + "learning_rate": 1.6401507043472283e-06, + "loss": 1.0166, + "step": 35174 + }, + { + "epoch": 0.9, + "learning_rate": 1.6401294462937284e-06, + "loss": 0.9346, + "step": 35175 + }, + { + "epoch": 0.9, + "learning_rate": 1.6401081877501113e-06, + "loss": 0.8838, + "step": 35176 + }, + { + "epoch": 0.9, + "learning_rate": 1.6400869287163925e-06, + "loss": 0.9092, + "step": 35177 + }, + { + "epoch": 0.9, + "learning_rate": 1.6400656691925889e-06, + "loss": 0.7393, + "step": 35178 + }, + { + "epoch": 0.9, + "learning_rate": 1.6400444091787161e-06, + "loss": 1.2139, + "step": 35179 + }, + { + "epoch": 0.9, + "learning_rate": 1.6400231486747908e-06, + "loss": 0.7891, + "step": 35180 + }, + { + "epoch": 0.9, + "learning_rate": 1.6400018876808296e-06, + "loss": 0.7551, + "step": 35181 + }, + { + "epoch": 0.9, + "learning_rate": 1.6399806261968477e-06, + "loss": 1.0254, + "step": 35182 + }, + { + "epoch": 0.9, + "learning_rate": 1.6399593642228626e-06, + "loss": 0.958, + "step": 35183 + }, + { + "epoch": 0.9, + "learning_rate": 1.6399381017588896e-06, + "loss": 0.8828, + "step": 35184 + }, + { + "epoch": 0.9, + "learning_rate": 1.6399168388049458e-06, + "loss": 0.9053, + "step": 35185 + }, + { + "epoch": 0.9, + "learning_rate": 1.6398955753610468e-06, + "loss": 0.7695, + "step": 35186 + }, + { + "epoch": 0.9, + "learning_rate": 1.6398743114272096e-06, + "loss": 0.6487, + "step": 35187 + }, + { + "epoch": 0.9, + "learning_rate": 1.6398530470034495e-06, + "loss": 0.8638, + "step": 35188 + }, + { + "epoch": 0.9, + "learning_rate": 1.6398317820897838e-06, + "loss": 0.7881, + "step": 35189 + }, + { + "epoch": 0.9, + "learning_rate": 1.6398105166862282e-06, + "loss": 0.6929, + "step": 35190 + }, + { + "epoch": 0.9, + "learning_rate": 1.6397892507927988e-06, + "loss": 0.9883, + "step": 35191 + }, + { + "epoch": 0.9, + "learning_rate": 1.6397679844095125e-06, + "loss": 0.8896, + "step": 35192 + }, + { + "epoch": 0.9, + "learning_rate": 1.6397467175363854e-06, + "loss": 0.7725, + "step": 35193 + }, + { + "epoch": 0.9, + "learning_rate": 1.6397254501734335e-06, + "loss": 0.7021, + "step": 35194 + }, + { + "epoch": 0.9, + "learning_rate": 1.6397041823206732e-06, + "loss": 0.8457, + "step": 35195 + }, + { + "epoch": 0.9, + "learning_rate": 1.6396829139781207e-06, + "loss": 0.958, + "step": 35196 + }, + { + "epoch": 0.9, + "learning_rate": 1.6396616451457926e-06, + "loss": 0.6938, + "step": 35197 + }, + { + "epoch": 0.9, + "learning_rate": 1.639640375823705e-06, + "loss": 0.9014, + "step": 35198 + }, + { + "epoch": 0.9, + "learning_rate": 1.6396191060118743e-06, + "loss": 0.9434, + "step": 35199 + }, + { + "epoch": 0.9, + "learning_rate": 1.6395978357103163e-06, + "loss": 0.8936, + "step": 35200 + }, + { + "epoch": 0.9, + "learning_rate": 1.6395765649190477e-06, + "loss": 0.6826, + "step": 35201 + }, + { + "epoch": 0.9, + "learning_rate": 1.639555293638085e-06, + "loss": 0.8564, + "step": 35202 + }, + { + "epoch": 0.9, + "learning_rate": 1.639534021867444e-06, + "loss": 0.6855, + "step": 35203 + }, + { + "epoch": 0.9, + "learning_rate": 1.6395127496071415e-06, + "loss": 0.8877, + "step": 35204 + }, + { + "epoch": 0.9, + "learning_rate": 1.6394914768571932e-06, + "loss": 0.7603, + "step": 35205 + }, + { + "epoch": 0.9, + "learning_rate": 1.6394702036176157e-06, + "loss": 1.0459, + "step": 35206 + }, + { + "epoch": 0.9, + "learning_rate": 1.6394489298884254e-06, + "loss": 0.7656, + "step": 35207 + }, + { + "epoch": 0.9, + "learning_rate": 1.6394276556696384e-06, + "loss": 0.8232, + "step": 35208 + }, + { + "epoch": 0.9, + "learning_rate": 1.639406380961271e-06, + "loss": 0.8125, + "step": 35209 + }, + { + "epoch": 0.9, + "learning_rate": 1.6393851057633397e-06, + "loss": 0.9463, + "step": 35210 + }, + { + "epoch": 0.9, + "learning_rate": 1.6393638300758603e-06, + "loss": 0.7568, + "step": 35211 + }, + { + "epoch": 0.9, + "learning_rate": 1.6393425538988498e-06, + "loss": 0.6707, + "step": 35212 + }, + { + "epoch": 0.9, + "learning_rate": 1.639321277232324e-06, + "loss": 0.8809, + "step": 35213 + }, + { + "epoch": 0.9, + "learning_rate": 1.639300000076299e-06, + "loss": 0.6279, + "step": 35214 + }, + { + "epoch": 0.9, + "learning_rate": 1.6392787224307917e-06, + "loss": 0.9902, + "step": 35215 + }, + { + "epoch": 0.9, + "learning_rate": 1.6392574442958177e-06, + "loss": 0.814, + "step": 35216 + }, + { + "epoch": 0.9, + "learning_rate": 1.639236165671394e-06, + "loss": 1.0566, + "step": 35217 + }, + { + "epoch": 0.9, + "learning_rate": 1.6392148865575367e-06, + "loss": 0.9414, + "step": 35218 + }, + { + "epoch": 0.9, + "learning_rate": 1.6391936069542616e-06, + "loss": 0.8169, + "step": 35219 + }, + { + "epoch": 0.9, + "learning_rate": 1.6391723268615855e-06, + "loss": 0.8765, + "step": 35220 + }, + { + "epoch": 0.9, + "learning_rate": 1.6391510462795247e-06, + "loss": 0.8145, + "step": 35221 + }, + { + "epoch": 0.9, + "learning_rate": 1.639129765208095e-06, + "loss": 0.9492, + "step": 35222 + }, + { + "epoch": 0.9, + "learning_rate": 1.6391084836473132e-06, + "loss": 0.917, + "step": 35223 + }, + { + "epoch": 0.9, + "learning_rate": 1.6390872015971955e-06, + "loss": 0.9219, + "step": 35224 + }, + { + "epoch": 0.9, + "learning_rate": 1.6390659190577577e-06, + "loss": 0.6758, + "step": 35225 + }, + { + "epoch": 0.9, + "learning_rate": 1.639044636029017e-06, + "loss": 0.8525, + "step": 35226 + }, + { + "epoch": 0.9, + "learning_rate": 1.639023352510989e-06, + "loss": 0.6753, + "step": 35227 + }, + { + "epoch": 0.9, + "learning_rate": 1.6390020685036905e-06, + "loss": 0.834, + "step": 35228 + }, + { + "epoch": 0.9, + "learning_rate": 1.6389807840071372e-06, + "loss": 0.8604, + "step": 35229 + }, + { + "epoch": 0.9, + "learning_rate": 1.6389594990213457e-06, + "loss": 0.8936, + "step": 35230 + }, + { + "epoch": 0.9, + "learning_rate": 1.6389382135463323e-06, + "loss": 0.8555, + "step": 35231 + }, + { + "epoch": 0.9, + "learning_rate": 1.6389169275821132e-06, + "loss": 0.9258, + "step": 35232 + }, + { + "epoch": 0.9, + "learning_rate": 1.638895641128705e-06, + "loss": 0.667, + "step": 35233 + }, + { + "epoch": 0.9, + "learning_rate": 1.6388743541861239e-06, + "loss": 0.8975, + "step": 35234 + }, + { + "epoch": 0.9, + "learning_rate": 1.6388530667543856e-06, + "loss": 0.9277, + "step": 35235 + }, + { + "epoch": 0.9, + "learning_rate": 1.638831778833507e-06, + "loss": 0.9922, + "step": 35236 + }, + { + "epoch": 0.9, + "learning_rate": 1.6388104904235046e-06, + "loss": 0.7549, + "step": 35237 + }, + { + "epoch": 0.9, + "learning_rate": 1.6387892015243945e-06, + "loss": 0.7266, + "step": 35238 + }, + { + "epoch": 0.9, + "learning_rate": 1.6387679121361925e-06, + "loss": 0.8374, + "step": 35239 + }, + { + "epoch": 0.9, + "learning_rate": 1.6387466222589153e-06, + "loss": 0.8779, + "step": 35240 + }, + { + "epoch": 0.9, + "learning_rate": 1.6387253318925791e-06, + "loss": 0.793, + "step": 35241 + }, + { + "epoch": 0.9, + "learning_rate": 1.6387040410372007e-06, + "loss": 1.0479, + "step": 35242 + }, + { + "epoch": 0.9, + "learning_rate": 1.6386827496927957e-06, + "loss": 1.1123, + "step": 35243 + }, + { + "epoch": 0.9, + "learning_rate": 1.6386614578593807e-06, + "loss": 0.8643, + "step": 35244 + }, + { + "epoch": 0.9, + "learning_rate": 1.638640165536972e-06, + "loss": 0.6284, + "step": 35245 + }, + { + "epoch": 0.9, + "learning_rate": 1.638618872725586e-06, + "loss": 0.9121, + "step": 35246 + }, + { + "epoch": 0.9, + "learning_rate": 1.6385975794252388e-06, + "loss": 1.0576, + "step": 35247 + }, + { + "epoch": 0.9, + "learning_rate": 1.6385762856359467e-06, + "loss": 0.6167, + "step": 35248 + }, + { + "epoch": 0.9, + "learning_rate": 1.6385549913577261e-06, + "loss": 0.7773, + "step": 35249 + }, + { + "epoch": 0.9, + "learning_rate": 1.6385336965905934e-06, + "loss": 0.7881, + "step": 35250 + }, + { + "epoch": 0.9, + "learning_rate": 1.6385124013345647e-06, + "loss": 0.8721, + "step": 35251 + }, + { + "epoch": 0.9, + "learning_rate": 1.6384911055896566e-06, + "loss": 0.958, + "step": 35252 + }, + { + "epoch": 0.9, + "learning_rate": 1.638469809355885e-06, + "loss": 0.8545, + "step": 35253 + }, + { + "epoch": 0.9, + "learning_rate": 1.6384485126332667e-06, + "loss": 0.9082, + "step": 35254 + }, + { + "epoch": 0.9, + "learning_rate": 1.6384272154218177e-06, + "loss": 0.5962, + "step": 35255 + }, + { + "epoch": 0.9, + "learning_rate": 1.6384059177215544e-06, + "loss": 0.7417, + "step": 35256 + }, + { + "epoch": 0.9, + "learning_rate": 1.6383846195324926e-06, + "loss": 0.7163, + "step": 35257 + }, + { + "epoch": 0.9, + "learning_rate": 1.6383633208546495e-06, + "loss": 0.783, + "step": 35258 + }, + { + "epoch": 0.9, + "learning_rate": 1.6383420216880408e-06, + "loss": 0.8193, + "step": 35259 + }, + { + "epoch": 0.9, + "learning_rate": 1.6383207220326826e-06, + "loss": 0.7417, + "step": 35260 + }, + { + "epoch": 0.9, + "learning_rate": 1.638299421888592e-06, + "loss": 1.0186, + "step": 35261 + }, + { + "epoch": 0.9, + "learning_rate": 1.6382781212557849e-06, + "loss": 0.4438, + "step": 35262 + }, + { + "epoch": 0.9, + "learning_rate": 1.6382568201342775e-06, + "loss": 0.916, + "step": 35263 + }, + { + "epoch": 0.9, + "learning_rate": 1.638235518524086e-06, + "loss": 1.0137, + "step": 35264 + }, + { + "epoch": 0.9, + "learning_rate": 1.6382142164252272e-06, + "loss": 0.9717, + "step": 35265 + }, + { + "epoch": 0.9, + "learning_rate": 1.6381929138377171e-06, + "loss": 0.915, + "step": 35266 + }, + { + "epoch": 0.9, + "learning_rate": 1.638171610761572e-06, + "loss": 0.8047, + "step": 35267 + }, + { + "epoch": 0.9, + "learning_rate": 1.6381503071968084e-06, + "loss": 0.6865, + "step": 35268 + }, + { + "epoch": 0.9, + "learning_rate": 1.638129003143442e-06, + "loss": 0.8506, + "step": 35269 + }, + { + "epoch": 0.9, + "learning_rate": 1.63810769860149e-06, + "loss": 0.8213, + "step": 35270 + }, + { + "epoch": 0.9, + "learning_rate": 1.6380863935709679e-06, + "loss": 0.7297, + "step": 35271 + }, + { + "epoch": 0.9, + "learning_rate": 1.6380650880518924e-06, + "loss": 0.9199, + "step": 35272 + }, + { + "epoch": 0.9, + "learning_rate": 1.6380437820442804e-06, + "loss": 0.8174, + "step": 35273 + }, + { + "epoch": 0.9, + "learning_rate": 1.638022475548147e-06, + "loss": 0.6479, + "step": 35274 + }, + { + "epoch": 0.9, + "learning_rate": 1.6380011685635092e-06, + "loss": 0.8662, + "step": 35275 + }, + { + "epoch": 0.9, + "learning_rate": 1.6379798610903834e-06, + "loss": 0.6294, + "step": 35276 + }, + { + "epoch": 0.9, + "learning_rate": 1.6379585531287856e-06, + "loss": 0.8584, + "step": 35277 + }, + { + "epoch": 0.9, + "learning_rate": 1.6379372446787328e-06, + "loss": 0.9453, + "step": 35278 + }, + { + "epoch": 0.9, + "learning_rate": 1.6379159357402402e-06, + "loss": 0.6133, + "step": 35279 + }, + { + "epoch": 0.9, + "learning_rate": 1.637894626313325e-06, + "loss": 0.5513, + "step": 35280 + }, + { + "epoch": 0.9, + "learning_rate": 1.6378733163980028e-06, + "loss": 0.8242, + "step": 35281 + }, + { + "epoch": 0.9, + "learning_rate": 1.6378520059942906e-06, + "loss": 1.0186, + "step": 35282 + }, + { + "epoch": 0.9, + "learning_rate": 1.6378306951022048e-06, + "loss": 0.8779, + "step": 35283 + }, + { + "epoch": 0.9, + "learning_rate": 1.6378093837217609e-06, + "loss": 0.7441, + "step": 35284 + }, + { + "epoch": 0.9, + "learning_rate": 1.6377880718529758e-06, + "loss": 0.8027, + "step": 35285 + }, + { + "epoch": 0.9, + "learning_rate": 1.6377667594958658e-06, + "loss": 0.9824, + "step": 35286 + }, + { + "epoch": 0.9, + "learning_rate": 1.6377454466504469e-06, + "loss": 0.793, + "step": 35287 + }, + { + "epoch": 0.9, + "learning_rate": 1.6377241333167357e-06, + "loss": 0.7422, + "step": 35288 + }, + { + "epoch": 0.9, + "learning_rate": 1.6377028194947487e-06, + "loss": 0.9531, + "step": 35289 + }, + { + "epoch": 0.9, + "learning_rate": 1.6376815051845017e-06, + "loss": 0.8882, + "step": 35290 + }, + { + "epoch": 0.9, + "learning_rate": 1.6376601903860111e-06, + "loss": 0.8818, + "step": 35291 + }, + { + "epoch": 0.9, + "learning_rate": 1.6376388750992937e-06, + "loss": 0.8701, + "step": 35292 + }, + { + "epoch": 0.9, + "learning_rate": 1.637617559324366e-06, + "loss": 0.7676, + "step": 35293 + }, + { + "epoch": 0.9, + "learning_rate": 1.6375962430612433e-06, + "loss": 0.8018, + "step": 35294 + }, + { + "epoch": 0.9, + "learning_rate": 1.6375749263099424e-06, + "loss": 0.9248, + "step": 35295 + }, + { + "epoch": 0.9, + "learning_rate": 1.6375536090704799e-06, + "loss": 0.718, + "step": 35296 + }, + { + "epoch": 0.9, + "learning_rate": 1.6375322913428719e-06, + "loss": 0.9902, + "step": 35297 + }, + { + "epoch": 0.9, + "learning_rate": 1.6375109731271347e-06, + "loss": 0.8145, + "step": 35298 + }, + { + "epoch": 0.9, + "learning_rate": 1.6374896544232848e-06, + "loss": 1.0283, + "step": 35299 + }, + { + "epoch": 0.9, + "learning_rate": 1.637468335231338e-06, + "loss": 0.832, + "step": 35300 + }, + { + "epoch": 0.9, + "learning_rate": 1.6374470155513115e-06, + "loss": 0.9473, + "step": 35301 + }, + { + "epoch": 0.9, + "learning_rate": 1.637425695383221e-06, + "loss": 0.8516, + "step": 35302 + }, + { + "epoch": 0.9, + "learning_rate": 1.6374043747270827e-06, + "loss": 0.6699, + "step": 35303 + }, + { + "epoch": 0.9, + "learning_rate": 1.6373830535829135e-06, + "loss": 0.9316, + "step": 35304 + }, + { + "epoch": 0.9, + "learning_rate": 1.6373617319507288e-06, + "loss": 0.7463, + "step": 35305 + }, + { + "epoch": 0.9, + "learning_rate": 1.637340409830546e-06, + "loss": 0.6592, + "step": 35306 + }, + { + "epoch": 0.9, + "learning_rate": 1.637319087222381e-06, + "loss": 0.6699, + "step": 35307 + }, + { + "epoch": 0.9, + "learning_rate": 1.63729776412625e-06, + "loss": 0.8047, + "step": 35308 + }, + { + "epoch": 0.9, + "learning_rate": 1.6372764405421695e-06, + "loss": 0.5991, + "step": 35309 + }, + { + "epoch": 0.91, + "learning_rate": 1.6372551164701556e-06, + "loss": 0.8096, + "step": 35310 + }, + { + "epoch": 0.91, + "learning_rate": 1.6372337919102246e-06, + "loss": 0.6616, + "step": 35311 + }, + { + "epoch": 0.91, + "learning_rate": 1.6372124668623936e-06, + "loss": 0.7334, + "step": 35312 + }, + { + "epoch": 0.91, + "learning_rate": 1.6371911413266777e-06, + "loss": 1.0059, + "step": 35313 + }, + { + "epoch": 0.91, + "learning_rate": 1.6371698153030939e-06, + "loss": 1.0371, + "step": 35314 + }, + { + "epoch": 0.91, + "learning_rate": 1.6371484887916587e-06, + "loss": 0.8262, + "step": 35315 + }, + { + "epoch": 0.91, + "learning_rate": 1.637127161792388e-06, + "loss": 0.7812, + "step": 35316 + }, + { + "epoch": 0.91, + "learning_rate": 1.6371058343052986e-06, + "loss": 0.5088, + "step": 35317 + }, + { + "epoch": 0.91, + "learning_rate": 1.6370845063304065e-06, + "loss": 0.7944, + "step": 35318 + }, + { + "epoch": 0.91, + "learning_rate": 1.637063177867728e-06, + "loss": 0.7275, + "step": 35319 + }, + { + "epoch": 0.91, + "learning_rate": 1.6370418489172794e-06, + "loss": 0.6138, + "step": 35320 + }, + { + "epoch": 0.91, + "learning_rate": 1.6370205194790771e-06, + "loss": 0.9619, + "step": 35321 + }, + { + "epoch": 0.91, + "learning_rate": 1.6369991895531378e-06, + "loss": 0.9199, + "step": 35322 + }, + { + "epoch": 0.91, + "learning_rate": 1.636977859139477e-06, + "loss": 0.6738, + "step": 35323 + }, + { + "epoch": 0.91, + "learning_rate": 1.636956528238112e-06, + "loss": 1.0508, + "step": 35324 + }, + { + "epoch": 0.91, + "learning_rate": 1.6369351968490586e-06, + "loss": 0.8779, + "step": 35325 + }, + { + "epoch": 0.91, + "learning_rate": 1.636913864972333e-06, + "loss": 0.7002, + "step": 35326 + }, + { + "epoch": 0.91, + "learning_rate": 1.6368925326079521e-06, + "loss": 0.8887, + "step": 35327 + }, + { + "epoch": 0.91, + "learning_rate": 1.6368711997559318e-06, + "loss": 0.9912, + "step": 35328 + }, + { + "epoch": 0.91, + "learning_rate": 1.636849866416288e-06, + "loss": 0.8052, + "step": 35329 + }, + { + "epoch": 0.91, + "learning_rate": 1.636828532589038e-06, + "loss": 0.7588, + "step": 35330 + }, + { + "epoch": 0.91, + "learning_rate": 1.6368071982741975e-06, + "loss": 1.1348, + "step": 35331 + }, + { + "epoch": 0.91, + "learning_rate": 1.6367858634717834e-06, + "loss": 0.9883, + "step": 35332 + }, + { + "epoch": 0.91, + "learning_rate": 1.6367645281818114e-06, + "loss": 0.9189, + "step": 35333 + }, + { + "epoch": 0.91, + "learning_rate": 1.6367431924042978e-06, + "loss": 0.8887, + "step": 35334 + }, + { + "epoch": 0.91, + "learning_rate": 1.6367218561392594e-06, + "loss": 1.041, + "step": 35335 + }, + { + "epoch": 0.91, + "learning_rate": 1.6367005193867125e-06, + "loss": 0.75, + "step": 35336 + }, + { + "epoch": 0.91, + "learning_rate": 1.6366791821466733e-06, + "loss": 0.5796, + "step": 35337 + }, + { + "epoch": 0.91, + "learning_rate": 1.6366578444191582e-06, + "loss": 0.9961, + "step": 35338 + }, + { + "epoch": 0.91, + "learning_rate": 1.6366365062041832e-06, + "loss": 0.7666, + "step": 35339 + }, + { + "epoch": 0.91, + "learning_rate": 1.6366151675017647e-06, + "loss": 0.832, + "step": 35340 + }, + { + "epoch": 0.91, + "learning_rate": 1.6365938283119194e-06, + "loss": 0.9805, + "step": 35341 + }, + { + "epoch": 0.91, + "learning_rate": 1.6365724886346639e-06, + "loss": 0.6187, + "step": 35342 + }, + { + "epoch": 0.91, + "learning_rate": 1.6365511484700137e-06, + "loss": 0.7124, + "step": 35343 + }, + { + "epoch": 0.91, + "learning_rate": 1.6365298078179856e-06, + "loss": 0.7773, + "step": 35344 + }, + { + "epoch": 0.91, + "learning_rate": 1.6365084666785957e-06, + "loss": 0.9512, + "step": 35345 + }, + { + "epoch": 0.91, + "learning_rate": 1.636487125051861e-06, + "loss": 1.0723, + "step": 35346 + }, + { + "epoch": 0.91, + "learning_rate": 1.6364657829377973e-06, + "loss": 0.752, + "step": 35347 + }, + { + "epoch": 0.91, + "learning_rate": 1.636444440336421e-06, + "loss": 0.8281, + "step": 35348 + }, + { + "epoch": 0.91, + "learning_rate": 1.6364230972477482e-06, + "loss": 1.0254, + "step": 35349 + }, + { + "epoch": 0.91, + "learning_rate": 1.6364017536717954e-06, + "loss": 0.6978, + "step": 35350 + }, + { + "epoch": 0.91, + "learning_rate": 1.6363804096085793e-06, + "loss": 0.9697, + "step": 35351 + }, + { + "epoch": 0.91, + "learning_rate": 1.6363590650581162e-06, + "loss": 0.8291, + "step": 35352 + }, + { + "epoch": 0.91, + "learning_rate": 1.6363377200204221e-06, + "loss": 0.8062, + "step": 35353 + }, + { + "epoch": 0.91, + "learning_rate": 1.636316374495513e-06, + "loss": 0.9414, + "step": 35354 + }, + { + "epoch": 0.91, + "learning_rate": 1.636295028483406e-06, + "loss": 0.9502, + "step": 35355 + }, + { + "epoch": 0.91, + "learning_rate": 1.6362736819841172e-06, + "loss": 1.2451, + "step": 35356 + }, + { + "epoch": 0.91, + "learning_rate": 1.6362523349976631e-06, + "loss": 0.8867, + "step": 35357 + }, + { + "epoch": 0.91, + "learning_rate": 1.6362309875240597e-06, + "loss": 0.7905, + "step": 35358 + }, + { + "epoch": 0.91, + "learning_rate": 1.6362096395633233e-06, + "loss": 0.7852, + "step": 35359 + }, + { + "epoch": 0.91, + "learning_rate": 1.6361882911154706e-06, + "loss": 0.8164, + "step": 35360 + }, + { + "epoch": 0.91, + "learning_rate": 1.6361669421805178e-06, + "loss": 0.8916, + "step": 35361 + }, + { + "epoch": 0.91, + "learning_rate": 1.6361455927584813e-06, + "loss": 0.9141, + "step": 35362 + }, + { + "epoch": 0.91, + "learning_rate": 1.636124242849377e-06, + "loss": 0.832, + "step": 35363 + }, + { + "epoch": 0.91, + "learning_rate": 1.6361028924532221e-06, + "loss": 0.6985, + "step": 35364 + }, + { + "epoch": 0.91, + "learning_rate": 1.6360815415700322e-06, + "loss": 0.9185, + "step": 35365 + }, + { + "epoch": 0.91, + "learning_rate": 1.6360601901998239e-06, + "loss": 0.9404, + "step": 35366 + }, + { + "epoch": 0.91, + "learning_rate": 1.6360388383426135e-06, + "loss": 0.874, + "step": 35367 + }, + { + "epoch": 0.91, + "learning_rate": 1.6360174859984175e-06, + "loss": 1.0293, + "step": 35368 + }, + { + "epoch": 0.91, + "learning_rate": 1.6359961331672523e-06, + "loss": 0.709, + "step": 35369 + }, + { + "epoch": 0.91, + "learning_rate": 1.6359747798491338e-06, + "loss": 0.9492, + "step": 35370 + }, + { + "epoch": 0.91, + "learning_rate": 1.6359534260440789e-06, + "loss": 0.627, + "step": 35371 + }, + { + "epoch": 0.91, + "learning_rate": 1.6359320717521037e-06, + "loss": 0.8008, + "step": 35372 + }, + { + "epoch": 0.91, + "learning_rate": 1.6359107169732243e-06, + "loss": 0.9736, + "step": 35373 + }, + { + "epoch": 0.91, + "learning_rate": 1.6358893617074573e-06, + "loss": 0.9424, + "step": 35374 + }, + { + "epoch": 0.91, + "learning_rate": 1.6358680059548193e-06, + "loss": 0.7349, + "step": 35375 + }, + { + "epoch": 0.91, + "learning_rate": 1.6358466497153263e-06, + "loss": 0.6035, + "step": 35376 + }, + { + "epoch": 0.91, + "learning_rate": 1.635825292988995e-06, + "loss": 0.5889, + "step": 35377 + }, + { + "epoch": 0.91, + "learning_rate": 1.6358039357758414e-06, + "loss": 0.8428, + "step": 35378 + }, + { + "epoch": 0.91, + "learning_rate": 1.6357825780758816e-06, + "loss": 0.8252, + "step": 35379 + }, + { + "epoch": 0.91, + "learning_rate": 1.6357612198891327e-06, + "loss": 0.604, + "step": 35380 + }, + { + "epoch": 0.91, + "learning_rate": 1.6357398612156103e-06, + "loss": 0.8652, + "step": 35381 + }, + { + "epoch": 0.91, + "learning_rate": 1.6357185020553316e-06, + "loss": 0.7461, + "step": 35382 + }, + { + "epoch": 0.91, + "learning_rate": 1.6356971424083123e-06, + "loss": 0.6738, + "step": 35383 + }, + { + "epoch": 0.91, + "learning_rate": 1.6356757822745688e-06, + "loss": 0.9043, + "step": 35384 + }, + { + "epoch": 0.91, + "learning_rate": 1.6356544216541178e-06, + "loss": 0.5308, + "step": 35385 + }, + { + "epoch": 0.91, + "learning_rate": 1.6356330605469753e-06, + "loss": 1.0449, + "step": 35386 + }, + { + "epoch": 0.91, + "learning_rate": 1.6356116989531576e-06, + "loss": 0.8789, + "step": 35387 + }, + { + "epoch": 0.91, + "learning_rate": 1.6355903368726813e-06, + "loss": 0.9165, + "step": 35388 + }, + { + "epoch": 0.91, + "learning_rate": 1.6355689743055629e-06, + "loss": 0.8867, + "step": 35389 + }, + { + "epoch": 0.91, + "learning_rate": 1.6355476112518185e-06, + "loss": 0.7925, + "step": 35390 + }, + { + "epoch": 0.91, + "learning_rate": 1.6355262477114646e-06, + "loss": 0.8994, + "step": 35391 + }, + { + "epoch": 0.91, + "learning_rate": 1.6355048836845175e-06, + "loss": 0.7217, + "step": 35392 + }, + { + "epoch": 0.91, + "learning_rate": 1.6354835191709934e-06, + "loss": 0.918, + "step": 35393 + }, + { + "epoch": 0.91, + "learning_rate": 1.6354621541709088e-06, + "loss": 1.0449, + "step": 35394 + }, + { + "epoch": 0.91, + "learning_rate": 1.63544078868428e-06, + "loss": 0.9258, + "step": 35395 + }, + { + "epoch": 0.91, + "learning_rate": 1.6354194227111233e-06, + "loss": 0.8145, + "step": 35396 + }, + { + "epoch": 0.91, + "learning_rate": 1.6353980562514555e-06, + "loss": 0.7151, + "step": 35397 + }, + { + "epoch": 0.91, + "learning_rate": 1.6353766893052926e-06, + "loss": 0.8994, + "step": 35398 + }, + { + "epoch": 0.91, + "learning_rate": 1.635355321872651e-06, + "loss": 0.8379, + "step": 35399 + }, + { + "epoch": 0.91, + "learning_rate": 1.6353339539535463e-06, + "loss": 0.9141, + "step": 35400 + }, + { + "epoch": 0.91, + "learning_rate": 1.6353125855479963e-06, + "loss": 0.7471, + "step": 35401 + }, + { + "epoch": 0.91, + "learning_rate": 1.6352912166560166e-06, + "loss": 0.6362, + "step": 35402 + }, + { + "epoch": 0.91, + "learning_rate": 1.6352698472776236e-06, + "loss": 1.0439, + "step": 35403 + }, + { + "epoch": 0.91, + "learning_rate": 1.635248477412834e-06, + "loss": 0.9736, + "step": 35404 + }, + { + "epoch": 0.91, + "learning_rate": 1.6352271070616632e-06, + "loss": 0.8311, + "step": 35405 + }, + { + "epoch": 0.91, + "learning_rate": 1.6352057362241284e-06, + "loss": 0.8755, + "step": 35406 + }, + { + "epoch": 0.91, + "learning_rate": 1.6351843649002462e-06, + "loss": 0.8789, + "step": 35407 + }, + { + "epoch": 0.91, + "learning_rate": 1.6351629930900321e-06, + "loss": 0.7747, + "step": 35408 + }, + { + "epoch": 0.91, + "learning_rate": 1.6351416207935032e-06, + "loss": 0.7666, + "step": 35409 + }, + { + "epoch": 0.91, + "learning_rate": 1.6351202480106751e-06, + "loss": 0.75, + "step": 35410 + }, + { + "epoch": 0.91, + "learning_rate": 1.635098874741565e-06, + "loss": 0.7888, + "step": 35411 + }, + { + "epoch": 0.91, + "learning_rate": 1.635077500986189e-06, + "loss": 0.8242, + "step": 35412 + }, + { + "epoch": 0.91, + "learning_rate": 1.6350561267445632e-06, + "loss": 0.8098, + "step": 35413 + }, + { + "epoch": 0.91, + "learning_rate": 1.635034752016704e-06, + "loss": 0.876, + "step": 35414 + }, + { + "epoch": 0.91, + "learning_rate": 1.635013376802628e-06, + "loss": 0.9395, + "step": 35415 + }, + { + "epoch": 0.91, + "learning_rate": 1.6349920011023516e-06, + "loss": 0.8877, + "step": 35416 + }, + { + "epoch": 0.91, + "learning_rate": 1.634970624915891e-06, + "loss": 0.9424, + "step": 35417 + }, + { + "epoch": 0.91, + "learning_rate": 1.6349492482432623e-06, + "loss": 1.0205, + "step": 35418 + }, + { + "epoch": 0.91, + "learning_rate": 1.6349278710844822e-06, + "loss": 0.7061, + "step": 35419 + }, + { + "epoch": 0.91, + "learning_rate": 1.6349064934395673e-06, + "loss": 1.0098, + "step": 35420 + }, + { + "epoch": 0.91, + "learning_rate": 1.6348851153085336e-06, + "loss": 0.9414, + "step": 35421 + }, + { + "epoch": 0.91, + "learning_rate": 1.6348637366913976e-06, + "loss": 0.7305, + "step": 35422 + }, + { + "epoch": 0.91, + "learning_rate": 1.6348423575881753e-06, + "loss": 0.9062, + "step": 35423 + }, + { + "epoch": 0.91, + "learning_rate": 1.6348209779988837e-06, + "loss": 0.9131, + "step": 35424 + }, + { + "epoch": 0.91, + "learning_rate": 1.6347995979235388e-06, + "loss": 0.8496, + "step": 35425 + }, + { + "epoch": 0.91, + "learning_rate": 1.6347782173621568e-06, + "loss": 0.8398, + "step": 35426 + }, + { + "epoch": 0.91, + "learning_rate": 1.634756836314755e-06, + "loss": 0.8252, + "step": 35427 + }, + { + "epoch": 0.91, + "learning_rate": 1.6347354547813486e-06, + "loss": 0.7559, + "step": 35428 + }, + { + "epoch": 0.91, + "learning_rate": 1.6347140727619544e-06, + "loss": 0.8623, + "step": 35429 + }, + { + "epoch": 0.91, + "learning_rate": 1.6346926902565887e-06, + "loss": 0.8779, + "step": 35430 + }, + { + "epoch": 0.91, + "learning_rate": 1.6346713072652683e-06, + "loss": 0.5322, + "step": 35431 + }, + { + "epoch": 0.91, + "learning_rate": 1.634649923788009e-06, + "loss": 0.7314, + "step": 35432 + }, + { + "epoch": 0.91, + "learning_rate": 1.6346285398248276e-06, + "loss": 0.6641, + "step": 35433 + }, + { + "epoch": 0.91, + "learning_rate": 1.6346071553757404e-06, + "loss": 1.1748, + "step": 35434 + }, + { + "epoch": 0.91, + "learning_rate": 1.6345857704407636e-06, + "loss": 0.7227, + "step": 35435 + }, + { + "epoch": 0.91, + "learning_rate": 1.6345643850199136e-06, + "loss": 0.6941, + "step": 35436 + }, + { + "epoch": 0.91, + "learning_rate": 1.634542999113207e-06, + "loss": 1.0498, + "step": 35437 + }, + { + "epoch": 0.91, + "learning_rate": 1.6345216127206599e-06, + "loss": 0.8047, + "step": 35438 + }, + { + "epoch": 0.91, + "learning_rate": 1.6345002258422883e-06, + "loss": 0.8081, + "step": 35439 + }, + { + "epoch": 0.91, + "learning_rate": 1.6344788384781097e-06, + "loss": 0.7373, + "step": 35440 + }, + { + "epoch": 0.91, + "learning_rate": 1.6344574506281395e-06, + "loss": 0.8721, + "step": 35441 + }, + { + "epoch": 0.91, + "learning_rate": 1.6344360622923946e-06, + "loss": 0.9629, + "step": 35442 + }, + { + "epoch": 0.91, + "learning_rate": 1.634414673470891e-06, + "loss": 0.7539, + "step": 35443 + }, + { + "epoch": 0.91, + "learning_rate": 1.6343932841636455e-06, + "loss": 0.9111, + "step": 35444 + }, + { + "epoch": 0.91, + "learning_rate": 1.6343718943706742e-06, + "loss": 1.0186, + "step": 35445 + }, + { + "epoch": 0.91, + "learning_rate": 1.634350504091993e-06, + "loss": 0.9023, + "step": 35446 + }, + { + "epoch": 0.91, + "learning_rate": 1.6343291133276194e-06, + "loss": 0.8555, + "step": 35447 + }, + { + "epoch": 0.91, + "learning_rate": 1.634307722077569e-06, + "loss": 0.8428, + "step": 35448 + }, + { + "epoch": 0.91, + "learning_rate": 1.6342863303418582e-06, + "loss": 0.8301, + "step": 35449 + }, + { + "epoch": 0.91, + "learning_rate": 1.6342649381205036e-06, + "loss": 0.7861, + "step": 35450 + }, + { + "epoch": 0.91, + "learning_rate": 1.6342435454135215e-06, + "loss": 0.7803, + "step": 35451 + }, + { + "epoch": 0.91, + "learning_rate": 1.6342221522209285e-06, + "loss": 0.8311, + "step": 35452 + }, + { + "epoch": 0.91, + "learning_rate": 1.6342007585427403e-06, + "loss": 0.563, + "step": 35453 + }, + { + "epoch": 0.91, + "learning_rate": 1.634179364378974e-06, + "loss": 1.1055, + "step": 35454 + }, + { + "epoch": 0.91, + "learning_rate": 1.6341579697296459e-06, + "loss": 0.8311, + "step": 35455 + }, + { + "epoch": 0.91, + "learning_rate": 1.634136574594772e-06, + "loss": 1.0605, + "step": 35456 + }, + { + "epoch": 0.91, + "learning_rate": 1.6341151789743688e-06, + "loss": 0.9707, + "step": 35457 + }, + { + "epoch": 0.91, + "learning_rate": 1.634093782868453e-06, + "loss": 0.6287, + "step": 35458 + }, + { + "epoch": 0.91, + "learning_rate": 1.6340723862770405e-06, + "loss": 0.4653, + "step": 35459 + }, + { + "epoch": 0.91, + "learning_rate": 1.6340509892001479e-06, + "loss": 1.0098, + "step": 35460 + }, + { + "epoch": 0.91, + "learning_rate": 1.6340295916377917e-06, + "loss": 0.7383, + "step": 35461 + }, + { + "epoch": 0.91, + "learning_rate": 1.6340081935899886e-06, + "loss": 0.9365, + "step": 35462 + }, + { + "epoch": 0.91, + "learning_rate": 1.6339867950567542e-06, + "loss": 0.8193, + "step": 35463 + }, + { + "epoch": 0.91, + "learning_rate": 1.6339653960381052e-06, + "loss": 0.7471, + "step": 35464 + }, + { + "epoch": 0.91, + "learning_rate": 1.633943996534058e-06, + "loss": 0.8652, + "step": 35465 + }, + { + "epoch": 0.91, + "learning_rate": 1.6339225965446292e-06, + "loss": 0.7676, + "step": 35466 + }, + { + "epoch": 0.91, + "learning_rate": 1.6339011960698352e-06, + "loss": 0.8428, + "step": 35467 + }, + { + "epoch": 0.91, + "learning_rate": 1.6338797951096918e-06, + "loss": 1.0049, + "step": 35468 + }, + { + "epoch": 0.91, + "learning_rate": 1.6338583936642158e-06, + "loss": 0.9482, + "step": 35469 + }, + { + "epoch": 0.91, + "learning_rate": 1.6338369917334238e-06, + "loss": 0.7578, + "step": 35470 + }, + { + "epoch": 0.91, + "learning_rate": 1.633815589317332e-06, + "loss": 0.7822, + "step": 35471 + }, + { + "epoch": 0.91, + "learning_rate": 1.6337941864159567e-06, + "loss": 0.8022, + "step": 35472 + }, + { + "epoch": 0.91, + "learning_rate": 1.6337727830293143e-06, + "loss": 0.8906, + "step": 35473 + }, + { + "epoch": 0.91, + "learning_rate": 1.6337513791574211e-06, + "loss": 0.9551, + "step": 35474 + }, + { + "epoch": 0.91, + "learning_rate": 1.6337299748002937e-06, + "loss": 0.9546, + "step": 35475 + }, + { + "epoch": 0.91, + "learning_rate": 1.6337085699579485e-06, + "loss": 0.8076, + "step": 35476 + }, + { + "epoch": 0.91, + "learning_rate": 1.6336871646304019e-06, + "loss": 0.7793, + "step": 35477 + }, + { + "epoch": 0.91, + "learning_rate": 1.6336657588176697e-06, + "loss": 0.9414, + "step": 35478 + }, + { + "epoch": 0.91, + "learning_rate": 1.6336443525197691e-06, + "loss": 1.0723, + "step": 35479 + }, + { + "epoch": 0.91, + "learning_rate": 1.6336229457367158e-06, + "loss": 0.8447, + "step": 35480 + }, + { + "epoch": 0.91, + "learning_rate": 1.6336015384685272e-06, + "loss": 1.0527, + "step": 35481 + }, + { + "epoch": 0.91, + "learning_rate": 1.6335801307152188e-06, + "loss": 0.8271, + "step": 35482 + }, + { + "epoch": 0.91, + "learning_rate": 1.633558722476807e-06, + "loss": 0.8096, + "step": 35483 + }, + { + "epoch": 0.91, + "learning_rate": 1.6335373137533084e-06, + "loss": 0.9756, + "step": 35484 + }, + { + "epoch": 0.91, + "learning_rate": 1.6335159045447396e-06, + "loss": 0.8379, + "step": 35485 + }, + { + "epoch": 0.91, + "learning_rate": 1.6334944948511168e-06, + "loss": 0.7627, + "step": 35486 + }, + { + "epoch": 0.91, + "learning_rate": 1.6334730846724562e-06, + "loss": 0.835, + "step": 35487 + }, + { + "epoch": 0.91, + "learning_rate": 1.6334516740087746e-06, + "loss": 0.915, + "step": 35488 + }, + { + "epoch": 0.91, + "learning_rate": 1.633430262860088e-06, + "loss": 0.5811, + "step": 35489 + }, + { + "epoch": 0.91, + "learning_rate": 1.633408851226413e-06, + "loss": 0.8105, + "step": 35490 + }, + { + "epoch": 0.91, + "learning_rate": 1.633387439107766e-06, + "loss": 0.8496, + "step": 35491 + }, + { + "epoch": 0.91, + "learning_rate": 1.6333660265041639e-06, + "loss": 0.8721, + "step": 35492 + }, + { + "epoch": 0.91, + "learning_rate": 1.633344613415622e-06, + "loss": 0.9053, + "step": 35493 + }, + { + "epoch": 0.91, + "learning_rate": 1.633323199842157e-06, + "loss": 0.8701, + "step": 35494 + }, + { + "epoch": 0.91, + "learning_rate": 1.633301785783786e-06, + "loss": 0.8125, + "step": 35495 + }, + { + "epoch": 0.91, + "learning_rate": 1.6332803712405245e-06, + "loss": 0.5515, + "step": 35496 + }, + { + "epoch": 0.91, + "learning_rate": 1.6332589562123898e-06, + "loss": 0.8789, + "step": 35497 + }, + { + "epoch": 0.91, + "learning_rate": 1.633237540699398e-06, + "loss": 0.9326, + "step": 35498 + }, + { + "epoch": 0.91, + "learning_rate": 1.6332161247015645e-06, + "loss": 0.6948, + "step": 35499 + }, + { + "epoch": 0.91, + "learning_rate": 1.6331947082189074e-06, + "loss": 0.7959, + "step": 35500 + }, + { + "epoch": 0.91, + "learning_rate": 1.6331732912514418e-06, + "loss": 0.8047, + "step": 35501 + }, + { + "epoch": 0.91, + "learning_rate": 1.6331518737991846e-06, + "loss": 0.8091, + "step": 35502 + }, + { + "epoch": 0.91, + "learning_rate": 1.633130455862152e-06, + "loss": 0.6245, + "step": 35503 + }, + { + "epoch": 0.91, + "learning_rate": 1.6331090374403607e-06, + "loss": 1.0791, + "step": 35504 + }, + { + "epoch": 0.91, + "learning_rate": 1.6330876185338267e-06, + "loss": 0.8408, + "step": 35505 + }, + { + "epoch": 0.91, + "learning_rate": 1.6330661991425666e-06, + "loss": 0.8438, + "step": 35506 + }, + { + "epoch": 0.91, + "learning_rate": 1.6330447792665973e-06, + "loss": 0.8545, + "step": 35507 + }, + { + "epoch": 0.91, + "learning_rate": 1.6330233589059342e-06, + "loss": 0.8579, + "step": 35508 + }, + { + "epoch": 0.91, + "learning_rate": 1.6330019380605945e-06, + "loss": 0.7583, + "step": 35509 + }, + { + "epoch": 0.91, + "learning_rate": 1.6329805167305942e-06, + "loss": 0.7129, + "step": 35510 + }, + { + "epoch": 0.91, + "learning_rate": 1.6329590949159498e-06, + "loss": 1.1748, + "step": 35511 + }, + { + "epoch": 0.91, + "learning_rate": 1.6329376726166778e-06, + "loss": 0.7666, + "step": 35512 + }, + { + "epoch": 0.91, + "learning_rate": 1.6329162498327946e-06, + "loss": 0.874, + "step": 35513 + }, + { + "epoch": 0.91, + "learning_rate": 1.6328948265643166e-06, + "loss": 0.9346, + "step": 35514 + }, + { + "epoch": 0.91, + "learning_rate": 1.63287340281126e-06, + "loss": 0.7285, + "step": 35515 + }, + { + "epoch": 0.91, + "learning_rate": 1.6328519785736411e-06, + "loss": 0.7949, + "step": 35516 + }, + { + "epoch": 0.91, + "learning_rate": 1.6328305538514772e-06, + "loss": 0.7803, + "step": 35517 + }, + { + "epoch": 0.91, + "learning_rate": 1.6328091286447834e-06, + "loss": 0.8076, + "step": 35518 + }, + { + "epoch": 0.91, + "learning_rate": 1.6327877029535771e-06, + "loss": 0.9277, + "step": 35519 + }, + { + "epoch": 0.91, + "learning_rate": 1.632766276777874e-06, + "loss": 0.7212, + "step": 35520 + }, + { + "epoch": 0.91, + "learning_rate": 1.6327448501176911e-06, + "loss": 0.6763, + "step": 35521 + }, + { + "epoch": 0.91, + "learning_rate": 1.6327234229730444e-06, + "loss": 0.9785, + "step": 35522 + }, + { + "epoch": 0.91, + "learning_rate": 1.6327019953439506e-06, + "loss": 0.9385, + "step": 35523 + }, + { + "epoch": 0.91, + "learning_rate": 1.632680567230426e-06, + "loss": 0.8486, + "step": 35524 + }, + { + "epoch": 0.91, + "learning_rate": 1.632659138632487e-06, + "loss": 0.7944, + "step": 35525 + }, + { + "epoch": 0.91, + "learning_rate": 1.63263770955015e-06, + "loss": 0.8145, + "step": 35526 + }, + { + "epoch": 0.91, + "learning_rate": 1.6326162799834316e-06, + "loss": 0.6875, + "step": 35527 + }, + { + "epoch": 0.91, + "learning_rate": 1.6325948499323477e-06, + "loss": 0.8726, + "step": 35528 + }, + { + "epoch": 0.91, + "learning_rate": 1.6325734193969146e-06, + "loss": 0.6401, + "step": 35529 + }, + { + "epoch": 0.91, + "learning_rate": 1.6325519883771496e-06, + "loss": 0.8115, + "step": 35530 + }, + { + "epoch": 0.91, + "learning_rate": 1.6325305568730688e-06, + "loss": 0.9521, + "step": 35531 + }, + { + "epoch": 0.91, + "learning_rate": 1.6325091248846883e-06, + "loss": 0.8506, + "step": 35532 + }, + { + "epoch": 0.91, + "learning_rate": 1.6324876924120246e-06, + "loss": 0.7568, + "step": 35533 + }, + { + "epoch": 0.91, + "learning_rate": 1.6324662594550942e-06, + "loss": 0.8066, + "step": 35534 + }, + { + "epoch": 0.91, + "learning_rate": 1.6324448260139132e-06, + "loss": 0.7871, + "step": 35535 + }, + { + "epoch": 0.91, + "learning_rate": 1.6324233920884986e-06, + "loss": 1.0068, + "step": 35536 + }, + { + "epoch": 0.91, + "learning_rate": 1.6324019576788667e-06, + "loss": 0.8906, + "step": 35537 + }, + { + "epoch": 0.91, + "learning_rate": 1.632380522785033e-06, + "loss": 0.8379, + "step": 35538 + }, + { + "epoch": 0.91, + "learning_rate": 1.632359087407015e-06, + "loss": 0.8438, + "step": 35539 + }, + { + "epoch": 0.91, + "learning_rate": 1.6323376515448289e-06, + "loss": 0.6968, + "step": 35540 + }, + { + "epoch": 0.91, + "learning_rate": 1.6323162151984904e-06, + "loss": 0.8506, + "step": 35541 + }, + { + "epoch": 0.91, + "learning_rate": 1.632294778368017e-06, + "loss": 0.6729, + "step": 35542 + }, + { + "epoch": 0.91, + "learning_rate": 1.6322733410534245e-06, + "loss": 0.9268, + "step": 35543 + }, + { + "epoch": 0.91, + "learning_rate": 1.632251903254729e-06, + "loss": 0.7568, + "step": 35544 + }, + { + "epoch": 0.91, + "learning_rate": 1.6322304649719474e-06, + "loss": 0.9443, + "step": 35545 + }, + { + "epoch": 0.91, + "learning_rate": 1.6322090262050963e-06, + "loss": 1.0039, + "step": 35546 + }, + { + "epoch": 0.91, + "learning_rate": 1.6321875869541914e-06, + "loss": 0.8135, + "step": 35547 + }, + { + "epoch": 0.91, + "learning_rate": 1.6321661472192497e-06, + "loss": 0.8271, + "step": 35548 + }, + { + "epoch": 0.91, + "learning_rate": 1.6321447070002879e-06, + "loss": 0.8008, + "step": 35549 + }, + { + "epoch": 0.91, + "learning_rate": 1.6321232662973214e-06, + "loss": 0.8389, + "step": 35550 + }, + { + "epoch": 0.91, + "learning_rate": 1.6321018251103673e-06, + "loss": 0.7705, + "step": 35551 + }, + { + "epoch": 0.91, + "learning_rate": 1.632080383439442e-06, + "loss": 0.5488, + "step": 35552 + }, + { + "epoch": 0.91, + "learning_rate": 1.632058941284562e-06, + "loss": 0.9629, + "step": 35553 + }, + { + "epoch": 0.91, + "learning_rate": 1.6320374986457433e-06, + "loss": 0.8018, + "step": 35554 + }, + { + "epoch": 0.91, + "learning_rate": 1.6320160555230023e-06, + "loss": 0.917, + "step": 35555 + }, + { + "epoch": 0.91, + "learning_rate": 1.6319946119163559e-06, + "loss": 0.9116, + "step": 35556 + }, + { + "epoch": 0.91, + "learning_rate": 1.6319731678258207e-06, + "loss": 0.8687, + "step": 35557 + }, + { + "epoch": 0.91, + "learning_rate": 1.6319517232514122e-06, + "loss": 0.8975, + "step": 35558 + }, + { + "epoch": 0.91, + "learning_rate": 1.6319302781931472e-06, + "loss": 0.9082, + "step": 35559 + }, + { + "epoch": 0.91, + "learning_rate": 1.6319088326510427e-06, + "loss": 0.8062, + "step": 35560 + }, + { + "epoch": 0.91, + "learning_rate": 1.6318873866251143e-06, + "loss": 0.873, + "step": 35561 + }, + { + "epoch": 0.91, + "learning_rate": 1.6318659401153791e-06, + "loss": 0.9229, + "step": 35562 + }, + { + "epoch": 0.91, + "learning_rate": 1.6318444931218532e-06, + "loss": 0.8652, + "step": 35563 + }, + { + "epoch": 0.91, + "learning_rate": 1.6318230456445527e-06, + "loss": 0.8145, + "step": 35564 + }, + { + "epoch": 0.91, + "learning_rate": 1.6318015976834946e-06, + "loss": 0.8291, + "step": 35565 + }, + { + "epoch": 0.91, + "learning_rate": 1.6317801492386946e-06, + "loss": 0.7578, + "step": 35566 + }, + { + "epoch": 0.91, + "learning_rate": 1.6317587003101702e-06, + "loss": 0.8726, + "step": 35567 + }, + { + "epoch": 0.91, + "learning_rate": 1.6317372508979369e-06, + "loss": 0.696, + "step": 35568 + }, + { + "epoch": 0.91, + "learning_rate": 1.6317158010020115e-06, + "loss": 0.7939, + "step": 35569 + }, + { + "epoch": 0.91, + "learning_rate": 1.6316943506224104e-06, + "loss": 1.0225, + "step": 35570 + }, + { + "epoch": 0.91, + "learning_rate": 1.6316728997591497e-06, + "loss": 0.9287, + "step": 35571 + }, + { + "epoch": 0.91, + "learning_rate": 1.6316514484122465e-06, + "loss": 0.8486, + "step": 35572 + }, + { + "epoch": 0.91, + "learning_rate": 1.6316299965817168e-06, + "loss": 0.8721, + "step": 35573 + }, + { + "epoch": 0.91, + "learning_rate": 1.631608544267577e-06, + "loss": 0.8708, + "step": 35574 + }, + { + "epoch": 0.91, + "learning_rate": 1.6315870914698433e-06, + "loss": 0.6333, + "step": 35575 + }, + { + "epoch": 0.91, + "learning_rate": 1.6315656381885329e-06, + "loss": 0.6001, + "step": 35576 + }, + { + "epoch": 0.91, + "learning_rate": 1.6315441844236615e-06, + "loss": 0.8193, + "step": 35577 + }, + { + "epoch": 0.91, + "learning_rate": 1.6315227301752454e-06, + "loss": 0.584, + "step": 35578 + }, + { + "epoch": 0.91, + "learning_rate": 1.6315012754433017e-06, + "loss": 0.9424, + "step": 35579 + }, + { + "epoch": 0.91, + "learning_rate": 1.6314798202278466e-06, + "loss": 0.8613, + "step": 35580 + }, + { + "epoch": 0.91, + "learning_rate": 1.6314583645288962e-06, + "loss": 0.8975, + "step": 35581 + }, + { + "epoch": 0.91, + "learning_rate": 1.6314369083464676e-06, + "loss": 0.6929, + "step": 35582 + }, + { + "epoch": 0.91, + "learning_rate": 1.6314154516805766e-06, + "loss": 0.6714, + "step": 35583 + }, + { + "epoch": 0.91, + "learning_rate": 1.6313939945312396e-06, + "loss": 0.9443, + "step": 35584 + }, + { + "epoch": 0.91, + "learning_rate": 1.6313725368984731e-06, + "loss": 0.8579, + "step": 35585 + }, + { + "epoch": 0.91, + "learning_rate": 1.631351078782294e-06, + "loss": 0.9424, + "step": 35586 + }, + { + "epoch": 0.91, + "learning_rate": 1.6313296201827184e-06, + "loss": 0.8906, + "step": 35587 + }, + { + "epoch": 0.91, + "learning_rate": 1.631308161099763e-06, + "loss": 0.7988, + "step": 35588 + }, + { + "epoch": 0.91, + "learning_rate": 1.6312867015334434e-06, + "loss": 0.7666, + "step": 35589 + }, + { + "epoch": 0.91, + "learning_rate": 1.631265241483777e-06, + "loss": 0.8975, + "step": 35590 + }, + { + "epoch": 0.91, + "learning_rate": 1.6312437809507796e-06, + "loss": 1.0293, + "step": 35591 + }, + { + "epoch": 0.91, + "learning_rate": 1.6312223199344678e-06, + "loss": 0.8281, + "step": 35592 + }, + { + "epoch": 0.91, + "learning_rate": 1.6312008584348583e-06, + "loss": 0.8574, + "step": 35593 + }, + { + "epoch": 0.91, + "learning_rate": 1.6311793964519676e-06, + "loss": 0.6997, + "step": 35594 + }, + { + "epoch": 0.91, + "learning_rate": 1.6311579339858112e-06, + "loss": 0.7441, + "step": 35595 + }, + { + "epoch": 0.91, + "learning_rate": 1.6311364710364067e-06, + "loss": 0.9102, + "step": 35596 + }, + { + "epoch": 0.91, + "learning_rate": 1.6311150076037698e-06, + "loss": 0.7148, + "step": 35597 + }, + { + "epoch": 0.91, + "learning_rate": 1.631093543687917e-06, + "loss": 0.5958, + "step": 35598 + }, + { + "epoch": 0.91, + "learning_rate": 1.6310720792888653e-06, + "loss": 0.7622, + "step": 35599 + }, + { + "epoch": 0.91, + "learning_rate": 1.6310506144066306e-06, + "loss": 0.7656, + "step": 35600 + }, + { + "epoch": 0.91, + "learning_rate": 1.6310291490412296e-06, + "loss": 0.8262, + "step": 35601 + }, + { + "epoch": 0.91, + "learning_rate": 1.6310076831926781e-06, + "loss": 0.8037, + "step": 35602 + }, + { + "epoch": 0.91, + "learning_rate": 1.6309862168609936e-06, + "loss": 0.7012, + "step": 35603 + }, + { + "epoch": 0.91, + "learning_rate": 1.6309647500461914e-06, + "loss": 0.8545, + "step": 35604 + }, + { + "epoch": 0.91, + "learning_rate": 1.630943282748289e-06, + "loss": 0.6826, + "step": 35605 + }, + { + "epoch": 0.91, + "learning_rate": 1.6309218149673024e-06, + "loss": 0.75, + "step": 35606 + }, + { + "epoch": 0.91, + "learning_rate": 1.6309003467032473e-06, + "loss": 0.5825, + "step": 35607 + }, + { + "epoch": 0.91, + "learning_rate": 1.6308788779561412e-06, + "loss": 0.9102, + "step": 35608 + }, + { + "epoch": 0.91, + "learning_rate": 1.6308574087260004e-06, + "loss": 0.5508, + "step": 35609 + }, + { + "epoch": 0.91, + "learning_rate": 1.6308359390128408e-06, + "loss": 0.8662, + "step": 35610 + }, + { + "epoch": 0.91, + "learning_rate": 1.6308144688166792e-06, + "loss": 0.6008, + "step": 35611 + }, + { + "epoch": 0.91, + "learning_rate": 1.6307929981375318e-06, + "loss": 0.5984, + "step": 35612 + }, + { + "epoch": 0.91, + "learning_rate": 1.6307715269754154e-06, + "loss": 0.8604, + "step": 35613 + }, + { + "epoch": 0.91, + "learning_rate": 1.6307500553303463e-06, + "loss": 0.6636, + "step": 35614 + }, + { + "epoch": 0.91, + "learning_rate": 1.6307285832023406e-06, + "loss": 0.8506, + "step": 35615 + }, + { + "epoch": 0.91, + "learning_rate": 1.6307071105914156e-06, + "loss": 0.9365, + "step": 35616 + }, + { + "epoch": 0.91, + "learning_rate": 1.6306856374975868e-06, + "loss": 0.7803, + "step": 35617 + }, + { + "epoch": 0.91, + "learning_rate": 1.630664163920871e-06, + "loss": 0.7148, + "step": 35618 + }, + { + "epoch": 0.91, + "learning_rate": 1.6306426898612843e-06, + "loss": 0.8467, + "step": 35619 + }, + { + "epoch": 0.91, + "learning_rate": 1.6306212153188438e-06, + "loss": 0.9707, + "step": 35620 + }, + { + "epoch": 0.91, + "learning_rate": 1.630599740293566e-06, + "loss": 0.9668, + "step": 35621 + }, + { + "epoch": 0.91, + "learning_rate": 1.6305782647854666e-06, + "loss": 0.5068, + "step": 35622 + }, + { + "epoch": 0.91, + "learning_rate": 1.6305567887945623e-06, + "loss": 0.4688, + "step": 35623 + }, + { + "epoch": 0.91, + "learning_rate": 1.6305353123208701e-06, + "loss": 0.791, + "step": 35624 + }, + { + "epoch": 0.91, + "learning_rate": 1.6305138353644054e-06, + "loss": 0.916, + "step": 35625 + }, + { + "epoch": 0.91, + "learning_rate": 1.6304923579251857e-06, + "loss": 0.9521, + "step": 35626 + }, + { + "epoch": 0.91, + "learning_rate": 1.630470880003227e-06, + "loss": 0.7314, + "step": 35627 + }, + { + "epoch": 0.91, + "learning_rate": 1.6304494015985455e-06, + "loss": 0.832, + "step": 35628 + }, + { + "epoch": 0.91, + "learning_rate": 1.630427922711158e-06, + "loss": 1.0269, + "step": 35629 + }, + { + "epoch": 0.91, + "learning_rate": 1.630406443341081e-06, + "loss": 0.9424, + "step": 35630 + }, + { + "epoch": 0.91, + "learning_rate": 1.6303849634883305e-06, + "loss": 0.8984, + "step": 35631 + }, + { + "epoch": 0.91, + "learning_rate": 1.6303634831529232e-06, + "loss": 0.998, + "step": 35632 + }, + { + "epoch": 0.91, + "learning_rate": 1.6303420023348755e-06, + "loss": 0.8291, + "step": 35633 + }, + { + "epoch": 0.91, + "learning_rate": 1.6303205210342043e-06, + "loss": 0.8613, + "step": 35634 + }, + { + "epoch": 0.91, + "learning_rate": 1.6302990392509256e-06, + "loss": 0.752, + "step": 35635 + }, + { + "epoch": 0.91, + "learning_rate": 1.6302775569850555e-06, + "loss": 0.6558, + "step": 35636 + }, + { + "epoch": 0.91, + "learning_rate": 1.6302560742366112e-06, + "loss": 0.8335, + "step": 35637 + }, + { + "epoch": 0.91, + "learning_rate": 1.6302345910056085e-06, + "loss": 1.1309, + "step": 35638 + }, + { + "epoch": 0.91, + "learning_rate": 1.6302131072920645e-06, + "loss": 0.835, + "step": 35639 + }, + { + "epoch": 0.91, + "learning_rate": 1.6301916230959952e-06, + "loss": 0.6473, + "step": 35640 + }, + { + "epoch": 0.91, + "learning_rate": 1.6301701384174172e-06, + "loss": 0.8955, + "step": 35641 + }, + { + "epoch": 0.91, + "learning_rate": 1.630148653256347e-06, + "loss": 0.6694, + "step": 35642 + }, + { + "epoch": 0.91, + "learning_rate": 1.6301271676128004e-06, + "loss": 0.7979, + "step": 35643 + }, + { + "epoch": 0.91, + "learning_rate": 1.6301056814867947e-06, + "loss": 0.9648, + "step": 35644 + }, + { + "epoch": 0.91, + "learning_rate": 1.6300841948783462e-06, + "loss": 0.8062, + "step": 35645 + }, + { + "epoch": 0.91, + "learning_rate": 1.6300627077874713e-06, + "loss": 0.8516, + "step": 35646 + }, + { + "epoch": 0.91, + "learning_rate": 1.6300412202141861e-06, + "loss": 0.9443, + "step": 35647 + }, + { + "epoch": 0.91, + "learning_rate": 1.6300197321585075e-06, + "loss": 0.6758, + "step": 35648 + }, + { + "epoch": 0.91, + "learning_rate": 1.6299982436204514e-06, + "loss": 0.8359, + "step": 35649 + }, + { + "epoch": 0.91, + "learning_rate": 1.629976754600035e-06, + "loss": 0.7021, + "step": 35650 + }, + { + "epoch": 0.91, + "learning_rate": 1.6299552650972744e-06, + "loss": 1.0361, + "step": 35651 + }, + { + "epoch": 0.91, + "learning_rate": 1.6299337751121858e-06, + "loss": 0.8066, + "step": 35652 + }, + { + "epoch": 0.91, + "learning_rate": 1.629912284644786e-06, + "loss": 0.8516, + "step": 35653 + }, + { + "epoch": 0.91, + "learning_rate": 1.629890793695091e-06, + "loss": 0.8799, + "step": 35654 + }, + { + "epoch": 0.91, + "learning_rate": 1.6298693022631177e-06, + "loss": 0.8408, + "step": 35655 + }, + { + "epoch": 0.91, + "learning_rate": 1.6298478103488828e-06, + "loss": 0.6284, + "step": 35656 + }, + { + "epoch": 0.91, + "learning_rate": 1.629826317952402e-06, + "loss": 0.8643, + "step": 35657 + }, + { + "epoch": 0.91, + "learning_rate": 1.6298048250736924e-06, + "loss": 0.7539, + "step": 35658 + }, + { + "epoch": 0.91, + "learning_rate": 1.62978333171277e-06, + "loss": 0.7998, + "step": 35659 + }, + { + "epoch": 0.91, + "learning_rate": 1.6297618378696517e-06, + "loss": 0.7715, + "step": 35660 + }, + { + "epoch": 0.91, + "learning_rate": 1.6297403435443537e-06, + "loss": 0.7168, + "step": 35661 + }, + { + "epoch": 0.91, + "learning_rate": 1.6297188487368922e-06, + "loss": 0.7183, + "step": 35662 + }, + { + "epoch": 0.91, + "learning_rate": 1.629697353447284e-06, + "loss": 0.9443, + "step": 35663 + }, + { + "epoch": 0.91, + "learning_rate": 1.6296758576755459e-06, + "loss": 0.835, + "step": 35664 + }, + { + "epoch": 0.91, + "learning_rate": 1.6296543614216934e-06, + "loss": 0.8584, + "step": 35665 + }, + { + "epoch": 0.91, + "learning_rate": 1.6296328646857437e-06, + "loss": 0.6082, + "step": 35666 + }, + { + "epoch": 0.91, + "learning_rate": 1.6296113674677133e-06, + "loss": 1.0366, + "step": 35667 + }, + { + "epoch": 0.91, + "learning_rate": 1.6295898697676183e-06, + "loss": 0.8364, + "step": 35668 + }, + { + "epoch": 0.91, + "learning_rate": 1.629568371585475e-06, + "loss": 0.9385, + "step": 35669 + }, + { + "epoch": 0.91, + "learning_rate": 1.6295468729213004e-06, + "loss": 0.8662, + "step": 35670 + }, + { + "epoch": 0.91, + "learning_rate": 1.6295253737751108e-06, + "loss": 1.082, + "step": 35671 + }, + { + "epoch": 0.91, + "learning_rate": 1.6295038741469224e-06, + "loss": 0.6631, + "step": 35672 + }, + { + "epoch": 0.91, + "learning_rate": 1.629482374036752e-06, + "loss": 0.8848, + "step": 35673 + }, + { + "epoch": 0.91, + "learning_rate": 1.6294608734446155e-06, + "loss": 0.9609, + "step": 35674 + }, + { + "epoch": 0.91, + "learning_rate": 1.6294393723705302e-06, + "loss": 0.8232, + "step": 35675 + }, + { + "epoch": 0.91, + "learning_rate": 1.629417870814512e-06, + "loss": 0.9258, + "step": 35676 + }, + { + "epoch": 0.91, + "learning_rate": 1.6293963687765776e-06, + "loss": 1.0273, + "step": 35677 + }, + { + "epoch": 0.91, + "learning_rate": 1.629374866256743e-06, + "loss": 0.7314, + "step": 35678 + }, + { + "epoch": 0.91, + "learning_rate": 1.6293533632550252e-06, + "loss": 0.9473, + "step": 35679 + }, + { + "epoch": 0.91, + "learning_rate": 1.6293318597714402e-06, + "loss": 0.75, + "step": 35680 + }, + { + "epoch": 0.91, + "learning_rate": 1.629310355806005e-06, + "loss": 0.8159, + "step": 35681 + }, + { + "epoch": 0.91, + "learning_rate": 1.6292888513587357e-06, + "loss": 0.9355, + "step": 35682 + }, + { + "epoch": 0.91, + "learning_rate": 1.629267346429649e-06, + "loss": 0.875, + "step": 35683 + }, + { + "epoch": 0.91, + "learning_rate": 1.6292458410187613e-06, + "loss": 0.6841, + "step": 35684 + }, + { + "epoch": 0.91, + "learning_rate": 1.6292243351260888e-06, + "loss": 0.8672, + "step": 35685 + }, + { + "epoch": 0.91, + "learning_rate": 1.6292028287516482e-06, + "loss": 0.9131, + "step": 35686 + }, + { + "epoch": 0.91, + "learning_rate": 1.629181321895456e-06, + "loss": 0.8613, + "step": 35687 + }, + { + "epoch": 0.91, + "learning_rate": 1.6291598145575284e-06, + "loss": 0.9111, + "step": 35688 + }, + { + "epoch": 0.91, + "learning_rate": 1.6291383067378822e-06, + "loss": 1.0215, + "step": 35689 + }, + { + "epoch": 0.91, + "learning_rate": 1.6291167984365334e-06, + "loss": 0.7783, + "step": 35690 + }, + { + "epoch": 0.91, + "learning_rate": 1.6290952896534992e-06, + "loss": 0.9512, + "step": 35691 + }, + { + "epoch": 0.91, + "learning_rate": 1.6290737803887957e-06, + "loss": 0.9014, + "step": 35692 + }, + { + "epoch": 0.91, + "learning_rate": 1.6290522706424392e-06, + "loss": 0.8057, + "step": 35693 + }, + { + "epoch": 0.91, + "learning_rate": 1.6290307604144462e-06, + "loss": 0.4137, + "step": 35694 + }, + { + "epoch": 0.91, + "learning_rate": 1.6290092497048335e-06, + "loss": 0.7373, + "step": 35695 + }, + { + "epoch": 0.91, + "learning_rate": 1.6289877385136173e-06, + "loss": 0.8828, + "step": 35696 + }, + { + "epoch": 0.91, + "learning_rate": 1.628966226840814e-06, + "loss": 0.9238, + "step": 35697 + }, + { + "epoch": 0.91, + "learning_rate": 1.6289447146864401e-06, + "loss": 0.7656, + "step": 35698 + }, + { + "epoch": 0.91, + "learning_rate": 1.628923202050512e-06, + "loss": 0.7148, + "step": 35699 + }, + { + "epoch": 0.92, + "learning_rate": 1.628901688933047e-06, + "loss": 0.7354, + "step": 35700 + }, + { + "epoch": 0.92, + "learning_rate": 1.6288801753340602e-06, + "loss": 1.0088, + "step": 35701 + }, + { + "epoch": 0.92, + "learning_rate": 1.6288586612535691e-06, + "loss": 0.7734, + "step": 35702 + }, + { + "epoch": 0.92, + "learning_rate": 1.6288371466915897e-06, + "loss": 0.8252, + "step": 35703 + }, + { + "epoch": 0.92, + "learning_rate": 1.6288156316481386e-06, + "loss": 0.8594, + "step": 35704 + }, + { + "epoch": 0.92, + "learning_rate": 1.6287941161232323e-06, + "loss": 0.7485, + "step": 35705 + }, + { + "epoch": 0.92, + "learning_rate": 1.6287726001168875e-06, + "loss": 0.9912, + "step": 35706 + }, + { + "epoch": 0.92, + "learning_rate": 1.6287510836291203e-06, + "loss": 0.8037, + "step": 35707 + }, + { + "epoch": 0.92, + "learning_rate": 1.6287295666599472e-06, + "loss": 0.9121, + "step": 35708 + }, + { + "epoch": 0.92, + "learning_rate": 1.628708049209385e-06, + "loss": 0.748, + "step": 35709 + }, + { + "epoch": 0.92, + "learning_rate": 1.6286865312774496e-06, + "loss": 0.8809, + "step": 35710 + }, + { + "epoch": 0.92, + "learning_rate": 1.6286650128641582e-06, + "loss": 1.0234, + "step": 35711 + }, + { + "epoch": 0.92, + "learning_rate": 1.628643493969527e-06, + "loss": 0.7886, + "step": 35712 + }, + { + "epoch": 0.92, + "learning_rate": 1.628621974593572e-06, + "loss": 0.8291, + "step": 35713 + }, + { + "epoch": 0.92, + "learning_rate": 1.62860045473631e-06, + "loss": 0.71, + "step": 35714 + }, + { + "epoch": 0.92, + "learning_rate": 1.6285789343977576e-06, + "loss": 0.6509, + "step": 35715 + }, + { + "epoch": 0.92, + "learning_rate": 1.6285574135779316e-06, + "loss": 0.5269, + "step": 35716 + }, + { + "epoch": 0.92, + "learning_rate": 1.6285358922768478e-06, + "loss": 0.8633, + "step": 35717 + }, + { + "epoch": 0.92, + "learning_rate": 1.6285143704945228e-06, + "loss": 0.874, + "step": 35718 + }, + { + "epoch": 0.92, + "learning_rate": 1.6284928482309734e-06, + "loss": 0.8408, + "step": 35719 + }, + { + "epoch": 0.92, + "learning_rate": 1.628471325486216e-06, + "loss": 0.9482, + "step": 35720 + }, + { + "epoch": 0.92, + "learning_rate": 1.628449802260267e-06, + "loss": 0.8398, + "step": 35721 + }, + { + "epoch": 0.92, + "learning_rate": 1.6284282785531426e-06, + "loss": 0.7729, + "step": 35722 + }, + { + "epoch": 0.92, + "learning_rate": 1.62840675436486e-06, + "loss": 0.873, + "step": 35723 + }, + { + "epoch": 0.92, + "learning_rate": 1.628385229695435e-06, + "loss": 0.8311, + "step": 35724 + }, + { + "epoch": 0.92, + "learning_rate": 1.6283637045448844e-06, + "loss": 0.5376, + "step": 35725 + }, + { + "epoch": 0.92, + "learning_rate": 1.6283421789132246e-06, + "loss": 0.9277, + "step": 35726 + }, + { + "epoch": 0.92, + "learning_rate": 1.628320652800472e-06, + "loss": 0.8418, + "step": 35727 + }, + { + "epoch": 0.92, + "learning_rate": 1.6282991262066432e-06, + "loss": 0.7832, + "step": 35728 + }, + { + "epoch": 0.92, + "learning_rate": 1.6282775991317546e-06, + "loss": 0.7725, + "step": 35729 + }, + { + "epoch": 0.92, + "learning_rate": 1.6282560715758229e-06, + "loss": 0.9238, + "step": 35730 + }, + { + "epoch": 0.92, + "learning_rate": 1.6282345435388646e-06, + "loss": 1.0127, + "step": 35731 + }, + { + "epoch": 0.92, + "learning_rate": 1.6282130150208955e-06, + "loss": 0.8965, + "step": 35732 + }, + { + "epoch": 0.92, + "learning_rate": 1.6281914860219328e-06, + "loss": 0.7793, + "step": 35733 + }, + { + "epoch": 0.92, + "learning_rate": 1.6281699565419929e-06, + "loss": 0.8662, + "step": 35734 + }, + { + "epoch": 0.92, + "learning_rate": 1.6281484265810915e-06, + "loss": 0.5859, + "step": 35735 + }, + { + "epoch": 0.92, + "learning_rate": 1.6281268961392468e-06, + "loss": 0.9287, + "step": 35736 + }, + { + "epoch": 0.92, + "learning_rate": 1.6281053652164735e-06, + "loss": 1.1426, + "step": 35737 + }, + { + "epoch": 0.92, + "learning_rate": 1.628083833812789e-06, + "loss": 0.6318, + "step": 35738 + }, + { + "epoch": 0.92, + "learning_rate": 1.6280623019282093e-06, + "loss": 1.04, + "step": 35739 + }, + { + "epoch": 0.92, + "learning_rate": 1.6280407695627516e-06, + "loss": 1.0332, + "step": 35740 + }, + { + "epoch": 0.92, + "learning_rate": 1.628019236716432e-06, + "loss": 0.7007, + "step": 35741 + }, + { + "epoch": 0.92, + "learning_rate": 1.6279977033892664e-06, + "loss": 1.0459, + "step": 35742 + }, + { + "epoch": 0.92, + "learning_rate": 1.6279761695812723e-06, + "loss": 0.9111, + "step": 35743 + }, + { + "epoch": 0.92, + "learning_rate": 1.6279546352924656e-06, + "loss": 0.8086, + "step": 35744 + }, + { + "epoch": 0.92, + "learning_rate": 1.627933100522863e-06, + "loss": 0.7588, + "step": 35745 + }, + { + "epoch": 0.92, + "learning_rate": 1.6279115652724808e-06, + "loss": 0.9238, + "step": 35746 + }, + { + "epoch": 0.92, + "learning_rate": 1.6278900295413354e-06, + "loss": 0.9106, + "step": 35747 + }, + { + "epoch": 0.92, + "learning_rate": 1.6278684933294438e-06, + "loss": 0.7422, + "step": 35748 + }, + { + "epoch": 0.92, + "learning_rate": 1.627846956636822e-06, + "loss": 0.8623, + "step": 35749 + }, + { + "epoch": 0.92, + "learning_rate": 1.6278254194634866e-06, + "loss": 0.7607, + "step": 35750 + }, + { + "epoch": 0.92, + "learning_rate": 1.6278038818094544e-06, + "loss": 0.7417, + "step": 35751 + }, + { + "epoch": 0.92, + "learning_rate": 1.6277823436747413e-06, + "loss": 0.7363, + "step": 35752 + }, + { + "epoch": 0.92, + "learning_rate": 1.6277608050593642e-06, + "loss": 0.7383, + "step": 35753 + }, + { + "epoch": 0.92, + "learning_rate": 1.6277392659633398e-06, + "loss": 0.9395, + "step": 35754 + }, + { + "epoch": 0.92, + "learning_rate": 1.6277177263866841e-06, + "loss": 0.8916, + "step": 35755 + }, + { + "epoch": 0.92, + "learning_rate": 1.627696186329414e-06, + "loss": 0.7601, + "step": 35756 + }, + { + "epoch": 0.92, + "learning_rate": 1.6276746457915454e-06, + "loss": 1.0112, + "step": 35757 + }, + { + "epoch": 0.92, + "learning_rate": 1.6276531047730955e-06, + "loss": 0.9287, + "step": 35758 + }, + { + "epoch": 0.92, + "learning_rate": 1.6276315632740803e-06, + "loss": 0.8357, + "step": 35759 + }, + { + "epoch": 0.92, + "learning_rate": 1.6276100212945165e-06, + "loss": 0.7979, + "step": 35760 + }, + { + "epoch": 0.92, + "learning_rate": 1.6275884788344206e-06, + "loss": 0.9102, + "step": 35761 + }, + { + "epoch": 0.92, + "learning_rate": 1.6275669358938092e-06, + "loss": 0.6953, + "step": 35762 + }, + { + "epoch": 0.92, + "learning_rate": 1.6275453924726984e-06, + "loss": 0.8936, + "step": 35763 + }, + { + "epoch": 0.92, + "learning_rate": 1.627523848571105e-06, + "loss": 0.771, + "step": 35764 + }, + { + "epoch": 0.92, + "learning_rate": 1.6275023041890457e-06, + "loss": 1.001, + "step": 35765 + }, + { + "epoch": 0.92, + "learning_rate": 1.6274807593265366e-06, + "loss": 0.7688, + "step": 35766 + }, + { + "epoch": 0.92, + "learning_rate": 1.6274592139835942e-06, + "loss": 0.9922, + "step": 35767 + }, + { + "epoch": 0.92, + "learning_rate": 1.627437668160235e-06, + "loss": 0.9082, + "step": 35768 + }, + { + "epoch": 0.92, + "learning_rate": 1.6274161218564759e-06, + "loss": 0.9238, + "step": 35769 + }, + { + "epoch": 0.92, + "learning_rate": 1.627394575072333e-06, + "loss": 0.7021, + "step": 35770 + }, + { + "epoch": 0.92, + "learning_rate": 1.6273730278078231e-06, + "loss": 0.7725, + "step": 35771 + }, + { + "epoch": 0.92, + "learning_rate": 1.6273514800629623e-06, + "loss": 0.8491, + "step": 35772 + }, + { + "epoch": 0.92, + "learning_rate": 1.6273299318377676e-06, + "loss": 0.7261, + "step": 35773 + }, + { + "epoch": 0.92, + "learning_rate": 1.627308383132255e-06, + "loss": 0.8232, + "step": 35774 + }, + { + "epoch": 0.92, + "learning_rate": 1.6272868339464412e-06, + "loss": 0.897, + "step": 35775 + }, + { + "epoch": 0.92, + "learning_rate": 1.6272652842803426e-06, + "loss": 0.9209, + "step": 35776 + }, + { + "epoch": 0.92, + "learning_rate": 1.6272437341339762e-06, + "loss": 0.6318, + "step": 35777 + }, + { + "epoch": 0.92, + "learning_rate": 1.6272221835073579e-06, + "loss": 0.8735, + "step": 35778 + }, + { + "epoch": 0.92, + "learning_rate": 1.6272006324005045e-06, + "loss": 0.9678, + "step": 35779 + }, + { + "epoch": 0.92, + "learning_rate": 1.6271790808134322e-06, + "loss": 0.9912, + "step": 35780 + }, + { + "epoch": 0.92, + "learning_rate": 1.6271575287461578e-06, + "loss": 0.752, + "step": 35781 + }, + { + "epoch": 0.92, + "learning_rate": 1.6271359761986977e-06, + "loss": 0.9053, + "step": 35782 + }, + { + "epoch": 0.92, + "learning_rate": 1.6271144231710684e-06, + "loss": 0.6409, + "step": 35783 + }, + { + "epoch": 0.92, + "learning_rate": 1.6270928696632869e-06, + "loss": 0.835, + "step": 35784 + }, + { + "epoch": 0.92, + "learning_rate": 1.6270713156753687e-06, + "loss": 0.7461, + "step": 35785 + }, + { + "epoch": 0.92, + "learning_rate": 1.627049761207331e-06, + "loss": 1.0889, + "step": 35786 + }, + { + "epoch": 0.92, + "learning_rate": 1.6270282062591903e-06, + "loss": 0.6846, + "step": 35787 + }, + { + "epoch": 0.92, + "learning_rate": 1.6270066508309626e-06, + "loss": 0.6914, + "step": 35788 + }, + { + "epoch": 0.92, + "learning_rate": 1.6269850949226647e-06, + "loss": 0.7573, + "step": 35789 + }, + { + "epoch": 0.92, + "learning_rate": 1.6269635385343134e-06, + "loss": 0.9658, + "step": 35790 + }, + { + "epoch": 0.92, + "learning_rate": 1.626941981665925e-06, + "loss": 1.0049, + "step": 35791 + }, + { + "epoch": 0.92, + "learning_rate": 1.6269204243175154e-06, + "loss": 0.7939, + "step": 35792 + }, + { + "epoch": 0.92, + "learning_rate": 1.6268988664891024e-06, + "loss": 0.9277, + "step": 35793 + }, + { + "epoch": 0.92, + "learning_rate": 1.6268773081807012e-06, + "loss": 0.8057, + "step": 35794 + }, + { + "epoch": 0.92, + "learning_rate": 1.6268557493923289e-06, + "loss": 0.5688, + "step": 35795 + }, + { + "epoch": 0.92, + "learning_rate": 1.6268341901240024e-06, + "loss": 0.7695, + "step": 35796 + }, + { + "epoch": 0.92, + "learning_rate": 1.6268126303757374e-06, + "loss": 0.9619, + "step": 35797 + }, + { + "epoch": 0.92, + "learning_rate": 1.626791070147551e-06, + "loss": 0.9141, + "step": 35798 + }, + { + "epoch": 0.92, + "learning_rate": 1.6267695094394596e-06, + "loss": 0.9961, + "step": 35799 + }, + { + "epoch": 0.92, + "learning_rate": 1.6267479482514795e-06, + "loss": 0.5913, + "step": 35800 + }, + { + "epoch": 0.92, + "learning_rate": 1.6267263865836273e-06, + "loss": 0.8213, + "step": 35801 + }, + { + "epoch": 0.92, + "learning_rate": 1.6267048244359193e-06, + "loss": 0.8896, + "step": 35802 + }, + { + "epoch": 0.92, + "learning_rate": 1.6266832618083726e-06, + "loss": 0.8867, + "step": 35803 + }, + { + "epoch": 0.92, + "learning_rate": 1.6266616987010032e-06, + "loss": 0.7466, + "step": 35804 + }, + { + "epoch": 0.92, + "learning_rate": 1.6266401351138275e-06, + "loss": 0.697, + "step": 35805 + }, + { + "epoch": 0.92, + "learning_rate": 1.6266185710468627e-06, + "loss": 0.8066, + "step": 35806 + }, + { + "epoch": 0.92, + "learning_rate": 1.6265970065001246e-06, + "loss": 0.9961, + "step": 35807 + }, + { + "epoch": 0.92, + "learning_rate": 1.6265754414736299e-06, + "loss": 0.7246, + "step": 35808 + }, + { + "epoch": 0.92, + "learning_rate": 1.6265538759673954e-06, + "loss": 0.8994, + "step": 35809 + }, + { + "epoch": 0.92, + "learning_rate": 1.6265323099814372e-06, + "loss": 0.8887, + "step": 35810 + }, + { + "epoch": 0.92, + "learning_rate": 1.626510743515772e-06, + "loss": 0.6855, + "step": 35811 + }, + { + "epoch": 0.92, + "learning_rate": 1.6264891765704167e-06, + "loss": 0.9805, + "step": 35812 + }, + { + "epoch": 0.92, + "learning_rate": 1.6264676091453872e-06, + "loss": 0.9199, + "step": 35813 + }, + { + "epoch": 0.92, + "learning_rate": 1.6264460412407001e-06, + "loss": 0.8965, + "step": 35814 + }, + { + "epoch": 0.92, + "learning_rate": 1.6264244728563724e-06, + "loss": 0.7905, + "step": 35815 + }, + { + "epoch": 0.92, + "learning_rate": 1.6264029039924203e-06, + "loss": 0.7461, + "step": 35816 + }, + { + "epoch": 0.92, + "learning_rate": 1.62638133464886e-06, + "loss": 0.9014, + "step": 35817 + }, + { + "epoch": 0.92, + "learning_rate": 1.6263597648257084e-06, + "loss": 0.5918, + "step": 35818 + }, + { + "epoch": 0.92, + "learning_rate": 1.6263381945229821e-06, + "loss": 0.877, + "step": 35819 + }, + { + "epoch": 0.92, + "learning_rate": 1.6263166237406973e-06, + "loss": 0.8018, + "step": 35820 + }, + { + "epoch": 0.92, + "learning_rate": 1.6262950524788708e-06, + "loss": 0.7278, + "step": 35821 + }, + { + "epoch": 0.92, + "learning_rate": 1.626273480737519e-06, + "loss": 0.9316, + "step": 35822 + }, + { + "epoch": 0.92, + "learning_rate": 1.6262519085166582e-06, + "loss": 0.7974, + "step": 35823 + }, + { + "epoch": 0.92, + "learning_rate": 1.626230335816305e-06, + "loss": 0.71, + "step": 35824 + }, + { + "epoch": 0.92, + "learning_rate": 1.6262087626364762e-06, + "loss": 0.6541, + "step": 35825 + }, + { + "epoch": 0.92, + "learning_rate": 1.6261871889771883e-06, + "loss": 0.792, + "step": 35826 + }, + { + "epoch": 0.92, + "learning_rate": 1.6261656148384574e-06, + "loss": 0.6631, + "step": 35827 + }, + { + "epoch": 0.92, + "learning_rate": 1.6261440402203004e-06, + "loss": 0.7686, + "step": 35828 + }, + { + "epoch": 0.92, + "learning_rate": 1.6261224651227336e-06, + "loss": 0.915, + "step": 35829 + }, + { + "epoch": 0.92, + "learning_rate": 1.6261008895457735e-06, + "loss": 0.7896, + "step": 35830 + }, + { + "epoch": 0.92, + "learning_rate": 1.6260793134894372e-06, + "loss": 0.7163, + "step": 35831 + }, + { + "epoch": 0.92, + "learning_rate": 1.6260577369537404e-06, + "loss": 0.833, + "step": 35832 + }, + { + "epoch": 0.92, + "learning_rate": 1.6260361599387e-06, + "loss": 0.791, + "step": 35833 + }, + { + "epoch": 0.92, + "learning_rate": 1.6260145824443327e-06, + "loss": 0.9277, + "step": 35834 + }, + { + "epoch": 0.92, + "learning_rate": 1.6259930044706547e-06, + "loss": 0.75, + "step": 35835 + }, + { + "epoch": 0.92, + "learning_rate": 1.6259714260176827e-06, + "loss": 0.8379, + "step": 35836 + }, + { + "epoch": 0.92, + "learning_rate": 1.6259498470854329e-06, + "loss": 0.8179, + "step": 35837 + }, + { + "epoch": 0.92, + "learning_rate": 1.6259282676739224e-06, + "loss": 0.6426, + "step": 35838 + }, + { + "epoch": 0.92, + "learning_rate": 1.625906687783167e-06, + "loss": 0.6636, + "step": 35839 + }, + { + "epoch": 0.92, + "learning_rate": 1.6258851074131838e-06, + "loss": 0.96, + "step": 35840 + }, + { + "epoch": 0.92, + "learning_rate": 1.6258635265639895e-06, + "loss": 0.96, + "step": 35841 + }, + { + "epoch": 0.92, + "learning_rate": 1.6258419452356003e-06, + "loss": 0.8145, + "step": 35842 + }, + { + "epoch": 0.92, + "learning_rate": 1.625820363428032e-06, + "loss": 0.8174, + "step": 35843 + }, + { + "epoch": 0.92, + "learning_rate": 1.6257987811413023e-06, + "loss": 0.3842, + "step": 35844 + }, + { + "epoch": 0.92, + "learning_rate": 1.6257771983754273e-06, + "loss": 0.7256, + "step": 35845 + }, + { + "epoch": 0.92, + "learning_rate": 1.6257556151304238e-06, + "loss": 0.7969, + "step": 35846 + }, + { + "epoch": 0.92, + "learning_rate": 1.6257340314063074e-06, + "loss": 0.7661, + "step": 35847 + }, + { + "epoch": 0.92, + "learning_rate": 1.6257124472030953e-06, + "loss": 0.9023, + "step": 35848 + }, + { + "epoch": 0.92, + "learning_rate": 1.6256908625208042e-06, + "loss": 0.5884, + "step": 35849 + }, + { + "epoch": 0.92, + "learning_rate": 1.62566927735945e-06, + "loss": 0.959, + "step": 35850 + }, + { + "epoch": 0.92, + "learning_rate": 1.6256476917190501e-06, + "loss": 0.7642, + "step": 35851 + }, + { + "epoch": 0.92, + "learning_rate": 1.62562610559962e-06, + "loss": 0.8213, + "step": 35852 + }, + { + "epoch": 0.92, + "learning_rate": 1.625604519001177e-06, + "loss": 0.6338, + "step": 35853 + }, + { + "epoch": 0.92, + "learning_rate": 1.6255829319237375e-06, + "loss": 0.8193, + "step": 35854 + }, + { + "epoch": 0.92, + "learning_rate": 1.6255613443673176e-06, + "loss": 0.6411, + "step": 35855 + }, + { + "epoch": 0.92, + "learning_rate": 1.6255397563319346e-06, + "loss": 0.792, + "step": 35856 + }, + { + "epoch": 0.92, + "learning_rate": 1.6255181678176041e-06, + "loss": 0.8252, + "step": 35857 + }, + { + "epoch": 0.92, + "learning_rate": 1.6254965788243435e-06, + "loss": 0.8223, + "step": 35858 + }, + { + "epoch": 0.92, + "learning_rate": 1.625474989352169e-06, + "loss": 0.8672, + "step": 35859 + }, + { + "epoch": 0.92, + "learning_rate": 1.6254533994010966e-06, + "loss": 0.7061, + "step": 35860 + }, + { + "epoch": 0.92, + "learning_rate": 1.6254318089711437e-06, + "loss": 0.9258, + "step": 35861 + }, + { + "epoch": 0.92, + "learning_rate": 1.625410218062326e-06, + "loss": 0.793, + "step": 35862 + }, + { + "epoch": 0.92, + "learning_rate": 1.6253886266746609e-06, + "loss": 0.8623, + "step": 35863 + }, + { + "epoch": 0.92, + "learning_rate": 1.625367034808164e-06, + "loss": 0.8662, + "step": 35864 + }, + { + "epoch": 0.92, + "learning_rate": 1.6253454424628527e-06, + "loss": 0.7969, + "step": 35865 + }, + { + "epoch": 0.92, + "learning_rate": 1.6253238496387432e-06, + "loss": 0.7803, + "step": 35866 + }, + { + "epoch": 0.92, + "learning_rate": 1.6253022563358518e-06, + "loss": 0.8638, + "step": 35867 + }, + { + "epoch": 0.92, + "learning_rate": 1.625280662554195e-06, + "loss": 0.875, + "step": 35868 + }, + { + "epoch": 0.92, + "learning_rate": 1.6252590682937899e-06, + "loss": 0.5085, + "step": 35869 + }, + { + "epoch": 0.92, + "learning_rate": 1.6252374735546526e-06, + "loss": 0.877, + "step": 35870 + }, + { + "epoch": 0.92, + "learning_rate": 1.6252158783368e-06, + "loss": 0.7744, + "step": 35871 + }, + { + "epoch": 0.92, + "learning_rate": 1.6251942826402478e-06, + "loss": 0.6128, + "step": 35872 + }, + { + "epoch": 0.92, + "learning_rate": 1.6251726864650132e-06, + "loss": 0.8467, + "step": 35873 + }, + { + "epoch": 0.92, + "learning_rate": 1.6251510898111129e-06, + "loss": 0.6753, + "step": 35874 + }, + { + "epoch": 0.92, + "learning_rate": 1.6251294926785631e-06, + "loss": 0.6992, + "step": 35875 + }, + { + "epoch": 0.92, + "learning_rate": 1.6251078950673803e-06, + "loss": 0.9277, + "step": 35876 + }, + { + "epoch": 0.92, + "learning_rate": 1.6250862969775812e-06, + "loss": 0.9111, + "step": 35877 + }, + { + "epoch": 0.92, + "learning_rate": 1.625064698409182e-06, + "loss": 0.793, + "step": 35878 + }, + { + "epoch": 0.92, + "learning_rate": 1.6250430993621996e-06, + "loss": 0.8574, + "step": 35879 + }, + { + "epoch": 0.92, + "learning_rate": 1.6250214998366505e-06, + "loss": 0.8545, + "step": 35880 + }, + { + "epoch": 0.92, + "learning_rate": 1.6249998998325513e-06, + "loss": 0.8252, + "step": 35881 + }, + { + "epoch": 0.92, + "learning_rate": 1.624978299349918e-06, + "loss": 0.7783, + "step": 35882 + }, + { + "epoch": 0.92, + "learning_rate": 1.6249566983887682e-06, + "loss": 0.7827, + "step": 35883 + }, + { + "epoch": 0.92, + "learning_rate": 1.6249350969491173e-06, + "loss": 0.9238, + "step": 35884 + }, + { + "epoch": 0.92, + "learning_rate": 1.6249134950309826e-06, + "loss": 0.8159, + "step": 35885 + }, + { + "epoch": 0.92, + "learning_rate": 1.6248918926343804e-06, + "loss": 0.9229, + "step": 35886 + }, + { + "epoch": 0.92, + "learning_rate": 1.624870289759327e-06, + "loss": 0.8447, + "step": 35887 + }, + { + "epoch": 0.92, + "learning_rate": 1.6248486864058392e-06, + "loss": 0.7998, + "step": 35888 + }, + { + "epoch": 0.92, + "learning_rate": 1.6248270825739335e-06, + "loss": 0.958, + "step": 35889 + }, + { + "epoch": 0.92, + "learning_rate": 1.6248054782636268e-06, + "loss": 0.8037, + "step": 35890 + }, + { + "epoch": 0.92, + "learning_rate": 1.6247838734749347e-06, + "loss": 0.8477, + "step": 35891 + }, + { + "epoch": 0.92, + "learning_rate": 1.6247622682078746e-06, + "loss": 0.8887, + "step": 35892 + }, + { + "epoch": 0.92, + "learning_rate": 1.6247406624624626e-06, + "loss": 0.8867, + "step": 35893 + }, + { + "epoch": 0.92, + "learning_rate": 1.6247190562387155e-06, + "loss": 0.8047, + "step": 35894 + }, + { + "epoch": 0.92, + "learning_rate": 1.6246974495366498e-06, + "loss": 0.7056, + "step": 35895 + }, + { + "epoch": 0.92, + "learning_rate": 1.6246758423562819e-06, + "loss": 0.6155, + "step": 35896 + }, + { + "epoch": 0.92, + "learning_rate": 1.6246542346976285e-06, + "loss": 0.8682, + "step": 35897 + }, + { + "epoch": 0.92, + "learning_rate": 1.624632626560706e-06, + "loss": 1.0293, + "step": 35898 + }, + { + "epoch": 0.92, + "learning_rate": 1.624611017945531e-06, + "loss": 0.7607, + "step": 35899 + }, + { + "epoch": 0.92, + "learning_rate": 1.6245894088521202e-06, + "loss": 0.8545, + "step": 35900 + }, + { + "epoch": 0.92, + "learning_rate": 1.6245677992804897e-06, + "loss": 0.8984, + "step": 35901 + }, + { + "epoch": 0.92, + "learning_rate": 1.6245461892306566e-06, + "loss": 0.8438, + "step": 35902 + }, + { + "epoch": 0.92, + "learning_rate": 1.6245245787026374e-06, + "loss": 0.7959, + "step": 35903 + }, + { + "epoch": 0.92, + "learning_rate": 1.6245029676964482e-06, + "loss": 0.9766, + "step": 35904 + }, + { + "epoch": 0.92, + "learning_rate": 1.6244813562121057e-06, + "loss": 0.876, + "step": 35905 + }, + { + "epoch": 0.92, + "learning_rate": 1.6244597442496267e-06, + "loss": 0.9307, + "step": 35906 + }, + { + "epoch": 0.92, + "learning_rate": 1.6244381318090276e-06, + "loss": 0.5574, + "step": 35907 + }, + { + "epoch": 0.92, + "learning_rate": 1.6244165188903249e-06, + "loss": 0.916, + "step": 35908 + }, + { + "epoch": 0.92, + "learning_rate": 1.624394905493535e-06, + "loss": 0.7061, + "step": 35909 + }, + { + "epoch": 0.92, + "learning_rate": 1.624373291618675e-06, + "loss": 0.98, + "step": 35910 + }, + { + "epoch": 0.92, + "learning_rate": 1.6243516772657608e-06, + "loss": 0.9551, + "step": 35911 + }, + { + "epoch": 0.92, + "learning_rate": 1.6243300624348094e-06, + "loss": 0.7532, + "step": 35912 + }, + { + "epoch": 0.92, + "learning_rate": 1.6243084471258368e-06, + "loss": 0.6694, + "step": 35913 + }, + { + "epoch": 0.92, + "learning_rate": 1.6242868313388604e-06, + "loss": 0.9258, + "step": 35914 + }, + { + "epoch": 0.92, + "learning_rate": 1.6242652150738962e-06, + "loss": 0.3662, + "step": 35915 + }, + { + "epoch": 0.92, + "learning_rate": 1.6242435983309606e-06, + "loss": 0.7405, + "step": 35916 + }, + { + "epoch": 0.92, + "learning_rate": 1.6242219811100705e-06, + "loss": 0.751, + "step": 35917 + }, + { + "epoch": 0.92, + "learning_rate": 1.6242003634112425e-06, + "loss": 0.8496, + "step": 35918 + }, + { + "epoch": 0.92, + "learning_rate": 1.6241787452344927e-06, + "loss": 0.6826, + "step": 35919 + }, + { + "epoch": 0.92, + "learning_rate": 1.6241571265798378e-06, + "loss": 0.7412, + "step": 35920 + }, + { + "epoch": 0.92, + "learning_rate": 1.624135507447295e-06, + "loss": 0.4719, + "step": 35921 + }, + { + "epoch": 0.92, + "learning_rate": 1.6241138878368801e-06, + "loss": 0.7598, + "step": 35922 + }, + { + "epoch": 0.92, + "learning_rate": 1.6240922677486099e-06, + "loss": 0.8438, + "step": 35923 + }, + { + "epoch": 0.92, + "learning_rate": 1.624070647182501e-06, + "loss": 0.7114, + "step": 35924 + }, + { + "epoch": 0.92, + "learning_rate": 1.6240490261385697e-06, + "loss": 0.876, + "step": 35925 + }, + { + "epoch": 0.92, + "learning_rate": 1.624027404616833e-06, + "loss": 0.9785, + "step": 35926 + }, + { + "epoch": 0.92, + "learning_rate": 1.6240057826173069e-06, + "loss": 0.6162, + "step": 35927 + }, + { + "epoch": 0.92, + "learning_rate": 1.6239841601400084e-06, + "loss": 0.7671, + "step": 35928 + }, + { + "epoch": 0.92, + "learning_rate": 1.6239625371849539e-06, + "loss": 0.9648, + "step": 35929 + }, + { + "epoch": 0.92, + "learning_rate": 1.6239409137521603e-06, + "loss": 0.7871, + "step": 35930 + }, + { + "epoch": 0.92, + "learning_rate": 1.6239192898416437e-06, + "loss": 0.8477, + "step": 35931 + }, + { + "epoch": 0.92, + "learning_rate": 1.6238976654534207e-06, + "loss": 0.9424, + "step": 35932 + }, + { + "epoch": 0.92, + "learning_rate": 1.6238760405875077e-06, + "loss": 0.8916, + "step": 35933 + }, + { + "epoch": 0.92, + "learning_rate": 1.6238544152439217e-06, + "loss": 0.8999, + "step": 35934 + }, + { + "epoch": 0.92, + "learning_rate": 1.6238327894226792e-06, + "loss": 0.7153, + "step": 35935 + }, + { + "epoch": 0.92, + "learning_rate": 1.6238111631237966e-06, + "loss": 1.0645, + "step": 35936 + }, + { + "epoch": 0.92, + "learning_rate": 1.6237895363472903e-06, + "loss": 0.6816, + "step": 35937 + }, + { + "epoch": 0.92, + "learning_rate": 1.623767909093177e-06, + "loss": 0.9619, + "step": 35938 + }, + { + "epoch": 0.92, + "learning_rate": 1.6237462813614733e-06, + "loss": 0.834, + "step": 35939 + }, + { + "epoch": 0.92, + "learning_rate": 1.623724653152196e-06, + "loss": 0.7617, + "step": 35940 + }, + { + "epoch": 0.92, + "learning_rate": 1.6237030244653614e-06, + "loss": 0.8438, + "step": 35941 + }, + { + "epoch": 0.92, + "learning_rate": 1.6236813953009857e-06, + "loss": 0.79, + "step": 35942 + }, + { + "epoch": 0.92, + "learning_rate": 1.6236597656590861e-06, + "loss": 0.9453, + "step": 35943 + }, + { + "epoch": 0.92, + "learning_rate": 1.623638135539679e-06, + "loss": 0.709, + "step": 35944 + }, + { + "epoch": 0.92, + "learning_rate": 1.6236165049427807e-06, + "loss": 0.8281, + "step": 35945 + }, + { + "epoch": 0.92, + "learning_rate": 1.623594873868408e-06, + "loss": 0.8489, + "step": 35946 + }, + { + "epoch": 0.92, + "learning_rate": 1.6235732423165774e-06, + "loss": 1.0283, + "step": 35947 + }, + { + "epoch": 0.92, + "learning_rate": 1.6235516102873051e-06, + "loss": 0.96, + "step": 35948 + }, + { + "epoch": 0.92, + "learning_rate": 1.6235299777806084e-06, + "loss": 0.5596, + "step": 35949 + }, + { + "epoch": 0.92, + "learning_rate": 1.6235083447965034e-06, + "loss": 0.917, + "step": 35950 + }, + { + "epoch": 0.92, + "learning_rate": 1.6234867113350066e-06, + "loss": 0.6865, + "step": 35951 + }, + { + "epoch": 0.92, + "learning_rate": 1.6234650773961347e-06, + "loss": 0.7715, + "step": 35952 + }, + { + "epoch": 0.92, + "learning_rate": 1.6234434429799043e-06, + "loss": 0.562, + "step": 35953 + }, + { + "epoch": 0.92, + "learning_rate": 1.623421808086332e-06, + "loss": 0.8574, + "step": 35954 + }, + { + "epoch": 0.92, + "learning_rate": 1.623400172715434e-06, + "loss": 0.772, + "step": 35955 + }, + { + "epoch": 0.92, + "learning_rate": 1.6233785368672278e-06, + "loss": 0.8516, + "step": 35956 + }, + { + "epoch": 0.92, + "learning_rate": 1.6233569005417285e-06, + "loss": 0.8516, + "step": 35957 + }, + { + "epoch": 0.92, + "learning_rate": 1.623335263738954e-06, + "loss": 0.9561, + "step": 35958 + }, + { + "epoch": 0.92, + "learning_rate": 1.6233136264589202e-06, + "loss": 0.8008, + "step": 35959 + }, + { + "epoch": 0.92, + "learning_rate": 1.6232919887016441e-06, + "loss": 0.8179, + "step": 35960 + }, + { + "epoch": 0.92, + "learning_rate": 1.6232703504671416e-06, + "loss": 0.8203, + "step": 35961 + }, + { + "epoch": 0.92, + "learning_rate": 1.6232487117554297e-06, + "loss": 0.8037, + "step": 35962 + }, + { + "epoch": 0.92, + "learning_rate": 1.623227072566525e-06, + "loss": 0.8389, + "step": 35963 + }, + { + "epoch": 0.92, + "learning_rate": 1.6232054329004439e-06, + "loss": 0.8779, + "step": 35964 + }, + { + "epoch": 0.92, + "learning_rate": 1.6231837927572032e-06, + "loss": 0.8076, + "step": 35965 + }, + { + "epoch": 0.92, + "learning_rate": 1.6231621521368192e-06, + "loss": 0.6655, + "step": 35966 + }, + { + "epoch": 0.92, + "learning_rate": 1.6231405110393087e-06, + "loss": 0.8594, + "step": 35967 + }, + { + "epoch": 0.92, + "learning_rate": 1.6231188694646881e-06, + "loss": 0.8457, + "step": 35968 + }, + { + "epoch": 0.92, + "learning_rate": 1.6230972274129743e-06, + "loss": 0.8066, + "step": 35969 + }, + { + "epoch": 0.92, + "learning_rate": 1.6230755848841833e-06, + "loss": 0.7324, + "step": 35970 + }, + { + "epoch": 0.92, + "learning_rate": 1.6230539418783317e-06, + "loss": 0.686, + "step": 35971 + }, + { + "epoch": 0.92, + "learning_rate": 1.6230322983954367e-06, + "loss": 0.7676, + "step": 35972 + }, + { + "epoch": 0.92, + "learning_rate": 1.6230106544355143e-06, + "loss": 0.8076, + "step": 35973 + }, + { + "epoch": 0.92, + "learning_rate": 1.6229890099985818e-06, + "loss": 0.7295, + "step": 35974 + }, + { + "epoch": 0.92, + "learning_rate": 1.6229673650846549e-06, + "loss": 0.957, + "step": 35975 + }, + { + "epoch": 0.92, + "learning_rate": 1.6229457196937508e-06, + "loss": 1.0547, + "step": 35976 + }, + { + "epoch": 0.92, + "learning_rate": 1.6229240738258856e-06, + "loss": 0.6523, + "step": 35977 + }, + { + "epoch": 0.92, + "learning_rate": 1.622902427481076e-06, + "loss": 0.874, + "step": 35978 + }, + { + "epoch": 0.92, + "learning_rate": 1.6228807806593386e-06, + "loss": 0.9336, + "step": 35979 + }, + { + "epoch": 0.92, + "learning_rate": 1.6228591333606902e-06, + "loss": 0.7549, + "step": 35980 + }, + { + "epoch": 0.92, + "learning_rate": 1.6228374855851472e-06, + "loss": 0.9668, + "step": 35981 + }, + { + "epoch": 0.92, + "learning_rate": 1.622815837332726e-06, + "loss": 0.9678, + "step": 35982 + }, + { + "epoch": 0.92, + "learning_rate": 1.6227941886034435e-06, + "loss": 0.9287, + "step": 35983 + }, + { + "epoch": 0.92, + "learning_rate": 1.622772539397316e-06, + "loss": 0.875, + "step": 35984 + }, + { + "epoch": 0.92, + "learning_rate": 1.6227508897143605e-06, + "loss": 0.4636, + "step": 35985 + }, + { + "epoch": 0.92, + "learning_rate": 1.6227292395545931e-06, + "loss": 0.5842, + "step": 35986 + }, + { + "epoch": 0.92, + "learning_rate": 1.6227075889180303e-06, + "loss": 0.6948, + "step": 35987 + }, + { + "epoch": 0.92, + "learning_rate": 1.6226859378046894e-06, + "loss": 0.7881, + "step": 35988 + }, + { + "epoch": 0.92, + "learning_rate": 1.622664286214586e-06, + "loss": 0.9004, + "step": 35989 + }, + { + "epoch": 0.92, + "learning_rate": 1.6226426341477378e-06, + "loss": 0.9707, + "step": 35990 + }, + { + "epoch": 0.92, + "learning_rate": 1.6226209816041604e-06, + "loss": 0.8809, + "step": 35991 + }, + { + "epoch": 0.92, + "learning_rate": 1.6225993285838706e-06, + "loss": 0.6445, + "step": 35992 + }, + { + "epoch": 0.92, + "learning_rate": 1.6225776750868852e-06, + "loss": 0.6782, + "step": 35993 + }, + { + "epoch": 0.92, + "learning_rate": 1.6225560211132207e-06, + "loss": 0.8838, + "step": 35994 + }, + { + "epoch": 0.92, + "learning_rate": 1.6225343666628942e-06, + "loss": 0.7773, + "step": 35995 + }, + { + "epoch": 0.92, + "learning_rate": 1.6225127117359213e-06, + "loss": 1.0215, + "step": 35996 + }, + { + "epoch": 0.92, + "learning_rate": 1.6224910563323189e-06, + "loss": 1.0391, + "step": 35997 + }, + { + "epoch": 0.92, + "learning_rate": 1.622469400452104e-06, + "loss": 0.8142, + "step": 35998 + }, + { + "epoch": 0.92, + "learning_rate": 1.6224477440952926e-06, + "loss": 0.8682, + "step": 35999 + }, + { + "epoch": 0.92, + "learning_rate": 1.622426087261902e-06, + "loss": 1.1377, + "step": 36000 + }, + { + "epoch": 0.92, + "learning_rate": 1.6224044299519481e-06, + "loss": 0.9082, + "step": 36001 + }, + { + "epoch": 0.92, + "learning_rate": 1.6223827721654477e-06, + "loss": 0.7227, + "step": 36002 + }, + { + "epoch": 0.92, + "learning_rate": 1.6223611139024175e-06, + "loss": 0.834, + "step": 36003 + }, + { + "epoch": 0.92, + "learning_rate": 1.6223394551628743e-06, + "loss": 0.9082, + "step": 36004 + }, + { + "epoch": 0.92, + "learning_rate": 1.622317795946834e-06, + "loss": 0.8115, + "step": 36005 + }, + { + "epoch": 0.92, + "learning_rate": 1.6222961362543137e-06, + "loss": 0.6672, + "step": 36006 + }, + { + "epoch": 0.92, + "learning_rate": 1.6222744760853297e-06, + "loss": 0.8789, + "step": 36007 + }, + { + "epoch": 0.92, + "learning_rate": 1.622252815439899e-06, + "loss": 0.7617, + "step": 36008 + }, + { + "epoch": 0.92, + "learning_rate": 1.6222311543180378e-06, + "loss": 0.9961, + "step": 36009 + }, + { + "epoch": 0.92, + "learning_rate": 1.6222094927197629e-06, + "loss": 0.9805, + "step": 36010 + }, + { + "epoch": 0.92, + "learning_rate": 1.6221878306450908e-06, + "loss": 0.876, + "step": 36011 + }, + { + "epoch": 0.92, + "learning_rate": 1.6221661680940382e-06, + "loss": 0.6919, + "step": 36012 + }, + { + "epoch": 0.92, + "learning_rate": 1.6221445050666213e-06, + "loss": 0.8901, + "step": 36013 + }, + { + "epoch": 0.92, + "learning_rate": 1.6221228415628573e-06, + "loss": 0.7651, + "step": 36014 + }, + { + "epoch": 0.92, + "learning_rate": 1.622101177582762e-06, + "loss": 0.8262, + "step": 36015 + }, + { + "epoch": 0.92, + "learning_rate": 1.6220795131263528e-06, + "loss": 0.6797, + "step": 36016 + }, + { + "epoch": 0.92, + "learning_rate": 1.6220578481936458e-06, + "loss": 0.6616, + "step": 36017 + }, + { + "epoch": 0.92, + "learning_rate": 1.6220361827846575e-06, + "loss": 0.7373, + "step": 36018 + }, + { + "epoch": 0.92, + "learning_rate": 1.6220145168994048e-06, + "loss": 0.6484, + "step": 36019 + }, + { + "epoch": 0.92, + "learning_rate": 1.6219928505379047e-06, + "loss": 0.7229, + "step": 36020 + }, + { + "epoch": 0.92, + "learning_rate": 1.6219711837001725e-06, + "loss": 0.7456, + "step": 36021 + }, + { + "epoch": 0.92, + "learning_rate": 1.621949516386226e-06, + "loss": 0.9297, + "step": 36022 + }, + { + "epoch": 0.92, + "learning_rate": 1.6219278485960813e-06, + "loss": 0.8027, + "step": 36023 + }, + { + "epoch": 0.92, + "learning_rate": 1.6219061803297549e-06, + "loss": 0.522, + "step": 36024 + }, + { + "epoch": 0.92, + "learning_rate": 1.6218845115872637e-06, + "loss": 0.7083, + "step": 36025 + }, + { + "epoch": 0.92, + "learning_rate": 1.6218628423686243e-06, + "loss": 0.6572, + "step": 36026 + }, + { + "epoch": 0.92, + "learning_rate": 1.6218411726738528e-06, + "loss": 0.8218, + "step": 36027 + }, + { + "epoch": 0.92, + "learning_rate": 1.6218195025029661e-06, + "loss": 0.7678, + "step": 36028 + }, + { + "epoch": 0.92, + "learning_rate": 1.621797831855981e-06, + "loss": 0.8447, + "step": 36029 + }, + { + "epoch": 0.92, + "learning_rate": 1.6217761607329137e-06, + "loss": 1.0107, + "step": 36030 + }, + { + "epoch": 0.92, + "learning_rate": 1.621754489133781e-06, + "loss": 0.8271, + "step": 36031 + }, + { + "epoch": 0.92, + "learning_rate": 1.6217328170585997e-06, + "loss": 0.5933, + "step": 36032 + }, + { + "epoch": 0.92, + "learning_rate": 1.621711144507386e-06, + "loss": 0.9287, + "step": 36033 + }, + { + "epoch": 0.92, + "learning_rate": 1.6216894714801566e-06, + "loss": 1.0537, + "step": 36034 + }, + { + "epoch": 0.92, + "learning_rate": 1.6216677979769282e-06, + "loss": 0.8784, + "step": 36035 + }, + { + "epoch": 0.92, + "learning_rate": 1.6216461239977176e-06, + "loss": 1.0469, + "step": 36036 + }, + { + "epoch": 0.92, + "learning_rate": 1.6216244495425406e-06, + "loss": 0.6504, + "step": 36037 + }, + { + "epoch": 0.92, + "learning_rate": 1.6216027746114146e-06, + "loss": 0.9912, + "step": 36038 + }, + { + "epoch": 0.92, + "learning_rate": 1.6215810992043562e-06, + "loss": 0.9688, + "step": 36039 + }, + { + "epoch": 0.92, + "learning_rate": 1.6215594233213816e-06, + "loss": 0.7178, + "step": 36040 + }, + { + "epoch": 0.92, + "learning_rate": 1.6215377469625072e-06, + "loss": 0.7861, + "step": 36041 + }, + { + "epoch": 0.92, + "learning_rate": 1.6215160701277505e-06, + "loss": 0.7578, + "step": 36042 + }, + { + "epoch": 0.92, + "learning_rate": 1.621494392817127e-06, + "loss": 0.9668, + "step": 36043 + }, + { + "epoch": 0.92, + "learning_rate": 1.621472715030654e-06, + "loss": 1.001, + "step": 36044 + }, + { + "epoch": 0.92, + "learning_rate": 1.6214510367683484e-06, + "loss": 1.0264, + "step": 36045 + }, + { + "epoch": 0.92, + "learning_rate": 1.6214293580302256e-06, + "loss": 0.8076, + "step": 36046 + }, + { + "epoch": 0.92, + "learning_rate": 1.6214076788163032e-06, + "loss": 0.7764, + "step": 36047 + }, + { + "epoch": 0.92, + "learning_rate": 1.6213859991265975e-06, + "loss": 0.7451, + "step": 36048 + }, + { + "epoch": 0.92, + "learning_rate": 1.6213643189611253e-06, + "loss": 0.9678, + "step": 36049 + }, + { + "epoch": 0.92, + "learning_rate": 1.6213426383199029e-06, + "loss": 0.8135, + "step": 36050 + }, + { + "epoch": 0.92, + "learning_rate": 1.621320957202947e-06, + "loss": 0.8906, + "step": 36051 + }, + { + "epoch": 0.92, + "learning_rate": 1.621299275610274e-06, + "loss": 0.9111, + "step": 36052 + }, + { + "epoch": 0.92, + "learning_rate": 1.6212775935419007e-06, + "loss": 1.0537, + "step": 36053 + }, + { + "epoch": 0.92, + "learning_rate": 1.6212559109978438e-06, + "loss": 0.8271, + "step": 36054 + }, + { + "epoch": 0.92, + "learning_rate": 1.6212342279781202e-06, + "loss": 0.646, + "step": 36055 + }, + { + "epoch": 0.92, + "learning_rate": 1.621212544482746e-06, + "loss": 0.8789, + "step": 36056 + }, + { + "epoch": 0.92, + "learning_rate": 1.6211908605117374e-06, + "loss": 0.8965, + "step": 36057 + }, + { + "epoch": 0.92, + "learning_rate": 1.6211691760651119e-06, + "loss": 0.9619, + "step": 36058 + }, + { + "epoch": 0.92, + "learning_rate": 1.6211474911428856e-06, + "loss": 1.1113, + "step": 36059 + }, + { + "epoch": 0.92, + "learning_rate": 1.6211258057450753e-06, + "loss": 0.6841, + "step": 36060 + }, + { + "epoch": 0.92, + "learning_rate": 1.6211041198716977e-06, + "loss": 0.9062, + "step": 36061 + }, + { + "epoch": 0.92, + "learning_rate": 1.621082433522769e-06, + "loss": 0.7319, + "step": 36062 + }, + { + "epoch": 0.92, + "learning_rate": 1.6210607466983062e-06, + "loss": 0.7466, + "step": 36063 + }, + { + "epoch": 0.92, + "learning_rate": 1.6210390593983254e-06, + "loss": 1.0303, + "step": 36064 + }, + { + "epoch": 0.92, + "learning_rate": 1.6210173716228441e-06, + "loss": 0.8867, + "step": 36065 + }, + { + "epoch": 0.92, + "learning_rate": 1.6209956833718779e-06, + "loss": 0.959, + "step": 36066 + }, + { + "epoch": 0.92, + "learning_rate": 1.620973994645444e-06, + "loss": 0.6753, + "step": 36067 + }, + { + "epoch": 0.92, + "learning_rate": 1.6209523054435587e-06, + "loss": 0.8828, + "step": 36068 + }, + { + "epoch": 0.92, + "learning_rate": 1.620930615766239e-06, + "loss": 0.584, + "step": 36069 + }, + { + "epoch": 0.92, + "learning_rate": 1.6209089256135014e-06, + "loss": 0.8887, + "step": 36070 + }, + { + "epoch": 0.92, + "learning_rate": 1.6208872349853622e-06, + "loss": 0.7344, + "step": 36071 + }, + { + "epoch": 0.92, + "learning_rate": 1.6208655438818382e-06, + "loss": 0.6177, + "step": 36072 + }, + { + "epoch": 0.92, + "learning_rate": 1.620843852302946e-06, + "loss": 0.7388, + "step": 36073 + }, + { + "epoch": 0.92, + "learning_rate": 1.6208221602487021e-06, + "loss": 0.9121, + "step": 36074 + }, + { + "epoch": 0.92, + "learning_rate": 1.6208004677191237e-06, + "loss": 0.7397, + "step": 36075 + }, + { + "epoch": 0.92, + "learning_rate": 1.6207787747142265e-06, + "loss": 0.8193, + "step": 36076 + }, + { + "epoch": 0.92, + "learning_rate": 1.6207570812340274e-06, + "loss": 0.7666, + "step": 36077 + }, + { + "epoch": 0.92, + "learning_rate": 1.6207353872785433e-06, + "loss": 0.5269, + "step": 36078 + }, + { + "epoch": 0.92, + "learning_rate": 1.620713692847791e-06, + "loss": 0.853, + "step": 36079 + }, + { + "epoch": 0.92, + "learning_rate": 1.6206919979417864e-06, + "loss": 0.7305, + "step": 36080 + }, + { + "epoch": 0.92, + "learning_rate": 1.6206703025605463e-06, + "loss": 0.9004, + "step": 36081 + }, + { + "epoch": 0.92, + "learning_rate": 1.6206486067040878e-06, + "loss": 0.9316, + "step": 36082 + }, + { + "epoch": 0.92, + "learning_rate": 1.6206269103724272e-06, + "loss": 0.8975, + "step": 36083 + }, + { + "epoch": 0.92, + "learning_rate": 1.620605213565581e-06, + "loss": 0.71, + "step": 36084 + }, + { + "epoch": 0.92, + "learning_rate": 1.620583516283566e-06, + "loss": 0.9717, + "step": 36085 + }, + { + "epoch": 0.92, + "learning_rate": 1.6205618185263988e-06, + "loss": 0.7188, + "step": 36086 + }, + { + "epoch": 0.92, + "learning_rate": 1.6205401202940958e-06, + "loss": 0.6924, + "step": 36087 + }, + { + "epoch": 0.92, + "learning_rate": 1.6205184215866737e-06, + "loss": 0.8896, + "step": 36088 + }, + { + "epoch": 0.92, + "learning_rate": 1.6204967224041494e-06, + "loss": 0.8145, + "step": 36089 + }, + { + "epoch": 0.93, + "learning_rate": 1.620475022746539e-06, + "loss": 0.8896, + "step": 36090 + }, + { + "epoch": 0.93, + "learning_rate": 1.6204533226138599e-06, + "loss": 0.7554, + "step": 36091 + }, + { + "epoch": 0.93, + "learning_rate": 1.6204316220061278e-06, + "loss": 1.0381, + "step": 36092 + }, + { + "epoch": 0.93, + "learning_rate": 1.6204099209233597e-06, + "loss": 0.7832, + "step": 36093 + }, + { + "epoch": 0.93, + "learning_rate": 1.6203882193655726e-06, + "loss": 1.0586, + "step": 36094 + }, + { + "epoch": 0.93, + "learning_rate": 1.6203665173327825e-06, + "loss": 0.8105, + "step": 36095 + }, + { + "epoch": 0.93, + "learning_rate": 1.6203448148250064e-06, + "loss": 0.7578, + "step": 36096 + }, + { + "epoch": 0.93, + "learning_rate": 1.6203231118422606e-06, + "loss": 0.6323, + "step": 36097 + }, + { + "epoch": 0.93, + "learning_rate": 1.620301408384562e-06, + "loss": 0.8896, + "step": 36098 + }, + { + "epoch": 0.93, + "learning_rate": 1.6202797044519275e-06, + "loss": 0.9102, + "step": 36099 + }, + { + "epoch": 0.93, + "learning_rate": 1.6202580000443732e-06, + "loss": 0.8057, + "step": 36100 + }, + { + "epoch": 0.93, + "learning_rate": 1.6202362951619154e-06, + "loss": 0.9707, + "step": 36101 + }, + { + "epoch": 0.93, + "learning_rate": 1.6202145898045717e-06, + "loss": 0.8594, + "step": 36102 + }, + { + "epoch": 0.93, + "learning_rate": 1.6201928839723577e-06, + "loss": 0.6189, + "step": 36103 + }, + { + "epoch": 0.93, + "learning_rate": 1.620171177665291e-06, + "loss": 0.8379, + "step": 36104 + }, + { + "epoch": 0.93, + "learning_rate": 1.6201494708833879e-06, + "loss": 1.0322, + "step": 36105 + }, + { + "epoch": 0.93, + "learning_rate": 1.6201277636266642e-06, + "loss": 0.8457, + "step": 36106 + }, + { + "epoch": 0.93, + "learning_rate": 1.6201060558951376e-06, + "loss": 0.9512, + "step": 36107 + }, + { + "epoch": 0.93, + "learning_rate": 1.6200843476888242e-06, + "loss": 1.0449, + "step": 36108 + }, + { + "epoch": 0.93, + "learning_rate": 1.6200626390077407e-06, + "loss": 1.0049, + "step": 36109 + }, + { + "epoch": 0.93, + "learning_rate": 1.6200409298519039e-06, + "loss": 0.8711, + "step": 36110 + }, + { + "epoch": 0.93, + "learning_rate": 1.6200192202213303e-06, + "loss": 0.752, + "step": 36111 + }, + { + "epoch": 0.93, + "learning_rate": 1.6199975101160363e-06, + "loss": 0.8657, + "step": 36112 + }, + { + "epoch": 0.93, + "learning_rate": 1.6199757995360388e-06, + "loss": 0.9092, + "step": 36113 + }, + { + "epoch": 0.93, + "learning_rate": 1.6199540884813543e-06, + "loss": 0.8457, + "step": 36114 + }, + { + "epoch": 0.93, + "learning_rate": 1.6199323769519997e-06, + "loss": 0.9141, + "step": 36115 + }, + { + "epoch": 0.93, + "learning_rate": 1.6199106649479913e-06, + "loss": 0.9844, + "step": 36116 + }, + { + "epoch": 0.93, + "learning_rate": 1.6198889524693455e-06, + "loss": 0.999, + "step": 36117 + }, + { + "epoch": 0.93, + "learning_rate": 1.6198672395160796e-06, + "loss": 0.8652, + "step": 36118 + }, + { + "epoch": 0.93, + "learning_rate": 1.6198455260882095e-06, + "loss": 0.7026, + "step": 36119 + }, + { + "epoch": 0.93, + "learning_rate": 1.6198238121857523e-06, + "loss": 0.8306, + "step": 36120 + }, + { + "epoch": 0.93, + "learning_rate": 1.6198020978087246e-06, + "loss": 0.7119, + "step": 36121 + }, + { + "epoch": 0.93, + "learning_rate": 1.619780382957143e-06, + "loss": 0.8887, + "step": 36122 + }, + { + "epoch": 0.93, + "learning_rate": 1.6197586676310237e-06, + "loss": 1.1035, + "step": 36123 + }, + { + "epoch": 0.93, + "learning_rate": 1.6197369518303841e-06, + "loss": 0.7285, + "step": 36124 + }, + { + "epoch": 0.93, + "learning_rate": 1.6197152355552403e-06, + "loss": 1.1201, + "step": 36125 + }, + { + "epoch": 0.93, + "learning_rate": 1.619693518805609e-06, + "loss": 0.8301, + "step": 36126 + }, + { + "epoch": 0.93, + "learning_rate": 1.6196718015815068e-06, + "loss": 0.8311, + "step": 36127 + }, + { + "epoch": 0.93, + "learning_rate": 1.6196500838829503e-06, + "loss": 0.6008, + "step": 36128 + }, + { + "epoch": 0.93, + "learning_rate": 1.6196283657099565e-06, + "loss": 0.8721, + "step": 36129 + }, + { + "epoch": 0.93, + "learning_rate": 1.6196066470625417e-06, + "loss": 0.7427, + "step": 36130 + }, + { + "epoch": 0.93, + "learning_rate": 1.6195849279407226e-06, + "loss": 0.7266, + "step": 36131 + }, + { + "epoch": 0.93, + "learning_rate": 1.6195632083445157e-06, + "loss": 0.8701, + "step": 36132 + }, + { + "epoch": 0.93, + "learning_rate": 1.6195414882739375e-06, + "loss": 0.8906, + "step": 36133 + }, + { + "epoch": 0.93, + "learning_rate": 1.6195197677290052e-06, + "loss": 0.9629, + "step": 36134 + }, + { + "epoch": 0.93, + "learning_rate": 1.6194980467097353e-06, + "loss": 0.8213, + "step": 36135 + }, + { + "epoch": 0.93, + "learning_rate": 1.6194763252161439e-06, + "loss": 0.8774, + "step": 36136 + }, + { + "epoch": 0.93, + "learning_rate": 1.6194546032482479e-06, + "loss": 0.8672, + "step": 36137 + }, + { + "epoch": 0.93, + "learning_rate": 1.6194328808060642e-06, + "loss": 0.9336, + "step": 36138 + }, + { + "epoch": 0.93, + "learning_rate": 1.619411157889609e-06, + "loss": 0.9375, + "step": 36139 + }, + { + "epoch": 0.93, + "learning_rate": 1.6193894344988993e-06, + "loss": 0.752, + "step": 36140 + }, + { + "epoch": 0.93, + "learning_rate": 1.6193677106339515e-06, + "loss": 0.7871, + "step": 36141 + }, + { + "epoch": 0.93, + "learning_rate": 1.6193459862947828e-06, + "loss": 0.8672, + "step": 36142 + }, + { + "epoch": 0.93, + "learning_rate": 1.6193242614814088e-06, + "loss": 0.7891, + "step": 36143 + }, + { + "epoch": 0.93, + "learning_rate": 1.6193025361938469e-06, + "loss": 0.8398, + "step": 36144 + }, + { + "epoch": 0.93, + "learning_rate": 1.6192808104321136e-06, + "loss": 0.6797, + "step": 36145 + }, + { + "epoch": 0.93, + "learning_rate": 1.619259084196225e-06, + "loss": 0.8818, + "step": 36146 + }, + { + "epoch": 0.93, + "learning_rate": 1.6192373574861988e-06, + "loss": 0.7966, + "step": 36147 + }, + { + "epoch": 0.93, + "learning_rate": 1.6192156303020507e-06, + "loss": 0.918, + "step": 36148 + }, + { + "epoch": 0.93, + "learning_rate": 1.6191939026437978e-06, + "loss": 0.7119, + "step": 36149 + }, + { + "epoch": 0.93, + "learning_rate": 1.6191721745114567e-06, + "loss": 0.6406, + "step": 36150 + }, + { + "epoch": 0.93, + "learning_rate": 1.6191504459050435e-06, + "loss": 0.793, + "step": 36151 + }, + { + "epoch": 0.93, + "learning_rate": 1.6191287168245754e-06, + "loss": 0.8604, + "step": 36152 + }, + { + "epoch": 0.93, + "learning_rate": 1.6191069872700692e-06, + "loss": 0.9697, + "step": 36153 + }, + { + "epoch": 0.93, + "learning_rate": 1.619085257241541e-06, + "loss": 0.6533, + "step": 36154 + }, + { + "epoch": 0.93, + "learning_rate": 1.619063526739008e-06, + "loss": 0.8359, + "step": 36155 + }, + { + "epoch": 0.93, + "learning_rate": 1.6190417957624863e-06, + "loss": 0.686, + "step": 36156 + }, + { + "epoch": 0.93, + "learning_rate": 1.6190200643119927e-06, + "loss": 0.7314, + "step": 36157 + }, + { + "epoch": 0.93, + "learning_rate": 1.618998332387544e-06, + "loss": 0.8359, + "step": 36158 + }, + { + "epoch": 0.93, + "learning_rate": 1.6189765999891564e-06, + "loss": 0.9033, + "step": 36159 + }, + { + "epoch": 0.93, + "learning_rate": 1.6189548671168475e-06, + "loss": 0.8413, + "step": 36160 + }, + { + "epoch": 0.93, + "learning_rate": 1.618933133770633e-06, + "loss": 0.8223, + "step": 36161 + }, + { + "epoch": 0.93, + "learning_rate": 1.6189113999505298e-06, + "loss": 0.7627, + "step": 36162 + }, + { + "epoch": 0.93, + "learning_rate": 1.6188896656565547e-06, + "loss": 0.7324, + "step": 36163 + }, + { + "epoch": 0.93, + "learning_rate": 1.6188679308887241e-06, + "loss": 0.9434, + "step": 36164 + }, + { + "epoch": 0.93, + "learning_rate": 1.6188461956470549e-06, + "loss": 0.7422, + "step": 36165 + }, + { + "epoch": 0.93, + "learning_rate": 1.6188244599315638e-06, + "loss": 0.7627, + "step": 36166 + }, + { + "epoch": 0.93, + "learning_rate": 1.618802723742267e-06, + "loss": 0.9932, + "step": 36167 + }, + { + "epoch": 0.93, + "learning_rate": 1.6187809870791815e-06, + "loss": 0.8086, + "step": 36168 + }, + { + "epoch": 0.93, + "learning_rate": 1.6187592499423237e-06, + "loss": 0.7295, + "step": 36169 + }, + { + "epoch": 0.93, + "learning_rate": 1.6187375123317106e-06, + "loss": 0.7559, + "step": 36170 + }, + { + "epoch": 0.93, + "learning_rate": 1.6187157742473585e-06, + "loss": 0.8584, + "step": 36171 + }, + { + "epoch": 0.93, + "learning_rate": 1.6186940356892844e-06, + "loss": 1.0635, + "step": 36172 + }, + { + "epoch": 0.93, + "learning_rate": 1.6186722966575044e-06, + "loss": 0.7949, + "step": 36173 + }, + { + "epoch": 0.93, + "learning_rate": 1.6186505571520356e-06, + "loss": 0.9141, + "step": 36174 + }, + { + "epoch": 0.93, + "learning_rate": 1.6186288171728948e-06, + "loss": 0.96, + "step": 36175 + }, + { + "epoch": 0.93, + "learning_rate": 1.6186070767200982e-06, + "loss": 0.546, + "step": 36176 + }, + { + "epoch": 0.93, + "learning_rate": 1.6185853357936624e-06, + "loss": 0.6758, + "step": 36177 + }, + { + "epoch": 0.93, + "learning_rate": 1.6185635943936043e-06, + "loss": 0.9443, + "step": 36178 + }, + { + "epoch": 0.93, + "learning_rate": 1.6185418525199404e-06, + "loss": 0.7969, + "step": 36179 + }, + { + "epoch": 0.93, + "learning_rate": 1.618520110172688e-06, + "loss": 0.7375, + "step": 36180 + }, + { + "epoch": 0.93, + "learning_rate": 1.6184983673518627e-06, + "loss": 0.9453, + "step": 36181 + }, + { + "epoch": 0.93, + "learning_rate": 1.6184766240574817e-06, + "loss": 0.9492, + "step": 36182 + }, + { + "epoch": 0.93, + "learning_rate": 1.6184548802895615e-06, + "loss": 0.8105, + "step": 36183 + }, + { + "epoch": 0.93, + "learning_rate": 1.618433136048119e-06, + "loss": 0.9932, + "step": 36184 + }, + { + "epoch": 0.93, + "learning_rate": 1.6184113913331706e-06, + "loss": 0.5708, + "step": 36185 + }, + { + "epoch": 0.93, + "learning_rate": 1.6183896461447333e-06, + "loss": 0.8906, + "step": 36186 + }, + { + "epoch": 0.93, + "learning_rate": 1.618367900482823e-06, + "loss": 0.9902, + "step": 36187 + }, + { + "epoch": 0.93, + "learning_rate": 1.6183461543474573e-06, + "loss": 0.8096, + "step": 36188 + }, + { + "epoch": 0.93, + "learning_rate": 1.618324407738652e-06, + "loss": 0.6846, + "step": 36189 + }, + { + "epoch": 0.93, + "learning_rate": 1.6183026606564244e-06, + "loss": 0.8359, + "step": 36190 + }, + { + "epoch": 0.93, + "learning_rate": 1.618280913100791e-06, + "loss": 0.9072, + "step": 36191 + }, + { + "epoch": 0.93, + "learning_rate": 1.6182591650717679e-06, + "loss": 0.5708, + "step": 36192 + }, + { + "epoch": 0.93, + "learning_rate": 1.6182374165693724e-06, + "loss": 0.6807, + "step": 36193 + }, + { + "epoch": 0.93, + "learning_rate": 1.618215667593621e-06, + "loss": 0.6753, + "step": 36194 + }, + { + "epoch": 0.93, + "learning_rate": 1.6181939181445303e-06, + "loss": 0.8779, + "step": 36195 + }, + { + "epoch": 0.93, + "learning_rate": 1.6181721682221167e-06, + "loss": 0.7441, + "step": 36196 + }, + { + "epoch": 0.93, + "learning_rate": 1.6181504178263974e-06, + "loss": 0.833, + "step": 36197 + }, + { + "epoch": 0.93, + "learning_rate": 1.6181286669573887e-06, + "loss": 0.8027, + "step": 36198 + }, + { + "epoch": 0.93, + "learning_rate": 1.6181069156151073e-06, + "loss": 0.9863, + "step": 36199 + }, + { + "epoch": 0.93, + "learning_rate": 1.6180851637995695e-06, + "loss": 0.8296, + "step": 36200 + }, + { + "epoch": 0.93, + "learning_rate": 1.6180634115107928e-06, + "loss": 1.0049, + "step": 36201 + }, + { + "epoch": 0.93, + "learning_rate": 1.6180416587487931e-06, + "loss": 0.8345, + "step": 36202 + }, + { + "epoch": 0.93, + "learning_rate": 1.6180199055135875e-06, + "loss": 0.7656, + "step": 36203 + }, + { + "epoch": 0.93, + "learning_rate": 1.6179981518051925e-06, + "loss": 0.876, + "step": 36204 + }, + { + "epoch": 0.93, + "learning_rate": 1.6179763976236242e-06, + "loss": 0.7173, + "step": 36205 + }, + { + "epoch": 0.93, + "learning_rate": 1.6179546429689005e-06, + "loss": 0.7598, + "step": 36206 + }, + { + "epoch": 0.93, + "learning_rate": 1.6179328878410368e-06, + "loss": 0.7495, + "step": 36207 + }, + { + "epoch": 0.93, + "learning_rate": 1.6179111322400506e-06, + "loss": 0.5125, + "step": 36208 + }, + { + "epoch": 0.93, + "learning_rate": 1.6178893761659583e-06, + "loss": 0.8428, + "step": 36209 + }, + { + "epoch": 0.93, + "learning_rate": 1.6178676196187762e-06, + "loss": 0.9209, + "step": 36210 + }, + { + "epoch": 0.93, + "learning_rate": 1.6178458625985214e-06, + "loss": 0.8291, + "step": 36211 + }, + { + "epoch": 0.93, + "learning_rate": 1.6178241051052107e-06, + "loss": 0.6836, + "step": 36212 + }, + { + "epoch": 0.93, + "learning_rate": 1.6178023471388602e-06, + "loss": 0.7969, + "step": 36213 + }, + { + "epoch": 0.93, + "learning_rate": 1.617780588699487e-06, + "loss": 0.7129, + "step": 36214 + }, + { + "epoch": 0.93, + "learning_rate": 1.6177588297871077e-06, + "loss": 0.8076, + "step": 36215 + }, + { + "epoch": 0.93, + "learning_rate": 1.6177370704017386e-06, + "loss": 0.915, + "step": 36216 + }, + { + "epoch": 0.93, + "learning_rate": 1.6177153105433967e-06, + "loss": 0.8594, + "step": 36217 + }, + { + "epoch": 0.93, + "learning_rate": 1.6176935502120986e-06, + "loss": 0.7969, + "step": 36218 + }, + { + "epoch": 0.93, + "learning_rate": 1.617671789407861e-06, + "loss": 0.9248, + "step": 36219 + }, + { + "epoch": 0.93, + "learning_rate": 1.6176500281307006e-06, + "loss": 0.9297, + "step": 36220 + }, + { + "epoch": 0.93, + "learning_rate": 1.6176282663806338e-06, + "loss": 0.79, + "step": 36221 + }, + { + "epoch": 0.93, + "learning_rate": 1.6176065041576776e-06, + "loss": 0.8525, + "step": 36222 + }, + { + "epoch": 0.93, + "learning_rate": 1.617584741461848e-06, + "loss": 0.792, + "step": 36223 + }, + { + "epoch": 0.93, + "learning_rate": 1.6175629782931631e-06, + "loss": 0.9316, + "step": 36224 + }, + { + "epoch": 0.93, + "learning_rate": 1.6175412146516379e-06, + "loss": 0.8457, + "step": 36225 + }, + { + "epoch": 0.93, + "learning_rate": 1.61751945053729e-06, + "loss": 0.9746, + "step": 36226 + }, + { + "epoch": 0.93, + "learning_rate": 1.6174976859501359e-06, + "loss": 0.916, + "step": 36227 + }, + { + "epoch": 0.93, + "learning_rate": 1.6174759208901921e-06, + "loss": 0.9238, + "step": 36228 + }, + { + "epoch": 0.93, + "learning_rate": 1.6174541553574756e-06, + "loss": 0.8262, + "step": 36229 + }, + { + "epoch": 0.93, + "learning_rate": 1.6174323893520026e-06, + "loss": 0.8428, + "step": 36230 + }, + { + "epoch": 0.93, + "learning_rate": 1.6174106228737898e-06, + "loss": 0.7373, + "step": 36231 + }, + { + "epoch": 0.93, + "learning_rate": 1.6173888559228543e-06, + "loss": 0.8418, + "step": 36232 + }, + { + "epoch": 0.93, + "learning_rate": 1.6173670884992129e-06, + "loss": 1.0127, + "step": 36233 + }, + { + "epoch": 0.93, + "learning_rate": 1.6173453206028814e-06, + "loss": 0.6846, + "step": 36234 + }, + { + "epoch": 0.93, + "learning_rate": 1.6173235522338773e-06, + "loss": 0.6431, + "step": 36235 + }, + { + "epoch": 0.93, + "learning_rate": 1.6173017833922167e-06, + "loss": 1.1553, + "step": 36236 + }, + { + "epoch": 0.93, + "learning_rate": 1.6172800140779167e-06, + "loss": 0.9248, + "step": 36237 + }, + { + "epoch": 0.93, + "learning_rate": 1.6172582442909936e-06, + "loss": 0.6699, + "step": 36238 + }, + { + "epoch": 0.93, + "learning_rate": 1.6172364740314646e-06, + "loss": 0.594, + "step": 36239 + }, + { + "epoch": 0.93, + "learning_rate": 1.6172147032993457e-06, + "loss": 0.6385, + "step": 36240 + }, + { + "epoch": 0.93, + "learning_rate": 1.617192932094654e-06, + "loss": 0.9443, + "step": 36241 + }, + { + "epoch": 0.93, + "learning_rate": 1.617171160417406e-06, + "loss": 0.7417, + "step": 36242 + }, + { + "epoch": 0.93, + "learning_rate": 1.6171493882676183e-06, + "loss": 0.8955, + "step": 36243 + }, + { + "epoch": 0.93, + "learning_rate": 1.6171276156453079e-06, + "loss": 0.9307, + "step": 36244 + }, + { + "epoch": 0.93, + "learning_rate": 1.6171058425504911e-06, + "loss": 0.9473, + "step": 36245 + }, + { + "epoch": 0.93, + "learning_rate": 1.6170840689831848e-06, + "loss": 0.8701, + "step": 36246 + }, + { + "epoch": 0.93, + "learning_rate": 1.6170622949434056e-06, + "loss": 0.9277, + "step": 36247 + }, + { + "epoch": 0.93, + "learning_rate": 1.6170405204311704e-06, + "loss": 0.7627, + "step": 36248 + }, + { + "epoch": 0.93, + "learning_rate": 1.6170187454464955e-06, + "loss": 0.8633, + "step": 36249 + }, + { + "epoch": 0.93, + "learning_rate": 1.6169969699893974e-06, + "loss": 0.7759, + "step": 36250 + }, + { + "epoch": 0.93, + "learning_rate": 1.6169751940598934e-06, + "loss": 0.7354, + "step": 36251 + }, + { + "epoch": 0.93, + "learning_rate": 1.6169534176579998e-06, + "loss": 0.9258, + "step": 36252 + }, + { + "epoch": 0.93, + "learning_rate": 1.6169316407837333e-06, + "loss": 0.7549, + "step": 36253 + }, + { + "epoch": 0.93, + "learning_rate": 1.6169098634371107e-06, + "loss": 0.9185, + "step": 36254 + }, + { + "epoch": 0.93, + "learning_rate": 1.6168880856181483e-06, + "loss": 0.9111, + "step": 36255 + }, + { + "epoch": 0.93, + "learning_rate": 1.6168663073268634e-06, + "loss": 0.7178, + "step": 36256 + }, + { + "epoch": 0.93, + "learning_rate": 1.6168445285632721e-06, + "loss": 0.7793, + "step": 36257 + }, + { + "epoch": 0.93, + "learning_rate": 1.6168227493273915e-06, + "loss": 1.0547, + "step": 36258 + }, + { + "epoch": 0.93, + "learning_rate": 1.6168009696192382e-06, + "loss": 0.9746, + "step": 36259 + }, + { + "epoch": 0.93, + "learning_rate": 1.6167791894388284e-06, + "loss": 0.7627, + "step": 36260 + }, + { + "epoch": 0.93, + "learning_rate": 1.6167574087861793e-06, + "loss": 0.752, + "step": 36261 + }, + { + "epoch": 0.93, + "learning_rate": 1.6167356276613075e-06, + "loss": 0.6592, + "step": 36262 + }, + { + "epoch": 0.93, + "learning_rate": 1.6167138460642296e-06, + "loss": 0.6948, + "step": 36263 + }, + { + "epoch": 0.93, + "learning_rate": 1.6166920639949622e-06, + "loss": 0.6924, + "step": 36264 + }, + { + "epoch": 0.93, + "learning_rate": 1.6166702814535218e-06, + "loss": 0.8076, + "step": 36265 + }, + { + "epoch": 0.93, + "learning_rate": 1.6166484984399255e-06, + "loss": 0.8877, + "step": 36266 + }, + { + "epoch": 0.93, + "learning_rate": 1.6166267149541899e-06, + "loss": 0.8555, + "step": 36267 + }, + { + "epoch": 0.93, + "learning_rate": 1.6166049309963314e-06, + "loss": 0.5864, + "step": 36268 + }, + { + "epoch": 0.93, + "learning_rate": 1.6165831465663673e-06, + "loss": 0.6846, + "step": 36269 + }, + { + "epoch": 0.93, + "learning_rate": 1.6165613616643134e-06, + "loss": 0.5808, + "step": 36270 + }, + { + "epoch": 0.93, + "learning_rate": 1.616539576290187e-06, + "loss": 1.0488, + "step": 36271 + }, + { + "epoch": 0.93, + "learning_rate": 1.6165177904440044e-06, + "loss": 0.9189, + "step": 36272 + }, + { + "epoch": 0.93, + "learning_rate": 1.6164960041257825e-06, + "loss": 1.0635, + "step": 36273 + }, + { + "epoch": 0.93, + "learning_rate": 1.6164742173355382e-06, + "loss": 0.8135, + "step": 36274 + }, + { + "epoch": 0.93, + "learning_rate": 1.6164524300732878e-06, + "loss": 0.8975, + "step": 36275 + }, + { + "epoch": 0.93, + "learning_rate": 1.6164306423390479e-06, + "loss": 0.835, + "step": 36276 + }, + { + "epoch": 0.93, + "learning_rate": 1.6164088541328358e-06, + "loss": 0.9072, + "step": 36277 + }, + { + "epoch": 0.93, + "learning_rate": 1.6163870654546675e-06, + "loss": 0.834, + "step": 36278 + }, + { + "epoch": 0.93, + "learning_rate": 1.6163652763045601e-06, + "loss": 0.7007, + "step": 36279 + }, + { + "epoch": 0.93, + "learning_rate": 1.61634348668253e-06, + "loss": 0.9268, + "step": 36280 + }, + { + "epoch": 0.93, + "learning_rate": 1.616321696588594e-06, + "loss": 0.8174, + "step": 36281 + }, + { + "epoch": 0.93, + "learning_rate": 1.616299906022769e-06, + "loss": 0.6924, + "step": 36282 + }, + { + "epoch": 0.93, + "learning_rate": 1.6162781149850715e-06, + "loss": 0.9102, + "step": 36283 + }, + { + "epoch": 0.93, + "learning_rate": 1.6162563234755183e-06, + "loss": 0.9375, + "step": 36284 + }, + { + "epoch": 0.93, + "learning_rate": 1.6162345314941257e-06, + "loss": 0.877, + "step": 36285 + }, + { + "epoch": 0.93, + "learning_rate": 1.6162127390409107e-06, + "loss": 0.8164, + "step": 36286 + }, + { + "epoch": 0.93, + "learning_rate": 1.61619094611589e-06, + "loss": 0.8022, + "step": 36287 + }, + { + "epoch": 0.93, + "learning_rate": 1.6161691527190801e-06, + "loss": 0.7148, + "step": 36288 + }, + { + "epoch": 0.93, + "learning_rate": 1.616147358850498e-06, + "loss": 0.9189, + "step": 36289 + }, + { + "epoch": 0.93, + "learning_rate": 1.6161255645101602e-06, + "loss": 0.9512, + "step": 36290 + }, + { + "epoch": 0.93, + "learning_rate": 1.6161037696980834e-06, + "loss": 0.791, + "step": 36291 + }, + { + "epoch": 0.93, + "learning_rate": 1.6160819744142841e-06, + "loss": 0.5991, + "step": 36292 + }, + { + "epoch": 0.93, + "learning_rate": 1.6160601786587793e-06, + "loss": 0.6641, + "step": 36293 + }, + { + "epoch": 0.93, + "learning_rate": 1.6160383824315855e-06, + "loss": 0.5469, + "step": 36294 + }, + { + "epoch": 0.93, + "learning_rate": 1.6160165857327195e-06, + "loss": 0.5046, + "step": 36295 + }, + { + "epoch": 0.93, + "learning_rate": 1.6159947885621978e-06, + "loss": 0.7725, + "step": 36296 + }, + { + "epoch": 0.93, + "learning_rate": 1.6159729909200372e-06, + "loss": 0.8599, + "step": 36297 + }, + { + "epoch": 0.93, + "learning_rate": 1.6159511928062545e-06, + "loss": 0.8242, + "step": 36298 + }, + { + "epoch": 0.93, + "learning_rate": 1.6159293942208666e-06, + "loss": 0.918, + "step": 36299 + }, + { + "epoch": 0.93, + "learning_rate": 1.6159075951638894e-06, + "loss": 0.9131, + "step": 36300 + }, + { + "epoch": 0.93, + "learning_rate": 1.6158857956353402e-06, + "loss": 1.0127, + "step": 36301 + }, + { + "epoch": 0.93, + "learning_rate": 1.6158639956352355e-06, + "loss": 0.917, + "step": 36302 + }, + { + "epoch": 0.93, + "learning_rate": 1.615842195163592e-06, + "loss": 0.5266, + "step": 36303 + }, + { + "epoch": 0.93, + "learning_rate": 1.615820394220427e-06, + "loss": 0.6777, + "step": 36304 + }, + { + "epoch": 0.93, + "learning_rate": 1.6157985928057562e-06, + "loss": 0.8418, + "step": 36305 + }, + { + "epoch": 0.93, + "learning_rate": 1.6157767909195967e-06, + "loss": 0.751, + "step": 36306 + }, + { + "epoch": 0.93, + "learning_rate": 1.6157549885619653e-06, + "loss": 0.793, + "step": 36307 + }, + { + "epoch": 0.93, + "learning_rate": 1.6157331857328784e-06, + "loss": 0.8154, + "step": 36308 + }, + { + "epoch": 0.93, + "learning_rate": 1.6157113824323534e-06, + "loss": 0.9004, + "step": 36309 + }, + { + "epoch": 0.93, + "learning_rate": 1.6156895786604063e-06, + "loss": 0.9111, + "step": 36310 + }, + { + "epoch": 0.93, + "learning_rate": 1.6156677744170537e-06, + "loss": 0.6958, + "step": 36311 + }, + { + "epoch": 0.93, + "learning_rate": 1.6156459697023127e-06, + "loss": 0.9229, + "step": 36312 + }, + { + "epoch": 0.93, + "learning_rate": 1.6156241645162001e-06, + "loss": 0.9014, + "step": 36313 + }, + { + "epoch": 0.93, + "learning_rate": 1.6156023588587325e-06, + "loss": 0.8311, + "step": 36314 + }, + { + "epoch": 0.93, + "learning_rate": 1.6155805527299262e-06, + "loss": 0.8672, + "step": 36315 + }, + { + "epoch": 0.93, + "learning_rate": 1.6155587461297984e-06, + "loss": 0.6958, + "step": 36316 + }, + { + "epoch": 0.93, + "learning_rate": 1.6155369390583653e-06, + "loss": 0.897, + "step": 36317 + }, + { + "epoch": 0.93, + "learning_rate": 1.615515131515644e-06, + "loss": 0.7812, + "step": 36318 + }, + { + "epoch": 0.93, + "learning_rate": 1.6154933235016513e-06, + "loss": 0.999, + "step": 36319 + }, + { + "epoch": 0.93, + "learning_rate": 1.6154715150164034e-06, + "loss": 0.7578, + "step": 36320 + }, + { + "epoch": 0.93, + "learning_rate": 1.6154497060599173e-06, + "loss": 0.8975, + "step": 36321 + }, + { + "epoch": 0.93, + "learning_rate": 1.6154278966322097e-06, + "loss": 0.8721, + "step": 36322 + }, + { + "epoch": 0.93, + "learning_rate": 1.615406086733297e-06, + "loss": 0.7627, + "step": 36323 + }, + { + "epoch": 0.93, + "learning_rate": 1.6153842763631965e-06, + "loss": 0.9248, + "step": 36324 + }, + { + "epoch": 0.93, + "learning_rate": 1.6153624655219243e-06, + "loss": 0.603, + "step": 36325 + }, + { + "epoch": 0.93, + "learning_rate": 1.6153406542094974e-06, + "loss": 0.873, + "step": 36326 + }, + { + "epoch": 0.93, + "learning_rate": 1.6153188424259328e-06, + "loss": 0.7842, + "step": 36327 + }, + { + "epoch": 0.93, + "learning_rate": 1.6152970301712466e-06, + "loss": 0.9043, + "step": 36328 + }, + { + "epoch": 0.93, + "learning_rate": 1.615275217445456e-06, + "loss": 0.6538, + "step": 36329 + }, + { + "epoch": 0.93, + "learning_rate": 1.6152534042485768e-06, + "loss": 0.7334, + "step": 36330 + }, + { + "epoch": 0.93, + "learning_rate": 1.6152315905806267e-06, + "loss": 0.8984, + "step": 36331 + }, + { + "epoch": 0.93, + "learning_rate": 1.6152097764416221e-06, + "loss": 0.9082, + "step": 36332 + }, + { + "epoch": 0.93, + "learning_rate": 1.6151879618315797e-06, + "loss": 0.9785, + "step": 36333 + }, + { + "epoch": 0.93, + "learning_rate": 1.6151661467505165e-06, + "loss": 0.8398, + "step": 36334 + }, + { + "epoch": 0.93, + "learning_rate": 1.6151443311984484e-06, + "loss": 0.8379, + "step": 36335 + }, + { + "epoch": 0.93, + "learning_rate": 1.6151225151753924e-06, + "loss": 0.7671, + "step": 36336 + }, + { + "epoch": 0.93, + "learning_rate": 1.6151006986813658e-06, + "loss": 0.8584, + "step": 36337 + }, + { + "epoch": 0.93, + "learning_rate": 1.6150788817163848e-06, + "loss": 1.0107, + "step": 36338 + }, + { + "epoch": 0.93, + "learning_rate": 1.6150570642804663e-06, + "loss": 0.9824, + "step": 36339 + }, + { + "epoch": 0.93, + "learning_rate": 1.6150352463736266e-06, + "loss": 0.9424, + "step": 36340 + }, + { + "epoch": 0.93, + "learning_rate": 1.6150134279958828e-06, + "loss": 0.9238, + "step": 36341 + }, + { + "epoch": 0.93, + "learning_rate": 1.6149916091472515e-06, + "loss": 0.8735, + "step": 36342 + }, + { + "epoch": 0.93, + "learning_rate": 1.6149697898277492e-06, + "loss": 0.9297, + "step": 36343 + }, + { + "epoch": 0.93, + "learning_rate": 1.614947970037393e-06, + "loss": 0.8779, + "step": 36344 + }, + { + "epoch": 0.93, + "learning_rate": 1.6149261497761995e-06, + "loss": 0.7388, + "step": 36345 + }, + { + "epoch": 0.93, + "learning_rate": 1.6149043290441852e-06, + "loss": 0.7749, + "step": 36346 + }, + { + "epoch": 0.93, + "learning_rate": 1.614882507841367e-06, + "loss": 0.8848, + "step": 36347 + }, + { + "epoch": 0.93, + "learning_rate": 1.6148606861677615e-06, + "loss": 0.71, + "step": 36348 + }, + { + "epoch": 0.93, + "learning_rate": 1.6148388640233854e-06, + "loss": 0.9463, + "step": 36349 + }, + { + "epoch": 0.93, + "learning_rate": 1.6148170414082558e-06, + "loss": 0.9326, + "step": 36350 + }, + { + "epoch": 0.93, + "learning_rate": 1.6147952183223886e-06, + "loss": 0.9531, + "step": 36351 + }, + { + "epoch": 0.93, + "learning_rate": 1.614773394765801e-06, + "loss": 0.8398, + "step": 36352 + }, + { + "epoch": 0.93, + "learning_rate": 1.6147515707385097e-06, + "loss": 0.8193, + "step": 36353 + }, + { + "epoch": 0.93, + "learning_rate": 1.6147297462405318e-06, + "loss": 0.6724, + "step": 36354 + }, + { + "epoch": 0.93, + "learning_rate": 1.6147079212718832e-06, + "loss": 0.7988, + "step": 36355 + }, + { + "epoch": 0.93, + "learning_rate": 1.6146860958325811e-06, + "loss": 0.999, + "step": 36356 + }, + { + "epoch": 0.93, + "learning_rate": 1.6146642699226423e-06, + "loss": 0.6785, + "step": 36357 + }, + { + "epoch": 0.93, + "learning_rate": 1.6146424435420832e-06, + "loss": 0.5757, + "step": 36358 + }, + { + "epoch": 0.93, + "learning_rate": 1.6146206166909205e-06, + "loss": 0.8086, + "step": 36359 + }, + { + "epoch": 0.93, + "learning_rate": 1.6145987893691712e-06, + "loss": 0.8994, + "step": 36360 + }, + { + "epoch": 0.93, + "learning_rate": 1.6145769615768518e-06, + "loss": 0.7529, + "step": 36361 + }, + { + "epoch": 0.93, + "learning_rate": 1.6145551333139792e-06, + "loss": 0.7925, + "step": 36362 + }, + { + "epoch": 0.93, + "learning_rate": 1.6145333045805698e-06, + "loss": 0.7197, + "step": 36363 + }, + { + "epoch": 0.93, + "learning_rate": 1.6145114753766408e-06, + "loss": 1.1016, + "step": 36364 + }, + { + "epoch": 0.93, + "learning_rate": 1.6144896457022083e-06, + "loss": 0.8711, + "step": 36365 + }, + { + "epoch": 0.93, + "learning_rate": 1.6144678155572894e-06, + "loss": 0.9971, + "step": 36366 + }, + { + "epoch": 0.93, + "learning_rate": 1.614445984941901e-06, + "loss": 0.6147, + "step": 36367 + }, + { + "epoch": 0.93, + "learning_rate": 1.6144241538560594e-06, + "loss": 0.708, + "step": 36368 + }, + { + "epoch": 0.93, + "learning_rate": 1.6144023222997816e-06, + "loss": 0.7153, + "step": 36369 + }, + { + "epoch": 0.93, + "learning_rate": 1.614380490273084e-06, + "loss": 1.166, + "step": 36370 + }, + { + "epoch": 0.93, + "learning_rate": 1.6143586577759834e-06, + "loss": 0.8955, + "step": 36371 + }, + { + "epoch": 0.93, + "learning_rate": 1.6143368248084967e-06, + "loss": 0.8682, + "step": 36372 + }, + { + "epoch": 0.93, + "learning_rate": 1.6143149913706409e-06, + "loss": 0.7754, + "step": 36373 + }, + { + "epoch": 0.93, + "learning_rate": 1.614293157462432e-06, + "loss": 1.0127, + "step": 36374 + }, + { + "epoch": 0.93, + "learning_rate": 1.6142713230838872e-06, + "loss": 0.8086, + "step": 36375 + }, + { + "epoch": 0.93, + "learning_rate": 1.6142494882350231e-06, + "loss": 0.7422, + "step": 36376 + }, + { + "epoch": 0.93, + "learning_rate": 1.6142276529158561e-06, + "loss": 0.7734, + "step": 36377 + }, + { + "epoch": 0.93, + "learning_rate": 1.6142058171264035e-06, + "loss": 0.8174, + "step": 36378 + }, + { + "epoch": 0.93, + "learning_rate": 1.6141839808666816e-06, + "loss": 0.9482, + "step": 36379 + }, + { + "epoch": 0.93, + "learning_rate": 1.6141621441367078e-06, + "loss": 0.6279, + "step": 36380 + }, + { + "epoch": 0.93, + "learning_rate": 1.6141403069364979e-06, + "loss": 0.8018, + "step": 36381 + }, + { + "epoch": 0.93, + "learning_rate": 1.6141184692660688e-06, + "loss": 0.9307, + "step": 36382 + }, + { + "epoch": 0.93, + "learning_rate": 1.6140966311254376e-06, + "loss": 0.6909, + "step": 36383 + }, + { + "epoch": 0.93, + "learning_rate": 1.614074792514621e-06, + "loss": 0.8711, + "step": 36384 + }, + { + "epoch": 0.93, + "learning_rate": 1.6140529534336354e-06, + "loss": 0.7896, + "step": 36385 + }, + { + "epoch": 0.93, + "learning_rate": 1.6140311138824978e-06, + "loss": 0.8745, + "step": 36386 + }, + { + "epoch": 0.93, + "learning_rate": 1.6140092738612246e-06, + "loss": 0.9854, + "step": 36387 + }, + { + "epoch": 0.93, + "learning_rate": 1.6139874333698328e-06, + "loss": 0.9551, + "step": 36388 + }, + { + "epoch": 0.93, + "learning_rate": 1.6139655924083392e-06, + "loss": 0.6592, + "step": 36389 + }, + { + "epoch": 0.93, + "learning_rate": 1.61394375097676e-06, + "loss": 0.8872, + "step": 36390 + }, + { + "epoch": 0.93, + "learning_rate": 1.6139219090751128e-06, + "loss": 0.8662, + "step": 36391 + }, + { + "epoch": 0.93, + "learning_rate": 1.6139000667034138e-06, + "loss": 0.7686, + "step": 36392 + }, + { + "epoch": 0.93, + "learning_rate": 1.6138782238616794e-06, + "loss": 0.8496, + "step": 36393 + }, + { + "epoch": 0.93, + "learning_rate": 1.6138563805499267e-06, + "loss": 0.9512, + "step": 36394 + }, + { + "epoch": 0.93, + "learning_rate": 1.6138345367681727e-06, + "loss": 0.6885, + "step": 36395 + }, + { + "epoch": 0.93, + "learning_rate": 1.6138126925164337e-06, + "loss": 0.8662, + "step": 36396 + }, + { + "epoch": 0.93, + "learning_rate": 1.6137908477947264e-06, + "loss": 0.5215, + "step": 36397 + }, + { + "epoch": 0.93, + "learning_rate": 1.6137690026030677e-06, + "loss": 0.792, + "step": 36398 + }, + { + "epoch": 0.93, + "learning_rate": 1.6137471569414744e-06, + "loss": 0.9824, + "step": 36399 + }, + { + "epoch": 0.93, + "learning_rate": 1.6137253108099632e-06, + "loss": 0.8799, + "step": 36400 + }, + { + "epoch": 0.93, + "learning_rate": 1.6137034642085507e-06, + "loss": 0.8506, + "step": 36401 + }, + { + "epoch": 0.93, + "learning_rate": 1.6136816171372535e-06, + "loss": 0.9365, + "step": 36402 + }, + { + "epoch": 0.93, + "learning_rate": 1.6136597695960888e-06, + "loss": 0.8418, + "step": 36403 + }, + { + "epoch": 0.93, + "learning_rate": 1.6136379215850729e-06, + "loss": 0.8848, + "step": 36404 + }, + { + "epoch": 0.93, + "learning_rate": 1.6136160731042226e-06, + "loss": 1.0, + "step": 36405 + }, + { + "epoch": 0.93, + "learning_rate": 1.6135942241535545e-06, + "loss": 0.7598, + "step": 36406 + }, + { + "epoch": 0.93, + "learning_rate": 1.6135723747330859e-06, + "loss": 0.8457, + "step": 36407 + }, + { + "epoch": 0.93, + "learning_rate": 1.6135505248428327e-06, + "loss": 0.8857, + "step": 36408 + }, + { + "epoch": 0.93, + "learning_rate": 1.6135286744828125e-06, + "loss": 0.6611, + "step": 36409 + }, + { + "epoch": 0.93, + "learning_rate": 1.6135068236530414e-06, + "loss": 0.957, + "step": 36410 + }, + { + "epoch": 0.93, + "learning_rate": 1.6134849723535365e-06, + "loss": 0.614, + "step": 36411 + }, + { + "epoch": 0.93, + "learning_rate": 1.6134631205843142e-06, + "loss": 0.9082, + "step": 36412 + }, + { + "epoch": 0.93, + "learning_rate": 1.6134412683453913e-06, + "loss": 0.7598, + "step": 36413 + }, + { + "epoch": 0.93, + "learning_rate": 1.6134194156367849e-06, + "loss": 0.6328, + "step": 36414 + }, + { + "epoch": 0.93, + "learning_rate": 1.6133975624585111e-06, + "loss": 0.6685, + "step": 36415 + }, + { + "epoch": 0.93, + "learning_rate": 1.6133757088105873e-06, + "loss": 0.707, + "step": 36416 + }, + { + "epoch": 0.93, + "learning_rate": 1.6133538546930298e-06, + "loss": 0.7603, + "step": 36417 + }, + { + "epoch": 0.93, + "learning_rate": 1.6133320001058555e-06, + "loss": 0.874, + "step": 36418 + }, + { + "epoch": 0.93, + "learning_rate": 1.613310145049081e-06, + "loss": 0.9385, + "step": 36419 + }, + { + "epoch": 0.93, + "learning_rate": 1.6132882895227234e-06, + "loss": 0.8369, + "step": 36420 + }, + { + "epoch": 0.93, + "learning_rate": 1.6132664335267988e-06, + "loss": 0.8145, + "step": 36421 + }, + { + "epoch": 0.93, + "learning_rate": 1.6132445770613242e-06, + "loss": 1.0977, + "step": 36422 + }, + { + "epoch": 0.93, + "learning_rate": 1.6132227201263169e-06, + "loss": 0.8232, + "step": 36423 + }, + { + "epoch": 0.93, + "learning_rate": 1.613200862721793e-06, + "loss": 0.9912, + "step": 36424 + }, + { + "epoch": 0.93, + "learning_rate": 1.6131790048477694e-06, + "loss": 0.6582, + "step": 36425 + }, + { + "epoch": 0.93, + "learning_rate": 1.6131571465042627e-06, + "loss": 0.9053, + "step": 36426 + }, + { + "epoch": 0.93, + "learning_rate": 1.61313528769129e-06, + "loss": 0.7568, + "step": 36427 + }, + { + "epoch": 0.93, + "learning_rate": 1.6131134284088675e-06, + "loss": 0.959, + "step": 36428 + }, + { + "epoch": 0.93, + "learning_rate": 1.6130915686570123e-06, + "loss": 0.6694, + "step": 36429 + }, + { + "epoch": 0.93, + "learning_rate": 1.6130697084357411e-06, + "loss": 0.9551, + "step": 36430 + }, + { + "epoch": 0.93, + "learning_rate": 1.6130478477450708e-06, + "loss": 0.8779, + "step": 36431 + }, + { + "epoch": 0.93, + "learning_rate": 1.6130259865850178e-06, + "loss": 0.8945, + "step": 36432 + }, + { + "epoch": 0.93, + "learning_rate": 1.6130041249555988e-06, + "loss": 0.8174, + "step": 36433 + }, + { + "epoch": 0.93, + "learning_rate": 1.612982262856831e-06, + "loss": 0.7461, + "step": 36434 + }, + { + "epoch": 0.93, + "learning_rate": 1.6129604002887309e-06, + "loss": 0.8203, + "step": 36435 + }, + { + "epoch": 0.93, + "learning_rate": 1.612938537251315e-06, + "loss": 0.8223, + "step": 36436 + }, + { + "epoch": 0.93, + "learning_rate": 1.6129166737446005e-06, + "loss": 0.8872, + "step": 36437 + }, + { + "epoch": 0.93, + "learning_rate": 1.6128948097686038e-06, + "loss": 0.7358, + "step": 36438 + }, + { + "epoch": 0.93, + "learning_rate": 1.6128729453233415e-06, + "loss": 0.8672, + "step": 36439 + }, + { + "epoch": 0.93, + "learning_rate": 1.6128510804088307e-06, + "loss": 0.812, + "step": 36440 + }, + { + "epoch": 0.93, + "learning_rate": 1.6128292150250879e-06, + "loss": 0.8135, + "step": 36441 + }, + { + "epoch": 0.93, + "learning_rate": 1.6128073491721303e-06, + "loss": 1.0586, + "step": 36442 + }, + { + "epoch": 0.93, + "learning_rate": 1.6127854828499737e-06, + "loss": 0.9297, + "step": 36443 + }, + { + "epoch": 0.93, + "learning_rate": 1.6127636160586363e-06, + "loss": 0.8623, + "step": 36444 + }, + { + "epoch": 0.93, + "learning_rate": 1.6127417487981334e-06, + "loss": 0.793, + "step": 36445 + }, + { + "epoch": 0.93, + "learning_rate": 1.6127198810684822e-06, + "loss": 0.8301, + "step": 36446 + }, + { + "epoch": 0.93, + "learning_rate": 1.6126980128696998e-06, + "loss": 0.792, + "step": 36447 + }, + { + "epoch": 0.93, + "learning_rate": 1.6126761442018027e-06, + "loss": 0.917, + "step": 36448 + }, + { + "epoch": 0.93, + "learning_rate": 1.6126542750648078e-06, + "loss": 0.8066, + "step": 36449 + }, + { + "epoch": 0.93, + "learning_rate": 1.6126324054587314e-06, + "loss": 0.8169, + "step": 36450 + }, + { + "epoch": 0.93, + "learning_rate": 1.6126105353835905e-06, + "loss": 1.0352, + "step": 36451 + }, + { + "epoch": 0.93, + "learning_rate": 1.6125886648394022e-06, + "loss": 0.8613, + "step": 36452 + }, + { + "epoch": 0.93, + "learning_rate": 1.6125667938261828e-06, + "loss": 0.8398, + "step": 36453 + }, + { + "epoch": 0.93, + "learning_rate": 1.612544922343949e-06, + "loss": 0.9414, + "step": 36454 + }, + { + "epoch": 0.93, + "learning_rate": 1.612523050392718e-06, + "loss": 0.7998, + "step": 36455 + }, + { + "epoch": 0.93, + "learning_rate": 1.612501177972506e-06, + "loss": 0.7534, + "step": 36456 + }, + { + "epoch": 0.93, + "learning_rate": 1.61247930508333e-06, + "loss": 1.0186, + "step": 36457 + }, + { + "epoch": 0.93, + "learning_rate": 1.6124574317252068e-06, + "loss": 0.8975, + "step": 36458 + }, + { + "epoch": 0.93, + "learning_rate": 1.6124355578981534e-06, + "loss": 0.5931, + "step": 36459 + }, + { + "epoch": 0.93, + "learning_rate": 1.612413683602186e-06, + "loss": 1.0215, + "step": 36460 + }, + { + "epoch": 0.93, + "learning_rate": 1.6123918088373217e-06, + "loss": 0.8096, + "step": 36461 + }, + { + "epoch": 0.93, + "learning_rate": 1.612369933603577e-06, + "loss": 0.8633, + "step": 36462 + }, + { + "epoch": 0.93, + "learning_rate": 1.6123480579009688e-06, + "loss": 0.8025, + "step": 36463 + }, + { + "epoch": 0.93, + "learning_rate": 1.612326181729514e-06, + "loss": 0.8633, + "step": 36464 + }, + { + "epoch": 0.93, + "learning_rate": 1.6123043050892293e-06, + "loss": 0.8115, + "step": 36465 + }, + { + "epoch": 0.93, + "learning_rate": 1.612282427980131e-06, + "loss": 1.0059, + "step": 36466 + }, + { + "epoch": 0.93, + "learning_rate": 1.6122605504022365e-06, + "loss": 0.792, + "step": 36467 + }, + { + "epoch": 0.93, + "learning_rate": 1.6122386723555619e-06, + "loss": 0.8232, + "step": 36468 + }, + { + "epoch": 0.93, + "learning_rate": 1.6122167938401248e-06, + "loss": 0.9033, + "step": 36469 + }, + { + "epoch": 0.93, + "learning_rate": 1.612194914855941e-06, + "loss": 0.8867, + "step": 36470 + }, + { + "epoch": 0.93, + "learning_rate": 1.612173035403028e-06, + "loss": 0.9072, + "step": 36471 + }, + { + "epoch": 0.93, + "learning_rate": 1.612151155481402e-06, + "loss": 0.7412, + "step": 36472 + }, + { + "epoch": 0.93, + "learning_rate": 1.6121292750910802e-06, + "loss": 0.8389, + "step": 36473 + }, + { + "epoch": 0.93, + "learning_rate": 1.6121073942320793e-06, + "loss": 0.8525, + "step": 36474 + }, + { + "epoch": 0.93, + "learning_rate": 1.6120855129044158e-06, + "loss": 0.7393, + "step": 36475 + }, + { + "epoch": 0.93, + "learning_rate": 1.6120636311081063e-06, + "loss": 1.0225, + "step": 36476 + }, + { + "epoch": 0.93, + "learning_rate": 1.612041748843168e-06, + "loss": 0.7546, + "step": 36477 + }, + { + "epoch": 0.93, + "learning_rate": 1.6120198661096173e-06, + "loss": 0.7568, + "step": 36478 + }, + { + "epoch": 0.93, + "learning_rate": 1.6119979829074714e-06, + "loss": 0.8965, + "step": 36479 + }, + { + "epoch": 0.94, + "learning_rate": 1.6119760992367468e-06, + "loss": 0.8564, + "step": 36480 + }, + { + "epoch": 0.94, + "learning_rate": 1.61195421509746e-06, + "loss": 0.9961, + "step": 36481 + }, + { + "epoch": 0.94, + "learning_rate": 1.6119323304896282e-06, + "loss": 0.7666, + "step": 36482 + }, + { + "epoch": 0.94, + "learning_rate": 1.6119104454132679e-06, + "loss": 1.0234, + "step": 36483 + }, + { + "epoch": 0.94, + "learning_rate": 1.611888559868396e-06, + "loss": 0.8223, + "step": 36484 + }, + { + "epoch": 0.94, + "learning_rate": 1.611866673855029e-06, + "loss": 0.6924, + "step": 36485 + }, + { + "epoch": 0.94, + "learning_rate": 1.611844787373184e-06, + "loss": 0.8252, + "step": 36486 + }, + { + "epoch": 0.94, + "learning_rate": 1.6118229004228772e-06, + "loss": 0.7607, + "step": 36487 + }, + { + "epoch": 0.94, + "learning_rate": 1.6118010130041263e-06, + "loss": 1.1455, + "step": 36488 + }, + { + "epoch": 0.94, + "learning_rate": 1.611779125116947e-06, + "loss": 0.8955, + "step": 36489 + }, + { + "epoch": 0.94, + "learning_rate": 1.6117572367613567e-06, + "loss": 0.8438, + "step": 36490 + }, + { + "epoch": 0.94, + "learning_rate": 1.6117353479373721e-06, + "loss": 0.832, + "step": 36491 + }, + { + "epoch": 0.94, + "learning_rate": 1.61171345864501e-06, + "loss": 0.8848, + "step": 36492 + }, + { + "epoch": 0.94, + "learning_rate": 1.6116915688842868e-06, + "loss": 0.8066, + "step": 36493 + }, + { + "epoch": 0.94, + "learning_rate": 1.6116696786552195e-06, + "loss": 0.6528, + "step": 36494 + }, + { + "epoch": 0.94, + "learning_rate": 1.611647787957825e-06, + "loss": 0.8599, + "step": 36495 + }, + { + "epoch": 0.94, + "learning_rate": 1.6116258967921197e-06, + "loss": 1.0117, + "step": 36496 + }, + { + "epoch": 0.94, + "learning_rate": 1.6116040051581207e-06, + "loss": 0.7578, + "step": 36497 + }, + { + "epoch": 0.94, + "learning_rate": 1.6115821130558449e-06, + "loss": 0.7754, + "step": 36498 + }, + { + "epoch": 0.94, + "learning_rate": 1.6115602204853084e-06, + "loss": 0.7686, + "step": 36499 + }, + { + "epoch": 0.94, + "learning_rate": 1.6115383274465284e-06, + "loss": 0.8447, + "step": 36500 + }, + { + "epoch": 0.94, + "learning_rate": 1.6115164339395217e-06, + "loss": 0.9902, + "step": 36501 + }, + { + "epoch": 0.94, + "learning_rate": 1.611494539964305e-06, + "loss": 0.7695, + "step": 36502 + }, + { + "epoch": 0.94, + "learning_rate": 1.6114726455208951e-06, + "loss": 1.0117, + "step": 36503 + }, + { + "epoch": 0.94, + "learning_rate": 1.6114507506093085e-06, + "loss": 0.8887, + "step": 36504 + }, + { + "epoch": 0.94, + "learning_rate": 1.6114288552295623e-06, + "loss": 0.9053, + "step": 36505 + }, + { + "epoch": 0.94, + "learning_rate": 1.6114069593816733e-06, + "loss": 0.7656, + "step": 36506 + }, + { + "epoch": 0.94, + "learning_rate": 1.6113850630656578e-06, + "loss": 0.8359, + "step": 36507 + }, + { + "epoch": 0.94, + "learning_rate": 1.6113631662815332e-06, + "loss": 0.7705, + "step": 36508 + }, + { + "epoch": 0.94, + "learning_rate": 1.611341269029316e-06, + "loss": 0.7153, + "step": 36509 + }, + { + "epoch": 0.94, + "learning_rate": 1.6113193713090226e-06, + "loss": 0.9111, + "step": 36510 + }, + { + "epoch": 0.94, + "learning_rate": 1.6112974731206702e-06, + "loss": 0.7969, + "step": 36511 + }, + { + "epoch": 0.94, + "learning_rate": 1.6112755744642751e-06, + "loss": 0.6035, + "step": 36512 + }, + { + "epoch": 0.94, + "learning_rate": 1.611253675339855e-06, + "loss": 1.0859, + "step": 36513 + }, + { + "epoch": 0.94, + "learning_rate": 1.6112317757474256e-06, + "loss": 0.7871, + "step": 36514 + }, + { + "epoch": 0.94, + "learning_rate": 1.6112098756870043e-06, + "loss": 0.6855, + "step": 36515 + }, + { + "epoch": 0.94, + "learning_rate": 1.6111879751586078e-06, + "loss": 0.9609, + "step": 36516 + }, + { + "epoch": 0.94, + "learning_rate": 1.6111660741622526e-06, + "loss": 0.7441, + "step": 36517 + }, + { + "epoch": 0.94, + "learning_rate": 1.6111441726979558e-06, + "loss": 0.8223, + "step": 36518 + }, + { + "epoch": 0.94, + "learning_rate": 1.6111222707657337e-06, + "loss": 0.8047, + "step": 36519 + }, + { + "epoch": 0.94, + "learning_rate": 1.6111003683656038e-06, + "loss": 0.8955, + "step": 36520 + }, + { + "epoch": 0.94, + "learning_rate": 1.611078465497582e-06, + "loss": 0.9355, + "step": 36521 + }, + { + "epoch": 0.94, + "learning_rate": 1.6110565621616856e-06, + "loss": 0.9248, + "step": 36522 + }, + { + "epoch": 0.94, + "learning_rate": 1.6110346583579318e-06, + "loss": 0.7515, + "step": 36523 + }, + { + "epoch": 0.94, + "learning_rate": 1.6110127540863364e-06, + "loss": 0.8643, + "step": 36524 + }, + { + "epoch": 0.94, + "learning_rate": 1.6109908493469166e-06, + "loss": 0.8965, + "step": 36525 + }, + { + "epoch": 0.94, + "learning_rate": 1.6109689441396892e-06, + "loss": 0.9834, + "step": 36526 + }, + { + "epoch": 0.94, + "learning_rate": 1.6109470384646713e-06, + "loss": 0.8516, + "step": 36527 + }, + { + "epoch": 0.94, + "learning_rate": 1.610925132321879e-06, + "loss": 0.6544, + "step": 36528 + }, + { + "epoch": 0.94, + "learning_rate": 1.6109032257113294e-06, + "loss": 0.9062, + "step": 36529 + }, + { + "epoch": 0.94, + "learning_rate": 1.6108813186330397e-06, + "loss": 0.7104, + "step": 36530 + }, + { + "epoch": 0.94, + "learning_rate": 1.610859411087026e-06, + "loss": 0.6309, + "step": 36531 + }, + { + "epoch": 0.94, + "learning_rate": 1.6108375030733053e-06, + "loss": 0.8071, + "step": 36532 + }, + { + "epoch": 0.94, + "learning_rate": 1.6108155945918945e-06, + "loss": 0.7695, + "step": 36533 + }, + { + "epoch": 0.94, + "learning_rate": 1.61079368564281e-06, + "loss": 0.6934, + "step": 36534 + }, + { + "epoch": 0.94, + "learning_rate": 1.6107717762260693e-06, + "loss": 0.8555, + "step": 36535 + }, + { + "epoch": 0.94, + "learning_rate": 1.6107498663416886e-06, + "loss": 0.6992, + "step": 36536 + }, + { + "epoch": 0.94, + "learning_rate": 1.6107279559896845e-06, + "loss": 0.9014, + "step": 36537 + }, + { + "epoch": 0.94, + "learning_rate": 1.6107060451700748e-06, + "loss": 1.0371, + "step": 36538 + }, + { + "epoch": 0.94, + "learning_rate": 1.610684133882875e-06, + "loss": 0.8467, + "step": 36539 + }, + { + "epoch": 0.94, + "learning_rate": 1.6106622221281024e-06, + "loss": 0.7715, + "step": 36540 + }, + { + "epoch": 0.94, + "learning_rate": 1.610640309905774e-06, + "loss": 1.0537, + "step": 36541 + }, + { + "epoch": 0.94, + "learning_rate": 1.6106183972159062e-06, + "loss": 0.7109, + "step": 36542 + }, + { + "epoch": 0.94, + "learning_rate": 1.6105964840585163e-06, + "loss": 0.8887, + "step": 36543 + }, + { + "epoch": 0.94, + "learning_rate": 1.6105745704336205e-06, + "loss": 0.8457, + "step": 36544 + }, + { + "epoch": 0.94, + "learning_rate": 1.6105526563412358e-06, + "loss": 0.7256, + "step": 36545 + }, + { + "epoch": 0.94, + "learning_rate": 1.610530741781379e-06, + "loss": 1.0742, + "step": 36546 + }, + { + "epoch": 0.94, + "learning_rate": 1.6105088267540672e-06, + "loss": 0.6411, + "step": 36547 + }, + { + "epoch": 0.94, + "learning_rate": 1.6104869112593167e-06, + "loss": 0.8853, + "step": 36548 + }, + { + "epoch": 0.94, + "learning_rate": 1.610464995297144e-06, + "loss": 0.7915, + "step": 36549 + }, + { + "epoch": 0.94, + "learning_rate": 1.6104430788675668e-06, + "loss": 0.5938, + "step": 36550 + }, + { + "epoch": 0.94, + "learning_rate": 1.6104211619706014e-06, + "loss": 1.0566, + "step": 36551 + }, + { + "epoch": 0.94, + "learning_rate": 1.6103992446062643e-06, + "loss": 1.2383, + "step": 36552 + }, + { + "epoch": 0.94, + "learning_rate": 1.6103773267745729e-06, + "loss": 0.8545, + "step": 36553 + }, + { + "epoch": 0.94, + "learning_rate": 1.6103554084755435e-06, + "loss": 0.6982, + "step": 36554 + }, + { + "epoch": 0.94, + "learning_rate": 1.6103334897091928e-06, + "loss": 0.6545, + "step": 36555 + }, + { + "epoch": 0.94, + "learning_rate": 1.6103115704755384e-06, + "loss": 0.8867, + "step": 36556 + }, + { + "epoch": 0.94, + "learning_rate": 1.610289650774596e-06, + "loss": 0.8193, + "step": 36557 + }, + { + "epoch": 0.94, + "learning_rate": 1.6102677306063832e-06, + "loss": 0.7656, + "step": 36558 + }, + { + "epoch": 0.94, + "learning_rate": 1.6102458099709163e-06, + "loss": 0.8994, + "step": 36559 + }, + { + "epoch": 0.94, + "learning_rate": 1.610223888868212e-06, + "loss": 0.7017, + "step": 36560 + }, + { + "epoch": 0.94, + "learning_rate": 1.6102019672982876e-06, + "loss": 1.0264, + "step": 36561 + }, + { + "epoch": 0.94, + "learning_rate": 1.6101800452611593e-06, + "loss": 0.8643, + "step": 36562 + }, + { + "epoch": 0.94, + "learning_rate": 1.6101581227568449e-06, + "loss": 0.7559, + "step": 36563 + }, + { + "epoch": 0.94, + "learning_rate": 1.61013619978536e-06, + "loss": 0.7031, + "step": 36564 + }, + { + "epoch": 0.94, + "learning_rate": 1.6101142763467217e-06, + "loss": 0.9399, + "step": 36565 + }, + { + "epoch": 0.94, + "learning_rate": 1.6100923524409474e-06, + "loss": 0.7574, + "step": 36566 + }, + { + "epoch": 0.94, + "learning_rate": 1.6100704280680529e-06, + "loss": 0.7783, + "step": 36567 + }, + { + "epoch": 0.94, + "learning_rate": 1.610048503228056e-06, + "loss": 0.8164, + "step": 36568 + }, + { + "epoch": 0.94, + "learning_rate": 1.6100265779209728e-06, + "loss": 0.96, + "step": 36569 + }, + { + "epoch": 0.94, + "learning_rate": 1.6100046521468204e-06, + "loss": 0.9277, + "step": 36570 + }, + { + "epoch": 0.94, + "learning_rate": 1.6099827259056154e-06, + "loss": 0.7808, + "step": 36571 + }, + { + "epoch": 0.94, + "learning_rate": 1.6099607991973744e-06, + "loss": 0.7339, + "step": 36572 + }, + { + "epoch": 0.94, + "learning_rate": 1.609938872022115e-06, + "loss": 0.803, + "step": 36573 + }, + { + "epoch": 0.94, + "learning_rate": 1.609916944379853e-06, + "loss": 0.8701, + "step": 36574 + }, + { + "epoch": 0.94, + "learning_rate": 1.609895016270606e-06, + "loss": 0.833, + "step": 36575 + }, + { + "epoch": 0.94, + "learning_rate": 1.6098730876943903e-06, + "loss": 0.9854, + "step": 36576 + }, + { + "epoch": 0.94, + "learning_rate": 1.6098511586512228e-06, + "loss": 0.8145, + "step": 36577 + }, + { + "epoch": 0.94, + "learning_rate": 1.6098292291411202e-06, + "loss": 0.9766, + "step": 36578 + }, + { + "epoch": 0.94, + "learning_rate": 1.6098072991640996e-06, + "loss": 0.8779, + "step": 36579 + }, + { + "epoch": 0.94, + "learning_rate": 1.6097853687201774e-06, + "loss": 0.9072, + "step": 36580 + }, + { + "epoch": 0.94, + "learning_rate": 1.6097634378093705e-06, + "loss": 0.9937, + "step": 36581 + }, + { + "epoch": 0.94, + "learning_rate": 1.609741506431696e-06, + "loss": 0.8452, + "step": 36582 + }, + { + "epoch": 0.94, + "learning_rate": 1.6097195745871707e-06, + "loss": 0.8408, + "step": 36583 + }, + { + "epoch": 0.94, + "learning_rate": 1.6096976422758108e-06, + "loss": 0.6943, + "step": 36584 + }, + { + "epoch": 0.94, + "learning_rate": 1.6096757094976334e-06, + "loss": 0.8311, + "step": 36585 + }, + { + "epoch": 0.94, + "learning_rate": 1.6096537762526556e-06, + "loss": 0.8184, + "step": 36586 + }, + { + "epoch": 0.94, + "learning_rate": 1.6096318425408938e-06, + "loss": 0.71, + "step": 36587 + }, + { + "epoch": 0.94, + "learning_rate": 1.6096099083623649e-06, + "loss": 0.7852, + "step": 36588 + }, + { + "epoch": 0.94, + "learning_rate": 1.609587973717086e-06, + "loss": 0.8721, + "step": 36589 + }, + { + "epoch": 0.94, + "learning_rate": 1.6095660386050732e-06, + "loss": 0.6183, + "step": 36590 + }, + { + "epoch": 0.94, + "learning_rate": 1.6095441030263438e-06, + "loss": 0.6328, + "step": 36591 + }, + { + "epoch": 0.94, + "learning_rate": 1.6095221669809145e-06, + "loss": 0.9648, + "step": 36592 + }, + { + "epoch": 0.94, + "learning_rate": 1.6095002304688024e-06, + "loss": 0.9092, + "step": 36593 + }, + { + "epoch": 0.94, + "learning_rate": 1.6094782934900235e-06, + "loss": 0.7471, + "step": 36594 + }, + { + "epoch": 0.94, + "learning_rate": 1.6094563560445955e-06, + "loss": 0.9199, + "step": 36595 + }, + { + "epoch": 0.94, + "learning_rate": 1.6094344181325345e-06, + "loss": 0.8066, + "step": 36596 + }, + { + "epoch": 0.94, + "learning_rate": 1.6094124797538577e-06, + "loss": 0.9619, + "step": 36597 + }, + { + "epoch": 0.94, + "learning_rate": 1.6093905409085822e-06, + "loss": 0.7197, + "step": 36598 + }, + { + "epoch": 0.94, + "learning_rate": 1.6093686015967238e-06, + "loss": 0.8809, + "step": 36599 + }, + { + "epoch": 0.94, + "learning_rate": 1.6093466618183003e-06, + "loss": 0.8491, + "step": 36600 + }, + { + "epoch": 0.94, + "learning_rate": 1.6093247215733276e-06, + "loss": 0.7925, + "step": 36601 + }, + { + "epoch": 0.94, + "learning_rate": 1.6093027808618235e-06, + "loss": 0.9189, + "step": 36602 + }, + { + "epoch": 0.94, + "learning_rate": 1.6092808396838042e-06, + "loss": 0.6055, + "step": 36603 + }, + { + "epoch": 0.94, + "learning_rate": 1.6092588980392864e-06, + "loss": 1.0059, + "step": 36604 + }, + { + "epoch": 0.94, + "learning_rate": 1.609236955928287e-06, + "loss": 0.6143, + "step": 36605 + }, + { + "epoch": 0.94, + "learning_rate": 1.609215013350823e-06, + "loss": 0.7993, + "step": 36606 + }, + { + "epoch": 0.94, + "learning_rate": 1.609193070306911e-06, + "loss": 0.79, + "step": 36607 + }, + { + "epoch": 0.94, + "learning_rate": 1.6091711267965683e-06, + "loss": 0.769, + "step": 36608 + }, + { + "epoch": 0.94, + "learning_rate": 1.6091491828198107e-06, + "loss": 0.814, + "step": 36609 + }, + { + "epoch": 0.94, + "learning_rate": 1.6091272383766557e-06, + "loss": 0.4893, + "step": 36610 + }, + { + "epoch": 0.94, + "learning_rate": 1.60910529346712e-06, + "loss": 0.7451, + "step": 36611 + }, + { + "epoch": 0.94, + "learning_rate": 1.6090833480912205e-06, + "loss": 0.3989, + "step": 36612 + }, + { + "epoch": 0.94, + "learning_rate": 1.6090614022489738e-06, + "loss": 0.7778, + "step": 36613 + }, + { + "epoch": 0.94, + "learning_rate": 1.609039455940397e-06, + "loss": 0.7949, + "step": 36614 + }, + { + "epoch": 0.94, + "learning_rate": 1.6090175091655065e-06, + "loss": 0.7178, + "step": 36615 + }, + { + "epoch": 0.94, + "learning_rate": 1.6089955619243193e-06, + "loss": 0.916, + "step": 36616 + }, + { + "epoch": 0.94, + "learning_rate": 1.6089736142168523e-06, + "loss": 0.8428, + "step": 36617 + }, + { + "epoch": 0.94, + "learning_rate": 1.6089516660431222e-06, + "loss": 0.7793, + "step": 36618 + }, + { + "epoch": 0.94, + "learning_rate": 1.6089297174031456e-06, + "loss": 1.0469, + "step": 36619 + }, + { + "epoch": 0.94, + "learning_rate": 1.6089077682969397e-06, + "loss": 1.0537, + "step": 36620 + }, + { + "epoch": 0.94, + "learning_rate": 1.6088858187245208e-06, + "loss": 0.8252, + "step": 36621 + }, + { + "epoch": 0.94, + "learning_rate": 1.6088638686859065e-06, + "loss": 0.958, + "step": 36622 + }, + { + "epoch": 0.94, + "learning_rate": 1.608841918181113e-06, + "loss": 0.8555, + "step": 36623 + }, + { + "epoch": 0.94, + "learning_rate": 1.6088199672101572e-06, + "loss": 0.71, + "step": 36624 + }, + { + "epoch": 0.94, + "learning_rate": 1.608798015773056e-06, + "loss": 0.7476, + "step": 36625 + }, + { + "epoch": 0.94, + "learning_rate": 1.608776063869826e-06, + "loss": 0.9004, + "step": 36626 + }, + { + "epoch": 0.94, + "learning_rate": 1.608754111500484e-06, + "loss": 0.7598, + "step": 36627 + }, + { + "epoch": 0.94, + "learning_rate": 1.6087321586650476e-06, + "loss": 0.8975, + "step": 36628 + }, + { + "epoch": 0.94, + "learning_rate": 1.6087102053635324e-06, + "loss": 0.6021, + "step": 36629 + }, + { + "epoch": 0.94, + "learning_rate": 1.6086882515959559e-06, + "loss": 0.8247, + "step": 36630 + }, + { + "epoch": 0.94, + "learning_rate": 1.6086662973623348e-06, + "loss": 0.8789, + "step": 36631 + }, + { + "epoch": 0.94, + "learning_rate": 1.608644342662686e-06, + "loss": 0.7148, + "step": 36632 + }, + { + "epoch": 0.94, + "learning_rate": 1.6086223874970264e-06, + "loss": 0.8369, + "step": 36633 + }, + { + "epoch": 0.94, + "learning_rate": 1.6086004318653724e-06, + "loss": 0.8047, + "step": 36634 + }, + { + "epoch": 0.94, + "learning_rate": 1.6085784757677408e-06, + "loss": 0.6885, + "step": 36635 + }, + { + "epoch": 0.94, + "learning_rate": 1.608556519204149e-06, + "loss": 0.8848, + "step": 36636 + }, + { + "epoch": 0.94, + "learning_rate": 1.6085345621746132e-06, + "loss": 0.8364, + "step": 36637 + }, + { + "epoch": 0.94, + "learning_rate": 1.6085126046791507e-06, + "loss": 0.7988, + "step": 36638 + }, + { + "epoch": 0.94, + "learning_rate": 1.608490646717778e-06, + "loss": 0.8408, + "step": 36639 + }, + { + "epoch": 0.94, + "learning_rate": 1.6084686882905118e-06, + "loss": 0.9219, + "step": 36640 + }, + { + "epoch": 0.94, + "learning_rate": 1.6084467293973693e-06, + "loss": 0.7549, + "step": 36641 + }, + { + "epoch": 0.94, + "learning_rate": 1.608424770038367e-06, + "loss": 0.7939, + "step": 36642 + }, + { + "epoch": 0.94, + "learning_rate": 1.6084028102135221e-06, + "loss": 0.7041, + "step": 36643 + }, + { + "epoch": 0.94, + "learning_rate": 1.608380849922851e-06, + "loss": 0.6001, + "step": 36644 + }, + { + "epoch": 0.94, + "learning_rate": 1.6083588891663706e-06, + "loss": 0.9277, + "step": 36645 + }, + { + "epoch": 0.94, + "learning_rate": 1.6083369279440976e-06, + "loss": 0.7925, + "step": 36646 + }, + { + "epoch": 0.94, + "learning_rate": 1.6083149662560494e-06, + "loss": 0.7212, + "step": 36647 + }, + { + "epoch": 0.94, + "learning_rate": 1.6082930041022421e-06, + "loss": 0.8271, + "step": 36648 + }, + { + "epoch": 0.94, + "learning_rate": 1.608271041482693e-06, + "loss": 0.9668, + "step": 36649 + }, + { + "epoch": 0.94, + "learning_rate": 1.6082490783974186e-06, + "loss": 0.6892, + "step": 36650 + }, + { + "epoch": 0.94, + "learning_rate": 1.6082271148464358e-06, + "loss": 0.9375, + "step": 36651 + }, + { + "epoch": 0.94, + "learning_rate": 1.6082051508297615e-06, + "loss": 0.8096, + "step": 36652 + }, + { + "epoch": 0.94, + "learning_rate": 1.6081831863474124e-06, + "loss": 0.7368, + "step": 36653 + }, + { + "epoch": 0.94, + "learning_rate": 1.6081612213994058e-06, + "loss": 0.7031, + "step": 36654 + }, + { + "epoch": 0.94, + "learning_rate": 1.6081392559857576e-06, + "loss": 0.876, + "step": 36655 + }, + { + "epoch": 0.94, + "learning_rate": 1.6081172901064855e-06, + "loss": 0.6968, + "step": 36656 + }, + { + "epoch": 0.94, + "learning_rate": 1.6080953237616056e-06, + "loss": 0.9873, + "step": 36657 + }, + { + "epoch": 0.94, + "learning_rate": 1.6080733569511352e-06, + "loss": 0.7666, + "step": 36658 + }, + { + "epoch": 0.94, + "learning_rate": 1.6080513896750913e-06, + "loss": 1.0215, + "step": 36659 + }, + { + "epoch": 0.94, + "learning_rate": 1.6080294219334902e-06, + "loss": 0.7705, + "step": 36660 + }, + { + "epoch": 0.94, + "learning_rate": 1.608007453726349e-06, + "loss": 0.9844, + "step": 36661 + }, + { + "epoch": 0.94, + "learning_rate": 1.6079854850536842e-06, + "loss": 0.771, + "step": 36662 + }, + { + "epoch": 0.94, + "learning_rate": 1.6079635159155132e-06, + "loss": 0.8599, + "step": 36663 + }, + { + "epoch": 0.94, + "learning_rate": 1.6079415463118524e-06, + "loss": 0.8887, + "step": 36664 + }, + { + "epoch": 0.94, + "learning_rate": 1.6079195762427185e-06, + "loss": 0.9824, + "step": 36665 + }, + { + "epoch": 0.94, + "learning_rate": 1.6078976057081288e-06, + "loss": 0.8301, + "step": 36666 + }, + { + "epoch": 0.94, + "learning_rate": 1.6078756347080997e-06, + "loss": 0.6367, + "step": 36667 + }, + { + "epoch": 0.94, + "learning_rate": 1.6078536632426483e-06, + "loss": 1.0039, + "step": 36668 + }, + { + "epoch": 0.94, + "learning_rate": 1.607831691311791e-06, + "loss": 0.8564, + "step": 36669 + }, + { + "epoch": 0.94, + "learning_rate": 1.6078097189155452e-06, + "loss": 0.6245, + "step": 36670 + }, + { + "epoch": 0.94, + "learning_rate": 1.6077877460539273e-06, + "loss": 1.0015, + "step": 36671 + }, + { + "epoch": 0.94, + "learning_rate": 1.6077657727269544e-06, + "loss": 0.8506, + "step": 36672 + }, + { + "epoch": 0.94, + "learning_rate": 1.6077437989346434e-06, + "loss": 0.7358, + "step": 36673 + }, + { + "epoch": 0.94, + "learning_rate": 1.6077218246770104e-06, + "loss": 0.8584, + "step": 36674 + }, + { + "epoch": 0.94, + "learning_rate": 1.607699849954073e-06, + "loss": 0.9551, + "step": 36675 + }, + { + "epoch": 0.94, + "learning_rate": 1.6076778747658479e-06, + "loss": 0.9688, + "step": 36676 + }, + { + "epoch": 0.94, + "learning_rate": 1.6076558991123514e-06, + "loss": 0.8584, + "step": 36677 + }, + { + "epoch": 0.94, + "learning_rate": 1.6076339229936013e-06, + "loss": 0.8662, + "step": 36678 + }, + { + "epoch": 0.94, + "learning_rate": 1.6076119464096137e-06, + "loss": 0.9351, + "step": 36679 + }, + { + "epoch": 0.94, + "learning_rate": 1.6075899693604051e-06, + "loss": 0.9873, + "step": 36680 + }, + { + "epoch": 0.94, + "learning_rate": 1.6075679918459933e-06, + "loss": 0.7842, + "step": 36681 + }, + { + "epoch": 0.94, + "learning_rate": 1.6075460138663942e-06, + "loss": 0.6494, + "step": 36682 + }, + { + "epoch": 0.94, + "learning_rate": 1.6075240354216254e-06, + "loss": 0.9121, + "step": 36683 + }, + { + "epoch": 0.94, + "learning_rate": 1.6075020565117033e-06, + "loss": 0.7881, + "step": 36684 + }, + { + "epoch": 0.94, + "learning_rate": 1.6074800771366445e-06, + "loss": 0.7578, + "step": 36685 + }, + { + "epoch": 0.94, + "learning_rate": 1.6074580972964666e-06, + "loss": 0.8975, + "step": 36686 + }, + { + "epoch": 0.94, + "learning_rate": 1.6074361169911857e-06, + "loss": 0.7451, + "step": 36687 + }, + { + "epoch": 0.94, + "learning_rate": 1.6074141362208188e-06, + "loss": 0.771, + "step": 36688 + }, + { + "epoch": 0.94, + "learning_rate": 1.607392154985383e-06, + "loss": 0.6157, + "step": 36689 + }, + { + "epoch": 0.94, + "learning_rate": 1.6073701732848953e-06, + "loss": 0.8564, + "step": 36690 + }, + { + "epoch": 0.94, + "learning_rate": 1.6073481911193716e-06, + "loss": 0.9326, + "step": 36691 + }, + { + "epoch": 0.94, + "learning_rate": 1.6073262084888295e-06, + "loss": 1.1191, + "step": 36692 + }, + { + "epoch": 0.94, + "learning_rate": 1.6073042253932859e-06, + "loss": 0.9004, + "step": 36693 + }, + { + "epoch": 0.94, + "learning_rate": 1.6072822418327572e-06, + "loss": 0.8833, + "step": 36694 + }, + { + "epoch": 0.94, + "learning_rate": 1.6072602578072603e-06, + "loss": 0.8877, + "step": 36695 + }, + { + "epoch": 0.94, + "learning_rate": 1.6072382733168122e-06, + "loss": 0.7676, + "step": 36696 + }, + { + "epoch": 0.94, + "learning_rate": 1.6072162883614294e-06, + "loss": 0.6724, + "step": 36697 + }, + { + "epoch": 0.94, + "learning_rate": 1.6071943029411298e-06, + "loss": 0.8506, + "step": 36698 + }, + { + "epoch": 0.94, + "learning_rate": 1.6071723170559288e-06, + "loss": 0.7041, + "step": 36699 + }, + { + "epoch": 0.94, + "learning_rate": 1.607150330705844e-06, + "loss": 0.8057, + "step": 36700 + }, + { + "epoch": 0.94, + "learning_rate": 1.607128343890892e-06, + "loss": 0.749, + "step": 36701 + }, + { + "epoch": 0.94, + "learning_rate": 1.60710635661109e-06, + "loss": 0.9736, + "step": 36702 + }, + { + "epoch": 0.94, + "learning_rate": 1.6070843688664546e-06, + "loss": 0.8691, + "step": 36703 + }, + { + "epoch": 0.94, + "learning_rate": 1.6070623806570023e-06, + "loss": 1.082, + "step": 36704 + }, + { + "epoch": 0.94, + "learning_rate": 1.6070403919827506e-06, + "loss": 1.0273, + "step": 36705 + }, + { + "epoch": 0.94, + "learning_rate": 1.6070184028437156e-06, + "loss": 0.8838, + "step": 36706 + }, + { + "epoch": 0.94, + "learning_rate": 1.6069964132399147e-06, + "loss": 0.7666, + "step": 36707 + }, + { + "epoch": 0.94, + "learning_rate": 1.6069744231713646e-06, + "loss": 0.8135, + "step": 36708 + }, + { + "epoch": 0.94, + "learning_rate": 1.6069524326380823e-06, + "loss": 0.7568, + "step": 36709 + }, + { + "epoch": 0.94, + "learning_rate": 1.6069304416400842e-06, + "loss": 0.7734, + "step": 36710 + }, + { + "epoch": 0.94, + "learning_rate": 1.6069084501773873e-06, + "loss": 0.9238, + "step": 36711 + }, + { + "epoch": 0.94, + "learning_rate": 1.6068864582500086e-06, + "loss": 0.5776, + "step": 36712 + }, + { + "epoch": 0.94, + "learning_rate": 1.606864465857965e-06, + "loss": 0.876, + "step": 36713 + }, + { + "epoch": 0.94, + "learning_rate": 1.6068424730012731e-06, + "loss": 0.9404, + "step": 36714 + }, + { + "epoch": 0.94, + "learning_rate": 1.6068204796799494e-06, + "loss": 1.002, + "step": 36715 + }, + { + "epoch": 0.94, + "learning_rate": 1.6067984858940116e-06, + "loss": 0.6699, + "step": 36716 + }, + { + "epoch": 0.94, + "learning_rate": 1.606776491643476e-06, + "loss": 0.7275, + "step": 36717 + }, + { + "epoch": 0.94, + "learning_rate": 1.6067544969283597e-06, + "loss": 0.9316, + "step": 36718 + }, + { + "epoch": 0.94, + "learning_rate": 1.606732501748679e-06, + "loss": 1.0498, + "step": 36719 + }, + { + "epoch": 0.94, + "learning_rate": 1.6067105061044514e-06, + "loss": 0.709, + "step": 36720 + }, + { + "epoch": 0.94, + "learning_rate": 1.6066885099956933e-06, + "loss": 0.9033, + "step": 36721 + }, + { + "epoch": 0.94, + "learning_rate": 1.606666513422422e-06, + "loss": 0.6382, + "step": 36722 + }, + { + "epoch": 0.94, + "learning_rate": 1.6066445163846539e-06, + "loss": 0.7324, + "step": 36723 + }, + { + "epoch": 0.94, + "learning_rate": 1.6066225188824058e-06, + "loss": 0.958, + "step": 36724 + }, + { + "epoch": 0.94, + "learning_rate": 1.606600520915695e-06, + "loss": 0.8828, + "step": 36725 + }, + { + "epoch": 0.94, + "learning_rate": 1.6065785224845378e-06, + "loss": 0.8789, + "step": 36726 + }, + { + "epoch": 0.94, + "learning_rate": 1.6065565235889515e-06, + "loss": 0.7031, + "step": 36727 + }, + { + "epoch": 0.94, + "learning_rate": 1.6065345242289527e-06, + "loss": 0.835, + "step": 36728 + }, + { + "epoch": 0.94, + "learning_rate": 1.6065125244045583e-06, + "loss": 0.6587, + "step": 36729 + }, + { + "epoch": 0.94, + "learning_rate": 1.6064905241157853e-06, + "loss": 0.5886, + "step": 36730 + }, + { + "epoch": 0.94, + "learning_rate": 1.60646852336265e-06, + "loss": 0.9912, + "step": 36731 + }, + { + "epoch": 0.94, + "learning_rate": 1.60644652214517e-06, + "loss": 0.9395, + "step": 36732 + }, + { + "epoch": 0.94, + "learning_rate": 1.6064245204633617e-06, + "loss": 0.8467, + "step": 36733 + }, + { + "epoch": 0.94, + "learning_rate": 1.606402518317242e-06, + "loss": 0.7959, + "step": 36734 + }, + { + "epoch": 0.94, + "learning_rate": 1.606380515706828e-06, + "loss": 0.9189, + "step": 36735 + }, + { + "epoch": 0.94, + "learning_rate": 1.6063585126321359e-06, + "loss": 0.7979, + "step": 36736 + }, + { + "epoch": 0.94, + "learning_rate": 1.6063365090931833e-06, + "loss": 0.8721, + "step": 36737 + }, + { + "epoch": 0.94, + "learning_rate": 1.6063145050899866e-06, + "loss": 0.6851, + "step": 36738 + }, + { + "epoch": 0.94, + "learning_rate": 1.6062925006225627e-06, + "loss": 0.7402, + "step": 36739 + }, + { + "epoch": 0.94, + "learning_rate": 1.6062704956909286e-06, + "loss": 0.8086, + "step": 36740 + }, + { + "epoch": 0.94, + "learning_rate": 1.606248490295101e-06, + "loss": 0.7065, + "step": 36741 + }, + { + "epoch": 0.94, + "learning_rate": 1.6062264844350968e-06, + "loss": 0.8516, + "step": 36742 + }, + { + "epoch": 0.94, + "learning_rate": 1.606204478110933e-06, + "loss": 0.8457, + "step": 36743 + }, + { + "epoch": 0.94, + "learning_rate": 1.6061824713226262e-06, + "loss": 0.9531, + "step": 36744 + }, + { + "epoch": 0.94, + "learning_rate": 1.6061604640701933e-06, + "loss": 0.8525, + "step": 36745 + }, + { + "epoch": 0.94, + "learning_rate": 1.6061384563536512e-06, + "loss": 0.6855, + "step": 36746 + }, + { + "epoch": 0.94, + "learning_rate": 1.606116448173017e-06, + "loss": 0.5852, + "step": 36747 + }, + { + "epoch": 0.94, + "learning_rate": 1.6060944395283072e-06, + "loss": 0.8467, + "step": 36748 + }, + { + "epoch": 0.94, + "learning_rate": 1.6060724304195383e-06, + "loss": 1.0449, + "step": 36749 + }, + { + "epoch": 0.94, + "learning_rate": 1.6060504208467283e-06, + "loss": 0.8496, + "step": 36750 + }, + { + "epoch": 0.94, + "learning_rate": 1.606028410809893e-06, + "loss": 0.5876, + "step": 36751 + }, + { + "epoch": 0.94, + "learning_rate": 1.6060064003090496e-06, + "loss": 0.9053, + "step": 36752 + }, + { + "epoch": 0.94, + "learning_rate": 1.6059843893442149e-06, + "loss": 0.8291, + "step": 36753 + }, + { + "epoch": 0.94, + "learning_rate": 1.6059623779154058e-06, + "loss": 0.9688, + "step": 36754 + }, + { + "epoch": 0.94, + "learning_rate": 1.6059403660226395e-06, + "loss": 0.8379, + "step": 36755 + }, + { + "epoch": 0.94, + "learning_rate": 1.6059183536659324e-06, + "loss": 0.8281, + "step": 36756 + }, + { + "epoch": 0.94, + "learning_rate": 1.6058963408453012e-06, + "loss": 0.7578, + "step": 36757 + }, + { + "epoch": 0.94, + "learning_rate": 1.6058743275607634e-06, + "loss": 0.8101, + "step": 36758 + }, + { + "epoch": 0.94, + "learning_rate": 1.6058523138123352e-06, + "loss": 0.9409, + "step": 36759 + }, + { + "epoch": 0.94, + "learning_rate": 1.605830299600034e-06, + "loss": 0.8242, + "step": 36760 + }, + { + "epoch": 0.94, + "learning_rate": 1.6058082849238761e-06, + "loss": 0.9248, + "step": 36761 + }, + { + "epoch": 0.94, + "learning_rate": 1.6057862697838788e-06, + "loss": 1.0156, + "step": 36762 + }, + { + "epoch": 0.94, + "learning_rate": 1.605764254180059e-06, + "loss": 0.9922, + "step": 36763 + }, + { + "epoch": 0.94, + "learning_rate": 1.605742238112433e-06, + "loss": 0.6904, + "step": 36764 + }, + { + "epoch": 0.94, + "learning_rate": 1.6057202215810183e-06, + "loss": 0.9961, + "step": 36765 + }, + { + "epoch": 0.94, + "learning_rate": 1.6056982045858315e-06, + "loss": 0.7861, + "step": 36766 + }, + { + "epoch": 0.94, + "learning_rate": 1.6056761871268894e-06, + "loss": 0.8516, + "step": 36767 + }, + { + "epoch": 0.94, + "learning_rate": 1.6056541692042086e-06, + "loss": 0.7261, + "step": 36768 + }, + { + "epoch": 0.94, + "learning_rate": 1.6056321508178066e-06, + "loss": 0.7871, + "step": 36769 + }, + { + "epoch": 0.94, + "learning_rate": 1.6056101319676997e-06, + "loss": 0.8682, + "step": 36770 + }, + { + "epoch": 0.94, + "learning_rate": 1.605588112653905e-06, + "loss": 0.9756, + "step": 36771 + }, + { + "epoch": 0.94, + "learning_rate": 1.6055660928764393e-06, + "loss": 0.9844, + "step": 36772 + }, + { + "epoch": 0.94, + "learning_rate": 1.6055440726353195e-06, + "loss": 0.873, + "step": 36773 + }, + { + "epoch": 0.94, + "learning_rate": 1.6055220519305626e-06, + "loss": 0.835, + "step": 36774 + }, + { + "epoch": 0.94, + "learning_rate": 1.6055000307621853e-06, + "loss": 1.001, + "step": 36775 + }, + { + "epoch": 0.94, + "learning_rate": 1.6054780091302043e-06, + "loss": 0.8506, + "step": 36776 + }, + { + "epoch": 0.94, + "learning_rate": 1.6054559870346367e-06, + "loss": 0.8115, + "step": 36777 + }, + { + "epoch": 0.94, + "learning_rate": 1.6054339644754996e-06, + "loss": 0.7075, + "step": 36778 + }, + { + "epoch": 0.94, + "learning_rate": 1.6054119414528091e-06, + "loss": 0.7642, + "step": 36779 + }, + { + "epoch": 0.94, + "learning_rate": 1.6053899179665824e-06, + "loss": 0.9297, + "step": 36780 + }, + { + "epoch": 0.94, + "learning_rate": 1.6053678940168366e-06, + "loss": 0.9375, + "step": 36781 + }, + { + "epoch": 0.94, + "learning_rate": 1.6053458696035889e-06, + "loss": 0.833, + "step": 36782 + }, + { + "epoch": 0.94, + "learning_rate": 1.6053238447268553e-06, + "loss": 0.8701, + "step": 36783 + }, + { + "epoch": 0.94, + "learning_rate": 1.6053018193866532e-06, + "loss": 0.9707, + "step": 36784 + }, + { + "epoch": 0.94, + "learning_rate": 1.6052797935829992e-06, + "loss": 0.7939, + "step": 36785 + }, + { + "epoch": 0.94, + "learning_rate": 1.6052577673159104e-06, + "loss": 0.8198, + "step": 36786 + }, + { + "epoch": 0.94, + "learning_rate": 1.6052357405854035e-06, + "loss": 0.7764, + "step": 36787 + }, + { + "epoch": 0.94, + "learning_rate": 1.6052137133914956e-06, + "loss": 0.9912, + "step": 36788 + }, + { + "epoch": 0.94, + "learning_rate": 1.6051916857342032e-06, + "loss": 0.75, + "step": 36789 + }, + { + "epoch": 0.94, + "learning_rate": 1.6051696576135435e-06, + "loss": 1.0244, + "step": 36790 + }, + { + "epoch": 0.94, + "learning_rate": 1.6051476290295328e-06, + "loss": 0.7441, + "step": 36791 + }, + { + "epoch": 0.94, + "learning_rate": 1.6051255999821888e-06, + "loss": 0.8013, + "step": 36792 + }, + { + "epoch": 0.94, + "learning_rate": 1.605103570471528e-06, + "loss": 0.7422, + "step": 36793 + }, + { + "epoch": 0.94, + "learning_rate": 1.6050815404975671e-06, + "loss": 1.0225, + "step": 36794 + }, + { + "epoch": 0.94, + "learning_rate": 1.6050595100603231e-06, + "loss": 0.6857, + "step": 36795 + }, + { + "epoch": 0.94, + "learning_rate": 1.6050374791598127e-06, + "loss": 0.792, + "step": 36796 + }, + { + "epoch": 0.94, + "learning_rate": 1.6050154477960531e-06, + "loss": 0.8867, + "step": 36797 + }, + { + "epoch": 0.94, + "learning_rate": 1.6049934159690608e-06, + "loss": 0.7871, + "step": 36798 + }, + { + "epoch": 0.94, + "learning_rate": 1.604971383678853e-06, + "loss": 0.6265, + "step": 36799 + }, + { + "epoch": 0.94, + "learning_rate": 1.6049493509254463e-06, + "loss": 0.8262, + "step": 36800 + }, + { + "epoch": 0.94, + "learning_rate": 1.604927317708858e-06, + "loss": 0.9629, + "step": 36801 + }, + { + "epoch": 0.94, + "learning_rate": 1.6049052840291047e-06, + "loss": 0.9238, + "step": 36802 + }, + { + "epoch": 0.94, + "learning_rate": 1.604883249886203e-06, + "loss": 0.8799, + "step": 36803 + }, + { + "epoch": 0.94, + "learning_rate": 1.6048612152801698e-06, + "loss": 0.8721, + "step": 36804 + }, + { + "epoch": 0.94, + "learning_rate": 1.6048391802110223e-06, + "loss": 0.8535, + "step": 36805 + }, + { + "epoch": 0.94, + "learning_rate": 1.6048171446787775e-06, + "loss": 0.7969, + "step": 36806 + }, + { + "epoch": 0.94, + "learning_rate": 1.604795108683452e-06, + "loss": 0.6964, + "step": 36807 + }, + { + "epoch": 0.94, + "learning_rate": 1.6047730722250626e-06, + "loss": 0.7656, + "step": 36808 + }, + { + "epoch": 0.94, + "learning_rate": 1.604751035303626e-06, + "loss": 0.8096, + "step": 36809 + }, + { + "epoch": 0.94, + "learning_rate": 1.6047289979191598e-06, + "loss": 0.6191, + "step": 36810 + }, + { + "epoch": 0.94, + "learning_rate": 1.60470696007168e-06, + "loss": 0.6587, + "step": 36811 + }, + { + "epoch": 0.94, + "learning_rate": 1.6046849217612043e-06, + "loss": 0.9971, + "step": 36812 + }, + { + "epoch": 0.94, + "learning_rate": 1.604662882987749e-06, + "loss": 1.0283, + "step": 36813 + }, + { + "epoch": 0.94, + "learning_rate": 1.6046408437513308e-06, + "loss": 0.7471, + "step": 36814 + }, + { + "epoch": 0.94, + "learning_rate": 1.6046188040519673e-06, + "loss": 0.9785, + "step": 36815 + }, + { + "epoch": 0.94, + "learning_rate": 1.604596763889675e-06, + "loss": 0.7725, + "step": 36816 + }, + { + "epoch": 0.94, + "learning_rate": 1.6045747232644703e-06, + "loss": 0.8447, + "step": 36817 + }, + { + "epoch": 0.94, + "learning_rate": 1.6045526821763708e-06, + "loss": 0.8359, + "step": 36818 + }, + { + "epoch": 0.94, + "learning_rate": 1.6045306406253933e-06, + "loss": 0.8906, + "step": 36819 + }, + { + "epoch": 0.94, + "learning_rate": 1.6045085986115543e-06, + "loss": 1.0557, + "step": 36820 + }, + { + "epoch": 0.94, + "learning_rate": 1.6044865561348711e-06, + "loss": 0.7002, + "step": 36821 + }, + { + "epoch": 0.94, + "learning_rate": 1.60446451319536e-06, + "loss": 0.9922, + "step": 36822 + }, + { + "epoch": 0.94, + "learning_rate": 1.6044424697930382e-06, + "loss": 0.9639, + "step": 36823 + }, + { + "epoch": 0.94, + "learning_rate": 1.604420425927923e-06, + "loss": 0.5459, + "step": 36824 + }, + { + "epoch": 0.94, + "learning_rate": 1.6043983816000305e-06, + "loss": 0.6255, + "step": 36825 + }, + { + "epoch": 0.94, + "learning_rate": 1.604376336809378e-06, + "loss": 0.96, + "step": 36826 + }, + { + "epoch": 0.94, + "learning_rate": 1.6043542915559826e-06, + "loss": 0.8955, + "step": 36827 + }, + { + "epoch": 0.94, + "learning_rate": 1.6043322458398607e-06, + "loss": 0.7725, + "step": 36828 + }, + { + "epoch": 0.94, + "learning_rate": 1.6043101996610293e-06, + "loss": 0.8262, + "step": 36829 + }, + { + "epoch": 0.94, + "learning_rate": 1.6042881530195056e-06, + "loss": 0.9531, + "step": 36830 + }, + { + "epoch": 0.94, + "learning_rate": 1.6042661059153061e-06, + "loss": 0.7095, + "step": 36831 + }, + { + "epoch": 0.94, + "learning_rate": 1.604244058348448e-06, + "loss": 0.9463, + "step": 36832 + }, + { + "epoch": 0.94, + "learning_rate": 1.604222010318948e-06, + "loss": 1.0156, + "step": 36833 + }, + { + "epoch": 0.94, + "learning_rate": 1.6041999618268225e-06, + "loss": 0.8057, + "step": 36834 + }, + { + "epoch": 0.94, + "learning_rate": 1.6041779128720894e-06, + "loss": 0.7979, + "step": 36835 + }, + { + "epoch": 0.94, + "learning_rate": 1.604155863454765e-06, + "loss": 0.8701, + "step": 36836 + }, + { + "epoch": 0.94, + "learning_rate": 1.6041338135748662e-06, + "loss": 0.834, + "step": 36837 + }, + { + "epoch": 0.94, + "learning_rate": 1.6041117632324096e-06, + "loss": 0.9258, + "step": 36838 + }, + { + "epoch": 0.94, + "learning_rate": 1.6040897124274126e-06, + "loss": 0.9775, + "step": 36839 + }, + { + "epoch": 0.94, + "learning_rate": 1.6040676611598918e-06, + "loss": 0.6758, + "step": 36840 + }, + { + "epoch": 0.94, + "learning_rate": 1.6040456094298645e-06, + "loss": 0.9102, + "step": 36841 + }, + { + "epoch": 0.94, + "learning_rate": 1.6040235572373471e-06, + "loss": 0.8223, + "step": 36842 + }, + { + "epoch": 0.94, + "learning_rate": 1.6040015045823565e-06, + "loss": 0.8047, + "step": 36843 + }, + { + "epoch": 0.94, + "learning_rate": 1.6039794514649096e-06, + "loss": 0.6562, + "step": 36844 + }, + { + "epoch": 0.94, + "learning_rate": 1.6039573978850236e-06, + "loss": 0.9961, + "step": 36845 + }, + { + "epoch": 0.94, + "learning_rate": 1.603935343842715e-06, + "loss": 0.8184, + "step": 36846 + }, + { + "epoch": 0.94, + "learning_rate": 1.6039132893380013e-06, + "loss": 0.752, + "step": 36847 + }, + { + "epoch": 0.94, + "learning_rate": 1.6038912343708985e-06, + "loss": 0.9023, + "step": 36848 + }, + { + "epoch": 0.94, + "learning_rate": 1.6038691789414242e-06, + "loss": 0.9316, + "step": 36849 + }, + { + "epoch": 0.94, + "learning_rate": 1.6038471230495952e-06, + "loss": 1.0342, + "step": 36850 + }, + { + "epoch": 0.94, + "learning_rate": 1.603825066695428e-06, + "loss": 0.9771, + "step": 36851 + }, + { + "epoch": 0.94, + "learning_rate": 1.6038030098789398e-06, + "loss": 0.7437, + "step": 36852 + }, + { + "epoch": 0.94, + "learning_rate": 1.6037809526001473e-06, + "loss": 0.6604, + "step": 36853 + }, + { + "epoch": 0.94, + "learning_rate": 1.6037588948590678e-06, + "loss": 0.7939, + "step": 36854 + }, + { + "epoch": 0.94, + "learning_rate": 1.6037368366557174e-06, + "loss": 0.792, + "step": 36855 + }, + { + "epoch": 0.94, + "learning_rate": 1.6037147779901137e-06, + "loss": 0.8369, + "step": 36856 + }, + { + "epoch": 0.94, + "learning_rate": 1.6036927188622732e-06, + "loss": 0.8408, + "step": 36857 + }, + { + "epoch": 0.94, + "learning_rate": 1.603670659272213e-06, + "loss": 0.8857, + "step": 36858 + }, + { + "epoch": 0.94, + "learning_rate": 1.6036485992199503e-06, + "loss": 0.8906, + "step": 36859 + }, + { + "epoch": 0.94, + "learning_rate": 1.6036265387055013e-06, + "loss": 0.835, + "step": 36860 + }, + { + "epoch": 0.94, + "learning_rate": 1.603604477728883e-06, + "loss": 0.7085, + "step": 36861 + }, + { + "epoch": 0.94, + "learning_rate": 1.6035824162901127e-06, + "loss": 0.73, + "step": 36862 + }, + { + "epoch": 0.94, + "learning_rate": 1.6035603543892071e-06, + "loss": 0.9736, + "step": 36863 + }, + { + "epoch": 0.94, + "learning_rate": 1.6035382920261832e-06, + "loss": 0.5967, + "step": 36864 + }, + { + "epoch": 0.94, + "learning_rate": 1.6035162292010578e-06, + "loss": 0.729, + "step": 36865 + }, + { + "epoch": 0.94, + "learning_rate": 1.6034941659138474e-06, + "loss": 0.647, + "step": 36866 + }, + { + "epoch": 0.94, + "learning_rate": 1.6034721021645698e-06, + "loss": 0.8613, + "step": 36867 + }, + { + "epoch": 0.94, + "learning_rate": 1.6034500379532412e-06, + "loss": 0.8281, + "step": 36868 + }, + { + "epoch": 0.94, + "learning_rate": 1.6034279732798784e-06, + "loss": 0.7393, + "step": 36869 + }, + { + "epoch": 0.94, + "learning_rate": 1.6034059081444988e-06, + "loss": 0.8281, + "step": 36870 + }, + { + "epoch": 0.95, + "learning_rate": 1.603383842547119e-06, + "loss": 0.5913, + "step": 36871 + }, + { + "epoch": 0.95, + "learning_rate": 1.6033617764877559e-06, + "loss": 0.7466, + "step": 36872 + }, + { + "epoch": 0.95, + "learning_rate": 1.6033397099664266e-06, + "loss": 0.8008, + "step": 36873 + }, + { + "epoch": 0.95, + "learning_rate": 1.6033176429831473e-06, + "loss": 0.6978, + "step": 36874 + }, + { + "epoch": 0.95, + "learning_rate": 1.6032955755379361e-06, + "loss": 0.7944, + "step": 36875 + }, + { + "epoch": 0.95, + "learning_rate": 1.6032735076308086e-06, + "loss": 0.8018, + "step": 36876 + }, + { + "epoch": 0.95, + "learning_rate": 1.6032514392617826e-06, + "loss": 0.9102, + "step": 36877 + }, + { + "epoch": 0.95, + "learning_rate": 1.603229370430875e-06, + "loss": 0.9385, + "step": 36878 + }, + { + "epoch": 0.95, + "learning_rate": 1.603207301138102e-06, + "loss": 0.9297, + "step": 36879 + }, + { + "epoch": 0.95, + "learning_rate": 1.603185231383481e-06, + "loss": 0.8027, + "step": 36880 + }, + { + "epoch": 0.95, + "learning_rate": 1.6031631611670288e-06, + "loss": 0.8359, + "step": 36881 + }, + { + "epoch": 0.95, + "learning_rate": 1.6031410904887623e-06, + "loss": 0.855, + "step": 36882 + }, + { + "epoch": 0.95, + "learning_rate": 1.6031190193486985e-06, + "loss": 0.8154, + "step": 36883 + }, + { + "epoch": 0.95, + "learning_rate": 1.6030969477468541e-06, + "loss": 0.644, + "step": 36884 + }, + { + "epoch": 0.95, + "learning_rate": 1.6030748756832462e-06, + "loss": 0.4723, + "step": 36885 + }, + { + "epoch": 0.95, + "learning_rate": 1.6030528031578915e-06, + "loss": 0.7651, + "step": 36886 + }, + { + "epoch": 0.95, + "learning_rate": 1.603030730170807e-06, + "loss": 0.9414, + "step": 36887 + }, + { + "epoch": 0.95, + "learning_rate": 1.6030086567220096e-06, + "loss": 0.8838, + "step": 36888 + }, + { + "epoch": 0.95, + "learning_rate": 1.6029865828115164e-06, + "loss": 0.7988, + "step": 36889 + }, + { + "epoch": 0.95, + "learning_rate": 1.6029645084393437e-06, + "loss": 0.9004, + "step": 36890 + }, + { + "epoch": 0.95, + "learning_rate": 1.602942433605509e-06, + "loss": 0.9619, + "step": 36891 + }, + { + "epoch": 0.95, + "learning_rate": 1.6029203583100292e-06, + "loss": 0.8252, + "step": 36892 + }, + { + "epoch": 0.95, + "learning_rate": 1.6028982825529207e-06, + "loss": 1.0684, + "step": 36893 + }, + { + "epoch": 0.95, + "learning_rate": 1.6028762063342009e-06, + "loss": 0.709, + "step": 36894 + }, + { + "epoch": 0.95, + "learning_rate": 1.6028541296538864e-06, + "loss": 0.7715, + "step": 36895 + }, + { + "epoch": 0.95, + "learning_rate": 1.6028320525119943e-06, + "loss": 0.8818, + "step": 36896 + }, + { + "epoch": 0.95, + "learning_rate": 1.6028099749085416e-06, + "loss": 0.6101, + "step": 36897 + }, + { + "epoch": 0.95, + "learning_rate": 1.6027878968435447e-06, + "loss": 0.9248, + "step": 36898 + }, + { + "epoch": 0.95, + "learning_rate": 1.602765818317021e-06, + "loss": 1.082, + "step": 36899 + }, + { + "epoch": 0.95, + "learning_rate": 1.6027437393289868e-06, + "loss": 1.0117, + "step": 36900 + }, + { + "epoch": 0.95, + "learning_rate": 1.6027216598794597e-06, + "loss": 0.9033, + "step": 36901 + }, + { + "epoch": 0.95, + "learning_rate": 1.6026995799684566e-06, + "loss": 0.8828, + "step": 36902 + }, + { + "epoch": 0.95, + "learning_rate": 1.6026774995959941e-06, + "loss": 0.8711, + "step": 36903 + }, + { + "epoch": 0.95, + "learning_rate": 1.6026554187620889e-06, + "loss": 0.8574, + "step": 36904 + }, + { + "epoch": 0.95, + "learning_rate": 1.6026333374667584e-06, + "loss": 0.9961, + "step": 36905 + }, + { + "epoch": 0.95, + "learning_rate": 1.6026112557100188e-06, + "loss": 0.749, + "step": 36906 + }, + { + "epoch": 0.95, + "learning_rate": 1.6025891734918878e-06, + "loss": 0.7681, + "step": 36907 + }, + { + "epoch": 0.95, + "learning_rate": 1.602567090812382e-06, + "loss": 0.9629, + "step": 36908 + }, + { + "epoch": 0.95, + "learning_rate": 1.6025450076715186e-06, + "loss": 0.6606, + "step": 36909 + }, + { + "epoch": 0.95, + "learning_rate": 1.6025229240693136e-06, + "loss": 1.082, + "step": 36910 + }, + { + "epoch": 0.95, + "learning_rate": 1.6025008400057848e-06, + "loss": 0.7183, + "step": 36911 + }, + { + "epoch": 0.95, + "learning_rate": 1.602478755480949e-06, + "loss": 0.7002, + "step": 36912 + }, + { + "epoch": 0.95, + "learning_rate": 1.6024566704948225e-06, + "loss": 0.7344, + "step": 36913 + }, + { + "epoch": 0.95, + "learning_rate": 1.602434585047423e-06, + "loss": 0.7388, + "step": 36914 + }, + { + "epoch": 0.95, + "learning_rate": 1.6024124991387669e-06, + "loss": 0.8162, + "step": 36915 + }, + { + "epoch": 0.95, + "learning_rate": 1.602390412768871e-06, + "loss": 0.6685, + "step": 36916 + }, + { + "epoch": 0.95, + "learning_rate": 1.602368325937753e-06, + "loss": 0.873, + "step": 36917 + }, + { + "epoch": 0.95, + "learning_rate": 1.6023462386454286e-06, + "loss": 1.0195, + "step": 36918 + }, + { + "epoch": 0.95, + "learning_rate": 1.6023241508919158e-06, + "loss": 0.8916, + "step": 36919 + }, + { + "epoch": 0.95, + "learning_rate": 1.602302062677231e-06, + "loss": 0.7959, + "step": 36920 + }, + { + "epoch": 0.95, + "learning_rate": 1.6022799740013913e-06, + "loss": 0.5293, + "step": 36921 + }, + { + "epoch": 0.95, + "learning_rate": 1.6022578848644134e-06, + "loss": 0.832, + "step": 36922 + }, + { + "epoch": 0.95, + "learning_rate": 1.6022357952663144e-06, + "loss": 0.6704, + "step": 36923 + }, + { + "epoch": 0.95, + "learning_rate": 1.6022137052071111e-06, + "loss": 0.9746, + "step": 36924 + }, + { + "epoch": 0.95, + "learning_rate": 1.6021916146868204e-06, + "loss": 0.958, + "step": 36925 + }, + { + "epoch": 0.95, + "learning_rate": 1.6021695237054594e-06, + "loss": 0.709, + "step": 36926 + }, + { + "epoch": 0.95, + "learning_rate": 1.6021474322630448e-06, + "loss": 0.8838, + "step": 36927 + }, + { + "epoch": 0.95, + "learning_rate": 1.6021253403595938e-06, + "loss": 0.7129, + "step": 36928 + }, + { + "epoch": 0.95, + "learning_rate": 1.6021032479951226e-06, + "loss": 0.9561, + "step": 36929 + }, + { + "epoch": 0.95, + "learning_rate": 1.602081155169649e-06, + "loss": 0.8027, + "step": 36930 + }, + { + "epoch": 0.95, + "learning_rate": 1.6020590618831897e-06, + "loss": 0.7109, + "step": 36931 + }, + { + "epoch": 0.95, + "learning_rate": 1.6020369681357613e-06, + "loss": 0.8711, + "step": 36932 + }, + { + "epoch": 0.95, + "learning_rate": 1.6020148739273807e-06, + "loss": 0.4648, + "step": 36933 + }, + { + "epoch": 0.95, + "learning_rate": 1.6019927792580651e-06, + "loss": 0.5925, + "step": 36934 + }, + { + "epoch": 0.95, + "learning_rate": 1.6019706841278313e-06, + "loss": 0.8691, + "step": 36935 + }, + { + "epoch": 0.95, + "learning_rate": 1.6019485885366963e-06, + "loss": 0.8359, + "step": 36936 + }, + { + "epoch": 0.95, + "learning_rate": 1.6019264924846772e-06, + "loss": 0.915, + "step": 36937 + }, + { + "epoch": 0.95, + "learning_rate": 1.6019043959717901e-06, + "loss": 0.5112, + "step": 36938 + }, + { + "epoch": 0.95, + "learning_rate": 1.601882298998053e-06, + "loss": 0.6816, + "step": 36939 + }, + { + "epoch": 0.95, + "learning_rate": 1.601860201563482e-06, + "loss": 0.7905, + "step": 36940 + }, + { + "epoch": 0.95, + "learning_rate": 1.6018381036680944e-06, + "loss": 0.8301, + "step": 36941 + }, + { + "epoch": 0.95, + "learning_rate": 1.6018160053119072e-06, + "loss": 0.7598, + "step": 36942 + }, + { + "epoch": 0.95, + "learning_rate": 1.6017939064949366e-06, + "loss": 0.7134, + "step": 36943 + }, + { + "epoch": 0.95, + "learning_rate": 1.6017718072172006e-06, + "loss": 0.8945, + "step": 36944 + }, + { + "epoch": 0.95, + "learning_rate": 1.6017497074787153e-06, + "loss": 0.9561, + "step": 36945 + }, + { + "epoch": 0.95, + "learning_rate": 1.6017276072794981e-06, + "loss": 1.001, + "step": 36946 + }, + { + "epoch": 0.95, + "learning_rate": 1.6017055066195658e-06, + "loss": 0.6128, + "step": 36947 + }, + { + "epoch": 0.95, + "learning_rate": 1.6016834054989351e-06, + "loss": 0.8828, + "step": 36948 + }, + { + "epoch": 0.95, + "learning_rate": 1.6016613039176232e-06, + "loss": 0.9219, + "step": 36949 + }, + { + "epoch": 0.95, + "learning_rate": 1.6016392018756468e-06, + "loss": 0.9316, + "step": 36950 + }, + { + "epoch": 0.95, + "learning_rate": 1.601617099373023e-06, + "loss": 0.8945, + "step": 36951 + }, + { + "epoch": 0.95, + "learning_rate": 1.6015949964097688e-06, + "loss": 0.8838, + "step": 36952 + }, + { + "epoch": 0.95, + "learning_rate": 1.6015728929859008e-06, + "loss": 0.6816, + "step": 36953 + }, + { + "epoch": 0.95, + "learning_rate": 1.601550789101436e-06, + "loss": 0.9443, + "step": 36954 + }, + { + "epoch": 0.95, + "learning_rate": 1.6015286847563914e-06, + "loss": 0.5864, + "step": 36955 + }, + { + "epoch": 0.95, + "learning_rate": 1.6015065799507842e-06, + "loss": 0.7354, + "step": 36956 + }, + { + "epoch": 0.95, + "learning_rate": 1.6014844746846307e-06, + "loss": 0.5762, + "step": 36957 + }, + { + "epoch": 0.95, + "learning_rate": 1.6014623689579486e-06, + "loss": 1.0107, + "step": 36958 + }, + { + "epoch": 0.95, + "learning_rate": 1.6014402627707542e-06, + "loss": 1.0137, + "step": 36959 + }, + { + "epoch": 0.95, + "learning_rate": 1.6014181561230648e-06, + "loss": 0.8457, + "step": 36960 + }, + { + "epoch": 0.95, + "learning_rate": 1.6013960490148968e-06, + "loss": 0.874, + "step": 36961 + }, + { + "epoch": 0.95, + "learning_rate": 1.601373941446268e-06, + "loss": 0.6431, + "step": 36962 + }, + { + "epoch": 0.95, + "learning_rate": 1.6013518334171945e-06, + "loss": 0.8721, + "step": 36963 + }, + { + "epoch": 0.95, + "learning_rate": 1.6013297249276936e-06, + "loss": 1.04, + "step": 36964 + }, + { + "epoch": 0.95, + "learning_rate": 1.6013076159777822e-06, + "loss": 0.8447, + "step": 36965 + }, + { + "epoch": 0.95, + "learning_rate": 1.6012855065674773e-06, + "loss": 0.8105, + "step": 36966 + }, + { + "epoch": 0.95, + "learning_rate": 1.6012633966967956e-06, + "loss": 0.8721, + "step": 36967 + }, + { + "epoch": 0.95, + "learning_rate": 1.6012412863657544e-06, + "loss": 0.7739, + "step": 36968 + }, + { + "epoch": 0.95, + "learning_rate": 1.60121917557437e-06, + "loss": 0.8516, + "step": 36969 + }, + { + "epoch": 0.95, + "learning_rate": 1.60119706432266e-06, + "loss": 0.7993, + "step": 36970 + }, + { + "epoch": 0.95, + "learning_rate": 1.601174952610641e-06, + "loss": 0.7471, + "step": 36971 + }, + { + "epoch": 0.95, + "learning_rate": 1.60115284043833e-06, + "loss": 0.7302, + "step": 36972 + }, + { + "epoch": 0.95, + "learning_rate": 1.6011307278057439e-06, + "loss": 0.8721, + "step": 36973 + }, + { + "epoch": 0.95, + "learning_rate": 1.6011086147128997e-06, + "loss": 0.7686, + "step": 36974 + }, + { + "epoch": 0.95, + "learning_rate": 1.601086501159814e-06, + "loss": 0.873, + "step": 36975 + }, + { + "epoch": 0.95, + "learning_rate": 1.6010643871465044e-06, + "loss": 0.8516, + "step": 36976 + }, + { + "epoch": 0.95, + "learning_rate": 1.6010422726729874e-06, + "loss": 0.9727, + "step": 36977 + }, + { + "epoch": 0.95, + "learning_rate": 1.6010201577392797e-06, + "loss": 0.7666, + "step": 36978 + }, + { + "epoch": 0.95, + "learning_rate": 1.6009980423453985e-06, + "loss": 0.8423, + "step": 36979 + }, + { + "epoch": 0.95, + "learning_rate": 1.600975926491361e-06, + "loss": 0.8867, + "step": 36980 + }, + { + "epoch": 0.95, + "learning_rate": 1.6009538101771836e-06, + "loss": 0.9297, + "step": 36981 + }, + { + "epoch": 0.95, + "learning_rate": 1.6009316934028837e-06, + "loss": 0.9395, + "step": 36982 + }, + { + "epoch": 0.95, + "learning_rate": 1.6009095761684778e-06, + "loss": 0.8469, + "step": 36983 + }, + { + "epoch": 0.95, + "learning_rate": 1.6008874584739834e-06, + "loss": 0.771, + "step": 36984 + }, + { + "epoch": 0.95, + "learning_rate": 1.6008653403194168e-06, + "loss": 0.9502, + "step": 36985 + }, + { + "epoch": 0.95, + "learning_rate": 1.6008432217047953e-06, + "loss": 0.8203, + "step": 36986 + }, + { + "epoch": 0.95, + "learning_rate": 1.600821102630136e-06, + "loss": 1.0371, + "step": 36987 + }, + { + "epoch": 0.95, + "learning_rate": 1.6007989830954553e-06, + "loss": 0.8936, + "step": 36988 + }, + { + "epoch": 0.95, + "learning_rate": 1.6007768631007705e-06, + "loss": 0.9678, + "step": 36989 + }, + { + "epoch": 0.95, + "learning_rate": 1.6007547426460987e-06, + "loss": 0.7598, + "step": 36990 + }, + { + "epoch": 0.95, + "learning_rate": 1.6007326217314562e-06, + "loss": 0.7393, + "step": 36991 + }, + { + "epoch": 0.95, + "learning_rate": 1.600710500356861e-06, + "loss": 0.8271, + "step": 36992 + }, + { + "epoch": 0.95, + "learning_rate": 1.6006883785223288e-06, + "loss": 0.9668, + "step": 36993 + }, + { + "epoch": 0.95, + "learning_rate": 1.6006662562278775e-06, + "loss": 0.6816, + "step": 36994 + }, + { + "epoch": 0.95, + "learning_rate": 1.6006441334735235e-06, + "loss": 0.8276, + "step": 36995 + }, + { + "epoch": 0.95, + "learning_rate": 1.600622010259284e-06, + "loss": 1.0215, + "step": 36996 + }, + { + "epoch": 0.95, + "learning_rate": 1.6005998865851757e-06, + "loss": 0.7607, + "step": 36997 + }, + { + "epoch": 0.95, + "learning_rate": 1.6005777624512157e-06, + "loss": 0.6421, + "step": 36998 + }, + { + "epoch": 0.95, + "learning_rate": 1.600555637857421e-06, + "loss": 0.7539, + "step": 36999 + }, + { + "epoch": 0.95, + "learning_rate": 1.6005335128038082e-06, + "loss": 0.8047, + "step": 37000 + }, + { + "epoch": 0.95, + "learning_rate": 1.6005113872903947e-06, + "loss": 0.7422, + "step": 37001 + }, + { + "epoch": 0.95, + "learning_rate": 1.6004892613171976e-06, + "loss": 0.7754, + "step": 37002 + }, + { + "epoch": 0.95, + "learning_rate": 1.6004671348842331e-06, + "loss": 0.8169, + "step": 37003 + }, + { + "epoch": 0.95, + "learning_rate": 1.6004450079915186e-06, + "loss": 0.7969, + "step": 37004 + }, + { + "epoch": 0.95, + "learning_rate": 1.6004228806390708e-06, + "loss": 0.7515, + "step": 37005 + }, + { + "epoch": 0.95, + "learning_rate": 1.600400752826907e-06, + "loss": 0.9072, + "step": 37006 + }, + { + "epoch": 0.95, + "learning_rate": 1.600378624555044e-06, + "loss": 0.8022, + "step": 37007 + }, + { + "epoch": 0.95, + "learning_rate": 1.6003564958234988e-06, + "loss": 0.7007, + "step": 37008 + }, + { + "epoch": 0.95, + "learning_rate": 1.600334366632288e-06, + "loss": 0.877, + "step": 37009 + }, + { + "epoch": 0.95, + "learning_rate": 1.6003122369814288e-06, + "loss": 0.9131, + "step": 37010 + }, + { + "epoch": 0.95, + "learning_rate": 1.600290106870938e-06, + "loss": 0.7988, + "step": 37011 + }, + { + "epoch": 0.95, + "learning_rate": 1.6002679763008331e-06, + "loss": 0.8706, + "step": 37012 + }, + { + "epoch": 0.95, + "learning_rate": 1.60024584527113e-06, + "loss": 0.9385, + "step": 37013 + }, + { + "epoch": 0.95, + "learning_rate": 1.6002237137818467e-06, + "loss": 0.959, + "step": 37014 + }, + { + "epoch": 0.95, + "learning_rate": 1.6002015818329998e-06, + "loss": 0.9014, + "step": 37015 + }, + { + "epoch": 0.95, + "learning_rate": 1.6001794494246058e-06, + "loss": 1.0156, + "step": 37016 + }, + { + "epoch": 0.95, + "learning_rate": 1.600157316556682e-06, + "loss": 0.9766, + "step": 37017 + }, + { + "epoch": 0.95, + "learning_rate": 1.6001351832292456e-06, + "loss": 0.7002, + "step": 37018 + }, + { + "epoch": 0.95, + "learning_rate": 1.6001130494423131e-06, + "loss": 0.8052, + "step": 37019 + }, + { + "epoch": 0.95, + "learning_rate": 1.6000909151959015e-06, + "loss": 0.9062, + "step": 37020 + }, + { + "epoch": 0.95, + "learning_rate": 1.6000687804900284e-06, + "loss": 0.6924, + "step": 37021 + }, + { + "epoch": 0.95, + "learning_rate": 1.60004664532471e-06, + "loss": 0.7876, + "step": 37022 + }, + { + "epoch": 0.95, + "learning_rate": 1.600024509699963e-06, + "loss": 0.6509, + "step": 37023 + }, + { + "epoch": 0.95, + "learning_rate": 1.6000023736158052e-06, + "loss": 1.0332, + "step": 37024 + }, + { + "epoch": 0.95, + "learning_rate": 1.5999802370722533e-06, + "loss": 0.9082, + "step": 37025 + }, + { + "epoch": 0.95, + "learning_rate": 1.599958100069324e-06, + "loss": 0.8169, + "step": 37026 + }, + { + "epoch": 0.95, + "learning_rate": 1.5999359626070343e-06, + "loss": 0.874, + "step": 37027 + }, + { + "epoch": 0.95, + "learning_rate": 1.5999138246854012e-06, + "loss": 0.8486, + "step": 37028 + }, + { + "epoch": 0.95, + "learning_rate": 1.5998916863044417e-06, + "loss": 0.6304, + "step": 37029 + }, + { + "epoch": 0.95, + "learning_rate": 1.5998695474641729e-06, + "loss": 0.7261, + "step": 37030 + }, + { + "epoch": 0.95, + "learning_rate": 1.5998474081646115e-06, + "loss": 0.8047, + "step": 37031 + }, + { + "epoch": 0.95, + "learning_rate": 1.5998252684057744e-06, + "loss": 1.1895, + "step": 37032 + }, + { + "epoch": 0.95, + "learning_rate": 1.5998031281876786e-06, + "loss": 0.6655, + "step": 37033 + }, + { + "epoch": 0.95, + "learning_rate": 1.5997809875103412e-06, + "loss": 1.0215, + "step": 37034 + }, + { + "epoch": 0.95, + "learning_rate": 1.599758846373779e-06, + "loss": 0.8398, + "step": 37035 + }, + { + "epoch": 0.95, + "learning_rate": 1.5997367047780094e-06, + "loss": 0.8027, + "step": 37036 + }, + { + "epoch": 0.95, + "learning_rate": 1.5997145627230487e-06, + "loss": 0.689, + "step": 37037 + }, + { + "epoch": 0.95, + "learning_rate": 1.599692420208914e-06, + "loss": 0.6787, + "step": 37038 + }, + { + "epoch": 0.95, + "learning_rate": 1.5996702772356225e-06, + "loss": 0.7278, + "step": 37039 + }, + { + "epoch": 0.95, + "learning_rate": 1.5996481338031913e-06, + "loss": 0.9404, + "step": 37040 + }, + { + "epoch": 0.95, + "learning_rate": 1.5996259899116366e-06, + "loss": 0.8789, + "step": 37041 + }, + { + "epoch": 0.95, + "learning_rate": 1.5996038455609763e-06, + "loss": 0.7661, + "step": 37042 + }, + { + "epoch": 0.95, + "learning_rate": 1.599581700751227e-06, + "loss": 1.2041, + "step": 37043 + }, + { + "epoch": 0.95, + "learning_rate": 1.599559555482405e-06, + "loss": 0.6016, + "step": 37044 + }, + { + "epoch": 0.95, + "learning_rate": 1.5995374097545282e-06, + "loss": 0.873, + "step": 37045 + }, + { + "epoch": 0.95, + "learning_rate": 1.599515263567613e-06, + "loss": 0.6299, + "step": 37046 + }, + { + "epoch": 0.95, + "learning_rate": 1.5994931169216768e-06, + "loss": 0.8477, + "step": 37047 + }, + { + "epoch": 0.95, + "learning_rate": 1.5994709698167362e-06, + "loss": 0.8955, + "step": 37048 + }, + { + "epoch": 0.95, + "learning_rate": 1.599448822252808e-06, + "loss": 0.7988, + "step": 37049 + }, + { + "epoch": 0.95, + "learning_rate": 1.5994266742299094e-06, + "loss": 0.769, + "step": 37050 + }, + { + "epoch": 0.95, + "learning_rate": 1.5994045257480577e-06, + "loss": 0.8877, + "step": 37051 + }, + { + "epoch": 0.95, + "learning_rate": 1.5993823768072693e-06, + "loss": 1.0166, + "step": 37052 + }, + { + "epoch": 0.95, + "learning_rate": 1.5993602274075615e-06, + "loss": 0.8066, + "step": 37053 + }, + { + "epoch": 0.95, + "learning_rate": 1.599338077548951e-06, + "loss": 1.042, + "step": 37054 + }, + { + "epoch": 0.95, + "learning_rate": 1.5993159272314549e-06, + "loss": 0.9238, + "step": 37055 + }, + { + "epoch": 0.95, + "learning_rate": 1.5992937764550902e-06, + "loss": 0.834, + "step": 37056 + }, + { + "epoch": 0.95, + "learning_rate": 1.5992716252198738e-06, + "loss": 0.6201, + "step": 37057 + }, + { + "epoch": 0.95, + "learning_rate": 1.5992494735258229e-06, + "loss": 1.1162, + "step": 37058 + }, + { + "epoch": 0.95, + "learning_rate": 1.5992273213729539e-06, + "loss": 1.1816, + "step": 37059 + }, + { + "epoch": 0.95, + "learning_rate": 1.599205168761284e-06, + "loss": 0.7622, + "step": 37060 + }, + { + "epoch": 0.95, + "learning_rate": 1.5991830156908303e-06, + "loss": 0.7979, + "step": 37061 + }, + { + "epoch": 0.95, + "learning_rate": 1.5991608621616098e-06, + "loss": 1.042, + "step": 37062 + }, + { + "epoch": 0.95, + "learning_rate": 1.5991387081736395e-06, + "loss": 1.0508, + "step": 37063 + }, + { + "epoch": 0.95, + "learning_rate": 1.5991165537269363e-06, + "loss": 0.75, + "step": 37064 + }, + { + "epoch": 0.95, + "learning_rate": 1.599094398821517e-06, + "loss": 0.8047, + "step": 37065 + }, + { + "epoch": 0.95, + "learning_rate": 1.5990722434573987e-06, + "loss": 0.9678, + "step": 37066 + }, + { + "epoch": 0.95, + "learning_rate": 1.5990500876345983e-06, + "loss": 0.8599, + "step": 37067 + }, + { + "epoch": 0.95, + "learning_rate": 1.5990279313531328e-06, + "loss": 0.8462, + "step": 37068 + }, + { + "epoch": 0.95, + "learning_rate": 1.599005774613019e-06, + "loss": 0.8213, + "step": 37069 + }, + { + "epoch": 0.95, + "learning_rate": 1.5989836174142743e-06, + "loss": 0.8555, + "step": 37070 + }, + { + "epoch": 0.95, + "learning_rate": 1.5989614597569151e-06, + "loss": 0.8359, + "step": 37071 + }, + { + "epoch": 0.95, + "learning_rate": 1.598939301640959e-06, + "loss": 0.7104, + "step": 37072 + }, + { + "epoch": 0.95, + "learning_rate": 1.5989171430664223e-06, + "loss": 1.0137, + "step": 37073 + }, + { + "epoch": 0.95, + "learning_rate": 1.5988949840333223e-06, + "loss": 0.9834, + "step": 37074 + }, + { + "epoch": 0.95, + "learning_rate": 1.598872824541676e-06, + "loss": 0.7461, + "step": 37075 + }, + { + "epoch": 0.95, + "learning_rate": 1.5988506645915005e-06, + "loss": 0.7051, + "step": 37076 + }, + { + "epoch": 0.95, + "learning_rate": 1.5988285041828125e-06, + "loss": 0.9482, + "step": 37077 + }, + { + "epoch": 0.95, + "learning_rate": 1.598806343315629e-06, + "loss": 0.832, + "step": 37078 + }, + { + "epoch": 0.95, + "learning_rate": 1.5987841819899667e-06, + "loss": 0.5952, + "step": 37079 + }, + { + "epoch": 0.95, + "learning_rate": 1.5987620202058433e-06, + "loss": 0.8564, + "step": 37080 + }, + { + "epoch": 0.95, + "learning_rate": 1.5987398579632752e-06, + "loss": 0.7583, + "step": 37081 + }, + { + "epoch": 0.95, + "learning_rate": 1.5987176952622797e-06, + "loss": 0.9424, + "step": 37082 + }, + { + "epoch": 0.95, + "learning_rate": 1.5986955321028733e-06, + "loss": 0.7251, + "step": 37083 + }, + { + "epoch": 0.95, + "learning_rate": 1.5986733684850735e-06, + "loss": 0.6357, + "step": 37084 + }, + { + "epoch": 0.95, + "learning_rate": 1.598651204408897e-06, + "loss": 0.9199, + "step": 37085 + }, + { + "epoch": 0.95, + "learning_rate": 1.5986290398743608e-06, + "loss": 0.9297, + "step": 37086 + }, + { + "epoch": 0.95, + "learning_rate": 1.5986068748814815e-06, + "loss": 0.9219, + "step": 37087 + }, + { + "epoch": 0.95, + "learning_rate": 1.5985847094302768e-06, + "loss": 0.7383, + "step": 37088 + }, + { + "epoch": 0.95, + "learning_rate": 1.5985625435207633e-06, + "loss": 0.9443, + "step": 37089 + }, + { + "epoch": 0.95, + "learning_rate": 1.598540377152958e-06, + "loss": 0.6147, + "step": 37090 + }, + { + "epoch": 0.95, + "learning_rate": 1.5985182103268779e-06, + "loss": 0.9521, + "step": 37091 + }, + { + "epoch": 0.95, + "learning_rate": 1.5984960430425399e-06, + "loss": 0.8701, + "step": 37092 + }, + { + "epoch": 0.95, + "learning_rate": 1.5984738752999606e-06, + "loss": 0.833, + "step": 37093 + }, + { + "epoch": 0.95, + "learning_rate": 1.5984517070991576e-06, + "loss": 0.8535, + "step": 37094 + }, + { + "epoch": 0.95, + "learning_rate": 1.5984295384401478e-06, + "loss": 0.918, + "step": 37095 + }, + { + "epoch": 0.95, + "learning_rate": 1.5984073693229482e-06, + "loss": 0.6934, + "step": 37096 + }, + { + "epoch": 0.95, + "learning_rate": 1.5983851997475752e-06, + "loss": 0.7241, + "step": 37097 + }, + { + "epoch": 0.95, + "learning_rate": 1.5983630297140465e-06, + "loss": 0.9395, + "step": 37098 + }, + { + "epoch": 0.95, + "learning_rate": 1.5983408592223784e-06, + "loss": 0.7456, + "step": 37099 + }, + { + "epoch": 0.95, + "learning_rate": 1.5983186882725886e-06, + "loss": 0.835, + "step": 37100 + }, + { + "epoch": 0.95, + "learning_rate": 1.5982965168646937e-06, + "loss": 0.8369, + "step": 37101 + }, + { + "epoch": 0.95, + "learning_rate": 1.5982743449987102e-06, + "loss": 0.7739, + "step": 37102 + }, + { + "epoch": 0.95, + "learning_rate": 1.5982521726746558e-06, + "loss": 0.9814, + "step": 37103 + }, + { + "epoch": 0.95, + "learning_rate": 1.598229999892547e-06, + "loss": 0.9023, + "step": 37104 + }, + { + "epoch": 0.95, + "learning_rate": 1.5982078266524013e-06, + "loss": 0.873, + "step": 37105 + }, + { + "epoch": 0.95, + "learning_rate": 1.5981856529542352e-06, + "loss": 0.8838, + "step": 37106 + }, + { + "epoch": 0.95, + "learning_rate": 1.598163478798066e-06, + "loss": 0.7344, + "step": 37107 + }, + { + "epoch": 0.95, + "learning_rate": 1.5981413041839104e-06, + "loss": 0.7852, + "step": 37108 + }, + { + "epoch": 0.95, + "learning_rate": 1.5981191291117855e-06, + "loss": 0.8066, + "step": 37109 + }, + { + "epoch": 0.95, + "learning_rate": 1.5980969535817082e-06, + "loss": 0.8682, + "step": 37110 + }, + { + "epoch": 0.95, + "learning_rate": 1.598074777593696e-06, + "loss": 0.9473, + "step": 37111 + }, + { + "epoch": 0.95, + "learning_rate": 1.598052601147765e-06, + "loss": 0.8481, + "step": 37112 + }, + { + "epoch": 0.95, + "learning_rate": 1.5980304242439328e-06, + "loss": 0.75, + "step": 37113 + }, + { + "epoch": 0.95, + "learning_rate": 1.598008246882216e-06, + "loss": 0.8418, + "step": 37114 + }, + { + "epoch": 0.95, + "learning_rate": 1.5979860690626321e-06, + "loss": 0.9307, + "step": 37115 + }, + { + "epoch": 0.95, + "learning_rate": 1.5979638907851977e-06, + "loss": 0.9287, + "step": 37116 + }, + { + "epoch": 0.95, + "learning_rate": 1.5979417120499297e-06, + "loss": 0.916, + "step": 37117 + }, + { + "epoch": 0.95, + "learning_rate": 1.5979195328568453e-06, + "loss": 0.8252, + "step": 37118 + }, + { + "epoch": 0.95, + "learning_rate": 1.5978973532059614e-06, + "loss": 1.0967, + "step": 37119 + }, + { + "epoch": 0.95, + "learning_rate": 1.5978751730972949e-06, + "loss": 0.8525, + "step": 37120 + }, + { + "epoch": 0.95, + "learning_rate": 1.5978529925308632e-06, + "loss": 0.7773, + "step": 37121 + }, + { + "epoch": 0.95, + "learning_rate": 1.5978308115066827e-06, + "loss": 0.9463, + "step": 37122 + }, + { + "epoch": 0.95, + "learning_rate": 1.5978086300247706e-06, + "loss": 0.9834, + "step": 37123 + }, + { + "epoch": 0.95, + "learning_rate": 1.5977864480851437e-06, + "loss": 0.6812, + "step": 37124 + }, + { + "epoch": 0.95, + "learning_rate": 1.5977642656878196e-06, + "loss": 0.7002, + "step": 37125 + }, + { + "epoch": 0.95, + "learning_rate": 1.5977420828328148e-06, + "loss": 0.9062, + "step": 37126 + }, + { + "epoch": 0.95, + "learning_rate": 1.5977198995201465e-06, + "loss": 0.9482, + "step": 37127 + }, + { + "epoch": 0.95, + "learning_rate": 1.5976977157498313e-06, + "loss": 0.718, + "step": 37128 + }, + { + "epoch": 0.95, + "learning_rate": 1.5976755315218865e-06, + "loss": 1.0684, + "step": 37129 + }, + { + "epoch": 0.95, + "learning_rate": 1.597653346836329e-06, + "loss": 0.8184, + "step": 37130 + }, + { + "epoch": 0.95, + "learning_rate": 1.597631161693176e-06, + "loss": 0.7246, + "step": 37131 + }, + { + "epoch": 0.95, + "learning_rate": 1.597608976092444e-06, + "loss": 0.7656, + "step": 37132 + }, + { + "epoch": 0.95, + "learning_rate": 1.5975867900341504e-06, + "loss": 0.8105, + "step": 37133 + }, + { + "epoch": 0.95, + "learning_rate": 1.5975646035183122e-06, + "loss": 0.8145, + "step": 37134 + }, + { + "epoch": 0.95, + "learning_rate": 1.5975424165449461e-06, + "loss": 0.5356, + "step": 37135 + }, + { + "epoch": 0.95, + "learning_rate": 1.5975202291140695e-06, + "loss": 0.6787, + "step": 37136 + }, + { + "epoch": 0.95, + "learning_rate": 1.5974980412256989e-06, + "loss": 0.6382, + "step": 37137 + }, + { + "epoch": 0.95, + "learning_rate": 1.5974758528798515e-06, + "loss": 0.7588, + "step": 37138 + }, + { + "epoch": 0.95, + "learning_rate": 1.5974536640765445e-06, + "loss": 0.9482, + "step": 37139 + }, + { + "epoch": 0.95, + "learning_rate": 1.5974314748157944e-06, + "loss": 0.7539, + "step": 37140 + }, + { + "epoch": 0.95, + "learning_rate": 1.5974092850976191e-06, + "loss": 0.8418, + "step": 37141 + }, + { + "epoch": 0.95, + "learning_rate": 1.5973870949220345e-06, + "loss": 1.082, + "step": 37142 + }, + { + "epoch": 0.95, + "learning_rate": 1.597364904289058e-06, + "loss": 0.8203, + "step": 37143 + }, + { + "epoch": 0.95, + "learning_rate": 1.5973427131987067e-06, + "loss": 0.8438, + "step": 37144 + }, + { + "epoch": 0.95, + "learning_rate": 1.5973205216509977e-06, + "loss": 1.0293, + "step": 37145 + }, + { + "epoch": 0.95, + "learning_rate": 1.5972983296459479e-06, + "loss": 0.5304, + "step": 37146 + }, + { + "epoch": 0.95, + "learning_rate": 1.5972761371835742e-06, + "loss": 0.9385, + "step": 37147 + }, + { + "epoch": 0.95, + "learning_rate": 1.5972539442638935e-06, + "loss": 0.9756, + "step": 37148 + }, + { + "epoch": 0.95, + "learning_rate": 1.5972317508869228e-06, + "loss": 0.8184, + "step": 37149 + }, + { + "epoch": 0.95, + "learning_rate": 1.5972095570526793e-06, + "loss": 0.6255, + "step": 37150 + }, + { + "epoch": 0.95, + "learning_rate": 1.59718736276118e-06, + "loss": 0.9795, + "step": 37151 + }, + { + "epoch": 0.95, + "learning_rate": 1.597165168012442e-06, + "loss": 0.5879, + "step": 37152 + }, + { + "epoch": 0.95, + "learning_rate": 1.5971429728064818e-06, + "loss": 0.8945, + "step": 37153 + }, + { + "epoch": 0.95, + "learning_rate": 1.5971207771433167e-06, + "loss": 0.9209, + "step": 37154 + }, + { + "epoch": 0.95, + "learning_rate": 1.5970985810229639e-06, + "loss": 0.8955, + "step": 37155 + }, + { + "epoch": 0.95, + "learning_rate": 1.5970763844454398e-06, + "loss": 0.9131, + "step": 37156 + }, + { + "epoch": 0.95, + "learning_rate": 1.597054187410762e-06, + "loss": 0.9009, + "step": 37157 + }, + { + "epoch": 0.95, + "learning_rate": 1.5970319899189473e-06, + "loss": 0.7939, + "step": 37158 + }, + { + "epoch": 0.95, + "learning_rate": 1.5970097919700126e-06, + "loss": 0.7383, + "step": 37159 + }, + { + "epoch": 0.95, + "learning_rate": 1.5969875935639748e-06, + "loss": 0.8682, + "step": 37160 + }, + { + "epoch": 0.95, + "learning_rate": 1.5969653947008515e-06, + "loss": 0.7432, + "step": 37161 + }, + { + "epoch": 0.95, + "learning_rate": 1.5969431953806587e-06, + "loss": 0.9229, + "step": 37162 + }, + { + "epoch": 0.95, + "learning_rate": 1.5969209956034141e-06, + "loss": 0.8525, + "step": 37163 + }, + { + "epoch": 0.95, + "learning_rate": 1.596898795369135e-06, + "loss": 1.0098, + "step": 37164 + }, + { + "epoch": 0.95, + "learning_rate": 1.5968765946778374e-06, + "loss": 1.001, + "step": 37165 + }, + { + "epoch": 0.95, + "learning_rate": 1.5968543935295391e-06, + "loss": 0.9043, + "step": 37166 + }, + { + "epoch": 0.95, + "learning_rate": 1.5968321919242564e-06, + "loss": 0.8594, + "step": 37167 + }, + { + "epoch": 0.95, + "learning_rate": 1.5968099898620072e-06, + "loss": 0.8125, + "step": 37168 + }, + { + "epoch": 0.95, + "learning_rate": 1.596787787342808e-06, + "loss": 0.5669, + "step": 37169 + }, + { + "epoch": 0.95, + "learning_rate": 1.5967655843666757e-06, + "loss": 1.0059, + "step": 37170 + }, + { + "epoch": 0.95, + "learning_rate": 1.5967433809336276e-06, + "loss": 0.9248, + "step": 37171 + }, + { + "epoch": 0.95, + "learning_rate": 1.5967211770436802e-06, + "loss": 0.647, + "step": 37172 + }, + { + "epoch": 0.95, + "learning_rate": 1.596698972696851e-06, + "loss": 1.083, + "step": 37173 + }, + { + "epoch": 0.95, + "learning_rate": 1.596676767893157e-06, + "loss": 0.833, + "step": 37174 + }, + { + "epoch": 0.95, + "learning_rate": 1.5966545626326146e-06, + "loss": 0.876, + "step": 37175 + }, + { + "epoch": 0.95, + "learning_rate": 1.5966323569152417e-06, + "loss": 0.8779, + "step": 37176 + }, + { + "epoch": 0.95, + "learning_rate": 1.5966101507410548e-06, + "loss": 0.8057, + "step": 37177 + }, + { + "epoch": 0.95, + "learning_rate": 1.5965879441100706e-06, + "loss": 0.8691, + "step": 37178 + }, + { + "epoch": 0.95, + "learning_rate": 1.5965657370223066e-06, + "loss": 0.75, + "step": 37179 + }, + { + "epoch": 0.95, + "learning_rate": 1.5965435294777799e-06, + "loss": 0.6716, + "step": 37180 + }, + { + "epoch": 0.95, + "learning_rate": 1.596521321476507e-06, + "loss": 0.6445, + "step": 37181 + }, + { + "epoch": 0.95, + "learning_rate": 1.5964991130185053e-06, + "loss": 0.9414, + "step": 37182 + }, + { + "epoch": 0.95, + "learning_rate": 1.5964769041037913e-06, + "loss": 1.168, + "step": 37183 + }, + { + "epoch": 0.95, + "learning_rate": 1.5964546947323827e-06, + "loss": 0.9268, + "step": 37184 + }, + { + "epoch": 0.95, + "learning_rate": 1.5964324849042964e-06, + "loss": 0.7979, + "step": 37185 + }, + { + "epoch": 0.95, + "learning_rate": 1.5964102746195488e-06, + "loss": 0.7788, + "step": 37186 + }, + { + "epoch": 0.95, + "learning_rate": 1.5963880638781573e-06, + "loss": 0.8701, + "step": 37187 + }, + { + "epoch": 0.95, + "learning_rate": 1.596365852680139e-06, + "loss": 1.1035, + "step": 37188 + }, + { + "epoch": 0.95, + "learning_rate": 1.5963436410255104e-06, + "loss": 0.5938, + "step": 37189 + }, + { + "epoch": 0.95, + "learning_rate": 1.5963214289142891e-06, + "loss": 0.9238, + "step": 37190 + }, + { + "epoch": 0.95, + "learning_rate": 1.5962992163464924e-06, + "loss": 0.9229, + "step": 37191 + }, + { + "epoch": 0.95, + "learning_rate": 1.5962770033221363e-06, + "loss": 0.9536, + "step": 37192 + }, + { + "epoch": 0.95, + "learning_rate": 1.5962547898412385e-06, + "loss": 0.9111, + "step": 37193 + }, + { + "epoch": 0.95, + "learning_rate": 1.5962325759038155e-06, + "loss": 1.0059, + "step": 37194 + }, + { + "epoch": 0.95, + "learning_rate": 1.5962103615098849e-06, + "loss": 0.8496, + "step": 37195 + }, + { + "epoch": 0.95, + "learning_rate": 1.5961881466594635e-06, + "loss": 0.7549, + "step": 37196 + }, + { + "epoch": 0.95, + "learning_rate": 1.5961659313525682e-06, + "loss": 0.8086, + "step": 37197 + }, + { + "epoch": 0.95, + "learning_rate": 1.596143715589216e-06, + "loss": 1.0557, + "step": 37198 + }, + { + "epoch": 0.95, + "learning_rate": 1.5961214993694241e-06, + "loss": 0.8398, + "step": 37199 + }, + { + "epoch": 0.95, + "learning_rate": 1.596099282693209e-06, + "loss": 0.9375, + "step": 37200 + }, + { + "epoch": 0.95, + "learning_rate": 1.5960770655605886e-06, + "loss": 0.8926, + "step": 37201 + }, + { + "epoch": 0.95, + "learning_rate": 1.5960548479715793e-06, + "loss": 0.8994, + "step": 37202 + }, + { + "epoch": 0.95, + "learning_rate": 1.5960326299261979e-06, + "loss": 0.8057, + "step": 37203 + }, + { + "epoch": 0.95, + "learning_rate": 1.5960104114244618e-06, + "loss": 0.8926, + "step": 37204 + }, + { + "epoch": 0.95, + "learning_rate": 1.595988192466388e-06, + "loss": 0.8496, + "step": 37205 + }, + { + "epoch": 0.95, + "learning_rate": 1.5959659730519936e-06, + "loss": 0.6543, + "step": 37206 + }, + { + "epoch": 0.95, + "learning_rate": 1.5959437531812954e-06, + "loss": 0.564, + "step": 37207 + }, + { + "epoch": 0.95, + "learning_rate": 1.5959215328543102e-06, + "loss": 0.999, + "step": 37208 + }, + { + "epoch": 0.95, + "learning_rate": 1.5958993120710556e-06, + "loss": 0.4927, + "step": 37209 + }, + { + "epoch": 0.95, + "learning_rate": 1.5958770908315483e-06, + "loss": 0.835, + "step": 37210 + }, + { + "epoch": 0.95, + "learning_rate": 1.5958548691358051e-06, + "loss": 0.6656, + "step": 37211 + }, + { + "epoch": 0.95, + "learning_rate": 1.5958326469838435e-06, + "loss": 0.6572, + "step": 37212 + }, + { + "epoch": 0.95, + "learning_rate": 1.59581042437568e-06, + "loss": 0.7925, + "step": 37213 + }, + { + "epoch": 0.95, + "learning_rate": 1.5957882013113317e-06, + "loss": 0.7107, + "step": 37214 + }, + { + "epoch": 0.95, + "learning_rate": 1.595765977790816e-06, + "loss": 0.7688, + "step": 37215 + }, + { + "epoch": 0.95, + "learning_rate": 1.5957437538141499e-06, + "loss": 0.9424, + "step": 37216 + }, + { + "epoch": 0.95, + "learning_rate": 1.59572152938135e-06, + "loss": 0.6423, + "step": 37217 + }, + { + "epoch": 0.95, + "learning_rate": 1.5956993044924334e-06, + "loss": 0.8887, + "step": 37218 + }, + { + "epoch": 0.95, + "learning_rate": 1.5956770791474172e-06, + "loss": 0.8086, + "step": 37219 + }, + { + "epoch": 0.95, + "learning_rate": 1.5956548533463186e-06, + "loss": 0.8682, + "step": 37220 + }, + { + "epoch": 0.95, + "learning_rate": 1.5956326270891546e-06, + "loss": 0.6792, + "step": 37221 + }, + { + "epoch": 0.95, + "learning_rate": 1.5956104003759419e-06, + "loss": 0.7715, + "step": 37222 + }, + { + "epoch": 0.95, + "learning_rate": 1.5955881732066976e-06, + "loss": 0.9561, + "step": 37223 + }, + { + "epoch": 0.95, + "learning_rate": 1.595565945581439e-06, + "loss": 0.8311, + "step": 37224 + }, + { + "epoch": 0.95, + "learning_rate": 1.5955437175001826e-06, + "loss": 0.7793, + "step": 37225 + }, + { + "epoch": 0.95, + "learning_rate": 1.5955214889629463e-06, + "loss": 0.9053, + "step": 37226 + }, + { + "epoch": 0.95, + "learning_rate": 1.5954992599697464e-06, + "loss": 0.918, + "step": 37227 + }, + { + "epoch": 0.95, + "learning_rate": 1.5954770305206e-06, + "loss": 0.8301, + "step": 37228 + }, + { + "epoch": 0.95, + "learning_rate": 1.5954548006155242e-06, + "loss": 0.917, + "step": 37229 + }, + { + "epoch": 0.95, + "learning_rate": 1.595432570254536e-06, + "loss": 0.8105, + "step": 37230 + }, + { + "epoch": 0.95, + "learning_rate": 1.5954103394376527e-06, + "loss": 0.9473, + "step": 37231 + }, + { + "epoch": 0.95, + "learning_rate": 1.595388108164891e-06, + "loss": 0.918, + "step": 37232 + }, + { + "epoch": 0.95, + "learning_rate": 1.5953658764362676e-06, + "loss": 0.7539, + "step": 37233 + }, + { + "epoch": 0.95, + "learning_rate": 1.5953436442518004e-06, + "loss": 0.9297, + "step": 37234 + }, + { + "epoch": 0.95, + "learning_rate": 1.5953214116115058e-06, + "loss": 0.8174, + "step": 37235 + }, + { + "epoch": 0.95, + "learning_rate": 1.595299178515401e-06, + "loss": 0.7363, + "step": 37236 + }, + { + "epoch": 0.95, + "learning_rate": 1.5952769449635032e-06, + "loss": 0.8145, + "step": 37237 + }, + { + "epoch": 0.95, + "learning_rate": 1.5952547109558284e-06, + "loss": 0.6501, + "step": 37238 + }, + { + "epoch": 0.95, + "learning_rate": 1.5952324764923951e-06, + "loss": 0.9141, + "step": 37239 + }, + { + "epoch": 0.95, + "learning_rate": 1.5952102415732198e-06, + "loss": 0.9619, + "step": 37240 + }, + { + "epoch": 0.95, + "learning_rate": 1.5951880061983189e-06, + "loss": 0.915, + "step": 37241 + }, + { + "epoch": 0.95, + "learning_rate": 1.5951657703677105e-06, + "loss": 0.5903, + "step": 37242 + }, + { + "epoch": 0.95, + "learning_rate": 1.5951435340814106e-06, + "loss": 0.917, + "step": 37243 + }, + { + "epoch": 0.95, + "learning_rate": 1.5951212973394369e-06, + "loss": 0.9287, + "step": 37244 + }, + { + "epoch": 0.95, + "learning_rate": 1.5950990601418058e-06, + "loss": 0.7393, + "step": 37245 + }, + { + "epoch": 0.95, + "learning_rate": 1.5950768224885351e-06, + "loss": 0.9551, + "step": 37246 + }, + { + "epoch": 0.95, + "learning_rate": 1.5950545843796412e-06, + "loss": 0.8105, + "step": 37247 + }, + { + "epoch": 0.95, + "learning_rate": 1.5950323458151416e-06, + "loss": 0.7256, + "step": 37248 + }, + { + "epoch": 0.95, + "learning_rate": 1.595010106795053e-06, + "loss": 0.8789, + "step": 37249 + }, + { + "epoch": 0.95, + "learning_rate": 1.5949878673193923e-06, + "loss": 0.8296, + "step": 37250 + }, + { + "epoch": 0.95, + "learning_rate": 1.5949656273881771e-06, + "loss": 0.7139, + "step": 37251 + }, + { + "epoch": 0.95, + "learning_rate": 1.594943387001424e-06, + "loss": 0.917, + "step": 37252 + }, + { + "epoch": 0.95, + "learning_rate": 1.5949211461591499e-06, + "loss": 0.576, + "step": 37253 + }, + { + "epoch": 0.95, + "learning_rate": 1.5948989048613722e-06, + "loss": 0.7783, + "step": 37254 + }, + { + "epoch": 0.95, + "learning_rate": 1.5948766631081076e-06, + "loss": 0.5884, + "step": 37255 + }, + { + "epoch": 0.95, + "learning_rate": 1.5948544208993735e-06, + "loss": 0.8838, + "step": 37256 + }, + { + "epoch": 0.95, + "learning_rate": 1.5948321782351865e-06, + "loss": 0.9141, + "step": 37257 + }, + { + "epoch": 0.95, + "learning_rate": 1.5948099351155642e-06, + "loss": 0.8711, + "step": 37258 + }, + { + "epoch": 0.95, + "learning_rate": 1.5947876915405227e-06, + "loss": 0.8408, + "step": 37259 + }, + { + "epoch": 0.95, + "learning_rate": 1.59476544751008e-06, + "loss": 0.6919, + "step": 37260 + }, + { + "epoch": 0.96, + "learning_rate": 1.5947432030242527e-06, + "loss": 0.9492, + "step": 37261 + }, + { + "epoch": 0.96, + "learning_rate": 1.594720958083058e-06, + "loss": 0.9912, + "step": 37262 + }, + { + "epoch": 0.96, + "learning_rate": 1.5946987126865125e-06, + "loss": 0.8164, + "step": 37263 + }, + { + "epoch": 0.96, + "learning_rate": 1.594676466834634e-06, + "loss": 0.812, + "step": 37264 + }, + { + "epoch": 0.96, + "learning_rate": 1.5946542205274386e-06, + "loss": 0.8447, + "step": 37265 + }, + { + "epoch": 0.96, + "learning_rate": 1.5946319737649442e-06, + "loss": 0.9053, + "step": 37266 + }, + { + "epoch": 0.96, + "learning_rate": 1.5946097265471675e-06, + "loss": 0.8218, + "step": 37267 + }, + { + "epoch": 0.96, + "learning_rate": 1.594587478874125e-06, + "loss": 0.9287, + "step": 37268 + }, + { + "epoch": 0.96, + "learning_rate": 1.5945652307458343e-06, + "loss": 1.0342, + "step": 37269 + }, + { + "epoch": 0.96, + "learning_rate": 1.5945429821623125e-06, + "loss": 1.0381, + "step": 37270 + }, + { + "epoch": 0.96, + "learning_rate": 1.5945207331235767e-06, + "loss": 0.7769, + "step": 37271 + }, + { + "epoch": 0.96, + "learning_rate": 1.5944984836296433e-06, + "loss": 0.6562, + "step": 37272 + }, + { + "epoch": 0.96, + "learning_rate": 1.59447623368053e-06, + "loss": 1.0039, + "step": 37273 + }, + { + "epoch": 0.96, + "learning_rate": 1.5944539832762534e-06, + "loss": 0.8252, + "step": 37274 + }, + { + "epoch": 0.96, + "learning_rate": 1.594431732416831e-06, + "loss": 0.8516, + "step": 37275 + }, + { + "epoch": 0.96, + "learning_rate": 1.5944094811022796e-06, + "loss": 0.4946, + "step": 37276 + }, + { + "epoch": 0.96, + "learning_rate": 1.5943872293326157e-06, + "loss": 1.1133, + "step": 37277 + }, + { + "epoch": 0.96, + "learning_rate": 1.5943649771078572e-06, + "loss": 0.8682, + "step": 37278 + }, + { + "epoch": 0.96, + "learning_rate": 1.5943427244280205e-06, + "loss": 0.9902, + "step": 37279 + }, + { + "epoch": 0.96, + "learning_rate": 1.5943204712931231e-06, + "loss": 0.7974, + "step": 37280 + }, + { + "epoch": 0.96, + "learning_rate": 1.5942982177031819e-06, + "loss": 0.8027, + "step": 37281 + }, + { + "epoch": 0.96, + "learning_rate": 1.5942759636582137e-06, + "loss": 0.7178, + "step": 37282 + }, + { + "epoch": 0.96, + "learning_rate": 1.5942537091582357e-06, + "loss": 0.9399, + "step": 37283 + }, + { + "epoch": 0.96, + "learning_rate": 1.5942314542032653e-06, + "loss": 1.0176, + "step": 37284 + }, + { + "epoch": 0.96, + "learning_rate": 1.5942091987933188e-06, + "loss": 0.9492, + "step": 37285 + }, + { + "epoch": 0.96, + "learning_rate": 1.5941869429284137e-06, + "loss": 0.8086, + "step": 37286 + }, + { + "epoch": 0.96, + "learning_rate": 1.5941646866085675e-06, + "loss": 0.9375, + "step": 37287 + }, + { + "epoch": 0.96, + "learning_rate": 1.594142429833796e-06, + "loss": 0.79, + "step": 37288 + }, + { + "epoch": 0.96, + "learning_rate": 1.5941201726041173e-06, + "loss": 0.7012, + "step": 37289 + }, + { + "epoch": 0.96, + "learning_rate": 1.5940979149195482e-06, + "loss": 1.0664, + "step": 37290 + }, + { + "epoch": 0.96, + "learning_rate": 1.5940756567801054e-06, + "loss": 0.9443, + "step": 37291 + }, + { + "epoch": 0.96, + "learning_rate": 1.5940533981858063e-06, + "loss": 0.9932, + "step": 37292 + }, + { + "epoch": 0.96, + "learning_rate": 1.5940311391366678e-06, + "loss": 0.8779, + "step": 37293 + }, + { + "epoch": 0.96, + "learning_rate": 1.5940088796327072e-06, + "loss": 0.8008, + "step": 37294 + }, + { + "epoch": 0.96, + "learning_rate": 1.5939866196739409e-06, + "loss": 0.8369, + "step": 37295 + }, + { + "epoch": 0.96, + "learning_rate": 1.593964359260387e-06, + "loss": 0.6633, + "step": 37296 + }, + { + "epoch": 0.96, + "learning_rate": 1.5939420983920612e-06, + "loss": 0.4458, + "step": 37297 + }, + { + "epoch": 0.96, + "learning_rate": 1.5939198370689815e-06, + "loss": 0.8174, + "step": 37298 + }, + { + "epoch": 0.96, + "learning_rate": 1.5938975752911645e-06, + "loss": 0.8379, + "step": 37299 + }, + { + "epoch": 0.96, + "learning_rate": 1.5938753130586278e-06, + "loss": 0.5981, + "step": 37300 + }, + { + "epoch": 0.96, + "learning_rate": 1.593853050371388e-06, + "loss": 0.9062, + "step": 37301 + }, + { + "epoch": 0.96, + "learning_rate": 1.5938307872294621e-06, + "loss": 0.957, + "step": 37302 + }, + { + "epoch": 0.96, + "learning_rate": 1.5938085236328674e-06, + "loss": 0.8857, + "step": 37303 + }, + { + "epoch": 0.96, + "learning_rate": 1.5937862595816208e-06, + "loss": 0.917, + "step": 37304 + }, + { + "epoch": 0.96, + "learning_rate": 1.5937639950757392e-06, + "loss": 0.6182, + "step": 37305 + }, + { + "epoch": 0.96, + "learning_rate": 1.5937417301152397e-06, + "loss": 0.9746, + "step": 37306 + }, + { + "epoch": 0.96, + "learning_rate": 1.5937194647001398e-06, + "loss": 0.7461, + "step": 37307 + }, + { + "epoch": 0.96, + "learning_rate": 1.5936971988304562e-06, + "loss": 0.9453, + "step": 37308 + }, + { + "epoch": 0.96, + "learning_rate": 1.5936749325062055e-06, + "loss": 0.7861, + "step": 37309 + }, + { + "epoch": 0.96, + "learning_rate": 1.5936526657274056e-06, + "loss": 0.9629, + "step": 37310 + }, + { + "epoch": 0.96, + "learning_rate": 1.5936303984940733e-06, + "loss": 0.7183, + "step": 37311 + }, + { + "epoch": 0.96, + "learning_rate": 1.5936081308062252e-06, + "loss": 0.8442, + "step": 37312 + }, + { + "epoch": 0.96, + "learning_rate": 1.5935858626638786e-06, + "loss": 0.9385, + "step": 37313 + }, + { + "epoch": 0.96, + "learning_rate": 1.5935635940670506e-06, + "loss": 1.0225, + "step": 37314 + }, + { + "epoch": 0.96, + "learning_rate": 1.5935413250157586e-06, + "loss": 1.042, + "step": 37315 + }, + { + "epoch": 0.96, + "learning_rate": 1.5935190555100193e-06, + "loss": 0.7207, + "step": 37316 + }, + { + "epoch": 0.96, + "learning_rate": 1.5934967855498493e-06, + "loss": 0.9736, + "step": 37317 + }, + { + "epoch": 0.96, + "learning_rate": 1.5934745151352664e-06, + "loss": 0.9844, + "step": 37318 + }, + { + "epoch": 0.96, + "learning_rate": 1.5934522442662873e-06, + "loss": 0.9561, + "step": 37319 + }, + { + "epoch": 0.96, + "learning_rate": 1.593429972942929e-06, + "loss": 0.7617, + "step": 37320 + }, + { + "epoch": 0.96, + "learning_rate": 1.5934077011652089e-06, + "loss": 0.7676, + "step": 37321 + }, + { + "epoch": 0.96, + "learning_rate": 1.5933854289331437e-06, + "loss": 0.6304, + "step": 37322 + }, + { + "epoch": 0.96, + "learning_rate": 1.5933631562467503e-06, + "loss": 0.7363, + "step": 37323 + }, + { + "epoch": 0.96, + "learning_rate": 1.5933408831060464e-06, + "loss": 0.7871, + "step": 37324 + }, + { + "epoch": 0.96, + "learning_rate": 1.5933186095110483e-06, + "loss": 0.793, + "step": 37325 + }, + { + "epoch": 0.96, + "learning_rate": 1.593296335461774e-06, + "loss": 0.5431, + "step": 37326 + }, + { + "epoch": 0.96, + "learning_rate": 1.5932740609582393e-06, + "loss": 0.9307, + "step": 37327 + }, + { + "epoch": 0.96, + "learning_rate": 1.5932517860004623e-06, + "loss": 0.5278, + "step": 37328 + }, + { + "epoch": 0.96, + "learning_rate": 1.5932295105884594e-06, + "loss": 0.7773, + "step": 37329 + }, + { + "epoch": 0.96, + "learning_rate": 1.5932072347222483e-06, + "loss": 0.5449, + "step": 37330 + }, + { + "epoch": 0.96, + "learning_rate": 1.5931849584018455e-06, + "loss": 0.9941, + "step": 37331 + }, + { + "epoch": 0.96, + "learning_rate": 1.5931626816272682e-06, + "loss": 0.6484, + "step": 37332 + }, + { + "epoch": 0.96, + "learning_rate": 1.5931404043985337e-06, + "loss": 0.6228, + "step": 37333 + }, + { + "epoch": 0.96, + "learning_rate": 1.5931181267156587e-06, + "loss": 0.9082, + "step": 37334 + }, + { + "epoch": 0.96, + "learning_rate": 1.5930958485786605e-06, + "loss": 0.8457, + "step": 37335 + }, + { + "epoch": 0.96, + "learning_rate": 1.5930735699875561e-06, + "loss": 0.9775, + "step": 37336 + }, + { + "epoch": 0.96, + "learning_rate": 1.5930512909423626e-06, + "loss": 0.8398, + "step": 37337 + }, + { + "epoch": 0.96, + "learning_rate": 1.593029011443097e-06, + "loss": 0.9014, + "step": 37338 + }, + { + "epoch": 0.96, + "learning_rate": 1.5930067314897763e-06, + "loss": 0.7773, + "step": 37339 + }, + { + "epoch": 0.96, + "learning_rate": 1.5929844510824174e-06, + "loss": 0.7656, + "step": 37340 + }, + { + "epoch": 0.96, + "learning_rate": 1.5929621702210381e-06, + "loss": 0.875, + "step": 37341 + }, + { + "epoch": 0.96, + "learning_rate": 1.5929398889056543e-06, + "loss": 0.8115, + "step": 37342 + }, + { + "epoch": 0.96, + "learning_rate": 1.592917607136284e-06, + "loss": 0.7126, + "step": 37343 + }, + { + "epoch": 0.96, + "learning_rate": 1.592895324912944e-06, + "loss": 0.8389, + "step": 37344 + }, + { + "epoch": 0.96, + "learning_rate": 1.5928730422356512e-06, + "loss": 1.0068, + "step": 37345 + }, + { + "epoch": 0.96, + "learning_rate": 1.5928507591044229e-06, + "loss": 0.8906, + "step": 37346 + }, + { + "epoch": 0.96, + "learning_rate": 1.5928284755192757e-06, + "loss": 0.7285, + "step": 37347 + }, + { + "epoch": 0.96, + "learning_rate": 1.5928061914802276e-06, + "loss": 0.6089, + "step": 37348 + }, + { + "epoch": 0.96, + "learning_rate": 1.5927839069872943e-06, + "loss": 0.8047, + "step": 37349 + }, + { + "epoch": 0.96, + "learning_rate": 1.592761622040494e-06, + "loss": 0.6064, + "step": 37350 + }, + { + "epoch": 0.96, + "learning_rate": 1.5927393366398436e-06, + "loss": 1.0625, + "step": 37351 + }, + { + "epoch": 0.96, + "learning_rate": 1.5927170507853599e-06, + "loss": 0.7812, + "step": 37352 + }, + { + "epoch": 0.96, + "learning_rate": 1.5926947644770596e-06, + "loss": 0.8623, + "step": 37353 + }, + { + "epoch": 0.96, + "learning_rate": 1.5926724777149604e-06, + "loss": 0.9648, + "step": 37354 + }, + { + "epoch": 0.96, + "learning_rate": 1.5926501904990792e-06, + "loss": 0.6694, + "step": 37355 + }, + { + "epoch": 0.96, + "learning_rate": 1.592627902829433e-06, + "loss": 1.0342, + "step": 37356 + }, + { + "epoch": 0.96, + "learning_rate": 1.5926056147060386e-06, + "loss": 0.8418, + "step": 37357 + }, + { + "epoch": 0.96, + "learning_rate": 1.5925833261289138e-06, + "loss": 0.9463, + "step": 37358 + }, + { + "epoch": 0.96, + "learning_rate": 1.5925610370980748e-06, + "loss": 1.0205, + "step": 37359 + }, + { + "epoch": 0.96, + "learning_rate": 1.5925387476135393e-06, + "loss": 0.9375, + "step": 37360 + }, + { + "epoch": 0.96, + "learning_rate": 1.592516457675324e-06, + "loss": 0.6074, + "step": 37361 + }, + { + "epoch": 0.96, + "learning_rate": 1.5924941672834461e-06, + "loss": 0.7803, + "step": 37362 + }, + { + "epoch": 0.96, + "learning_rate": 1.5924718764379229e-06, + "loss": 0.7725, + "step": 37363 + }, + { + "epoch": 0.96, + "learning_rate": 1.5924495851387709e-06, + "loss": 0.9229, + "step": 37364 + }, + { + "epoch": 0.96, + "learning_rate": 1.5924272933860077e-06, + "loss": 0.8838, + "step": 37365 + }, + { + "epoch": 0.96, + "learning_rate": 1.59240500117965e-06, + "loss": 0.7842, + "step": 37366 + }, + { + "epoch": 0.96, + "learning_rate": 1.592382708519715e-06, + "loss": 0.7183, + "step": 37367 + }, + { + "epoch": 0.96, + "learning_rate": 1.59236041540622e-06, + "loss": 0.7979, + "step": 37368 + }, + { + "epoch": 0.96, + "learning_rate": 1.5923381218391817e-06, + "loss": 0.8271, + "step": 37369 + }, + { + "epoch": 0.96, + "learning_rate": 1.5923158278186174e-06, + "loss": 0.8652, + "step": 37370 + }, + { + "epoch": 0.96, + "learning_rate": 1.5922935333445441e-06, + "loss": 0.6436, + "step": 37371 + }, + { + "epoch": 0.96, + "learning_rate": 1.592271238416979e-06, + "loss": 0.8447, + "step": 37372 + }, + { + "epoch": 0.96, + "learning_rate": 1.592248943035939e-06, + "loss": 0.8691, + "step": 37373 + }, + { + "epoch": 0.96, + "learning_rate": 1.592226647201441e-06, + "loss": 0.7832, + "step": 37374 + }, + { + "epoch": 0.96, + "learning_rate": 1.5922043509135025e-06, + "loss": 0.7915, + "step": 37375 + }, + { + "epoch": 0.96, + "learning_rate": 1.5921820541721403e-06, + "loss": 1.0547, + "step": 37376 + }, + { + "epoch": 0.96, + "learning_rate": 1.5921597569773715e-06, + "loss": 0.7063, + "step": 37377 + }, + { + "epoch": 0.96, + "learning_rate": 1.5921374593292131e-06, + "loss": 0.8809, + "step": 37378 + }, + { + "epoch": 0.96, + "learning_rate": 1.5921151612276825e-06, + "loss": 0.833, + "step": 37379 + }, + { + "epoch": 0.96, + "learning_rate": 1.5920928626727965e-06, + "loss": 0.7227, + "step": 37380 + }, + { + "epoch": 0.96, + "learning_rate": 1.5920705636645721e-06, + "loss": 0.8716, + "step": 37381 + }, + { + "epoch": 0.96, + "learning_rate": 1.5920482642030267e-06, + "loss": 0.6411, + "step": 37382 + }, + { + "epoch": 0.96, + "learning_rate": 1.5920259642881768e-06, + "loss": 0.8105, + "step": 37383 + }, + { + "epoch": 0.96, + "learning_rate": 1.5920036639200402e-06, + "loss": 0.6135, + "step": 37384 + }, + { + "epoch": 0.96, + "learning_rate": 1.5919813630986336e-06, + "loss": 0.916, + "step": 37385 + }, + { + "epoch": 0.96, + "learning_rate": 1.591959061823974e-06, + "loss": 0.645, + "step": 37386 + }, + { + "epoch": 0.96, + "learning_rate": 1.5919367600960784e-06, + "loss": 0.8789, + "step": 37387 + }, + { + "epoch": 0.96, + "learning_rate": 1.5919144579149641e-06, + "loss": 0.7617, + "step": 37388 + }, + { + "epoch": 0.96, + "learning_rate": 1.5918921552806483e-06, + "loss": 0.7744, + "step": 37389 + }, + { + "epoch": 0.96, + "learning_rate": 1.591869852193148e-06, + "loss": 0.8271, + "step": 37390 + }, + { + "epoch": 0.96, + "learning_rate": 1.59184754865248e-06, + "loss": 1.3281, + "step": 37391 + }, + { + "epoch": 0.96, + "learning_rate": 1.5918252446586613e-06, + "loss": 1.0967, + "step": 37392 + }, + { + "epoch": 0.96, + "learning_rate": 1.5918029402117093e-06, + "loss": 0.9043, + "step": 37393 + }, + { + "epoch": 0.96, + "learning_rate": 1.5917806353116411e-06, + "loss": 0.8926, + "step": 37394 + }, + { + "epoch": 0.96, + "learning_rate": 1.5917583299584738e-06, + "loss": 0.9009, + "step": 37395 + }, + { + "epoch": 0.96, + "learning_rate": 1.5917360241522243e-06, + "loss": 0.7725, + "step": 37396 + }, + { + "epoch": 0.96, + "learning_rate": 1.5917137178929096e-06, + "loss": 0.7559, + "step": 37397 + }, + { + "epoch": 0.96, + "learning_rate": 1.591691411180547e-06, + "loss": 0.8049, + "step": 37398 + }, + { + "epoch": 0.96, + "learning_rate": 1.5916691040151537e-06, + "loss": 0.7969, + "step": 37399 + }, + { + "epoch": 0.96, + "learning_rate": 1.5916467963967463e-06, + "loss": 0.8643, + "step": 37400 + }, + { + "epoch": 0.96, + "learning_rate": 1.5916244883253422e-06, + "loss": 0.7192, + "step": 37401 + }, + { + "epoch": 0.96, + "learning_rate": 1.5916021798009585e-06, + "loss": 0.6528, + "step": 37402 + }, + { + "epoch": 0.96, + "learning_rate": 1.591579870823612e-06, + "loss": 0.8115, + "step": 37403 + }, + { + "epoch": 0.96, + "learning_rate": 1.59155756139332e-06, + "loss": 0.7617, + "step": 37404 + }, + { + "epoch": 0.96, + "learning_rate": 1.5915352515101002e-06, + "loss": 0.9023, + "step": 37405 + }, + { + "epoch": 0.96, + "learning_rate": 1.5915129411739685e-06, + "loss": 0.8506, + "step": 37406 + }, + { + "epoch": 0.96, + "learning_rate": 1.5914906303849426e-06, + "loss": 0.6753, + "step": 37407 + }, + { + "epoch": 0.96, + "learning_rate": 1.5914683191430396e-06, + "loss": 0.8369, + "step": 37408 + }, + { + "epoch": 0.96, + "learning_rate": 1.5914460074482766e-06, + "loss": 1.0078, + "step": 37409 + }, + { + "epoch": 0.96, + "learning_rate": 1.5914236953006707e-06, + "loss": 0.7319, + "step": 37410 + }, + { + "epoch": 0.96, + "learning_rate": 1.5914013827002384e-06, + "loss": 0.7466, + "step": 37411 + }, + { + "epoch": 0.96, + "learning_rate": 1.5913790696469973e-06, + "loss": 0.9346, + "step": 37412 + }, + { + "epoch": 0.96, + "learning_rate": 1.5913567561409647e-06, + "loss": 0.7881, + "step": 37413 + }, + { + "epoch": 0.96, + "learning_rate": 1.5913344421821573e-06, + "loss": 0.7627, + "step": 37414 + }, + { + "epoch": 0.96, + "learning_rate": 1.5913121277705926e-06, + "loss": 0.9756, + "step": 37415 + }, + { + "epoch": 0.96, + "learning_rate": 1.591289812906287e-06, + "loss": 1.0859, + "step": 37416 + }, + { + "epoch": 0.96, + "learning_rate": 1.591267497589258e-06, + "loss": 0.9473, + "step": 37417 + }, + { + "epoch": 0.96, + "learning_rate": 1.5912451818195228e-06, + "loss": 0.834, + "step": 37418 + }, + { + "epoch": 0.96, + "learning_rate": 1.5912228655970985e-06, + "loss": 0.9121, + "step": 37419 + }, + { + "epoch": 0.96, + "learning_rate": 1.5912005489220017e-06, + "loss": 0.7969, + "step": 37420 + }, + { + "epoch": 0.96, + "learning_rate": 1.5911782317942501e-06, + "loss": 0.8232, + "step": 37421 + }, + { + "epoch": 0.96, + "learning_rate": 1.5911559142138602e-06, + "loss": 0.708, + "step": 37422 + }, + { + "epoch": 0.96, + "learning_rate": 1.5911335961808496e-06, + "loss": 0.8213, + "step": 37423 + }, + { + "epoch": 0.96, + "learning_rate": 1.5911112776952354e-06, + "loss": 0.8574, + "step": 37424 + }, + { + "epoch": 0.96, + "learning_rate": 1.5910889587570343e-06, + "loss": 0.7478, + "step": 37425 + }, + { + "epoch": 0.96, + "learning_rate": 1.5910666393662635e-06, + "loss": 0.8945, + "step": 37426 + }, + { + "epoch": 0.96, + "learning_rate": 1.5910443195229402e-06, + "loss": 1.0225, + "step": 37427 + }, + { + "epoch": 0.96, + "learning_rate": 1.5910219992270814e-06, + "loss": 0.8789, + "step": 37428 + }, + { + "epoch": 0.96, + "learning_rate": 1.5909996784787043e-06, + "loss": 0.8003, + "step": 37429 + }, + { + "epoch": 0.96, + "learning_rate": 1.590977357277826e-06, + "loss": 0.8359, + "step": 37430 + }, + { + "epoch": 0.96, + "learning_rate": 1.5909550356244633e-06, + "loss": 0.8164, + "step": 37431 + }, + { + "epoch": 0.96, + "learning_rate": 1.5909327135186335e-06, + "loss": 0.8208, + "step": 37432 + }, + { + "epoch": 0.96, + "learning_rate": 1.5909103909603538e-06, + "loss": 0.6267, + "step": 37433 + }, + { + "epoch": 0.96, + "learning_rate": 1.590888067949641e-06, + "loss": 0.8442, + "step": 37434 + }, + { + "epoch": 0.96, + "learning_rate": 1.5908657444865128e-06, + "loss": 0.853, + "step": 37435 + }, + { + "epoch": 0.96, + "learning_rate": 1.5908434205709856e-06, + "loss": 0.6709, + "step": 37436 + }, + { + "epoch": 0.96, + "learning_rate": 1.5908210962030767e-06, + "loss": 0.8506, + "step": 37437 + }, + { + "epoch": 0.96, + "learning_rate": 1.5907987713828034e-06, + "loss": 0.7417, + "step": 37438 + }, + { + "epoch": 0.96, + "learning_rate": 1.5907764461101824e-06, + "loss": 0.4043, + "step": 37439 + }, + { + "epoch": 0.96, + "learning_rate": 1.5907541203852315e-06, + "loss": 0.9072, + "step": 37440 + }, + { + "epoch": 0.96, + "learning_rate": 1.5907317942079667e-06, + "loss": 0.9307, + "step": 37441 + }, + { + "epoch": 0.96, + "learning_rate": 1.5907094675784062e-06, + "loss": 0.6919, + "step": 37442 + }, + { + "epoch": 0.96, + "learning_rate": 1.5906871404965665e-06, + "loss": 0.8467, + "step": 37443 + }, + { + "epoch": 0.96, + "learning_rate": 1.5906648129624648e-06, + "loss": 0.783, + "step": 37444 + }, + { + "epoch": 0.96, + "learning_rate": 1.5906424849761185e-06, + "loss": 0.9072, + "step": 37445 + }, + { + "epoch": 0.96, + "learning_rate": 1.5906201565375442e-06, + "loss": 0.793, + "step": 37446 + }, + { + "epoch": 0.96, + "learning_rate": 1.590597827646759e-06, + "loss": 0.793, + "step": 37447 + }, + { + "epoch": 0.96, + "learning_rate": 1.5905754983037802e-06, + "loss": 0.8848, + "step": 37448 + }, + { + "epoch": 0.96, + "learning_rate": 1.590553168508625e-06, + "loss": 0.9854, + "step": 37449 + }, + { + "epoch": 0.96, + "learning_rate": 1.5905308382613108e-06, + "loss": 0.7588, + "step": 37450 + }, + { + "epoch": 0.96, + "learning_rate": 1.5905085075618536e-06, + "loss": 1.0186, + "step": 37451 + }, + { + "epoch": 0.96, + "learning_rate": 1.5904861764102715e-06, + "loss": 0.8828, + "step": 37452 + }, + { + "epoch": 0.96, + "learning_rate": 1.5904638448065812e-06, + "loss": 0.8965, + "step": 37453 + }, + { + "epoch": 0.96, + "learning_rate": 1.5904415127508001e-06, + "loss": 0.6196, + "step": 37454 + }, + { + "epoch": 0.96, + "learning_rate": 1.590419180242945e-06, + "loss": 0.7769, + "step": 37455 + }, + { + "epoch": 0.96, + "learning_rate": 1.590396847283033e-06, + "loss": 0.9238, + "step": 37456 + }, + { + "epoch": 0.96, + "learning_rate": 1.5903745138710813e-06, + "loss": 0.8223, + "step": 37457 + }, + { + "epoch": 0.96, + "learning_rate": 1.590352180007107e-06, + "loss": 0.8613, + "step": 37458 + }, + { + "epoch": 0.96, + "learning_rate": 1.5903298456911272e-06, + "loss": 0.8926, + "step": 37459 + }, + { + "epoch": 0.96, + "learning_rate": 1.590307510923159e-06, + "loss": 0.6538, + "step": 37460 + }, + { + "epoch": 0.96, + "learning_rate": 1.5902851757032196e-06, + "loss": 1.0029, + "step": 37461 + }, + { + "epoch": 0.96, + "learning_rate": 1.5902628400313257e-06, + "loss": 0.698, + "step": 37462 + }, + { + "epoch": 0.96, + "learning_rate": 1.590240503907495e-06, + "loss": 0.9668, + "step": 37463 + }, + { + "epoch": 0.96, + "learning_rate": 1.5902181673317438e-06, + "loss": 0.7705, + "step": 37464 + }, + { + "epoch": 0.96, + "learning_rate": 1.59019583030409e-06, + "loss": 0.8857, + "step": 37465 + }, + { + "epoch": 0.96, + "learning_rate": 1.5901734928245506e-06, + "loss": 0.9766, + "step": 37466 + }, + { + "epoch": 0.96, + "learning_rate": 1.5901511548931421e-06, + "loss": 0.7988, + "step": 37467 + }, + { + "epoch": 0.96, + "learning_rate": 1.5901288165098822e-06, + "loss": 0.7637, + "step": 37468 + }, + { + "epoch": 0.96, + "learning_rate": 1.5901064776747877e-06, + "loss": 1.0781, + "step": 37469 + }, + { + "epoch": 0.96, + "learning_rate": 1.590084138387876e-06, + "loss": 0.6128, + "step": 37470 + }, + { + "epoch": 0.96, + "learning_rate": 1.590061798649164e-06, + "loss": 0.7627, + "step": 37471 + }, + { + "epoch": 0.96, + "learning_rate": 1.5900394584586688e-06, + "loss": 0.9404, + "step": 37472 + }, + { + "epoch": 0.96, + "learning_rate": 1.5900171178164072e-06, + "loss": 0.8936, + "step": 37473 + }, + { + "epoch": 0.96, + "learning_rate": 1.5899947767223968e-06, + "loss": 0.8125, + "step": 37474 + }, + { + "epoch": 0.96, + "learning_rate": 1.5899724351766545e-06, + "loss": 0.7207, + "step": 37475 + }, + { + "epoch": 0.96, + "learning_rate": 1.5899500931791976e-06, + "loss": 0.7754, + "step": 37476 + }, + { + "epoch": 0.96, + "learning_rate": 1.5899277507300428e-06, + "loss": 0.96, + "step": 37477 + }, + { + "epoch": 0.96, + "learning_rate": 1.5899054078292076e-06, + "loss": 0.8994, + "step": 37478 + }, + { + "epoch": 0.96, + "learning_rate": 1.5898830644767089e-06, + "loss": 0.9805, + "step": 37479 + }, + { + "epoch": 0.96, + "learning_rate": 1.5898607206725641e-06, + "loss": 0.6145, + "step": 37480 + }, + { + "epoch": 0.96, + "learning_rate": 1.58983837641679e-06, + "loss": 0.7803, + "step": 37481 + }, + { + "epoch": 0.96, + "learning_rate": 1.5898160317094035e-06, + "loss": 1.0791, + "step": 37482 + }, + { + "epoch": 0.96, + "learning_rate": 1.589793686550422e-06, + "loss": 0.7817, + "step": 37483 + }, + { + "epoch": 0.96, + "learning_rate": 1.5897713409398627e-06, + "loss": 0.9619, + "step": 37484 + }, + { + "epoch": 0.96, + "learning_rate": 1.5897489948777428e-06, + "loss": 0.8818, + "step": 37485 + }, + { + "epoch": 0.96, + "learning_rate": 1.589726648364079e-06, + "loss": 0.8506, + "step": 37486 + }, + { + "epoch": 0.96, + "learning_rate": 1.5897043013988886e-06, + "loss": 1.0469, + "step": 37487 + }, + { + "epoch": 0.96, + "learning_rate": 1.5896819539821888e-06, + "loss": 0.958, + "step": 37488 + }, + { + "epoch": 0.96, + "learning_rate": 1.5896596061139967e-06, + "loss": 0.5791, + "step": 37489 + }, + { + "epoch": 0.96, + "learning_rate": 1.5896372577943294e-06, + "loss": 0.9131, + "step": 37490 + }, + { + "epoch": 0.96, + "learning_rate": 1.5896149090232038e-06, + "loss": 0.7627, + "step": 37491 + }, + { + "epoch": 0.96, + "learning_rate": 1.589592559800637e-06, + "loss": 0.9307, + "step": 37492 + }, + { + "epoch": 0.96, + "learning_rate": 1.5895702101266466e-06, + "loss": 0.8838, + "step": 37493 + }, + { + "epoch": 0.96, + "learning_rate": 1.5895478600012493e-06, + "loss": 0.8701, + "step": 37494 + }, + { + "epoch": 0.96, + "learning_rate": 1.5895255094244627e-06, + "loss": 0.7363, + "step": 37495 + }, + { + "epoch": 0.96, + "learning_rate": 1.5895031583963028e-06, + "loss": 0.9912, + "step": 37496 + }, + { + "epoch": 0.96, + "learning_rate": 1.589480806916788e-06, + "loss": 0.6338, + "step": 37497 + }, + { + "epoch": 0.96, + "learning_rate": 1.5894584549859345e-06, + "loss": 0.8262, + "step": 37498 + }, + { + "epoch": 0.96, + "learning_rate": 1.5894361026037597e-06, + "loss": 0.8457, + "step": 37499 + }, + { + "epoch": 0.96, + "learning_rate": 1.5894137497702814e-06, + "loss": 0.6797, + "step": 37500 + }, + { + "epoch": 0.96, + "learning_rate": 1.5893913964855154e-06, + "loss": 0.6147, + "step": 37501 + }, + { + "epoch": 0.96, + "learning_rate": 1.5893690427494799e-06, + "loss": 0.7104, + "step": 37502 + }, + { + "epoch": 0.96, + "learning_rate": 1.5893466885621916e-06, + "loss": 0.8799, + "step": 37503 + }, + { + "epoch": 0.96, + "learning_rate": 1.5893243339236672e-06, + "loss": 0.7046, + "step": 37504 + }, + { + "epoch": 0.96, + "learning_rate": 1.5893019788339248e-06, + "loss": 0.7607, + "step": 37505 + }, + { + "epoch": 0.96, + "learning_rate": 1.589279623292981e-06, + "loss": 0.8071, + "step": 37506 + }, + { + "epoch": 0.96, + "learning_rate": 1.5892572673008524e-06, + "loss": 0.79, + "step": 37507 + }, + { + "epoch": 0.96, + "learning_rate": 1.5892349108575569e-06, + "loss": 0.9082, + "step": 37508 + }, + { + "epoch": 0.96, + "learning_rate": 1.589212553963111e-06, + "loss": 0.7695, + "step": 37509 + }, + { + "epoch": 0.96, + "learning_rate": 1.5891901966175327e-06, + "loss": 0.9092, + "step": 37510 + }, + { + "epoch": 0.96, + "learning_rate": 1.5891678388208382e-06, + "loss": 0.6772, + "step": 37511 + }, + { + "epoch": 0.96, + "learning_rate": 1.589145480573045e-06, + "loss": 0.8037, + "step": 37512 + }, + { + "epoch": 0.96, + "learning_rate": 1.5891231218741705e-06, + "loss": 0.8232, + "step": 37513 + }, + { + "epoch": 0.96, + "learning_rate": 1.589100762724231e-06, + "loss": 1.1387, + "step": 37514 + }, + { + "epoch": 0.96, + "learning_rate": 1.5890784031232446e-06, + "loss": 0.8799, + "step": 37515 + }, + { + "epoch": 0.96, + "learning_rate": 1.5890560430712277e-06, + "loss": 0.6517, + "step": 37516 + }, + { + "epoch": 0.96, + "learning_rate": 1.589033682568198e-06, + "loss": 0.7627, + "step": 37517 + }, + { + "epoch": 0.96, + "learning_rate": 1.5890113216141718e-06, + "loss": 0.8447, + "step": 37518 + }, + { + "epoch": 0.96, + "learning_rate": 1.5889889602091669e-06, + "loss": 0.7881, + "step": 37519 + }, + { + "epoch": 0.96, + "learning_rate": 1.5889665983532004e-06, + "loss": 0.8955, + "step": 37520 + }, + { + "epoch": 0.96, + "learning_rate": 1.5889442360462892e-06, + "loss": 0.875, + "step": 37521 + }, + { + "epoch": 0.96, + "learning_rate": 1.5889218732884505e-06, + "loss": 0.7871, + "step": 37522 + }, + { + "epoch": 0.96, + "learning_rate": 1.5888995100797012e-06, + "loss": 0.6084, + "step": 37523 + }, + { + "epoch": 0.96, + "learning_rate": 1.5888771464200587e-06, + "loss": 0.8721, + "step": 37524 + }, + { + "epoch": 0.96, + "learning_rate": 1.5888547823095402e-06, + "loss": 0.6357, + "step": 37525 + }, + { + "epoch": 0.96, + "learning_rate": 1.5888324177481625e-06, + "loss": 0.5649, + "step": 37526 + }, + { + "epoch": 0.96, + "learning_rate": 1.5888100527359429e-06, + "loss": 0.6914, + "step": 37527 + }, + { + "epoch": 0.96, + "learning_rate": 1.5887876872728984e-06, + "loss": 0.9443, + "step": 37528 + }, + { + "epoch": 0.96, + "learning_rate": 1.5887653213590465e-06, + "loss": 0.875, + "step": 37529 + }, + { + "epoch": 0.96, + "learning_rate": 1.588742954994404e-06, + "loss": 0.9795, + "step": 37530 + }, + { + "epoch": 0.96, + "learning_rate": 1.588720588178988e-06, + "loss": 0.52, + "step": 37531 + }, + { + "epoch": 0.96, + "learning_rate": 1.5886982209128159e-06, + "loss": 0.9033, + "step": 37532 + }, + { + "epoch": 0.96, + "learning_rate": 1.5886758531959044e-06, + "loss": 0.7383, + "step": 37533 + }, + { + "epoch": 0.96, + "learning_rate": 1.588653485028271e-06, + "loss": 0.9287, + "step": 37534 + }, + { + "epoch": 0.96, + "learning_rate": 1.5886311164099327e-06, + "loss": 0.613, + "step": 37535 + }, + { + "epoch": 0.96, + "learning_rate": 1.5886087473409066e-06, + "loss": 0.7559, + "step": 37536 + }, + { + "epoch": 0.96, + "learning_rate": 1.5885863778212098e-06, + "loss": 0.7644, + "step": 37537 + }, + { + "epoch": 0.96, + "learning_rate": 1.5885640078508595e-06, + "loss": 0.7656, + "step": 37538 + }, + { + "epoch": 0.96, + "learning_rate": 1.5885416374298729e-06, + "loss": 0.7134, + "step": 37539 + }, + { + "epoch": 0.96, + "learning_rate": 1.5885192665582673e-06, + "loss": 0.8486, + "step": 37540 + }, + { + "epoch": 0.96, + "learning_rate": 1.588496895236059e-06, + "loss": 0.7578, + "step": 37541 + }, + { + "epoch": 0.96, + "learning_rate": 1.5884745234632657e-06, + "loss": 0.9941, + "step": 37542 + }, + { + "epoch": 0.96, + "learning_rate": 1.5884521512399048e-06, + "loss": 0.9189, + "step": 37543 + }, + { + "epoch": 0.96, + "learning_rate": 1.588429778565993e-06, + "loss": 0.8682, + "step": 37544 + }, + { + "epoch": 0.96, + "learning_rate": 1.5884074054415479e-06, + "loss": 0.9189, + "step": 37545 + }, + { + "epoch": 0.96, + "learning_rate": 1.588385031866586e-06, + "loss": 0.644, + "step": 37546 + }, + { + "epoch": 0.96, + "learning_rate": 1.5883626578411248e-06, + "loss": 0.9766, + "step": 37547 + }, + { + "epoch": 0.96, + "learning_rate": 1.5883402833651811e-06, + "loss": 0.8135, + "step": 37548 + }, + { + "epoch": 0.96, + "learning_rate": 1.5883179084387727e-06, + "loss": 0.8047, + "step": 37549 + }, + { + "epoch": 0.96, + "learning_rate": 1.588295533061916e-06, + "loss": 0.7188, + "step": 37550 + }, + { + "epoch": 0.96, + "learning_rate": 1.5882731572346288e-06, + "loss": 0.7915, + "step": 37551 + }, + { + "epoch": 0.96, + "learning_rate": 1.5882507809569277e-06, + "loss": 0.7319, + "step": 37552 + }, + { + "epoch": 0.96, + "learning_rate": 1.5882284042288298e-06, + "loss": 0.9189, + "step": 37553 + }, + { + "epoch": 0.96, + "learning_rate": 1.588206027050353e-06, + "loss": 0.8315, + "step": 37554 + }, + { + "epoch": 0.96, + "learning_rate": 1.5881836494215134e-06, + "loss": 0.9824, + "step": 37555 + }, + { + "epoch": 0.96, + "learning_rate": 1.588161271342329e-06, + "loss": 0.6086, + "step": 37556 + }, + { + "epoch": 0.96, + "learning_rate": 1.5881388928128163e-06, + "loss": 0.6714, + "step": 37557 + }, + { + "epoch": 0.96, + "learning_rate": 1.588116513832993e-06, + "loss": 0.6694, + "step": 37558 + }, + { + "epoch": 0.96, + "learning_rate": 1.5880941344028753e-06, + "loss": 0.6255, + "step": 37559 + }, + { + "epoch": 0.96, + "learning_rate": 1.5880717545224816e-06, + "loss": 0.7549, + "step": 37560 + }, + { + "epoch": 0.96, + "learning_rate": 1.5880493741918282e-06, + "loss": 0.7119, + "step": 37561 + }, + { + "epoch": 0.96, + "learning_rate": 1.5880269934109322e-06, + "loss": 0.6895, + "step": 37562 + }, + { + "epoch": 0.96, + "learning_rate": 1.5880046121798114e-06, + "loss": 0.9648, + "step": 37563 + }, + { + "epoch": 0.96, + "learning_rate": 1.5879822304984823e-06, + "loss": 0.834, + "step": 37564 + }, + { + "epoch": 0.96, + "learning_rate": 1.5879598483669621e-06, + "loss": 0.9697, + "step": 37565 + }, + { + "epoch": 0.96, + "learning_rate": 1.5879374657852683e-06, + "loss": 0.8164, + "step": 37566 + }, + { + "epoch": 0.96, + "learning_rate": 1.5879150827534175e-06, + "loss": 0.9756, + "step": 37567 + }, + { + "epoch": 0.96, + "learning_rate": 1.5878926992714274e-06, + "loss": 1.0293, + "step": 37568 + }, + { + "epoch": 0.96, + "learning_rate": 1.5878703153393147e-06, + "loss": 0.749, + "step": 37569 + }, + { + "epoch": 0.96, + "learning_rate": 1.5878479309570971e-06, + "loss": 0.7764, + "step": 37570 + }, + { + "epoch": 0.96, + "learning_rate": 1.5878255461247912e-06, + "loss": 0.9814, + "step": 37571 + }, + { + "epoch": 0.96, + "learning_rate": 1.5878031608424142e-06, + "loss": 0.8037, + "step": 37572 + }, + { + "epoch": 0.96, + "learning_rate": 1.5877807751099835e-06, + "loss": 1.04, + "step": 37573 + }, + { + "epoch": 0.96, + "learning_rate": 1.587758388927516e-06, + "loss": 0.9473, + "step": 37574 + }, + { + "epoch": 0.96, + "learning_rate": 1.587736002295029e-06, + "loss": 0.8418, + "step": 37575 + }, + { + "epoch": 0.96, + "learning_rate": 1.5877136152125394e-06, + "loss": 1.0293, + "step": 37576 + }, + { + "epoch": 0.96, + "learning_rate": 1.5876912276800644e-06, + "loss": 0.9668, + "step": 37577 + }, + { + "epoch": 0.96, + "learning_rate": 1.5876688396976214e-06, + "loss": 0.916, + "step": 37578 + }, + { + "epoch": 0.96, + "learning_rate": 1.5876464512652277e-06, + "loss": 0.8408, + "step": 37579 + }, + { + "epoch": 0.96, + "learning_rate": 1.5876240623829e-06, + "loss": 0.7422, + "step": 37580 + }, + { + "epoch": 0.96, + "learning_rate": 1.5876016730506554e-06, + "loss": 0.7246, + "step": 37581 + }, + { + "epoch": 0.96, + "learning_rate": 1.5875792832685111e-06, + "loss": 0.8384, + "step": 37582 + }, + { + "epoch": 0.96, + "learning_rate": 1.5875568930364845e-06, + "loss": 0.7817, + "step": 37583 + }, + { + "epoch": 0.96, + "learning_rate": 1.5875345023545928e-06, + "loss": 1.0693, + "step": 37584 + }, + { + "epoch": 0.96, + "learning_rate": 1.587512111222853e-06, + "loss": 0.9648, + "step": 37585 + }, + { + "epoch": 0.96, + "learning_rate": 1.5874897196412818e-06, + "loss": 0.7861, + "step": 37586 + }, + { + "epoch": 0.96, + "learning_rate": 1.5874673276098968e-06, + "loss": 0.8047, + "step": 37587 + }, + { + "epoch": 0.96, + "learning_rate": 1.5874449351287152e-06, + "loss": 1.002, + "step": 37588 + }, + { + "epoch": 0.96, + "learning_rate": 1.5874225421977539e-06, + "loss": 0.7769, + "step": 37589 + }, + { + "epoch": 0.96, + "learning_rate": 1.5874001488170303e-06, + "loss": 0.8105, + "step": 37590 + }, + { + "epoch": 0.96, + "learning_rate": 1.5873777549865617e-06, + "loss": 0.7153, + "step": 37591 + }, + { + "epoch": 0.96, + "learning_rate": 1.5873553607063644e-06, + "loss": 0.8652, + "step": 37592 + }, + { + "epoch": 0.96, + "learning_rate": 1.5873329659764565e-06, + "loss": 0.9941, + "step": 37593 + }, + { + "epoch": 0.96, + "learning_rate": 1.5873105707968546e-06, + "loss": 0.7422, + "step": 37594 + }, + { + "epoch": 0.96, + "learning_rate": 1.587288175167576e-06, + "loss": 0.9287, + "step": 37595 + }, + { + "epoch": 0.96, + "learning_rate": 1.5872657790886379e-06, + "loss": 0.7324, + "step": 37596 + }, + { + "epoch": 0.96, + "learning_rate": 1.5872433825600574e-06, + "loss": 0.8262, + "step": 37597 + }, + { + "epoch": 0.96, + "learning_rate": 1.5872209855818515e-06, + "loss": 0.8066, + "step": 37598 + }, + { + "epoch": 0.96, + "learning_rate": 1.5871985881540378e-06, + "loss": 0.8223, + "step": 37599 + }, + { + "epoch": 0.96, + "learning_rate": 1.5871761902766328e-06, + "loss": 0.6763, + "step": 37600 + }, + { + "epoch": 0.96, + "learning_rate": 1.587153791949654e-06, + "loss": 0.7861, + "step": 37601 + }, + { + "epoch": 0.96, + "learning_rate": 1.5871313931731188e-06, + "loss": 0.7354, + "step": 37602 + }, + { + "epoch": 0.96, + "learning_rate": 1.587108993947044e-06, + "loss": 0.9873, + "step": 37603 + }, + { + "epoch": 0.96, + "learning_rate": 1.5870865942714466e-06, + "loss": 0.6523, + "step": 37604 + }, + { + "epoch": 0.96, + "learning_rate": 1.5870641941463446e-06, + "loss": 1.0117, + "step": 37605 + }, + { + "epoch": 0.96, + "learning_rate": 1.5870417935717537e-06, + "loss": 0.9609, + "step": 37606 + }, + { + "epoch": 0.96, + "learning_rate": 1.5870193925476924e-06, + "loss": 0.9336, + "step": 37607 + }, + { + "epoch": 0.96, + "learning_rate": 1.5869969910741774e-06, + "loss": 0.8018, + "step": 37608 + }, + { + "epoch": 0.96, + "learning_rate": 1.5869745891512257e-06, + "loss": 0.8467, + "step": 37609 + }, + { + "epoch": 0.96, + "learning_rate": 1.5869521867788544e-06, + "loss": 0.9219, + "step": 37610 + }, + { + "epoch": 0.96, + "learning_rate": 1.5869297839570809e-06, + "loss": 0.9678, + "step": 37611 + }, + { + "epoch": 0.96, + "learning_rate": 1.5869073806859223e-06, + "loss": 0.9375, + "step": 37612 + }, + { + "epoch": 0.96, + "learning_rate": 1.5868849769653956e-06, + "loss": 0.7051, + "step": 37613 + }, + { + "epoch": 0.96, + "learning_rate": 1.586862572795518e-06, + "loss": 0.8721, + "step": 37614 + }, + { + "epoch": 0.96, + "learning_rate": 1.586840168176307e-06, + "loss": 0.8701, + "step": 37615 + }, + { + "epoch": 0.96, + "learning_rate": 1.5868177631077794e-06, + "loss": 0.8535, + "step": 37616 + }, + { + "epoch": 0.96, + "learning_rate": 1.5867953575899523e-06, + "loss": 0.8027, + "step": 37617 + }, + { + "epoch": 0.96, + "learning_rate": 1.586772951622843e-06, + "loss": 0.9043, + "step": 37618 + }, + { + "epoch": 0.96, + "learning_rate": 1.5867505452064686e-06, + "loss": 0.875, + "step": 37619 + }, + { + "epoch": 0.96, + "learning_rate": 1.5867281383408463e-06, + "loss": 0.7676, + "step": 37620 + }, + { + "epoch": 0.96, + "learning_rate": 1.5867057310259932e-06, + "loss": 0.8105, + "step": 37621 + }, + { + "epoch": 0.96, + "learning_rate": 1.5866833232619265e-06, + "loss": 0.8428, + "step": 37622 + }, + { + "epoch": 0.96, + "learning_rate": 1.5866609150486637e-06, + "loss": 0.7637, + "step": 37623 + }, + { + "epoch": 0.96, + "learning_rate": 1.586638506386221e-06, + "loss": 0.957, + "step": 37624 + }, + { + "epoch": 0.96, + "learning_rate": 1.5866160972746168e-06, + "loss": 0.7773, + "step": 37625 + }, + { + "epoch": 0.96, + "learning_rate": 1.5865936877138674e-06, + "loss": 0.6777, + "step": 37626 + }, + { + "epoch": 0.96, + "learning_rate": 1.58657127770399e-06, + "loss": 0.9424, + "step": 37627 + }, + { + "epoch": 0.96, + "learning_rate": 1.586548867245002e-06, + "loss": 0.8013, + "step": 37628 + }, + { + "epoch": 0.96, + "learning_rate": 1.5865264563369205e-06, + "loss": 0.8447, + "step": 37629 + }, + { + "epoch": 0.96, + "learning_rate": 1.5865040449797628e-06, + "loss": 0.6948, + "step": 37630 + }, + { + "epoch": 0.96, + "learning_rate": 1.586481633173546e-06, + "loss": 0.8955, + "step": 37631 + }, + { + "epoch": 0.96, + "learning_rate": 1.5864592209182867e-06, + "loss": 0.9756, + "step": 37632 + }, + { + "epoch": 0.96, + "learning_rate": 1.586436808214003e-06, + "loss": 0.7529, + "step": 37633 + }, + { + "epoch": 0.96, + "learning_rate": 1.5864143950607115e-06, + "loss": 0.8276, + "step": 37634 + }, + { + "epoch": 0.96, + "learning_rate": 1.5863919814584295e-06, + "loss": 0.916, + "step": 37635 + }, + { + "epoch": 0.96, + "learning_rate": 1.586369567407174e-06, + "loss": 0.9473, + "step": 37636 + }, + { + "epoch": 0.96, + "learning_rate": 1.5863471529069623e-06, + "loss": 0.7949, + "step": 37637 + }, + { + "epoch": 0.96, + "learning_rate": 1.5863247379578115e-06, + "loss": 0.7881, + "step": 37638 + }, + { + "epoch": 0.96, + "learning_rate": 1.586302322559739e-06, + "loss": 0.8359, + "step": 37639 + }, + { + "epoch": 0.96, + "learning_rate": 1.5862799067127616e-06, + "loss": 0.959, + "step": 37640 + }, + { + "epoch": 0.96, + "learning_rate": 1.5862574904168966e-06, + "loss": 0.9463, + "step": 37641 + }, + { + "epoch": 0.96, + "learning_rate": 1.5862350736721615e-06, + "loss": 0.6367, + "step": 37642 + }, + { + "epoch": 0.96, + "learning_rate": 1.5862126564785729e-06, + "loss": 0.6289, + "step": 37643 + }, + { + "epoch": 0.96, + "learning_rate": 1.5861902388361483e-06, + "loss": 0.9014, + "step": 37644 + }, + { + "epoch": 0.96, + "learning_rate": 1.5861678207449048e-06, + "loss": 1.0215, + "step": 37645 + }, + { + "epoch": 0.96, + "learning_rate": 1.5861454022048593e-06, + "loss": 0.6162, + "step": 37646 + }, + { + "epoch": 0.96, + "learning_rate": 1.5861229832160294e-06, + "loss": 1.0273, + "step": 37647 + }, + { + "epoch": 0.96, + "learning_rate": 1.5861005637784321e-06, + "loss": 0.9844, + "step": 37648 + }, + { + "epoch": 0.96, + "learning_rate": 1.5860781438920845e-06, + "loss": 0.9873, + "step": 37649 + }, + { + "epoch": 0.96, + "learning_rate": 1.586055723557004e-06, + "loss": 0.9551, + "step": 37650 + }, + { + "epoch": 0.97, + "learning_rate": 1.5860333027732075e-06, + "loss": 0.7979, + "step": 37651 + }, + { + "epoch": 0.97, + "learning_rate": 1.5860108815407123e-06, + "loss": 0.7822, + "step": 37652 + }, + { + "epoch": 0.97, + "learning_rate": 1.5859884598595353e-06, + "loss": 0.8926, + "step": 37653 + }, + { + "epoch": 0.97, + "learning_rate": 1.585966037729694e-06, + "loss": 0.8843, + "step": 37654 + }, + { + "epoch": 0.97, + "learning_rate": 1.5859436151512056e-06, + "loss": 0.833, + "step": 37655 + }, + { + "epoch": 0.97, + "learning_rate": 1.5859211921240869e-06, + "loss": 0.6255, + "step": 37656 + }, + { + "epoch": 0.97, + "learning_rate": 1.5858987686483553e-06, + "loss": 0.8018, + "step": 37657 + }, + { + "epoch": 0.97, + "learning_rate": 1.585876344724028e-06, + "loss": 1.0098, + "step": 37658 + }, + { + "epoch": 0.97, + "learning_rate": 1.5858539203511221e-06, + "loss": 0.7842, + "step": 37659 + }, + { + "epoch": 0.97, + "learning_rate": 1.5858314955296547e-06, + "loss": 0.7605, + "step": 37660 + }, + { + "epoch": 0.97, + "learning_rate": 1.5858090702596433e-06, + "loss": 0.9473, + "step": 37661 + }, + { + "epoch": 0.97, + "learning_rate": 1.5857866445411047e-06, + "loss": 1.0928, + "step": 37662 + }, + { + "epoch": 0.97, + "learning_rate": 1.5857642183740562e-06, + "loss": 0.7812, + "step": 37663 + }, + { + "epoch": 0.97, + "learning_rate": 1.5857417917585152e-06, + "loss": 1.1113, + "step": 37664 + }, + { + "epoch": 0.97, + "learning_rate": 1.5857193646944983e-06, + "loss": 1.0527, + "step": 37665 + }, + { + "epoch": 0.97, + "learning_rate": 1.585696937182023e-06, + "loss": 0.7979, + "step": 37666 + }, + { + "epoch": 0.97, + "learning_rate": 1.5856745092211066e-06, + "loss": 0.875, + "step": 37667 + }, + { + "epoch": 0.97, + "learning_rate": 1.5856520808117662e-06, + "loss": 0.9203, + "step": 37668 + }, + { + "epoch": 0.97, + "learning_rate": 1.5856296519540191e-06, + "loss": 0.6572, + "step": 37669 + }, + { + "epoch": 0.97, + "learning_rate": 1.585607222647882e-06, + "loss": 0.6187, + "step": 37670 + }, + { + "epoch": 0.97, + "learning_rate": 1.5855847928933726e-06, + "loss": 0.7163, + "step": 37671 + }, + { + "epoch": 0.97, + "learning_rate": 1.5855623626905078e-06, + "loss": 0.7642, + "step": 37672 + }, + { + "epoch": 0.97, + "learning_rate": 1.5855399320393046e-06, + "loss": 0.8848, + "step": 37673 + }, + { + "epoch": 0.97, + "learning_rate": 1.5855175009397806e-06, + "loss": 0.8965, + "step": 37674 + }, + { + "epoch": 0.97, + "learning_rate": 1.585495069391953e-06, + "loss": 0.6675, + "step": 37675 + }, + { + "epoch": 0.97, + "learning_rate": 1.585472637395838e-06, + "loss": 0.7783, + "step": 37676 + }, + { + "epoch": 0.97, + "learning_rate": 1.5854502049514542e-06, + "loss": 0.7417, + "step": 37677 + }, + { + "epoch": 0.97, + "learning_rate": 1.5854277720588178e-06, + "loss": 0.8105, + "step": 37678 + }, + { + "epoch": 0.97, + "learning_rate": 1.5854053387179466e-06, + "loss": 0.9414, + "step": 37679 + }, + { + "epoch": 0.97, + "learning_rate": 1.585382904928857e-06, + "loss": 0.8672, + "step": 37680 + }, + { + "epoch": 0.97, + "learning_rate": 1.585360470691567e-06, + "loss": 0.8828, + "step": 37681 + }, + { + "epoch": 0.97, + "learning_rate": 1.5853380360060933e-06, + "loss": 0.9082, + "step": 37682 + }, + { + "epoch": 0.97, + "learning_rate": 1.5853156008724532e-06, + "loss": 0.6533, + "step": 37683 + }, + { + "epoch": 0.97, + "learning_rate": 1.5852931652906636e-06, + "loss": 0.8013, + "step": 37684 + }, + { + "epoch": 0.97, + "learning_rate": 1.585270729260742e-06, + "loss": 0.8916, + "step": 37685 + }, + { + "epoch": 0.97, + "learning_rate": 1.5852482927827056e-06, + "loss": 0.748, + "step": 37686 + }, + { + "epoch": 0.97, + "learning_rate": 1.5852258558565716e-06, + "loss": 1.0273, + "step": 37687 + }, + { + "epoch": 0.97, + "learning_rate": 1.585203418482357e-06, + "loss": 0.7122, + "step": 37688 + }, + { + "epoch": 0.97, + "learning_rate": 1.5851809806600791e-06, + "loss": 0.8379, + "step": 37689 + }, + { + "epoch": 0.97, + "learning_rate": 1.585158542389755e-06, + "loss": 0.5376, + "step": 37690 + }, + { + "epoch": 0.97, + "learning_rate": 1.585136103671402e-06, + "loss": 0.8071, + "step": 37691 + }, + { + "epoch": 0.97, + "learning_rate": 1.585113664505037e-06, + "loss": 0.7505, + "step": 37692 + }, + { + "epoch": 0.97, + "learning_rate": 1.5850912248906774e-06, + "loss": 0.7769, + "step": 37693 + }, + { + "epoch": 0.97, + "learning_rate": 1.5850687848283405e-06, + "loss": 1.0928, + "step": 37694 + }, + { + "epoch": 0.97, + "learning_rate": 1.5850463443180433e-06, + "loss": 0.6582, + "step": 37695 + }, + { + "epoch": 0.97, + "learning_rate": 1.585023903359803e-06, + "loss": 0.8604, + "step": 37696 + }, + { + "epoch": 0.97, + "learning_rate": 1.5850014619536367e-06, + "loss": 0.9834, + "step": 37697 + }, + { + "epoch": 0.97, + "learning_rate": 1.5849790200995617e-06, + "loss": 0.6455, + "step": 37698 + }, + { + "epoch": 0.97, + "learning_rate": 1.5849565777975952e-06, + "loss": 0.5706, + "step": 37699 + }, + { + "epoch": 0.97, + "learning_rate": 1.5849341350477544e-06, + "loss": 0.8652, + "step": 37700 + }, + { + "epoch": 0.97, + "learning_rate": 1.5849116918500562e-06, + "loss": 1.0039, + "step": 37701 + }, + { + "epoch": 0.97, + "learning_rate": 1.5848892482045182e-06, + "loss": 0.8564, + "step": 37702 + }, + { + "epoch": 0.97, + "learning_rate": 1.5848668041111575e-06, + "loss": 0.9639, + "step": 37703 + }, + { + "epoch": 0.97, + "learning_rate": 1.5848443595699913e-06, + "loss": 0.7578, + "step": 37704 + }, + { + "epoch": 0.97, + "learning_rate": 1.5848219145810364e-06, + "loss": 0.9072, + "step": 37705 + }, + { + "epoch": 0.97, + "learning_rate": 1.58479946914431e-06, + "loss": 0.6245, + "step": 37706 + }, + { + "epoch": 0.97, + "learning_rate": 1.58477702325983e-06, + "loss": 0.8818, + "step": 37707 + }, + { + "epoch": 0.97, + "learning_rate": 1.584754576927613e-06, + "loss": 1.3623, + "step": 37708 + }, + { + "epoch": 0.97, + "learning_rate": 1.584732130147676e-06, + "loss": 0.9512, + "step": 37709 + }, + { + "epoch": 0.97, + "learning_rate": 1.5847096829200368e-06, + "loss": 0.9561, + "step": 37710 + }, + { + "epoch": 0.97, + "learning_rate": 1.5846872352447123e-06, + "loss": 0.7578, + "step": 37711 + }, + { + "epoch": 0.97, + "learning_rate": 1.5846647871217194e-06, + "loss": 0.8438, + "step": 37712 + }, + { + "epoch": 0.97, + "learning_rate": 1.5846423385510757e-06, + "loss": 0.9814, + "step": 37713 + }, + { + "epoch": 0.97, + "learning_rate": 1.5846198895327984e-06, + "loss": 0.8887, + "step": 37714 + }, + { + "epoch": 0.97, + "learning_rate": 1.5845974400669047e-06, + "loss": 0.8066, + "step": 37715 + }, + { + "epoch": 0.97, + "learning_rate": 1.5845749901534112e-06, + "loss": 0.7668, + "step": 37716 + }, + { + "epoch": 0.97, + "learning_rate": 1.5845525397923355e-06, + "loss": 0.7041, + "step": 37717 + }, + { + "epoch": 0.97, + "learning_rate": 1.584530088983695e-06, + "loss": 0.7969, + "step": 37718 + }, + { + "epoch": 0.97, + "learning_rate": 1.5845076377275065e-06, + "loss": 0.9956, + "step": 37719 + }, + { + "epoch": 0.97, + "learning_rate": 1.5844851860237877e-06, + "loss": 0.6997, + "step": 37720 + }, + { + "epoch": 0.97, + "learning_rate": 1.5844627338725554e-06, + "loss": 1.0693, + "step": 37721 + }, + { + "epoch": 0.97, + "learning_rate": 1.5844402812738266e-06, + "loss": 0.696, + "step": 37722 + }, + { + "epoch": 0.97, + "learning_rate": 1.584417828227619e-06, + "loss": 0.6357, + "step": 37723 + }, + { + "epoch": 0.97, + "learning_rate": 1.5843953747339494e-06, + "loss": 0.6619, + "step": 37724 + }, + { + "epoch": 0.97, + "learning_rate": 1.5843729207928354e-06, + "loss": 0.6421, + "step": 37725 + }, + { + "epoch": 0.97, + "learning_rate": 1.5843504664042934e-06, + "loss": 0.7197, + "step": 37726 + }, + { + "epoch": 0.97, + "learning_rate": 1.5843280115683414e-06, + "loss": 0.8242, + "step": 37727 + }, + { + "epoch": 0.97, + "learning_rate": 1.5843055562849964e-06, + "loss": 0.8965, + "step": 37728 + }, + { + "epoch": 0.97, + "learning_rate": 1.5842831005542756e-06, + "loss": 0.7617, + "step": 37729 + }, + { + "epoch": 0.97, + "learning_rate": 1.584260644376196e-06, + "loss": 0.6948, + "step": 37730 + }, + { + "epoch": 0.97, + "learning_rate": 1.5842381877507744e-06, + "loss": 0.7373, + "step": 37731 + }, + { + "epoch": 0.97, + "learning_rate": 1.584215730678029e-06, + "loss": 0.8193, + "step": 37732 + }, + { + "epoch": 0.97, + "learning_rate": 1.5841932731579766e-06, + "loss": 0.7383, + "step": 37733 + }, + { + "epoch": 0.97, + "learning_rate": 1.5841708151906338e-06, + "loss": 0.6143, + "step": 37734 + }, + { + "epoch": 0.97, + "learning_rate": 1.5841483567760186e-06, + "loss": 1.0527, + "step": 37735 + }, + { + "epoch": 0.97, + "learning_rate": 1.5841258979141476e-06, + "loss": 0.8682, + "step": 37736 + }, + { + "epoch": 0.97, + "learning_rate": 1.5841034386050388e-06, + "loss": 0.8711, + "step": 37737 + }, + { + "epoch": 0.97, + "learning_rate": 1.5840809788487082e-06, + "loss": 0.6533, + "step": 37738 + }, + { + "epoch": 0.97, + "learning_rate": 1.584058518645174e-06, + "loss": 0.8613, + "step": 37739 + }, + { + "epoch": 0.97, + "learning_rate": 1.584036057994453e-06, + "loss": 0.7617, + "step": 37740 + }, + { + "epoch": 0.97, + "learning_rate": 1.5840135968965625e-06, + "loss": 0.9277, + "step": 37741 + }, + { + "epoch": 0.97, + "learning_rate": 1.5839911353515194e-06, + "loss": 0.7744, + "step": 37742 + }, + { + "epoch": 0.97, + "learning_rate": 1.5839686733593414e-06, + "loss": 0.7197, + "step": 37743 + }, + { + "epoch": 0.97, + "learning_rate": 1.5839462109200454e-06, + "loss": 0.5415, + "step": 37744 + }, + { + "epoch": 0.97, + "learning_rate": 1.5839237480336488e-06, + "loss": 0.7324, + "step": 37745 + }, + { + "epoch": 0.97, + "learning_rate": 1.5839012847001682e-06, + "loss": 0.8535, + "step": 37746 + }, + { + "epoch": 0.97, + "learning_rate": 1.5838788209196214e-06, + "loss": 0.7874, + "step": 37747 + }, + { + "epoch": 0.97, + "learning_rate": 1.5838563566920256e-06, + "loss": 0.7998, + "step": 37748 + }, + { + "epoch": 0.97, + "learning_rate": 1.583833892017398e-06, + "loss": 0.9736, + "step": 37749 + }, + { + "epoch": 0.97, + "learning_rate": 1.583811426895755e-06, + "loss": 0.7832, + "step": 37750 + }, + { + "epoch": 0.97, + "learning_rate": 1.5837889613271149e-06, + "loss": 0.7776, + "step": 37751 + }, + { + "epoch": 0.97, + "learning_rate": 1.5837664953114941e-06, + "loss": 0.8955, + "step": 37752 + }, + { + "epoch": 0.97, + "learning_rate": 1.5837440288489106e-06, + "loss": 0.7344, + "step": 37753 + }, + { + "epoch": 0.97, + "learning_rate": 1.5837215619393809e-06, + "loss": 0.6343, + "step": 37754 + }, + { + "epoch": 0.97, + "learning_rate": 1.5836990945829224e-06, + "loss": 0.9482, + "step": 37755 + }, + { + "epoch": 0.97, + "learning_rate": 1.5836766267795523e-06, + "loss": 0.813, + "step": 37756 + }, + { + "epoch": 0.97, + "learning_rate": 1.583654158529288e-06, + "loss": 0.73, + "step": 37757 + }, + { + "epoch": 0.97, + "learning_rate": 1.5836316898321464e-06, + "loss": 0.9824, + "step": 37758 + }, + { + "epoch": 0.97, + "learning_rate": 1.583609220688145e-06, + "loss": 0.8228, + "step": 37759 + }, + { + "epoch": 0.97, + "learning_rate": 1.5835867510973009e-06, + "loss": 0.7246, + "step": 37760 + }, + { + "epoch": 0.97, + "learning_rate": 1.583564281059631e-06, + "loss": 0.7568, + "step": 37761 + }, + { + "epoch": 0.97, + "learning_rate": 1.583541810575153e-06, + "loss": 0.8057, + "step": 37762 + }, + { + "epoch": 0.97, + "learning_rate": 1.5835193396438837e-06, + "loss": 1.0527, + "step": 37763 + }, + { + "epoch": 0.97, + "learning_rate": 1.5834968682658407e-06, + "loss": 1.0645, + "step": 37764 + }, + { + "epoch": 0.97, + "learning_rate": 1.5834743964410408e-06, + "loss": 0.8101, + "step": 37765 + }, + { + "epoch": 0.97, + "learning_rate": 1.5834519241695015e-06, + "loss": 0.5063, + "step": 37766 + }, + { + "epoch": 0.97, + "learning_rate": 1.5834294514512396e-06, + "loss": 0.8848, + "step": 37767 + }, + { + "epoch": 0.97, + "learning_rate": 1.5834069782862728e-06, + "loss": 0.7949, + "step": 37768 + }, + { + "epoch": 0.97, + "learning_rate": 1.5833845046746184e-06, + "loss": 0.9453, + "step": 37769 + }, + { + "epoch": 0.97, + "learning_rate": 1.583362030616293e-06, + "loss": 0.7715, + "step": 37770 + }, + { + "epoch": 0.97, + "learning_rate": 1.583339556111314e-06, + "loss": 0.8867, + "step": 37771 + }, + { + "epoch": 0.97, + "learning_rate": 1.583317081159699e-06, + "loss": 0.8652, + "step": 37772 + }, + { + "epoch": 0.97, + "learning_rate": 1.5832946057614644e-06, + "loss": 0.8291, + "step": 37773 + }, + { + "epoch": 0.97, + "learning_rate": 1.5832721299166285e-06, + "loss": 1.0166, + "step": 37774 + }, + { + "epoch": 0.97, + "learning_rate": 1.5832496536252079e-06, + "loss": 1.1689, + "step": 37775 + }, + { + "epoch": 0.97, + "learning_rate": 1.5832271768872196e-06, + "loss": 0.8594, + "step": 37776 + }, + { + "epoch": 0.97, + "learning_rate": 1.5832046997026813e-06, + "loss": 0.6323, + "step": 37777 + }, + { + "epoch": 0.97, + "learning_rate": 1.5831822220716097e-06, + "loss": 0.959, + "step": 37778 + }, + { + "epoch": 0.97, + "learning_rate": 1.5831597439940225e-06, + "loss": 0.6938, + "step": 37779 + }, + { + "epoch": 0.97, + "learning_rate": 1.583137265469937e-06, + "loss": 0.9619, + "step": 37780 + }, + { + "epoch": 0.97, + "learning_rate": 1.5831147864993697e-06, + "loss": 1.0283, + "step": 37781 + }, + { + "epoch": 0.97, + "learning_rate": 1.583092307082338e-06, + "loss": 0.7764, + "step": 37782 + }, + { + "epoch": 0.97, + "learning_rate": 1.5830698272188596e-06, + "loss": 0.8003, + "step": 37783 + }, + { + "epoch": 0.97, + "learning_rate": 1.5830473469089518e-06, + "loss": 0.7373, + "step": 37784 + }, + { + "epoch": 0.97, + "learning_rate": 1.5830248661526308e-06, + "loss": 0.7861, + "step": 37785 + }, + { + "epoch": 0.97, + "learning_rate": 1.583002384949915e-06, + "loss": 0.9023, + "step": 37786 + }, + { + "epoch": 0.97, + "learning_rate": 1.582979903300821e-06, + "loss": 0.8887, + "step": 37787 + }, + { + "epoch": 0.97, + "learning_rate": 1.5829574212053658e-06, + "loss": 0.5959, + "step": 37788 + }, + { + "epoch": 0.97, + "learning_rate": 1.5829349386635671e-06, + "loss": 0.8467, + "step": 37789 + }, + { + "epoch": 0.97, + "learning_rate": 1.5829124556754422e-06, + "loss": 0.8018, + "step": 37790 + }, + { + "epoch": 0.97, + "learning_rate": 1.5828899722410073e-06, + "loss": 0.7969, + "step": 37791 + }, + { + "epoch": 0.97, + "learning_rate": 1.5828674883602807e-06, + "loss": 0.792, + "step": 37792 + }, + { + "epoch": 0.97, + "learning_rate": 1.5828450040332796e-06, + "loss": 0.8096, + "step": 37793 + }, + { + "epoch": 0.97, + "learning_rate": 1.5828225192600209e-06, + "loss": 0.791, + "step": 37794 + }, + { + "epoch": 0.97, + "learning_rate": 1.5828000340405212e-06, + "loss": 0.7808, + "step": 37795 + }, + { + "epoch": 0.97, + "learning_rate": 1.5827775483747987e-06, + "loss": 0.8613, + "step": 37796 + }, + { + "epoch": 0.97, + "learning_rate": 1.58275506226287e-06, + "loss": 1.0361, + "step": 37797 + }, + { + "epoch": 0.97, + "learning_rate": 1.5827325757047528e-06, + "loss": 0.7891, + "step": 37798 + }, + { + "epoch": 0.97, + "learning_rate": 1.5827100887004641e-06, + "loss": 0.5698, + "step": 37799 + }, + { + "epoch": 0.97, + "learning_rate": 1.5826876012500208e-06, + "loss": 0.79, + "step": 37800 + }, + { + "epoch": 0.97, + "learning_rate": 1.5826651133534407e-06, + "loss": 0.7637, + "step": 37801 + }, + { + "epoch": 0.97, + "learning_rate": 1.5826426250107402e-06, + "loss": 0.5571, + "step": 37802 + }, + { + "epoch": 0.97, + "learning_rate": 1.5826201362219375e-06, + "loss": 0.7861, + "step": 37803 + }, + { + "epoch": 0.97, + "learning_rate": 1.5825976469870494e-06, + "loss": 0.7065, + "step": 37804 + }, + { + "epoch": 0.97, + "learning_rate": 1.582575157306093e-06, + "loss": 0.7666, + "step": 37805 + }, + { + "epoch": 0.97, + "learning_rate": 1.5825526671790855e-06, + "loss": 0.998, + "step": 37806 + }, + { + "epoch": 0.97, + "learning_rate": 1.5825301766060441e-06, + "loss": 0.6924, + "step": 37807 + }, + { + "epoch": 0.97, + "learning_rate": 1.5825076855869863e-06, + "loss": 0.8682, + "step": 37808 + }, + { + "epoch": 0.97, + "learning_rate": 1.5824851941219293e-06, + "loss": 0.538, + "step": 37809 + }, + { + "epoch": 0.97, + "learning_rate": 1.58246270221089e-06, + "loss": 0.561, + "step": 37810 + }, + { + "epoch": 0.97, + "learning_rate": 1.5824402098538856e-06, + "loss": 0.7432, + "step": 37811 + }, + { + "epoch": 0.97, + "learning_rate": 1.5824177170509337e-06, + "loss": 0.6426, + "step": 37812 + }, + { + "epoch": 0.97, + "learning_rate": 1.5823952238020513e-06, + "loss": 0.6997, + "step": 37813 + }, + { + "epoch": 0.97, + "learning_rate": 1.5823727301072558e-06, + "loss": 0.8438, + "step": 37814 + }, + { + "epoch": 0.97, + "learning_rate": 1.582350235966564e-06, + "loss": 0.9102, + "step": 37815 + }, + { + "epoch": 0.97, + "learning_rate": 1.5823277413799936e-06, + "loss": 0.9199, + "step": 37816 + }, + { + "epoch": 0.97, + "learning_rate": 1.5823052463475614e-06, + "loss": 0.8779, + "step": 37817 + }, + { + "epoch": 0.97, + "learning_rate": 1.5822827508692851e-06, + "loss": 0.8662, + "step": 37818 + }, + { + "epoch": 0.97, + "learning_rate": 1.5822602549451815e-06, + "loss": 0.7197, + "step": 37819 + }, + { + "epoch": 0.97, + "learning_rate": 1.582237758575268e-06, + "loss": 0.9209, + "step": 37820 + }, + { + "epoch": 0.97, + "learning_rate": 1.582215261759562e-06, + "loss": 0.9141, + "step": 37821 + }, + { + "epoch": 0.97, + "learning_rate": 1.5821927644980804e-06, + "loss": 0.8755, + "step": 37822 + }, + { + "epoch": 0.97, + "learning_rate": 1.5821702667908406e-06, + "loss": 0.8379, + "step": 37823 + }, + { + "epoch": 0.97, + "learning_rate": 1.58214776863786e-06, + "loss": 0.8086, + "step": 37824 + }, + { + "epoch": 0.97, + "learning_rate": 1.5821252700391554e-06, + "loss": 0.7812, + "step": 37825 + }, + { + "epoch": 0.97, + "learning_rate": 1.5821027709947442e-06, + "loss": 0.7251, + "step": 37826 + }, + { + "epoch": 0.97, + "learning_rate": 1.5820802715046438e-06, + "loss": 0.8062, + "step": 37827 + }, + { + "epoch": 0.97, + "learning_rate": 1.5820577715688712e-06, + "loss": 0.7471, + "step": 37828 + }, + { + "epoch": 0.97, + "learning_rate": 1.582035271187444e-06, + "loss": 0.7783, + "step": 37829 + }, + { + "epoch": 0.97, + "learning_rate": 1.5820127703603786e-06, + "loss": 0.7295, + "step": 37830 + }, + { + "epoch": 0.97, + "learning_rate": 1.5819902690876931e-06, + "loss": 0.877, + "step": 37831 + }, + { + "epoch": 0.97, + "learning_rate": 1.5819677673694045e-06, + "loss": 0.7363, + "step": 37832 + }, + { + "epoch": 0.97, + "learning_rate": 1.58194526520553e-06, + "loss": 0.9756, + "step": 37833 + }, + { + "epoch": 0.97, + "learning_rate": 1.5819227625960868e-06, + "loss": 0.9648, + "step": 37834 + }, + { + "epoch": 0.97, + "learning_rate": 1.5819002595410917e-06, + "loss": 0.8911, + "step": 37835 + }, + { + "epoch": 0.97, + "learning_rate": 1.5818777560405628e-06, + "loss": 0.688, + "step": 37836 + }, + { + "epoch": 0.97, + "learning_rate": 1.5818552520945165e-06, + "loss": 0.9609, + "step": 37837 + }, + { + "epoch": 0.97, + "learning_rate": 1.5818327477029706e-06, + "loss": 0.9854, + "step": 37838 + }, + { + "epoch": 0.97, + "learning_rate": 1.5818102428659418e-06, + "loss": 0.8848, + "step": 37839 + }, + { + "epoch": 0.97, + "learning_rate": 1.581787737583448e-06, + "loss": 1.0439, + "step": 37840 + }, + { + "epoch": 0.97, + "learning_rate": 1.581765231855506e-06, + "loss": 1.4229, + "step": 37841 + }, + { + "epoch": 0.97, + "learning_rate": 1.5817427256821331e-06, + "loss": 1.1377, + "step": 37842 + }, + { + "epoch": 0.97, + "learning_rate": 1.5817202190633462e-06, + "loss": 0.9199, + "step": 37843 + }, + { + "epoch": 0.97, + "learning_rate": 1.5816977119991635e-06, + "loss": 0.8936, + "step": 37844 + }, + { + "epoch": 0.97, + "learning_rate": 1.5816752044896014e-06, + "loss": 0.8975, + "step": 37845 + }, + { + "epoch": 0.97, + "learning_rate": 1.581652696534677e-06, + "loss": 0.6406, + "step": 37846 + }, + { + "epoch": 0.97, + "learning_rate": 1.581630188134408e-06, + "loss": 0.9502, + "step": 37847 + }, + { + "epoch": 0.97, + "learning_rate": 1.5816076792888118e-06, + "loss": 0.9492, + "step": 37848 + }, + { + "epoch": 0.97, + "learning_rate": 1.5815851699979055e-06, + "loss": 0.707, + "step": 37849 + }, + { + "epoch": 0.97, + "learning_rate": 1.5815626602617055e-06, + "loss": 0.7175, + "step": 37850 + }, + { + "epoch": 0.97, + "learning_rate": 1.58154015008023e-06, + "loss": 0.563, + "step": 37851 + }, + { + "epoch": 0.97, + "learning_rate": 1.581517639453496e-06, + "loss": 1.1787, + "step": 37852 + }, + { + "epoch": 0.97, + "learning_rate": 1.5814951283815207e-06, + "loss": 0.7109, + "step": 37853 + }, + { + "epoch": 0.97, + "learning_rate": 1.5814726168643215e-06, + "loss": 0.9106, + "step": 37854 + }, + { + "epoch": 0.97, + "learning_rate": 1.5814501049019153e-06, + "loss": 0.7896, + "step": 37855 + }, + { + "epoch": 0.97, + "learning_rate": 1.5814275924943195e-06, + "loss": 0.6836, + "step": 37856 + }, + { + "epoch": 0.97, + "learning_rate": 1.5814050796415511e-06, + "loss": 0.9277, + "step": 37857 + }, + { + "epoch": 0.97, + "learning_rate": 1.5813825663436278e-06, + "loss": 0.8887, + "step": 37858 + }, + { + "epoch": 0.97, + "learning_rate": 1.5813600526005666e-06, + "loss": 0.5684, + "step": 37859 + }, + { + "epoch": 0.97, + "learning_rate": 1.5813375384123848e-06, + "loss": 0.9287, + "step": 37860 + }, + { + "epoch": 0.97, + "learning_rate": 1.5813150237790996e-06, + "loss": 0.9443, + "step": 37861 + }, + { + "epoch": 0.97, + "learning_rate": 1.5812925087007278e-06, + "loss": 0.9111, + "step": 37862 + }, + { + "epoch": 0.97, + "learning_rate": 1.5812699931772873e-06, + "loss": 0.8291, + "step": 37863 + }, + { + "epoch": 0.97, + "learning_rate": 1.5812474772087953e-06, + "loss": 0.8838, + "step": 37864 + }, + { + "epoch": 0.97, + "learning_rate": 1.5812249607952686e-06, + "loss": 1.0664, + "step": 37865 + }, + { + "epoch": 0.97, + "learning_rate": 1.5812024439367247e-06, + "loss": 0.8496, + "step": 37866 + }, + { + "epoch": 0.97, + "learning_rate": 1.5811799266331809e-06, + "loss": 0.792, + "step": 37867 + }, + { + "epoch": 0.97, + "learning_rate": 1.5811574088846542e-06, + "loss": 0.8838, + "step": 37868 + }, + { + "epoch": 0.97, + "learning_rate": 1.581134890691162e-06, + "loss": 0.9717, + "step": 37869 + }, + { + "epoch": 0.97, + "learning_rate": 1.581112372052722e-06, + "loss": 0.8818, + "step": 37870 + }, + { + "epoch": 0.97, + "learning_rate": 1.5810898529693505e-06, + "loss": 0.9707, + "step": 37871 + }, + { + "epoch": 0.97, + "learning_rate": 1.581067333441065e-06, + "loss": 1.0225, + "step": 37872 + }, + { + "epoch": 0.97, + "learning_rate": 1.5810448134678834e-06, + "loss": 0.8359, + "step": 37873 + }, + { + "epoch": 0.97, + "learning_rate": 1.5810222930498225e-06, + "loss": 0.8369, + "step": 37874 + }, + { + "epoch": 0.97, + "learning_rate": 1.5809997721868995e-06, + "loss": 0.8008, + "step": 37875 + }, + { + "epoch": 0.97, + "learning_rate": 1.5809772508791315e-06, + "loss": 0.8623, + "step": 37876 + }, + { + "epoch": 0.97, + "learning_rate": 1.5809547291265361e-06, + "loss": 0.7422, + "step": 37877 + }, + { + "epoch": 0.97, + "learning_rate": 1.5809322069291305e-06, + "loss": 0.7441, + "step": 37878 + }, + { + "epoch": 0.97, + "learning_rate": 1.5809096842869315e-06, + "loss": 0.7124, + "step": 37879 + }, + { + "epoch": 0.97, + "learning_rate": 1.580887161199957e-06, + "loss": 0.8076, + "step": 37880 + }, + { + "epoch": 0.97, + "learning_rate": 1.5808646376682236e-06, + "loss": 0.7542, + "step": 37881 + }, + { + "epoch": 0.97, + "learning_rate": 1.5808421136917489e-06, + "loss": 0.8271, + "step": 37882 + }, + { + "epoch": 0.97, + "learning_rate": 1.5808195892705504e-06, + "loss": 0.9395, + "step": 37883 + }, + { + "epoch": 0.97, + "learning_rate": 1.580797064404645e-06, + "loss": 0.8013, + "step": 37884 + }, + { + "epoch": 0.97, + "learning_rate": 1.5807745390940497e-06, + "loss": 1.1436, + "step": 37885 + }, + { + "epoch": 0.97, + "learning_rate": 1.580752013338782e-06, + "loss": 0.9258, + "step": 37886 + }, + { + "epoch": 0.97, + "learning_rate": 1.5807294871388595e-06, + "loss": 0.8335, + "step": 37887 + }, + { + "epoch": 0.97, + "learning_rate": 1.5807069604942988e-06, + "loss": 0.8203, + "step": 37888 + }, + { + "epoch": 0.97, + "learning_rate": 1.5806844334051178e-06, + "loss": 1.0723, + "step": 37889 + }, + { + "epoch": 0.97, + "learning_rate": 1.5806619058713332e-06, + "loss": 0.7812, + "step": 37890 + }, + { + "epoch": 0.97, + "learning_rate": 1.5806393778929628e-06, + "loss": 0.8301, + "step": 37891 + }, + { + "epoch": 0.97, + "learning_rate": 1.5806168494700232e-06, + "loss": 0.6631, + "step": 37892 + }, + { + "epoch": 0.97, + "learning_rate": 1.5805943206025321e-06, + "loss": 0.9375, + "step": 37893 + }, + { + "epoch": 0.97, + "learning_rate": 1.5805717912905067e-06, + "loss": 0.5706, + "step": 37894 + }, + { + "epoch": 0.97, + "learning_rate": 1.5805492615339639e-06, + "loss": 0.6938, + "step": 37895 + }, + { + "epoch": 0.97, + "learning_rate": 1.5805267313329217e-06, + "loss": 0.9814, + "step": 37896 + }, + { + "epoch": 0.97, + "learning_rate": 1.5805042006873964e-06, + "loss": 1.0332, + "step": 37897 + }, + { + "epoch": 0.97, + "learning_rate": 1.5804816695974056e-06, + "loss": 0.6846, + "step": 37898 + }, + { + "epoch": 0.97, + "learning_rate": 1.5804591380629675e-06, + "loss": 0.7009, + "step": 37899 + }, + { + "epoch": 0.97, + "learning_rate": 1.5804366060840976e-06, + "loss": 0.7549, + "step": 37900 + }, + { + "epoch": 0.97, + "learning_rate": 1.5804140736608147e-06, + "loss": 0.9365, + "step": 37901 + }, + { + "epoch": 0.97, + "learning_rate": 1.5803915407931351e-06, + "loss": 0.8057, + "step": 37902 + }, + { + "epoch": 0.97, + "learning_rate": 1.5803690074810767e-06, + "loss": 0.6455, + "step": 37903 + }, + { + "epoch": 0.97, + "learning_rate": 1.5803464737246564e-06, + "loss": 0.8301, + "step": 37904 + }, + { + "epoch": 0.97, + "learning_rate": 1.5803239395238912e-06, + "loss": 0.7979, + "step": 37905 + }, + { + "epoch": 0.97, + "learning_rate": 1.5803014048787987e-06, + "loss": 0.4968, + "step": 37906 + }, + { + "epoch": 0.97, + "learning_rate": 1.5802788697893962e-06, + "loss": 0.6704, + "step": 37907 + }, + { + "epoch": 0.97, + "learning_rate": 1.5802563342557008e-06, + "loss": 0.7158, + "step": 37908 + }, + { + "epoch": 0.97, + "learning_rate": 1.58023379827773e-06, + "loss": 0.7173, + "step": 37909 + }, + { + "epoch": 0.97, + "learning_rate": 1.5802112618555005e-06, + "loss": 0.835, + "step": 37910 + }, + { + "epoch": 0.97, + "learning_rate": 1.5801887249890303e-06, + "loss": 1.1035, + "step": 37911 + }, + { + "epoch": 0.97, + "learning_rate": 1.5801661876783362e-06, + "loss": 0.7578, + "step": 37912 + }, + { + "epoch": 0.97, + "learning_rate": 1.580143649923435e-06, + "loss": 1.0156, + "step": 37913 + }, + { + "epoch": 0.97, + "learning_rate": 1.5801211117243453e-06, + "loss": 0.8916, + "step": 37914 + }, + { + "epoch": 0.97, + "learning_rate": 1.580098573081083e-06, + "loss": 0.9434, + "step": 37915 + }, + { + "epoch": 0.97, + "learning_rate": 1.5800760339936661e-06, + "loss": 0.9668, + "step": 37916 + }, + { + "epoch": 0.97, + "learning_rate": 1.5800534944621115e-06, + "loss": 0.8447, + "step": 37917 + }, + { + "epoch": 0.97, + "learning_rate": 1.5800309544864366e-06, + "loss": 0.7373, + "step": 37918 + }, + { + "epoch": 0.97, + "learning_rate": 1.5800084140666589e-06, + "loss": 0.8154, + "step": 37919 + }, + { + "epoch": 0.97, + "learning_rate": 1.5799858732027952e-06, + "loss": 0.9238, + "step": 37920 + }, + { + "epoch": 0.97, + "learning_rate": 1.5799633318948632e-06, + "loss": 0.7407, + "step": 37921 + }, + { + "epoch": 0.97, + "learning_rate": 1.5799407901428797e-06, + "loss": 0.8848, + "step": 37922 + }, + { + "epoch": 0.97, + "learning_rate": 1.5799182479468623e-06, + "loss": 0.7485, + "step": 37923 + }, + { + "epoch": 0.97, + "learning_rate": 1.5798957053068285e-06, + "loss": 0.8428, + "step": 37924 + }, + { + "epoch": 0.97, + "learning_rate": 1.5798731622227948e-06, + "loss": 0.8506, + "step": 37925 + }, + { + "epoch": 0.97, + "learning_rate": 1.579850618694779e-06, + "loss": 0.9062, + "step": 37926 + }, + { + "epoch": 0.97, + "learning_rate": 1.579828074722798e-06, + "loss": 0.7759, + "step": 37927 + }, + { + "epoch": 0.97, + "learning_rate": 1.5798055303068695e-06, + "loss": 1.1309, + "step": 37928 + }, + { + "epoch": 0.97, + "learning_rate": 1.5797829854470107e-06, + "loss": 0.8906, + "step": 37929 + }, + { + "epoch": 0.97, + "learning_rate": 1.5797604401432387e-06, + "loss": 0.9014, + "step": 37930 + }, + { + "epoch": 0.97, + "learning_rate": 1.5797378943955707e-06, + "loss": 0.6875, + "step": 37931 + }, + { + "epoch": 0.97, + "learning_rate": 1.579715348204024e-06, + "loss": 0.8574, + "step": 37932 + }, + { + "epoch": 0.97, + "learning_rate": 1.5796928015686159e-06, + "loss": 0.8848, + "step": 37933 + }, + { + "epoch": 0.97, + "learning_rate": 1.579670254489364e-06, + "loss": 0.8682, + "step": 37934 + }, + { + "epoch": 0.97, + "learning_rate": 1.579647706966285e-06, + "loss": 0.5796, + "step": 37935 + }, + { + "epoch": 0.97, + "learning_rate": 1.5796251589993963e-06, + "loss": 0.959, + "step": 37936 + }, + { + "epoch": 0.97, + "learning_rate": 1.5796026105887155e-06, + "loss": 0.7072, + "step": 37937 + }, + { + "epoch": 0.97, + "learning_rate": 1.5795800617342595e-06, + "loss": 0.7129, + "step": 37938 + }, + { + "epoch": 0.97, + "learning_rate": 1.5795575124360457e-06, + "loss": 0.7852, + "step": 37939 + }, + { + "epoch": 0.97, + "learning_rate": 1.5795349626940913e-06, + "loss": 0.9336, + "step": 37940 + }, + { + "epoch": 0.97, + "learning_rate": 1.5795124125084137e-06, + "loss": 0.7502, + "step": 37941 + }, + { + "epoch": 0.97, + "learning_rate": 1.57948986187903e-06, + "loss": 0.917, + "step": 37942 + }, + { + "epoch": 0.97, + "learning_rate": 1.5794673108059574e-06, + "loss": 0.9375, + "step": 37943 + }, + { + "epoch": 0.97, + "learning_rate": 1.579444759289214e-06, + "loss": 1.0684, + "step": 37944 + }, + { + "epoch": 0.97, + "learning_rate": 1.579422207328816e-06, + "loss": 0.7197, + "step": 37945 + }, + { + "epoch": 0.97, + "learning_rate": 1.579399654924781e-06, + "loss": 0.9473, + "step": 37946 + }, + { + "epoch": 0.97, + "learning_rate": 1.5793771020771262e-06, + "loss": 0.7568, + "step": 37947 + }, + { + "epoch": 0.97, + "learning_rate": 1.579354548785869e-06, + "loss": 0.6597, + "step": 37948 + }, + { + "epoch": 0.97, + "learning_rate": 1.5793319950510271e-06, + "loss": 0.7646, + "step": 37949 + }, + { + "epoch": 0.97, + "learning_rate": 1.579309440872617e-06, + "loss": 0.7334, + "step": 37950 + }, + { + "epoch": 0.97, + "learning_rate": 1.579286886250656e-06, + "loss": 0.4927, + "step": 37951 + }, + { + "epoch": 0.97, + "learning_rate": 1.5792643311851622e-06, + "loss": 0.9297, + "step": 37952 + }, + { + "epoch": 0.97, + "learning_rate": 1.5792417756761522e-06, + "loss": 0.9473, + "step": 37953 + }, + { + "epoch": 0.97, + "learning_rate": 1.5792192197236433e-06, + "loss": 0.7397, + "step": 37954 + }, + { + "epoch": 0.97, + "learning_rate": 1.5791966633276528e-06, + "loss": 0.7949, + "step": 37955 + }, + { + "epoch": 0.97, + "learning_rate": 1.5791741064881982e-06, + "loss": 0.7393, + "step": 37956 + }, + { + "epoch": 0.97, + "learning_rate": 1.5791515492052966e-06, + "loss": 0.4741, + "step": 37957 + }, + { + "epoch": 0.97, + "learning_rate": 1.5791289914789654e-06, + "loss": 0.6208, + "step": 37958 + }, + { + "epoch": 0.97, + "learning_rate": 1.5791064333092216e-06, + "loss": 0.7568, + "step": 37959 + }, + { + "epoch": 0.97, + "learning_rate": 1.5790838746960826e-06, + "loss": 0.6938, + "step": 37960 + }, + { + "epoch": 0.97, + "learning_rate": 1.5790613156395658e-06, + "loss": 0.7344, + "step": 37961 + }, + { + "epoch": 0.97, + "learning_rate": 1.5790387561396883e-06, + "loss": 0.8616, + "step": 37962 + }, + { + "epoch": 0.97, + "learning_rate": 1.5790161961964677e-06, + "loss": 0.7607, + "step": 37963 + }, + { + "epoch": 0.97, + "learning_rate": 1.5789936358099208e-06, + "loss": 0.748, + "step": 37964 + }, + { + "epoch": 0.97, + "learning_rate": 1.578971074980065e-06, + "loss": 0.9043, + "step": 37965 + }, + { + "epoch": 0.97, + "learning_rate": 1.5789485137069178e-06, + "loss": 0.6482, + "step": 37966 + }, + { + "epoch": 0.97, + "learning_rate": 1.578925951990496e-06, + "loss": 0.604, + "step": 37967 + }, + { + "epoch": 0.97, + "learning_rate": 1.5789033898308177e-06, + "loss": 0.8691, + "step": 37968 + }, + { + "epoch": 0.97, + "learning_rate": 1.5788808272278998e-06, + "loss": 0.8228, + "step": 37969 + }, + { + "epoch": 0.97, + "learning_rate": 1.578858264181759e-06, + "loss": 0.8467, + "step": 37970 + }, + { + "epoch": 0.97, + "learning_rate": 1.5788357006924132e-06, + "loss": 0.7686, + "step": 37971 + }, + { + "epoch": 0.97, + "learning_rate": 1.5788131367598796e-06, + "loss": 0.8662, + "step": 37972 + }, + { + "epoch": 0.97, + "learning_rate": 1.5787905723841755e-06, + "loss": 0.8408, + "step": 37973 + }, + { + "epoch": 0.97, + "learning_rate": 1.5787680075653177e-06, + "loss": 0.7524, + "step": 37974 + }, + { + "epoch": 0.97, + "learning_rate": 1.578745442303324e-06, + "loss": 0.877, + "step": 37975 + }, + { + "epoch": 0.97, + "learning_rate": 1.578722876598212e-06, + "loss": 0.8535, + "step": 37976 + }, + { + "epoch": 0.97, + "learning_rate": 1.578700310449998e-06, + "loss": 0.8623, + "step": 37977 + }, + { + "epoch": 0.97, + "learning_rate": 1.5786777438586998e-06, + "loss": 0.7051, + "step": 37978 + }, + { + "epoch": 0.97, + "learning_rate": 1.5786551768243348e-06, + "loss": 1.1504, + "step": 37979 + }, + { + "epoch": 0.97, + "learning_rate": 1.5786326093469202e-06, + "loss": 0.7715, + "step": 37980 + }, + { + "epoch": 0.97, + "learning_rate": 1.578610041426473e-06, + "loss": 0.9707, + "step": 37981 + }, + { + "epoch": 0.97, + "learning_rate": 1.5785874730630106e-06, + "loss": 0.957, + "step": 37982 + }, + { + "epoch": 0.97, + "learning_rate": 1.578564904256551e-06, + "loss": 0.9785, + "step": 37983 + }, + { + "epoch": 0.97, + "learning_rate": 1.5785423350071104e-06, + "loss": 0.623, + "step": 37984 + }, + { + "epoch": 0.97, + "learning_rate": 1.5785197653147064e-06, + "loss": 1.0781, + "step": 37985 + }, + { + "epoch": 0.97, + "learning_rate": 1.5784971951793566e-06, + "loss": 0.7056, + "step": 37986 + }, + { + "epoch": 0.97, + "learning_rate": 1.5784746246010782e-06, + "loss": 0.6624, + "step": 37987 + }, + { + "epoch": 0.97, + "learning_rate": 1.5784520535798881e-06, + "loss": 0.8916, + "step": 37988 + }, + { + "epoch": 0.97, + "learning_rate": 1.5784294821158042e-06, + "loss": 1.0273, + "step": 37989 + }, + { + "epoch": 0.97, + "learning_rate": 1.578406910208843e-06, + "loss": 1.0645, + "step": 37990 + }, + { + "epoch": 0.97, + "learning_rate": 1.5783843378590227e-06, + "loss": 0.8184, + "step": 37991 + }, + { + "epoch": 0.97, + "learning_rate": 1.5783617650663596e-06, + "loss": 0.8945, + "step": 37992 + }, + { + "epoch": 0.97, + "learning_rate": 1.5783391918308722e-06, + "loss": 0.4985, + "step": 37993 + }, + { + "epoch": 0.97, + "learning_rate": 1.5783166181525766e-06, + "loss": 0.9199, + "step": 37994 + }, + { + "epoch": 0.97, + "learning_rate": 1.5782940440314906e-06, + "loss": 0.7754, + "step": 37995 + }, + { + "epoch": 0.97, + "learning_rate": 1.5782714694676314e-06, + "loss": 1.1816, + "step": 37996 + }, + { + "epoch": 0.97, + "learning_rate": 1.5782488944610164e-06, + "loss": 0.7202, + "step": 37997 + }, + { + "epoch": 0.97, + "learning_rate": 1.5782263190116626e-06, + "loss": 0.9785, + "step": 37998 + }, + { + "epoch": 0.97, + "learning_rate": 1.5782037431195878e-06, + "loss": 0.7593, + "step": 37999 + }, + { + "epoch": 0.97, + "learning_rate": 1.578181166784809e-06, + "loss": 1.0527, + "step": 38000 + }, + { + "epoch": 0.97, + "learning_rate": 1.5781585900073433e-06, + "loss": 0.7051, + "step": 38001 + }, + { + "epoch": 0.97, + "learning_rate": 1.5781360127872082e-06, + "loss": 0.9062, + "step": 38002 + }, + { + "epoch": 0.97, + "learning_rate": 1.578113435124421e-06, + "loss": 0.8184, + "step": 38003 + }, + { + "epoch": 0.97, + "learning_rate": 1.578090857018999e-06, + "loss": 0.8645, + "step": 38004 + }, + { + "epoch": 0.97, + "learning_rate": 1.578068278470959e-06, + "loss": 0.8647, + "step": 38005 + }, + { + "epoch": 0.97, + "learning_rate": 1.5780456994803188e-06, + "loss": 0.9307, + "step": 38006 + }, + { + "epoch": 0.97, + "learning_rate": 1.5780231200470959e-06, + "loss": 0.7871, + "step": 38007 + }, + { + "epoch": 0.97, + "learning_rate": 1.5780005401713076e-06, + "loss": 0.9639, + "step": 38008 + }, + { + "epoch": 0.97, + "learning_rate": 1.5779779598529702e-06, + "loss": 0.8291, + "step": 38009 + }, + { + "epoch": 0.97, + "learning_rate": 1.577955379092102e-06, + "loss": 0.9697, + "step": 38010 + }, + { + "epoch": 0.97, + "learning_rate": 1.5779327978887195e-06, + "loss": 0.7549, + "step": 38011 + }, + { + "epoch": 0.97, + "learning_rate": 1.5779102162428405e-06, + "loss": 0.874, + "step": 38012 + }, + { + "epoch": 0.97, + "learning_rate": 1.5778876341544827e-06, + "loss": 0.634, + "step": 38013 + }, + { + "epoch": 0.97, + "learning_rate": 1.5778650516236627e-06, + "loss": 0.5605, + "step": 38014 + }, + { + "epoch": 0.97, + "learning_rate": 1.577842468650398e-06, + "loss": 0.8887, + "step": 38015 + }, + { + "epoch": 0.97, + "learning_rate": 1.5778198852347058e-06, + "loss": 0.9189, + "step": 38016 + }, + { + "epoch": 0.97, + "learning_rate": 1.5777973013766036e-06, + "loss": 0.8311, + "step": 38017 + }, + { + "epoch": 0.97, + "learning_rate": 1.5777747170761085e-06, + "loss": 0.7134, + "step": 38018 + }, + { + "epoch": 0.97, + "learning_rate": 1.5777521323332378e-06, + "loss": 0.9004, + "step": 38019 + }, + { + "epoch": 0.97, + "learning_rate": 1.5777295471480087e-06, + "loss": 0.6577, + "step": 38020 + }, + { + "epoch": 0.97, + "learning_rate": 1.577706961520439e-06, + "loss": 0.9854, + "step": 38021 + }, + { + "epoch": 0.97, + "learning_rate": 1.5776843754505454e-06, + "loss": 0.7275, + "step": 38022 + }, + { + "epoch": 0.97, + "learning_rate": 1.5776617889383457e-06, + "loss": 0.6338, + "step": 38023 + }, + { + "epoch": 0.97, + "learning_rate": 1.5776392019838567e-06, + "loss": 0.9316, + "step": 38024 + }, + { + "epoch": 0.97, + "learning_rate": 1.5776166145870962e-06, + "loss": 0.7637, + "step": 38025 + }, + { + "epoch": 0.97, + "learning_rate": 1.577594026748081e-06, + "loss": 0.8369, + "step": 38026 + }, + { + "epoch": 0.97, + "learning_rate": 1.5775714384668283e-06, + "loss": 0.9824, + "step": 38027 + }, + { + "epoch": 0.97, + "learning_rate": 1.5775488497433563e-06, + "loss": 0.6836, + "step": 38028 + }, + { + "epoch": 0.97, + "learning_rate": 1.5775262605776815e-06, + "loss": 0.9824, + "step": 38029 + }, + { + "epoch": 0.97, + "learning_rate": 1.5775036709698213e-06, + "loss": 0.8604, + "step": 38030 + }, + { + "epoch": 0.97, + "learning_rate": 1.5774810809197932e-06, + "loss": 0.7998, + "step": 38031 + }, + { + "epoch": 0.97, + "learning_rate": 1.5774584904276141e-06, + "loss": 0.8965, + "step": 38032 + }, + { + "epoch": 0.97, + "learning_rate": 1.5774358994933018e-06, + "loss": 0.6987, + "step": 38033 + }, + { + "epoch": 0.97, + "learning_rate": 1.5774133081168737e-06, + "loss": 0.6963, + "step": 38034 + }, + { + "epoch": 0.97, + "learning_rate": 1.577390716298346e-06, + "loss": 0.7129, + "step": 38035 + }, + { + "epoch": 0.97, + "learning_rate": 1.5773681240377378e-06, + "loss": 0.752, + "step": 38036 + }, + { + "epoch": 0.97, + "learning_rate": 1.5773455313350644e-06, + "loss": 0.8911, + "step": 38037 + }, + { + "epoch": 0.97, + "learning_rate": 1.5773229381903447e-06, + "loss": 1.04, + "step": 38038 + }, + { + "epoch": 0.97, + "learning_rate": 1.5773003446035951e-06, + "loss": 0.7402, + "step": 38039 + }, + { + "epoch": 0.97, + "learning_rate": 1.5772777505748333e-06, + "loss": 0.8857, + "step": 38040 + }, + { + "epoch": 0.98, + "learning_rate": 1.5772551561040763e-06, + "loss": 0.6836, + "step": 38041 + }, + { + "epoch": 0.98, + "learning_rate": 1.5772325611913417e-06, + "loss": 0.957, + "step": 38042 + }, + { + "epoch": 0.98, + "learning_rate": 1.5772099658366468e-06, + "loss": 1.0156, + "step": 38043 + }, + { + "epoch": 0.98, + "learning_rate": 1.5771873700400086e-06, + "loss": 0.7383, + "step": 38044 + }, + { + "epoch": 0.98, + "learning_rate": 1.5771647738014445e-06, + "loss": 0.7935, + "step": 38045 + }, + { + "epoch": 0.98, + "learning_rate": 1.5771421771209719e-06, + "loss": 0.7656, + "step": 38046 + }, + { + "epoch": 0.98, + "learning_rate": 1.5771195799986083e-06, + "loss": 0.9277, + "step": 38047 + }, + { + "epoch": 0.98, + "learning_rate": 1.5770969824343707e-06, + "loss": 0.9468, + "step": 38048 + }, + { + "epoch": 0.98, + "learning_rate": 1.5770743844282763e-06, + "loss": 0.8779, + "step": 38049 + }, + { + "epoch": 0.98, + "learning_rate": 1.5770517859803428e-06, + "loss": 0.6479, + "step": 38050 + }, + { + "epoch": 0.98, + "learning_rate": 1.577029187090587e-06, + "loss": 0.8184, + "step": 38051 + }, + { + "epoch": 0.98, + "learning_rate": 1.5770065877590266e-06, + "loss": 0.8574, + "step": 38052 + }, + { + "epoch": 0.98, + "learning_rate": 1.576983987985679e-06, + "loss": 0.9375, + "step": 38053 + }, + { + "epoch": 0.98, + "learning_rate": 1.5769613877705612e-06, + "loss": 0.8564, + "step": 38054 + }, + { + "epoch": 0.98, + "learning_rate": 1.5769387871136903e-06, + "loss": 0.7363, + "step": 38055 + }, + { + "epoch": 0.98, + "learning_rate": 1.5769161860150841e-06, + "loss": 0.9648, + "step": 38056 + }, + { + "epoch": 0.98, + "learning_rate": 1.5768935844747598e-06, + "loss": 0.8906, + "step": 38057 + }, + { + "epoch": 0.98, + "learning_rate": 1.5768709824927346e-06, + "loss": 0.7236, + "step": 38058 + }, + { + "epoch": 0.98, + "learning_rate": 1.5768483800690256e-06, + "loss": 0.7856, + "step": 38059 + }, + { + "epoch": 0.98, + "learning_rate": 1.5768257772036505e-06, + "loss": 0.9082, + "step": 38060 + }, + { + "epoch": 0.98, + "learning_rate": 1.5768031738966264e-06, + "loss": 0.8242, + "step": 38061 + }, + { + "epoch": 0.98, + "learning_rate": 1.5767805701479704e-06, + "loss": 0.5286, + "step": 38062 + }, + { + "epoch": 0.98, + "learning_rate": 1.5767579659577003e-06, + "loss": 0.7817, + "step": 38063 + }, + { + "epoch": 0.98, + "learning_rate": 1.5767353613258332e-06, + "loss": 0.8091, + "step": 38064 + }, + { + "epoch": 0.98, + "learning_rate": 1.5767127562523864e-06, + "loss": 0.8467, + "step": 38065 + }, + { + "epoch": 0.98, + "learning_rate": 1.5766901507373768e-06, + "loss": 0.792, + "step": 38066 + }, + { + "epoch": 0.98, + "learning_rate": 1.5766675447808222e-06, + "loss": 0.6138, + "step": 38067 + }, + { + "epoch": 0.98, + "learning_rate": 1.5766449383827401e-06, + "loss": 0.5945, + "step": 38068 + }, + { + "epoch": 0.98, + "learning_rate": 1.576622331543147e-06, + "loss": 0.6875, + "step": 38069 + }, + { + "epoch": 0.98, + "learning_rate": 1.576599724262061e-06, + "loss": 1.04, + "step": 38070 + }, + { + "epoch": 0.98, + "learning_rate": 1.576577116539499e-06, + "loss": 0.9346, + "step": 38071 + }, + { + "epoch": 0.98, + "learning_rate": 1.5765545083754783e-06, + "loss": 0.8184, + "step": 38072 + }, + { + "epoch": 0.98, + "learning_rate": 1.5765318997700167e-06, + "loss": 0.5208, + "step": 38073 + }, + { + "epoch": 0.98, + "learning_rate": 1.576509290723131e-06, + "loss": 0.8555, + "step": 38074 + }, + { + "epoch": 0.98, + "learning_rate": 1.5764866812348383e-06, + "loss": 0.6509, + "step": 38075 + }, + { + "epoch": 0.98, + "learning_rate": 1.5764640713051564e-06, + "loss": 0.8242, + "step": 38076 + }, + { + "epoch": 0.98, + "learning_rate": 1.5764414609341027e-06, + "loss": 0.959, + "step": 38077 + }, + { + "epoch": 0.98, + "learning_rate": 1.5764188501216943e-06, + "loss": 0.9062, + "step": 38078 + }, + { + "epoch": 0.98, + "learning_rate": 1.5763962388679483e-06, + "loss": 1.1338, + "step": 38079 + }, + { + "epoch": 0.98, + "learning_rate": 1.5763736271728822e-06, + "loss": 0.8721, + "step": 38080 + }, + { + "epoch": 0.98, + "learning_rate": 1.5763510150365136e-06, + "loss": 0.8457, + "step": 38081 + }, + { + "epoch": 0.98, + "learning_rate": 1.5763284024588593e-06, + "loss": 0.9717, + "step": 38082 + }, + { + "epoch": 0.98, + "learning_rate": 1.5763057894399368e-06, + "loss": 0.707, + "step": 38083 + }, + { + "epoch": 0.98, + "learning_rate": 1.5762831759797635e-06, + "loss": 0.6724, + "step": 38084 + }, + { + "epoch": 0.98, + "learning_rate": 1.5762605620783566e-06, + "loss": 1.001, + "step": 38085 + }, + { + "epoch": 0.98, + "learning_rate": 1.5762379477357334e-06, + "loss": 0.7305, + "step": 38086 + }, + { + "epoch": 0.98, + "learning_rate": 1.5762153329519115e-06, + "loss": 0.9082, + "step": 38087 + }, + { + "epoch": 0.98, + "learning_rate": 1.5761927177269078e-06, + "loss": 0.8604, + "step": 38088 + }, + { + "epoch": 0.98, + "learning_rate": 1.5761701020607401e-06, + "loss": 0.6562, + "step": 38089 + }, + { + "epoch": 0.98, + "learning_rate": 1.5761474859534254e-06, + "loss": 0.7021, + "step": 38090 + }, + { + "epoch": 0.98, + "learning_rate": 1.576124869404981e-06, + "loss": 0.8115, + "step": 38091 + }, + { + "epoch": 0.98, + "learning_rate": 1.576102252415424e-06, + "loss": 0.9863, + "step": 38092 + }, + { + "epoch": 0.98, + "learning_rate": 1.5760796349847726e-06, + "loss": 0.8506, + "step": 38093 + }, + { + "epoch": 0.98, + "learning_rate": 1.5760570171130432e-06, + "loss": 1.0623, + "step": 38094 + }, + { + "epoch": 0.98, + "learning_rate": 1.5760343988002533e-06, + "loss": 0.957, + "step": 38095 + }, + { + "epoch": 0.98, + "learning_rate": 1.5760117800464206e-06, + "loss": 0.7832, + "step": 38096 + }, + { + "epoch": 0.98, + "learning_rate": 1.575989160851562e-06, + "loss": 0.9922, + "step": 38097 + }, + { + "epoch": 0.98, + "learning_rate": 1.5759665412156951e-06, + "loss": 0.7578, + "step": 38098 + }, + { + "epoch": 0.98, + "learning_rate": 1.5759439211388367e-06, + "loss": 0.9111, + "step": 38099 + }, + { + "epoch": 0.98, + "learning_rate": 1.575921300621005e-06, + "loss": 0.7881, + "step": 38100 + }, + { + "epoch": 0.98, + "learning_rate": 1.5758986796622167e-06, + "loss": 0.9531, + "step": 38101 + }, + { + "epoch": 0.98, + "learning_rate": 1.575876058262489e-06, + "loss": 0.6968, + "step": 38102 + }, + { + "epoch": 0.98, + "learning_rate": 1.57585343642184e-06, + "loss": 0.916, + "step": 38103 + }, + { + "epoch": 0.98, + "learning_rate": 1.5758308141402862e-06, + "loss": 0.7783, + "step": 38104 + }, + { + "epoch": 0.98, + "learning_rate": 1.5758081914178454e-06, + "loss": 0.915, + "step": 38105 + }, + { + "epoch": 0.98, + "learning_rate": 1.5757855682545344e-06, + "loss": 0.9609, + "step": 38106 + }, + { + "epoch": 0.98, + "learning_rate": 1.575762944650371e-06, + "loss": 1.0146, + "step": 38107 + }, + { + "epoch": 0.98, + "learning_rate": 1.5757403206053725e-06, + "loss": 0.7324, + "step": 38108 + }, + { + "epoch": 0.98, + "learning_rate": 1.5757176961195562e-06, + "loss": 0.8574, + "step": 38109 + }, + { + "epoch": 0.98, + "learning_rate": 1.575695071192939e-06, + "loss": 1.1904, + "step": 38110 + }, + { + "epoch": 0.98, + "learning_rate": 1.5756724458255387e-06, + "loss": 0.9482, + "step": 38111 + }, + { + "epoch": 0.98, + "learning_rate": 1.5756498200173727e-06, + "loss": 0.7588, + "step": 38112 + }, + { + "epoch": 0.98, + "learning_rate": 1.575627193768458e-06, + "loss": 0.9854, + "step": 38113 + }, + { + "epoch": 0.98, + "learning_rate": 1.575604567078812e-06, + "loss": 0.9619, + "step": 38114 + }, + { + "epoch": 0.98, + "learning_rate": 1.5755819399484518e-06, + "loss": 0.9082, + "step": 38115 + }, + { + "epoch": 0.98, + "learning_rate": 1.5755593123773951e-06, + "loss": 0.8809, + "step": 38116 + }, + { + "epoch": 0.98, + "learning_rate": 1.5755366843656593e-06, + "loss": 1.0283, + "step": 38117 + }, + { + "epoch": 0.98, + "learning_rate": 1.5755140559132617e-06, + "loss": 0.7173, + "step": 38118 + }, + { + "epoch": 0.98, + "learning_rate": 1.5754914270202188e-06, + "loss": 0.6445, + "step": 38119 + }, + { + "epoch": 0.98, + "learning_rate": 1.575468797686549e-06, + "loss": 0.6992, + "step": 38120 + }, + { + "epoch": 0.98, + "learning_rate": 1.575446167912269e-06, + "loss": 0.8018, + "step": 38121 + }, + { + "epoch": 0.98, + "learning_rate": 1.5754235376973965e-06, + "loss": 0.7393, + "step": 38122 + }, + { + "epoch": 0.98, + "learning_rate": 1.5754009070419487e-06, + "loss": 0.7607, + "step": 38123 + }, + { + "epoch": 0.98, + "learning_rate": 1.5753782759459427e-06, + "loss": 0.7832, + "step": 38124 + }, + { + "epoch": 0.98, + "learning_rate": 1.575355644409396e-06, + "loss": 0.8003, + "step": 38125 + }, + { + "epoch": 0.98, + "learning_rate": 1.5753330124323263e-06, + "loss": 0.7339, + "step": 38126 + }, + { + "epoch": 0.98, + "learning_rate": 1.5753103800147502e-06, + "loss": 0.6381, + "step": 38127 + }, + { + "epoch": 0.98, + "learning_rate": 1.5752877471566857e-06, + "loss": 0.7666, + "step": 38128 + }, + { + "epoch": 0.98, + "learning_rate": 1.5752651138581494e-06, + "loss": 0.6357, + "step": 38129 + }, + { + "epoch": 0.98, + "learning_rate": 1.5752424801191592e-06, + "loss": 0.8164, + "step": 38130 + }, + { + "epoch": 0.98, + "learning_rate": 1.5752198459397325e-06, + "loss": 0.8096, + "step": 38131 + }, + { + "epoch": 0.98, + "learning_rate": 1.5751972113198861e-06, + "loss": 0.7939, + "step": 38132 + }, + { + "epoch": 0.98, + "learning_rate": 1.5751745762596381e-06, + "loss": 0.8877, + "step": 38133 + }, + { + "epoch": 0.98, + "learning_rate": 1.575151940759005e-06, + "loss": 0.9297, + "step": 38134 + }, + { + "epoch": 0.98, + "learning_rate": 1.5751293048180045e-06, + "loss": 0.8091, + "step": 38135 + }, + { + "epoch": 0.98, + "learning_rate": 1.5751066684366542e-06, + "loss": 0.6289, + "step": 38136 + }, + { + "epoch": 0.98, + "learning_rate": 1.5750840316149709e-06, + "loss": 0.6936, + "step": 38137 + }, + { + "epoch": 0.98, + "learning_rate": 1.5750613943529723e-06, + "loss": 0.8262, + "step": 38138 + }, + { + "epoch": 0.98, + "learning_rate": 1.5750387566506758e-06, + "loss": 0.9717, + "step": 38139 + }, + { + "epoch": 0.98, + "learning_rate": 1.5750161185080982e-06, + "loss": 0.6611, + "step": 38140 + }, + { + "epoch": 0.98, + "learning_rate": 1.5749934799252574e-06, + "loss": 0.73, + "step": 38141 + }, + { + "epoch": 0.98, + "learning_rate": 1.5749708409021704e-06, + "loss": 0.6538, + "step": 38142 + }, + { + "epoch": 0.98, + "learning_rate": 1.5749482014388552e-06, + "loss": 0.5938, + "step": 38143 + }, + { + "epoch": 0.98, + "learning_rate": 1.574925561535328e-06, + "loss": 0.7725, + "step": 38144 + }, + { + "epoch": 0.98, + "learning_rate": 1.574902921191607e-06, + "loss": 0.9121, + "step": 38145 + }, + { + "epoch": 0.98, + "learning_rate": 1.5748802804077093e-06, + "loss": 0.8779, + "step": 38146 + }, + { + "epoch": 0.98, + "learning_rate": 1.574857639183652e-06, + "loss": 0.7617, + "step": 38147 + }, + { + "epoch": 0.98, + "learning_rate": 1.5748349975194529e-06, + "loss": 0.9043, + "step": 38148 + }, + { + "epoch": 0.98, + "learning_rate": 1.574812355415129e-06, + "loss": 0.8291, + "step": 38149 + }, + { + "epoch": 0.98, + "learning_rate": 1.5747897128706975e-06, + "loss": 0.8145, + "step": 38150 + }, + { + "epoch": 0.98, + "learning_rate": 1.5747670698861758e-06, + "loss": 0.8027, + "step": 38151 + }, + { + "epoch": 0.98, + "learning_rate": 1.5747444264615819e-06, + "loss": 0.6875, + "step": 38152 + }, + { + "epoch": 0.98, + "learning_rate": 1.5747217825969322e-06, + "loss": 0.7749, + "step": 38153 + }, + { + "epoch": 0.98, + "learning_rate": 1.5746991382922446e-06, + "loss": 0.9678, + "step": 38154 + }, + { + "epoch": 0.98, + "learning_rate": 1.5746764935475366e-06, + "loss": 0.8198, + "step": 38155 + }, + { + "epoch": 0.98, + "learning_rate": 1.5746538483628249e-06, + "loss": 0.8066, + "step": 38156 + }, + { + "epoch": 0.98, + "learning_rate": 1.5746312027381272e-06, + "loss": 0.7705, + "step": 38157 + }, + { + "epoch": 0.98, + "learning_rate": 1.574608556673461e-06, + "loss": 0.6714, + "step": 38158 + }, + { + "epoch": 0.98, + "learning_rate": 1.574585910168843e-06, + "loss": 1.0557, + "step": 38159 + }, + { + "epoch": 0.98, + "learning_rate": 1.5745632632242913e-06, + "loss": 0.8662, + "step": 38160 + }, + { + "epoch": 0.98, + "learning_rate": 1.574540615839823e-06, + "loss": 0.8779, + "step": 38161 + }, + { + "epoch": 0.98, + "learning_rate": 1.574517968015455e-06, + "loss": 0.8379, + "step": 38162 + }, + { + "epoch": 0.98, + "learning_rate": 1.5744953197512056e-06, + "loss": 0.8965, + "step": 38163 + }, + { + "epoch": 0.98, + "learning_rate": 1.5744726710470912e-06, + "loss": 0.9824, + "step": 38164 + }, + { + "epoch": 0.98, + "learning_rate": 1.5744500219031296e-06, + "loss": 0.9453, + "step": 38165 + }, + { + "epoch": 0.98, + "learning_rate": 1.5744273723193377e-06, + "loss": 0.873, + "step": 38166 + }, + { + "epoch": 0.98, + "learning_rate": 1.5744047222957336e-06, + "loss": 1.043, + "step": 38167 + }, + { + "epoch": 0.98, + "learning_rate": 1.5743820718323342e-06, + "loss": 1.1006, + "step": 38168 + }, + { + "epoch": 0.98, + "learning_rate": 1.5743594209291567e-06, + "loss": 0.8613, + "step": 38169 + }, + { + "epoch": 0.98, + "learning_rate": 1.5743367695862184e-06, + "loss": 0.7812, + "step": 38170 + }, + { + "epoch": 0.98, + "learning_rate": 1.5743141178035371e-06, + "loss": 0.918, + "step": 38171 + }, + { + "epoch": 0.98, + "learning_rate": 1.5742914655811298e-06, + "loss": 0.7676, + "step": 38172 + }, + { + "epoch": 0.98, + "learning_rate": 1.574268812919014e-06, + "loss": 0.8501, + "step": 38173 + }, + { + "epoch": 0.98, + "learning_rate": 1.574246159817207e-06, + "loss": 0.7375, + "step": 38174 + }, + { + "epoch": 0.98, + "learning_rate": 1.574223506275726e-06, + "loss": 0.5551, + "step": 38175 + }, + { + "epoch": 0.98, + "learning_rate": 1.5742008522945883e-06, + "loss": 0.9209, + "step": 38176 + }, + { + "epoch": 0.98, + "learning_rate": 1.5741781978738118e-06, + "loss": 0.8296, + "step": 38177 + }, + { + "epoch": 0.98, + "learning_rate": 1.5741555430134135e-06, + "loss": 0.9219, + "step": 38178 + }, + { + "epoch": 0.98, + "learning_rate": 1.5741328877134104e-06, + "loss": 0.7979, + "step": 38179 + }, + { + "epoch": 0.98, + "learning_rate": 1.5741102319738203e-06, + "loss": 0.5811, + "step": 38180 + }, + { + "epoch": 0.98, + "learning_rate": 1.5740875757946603e-06, + "loss": 0.8057, + "step": 38181 + }, + { + "epoch": 0.98, + "learning_rate": 1.5740649191759476e-06, + "loss": 0.8008, + "step": 38182 + }, + { + "epoch": 0.98, + "learning_rate": 1.5740422621177004e-06, + "loss": 1.0225, + "step": 38183 + }, + { + "epoch": 0.98, + "learning_rate": 1.574019604619935e-06, + "loss": 0.71, + "step": 38184 + }, + { + "epoch": 0.98, + "learning_rate": 1.5739969466826692e-06, + "loss": 0.8608, + "step": 38185 + }, + { + "epoch": 0.98, + "learning_rate": 1.5739742883059206e-06, + "loss": 0.8154, + "step": 38186 + }, + { + "epoch": 0.98, + "learning_rate": 1.573951629489706e-06, + "loss": 0.9062, + "step": 38187 + }, + { + "epoch": 0.98, + "learning_rate": 1.5739289702340432e-06, + "loss": 0.7812, + "step": 38188 + }, + { + "epoch": 0.98, + "learning_rate": 1.5739063105389492e-06, + "loss": 0.833, + "step": 38189 + }, + { + "epoch": 0.98, + "learning_rate": 1.5738836504044418e-06, + "loss": 0.9707, + "step": 38190 + }, + { + "epoch": 0.98, + "learning_rate": 1.5738609898305377e-06, + "loss": 0.9219, + "step": 38191 + }, + { + "epoch": 0.98, + "learning_rate": 1.573838328817255e-06, + "loss": 0.874, + "step": 38192 + }, + { + "epoch": 0.98, + "learning_rate": 1.5738156673646103e-06, + "loss": 0.8262, + "step": 38193 + }, + { + "epoch": 0.98, + "learning_rate": 1.5737930054726215e-06, + "loss": 0.8447, + "step": 38194 + }, + { + "epoch": 0.98, + "learning_rate": 1.573770343141306e-06, + "loss": 0.6987, + "step": 38195 + }, + { + "epoch": 0.98, + "learning_rate": 1.5737476803706807e-06, + "loss": 1.0078, + "step": 38196 + }, + { + "epoch": 0.98, + "learning_rate": 1.5737250171607631e-06, + "loss": 0.998, + "step": 38197 + }, + { + "epoch": 0.98, + "learning_rate": 1.573702353511571e-06, + "loss": 0.7588, + "step": 38198 + }, + { + "epoch": 0.98, + "learning_rate": 1.573679689423121e-06, + "loss": 0.9219, + "step": 38199 + }, + { + "epoch": 0.98, + "learning_rate": 1.5736570248954312e-06, + "loss": 0.7739, + "step": 38200 + }, + { + "epoch": 0.98, + "learning_rate": 1.5736343599285182e-06, + "loss": 0.7881, + "step": 38201 + }, + { + "epoch": 0.98, + "learning_rate": 1.5736116945224e-06, + "loss": 0.8926, + "step": 38202 + }, + { + "epoch": 0.98, + "learning_rate": 1.5735890286770936e-06, + "loss": 0.8789, + "step": 38203 + }, + { + "epoch": 0.98, + "learning_rate": 1.5735663623926165e-06, + "loss": 1.123, + "step": 38204 + }, + { + "epoch": 0.98, + "learning_rate": 1.5735436956689858e-06, + "loss": 0.7764, + "step": 38205 + }, + { + "epoch": 0.98, + "learning_rate": 1.5735210285062194e-06, + "loss": 0.959, + "step": 38206 + }, + { + "epoch": 0.98, + "learning_rate": 1.5734983609043341e-06, + "loss": 0.7539, + "step": 38207 + }, + { + "epoch": 0.98, + "learning_rate": 1.5734756928633476e-06, + "loss": 0.5684, + "step": 38208 + }, + { + "epoch": 0.98, + "learning_rate": 1.5734530243832772e-06, + "loss": 0.8362, + "step": 38209 + }, + { + "epoch": 0.98, + "learning_rate": 1.57343035546414e-06, + "loss": 0.9053, + "step": 38210 + }, + { + "epoch": 0.98, + "learning_rate": 1.5734076861059538e-06, + "loss": 0.8086, + "step": 38211 + }, + { + "epoch": 0.98, + "learning_rate": 1.5733850163087352e-06, + "loss": 0.7712, + "step": 38212 + }, + { + "epoch": 0.98, + "learning_rate": 1.5733623460725025e-06, + "loss": 0.7217, + "step": 38213 + }, + { + "epoch": 0.98, + "learning_rate": 1.5733396753972725e-06, + "loss": 0.7058, + "step": 38214 + }, + { + "epoch": 0.98, + "learning_rate": 1.5733170042830628e-06, + "loss": 0.9385, + "step": 38215 + }, + { + "epoch": 0.98, + "learning_rate": 1.5732943327298904e-06, + "loss": 0.8208, + "step": 38216 + }, + { + "epoch": 0.98, + "learning_rate": 1.573271660737773e-06, + "loss": 0.9004, + "step": 38217 + }, + { + "epoch": 0.98, + "learning_rate": 1.5732489883067279e-06, + "loss": 1.001, + "step": 38218 + }, + { + "epoch": 0.98, + "learning_rate": 1.5732263154367724e-06, + "loss": 0.7598, + "step": 38219 + }, + { + "epoch": 0.98, + "learning_rate": 1.5732036421279237e-06, + "loss": 0.7754, + "step": 38220 + }, + { + "epoch": 0.98, + "learning_rate": 1.5731809683801994e-06, + "loss": 0.9287, + "step": 38221 + }, + { + "epoch": 0.98, + "learning_rate": 1.5731582941936168e-06, + "loss": 0.8682, + "step": 38222 + }, + { + "epoch": 0.98, + "learning_rate": 1.5731356195681933e-06, + "loss": 0.9248, + "step": 38223 + }, + { + "epoch": 0.98, + "learning_rate": 1.5731129445039462e-06, + "loss": 1.0645, + "step": 38224 + }, + { + "epoch": 0.98, + "learning_rate": 1.573090269000893e-06, + "loss": 0.9355, + "step": 38225 + }, + { + "epoch": 0.98, + "learning_rate": 1.5730675930590506e-06, + "loss": 0.9434, + "step": 38226 + }, + { + "epoch": 0.98, + "learning_rate": 1.573044916678437e-06, + "loss": 0.6611, + "step": 38227 + }, + { + "epoch": 0.98, + "learning_rate": 1.5730222398590694e-06, + "loss": 0.7656, + "step": 38228 + }, + { + "epoch": 0.98, + "learning_rate": 1.5729995626009647e-06, + "loss": 0.957, + "step": 38229 + }, + { + "epoch": 0.98, + "learning_rate": 1.5729768849041406e-06, + "loss": 0.8379, + "step": 38230 + }, + { + "epoch": 0.98, + "learning_rate": 1.5729542067686143e-06, + "loss": 0.9258, + "step": 38231 + }, + { + "epoch": 0.98, + "learning_rate": 1.5729315281944034e-06, + "loss": 0.8818, + "step": 38232 + }, + { + "epoch": 0.98, + "learning_rate": 1.5729088491815255e-06, + "loss": 1.0537, + "step": 38233 + }, + { + "epoch": 0.98, + "learning_rate": 1.5728861697299975e-06, + "loss": 1.0176, + "step": 38234 + }, + { + "epoch": 0.98, + "learning_rate": 1.5728634898398366e-06, + "loss": 0.6978, + "step": 38235 + }, + { + "epoch": 0.98, + "learning_rate": 1.5728408095110606e-06, + "loss": 0.8105, + "step": 38236 + }, + { + "epoch": 0.98, + "learning_rate": 1.572818128743687e-06, + "loss": 0.9424, + "step": 38237 + }, + { + "epoch": 0.98, + "learning_rate": 1.5727954475377328e-06, + "loss": 0.8896, + "step": 38238 + }, + { + "epoch": 0.98, + "learning_rate": 1.5727727658932153e-06, + "loss": 0.7793, + "step": 38239 + }, + { + "epoch": 0.98, + "learning_rate": 1.5727500838101522e-06, + "loss": 1.0332, + "step": 38240 + }, + { + "epoch": 0.98, + "learning_rate": 1.5727274012885606e-06, + "loss": 0.8223, + "step": 38241 + }, + { + "epoch": 0.98, + "learning_rate": 1.572704718328458e-06, + "loss": 0.9746, + "step": 38242 + }, + { + "epoch": 0.98, + "learning_rate": 1.5726820349298616e-06, + "loss": 0.6729, + "step": 38243 + }, + { + "epoch": 0.98, + "learning_rate": 1.5726593510927889e-06, + "loss": 0.8271, + "step": 38244 + }, + { + "epoch": 0.98, + "learning_rate": 1.5726366668172574e-06, + "loss": 0.8091, + "step": 38245 + }, + { + "epoch": 0.98, + "learning_rate": 1.5726139821032841e-06, + "loss": 0.875, + "step": 38246 + }, + { + "epoch": 0.98, + "learning_rate": 1.572591296950887e-06, + "loss": 0.9736, + "step": 38247 + }, + { + "epoch": 0.98, + "learning_rate": 1.572568611360083e-06, + "loss": 0.8271, + "step": 38248 + }, + { + "epoch": 0.98, + "learning_rate": 1.5725459253308892e-06, + "loss": 0.8242, + "step": 38249 + }, + { + "epoch": 0.98, + "learning_rate": 1.5725232388633235e-06, + "loss": 0.8662, + "step": 38250 + }, + { + "epoch": 0.98, + "learning_rate": 1.572500551957403e-06, + "loss": 0.7988, + "step": 38251 + }, + { + "epoch": 0.98, + "learning_rate": 1.5724778646131453e-06, + "loss": 0.9863, + "step": 38252 + }, + { + "epoch": 0.98, + "learning_rate": 1.5724551768305677e-06, + "loss": 1.0166, + "step": 38253 + }, + { + "epoch": 0.98, + "learning_rate": 1.5724324886096874e-06, + "loss": 0.7153, + "step": 38254 + }, + { + "epoch": 0.98, + "learning_rate": 1.5724097999505218e-06, + "loss": 0.6957, + "step": 38255 + }, + { + "epoch": 0.98, + "learning_rate": 1.5723871108530884e-06, + "loss": 0.5254, + "step": 38256 + }, + { + "epoch": 0.98, + "learning_rate": 1.5723644213174046e-06, + "loss": 0.9502, + "step": 38257 + }, + { + "epoch": 0.98, + "learning_rate": 1.5723417313434874e-06, + "loss": 1.0957, + "step": 38258 + }, + { + "epoch": 0.98, + "learning_rate": 1.5723190409313547e-06, + "loss": 1.1123, + "step": 38259 + }, + { + "epoch": 0.98, + "learning_rate": 1.5722963500810234e-06, + "loss": 0.8545, + "step": 38260 + }, + { + "epoch": 0.98, + "learning_rate": 1.5722736587925113e-06, + "loss": 1.0264, + "step": 38261 + }, + { + "epoch": 0.98, + "learning_rate": 1.5722509670658357e-06, + "loss": 0.9785, + "step": 38262 + }, + { + "epoch": 0.98, + "learning_rate": 1.5722282749010133e-06, + "loss": 0.6809, + "step": 38263 + }, + { + "epoch": 0.98, + "learning_rate": 1.5722055822980625e-06, + "loss": 0.6904, + "step": 38264 + }, + { + "epoch": 0.98, + "learning_rate": 1.5721828892570002e-06, + "loss": 0.7529, + "step": 38265 + }, + { + "epoch": 0.98, + "learning_rate": 1.5721601957778434e-06, + "loss": 1.0059, + "step": 38266 + }, + { + "epoch": 0.98, + "learning_rate": 1.5721375018606104e-06, + "loss": 0.8291, + "step": 38267 + }, + { + "epoch": 0.98, + "learning_rate": 1.5721148075053176e-06, + "loss": 0.835, + "step": 38268 + }, + { + "epoch": 0.98, + "learning_rate": 1.5720921127119828e-06, + "loss": 0.7852, + "step": 38269 + }, + { + "epoch": 0.98, + "learning_rate": 1.5720694174806235e-06, + "loss": 0.7812, + "step": 38270 + }, + { + "epoch": 0.98, + "learning_rate": 1.572046721811257e-06, + "loss": 0.7041, + "step": 38271 + }, + { + "epoch": 0.98, + "learning_rate": 1.5720240257039006e-06, + "loss": 0.8555, + "step": 38272 + }, + { + "epoch": 0.98, + "learning_rate": 1.5720013291585716e-06, + "loss": 0.5342, + "step": 38273 + }, + { + "epoch": 0.98, + "learning_rate": 1.5719786321752877e-06, + "loss": 0.8838, + "step": 38274 + }, + { + "epoch": 0.98, + "learning_rate": 1.5719559347540658e-06, + "loss": 0.832, + "step": 38275 + }, + { + "epoch": 0.98, + "learning_rate": 1.5719332368949236e-06, + "loss": 0.5132, + "step": 38276 + }, + { + "epoch": 0.98, + "learning_rate": 1.5719105385978787e-06, + "loss": 0.6411, + "step": 38277 + }, + { + "epoch": 0.98, + "learning_rate": 1.5718878398629478e-06, + "loss": 0.7764, + "step": 38278 + }, + { + "epoch": 0.98, + "learning_rate": 1.571865140690149e-06, + "loss": 0.8223, + "step": 38279 + }, + { + "epoch": 0.98, + "learning_rate": 1.5718424410794992e-06, + "loss": 0.9131, + "step": 38280 + }, + { + "epoch": 0.98, + "learning_rate": 1.5718197410310159e-06, + "loss": 0.7734, + "step": 38281 + }, + { + "epoch": 0.98, + "learning_rate": 1.5717970405447165e-06, + "loss": 0.6001, + "step": 38282 + }, + { + "epoch": 0.98, + "learning_rate": 1.5717743396206186e-06, + "loss": 0.9551, + "step": 38283 + }, + { + "epoch": 0.98, + "learning_rate": 1.5717516382587392e-06, + "loss": 1.166, + "step": 38284 + }, + { + "epoch": 0.98, + "learning_rate": 1.5717289364590957e-06, + "loss": 0.7588, + "step": 38285 + }, + { + "epoch": 0.98, + "learning_rate": 1.571706234221706e-06, + "loss": 0.96, + "step": 38286 + }, + { + "epoch": 0.98, + "learning_rate": 1.571683531546587e-06, + "loss": 0.8296, + "step": 38287 + }, + { + "epoch": 0.98, + "learning_rate": 1.5716608284337562e-06, + "loss": 0.8105, + "step": 38288 + }, + { + "epoch": 0.98, + "learning_rate": 1.5716381248832308e-06, + "loss": 0.7656, + "step": 38289 + }, + { + "epoch": 0.98, + "learning_rate": 1.5716154208950287e-06, + "loss": 1.0039, + "step": 38290 + }, + { + "epoch": 0.98, + "learning_rate": 1.5715927164691668e-06, + "loss": 0.7861, + "step": 38291 + }, + { + "epoch": 0.98, + "learning_rate": 1.5715700116056627e-06, + "loss": 0.6968, + "step": 38292 + }, + { + "epoch": 0.98, + "learning_rate": 1.5715473063045335e-06, + "loss": 1.0586, + "step": 38293 + }, + { + "epoch": 0.98, + "learning_rate": 1.5715246005657972e-06, + "loss": 0.624, + "step": 38294 + }, + { + "epoch": 0.98, + "learning_rate": 1.5715018943894704e-06, + "loss": 0.8286, + "step": 38295 + }, + { + "epoch": 0.98, + "learning_rate": 1.571479187775571e-06, + "loss": 0.8296, + "step": 38296 + }, + { + "epoch": 0.98, + "learning_rate": 1.5714564807241164e-06, + "loss": 0.6782, + "step": 38297 + }, + { + "epoch": 0.98, + "learning_rate": 1.5714337732351238e-06, + "loss": 0.8896, + "step": 38298 + }, + { + "epoch": 0.98, + "learning_rate": 1.5714110653086104e-06, + "loss": 0.7617, + "step": 38299 + }, + { + "epoch": 0.98, + "learning_rate": 1.571388356944594e-06, + "loss": 0.9727, + "step": 38300 + }, + { + "epoch": 0.98, + "learning_rate": 1.5713656481430916e-06, + "loss": 0.8799, + "step": 38301 + }, + { + "epoch": 0.98, + "learning_rate": 1.5713429389041215e-06, + "loss": 1.0117, + "step": 38302 + }, + { + "epoch": 0.98, + "learning_rate": 1.5713202292276997e-06, + "loss": 1.0713, + "step": 38303 + }, + { + "epoch": 0.98, + "learning_rate": 1.5712975191138445e-06, + "loss": 0.834, + "step": 38304 + }, + { + "epoch": 0.98, + "learning_rate": 1.571274808562573e-06, + "loss": 0.7949, + "step": 38305 + }, + { + "epoch": 0.98, + "learning_rate": 1.5712520975739026e-06, + "loss": 0.5737, + "step": 38306 + }, + { + "epoch": 0.98, + "learning_rate": 1.5712293861478506e-06, + "loss": 0.8936, + "step": 38307 + }, + { + "epoch": 0.98, + "learning_rate": 1.5712066742844349e-06, + "loss": 0.8916, + "step": 38308 + }, + { + "epoch": 0.98, + "learning_rate": 1.5711839619836723e-06, + "loss": 0.8779, + "step": 38309 + }, + { + "epoch": 0.98, + "learning_rate": 1.5711612492455805e-06, + "loss": 0.7656, + "step": 38310 + }, + { + "epoch": 0.98, + "learning_rate": 1.5711385360701768e-06, + "loss": 0.8818, + "step": 38311 + }, + { + "epoch": 0.98, + "learning_rate": 1.5711158224574786e-06, + "loss": 0.7412, + "step": 38312 + }, + { + "epoch": 0.98, + "learning_rate": 1.5710931084075032e-06, + "loss": 1.0312, + "step": 38313 + }, + { + "epoch": 0.98, + "learning_rate": 1.571070393920268e-06, + "loss": 0.9639, + "step": 38314 + }, + { + "epoch": 0.98, + "learning_rate": 1.5710476789957906e-06, + "loss": 1.0225, + "step": 38315 + }, + { + "epoch": 0.98, + "learning_rate": 1.571024963634088e-06, + "loss": 0.6509, + "step": 38316 + }, + { + "epoch": 0.98, + "learning_rate": 1.5710022478351782e-06, + "loss": 0.9189, + "step": 38317 + }, + { + "epoch": 0.98, + "learning_rate": 1.5709795315990779e-06, + "loss": 0.832, + "step": 38318 + }, + { + "epoch": 0.98, + "learning_rate": 1.570956814925805e-06, + "loss": 0.7861, + "step": 38319 + }, + { + "epoch": 0.98, + "learning_rate": 1.5709340978153768e-06, + "loss": 0.7061, + "step": 38320 + }, + { + "epoch": 0.98, + "learning_rate": 1.5709113802678103e-06, + "loss": 1.0, + "step": 38321 + }, + { + "epoch": 0.98, + "learning_rate": 1.5708886622831238e-06, + "loss": 0.8052, + "step": 38322 + }, + { + "epoch": 0.98, + "learning_rate": 1.5708659438613335e-06, + "loss": 0.8008, + "step": 38323 + }, + { + "epoch": 0.98, + "learning_rate": 1.5708432250024575e-06, + "loss": 1.0107, + "step": 38324 + }, + { + "epoch": 0.98, + "learning_rate": 1.5708205057065134e-06, + "loss": 0.6838, + "step": 38325 + }, + { + "epoch": 0.98, + "learning_rate": 1.570797785973518e-06, + "loss": 1.002, + "step": 38326 + }, + { + "epoch": 0.98, + "learning_rate": 1.570775065803489e-06, + "loss": 0.7273, + "step": 38327 + }, + { + "epoch": 0.98, + "learning_rate": 1.570752345196444e-06, + "loss": 0.7148, + "step": 38328 + }, + { + "epoch": 0.98, + "learning_rate": 1.5707296241524e-06, + "loss": 0.7422, + "step": 38329 + }, + { + "epoch": 0.98, + "learning_rate": 1.5707069026713743e-06, + "loss": 0.9385, + "step": 38330 + }, + { + "epoch": 0.98, + "learning_rate": 1.570684180753385e-06, + "loss": 0.9863, + "step": 38331 + }, + { + "epoch": 0.98, + "learning_rate": 1.570661458398449e-06, + "loss": 0.8223, + "step": 38332 + }, + { + "epoch": 0.98, + "learning_rate": 1.5706387356065839e-06, + "loss": 0.7622, + "step": 38333 + }, + { + "epoch": 0.98, + "learning_rate": 1.5706160123778065e-06, + "loss": 0.791, + "step": 38334 + }, + { + "epoch": 0.98, + "learning_rate": 1.570593288712135e-06, + "loss": 0.7979, + "step": 38335 + }, + { + "epoch": 0.98, + "learning_rate": 1.570570564609586e-06, + "loss": 0.6597, + "step": 38336 + }, + { + "epoch": 0.98, + "learning_rate": 1.570547840070178e-06, + "loss": 0.8115, + "step": 38337 + }, + { + "epoch": 0.98, + "learning_rate": 1.5705251150939277e-06, + "loss": 0.8945, + "step": 38338 + }, + { + "epoch": 0.98, + "learning_rate": 1.570502389680852e-06, + "loss": 0.7476, + "step": 38339 + }, + { + "epoch": 0.98, + "learning_rate": 1.5704796638309692e-06, + "loss": 0.7324, + "step": 38340 + }, + { + "epoch": 0.98, + "learning_rate": 1.5704569375442964e-06, + "loss": 0.7393, + "step": 38341 + }, + { + "epoch": 0.98, + "learning_rate": 1.570434210820851e-06, + "loss": 0.769, + "step": 38342 + }, + { + "epoch": 0.98, + "learning_rate": 1.5704114836606502e-06, + "loss": 0.6943, + "step": 38343 + }, + { + "epoch": 0.98, + "learning_rate": 1.5703887560637114e-06, + "loss": 0.79, + "step": 38344 + }, + { + "epoch": 0.98, + "learning_rate": 1.5703660280300523e-06, + "loss": 0.8711, + "step": 38345 + }, + { + "epoch": 0.98, + "learning_rate": 1.5703432995596902e-06, + "loss": 1.0479, + "step": 38346 + }, + { + "epoch": 0.98, + "learning_rate": 1.5703205706526426e-06, + "loss": 0.73, + "step": 38347 + }, + { + "epoch": 0.98, + "learning_rate": 1.5702978413089266e-06, + "loss": 0.8047, + "step": 38348 + }, + { + "epoch": 0.98, + "learning_rate": 1.5702751115285598e-06, + "loss": 1.0039, + "step": 38349 + }, + { + "epoch": 0.98, + "learning_rate": 1.5702523813115597e-06, + "loss": 1.0044, + "step": 38350 + }, + { + "epoch": 0.98, + "learning_rate": 1.5702296506579434e-06, + "loss": 0.8525, + "step": 38351 + }, + { + "epoch": 0.98, + "learning_rate": 1.5702069195677283e-06, + "loss": 0.7026, + "step": 38352 + }, + { + "epoch": 0.98, + "learning_rate": 1.5701841880409323e-06, + "loss": 0.8086, + "step": 38353 + }, + { + "epoch": 0.98, + "learning_rate": 1.5701614560775723e-06, + "loss": 0.6416, + "step": 38354 + }, + { + "epoch": 0.98, + "learning_rate": 1.570138723677666e-06, + "loss": 0.9971, + "step": 38355 + }, + { + "epoch": 0.98, + "learning_rate": 1.5701159908412308e-06, + "loss": 0.6875, + "step": 38356 + }, + { + "epoch": 0.98, + "learning_rate": 1.5700932575682837e-06, + "loss": 0.917, + "step": 38357 + }, + { + "epoch": 0.98, + "learning_rate": 1.5700705238588426e-06, + "loss": 1.0078, + "step": 38358 + }, + { + "epoch": 0.98, + "learning_rate": 1.5700477897129246e-06, + "loss": 0.7783, + "step": 38359 + }, + { + "epoch": 0.98, + "learning_rate": 1.5700250551305474e-06, + "loss": 0.708, + "step": 38360 + }, + { + "epoch": 0.98, + "learning_rate": 1.5700023201117278e-06, + "loss": 0.9551, + "step": 38361 + }, + { + "epoch": 0.98, + "learning_rate": 1.5699795846564843e-06, + "loss": 0.7583, + "step": 38362 + }, + { + "epoch": 0.98, + "learning_rate": 1.5699568487648334e-06, + "loss": 0.8159, + "step": 38363 + }, + { + "epoch": 0.98, + "learning_rate": 1.5699341124367925e-06, + "loss": 1.0186, + "step": 38364 + }, + { + "epoch": 0.98, + "learning_rate": 1.5699113756723793e-06, + "loss": 0.8984, + "step": 38365 + }, + { + "epoch": 0.98, + "learning_rate": 1.5698886384716113e-06, + "loss": 0.8662, + "step": 38366 + }, + { + "epoch": 0.98, + "learning_rate": 1.5698659008345057e-06, + "loss": 0.7686, + "step": 38367 + }, + { + "epoch": 0.98, + "learning_rate": 1.5698431627610801e-06, + "loss": 0.7871, + "step": 38368 + }, + { + "epoch": 0.98, + "learning_rate": 1.5698204242513517e-06, + "loss": 1.0469, + "step": 38369 + }, + { + "epoch": 0.98, + "learning_rate": 1.569797685305338e-06, + "loss": 0.7803, + "step": 38370 + }, + { + "epoch": 0.98, + "learning_rate": 1.5697749459230565e-06, + "loss": 0.9648, + "step": 38371 + }, + { + "epoch": 0.98, + "learning_rate": 1.5697522061045243e-06, + "loss": 0.7451, + "step": 38372 + }, + { + "epoch": 0.98, + "learning_rate": 1.5697294658497594e-06, + "loss": 1.0557, + "step": 38373 + }, + { + "epoch": 0.98, + "learning_rate": 1.5697067251587784e-06, + "loss": 0.6348, + "step": 38374 + }, + { + "epoch": 0.98, + "learning_rate": 1.5696839840315993e-06, + "loss": 0.6748, + "step": 38375 + }, + { + "epoch": 0.98, + "learning_rate": 1.5696612424682396e-06, + "loss": 0.8965, + "step": 38376 + }, + { + "epoch": 0.98, + "learning_rate": 1.5696385004687166e-06, + "loss": 0.7583, + "step": 38377 + }, + { + "epoch": 0.98, + "learning_rate": 1.5696157580330472e-06, + "loss": 0.8779, + "step": 38378 + }, + { + "epoch": 0.98, + "learning_rate": 1.5695930151612492e-06, + "loss": 0.8535, + "step": 38379 + }, + { + "epoch": 0.98, + "learning_rate": 1.5695702718533402e-06, + "loss": 0.9141, + "step": 38380 + }, + { + "epoch": 0.98, + "learning_rate": 1.5695475281093373e-06, + "loss": 1.0098, + "step": 38381 + }, + { + "epoch": 0.98, + "learning_rate": 1.5695247839292582e-06, + "loss": 0.6743, + "step": 38382 + }, + { + "epoch": 0.98, + "learning_rate": 1.5695020393131202e-06, + "loss": 0.9971, + "step": 38383 + }, + { + "epoch": 0.98, + "learning_rate": 1.5694792942609402e-06, + "loss": 0.7417, + "step": 38384 + }, + { + "epoch": 0.98, + "learning_rate": 1.5694565487727366e-06, + "loss": 0.7988, + "step": 38385 + }, + { + "epoch": 0.98, + "learning_rate": 1.569433802848526e-06, + "loss": 0.8047, + "step": 38386 + }, + { + "epoch": 0.98, + "learning_rate": 1.5694110564883266e-06, + "loss": 0.9746, + "step": 38387 + }, + { + "epoch": 0.98, + "learning_rate": 1.5693883096921549e-06, + "loss": 0.9355, + "step": 38388 + }, + { + "epoch": 0.98, + "learning_rate": 1.5693655624600289e-06, + "loss": 0.5088, + "step": 38389 + }, + { + "epoch": 0.98, + "learning_rate": 1.5693428147919657e-06, + "loss": 0.8184, + "step": 38390 + }, + { + "epoch": 0.98, + "learning_rate": 1.569320066687983e-06, + "loss": 0.9277, + "step": 38391 + }, + { + "epoch": 0.98, + "learning_rate": 1.5692973181480982e-06, + "loss": 0.5264, + "step": 38392 + }, + { + "epoch": 0.98, + "learning_rate": 1.5692745691723286e-06, + "loss": 0.8086, + "step": 38393 + }, + { + "epoch": 0.98, + "learning_rate": 1.5692518197606917e-06, + "loss": 0.8359, + "step": 38394 + }, + { + "epoch": 0.98, + "learning_rate": 1.5692290699132045e-06, + "loss": 0.9863, + "step": 38395 + }, + { + "epoch": 0.98, + "learning_rate": 1.569206319629885e-06, + "loss": 0.8828, + "step": 38396 + }, + { + "epoch": 0.98, + "learning_rate": 1.5691835689107506e-06, + "loss": 0.8701, + "step": 38397 + }, + { + "epoch": 0.98, + "learning_rate": 1.5691608177558183e-06, + "loss": 0.7808, + "step": 38398 + }, + { + "epoch": 0.98, + "learning_rate": 1.569138066165106e-06, + "loss": 0.8125, + "step": 38399 + }, + { + "epoch": 0.98, + "learning_rate": 1.5691153141386303e-06, + "loss": 0.7686, + "step": 38400 + }, + { + "epoch": 0.98, + "learning_rate": 1.5690925616764095e-06, + "loss": 0.6494, + "step": 38401 + }, + { + "epoch": 0.98, + "learning_rate": 1.5690698087784609e-06, + "loss": 1.0742, + "step": 38402 + }, + { + "epoch": 0.98, + "learning_rate": 1.5690470554448014e-06, + "loss": 0.5983, + "step": 38403 + }, + { + "epoch": 0.98, + "learning_rate": 1.5690243016754487e-06, + "loss": 0.9248, + "step": 38404 + }, + { + "epoch": 0.98, + "learning_rate": 1.5690015474704204e-06, + "loss": 0.9082, + "step": 38405 + }, + { + "epoch": 0.98, + "learning_rate": 1.5689787928297339e-06, + "loss": 0.7773, + "step": 38406 + }, + { + "epoch": 0.98, + "learning_rate": 1.5689560377534062e-06, + "loss": 0.8423, + "step": 38407 + }, + { + "epoch": 0.98, + "learning_rate": 1.5689332822414552e-06, + "loss": 0.9365, + "step": 38408 + }, + { + "epoch": 0.98, + "learning_rate": 1.568910526293898e-06, + "loss": 0.7803, + "step": 38409 + }, + { + "epoch": 0.98, + "learning_rate": 1.5688877699107524e-06, + "loss": 0.7271, + "step": 38410 + }, + { + "epoch": 0.98, + "learning_rate": 1.5688650130920354e-06, + "loss": 0.915, + "step": 38411 + }, + { + "epoch": 0.98, + "learning_rate": 1.5688422558377647e-06, + "loss": 0.998, + "step": 38412 + }, + { + "epoch": 0.98, + "learning_rate": 1.568819498147958e-06, + "loss": 1.001, + "step": 38413 + }, + { + "epoch": 0.98, + "learning_rate": 1.5687967400226318e-06, + "loss": 0.812, + "step": 38414 + }, + { + "epoch": 0.98, + "learning_rate": 1.5687739814618041e-06, + "loss": 0.9219, + "step": 38415 + }, + { + "epoch": 0.98, + "learning_rate": 1.5687512224654927e-06, + "loss": 0.8408, + "step": 38416 + }, + { + "epoch": 0.98, + "learning_rate": 1.5687284630337146e-06, + "loss": 0.7715, + "step": 38417 + }, + { + "epoch": 0.98, + "learning_rate": 1.568705703166487e-06, + "loss": 0.7324, + "step": 38418 + }, + { + "epoch": 0.98, + "learning_rate": 1.5686829428638278e-06, + "loss": 0.9561, + "step": 38419 + }, + { + "epoch": 0.98, + "learning_rate": 1.568660182125754e-06, + "loss": 0.7686, + "step": 38420 + }, + { + "epoch": 0.98, + "learning_rate": 1.5686374209522835e-06, + "loss": 0.9678, + "step": 38421 + }, + { + "epoch": 0.98, + "learning_rate": 1.5686146593434333e-06, + "loss": 0.8633, + "step": 38422 + }, + { + "epoch": 0.98, + "learning_rate": 1.568591897299221e-06, + "loss": 0.9053, + "step": 38423 + }, + { + "epoch": 0.98, + "learning_rate": 1.568569134819664e-06, + "loss": 0.7866, + "step": 38424 + }, + { + "epoch": 0.98, + "learning_rate": 1.5685463719047797e-06, + "loss": 0.7466, + "step": 38425 + }, + { + "epoch": 0.98, + "learning_rate": 1.568523608554586e-06, + "loss": 0.8428, + "step": 38426 + }, + { + "epoch": 0.98, + "learning_rate": 1.5685008447690998e-06, + "loss": 0.7251, + "step": 38427 + }, + { + "epoch": 0.98, + "learning_rate": 1.5684780805483384e-06, + "loss": 1.2061, + "step": 38428 + }, + { + "epoch": 0.98, + "learning_rate": 1.5684553158923195e-06, + "loss": 0.8682, + "step": 38429 + }, + { + "epoch": 0.98, + "learning_rate": 1.5684325508010602e-06, + "loss": 0.7432, + "step": 38430 + }, + { + "epoch": 0.99, + "learning_rate": 1.5684097852745788e-06, + "loss": 0.9199, + "step": 38431 + }, + { + "epoch": 0.99, + "learning_rate": 1.568387019312892e-06, + "loss": 0.8911, + "step": 38432 + }, + { + "epoch": 0.99, + "learning_rate": 1.5683642529160172e-06, + "loss": 0.8652, + "step": 38433 + }, + { + "epoch": 0.99, + "learning_rate": 1.5683414860839723e-06, + "loss": 0.875, + "step": 38434 + }, + { + "epoch": 0.99, + "learning_rate": 1.5683187188167744e-06, + "loss": 0.8047, + "step": 38435 + }, + { + "epoch": 0.99, + "learning_rate": 1.5682959511144408e-06, + "loss": 0.6816, + "step": 38436 + }, + { + "epoch": 0.99, + "learning_rate": 1.5682731829769896e-06, + "loss": 0.7412, + "step": 38437 + }, + { + "epoch": 0.99, + "learning_rate": 1.5682504144044373e-06, + "loss": 1.0732, + "step": 38438 + }, + { + "epoch": 0.99, + "learning_rate": 1.5682276453968018e-06, + "loss": 0.8916, + "step": 38439 + }, + { + "epoch": 0.99, + "learning_rate": 1.5682048759541005e-06, + "loss": 0.9248, + "step": 38440 + }, + { + "epoch": 0.99, + "learning_rate": 1.5681821060763509e-06, + "loss": 0.748, + "step": 38441 + }, + { + "epoch": 0.99, + "learning_rate": 1.5681593357635708e-06, + "loss": 0.7773, + "step": 38442 + }, + { + "epoch": 0.99, + "learning_rate": 1.5681365650157767e-06, + "loss": 0.8599, + "step": 38443 + }, + { + "epoch": 0.99, + "learning_rate": 1.5681137938329866e-06, + "loss": 1.085, + "step": 38444 + }, + { + "epoch": 0.99, + "learning_rate": 1.5680910222152178e-06, + "loss": 0.9639, + "step": 38445 + }, + { + "epoch": 0.99, + "learning_rate": 1.5680682501624883e-06, + "loss": 0.8867, + "step": 38446 + }, + { + "epoch": 0.99, + "learning_rate": 1.5680454776748148e-06, + "loss": 0.6777, + "step": 38447 + }, + { + "epoch": 0.99, + "learning_rate": 1.568022704752215e-06, + "loss": 0.8232, + "step": 38448 + }, + { + "epoch": 0.99, + "learning_rate": 1.5679999313947063e-06, + "loss": 1.0078, + "step": 38449 + }, + { + "epoch": 0.99, + "learning_rate": 1.5679771576023062e-06, + "loss": 0.6704, + "step": 38450 + }, + { + "epoch": 0.99, + "learning_rate": 1.567954383375032e-06, + "loss": 0.6611, + "step": 38451 + }, + { + "epoch": 0.99, + "learning_rate": 1.5679316087129016e-06, + "loss": 0.835, + "step": 38452 + }, + { + "epoch": 0.99, + "learning_rate": 1.5679088336159319e-06, + "loss": 0.6758, + "step": 38453 + }, + { + "epoch": 0.99, + "learning_rate": 1.5678860580841401e-06, + "loss": 0.9824, + "step": 38454 + }, + { + "epoch": 0.99, + "learning_rate": 1.5678632821175445e-06, + "loss": 0.7949, + "step": 38455 + }, + { + "epoch": 0.99, + "learning_rate": 1.567840505716162e-06, + "loss": 0.9229, + "step": 38456 + }, + { + "epoch": 0.99, + "learning_rate": 1.5678177288800103e-06, + "loss": 0.9492, + "step": 38457 + }, + { + "epoch": 0.99, + "learning_rate": 1.5677949516091065e-06, + "loss": 0.6704, + "step": 38458 + }, + { + "epoch": 0.99, + "learning_rate": 1.5677721739034682e-06, + "loss": 0.9639, + "step": 38459 + }, + { + "epoch": 0.99, + "learning_rate": 1.567749395763113e-06, + "loss": 0.9395, + "step": 38460 + }, + { + "epoch": 0.99, + "learning_rate": 1.567726617188058e-06, + "loss": 0.75, + "step": 38461 + }, + { + "epoch": 0.99, + "learning_rate": 1.567703838178321e-06, + "loss": 0.8057, + "step": 38462 + }, + { + "epoch": 0.99, + "learning_rate": 1.567681058733919e-06, + "loss": 0.8916, + "step": 38463 + }, + { + "epoch": 0.99, + "learning_rate": 1.56765827885487e-06, + "loss": 0.8091, + "step": 38464 + }, + { + "epoch": 0.99, + "learning_rate": 1.567635498541191e-06, + "loss": 0.7349, + "step": 38465 + }, + { + "epoch": 0.99, + "learning_rate": 1.5676127177928998e-06, + "loss": 0.8496, + "step": 38466 + }, + { + "epoch": 0.99, + "learning_rate": 1.5675899366100134e-06, + "loss": 0.8447, + "step": 38467 + }, + { + "epoch": 0.99, + "learning_rate": 1.5675671549925495e-06, + "loss": 0.877, + "step": 38468 + }, + { + "epoch": 0.99, + "learning_rate": 1.5675443729405257e-06, + "loss": 0.8203, + "step": 38469 + }, + { + "epoch": 0.99, + "learning_rate": 1.5675215904539593e-06, + "loss": 0.5381, + "step": 38470 + }, + { + "epoch": 0.99, + "learning_rate": 1.5674988075328674e-06, + "loss": 0.8047, + "step": 38471 + }, + { + "epoch": 0.99, + "learning_rate": 1.567476024177268e-06, + "loss": 0.8779, + "step": 38472 + }, + { + "epoch": 0.99, + "learning_rate": 1.5674532403871781e-06, + "loss": 0.792, + "step": 38473 + }, + { + "epoch": 0.99, + "learning_rate": 1.5674304561626155e-06, + "loss": 0.8223, + "step": 38474 + }, + { + "epoch": 0.99, + "learning_rate": 1.5674076715035975e-06, + "loss": 0.6729, + "step": 38475 + }, + { + "epoch": 0.99, + "learning_rate": 1.5673848864101417e-06, + "loss": 1.0166, + "step": 38476 + }, + { + "epoch": 0.99, + "learning_rate": 1.5673621008822653e-06, + "loss": 0.9136, + "step": 38477 + }, + { + "epoch": 0.99, + "learning_rate": 1.5673393149199857e-06, + "loss": 0.8896, + "step": 38478 + }, + { + "epoch": 0.99, + "learning_rate": 1.5673165285233205e-06, + "loss": 0.6567, + "step": 38479 + }, + { + "epoch": 0.99, + "learning_rate": 1.5672937416922869e-06, + "loss": 0.9805, + "step": 38480 + }, + { + "epoch": 0.99, + "learning_rate": 1.567270954426903e-06, + "loss": 0.9561, + "step": 38481 + }, + { + "epoch": 0.99, + "learning_rate": 1.5672481667271854e-06, + "loss": 0.9385, + "step": 38482 + }, + { + "epoch": 0.99, + "learning_rate": 1.5672253785931523e-06, + "loss": 0.9688, + "step": 38483 + }, + { + "epoch": 0.99, + "learning_rate": 1.5672025900248207e-06, + "loss": 1.0107, + "step": 38484 + }, + { + "epoch": 0.99, + "learning_rate": 1.5671798010222078e-06, + "loss": 0.8418, + "step": 38485 + }, + { + "epoch": 0.99, + "learning_rate": 1.5671570115853322e-06, + "loss": 0.7305, + "step": 38486 + }, + { + "epoch": 0.99, + "learning_rate": 1.5671342217142099e-06, + "loss": 0.9521, + "step": 38487 + }, + { + "epoch": 0.99, + "learning_rate": 1.5671114314088595e-06, + "loss": 0.792, + "step": 38488 + }, + { + "epoch": 0.99, + "learning_rate": 1.5670886406692976e-06, + "loss": 0.5576, + "step": 38489 + }, + { + "epoch": 0.99, + "learning_rate": 1.5670658494955417e-06, + "loss": 0.6206, + "step": 38490 + }, + { + "epoch": 0.99, + "learning_rate": 1.56704305788761e-06, + "loss": 0.8447, + "step": 38491 + }, + { + "epoch": 0.99, + "learning_rate": 1.5670202658455196e-06, + "loss": 1.0352, + "step": 38492 + }, + { + "epoch": 0.99, + "learning_rate": 1.5669974733692876e-06, + "loss": 0.769, + "step": 38493 + }, + { + "epoch": 0.99, + "learning_rate": 1.5669746804589316e-06, + "loss": 0.8105, + "step": 38494 + }, + { + "epoch": 0.99, + "learning_rate": 1.5669518871144694e-06, + "loss": 0.8545, + "step": 38495 + }, + { + "epoch": 0.99, + "learning_rate": 1.566929093335918e-06, + "loss": 0.8438, + "step": 38496 + }, + { + "epoch": 0.99, + "learning_rate": 1.5669062991232952e-06, + "loss": 0.791, + "step": 38497 + }, + { + "epoch": 0.99, + "learning_rate": 1.5668835044766185e-06, + "loss": 0.8018, + "step": 38498 + }, + { + "epoch": 0.99, + "learning_rate": 1.566860709395905e-06, + "loss": 0.8867, + "step": 38499 + }, + { + "epoch": 0.99, + "learning_rate": 1.5668379138811722e-06, + "loss": 0.8525, + "step": 38500 + }, + { + "epoch": 0.99, + "learning_rate": 1.5668151179324379e-06, + "loss": 0.7979, + "step": 38501 + }, + { + "epoch": 0.99, + "learning_rate": 1.5667923215497193e-06, + "loss": 0.9297, + "step": 38502 + }, + { + "epoch": 0.99, + "learning_rate": 1.5667695247330337e-06, + "loss": 0.8162, + "step": 38503 + }, + { + "epoch": 0.99, + "learning_rate": 1.566746727482399e-06, + "loss": 0.9038, + "step": 38504 + }, + { + "epoch": 0.99, + "learning_rate": 1.566723929797832e-06, + "loss": 0.8145, + "step": 38505 + }, + { + "epoch": 0.99, + "learning_rate": 1.5667011316793506e-06, + "loss": 0.8125, + "step": 38506 + }, + { + "epoch": 0.99, + "learning_rate": 1.5666783331269726e-06, + "loss": 0.791, + "step": 38507 + }, + { + "epoch": 0.99, + "learning_rate": 1.5666555341407149e-06, + "loss": 0.6934, + "step": 38508 + }, + { + "epoch": 0.99, + "learning_rate": 1.5666327347205948e-06, + "loss": 1.0039, + "step": 38509 + }, + { + "epoch": 0.99, + "learning_rate": 1.5666099348666303e-06, + "loss": 0.6226, + "step": 38510 + }, + { + "epoch": 0.99, + "learning_rate": 1.5665871345788387e-06, + "loss": 0.8145, + "step": 38511 + }, + { + "epoch": 0.99, + "learning_rate": 1.5665643338572374e-06, + "loss": 0.897, + "step": 38512 + }, + { + "epoch": 0.99, + "learning_rate": 1.5665415327018437e-06, + "loss": 0.9961, + "step": 38513 + }, + { + "epoch": 0.99, + "learning_rate": 1.566518731112675e-06, + "loss": 0.8848, + "step": 38514 + }, + { + "epoch": 0.99, + "learning_rate": 1.5664959290897492e-06, + "loss": 0.6782, + "step": 38515 + }, + { + "epoch": 0.99, + "learning_rate": 1.5664731266330837e-06, + "loss": 0.5479, + "step": 38516 + }, + { + "epoch": 0.99, + "learning_rate": 1.5664503237426955e-06, + "loss": 0.7451, + "step": 38517 + }, + { + "epoch": 0.99, + "learning_rate": 1.5664275204186024e-06, + "loss": 0.6167, + "step": 38518 + }, + { + "epoch": 0.99, + "learning_rate": 1.5664047166608218e-06, + "loss": 0.9746, + "step": 38519 + }, + { + "epoch": 0.99, + "learning_rate": 1.5663819124693714e-06, + "loss": 0.8147, + "step": 38520 + }, + { + "epoch": 0.99, + "learning_rate": 1.566359107844268e-06, + "loss": 0.96, + "step": 38521 + }, + { + "epoch": 0.99, + "learning_rate": 1.5663363027855296e-06, + "loss": 0.9385, + "step": 38522 + }, + { + "epoch": 0.99, + "learning_rate": 1.5663134972931736e-06, + "loss": 0.7959, + "step": 38523 + }, + { + "epoch": 0.99, + "learning_rate": 1.5662906913672175e-06, + "loss": 1.0303, + "step": 38524 + }, + { + "epoch": 0.99, + "learning_rate": 1.5662678850076786e-06, + "loss": 0.7432, + "step": 38525 + }, + { + "epoch": 0.99, + "learning_rate": 1.5662450782145742e-06, + "loss": 0.7871, + "step": 38526 + }, + { + "epoch": 0.99, + "learning_rate": 1.5662222709879225e-06, + "loss": 0.9814, + "step": 38527 + }, + { + "epoch": 0.99, + "learning_rate": 1.5661994633277397e-06, + "loss": 0.8848, + "step": 38528 + }, + { + "epoch": 0.99, + "learning_rate": 1.5661766552340446e-06, + "loss": 0.8477, + "step": 38529 + }, + { + "epoch": 0.99, + "learning_rate": 1.5661538467068539e-06, + "loss": 0.877, + "step": 38530 + }, + { + "epoch": 0.99, + "learning_rate": 1.5661310377461852e-06, + "loss": 0.6816, + "step": 38531 + }, + { + "epoch": 0.99, + "learning_rate": 1.5661082283520558e-06, + "loss": 0.9775, + "step": 38532 + }, + { + "epoch": 0.99, + "learning_rate": 1.5660854185244836e-06, + "loss": 0.7456, + "step": 38533 + }, + { + "epoch": 0.99, + "learning_rate": 1.5660626082634857e-06, + "loss": 0.8359, + "step": 38534 + }, + { + "epoch": 0.99, + "learning_rate": 1.5660397975690797e-06, + "loss": 0.7119, + "step": 38535 + }, + { + "epoch": 0.99, + "learning_rate": 1.5660169864412831e-06, + "loss": 0.791, + "step": 38536 + }, + { + "epoch": 0.99, + "learning_rate": 1.5659941748801136e-06, + "loss": 0.998, + "step": 38537 + }, + { + "epoch": 0.99, + "learning_rate": 1.565971362885588e-06, + "loss": 0.7549, + "step": 38538 + }, + { + "epoch": 0.99, + "learning_rate": 1.5659485504577244e-06, + "loss": 0.7295, + "step": 38539 + }, + { + "epoch": 0.99, + "learning_rate": 1.5659257375965399e-06, + "loss": 0.6475, + "step": 38540 + }, + { + "epoch": 0.99, + "learning_rate": 1.5659029243020519e-06, + "loss": 0.8608, + "step": 38541 + }, + { + "epoch": 0.99, + "learning_rate": 1.5658801105742784e-06, + "loss": 0.6169, + "step": 38542 + }, + { + "epoch": 0.99, + "learning_rate": 1.5658572964132363e-06, + "loss": 0.7083, + "step": 38543 + }, + { + "epoch": 0.99, + "learning_rate": 1.5658344818189432e-06, + "loss": 0.9756, + "step": 38544 + }, + { + "epoch": 0.99, + "learning_rate": 1.5658116667914168e-06, + "loss": 0.7803, + "step": 38545 + }, + { + "epoch": 0.99, + "learning_rate": 1.5657888513306743e-06, + "loss": 0.793, + "step": 38546 + }, + { + "epoch": 0.99, + "learning_rate": 1.5657660354367334e-06, + "loss": 0.9854, + "step": 38547 + }, + { + "epoch": 0.99, + "learning_rate": 1.5657432191096116e-06, + "loss": 1.0713, + "step": 38548 + }, + { + "epoch": 0.99, + "learning_rate": 1.565720402349326e-06, + "loss": 0.9355, + "step": 38549 + }, + { + "epoch": 0.99, + "learning_rate": 1.5656975851558944e-06, + "loss": 0.8467, + "step": 38550 + }, + { + "epoch": 0.99, + "learning_rate": 1.5656747675293343e-06, + "loss": 0.9287, + "step": 38551 + }, + { + "epoch": 0.99, + "learning_rate": 1.5656519494696628e-06, + "loss": 0.8145, + "step": 38552 + }, + { + "epoch": 0.99, + "learning_rate": 1.5656291309768976e-06, + "loss": 1.1738, + "step": 38553 + }, + { + "epoch": 0.99, + "learning_rate": 1.5656063120510563e-06, + "loss": 0.9355, + "step": 38554 + }, + { + "epoch": 0.99, + "learning_rate": 1.5655834926921565e-06, + "loss": 0.8701, + "step": 38555 + }, + { + "epoch": 0.99, + "learning_rate": 1.5655606729002151e-06, + "loss": 0.5642, + "step": 38556 + }, + { + "epoch": 0.99, + "learning_rate": 1.5655378526752498e-06, + "loss": 0.7852, + "step": 38557 + }, + { + "epoch": 0.99, + "learning_rate": 1.5655150320172786e-06, + "loss": 0.7529, + "step": 38558 + }, + { + "epoch": 0.99, + "learning_rate": 1.565492210926318e-06, + "loss": 0.6914, + "step": 38559 + }, + { + "epoch": 0.99, + "learning_rate": 1.5654693894023865e-06, + "loss": 0.8389, + "step": 38560 + }, + { + "epoch": 0.99, + "learning_rate": 1.565446567445501e-06, + "loss": 0.7822, + "step": 38561 + }, + { + "epoch": 0.99, + "learning_rate": 1.5654237450556788e-06, + "loss": 0.8389, + "step": 38562 + }, + { + "epoch": 0.99, + "learning_rate": 1.565400922232938e-06, + "loss": 0.6885, + "step": 38563 + }, + { + "epoch": 0.99, + "learning_rate": 1.565378098977295e-06, + "loss": 1.1318, + "step": 38564 + }, + { + "epoch": 0.99, + "learning_rate": 1.565355275288769e-06, + "loss": 0.8184, + "step": 38565 + }, + { + "epoch": 0.99, + "learning_rate": 1.565332451167376e-06, + "loss": 1.0, + "step": 38566 + }, + { + "epoch": 0.99, + "learning_rate": 1.5653096266131337e-06, + "loss": 0.9111, + "step": 38567 + }, + { + "epoch": 0.99, + "learning_rate": 1.56528680162606e-06, + "loss": 0.9062, + "step": 38568 + }, + { + "epoch": 0.99, + "learning_rate": 1.5652639762061721e-06, + "loss": 0.8721, + "step": 38569 + }, + { + "epoch": 0.99, + "learning_rate": 1.5652411503534876e-06, + "loss": 0.7454, + "step": 38570 + }, + { + "epoch": 0.99, + "learning_rate": 1.5652183240680242e-06, + "loss": 0.8018, + "step": 38571 + }, + { + "epoch": 0.99, + "learning_rate": 1.565195497349799e-06, + "loss": 0.9316, + "step": 38572 + }, + { + "epoch": 0.99, + "learning_rate": 1.5651726701988292e-06, + "loss": 0.7725, + "step": 38573 + }, + { + "epoch": 0.99, + "learning_rate": 1.5651498426151331e-06, + "loss": 0.8408, + "step": 38574 + }, + { + "epoch": 0.99, + "learning_rate": 1.5651270145987276e-06, + "loss": 0.9658, + "step": 38575 + }, + { + "epoch": 0.99, + "learning_rate": 1.5651041861496305e-06, + "loss": 0.6729, + "step": 38576 + }, + { + "epoch": 0.99, + "learning_rate": 1.565081357267859e-06, + "loss": 0.8584, + "step": 38577 + }, + { + "epoch": 0.99, + "learning_rate": 1.5650585279534307e-06, + "loss": 0.8115, + "step": 38578 + }, + { + "epoch": 0.99, + "learning_rate": 1.5650356982063628e-06, + "loss": 0.9619, + "step": 38579 + }, + { + "epoch": 0.99, + "learning_rate": 1.5650128680266734e-06, + "loss": 0.9727, + "step": 38580 + }, + { + "epoch": 0.99, + "learning_rate": 1.5649900374143793e-06, + "loss": 0.7705, + "step": 38581 + }, + { + "epoch": 0.99, + "learning_rate": 1.5649672063694987e-06, + "loss": 0.8799, + "step": 38582 + }, + { + "epoch": 0.99, + "learning_rate": 1.5649443748920486e-06, + "loss": 0.7278, + "step": 38583 + }, + { + "epoch": 0.99, + "learning_rate": 1.5649215429820464e-06, + "loss": 0.6978, + "step": 38584 + }, + { + "epoch": 0.99, + "learning_rate": 1.5648987106395097e-06, + "loss": 0.8701, + "step": 38585 + }, + { + "epoch": 0.99, + "learning_rate": 1.5648758778644563e-06, + "loss": 1.0361, + "step": 38586 + }, + { + "epoch": 0.99, + "learning_rate": 1.5648530446569032e-06, + "loss": 0.8779, + "step": 38587 + }, + { + "epoch": 0.99, + "learning_rate": 1.564830211016868e-06, + "loss": 0.7095, + "step": 38588 + }, + { + "epoch": 0.99, + "learning_rate": 1.5648073769443686e-06, + "loss": 0.7334, + "step": 38589 + }, + { + "epoch": 0.99, + "learning_rate": 1.564784542439422e-06, + "loss": 0.9375, + "step": 38590 + }, + { + "epoch": 0.99, + "learning_rate": 1.564761707502046e-06, + "loss": 1.0703, + "step": 38591 + }, + { + "epoch": 0.99, + "learning_rate": 1.5647388721322576e-06, + "loss": 0.4651, + "step": 38592 + }, + { + "epoch": 0.99, + "learning_rate": 1.564716036330075e-06, + "loss": 0.7324, + "step": 38593 + }, + { + "epoch": 0.99, + "learning_rate": 1.564693200095515e-06, + "loss": 1.083, + "step": 38594 + }, + { + "epoch": 0.99, + "learning_rate": 1.5646703634285953e-06, + "loss": 1.0703, + "step": 38595 + }, + { + "epoch": 0.99, + "learning_rate": 1.5646475263293337e-06, + "loss": 0.874, + "step": 38596 + }, + { + "epoch": 0.99, + "learning_rate": 1.5646246887977475e-06, + "loss": 0.8667, + "step": 38597 + }, + { + "epoch": 0.99, + "learning_rate": 1.5646018508338541e-06, + "loss": 0.9277, + "step": 38598 + }, + { + "epoch": 0.99, + "learning_rate": 1.564579012437671e-06, + "loss": 0.7305, + "step": 38599 + }, + { + "epoch": 0.99, + "learning_rate": 1.5645561736092155e-06, + "loss": 0.9014, + "step": 38600 + }, + { + "epoch": 0.99, + "learning_rate": 1.5645333343485056e-06, + "loss": 0.8291, + "step": 38601 + }, + { + "epoch": 0.99, + "learning_rate": 1.5645104946555581e-06, + "loss": 1.0498, + "step": 38602 + }, + { + "epoch": 0.99, + "learning_rate": 1.5644876545303914e-06, + "loss": 0.9238, + "step": 38603 + }, + { + "epoch": 0.99, + "learning_rate": 1.5644648139730219e-06, + "loss": 1.0674, + "step": 38604 + }, + { + "epoch": 0.99, + "learning_rate": 1.564441972983468e-06, + "loss": 0.8564, + "step": 38605 + }, + { + "epoch": 0.99, + "learning_rate": 1.5644191315617468e-06, + "loss": 0.7646, + "step": 38606 + }, + { + "epoch": 0.99, + "learning_rate": 1.5643962897078758e-06, + "loss": 0.6841, + "step": 38607 + }, + { + "epoch": 0.99, + "learning_rate": 1.5643734474218723e-06, + "loss": 0.8428, + "step": 38608 + }, + { + "epoch": 0.99, + "learning_rate": 1.5643506047037543e-06, + "loss": 0.9023, + "step": 38609 + }, + { + "epoch": 0.99, + "learning_rate": 1.5643277615535388e-06, + "loss": 0.8037, + "step": 38610 + }, + { + "epoch": 0.99, + "learning_rate": 1.5643049179712437e-06, + "loss": 0.7842, + "step": 38611 + }, + { + "epoch": 0.99, + "learning_rate": 1.5642820739568862e-06, + "loss": 0.8428, + "step": 38612 + }, + { + "epoch": 0.99, + "learning_rate": 1.5642592295104837e-06, + "loss": 0.731, + "step": 38613 + }, + { + "epoch": 0.99, + "learning_rate": 1.564236384632054e-06, + "loss": 0.8984, + "step": 38614 + }, + { + "epoch": 0.99, + "learning_rate": 1.5642135393216143e-06, + "loss": 0.8975, + "step": 38615 + }, + { + "epoch": 0.99, + "learning_rate": 1.5641906935791825e-06, + "loss": 0.7798, + "step": 38616 + }, + { + "epoch": 0.99, + "learning_rate": 1.5641678474047754e-06, + "loss": 0.7871, + "step": 38617 + }, + { + "epoch": 0.99, + "learning_rate": 1.5641450007984113e-06, + "loss": 0.7349, + "step": 38618 + }, + { + "epoch": 0.99, + "learning_rate": 1.5641221537601072e-06, + "loss": 0.8594, + "step": 38619 + }, + { + "epoch": 0.99, + "learning_rate": 1.5640993062898807e-06, + "loss": 0.9258, + "step": 38620 + }, + { + "epoch": 0.99, + "learning_rate": 1.5640764583877496e-06, + "loss": 0.9033, + "step": 38621 + }, + { + "epoch": 0.99, + "learning_rate": 1.5640536100537305e-06, + "loss": 0.5669, + "step": 38622 + }, + { + "epoch": 0.99, + "learning_rate": 1.5640307612878418e-06, + "loss": 0.7725, + "step": 38623 + }, + { + "epoch": 0.99, + "learning_rate": 1.5640079120901009e-06, + "loss": 0.7568, + "step": 38624 + }, + { + "epoch": 0.99, + "learning_rate": 1.5639850624605246e-06, + "loss": 0.4331, + "step": 38625 + }, + { + "epoch": 0.99, + "learning_rate": 1.5639622123991311e-06, + "loss": 0.876, + "step": 38626 + }, + { + "epoch": 0.99, + "learning_rate": 1.5639393619059377e-06, + "loss": 0.8037, + "step": 38627 + }, + { + "epoch": 0.99, + "learning_rate": 1.5639165109809617e-06, + "loss": 0.8423, + "step": 38628 + }, + { + "epoch": 0.99, + "learning_rate": 1.5638936596242209e-06, + "loss": 0.7329, + "step": 38629 + }, + { + "epoch": 0.99, + "learning_rate": 1.5638708078357325e-06, + "loss": 0.731, + "step": 38630 + }, + { + "epoch": 0.99, + "learning_rate": 1.5638479556155147e-06, + "loss": 0.8359, + "step": 38631 + }, + { + "epoch": 0.99, + "learning_rate": 1.5638251029635838e-06, + "loss": 0.6528, + "step": 38632 + }, + { + "epoch": 0.99, + "learning_rate": 1.5638022498799584e-06, + "loss": 0.7837, + "step": 38633 + }, + { + "epoch": 0.99, + "learning_rate": 1.563779396364655e-06, + "loss": 0.7617, + "step": 38634 + }, + { + "epoch": 0.99, + "learning_rate": 1.5637565424176921e-06, + "loss": 0.9209, + "step": 38635 + }, + { + "epoch": 0.99, + "learning_rate": 1.5637336880390867e-06, + "loss": 0.6646, + "step": 38636 + }, + { + "epoch": 0.99, + "learning_rate": 1.5637108332288562e-06, + "loss": 0.9062, + "step": 38637 + }, + { + "epoch": 0.99, + "learning_rate": 1.5636879779870183e-06, + "loss": 0.7021, + "step": 38638 + }, + { + "epoch": 0.99, + "learning_rate": 1.5636651223135903e-06, + "loss": 0.7568, + "step": 38639 + }, + { + "epoch": 0.99, + "learning_rate": 1.5636422662085899e-06, + "loss": 0.6958, + "step": 38640 + }, + { + "epoch": 0.99, + "learning_rate": 1.563619409672035e-06, + "loss": 0.9609, + "step": 38641 + }, + { + "epoch": 0.99, + "learning_rate": 1.5635965527039421e-06, + "loss": 0.8262, + "step": 38642 + }, + { + "epoch": 0.99, + "learning_rate": 1.5635736953043293e-06, + "loss": 0.8447, + "step": 38643 + }, + { + "epoch": 0.99, + "learning_rate": 1.563550837473214e-06, + "loss": 0.7207, + "step": 38644 + }, + { + "epoch": 0.99, + "learning_rate": 1.5635279792106138e-06, + "loss": 0.877, + "step": 38645 + }, + { + "epoch": 0.99, + "learning_rate": 1.5635051205165462e-06, + "loss": 0.8447, + "step": 38646 + }, + { + "epoch": 0.99, + "learning_rate": 1.5634822613910286e-06, + "loss": 0.9287, + "step": 38647 + }, + { + "epoch": 0.99, + "learning_rate": 1.5634594018340784e-06, + "loss": 0.8906, + "step": 38648 + }, + { + "epoch": 0.99, + "learning_rate": 1.5634365418457133e-06, + "loss": 0.8027, + "step": 38649 + }, + { + "epoch": 0.99, + "learning_rate": 1.563413681425951e-06, + "loss": 0.9658, + "step": 38650 + }, + { + "epoch": 0.99, + "learning_rate": 1.5633908205748085e-06, + "loss": 0.7349, + "step": 38651 + }, + { + "epoch": 0.99, + "learning_rate": 1.5633679592923037e-06, + "loss": 0.8359, + "step": 38652 + }, + { + "epoch": 0.99, + "learning_rate": 1.563345097578454e-06, + "loss": 0.7441, + "step": 38653 + }, + { + "epoch": 0.99, + "learning_rate": 1.5633222354332766e-06, + "loss": 0.9053, + "step": 38654 + }, + { + "epoch": 0.99, + "learning_rate": 1.5632993728567895e-06, + "loss": 1.0596, + "step": 38655 + }, + { + "epoch": 0.99, + "learning_rate": 1.5632765098490099e-06, + "loss": 0.9072, + "step": 38656 + }, + { + "epoch": 0.99, + "learning_rate": 1.5632536464099552e-06, + "loss": 0.9189, + "step": 38657 + }, + { + "epoch": 0.99, + "learning_rate": 1.5632307825396434e-06, + "loss": 0.7476, + "step": 38658 + }, + { + "epoch": 0.99, + "learning_rate": 1.5632079182380915e-06, + "loss": 0.751, + "step": 38659 + }, + { + "epoch": 0.99, + "learning_rate": 1.5631850535053172e-06, + "loss": 0.7214, + "step": 38660 + }, + { + "epoch": 0.99, + "learning_rate": 1.5631621883413382e-06, + "loss": 0.7881, + "step": 38661 + }, + { + "epoch": 0.99, + "learning_rate": 1.5631393227461715e-06, + "loss": 0.8369, + "step": 38662 + }, + { + "epoch": 0.99, + "learning_rate": 1.5631164567198352e-06, + "loss": 0.79, + "step": 38663 + }, + { + "epoch": 0.99, + "learning_rate": 1.5630935902623464e-06, + "loss": 0.8447, + "step": 38664 + }, + { + "epoch": 0.99, + "learning_rate": 1.5630707233737223e-06, + "loss": 0.8276, + "step": 38665 + }, + { + "epoch": 0.99, + "learning_rate": 1.5630478560539815e-06, + "loss": 0.7627, + "step": 38666 + }, + { + "epoch": 0.99, + "learning_rate": 1.5630249883031405e-06, + "loss": 0.8164, + "step": 38667 + }, + { + "epoch": 0.99, + "learning_rate": 1.5630021201212174e-06, + "loss": 0.8584, + "step": 38668 + }, + { + "epoch": 0.99, + "learning_rate": 1.5629792515082292e-06, + "loss": 0.5271, + "step": 38669 + }, + { + "epoch": 0.99, + "learning_rate": 1.5629563824641938e-06, + "loss": 0.7173, + "step": 38670 + }, + { + "epoch": 0.99, + "learning_rate": 1.5629335129891286e-06, + "loss": 0.7891, + "step": 38671 + }, + { + "epoch": 0.99, + "learning_rate": 1.562910643083051e-06, + "loss": 0.8398, + "step": 38672 + }, + { + "epoch": 0.99, + "learning_rate": 1.5628877727459785e-06, + "loss": 1.1045, + "step": 38673 + }, + { + "epoch": 0.99, + "learning_rate": 1.562864901977929e-06, + "loss": 0.7649, + "step": 38674 + }, + { + "epoch": 0.99, + "learning_rate": 1.5628420307789195e-06, + "loss": 0.9004, + "step": 38675 + }, + { + "epoch": 0.99, + "learning_rate": 1.5628191591489681e-06, + "loss": 0.5166, + "step": 38676 + }, + { + "epoch": 0.99, + "learning_rate": 1.5627962870880915e-06, + "loss": 0.8125, + "step": 38677 + }, + { + "epoch": 0.99, + "learning_rate": 1.5627734145963078e-06, + "loss": 0.7144, + "step": 38678 + }, + { + "epoch": 0.99, + "learning_rate": 1.5627505416736347e-06, + "loss": 1.0791, + "step": 38679 + }, + { + "epoch": 0.99, + "learning_rate": 1.562727668320089e-06, + "loss": 0.79, + "step": 38680 + }, + { + "epoch": 0.99, + "learning_rate": 1.5627047945356887e-06, + "loss": 0.7173, + "step": 38681 + }, + { + "epoch": 0.99, + "learning_rate": 1.5626819203204513e-06, + "loss": 0.627, + "step": 38682 + }, + { + "epoch": 0.99, + "learning_rate": 1.562659045674394e-06, + "loss": 0.7139, + "step": 38683 + }, + { + "epoch": 0.99, + "learning_rate": 1.5626361705975345e-06, + "loss": 0.6406, + "step": 38684 + }, + { + "epoch": 0.99, + "learning_rate": 1.5626132950898907e-06, + "loss": 0.7495, + "step": 38685 + }, + { + "epoch": 0.99, + "learning_rate": 1.5625904191514797e-06, + "loss": 0.6714, + "step": 38686 + }, + { + "epoch": 0.99, + "learning_rate": 1.562567542782319e-06, + "loss": 0.8164, + "step": 38687 + }, + { + "epoch": 0.99, + "learning_rate": 1.5625446659824265e-06, + "loss": 0.7549, + "step": 38688 + }, + { + "epoch": 0.99, + "learning_rate": 1.5625217887518187e-06, + "loss": 0.4487, + "step": 38689 + }, + { + "epoch": 0.99, + "learning_rate": 1.5624989110905142e-06, + "loss": 0.8867, + "step": 38690 + }, + { + "epoch": 0.99, + "learning_rate": 1.5624760329985302e-06, + "loss": 0.7119, + "step": 38691 + }, + { + "epoch": 0.99, + "learning_rate": 1.5624531544758843e-06, + "loss": 1.0234, + "step": 38692 + }, + { + "epoch": 0.99, + "learning_rate": 1.5624302755225938e-06, + "loss": 0.8887, + "step": 38693 + }, + { + "epoch": 0.99, + "learning_rate": 1.562407396138676e-06, + "loss": 0.9521, + "step": 38694 + }, + { + "epoch": 0.99, + "learning_rate": 1.562384516324149e-06, + "loss": 0.8428, + "step": 38695 + }, + { + "epoch": 0.99, + "learning_rate": 1.5623616360790301e-06, + "loss": 0.7524, + "step": 38696 + }, + { + "epoch": 0.99, + "learning_rate": 1.5623387554033367e-06, + "loss": 1.0088, + "step": 38697 + }, + { + "epoch": 0.99, + "learning_rate": 1.5623158742970863e-06, + "loss": 0.9414, + "step": 38698 + }, + { + "epoch": 0.99, + "learning_rate": 1.5622929927602964e-06, + "loss": 0.7744, + "step": 38699 + }, + { + "epoch": 0.99, + "learning_rate": 1.5622701107929847e-06, + "loss": 0.7305, + "step": 38700 + }, + { + "epoch": 0.99, + "learning_rate": 1.5622472283951689e-06, + "loss": 0.7524, + "step": 38701 + }, + { + "epoch": 0.99, + "learning_rate": 1.5622243455668657e-06, + "loss": 0.8027, + "step": 38702 + }, + { + "epoch": 0.99, + "learning_rate": 1.5622014623080937e-06, + "loss": 0.8994, + "step": 38703 + }, + { + "epoch": 0.99, + "learning_rate": 1.5621785786188694e-06, + "loss": 0.7646, + "step": 38704 + }, + { + "epoch": 0.99, + "learning_rate": 1.5621556944992112e-06, + "loss": 0.4609, + "step": 38705 + }, + { + "epoch": 0.99, + "learning_rate": 1.5621328099491361e-06, + "loss": 0.6516, + "step": 38706 + }, + { + "epoch": 0.99, + "learning_rate": 1.562109924968662e-06, + "loss": 0.6338, + "step": 38707 + }, + { + "epoch": 0.99, + "learning_rate": 1.5620870395578059e-06, + "loss": 0.8477, + "step": 38708 + }, + { + "epoch": 0.99, + "learning_rate": 1.5620641537165856e-06, + "loss": 0.8535, + "step": 38709 + }, + { + "epoch": 0.99, + "learning_rate": 1.5620412674450185e-06, + "loss": 0.8491, + "step": 38710 + }, + { + "epoch": 0.99, + "learning_rate": 1.5620183807431223e-06, + "loss": 0.9043, + "step": 38711 + }, + { + "epoch": 0.99, + "learning_rate": 1.5619954936109148e-06, + "loss": 0.8306, + "step": 38712 + }, + { + "epoch": 0.99, + "learning_rate": 1.561972606048413e-06, + "loss": 0.7793, + "step": 38713 + }, + { + "epoch": 0.99, + "learning_rate": 1.5619497180556346e-06, + "loss": 0.8682, + "step": 38714 + }, + { + "epoch": 0.99, + "learning_rate": 1.5619268296325969e-06, + "loss": 0.8091, + "step": 38715 + }, + { + "epoch": 0.99, + "learning_rate": 1.5619039407793179e-06, + "loss": 0.8018, + "step": 38716 + }, + { + "epoch": 0.99, + "learning_rate": 1.561881051495815e-06, + "loss": 0.8613, + "step": 38717 + }, + { + "epoch": 0.99, + "learning_rate": 1.5618581617821053e-06, + "loss": 0.7745, + "step": 38718 + }, + { + "epoch": 0.99, + "learning_rate": 1.5618352716382069e-06, + "loss": 0.668, + "step": 38719 + }, + { + "epoch": 0.99, + "learning_rate": 1.561812381064137e-06, + "loss": 0.6682, + "step": 38720 + }, + { + "epoch": 0.99, + "learning_rate": 1.5617894900599134e-06, + "loss": 0.7769, + "step": 38721 + }, + { + "epoch": 0.99, + "learning_rate": 1.561766598625553e-06, + "loss": 1.0215, + "step": 38722 + }, + { + "epoch": 0.99, + "learning_rate": 1.5617437067610739e-06, + "loss": 0.8613, + "step": 38723 + }, + { + "epoch": 0.99, + "learning_rate": 1.5617208144664936e-06, + "loss": 0.6887, + "step": 38724 + }, + { + "epoch": 0.99, + "learning_rate": 1.5616979217418295e-06, + "loss": 0.8271, + "step": 38725 + }, + { + "epoch": 0.99, + "learning_rate": 1.561675028587099e-06, + "loss": 0.73, + "step": 38726 + }, + { + "epoch": 0.99, + "learning_rate": 1.56165213500232e-06, + "loss": 0.7979, + "step": 38727 + }, + { + "epoch": 0.99, + "learning_rate": 1.5616292409875093e-06, + "loss": 0.8418, + "step": 38728 + }, + { + "epoch": 0.99, + "learning_rate": 1.5616063465426855e-06, + "loss": 1.0039, + "step": 38729 + }, + { + "epoch": 0.99, + "learning_rate": 1.561583451667865e-06, + "loss": 0.8164, + "step": 38730 + }, + { + "epoch": 0.99, + "learning_rate": 1.5615605563630663e-06, + "loss": 0.731, + "step": 38731 + }, + { + "epoch": 0.99, + "learning_rate": 1.5615376606283064e-06, + "loss": 0.9707, + "step": 38732 + }, + { + "epoch": 0.99, + "learning_rate": 1.561514764463603e-06, + "loss": 0.6948, + "step": 38733 + }, + { + "epoch": 0.99, + "learning_rate": 1.5614918678689733e-06, + "loss": 0.9556, + "step": 38734 + }, + { + "epoch": 0.99, + "learning_rate": 1.561468970844435e-06, + "loss": 0.9126, + "step": 38735 + }, + { + "epoch": 0.99, + "learning_rate": 1.561446073390006e-06, + "loss": 0.9297, + "step": 38736 + }, + { + "epoch": 0.99, + "learning_rate": 1.5614231755057038e-06, + "loss": 0.5698, + "step": 38737 + }, + { + "epoch": 0.99, + "learning_rate": 1.5614002771915451e-06, + "loss": 0.7041, + "step": 38738 + }, + { + "epoch": 0.99, + "learning_rate": 1.5613773784475484e-06, + "loss": 0.8086, + "step": 38739 + }, + { + "epoch": 0.99, + "learning_rate": 1.5613544792737305e-06, + "loss": 0.8301, + "step": 38740 + }, + { + "epoch": 0.99, + "learning_rate": 1.5613315796701099e-06, + "loss": 0.7183, + "step": 38741 + }, + { + "epoch": 0.99, + "learning_rate": 1.5613086796367033e-06, + "loss": 0.9199, + "step": 38742 + }, + { + "epoch": 0.99, + "learning_rate": 1.561285779173528e-06, + "loss": 0.8545, + "step": 38743 + }, + { + "epoch": 0.99, + "learning_rate": 1.5612628782806025e-06, + "loss": 0.7959, + "step": 38744 + }, + { + "epoch": 0.99, + "learning_rate": 1.5612399769579434e-06, + "loss": 0.623, + "step": 38745 + }, + { + "epoch": 0.99, + "learning_rate": 1.5612170752055694e-06, + "loss": 0.8213, + "step": 38746 + }, + { + "epoch": 0.99, + "learning_rate": 1.5611941730234966e-06, + "loss": 0.6658, + "step": 38747 + }, + { + "epoch": 0.99, + "learning_rate": 1.5611712704117435e-06, + "loss": 0.6792, + "step": 38748 + }, + { + "epoch": 0.99, + "learning_rate": 1.5611483673703272e-06, + "loss": 0.6658, + "step": 38749 + }, + { + "epoch": 0.99, + "learning_rate": 1.5611254638992653e-06, + "loss": 0.9492, + "step": 38750 + }, + { + "epoch": 0.99, + "learning_rate": 1.5611025599985759e-06, + "loss": 1.0156, + "step": 38751 + }, + { + "epoch": 0.99, + "learning_rate": 1.5610796556682755e-06, + "loss": 0.7266, + "step": 38752 + }, + { + "epoch": 0.99, + "learning_rate": 1.5610567509083827e-06, + "loss": 0.8203, + "step": 38753 + }, + { + "epoch": 0.99, + "learning_rate": 1.5610338457189142e-06, + "loss": 0.7207, + "step": 38754 + }, + { + "epoch": 0.99, + "learning_rate": 1.561010940099888e-06, + "loss": 0.5134, + "step": 38755 + }, + { + "epoch": 0.99, + "learning_rate": 1.5609880340513215e-06, + "loss": 0.8379, + "step": 38756 + }, + { + "epoch": 0.99, + "learning_rate": 1.5609651275732323e-06, + "loss": 0.7632, + "step": 38757 + }, + { + "epoch": 0.99, + "learning_rate": 1.5609422206656379e-06, + "loss": 0.833, + "step": 38758 + }, + { + "epoch": 0.99, + "learning_rate": 1.5609193133285558e-06, + "loss": 0.793, + "step": 38759 + }, + { + "epoch": 0.99, + "learning_rate": 1.5608964055620035e-06, + "loss": 0.833, + "step": 38760 + }, + { + "epoch": 0.99, + "learning_rate": 1.560873497365999e-06, + "loss": 0.957, + "step": 38761 + }, + { + "epoch": 0.99, + "learning_rate": 1.560850588740559e-06, + "loss": 0.9746, + "step": 38762 + }, + { + "epoch": 0.99, + "learning_rate": 1.5608276796857016e-06, + "loss": 0.552, + "step": 38763 + }, + { + "epoch": 0.99, + "learning_rate": 1.5608047702014444e-06, + "loss": 0.6558, + "step": 38764 + }, + { + "epoch": 0.99, + "learning_rate": 1.5607818602878044e-06, + "loss": 0.6611, + "step": 38765 + }, + { + "epoch": 0.99, + "learning_rate": 1.5607589499448e-06, + "loss": 0.9717, + "step": 38766 + }, + { + "epoch": 0.99, + "learning_rate": 1.560736039172448e-06, + "loss": 0.6641, + "step": 38767 + }, + { + "epoch": 0.99, + "learning_rate": 1.560713127970766e-06, + "loss": 0.9736, + "step": 38768 + }, + { + "epoch": 0.99, + "learning_rate": 1.5606902163397723e-06, + "loss": 0.8633, + "step": 38769 + }, + { + "epoch": 0.99, + "learning_rate": 1.5606673042794833e-06, + "loss": 0.4866, + "step": 38770 + }, + { + "epoch": 0.99, + "learning_rate": 1.5606443917899176e-06, + "loss": 0.8662, + "step": 38771 + }, + { + "epoch": 0.99, + "learning_rate": 1.5606214788710918e-06, + "loss": 0.8223, + "step": 38772 + }, + { + "epoch": 0.99, + "learning_rate": 1.5605985655230243e-06, + "loss": 0.9023, + "step": 38773 + }, + { + "epoch": 0.99, + "learning_rate": 1.560575651745732e-06, + "loss": 0.8623, + "step": 38774 + }, + { + "epoch": 0.99, + "learning_rate": 1.560552737539233e-06, + "loss": 0.7778, + "step": 38775 + }, + { + "epoch": 0.99, + "learning_rate": 1.5605298229035443e-06, + "loss": 0.7236, + "step": 38776 + }, + { + "epoch": 0.99, + "learning_rate": 1.5605069078386838e-06, + "loss": 0.812, + "step": 38777 + }, + { + "epoch": 0.99, + "learning_rate": 1.5604839923446686e-06, + "loss": 0.8145, + "step": 38778 + }, + { + "epoch": 0.99, + "learning_rate": 1.5604610764215172e-06, + "loss": 0.7432, + "step": 38779 + }, + { + "epoch": 0.99, + "learning_rate": 1.560438160069246e-06, + "loss": 0.7959, + "step": 38780 + }, + { + "epoch": 0.99, + "learning_rate": 1.5604152432878733e-06, + "loss": 0.9082, + "step": 38781 + }, + { + "epoch": 0.99, + "learning_rate": 1.5603923260774163e-06, + "loss": 0.9492, + "step": 38782 + }, + { + "epoch": 0.99, + "learning_rate": 1.5603694084378926e-06, + "loss": 0.5933, + "step": 38783 + }, + { + "epoch": 0.99, + "learning_rate": 1.56034649036932e-06, + "loss": 1.0645, + "step": 38784 + }, + { + "epoch": 0.99, + "learning_rate": 1.5603235718717159e-06, + "loss": 0.7393, + "step": 38785 + }, + { + "epoch": 0.99, + "learning_rate": 1.5603006529450977e-06, + "loss": 0.623, + "step": 38786 + }, + { + "epoch": 0.99, + "learning_rate": 1.560277733589483e-06, + "loss": 0.8682, + "step": 38787 + }, + { + "epoch": 0.99, + "learning_rate": 1.5602548138048897e-06, + "loss": 0.7444, + "step": 38788 + }, + { + "epoch": 0.99, + "learning_rate": 1.5602318935913345e-06, + "loss": 0.9355, + "step": 38789 + }, + { + "epoch": 0.99, + "learning_rate": 1.560208972948836e-06, + "loss": 0.9229, + "step": 38790 + }, + { + "epoch": 0.99, + "learning_rate": 1.560186051877411e-06, + "loss": 0.8081, + "step": 38791 + }, + { + "epoch": 0.99, + "learning_rate": 1.5601631303770772e-06, + "loss": 0.9082, + "step": 38792 + }, + { + "epoch": 0.99, + "learning_rate": 1.5601402084478526e-06, + "loss": 0.958, + "step": 38793 + }, + { + "epoch": 0.99, + "learning_rate": 1.560117286089754e-06, + "loss": 0.6753, + "step": 38794 + }, + { + "epoch": 0.99, + "learning_rate": 1.5600943633027995e-06, + "loss": 0.7676, + "step": 38795 + }, + { + "epoch": 0.99, + "learning_rate": 1.560071440087007e-06, + "loss": 1.1025, + "step": 38796 + }, + { + "epoch": 0.99, + "learning_rate": 1.560048516442393e-06, + "loss": 0.8906, + "step": 38797 + }, + { + "epoch": 0.99, + "learning_rate": 1.5600255923689756e-06, + "loss": 0.6279, + "step": 38798 + }, + { + "epoch": 0.99, + "learning_rate": 1.5600026678667723e-06, + "loss": 0.8643, + "step": 38799 + }, + { + "epoch": 0.99, + "learning_rate": 1.559979742935801e-06, + "loss": 0.6885, + "step": 38800 + }, + { + "epoch": 0.99, + "learning_rate": 1.5599568175760788e-06, + "loss": 0.9438, + "step": 38801 + }, + { + "epoch": 0.99, + "learning_rate": 1.5599338917876234e-06, + "loss": 0.958, + "step": 38802 + }, + { + "epoch": 0.99, + "learning_rate": 1.5599109655704523e-06, + "loss": 0.96, + "step": 38803 + }, + { + "epoch": 0.99, + "learning_rate": 1.5598880389245834e-06, + "loss": 0.7954, + "step": 38804 + }, + { + "epoch": 0.99, + "learning_rate": 1.5598651118500338e-06, + "loss": 0.7969, + "step": 38805 + }, + { + "epoch": 0.99, + "learning_rate": 1.5598421843468212e-06, + "loss": 0.7417, + "step": 38806 + }, + { + "epoch": 0.99, + "learning_rate": 1.559819256414963e-06, + "loss": 0.8574, + "step": 38807 + }, + { + "epoch": 0.99, + "learning_rate": 1.5597963280544772e-06, + "loss": 0.877, + "step": 38808 + }, + { + "epoch": 0.99, + "learning_rate": 1.559773399265381e-06, + "loss": 0.8281, + "step": 38809 + }, + { + "epoch": 0.99, + "learning_rate": 1.559750470047692e-06, + "loss": 0.9531, + "step": 38810 + }, + { + "epoch": 0.99, + "learning_rate": 1.559727540401428e-06, + "loss": 0.9082, + "step": 38811 + }, + { + "epoch": 0.99, + "learning_rate": 1.5597046103266064e-06, + "loss": 0.8955, + "step": 38812 + }, + { + "epoch": 0.99, + "learning_rate": 1.5596816798232447e-06, + "loss": 0.6003, + "step": 38813 + }, + { + "epoch": 0.99, + "learning_rate": 1.5596587488913602e-06, + "loss": 0.9033, + "step": 38814 + }, + { + "epoch": 0.99, + "learning_rate": 1.5596358175309707e-06, + "loss": 0.8633, + "step": 38815 + }, + { + "epoch": 0.99, + "learning_rate": 1.5596128857420944e-06, + "loss": 0.6421, + "step": 38816 + }, + { + "epoch": 0.99, + "learning_rate": 1.5595899535247474e-06, + "loss": 0.8096, + "step": 38817 + }, + { + "epoch": 0.99, + "learning_rate": 1.5595670208789486e-06, + "loss": 1.0049, + "step": 38818 + }, + { + "epoch": 0.99, + "learning_rate": 1.5595440878047148e-06, + "loss": 0.8682, + "step": 38819 + }, + { + "epoch": 0.99, + "learning_rate": 1.5595211543020642e-06, + "loss": 0.9082, + "step": 38820 + }, + { + "epoch": 1.0, + "learning_rate": 1.559498220371014e-06, + "loss": 1.0254, + "step": 38821 + }, + { + "epoch": 1.0, + "learning_rate": 1.5594752860115813e-06, + "loss": 0.8184, + "step": 38822 + }, + { + "epoch": 1.0, + "learning_rate": 1.559452351223784e-06, + "loss": 0.5039, + "step": 38823 + }, + { + "epoch": 1.0, + "learning_rate": 1.55942941600764e-06, + "loss": 0.7378, + "step": 38824 + }, + { + "epoch": 1.0, + "learning_rate": 1.5594064803631667e-06, + "loss": 0.9668, + "step": 38825 + }, + { + "epoch": 1.0, + "learning_rate": 1.5593835442903816e-06, + "loss": 0.6909, + "step": 38826 + }, + { + "epoch": 1.0, + "learning_rate": 1.5593606077893021e-06, + "loss": 0.9844, + "step": 38827 + }, + { + "epoch": 1.0, + "learning_rate": 1.559337670859946e-06, + "loss": 0.9746, + "step": 38828 + }, + { + "epoch": 1.0, + "learning_rate": 1.5593147335023308e-06, + "loss": 0.7148, + "step": 38829 + }, + { + "epoch": 1.0, + "learning_rate": 1.5592917957164739e-06, + "loss": 0.8311, + "step": 38830 + }, + { + "epoch": 1.0, + "learning_rate": 1.5592688575023933e-06, + "loss": 0.9814, + "step": 38831 + }, + { + "epoch": 1.0, + "learning_rate": 1.559245918860106e-06, + "loss": 1.0566, + "step": 38832 + }, + { + "epoch": 1.0, + "learning_rate": 1.55922297978963e-06, + "loss": 0.9863, + "step": 38833 + }, + { + "epoch": 1.0, + "learning_rate": 1.5592000402909823e-06, + "loss": 0.793, + "step": 38834 + }, + { + "epoch": 1.0, + "learning_rate": 1.559177100364181e-06, + "loss": 0.7163, + "step": 38835 + }, + { + "epoch": 1.0, + "learning_rate": 1.5591541600092439e-06, + "loss": 0.5093, + "step": 38836 + }, + { + "epoch": 1.0, + "learning_rate": 1.5591312192261875e-06, + "loss": 0.8193, + "step": 38837 + }, + { + "epoch": 1.0, + "learning_rate": 1.5591082780150306e-06, + "loss": 0.7988, + "step": 38838 + }, + { + "epoch": 1.0, + "learning_rate": 1.55908533637579e-06, + "loss": 1.0645, + "step": 38839 + }, + { + "epoch": 1.0, + "learning_rate": 1.5590623943084832e-06, + "loss": 0.9541, + "step": 38840 + }, + { + "epoch": 1.0, + "learning_rate": 1.5590394518131284e-06, + "loss": 0.8643, + "step": 38841 + }, + { + "epoch": 1.0, + "learning_rate": 1.5590165088897427e-06, + "loss": 0.8574, + "step": 38842 + }, + { + "epoch": 1.0, + "learning_rate": 1.5589935655383437e-06, + "loss": 0.8662, + "step": 38843 + }, + { + "epoch": 1.0, + "learning_rate": 1.5589706217589492e-06, + "loss": 0.75, + "step": 38844 + }, + { + "epoch": 1.0, + "learning_rate": 1.5589476775515765e-06, + "loss": 0.7969, + "step": 38845 + }, + { + "epoch": 1.0, + "learning_rate": 1.558924732916243e-06, + "loss": 0.8398, + "step": 38846 + }, + { + "epoch": 1.0, + "learning_rate": 1.5589017878529669e-06, + "loss": 0.7419, + "step": 38847 + }, + { + "epoch": 1.0, + "learning_rate": 1.5588788423617652e-06, + "loss": 0.54, + "step": 38848 + }, + { + "epoch": 1.0, + "learning_rate": 1.5588558964426557e-06, + "loss": 0.8096, + "step": 38849 + }, + { + "epoch": 1.0, + "learning_rate": 1.5588329500956562e-06, + "loss": 0.7969, + "step": 38850 + }, + { + "epoch": 1.0, + "learning_rate": 1.5588100033207834e-06, + "loss": 0.9111, + "step": 38851 + }, + { + "epoch": 1.0, + "learning_rate": 1.5587870561180561e-06, + "loss": 0.8096, + "step": 38852 + }, + { + "epoch": 1.0, + "learning_rate": 1.558764108487491e-06, + "loss": 0.6445, + "step": 38853 + }, + { + "epoch": 1.0, + "learning_rate": 1.5587411604291056e-06, + "loss": 0.8232, + "step": 38854 + }, + { + "epoch": 1.0, + "learning_rate": 1.5587182119429182e-06, + "loss": 0.7705, + "step": 38855 + }, + { + "epoch": 1.0, + "learning_rate": 1.5586952630289457e-06, + "loss": 0.575, + "step": 38856 + }, + { + "epoch": 1.0, + "learning_rate": 1.5586723136872061e-06, + "loss": 0.8975, + "step": 38857 + }, + { + "epoch": 1.0, + "learning_rate": 1.5586493639177168e-06, + "loss": 0.6479, + "step": 38858 + }, + { + "epoch": 1.0, + "learning_rate": 1.5586264137204953e-06, + "loss": 0.8877, + "step": 38859 + }, + { + "epoch": 1.0, + "learning_rate": 1.5586034630955592e-06, + "loss": 0.9238, + "step": 38860 + }, + { + "epoch": 1.0, + "learning_rate": 1.5585805120429266e-06, + "loss": 0.9971, + "step": 38861 + }, + { + "epoch": 1.0, + "learning_rate": 1.558557560562614e-06, + "loss": 0.7666, + "step": 38862 + }, + { + "epoch": 1.0, + "learning_rate": 1.5585346086546397e-06, + "loss": 0.7397, + "step": 38863 + }, + { + "epoch": 1.0, + "learning_rate": 1.5585116563190211e-06, + "loss": 0.9297, + "step": 38864 + }, + { + "epoch": 1.0, + "learning_rate": 1.558488703555776e-06, + "loss": 0.7681, + "step": 38865 + }, + { + "epoch": 1.0, + "learning_rate": 1.5584657503649217e-06, + "loss": 0.8994, + "step": 38866 + }, + { + "epoch": 1.0, + "learning_rate": 1.5584427967464757e-06, + "loss": 0.9434, + "step": 38867 + }, + { + "epoch": 1.0, + "learning_rate": 1.5584198427004558e-06, + "loss": 0.8135, + "step": 38868 + }, + { + "epoch": 1.0, + "learning_rate": 1.5583968882268796e-06, + "loss": 0.9639, + "step": 38869 + }, + { + "epoch": 1.0, + "learning_rate": 1.5583739333257646e-06, + "loss": 0.8359, + "step": 38870 + }, + { + "epoch": 1.0, + "learning_rate": 1.5583509779971282e-06, + "loss": 0.9531, + "step": 38871 + }, + { + "epoch": 1.0, + "learning_rate": 1.558328022240988e-06, + "loss": 0.7246, + "step": 38872 + }, + { + "epoch": 1.0, + "learning_rate": 1.558305066057362e-06, + "loss": 0.9238, + "step": 38873 + }, + { + "epoch": 1.0, + "learning_rate": 1.5582821094462673e-06, + "loss": 0.6797, + "step": 38874 + }, + { + "epoch": 1.0, + "learning_rate": 1.558259152407722e-06, + "loss": 0.731, + "step": 38875 + }, + { + "epoch": 1.0, + "learning_rate": 1.558236194941743e-06, + "loss": 0.8545, + "step": 38876 + }, + { + "epoch": 1.0, + "learning_rate": 1.5582132370483482e-06, + "loss": 0.916, + "step": 38877 + }, + { + "epoch": 1.0, + "learning_rate": 1.5581902787275554e-06, + "loss": 0.7898, + "step": 38878 + }, + { + "epoch": 1.0, + "learning_rate": 1.5581673199793817e-06, + "loss": 0.8613, + "step": 38879 + }, + { + "epoch": 1.0, + "learning_rate": 1.5581443608038454e-06, + "loss": 0.71, + "step": 38880 + }, + { + "epoch": 1.0, + "learning_rate": 1.5581214012009634e-06, + "loss": 0.7925, + "step": 38881 + }, + { + "epoch": 1.0, + "learning_rate": 1.5580984411707535e-06, + "loss": 0.7427, + "step": 38882 + }, + { + "epoch": 1.0, + "learning_rate": 1.5580754807132328e-06, + "loss": 0.9673, + "step": 38883 + }, + { + "epoch": 1.0, + "learning_rate": 1.5580525198284198e-06, + "loss": 1.0625, + "step": 38884 + }, + { + "epoch": 1.0, + "learning_rate": 1.5580295585163318e-06, + "loss": 0.8447, + "step": 38885 + }, + { + "epoch": 1.0, + "learning_rate": 1.5580065967769862e-06, + "loss": 0.7485, + "step": 38886 + }, + { + "epoch": 1.0, + "learning_rate": 1.5579836346104002e-06, + "loss": 0.8237, + "step": 38887 + }, + { + "epoch": 1.0, + "learning_rate": 1.5579606720165921e-06, + "loss": 0.7344, + "step": 38888 + }, + { + "epoch": 1.0, + "learning_rate": 1.5579377089955792e-06, + "loss": 0.9062, + "step": 38889 + }, + { + "epoch": 1.0, + "learning_rate": 1.5579147455473791e-06, + "loss": 0.5581, + "step": 38890 + }, + { + "epoch": 1.0, + "learning_rate": 1.557891781672009e-06, + "loss": 0.9746, + "step": 38891 + }, + { + "epoch": 1.0, + "learning_rate": 1.5578688173694872e-06, + "loss": 0.9331, + "step": 38892 + }, + { + "epoch": 1.0, + "learning_rate": 1.5578458526398305e-06, + "loss": 0.6719, + "step": 38893 + }, + { + "epoch": 1.0, + "learning_rate": 1.5578228874830572e-06, + "loss": 0.8477, + "step": 38894 + }, + { + "epoch": 1.0, + "learning_rate": 1.5577999218991847e-06, + "loss": 0.7295, + "step": 38895 + }, + { + "epoch": 1.0, + "learning_rate": 1.5577769558882302e-06, + "loss": 1.0117, + "step": 38896 + }, + { + "epoch": 1.0, + "learning_rate": 1.5577539894502114e-06, + "loss": 0.6494, + "step": 38897 + }, + { + "epoch": 1.0, + "learning_rate": 1.557731022585146e-06, + "loss": 0.7686, + "step": 38898 + }, + { + "epoch": 1.0, + "learning_rate": 1.5577080552930516e-06, + "loss": 0.5503, + "step": 38899 + }, + { + "epoch": 1.0, + "learning_rate": 1.5576850875739465e-06, + "loss": 0.7549, + "step": 38900 + }, + { + "epoch": 1.0, + "learning_rate": 1.5576621194278468e-06, + "loss": 0.6912, + "step": 38901 + }, + { + "epoch": 1.0, + "learning_rate": 1.5576391508547713e-06, + "loss": 0.626, + "step": 38902 + }, + { + "epoch": 1.0, + "learning_rate": 1.5576161818547366e-06, + "loss": 0.9219, + "step": 38903 + }, + { + "epoch": 1.0, + "learning_rate": 1.5575932124277612e-06, + "loss": 0.7236, + "step": 38904 + }, + { + "epoch": 1.0, + "learning_rate": 1.5575702425738625e-06, + "loss": 1.0332, + "step": 38905 + }, + { + "epoch": 1.0, + "learning_rate": 1.5575472722930576e-06, + "loss": 0.5837, + "step": 38906 + }, + { + "epoch": 1.0, + "learning_rate": 1.5575243015853644e-06, + "loss": 0.7754, + "step": 38907 + }, + { + "epoch": 1.0, + "learning_rate": 1.5575013304508008e-06, + "loss": 0.8252, + "step": 38908 + }, + { + "epoch": 1.0, + "learning_rate": 1.5574783588893837e-06, + "loss": 0.9248, + "step": 38909 + }, + { + "epoch": 1.0, + "learning_rate": 1.557455386901131e-06, + "loss": 0.8271, + "step": 38910 + }, + { + "epoch": 1.0, + "learning_rate": 1.5574324144860605e-06, + "loss": 0.9668, + "step": 38911 + }, + { + "epoch": 1.0, + "learning_rate": 1.55740944164419e-06, + "loss": 0.8867, + "step": 38912 + }, + { + "epoch": 1.0, + "learning_rate": 1.557386468375536e-06, + "loss": 1.0098, + "step": 38913 + }, + { + "epoch": 1.0, + "learning_rate": 1.5573634946801173e-06, + "loss": 0.6523, + "step": 38914 + }, + { + "epoch": 1.0, + "learning_rate": 1.557340520557951e-06, + "loss": 1.0098, + "step": 38915 + }, + { + "epoch": 1.0, + "learning_rate": 1.5573175460090542e-06, + "loss": 0.9346, + "step": 38916 + }, + { + "epoch": 1.0, + "learning_rate": 1.5572945710334455e-06, + "loss": 0.8887, + "step": 38917 + }, + { + "epoch": 1.0, + "learning_rate": 1.5572715956311417e-06, + "loss": 0.8252, + "step": 38918 + }, + { + "epoch": 1.0, + "learning_rate": 1.5572486198021607e-06, + "loss": 0.6855, + "step": 38919 + }, + { + "epoch": 1.0, + "learning_rate": 1.5572256435465203e-06, + "loss": 0.8628, + "step": 38920 + }, + { + "epoch": 1.0, + "learning_rate": 1.5572026668642377e-06, + "loss": 0.9092, + "step": 38921 + }, + { + "epoch": 1.0, + "learning_rate": 1.5571796897553306e-06, + "loss": 0.7983, + "step": 38922 + }, + { + "epoch": 1.0, + "learning_rate": 1.5571567122198167e-06, + "loss": 1.0938, + "step": 38923 + }, + { + "epoch": 1.0, + "learning_rate": 1.5571337342577132e-06, + "loss": 0.7959, + "step": 38924 + }, + { + "epoch": 1.0, + "learning_rate": 1.5571107558690387e-06, + "loss": 0.9697, + "step": 38925 + }, + { + "epoch": 1.0, + "learning_rate": 1.5570877770538096e-06, + "loss": 0.9141, + "step": 38926 + }, + { + "epoch": 1.0, + "learning_rate": 1.557064797812044e-06, + "loss": 0.8447, + "step": 38927 + }, + { + "epoch": 1.0, + "learning_rate": 1.5570418181437597e-06, + "loss": 0.8945, + "step": 38928 + }, + { + "epoch": 1.0, + "learning_rate": 1.557018838048974e-06, + "loss": 0.7354, + "step": 38929 + }, + { + "epoch": 1.0, + "learning_rate": 1.5569958575277045e-06, + "loss": 0.7402, + "step": 38930 + }, + { + "epoch": 1.0, + "learning_rate": 1.556972876579969e-06, + "loss": 0.9219, + "step": 38931 + }, + { + "epoch": 1.0, + "learning_rate": 1.5569498952057849e-06, + "loss": 0.8545, + "step": 38932 + }, + { + "epoch": 1.0, + "learning_rate": 1.55692691340517e-06, + "loss": 0.9346, + "step": 38933 + }, + { + "epoch": 1.0, + "learning_rate": 1.5569039311781417e-06, + "loss": 0.832, + "step": 38934 + }, + { + "epoch": 1.0, + "learning_rate": 1.5568809485247174e-06, + "loss": 0.7603, + "step": 38935 + }, + { + "epoch": 1.0, + "learning_rate": 1.5568579654449154e-06, + "loss": 1.0693, + "step": 38936 + }, + { + "epoch": 1.0, + "learning_rate": 1.5568349819387527e-06, + "loss": 0.9473, + "step": 38937 + }, + { + "epoch": 1.0, + "learning_rate": 1.556811998006247e-06, + "loss": 0.7842, + "step": 38938 + }, + { + "epoch": 1.0, + "learning_rate": 1.556789013647416e-06, + "loss": 0.6128, + "step": 38939 + }, + { + "epoch": 1.0, + "learning_rate": 1.5567660288622773e-06, + "loss": 0.8252, + "step": 38940 + }, + { + "epoch": 1.0, + "learning_rate": 1.5567430436508485e-06, + "loss": 0.7295, + "step": 38941 + }, + { + "epoch": 1.0, + "learning_rate": 1.556720058013147e-06, + "loss": 0.9277, + "step": 38942 + }, + { + "epoch": 1.0, + "learning_rate": 1.5566970719491903e-06, + "loss": 0.8887, + "step": 38943 + }, + { + "epoch": 1.0, + "learning_rate": 1.5566740854589967e-06, + "loss": 0.7471, + "step": 38944 + }, + { + "epoch": 1.0, + "learning_rate": 1.5566510985425834e-06, + "loss": 0.6475, + "step": 38945 + }, + { + "epoch": 1.0, + "learning_rate": 1.5566281111999678e-06, + "loss": 0.8242, + "step": 38946 + }, + { + "epoch": 1.0, + "learning_rate": 1.5566051234311674e-06, + "loss": 0.9287, + "step": 38947 + }, + { + "epoch": 1.0, + "learning_rate": 1.5565821352362004e-06, + "loss": 0.5776, + "step": 38948 + }, + { + "epoch": 1.0, + "learning_rate": 1.5565591466150837e-06, + "loss": 0.7651, + "step": 38949 + }, + { + "epoch": 1.0, + "learning_rate": 1.5565361575678355e-06, + "loss": 0.6772, + "step": 38950 + }, + { + "epoch": 1.0, + "learning_rate": 1.5565131680944731e-06, + "loss": 0.9268, + "step": 38951 + }, + { + "epoch": 1.0, + "learning_rate": 1.5564901781950143e-06, + "loss": 0.8066, + "step": 38952 + }, + { + "epoch": 1.0, + "learning_rate": 1.5564671878694765e-06, + "loss": 0.6235, + "step": 38953 + }, + { + "epoch": 1.0, + "learning_rate": 1.556444197117877e-06, + "loss": 0.6943, + "step": 38954 + }, + { + "epoch": 1.0, + "learning_rate": 1.556421205940234e-06, + "loss": 0.6968, + "step": 38955 + }, + { + "epoch": 1.0, + "learning_rate": 1.556398214336565e-06, + "loss": 0.7529, + "step": 38956 + }, + { + "epoch": 1.0, + "learning_rate": 1.5563752223068876e-06, + "loss": 0.6217, + "step": 38957 + }, + { + "epoch": 1.0, + "learning_rate": 1.5563522298512188e-06, + "loss": 0.845, + "step": 38958 + }, + { + "epoch": 1.0, + "learning_rate": 1.556329236969577e-06, + "loss": 0.8364, + "step": 38959 + }, + { + "epoch": 1.0, + "learning_rate": 1.5563062436619797e-06, + "loss": 0.9424, + "step": 38960 + }, + { + "epoch": 1.0, + "learning_rate": 1.5562832499284438e-06, + "loss": 0.707, + "step": 38961 + }, + { + "epoch": 1.0, + "learning_rate": 1.5562602557689877e-06, + "loss": 0.7671, + "step": 38962 + }, + { + "epoch": 1.0, + "learning_rate": 1.5562372611836285e-06, + "loss": 0.6191, + "step": 38963 + }, + { + "epoch": 1.0, + "learning_rate": 1.5562142661723842e-06, + "loss": 0.9873, + "step": 38964 + }, + { + "epoch": 1.0, + "learning_rate": 1.5561912707352722e-06, + "loss": 0.4355, + "step": 38965 + }, + { + "epoch": 1.0, + "learning_rate": 1.5561682748723102e-06, + "loss": 0.958, + "step": 38966 + }, + { + "epoch": 1.0, + "learning_rate": 1.5561452785835154e-06, + "loss": 0.8555, + "step": 38967 + }, + { + "epoch": 1.0, + "learning_rate": 1.5561222818689057e-06, + "loss": 0.5605, + "step": 38968 + }, + { + "epoch": 1.0, + "learning_rate": 1.5560992847284991e-06, + "loss": 1.0469, + "step": 38969 + }, + { + "epoch": 1.0, + "learning_rate": 1.5560762871623128e-06, + "loss": 0.8032, + "step": 38970 + }, + { + "epoch": 1.0, + "learning_rate": 1.5560532891703645e-06, + "loss": 0.6294, + "step": 38971 + }, + { + "epoch": 1.0, + "learning_rate": 1.5560302907526713e-06, + "loss": 0.7207, + "step": 38972 + }, + { + "epoch": 1.0, + "learning_rate": 1.5560072919092514e-06, + "loss": 0.8174, + "step": 38973 + }, + { + "epoch": 1.0, + "learning_rate": 1.5559842926401227e-06, + "loss": 0.7979, + "step": 38974 + }, + { + "epoch": 1.0, + "learning_rate": 1.5559612929453023e-06, + "loss": 0.7676, + "step": 38975 + }, + { + "epoch": 1.0, + "learning_rate": 1.5559382928248076e-06, + "loss": 0.8223, + "step": 38976 + }, + { + "epoch": 1.0, + "learning_rate": 1.5559152922786569e-06, + "loss": 0.915, + "step": 38977 + }, + { + "epoch": 1.0, + "learning_rate": 1.555892291306867e-06, + "loss": 0.8789, + "step": 38978 + }, + { + "epoch": 1.0, + "learning_rate": 1.5558692899094562e-06, + "loss": 1.0479, + "step": 38979 + }, + { + "epoch": 1.0, + "learning_rate": 1.5558462880864418e-06, + "loss": 0.6592, + "step": 38980 + }, + { + "epoch": 1.0, + "learning_rate": 1.5558232858378414e-06, + "loss": 0.7261, + "step": 38981 + }, + { + "epoch": 1.0, + "learning_rate": 1.5558002831636725e-06, + "loss": 0.7463, + "step": 38982 + }, + { + "epoch": 1.0, + "learning_rate": 1.5557772800639533e-06, + "loss": 0.7305, + "step": 38983 + }, + { + "epoch": 1.0, + "learning_rate": 1.5557542765387006e-06, + "loss": 0.8403, + "step": 38984 + }, + { + "epoch": 1.0, + "learning_rate": 1.5557312725879327e-06, + "loss": 0.6982, + "step": 38985 + }, + { + "epoch": 1.0, + "learning_rate": 1.5557082682116667e-06, + "loss": 0.8213, + "step": 38986 + }, + { + "epoch": 1.0, + "learning_rate": 1.5556852634099205e-06, + "loss": 0.8779, + "step": 38987 + }, + { + "epoch": 1.0, + "learning_rate": 1.5556622581827117e-06, + "loss": 0.9658, + "step": 38988 + }, + { + "epoch": 1.0, + "learning_rate": 1.5556392525300578e-06, + "loss": 0.7812, + "step": 38989 + }, + { + "epoch": 1.0, + "learning_rate": 1.5556162464519766e-06, + "loss": 1.0293, + "step": 38990 + }, + { + "epoch": 1.0, + "learning_rate": 1.5555932399484854e-06, + "loss": 0.8198, + "step": 38991 + }, + { + "epoch": 1.0, + "learning_rate": 1.5555702330196021e-06, + "loss": 0.8994, + "step": 38992 + }, + { + "epoch": 1.0, + "learning_rate": 1.5555472256653445e-06, + "loss": 0.9023, + "step": 38993 + }, + { + "epoch": 1.0, + "learning_rate": 1.5555242178857295e-06, + "loss": 0.9492, + "step": 38994 + }, + { + "epoch": 1.0, + "learning_rate": 1.5555012096807754e-06, + "loss": 0.9395, + "step": 38995 + }, + { + "epoch": 1.0, + "learning_rate": 1.5554782010504992e-06, + "loss": 0.6084, + "step": 38996 + }, + { + "epoch": 1.0, + "learning_rate": 1.5554551919949193e-06, + "loss": 0.7036, + "step": 38997 + }, + { + "epoch": 1.0, + "learning_rate": 1.5554321825140529e-06, + "loss": 0.9014, + "step": 38998 + }, + { + "epoch": 1.0, + "learning_rate": 1.5554091726079172e-06, + "loss": 0.8135, + "step": 38999 + }, + { + "epoch": 1.0, + "learning_rate": 1.5553861622765306e-06, + "loss": 0.8291, + "step": 39000 + }, + { + "epoch": 1.0, + "learning_rate": 1.5553631515199101e-06, + "loss": 1.041, + "step": 39001 + }, + { + "epoch": 1.0, + "learning_rate": 1.5553401403380738e-06, + "loss": 0.7168, + "step": 39002 + }, + { + "epoch": 1.0, + "learning_rate": 1.5553171287310392e-06, + "loss": 0.7988, + "step": 39003 + }, + { + "epoch": 1.0, + "learning_rate": 1.5552941166988234e-06, + "loss": 0.7693, + "step": 39004 + }, + { + "epoch": 1.0, + "learning_rate": 1.5552711042414446e-06, + "loss": 0.7959, + "step": 39005 + }, + { + "epoch": 1.0, + "learning_rate": 1.5552480913589205e-06, + "loss": 1.0, + "step": 39006 + }, + { + "epoch": 1.0, + "learning_rate": 1.5552250780512682e-06, + "loss": 0.7466, + "step": 39007 + }, + { + "epoch": 1.0, + "learning_rate": 1.5552020643185056e-06, + "loss": 0.8721, + "step": 39008 + }, + { + "epoch": 1.0, + "learning_rate": 1.5551790501606501e-06, + "loss": 0.877, + "step": 39009 + }, + { + "epoch": 1.0, + "learning_rate": 1.5551560355777201e-06, + "loss": 0.8867, + "step": 39010 + }, + { + "epoch": 1.0, + "learning_rate": 1.5551330205697322e-06, + "loss": 0.7402, + "step": 39011 + }, + { + "epoch": 1.0, + "learning_rate": 1.5551100051367047e-06, + "loss": 0.6943, + "step": 39012 + }, + { + "epoch": 1.0, + "learning_rate": 1.5550869892786549e-06, + "loss": 0.8711, + "step": 39013 + }, + { + "epoch": 1.0, + "learning_rate": 1.5550639729956005e-06, + "loss": 0.8037, + "step": 39014 + }, + { + "epoch": 1.0, + "learning_rate": 1.5550409562875593e-06, + "loss": 0.9434, + "step": 39015 + }, + { + "epoch": 1.0, + "learning_rate": 1.5550179391545487e-06, + "loss": 0.7852, + "step": 39016 + }, + { + "epoch": 1.0, + "learning_rate": 1.554994921596586e-06, + "loss": 0.6829, + "step": 39017 + }, + { + "epoch": 1.0, + "learning_rate": 1.5549719036136897e-06, + "loss": 0.7891, + "step": 39018 + }, + { + "epoch": 1.0, + "learning_rate": 1.5549488852058766e-06, + "loss": 0.7266, + "step": 39019 + }, + { + "epoch": 1.0, + "learning_rate": 1.554925866373165e-06, + "loss": 0.7617, + "step": 39020 + }, + { + "epoch": 1.0, + "learning_rate": 1.554902847115572e-06, + "loss": 0.709, + "step": 39021 + }, + { + "epoch": 1.0, + "learning_rate": 1.5548798274331152e-06, + "loss": 0.6033, + "step": 39022 + }, + { + "epoch": 1.0, + "learning_rate": 1.5548568073258125e-06, + "loss": 0.6326, + "step": 39023 + }, + { + "epoch": 1.0, + "learning_rate": 1.5548337867936816e-06, + "loss": 0.6895, + "step": 39024 + }, + { + "epoch": 1.0, + "learning_rate": 1.55481076583674e-06, + "loss": 0.5718, + "step": 39025 + }, + { + "epoch": 1.0, + "learning_rate": 1.5547877444550053e-06, + "loss": 0.6528, + "step": 39026 + }, + { + "epoch": 1.0, + "learning_rate": 1.554764722648495e-06, + "loss": 0.8047, + "step": 39027 + }, + { + "epoch": 1.0, + "learning_rate": 1.554741700417227e-06, + "loss": 0.7305, + "step": 39028 + }, + { + "epoch": 1.0, + "learning_rate": 1.554718677761219e-06, + "loss": 0.6897, + "step": 39029 + }, + { + "epoch": 1.0, + "learning_rate": 1.5546956546804879e-06, + "loss": 0.5771, + "step": 39030 + }, + { + "epoch": 1.0, + "learning_rate": 1.5546726311750521e-06, + "loss": 0.7178, + "step": 39031 + }, + { + "epoch": 1.0, + "learning_rate": 1.5546496072449289e-06, + "loss": 0.7852, + "step": 39032 + }, + { + "epoch": 1.0, + "learning_rate": 1.5546265828901359e-06, + "loss": 0.6973, + "step": 39033 + }, + { + "epoch": 1.0, + "learning_rate": 1.554603558110691e-06, + "loss": 0.7324, + "step": 39034 + }, + { + "epoch": 1.0, + "learning_rate": 1.554580532906612e-06, + "loss": 0.7305, + "step": 39035 + }, + { + "epoch": 1.0, + "learning_rate": 1.5545575072779158e-06, + "loss": 0.6646, + "step": 39036 + }, + { + "epoch": 1.0, + "learning_rate": 1.5545344812246204e-06, + "loss": 0.7188, + "step": 39037 + }, + { + "epoch": 1.0, + "learning_rate": 1.5545114547467436e-06, + "loss": 0.7012, + "step": 39038 + }, + { + "epoch": 1.0, + "learning_rate": 1.5544884278443027e-06, + "loss": 0.667, + "step": 39039 + }, + { + "epoch": 1.0, + "learning_rate": 1.5544654005173156e-06, + "loss": 0.7207, + "step": 39040 + }, + { + "epoch": 1.0, + "learning_rate": 1.5544423727657998e-06, + "loss": 0.7188, + "step": 39041 + }, + { + "epoch": 1.0, + "learning_rate": 1.554419344589773e-06, + "loss": 0.7803, + "step": 39042 + }, + { + "epoch": 1.0, + "learning_rate": 1.5543963159892525e-06, + "loss": 0.47, + "step": 39043 + }, + { + "epoch": 1.0, + "learning_rate": 1.5543732869642568e-06, + "loss": 0.7314, + "step": 39044 + }, + { + "epoch": 1.0, + "learning_rate": 1.5543502575148027e-06, + "loss": 0.7969, + "step": 39045 + }, + { + "epoch": 1.0, + "learning_rate": 1.554327227640908e-06, + "loss": 0.6709, + "step": 39046 + }, + { + "epoch": 1.0, + "learning_rate": 1.5543041973425905e-06, + "loss": 0.6826, + "step": 39047 + }, + { + "epoch": 1.0, + "learning_rate": 1.5542811666198678e-06, + "loss": 0.6523, + "step": 39048 + }, + { + "epoch": 1.0, + "learning_rate": 1.5542581354727576e-06, + "loss": 0.624, + "step": 39049 + }, + { + "epoch": 1.0, + "learning_rate": 1.5542351039012772e-06, + "loss": 0.9346, + "step": 39050 + }, + { + "epoch": 1.0, + "learning_rate": 1.5542120719054445e-06, + "loss": 0.4854, + "step": 39051 + }, + { + "epoch": 1.0, + "learning_rate": 1.5541890394852773e-06, + "loss": 0.5947, + "step": 39052 + }, + { + "epoch": 1.0, + "learning_rate": 1.5541660066407927e-06, + "loss": 0.4493, + "step": 39053 + }, + { + "epoch": 1.0, + "learning_rate": 1.5541429733720088e-06, + "loss": 0.6431, + "step": 39054 + }, + { + "epoch": 1.0, + "learning_rate": 1.5541199396789436e-06, + "loss": 0.6187, + "step": 39055 + }, + { + "epoch": 1.0, + "learning_rate": 1.5540969055616135e-06, + "loss": 0.6377, + "step": 39056 + }, + { + "epoch": 1.0, + "learning_rate": 1.5540738710200375e-06, + "loss": 0.6558, + "step": 39057 + }, + { + "epoch": 1.0, + "learning_rate": 1.5540508360542322e-06, + "loss": 0.6567, + "step": 39058 + }, + { + "epoch": 1.0, + "learning_rate": 1.5540278006642158e-06, + "loss": 0.7207, + "step": 39059 + }, + { + "epoch": 1.0, + "learning_rate": 1.5540047648500058e-06, + "loss": 0.7651, + "step": 39060 + }, + { + "epoch": 1.0, + "learning_rate": 1.5539817286116197e-06, + "loss": 0.6479, + "step": 39061 + }, + { + "epoch": 1.0, + "learning_rate": 1.5539586919490755e-06, + "loss": 0.5249, + "step": 39062 + }, + { + "epoch": 1.0, + "learning_rate": 1.5539356548623903e-06, + "loss": 0.3691, + "step": 39063 + }, + { + "epoch": 1.0, + "learning_rate": 1.5539126173515822e-06, + "loss": 0.7324, + "step": 39064 + }, + { + "epoch": 1.0, + "learning_rate": 1.5538895794166687e-06, + "loss": 0.4797, + "step": 39065 + }, + { + "epoch": 1.0, + "learning_rate": 1.5538665410576672e-06, + "loss": 0.6865, + "step": 39066 + }, + { + "epoch": 1.0, + "learning_rate": 1.553843502274596e-06, + "loss": 0.7236, + "step": 39067 + }, + { + "epoch": 1.0, + "learning_rate": 1.5538204630674717e-06, + "loss": 0.6904, + "step": 39068 + }, + { + "epoch": 1.0, + "learning_rate": 1.553797423436313e-06, + "loss": 0.6719, + "step": 39069 + }, + { + "epoch": 1.0, + "learning_rate": 1.5537743833811373e-06, + "loss": 0.6592, + "step": 39070 + }, + { + "epoch": 1.0, + "learning_rate": 1.5537513429019615e-06, + "loss": 0.7002, + "step": 39071 + }, + { + "epoch": 1.0, + "learning_rate": 1.5537283019988036e-06, + "loss": 0.7598, + "step": 39072 + }, + { + "epoch": 1.0, + "learning_rate": 1.5537052606716817e-06, + "loss": 0.6465, + "step": 39073 + }, + { + "epoch": 1.0, + "learning_rate": 1.5536822189206133e-06, + "loss": 0.7471, + "step": 39074 + }, + { + "epoch": 1.0, + "learning_rate": 1.553659176745616e-06, + "loss": 0.4812, + "step": 39075 + }, + { + "epoch": 1.0, + "learning_rate": 1.553636134146707e-06, + "loss": 0.5994, + "step": 39076 + }, + { + "epoch": 1.0, + "learning_rate": 1.5536130911239042e-06, + "loss": 0.8574, + "step": 39077 + }, + { + "epoch": 1.0, + "learning_rate": 1.5535900476772255e-06, + "loss": 0.8984, + "step": 39078 + }, + { + "epoch": 1.0, + "learning_rate": 1.5535670038066884e-06, + "loss": 0.7021, + "step": 39079 + }, + { + "epoch": 1.0, + "learning_rate": 1.5535439595123102e-06, + "loss": 0.6157, + "step": 39080 + }, + { + "epoch": 1.0, + "learning_rate": 1.5535209147941094e-06, + "loss": 0.6167, + "step": 39081 + }, + { + "epoch": 1.0, + "learning_rate": 1.5534978696521023e-06, + "loss": 0.7852, + "step": 39082 + }, + { + "epoch": 1.0, + "learning_rate": 1.553474824086308e-06, + "loss": 0.8096, + "step": 39083 + }, + { + "epoch": 1.0, + "learning_rate": 1.5534517780967433e-06, + "loss": 0.541, + "step": 39084 + }, + { + "epoch": 1.0, + "learning_rate": 1.553428731683426e-06, + "loss": 0.8232, + "step": 39085 + }, + { + "epoch": 1.0, + "learning_rate": 1.5534056848463738e-06, + "loss": 0.5557, + "step": 39086 + }, + { + "epoch": 1.0, + "learning_rate": 1.5533826375856043e-06, + "loss": 0.7773, + "step": 39087 + }, + { + "epoch": 1.0, + "learning_rate": 1.553359589901135e-06, + "loss": 0.5508, + "step": 39088 + }, + { + "epoch": 1.0, + "learning_rate": 1.5533365417929835e-06, + "loss": 0.6958, + "step": 39089 + }, + { + "epoch": 1.0, + "learning_rate": 1.5533134932611682e-06, + "loss": 0.6875, + "step": 39090 + }, + { + "epoch": 1.0, + "learning_rate": 1.553290444305706e-06, + "loss": 0.7876, + "step": 39091 + }, + { + "epoch": 1.0, + "learning_rate": 1.5532673949266148e-06, + "loss": 0.6143, + "step": 39092 + }, + { + "epoch": 1.0, + "learning_rate": 1.553244345123912e-06, + "loss": 0.6807, + "step": 39093 + }, + { + "epoch": 1.0, + "learning_rate": 1.5532212948976156e-06, + "loss": 0.6182, + "step": 39094 + }, + { + "epoch": 1.0, + "learning_rate": 1.5531982442477432e-06, + "loss": 0.7139, + "step": 39095 + }, + { + "epoch": 1.0, + "learning_rate": 1.553175193174312e-06, + "loss": 0.7793, + "step": 39096 + }, + { + "epoch": 1.0, + "learning_rate": 1.5531521416773404e-06, + "loss": 0.8223, + "step": 39097 + }, + { + "epoch": 1.0, + "learning_rate": 1.5531290897568453e-06, + "loss": 0.6797, + "step": 39098 + }, + { + "epoch": 1.0, + "learning_rate": 1.553106037412845e-06, + "loss": 0.7207, + "step": 39099 + }, + { + "epoch": 1.0, + "learning_rate": 1.5530829846453566e-06, + "loss": 0.7646, + "step": 39100 + }, + { + "epoch": 1.0, + "learning_rate": 1.553059931454398e-06, + "loss": 0.5913, + "step": 39101 + }, + { + "epoch": 1.0, + "learning_rate": 1.5530368778399867e-06, + "loss": 0.8516, + "step": 39102 + }, + { + "epoch": 1.0, + "learning_rate": 1.5530138238021407e-06, + "loss": 0.8389, + "step": 39103 + }, + { + "epoch": 1.0, + "learning_rate": 1.5529907693408775e-06, + "loss": 0.7383, + "step": 39104 + }, + { + "epoch": 1.0, + "learning_rate": 1.5529677144562147e-06, + "loss": 0.6475, + "step": 39105 + }, + { + "epoch": 1.0, + "learning_rate": 1.5529446591481699e-06, + "loss": 0.5557, + "step": 39106 + }, + { + "epoch": 1.0, + "learning_rate": 1.5529216034167604e-06, + "loss": 0.793, + "step": 39107 + }, + { + "epoch": 1.0, + "learning_rate": 1.5528985472620048e-06, + "loss": 0.5508, + "step": 39108 + }, + { + "epoch": 1.0, + "learning_rate": 1.5528754906839198e-06, + "loss": 0.6016, + "step": 39109 + }, + { + "epoch": 1.0, + "learning_rate": 1.552852433682524e-06, + "loss": 0.6494, + "step": 39110 + }, + { + "epoch": 1.0, + "learning_rate": 1.552829376257834e-06, + "loss": 0.6895, + "step": 39111 + }, + { + "epoch": 1.0, + "learning_rate": 1.5528063184098683e-06, + "loss": 0.5325, + "step": 39112 + }, + { + "epoch": 1.0, + "learning_rate": 1.552783260138644e-06, + "loss": 0.5776, + "step": 39113 + }, + { + "epoch": 1.0, + "learning_rate": 1.5527602014441791e-06, + "loss": 0.7842, + "step": 39114 + }, + { + "epoch": 1.0, + "learning_rate": 1.552737142326491e-06, + "loss": 0.8076, + "step": 39115 + }, + { + "epoch": 1.0, + "learning_rate": 1.5527140827855977e-06, + "loss": 0.7334, + "step": 39116 + }, + { + "epoch": 1.0, + "learning_rate": 1.5526910228215165e-06, + "loss": 0.6416, + "step": 39117 + }, + { + "epoch": 1.0, + "learning_rate": 1.5526679624342651e-06, + "loss": 0.7148, + "step": 39118 + }, + { + "epoch": 1.0, + "learning_rate": 1.5526449016238615e-06, + "loss": 0.6445, + "step": 39119 + }, + { + "epoch": 1.0, + "learning_rate": 1.552621840390323e-06, + "loss": 0.7383, + "step": 39120 + }, + { + "epoch": 1.0, + "learning_rate": 1.552598778733667e-06, + "loss": 0.7622, + "step": 39121 + }, + { + "epoch": 1.0, + "learning_rate": 1.5525757166539122e-06, + "loss": 0.4534, + "step": 39122 + }, + { + "epoch": 1.0, + "learning_rate": 1.5525526541510748e-06, + "loss": 0.7383, + "step": 39123 + }, + { + "epoch": 1.0, + "learning_rate": 1.552529591225174e-06, + "loss": 0.6885, + "step": 39124 + }, + { + "epoch": 1.0, + "learning_rate": 1.5525065278762264e-06, + "loss": 0.5137, + "step": 39125 + }, + { + "epoch": 1.0, + "learning_rate": 1.55248346410425e-06, + "loss": 0.6528, + "step": 39126 + }, + { + "epoch": 1.0, + "learning_rate": 1.5524603999092623e-06, + "loss": 0.4695, + "step": 39127 + }, + { + "epoch": 1.0, + "learning_rate": 1.5524373352912813e-06, + "loss": 0.6782, + "step": 39128 + }, + { + "epoch": 1.0, + "learning_rate": 1.552414270250324e-06, + "loss": 0.8594, + "step": 39129 + }, + { + "epoch": 1.0, + "learning_rate": 1.5523912047864087e-06, + "loss": 0.7427, + "step": 39130 + }, + { + "epoch": 1.0, + "learning_rate": 1.552368138899553e-06, + "loss": 0.562, + "step": 39131 + }, + { + "epoch": 1.0, + "learning_rate": 1.5523450725897744e-06, + "loss": 0.8223, + "step": 39132 + }, + { + "epoch": 1.0, + "learning_rate": 1.5523220058570904e-06, + "loss": 0.5339, + "step": 39133 + }, + { + "epoch": 1.0, + "learning_rate": 1.5522989387015192e-06, + "loss": 0.6919, + "step": 39134 + }, + { + "epoch": 1.0, + "learning_rate": 1.5522758711230775e-06, + "loss": 0.708, + "step": 39135 + }, + { + "epoch": 1.0, + "learning_rate": 1.552252803121784e-06, + "loss": 0.7822, + "step": 39136 + }, + { + "epoch": 1.0, + "learning_rate": 1.5522297346976557e-06, + "loss": 0.6875, + "step": 39137 + }, + { + "epoch": 1.0, + "learning_rate": 1.5522066658507106e-06, + "loss": 0.6006, + "step": 39138 + }, + { + "epoch": 1.0, + "learning_rate": 1.5521835965809663e-06, + "loss": 0.6211, + "step": 39139 + }, + { + "epoch": 1.0, + "learning_rate": 1.5521605268884405e-06, + "loss": 0.2896, + "step": 39140 + }, + { + "epoch": 1.0, + "learning_rate": 1.5521374567731503e-06, + "loss": 0.6982, + "step": 39141 + }, + { + "epoch": 1.0, + "learning_rate": 1.5521143862351146e-06, + "loss": 0.8057, + "step": 39142 + }, + { + "epoch": 1.0, + "learning_rate": 1.5520913152743496e-06, + "loss": 0.5574, + "step": 39143 + }, + { + "epoch": 1.0, + "learning_rate": 1.5520682438908741e-06, + "loss": 0.5356, + "step": 39144 + }, + { + "epoch": 1.0, + "learning_rate": 1.5520451720847053e-06, + "loss": 0.4861, + "step": 39145 + }, + { + "epoch": 1.0, + "learning_rate": 1.5520220998558604e-06, + "loss": 0.7939, + "step": 39146 + }, + { + "epoch": 1.0, + "learning_rate": 1.5519990272043582e-06, + "loss": 0.5903, + "step": 39147 + }, + { + "epoch": 1.0, + "learning_rate": 1.5519759541302154e-06, + "loss": 0.6875, + "step": 39148 + }, + { + "epoch": 1.0, + "learning_rate": 1.55195288063345e-06, + "loss": 0.8525, + "step": 39149 + }, + { + "epoch": 1.0, + "learning_rate": 1.5519298067140797e-06, + "loss": 0.8418, + "step": 39150 + }, + { + "epoch": 1.0, + "learning_rate": 1.5519067323721223e-06, + "loss": 0.6963, + "step": 39151 + }, + { + "epoch": 1.0, + "learning_rate": 1.551883657607595e-06, + "loss": 0.6501, + "step": 39152 + }, + { + "epoch": 1.0, + "learning_rate": 1.5518605824205157e-06, + "loss": 0.6533, + "step": 39153 + }, + { + "epoch": 1.0, + "learning_rate": 1.5518375068109023e-06, + "loss": 0.7803, + "step": 39154 + }, + { + "epoch": 1.0, + "learning_rate": 1.5518144307787724e-06, + "loss": 0.5542, + "step": 39155 + }, + { + "epoch": 1.0, + "learning_rate": 1.5517913543241435e-06, + "loss": 0.6465, + "step": 39156 + }, + { + "epoch": 1.0, + "learning_rate": 1.5517682774470334e-06, + "loss": 0.6675, + "step": 39157 + }, + { + "epoch": 1.0, + "learning_rate": 1.5517452001474593e-06, + "loss": 0.5483, + "step": 39158 + }, + { + "epoch": 1.0, + "learning_rate": 1.5517221224254398e-06, + "loss": 0.5811, + "step": 39159 + }, + { + "epoch": 1.0, + "learning_rate": 1.5516990442809918e-06, + "loss": 0.6963, + "step": 39160 + }, + { + "epoch": 1.0, + "learning_rate": 1.551675965714133e-06, + "loss": 0.5317, + "step": 39161 + }, + { + "epoch": 1.0, + "learning_rate": 1.5516528867248818e-06, + "loss": 0.6846, + "step": 39162 + }, + { + "epoch": 1.0, + "learning_rate": 1.5516298073132547e-06, + "loss": 0.7207, + "step": 39163 + }, + { + "epoch": 1.0, + "learning_rate": 1.5516067274792706e-06, + "loss": 0.6377, + "step": 39164 + }, + { + "epoch": 1.0, + "learning_rate": 1.5515836472229462e-06, + "loss": 0.5239, + "step": 39165 + }, + { + "epoch": 1.0, + "learning_rate": 1.5515605665442998e-06, + "loss": 0.6963, + "step": 39166 + }, + { + "epoch": 1.0, + "learning_rate": 1.5515374854433487e-06, + "loss": 0.5217, + "step": 39167 + }, + { + "epoch": 1.0, + "learning_rate": 1.5515144039201106e-06, + "loss": 0.6904, + "step": 39168 + }, + { + "epoch": 1.0, + "learning_rate": 1.5514913219746038e-06, + "loss": 0.5059, + "step": 39169 + }, + { + "epoch": 1.0, + "learning_rate": 1.551468239606845e-06, + "loss": 0.5059, + "step": 39170 + }, + { + "epoch": 1.0, + "learning_rate": 1.5514451568168525e-06, + "loss": 0.6963, + "step": 39171 + }, + { + "epoch": 1.0, + "learning_rate": 1.5514220736046437e-06, + "loss": 0.6289, + "step": 39172 + }, + { + "epoch": 1.0, + "learning_rate": 1.5513989899702361e-06, + "loss": 0.6553, + "step": 39173 + }, + { + "epoch": 1.0, + "learning_rate": 1.551375905913648e-06, + "loss": 0.6309, + "step": 39174 + }, + { + "epoch": 1.0, + "learning_rate": 1.551352821434897e-06, + "loss": 0.5806, + "step": 39175 + }, + { + "epoch": 1.0, + "learning_rate": 1.5513297365339998e-06, + "loss": 0.7197, + "step": 39176 + }, + { + "epoch": 1.0, + "learning_rate": 1.5513066512109753e-06, + "loss": 0.8525, + "step": 39177 + }, + { + "epoch": 1.0, + "learning_rate": 1.5512835654658405e-06, + "loss": 0.6685, + "step": 39178 + }, + { + "epoch": 1.0, + "learning_rate": 1.5512604792986132e-06, + "loss": 0.5864, + "step": 39179 + }, + { + "epoch": 1.0, + "learning_rate": 1.5512373927093113e-06, + "loss": 0.7119, + "step": 39180 + }, + { + "epoch": 1.0, + "learning_rate": 1.551214305697952e-06, + "loss": 0.792, + "step": 39181 + }, + { + "epoch": 1.0, + "learning_rate": 1.5511912182645531e-06, + "loss": 0.6392, + "step": 39182 + }, + { + "epoch": 1.0, + "learning_rate": 1.5511681304091329e-06, + "loss": 0.3884, + "step": 39183 + }, + { + "epoch": 1.0, + "learning_rate": 1.5511450421317083e-06, + "loss": 0.7363, + "step": 39184 + }, + { + "epoch": 1.0, + "learning_rate": 1.5511219534322972e-06, + "loss": 0.6514, + "step": 39185 + }, + { + "epoch": 1.0, + "learning_rate": 1.5510988643109176e-06, + "loss": 0.5842, + "step": 39186 + }, + { + "epoch": 1.0, + "learning_rate": 1.5510757747675868e-06, + "loss": 0.6792, + "step": 39187 + }, + { + "epoch": 1.0, + "learning_rate": 1.5510526848023227e-06, + "loss": 0.603, + "step": 39188 + }, + { + "epoch": 1.0, + "learning_rate": 1.551029594415143e-06, + "loss": 0.4663, + "step": 39189 + }, + { + "epoch": 1.0, + "learning_rate": 1.551006503606065e-06, + "loss": 0.7393, + "step": 39190 + }, + { + "epoch": 1.0, + "learning_rate": 1.5509834123751069e-06, + "loss": 0.7021, + "step": 39191 + }, + { + "epoch": 1.0, + "learning_rate": 1.5509603207222859e-06, + "loss": 0.6211, + "step": 39192 + }, + { + "epoch": 1.0, + "learning_rate": 1.5509372286476202e-06, + "loss": 0.6055, + "step": 39193 + }, + { + "epoch": 1.0, + "learning_rate": 1.550914136151127e-06, + "loss": 0.5854, + "step": 39194 + }, + { + "epoch": 1.0, + "learning_rate": 1.5508910432328244e-06, + "loss": 0.4395, + "step": 39195 + }, + { + "epoch": 1.0, + "learning_rate": 1.5508679498927295e-06, + "loss": 0.6543, + "step": 39196 + }, + { + "epoch": 1.0, + "learning_rate": 1.5508448561308604e-06, + "loss": 0.5815, + "step": 39197 + }, + { + "epoch": 1.0, + "learning_rate": 1.550821761947235e-06, + "loss": 0.7129, + "step": 39198 + }, + { + "epoch": 1.0, + "learning_rate": 1.5507986673418705e-06, + "loss": 0.7134, + "step": 39199 + }, + { + "epoch": 1.0, + "learning_rate": 1.5507755723147851e-06, + "loss": 0.7881, + "step": 39200 + }, + { + "epoch": 1.0, + "learning_rate": 1.5507524768659957e-06, + "loss": 0.6021, + "step": 39201 + }, + { + "epoch": 1.0, + "learning_rate": 1.5507293809955207e-06, + "loss": 0.574, + "step": 39202 + }, + { + "epoch": 1.0, + "learning_rate": 1.5507062847033774e-06, + "loss": 0.6777, + "step": 39203 + }, + { + "epoch": 1.0, + "learning_rate": 1.5506831879895836e-06, + "loss": 0.5696, + "step": 39204 + }, + { + "epoch": 1.0, + "learning_rate": 1.5506600908541572e-06, + "loss": 0.543, + "step": 39205 + }, + { + "epoch": 1.0, + "learning_rate": 1.5506369932971155e-06, + "loss": 0.625, + "step": 39206 + }, + { + "epoch": 1.0, + "learning_rate": 1.5506138953184765e-06, + "loss": 0.6553, + "step": 39207 + }, + { + "epoch": 1.0, + "learning_rate": 1.5505907969182577e-06, + "loss": 0.709, + "step": 39208 + }, + { + "epoch": 1.0, + "learning_rate": 1.550567698096477e-06, + "loss": 0.6855, + "step": 39209 + }, + { + "epoch": 1.0, + "learning_rate": 1.5505445988531517e-06, + "loss": 0.6265, + "step": 39210 + }, + { + "epoch": 1.0, + "learning_rate": 1.5505214991883e-06, + "loss": 0.6172, + "step": 39211 + }, + { + "epoch": 1.01, + "learning_rate": 1.5504983991019392e-06, + "loss": 0.7666, + "step": 39212 + }, + { + "epoch": 1.01, + "learning_rate": 1.5504752985940867e-06, + "loss": 0.6504, + "step": 39213 + }, + { + "epoch": 1.01, + "learning_rate": 1.5504521976647613e-06, + "loss": 0.8174, + "step": 39214 + }, + { + "epoch": 1.01, + "learning_rate": 1.5504290963139795e-06, + "loss": 0.4951, + "step": 39215 + }, + { + "epoch": 1.01, + "learning_rate": 1.5504059945417593e-06, + "loss": 0.5669, + "step": 39216 + }, + { + "epoch": 1.01, + "learning_rate": 1.5503828923481189e-06, + "loss": 0.6646, + "step": 39217 + }, + { + "epoch": 1.01, + "learning_rate": 1.5503597897330754e-06, + "loss": 0.4766, + "step": 39218 + }, + { + "epoch": 1.01, + "learning_rate": 1.5503366866966468e-06, + "loss": 0.7241, + "step": 39219 + }, + { + "epoch": 1.01, + "learning_rate": 1.5503135832388508e-06, + "loss": 0.7017, + "step": 39220 + }, + { + "epoch": 1.01, + "learning_rate": 1.5502904793597047e-06, + "loss": 0.7393, + "step": 39221 + }, + { + "epoch": 1.01, + "learning_rate": 1.5502673750592268e-06, + "loss": 0.6816, + "step": 39222 + }, + { + "epoch": 1.01, + "learning_rate": 1.5502442703374343e-06, + "loss": 0.625, + "step": 39223 + }, + { + "epoch": 1.01, + "learning_rate": 1.5502211651943452e-06, + "loss": 0.5234, + "step": 39224 + }, + { + "epoch": 1.01, + "learning_rate": 1.5501980596299768e-06, + "loss": 0.5781, + "step": 39225 + }, + { + "epoch": 1.01, + "learning_rate": 1.5501749536443472e-06, + "loss": 0.6362, + "step": 39226 + }, + { + "epoch": 1.01, + "learning_rate": 1.5501518472374739e-06, + "loss": 0.5854, + "step": 39227 + }, + { + "epoch": 1.01, + "learning_rate": 1.5501287404093747e-06, + "loss": 0.4189, + "step": 39228 + }, + { + "epoch": 1.01, + "learning_rate": 1.5501056331600672e-06, + "loss": 0.8506, + "step": 39229 + }, + { + "epoch": 1.01, + "learning_rate": 1.5500825254895692e-06, + "loss": 0.5847, + "step": 39230 + }, + { + "epoch": 1.01, + "learning_rate": 1.550059417397898e-06, + "loss": 0.5999, + "step": 39231 + }, + { + "epoch": 1.01, + "learning_rate": 1.550036308885072e-06, + "loss": 0.8389, + "step": 39232 + }, + { + "epoch": 1.01, + "learning_rate": 1.5500131999511082e-06, + "loss": 0.8057, + "step": 39233 + }, + { + "epoch": 1.01, + "learning_rate": 1.5499900905960245e-06, + "loss": 0.5537, + "step": 39234 + }, + { + "epoch": 1.01, + "learning_rate": 1.549966980819839e-06, + "loss": 0.7744, + "step": 39235 + }, + { + "epoch": 1.01, + "learning_rate": 1.5499438706225689e-06, + "loss": 0.6758, + "step": 39236 + }, + { + "epoch": 1.01, + "learning_rate": 1.549920760004232e-06, + "loss": 0.6299, + "step": 39237 + }, + { + "epoch": 1.01, + "learning_rate": 1.5498976489648463e-06, + "loss": 0.6938, + "step": 39238 + }, + { + "epoch": 1.01, + "learning_rate": 1.5498745375044291e-06, + "loss": 0.7393, + "step": 39239 + }, + { + "epoch": 1.01, + "learning_rate": 1.5498514256229983e-06, + "loss": 0.8008, + "step": 39240 + }, + { + "epoch": 1.01, + "learning_rate": 1.5498283133205713e-06, + "loss": 0.6011, + "step": 39241 + }, + { + "epoch": 1.01, + "learning_rate": 1.5498052005971663e-06, + "loss": 0.6201, + "step": 39242 + }, + { + "epoch": 1.01, + "learning_rate": 1.5497820874528004e-06, + "loss": 0.7168, + "step": 39243 + }, + { + "epoch": 1.01, + "learning_rate": 1.5497589738874922e-06, + "loss": 0.4673, + "step": 39244 + }, + { + "epoch": 1.01, + "learning_rate": 1.5497358599012586e-06, + "loss": 0.4619, + "step": 39245 + }, + { + "epoch": 1.01, + "learning_rate": 1.5497127454941174e-06, + "loss": 0.7754, + "step": 39246 + }, + { + "epoch": 1.01, + "learning_rate": 1.5496896306660864e-06, + "loss": 0.9111, + "step": 39247 + }, + { + "epoch": 1.01, + "learning_rate": 1.5496665154171836e-06, + "loss": 0.6597, + "step": 39248 + }, + { + "epoch": 1.01, + "learning_rate": 1.5496433997474263e-06, + "loss": 0.5396, + "step": 39249 + }, + { + "epoch": 1.01, + "learning_rate": 1.5496202836568323e-06, + "loss": 0.6904, + "step": 39250 + }, + { + "epoch": 1.01, + "learning_rate": 1.5495971671454192e-06, + "loss": 0.5425, + "step": 39251 + }, + { + "epoch": 1.01, + "learning_rate": 1.5495740502132048e-06, + "loss": 0.6436, + "step": 39252 + }, + { + "epoch": 1.01, + "learning_rate": 1.5495509328602067e-06, + "loss": 0.6787, + "step": 39253 + }, + { + "epoch": 1.01, + "learning_rate": 1.5495278150864433e-06, + "loss": 0.7998, + "step": 39254 + }, + { + "epoch": 1.01, + "learning_rate": 1.5495046968919315e-06, + "loss": 0.5234, + "step": 39255 + }, + { + "epoch": 1.01, + "learning_rate": 1.5494815782766889e-06, + "loss": 0.6572, + "step": 39256 + }, + { + "epoch": 1.01, + "learning_rate": 1.5494584592407337e-06, + "loss": 0.7607, + "step": 39257 + }, + { + "epoch": 1.01, + "learning_rate": 1.5494353397840833e-06, + "loss": 0.687, + "step": 39258 + }, + { + "epoch": 1.01, + "learning_rate": 1.5494122199067559e-06, + "loss": 0.7969, + "step": 39259 + }, + { + "epoch": 1.01, + "learning_rate": 1.5493890996087684e-06, + "loss": 0.5337, + "step": 39260 + }, + { + "epoch": 1.01, + "learning_rate": 1.5493659788901393e-06, + "loss": 0.4785, + "step": 39261 + }, + { + "epoch": 1.01, + "learning_rate": 1.5493428577508857e-06, + "loss": 0.7002, + "step": 39262 + }, + { + "epoch": 1.01, + "learning_rate": 1.5493197361910256e-06, + "loss": 0.6338, + "step": 39263 + }, + { + "epoch": 1.01, + "learning_rate": 1.5492966142105766e-06, + "loss": 0.7051, + "step": 39264 + }, + { + "epoch": 1.01, + "learning_rate": 1.5492734918095564e-06, + "loss": 0.646, + "step": 39265 + }, + { + "epoch": 1.01, + "learning_rate": 1.5492503689879827e-06, + "loss": 0.4814, + "step": 39266 + }, + { + "epoch": 1.01, + "learning_rate": 1.5492272457458735e-06, + "loss": 0.6641, + "step": 39267 + }, + { + "epoch": 1.01, + "learning_rate": 1.5492041220832458e-06, + "loss": 0.6729, + "step": 39268 + }, + { + "epoch": 1.01, + "learning_rate": 1.5491809980001182e-06, + "loss": 0.6758, + "step": 39269 + }, + { + "epoch": 1.01, + "learning_rate": 1.5491578734965077e-06, + "loss": 0.5273, + "step": 39270 + }, + { + "epoch": 1.01, + "learning_rate": 1.5491347485724325e-06, + "loss": 0.5884, + "step": 39271 + }, + { + "epoch": 1.01, + "learning_rate": 1.54911162322791e-06, + "loss": 0.646, + "step": 39272 + }, + { + "epoch": 1.01, + "learning_rate": 1.549088497462958e-06, + "loss": 0.5542, + "step": 39273 + }, + { + "epoch": 1.01, + "learning_rate": 1.549065371277594e-06, + "loss": 0.5679, + "step": 39274 + }, + { + "epoch": 1.01, + "learning_rate": 1.549042244671836e-06, + "loss": 0.7373, + "step": 39275 + }, + { + "epoch": 1.01, + "learning_rate": 1.5490191176457014e-06, + "loss": 0.7783, + "step": 39276 + }, + { + "epoch": 1.01, + "learning_rate": 1.5489959901992084e-06, + "loss": 0.6787, + "step": 39277 + }, + { + "epoch": 1.01, + "learning_rate": 1.5489728623323744e-06, + "loss": 0.6113, + "step": 39278 + }, + { + "epoch": 1.01, + "learning_rate": 1.5489497340452173e-06, + "loss": 0.5825, + "step": 39279 + }, + { + "epoch": 1.01, + "learning_rate": 1.5489266053377543e-06, + "loss": 0.7666, + "step": 39280 + }, + { + "epoch": 1.01, + "learning_rate": 1.5489034762100034e-06, + "loss": 0.7539, + "step": 39281 + }, + { + "epoch": 1.01, + "learning_rate": 1.5488803466619825e-06, + "loss": 0.7393, + "step": 39282 + }, + { + "epoch": 1.01, + "learning_rate": 1.548857216693709e-06, + "loss": 0.6562, + "step": 39283 + }, + { + "epoch": 1.01, + "learning_rate": 1.5488340863052009e-06, + "loss": 0.749, + "step": 39284 + }, + { + "epoch": 1.01, + "learning_rate": 1.5488109554964758e-06, + "loss": 0.7734, + "step": 39285 + }, + { + "epoch": 1.01, + "learning_rate": 1.5487878242675514e-06, + "loss": 0.6064, + "step": 39286 + }, + { + "epoch": 1.01, + "learning_rate": 1.5487646926184454e-06, + "loss": 0.6499, + "step": 39287 + }, + { + "epoch": 1.01, + "learning_rate": 1.5487415605491754e-06, + "loss": 0.7539, + "step": 39288 + }, + { + "epoch": 1.01, + "learning_rate": 1.5487184280597595e-06, + "loss": 0.5132, + "step": 39289 + }, + { + "epoch": 1.01, + "learning_rate": 1.5486952951502148e-06, + "loss": 0.6035, + "step": 39290 + }, + { + "epoch": 1.01, + "learning_rate": 1.5486721618205594e-06, + "loss": 0.6533, + "step": 39291 + }, + { + "epoch": 1.01, + "learning_rate": 1.5486490280708112e-06, + "loss": 0.625, + "step": 39292 + }, + { + "epoch": 1.01, + "learning_rate": 1.5486258939009874e-06, + "loss": 0.5879, + "step": 39293 + }, + { + "epoch": 1.01, + "learning_rate": 1.548602759311106e-06, + "loss": 0.709, + "step": 39294 + }, + { + "epoch": 1.01, + "learning_rate": 1.5485796243011847e-06, + "loss": 0.7568, + "step": 39295 + }, + { + "epoch": 1.01, + "learning_rate": 1.5485564888712412e-06, + "loss": 0.7207, + "step": 39296 + }, + { + "epoch": 1.01, + "learning_rate": 1.5485333530212932e-06, + "loss": 0.7695, + "step": 39297 + }, + { + "epoch": 1.01, + "learning_rate": 1.5485102167513583e-06, + "loss": 0.7061, + "step": 39298 + }, + { + "epoch": 1.01, + "learning_rate": 1.5484870800614548e-06, + "loss": 0.7832, + "step": 39299 + }, + { + "epoch": 1.01, + "learning_rate": 1.5484639429515997e-06, + "loss": 0.7031, + "step": 39300 + }, + { + "epoch": 1.01, + "learning_rate": 1.548440805421811e-06, + "loss": 0.5811, + "step": 39301 + }, + { + "epoch": 1.01, + "learning_rate": 1.5484176674721064e-06, + "loss": 0.5823, + "step": 39302 + }, + { + "epoch": 1.01, + "learning_rate": 1.5483945291025035e-06, + "loss": 0.6924, + "step": 39303 + }, + { + "epoch": 1.01, + "learning_rate": 1.5483713903130204e-06, + "loss": 0.4331, + "step": 39304 + }, + { + "epoch": 1.01, + "learning_rate": 1.5483482511036744e-06, + "loss": 0.4541, + "step": 39305 + }, + { + "epoch": 1.01, + "learning_rate": 1.548325111474483e-06, + "loss": 0.5225, + "step": 39306 + }, + { + "epoch": 1.01, + "learning_rate": 1.5483019714254648e-06, + "loss": 0.6797, + "step": 39307 + }, + { + "epoch": 1.01, + "learning_rate": 1.5482788309566366e-06, + "loss": 0.6582, + "step": 39308 + }, + { + "epoch": 1.01, + "learning_rate": 1.548255690068017e-06, + "loss": 0.6787, + "step": 39309 + }, + { + "epoch": 1.01, + "learning_rate": 1.548232548759623e-06, + "loss": 0.7109, + "step": 39310 + }, + { + "epoch": 1.01, + "learning_rate": 1.5482094070314721e-06, + "loss": 0.6982, + "step": 39311 + }, + { + "epoch": 1.01, + "learning_rate": 1.5481862648835828e-06, + "loss": 0.6035, + "step": 39312 + }, + { + "epoch": 1.01, + "learning_rate": 1.5481631223159726e-06, + "loss": 0.5273, + "step": 39313 + }, + { + "epoch": 1.01, + "learning_rate": 1.5481399793286589e-06, + "loss": 0.7852, + "step": 39314 + }, + { + "epoch": 1.01, + "learning_rate": 1.54811683592166e-06, + "loss": 0.8955, + "step": 39315 + }, + { + "epoch": 1.01, + "learning_rate": 1.5480936920949929e-06, + "loss": 0.5042, + "step": 39316 + }, + { + "epoch": 1.01, + "learning_rate": 1.5480705478486758e-06, + "loss": 0.5596, + "step": 39317 + }, + { + "epoch": 1.01, + "learning_rate": 1.5480474031827261e-06, + "loss": 0.7051, + "step": 39318 + }, + { + "epoch": 1.01, + "learning_rate": 1.5480242580971618e-06, + "loss": 0.6309, + "step": 39319 + }, + { + "epoch": 1.01, + "learning_rate": 1.5480011125920007e-06, + "loss": 0.686, + "step": 39320 + }, + { + "epoch": 1.01, + "learning_rate": 1.54797796666726e-06, + "loss": 0.7578, + "step": 39321 + }, + { + "epoch": 1.01, + "learning_rate": 1.547954820322958e-06, + "loss": 0.6953, + "step": 39322 + }, + { + "epoch": 1.01, + "learning_rate": 1.547931673559112e-06, + "loss": 0.7188, + "step": 39323 + }, + { + "epoch": 1.01, + "learning_rate": 1.5479085263757403e-06, + "loss": 0.6406, + "step": 39324 + }, + { + "epoch": 1.01, + "learning_rate": 1.5478853787728601e-06, + "loss": 0.52, + "step": 39325 + }, + { + "epoch": 1.01, + "learning_rate": 1.5478622307504892e-06, + "loss": 0.792, + "step": 39326 + }, + { + "epoch": 1.01, + "learning_rate": 1.5478390823086452e-06, + "loss": 0.4535, + "step": 39327 + }, + { + "epoch": 1.01, + "learning_rate": 1.547815933447346e-06, + "loss": 0.645, + "step": 39328 + }, + { + "epoch": 1.01, + "learning_rate": 1.5477927841666096e-06, + "loss": 0.5908, + "step": 39329 + }, + { + "epoch": 1.01, + "learning_rate": 1.5477696344664532e-06, + "loss": 0.4561, + "step": 39330 + }, + { + "epoch": 1.01, + "learning_rate": 1.547746484346895e-06, + "loss": 0.533, + "step": 39331 + }, + { + "epoch": 1.01, + "learning_rate": 1.5477233338079526e-06, + "loss": 0.748, + "step": 39332 + }, + { + "epoch": 1.01, + "learning_rate": 1.5477001828496431e-06, + "loss": 0.7568, + "step": 39333 + }, + { + "epoch": 1.01, + "learning_rate": 1.5476770314719854e-06, + "loss": 0.6611, + "step": 39334 + }, + { + "epoch": 1.01, + "learning_rate": 1.5476538796749962e-06, + "loss": 0.7285, + "step": 39335 + }, + { + "epoch": 1.01, + "learning_rate": 1.5476307274586937e-06, + "loss": 0.6821, + "step": 39336 + }, + { + "epoch": 1.01, + "learning_rate": 1.5476075748230955e-06, + "loss": 0.5703, + "step": 39337 + }, + { + "epoch": 1.01, + "learning_rate": 1.5475844217682192e-06, + "loss": 0.6489, + "step": 39338 + }, + { + "epoch": 1.01, + "learning_rate": 1.5475612682940828e-06, + "loss": 0.7637, + "step": 39339 + }, + { + "epoch": 1.01, + "learning_rate": 1.5475381144007042e-06, + "loss": 0.8486, + "step": 39340 + }, + { + "epoch": 1.01, + "learning_rate": 1.5475149600881006e-06, + "loss": 0.665, + "step": 39341 + }, + { + "epoch": 1.01, + "learning_rate": 1.54749180535629e-06, + "loss": 0.6729, + "step": 39342 + }, + { + "epoch": 1.01, + "learning_rate": 1.5474686502052899e-06, + "loss": 0.6392, + "step": 39343 + }, + { + "epoch": 1.01, + "learning_rate": 1.5474454946351187e-06, + "loss": 0.8301, + "step": 39344 + }, + { + "epoch": 1.01, + "learning_rate": 1.547422338645793e-06, + "loss": 0.5115, + "step": 39345 + }, + { + "epoch": 1.01, + "learning_rate": 1.5473991822373319e-06, + "loss": 0.6797, + "step": 39346 + }, + { + "epoch": 1.01, + "learning_rate": 1.547376025409752e-06, + "loss": 0.6709, + "step": 39347 + }, + { + "epoch": 1.01, + "learning_rate": 1.5473528681630711e-06, + "loss": 0.5737, + "step": 39348 + }, + { + "epoch": 1.01, + "learning_rate": 1.547329710497308e-06, + "loss": 0.4753, + "step": 39349 + }, + { + "epoch": 1.01, + "learning_rate": 1.5473065524124795e-06, + "loss": 0.7021, + "step": 39350 + }, + { + "epoch": 1.01, + "learning_rate": 1.5472833939086033e-06, + "loss": 0.4125, + "step": 39351 + }, + { + "epoch": 1.01, + "learning_rate": 1.5472602349856975e-06, + "loss": 0.6187, + "step": 39352 + }, + { + "epoch": 1.01, + "learning_rate": 1.5472370756437797e-06, + "loss": 0.5249, + "step": 39353 + }, + { + "epoch": 1.01, + "learning_rate": 1.547213915882868e-06, + "loss": 0.6328, + "step": 39354 + }, + { + "epoch": 1.01, + "learning_rate": 1.5471907557029793e-06, + "loss": 0.6367, + "step": 39355 + }, + { + "epoch": 1.01, + "learning_rate": 1.5471675951041315e-06, + "loss": 0.5332, + "step": 39356 + }, + { + "epoch": 1.01, + "learning_rate": 1.5471444340863434e-06, + "loss": 0.6357, + "step": 39357 + }, + { + "epoch": 1.01, + "learning_rate": 1.5471212726496313e-06, + "loss": 0.5791, + "step": 39358 + }, + { + "epoch": 1.01, + "learning_rate": 1.5470981107940139e-06, + "loss": 0.6606, + "step": 39359 + }, + { + "epoch": 1.01, + "learning_rate": 1.547074948519509e-06, + "loss": 0.7324, + "step": 39360 + }, + { + "epoch": 1.01, + "learning_rate": 1.5470517858261334e-06, + "loss": 0.4526, + "step": 39361 + }, + { + "epoch": 1.01, + "learning_rate": 1.5470286227139059e-06, + "loss": 0.5967, + "step": 39362 + }, + { + "epoch": 1.01, + "learning_rate": 1.5470054591828433e-06, + "loss": 0.6294, + "step": 39363 + }, + { + "epoch": 1.01, + "learning_rate": 1.546982295232964e-06, + "loss": 0.6934, + "step": 39364 + }, + { + "epoch": 1.01, + "learning_rate": 1.5469591308642853e-06, + "loss": 0.6094, + "step": 39365 + }, + { + "epoch": 1.01, + "learning_rate": 1.546935966076825e-06, + "loss": 0.6479, + "step": 39366 + }, + { + "epoch": 1.01, + "learning_rate": 1.5469128008706014e-06, + "loss": 0.625, + "step": 39367 + }, + { + "epoch": 1.01, + "learning_rate": 1.5468896352456317e-06, + "loss": 0.7441, + "step": 39368 + }, + { + "epoch": 1.01, + "learning_rate": 1.5468664692019337e-06, + "loss": 0.8271, + "step": 39369 + }, + { + "epoch": 1.01, + "learning_rate": 1.5468433027395253e-06, + "loss": 0.8135, + "step": 39370 + }, + { + "epoch": 1.01, + "learning_rate": 1.5468201358584239e-06, + "loss": 0.5721, + "step": 39371 + }, + { + "epoch": 1.01, + "learning_rate": 1.5467969685586474e-06, + "loss": 0.7031, + "step": 39372 + }, + { + "epoch": 1.01, + "learning_rate": 1.5467738008402141e-06, + "loss": 0.5121, + "step": 39373 + }, + { + "epoch": 1.01, + "learning_rate": 1.546750632703141e-06, + "loss": 0.5312, + "step": 39374 + }, + { + "epoch": 1.01, + "learning_rate": 1.5467274641474458e-06, + "loss": 0.7559, + "step": 39375 + }, + { + "epoch": 1.01, + "learning_rate": 1.5467042951731468e-06, + "loss": 0.7666, + "step": 39376 + }, + { + "epoch": 1.01, + "learning_rate": 1.5466811257802615e-06, + "loss": 0.8477, + "step": 39377 + }, + { + "epoch": 1.01, + "learning_rate": 1.5466579559688073e-06, + "loss": 0.707, + "step": 39378 + }, + { + "epoch": 1.01, + "learning_rate": 1.546634785738803e-06, + "loss": 0.5469, + "step": 39379 + }, + { + "epoch": 1.01, + "learning_rate": 1.5466116150902647e-06, + "loss": 0.6011, + "step": 39380 + }, + { + "epoch": 1.01, + "learning_rate": 1.5465884440232114e-06, + "loss": 0.7266, + "step": 39381 + }, + { + "epoch": 1.01, + "learning_rate": 1.5465652725376603e-06, + "loss": 0.5845, + "step": 39382 + }, + { + "epoch": 1.01, + "learning_rate": 1.5465421006336295e-06, + "loss": 0.7256, + "step": 39383 + }, + { + "epoch": 1.01, + "learning_rate": 1.5465189283111364e-06, + "loss": 0.6982, + "step": 39384 + }, + { + "epoch": 1.01, + "learning_rate": 1.546495755570199e-06, + "loss": 0.6875, + "step": 39385 + }, + { + "epoch": 1.01, + "learning_rate": 1.5464725824108347e-06, + "loss": 0.707, + "step": 39386 + }, + { + "epoch": 1.01, + "learning_rate": 1.5464494088330616e-06, + "loss": 0.8086, + "step": 39387 + }, + { + "epoch": 1.01, + "learning_rate": 1.5464262348368974e-06, + "loss": 0.6875, + "step": 39388 + }, + { + "epoch": 1.01, + "learning_rate": 1.5464030604223597e-06, + "loss": 0.6646, + "step": 39389 + }, + { + "epoch": 1.01, + "learning_rate": 1.5463798855894664e-06, + "loss": 0.6694, + "step": 39390 + }, + { + "epoch": 1.01, + "learning_rate": 1.546356710338235e-06, + "loss": 0.7637, + "step": 39391 + }, + { + "epoch": 1.01, + "learning_rate": 1.5463335346686834e-06, + "loss": 0.7441, + "step": 39392 + }, + { + "epoch": 1.01, + "learning_rate": 1.5463103585808296e-06, + "loss": 0.4692, + "step": 39393 + }, + { + "epoch": 1.01, + "learning_rate": 1.5462871820746907e-06, + "loss": 0.7168, + "step": 39394 + }, + { + "epoch": 1.01, + "learning_rate": 1.546264005150285e-06, + "loss": 0.7139, + "step": 39395 + }, + { + "epoch": 1.01, + "learning_rate": 1.54624082780763e-06, + "loss": 0.6104, + "step": 39396 + }, + { + "epoch": 1.01, + "learning_rate": 1.5462176500467435e-06, + "loss": 0.7578, + "step": 39397 + }, + { + "epoch": 1.01, + "learning_rate": 1.5461944718676435e-06, + "loss": 0.8701, + "step": 39398 + }, + { + "epoch": 1.01, + "learning_rate": 1.5461712932703471e-06, + "loss": 0.6885, + "step": 39399 + }, + { + "epoch": 1.01, + "learning_rate": 1.546148114254873e-06, + "loss": 0.564, + "step": 39400 + }, + { + "epoch": 1.01, + "learning_rate": 1.546124934821238e-06, + "loss": 0.6982, + "step": 39401 + }, + { + "epoch": 1.01, + "learning_rate": 1.5461017549694605e-06, + "loss": 0.5913, + "step": 39402 + }, + { + "epoch": 1.01, + "learning_rate": 1.5460785746995574e-06, + "loss": 0.7183, + "step": 39403 + }, + { + "epoch": 1.01, + "learning_rate": 1.5460553940115477e-06, + "loss": 0.7158, + "step": 39404 + }, + { + "epoch": 1.01, + "learning_rate": 1.5460322129054482e-06, + "loss": 0.6875, + "step": 39405 + }, + { + "epoch": 1.01, + "learning_rate": 1.546009031381277e-06, + "loss": 0.5244, + "step": 39406 + }, + { + "epoch": 1.01, + "learning_rate": 1.5459858494390518e-06, + "loss": 0.6699, + "step": 39407 + }, + { + "epoch": 1.01, + "learning_rate": 1.5459626670787903e-06, + "loss": 0.6465, + "step": 39408 + }, + { + "epoch": 1.01, + "learning_rate": 1.5459394843005105e-06, + "loss": 0.6865, + "step": 39409 + }, + { + "epoch": 1.01, + "learning_rate": 1.5459163011042296e-06, + "loss": 0.667, + "step": 39410 + }, + { + "epoch": 1.01, + "learning_rate": 1.5458931174899658e-06, + "loss": 0.4849, + "step": 39411 + }, + { + "epoch": 1.01, + "learning_rate": 1.545869933457737e-06, + "loss": 0.5986, + "step": 39412 + }, + { + "epoch": 1.01, + "learning_rate": 1.5458467490075604e-06, + "loss": 0.645, + "step": 39413 + }, + { + "epoch": 1.01, + "learning_rate": 1.545823564139454e-06, + "loss": 0.7344, + "step": 39414 + }, + { + "epoch": 1.01, + "learning_rate": 1.5458003788534359e-06, + "loss": 0.5801, + "step": 39415 + }, + { + "epoch": 1.01, + "learning_rate": 1.5457771931495234e-06, + "loss": 0.6963, + "step": 39416 + }, + { + "epoch": 1.01, + "learning_rate": 1.5457540070277344e-06, + "loss": 0.5781, + "step": 39417 + }, + { + "epoch": 1.01, + "learning_rate": 1.5457308204880865e-06, + "loss": 0.5322, + "step": 39418 + }, + { + "epoch": 1.01, + "learning_rate": 1.5457076335305979e-06, + "loss": 0.8262, + "step": 39419 + }, + { + "epoch": 1.01, + "learning_rate": 1.545684446155286e-06, + "loss": 0.5881, + "step": 39420 + }, + { + "epoch": 1.01, + "learning_rate": 1.5456612583621684e-06, + "loss": 0.8135, + "step": 39421 + }, + { + "epoch": 1.01, + "learning_rate": 1.545638070151263e-06, + "loss": 0.792, + "step": 39422 + }, + { + "epoch": 1.01, + "learning_rate": 1.5456148815225877e-06, + "loss": 0.6465, + "step": 39423 + }, + { + "epoch": 1.01, + "learning_rate": 1.5455916924761604e-06, + "loss": 0.8281, + "step": 39424 + }, + { + "epoch": 1.01, + "learning_rate": 1.5455685030119985e-06, + "loss": 0.6309, + "step": 39425 + }, + { + "epoch": 1.01, + "learning_rate": 1.54554531313012e-06, + "loss": 0.6885, + "step": 39426 + }, + { + "epoch": 1.01, + "learning_rate": 1.5455221228305421e-06, + "loss": 0.5161, + "step": 39427 + }, + { + "epoch": 1.01, + "learning_rate": 1.5454989321132835e-06, + "loss": 0.7617, + "step": 39428 + }, + { + "epoch": 1.01, + "learning_rate": 1.5454757409783613e-06, + "loss": 0.79, + "step": 39429 + }, + { + "epoch": 1.01, + "learning_rate": 1.5454525494257933e-06, + "loss": 0.6787, + "step": 39430 + }, + { + "epoch": 1.01, + "learning_rate": 1.5454293574555974e-06, + "loss": 0.7432, + "step": 39431 + }, + { + "epoch": 1.01, + "learning_rate": 1.5454061650677913e-06, + "loss": 0.3538, + "step": 39432 + }, + { + "epoch": 1.01, + "learning_rate": 1.5453829722623927e-06, + "loss": 0.8047, + "step": 39433 + }, + { + "epoch": 1.01, + "learning_rate": 1.54535977903942e-06, + "loss": 0.5698, + "step": 39434 + }, + { + "epoch": 1.01, + "learning_rate": 1.5453365853988895e-06, + "loss": 0.5312, + "step": 39435 + }, + { + "epoch": 1.01, + "learning_rate": 1.5453133913408205e-06, + "loss": 0.624, + "step": 39436 + }, + { + "epoch": 1.01, + "learning_rate": 1.5452901968652298e-06, + "loss": 0.708, + "step": 39437 + }, + { + "epoch": 1.01, + "learning_rate": 1.5452670019721356e-06, + "loss": 0.6343, + "step": 39438 + }, + { + "epoch": 1.01, + "learning_rate": 1.5452438066615555e-06, + "loss": 0.832, + "step": 39439 + }, + { + "epoch": 1.01, + "learning_rate": 1.5452206109335072e-06, + "loss": 0.603, + "step": 39440 + }, + { + "epoch": 1.01, + "learning_rate": 1.5451974147880087e-06, + "loss": 0.6025, + "step": 39441 + }, + { + "epoch": 1.01, + "learning_rate": 1.5451742182250777e-06, + "loss": 0.7129, + "step": 39442 + }, + { + "epoch": 1.01, + "learning_rate": 1.5451510212447319e-06, + "loss": 0.6211, + "step": 39443 + }, + { + "epoch": 1.01, + "learning_rate": 1.5451278238469888e-06, + "loss": 0.5796, + "step": 39444 + }, + { + "epoch": 1.01, + "learning_rate": 1.5451046260318665e-06, + "loss": 0.6738, + "step": 39445 + }, + { + "epoch": 1.01, + "learning_rate": 1.5450814277993824e-06, + "loss": 0.6519, + "step": 39446 + }, + { + "epoch": 1.01, + "learning_rate": 1.545058229149555e-06, + "loss": 0.6777, + "step": 39447 + }, + { + "epoch": 1.01, + "learning_rate": 1.5450350300824011e-06, + "loss": 0.6265, + "step": 39448 + }, + { + "epoch": 1.01, + "learning_rate": 1.545011830597939e-06, + "loss": 0.5249, + "step": 39449 + }, + { + "epoch": 1.01, + "learning_rate": 1.5449886306961866e-06, + "loss": 0.6992, + "step": 39450 + }, + { + "epoch": 1.01, + "learning_rate": 1.5449654303771613e-06, + "loss": 0.7129, + "step": 39451 + }, + { + "epoch": 1.01, + "learning_rate": 1.5449422296408812e-06, + "loss": 0.7363, + "step": 39452 + }, + { + "epoch": 1.01, + "learning_rate": 1.544919028487364e-06, + "loss": 0.5791, + "step": 39453 + }, + { + "epoch": 1.01, + "learning_rate": 1.544895826916627e-06, + "loss": 0.8135, + "step": 39454 + }, + { + "epoch": 1.01, + "learning_rate": 1.5448726249286884e-06, + "loss": 0.5442, + "step": 39455 + }, + { + "epoch": 1.01, + "learning_rate": 1.544849422523566e-06, + "loss": 0.7881, + "step": 39456 + }, + { + "epoch": 1.01, + "learning_rate": 1.5448262197012774e-06, + "loss": 0.624, + "step": 39457 + }, + { + "epoch": 1.01, + "learning_rate": 1.5448030164618406e-06, + "loss": 0.7163, + "step": 39458 + }, + { + "epoch": 1.01, + "learning_rate": 1.544779812805273e-06, + "loss": 0.666, + "step": 39459 + }, + { + "epoch": 1.01, + "learning_rate": 1.5447566087315927e-06, + "loss": 0.8145, + "step": 39460 + }, + { + "epoch": 1.01, + "learning_rate": 1.5447334042408168e-06, + "loss": 0.6128, + "step": 39461 + }, + { + "epoch": 1.01, + "learning_rate": 1.544710199332964e-06, + "loss": 0.8145, + "step": 39462 + }, + { + "epoch": 1.01, + "learning_rate": 1.5446869940080517e-06, + "loss": 0.3967, + "step": 39463 + }, + { + "epoch": 1.01, + "learning_rate": 1.5446637882660975e-06, + "loss": 0.8828, + "step": 39464 + }, + { + "epoch": 1.01, + "learning_rate": 1.5446405821071194e-06, + "loss": 0.7754, + "step": 39465 + }, + { + "epoch": 1.01, + "learning_rate": 1.544617375531135e-06, + "loss": 0.6655, + "step": 39466 + }, + { + "epoch": 1.01, + "learning_rate": 1.544594168538162e-06, + "loss": 0.5762, + "step": 39467 + }, + { + "epoch": 1.01, + "learning_rate": 1.5445709611282186e-06, + "loss": 0.6401, + "step": 39468 + }, + { + "epoch": 1.01, + "learning_rate": 1.544547753301322e-06, + "loss": 0.5032, + "step": 39469 + }, + { + "epoch": 1.01, + "learning_rate": 1.54452454505749e-06, + "loss": 0.6509, + "step": 39470 + }, + { + "epoch": 1.01, + "learning_rate": 1.5445013363967409e-06, + "loss": 0.7529, + "step": 39471 + }, + { + "epoch": 1.01, + "learning_rate": 1.5444781273190919e-06, + "loss": 0.6104, + "step": 39472 + }, + { + "epoch": 1.01, + "learning_rate": 1.5444549178245614e-06, + "loss": 0.7148, + "step": 39473 + }, + { + "epoch": 1.01, + "learning_rate": 1.5444317079131667e-06, + "loss": 0.6914, + "step": 39474 + }, + { + "epoch": 1.01, + "learning_rate": 1.5444084975849254e-06, + "loss": 0.7207, + "step": 39475 + }, + { + "epoch": 1.01, + "learning_rate": 1.5443852868398558e-06, + "loss": 0.832, + "step": 39476 + }, + { + "epoch": 1.01, + "learning_rate": 1.5443620756779753e-06, + "loss": 0.5659, + "step": 39477 + }, + { + "epoch": 1.01, + "learning_rate": 1.544338864099302e-06, + "loss": 0.6157, + "step": 39478 + }, + { + "epoch": 1.01, + "learning_rate": 1.5443156521038532e-06, + "loss": 0.668, + "step": 39479 + }, + { + "epoch": 1.01, + "learning_rate": 1.544292439691647e-06, + "loss": 0.5029, + "step": 39480 + }, + { + "epoch": 1.01, + "learning_rate": 1.5442692268627013e-06, + "loss": 0.6719, + "step": 39481 + }, + { + "epoch": 1.01, + "learning_rate": 1.5442460136170333e-06, + "loss": 0.7373, + "step": 39482 + }, + { + "epoch": 1.01, + "learning_rate": 1.5442227999546616e-06, + "loss": 0.7402, + "step": 39483 + }, + { + "epoch": 1.01, + "learning_rate": 1.5441995858756034e-06, + "loss": 0.6768, + "step": 39484 + }, + { + "epoch": 1.01, + "learning_rate": 1.5441763713798764e-06, + "loss": 0.6416, + "step": 39485 + }, + { + "epoch": 1.01, + "learning_rate": 1.5441531564674985e-06, + "loss": 0.3284, + "step": 39486 + }, + { + "epoch": 1.01, + "learning_rate": 1.5441299411384878e-06, + "loss": 0.7549, + "step": 39487 + }, + { + "epoch": 1.01, + "learning_rate": 1.5441067253928618e-06, + "loss": 0.6406, + "step": 39488 + }, + { + "epoch": 1.01, + "learning_rate": 1.5440835092306386e-06, + "loss": 0.7476, + "step": 39489 + }, + { + "epoch": 1.01, + "learning_rate": 1.5440602926518352e-06, + "loss": 0.7129, + "step": 39490 + }, + { + "epoch": 1.01, + "learning_rate": 1.5440370756564699e-06, + "loss": 0.4922, + "step": 39491 + }, + { + "epoch": 1.01, + "learning_rate": 1.5440138582445603e-06, + "loss": 0.5835, + "step": 39492 + }, + { + "epoch": 1.01, + "learning_rate": 1.543990640416125e-06, + "loss": 0.583, + "step": 39493 + }, + { + "epoch": 1.01, + "learning_rate": 1.5439674221711804e-06, + "loss": 0.791, + "step": 39494 + }, + { + "epoch": 1.01, + "learning_rate": 1.5439442035097452e-06, + "loss": 0.5361, + "step": 39495 + }, + { + "epoch": 1.01, + "learning_rate": 1.543920984431837e-06, + "loss": 0.5791, + "step": 39496 + }, + { + "epoch": 1.01, + "learning_rate": 1.543897764937473e-06, + "loss": 0.5669, + "step": 39497 + }, + { + "epoch": 1.01, + "learning_rate": 1.543874545026672e-06, + "loss": 0.6694, + "step": 39498 + }, + { + "epoch": 1.01, + "learning_rate": 1.5438513246994514e-06, + "loss": 0.686, + "step": 39499 + }, + { + "epoch": 1.01, + "learning_rate": 1.5438281039558283e-06, + "loss": 0.8086, + "step": 39500 + }, + { + "epoch": 1.01, + "learning_rate": 1.5438048827958214e-06, + "loss": 0.5574, + "step": 39501 + }, + { + "epoch": 1.01, + "learning_rate": 1.543781661219448e-06, + "loss": 0.7158, + "step": 39502 + }, + { + "epoch": 1.01, + "learning_rate": 1.5437584392267262e-06, + "loss": 0.5977, + "step": 39503 + }, + { + "epoch": 1.01, + "learning_rate": 1.5437352168176733e-06, + "loss": 0.5265, + "step": 39504 + }, + { + "epoch": 1.01, + "learning_rate": 1.5437119939923075e-06, + "loss": 0.6089, + "step": 39505 + }, + { + "epoch": 1.01, + "learning_rate": 1.5436887707506464e-06, + "loss": 0.8115, + "step": 39506 + }, + { + "epoch": 1.01, + "learning_rate": 1.5436655470927078e-06, + "loss": 0.6426, + "step": 39507 + }, + { + "epoch": 1.01, + "learning_rate": 1.5436423230185094e-06, + "loss": 0.749, + "step": 39508 + }, + { + "epoch": 1.01, + "learning_rate": 1.5436190985280693e-06, + "loss": 0.6494, + "step": 39509 + }, + { + "epoch": 1.01, + "learning_rate": 1.5435958736214049e-06, + "loss": 0.6074, + "step": 39510 + }, + { + "epoch": 1.01, + "learning_rate": 1.5435726482985338e-06, + "loss": 0.7124, + "step": 39511 + }, + { + "epoch": 1.01, + "learning_rate": 1.5435494225594744e-06, + "loss": 0.2881, + "step": 39512 + }, + { + "epoch": 1.01, + "learning_rate": 1.5435261964042442e-06, + "loss": 0.5088, + "step": 39513 + }, + { + "epoch": 1.01, + "learning_rate": 1.5435029698328612e-06, + "loss": 0.5981, + "step": 39514 + }, + { + "epoch": 1.01, + "learning_rate": 1.543479742845343e-06, + "loss": 0.5273, + "step": 39515 + }, + { + "epoch": 1.01, + "learning_rate": 1.543456515441707e-06, + "loss": 0.6279, + "step": 39516 + }, + { + "epoch": 1.01, + "learning_rate": 1.5434332876219713e-06, + "loss": 0.6772, + "step": 39517 + }, + { + "epoch": 1.01, + "learning_rate": 1.543410059386154e-06, + "loss": 0.7314, + "step": 39518 + }, + { + "epoch": 1.01, + "learning_rate": 1.5433868307342723e-06, + "loss": 0.6797, + "step": 39519 + }, + { + "epoch": 1.01, + "learning_rate": 1.5433636016663444e-06, + "loss": 0.6621, + "step": 39520 + }, + { + "epoch": 1.01, + "learning_rate": 1.543340372182388e-06, + "loss": 0.5708, + "step": 39521 + }, + { + "epoch": 1.01, + "learning_rate": 1.5433171422824212e-06, + "loss": 0.6982, + "step": 39522 + }, + { + "epoch": 1.01, + "learning_rate": 1.5432939119664611e-06, + "loss": 0.748, + "step": 39523 + }, + { + "epoch": 1.01, + "learning_rate": 1.5432706812345262e-06, + "loss": 0.7104, + "step": 39524 + }, + { + "epoch": 1.01, + "learning_rate": 1.5432474500866335e-06, + "loss": 0.6348, + "step": 39525 + }, + { + "epoch": 1.01, + "learning_rate": 1.5432242185228013e-06, + "loss": 0.835, + "step": 39526 + }, + { + "epoch": 1.01, + "learning_rate": 1.5432009865430473e-06, + "loss": 0.4668, + "step": 39527 + }, + { + "epoch": 1.01, + "learning_rate": 1.5431777541473893e-06, + "loss": 0.6484, + "step": 39528 + }, + { + "epoch": 1.01, + "learning_rate": 1.543154521335845e-06, + "loss": 0.5493, + "step": 39529 + }, + { + "epoch": 1.01, + "learning_rate": 1.5431312881084324e-06, + "loss": 0.4585, + "step": 39530 + }, + { + "epoch": 1.01, + "learning_rate": 1.543108054465169e-06, + "loss": 0.5552, + "step": 39531 + }, + { + "epoch": 1.01, + "learning_rate": 1.5430848204060728e-06, + "loss": 0.6245, + "step": 39532 + }, + { + "epoch": 1.01, + "learning_rate": 1.5430615859311617e-06, + "loss": 0.6475, + "step": 39533 + }, + { + "epoch": 1.01, + "learning_rate": 1.5430383510404532e-06, + "loss": 0.6284, + "step": 39534 + }, + { + "epoch": 1.01, + "learning_rate": 1.543015115733965e-06, + "loss": 0.7686, + "step": 39535 + }, + { + "epoch": 1.01, + "learning_rate": 1.5429918800117152e-06, + "loss": 0.6445, + "step": 39536 + }, + { + "epoch": 1.01, + "learning_rate": 1.5429686438737214e-06, + "loss": 0.7578, + "step": 39537 + }, + { + "epoch": 1.01, + "learning_rate": 1.5429454073200018e-06, + "loss": 0.5591, + "step": 39538 + }, + { + "epoch": 1.01, + "learning_rate": 1.5429221703505736e-06, + "loss": 0.709, + "step": 39539 + }, + { + "epoch": 1.01, + "learning_rate": 1.5428989329654552e-06, + "loss": 0.3962, + "step": 39540 + }, + { + "epoch": 1.01, + "learning_rate": 1.5428756951646635e-06, + "loss": 0.5698, + "step": 39541 + }, + { + "epoch": 1.01, + "learning_rate": 1.5428524569482174e-06, + "loss": 0.7568, + "step": 39542 + }, + { + "epoch": 1.01, + "learning_rate": 1.5428292183161338e-06, + "loss": 0.5134, + "step": 39543 + }, + { + "epoch": 1.01, + "learning_rate": 1.5428059792684307e-06, + "loss": 0.6553, + "step": 39544 + }, + { + "epoch": 1.01, + "learning_rate": 1.5427827398051262e-06, + "loss": 0.6494, + "step": 39545 + }, + { + "epoch": 1.01, + "learning_rate": 1.542759499926238e-06, + "loss": 0.4629, + "step": 39546 + }, + { + "epoch": 1.01, + "learning_rate": 1.5427362596317837e-06, + "loss": 0.6479, + "step": 39547 + }, + { + "epoch": 1.01, + "learning_rate": 1.5427130189217813e-06, + "loss": 0.6914, + "step": 39548 + }, + { + "epoch": 1.01, + "learning_rate": 1.5426897777962484e-06, + "loss": 0.6309, + "step": 39549 + }, + { + "epoch": 1.01, + "learning_rate": 1.542666536255203e-06, + "loss": 0.707, + "step": 39550 + }, + { + "epoch": 1.01, + "learning_rate": 1.5426432942986627e-06, + "loss": 0.3663, + "step": 39551 + }, + { + "epoch": 1.01, + "learning_rate": 1.5426200519266452e-06, + "loss": 0.5469, + "step": 39552 + }, + { + "epoch": 1.01, + "learning_rate": 1.542596809139169e-06, + "loss": 0.7959, + "step": 39553 + }, + { + "epoch": 1.01, + "learning_rate": 1.542573565936251e-06, + "loss": 0.6104, + "step": 39554 + }, + { + "epoch": 1.01, + "learning_rate": 1.5425503223179093e-06, + "loss": 0.5142, + "step": 39555 + }, + { + "epoch": 1.01, + "learning_rate": 1.542527078284162e-06, + "loss": 0.7065, + "step": 39556 + }, + { + "epoch": 1.01, + "learning_rate": 1.5425038338350263e-06, + "loss": 0.4905, + "step": 39557 + }, + { + "epoch": 1.01, + "learning_rate": 1.5424805889705206e-06, + "loss": 0.6855, + "step": 39558 + }, + { + "epoch": 1.01, + "learning_rate": 1.5424573436906624e-06, + "loss": 0.6602, + "step": 39559 + }, + { + "epoch": 1.01, + "learning_rate": 1.5424340979954697e-06, + "loss": 0.5728, + "step": 39560 + }, + { + "epoch": 1.01, + "learning_rate": 1.54241085188496e-06, + "loss": 0.6377, + "step": 39561 + }, + { + "epoch": 1.01, + "learning_rate": 1.5423876053591514e-06, + "loss": 0.6758, + "step": 39562 + }, + { + "epoch": 1.01, + "learning_rate": 1.5423643584180615e-06, + "loss": 0.6123, + "step": 39563 + }, + { + "epoch": 1.01, + "learning_rate": 1.5423411110617082e-06, + "loss": 0.7617, + "step": 39564 + }, + { + "epoch": 1.01, + "learning_rate": 1.5423178632901087e-06, + "loss": 0.7148, + "step": 39565 + }, + { + "epoch": 1.01, + "learning_rate": 1.542294615103282e-06, + "loss": 0.9102, + "step": 39566 + }, + { + "epoch": 1.01, + "learning_rate": 1.542271366501245e-06, + "loss": 0.6611, + "step": 39567 + }, + { + "epoch": 1.01, + "learning_rate": 1.542248117484016e-06, + "loss": 0.6592, + "step": 39568 + }, + { + "epoch": 1.01, + "learning_rate": 1.5422248680516123e-06, + "loss": 0.5201, + "step": 39569 + }, + { + "epoch": 1.01, + "learning_rate": 1.5422016182040521e-06, + "loss": 0.7017, + "step": 39570 + }, + { + "epoch": 1.01, + "learning_rate": 1.5421783679413526e-06, + "loss": 0.7246, + "step": 39571 + }, + { + "epoch": 1.01, + "learning_rate": 1.5421551172635327e-06, + "loss": 0.6123, + "step": 39572 + }, + { + "epoch": 1.01, + "learning_rate": 1.5421318661706094e-06, + "loss": 0.5952, + "step": 39573 + }, + { + "epoch": 1.01, + "learning_rate": 1.5421086146626006e-06, + "loss": 0.8311, + "step": 39574 + }, + { + "epoch": 1.01, + "learning_rate": 1.5420853627395238e-06, + "loss": 0.7393, + "step": 39575 + }, + { + "epoch": 1.01, + "learning_rate": 1.5420621104013973e-06, + "loss": 0.5383, + "step": 39576 + }, + { + "epoch": 1.01, + "learning_rate": 1.542038857648239e-06, + "loss": 0.6729, + "step": 39577 + }, + { + "epoch": 1.01, + "learning_rate": 1.5420156044800666e-06, + "loss": 0.6021, + "step": 39578 + }, + { + "epoch": 1.01, + "learning_rate": 1.5419923508968976e-06, + "loss": 0.657, + "step": 39579 + }, + { + "epoch": 1.01, + "learning_rate": 1.5419690968987497e-06, + "loss": 0.8125, + "step": 39580 + }, + { + "epoch": 1.01, + "learning_rate": 1.5419458424856413e-06, + "loss": 0.6108, + "step": 39581 + }, + { + "epoch": 1.01, + "learning_rate": 1.5419225876575897e-06, + "loss": 0.4861, + "step": 39582 + }, + { + "epoch": 1.01, + "learning_rate": 1.541899332414613e-06, + "loss": 0.6226, + "step": 39583 + }, + { + "epoch": 1.01, + "learning_rate": 1.5418760767567291e-06, + "loss": 0.5786, + "step": 39584 + }, + { + "epoch": 1.01, + "learning_rate": 1.5418528206839554e-06, + "loss": 0.7139, + "step": 39585 + }, + { + "epoch": 1.01, + "learning_rate": 1.5418295641963097e-06, + "loss": 0.6182, + "step": 39586 + }, + { + "epoch": 1.01, + "learning_rate": 1.5418063072938104e-06, + "loss": 0.8721, + "step": 39587 + }, + { + "epoch": 1.01, + "learning_rate": 1.5417830499764749e-06, + "loss": 0.5786, + "step": 39588 + }, + { + "epoch": 1.01, + "learning_rate": 1.5417597922443206e-06, + "loss": 0.561, + "step": 39589 + }, + { + "epoch": 1.01, + "learning_rate": 1.541736534097366e-06, + "loss": 0.4556, + "step": 39590 + }, + { + "epoch": 1.01, + "learning_rate": 1.5417132755356287e-06, + "loss": 0.5474, + "step": 39591 + }, + { + "epoch": 1.01, + "learning_rate": 1.5416900165591264e-06, + "loss": 0.6992, + "step": 39592 + }, + { + "epoch": 1.01, + "learning_rate": 1.541666757167877e-06, + "loss": 0.6973, + "step": 39593 + }, + { + "epoch": 1.01, + "learning_rate": 1.5416434973618983e-06, + "loss": 0.7231, + "step": 39594 + }, + { + "epoch": 1.01, + "learning_rate": 1.5416202371412078e-06, + "loss": 0.667, + "step": 39595 + }, + { + "epoch": 1.01, + "learning_rate": 1.541596976505824e-06, + "loss": 0.6196, + "step": 39596 + }, + { + "epoch": 1.01, + "learning_rate": 1.541573715455764e-06, + "loss": 0.5181, + "step": 39597 + }, + { + "epoch": 1.01, + "learning_rate": 1.5415504539910465e-06, + "loss": 0.5696, + "step": 39598 + }, + { + "epoch": 1.01, + "learning_rate": 1.5415271921116882e-06, + "loss": 0.6533, + "step": 39599 + }, + { + "epoch": 1.01, + "learning_rate": 1.5415039298177073e-06, + "loss": 0.6963, + "step": 39600 + }, + { + "epoch": 1.01, + "learning_rate": 1.5414806671091218e-06, + "loss": 0.7129, + "step": 39601 + }, + { + "epoch": 1.02, + "learning_rate": 1.5414574039859497e-06, + "loss": 0.6797, + "step": 39602 + }, + { + "epoch": 1.02, + "learning_rate": 1.5414341404482083e-06, + "loss": 0.6892, + "step": 39603 + }, + { + "epoch": 1.02, + "learning_rate": 1.5414108764959158e-06, + "loss": 0.3457, + "step": 39604 + }, + { + "epoch": 1.02, + "learning_rate": 1.5413876121290899e-06, + "loss": 0.6206, + "step": 39605 + }, + { + "epoch": 1.02, + "learning_rate": 1.5413643473477484e-06, + "loss": 0.7773, + "step": 39606 + }, + { + "epoch": 1.02, + "learning_rate": 1.5413410821519091e-06, + "loss": 0.6655, + "step": 39607 + }, + { + "epoch": 1.02, + "learning_rate": 1.54131781654159e-06, + "loss": 0.7295, + "step": 39608 + }, + { + "epoch": 1.02, + "learning_rate": 1.5412945505168084e-06, + "loss": 0.793, + "step": 39609 + }, + { + "epoch": 1.02, + "learning_rate": 1.5412712840775825e-06, + "loss": 0.6299, + "step": 39610 + }, + { + "epoch": 1.02, + "learning_rate": 1.54124801722393e-06, + "loss": 0.7197, + "step": 39611 + }, + { + "epoch": 1.02, + "learning_rate": 1.5412247499558691e-06, + "loss": 0.7334, + "step": 39612 + }, + { + "epoch": 1.02, + "learning_rate": 1.5412014822734174e-06, + "loss": 0.5918, + "step": 39613 + }, + { + "epoch": 1.02, + "learning_rate": 1.5411782141765923e-06, + "loss": 0.5825, + "step": 39614 + }, + { + "epoch": 1.02, + "learning_rate": 1.5411549456654118e-06, + "loss": 0.7209, + "step": 39615 + }, + { + "epoch": 1.02, + "learning_rate": 1.5411316767398944e-06, + "loss": 0.5947, + "step": 39616 + }, + { + "epoch": 1.02, + "learning_rate": 1.5411084074000567e-06, + "loss": 0.7441, + "step": 39617 + }, + { + "epoch": 1.02, + "learning_rate": 1.5410851376459176e-06, + "loss": 0.5308, + "step": 39618 + }, + { + "epoch": 1.02, + "learning_rate": 1.5410618674774943e-06, + "loss": 0.6836, + "step": 39619 + }, + { + "epoch": 1.02, + "learning_rate": 1.541038596894805e-06, + "loss": 0.7568, + "step": 39620 + }, + { + "epoch": 1.02, + "learning_rate": 1.5410153258978672e-06, + "loss": 0.4019, + "step": 39621 + }, + { + "epoch": 1.02, + "learning_rate": 1.5409920544866987e-06, + "loss": 0.8086, + "step": 39622 + }, + { + "epoch": 1.02, + "learning_rate": 1.5409687826613178e-06, + "loss": 0.7026, + "step": 39623 + }, + { + "epoch": 1.02, + "learning_rate": 1.5409455104217416e-06, + "loss": 0.6052, + "step": 39624 + }, + { + "epoch": 1.02, + "learning_rate": 1.5409222377679885e-06, + "loss": 0.7563, + "step": 39625 + }, + { + "epoch": 1.02, + "learning_rate": 1.5408989647000761e-06, + "loss": 0.686, + "step": 39626 + }, + { + "epoch": 1.02, + "learning_rate": 1.540875691218022e-06, + "loss": 0.6011, + "step": 39627 + }, + { + "epoch": 1.02, + "learning_rate": 1.5408524173218446e-06, + "loss": 0.6538, + "step": 39628 + }, + { + "epoch": 1.02, + "learning_rate": 1.5408291430115612e-06, + "loss": 0.6436, + "step": 39629 + }, + { + "epoch": 1.02, + "learning_rate": 1.5408058682871897e-06, + "loss": 0.6772, + "step": 39630 + }, + { + "epoch": 1.02, + "learning_rate": 1.540782593148748e-06, + "loss": 0.752, + "step": 39631 + }, + { + "epoch": 1.02, + "learning_rate": 1.5407593175962543e-06, + "loss": 0.6709, + "step": 39632 + }, + { + "epoch": 1.02, + "learning_rate": 1.540736041629726e-06, + "loss": 0.5391, + "step": 39633 + }, + { + "epoch": 1.02, + "learning_rate": 1.5407127652491807e-06, + "loss": 0.2876, + "step": 39634 + }, + { + "epoch": 1.02, + "learning_rate": 1.5406894884546366e-06, + "loss": 0.5664, + "step": 39635 + }, + { + "epoch": 1.02, + "learning_rate": 1.5406662112461114e-06, + "loss": 0.5874, + "step": 39636 + }, + { + "epoch": 1.02, + "learning_rate": 1.5406429336236228e-06, + "loss": 0.6865, + "step": 39637 + }, + { + "epoch": 1.02, + "learning_rate": 1.5406196555871892e-06, + "loss": 0.6963, + "step": 39638 + }, + { + "epoch": 1.02, + "learning_rate": 1.5405963771368278e-06, + "loss": 0.71, + "step": 39639 + }, + { + "epoch": 1.02, + "learning_rate": 1.5405730982725565e-06, + "loss": 0.5669, + "step": 39640 + }, + { + "epoch": 1.02, + "learning_rate": 1.5405498189943932e-06, + "loss": 0.478, + "step": 39641 + }, + { + "epoch": 1.02, + "learning_rate": 1.5405265393023558e-06, + "loss": 0.573, + "step": 39642 + }, + { + "epoch": 1.02, + "learning_rate": 1.5405032591964623e-06, + "loss": 0.7383, + "step": 39643 + }, + { + "epoch": 1.02, + "learning_rate": 1.5404799786767299e-06, + "loss": 0.6973, + "step": 39644 + }, + { + "epoch": 1.02, + "learning_rate": 1.5404566977431772e-06, + "loss": 0.7148, + "step": 39645 + }, + { + "epoch": 1.02, + "learning_rate": 1.5404334163958214e-06, + "loss": 0.7012, + "step": 39646 + }, + { + "epoch": 1.02, + "learning_rate": 1.5404101346346808e-06, + "loss": 0.7498, + "step": 39647 + }, + { + "epoch": 1.02, + "learning_rate": 1.5403868524597727e-06, + "loss": 0.4644, + "step": 39648 + }, + { + "epoch": 1.02, + "learning_rate": 1.5403635698711156e-06, + "loss": 0.6348, + "step": 39649 + }, + { + "epoch": 1.02, + "learning_rate": 1.5403402868687266e-06, + "loss": 0.6982, + "step": 39650 + }, + { + "epoch": 1.02, + "learning_rate": 1.5403170034526242e-06, + "loss": 0.624, + "step": 39651 + }, + { + "epoch": 1.02, + "learning_rate": 1.5402937196228255e-06, + "loss": 0.6357, + "step": 39652 + }, + { + "epoch": 1.02, + "learning_rate": 1.5402704353793493e-06, + "loss": 0.6406, + "step": 39653 + }, + { + "epoch": 1.02, + "learning_rate": 1.5402471507222125e-06, + "loss": 0.6235, + "step": 39654 + }, + { + "epoch": 1.02, + "learning_rate": 1.5402238656514337e-06, + "loss": 0.512, + "step": 39655 + }, + { + "epoch": 1.02, + "learning_rate": 1.54020058016703e-06, + "loss": 0.4663, + "step": 39656 + }, + { + "epoch": 1.02, + "learning_rate": 1.5401772942690195e-06, + "loss": 0.688, + "step": 39657 + }, + { + "epoch": 1.02, + "learning_rate": 1.5401540079574202e-06, + "loss": 0.4658, + "step": 39658 + }, + { + "epoch": 1.02, + "learning_rate": 1.54013072123225e-06, + "loss": 0.7373, + "step": 39659 + }, + { + "epoch": 1.02, + "learning_rate": 1.540107434093526e-06, + "loss": 0.9561, + "step": 39660 + }, + { + "epoch": 1.02, + "learning_rate": 1.540084146541267e-06, + "loss": 0.6328, + "step": 39661 + }, + { + "epoch": 1.02, + "learning_rate": 1.5400608585754903e-06, + "loss": 0.6094, + "step": 39662 + }, + { + "epoch": 1.02, + "learning_rate": 1.5400375701962137e-06, + "loss": 0.7441, + "step": 39663 + }, + { + "epoch": 1.02, + "learning_rate": 1.5400142814034555e-06, + "loss": 0.4259, + "step": 39664 + }, + { + "epoch": 1.02, + "learning_rate": 1.5399909921972327e-06, + "loss": 0.5227, + "step": 39665 + }, + { + "epoch": 1.02, + "learning_rate": 1.5399677025775638e-06, + "loss": 0.5308, + "step": 39666 + }, + { + "epoch": 1.02, + "learning_rate": 1.5399444125444667e-06, + "loss": 0.6973, + "step": 39667 + }, + { + "epoch": 1.02, + "learning_rate": 1.5399211220979592e-06, + "loss": 0.7041, + "step": 39668 + }, + { + "epoch": 1.02, + "learning_rate": 1.5398978312380583e-06, + "loss": 0.6187, + "step": 39669 + }, + { + "epoch": 1.02, + "learning_rate": 1.5398745399647827e-06, + "loss": 0.5796, + "step": 39670 + }, + { + "epoch": 1.02, + "learning_rate": 1.53985124827815e-06, + "loss": 0.6128, + "step": 39671 + }, + { + "epoch": 1.02, + "learning_rate": 1.539827956178178e-06, + "loss": 0.7939, + "step": 39672 + }, + { + "epoch": 1.02, + "learning_rate": 1.539804663664885e-06, + "loss": 0.6338, + "step": 39673 + }, + { + "epoch": 1.02, + "learning_rate": 1.5397813707382881e-06, + "loss": 0.6572, + "step": 39674 + }, + { + "epoch": 1.02, + "learning_rate": 1.5397580773984048e-06, + "loss": 0.5439, + "step": 39675 + }, + { + "epoch": 1.02, + "learning_rate": 1.5397347836452546e-06, + "loss": 0.6611, + "step": 39676 + }, + { + "epoch": 1.02, + "learning_rate": 1.5397114894788535e-06, + "loss": 0.5444, + "step": 39677 + }, + { + "epoch": 1.02, + "learning_rate": 1.5396881948992206e-06, + "loss": 0.5586, + "step": 39678 + }, + { + "epoch": 1.02, + "learning_rate": 1.539664899906373e-06, + "loss": 0.8662, + "step": 39679 + }, + { + "epoch": 1.02, + "learning_rate": 1.5396416045003288e-06, + "loss": 0.8799, + "step": 39680 + }, + { + "epoch": 1.02, + "learning_rate": 1.539618308681106e-06, + "loss": 0.7588, + "step": 39681 + }, + { + "epoch": 1.02, + "learning_rate": 1.5395950124487222e-06, + "loss": 0.6182, + "step": 39682 + }, + { + "epoch": 1.02, + "learning_rate": 1.5395717158031954e-06, + "loss": 0.667, + "step": 39683 + }, + { + "epoch": 1.02, + "learning_rate": 1.539548418744543e-06, + "loss": 0.6641, + "step": 39684 + }, + { + "epoch": 1.02, + "learning_rate": 1.5395251212727836e-06, + "loss": 0.9258, + "step": 39685 + }, + { + "epoch": 1.02, + "learning_rate": 1.5395018233879345e-06, + "loss": 0.6572, + "step": 39686 + }, + { + "epoch": 1.02, + "learning_rate": 1.5394785250900135e-06, + "loss": 0.3918, + "step": 39687 + }, + { + "epoch": 1.02, + "learning_rate": 1.5394552263790388e-06, + "loss": 0.8779, + "step": 39688 + }, + { + "epoch": 1.02, + "learning_rate": 1.5394319272550278e-06, + "loss": 0.8486, + "step": 39689 + }, + { + "epoch": 1.02, + "learning_rate": 1.5394086277179988e-06, + "loss": 0.4287, + "step": 39690 + }, + { + "epoch": 1.02, + "learning_rate": 1.5393853277679693e-06, + "loss": 0.7275, + "step": 39691 + }, + { + "epoch": 1.02, + "learning_rate": 1.539362027404957e-06, + "loss": 0.5767, + "step": 39692 + }, + { + "epoch": 1.02, + "learning_rate": 1.5393387266289807e-06, + "loss": 0.9229, + "step": 39693 + }, + { + "epoch": 1.02, + "learning_rate": 1.539315425440057e-06, + "loss": 0.752, + "step": 39694 + }, + { + "epoch": 1.02, + "learning_rate": 1.5392921238382047e-06, + "loss": 0.5923, + "step": 39695 + }, + { + "epoch": 1.02, + "learning_rate": 1.5392688218234406e-06, + "loss": 0.5244, + "step": 39696 + }, + { + "epoch": 1.02, + "learning_rate": 1.5392455193957834e-06, + "loss": 0.5537, + "step": 39697 + }, + { + "epoch": 1.02, + "learning_rate": 1.539222216555251e-06, + "loss": 0.6494, + "step": 39698 + }, + { + "epoch": 1.02, + "learning_rate": 1.5391989133018607e-06, + "loss": 0.7246, + "step": 39699 + }, + { + "epoch": 1.02, + "learning_rate": 1.5391756096356306e-06, + "loss": 0.7119, + "step": 39700 + }, + { + "epoch": 1.02, + "learning_rate": 1.5391523055565787e-06, + "loss": 0.6611, + "step": 39701 + }, + { + "epoch": 1.02, + "learning_rate": 1.5391290010647223e-06, + "loss": 0.7432, + "step": 39702 + }, + { + "epoch": 1.02, + "learning_rate": 1.5391056961600798e-06, + "loss": 0.646, + "step": 39703 + }, + { + "epoch": 1.02, + "learning_rate": 1.539082390842669e-06, + "loss": 0.6313, + "step": 39704 + }, + { + "epoch": 1.02, + "learning_rate": 1.5390590851125075e-06, + "loss": 0.6084, + "step": 39705 + }, + { + "epoch": 1.02, + "learning_rate": 1.5390357789696132e-06, + "loss": 0.7988, + "step": 39706 + }, + { + "epoch": 1.02, + "learning_rate": 1.5390124724140038e-06, + "loss": 0.6045, + "step": 39707 + }, + { + "epoch": 1.02, + "learning_rate": 1.538989165445698e-06, + "loss": 0.6919, + "step": 39708 + }, + { + "epoch": 1.02, + "learning_rate": 1.5389658580647123e-06, + "loss": 0.667, + "step": 39709 + }, + { + "epoch": 1.02, + "learning_rate": 1.5389425502710656e-06, + "loss": 0.4604, + "step": 39710 + }, + { + "epoch": 1.02, + "learning_rate": 1.538919242064775e-06, + "loss": 0.7236, + "step": 39711 + }, + { + "epoch": 1.02, + "learning_rate": 1.5388959334458588e-06, + "loss": 0.6602, + "step": 39712 + }, + { + "epoch": 1.02, + "learning_rate": 1.5388726244143353e-06, + "loss": 0.7939, + "step": 39713 + }, + { + "epoch": 1.02, + "learning_rate": 1.5388493149702213e-06, + "loss": 0.6421, + "step": 39714 + }, + { + "epoch": 1.02, + "learning_rate": 1.538826005113535e-06, + "loss": 0.6479, + "step": 39715 + }, + { + "epoch": 1.02, + "learning_rate": 1.538802694844295e-06, + "loss": 0.6465, + "step": 39716 + }, + { + "epoch": 1.02, + "learning_rate": 1.538779384162518e-06, + "loss": 0.6484, + "step": 39717 + }, + { + "epoch": 1.02, + "learning_rate": 1.5387560730682228e-06, + "loss": 0.6758, + "step": 39718 + }, + { + "epoch": 1.02, + "learning_rate": 1.5387327615614267e-06, + "loss": 0.4387, + "step": 39719 + }, + { + "epoch": 1.02, + "learning_rate": 1.5387094496421478e-06, + "loss": 0.666, + "step": 39720 + }, + { + "epoch": 1.02, + "learning_rate": 1.5386861373104035e-06, + "loss": 0.6787, + "step": 39721 + }, + { + "epoch": 1.02, + "learning_rate": 1.5386628245662121e-06, + "loss": 0.6953, + "step": 39722 + }, + { + "epoch": 1.02, + "learning_rate": 1.5386395114095917e-06, + "loss": 0.6475, + "step": 39723 + }, + { + "epoch": 1.02, + "learning_rate": 1.5386161978405597e-06, + "loss": 0.5549, + "step": 39724 + }, + { + "epoch": 1.02, + "learning_rate": 1.5385928838591338e-06, + "loss": 0.5291, + "step": 39725 + }, + { + "epoch": 1.02, + "learning_rate": 1.538569569465332e-06, + "loss": 0.5413, + "step": 39726 + }, + { + "epoch": 1.02, + "learning_rate": 1.5385462546591725e-06, + "loss": 0.6494, + "step": 39727 + }, + { + "epoch": 1.02, + "learning_rate": 1.5385229394406728e-06, + "loss": 0.5918, + "step": 39728 + }, + { + "epoch": 1.02, + "learning_rate": 1.538499623809851e-06, + "loss": 0.6096, + "step": 39729 + }, + { + "epoch": 1.02, + "learning_rate": 1.5384763077667244e-06, + "loss": 0.5962, + "step": 39730 + }, + { + "epoch": 1.02, + "learning_rate": 1.5384529913113115e-06, + "loss": 0.7227, + "step": 39731 + }, + { + "epoch": 1.02, + "learning_rate": 1.53842967444363e-06, + "loss": 0.5532, + "step": 39732 + }, + { + "epoch": 1.02, + "learning_rate": 1.5384063571636978e-06, + "loss": 0.8193, + "step": 39733 + }, + { + "epoch": 1.02, + "learning_rate": 1.5383830394715322e-06, + "loss": 0.627, + "step": 39734 + }, + { + "epoch": 1.02, + "learning_rate": 1.5383597213671518e-06, + "loss": 0.6807, + "step": 39735 + }, + { + "epoch": 1.02, + "learning_rate": 1.5383364028505738e-06, + "loss": 0.6279, + "step": 39736 + }, + { + "epoch": 1.02, + "learning_rate": 1.5383130839218167e-06, + "loss": 0.7295, + "step": 39737 + }, + { + "epoch": 1.02, + "learning_rate": 1.5382897645808978e-06, + "loss": 0.7871, + "step": 39738 + }, + { + "epoch": 1.02, + "learning_rate": 1.5382664448278354e-06, + "loss": 0.6826, + "step": 39739 + }, + { + "epoch": 1.02, + "learning_rate": 1.5382431246626469e-06, + "loss": 0.7676, + "step": 39740 + }, + { + "epoch": 1.02, + "learning_rate": 1.5382198040853504e-06, + "loss": 0.5527, + "step": 39741 + }, + { + "epoch": 1.02, + "learning_rate": 1.5381964830959637e-06, + "loss": 0.6162, + "step": 39742 + }, + { + "epoch": 1.02, + "learning_rate": 1.538173161694505e-06, + "loss": 0.5879, + "step": 39743 + }, + { + "epoch": 1.02, + "learning_rate": 1.5381498398809915e-06, + "loss": 0.7925, + "step": 39744 + }, + { + "epoch": 1.02, + "learning_rate": 1.5381265176554416e-06, + "loss": 0.749, + "step": 39745 + }, + { + "epoch": 1.02, + "learning_rate": 1.5381031950178728e-06, + "loss": 0.624, + "step": 39746 + }, + { + "epoch": 1.02, + "learning_rate": 1.5380798719683034e-06, + "loss": 0.4929, + "step": 39747 + }, + { + "epoch": 1.02, + "learning_rate": 1.538056548506751e-06, + "loss": 0.7021, + "step": 39748 + }, + { + "epoch": 1.02, + "learning_rate": 1.5380332246332333e-06, + "loss": 0.6641, + "step": 39749 + }, + { + "epoch": 1.02, + "learning_rate": 1.5380099003477683e-06, + "loss": 0.707, + "step": 39750 + }, + { + "epoch": 1.02, + "learning_rate": 1.5379865756503737e-06, + "loss": 0.4799, + "step": 39751 + }, + { + "epoch": 1.02, + "learning_rate": 1.5379632505410677e-06, + "loss": 0.7026, + "step": 39752 + }, + { + "epoch": 1.02, + "learning_rate": 1.537939925019868e-06, + "loss": 0.613, + "step": 39753 + }, + { + "epoch": 1.02, + "learning_rate": 1.5379165990867924e-06, + "loss": 0.7354, + "step": 39754 + }, + { + "epoch": 1.02, + "learning_rate": 1.5378932727418589e-06, + "loss": 0.6504, + "step": 39755 + }, + { + "epoch": 1.02, + "learning_rate": 1.537869945985085e-06, + "loss": 0.8359, + "step": 39756 + }, + { + "epoch": 1.02, + "learning_rate": 1.537846618816489e-06, + "loss": 0.5002, + "step": 39757 + }, + { + "epoch": 1.02, + "learning_rate": 1.5378232912360884e-06, + "loss": 0.5215, + "step": 39758 + }, + { + "epoch": 1.02, + "learning_rate": 1.5377999632439013e-06, + "loss": 0.6191, + "step": 39759 + }, + { + "epoch": 1.02, + "learning_rate": 1.5377766348399457e-06, + "loss": 0.6177, + "step": 39760 + }, + { + "epoch": 1.02, + "learning_rate": 1.5377533060242388e-06, + "loss": 0.6001, + "step": 39761 + }, + { + "epoch": 1.02, + "learning_rate": 1.5377299767967995e-06, + "loss": 0.6094, + "step": 39762 + }, + { + "epoch": 1.02, + "learning_rate": 1.5377066471576447e-06, + "loss": 0.7329, + "step": 39763 + }, + { + "epoch": 1.02, + "learning_rate": 1.537683317106793e-06, + "loss": 0.8447, + "step": 39764 + }, + { + "epoch": 1.02, + "learning_rate": 1.5376599866442615e-06, + "loss": 0.6221, + "step": 39765 + }, + { + "epoch": 1.02, + "learning_rate": 1.5376366557700686e-06, + "loss": 0.6714, + "step": 39766 + }, + { + "epoch": 1.02, + "learning_rate": 1.5376133244842322e-06, + "loss": 0.6235, + "step": 39767 + }, + { + "epoch": 1.02, + "learning_rate": 1.53758999278677e-06, + "loss": 0.5508, + "step": 39768 + }, + { + "epoch": 1.02, + "learning_rate": 1.5375666606776995e-06, + "loss": 0.7393, + "step": 39769 + }, + { + "epoch": 1.02, + "learning_rate": 1.5375433281570392e-06, + "loss": 0.7363, + "step": 39770 + }, + { + "epoch": 1.02, + "learning_rate": 1.5375199952248067e-06, + "loss": 0.6006, + "step": 39771 + }, + { + "epoch": 1.02, + "learning_rate": 1.5374966618810197e-06, + "loss": 0.7109, + "step": 39772 + }, + { + "epoch": 1.02, + "learning_rate": 1.5374733281256964e-06, + "loss": 0.5229, + "step": 39773 + }, + { + "epoch": 1.02, + "learning_rate": 1.5374499939588543e-06, + "loss": 0.5679, + "step": 39774 + }, + { + "epoch": 1.02, + "learning_rate": 1.5374266593805115e-06, + "loss": 0.7305, + "step": 39775 + }, + { + "epoch": 1.02, + "learning_rate": 1.5374033243906862e-06, + "loss": 0.7139, + "step": 39776 + }, + { + "epoch": 1.02, + "learning_rate": 1.5373799889893954e-06, + "loss": 0.666, + "step": 39777 + }, + { + "epoch": 1.02, + "learning_rate": 1.5373566531766575e-06, + "loss": 0.6182, + "step": 39778 + }, + { + "epoch": 1.02, + "learning_rate": 1.5373333169524905e-06, + "loss": 0.5557, + "step": 39779 + }, + { + "epoch": 1.02, + "learning_rate": 1.5373099803169122e-06, + "loss": 0.6694, + "step": 39780 + }, + { + "epoch": 1.02, + "learning_rate": 1.5372866432699399e-06, + "loss": 0.5957, + "step": 39781 + }, + { + "epoch": 1.02, + "learning_rate": 1.5372633058115923e-06, + "loss": 0.6777, + "step": 39782 + }, + { + "epoch": 1.02, + "learning_rate": 1.5372399679418868e-06, + "loss": 0.6182, + "step": 39783 + }, + { + "epoch": 1.02, + "learning_rate": 1.537216629660841e-06, + "loss": 0.6401, + "step": 39784 + }, + { + "epoch": 1.02, + "learning_rate": 1.5371932909684738e-06, + "loss": 0.7803, + "step": 39785 + }, + { + "epoch": 1.02, + "learning_rate": 1.537169951864802e-06, + "loss": 0.7949, + "step": 39786 + }, + { + "epoch": 1.02, + "learning_rate": 1.537146612349844e-06, + "loss": 0.6692, + "step": 39787 + }, + { + "epoch": 1.02, + "learning_rate": 1.5371232724236177e-06, + "loss": 0.6338, + "step": 39788 + }, + { + "epoch": 1.02, + "learning_rate": 1.5370999320861403e-06, + "loss": 0.7607, + "step": 39789 + }, + { + "epoch": 1.02, + "learning_rate": 1.5370765913374304e-06, + "loss": 0.7012, + "step": 39790 + }, + { + "epoch": 1.02, + "learning_rate": 1.537053250177506e-06, + "loss": 0.6396, + "step": 39791 + }, + { + "epoch": 1.02, + "learning_rate": 1.5370299086063842e-06, + "loss": 0.6001, + "step": 39792 + }, + { + "epoch": 1.02, + "learning_rate": 1.5370065666240835e-06, + "loss": 0.6641, + "step": 39793 + }, + { + "epoch": 1.02, + "learning_rate": 1.5369832242306212e-06, + "loss": 0.6865, + "step": 39794 + }, + { + "epoch": 1.02, + "learning_rate": 1.536959881426016e-06, + "loss": 0.7095, + "step": 39795 + }, + { + "epoch": 1.02, + "learning_rate": 1.536936538210285e-06, + "loss": 0.71, + "step": 39796 + }, + { + "epoch": 1.02, + "learning_rate": 1.5369131945834465e-06, + "loss": 0.5776, + "step": 39797 + }, + { + "epoch": 1.02, + "learning_rate": 1.5368898505455183e-06, + "loss": 0.4871, + "step": 39798 + }, + { + "epoch": 1.02, + "learning_rate": 1.5368665060965182e-06, + "loss": 0.7754, + "step": 39799 + }, + { + "epoch": 1.02, + "learning_rate": 1.5368431612364643e-06, + "loss": 0.8975, + "step": 39800 + }, + { + "epoch": 1.02, + "learning_rate": 1.5368198159653739e-06, + "loss": 0.6309, + "step": 39801 + }, + { + "epoch": 1.02, + "learning_rate": 1.5367964702832656e-06, + "loss": 0.688, + "step": 39802 + }, + { + "epoch": 1.02, + "learning_rate": 1.5367731241901567e-06, + "loss": 0.7295, + "step": 39803 + }, + { + "epoch": 1.02, + "learning_rate": 1.5367497776860654e-06, + "loss": 0.7134, + "step": 39804 + }, + { + "epoch": 1.02, + "learning_rate": 1.5367264307710092e-06, + "loss": 0.751, + "step": 39805 + }, + { + "epoch": 1.02, + "learning_rate": 1.5367030834450064e-06, + "loss": 0.8047, + "step": 39806 + }, + { + "epoch": 1.02, + "learning_rate": 1.5366797357080752e-06, + "loss": 0.5901, + "step": 39807 + }, + { + "epoch": 1.02, + "learning_rate": 1.5366563875602326e-06, + "loss": 0.5474, + "step": 39808 + }, + { + "epoch": 1.02, + "learning_rate": 1.5366330390014968e-06, + "loss": 0.6614, + "step": 39809 + }, + { + "epoch": 1.02, + "learning_rate": 1.5366096900318857e-06, + "loss": 0.5698, + "step": 39810 + }, + { + "epoch": 1.02, + "learning_rate": 1.5365863406514175e-06, + "loss": 0.7891, + "step": 39811 + }, + { + "epoch": 1.02, + "learning_rate": 1.53656299086011e-06, + "loss": 0.5918, + "step": 39812 + }, + { + "epoch": 1.02, + "learning_rate": 1.5365396406579803e-06, + "loss": 0.6934, + "step": 39813 + }, + { + "epoch": 1.02, + "learning_rate": 1.5365162900450472e-06, + "loss": 0.6748, + "step": 39814 + }, + { + "epoch": 1.02, + "learning_rate": 1.5364929390213282e-06, + "loss": 0.7158, + "step": 39815 + }, + { + "epoch": 1.02, + "learning_rate": 1.5364695875868413e-06, + "loss": 0.5964, + "step": 39816 + }, + { + "epoch": 1.02, + "learning_rate": 1.5364462357416042e-06, + "loss": 0.6802, + "step": 39817 + }, + { + "epoch": 1.02, + "learning_rate": 1.5364228834856348e-06, + "loss": 0.6289, + "step": 39818 + }, + { + "epoch": 1.02, + "learning_rate": 1.5363995308189513e-06, + "loss": 0.7148, + "step": 39819 + }, + { + "epoch": 1.02, + "learning_rate": 1.5363761777415709e-06, + "loss": 0.6284, + "step": 39820 + }, + { + "epoch": 1.02, + "learning_rate": 1.5363528242535125e-06, + "loss": 0.5759, + "step": 39821 + }, + { + "epoch": 1.02, + "learning_rate": 1.536329470354793e-06, + "loss": 0.6553, + "step": 39822 + }, + { + "epoch": 1.02, + "learning_rate": 1.536306116045431e-06, + "loss": 0.7607, + "step": 39823 + }, + { + "epoch": 1.02, + "learning_rate": 1.5362827613254439e-06, + "loss": 0.6028, + "step": 39824 + }, + { + "epoch": 1.02, + "learning_rate": 1.5362594061948495e-06, + "loss": 0.7529, + "step": 39825 + }, + { + "epoch": 1.02, + "learning_rate": 1.5362360506536662e-06, + "loss": 0.7109, + "step": 39826 + }, + { + "epoch": 1.02, + "learning_rate": 1.5362126947019117e-06, + "loss": 0.6807, + "step": 39827 + }, + { + "epoch": 1.02, + "learning_rate": 1.5361893383396035e-06, + "loss": 0.7119, + "step": 39828 + }, + { + "epoch": 1.02, + "learning_rate": 1.5361659815667603e-06, + "loss": 0.6089, + "step": 39829 + }, + { + "epoch": 1.02, + "learning_rate": 1.5361426243833991e-06, + "loss": 0.6367, + "step": 39830 + }, + { + "epoch": 1.02, + "learning_rate": 1.5361192667895383e-06, + "loss": 0.7227, + "step": 39831 + }, + { + "epoch": 1.02, + "learning_rate": 1.5360959087851955e-06, + "loss": 0.709, + "step": 39832 + }, + { + "epoch": 1.02, + "learning_rate": 1.5360725503703886e-06, + "loss": 0.5898, + "step": 39833 + }, + { + "epoch": 1.02, + "learning_rate": 1.5360491915451354e-06, + "loss": 0.6582, + "step": 39834 + }, + { + "epoch": 1.02, + "learning_rate": 1.5360258323094547e-06, + "loss": 0.6504, + "step": 39835 + }, + { + "epoch": 1.02, + "learning_rate": 1.5360024726633628e-06, + "loss": 0.6865, + "step": 39836 + }, + { + "epoch": 1.02, + "learning_rate": 1.535979112606879e-06, + "loss": 0.9023, + "step": 39837 + }, + { + "epoch": 1.02, + "learning_rate": 1.5359557521400209e-06, + "loss": 0.6975, + "step": 39838 + }, + { + "epoch": 1.02, + "learning_rate": 1.5359323912628058e-06, + "loss": 0.6826, + "step": 39839 + }, + { + "epoch": 1.02, + "learning_rate": 1.5359090299752517e-06, + "loss": 0.5283, + "step": 39840 + }, + { + "epoch": 1.02, + "learning_rate": 1.535885668277377e-06, + "loss": 0.5005, + "step": 39841 + }, + { + "epoch": 1.02, + "learning_rate": 1.5358623061691991e-06, + "loss": 0.7832, + "step": 39842 + }, + { + "epoch": 1.02, + "learning_rate": 1.5358389436507361e-06, + "loss": 0.5991, + "step": 39843 + }, + { + "epoch": 1.02, + "learning_rate": 1.535815580722006e-06, + "loss": 0.7559, + "step": 39844 + }, + { + "epoch": 1.02, + "learning_rate": 1.5357922173830262e-06, + "loss": 0.8691, + "step": 39845 + }, + { + "epoch": 1.02, + "learning_rate": 1.5357688536338152e-06, + "loss": 0.7656, + "step": 39846 + }, + { + "epoch": 1.02, + "learning_rate": 1.5357454894743907e-06, + "loss": 0.7383, + "step": 39847 + }, + { + "epoch": 1.02, + "learning_rate": 1.5357221249047705e-06, + "loss": 0.7637, + "step": 39848 + }, + { + "epoch": 1.02, + "learning_rate": 1.5356987599249723e-06, + "loss": 0.6816, + "step": 39849 + }, + { + "epoch": 1.02, + "learning_rate": 1.5356753945350142e-06, + "loss": 0.834, + "step": 39850 + }, + { + "epoch": 1.02, + "learning_rate": 1.5356520287349142e-06, + "loss": 0.5518, + "step": 39851 + }, + { + "epoch": 1.02, + "learning_rate": 1.5356286625246903e-06, + "loss": 0.8203, + "step": 39852 + }, + { + "epoch": 1.02, + "learning_rate": 1.53560529590436e-06, + "loss": 0.6973, + "step": 39853 + }, + { + "epoch": 1.02, + "learning_rate": 1.5355819288739413e-06, + "loss": 0.6528, + "step": 39854 + }, + { + "epoch": 1.02, + "learning_rate": 1.5355585614334518e-06, + "loss": 0.6592, + "step": 39855 + }, + { + "epoch": 1.02, + "learning_rate": 1.53553519358291e-06, + "loss": 0.6421, + "step": 39856 + }, + { + "epoch": 1.02, + "learning_rate": 1.5355118253223341e-06, + "loss": 0.7949, + "step": 39857 + }, + { + "epoch": 1.02, + "learning_rate": 1.5354884566517408e-06, + "loss": 0.5146, + "step": 39858 + }, + { + "epoch": 1.02, + "learning_rate": 1.5354650875711486e-06, + "loss": 0.7031, + "step": 39859 + }, + { + "epoch": 1.02, + "learning_rate": 1.5354417180805754e-06, + "loss": 0.8262, + "step": 39860 + }, + { + "epoch": 1.02, + "learning_rate": 1.5354183481800394e-06, + "loss": 0.8018, + "step": 39861 + }, + { + "epoch": 1.02, + "learning_rate": 1.535394977869558e-06, + "loss": 0.7148, + "step": 39862 + }, + { + "epoch": 1.02, + "learning_rate": 1.5353716071491491e-06, + "loss": 0.6504, + "step": 39863 + }, + { + "epoch": 1.02, + "learning_rate": 1.535348236018831e-06, + "loss": 0.7983, + "step": 39864 + }, + { + "epoch": 1.02, + "learning_rate": 1.5353248644786212e-06, + "loss": 0.4907, + "step": 39865 + }, + { + "epoch": 1.02, + "learning_rate": 1.5353014925285382e-06, + "loss": 0.6396, + "step": 39866 + }, + { + "epoch": 1.02, + "learning_rate": 1.5352781201685991e-06, + "loss": 0.7568, + "step": 39867 + }, + { + "epoch": 1.02, + "learning_rate": 1.535254747398822e-06, + "loss": 0.749, + "step": 39868 + }, + { + "epoch": 1.02, + "learning_rate": 1.5352313742192253e-06, + "loss": 0.5503, + "step": 39869 + }, + { + "epoch": 1.02, + "learning_rate": 1.5352080006298263e-06, + "loss": 0.6826, + "step": 39870 + }, + { + "epoch": 1.02, + "learning_rate": 1.5351846266306434e-06, + "loss": 0.7217, + "step": 39871 + }, + { + "epoch": 1.02, + "learning_rate": 1.5351612522216941e-06, + "loss": 0.5281, + "step": 39872 + }, + { + "epoch": 1.02, + "learning_rate": 1.5351378774029967e-06, + "loss": 0.751, + "step": 39873 + }, + { + "epoch": 1.02, + "learning_rate": 1.5351145021745682e-06, + "loss": 0.5488, + "step": 39874 + }, + { + "epoch": 1.02, + "learning_rate": 1.5350911265364278e-06, + "loss": 0.5591, + "step": 39875 + }, + { + "epoch": 1.02, + "learning_rate": 1.5350677504885924e-06, + "loss": 0.6875, + "step": 39876 + }, + { + "epoch": 1.02, + "learning_rate": 1.5350443740310803e-06, + "loss": 0.8057, + "step": 39877 + }, + { + "epoch": 1.02, + "learning_rate": 1.5350209971639093e-06, + "loss": 0.6504, + "step": 39878 + }, + { + "epoch": 1.02, + "learning_rate": 1.5349976198870972e-06, + "loss": 0.8184, + "step": 39879 + }, + { + "epoch": 1.02, + "learning_rate": 1.5349742422006622e-06, + "loss": 0.6992, + "step": 39880 + }, + { + "epoch": 1.02, + "learning_rate": 1.5349508641046219e-06, + "loss": 0.439, + "step": 39881 + }, + { + "epoch": 1.02, + "learning_rate": 1.5349274855989944e-06, + "loss": 0.5938, + "step": 39882 + }, + { + "epoch": 1.02, + "learning_rate": 1.5349041066837974e-06, + "loss": 0.6719, + "step": 39883 + }, + { + "epoch": 1.02, + "learning_rate": 1.5348807273590492e-06, + "loss": 0.6079, + "step": 39884 + }, + { + "epoch": 1.02, + "learning_rate": 1.5348573476247674e-06, + "loss": 0.9473, + "step": 39885 + }, + { + "epoch": 1.02, + "learning_rate": 1.5348339674809694e-06, + "loss": 0.7949, + "step": 39886 + }, + { + "epoch": 1.02, + "learning_rate": 1.5348105869276743e-06, + "loss": 0.792, + "step": 39887 + }, + { + "epoch": 1.02, + "learning_rate": 1.5347872059648988e-06, + "loss": 0.687, + "step": 39888 + }, + { + "epoch": 1.02, + "learning_rate": 1.5347638245926615e-06, + "loss": 0.7988, + "step": 39889 + }, + { + "epoch": 1.02, + "learning_rate": 1.5347404428109801e-06, + "loss": 0.4424, + "step": 39890 + }, + { + "epoch": 1.02, + "learning_rate": 1.5347170606198724e-06, + "loss": 0.709, + "step": 39891 + }, + { + "epoch": 1.02, + "learning_rate": 1.5346936780193569e-06, + "loss": 0.689, + "step": 39892 + }, + { + "epoch": 1.02, + "learning_rate": 1.5346702950094508e-06, + "loss": 0.7031, + "step": 39893 + }, + { + "epoch": 1.02, + "learning_rate": 1.534646911590172e-06, + "loss": 0.6973, + "step": 39894 + }, + { + "epoch": 1.02, + "learning_rate": 1.534623527761539e-06, + "loss": 0.5742, + "step": 39895 + }, + { + "epoch": 1.02, + "learning_rate": 1.5346001435235691e-06, + "loss": 0.6748, + "step": 39896 + }, + { + "epoch": 1.02, + "learning_rate": 1.5345767588762808e-06, + "loss": 0.6206, + "step": 39897 + }, + { + "epoch": 1.02, + "learning_rate": 1.5345533738196914e-06, + "loss": 0.6533, + "step": 39898 + }, + { + "epoch": 1.02, + "learning_rate": 1.5345299883538188e-06, + "loss": 0.6084, + "step": 39899 + }, + { + "epoch": 1.02, + "learning_rate": 1.5345066024786815e-06, + "loss": 0.7607, + "step": 39900 + }, + { + "epoch": 1.02, + "learning_rate": 1.5344832161942968e-06, + "loss": 0.5151, + "step": 39901 + }, + { + "epoch": 1.02, + "learning_rate": 1.5344598295006835e-06, + "loss": 0.6392, + "step": 39902 + }, + { + "epoch": 1.02, + "learning_rate": 1.5344364423978583e-06, + "loss": 0.6885, + "step": 39903 + }, + { + "epoch": 1.02, + "learning_rate": 1.53441305488584e-06, + "loss": 0.5474, + "step": 39904 + }, + { + "epoch": 1.02, + "learning_rate": 1.5343896669646459e-06, + "loss": 0.5845, + "step": 39905 + }, + { + "epoch": 1.02, + "learning_rate": 1.5343662786342944e-06, + "loss": 0.6343, + "step": 39906 + }, + { + "epoch": 1.02, + "learning_rate": 1.5343428898948032e-06, + "loss": 0.6787, + "step": 39907 + }, + { + "epoch": 1.02, + "learning_rate": 1.53431950074619e-06, + "loss": 0.7168, + "step": 39908 + }, + { + "epoch": 1.02, + "learning_rate": 1.5342961111884733e-06, + "loss": 0.7129, + "step": 39909 + }, + { + "epoch": 1.02, + "learning_rate": 1.5342727212216703e-06, + "loss": 0.7734, + "step": 39910 + }, + { + "epoch": 1.02, + "learning_rate": 1.5342493308457995e-06, + "loss": 0.6191, + "step": 39911 + }, + { + "epoch": 1.02, + "learning_rate": 1.5342259400608783e-06, + "loss": 0.6465, + "step": 39912 + }, + { + "epoch": 1.02, + "learning_rate": 1.5342025488669253e-06, + "loss": 0.5762, + "step": 39913 + }, + { + "epoch": 1.02, + "learning_rate": 1.5341791572639572e-06, + "loss": 0.6621, + "step": 39914 + }, + { + "epoch": 1.02, + "learning_rate": 1.5341557652519934e-06, + "loss": 0.5371, + "step": 39915 + }, + { + "epoch": 1.02, + "learning_rate": 1.5341323728310509e-06, + "loss": 0.7539, + "step": 39916 + }, + { + "epoch": 1.02, + "learning_rate": 1.534108980001148e-06, + "loss": 0.3804, + "step": 39917 + }, + { + "epoch": 1.02, + "learning_rate": 1.534085586762302e-06, + "loss": 0.5312, + "step": 39918 + }, + { + "epoch": 1.02, + "learning_rate": 1.5340621931145314e-06, + "loss": 0.792, + "step": 39919 + }, + { + "epoch": 1.02, + "learning_rate": 1.534038799057854e-06, + "loss": 0.5249, + "step": 39920 + }, + { + "epoch": 1.02, + "learning_rate": 1.5340154045922874e-06, + "loss": 0.6099, + "step": 39921 + }, + { + "epoch": 1.02, + "learning_rate": 1.53399200971785e-06, + "loss": 0.5615, + "step": 39922 + }, + { + "epoch": 1.02, + "learning_rate": 1.5339686144345594e-06, + "loss": 0.5557, + "step": 39923 + }, + { + "epoch": 1.02, + "learning_rate": 1.5339452187424334e-06, + "loss": 0.6331, + "step": 39924 + }, + { + "epoch": 1.02, + "learning_rate": 1.5339218226414902e-06, + "loss": 0.7031, + "step": 39925 + }, + { + "epoch": 1.02, + "learning_rate": 1.5338984261317478e-06, + "loss": 0.5605, + "step": 39926 + }, + { + "epoch": 1.02, + "learning_rate": 1.5338750292132238e-06, + "loss": 0.6157, + "step": 39927 + }, + { + "epoch": 1.02, + "learning_rate": 1.5338516318859366e-06, + "loss": 0.4756, + "step": 39928 + }, + { + "epoch": 1.02, + "learning_rate": 1.5338282341499032e-06, + "loss": 0.5137, + "step": 39929 + }, + { + "epoch": 1.02, + "learning_rate": 1.5338048360051423e-06, + "loss": 0.7598, + "step": 39930 + }, + { + "epoch": 1.02, + "learning_rate": 1.5337814374516716e-06, + "loss": 0.3391, + "step": 39931 + }, + { + "epoch": 1.02, + "learning_rate": 1.533758038489509e-06, + "loss": 0.5732, + "step": 39932 + }, + { + "epoch": 1.02, + "learning_rate": 1.533734639118672e-06, + "loss": 0.8906, + "step": 39933 + }, + { + "epoch": 1.02, + "learning_rate": 1.5337112393391796e-06, + "loss": 0.7627, + "step": 39934 + }, + { + "epoch": 1.02, + "learning_rate": 1.5336878391510487e-06, + "loss": 0.6836, + "step": 39935 + }, + { + "epoch": 1.02, + "learning_rate": 1.5336644385542977e-06, + "loss": 0.6807, + "step": 39936 + }, + { + "epoch": 1.02, + "learning_rate": 1.5336410375489442e-06, + "loss": 0.6533, + "step": 39937 + }, + { + "epoch": 1.02, + "learning_rate": 1.5336176361350063e-06, + "loss": 0.6245, + "step": 39938 + }, + { + "epoch": 1.02, + "learning_rate": 1.533594234312502e-06, + "loss": 0.7783, + "step": 39939 + }, + { + "epoch": 1.02, + "learning_rate": 1.533570832081449e-06, + "loss": 0.6924, + "step": 39940 + }, + { + "epoch": 1.02, + "learning_rate": 1.5335474294418655e-06, + "loss": 0.6482, + "step": 39941 + }, + { + "epoch": 1.02, + "learning_rate": 1.5335240263937697e-06, + "loss": 0.6465, + "step": 39942 + }, + { + "epoch": 1.02, + "learning_rate": 1.5335006229371784e-06, + "loss": 0.5586, + "step": 39943 + }, + { + "epoch": 1.02, + "learning_rate": 1.5334772190721103e-06, + "loss": 0.5581, + "step": 39944 + }, + { + "epoch": 1.02, + "learning_rate": 1.5334538147985833e-06, + "loss": 0.8262, + "step": 39945 + }, + { + "epoch": 1.02, + "learning_rate": 1.5334304101166153e-06, + "loss": 0.5095, + "step": 39946 + }, + { + "epoch": 1.02, + "learning_rate": 1.5334070050262243e-06, + "loss": 0.6821, + "step": 39947 + }, + { + "epoch": 1.02, + "learning_rate": 1.533383599527428e-06, + "loss": 0.6934, + "step": 39948 + }, + { + "epoch": 1.02, + "learning_rate": 1.5333601936202442e-06, + "loss": 0.5542, + "step": 39949 + }, + { + "epoch": 1.02, + "learning_rate": 1.5333367873046914e-06, + "loss": 0.7803, + "step": 39950 + }, + { + "epoch": 1.02, + "learning_rate": 1.5333133805807866e-06, + "loss": 0.623, + "step": 39951 + }, + { + "epoch": 1.02, + "learning_rate": 1.5332899734485488e-06, + "loss": 0.7168, + "step": 39952 + }, + { + "epoch": 1.02, + "learning_rate": 1.5332665659079951e-06, + "loss": 0.7676, + "step": 39953 + }, + { + "epoch": 1.02, + "learning_rate": 1.5332431579591436e-06, + "loss": 0.7676, + "step": 39954 + }, + { + "epoch": 1.02, + "learning_rate": 1.5332197496020127e-06, + "loss": 0.548, + "step": 39955 + }, + { + "epoch": 1.02, + "learning_rate": 1.5331963408366196e-06, + "loss": 0.6362, + "step": 39956 + }, + { + "epoch": 1.02, + "learning_rate": 1.5331729316629828e-06, + "loss": 0.6045, + "step": 39957 + }, + { + "epoch": 1.02, + "learning_rate": 1.53314952208112e-06, + "loss": 0.5684, + "step": 39958 + }, + { + "epoch": 1.02, + "learning_rate": 1.533126112091049e-06, + "loss": 0.6631, + "step": 39959 + }, + { + "epoch": 1.02, + "learning_rate": 1.5331027016927878e-06, + "loss": 0.7109, + "step": 39960 + }, + { + "epoch": 1.02, + "learning_rate": 1.5330792908863548e-06, + "loss": 0.5767, + "step": 39961 + }, + { + "epoch": 1.02, + "learning_rate": 1.533055879671767e-06, + "loss": 0.7832, + "step": 39962 + }, + { + "epoch": 1.02, + "learning_rate": 1.5330324680490432e-06, + "loss": 0.6934, + "step": 39963 + }, + { + "epoch": 1.02, + "learning_rate": 1.5330090560182006e-06, + "loss": 0.4683, + "step": 39964 + }, + { + "epoch": 1.02, + "learning_rate": 1.5329856435792578e-06, + "loss": 0.708, + "step": 39965 + }, + { + "epoch": 1.02, + "learning_rate": 1.532962230732232e-06, + "loss": 1.0166, + "step": 39966 + }, + { + "epoch": 1.02, + "learning_rate": 1.532938817477142e-06, + "loss": 0.624, + "step": 39967 + }, + { + "epoch": 1.02, + "learning_rate": 1.5329154038140048e-06, + "loss": 0.7012, + "step": 39968 + }, + { + "epoch": 1.02, + "learning_rate": 1.5328919897428392e-06, + "loss": 0.7021, + "step": 39969 + }, + { + "epoch": 1.02, + "learning_rate": 1.5328685752636625e-06, + "loss": 0.5493, + "step": 39970 + }, + { + "epoch": 1.02, + "learning_rate": 1.5328451603764929e-06, + "loss": 0.3893, + "step": 39971 + }, + { + "epoch": 1.02, + "learning_rate": 1.5328217450813482e-06, + "loss": 0.7178, + "step": 39972 + }, + { + "epoch": 1.02, + "learning_rate": 1.532798329378246e-06, + "loss": 0.6191, + "step": 39973 + }, + { + "epoch": 1.02, + "learning_rate": 1.5327749132672051e-06, + "loss": 0.6021, + "step": 39974 + }, + { + "epoch": 1.02, + "learning_rate": 1.532751496748243e-06, + "loss": 0.4719, + "step": 39975 + }, + { + "epoch": 1.02, + "learning_rate": 1.5327280798213774e-06, + "loss": 0.3678, + "step": 39976 + }, + { + "epoch": 1.02, + "learning_rate": 1.5327046624866265e-06, + "loss": 0.7578, + "step": 39977 + }, + { + "epoch": 1.02, + "learning_rate": 1.5326812447440082e-06, + "loss": 0.6382, + "step": 39978 + }, + { + "epoch": 1.02, + "learning_rate": 1.5326578265935402e-06, + "loss": 0.7344, + "step": 39979 + }, + { + "epoch": 1.02, + "learning_rate": 1.5326344080352404e-06, + "loss": 0.6094, + "step": 39980 + }, + { + "epoch": 1.02, + "learning_rate": 1.532610989069127e-06, + "loss": 0.5164, + "step": 39981 + }, + { + "epoch": 1.02, + "learning_rate": 1.5325875696952184e-06, + "loss": 0.6621, + "step": 39982 + }, + { + "epoch": 1.02, + "learning_rate": 1.5325641499135316e-06, + "loss": 0.6401, + "step": 39983 + }, + { + "epoch": 1.02, + "learning_rate": 1.5325407297240848e-06, + "loss": 0.5835, + "step": 39984 + }, + { + "epoch": 1.02, + "learning_rate": 1.5325173091268959e-06, + "loss": 0.6631, + "step": 39985 + }, + { + "epoch": 1.02, + "learning_rate": 1.5324938881219835e-06, + "loss": 0.6211, + "step": 39986 + }, + { + "epoch": 1.02, + "learning_rate": 1.5324704667093648e-06, + "loss": 0.666, + "step": 39987 + }, + { + "epoch": 1.02, + "learning_rate": 1.532447044889058e-06, + "loss": 0.6143, + "step": 39988 + }, + { + "epoch": 1.02, + "learning_rate": 1.5324236226610807e-06, + "loss": 0.5378, + "step": 39989 + }, + { + "epoch": 1.02, + "learning_rate": 1.5324002000254515e-06, + "loss": 0.4078, + "step": 39990 + }, + { + "epoch": 1.02, + "learning_rate": 1.5323767769821876e-06, + "loss": 0.709, + "step": 39991 + }, + { + "epoch": 1.03, + "learning_rate": 1.5323533535313076e-06, + "loss": 0.5715, + "step": 39992 + }, + { + "epoch": 1.03, + "learning_rate": 1.5323299296728287e-06, + "loss": 0.6367, + "step": 39993 + }, + { + "epoch": 1.03, + "learning_rate": 1.5323065054067697e-06, + "loss": 0.574, + "step": 39994 + }, + { + "epoch": 1.03, + "learning_rate": 1.5322830807331476e-06, + "loss": 0.5374, + "step": 39995 + }, + { + "epoch": 1.03, + "learning_rate": 1.5322596556519814e-06, + "loss": 0.5913, + "step": 39996 + }, + { + "epoch": 1.03, + "learning_rate": 1.532236230163288e-06, + "loss": 0.6362, + "step": 39997 + }, + { + "epoch": 1.03, + "learning_rate": 1.5322128042670862e-06, + "loss": 0.6562, + "step": 39998 + }, + { + "epoch": 1.03, + "learning_rate": 1.5321893779633933e-06, + "loss": 0.8408, + "step": 39999 + }, + { + "epoch": 1.03, + "learning_rate": 1.5321659512522271e-06, + "loss": 0.4163, + "step": 40000 + }, + { + "epoch": 1.03, + "learning_rate": 1.5321425241336063e-06, + "loss": 0.6865, + "step": 40001 + }, + { + "epoch": 1.03, + "learning_rate": 1.5321190966075483e-06, + "loss": 0.6602, + "step": 40002 + }, + { + "epoch": 1.03, + "learning_rate": 1.5320956686740716e-06, + "loss": 0.6118, + "step": 40003 + }, + { + "epoch": 1.03, + "learning_rate": 1.5320722403331931e-06, + "loss": 0.7441, + "step": 40004 + }, + { + "epoch": 1.03, + "learning_rate": 1.5320488115849318e-06, + "loss": 0.751, + "step": 40005 + }, + { + "epoch": 1.03, + "learning_rate": 1.5320253824293047e-06, + "loss": 0.7861, + "step": 40006 + }, + { + "epoch": 1.03, + "learning_rate": 1.5320019528663309e-06, + "loss": 0.8857, + "step": 40007 + }, + { + "epoch": 1.03, + "learning_rate": 1.5319785228960272e-06, + "loss": 0.748, + "step": 40008 + }, + { + "epoch": 1.03, + "learning_rate": 1.531955092518412e-06, + "loss": 0.8262, + "step": 40009 + }, + { + "epoch": 1.03, + "learning_rate": 1.5319316617335033e-06, + "loss": 0.605, + "step": 40010 + }, + { + "epoch": 1.03, + "learning_rate": 1.5319082305413192e-06, + "loss": 0.7568, + "step": 40011 + }, + { + "epoch": 1.03, + "learning_rate": 1.5318847989418774e-06, + "loss": 0.7148, + "step": 40012 + }, + { + "epoch": 1.03, + "learning_rate": 1.5318613669351957e-06, + "loss": 0.5557, + "step": 40013 + }, + { + "epoch": 1.03, + "learning_rate": 1.531837934521292e-06, + "loss": 0.5977, + "step": 40014 + }, + { + "epoch": 1.03, + "learning_rate": 1.5318145017001846e-06, + "loss": 0.6162, + "step": 40015 + }, + { + "epoch": 1.03, + "learning_rate": 1.5317910684718913e-06, + "loss": 0.7354, + "step": 40016 + }, + { + "epoch": 1.03, + "learning_rate": 1.5317676348364304e-06, + "loss": 0.7217, + "step": 40017 + }, + { + "epoch": 1.03, + "learning_rate": 1.531744200793819e-06, + "loss": 0.7539, + "step": 40018 + }, + { + "epoch": 1.03, + "learning_rate": 1.5317207663440758e-06, + "loss": 0.7168, + "step": 40019 + }, + { + "epoch": 1.03, + "learning_rate": 1.5316973314872183e-06, + "loss": 0.7676, + "step": 40020 + }, + { + "epoch": 1.03, + "learning_rate": 1.5316738962232648e-06, + "loss": 0.3967, + "step": 40021 + }, + { + "epoch": 1.03, + "learning_rate": 1.5316504605522328e-06, + "loss": 0.6851, + "step": 40022 + }, + { + "epoch": 1.03, + "learning_rate": 1.5316270244741405e-06, + "loss": 0.6279, + "step": 40023 + }, + { + "epoch": 1.03, + "learning_rate": 1.531603587989006e-06, + "loss": 0.749, + "step": 40024 + }, + { + "epoch": 1.03, + "learning_rate": 1.531580151096847e-06, + "loss": 0.6885, + "step": 40025 + }, + { + "epoch": 1.03, + "learning_rate": 1.5315567137976815e-06, + "loss": 0.6621, + "step": 40026 + }, + { + "epoch": 1.03, + "learning_rate": 1.5315332760915273e-06, + "loss": 0.75, + "step": 40027 + }, + { + "epoch": 1.03, + "learning_rate": 1.5315098379784028e-06, + "loss": 0.7656, + "step": 40028 + }, + { + "epoch": 1.03, + "learning_rate": 1.5314863994583257e-06, + "loss": 0.7422, + "step": 40029 + }, + { + "epoch": 1.03, + "learning_rate": 1.5314629605313139e-06, + "loss": 0.7554, + "step": 40030 + }, + { + "epoch": 1.03, + "learning_rate": 1.531439521197385e-06, + "loss": 0.7061, + "step": 40031 + }, + { + "epoch": 1.03, + "learning_rate": 1.5314160814565576e-06, + "loss": 0.5337, + "step": 40032 + }, + { + "epoch": 1.03, + "learning_rate": 1.5313926413088491e-06, + "loss": 0.6836, + "step": 40033 + }, + { + "epoch": 1.03, + "learning_rate": 1.5313692007542777e-06, + "loss": 0.5894, + "step": 40034 + }, + { + "epoch": 1.03, + "learning_rate": 1.5313457597928613e-06, + "loss": 0.6274, + "step": 40035 + }, + { + "epoch": 1.03, + "learning_rate": 1.5313223184246184e-06, + "loss": 0.5244, + "step": 40036 + }, + { + "epoch": 1.03, + "learning_rate": 1.5312988766495663e-06, + "loss": 0.7549, + "step": 40037 + }, + { + "epoch": 1.03, + "learning_rate": 1.5312754344677228e-06, + "loss": 0.6191, + "step": 40038 + }, + { + "epoch": 1.03, + "learning_rate": 1.531251991879106e-06, + "loss": 0.7412, + "step": 40039 + }, + { + "epoch": 1.03, + "learning_rate": 1.5312285488837343e-06, + "loss": 0.6274, + "step": 40040 + }, + { + "epoch": 1.03, + "learning_rate": 1.531205105481625e-06, + "loss": 0.6226, + "step": 40041 + }, + { + "epoch": 1.03, + "learning_rate": 1.5311816616727967e-06, + "loss": 0.5518, + "step": 40042 + }, + { + "epoch": 1.03, + "learning_rate": 1.5311582174572667e-06, + "loss": 0.6279, + "step": 40043 + }, + { + "epoch": 1.03, + "learning_rate": 1.5311347728350533e-06, + "loss": 0.7998, + "step": 40044 + }, + { + "epoch": 1.03, + "learning_rate": 1.5311113278061748e-06, + "loss": 0.4695, + "step": 40045 + }, + { + "epoch": 1.03, + "learning_rate": 1.5310878823706488e-06, + "loss": 0.4496, + "step": 40046 + }, + { + "epoch": 1.03, + "learning_rate": 1.531064436528493e-06, + "loss": 0.6616, + "step": 40047 + }, + { + "epoch": 1.03, + "learning_rate": 1.5310409902797255e-06, + "loss": 0.7847, + "step": 40048 + }, + { + "epoch": 1.03, + "learning_rate": 1.5310175436243643e-06, + "loss": 0.3989, + "step": 40049 + }, + { + "epoch": 1.03, + "learning_rate": 1.5309940965624276e-06, + "loss": 0.7168, + "step": 40050 + }, + { + "epoch": 1.03, + "learning_rate": 1.5309706490939332e-06, + "loss": 0.6265, + "step": 40051 + }, + { + "epoch": 1.03, + "learning_rate": 1.5309472012188986e-06, + "loss": 0.7598, + "step": 40052 + }, + { + "epoch": 1.03, + "learning_rate": 1.5309237529373423e-06, + "loss": 0.7852, + "step": 40053 + }, + { + "epoch": 1.03, + "learning_rate": 1.530900304249282e-06, + "loss": 0.8076, + "step": 40054 + }, + { + "epoch": 1.03, + "learning_rate": 1.5308768551547362e-06, + "loss": 0.6206, + "step": 40055 + }, + { + "epoch": 1.03, + "learning_rate": 1.5308534056537221e-06, + "loss": 0.5889, + "step": 40056 + }, + { + "epoch": 1.03, + "learning_rate": 1.530829955746258e-06, + "loss": 0.5874, + "step": 40057 + }, + { + "epoch": 1.03, + "learning_rate": 1.5308065054323618e-06, + "loss": 0.5835, + "step": 40058 + }, + { + "epoch": 1.03, + "learning_rate": 1.5307830547120512e-06, + "loss": 0.7793, + "step": 40059 + }, + { + "epoch": 1.03, + "learning_rate": 1.5307596035853448e-06, + "loss": 0.4873, + "step": 40060 + }, + { + "epoch": 1.03, + "learning_rate": 1.53073615205226e-06, + "loss": 0.6042, + "step": 40061 + }, + { + "epoch": 1.03, + "learning_rate": 1.530712700112815e-06, + "loss": 0.6704, + "step": 40062 + }, + { + "epoch": 1.03, + "learning_rate": 1.5306892477670274e-06, + "loss": 0.5781, + "step": 40063 + }, + { + "epoch": 1.03, + "learning_rate": 1.530665795014916e-06, + "loss": 0.709, + "step": 40064 + }, + { + "epoch": 1.03, + "learning_rate": 1.530642341856498e-06, + "loss": 0.6172, + "step": 40065 + }, + { + "epoch": 1.03, + "learning_rate": 1.5306188882917913e-06, + "loss": 0.8125, + "step": 40066 + }, + { + "epoch": 1.03, + "learning_rate": 1.5305954343208143e-06, + "loss": 0.5051, + "step": 40067 + }, + { + "epoch": 1.03, + "learning_rate": 1.5305719799435849e-06, + "loss": 0.552, + "step": 40068 + }, + { + "epoch": 1.03, + "learning_rate": 1.5305485251601207e-06, + "loss": 0.5005, + "step": 40069 + }, + { + "epoch": 1.03, + "learning_rate": 1.53052506997044e-06, + "loss": 0.7725, + "step": 40070 + }, + { + "epoch": 1.03, + "learning_rate": 1.5305016143745606e-06, + "loss": 0.6914, + "step": 40071 + }, + { + "epoch": 1.03, + "learning_rate": 1.5304781583725007e-06, + "loss": 0.4951, + "step": 40072 + }, + { + "epoch": 1.03, + "learning_rate": 1.5304547019642777e-06, + "loss": 0.6904, + "step": 40073 + }, + { + "epoch": 1.03, + "learning_rate": 1.5304312451499102e-06, + "loss": 0.6763, + "step": 40074 + }, + { + "epoch": 1.03, + "learning_rate": 1.5304077879294158e-06, + "loss": 0.7197, + "step": 40075 + }, + { + "epoch": 1.03, + "learning_rate": 1.5303843303028127e-06, + "loss": 0.6592, + "step": 40076 + }, + { + "epoch": 1.03, + "learning_rate": 1.5303608722701183e-06, + "loss": 0.5654, + "step": 40077 + }, + { + "epoch": 1.03, + "learning_rate": 1.5303374138313515e-06, + "loss": 0.7197, + "step": 40078 + }, + { + "epoch": 1.03, + "learning_rate": 1.530313954986529e-06, + "loss": 0.8125, + "step": 40079 + }, + { + "epoch": 1.03, + "learning_rate": 1.53029049573567e-06, + "loss": 0.7539, + "step": 40080 + }, + { + "epoch": 1.03, + "learning_rate": 1.5302670360787921e-06, + "loss": 0.7021, + "step": 40081 + }, + { + "epoch": 1.03, + "learning_rate": 1.530243576015913e-06, + "loss": 0.7354, + "step": 40082 + }, + { + "epoch": 1.03, + "learning_rate": 1.5302201155470505e-06, + "loss": 0.7627, + "step": 40083 + }, + { + "epoch": 1.03, + "learning_rate": 1.530196654672223e-06, + "loss": 0.7998, + "step": 40084 + }, + { + "epoch": 1.03, + "learning_rate": 1.5301731933914483e-06, + "loss": 0.6699, + "step": 40085 + }, + { + "epoch": 1.03, + "learning_rate": 1.5301497317047444e-06, + "loss": 0.7012, + "step": 40086 + }, + { + "epoch": 1.03, + "learning_rate": 1.5301262696121294e-06, + "loss": 0.6523, + "step": 40087 + }, + { + "epoch": 1.03, + "learning_rate": 1.5301028071136207e-06, + "loss": 0.5261, + "step": 40088 + }, + { + "epoch": 1.03, + "learning_rate": 1.5300793442092368e-06, + "loss": 0.5742, + "step": 40089 + }, + { + "epoch": 1.03, + "learning_rate": 1.5300558808989957e-06, + "loss": 0.6553, + "step": 40090 + }, + { + "epoch": 1.03, + "learning_rate": 1.530032417182915e-06, + "loss": 0.4331, + "step": 40091 + }, + { + "epoch": 1.03, + "learning_rate": 1.530008953061013e-06, + "loss": 0.323, + "step": 40092 + }, + { + "epoch": 1.03, + "learning_rate": 1.5299854885333075e-06, + "loss": 0.6792, + "step": 40093 + }, + { + "epoch": 1.03, + "learning_rate": 1.5299620235998164e-06, + "loss": 0.8057, + "step": 40094 + }, + { + "epoch": 1.03, + "learning_rate": 1.5299385582605578e-06, + "loss": 0.5281, + "step": 40095 + }, + { + "epoch": 1.03, + "learning_rate": 1.5299150925155494e-06, + "loss": 0.5332, + "step": 40096 + }, + { + "epoch": 1.03, + "learning_rate": 1.5298916263648098e-06, + "loss": 0.6755, + "step": 40097 + }, + { + "epoch": 1.03, + "learning_rate": 1.5298681598083561e-06, + "loss": 0.5093, + "step": 40098 + }, + { + "epoch": 1.03, + "learning_rate": 1.529844692846207e-06, + "loss": 0.7188, + "step": 40099 + }, + { + "epoch": 1.03, + "learning_rate": 1.52982122547838e-06, + "loss": 0.6885, + "step": 40100 + }, + { + "epoch": 1.03, + "learning_rate": 1.5297977577048936e-06, + "loss": 0.8369, + "step": 40101 + }, + { + "epoch": 1.03, + "learning_rate": 1.5297742895257647e-06, + "loss": 0.5625, + "step": 40102 + }, + { + "epoch": 1.03, + "learning_rate": 1.5297508209410128e-06, + "loss": 0.5566, + "step": 40103 + }, + { + "epoch": 1.03, + "learning_rate": 1.5297273519506547e-06, + "loss": 0.5703, + "step": 40104 + }, + { + "epoch": 1.03, + "learning_rate": 1.5297038825547086e-06, + "loss": 0.6631, + "step": 40105 + }, + { + "epoch": 1.03, + "learning_rate": 1.5296804127531927e-06, + "loss": 0.7656, + "step": 40106 + }, + { + "epoch": 1.03, + "learning_rate": 1.5296569425461247e-06, + "loss": 0.6313, + "step": 40107 + }, + { + "epoch": 1.03, + "learning_rate": 1.5296334719335232e-06, + "loss": 0.6567, + "step": 40108 + }, + { + "epoch": 1.03, + "learning_rate": 1.5296100009154054e-06, + "loss": 0.5757, + "step": 40109 + }, + { + "epoch": 1.03, + "learning_rate": 1.5295865294917895e-06, + "loss": 0.5737, + "step": 40110 + }, + { + "epoch": 1.03, + "learning_rate": 1.5295630576626937e-06, + "loss": 0.7334, + "step": 40111 + }, + { + "epoch": 1.03, + "learning_rate": 1.5295395854281358e-06, + "loss": 0.835, + "step": 40112 + }, + { + "epoch": 1.03, + "learning_rate": 1.5295161127881336e-06, + "loss": 0.6582, + "step": 40113 + }, + { + "epoch": 1.03, + "learning_rate": 1.5294926397427052e-06, + "loss": 0.6304, + "step": 40114 + }, + { + "epoch": 1.03, + "learning_rate": 1.5294691662918688e-06, + "loss": 0.5928, + "step": 40115 + }, + { + "epoch": 1.03, + "learning_rate": 1.5294456924356425e-06, + "loss": 0.5762, + "step": 40116 + }, + { + "epoch": 1.03, + "learning_rate": 1.5294222181740437e-06, + "loss": 0.7495, + "step": 40117 + }, + { + "epoch": 1.03, + "learning_rate": 1.5293987435070908e-06, + "loss": 0.5037, + "step": 40118 + }, + { + "epoch": 1.03, + "learning_rate": 1.5293752684348013e-06, + "loss": 0.8096, + "step": 40119 + }, + { + "epoch": 1.03, + "learning_rate": 1.5293517929571938e-06, + "loss": 0.5322, + "step": 40120 + }, + { + "epoch": 1.03, + "learning_rate": 1.5293283170742859e-06, + "loss": 0.647, + "step": 40121 + }, + { + "epoch": 1.03, + "learning_rate": 1.5293048407860956e-06, + "loss": 0.5542, + "step": 40122 + }, + { + "epoch": 1.03, + "learning_rate": 1.529281364092641e-06, + "loss": 0.7148, + "step": 40123 + }, + { + "epoch": 1.03, + "learning_rate": 1.5292578869939398e-06, + "loss": 0.7383, + "step": 40124 + }, + { + "epoch": 1.03, + "learning_rate": 1.52923440949001e-06, + "loss": 0.8379, + "step": 40125 + }, + { + "epoch": 1.03, + "learning_rate": 1.5292109315808703e-06, + "loss": 0.6348, + "step": 40126 + }, + { + "epoch": 1.03, + "learning_rate": 1.5291874532665378e-06, + "loss": 0.7217, + "step": 40127 + }, + { + "epoch": 1.03, + "learning_rate": 1.5291639745470311e-06, + "loss": 0.6802, + "step": 40128 + }, + { + "epoch": 1.03, + "learning_rate": 1.5291404954223674e-06, + "loss": 0.6924, + "step": 40129 + }, + { + "epoch": 1.03, + "learning_rate": 1.5291170158925657e-06, + "loss": 0.5718, + "step": 40130 + }, + { + "epoch": 1.03, + "learning_rate": 1.5290935359576432e-06, + "loss": 0.6719, + "step": 40131 + }, + { + "epoch": 1.03, + "learning_rate": 1.5290700556176177e-06, + "loss": 0.7363, + "step": 40132 + }, + { + "epoch": 1.03, + "learning_rate": 1.529046574872508e-06, + "loss": 0.6514, + "step": 40133 + }, + { + "epoch": 1.03, + "learning_rate": 1.5290230937223316e-06, + "loss": 0.5811, + "step": 40134 + }, + { + "epoch": 1.03, + "learning_rate": 1.5289996121671064e-06, + "loss": 0.6733, + "step": 40135 + }, + { + "epoch": 1.03, + "learning_rate": 1.5289761302068506e-06, + "loss": 0.6104, + "step": 40136 + }, + { + "epoch": 1.03, + "learning_rate": 1.5289526478415825e-06, + "loss": 0.6777, + "step": 40137 + }, + { + "epoch": 1.03, + "learning_rate": 1.528929165071319e-06, + "loss": 0.6885, + "step": 40138 + }, + { + "epoch": 1.03, + "learning_rate": 1.5289056818960792e-06, + "loss": 0.5776, + "step": 40139 + }, + { + "epoch": 1.03, + "learning_rate": 1.5288821983158803e-06, + "loss": 0.8545, + "step": 40140 + }, + { + "epoch": 1.03, + "learning_rate": 1.5288587143307412e-06, + "loss": 0.457, + "step": 40141 + }, + { + "epoch": 1.03, + "learning_rate": 1.5288352299406789e-06, + "loss": 0.6465, + "step": 40142 + }, + { + "epoch": 1.03, + "learning_rate": 1.528811745145712e-06, + "loss": 0.6455, + "step": 40143 + }, + { + "epoch": 1.03, + "learning_rate": 1.5287882599458577e-06, + "loss": 0.7646, + "step": 40144 + }, + { + "epoch": 1.03, + "learning_rate": 1.528764774341135e-06, + "loss": 0.6675, + "step": 40145 + }, + { + "epoch": 1.03, + "learning_rate": 1.5287412883315617e-06, + "loss": 0.6582, + "step": 40146 + }, + { + "epoch": 1.03, + "learning_rate": 1.5287178019171552e-06, + "loss": 0.5874, + "step": 40147 + }, + { + "epoch": 1.03, + "learning_rate": 1.5286943150979334e-06, + "loss": 0.6685, + "step": 40148 + }, + { + "epoch": 1.03, + "learning_rate": 1.528670827873915e-06, + "loss": 0.6104, + "step": 40149 + }, + { + "epoch": 1.03, + "learning_rate": 1.5286473402451176e-06, + "loss": 0.7251, + "step": 40150 + }, + { + "epoch": 1.03, + "learning_rate": 1.5286238522115596e-06, + "loss": 0.7666, + "step": 40151 + }, + { + "epoch": 1.03, + "learning_rate": 1.5286003637732585e-06, + "loss": 0.6807, + "step": 40152 + }, + { + "epoch": 1.03, + "learning_rate": 1.528576874930232e-06, + "loss": 0.5703, + "step": 40153 + }, + { + "epoch": 1.03, + "learning_rate": 1.5285533856824988e-06, + "loss": 0.6128, + "step": 40154 + }, + { + "epoch": 1.03, + "learning_rate": 1.5285298960300765e-06, + "loss": 0.6221, + "step": 40155 + }, + { + "epoch": 1.03, + "learning_rate": 1.5285064059729833e-06, + "loss": 0.8599, + "step": 40156 + }, + { + "epoch": 1.03, + "learning_rate": 1.528482915511237e-06, + "loss": 0.8066, + "step": 40157 + }, + { + "epoch": 1.03, + "learning_rate": 1.5284594246448555e-06, + "loss": 0.5361, + "step": 40158 + }, + { + "epoch": 1.03, + "learning_rate": 1.5284359333738567e-06, + "loss": 0.7178, + "step": 40159 + }, + { + "epoch": 1.03, + "learning_rate": 1.5284124416982592e-06, + "loss": 0.6611, + "step": 40160 + }, + { + "epoch": 1.03, + "learning_rate": 1.5283889496180807e-06, + "loss": 0.606, + "step": 40161 + }, + { + "epoch": 1.03, + "learning_rate": 1.5283654571333387e-06, + "loss": 0.9414, + "step": 40162 + }, + { + "epoch": 1.03, + "learning_rate": 1.5283419642440518e-06, + "loss": 0.5947, + "step": 40163 + }, + { + "epoch": 1.03, + "learning_rate": 1.5283184709502375e-06, + "loss": 0.4712, + "step": 40164 + }, + { + "epoch": 1.03, + "learning_rate": 1.5282949772519143e-06, + "loss": 0.7412, + "step": 40165 + }, + { + "epoch": 1.03, + "learning_rate": 1.5282714831490999e-06, + "loss": 0.5288, + "step": 40166 + }, + { + "epoch": 1.03, + "learning_rate": 1.5282479886418122e-06, + "loss": 0.5126, + "step": 40167 + }, + { + "epoch": 1.03, + "learning_rate": 1.5282244937300694e-06, + "loss": 0.6416, + "step": 40168 + }, + { + "epoch": 1.03, + "learning_rate": 1.5282009984138894e-06, + "loss": 0.5874, + "step": 40169 + }, + { + "epoch": 1.03, + "learning_rate": 1.5281775026932899e-06, + "loss": 0.6611, + "step": 40170 + }, + { + "epoch": 1.03, + "learning_rate": 1.5281540065682897e-06, + "loss": 0.54, + "step": 40171 + }, + { + "epoch": 1.03, + "learning_rate": 1.5281305100389059e-06, + "loss": 0.709, + "step": 40172 + }, + { + "epoch": 1.03, + "learning_rate": 1.5281070131051568e-06, + "loss": 0.8408, + "step": 40173 + }, + { + "epoch": 1.03, + "learning_rate": 1.5280835157670606e-06, + "loss": 0.6865, + "step": 40174 + }, + { + "epoch": 1.03, + "learning_rate": 1.528060018024635e-06, + "loss": 0.6738, + "step": 40175 + }, + { + "epoch": 1.03, + "learning_rate": 1.5280365198778982e-06, + "loss": 0.3823, + "step": 40176 + }, + { + "epoch": 1.03, + "learning_rate": 1.5280130213268682e-06, + "loss": 0.7544, + "step": 40177 + }, + { + "epoch": 1.03, + "learning_rate": 1.5279895223715628e-06, + "loss": 0.5664, + "step": 40178 + }, + { + "epoch": 1.03, + "learning_rate": 1.5279660230120005e-06, + "loss": 0.6162, + "step": 40179 + }, + { + "epoch": 1.03, + "learning_rate": 1.5279425232481982e-06, + "loss": 0.6191, + "step": 40180 + }, + { + "epoch": 1.03, + "learning_rate": 1.5279190230801754e-06, + "loss": 0.5186, + "step": 40181 + }, + { + "epoch": 1.03, + "learning_rate": 1.5278955225079484e-06, + "loss": 0.8008, + "step": 40182 + }, + { + "epoch": 1.03, + "learning_rate": 1.5278720215315363e-06, + "loss": 0.5017, + "step": 40183 + }, + { + "epoch": 1.03, + "learning_rate": 1.527848520150957e-06, + "loss": 0.7334, + "step": 40184 + }, + { + "epoch": 1.03, + "learning_rate": 1.5278250183662284e-06, + "loss": 0.5752, + "step": 40185 + }, + { + "epoch": 1.03, + "learning_rate": 1.5278015161773687e-06, + "loss": 0.6768, + "step": 40186 + }, + { + "epoch": 1.03, + "learning_rate": 1.5277780135843953e-06, + "loss": 0.7422, + "step": 40187 + }, + { + "epoch": 1.03, + "learning_rate": 1.5277545105873269e-06, + "loss": 0.5889, + "step": 40188 + }, + { + "epoch": 1.03, + "learning_rate": 1.5277310071861807e-06, + "loss": 0.6367, + "step": 40189 + }, + { + "epoch": 1.03, + "learning_rate": 1.5277075033809753e-06, + "loss": 0.7256, + "step": 40190 + }, + { + "epoch": 1.03, + "learning_rate": 1.5276839991717288e-06, + "loss": 0.7124, + "step": 40191 + }, + { + "epoch": 1.03, + "learning_rate": 1.5276604945584586e-06, + "loss": 0.6123, + "step": 40192 + }, + { + "epoch": 1.03, + "learning_rate": 1.527636989541183e-06, + "loss": 0.7227, + "step": 40193 + }, + { + "epoch": 1.03, + "learning_rate": 1.52761348411992e-06, + "loss": 0.6694, + "step": 40194 + }, + { + "epoch": 1.03, + "learning_rate": 1.5275899782946877e-06, + "loss": 0.5752, + "step": 40195 + }, + { + "epoch": 1.03, + "learning_rate": 1.5275664720655042e-06, + "loss": 0.6543, + "step": 40196 + }, + { + "epoch": 1.03, + "learning_rate": 1.5275429654323871e-06, + "loss": 0.6265, + "step": 40197 + }, + { + "epoch": 1.03, + "learning_rate": 1.5275194583953548e-06, + "loss": 0.5386, + "step": 40198 + }, + { + "epoch": 1.03, + "learning_rate": 1.527495950954425e-06, + "loss": 0.6895, + "step": 40199 + }, + { + "epoch": 1.03, + "learning_rate": 1.5274724431096155e-06, + "loss": 0.5701, + "step": 40200 + }, + { + "epoch": 1.03, + "learning_rate": 1.5274489348609449e-06, + "loss": 0.5483, + "step": 40201 + }, + { + "epoch": 1.03, + "learning_rate": 1.527425426208431e-06, + "loss": 0.644, + "step": 40202 + }, + { + "epoch": 1.03, + "learning_rate": 1.5274019171520914e-06, + "loss": 0.5747, + "step": 40203 + }, + { + "epoch": 1.03, + "learning_rate": 1.5273784076919447e-06, + "loss": 0.6504, + "step": 40204 + }, + { + "epoch": 1.03, + "learning_rate": 1.5273548978280081e-06, + "loss": 0.7119, + "step": 40205 + }, + { + "epoch": 1.03, + "learning_rate": 1.5273313875603009e-06, + "loss": 0.6074, + "step": 40206 + }, + { + "epoch": 1.03, + "learning_rate": 1.5273078768888397e-06, + "loss": 0.6978, + "step": 40207 + }, + { + "epoch": 1.03, + "learning_rate": 1.5272843658136437e-06, + "loss": 0.5632, + "step": 40208 + }, + { + "epoch": 1.03, + "learning_rate": 1.5272608543347297e-06, + "loss": 0.542, + "step": 40209 + }, + { + "epoch": 1.03, + "learning_rate": 1.5272373424521162e-06, + "loss": 0.7427, + "step": 40210 + }, + { + "epoch": 1.03, + "learning_rate": 1.5272138301658219e-06, + "loss": 0.6611, + "step": 40211 + }, + { + "epoch": 1.03, + "learning_rate": 1.527190317475864e-06, + "loss": 0.7188, + "step": 40212 + }, + { + "epoch": 1.03, + "learning_rate": 1.5271668043822605e-06, + "loss": 0.7275, + "step": 40213 + }, + { + "epoch": 1.03, + "learning_rate": 1.5271432908850299e-06, + "loss": 0.7222, + "step": 40214 + }, + { + "epoch": 1.03, + "learning_rate": 1.5271197769841897e-06, + "loss": 0.6519, + "step": 40215 + }, + { + "epoch": 1.03, + "learning_rate": 1.527096262679758e-06, + "loss": 0.5625, + "step": 40216 + }, + { + "epoch": 1.03, + "learning_rate": 1.5270727479717533e-06, + "loss": 0.5977, + "step": 40217 + }, + { + "epoch": 1.03, + "learning_rate": 1.5270492328601931e-06, + "loss": 0.7637, + "step": 40218 + }, + { + "epoch": 1.03, + "learning_rate": 1.5270257173450956e-06, + "loss": 0.5923, + "step": 40219 + }, + { + "epoch": 1.03, + "learning_rate": 1.5270022014264785e-06, + "loss": 0.6992, + "step": 40220 + }, + { + "epoch": 1.03, + "learning_rate": 1.5269786851043604e-06, + "loss": 0.6003, + "step": 40221 + }, + { + "epoch": 1.03, + "learning_rate": 1.5269551683787586e-06, + "loss": 0.7041, + "step": 40222 + }, + { + "epoch": 1.03, + "learning_rate": 1.5269316512496916e-06, + "loss": 0.6816, + "step": 40223 + }, + { + "epoch": 1.03, + "learning_rate": 1.5269081337171772e-06, + "loss": 0.7109, + "step": 40224 + }, + { + "epoch": 1.03, + "learning_rate": 1.5268846157812337e-06, + "loss": 0.5659, + "step": 40225 + }, + { + "epoch": 1.03, + "learning_rate": 1.5268610974418788e-06, + "loss": 0.5107, + "step": 40226 + }, + { + "epoch": 1.03, + "learning_rate": 1.5268375786991303e-06, + "loss": 0.8135, + "step": 40227 + }, + { + "epoch": 1.03, + "learning_rate": 1.5268140595530069e-06, + "loss": 0.7715, + "step": 40228 + }, + { + "epoch": 1.03, + "learning_rate": 1.526790540003526e-06, + "loss": 0.5854, + "step": 40229 + }, + { + "epoch": 1.03, + "learning_rate": 1.5267670200507055e-06, + "loss": 0.7969, + "step": 40230 + }, + { + "epoch": 1.03, + "learning_rate": 1.5267434996945643e-06, + "loss": 0.8135, + "step": 40231 + }, + { + "epoch": 1.03, + "learning_rate": 1.5267199789351195e-06, + "loss": 0.7178, + "step": 40232 + }, + { + "epoch": 1.03, + "learning_rate": 1.5266964577723895e-06, + "loss": 0.7544, + "step": 40233 + }, + { + "epoch": 1.03, + "learning_rate": 1.5266729362063919e-06, + "loss": 0.6104, + "step": 40234 + }, + { + "epoch": 1.03, + "learning_rate": 1.5266494142371455e-06, + "loss": 0.4678, + "step": 40235 + }, + { + "epoch": 1.03, + "learning_rate": 1.5266258918646677e-06, + "loss": 0.7207, + "step": 40236 + }, + { + "epoch": 1.03, + "learning_rate": 1.5266023690889767e-06, + "loss": 0.5845, + "step": 40237 + }, + { + "epoch": 1.03, + "learning_rate": 1.5265788459100905e-06, + "loss": 0.5396, + "step": 40238 + }, + { + "epoch": 1.03, + "learning_rate": 1.526555322328027e-06, + "loss": 0.7246, + "step": 40239 + }, + { + "epoch": 1.03, + "learning_rate": 1.5265317983428042e-06, + "loss": 0.4397, + "step": 40240 + }, + { + "epoch": 1.03, + "learning_rate": 1.5265082739544405e-06, + "loss": 0.3918, + "step": 40241 + }, + { + "epoch": 1.03, + "learning_rate": 1.5264847491629536e-06, + "loss": 0.6133, + "step": 40242 + }, + { + "epoch": 1.03, + "learning_rate": 1.5264612239683615e-06, + "loss": 0.7148, + "step": 40243 + }, + { + "epoch": 1.03, + "learning_rate": 1.5264376983706822e-06, + "loss": 0.541, + "step": 40244 + }, + { + "epoch": 1.03, + "learning_rate": 1.5264141723699337e-06, + "loss": 0.6196, + "step": 40245 + }, + { + "epoch": 1.03, + "learning_rate": 1.526390645966134e-06, + "loss": 0.7207, + "step": 40246 + }, + { + "epoch": 1.03, + "learning_rate": 1.5263671191593012e-06, + "loss": 0.6348, + "step": 40247 + }, + { + "epoch": 1.03, + "learning_rate": 1.5263435919494536e-06, + "loss": 0.7075, + "step": 40248 + }, + { + "epoch": 1.03, + "learning_rate": 1.5263200643366086e-06, + "loss": 0.7871, + "step": 40249 + }, + { + "epoch": 1.03, + "learning_rate": 1.5262965363207845e-06, + "loss": 0.666, + "step": 40250 + }, + { + "epoch": 1.03, + "learning_rate": 1.5262730079019996e-06, + "loss": 0.4595, + "step": 40251 + }, + { + "epoch": 1.03, + "learning_rate": 1.5262494790802715e-06, + "loss": 0.7446, + "step": 40252 + }, + { + "epoch": 1.03, + "learning_rate": 1.5262259498556182e-06, + "loss": 0.4453, + "step": 40253 + }, + { + "epoch": 1.03, + "learning_rate": 1.5262024202280583e-06, + "loss": 0.5679, + "step": 40254 + }, + { + "epoch": 1.03, + "learning_rate": 1.5261788901976092e-06, + "loss": 0.5522, + "step": 40255 + }, + { + "epoch": 1.03, + "learning_rate": 1.5261553597642891e-06, + "loss": 0.7969, + "step": 40256 + }, + { + "epoch": 1.03, + "learning_rate": 1.5261318289281162e-06, + "loss": 0.7344, + "step": 40257 + }, + { + "epoch": 1.03, + "learning_rate": 1.5261082976891081e-06, + "loss": 0.6357, + "step": 40258 + }, + { + "epoch": 1.03, + "learning_rate": 1.5260847660472832e-06, + "loss": 0.7212, + "step": 40259 + }, + { + "epoch": 1.03, + "learning_rate": 1.5260612340026593e-06, + "loss": 0.6001, + "step": 40260 + }, + { + "epoch": 1.03, + "learning_rate": 1.5260377015552546e-06, + "loss": 0.5586, + "step": 40261 + }, + { + "epoch": 1.03, + "learning_rate": 1.5260141687050872e-06, + "loss": 0.6738, + "step": 40262 + }, + { + "epoch": 1.03, + "learning_rate": 1.5259906354521745e-06, + "loss": 0.7373, + "step": 40263 + }, + { + "epoch": 1.03, + "learning_rate": 1.5259671017965352e-06, + "loss": 0.5457, + "step": 40264 + }, + { + "epoch": 1.03, + "learning_rate": 1.525943567738187e-06, + "loss": 0.5225, + "step": 40265 + }, + { + "epoch": 1.03, + "learning_rate": 1.5259200332771477e-06, + "loss": 0.6738, + "step": 40266 + }, + { + "epoch": 1.03, + "learning_rate": 1.5258964984134362e-06, + "loss": 0.603, + "step": 40267 + }, + { + "epoch": 1.03, + "learning_rate": 1.5258729631470696e-06, + "loss": 0.7588, + "step": 40268 + }, + { + "epoch": 1.03, + "learning_rate": 1.5258494274780664e-06, + "loss": 0.5657, + "step": 40269 + }, + { + "epoch": 1.03, + "learning_rate": 1.5258258914064444e-06, + "loss": 0.6143, + "step": 40270 + }, + { + "epoch": 1.03, + "learning_rate": 1.525802354932222e-06, + "loss": 0.6338, + "step": 40271 + }, + { + "epoch": 1.03, + "learning_rate": 1.5257788180554164e-06, + "loss": 0.5596, + "step": 40272 + }, + { + "epoch": 1.03, + "learning_rate": 1.5257552807760463e-06, + "loss": 0.5576, + "step": 40273 + }, + { + "epoch": 1.03, + "learning_rate": 1.5257317430941294e-06, + "loss": 0.5352, + "step": 40274 + }, + { + "epoch": 1.03, + "learning_rate": 1.5257082050096842e-06, + "loss": 0.7744, + "step": 40275 + }, + { + "epoch": 1.03, + "learning_rate": 1.5256846665227283e-06, + "loss": 0.5674, + "step": 40276 + }, + { + "epoch": 1.03, + "learning_rate": 1.5256611276332797e-06, + "loss": 0.7041, + "step": 40277 + }, + { + "epoch": 1.03, + "learning_rate": 1.5256375883413566e-06, + "loss": 0.4795, + "step": 40278 + }, + { + "epoch": 1.03, + "learning_rate": 1.525614048646977e-06, + "loss": 0.5117, + "step": 40279 + }, + { + "epoch": 1.03, + "learning_rate": 1.525590508550159e-06, + "loss": 0.5342, + "step": 40280 + }, + { + "epoch": 1.03, + "learning_rate": 1.5255669680509207e-06, + "loss": 0.7861, + "step": 40281 + }, + { + "epoch": 1.03, + "learning_rate": 1.5255434271492795e-06, + "loss": 0.6157, + "step": 40282 + }, + { + "epoch": 1.03, + "learning_rate": 1.525519885845254e-06, + "loss": 0.7637, + "step": 40283 + }, + { + "epoch": 1.03, + "learning_rate": 1.5254963441388623e-06, + "loss": 0.5264, + "step": 40284 + }, + { + "epoch": 1.03, + "learning_rate": 1.525472802030122e-06, + "loss": 0.7969, + "step": 40285 + }, + { + "epoch": 1.03, + "learning_rate": 1.525449259519051e-06, + "loss": 0.6885, + "step": 40286 + }, + { + "epoch": 1.03, + "learning_rate": 1.5254257166056683e-06, + "loss": 0.6055, + "step": 40287 + }, + { + "epoch": 1.03, + "learning_rate": 1.5254021732899908e-06, + "loss": 0.5337, + "step": 40288 + }, + { + "epoch": 1.03, + "learning_rate": 1.5253786295720373e-06, + "loss": 0.5103, + "step": 40289 + }, + { + "epoch": 1.03, + "learning_rate": 1.5253550854518254e-06, + "loss": 0.6118, + "step": 40290 + }, + { + "epoch": 1.03, + "learning_rate": 1.5253315409293735e-06, + "loss": 0.6953, + "step": 40291 + }, + { + "epoch": 1.03, + "learning_rate": 1.5253079960046994e-06, + "loss": 0.6436, + "step": 40292 + }, + { + "epoch": 1.03, + "learning_rate": 1.525284450677821e-06, + "loss": 0.5806, + "step": 40293 + }, + { + "epoch": 1.03, + "learning_rate": 1.5252609049487562e-06, + "loss": 0.6138, + "step": 40294 + }, + { + "epoch": 1.03, + "learning_rate": 1.5252373588175234e-06, + "loss": 0.54, + "step": 40295 + }, + { + "epoch": 1.03, + "learning_rate": 1.5252138122841407e-06, + "loss": 0.7461, + "step": 40296 + }, + { + "epoch": 1.03, + "learning_rate": 1.5251902653486258e-06, + "loss": 0.6733, + "step": 40297 + }, + { + "epoch": 1.03, + "learning_rate": 1.5251667180109968e-06, + "loss": 0.6885, + "step": 40298 + }, + { + "epoch": 1.03, + "learning_rate": 1.5251431702712717e-06, + "loss": 0.7227, + "step": 40299 + }, + { + "epoch": 1.03, + "learning_rate": 1.5251196221294688e-06, + "loss": 0.7637, + "step": 40300 + }, + { + "epoch": 1.03, + "learning_rate": 1.5250960735856062e-06, + "loss": 0.7246, + "step": 40301 + }, + { + "epoch": 1.03, + "learning_rate": 1.5250725246397016e-06, + "loss": 0.5972, + "step": 40302 + }, + { + "epoch": 1.03, + "learning_rate": 1.5250489752917725e-06, + "loss": 0.6389, + "step": 40303 + }, + { + "epoch": 1.03, + "learning_rate": 1.5250254255418383e-06, + "loss": 0.5925, + "step": 40304 + }, + { + "epoch": 1.03, + "learning_rate": 1.5250018753899157e-06, + "loss": 0.7173, + "step": 40305 + }, + { + "epoch": 1.03, + "learning_rate": 1.5249783248360238e-06, + "loss": 0.8154, + "step": 40306 + }, + { + "epoch": 1.03, + "learning_rate": 1.5249547738801798e-06, + "loss": 0.6221, + "step": 40307 + }, + { + "epoch": 1.03, + "learning_rate": 1.5249312225224022e-06, + "loss": 0.751, + "step": 40308 + }, + { + "epoch": 1.03, + "learning_rate": 1.5249076707627086e-06, + "loss": 0.6816, + "step": 40309 + }, + { + "epoch": 1.03, + "learning_rate": 1.5248841186011179e-06, + "loss": 0.5701, + "step": 40310 + }, + { + "epoch": 1.03, + "learning_rate": 1.5248605660376473e-06, + "loss": 0.71, + "step": 40311 + }, + { + "epoch": 1.03, + "learning_rate": 1.524837013072315e-06, + "loss": 0.7207, + "step": 40312 + }, + { + "epoch": 1.03, + "learning_rate": 1.5248134597051393e-06, + "loss": 0.7822, + "step": 40313 + }, + { + "epoch": 1.03, + "learning_rate": 1.5247899059361378e-06, + "loss": 0.6758, + "step": 40314 + }, + { + "epoch": 1.03, + "learning_rate": 1.5247663517653288e-06, + "loss": 0.7402, + "step": 40315 + }, + { + "epoch": 1.03, + "learning_rate": 1.5247427971927306e-06, + "loss": 0.6343, + "step": 40316 + }, + { + "epoch": 1.03, + "learning_rate": 1.524719242218361e-06, + "loss": 0.7012, + "step": 40317 + }, + { + "epoch": 1.03, + "learning_rate": 1.5246956868422377e-06, + "loss": 0.7842, + "step": 40318 + }, + { + "epoch": 1.03, + "learning_rate": 1.5246721310643792e-06, + "loss": 0.4756, + "step": 40319 + }, + { + "epoch": 1.03, + "learning_rate": 1.5246485748848032e-06, + "loss": 0.79, + "step": 40320 + }, + { + "epoch": 1.03, + "learning_rate": 1.5246250183035282e-06, + "loss": 0.7021, + "step": 40321 + }, + { + "epoch": 1.03, + "learning_rate": 1.524601461320572e-06, + "loss": 0.4829, + "step": 40322 + }, + { + "epoch": 1.03, + "learning_rate": 1.5245779039359523e-06, + "loss": 0.8398, + "step": 40323 + }, + { + "epoch": 1.03, + "learning_rate": 1.5245543461496874e-06, + "loss": 0.668, + "step": 40324 + }, + { + "epoch": 1.03, + "learning_rate": 1.5245307879617957e-06, + "loss": 0.4725, + "step": 40325 + }, + { + "epoch": 1.03, + "learning_rate": 1.5245072293722947e-06, + "loss": 0.6436, + "step": 40326 + }, + { + "epoch": 1.03, + "learning_rate": 1.5244836703812025e-06, + "loss": 0.6104, + "step": 40327 + }, + { + "epoch": 1.03, + "learning_rate": 1.5244601109885373e-06, + "loss": 0.5908, + "step": 40328 + }, + { + "epoch": 1.03, + "learning_rate": 1.5244365511943173e-06, + "loss": 0.6895, + "step": 40329 + }, + { + "epoch": 1.03, + "learning_rate": 1.5244129909985604e-06, + "loss": 0.6528, + "step": 40330 + }, + { + "epoch": 1.03, + "learning_rate": 1.5243894304012841e-06, + "loss": 0.5469, + "step": 40331 + }, + { + "epoch": 1.03, + "learning_rate": 1.5243658694025074e-06, + "loss": 0.5938, + "step": 40332 + }, + { + "epoch": 1.03, + "learning_rate": 1.5243423080022475e-06, + "loss": 0.71, + "step": 40333 + }, + { + "epoch": 1.03, + "learning_rate": 1.5243187462005232e-06, + "loss": 0.6094, + "step": 40334 + }, + { + "epoch": 1.03, + "learning_rate": 1.5242951839973518e-06, + "loss": 0.4534, + "step": 40335 + }, + { + "epoch": 1.03, + "learning_rate": 1.524271621392752e-06, + "loss": 0.5657, + "step": 40336 + }, + { + "epoch": 1.03, + "learning_rate": 1.5242480583867415e-06, + "loss": 0.5425, + "step": 40337 + }, + { + "epoch": 1.03, + "learning_rate": 1.524224494979338e-06, + "loss": 0.7715, + "step": 40338 + }, + { + "epoch": 1.03, + "learning_rate": 1.52420093117056e-06, + "loss": 0.5151, + "step": 40339 + }, + { + "epoch": 1.03, + "learning_rate": 1.524177366960426e-06, + "loss": 0.4988, + "step": 40340 + }, + { + "epoch": 1.03, + "learning_rate": 1.524153802348953e-06, + "loss": 0.5723, + "step": 40341 + }, + { + "epoch": 1.03, + "learning_rate": 1.5241302373361597e-06, + "loss": 0.7637, + "step": 40342 + }, + { + "epoch": 1.03, + "learning_rate": 1.5241066719220639e-06, + "loss": 0.7871, + "step": 40343 + }, + { + "epoch": 1.03, + "learning_rate": 1.5240831061066837e-06, + "loss": 0.7754, + "step": 40344 + }, + { + "epoch": 1.03, + "learning_rate": 1.5240595398900373e-06, + "loss": 0.8291, + "step": 40345 + }, + { + "epoch": 1.03, + "learning_rate": 1.5240359732721425e-06, + "loss": 0.5913, + "step": 40346 + }, + { + "epoch": 1.03, + "learning_rate": 1.5240124062530173e-06, + "loss": 0.6699, + "step": 40347 + }, + { + "epoch": 1.03, + "learning_rate": 1.5239888388326803e-06, + "loss": 0.5947, + "step": 40348 + }, + { + "epoch": 1.03, + "learning_rate": 1.5239652710111485e-06, + "loss": 0.5684, + "step": 40349 + }, + { + "epoch": 1.03, + "learning_rate": 1.5239417027884411e-06, + "loss": 0.8799, + "step": 40350 + }, + { + "epoch": 1.03, + "learning_rate": 1.5239181341645754e-06, + "loss": 0.7676, + "step": 40351 + }, + { + "epoch": 1.03, + "learning_rate": 1.52389456513957e-06, + "loss": 0.541, + "step": 40352 + }, + { + "epoch": 1.03, + "learning_rate": 1.5238709957134424e-06, + "loss": 0.6797, + "step": 40353 + }, + { + "epoch": 1.03, + "learning_rate": 1.5238474258862107e-06, + "loss": 0.5947, + "step": 40354 + }, + { + "epoch": 1.03, + "learning_rate": 1.5238238556578934e-06, + "loss": 0.5814, + "step": 40355 + }, + { + "epoch": 1.03, + "learning_rate": 1.523800285028508e-06, + "loss": 0.6206, + "step": 40356 + }, + { + "epoch": 1.03, + "learning_rate": 1.5237767139980732e-06, + "loss": 0.5498, + "step": 40357 + }, + { + "epoch": 1.03, + "learning_rate": 1.5237531425666062e-06, + "loss": 0.6699, + "step": 40358 + }, + { + "epoch": 1.03, + "learning_rate": 1.5237295707341256e-06, + "loss": 0.4746, + "step": 40359 + }, + { + "epoch": 1.03, + "learning_rate": 1.5237059985006495e-06, + "loss": 0.6567, + "step": 40360 + }, + { + "epoch": 1.03, + "learning_rate": 1.523682425866196e-06, + "loss": 0.6768, + "step": 40361 + }, + { + "epoch": 1.03, + "learning_rate": 1.5236588528307826e-06, + "loss": 0.6885, + "step": 40362 + }, + { + "epoch": 1.03, + "learning_rate": 1.5236352793944275e-06, + "loss": 0.6006, + "step": 40363 + }, + { + "epoch": 1.03, + "learning_rate": 1.5236117055571494e-06, + "loss": 0.6377, + "step": 40364 + }, + { + "epoch": 1.03, + "learning_rate": 1.5235881313189659e-06, + "loss": 0.5483, + "step": 40365 + }, + { + "epoch": 1.03, + "learning_rate": 1.5235645566798948e-06, + "loss": 0.8823, + "step": 40366 + }, + { + "epoch": 1.03, + "learning_rate": 1.5235409816399544e-06, + "loss": 0.6074, + "step": 40367 + }, + { + "epoch": 1.03, + "learning_rate": 1.5235174061991628e-06, + "loss": 0.7422, + "step": 40368 + }, + { + "epoch": 1.03, + "learning_rate": 1.523493830357538e-06, + "loss": 0.4232, + "step": 40369 + }, + { + "epoch": 1.03, + "learning_rate": 1.5234702541150978e-06, + "loss": 0.7109, + "step": 40370 + }, + { + "epoch": 1.03, + "learning_rate": 1.523446677471861e-06, + "loss": 0.6235, + "step": 40371 + }, + { + "epoch": 1.03, + "learning_rate": 1.5234231004278449e-06, + "loss": 0.7852, + "step": 40372 + }, + { + "epoch": 1.03, + "learning_rate": 1.5233995229830678e-06, + "loss": 0.6987, + "step": 40373 + }, + { + "epoch": 1.03, + "learning_rate": 1.5233759451375473e-06, + "loss": 0.4094, + "step": 40374 + }, + { + "epoch": 1.03, + "learning_rate": 1.5233523668913026e-06, + "loss": 0.5972, + "step": 40375 + }, + { + "epoch": 1.03, + "learning_rate": 1.523328788244351e-06, + "loss": 0.7012, + "step": 40376 + }, + { + "epoch": 1.03, + "learning_rate": 1.5233052091967103e-06, + "loss": 0.5234, + "step": 40377 + }, + { + "epoch": 1.03, + "learning_rate": 1.523281629748399e-06, + "loss": 0.644, + "step": 40378 + }, + { + "epoch": 1.03, + "learning_rate": 1.5232580498994347e-06, + "loss": 0.6631, + "step": 40379 + }, + { + "epoch": 1.03, + "learning_rate": 1.5232344696498363e-06, + "loss": 0.6074, + "step": 40380 + }, + { + "epoch": 1.03, + "learning_rate": 1.523210888999621e-06, + "loss": 0.4011, + "step": 40381 + }, + { + "epoch": 1.04, + "learning_rate": 1.5231873079488074e-06, + "loss": 0.5046, + "step": 40382 + }, + { + "epoch": 1.04, + "learning_rate": 1.5231637264974131e-06, + "loss": 0.6401, + "step": 40383 + }, + { + "epoch": 1.04, + "learning_rate": 1.5231401446454567e-06, + "loss": 0.7139, + "step": 40384 + }, + { + "epoch": 1.04, + "learning_rate": 1.5231165623929555e-06, + "loss": 0.5261, + "step": 40385 + }, + { + "epoch": 1.04, + "learning_rate": 1.5230929797399283e-06, + "loss": 0.6899, + "step": 40386 + }, + { + "epoch": 1.04, + "learning_rate": 1.5230693966863925e-06, + "loss": 0.6279, + "step": 40387 + }, + { + "epoch": 1.04, + "learning_rate": 1.5230458132323669e-06, + "loss": 0.6777, + "step": 40388 + }, + { + "epoch": 1.04, + "learning_rate": 1.5230222293778692e-06, + "loss": 0.627, + "step": 40389 + }, + { + "epoch": 1.04, + "learning_rate": 1.5229986451229175e-06, + "loss": 0.5352, + "step": 40390 + }, + { + "epoch": 1.04, + "learning_rate": 1.5229750604675294e-06, + "loss": 0.7959, + "step": 40391 + }, + { + "epoch": 1.04, + "learning_rate": 1.5229514754117236e-06, + "loss": 0.6255, + "step": 40392 + }, + { + "epoch": 1.04, + "learning_rate": 1.5229278899555179e-06, + "loss": 0.6455, + "step": 40393 + }, + { + "epoch": 1.04, + "learning_rate": 1.5229043040989303e-06, + "loss": 0.6836, + "step": 40394 + }, + { + "epoch": 1.04, + "learning_rate": 1.522880717841979e-06, + "loss": 0.6016, + "step": 40395 + }, + { + "epoch": 1.04, + "learning_rate": 1.5228571311846817e-06, + "loss": 0.6416, + "step": 40396 + }, + { + "epoch": 1.04, + "learning_rate": 1.522833544127057e-06, + "loss": 0.5962, + "step": 40397 + }, + { + "epoch": 1.04, + "learning_rate": 1.5228099566691225e-06, + "loss": 0.6313, + "step": 40398 + }, + { + "epoch": 1.04, + "learning_rate": 1.5227863688108966e-06, + "loss": 0.7266, + "step": 40399 + }, + { + "epoch": 1.04, + "learning_rate": 1.5227627805523973e-06, + "loss": 0.6001, + "step": 40400 + }, + { + "epoch": 1.04, + "learning_rate": 1.5227391918936424e-06, + "loss": 0.5508, + "step": 40401 + }, + { + "epoch": 1.04, + "learning_rate": 1.52271560283465e-06, + "loss": 0.8496, + "step": 40402 + }, + { + "epoch": 1.04, + "learning_rate": 1.5226920133754387e-06, + "loss": 0.7344, + "step": 40403 + }, + { + "epoch": 1.04, + "learning_rate": 1.5226684235160258e-06, + "loss": 0.79, + "step": 40404 + }, + { + "epoch": 1.04, + "learning_rate": 1.52264483325643e-06, + "loss": 0.7139, + "step": 40405 + }, + { + "epoch": 1.04, + "learning_rate": 1.5226212425966689e-06, + "loss": 0.626, + "step": 40406 + }, + { + "epoch": 1.04, + "learning_rate": 1.522597651536761e-06, + "loss": 0.8154, + "step": 40407 + }, + { + "epoch": 1.04, + "learning_rate": 1.5225740600767238e-06, + "loss": 0.6572, + "step": 40408 + }, + { + "epoch": 1.04, + "learning_rate": 1.5225504682165759e-06, + "loss": 0.6587, + "step": 40409 + }, + { + "epoch": 1.04, + "learning_rate": 1.522526875956335e-06, + "loss": 0.5928, + "step": 40410 + }, + { + "epoch": 1.04, + "learning_rate": 1.5225032832960194e-06, + "loss": 0.6729, + "step": 40411 + }, + { + "epoch": 1.04, + "learning_rate": 1.522479690235647e-06, + "loss": 0.604, + "step": 40412 + }, + { + "epoch": 1.04, + "learning_rate": 1.5224560967752357e-06, + "loss": 0.5864, + "step": 40413 + }, + { + "epoch": 1.04, + "learning_rate": 1.5224325029148042e-06, + "loss": 0.709, + "step": 40414 + }, + { + "epoch": 1.04, + "learning_rate": 1.5224089086543702e-06, + "loss": 0.5889, + "step": 40415 + }, + { + "epoch": 1.04, + "learning_rate": 1.522385313993951e-06, + "loss": 0.6445, + "step": 40416 + }, + { + "epoch": 1.04, + "learning_rate": 1.5223617189335661e-06, + "loss": 0.7227, + "step": 40417 + }, + { + "epoch": 1.04, + "learning_rate": 1.5223381234732324e-06, + "loss": 0.7354, + "step": 40418 + }, + { + "epoch": 1.04, + "learning_rate": 1.522314527612969e-06, + "loss": 0.5986, + "step": 40419 + }, + { + "epoch": 1.04, + "learning_rate": 1.5222909313527929e-06, + "loss": 0.6914, + "step": 40420 + }, + { + "epoch": 1.04, + "learning_rate": 1.5222673346927227e-06, + "loss": 0.752, + "step": 40421 + }, + { + "epoch": 1.04, + "learning_rate": 1.5222437376327766e-06, + "loss": 0.5867, + "step": 40422 + }, + { + "epoch": 1.04, + "learning_rate": 1.5222201401729722e-06, + "loss": 0.793, + "step": 40423 + }, + { + "epoch": 1.04, + "learning_rate": 1.522196542313328e-06, + "loss": 0.5144, + "step": 40424 + }, + { + "epoch": 1.04, + "learning_rate": 1.5221729440538619e-06, + "loss": 0.583, + "step": 40425 + }, + { + "epoch": 1.04, + "learning_rate": 1.5221493453945922e-06, + "loss": 0.6421, + "step": 40426 + }, + { + "epoch": 1.04, + "learning_rate": 1.5221257463355364e-06, + "loss": 0.748, + "step": 40427 + }, + { + "epoch": 1.04, + "learning_rate": 1.5221021468767131e-06, + "loss": 0.6304, + "step": 40428 + }, + { + "epoch": 1.04, + "learning_rate": 1.52207854701814e-06, + "loss": 0.6172, + "step": 40429 + }, + { + "epoch": 1.04, + "learning_rate": 1.522054946759836e-06, + "loss": 0.6213, + "step": 40430 + }, + { + "epoch": 1.04, + "learning_rate": 1.522031346101818e-06, + "loss": 0.5044, + "step": 40431 + }, + { + "epoch": 1.04, + "learning_rate": 1.5220077450441044e-06, + "loss": 0.7559, + "step": 40432 + }, + { + "epoch": 1.04, + "learning_rate": 1.5219841435867139e-06, + "loss": 0.6606, + "step": 40433 + }, + { + "epoch": 1.04, + "learning_rate": 1.5219605417296642e-06, + "loss": 0.8555, + "step": 40434 + }, + { + "epoch": 1.04, + "learning_rate": 1.5219369394729729e-06, + "loss": 0.8516, + "step": 40435 + }, + { + "epoch": 1.04, + "learning_rate": 1.521913336816659e-06, + "loss": 0.6143, + "step": 40436 + }, + { + "epoch": 1.04, + "learning_rate": 1.5218897337607395e-06, + "loss": 0.4189, + "step": 40437 + }, + { + "epoch": 1.04, + "learning_rate": 1.5218661303052334e-06, + "loss": 0.7725, + "step": 40438 + }, + { + "epoch": 1.04, + "learning_rate": 1.521842526450158e-06, + "loss": 0.6233, + "step": 40439 + }, + { + "epoch": 1.04, + "learning_rate": 1.5218189221955323e-06, + "loss": 0.5842, + "step": 40440 + }, + { + "epoch": 1.04, + "learning_rate": 1.5217953175413735e-06, + "loss": 0.7676, + "step": 40441 + }, + { + "epoch": 1.04, + "learning_rate": 1.5217717124877e-06, + "loss": 0.7979, + "step": 40442 + }, + { + "epoch": 1.04, + "learning_rate": 1.5217481070345302e-06, + "loss": 0.6738, + "step": 40443 + }, + { + "epoch": 1.04, + "learning_rate": 1.5217245011818815e-06, + "loss": 0.7178, + "step": 40444 + }, + { + "epoch": 1.04, + "learning_rate": 1.5217008949297726e-06, + "loss": 0.7837, + "step": 40445 + }, + { + "epoch": 1.04, + "learning_rate": 1.5216772882782213e-06, + "loss": 0.5835, + "step": 40446 + }, + { + "epoch": 1.04, + "learning_rate": 1.5216536812272456e-06, + "loss": 0.6338, + "step": 40447 + }, + { + "epoch": 1.04, + "learning_rate": 1.5216300737768638e-06, + "loss": 0.7324, + "step": 40448 + }, + { + "epoch": 1.04, + "learning_rate": 1.5216064659270935e-06, + "loss": 0.6895, + "step": 40449 + }, + { + "epoch": 1.04, + "learning_rate": 1.5215828576779535e-06, + "loss": 0.8125, + "step": 40450 + }, + { + "epoch": 1.04, + "learning_rate": 1.5215592490294613e-06, + "loss": 0.7451, + "step": 40451 + }, + { + "epoch": 1.04, + "learning_rate": 1.5215356399816351e-06, + "loss": 0.6187, + "step": 40452 + }, + { + "epoch": 1.04, + "learning_rate": 1.521512030534493e-06, + "loss": 0.6387, + "step": 40453 + }, + { + "epoch": 1.04, + "learning_rate": 1.5214884206880534e-06, + "loss": 0.5664, + "step": 40454 + }, + { + "epoch": 1.04, + "learning_rate": 1.521464810442334e-06, + "loss": 0.603, + "step": 40455 + }, + { + "epoch": 1.04, + "learning_rate": 1.5214411997973528e-06, + "loss": 0.7222, + "step": 40456 + }, + { + "epoch": 1.04, + "learning_rate": 1.5214175887531283e-06, + "loss": 0.5889, + "step": 40457 + }, + { + "epoch": 1.04, + "learning_rate": 1.521393977309678e-06, + "loss": 0.5972, + "step": 40458 + }, + { + "epoch": 1.04, + "learning_rate": 1.5213703654670206e-06, + "loss": 0.6072, + "step": 40459 + }, + { + "epoch": 1.04, + "learning_rate": 1.5213467532251738e-06, + "loss": 0.7725, + "step": 40460 + }, + { + "epoch": 1.04, + "learning_rate": 1.5213231405841559e-06, + "loss": 0.668, + "step": 40461 + }, + { + "epoch": 1.04, + "learning_rate": 1.5212995275439843e-06, + "loss": 0.584, + "step": 40462 + }, + { + "epoch": 1.04, + "learning_rate": 1.5212759141046783e-06, + "loss": 0.6094, + "step": 40463 + }, + { + "epoch": 1.04, + "learning_rate": 1.521252300266255e-06, + "loss": 0.5981, + "step": 40464 + }, + { + "epoch": 1.04, + "learning_rate": 1.5212286860287326e-06, + "loss": 0.7305, + "step": 40465 + }, + { + "epoch": 1.04, + "learning_rate": 1.5212050713921297e-06, + "loss": 0.8506, + "step": 40466 + }, + { + "epoch": 1.04, + "learning_rate": 1.5211814563564639e-06, + "loss": 0.8486, + "step": 40467 + }, + { + "epoch": 1.04, + "learning_rate": 1.5211578409217534e-06, + "loss": 0.7109, + "step": 40468 + }, + { + "epoch": 1.04, + "learning_rate": 1.5211342250880161e-06, + "loss": 0.8027, + "step": 40469 + }, + { + "epoch": 1.04, + "learning_rate": 1.5211106088552708e-06, + "loss": 0.6729, + "step": 40470 + }, + { + "epoch": 1.04, + "learning_rate": 1.5210869922235347e-06, + "loss": 0.5884, + "step": 40471 + }, + { + "epoch": 1.04, + "learning_rate": 1.5210633751928264e-06, + "loss": 0.6777, + "step": 40472 + }, + { + "epoch": 1.04, + "learning_rate": 1.5210397577631636e-06, + "loss": 0.4399, + "step": 40473 + }, + { + "epoch": 1.04, + "learning_rate": 1.5210161399345646e-06, + "loss": 0.7061, + "step": 40474 + }, + { + "epoch": 1.04, + "learning_rate": 1.5209925217070478e-06, + "loss": 0.748, + "step": 40475 + }, + { + "epoch": 1.04, + "learning_rate": 1.520968903080631e-06, + "loss": 0.5837, + "step": 40476 + }, + { + "epoch": 1.04, + "learning_rate": 1.5209452840553319e-06, + "loss": 0.6499, + "step": 40477 + }, + { + "epoch": 1.04, + "learning_rate": 1.5209216646311693e-06, + "loss": 0.6855, + "step": 40478 + }, + { + "epoch": 1.04, + "learning_rate": 1.5208980448081607e-06, + "loss": 0.5562, + "step": 40479 + }, + { + "epoch": 1.04, + "learning_rate": 1.5208744245863248e-06, + "loss": 0.6074, + "step": 40480 + }, + { + "epoch": 1.04, + "learning_rate": 1.5208508039656788e-06, + "loss": 0.7148, + "step": 40481 + }, + { + "epoch": 1.04, + "learning_rate": 1.5208271829462417e-06, + "loss": 0.6978, + "step": 40482 + }, + { + "epoch": 1.04, + "learning_rate": 1.5208035615280308e-06, + "loss": 0.6479, + "step": 40483 + }, + { + "epoch": 1.04, + "learning_rate": 1.5207799397110648e-06, + "loss": 0.71, + "step": 40484 + }, + { + "epoch": 1.04, + "learning_rate": 1.5207563174953615e-06, + "loss": 0.6284, + "step": 40485 + }, + { + "epoch": 1.04, + "learning_rate": 1.5207326948809392e-06, + "loss": 0.5625, + "step": 40486 + }, + { + "epoch": 1.04, + "learning_rate": 1.5207090718678154e-06, + "loss": 0.6055, + "step": 40487 + }, + { + "epoch": 1.04, + "learning_rate": 1.520685448456009e-06, + "loss": 0.7305, + "step": 40488 + }, + { + "epoch": 1.04, + "learning_rate": 1.5206618246455375e-06, + "loss": 0.5854, + "step": 40489 + }, + { + "epoch": 1.04, + "learning_rate": 1.5206382004364193e-06, + "loss": 0.6509, + "step": 40490 + }, + { + "epoch": 1.04, + "learning_rate": 1.5206145758286724e-06, + "loss": 0.386, + "step": 40491 + }, + { + "epoch": 1.04, + "learning_rate": 1.5205909508223145e-06, + "loss": 0.7158, + "step": 40492 + }, + { + "epoch": 1.04, + "learning_rate": 1.5205673254173643e-06, + "loss": 0.8535, + "step": 40493 + }, + { + "epoch": 1.04, + "learning_rate": 1.5205436996138396e-06, + "loss": 0.5479, + "step": 40494 + }, + { + "epoch": 1.04, + "learning_rate": 1.5205200734117588e-06, + "loss": 0.7324, + "step": 40495 + }, + { + "epoch": 1.04, + "learning_rate": 1.5204964468111392e-06, + "loss": 0.563, + "step": 40496 + }, + { + "epoch": 1.04, + "learning_rate": 1.5204728198119997e-06, + "loss": 0.585, + "step": 40497 + }, + { + "epoch": 1.04, + "learning_rate": 1.5204491924143582e-06, + "loss": 0.6235, + "step": 40498 + }, + { + "epoch": 1.04, + "learning_rate": 1.5204255646182325e-06, + "loss": 0.6855, + "step": 40499 + }, + { + "epoch": 1.04, + "learning_rate": 1.520401936423641e-06, + "loss": 0.6653, + "step": 40500 + }, + { + "epoch": 1.04, + "learning_rate": 1.5203783078306018e-06, + "loss": 0.543, + "step": 40501 + }, + { + "epoch": 1.04, + "learning_rate": 1.5203546788391325e-06, + "loss": 0.5723, + "step": 40502 + }, + { + "epoch": 1.04, + "learning_rate": 1.5203310494492518e-06, + "loss": 0.5845, + "step": 40503 + }, + { + "epoch": 1.04, + "learning_rate": 1.5203074196609773e-06, + "loss": 0.7695, + "step": 40504 + }, + { + "epoch": 1.04, + "learning_rate": 1.5202837894743277e-06, + "loss": 0.6367, + "step": 40505 + }, + { + "epoch": 1.04, + "learning_rate": 1.5202601588893202e-06, + "loss": 0.7603, + "step": 40506 + }, + { + "epoch": 1.04, + "learning_rate": 1.5202365279059739e-06, + "loss": 0.8838, + "step": 40507 + }, + { + "epoch": 1.04, + "learning_rate": 1.5202128965243062e-06, + "loss": 0.4742, + "step": 40508 + }, + { + "epoch": 1.04, + "learning_rate": 1.5201892647443356e-06, + "loss": 0.7246, + "step": 40509 + }, + { + "epoch": 1.04, + "learning_rate": 1.5201656325660797e-06, + "loss": 0.8027, + "step": 40510 + }, + { + "epoch": 1.04, + "learning_rate": 1.520141999989557e-06, + "loss": 0.6396, + "step": 40511 + }, + { + "epoch": 1.04, + "learning_rate": 1.5201183670147855e-06, + "loss": 0.5498, + "step": 40512 + }, + { + "epoch": 1.04, + "learning_rate": 1.520094733641783e-06, + "loss": 0.7988, + "step": 40513 + }, + { + "epoch": 1.04, + "learning_rate": 1.5200710998705683e-06, + "loss": 0.708, + "step": 40514 + }, + { + "epoch": 1.04, + "learning_rate": 1.5200474657011592e-06, + "loss": 0.4792, + "step": 40515 + }, + { + "epoch": 1.04, + "learning_rate": 1.5200238311335733e-06, + "loss": 0.6484, + "step": 40516 + }, + { + "epoch": 1.04, + "learning_rate": 1.5200001961678291e-06, + "loss": 0.6699, + "step": 40517 + }, + { + "epoch": 1.04, + "learning_rate": 1.5199765608039447e-06, + "loss": 0.6582, + "step": 40518 + }, + { + "epoch": 1.04, + "learning_rate": 1.5199529250419384e-06, + "loss": 0.7158, + "step": 40519 + }, + { + "epoch": 1.04, + "learning_rate": 1.519929288881828e-06, + "loss": 0.4893, + "step": 40520 + }, + { + "epoch": 1.04, + "learning_rate": 1.5199056523236314e-06, + "loss": 0.6567, + "step": 40521 + }, + { + "epoch": 1.04, + "learning_rate": 1.519882015367367e-06, + "loss": 0.5781, + "step": 40522 + }, + { + "epoch": 1.04, + "learning_rate": 1.519858378013053e-06, + "loss": 0.7354, + "step": 40523 + }, + { + "epoch": 1.04, + "learning_rate": 1.5198347402607073e-06, + "loss": 0.5266, + "step": 40524 + }, + { + "epoch": 1.04, + "learning_rate": 1.519811102110348e-06, + "loss": 0.6797, + "step": 40525 + }, + { + "epoch": 1.04, + "learning_rate": 1.5197874635619932e-06, + "loss": 0.6914, + "step": 40526 + }, + { + "epoch": 1.04, + "learning_rate": 1.5197638246156607e-06, + "loss": 0.792, + "step": 40527 + }, + { + "epoch": 1.04, + "learning_rate": 1.5197401852713695e-06, + "loss": 0.5337, + "step": 40528 + }, + { + "epoch": 1.04, + "learning_rate": 1.5197165455291368e-06, + "loss": 0.6191, + "step": 40529 + }, + { + "epoch": 1.04, + "learning_rate": 1.5196929053889813e-06, + "loss": 0.6255, + "step": 40530 + }, + { + "epoch": 1.04, + "learning_rate": 1.5196692648509205e-06, + "loss": 0.4441, + "step": 40531 + }, + { + "epoch": 1.04, + "learning_rate": 1.5196456239149733e-06, + "loss": 0.6846, + "step": 40532 + }, + { + "epoch": 1.04, + "learning_rate": 1.519621982581157e-06, + "loss": 0.8418, + "step": 40533 + }, + { + "epoch": 1.04, + "learning_rate": 1.5195983408494901e-06, + "loss": 0.6123, + "step": 40534 + }, + { + "epoch": 1.04, + "learning_rate": 1.5195746987199909e-06, + "loss": 0.7637, + "step": 40535 + }, + { + "epoch": 1.04, + "learning_rate": 1.519551056192677e-06, + "loss": 0.6226, + "step": 40536 + }, + { + "epoch": 1.04, + "learning_rate": 1.5195274132675667e-06, + "loss": 0.8047, + "step": 40537 + }, + { + "epoch": 1.04, + "learning_rate": 1.519503769944678e-06, + "loss": 0.5977, + "step": 40538 + }, + { + "epoch": 1.04, + "learning_rate": 1.5194801262240296e-06, + "loss": 0.729, + "step": 40539 + }, + { + "epoch": 1.04, + "learning_rate": 1.519456482105639e-06, + "loss": 0.7217, + "step": 40540 + }, + { + "epoch": 1.04, + "learning_rate": 1.5194328375895244e-06, + "loss": 0.7568, + "step": 40541 + }, + { + "epoch": 1.04, + "learning_rate": 1.5194091926757037e-06, + "loss": 0.8535, + "step": 40542 + }, + { + "epoch": 1.04, + "learning_rate": 1.5193855473641954e-06, + "loss": 0.6567, + "step": 40543 + }, + { + "epoch": 1.04, + "learning_rate": 1.5193619016550175e-06, + "loss": 0.5603, + "step": 40544 + }, + { + "epoch": 1.04, + "learning_rate": 1.5193382555481887e-06, + "loss": 0.7842, + "step": 40545 + }, + { + "epoch": 1.04, + "learning_rate": 1.5193146090437257e-06, + "loss": 0.6572, + "step": 40546 + }, + { + "epoch": 1.04, + "learning_rate": 1.5192909621416477e-06, + "loss": 0.6709, + "step": 40547 + }, + { + "epoch": 1.04, + "learning_rate": 1.5192673148419722e-06, + "loss": 0.6309, + "step": 40548 + }, + { + "epoch": 1.04, + "learning_rate": 1.519243667144718e-06, + "loss": 0.6934, + "step": 40549 + }, + { + "epoch": 1.04, + "learning_rate": 1.5192200190499024e-06, + "loss": 0.6299, + "step": 40550 + }, + { + "epoch": 1.04, + "learning_rate": 1.5191963705575442e-06, + "loss": 0.6904, + "step": 40551 + }, + { + "epoch": 1.04, + "learning_rate": 1.5191727216676608e-06, + "loss": 0.5981, + "step": 40552 + }, + { + "epoch": 1.04, + "learning_rate": 1.5191490723802711e-06, + "loss": 0.5366, + "step": 40553 + }, + { + "epoch": 1.04, + "learning_rate": 1.5191254226953928e-06, + "loss": 0.8164, + "step": 40554 + }, + { + "epoch": 1.04, + "learning_rate": 1.5191017726130442e-06, + "loss": 0.6646, + "step": 40555 + }, + { + "epoch": 1.04, + "learning_rate": 1.519078122133243e-06, + "loss": 0.4154, + "step": 40556 + }, + { + "epoch": 1.04, + "learning_rate": 1.5190544712560073e-06, + "loss": 0.7529, + "step": 40557 + }, + { + "epoch": 1.04, + "learning_rate": 1.519030819981356e-06, + "loss": 0.8037, + "step": 40558 + }, + { + "epoch": 1.04, + "learning_rate": 1.5190071683093063e-06, + "loss": 0.7627, + "step": 40559 + }, + { + "epoch": 1.04, + "learning_rate": 1.5189835162398769e-06, + "loss": 0.5725, + "step": 40560 + }, + { + "epoch": 1.04, + "learning_rate": 1.5189598637730855e-06, + "loss": 0.4363, + "step": 40561 + }, + { + "epoch": 1.04, + "learning_rate": 1.5189362109089502e-06, + "loss": 0.7212, + "step": 40562 + }, + { + "epoch": 1.04, + "learning_rate": 1.5189125576474897e-06, + "loss": 0.8066, + "step": 40563 + }, + { + "epoch": 1.04, + "learning_rate": 1.5188889039887215e-06, + "loss": 0.5254, + "step": 40564 + }, + { + "epoch": 1.04, + "learning_rate": 1.5188652499326642e-06, + "loss": 0.6772, + "step": 40565 + }, + { + "epoch": 1.04, + "learning_rate": 1.5188415954793355e-06, + "loss": 0.7446, + "step": 40566 + }, + { + "epoch": 1.04, + "learning_rate": 1.5188179406287534e-06, + "loss": 0.6738, + "step": 40567 + }, + { + "epoch": 1.04, + "learning_rate": 1.5187942853809364e-06, + "loss": 0.5142, + "step": 40568 + }, + { + "epoch": 1.04, + "learning_rate": 1.5187706297359025e-06, + "loss": 0.5776, + "step": 40569 + }, + { + "epoch": 1.04, + "learning_rate": 1.51874697369367e-06, + "loss": 0.5347, + "step": 40570 + }, + { + "epoch": 1.04, + "learning_rate": 1.5187233172542564e-06, + "loss": 0.584, + "step": 40571 + }, + { + "epoch": 1.04, + "learning_rate": 1.5186996604176804e-06, + "loss": 0.7168, + "step": 40572 + }, + { + "epoch": 1.04, + "learning_rate": 1.51867600318396e-06, + "loss": 0.6387, + "step": 40573 + }, + { + "epoch": 1.04, + "learning_rate": 1.5186523455531131e-06, + "loss": 0.7197, + "step": 40574 + }, + { + "epoch": 1.04, + "learning_rate": 1.5186286875251582e-06, + "loss": 0.7529, + "step": 40575 + }, + { + "epoch": 1.04, + "learning_rate": 1.5186050291001126e-06, + "loss": 0.7148, + "step": 40576 + }, + { + "epoch": 1.04, + "learning_rate": 1.5185813702779955e-06, + "loss": 0.6631, + "step": 40577 + }, + { + "epoch": 1.04, + "learning_rate": 1.5185577110588243e-06, + "loss": 0.5537, + "step": 40578 + }, + { + "epoch": 1.04, + "learning_rate": 1.5185340514426172e-06, + "loss": 0.6113, + "step": 40579 + }, + { + "epoch": 1.04, + "learning_rate": 1.5185103914293926e-06, + "loss": 0.5679, + "step": 40580 + }, + { + "epoch": 1.04, + "learning_rate": 1.5184867310191686e-06, + "loss": 0.7261, + "step": 40581 + }, + { + "epoch": 1.04, + "learning_rate": 1.5184630702119628e-06, + "loss": 0.7031, + "step": 40582 + }, + { + "epoch": 1.04, + "learning_rate": 1.5184394090077936e-06, + "loss": 0.6582, + "step": 40583 + }, + { + "epoch": 1.04, + "learning_rate": 1.5184157474066794e-06, + "loss": 0.6929, + "step": 40584 + }, + { + "epoch": 1.04, + "learning_rate": 1.5183920854086383e-06, + "loss": 0.7725, + "step": 40585 + }, + { + "epoch": 1.04, + "learning_rate": 1.518368423013688e-06, + "loss": 0.709, + "step": 40586 + }, + { + "epoch": 1.04, + "learning_rate": 1.518344760221847e-06, + "loss": 0.7246, + "step": 40587 + }, + { + "epoch": 1.04, + "learning_rate": 1.5183210970331329e-06, + "loss": 0.8008, + "step": 40588 + }, + { + "epoch": 1.04, + "learning_rate": 1.5182974334475644e-06, + "loss": 0.5173, + "step": 40589 + }, + { + "epoch": 1.04, + "learning_rate": 1.5182737694651593e-06, + "loss": 0.6841, + "step": 40590 + }, + { + "epoch": 1.04, + "learning_rate": 1.518250105085936e-06, + "loss": 0.958, + "step": 40591 + }, + { + "epoch": 1.04, + "learning_rate": 1.5182264403099121e-06, + "loss": 0.7412, + "step": 40592 + }, + { + "epoch": 1.04, + "learning_rate": 1.5182027751371062e-06, + "loss": 0.5449, + "step": 40593 + }, + { + "epoch": 1.04, + "learning_rate": 1.5181791095675363e-06, + "loss": 0.5693, + "step": 40594 + }, + { + "epoch": 1.04, + "learning_rate": 1.5181554436012208e-06, + "loss": 0.4109, + "step": 40595 + }, + { + "epoch": 1.04, + "learning_rate": 1.5181317772381767e-06, + "loss": 0.8389, + "step": 40596 + }, + { + "epoch": 1.04, + "learning_rate": 1.5181081104784234e-06, + "loss": 0.6709, + "step": 40597 + }, + { + "epoch": 1.04, + "learning_rate": 1.5180844433219785e-06, + "loss": 0.5879, + "step": 40598 + }, + { + "epoch": 1.04, + "learning_rate": 1.5180607757688603e-06, + "loss": 0.5242, + "step": 40599 + }, + { + "epoch": 1.04, + "learning_rate": 1.5180371078190867e-06, + "loss": 0.5996, + "step": 40600 + }, + { + "epoch": 1.04, + "learning_rate": 1.5180134394726758e-06, + "loss": 0.7129, + "step": 40601 + }, + { + "epoch": 1.04, + "learning_rate": 1.517989770729646e-06, + "loss": 0.6602, + "step": 40602 + }, + { + "epoch": 1.04, + "learning_rate": 1.5179661015900149e-06, + "loss": 0.8359, + "step": 40603 + }, + { + "epoch": 1.04, + "learning_rate": 1.5179424320538015e-06, + "loss": 0.5215, + "step": 40604 + }, + { + "epoch": 1.04, + "learning_rate": 1.517918762121023e-06, + "loss": 0.8633, + "step": 40605 + }, + { + "epoch": 1.04, + "learning_rate": 1.5178950917916984e-06, + "loss": 0.6104, + "step": 40606 + }, + { + "epoch": 1.04, + "learning_rate": 1.5178714210658448e-06, + "loss": 0.7324, + "step": 40607 + }, + { + "epoch": 1.04, + "learning_rate": 1.517847749943481e-06, + "loss": 0.6309, + "step": 40608 + }, + { + "epoch": 1.04, + "learning_rate": 1.517824078424625e-06, + "loss": 0.5833, + "step": 40609 + }, + { + "epoch": 1.04, + "learning_rate": 1.5178004065092952e-06, + "loss": 0.6011, + "step": 40610 + }, + { + "epoch": 1.04, + "learning_rate": 1.517776734197509e-06, + "loss": 0.7578, + "step": 40611 + }, + { + "epoch": 1.04, + "learning_rate": 1.517753061489285e-06, + "loss": 0.5625, + "step": 40612 + }, + { + "epoch": 1.04, + "learning_rate": 1.5177293883846414e-06, + "loss": 0.6104, + "step": 40613 + }, + { + "epoch": 1.04, + "learning_rate": 1.5177057148835965e-06, + "loss": 0.5913, + "step": 40614 + }, + { + "epoch": 1.04, + "learning_rate": 1.517682040986168e-06, + "loss": 0.6514, + "step": 40615 + }, + { + "epoch": 1.04, + "learning_rate": 1.517658366692374e-06, + "loss": 0.4094, + "step": 40616 + }, + { + "epoch": 1.04, + "learning_rate": 1.5176346920022327e-06, + "loss": 0.5706, + "step": 40617 + }, + { + "epoch": 1.04, + "learning_rate": 1.5176110169157625e-06, + "loss": 0.4463, + "step": 40618 + }, + { + "epoch": 1.04, + "learning_rate": 1.5175873414329817e-06, + "loss": 0.873, + "step": 40619 + }, + { + "epoch": 1.04, + "learning_rate": 1.5175636655539076e-06, + "loss": 0.5612, + "step": 40620 + }, + { + "epoch": 1.04, + "learning_rate": 1.5175399892785588e-06, + "loss": 0.5791, + "step": 40621 + }, + { + "epoch": 1.04, + "learning_rate": 1.5175163126069533e-06, + "loss": 0.6953, + "step": 40622 + }, + { + "epoch": 1.04, + "learning_rate": 1.5174926355391095e-06, + "loss": 0.5542, + "step": 40623 + }, + { + "epoch": 1.04, + "learning_rate": 1.5174689580750456e-06, + "loss": 0.666, + "step": 40624 + }, + { + "epoch": 1.04, + "learning_rate": 1.5174452802147794e-06, + "loss": 0.7822, + "step": 40625 + }, + { + "epoch": 1.04, + "learning_rate": 1.517421601958329e-06, + "loss": 0.7017, + "step": 40626 + }, + { + "epoch": 1.04, + "learning_rate": 1.5173979233057129e-06, + "loss": 0.4827, + "step": 40627 + }, + { + "epoch": 1.04, + "learning_rate": 1.5173742442569485e-06, + "loss": 0.6201, + "step": 40628 + }, + { + "epoch": 1.04, + "learning_rate": 1.5173505648120553e-06, + "loss": 0.7764, + "step": 40629 + }, + { + "epoch": 1.04, + "learning_rate": 1.51732688497105e-06, + "loss": 0.7295, + "step": 40630 + }, + { + "epoch": 1.04, + "learning_rate": 1.5173032047339513e-06, + "loss": 0.4941, + "step": 40631 + }, + { + "epoch": 1.04, + "learning_rate": 1.5172795241007771e-06, + "loss": 0.6138, + "step": 40632 + }, + { + "epoch": 1.04, + "learning_rate": 1.5172558430715462e-06, + "loss": 0.6318, + "step": 40633 + }, + { + "epoch": 1.04, + "learning_rate": 1.5172321616462761e-06, + "loss": 0.707, + "step": 40634 + }, + { + "epoch": 1.04, + "learning_rate": 1.5172084798249853e-06, + "loss": 0.6091, + "step": 40635 + }, + { + "epoch": 1.04, + "learning_rate": 1.5171847976076918e-06, + "loss": 0.6162, + "step": 40636 + }, + { + "epoch": 1.04, + "learning_rate": 1.5171611149944133e-06, + "loss": 0.4878, + "step": 40637 + }, + { + "epoch": 1.04, + "learning_rate": 1.5171374319851683e-06, + "loss": 0.6738, + "step": 40638 + }, + { + "epoch": 1.04, + "learning_rate": 1.5171137485799753e-06, + "loss": 0.6689, + "step": 40639 + }, + { + "epoch": 1.04, + "learning_rate": 1.517090064778852e-06, + "loss": 0.6592, + "step": 40640 + }, + { + "epoch": 1.04, + "learning_rate": 1.5170663805818164e-06, + "loss": 0.6792, + "step": 40641 + }, + { + "epoch": 1.04, + "learning_rate": 1.5170426959888868e-06, + "loss": 0.5596, + "step": 40642 + }, + { + "epoch": 1.04, + "learning_rate": 1.5170190110000818e-06, + "loss": 0.6206, + "step": 40643 + }, + { + "epoch": 1.04, + "learning_rate": 1.516995325615419e-06, + "loss": 0.6875, + "step": 40644 + }, + { + "epoch": 1.04, + "learning_rate": 1.5169716398349163e-06, + "loss": 0.5596, + "step": 40645 + }, + { + "epoch": 1.04, + "learning_rate": 1.5169479536585925e-06, + "loss": 0.635, + "step": 40646 + }, + { + "epoch": 1.04, + "learning_rate": 1.5169242670864652e-06, + "loss": 0.7812, + "step": 40647 + }, + { + "epoch": 1.04, + "learning_rate": 1.5169005801185529e-06, + "loss": 0.6138, + "step": 40648 + }, + { + "epoch": 1.04, + "learning_rate": 1.5168768927548737e-06, + "loss": 0.6475, + "step": 40649 + }, + { + "epoch": 1.04, + "learning_rate": 1.5168532049954455e-06, + "loss": 0.8105, + "step": 40650 + }, + { + "epoch": 1.04, + "learning_rate": 1.5168295168402865e-06, + "loss": 0.7295, + "step": 40651 + }, + { + "epoch": 1.04, + "learning_rate": 1.5168058282894148e-06, + "loss": 0.6816, + "step": 40652 + }, + { + "epoch": 1.04, + "learning_rate": 1.5167821393428488e-06, + "loss": 0.5415, + "step": 40653 + }, + { + "epoch": 1.04, + "learning_rate": 1.5167584500006068e-06, + "loss": 0.7202, + "step": 40654 + }, + { + "epoch": 1.04, + "learning_rate": 1.5167347602627061e-06, + "loss": 0.7695, + "step": 40655 + }, + { + "epoch": 1.04, + "learning_rate": 1.516711070129166e-06, + "loss": 0.5864, + "step": 40656 + }, + { + "epoch": 1.04, + "learning_rate": 1.516687379600003e-06, + "loss": 0.7266, + "step": 40657 + }, + { + "epoch": 1.04, + "learning_rate": 1.516663688675237e-06, + "loss": 0.6562, + "step": 40658 + }, + { + "epoch": 1.04, + "learning_rate": 1.5166399973548854e-06, + "loss": 0.5327, + "step": 40659 + }, + { + "epoch": 1.04, + "learning_rate": 1.516616305638966e-06, + "loss": 0.6802, + "step": 40660 + }, + { + "epoch": 1.04, + "learning_rate": 1.5165926135274974e-06, + "loss": 0.5801, + "step": 40661 + }, + { + "epoch": 1.04, + "learning_rate": 1.5165689210204976e-06, + "loss": 0.6855, + "step": 40662 + }, + { + "epoch": 1.04, + "learning_rate": 1.5165452281179842e-06, + "loss": 0.6265, + "step": 40663 + }, + { + "epoch": 1.04, + "learning_rate": 1.5165215348199764e-06, + "loss": 0.6411, + "step": 40664 + }, + { + "epoch": 1.04, + "learning_rate": 1.5164978411264918e-06, + "loss": 0.6924, + "step": 40665 + }, + { + "epoch": 1.04, + "learning_rate": 1.5164741470375485e-06, + "loss": 0.6748, + "step": 40666 + }, + { + "epoch": 1.04, + "learning_rate": 1.5164504525531645e-06, + "loss": 0.603, + "step": 40667 + }, + { + "epoch": 1.04, + "learning_rate": 1.5164267576733586e-06, + "loss": 0.5645, + "step": 40668 + }, + { + "epoch": 1.04, + "learning_rate": 1.5164030623981484e-06, + "loss": 0.6924, + "step": 40669 + }, + { + "epoch": 1.04, + "learning_rate": 1.5163793667275514e-06, + "loss": 0.6157, + "step": 40670 + }, + { + "epoch": 1.04, + "learning_rate": 1.5163556706615873e-06, + "loss": 0.6704, + "step": 40671 + }, + { + "epoch": 1.04, + "learning_rate": 1.5163319742002728e-06, + "loss": 0.468, + "step": 40672 + }, + { + "epoch": 1.04, + "learning_rate": 1.5163082773436271e-06, + "loss": 0.6323, + "step": 40673 + }, + { + "epoch": 1.04, + "learning_rate": 1.5162845800916678e-06, + "loss": 0.3464, + "step": 40674 + }, + { + "epoch": 1.04, + "learning_rate": 1.516260882444413e-06, + "loss": 0.7324, + "step": 40675 + }, + { + "epoch": 1.04, + "learning_rate": 1.516237184401881e-06, + "loss": 0.6392, + "step": 40676 + }, + { + "epoch": 1.04, + "learning_rate": 1.5162134859640898e-06, + "loss": 0.5283, + "step": 40677 + }, + { + "epoch": 1.04, + "learning_rate": 1.516189787131058e-06, + "loss": 0.7129, + "step": 40678 + }, + { + "epoch": 1.04, + "learning_rate": 1.5161660879028034e-06, + "loss": 0.7451, + "step": 40679 + }, + { + "epoch": 1.04, + "learning_rate": 1.5161423882793436e-06, + "loss": 0.7393, + "step": 40680 + }, + { + "epoch": 1.04, + "learning_rate": 1.5161186882606977e-06, + "loss": 0.7754, + "step": 40681 + }, + { + "epoch": 1.04, + "learning_rate": 1.5160949878468836e-06, + "loss": 0.5835, + "step": 40682 + }, + { + "epoch": 1.04, + "learning_rate": 1.5160712870379192e-06, + "loss": 0.7178, + "step": 40683 + }, + { + "epoch": 1.04, + "learning_rate": 1.5160475858338227e-06, + "loss": 0.501, + "step": 40684 + }, + { + "epoch": 1.04, + "learning_rate": 1.5160238842346122e-06, + "loss": 0.7383, + "step": 40685 + }, + { + "epoch": 1.04, + "learning_rate": 1.5160001822403062e-06, + "loss": 0.6548, + "step": 40686 + }, + { + "epoch": 1.04, + "learning_rate": 1.5159764798509222e-06, + "loss": 0.7207, + "step": 40687 + }, + { + "epoch": 1.04, + "learning_rate": 1.515952777066479e-06, + "loss": 0.7793, + "step": 40688 + }, + { + "epoch": 1.04, + "learning_rate": 1.5159290738869946e-06, + "loss": 0.6846, + "step": 40689 + }, + { + "epoch": 1.04, + "learning_rate": 1.515905370312487e-06, + "loss": 0.834, + "step": 40690 + }, + { + "epoch": 1.04, + "learning_rate": 1.515881666342974e-06, + "loss": 0.6602, + "step": 40691 + }, + { + "epoch": 1.04, + "learning_rate": 1.5158579619784743e-06, + "loss": 0.6035, + "step": 40692 + }, + { + "epoch": 1.04, + "learning_rate": 1.515834257219006e-06, + "loss": 0.6626, + "step": 40693 + }, + { + "epoch": 1.04, + "learning_rate": 1.5158105520645874e-06, + "loss": 0.5815, + "step": 40694 + }, + { + "epoch": 1.04, + "learning_rate": 1.5157868465152358e-06, + "loss": 0.7373, + "step": 40695 + }, + { + "epoch": 1.04, + "learning_rate": 1.5157631405709702e-06, + "loss": 0.7004, + "step": 40696 + }, + { + "epoch": 1.04, + "learning_rate": 1.5157394342318084e-06, + "loss": 0.4197, + "step": 40697 + }, + { + "epoch": 1.04, + "learning_rate": 1.5157157274977688e-06, + "loss": 0.6709, + "step": 40698 + }, + { + "epoch": 1.04, + "learning_rate": 1.5156920203688693e-06, + "loss": 0.5474, + "step": 40699 + }, + { + "epoch": 1.04, + "learning_rate": 1.5156683128451282e-06, + "loss": 0.7676, + "step": 40700 + }, + { + "epoch": 1.04, + "learning_rate": 1.5156446049265634e-06, + "loss": 0.4626, + "step": 40701 + }, + { + "epoch": 1.04, + "learning_rate": 1.5156208966131933e-06, + "loss": 0.8271, + "step": 40702 + }, + { + "epoch": 1.04, + "learning_rate": 1.515597187905036e-06, + "loss": 0.6494, + "step": 40703 + }, + { + "epoch": 1.04, + "learning_rate": 1.5155734788021098e-06, + "loss": 0.5923, + "step": 40704 + }, + { + "epoch": 1.04, + "learning_rate": 1.5155497693044325e-06, + "loss": 0.4388, + "step": 40705 + }, + { + "epoch": 1.04, + "learning_rate": 1.5155260594120226e-06, + "loss": 0.6855, + "step": 40706 + }, + { + "epoch": 1.04, + "learning_rate": 1.5155023491248978e-06, + "loss": 0.6699, + "step": 40707 + }, + { + "epoch": 1.04, + "learning_rate": 1.515478638443077e-06, + "loss": 0.8887, + "step": 40708 + }, + { + "epoch": 1.04, + "learning_rate": 1.5154549273665774e-06, + "loss": 0.7793, + "step": 40709 + }, + { + "epoch": 1.04, + "learning_rate": 1.515431215895418e-06, + "loss": 0.6221, + "step": 40710 + }, + { + "epoch": 1.04, + "learning_rate": 1.5154075040296165e-06, + "loss": 0.6196, + "step": 40711 + }, + { + "epoch": 1.04, + "learning_rate": 1.5153837917691911e-06, + "loss": 0.6865, + "step": 40712 + }, + { + "epoch": 1.04, + "learning_rate": 1.5153600791141604e-06, + "loss": 0.77, + "step": 40713 + }, + { + "epoch": 1.04, + "learning_rate": 1.5153363660645417e-06, + "loss": 0.6646, + "step": 40714 + }, + { + "epoch": 1.04, + "learning_rate": 1.5153126526203539e-06, + "loss": 0.6078, + "step": 40715 + }, + { + "epoch": 1.04, + "learning_rate": 1.515288938781615e-06, + "loss": 0.6172, + "step": 40716 + }, + { + "epoch": 1.04, + "learning_rate": 1.5152652245483428e-06, + "loss": 0.6327, + "step": 40717 + }, + { + "epoch": 1.04, + "learning_rate": 1.5152415099205559e-06, + "loss": 0.6963, + "step": 40718 + }, + { + "epoch": 1.04, + "learning_rate": 1.5152177948982724e-06, + "loss": 0.5182, + "step": 40719 + }, + { + "epoch": 1.04, + "learning_rate": 1.51519407948151e-06, + "loss": 0.5972, + "step": 40720 + }, + { + "epoch": 1.04, + "learning_rate": 1.5151703636702873e-06, + "loss": 0.7148, + "step": 40721 + }, + { + "epoch": 1.04, + "learning_rate": 1.5151466474646224e-06, + "loss": 0.7803, + "step": 40722 + }, + { + "epoch": 1.04, + "learning_rate": 1.5151229308645331e-06, + "loss": 0.4995, + "step": 40723 + }, + { + "epoch": 1.04, + "learning_rate": 1.5150992138700383e-06, + "loss": 0.5889, + "step": 40724 + }, + { + "epoch": 1.04, + "learning_rate": 1.5150754964811555e-06, + "loss": 0.6587, + "step": 40725 + }, + { + "epoch": 1.04, + "learning_rate": 1.5150517786979032e-06, + "loss": 0.5825, + "step": 40726 + }, + { + "epoch": 1.04, + "learning_rate": 1.5150280605202993e-06, + "loss": 0.6348, + "step": 40727 + }, + { + "epoch": 1.04, + "learning_rate": 1.515004341948362e-06, + "loss": 0.7324, + "step": 40728 + }, + { + "epoch": 1.04, + "learning_rate": 1.5149806229821098e-06, + "loss": 0.6611, + "step": 40729 + }, + { + "epoch": 1.04, + "learning_rate": 1.5149569036215603e-06, + "loss": 0.7686, + "step": 40730 + }, + { + "epoch": 1.04, + "learning_rate": 1.5149331838667325e-06, + "loss": 0.7441, + "step": 40731 + }, + { + "epoch": 1.04, + "learning_rate": 1.5149094637176436e-06, + "loss": 0.6758, + "step": 40732 + }, + { + "epoch": 1.04, + "learning_rate": 1.5148857431743123e-06, + "loss": 0.6953, + "step": 40733 + }, + { + "epoch": 1.04, + "learning_rate": 1.5148620222367567e-06, + "loss": 0.3719, + "step": 40734 + }, + { + "epoch": 1.04, + "learning_rate": 1.5148383009049947e-06, + "loss": 0.7607, + "step": 40735 + }, + { + "epoch": 1.04, + "learning_rate": 1.514814579179045e-06, + "loss": 0.7256, + "step": 40736 + }, + { + "epoch": 1.04, + "learning_rate": 1.5147908570589252e-06, + "loss": 0.6411, + "step": 40737 + }, + { + "epoch": 1.04, + "learning_rate": 1.514767134544654e-06, + "loss": 0.5889, + "step": 40738 + }, + { + "epoch": 1.04, + "learning_rate": 1.5147434116362491e-06, + "loss": 0.6079, + "step": 40739 + }, + { + "epoch": 1.04, + "learning_rate": 1.514719688333729e-06, + "loss": 0.5657, + "step": 40740 + }, + { + "epoch": 1.04, + "learning_rate": 1.5146959646371116e-06, + "loss": 0.5122, + "step": 40741 + }, + { + "epoch": 1.04, + "learning_rate": 1.5146722405464152e-06, + "loss": 0.5728, + "step": 40742 + }, + { + "epoch": 1.04, + "learning_rate": 1.5146485160616575e-06, + "loss": 0.6924, + "step": 40743 + }, + { + "epoch": 1.04, + "learning_rate": 1.5146247911828578e-06, + "loss": 0.709, + "step": 40744 + }, + { + "epoch": 1.04, + "learning_rate": 1.514601065910033e-06, + "loss": 0.707, + "step": 40745 + }, + { + "epoch": 1.04, + "learning_rate": 1.514577340243202e-06, + "loss": 0.6709, + "step": 40746 + }, + { + "epoch": 1.04, + "learning_rate": 1.5145536141823829e-06, + "loss": 0.6875, + "step": 40747 + }, + { + "epoch": 1.04, + "learning_rate": 1.5145298877275936e-06, + "loss": 0.5759, + "step": 40748 + }, + { + "epoch": 1.04, + "learning_rate": 1.5145061608788528e-06, + "loss": 0.6621, + "step": 40749 + }, + { + "epoch": 1.04, + "learning_rate": 1.514482433636178e-06, + "loss": 0.4368, + "step": 40750 + }, + { + "epoch": 1.04, + "learning_rate": 1.5144587059995875e-06, + "loss": 0.8232, + "step": 40751 + }, + { + "epoch": 1.04, + "learning_rate": 1.5144349779691e-06, + "loss": 0.6914, + "step": 40752 + }, + { + "epoch": 1.04, + "learning_rate": 1.5144112495447327e-06, + "loss": 0.4951, + "step": 40753 + }, + { + "epoch": 1.04, + "learning_rate": 1.514387520726505e-06, + "loss": 0.6914, + "step": 40754 + }, + { + "epoch": 1.04, + "learning_rate": 1.5143637915144343e-06, + "loss": 0.5701, + "step": 40755 + }, + { + "epoch": 1.04, + "learning_rate": 1.5143400619085386e-06, + "loss": 0.541, + "step": 40756 + }, + { + "epoch": 1.04, + "learning_rate": 1.5143163319088364e-06, + "loss": 0.7432, + "step": 40757 + }, + { + "epoch": 1.04, + "learning_rate": 1.514292601515346e-06, + "loss": 0.7446, + "step": 40758 + }, + { + "epoch": 1.04, + "learning_rate": 1.5142688707280856e-06, + "loss": 0.7686, + "step": 40759 + }, + { + "epoch": 1.04, + "learning_rate": 1.5142451395470727e-06, + "loss": 0.6787, + "step": 40760 + }, + { + "epoch": 1.04, + "learning_rate": 1.5142214079723262e-06, + "loss": 0.6958, + "step": 40761 + }, + { + "epoch": 1.04, + "learning_rate": 1.514197676003864e-06, + "loss": 0.5496, + "step": 40762 + }, + { + "epoch": 1.04, + "learning_rate": 1.5141739436417042e-06, + "loss": 0.5255, + "step": 40763 + }, + { + "epoch": 1.04, + "learning_rate": 1.5141502108858652e-06, + "loss": 0.623, + "step": 40764 + }, + { + "epoch": 1.04, + "learning_rate": 1.5141264777363652e-06, + "loss": 0.6895, + "step": 40765 + }, + { + "epoch": 1.04, + "learning_rate": 1.5141027441932214e-06, + "loss": 0.7529, + "step": 40766 + }, + { + "epoch": 1.04, + "learning_rate": 1.5140790102564535e-06, + "loss": 0.7666, + "step": 40767 + }, + { + "epoch": 1.04, + "learning_rate": 1.5140552759260788e-06, + "loss": 0.6069, + "step": 40768 + }, + { + "epoch": 1.04, + "learning_rate": 1.5140315412021156e-06, + "loss": 0.6924, + "step": 40769 + }, + { + "epoch": 1.04, + "learning_rate": 1.514007806084582e-06, + "loss": 0.7178, + "step": 40770 + }, + { + "epoch": 1.04, + "learning_rate": 1.5139840705734966e-06, + "loss": 0.6953, + "step": 40771 + }, + { + "epoch": 1.05, + "learning_rate": 1.5139603346688764e-06, + "loss": 0.4707, + "step": 40772 + }, + { + "epoch": 1.05, + "learning_rate": 1.5139365983707412e-06, + "loss": 0.7373, + "step": 40773 + }, + { + "epoch": 1.05, + "learning_rate": 1.5139128616791084e-06, + "loss": 0.7305, + "step": 40774 + }, + { + "epoch": 1.05, + "learning_rate": 1.5138891245939958e-06, + "loss": 0.5679, + "step": 40775 + }, + { + "epoch": 1.05, + "learning_rate": 1.513865387115422e-06, + "loss": 0.7998, + "step": 40776 + }, + { + "epoch": 1.05, + "learning_rate": 1.5138416492434049e-06, + "loss": 0.5615, + "step": 40777 + }, + { + "epoch": 1.05, + "learning_rate": 1.5138179109779633e-06, + "loss": 0.6079, + "step": 40778 + }, + { + "epoch": 1.05, + "learning_rate": 1.5137941723191146e-06, + "loss": 0.6279, + "step": 40779 + }, + { + "epoch": 1.05, + "learning_rate": 1.5137704332668774e-06, + "loss": 0.4638, + "step": 40780 + }, + { + "epoch": 1.05, + "learning_rate": 1.5137466938212699e-06, + "loss": 0.4717, + "step": 40781 + }, + { + "epoch": 1.05, + "learning_rate": 1.51372295398231e-06, + "loss": 0.5195, + "step": 40782 + }, + { + "epoch": 1.05, + "learning_rate": 1.5136992137500161e-06, + "loss": 0.6592, + "step": 40783 + }, + { + "epoch": 1.05, + "learning_rate": 1.5136754731244068e-06, + "loss": 0.6914, + "step": 40784 + }, + { + "epoch": 1.05, + "learning_rate": 1.513651732105499e-06, + "loss": 0.7231, + "step": 40785 + }, + { + "epoch": 1.05, + "learning_rate": 1.5136279906933125e-06, + "loss": 0.5596, + "step": 40786 + }, + { + "epoch": 1.05, + "learning_rate": 1.513604248887864e-06, + "loss": 0.8047, + "step": 40787 + }, + { + "epoch": 1.05, + "learning_rate": 1.513580506689173e-06, + "loss": 0.647, + "step": 40788 + }, + { + "epoch": 1.05, + "learning_rate": 1.5135567640972564e-06, + "loss": 0.7881, + "step": 40789 + }, + { + "epoch": 1.05, + "learning_rate": 1.5135330211121336e-06, + "loss": 0.5747, + "step": 40790 + }, + { + "epoch": 1.05, + "learning_rate": 1.5135092777338216e-06, + "loss": 0.5747, + "step": 40791 + }, + { + "epoch": 1.05, + "learning_rate": 1.5134855339623393e-06, + "loss": 0.5957, + "step": 40792 + }, + { + "epoch": 1.05, + "learning_rate": 1.513461789797705e-06, + "loss": 0.7725, + "step": 40793 + }, + { + "epoch": 1.05, + "learning_rate": 1.5134380452399365e-06, + "loss": 0.6299, + "step": 40794 + }, + { + "epoch": 1.05, + "learning_rate": 1.5134143002890519e-06, + "loss": 0.6719, + "step": 40795 + }, + { + "epoch": 1.05, + "learning_rate": 1.5133905549450698e-06, + "loss": 0.5684, + "step": 40796 + }, + { + "epoch": 1.05, + "learning_rate": 1.5133668092080082e-06, + "loss": 0.5737, + "step": 40797 + }, + { + "epoch": 1.05, + "learning_rate": 1.513343063077885e-06, + "loss": 0.6768, + "step": 40798 + }, + { + "epoch": 1.05, + "learning_rate": 1.5133193165547187e-06, + "loss": 0.6709, + "step": 40799 + }, + { + "epoch": 1.05, + "learning_rate": 1.5132955696385272e-06, + "loss": 0.4805, + "step": 40800 + }, + { + "epoch": 1.05, + "learning_rate": 1.5132718223293292e-06, + "loss": 0.792, + "step": 40801 + }, + { + "epoch": 1.05, + "learning_rate": 1.5132480746271426e-06, + "loss": 0.8477, + "step": 40802 + }, + { + "epoch": 1.05, + "learning_rate": 1.5132243265319855e-06, + "loss": 0.6421, + "step": 40803 + }, + { + "epoch": 1.05, + "learning_rate": 1.513200578043876e-06, + "loss": 0.6592, + "step": 40804 + }, + { + "epoch": 1.05, + "learning_rate": 1.5131768291628326e-06, + "loss": 0.7969, + "step": 40805 + }, + { + "epoch": 1.05, + "learning_rate": 1.513153079888873e-06, + "loss": 0.3901, + "step": 40806 + }, + { + "epoch": 1.05, + "learning_rate": 1.513129330222016e-06, + "loss": 0.7324, + "step": 40807 + }, + { + "epoch": 1.05, + "learning_rate": 1.5131055801622791e-06, + "loss": 0.7148, + "step": 40808 + }, + { + "epoch": 1.05, + "learning_rate": 1.5130818297096815e-06, + "loss": 0.5369, + "step": 40809 + }, + { + "epoch": 1.05, + "learning_rate": 1.51305807886424e-06, + "loss": 0.561, + "step": 40810 + }, + { + "epoch": 1.05, + "learning_rate": 1.5130343276259741e-06, + "loss": 0.6865, + "step": 40811 + }, + { + "epoch": 1.05, + "learning_rate": 1.513010575994901e-06, + "loss": 0.5791, + "step": 40812 + }, + { + "epoch": 1.05, + "learning_rate": 1.5129868239710395e-06, + "loss": 0.7871, + "step": 40813 + }, + { + "epoch": 1.05, + "learning_rate": 1.5129630715544076e-06, + "loss": 0.4775, + "step": 40814 + }, + { + "epoch": 1.05, + "learning_rate": 1.5129393187450233e-06, + "loss": 0.6206, + "step": 40815 + }, + { + "epoch": 1.05, + "learning_rate": 1.512915565542905e-06, + "loss": 0.5046, + "step": 40816 + }, + { + "epoch": 1.05, + "learning_rate": 1.5128918119480706e-06, + "loss": 0.7822, + "step": 40817 + }, + { + "epoch": 1.05, + "learning_rate": 1.5128680579605388e-06, + "loss": 0.7441, + "step": 40818 + }, + { + "epoch": 1.05, + "learning_rate": 1.5128443035803277e-06, + "loss": 0.5386, + "step": 40819 + }, + { + "epoch": 1.05, + "learning_rate": 1.512820548807455e-06, + "loss": 0.6382, + "step": 40820 + }, + { + "epoch": 1.05, + "learning_rate": 1.5127967936419394e-06, + "loss": 0.6226, + "step": 40821 + }, + { + "epoch": 1.05, + "learning_rate": 1.5127730380837986e-06, + "loss": 0.6172, + "step": 40822 + }, + { + "epoch": 1.05, + "learning_rate": 1.5127492821330515e-06, + "loss": 0.7178, + "step": 40823 + }, + { + "epoch": 1.05, + "learning_rate": 1.5127255257897154e-06, + "loss": 0.7383, + "step": 40824 + }, + { + "epoch": 1.05, + "learning_rate": 1.512701769053809e-06, + "loss": 0.6294, + "step": 40825 + }, + { + "epoch": 1.05, + "learning_rate": 1.5126780119253506e-06, + "loss": 0.6162, + "step": 40826 + }, + { + "epoch": 1.05, + "learning_rate": 1.5126542544043579e-06, + "loss": 0.6016, + "step": 40827 + }, + { + "epoch": 1.05, + "learning_rate": 1.5126304964908499e-06, + "loss": 0.6851, + "step": 40828 + }, + { + "epoch": 1.05, + "learning_rate": 1.5126067381848442e-06, + "loss": 0.7578, + "step": 40829 + }, + { + "epoch": 1.05, + "learning_rate": 1.512582979486359e-06, + "loss": 0.6421, + "step": 40830 + }, + { + "epoch": 1.05, + "learning_rate": 1.5125592203954124e-06, + "loss": 0.6396, + "step": 40831 + }, + { + "epoch": 1.05, + "learning_rate": 1.5125354609120228e-06, + "loss": 0.7324, + "step": 40832 + }, + { + "epoch": 1.05, + "learning_rate": 1.5125117010362084e-06, + "loss": 0.7939, + "step": 40833 + }, + { + "epoch": 1.05, + "learning_rate": 1.5124879407679876e-06, + "loss": 0.5444, + "step": 40834 + }, + { + "epoch": 1.05, + "learning_rate": 1.5124641801073784e-06, + "loss": 0.6562, + "step": 40835 + }, + { + "epoch": 1.05, + "learning_rate": 1.5124404190543985e-06, + "loss": 0.7451, + "step": 40836 + }, + { + "epoch": 1.05, + "learning_rate": 1.5124166576090668e-06, + "loss": 0.7666, + "step": 40837 + }, + { + "epoch": 1.05, + "learning_rate": 1.5123928957714012e-06, + "loss": 0.5361, + "step": 40838 + }, + { + "epoch": 1.05, + "learning_rate": 1.51236913354142e-06, + "loss": 0.5386, + "step": 40839 + }, + { + "epoch": 1.05, + "learning_rate": 1.5123453709191412e-06, + "loss": 0.7012, + "step": 40840 + }, + { + "epoch": 1.05, + "learning_rate": 1.5123216079045832e-06, + "loss": 0.6143, + "step": 40841 + }, + { + "epoch": 1.05, + "learning_rate": 1.512297844497764e-06, + "loss": 0.6479, + "step": 40842 + }, + { + "epoch": 1.05, + "learning_rate": 1.5122740806987015e-06, + "loss": 0.6621, + "step": 40843 + }, + { + "epoch": 1.05, + "learning_rate": 1.5122503165074148e-06, + "loss": 0.5811, + "step": 40844 + }, + { + "epoch": 1.05, + "learning_rate": 1.5122265519239217e-06, + "loss": 0.752, + "step": 40845 + }, + { + "epoch": 1.05, + "learning_rate": 1.5122027869482399e-06, + "loss": 0.6162, + "step": 40846 + }, + { + "epoch": 1.05, + "learning_rate": 1.5121790215803882e-06, + "loss": 0.6821, + "step": 40847 + }, + { + "epoch": 1.05, + "learning_rate": 1.5121552558203848e-06, + "loss": 0.6709, + "step": 40848 + }, + { + "epoch": 1.05, + "learning_rate": 1.5121314896682472e-06, + "loss": 0.7061, + "step": 40849 + }, + { + "epoch": 1.05, + "learning_rate": 1.5121077231239942e-06, + "loss": 0.6328, + "step": 40850 + }, + { + "epoch": 1.05, + "learning_rate": 1.5120839561876442e-06, + "loss": 0.6553, + "step": 40851 + }, + { + "epoch": 1.05, + "learning_rate": 1.5120601888592144e-06, + "loss": 0.6445, + "step": 40852 + }, + { + "epoch": 1.05, + "learning_rate": 1.5120364211387243e-06, + "loss": 0.5884, + "step": 40853 + }, + { + "epoch": 1.05, + "learning_rate": 1.5120126530261913e-06, + "loss": 0.6309, + "step": 40854 + }, + { + "epoch": 1.05, + "learning_rate": 1.5119888845216338e-06, + "loss": 0.4473, + "step": 40855 + }, + { + "epoch": 1.05, + "learning_rate": 1.5119651156250695e-06, + "loss": 0.7188, + "step": 40856 + }, + { + "epoch": 1.05, + "learning_rate": 1.5119413463365174e-06, + "loss": 0.4597, + "step": 40857 + }, + { + "epoch": 1.05, + "learning_rate": 1.5119175766559954e-06, + "loss": 0.6655, + "step": 40858 + }, + { + "epoch": 1.05, + "learning_rate": 1.5118938065835217e-06, + "loss": 0.5879, + "step": 40859 + }, + { + "epoch": 1.05, + "learning_rate": 1.511870036119114e-06, + "loss": 0.584, + "step": 40860 + }, + { + "epoch": 1.05, + "learning_rate": 1.5118462652627914e-06, + "loss": 0.7256, + "step": 40861 + }, + { + "epoch": 1.05, + "learning_rate": 1.5118224940145714e-06, + "loss": 0.5811, + "step": 40862 + }, + { + "epoch": 1.05, + "learning_rate": 1.5117987223744727e-06, + "loss": 0.6885, + "step": 40863 + }, + { + "epoch": 1.05, + "learning_rate": 1.5117749503425133e-06, + "loss": 0.4565, + "step": 40864 + }, + { + "epoch": 1.05, + "learning_rate": 1.511751177918711e-06, + "loss": 0.5044, + "step": 40865 + }, + { + "epoch": 1.05, + "learning_rate": 1.5117274051030844e-06, + "loss": 0.6406, + "step": 40866 + }, + { + "epoch": 1.05, + "learning_rate": 1.511703631895652e-06, + "loss": 0.8564, + "step": 40867 + }, + { + "epoch": 1.05, + "learning_rate": 1.511679858296431e-06, + "loss": 0.7773, + "step": 40868 + }, + { + "epoch": 1.05, + "learning_rate": 1.5116560843054411e-06, + "loss": 0.5156, + "step": 40869 + }, + { + "epoch": 1.05, + "learning_rate": 1.5116323099226993e-06, + "loss": 0.7432, + "step": 40870 + }, + { + "epoch": 1.05, + "learning_rate": 1.511608535148224e-06, + "loss": 0.7021, + "step": 40871 + }, + { + "epoch": 1.05, + "learning_rate": 1.5115847599820336e-06, + "loss": 0.5596, + "step": 40872 + }, + { + "epoch": 1.05, + "learning_rate": 1.5115609844241464e-06, + "loss": 0.6697, + "step": 40873 + }, + { + "epoch": 1.05, + "learning_rate": 1.5115372084745808e-06, + "loss": 0.7168, + "step": 40874 + }, + { + "epoch": 1.05, + "learning_rate": 1.511513432133354e-06, + "loss": 0.6973, + "step": 40875 + }, + { + "epoch": 1.05, + "learning_rate": 1.5114896554004856e-06, + "loss": 0.8262, + "step": 40876 + }, + { + "epoch": 1.05, + "learning_rate": 1.5114658782759923e-06, + "loss": 0.6636, + "step": 40877 + }, + { + "epoch": 1.05, + "learning_rate": 1.5114421007598937e-06, + "loss": 0.7002, + "step": 40878 + }, + { + "epoch": 1.05, + "learning_rate": 1.511418322852207e-06, + "loss": 0.7998, + "step": 40879 + }, + { + "epoch": 1.05, + "learning_rate": 1.5113945445529513e-06, + "loss": 0.5688, + "step": 40880 + }, + { + "epoch": 1.05, + "learning_rate": 1.5113707658621438e-06, + "loss": 0.5159, + "step": 40881 + }, + { + "epoch": 1.05, + "learning_rate": 1.5113469867798037e-06, + "loss": 0.6943, + "step": 40882 + }, + { + "epoch": 1.05, + "learning_rate": 1.5113232073059481e-06, + "loss": 0.7061, + "step": 40883 + }, + { + "epoch": 1.05, + "learning_rate": 1.5112994274405964e-06, + "loss": 0.7158, + "step": 40884 + }, + { + "epoch": 1.05, + "learning_rate": 1.511275647183766e-06, + "loss": 0.6406, + "step": 40885 + }, + { + "epoch": 1.05, + "learning_rate": 1.5112518665354755e-06, + "loss": 0.6514, + "step": 40886 + }, + { + "epoch": 1.05, + "learning_rate": 1.5112280854957427e-06, + "loss": 0.6455, + "step": 40887 + }, + { + "epoch": 1.05, + "learning_rate": 1.511204304064586e-06, + "loss": 0.6699, + "step": 40888 + }, + { + "epoch": 1.05, + "learning_rate": 1.511180522242024e-06, + "loss": 0.7832, + "step": 40889 + }, + { + "epoch": 1.05, + "learning_rate": 1.5111567400280745e-06, + "loss": 0.5317, + "step": 40890 + }, + { + "epoch": 1.05, + "learning_rate": 1.5111329574227557e-06, + "loss": 0.5142, + "step": 40891 + }, + { + "epoch": 1.05, + "learning_rate": 1.5111091744260858e-06, + "loss": 0.6909, + "step": 40892 + }, + { + "epoch": 1.05, + "learning_rate": 1.511085391038083e-06, + "loss": 0.6367, + "step": 40893 + }, + { + "epoch": 1.05, + "learning_rate": 1.511061607258766e-06, + "loss": 0.6299, + "step": 40894 + }, + { + "epoch": 1.05, + "learning_rate": 1.5110378230881527e-06, + "loss": 0.8652, + "step": 40895 + }, + { + "epoch": 1.05, + "learning_rate": 1.5110140385262608e-06, + "loss": 0.6416, + "step": 40896 + }, + { + "epoch": 1.05, + "learning_rate": 1.5109902535731092e-06, + "loss": 0.5952, + "step": 40897 + }, + { + "epoch": 1.05, + "learning_rate": 1.5109664682287158e-06, + "loss": 0.6885, + "step": 40898 + }, + { + "epoch": 1.05, + "learning_rate": 1.5109426824930992e-06, + "loss": 0.6753, + "step": 40899 + }, + { + "epoch": 1.05, + "learning_rate": 1.510918896366277e-06, + "loss": 0.4346, + "step": 40900 + }, + { + "epoch": 1.05, + "learning_rate": 1.5108951098482674e-06, + "loss": 0.7061, + "step": 40901 + }, + { + "epoch": 1.05, + "learning_rate": 1.510871322939089e-06, + "loss": 0.7559, + "step": 40902 + }, + { + "epoch": 1.05, + "learning_rate": 1.5108475356387604e-06, + "loss": 0.5374, + "step": 40903 + }, + { + "epoch": 1.05, + "learning_rate": 1.5108237479472988e-06, + "loss": 0.6313, + "step": 40904 + }, + { + "epoch": 1.05, + "learning_rate": 1.5107999598647234e-06, + "loss": 0.6934, + "step": 40905 + }, + { + "epoch": 1.05, + "learning_rate": 1.5107761713910517e-06, + "loss": 0.6035, + "step": 40906 + }, + { + "epoch": 1.05, + "learning_rate": 1.5107523825263023e-06, + "loss": 0.525, + "step": 40907 + }, + { + "epoch": 1.05, + "learning_rate": 1.510728593270493e-06, + "loss": 0.5938, + "step": 40908 + }, + { + "epoch": 1.05, + "learning_rate": 1.5107048036236426e-06, + "loss": 0.7026, + "step": 40909 + }, + { + "epoch": 1.05, + "learning_rate": 1.5106810135857689e-06, + "loss": 0.6121, + "step": 40910 + }, + { + "epoch": 1.05, + "learning_rate": 1.5106572231568901e-06, + "loss": 0.709, + "step": 40911 + }, + { + "epoch": 1.05, + "learning_rate": 1.5106334323370246e-06, + "loss": 0.7432, + "step": 40912 + }, + { + "epoch": 1.05, + "learning_rate": 1.5106096411261909e-06, + "loss": 0.5933, + "step": 40913 + }, + { + "epoch": 1.05, + "learning_rate": 1.5105858495244066e-06, + "loss": 0.6885, + "step": 40914 + }, + { + "epoch": 1.05, + "learning_rate": 1.5105620575316899e-06, + "loss": 0.3085, + "step": 40915 + }, + { + "epoch": 1.05, + "learning_rate": 1.5105382651480599e-06, + "loss": 0.7354, + "step": 40916 + }, + { + "epoch": 1.05, + "learning_rate": 1.5105144723735337e-06, + "loss": 0.6348, + "step": 40917 + }, + { + "epoch": 1.05, + "learning_rate": 1.5104906792081305e-06, + "loss": 0.4229, + "step": 40918 + }, + { + "epoch": 1.05, + "learning_rate": 1.5104668856518677e-06, + "loss": 0.6953, + "step": 40919 + }, + { + "epoch": 1.05, + "learning_rate": 1.5104430917047641e-06, + "loss": 0.8242, + "step": 40920 + }, + { + "epoch": 1.05, + "learning_rate": 1.5104192973668375e-06, + "loss": 0.603, + "step": 40921 + }, + { + "epoch": 1.05, + "learning_rate": 1.5103955026381065e-06, + "loss": 0.5562, + "step": 40922 + }, + { + "epoch": 1.05, + "learning_rate": 1.510371707518589e-06, + "loss": 0.7109, + "step": 40923 + }, + { + "epoch": 1.05, + "learning_rate": 1.5103479120083034e-06, + "loss": 0.6758, + "step": 40924 + }, + { + "epoch": 1.05, + "learning_rate": 1.510324116107268e-06, + "loss": 0.6587, + "step": 40925 + }, + { + "epoch": 1.05, + "learning_rate": 1.5103003198155006e-06, + "loss": 0.6479, + "step": 40926 + }, + { + "epoch": 1.05, + "learning_rate": 1.5102765231330196e-06, + "loss": 0.5708, + "step": 40927 + }, + { + "epoch": 1.05, + "learning_rate": 1.5102527260598442e-06, + "loss": 0.5444, + "step": 40928 + }, + { + "epoch": 1.05, + "learning_rate": 1.5102289285959909e-06, + "loss": 0.8262, + "step": 40929 + }, + { + "epoch": 1.05, + "learning_rate": 1.510205130741479e-06, + "loss": 0.7402, + "step": 40930 + }, + { + "epoch": 1.05, + "learning_rate": 1.5101813324963264e-06, + "loss": 0.708, + "step": 40931 + }, + { + "epoch": 1.05, + "learning_rate": 1.5101575338605518e-06, + "loss": 0.5061, + "step": 40932 + }, + { + "epoch": 1.05, + "learning_rate": 1.5101337348341728e-06, + "loss": 0.4609, + "step": 40933 + }, + { + "epoch": 1.05, + "learning_rate": 1.5101099354172074e-06, + "loss": 0.5884, + "step": 40934 + }, + { + "epoch": 1.05, + "learning_rate": 1.5100861356096748e-06, + "loss": 0.6357, + "step": 40935 + }, + { + "epoch": 1.05, + "learning_rate": 1.5100623354115926e-06, + "loss": 0.7207, + "step": 40936 + }, + { + "epoch": 1.05, + "learning_rate": 1.510038534822979e-06, + "loss": 0.6924, + "step": 40937 + }, + { + "epoch": 1.05, + "learning_rate": 1.5100147338438527e-06, + "loss": 0.4478, + "step": 40938 + }, + { + "epoch": 1.05, + "learning_rate": 1.5099909324742312e-06, + "loss": 0.4559, + "step": 40939 + }, + { + "epoch": 1.05, + "learning_rate": 1.5099671307141332e-06, + "loss": 0.6191, + "step": 40940 + }, + { + "epoch": 1.05, + "learning_rate": 1.509943328563577e-06, + "loss": 0.6895, + "step": 40941 + }, + { + "epoch": 1.05, + "learning_rate": 1.5099195260225802e-06, + "loss": 0.5986, + "step": 40942 + }, + { + "epoch": 1.05, + "learning_rate": 1.5098957230911621e-06, + "loss": 0.6091, + "step": 40943 + }, + { + "epoch": 1.05, + "learning_rate": 1.5098719197693397e-06, + "loss": 0.623, + "step": 40944 + }, + { + "epoch": 1.05, + "learning_rate": 1.5098481160571321e-06, + "loss": 0.7773, + "step": 40945 + }, + { + "epoch": 1.05, + "learning_rate": 1.5098243119545573e-06, + "loss": 0.7256, + "step": 40946 + }, + { + "epoch": 1.05, + "learning_rate": 1.5098005074616333e-06, + "loss": 0.5786, + "step": 40947 + }, + { + "epoch": 1.05, + "learning_rate": 1.5097767025783786e-06, + "loss": 0.6924, + "step": 40948 + }, + { + "epoch": 1.05, + "learning_rate": 1.5097528973048114e-06, + "loss": 0.6831, + "step": 40949 + }, + { + "epoch": 1.05, + "learning_rate": 1.5097290916409495e-06, + "loss": 0.7363, + "step": 40950 + }, + { + "epoch": 1.05, + "learning_rate": 1.5097052855868119e-06, + "loss": 0.6333, + "step": 40951 + }, + { + "epoch": 1.05, + "learning_rate": 1.5096814791424159e-06, + "loss": 0.4749, + "step": 40952 + }, + { + "epoch": 1.05, + "learning_rate": 1.5096576723077808e-06, + "loss": 0.6616, + "step": 40953 + }, + { + "epoch": 1.05, + "learning_rate": 1.509633865082924e-06, + "loss": 0.6309, + "step": 40954 + }, + { + "epoch": 1.05, + "learning_rate": 1.5096100574678636e-06, + "loss": 0.7285, + "step": 40955 + }, + { + "epoch": 1.05, + "learning_rate": 1.5095862494626188e-06, + "loss": 0.5886, + "step": 40956 + }, + { + "epoch": 1.05, + "learning_rate": 1.509562441067207e-06, + "loss": 0.8682, + "step": 40957 + }, + { + "epoch": 1.05, + "learning_rate": 1.5095386322816468e-06, + "loss": 0.6372, + "step": 40958 + }, + { + "epoch": 1.05, + "learning_rate": 1.509514823105956e-06, + "loss": 0.7188, + "step": 40959 + }, + { + "epoch": 1.05, + "learning_rate": 1.5094910135401536e-06, + "loss": 0.5601, + "step": 40960 + }, + { + "epoch": 1.05, + "learning_rate": 1.509467203584257e-06, + "loss": 0.7085, + "step": 40961 + }, + { + "epoch": 1.05, + "learning_rate": 1.5094433932382846e-06, + "loss": 0.7344, + "step": 40962 + }, + { + "epoch": 1.05, + "learning_rate": 1.5094195825022552e-06, + "loss": 0.5518, + "step": 40963 + }, + { + "epoch": 1.05, + "learning_rate": 1.5093957713761865e-06, + "loss": 0.8359, + "step": 40964 + }, + { + "epoch": 1.05, + "learning_rate": 1.5093719598600969e-06, + "loss": 0.627, + "step": 40965 + }, + { + "epoch": 1.05, + "learning_rate": 1.5093481479540047e-06, + "loss": 0.5254, + "step": 40966 + }, + { + "epoch": 1.05, + "learning_rate": 1.5093243356579277e-06, + "loss": 0.6274, + "step": 40967 + }, + { + "epoch": 1.05, + "learning_rate": 1.5093005229718848e-06, + "loss": 0.5671, + "step": 40968 + }, + { + "epoch": 1.05, + "learning_rate": 1.5092767098958938e-06, + "loss": 0.5879, + "step": 40969 + }, + { + "epoch": 1.05, + "learning_rate": 1.5092528964299733e-06, + "loss": 0.437, + "step": 40970 + }, + { + "epoch": 1.05, + "learning_rate": 1.5092290825741409e-06, + "loss": 0.7026, + "step": 40971 + }, + { + "epoch": 1.05, + "learning_rate": 1.5092052683284156e-06, + "loss": 0.613, + "step": 40972 + }, + { + "epoch": 1.05, + "learning_rate": 1.509181453692815e-06, + "loss": 0.7168, + "step": 40973 + }, + { + "epoch": 1.05, + "learning_rate": 1.5091576386673577e-06, + "loss": 0.4756, + "step": 40974 + }, + { + "epoch": 1.05, + "learning_rate": 1.5091338232520614e-06, + "loss": 0.6602, + "step": 40975 + }, + { + "epoch": 1.05, + "learning_rate": 1.5091100074469448e-06, + "loss": 0.709, + "step": 40976 + }, + { + "epoch": 1.05, + "learning_rate": 1.5090861912520265e-06, + "loss": 0.623, + "step": 40977 + }, + { + "epoch": 1.05, + "learning_rate": 1.509062374667324e-06, + "loss": 0.7412, + "step": 40978 + }, + { + "epoch": 1.05, + "learning_rate": 1.509038557692856e-06, + "loss": 0.7334, + "step": 40979 + }, + { + "epoch": 1.05, + "learning_rate": 1.5090147403286407e-06, + "loss": 0.6323, + "step": 40980 + }, + { + "epoch": 1.05, + "learning_rate": 1.508990922574696e-06, + "loss": 0.6504, + "step": 40981 + }, + { + "epoch": 1.05, + "learning_rate": 1.5089671044310404e-06, + "loss": 0.7188, + "step": 40982 + }, + { + "epoch": 1.05, + "learning_rate": 1.508943285897692e-06, + "loss": 0.5151, + "step": 40983 + }, + { + "epoch": 1.05, + "learning_rate": 1.5089194669746691e-06, + "loss": 0.4414, + "step": 40984 + }, + { + "epoch": 1.05, + "learning_rate": 1.5088956476619906e-06, + "loss": 0.5049, + "step": 40985 + }, + { + "epoch": 1.05, + "learning_rate": 1.5088718279596733e-06, + "loss": 0.3945, + "step": 40986 + }, + { + "epoch": 1.05, + "learning_rate": 1.5088480078677366e-06, + "loss": 0.6167, + "step": 40987 + }, + { + "epoch": 1.05, + "learning_rate": 1.5088241873861981e-06, + "loss": 0.6914, + "step": 40988 + }, + { + "epoch": 1.05, + "learning_rate": 1.5088003665150768e-06, + "loss": 0.426, + "step": 40989 + }, + { + "epoch": 1.05, + "learning_rate": 1.50877654525439e-06, + "loss": 0.7471, + "step": 40990 + }, + { + "epoch": 1.05, + "learning_rate": 1.5087527236041568e-06, + "loss": 0.6914, + "step": 40991 + }, + { + "epoch": 1.05, + "learning_rate": 1.5087289015643947e-06, + "loss": 0.4526, + "step": 40992 + }, + { + "epoch": 1.05, + "learning_rate": 1.5087050791351227e-06, + "loss": 0.7583, + "step": 40993 + }, + { + "epoch": 1.05, + "learning_rate": 1.508681256316358e-06, + "loss": 0.4849, + "step": 40994 + }, + { + "epoch": 1.05, + "learning_rate": 1.5086574331081199e-06, + "loss": 0.8027, + "step": 40995 + }, + { + "epoch": 1.05, + "learning_rate": 1.5086336095104258e-06, + "loss": 0.7261, + "step": 40996 + }, + { + "epoch": 1.05, + "learning_rate": 1.5086097855232947e-06, + "loss": 0.6133, + "step": 40997 + }, + { + "epoch": 1.05, + "learning_rate": 1.5085859611467445e-06, + "loss": 0.6973, + "step": 40998 + }, + { + "epoch": 1.05, + "learning_rate": 1.508562136380793e-06, + "loss": 0.6592, + "step": 40999 + }, + { + "epoch": 1.05, + "learning_rate": 1.5085383112254592e-06, + "loss": 0.7031, + "step": 41000 + }, + { + "epoch": 1.05, + "learning_rate": 1.508514485680761e-06, + "loss": 0.5732, + "step": 41001 + }, + { + "epoch": 1.05, + "learning_rate": 1.5084906597467164e-06, + "loss": 0.7803, + "step": 41002 + }, + { + "epoch": 1.05, + "learning_rate": 1.5084668334233442e-06, + "loss": 0.5349, + "step": 41003 + }, + { + "epoch": 1.05, + "learning_rate": 1.508443006710662e-06, + "loss": 0.7617, + "step": 41004 + }, + { + "epoch": 1.05, + "learning_rate": 1.5084191796086887e-06, + "loss": 0.5884, + "step": 41005 + }, + { + "epoch": 1.05, + "learning_rate": 1.5083953521174419e-06, + "loss": 0.6914, + "step": 41006 + }, + { + "epoch": 1.05, + "learning_rate": 1.5083715242369404e-06, + "loss": 0.665, + "step": 41007 + }, + { + "epoch": 1.05, + "learning_rate": 1.508347695967202e-06, + "loss": 0.8057, + "step": 41008 + }, + { + "epoch": 1.05, + "learning_rate": 1.5083238673082456e-06, + "loss": 0.7939, + "step": 41009 + }, + { + "epoch": 1.05, + "learning_rate": 1.5083000382600886e-06, + "loss": 0.8203, + "step": 41010 + }, + { + "epoch": 1.05, + "learning_rate": 1.5082762088227493e-06, + "loss": 0.8223, + "step": 41011 + }, + { + "epoch": 1.05, + "learning_rate": 1.508252378996247e-06, + "loss": 0.6567, + "step": 41012 + }, + { + "epoch": 1.05, + "learning_rate": 1.5082285487805985e-06, + "loss": 0.6528, + "step": 41013 + }, + { + "epoch": 1.05, + "learning_rate": 1.5082047181758233e-06, + "loss": 0.7461, + "step": 41014 + }, + { + "epoch": 1.05, + "learning_rate": 1.508180887181939e-06, + "loss": 0.6787, + "step": 41015 + }, + { + "epoch": 1.05, + "learning_rate": 1.5081570557989638e-06, + "loss": 0.6924, + "step": 41016 + }, + { + "epoch": 1.05, + "learning_rate": 1.508133224026916e-06, + "loss": 0.6035, + "step": 41017 + }, + { + "epoch": 1.05, + "learning_rate": 1.5081093918658145e-06, + "loss": 0.6855, + "step": 41018 + }, + { + "epoch": 1.05, + "learning_rate": 1.5080855593156767e-06, + "loss": 0.667, + "step": 41019 + }, + { + "epoch": 1.05, + "learning_rate": 1.5080617263765213e-06, + "loss": 0.6904, + "step": 41020 + }, + { + "epoch": 1.05, + "learning_rate": 1.508037893048366e-06, + "loss": 0.6279, + "step": 41021 + }, + { + "epoch": 1.05, + "learning_rate": 1.5080140593312298e-06, + "loss": 0.7021, + "step": 41022 + }, + { + "epoch": 1.05, + "learning_rate": 1.5079902252251304e-06, + "loss": 0.7041, + "step": 41023 + }, + { + "epoch": 1.05, + "learning_rate": 1.5079663907300861e-06, + "loss": 0.7202, + "step": 41024 + }, + { + "epoch": 1.05, + "learning_rate": 1.5079425558461157e-06, + "loss": 0.5457, + "step": 41025 + }, + { + "epoch": 1.05, + "learning_rate": 1.5079187205732367e-06, + "loss": 0.6621, + "step": 41026 + }, + { + "epoch": 1.05, + "learning_rate": 1.5078948849114679e-06, + "loss": 0.601, + "step": 41027 + }, + { + "epoch": 1.05, + "learning_rate": 1.5078710488608273e-06, + "loss": 0.5752, + "step": 41028 + }, + { + "epoch": 1.05, + "learning_rate": 1.5078472124213332e-06, + "loss": 0.8096, + "step": 41029 + }, + { + "epoch": 1.05, + "learning_rate": 1.5078233755930037e-06, + "loss": 0.6265, + "step": 41030 + }, + { + "epoch": 1.05, + "learning_rate": 1.5077995383758575e-06, + "loss": 0.5765, + "step": 41031 + }, + { + "epoch": 1.05, + "learning_rate": 1.5077757007699118e-06, + "loss": 0.6812, + "step": 41032 + }, + { + "epoch": 1.05, + "learning_rate": 1.5077518627751866e-06, + "loss": 0.6875, + "step": 41033 + }, + { + "epoch": 1.05, + "learning_rate": 1.5077280243916985e-06, + "loss": 0.5818, + "step": 41034 + }, + { + "epoch": 1.05, + "learning_rate": 1.5077041856194668e-06, + "loss": 0.6365, + "step": 41035 + }, + { + "epoch": 1.05, + "learning_rate": 1.5076803464585091e-06, + "loss": 0.6299, + "step": 41036 + }, + { + "epoch": 1.05, + "learning_rate": 1.5076565069088439e-06, + "loss": 0.5894, + "step": 41037 + }, + { + "epoch": 1.05, + "learning_rate": 1.5076326669704896e-06, + "loss": 0.5615, + "step": 41038 + }, + { + "epoch": 1.05, + "learning_rate": 1.507608826643464e-06, + "loss": 0.6113, + "step": 41039 + }, + { + "epoch": 1.05, + "learning_rate": 1.507584985927786e-06, + "loss": 0.8296, + "step": 41040 + }, + { + "epoch": 1.05, + "learning_rate": 1.5075611448234732e-06, + "loss": 0.7061, + "step": 41041 + }, + { + "epoch": 1.05, + "learning_rate": 1.5075373033305443e-06, + "loss": 0.7676, + "step": 41042 + }, + { + "epoch": 1.05, + "learning_rate": 1.5075134614490174e-06, + "loss": 0.6885, + "step": 41043 + }, + { + "epoch": 1.05, + "learning_rate": 1.5074896191789108e-06, + "loss": 0.9189, + "step": 41044 + }, + { + "epoch": 1.05, + "learning_rate": 1.5074657765202429e-06, + "loss": 0.5974, + "step": 41045 + }, + { + "epoch": 1.05, + "learning_rate": 1.5074419334730318e-06, + "loss": 0.8115, + "step": 41046 + }, + { + "epoch": 1.05, + "learning_rate": 1.5074180900372954e-06, + "loss": 0.5282, + "step": 41047 + }, + { + "epoch": 1.05, + "learning_rate": 1.5073942462130528e-06, + "loss": 0.7754, + "step": 41048 + }, + { + "epoch": 1.05, + "learning_rate": 1.5073704020003212e-06, + "loss": 0.6499, + "step": 41049 + }, + { + "epoch": 1.05, + "learning_rate": 1.5073465573991198e-06, + "loss": 0.7393, + "step": 41050 + }, + { + "epoch": 1.05, + "learning_rate": 1.5073227124094663e-06, + "loss": 0.7319, + "step": 41051 + }, + { + "epoch": 1.05, + "learning_rate": 1.5072988670313792e-06, + "loss": 0.5659, + "step": 41052 + }, + { + "epoch": 1.05, + "learning_rate": 1.5072750212648766e-06, + "loss": 0.5674, + "step": 41053 + }, + { + "epoch": 1.05, + "learning_rate": 1.507251175109977e-06, + "loss": 0.5842, + "step": 41054 + }, + { + "epoch": 1.05, + "learning_rate": 1.507227328566698e-06, + "loss": 0.5361, + "step": 41055 + }, + { + "epoch": 1.05, + "learning_rate": 1.507203481635059e-06, + "loss": 0.613, + "step": 41056 + }, + { + "epoch": 1.05, + "learning_rate": 1.5071796343150774e-06, + "loss": 0.7017, + "step": 41057 + }, + { + "epoch": 1.05, + "learning_rate": 1.5071557866067717e-06, + "loss": 0.344, + "step": 41058 + }, + { + "epoch": 1.05, + "learning_rate": 1.5071319385101599e-06, + "loss": 0.5216, + "step": 41059 + }, + { + "epoch": 1.05, + "learning_rate": 1.507108090025261e-06, + "loss": 0.7227, + "step": 41060 + }, + { + "epoch": 1.05, + "learning_rate": 1.5070842411520922e-06, + "loss": 0.6914, + "step": 41061 + }, + { + "epoch": 1.05, + "learning_rate": 1.5070603918906727e-06, + "loss": 0.7686, + "step": 41062 + }, + { + "epoch": 1.05, + "learning_rate": 1.5070365422410202e-06, + "loss": 0.8623, + "step": 41063 + }, + { + "epoch": 1.05, + "learning_rate": 1.5070126922031532e-06, + "loss": 0.7178, + "step": 41064 + }, + { + "epoch": 1.05, + "learning_rate": 1.5069888417770898e-06, + "loss": 0.7744, + "step": 41065 + }, + { + "epoch": 1.05, + "learning_rate": 1.5069649909628484e-06, + "loss": 0.7402, + "step": 41066 + }, + { + "epoch": 1.05, + "learning_rate": 1.506941139760447e-06, + "loss": 0.6787, + "step": 41067 + }, + { + "epoch": 1.05, + "learning_rate": 1.5069172881699044e-06, + "loss": 0.7744, + "step": 41068 + }, + { + "epoch": 1.05, + "learning_rate": 1.5068934361912385e-06, + "loss": 0.7178, + "step": 41069 + }, + { + "epoch": 1.05, + "learning_rate": 1.5068695838244674e-06, + "loss": 0.5957, + "step": 41070 + }, + { + "epoch": 1.05, + "learning_rate": 1.50684573106961e-06, + "loss": 0.5835, + "step": 41071 + }, + { + "epoch": 1.05, + "learning_rate": 1.5068218779266834e-06, + "loss": 0.6294, + "step": 41072 + }, + { + "epoch": 1.05, + "learning_rate": 1.5067980243957075e-06, + "loss": 0.5151, + "step": 41073 + }, + { + "epoch": 1.05, + "learning_rate": 1.506774170476699e-06, + "loss": 0.6719, + "step": 41074 + }, + { + "epoch": 1.05, + "learning_rate": 1.506750316169677e-06, + "loss": 0.6025, + "step": 41075 + }, + { + "epoch": 1.05, + "learning_rate": 1.5067264614746593e-06, + "loss": 0.6689, + "step": 41076 + }, + { + "epoch": 1.05, + "learning_rate": 1.5067026063916651e-06, + "loss": 0.5641, + "step": 41077 + }, + { + "epoch": 1.05, + "learning_rate": 1.5066787509207116e-06, + "loss": 0.7139, + "step": 41078 + }, + { + "epoch": 1.05, + "learning_rate": 1.5066548950618174e-06, + "loss": 0.6836, + "step": 41079 + }, + { + "epoch": 1.05, + "learning_rate": 1.506631038815001e-06, + "loss": 0.6929, + "step": 41080 + }, + { + "epoch": 1.05, + "learning_rate": 1.5066071821802803e-06, + "loss": 0.791, + "step": 41081 + }, + { + "epoch": 1.05, + "learning_rate": 1.506583325157674e-06, + "loss": 0.5227, + "step": 41082 + }, + { + "epoch": 1.05, + "learning_rate": 1.5065594677472003e-06, + "loss": 0.5596, + "step": 41083 + }, + { + "epoch": 1.05, + "learning_rate": 1.506535609948877e-06, + "loss": 0.6992, + "step": 41084 + }, + { + "epoch": 1.05, + "learning_rate": 1.5065117517627227e-06, + "loss": 0.7266, + "step": 41085 + }, + { + "epoch": 1.05, + "learning_rate": 1.5064878931887557e-06, + "loss": 0.6738, + "step": 41086 + }, + { + "epoch": 1.05, + "learning_rate": 1.5064640342269943e-06, + "loss": 0.6514, + "step": 41087 + }, + { + "epoch": 1.05, + "learning_rate": 1.5064401748774566e-06, + "loss": 0.7661, + "step": 41088 + }, + { + "epoch": 1.05, + "learning_rate": 1.5064163151401608e-06, + "loss": 0.5529, + "step": 41089 + }, + { + "epoch": 1.05, + "learning_rate": 1.5063924550151254e-06, + "loss": 0.6592, + "step": 41090 + }, + { + "epoch": 1.05, + "learning_rate": 1.5063685945023688e-06, + "loss": 0.7432, + "step": 41091 + }, + { + "epoch": 1.05, + "learning_rate": 1.5063447336019089e-06, + "loss": 0.397, + "step": 41092 + }, + { + "epoch": 1.05, + "learning_rate": 1.506320872313764e-06, + "loss": 0.749, + "step": 41093 + }, + { + "epoch": 1.05, + "learning_rate": 1.5062970106379526e-06, + "loss": 0.6235, + "step": 41094 + }, + { + "epoch": 1.05, + "learning_rate": 1.5062731485744928e-06, + "loss": 0.5415, + "step": 41095 + }, + { + "epoch": 1.05, + "learning_rate": 1.506249286123403e-06, + "loss": 0.7402, + "step": 41096 + }, + { + "epoch": 1.05, + "learning_rate": 1.5062254232847016e-06, + "loss": 0.5063, + "step": 41097 + }, + { + "epoch": 1.05, + "learning_rate": 1.5062015600584065e-06, + "loss": 0.5596, + "step": 41098 + }, + { + "epoch": 1.05, + "learning_rate": 1.506177696444536e-06, + "loss": 0.4576, + "step": 41099 + }, + { + "epoch": 1.05, + "learning_rate": 1.5061538324431087e-06, + "loss": 0.7334, + "step": 41100 + }, + { + "epoch": 1.05, + "learning_rate": 1.5061299680541427e-06, + "loss": 0.4922, + "step": 41101 + }, + { + "epoch": 1.05, + "learning_rate": 1.506106103277656e-06, + "loss": 0.6636, + "step": 41102 + }, + { + "epoch": 1.05, + "learning_rate": 1.5060822381136674e-06, + "loss": 0.6533, + "step": 41103 + }, + { + "epoch": 1.05, + "learning_rate": 1.5060583725621947e-06, + "loss": 0.6541, + "step": 41104 + }, + { + "epoch": 1.05, + "learning_rate": 1.5060345066232562e-06, + "loss": 0.5908, + "step": 41105 + }, + { + "epoch": 1.05, + "learning_rate": 1.5060106402968708e-06, + "loss": 0.6211, + "step": 41106 + }, + { + "epoch": 1.05, + "learning_rate": 1.505986773583056e-06, + "loss": 0.6226, + "step": 41107 + }, + { + "epoch": 1.05, + "learning_rate": 1.5059629064818306e-06, + "loss": 0.583, + "step": 41108 + }, + { + "epoch": 1.05, + "learning_rate": 1.5059390389932126e-06, + "loss": 0.7959, + "step": 41109 + }, + { + "epoch": 1.05, + "learning_rate": 1.5059151711172204e-06, + "loss": 0.5872, + "step": 41110 + }, + { + "epoch": 1.05, + "learning_rate": 1.5058913028538722e-06, + "loss": 0.4971, + "step": 41111 + }, + { + "epoch": 1.05, + "learning_rate": 1.5058674342031861e-06, + "loss": 0.7251, + "step": 41112 + }, + { + "epoch": 1.05, + "learning_rate": 1.5058435651651807e-06, + "loss": 0.6055, + "step": 41113 + }, + { + "epoch": 1.05, + "learning_rate": 1.5058196957398742e-06, + "loss": 0.7344, + "step": 41114 + }, + { + "epoch": 1.05, + "learning_rate": 1.5057958259272847e-06, + "loss": 0.6372, + "step": 41115 + }, + { + "epoch": 1.05, + "learning_rate": 1.5057719557274307e-06, + "loss": 0.7246, + "step": 41116 + }, + { + "epoch": 1.05, + "learning_rate": 1.5057480851403304e-06, + "loss": 0.7324, + "step": 41117 + }, + { + "epoch": 1.05, + "learning_rate": 1.5057242141660017e-06, + "loss": 0.4961, + "step": 41118 + }, + { + "epoch": 1.05, + "learning_rate": 1.5057003428044636e-06, + "loss": 0.6113, + "step": 41119 + }, + { + "epoch": 1.05, + "learning_rate": 1.5056764710557336e-06, + "loss": 0.6631, + "step": 41120 + }, + { + "epoch": 1.05, + "learning_rate": 1.505652598919831e-06, + "loss": 0.7827, + "step": 41121 + }, + { + "epoch": 1.05, + "learning_rate": 1.5056287263967732e-06, + "loss": 0.4956, + "step": 41122 + }, + { + "epoch": 1.05, + "learning_rate": 1.5056048534865787e-06, + "loss": 0.5742, + "step": 41123 + }, + { + "epoch": 1.05, + "learning_rate": 1.5055809801892656e-06, + "loss": 0.4404, + "step": 41124 + }, + { + "epoch": 1.05, + "learning_rate": 1.5055571065048527e-06, + "loss": 0.7598, + "step": 41125 + }, + { + "epoch": 1.05, + "learning_rate": 1.5055332324333576e-06, + "loss": 0.5356, + "step": 41126 + }, + { + "epoch": 1.05, + "learning_rate": 1.5055093579747994e-06, + "loss": 0.6729, + "step": 41127 + }, + { + "epoch": 1.05, + "learning_rate": 1.5054854831291956e-06, + "loss": 0.7168, + "step": 41128 + }, + { + "epoch": 1.05, + "learning_rate": 1.5054616078965649e-06, + "loss": 0.8115, + "step": 41129 + }, + { + "epoch": 1.05, + "learning_rate": 1.5054377322769254e-06, + "loss": 0.6992, + "step": 41130 + }, + { + "epoch": 1.05, + "learning_rate": 1.5054138562702957e-06, + "loss": 0.7529, + "step": 41131 + }, + { + "epoch": 1.05, + "learning_rate": 1.5053899798766935e-06, + "loss": 0.6138, + "step": 41132 + }, + { + "epoch": 1.05, + "learning_rate": 1.5053661030961378e-06, + "loss": 0.875, + "step": 41133 + }, + { + "epoch": 1.05, + "learning_rate": 1.5053422259286467e-06, + "loss": 0.5342, + "step": 41134 + }, + { + "epoch": 1.05, + "learning_rate": 1.5053183483742374e-06, + "loss": 0.7412, + "step": 41135 + }, + { + "epoch": 1.05, + "learning_rate": 1.50529447043293e-06, + "loss": 0.5659, + "step": 41136 + }, + { + "epoch": 1.05, + "learning_rate": 1.5052705921047414e-06, + "loss": 0.7783, + "step": 41137 + }, + { + "epoch": 1.05, + "learning_rate": 1.5052467133896904e-06, + "loss": 0.6328, + "step": 41138 + }, + { + "epoch": 1.05, + "learning_rate": 1.5052228342877954e-06, + "loss": 0.6709, + "step": 41139 + }, + { + "epoch": 1.05, + "learning_rate": 1.5051989547990742e-06, + "loss": 0.7178, + "step": 41140 + }, + { + "epoch": 1.05, + "learning_rate": 1.5051750749235454e-06, + "loss": 0.4744, + "step": 41141 + }, + { + "epoch": 1.05, + "learning_rate": 1.5051511946612276e-06, + "loss": 0.6133, + "step": 41142 + }, + { + "epoch": 1.05, + "learning_rate": 1.5051273140121388e-06, + "loss": 0.5653, + "step": 41143 + }, + { + "epoch": 1.05, + "learning_rate": 1.5051034329762971e-06, + "loss": 0.6482, + "step": 41144 + }, + { + "epoch": 1.05, + "learning_rate": 1.5050795515537205e-06, + "loss": 0.6748, + "step": 41145 + }, + { + "epoch": 1.05, + "learning_rate": 1.505055669744428e-06, + "loss": 0.623, + "step": 41146 + }, + { + "epoch": 1.05, + "learning_rate": 1.5050317875484377e-06, + "loss": 0.8301, + "step": 41147 + }, + { + "epoch": 1.05, + "learning_rate": 1.505007904965768e-06, + "loss": 0.4917, + "step": 41148 + }, + { + "epoch": 1.05, + "learning_rate": 1.5049840219964366e-06, + "loss": 0.6416, + "step": 41149 + }, + { + "epoch": 1.05, + "learning_rate": 1.5049601386404622e-06, + "loss": 0.7949, + "step": 41150 + }, + { + "epoch": 1.05, + "learning_rate": 1.504936254897863e-06, + "loss": 0.6855, + "step": 41151 + }, + { + "epoch": 1.05, + "learning_rate": 1.5049123707686576e-06, + "loss": 0.6709, + "step": 41152 + }, + { + "epoch": 1.05, + "learning_rate": 1.5048884862528638e-06, + "loss": 0.7217, + "step": 41153 + }, + { + "epoch": 1.05, + "learning_rate": 1.5048646013505003e-06, + "loss": 0.6562, + "step": 41154 + }, + { + "epoch": 1.05, + "learning_rate": 1.5048407160615849e-06, + "loss": 0.75, + "step": 41155 + }, + { + "epoch": 1.05, + "learning_rate": 1.5048168303861363e-06, + "loss": 0.5427, + "step": 41156 + }, + { + "epoch": 1.05, + "learning_rate": 1.5047929443241726e-06, + "loss": 0.6992, + "step": 41157 + }, + { + "epoch": 1.05, + "learning_rate": 1.5047690578757123e-06, + "loss": 0.9092, + "step": 41158 + }, + { + "epoch": 1.05, + "learning_rate": 1.5047451710407734e-06, + "loss": 0.6426, + "step": 41159 + }, + { + "epoch": 1.05, + "learning_rate": 1.5047212838193743e-06, + "loss": 0.7197, + "step": 41160 + }, + { + "epoch": 1.05, + "learning_rate": 1.5046973962115334e-06, + "loss": 0.6943, + "step": 41161 + }, + { + "epoch": 1.06, + "learning_rate": 1.504673508217269e-06, + "loss": 0.7139, + "step": 41162 + }, + { + "epoch": 1.06, + "learning_rate": 1.5046496198365995e-06, + "loss": 0.5835, + "step": 41163 + }, + { + "epoch": 1.06, + "learning_rate": 1.5046257310695425e-06, + "loss": 0.6274, + "step": 41164 + }, + { + "epoch": 1.06, + "learning_rate": 1.5046018419161173e-06, + "loss": 0.6758, + "step": 41165 + }, + { + "epoch": 1.06, + "learning_rate": 1.5045779523763412e-06, + "loss": 0.7734, + "step": 41166 + }, + { + "epoch": 1.06, + "learning_rate": 1.5045540624502331e-06, + "loss": 0.6982, + "step": 41167 + }, + { + "epoch": 1.06, + "learning_rate": 1.5045301721378113e-06, + "loss": 0.7363, + "step": 41168 + }, + { + "epoch": 1.06, + "learning_rate": 1.5045062814390938e-06, + "loss": 0.6807, + "step": 41169 + }, + { + "epoch": 1.06, + "learning_rate": 1.504482390354099e-06, + "loss": 0.6348, + "step": 41170 + }, + { + "epoch": 1.06, + "learning_rate": 1.5044584988828453e-06, + "loss": 0.5718, + "step": 41171 + }, + { + "epoch": 1.06, + "learning_rate": 1.5044346070253509e-06, + "loss": 0.6914, + "step": 41172 + }, + { + "epoch": 1.06, + "learning_rate": 1.5044107147816342e-06, + "loss": 0.5442, + "step": 41173 + }, + { + "epoch": 1.06, + "learning_rate": 1.5043868221517136e-06, + "loss": 0.6724, + "step": 41174 + }, + { + "epoch": 1.06, + "learning_rate": 1.5043629291356068e-06, + "loss": 0.7373, + "step": 41175 + }, + { + "epoch": 1.06, + "learning_rate": 1.5043390357333325e-06, + "loss": 0.6865, + "step": 41176 + }, + { + "epoch": 1.06, + "learning_rate": 1.5043151419449092e-06, + "loss": 0.583, + "step": 41177 + }, + { + "epoch": 1.06, + "learning_rate": 1.5042912477703551e-06, + "loss": 0.7676, + "step": 41178 + }, + { + "epoch": 1.06, + "learning_rate": 1.504267353209688e-06, + "loss": 0.4966, + "step": 41179 + }, + { + "epoch": 1.06, + "learning_rate": 1.5042434582629269e-06, + "loss": 0.77, + "step": 41180 + }, + { + "epoch": 1.06, + "learning_rate": 1.5042195629300898e-06, + "loss": 0.5913, + "step": 41181 + }, + { + "epoch": 1.06, + "learning_rate": 1.5041956672111945e-06, + "loss": 0.668, + "step": 41182 + }, + { + "epoch": 1.06, + "learning_rate": 1.5041717711062602e-06, + "loss": 0.6387, + "step": 41183 + }, + { + "epoch": 1.06, + "learning_rate": 1.5041478746153046e-06, + "loss": 0.7275, + "step": 41184 + }, + { + "epoch": 1.06, + "learning_rate": 1.504123977738346e-06, + "loss": 0.4414, + "step": 41185 + }, + { + "epoch": 1.06, + "learning_rate": 1.5041000804754034e-06, + "loss": 0.5537, + "step": 41186 + }, + { + "epoch": 1.06, + "learning_rate": 1.504076182826494e-06, + "loss": 0.6816, + "step": 41187 + }, + { + "epoch": 1.06, + "learning_rate": 1.504052284791637e-06, + "loss": 0.7139, + "step": 41188 + }, + { + "epoch": 1.06, + "learning_rate": 1.5040283863708503e-06, + "loss": 0.562, + "step": 41189 + }, + { + "epoch": 1.06, + "learning_rate": 1.5040044875641519e-06, + "loss": 0.6792, + "step": 41190 + }, + { + "epoch": 1.06, + "learning_rate": 1.5039805883715605e-06, + "loss": 0.6069, + "step": 41191 + }, + { + "epoch": 1.06, + "learning_rate": 1.5039566887930947e-06, + "loss": 0.6992, + "step": 41192 + }, + { + "epoch": 1.06, + "learning_rate": 1.5039327888287722e-06, + "loss": 0.6738, + "step": 41193 + }, + { + "epoch": 1.06, + "learning_rate": 1.5039088884786117e-06, + "loss": 0.5554, + "step": 41194 + }, + { + "epoch": 1.06, + "learning_rate": 1.5038849877426312e-06, + "loss": 0.6074, + "step": 41195 + }, + { + "epoch": 1.06, + "learning_rate": 1.5038610866208493e-06, + "loss": 0.624, + "step": 41196 + }, + { + "epoch": 1.06, + "learning_rate": 1.5038371851132837e-06, + "loss": 0.6572, + "step": 41197 + }, + { + "epoch": 1.06, + "learning_rate": 1.5038132832199536e-06, + "loss": 0.7598, + "step": 41198 + }, + { + "epoch": 1.06, + "learning_rate": 1.5037893809408763e-06, + "loss": 0.7549, + "step": 41199 + }, + { + "epoch": 1.06, + "learning_rate": 1.5037654782760712e-06, + "loss": 0.6069, + "step": 41200 + }, + { + "epoch": 1.06, + "learning_rate": 1.5037415752255558e-06, + "loss": 0.5508, + "step": 41201 + }, + { + "epoch": 1.06, + "learning_rate": 1.5037176717893485e-06, + "loss": 0.6436, + "step": 41202 + }, + { + "epoch": 1.06, + "learning_rate": 1.5036937679674682e-06, + "loss": 0.459, + "step": 41203 + }, + { + "epoch": 1.06, + "learning_rate": 1.5036698637599323e-06, + "loss": 0.748, + "step": 41204 + }, + { + "epoch": 1.06, + "learning_rate": 1.5036459591667597e-06, + "loss": 0.603, + "step": 41205 + }, + { + "epoch": 1.06, + "learning_rate": 1.5036220541879683e-06, + "loss": 0.7891, + "step": 41206 + }, + { + "epoch": 1.06, + "learning_rate": 1.5035981488235769e-06, + "loss": 0.6174, + "step": 41207 + }, + { + "epoch": 1.06, + "learning_rate": 1.5035742430736037e-06, + "loss": 0.6646, + "step": 41208 + }, + { + "epoch": 1.06, + "learning_rate": 1.503550336938067e-06, + "loss": 0.8125, + "step": 41209 + }, + { + "epoch": 1.06, + "learning_rate": 1.5035264304169842e-06, + "loss": 0.6533, + "step": 41210 + }, + { + "epoch": 1.06, + "learning_rate": 1.5035025235103749e-06, + "loss": 0.6313, + "step": 41211 + }, + { + "epoch": 1.06, + "learning_rate": 1.503478616218257e-06, + "loss": 0.6875, + "step": 41212 + }, + { + "epoch": 1.06, + "learning_rate": 1.5034547085406483e-06, + "loss": 0.7607, + "step": 41213 + }, + { + "epoch": 1.06, + "learning_rate": 1.5034308004775676e-06, + "loss": 0.752, + "step": 41214 + }, + { + "epoch": 1.06, + "learning_rate": 1.5034068920290332e-06, + "loss": 0.5107, + "step": 41215 + }, + { + "epoch": 1.06, + "learning_rate": 1.503382983195063e-06, + "loss": 0.5435, + "step": 41216 + }, + { + "epoch": 1.06, + "learning_rate": 1.503359073975676e-06, + "loss": 0.6284, + "step": 41217 + }, + { + "epoch": 1.06, + "learning_rate": 1.50333516437089e-06, + "loss": 0.6455, + "step": 41218 + }, + { + "epoch": 1.06, + "learning_rate": 1.5033112543807231e-06, + "loss": 0.7295, + "step": 41219 + }, + { + "epoch": 1.06, + "learning_rate": 1.5032873440051943e-06, + "loss": 0.5996, + "step": 41220 + }, + { + "epoch": 1.06, + "learning_rate": 1.5032634332443212e-06, + "loss": 0.7402, + "step": 41221 + }, + { + "epoch": 1.06, + "learning_rate": 1.5032395220981227e-06, + "loss": 0.6685, + "step": 41222 + }, + { + "epoch": 1.06, + "learning_rate": 1.5032156105666167e-06, + "loss": 0.5669, + "step": 41223 + }, + { + "epoch": 1.06, + "learning_rate": 1.5031916986498217e-06, + "loss": 0.6196, + "step": 41224 + }, + { + "epoch": 1.06, + "learning_rate": 1.5031677863477556e-06, + "loss": 0.5254, + "step": 41225 + }, + { + "epoch": 1.06, + "learning_rate": 1.5031438736604376e-06, + "loss": 0.8623, + "step": 41226 + }, + { + "epoch": 1.06, + "learning_rate": 1.5031199605878852e-06, + "loss": 0.6689, + "step": 41227 + }, + { + "epoch": 1.06, + "learning_rate": 1.5030960471301172e-06, + "loss": 0.7119, + "step": 41228 + }, + { + "epoch": 1.06, + "learning_rate": 1.5030721332871515e-06, + "loss": 0.5323, + "step": 41229 + }, + { + "epoch": 1.06, + "learning_rate": 1.5030482190590066e-06, + "loss": 0.7119, + "step": 41230 + }, + { + "epoch": 1.06, + "learning_rate": 1.5030243044457008e-06, + "loss": 0.7725, + "step": 41231 + }, + { + "epoch": 1.06, + "learning_rate": 1.5030003894472528e-06, + "loss": 0.6846, + "step": 41232 + }, + { + "epoch": 1.06, + "learning_rate": 1.50297647406368e-06, + "loss": 0.8213, + "step": 41233 + }, + { + "epoch": 1.06, + "learning_rate": 1.5029525582950014e-06, + "loss": 0.5723, + "step": 41234 + }, + { + "epoch": 1.06, + "learning_rate": 1.502928642141235e-06, + "loss": 0.7178, + "step": 41235 + }, + { + "epoch": 1.06, + "learning_rate": 1.5029047256023994e-06, + "loss": 0.5952, + "step": 41236 + }, + { + "epoch": 1.06, + "learning_rate": 1.5028808086785129e-06, + "loss": 0.7764, + "step": 41237 + }, + { + "epoch": 1.06, + "learning_rate": 1.5028568913695936e-06, + "loss": 0.7119, + "step": 41238 + }, + { + "epoch": 1.06, + "learning_rate": 1.5028329736756597e-06, + "loss": 0.6299, + "step": 41239 + }, + { + "epoch": 1.06, + "learning_rate": 1.5028090555967302e-06, + "loss": 0.6201, + "step": 41240 + }, + { + "epoch": 1.06, + "learning_rate": 1.5027851371328226e-06, + "loss": 0.5515, + "step": 41241 + }, + { + "epoch": 1.06, + "learning_rate": 1.5027612182839555e-06, + "loss": 0.5957, + "step": 41242 + }, + { + "epoch": 1.06, + "learning_rate": 1.5027372990501474e-06, + "loss": 0.6748, + "step": 41243 + }, + { + "epoch": 1.06, + "learning_rate": 1.5027133794314165e-06, + "loss": 0.6309, + "step": 41244 + }, + { + "epoch": 1.06, + "learning_rate": 1.5026894594277809e-06, + "loss": 0.5625, + "step": 41245 + }, + { + "epoch": 1.06, + "learning_rate": 1.5026655390392592e-06, + "loss": 0.7441, + "step": 41246 + }, + { + "epoch": 1.06, + "learning_rate": 1.5026416182658697e-06, + "loss": 0.6948, + "step": 41247 + }, + { + "epoch": 1.06, + "learning_rate": 1.5026176971076303e-06, + "loss": 0.7061, + "step": 41248 + }, + { + "epoch": 1.06, + "learning_rate": 1.50259377556456e-06, + "loss": 0.7627, + "step": 41249 + }, + { + "epoch": 1.06, + "learning_rate": 1.5025698536366764e-06, + "loss": 0.749, + "step": 41250 + }, + { + "epoch": 1.06, + "learning_rate": 1.5025459313239982e-06, + "loss": 0.6504, + "step": 41251 + }, + { + "epoch": 1.06, + "learning_rate": 1.5025220086265441e-06, + "loss": 0.5811, + "step": 41252 + }, + { + "epoch": 1.06, + "learning_rate": 1.502498085544332e-06, + "loss": 0.6221, + "step": 41253 + }, + { + "epoch": 1.06, + "learning_rate": 1.5024741620773797e-06, + "loss": 0.708, + "step": 41254 + }, + { + "epoch": 1.06, + "learning_rate": 1.5024502382257065e-06, + "loss": 0.605, + "step": 41255 + }, + { + "epoch": 1.06, + "learning_rate": 1.5024263139893299e-06, + "loss": 0.6211, + "step": 41256 + }, + { + "epoch": 1.06, + "learning_rate": 1.502402389368269e-06, + "loss": 0.6792, + "step": 41257 + }, + { + "epoch": 1.06, + "learning_rate": 1.5023784643625413e-06, + "loss": 0.6108, + "step": 41258 + }, + { + "epoch": 1.06, + "learning_rate": 1.5023545389721658e-06, + "loss": 0.5796, + "step": 41259 + }, + { + "epoch": 1.06, + "learning_rate": 1.5023306131971602e-06, + "loss": 0.7656, + "step": 41260 + }, + { + "epoch": 1.06, + "learning_rate": 1.5023066870375437e-06, + "loss": 0.7334, + "step": 41261 + }, + { + "epoch": 1.06, + "learning_rate": 1.5022827604933335e-06, + "loss": 0.5796, + "step": 41262 + }, + { + "epoch": 1.06, + "learning_rate": 1.5022588335645488e-06, + "loss": 0.7134, + "step": 41263 + }, + { + "epoch": 1.06, + "learning_rate": 1.5022349062512075e-06, + "loss": 0.7969, + "step": 41264 + }, + { + "epoch": 1.06, + "learning_rate": 1.5022109785533279e-06, + "loss": 0.6436, + "step": 41265 + }, + { + "epoch": 1.06, + "learning_rate": 1.5021870504709283e-06, + "loss": 0.7969, + "step": 41266 + }, + { + "epoch": 1.06, + "learning_rate": 1.5021631220040277e-06, + "loss": 0.5903, + "step": 41267 + }, + { + "epoch": 1.06, + "learning_rate": 1.5021391931526438e-06, + "loss": 0.5469, + "step": 41268 + }, + { + "epoch": 1.06, + "learning_rate": 1.5021152639167943e-06, + "loss": 0.7568, + "step": 41269 + }, + { + "epoch": 1.06, + "learning_rate": 1.502091334296499e-06, + "loss": 0.6758, + "step": 41270 + }, + { + "epoch": 1.06, + "learning_rate": 1.5020674042917754e-06, + "loss": 0.6689, + "step": 41271 + }, + { + "epoch": 1.06, + "learning_rate": 1.5020434739026417e-06, + "loss": 0.835, + "step": 41272 + }, + { + "epoch": 1.06, + "learning_rate": 1.5020195431291162e-06, + "loss": 0.6128, + "step": 41273 + }, + { + "epoch": 1.06, + "learning_rate": 1.5019956119712175e-06, + "loss": 0.4376, + "step": 41274 + }, + { + "epoch": 1.06, + "learning_rate": 1.501971680428964e-06, + "loss": 0.6807, + "step": 41275 + }, + { + "epoch": 1.06, + "learning_rate": 1.501947748502374e-06, + "loss": 0.7158, + "step": 41276 + }, + { + "epoch": 1.06, + "learning_rate": 1.5019238161914656e-06, + "loss": 0.4878, + "step": 41277 + }, + { + "epoch": 1.06, + "learning_rate": 1.501899883496257e-06, + "loss": 0.6108, + "step": 41278 + }, + { + "epoch": 1.06, + "learning_rate": 1.5018759504167667e-06, + "loss": 0.6221, + "step": 41279 + }, + { + "epoch": 1.06, + "learning_rate": 1.5018520169530133e-06, + "loss": 0.7578, + "step": 41280 + }, + { + "epoch": 1.06, + "learning_rate": 1.5018280831050148e-06, + "loss": 0.7949, + "step": 41281 + }, + { + "epoch": 1.06, + "learning_rate": 1.50180414887279e-06, + "loss": 0.6133, + "step": 41282 + }, + { + "epoch": 1.06, + "learning_rate": 1.5017802142563562e-06, + "loss": 0.7227, + "step": 41283 + }, + { + "epoch": 1.06, + "learning_rate": 1.5017562792557327e-06, + "loss": 0.7012, + "step": 41284 + }, + { + "epoch": 1.06, + "learning_rate": 1.5017323438709371e-06, + "loss": 0.7227, + "step": 41285 + }, + { + "epoch": 1.06, + "learning_rate": 1.5017084081019884e-06, + "loss": 0.6523, + "step": 41286 + }, + { + "epoch": 1.06, + "learning_rate": 1.5016844719489048e-06, + "loss": 0.7334, + "step": 41287 + }, + { + "epoch": 1.06, + "learning_rate": 1.5016605354117044e-06, + "loss": 0.7881, + "step": 41288 + }, + { + "epoch": 1.06, + "learning_rate": 1.5016365984904053e-06, + "loss": 0.8613, + "step": 41289 + }, + { + "epoch": 1.06, + "learning_rate": 1.5016126611850263e-06, + "loss": 0.6885, + "step": 41290 + }, + { + "epoch": 1.06, + "learning_rate": 1.5015887234955854e-06, + "loss": 0.7578, + "step": 41291 + }, + { + "epoch": 1.06, + "learning_rate": 1.5015647854221017e-06, + "loss": 0.5039, + "step": 41292 + }, + { + "epoch": 1.06, + "learning_rate": 1.5015408469645925e-06, + "loss": 0.3525, + "step": 41293 + }, + { + "epoch": 1.06, + "learning_rate": 1.5015169081230763e-06, + "loss": 0.8584, + "step": 41294 + }, + { + "epoch": 1.06, + "learning_rate": 1.5014929688975719e-06, + "loss": 0.4824, + "step": 41295 + }, + { + "epoch": 1.06, + "learning_rate": 1.5014690292880974e-06, + "loss": 0.7549, + "step": 41296 + }, + { + "epoch": 1.06, + "learning_rate": 1.501445089294671e-06, + "loss": 0.6924, + "step": 41297 + }, + { + "epoch": 1.06, + "learning_rate": 1.5014211489173115e-06, + "loss": 0.7773, + "step": 41298 + }, + { + "epoch": 1.06, + "learning_rate": 1.5013972081560366e-06, + "loss": 0.7852, + "step": 41299 + }, + { + "epoch": 1.06, + "learning_rate": 1.5013732670108647e-06, + "loss": 0.665, + "step": 41300 + }, + { + "epoch": 1.06, + "learning_rate": 1.5013493254818146e-06, + "loss": 0.5952, + "step": 41301 + }, + { + "epoch": 1.06, + "learning_rate": 1.5013253835689046e-06, + "loss": 0.6846, + "step": 41302 + }, + { + "epoch": 1.06, + "learning_rate": 1.5013014412721525e-06, + "loss": 0.6582, + "step": 41303 + }, + { + "epoch": 1.06, + "learning_rate": 1.5012774985915767e-06, + "loss": 0.7529, + "step": 41304 + }, + { + "epoch": 1.06, + "learning_rate": 1.5012535555271964e-06, + "loss": 0.4633, + "step": 41305 + }, + { + "epoch": 1.06, + "learning_rate": 1.5012296120790286e-06, + "loss": 0.8984, + "step": 41306 + }, + { + "epoch": 1.06, + "learning_rate": 1.501205668247093e-06, + "loss": 0.8154, + "step": 41307 + }, + { + "epoch": 1.06, + "learning_rate": 1.5011817240314068e-06, + "loss": 0.6567, + "step": 41308 + }, + { + "epoch": 1.06, + "learning_rate": 1.501157779431989e-06, + "loss": 0.8584, + "step": 41309 + }, + { + "epoch": 1.06, + "learning_rate": 1.5011338344488578e-06, + "loss": 0.6528, + "step": 41310 + }, + { + "epoch": 1.06, + "learning_rate": 1.5011098890820312e-06, + "loss": 0.6016, + "step": 41311 + }, + { + "epoch": 1.06, + "learning_rate": 1.5010859433315281e-06, + "loss": 0.665, + "step": 41312 + }, + { + "epoch": 1.06, + "learning_rate": 1.5010619971973663e-06, + "loss": 0.5742, + "step": 41313 + }, + { + "epoch": 1.06, + "learning_rate": 1.5010380506795644e-06, + "loss": 0.7334, + "step": 41314 + }, + { + "epoch": 1.06, + "learning_rate": 1.5010141037781407e-06, + "loss": 0.6289, + "step": 41315 + }, + { + "epoch": 1.06, + "learning_rate": 1.5009901564931138e-06, + "loss": 0.6396, + "step": 41316 + }, + { + "epoch": 1.06, + "learning_rate": 1.5009662088245016e-06, + "loss": 0.564, + "step": 41317 + }, + { + "epoch": 1.06, + "learning_rate": 1.5009422607723226e-06, + "loss": 0.5542, + "step": 41318 + }, + { + "epoch": 1.06, + "learning_rate": 1.5009183123365948e-06, + "loss": 0.6333, + "step": 41319 + }, + { + "epoch": 1.06, + "learning_rate": 1.5008943635173375e-06, + "loss": 0.748, + "step": 41320 + }, + { + "epoch": 1.06, + "learning_rate": 1.5008704143145679e-06, + "loss": 0.522, + "step": 41321 + }, + { + "epoch": 1.06, + "learning_rate": 1.5008464647283055e-06, + "loss": 0.5845, + "step": 41322 + }, + { + "epoch": 1.06, + "learning_rate": 1.5008225147585674e-06, + "loss": 0.6436, + "step": 41323 + }, + { + "epoch": 1.06, + "learning_rate": 1.5007985644053726e-06, + "loss": 0.4241, + "step": 41324 + }, + { + "epoch": 1.06, + "learning_rate": 1.5007746136687395e-06, + "loss": 0.625, + "step": 41325 + }, + { + "epoch": 1.06, + "learning_rate": 1.5007506625486864e-06, + "loss": 0.7871, + "step": 41326 + }, + { + "epoch": 1.06, + "learning_rate": 1.5007267110452312e-06, + "loss": 0.4075, + "step": 41327 + }, + { + "epoch": 1.06, + "learning_rate": 1.5007027591583929e-06, + "loss": 0.5542, + "step": 41328 + }, + { + "epoch": 1.06, + "learning_rate": 1.5006788068881893e-06, + "loss": 0.6816, + "step": 41329 + }, + { + "epoch": 1.06, + "learning_rate": 1.5006548542346394e-06, + "loss": 0.7373, + "step": 41330 + }, + { + "epoch": 1.06, + "learning_rate": 1.5006309011977604e-06, + "loss": 0.5786, + "step": 41331 + }, + { + "epoch": 1.06, + "learning_rate": 1.5006069477775718e-06, + "loss": 0.6445, + "step": 41332 + }, + { + "epoch": 1.06, + "learning_rate": 1.5005829939740914e-06, + "loss": 0.5735, + "step": 41333 + }, + { + "epoch": 1.06, + "learning_rate": 1.5005590397873377e-06, + "loss": 0.668, + "step": 41334 + }, + { + "epoch": 1.06, + "learning_rate": 1.500535085217329e-06, + "loss": 0.5762, + "step": 41335 + }, + { + "epoch": 1.06, + "learning_rate": 1.5005111302640833e-06, + "loss": 0.4728, + "step": 41336 + }, + { + "epoch": 1.06, + "learning_rate": 1.5004871749276196e-06, + "loss": 0.7871, + "step": 41337 + }, + { + "epoch": 1.06, + "learning_rate": 1.5004632192079556e-06, + "loss": 0.519, + "step": 41338 + }, + { + "epoch": 1.06, + "learning_rate": 1.50043926310511e-06, + "loss": 0.6426, + "step": 41339 + }, + { + "epoch": 1.06, + "learning_rate": 1.500415306619101e-06, + "loss": 0.6953, + "step": 41340 + }, + { + "epoch": 1.06, + "learning_rate": 1.5003913497499472e-06, + "loss": 0.5585, + "step": 41341 + }, + { + "epoch": 1.06, + "learning_rate": 1.5003673924976665e-06, + "loss": 0.7734, + "step": 41342 + }, + { + "epoch": 1.06, + "learning_rate": 1.500343434862278e-06, + "loss": 0.8047, + "step": 41343 + }, + { + "epoch": 1.06, + "learning_rate": 1.5003194768437987e-06, + "loss": 0.7891, + "step": 41344 + }, + { + "epoch": 1.06, + "learning_rate": 1.5002955184422485e-06, + "loss": 0.5605, + "step": 41345 + }, + { + "epoch": 1.06, + "learning_rate": 1.5002715596576448e-06, + "loss": 0.6387, + "step": 41346 + }, + { + "epoch": 1.06, + "learning_rate": 1.5002476004900064e-06, + "loss": 0.6338, + "step": 41347 + }, + { + "epoch": 1.06, + "learning_rate": 1.500223640939351e-06, + "loss": 0.6821, + "step": 41348 + }, + { + "epoch": 1.06, + "learning_rate": 1.5001996810056974e-06, + "loss": 0.5094, + "step": 41349 + }, + { + "epoch": 1.06, + "learning_rate": 1.500175720689064e-06, + "loss": 0.7051, + "step": 41350 + }, + { + "epoch": 1.06, + "learning_rate": 1.5001517599894692e-06, + "loss": 0.749, + "step": 41351 + }, + { + "epoch": 1.06, + "learning_rate": 1.5001277989069312e-06, + "loss": 0.4705, + "step": 41352 + }, + { + "epoch": 1.06, + "learning_rate": 1.5001038374414684e-06, + "loss": 0.582, + "step": 41353 + }, + { + "epoch": 1.06, + "learning_rate": 1.5000798755930986e-06, + "loss": 0.7393, + "step": 41354 + }, + { + "epoch": 1.06, + "learning_rate": 1.500055913361841e-06, + "loss": 0.6465, + "step": 41355 + }, + { + "epoch": 1.06, + "learning_rate": 1.5000319507477134e-06, + "loss": 0.4669, + "step": 41356 + }, + { + "epoch": 1.06, + "learning_rate": 1.5000079877507345e-06, + "loss": 0.7236, + "step": 41357 + }, + { + "epoch": 1.06, + "learning_rate": 1.4999840243709226e-06, + "loss": 0.6362, + "step": 41358 + }, + { + "epoch": 1.06, + "learning_rate": 1.4999600606082957e-06, + "loss": 0.8145, + "step": 41359 + }, + { + "epoch": 1.06, + "learning_rate": 1.4999360964628723e-06, + "loss": 0.7061, + "step": 41360 + }, + { + "epoch": 1.06, + "learning_rate": 1.499912131934671e-06, + "loss": 0.6924, + "step": 41361 + }, + { + "epoch": 1.06, + "learning_rate": 1.49988816702371e-06, + "loss": 0.5386, + "step": 41362 + }, + { + "epoch": 1.06, + "learning_rate": 1.4998642017300074e-06, + "loss": 0.5039, + "step": 41363 + }, + { + "epoch": 1.06, + "learning_rate": 1.4998402360535821e-06, + "loss": 0.5682, + "step": 41364 + }, + { + "epoch": 1.06, + "learning_rate": 1.4998162699944517e-06, + "loss": 0.6338, + "step": 41365 + }, + { + "epoch": 1.06, + "learning_rate": 1.4997923035526352e-06, + "loss": 0.6885, + "step": 41366 + }, + { + "epoch": 1.06, + "learning_rate": 1.4997683367281505e-06, + "loss": 0.6064, + "step": 41367 + }, + { + "epoch": 1.06, + "learning_rate": 1.4997443695210167e-06, + "loss": 0.6265, + "step": 41368 + }, + { + "epoch": 1.06, + "learning_rate": 1.4997204019312511e-06, + "loss": 0.6276, + "step": 41369 + }, + { + "epoch": 1.06, + "learning_rate": 1.4996964339588727e-06, + "loss": 0.7065, + "step": 41370 + }, + { + "epoch": 1.06, + "learning_rate": 1.4996724656038997e-06, + "loss": 0.7197, + "step": 41371 + }, + { + "epoch": 1.06, + "learning_rate": 1.4996484968663508e-06, + "loss": 0.7026, + "step": 41372 + }, + { + "epoch": 1.06, + "learning_rate": 1.4996245277462434e-06, + "loss": 0.5566, + "step": 41373 + }, + { + "epoch": 1.06, + "learning_rate": 1.4996005582435968e-06, + "loss": 0.708, + "step": 41374 + }, + { + "epoch": 1.06, + "learning_rate": 1.499576588358429e-06, + "loss": 0.4985, + "step": 41375 + }, + { + "epoch": 1.06, + "learning_rate": 1.4995526180907586e-06, + "loss": 0.6699, + "step": 41376 + }, + { + "epoch": 1.06, + "learning_rate": 1.4995286474406035e-06, + "loss": 0.6191, + "step": 41377 + }, + { + "epoch": 1.06, + "learning_rate": 1.4995046764079821e-06, + "loss": 0.6265, + "step": 41378 + }, + { + "epoch": 1.06, + "learning_rate": 1.4994807049929133e-06, + "loss": 0.5952, + "step": 41379 + }, + { + "epoch": 1.06, + "learning_rate": 1.499456733195415e-06, + "loss": 0.6895, + "step": 41380 + }, + { + "epoch": 1.06, + "learning_rate": 1.4994327610155055e-06, + "loss": 0.582, + "step": 41381 + }, + { + "epoch": 1.06, + "learning_rate": 1.4994087884532034e-06, + "loss": 0.7285, + "step": 41382 + }, + { + "epoch": 1.06, + "learning_rate": 1.4993848155085269e-06, + "loss": 0.7217, + "step": 41383 + }, + { + "epoch": 1.06, + "learning_rate": 1.4993608421814944e-06, + "loss": 0.6021, + "step": 41384 + }, + { + "epoch": 1.06, + "learning_rate": 1.4993368684721244e-06, + "loss": 0.7363, + "step": 41385 + }, + { + "epoch": 1.06, + "learning_rate": 1.4993128943804349e-06, + "loss": 0.6895, + "step": 41386 + }, + { + "epoch": 1.06, + "learning_rate": 1.4992889199064448e-06, + "loss": 0.5649, + "step": 41387 + }, + { + "epoch": 1.06, + "learning_rate": 1.499264945050172e-06, + "loss": 0.625, + "step": 41388 + }, + { + "epoch": 1.06, + "learning_rate": 1.4992409698116348e-06, + "loss": 0.7744, + "step": 41389 + }, + { + "epoch": 1.06, + "learning_rate": 1.499216994190852e-06, + "loss": 0.6541, + "step": 41390 + }, + { + "epoch": 1.06, + "learning_rate": 1.4991930181878417e-06, + "loss": 0.4128, + "step": 41391 + }, + { + "epoch": 1.06, + "learning_rate": 1.499169041802622e-06, + "loss": 0.6143, + "step": 41392 + }, + { + "epoch": 1.06, + "learning_rate": 1.4991450650352119e-06, + "loss": 0.562, + "step": 41393 + }, + { + "epoch": 1.06, + "learning_rate": 1.4991210878856288e-06, + "loss": 0.7256, + "step": 41394 + }, + { + "epoch": 1.06, + "learning_rate": 1.4990971103538921e-06, + "loss": 0.7676, + "step": 41395 + }, + { + "epoch": 1.06, + "learning_rate": 1.4990731324400193e-06, + "loss": 0.686, + "step": 41396 + }, + { + "epoch": 1.06, + "learning_rate": 1.4990491541440299e-06, + "loss": 0.5718, + "step": 41397 + }, + { + "epoch": 1.06, + "learning_rate": 1.4990251754659409e-06, + "loss": 0.6562, + "step": 41398 + }, + { + "epoch": 1.06, + "learning_rate": 1.4990011964057714e-06, + "loss": 0.5648, + "step": 41399 + }, + { + "epoch": 1.06, + "learning_rate": 1.4989772169635395e-06, + "loss": 0.7812, + "step": 41400 + }, + { + "epoch": 1.06, + "learning_rate": 1.498953237139264e-06, + "loss": 0.6455, + "step": 41401 + }, + { + "epoch": 1.06, + "learning_rate": 1.4989292569329625e-06, + "loss": 0.6865, + "step": 41402 + }, + { + "epoch": 1.06, + "learning_rate": 1.498905276344654e-06, + "loss": 0.5457, + "step": 41403 + }, + { + "epoch": 1.06, + "learning_rate": 1.4988812953743568e-06, + "loss": 0.6084, + "step": 41404 + }, + { + "epoch": 1.06, + "learning_rate": 1.498857314022089e-06, + "loss": 0.6807, + "step": 41405 + }, + { + "epoch": 1.06, + "learning_rate": 1.4988333322878692e-06, + "loss": 0.5271, + "step": 41406 + }, + { + "epoch": 1.06, + "learning_rate": 1.4988093501717156e-06, + "loss": 0.6641, + "step": 41407 + }, + { + "epoch": 1.06, + "learning_rate": 1.498785367673647e-06, + "loss": 0.8018, + "step": 41408 + }, + { + "epoch": 1.06, + "learning_rate": 1.4987613847936807e-06, + "loss": 0.6895, + "step": 41409 + }, + { + "epoch": 1.06, + "learning_rate": 1.4987374015318359e-06, + "loss": 0.3518, + "step": 41410 + }, + { + "epoch": 1.06, + "learning_rate": 1.4987134178881312e-06, + "loss": 0.7314, + "step": 41411 + }, + { + "epoch": 1.06, + "learning_rate": 1.4986894338625843e-06, + "loss": 0.6821, + "step": 41412 + }, + { + "epoch": 1.06, + "learning_rate": 1.4986654494552138e-06, + "loss": 0.7949, + "step": 41413 + }, + { + "epoch": 1.06, + "learning_rate": 1.498641464666038e-06, + "loss": 0.623, + "step": 41414 + }, + { + "epoch": 1.06, + "learning_rate": 1.4986174794950754e-06, + "loss": 0.7124, + "step": 41415 + }, + { + "epoch": 1.06, + "learning_rate": 1.4985934939423446e-06, + "loss": 0.8145, + "step": 41416 + }, + { + "epoch": 1.06, + "learning_rate": 1.4985695080078635e-06, + "loss": 0.6704, + "step": 41417 + }, + { + "epoch": 1.06, + "learning_rate": 1.4985455216916509e-06, + "loss": 0.8018, + "step": 41418 + }, + { + "epoch": 1.06, + "learning_rate": 1.4985215349937246e-06, + "loss": 0.6021, + "step": 41419 + }, + { + "epoch": 1.06, + "learning_rate": 1.4984975479141034e-06, + "loss": 0.5583, + "step": 41420 + }, + { + "epoch": 1.06, + "learning_rate": 1.4984735604528053e-06, + "loss": 0.501, + "step": 41421 + }, + { + "epoch": 1.06, + "learning_rate": 1.498449572609849e-06, + "loss": 0.6636, + "step": 41422 + }, + { + "epoch": 1.06, + "learning_rate": 1.4984255843852532e-06, + "loss": 0.5757, + "step": 41423 + }, + { + "epoch": 1.06, + "learning_rate": 1.4984015957790358e-06, + "loss": 0.8193, + "step": 41424 + }, + { + "epoch": 1.06, + "learning_rate": 1.4983776067912145e-06, + "loss": 0.604, + "step": 41425 + }, + { + "epoch": 1.06, + "learning_rate": 1.498353617421809e-06, + "loss": 0.5515, + "step": 41426 + }, + { + "epoch": 1.06, + "learning_rate": 1.498329627670837e-06, + "loss": 0.8125, + "step": 41427 + }, + { + "epoch": 1.06, + "learning_rate": 1.4983056375383167e-06, + "loss": 0.7617, + "step": 41428 + }, + { + "epoch": 1.06, + "learning_rate": 1.498281647024267e-06, + "loss": 0.4036, + "step": 41429 + }, + { + "epoch": 1.06, + "learning_rate": 1.4982576561287056e-06, + "loss": 0.7412, + "step": 41430 + }, + { + "epoch": 1.06, + "learning_rate": 1.4982336648516514e-06, + "loss": 0.6196, + "step": 41431 + }, + { + "epoch": 1.06, + "learning_rate": 1.4982096731931226e-06, + "loss": 0.6362, + "step": 41432 + }, + { + "epoch": 1.06, + "learning_rate": 1.4981856811531378e-06, + "loss": 0.6621, + "step": 41433 + }, + { + "epoch": 1.06, + "learning_rate": 1.4981616887317148e-06, + "loss": 0.7285, + "step": 41434 + }, + { + "epoch": 1.06, + "learning_rate": 1.4981376959288724e-06, + "loss": 0.8096, + "step": 41435 + }, + { + "epoch": 1.06, + "learning_rate": 1.4981137027446286e-06, + "loss": 0.8066, + "step": 41436 + }, + { + "epoch": 1.06, + "learning_rate": 1.4980897091790026e-06, + "loss": 0.6064, + "step": 41437 + }, + { + "epoch": 1.06, + "learning_rate": 1.4980657152320118e-06, + "loss": 0.7178, + "step": 41438 + }, + { + "epoch": 1.06, + "learning_rate": 1.4980417209036751e-06, + "loss": 0.7451, + "step": 41439 + }, + { + "epoch": 1.06, + "learning_rate": 1.4980177261940106e-06, + "loss": 0.604, + "step": 41440 + }, + { + "epoch": 1.06, + "learning_rate": 1.497993731103037e-06, + "loss": 0.5498, + "step": 41441 + }, + { + "epoch": 1.06, + "learning_rate": 1.4979697356307726e-06, + "loss": 0.5134, + "step": 41442 + }, + { + "epoch": 1.06, + "learning_rate": 1.4979457397772354e-06, + "loss": 0.4766, + "step": 41443 + }, + { + "epoch": 1.06, + "learning_rate": 1.4979217435424442e-06, + "loss": 0.6294, + "step": 41444 + }, + { + "epoch": 1.06, + "learning_rate": 1.497897746926417e-06, + "loss": 0.655, + "step": 41445 + }, + { + "epoch": 1.06, + "learning_rate": 1.4978737499291727e-06, + "loss": 0.7773, + "step": 41446 + }, + { + "epoch": 1.06, + "learning_rate": 1.497849752550729e-06, + "loss": 0.5762, + "step": 41447 + }, + { + "epoch": 1.06, + "learning_rate": 1.4978257547911054e-06, + "loss": 0.5662, + "step": 41448 + }, + { + "epoch": 1.06, + "learning_rate": 1.4978017566503188e-06, + "loss": 0.6509, + "step": 41449 + }, + { + "epoch": 1.06, + "learning_rate": 1.4977777581283887e-06, + "loss": 0.5474, + "step": 41450 + }, + { + "epoch": 1.06, + "learning_rate": 1.4977537592253327e-06, + "loss": 0.5825, + "step": 41451 + }, + { + "epoch": 1.06, + "learning_rate": 1.4977297599411696e-06, + "loss": 0.6924, + "step": 41452 + }, + { + "epoch": 1.06, + "learning_rate": 1.4977057602759178e-06, + "loss": 0.6797, + "step": 41453 + }, + { + "epoch": 1.06, + "learning_rate": 1.4976817602295957e-06, + "loss": 0.6675, + "step": 41454 + }, + { + "epoch": 1.06, + "learning_rate": 1.4976577598022214e-06, + "loss": 0.6094, + "step": 41455 + }, + { + "epoch": 1.06, + "learning_rate": 1.4976337589938133e-06, + "loss": 0.7627, + "step": 41456 + }, + { + "epoch": 1.06, + "learning_rate": 1.4976097578043901e-06, + "loss": 0.5693, + "step": 41457 + }, + { + "epoch": 1.06, + "learning_rate": 1.49758575623397e-06, + "loss": 0.3447, + "step": 41458 + }, + { + "epoch": 1.06, + "learning_rate": 1.497561754282571e-06, + "loss": 0.6089, + "step": 41459 + }, + { + "epoch": 1.06, + "learning_rate": 1.4975377519502127e-06, + "loss": 0.5181, + "step": 41460 + }, + { + "epoch": 1.06, + "learning_rate": 1.4975137492369116e-06, + "loss": 0.7373, + "step": 41461 + }, + { + "epoch": 1.06, + "learning_rate": 1.4974897461426881e-06, + "loss": 0.6055, + "step": 41462 + }, + { + "epoch": 1.06, + "learning_rate": 1.497465742667559e-06, + "loss": 0.6631, + "step": 41463 + }, + { + "epoch": 1.06, + "learning_rate": 1.4974417388115432e-06, + "loss": 0.6172, + "step": 41464 + }, + { + "epoch": 1.06, + "learning_rate": 1.4974177345746593e-06, + "loss": 0.6699, + "step": 41465 + }, + { + "epoch": 1.06, + "learning_rate": 1.4973937299569252e-06, + "loss": 0.7393, + "step": 41466 + }, + { + "epoch": 1.06, + "learning_rate": 1.49736972495836e-06, + "loss": 0.6675, + "step": 41467 + }, + { + "epoch": 1.06, + "learning_rate": 1.4973457195789815e-06, + "loss": 0.7803, + "step": 41468 + }, + { + "epoch": 1.06, + "learning_rate": 1.4973217138188083e-06, + "loss": 0.6973, + "step": 41469 + }, + { + "epoch": 1.06, + "learning_rate": 1.4972977076778588e-06, + "loss": 0.7549, + "step": 41470 + }, + { + "epoch": 1.06, + "learning_rate": 1.4972737011561512e-06, + "loss": 0.6377, + "step": 41471 + }, + { + "epoch": 1.06, + "learning_rate": 1.497249694253704e-06, + "loss": 0.667, + "step": 41472 + }, + { + "epoch": 1.06, + "learning_rate": 1.4972256869705357e-06, + "loss": 0.6982, + "step": 41473 + }, + { + "epoch": 1.06, + "learning_rate": 1.4972016793066641e-06, + "loss": 0.5723, + "step": 41474 + }, + { + "epoch": 1.06, + "learning_rate": 1.4971776712621087e-06, + "loss": 0.5896, + "step": 41475 + }, + { + "epoch": 1.06, + "learning_rate": 1.4971536628368866e-06, + "loss": 0.5933, + "step": 41476 + }, + { + "epoch": 1.06, + "learning_rate": 1.4971296540310175e-06, + "loss": 0.5605, + "step": 41477 + }, + { + "epoch": 1.06, + "learning_rate": 1.4971056448445185e-06, + "loss": 0.5103, + "step": 41478 + }, + { + "epoch": 1.06, + "learning_rate": 1.497081635277409e-06, + "loss": 0.4292, + "step": 41479 + }, + { + "epoch": 1.06, + "learning_rate": 1.4970576253297065e-06, + "loss": 0.5977, + "step": 41480 + }, + { + "epoch": 1.06, + "learning_rate": 1.49703361500143e-06, + "loss": 0.501, + "step": 41481 + }, + { + "epoch": 1.06, + "learning_rate": 1.497009604292598e-06, + "loss": 0.6548, + "step": 41482 + }, + { + "epoch": 1.06, + "learning_rate": 1.4969855932032282e-06, + "loss": 0.7197, + "step": 41483 + }, + { + "epoch": 1.06, + "learning_rate": 1.4969615817333394e-06, + "loss": 0.7988, + "step": 41484 + }, + { + "epoch": 1.06, + "learning_rate": 1.4969375698829501e-06, + "loss": 0.6826, + "step": 41485 + }, + { + "epoch": 1.06, + "learning_rate": 1.4969135576520783e-06, + "loss": 0.5371, + "step": 41486 + }, + { + "epoch": 1.06, + "learning_rate": 1.4968895450407432e-06, + "loss": 0.6899, + "step": 41487 + }, + { + "epoch": 1.06, + "learning_rate": 1.4968655320489622e-06, + "loss": 0.7256, + "step": 41488 + }, + { + "epoch": 1.06, + "learning_rate": 1.4968415186767542e-06, + "loss": 0.6211, + "step": 41489 + }, + { + "epoch": 1.06, + "learning_rate": 1.4968175049241377e-06, + "loss": 0.6128, + "step": 41490 + }, + { + "epoch": 1.06, + "learning_rate": 1.4967934907911306e-06, + "loss": 0.5215, + "step": 41491 + }, + { + "epoch": 1.06, + "learning_rate": 1.4967694762777517e-06, + "loss": 0.6553, + "step": 41492 + }, + { + "epoch": 1.06, + "learning_rate": 1.4967454613840192e-06, + "loss": 0.6057, + "step": 41493 + }, + { + "epoch": 1.06, + "learning_rate": 1.4967214461099515e-06, + "loss": 0.96, + "step": 41494 + }, + { + "epoch": 1.06, + "learning_rate": 1.496697430455567e-06, + "loss": 0.7305, + "step": 41495 + }, + { + "epoch": 1.06, + "learning_rate": 1.4966734144208842e-06, + "loss": 0.645, + "step": 41496 + }, + { + "epoch": 1.06, + "learning_rate": 1.4966493980059216e-06, + "loss": 0.7461, + "step": 41497 + }, + { + "epoch": 1.06, + "learning_rate": 1.496625381210697e-06, + "loss": 0.4624, + "step": 41498 + }, + { + "epoch": 1.06, + "learning_rate": 1.4966013640352294e-06, + "loss": 0.7798, + "step": 41499 + }, + { + "epoch": 1.06, + "learning_rate": 1.496577346479537e-06, + "loss": 0.7295, + "step": 41500 + }, + { + "epoch": 1.06, + "learning_rate": 1.4965533285436381e-06, + "loss": 0.709, + "step": 41501 + }, + { + "epoch": 1.06, + "learning_rate": 1.4965293102275514e-06, + "loss": 0.6772, + "step": 41502 + }, + { + "epoch": 1.06, + "learning_rate": 1.4965052915312947e-06, + "loss": 0.6729, + "step": 41503 + }, + { + "epoch": 1.06, + "learning_rate": 1.4964812724548868e-06, + "loss": 0.7812, + "step": 41504 + }, + { + "epoch": 1.06, + "learning_rate": 1.496457252998346e-06, + "loss": 0.7383, + "step": 41505 + }, + { + "epoch": 1.06, + "learning_rate": 1.496433233161691e-06, + "loss": 0.7031, + "step": 41506 + }, + { + "epoch": 1.06, + "learning_rate": 1.4964092129449393e-06, + "loss": 0.7173, + "step": 41507 + }, + { + "epoch": 1.06, + "learning_rate": 1.4963851923481103e-06, + "loss": 0.3887, + "step": 41508 + }, + { + "epoch": 1.06, + "learning_rate": 1.4963611713712218e-06, + "loss": 0.6064, + "step": 41509 + }, + { + "epoch": 1.06, + "learning_rate": 1.4963371500142925e-06, + "loss": 0.5459, + "step": 41510 + }, + { + "epoch": 1.06, + "learning_rate": 1.496313128277341e-06, + "loss": 0.6689, + "step": 41511 + }, + { + "epoch": 1.06, + "learning_rate": 1.496289106160385e-06, + "loss": 0.7134, + "step": 41512 + }, + { + "epoch": 1.06, + "learning_rate": 1.496265083663443e-06, + "loss": 0.6172, + "step": 41513 + }, + { + "epoch": 1.06, + "learning_rate": 1.4962410607865339e-06, + "loss": 0.7109, + "step": 41514 + }, + { + "epoch": 1.06, + "learning_rate": 1.4962170375296758e-06, + "loss": 0.6411, + "step": 41515 + }, + { + "epoch": 1.06, + "learning_rate": 1.4961930138928874e-06, + "loss": 0.7661, + "step": 41516 + }, + { + "epoch": 1.06, + "learning_rate": 1.4961689898761866e-06, + "loss": 0.7378, + "step": 41517 + }, + { + "epoch": 1.06, + "learning_rate": 1.4961449654795919e-06, + "loss": 0.6108, + "step": 41518 + }, + { + "epoch": 1.06, + "learning_rate": 1.496120940703122e-06, + "loss": 0.7139, + "step": 41519 + }, + { + "epoch": 1.06, + "learning_rate": 1.4960969155467948e-06, + "loss": 0.8672, + "step": 41520 + }, + { + "epoch": 1.06, + "learning_rate": 1.4960728900106297e-06, + "loss": 0.7334, + "step": 41521 + }, + { + "epoch": 1.06, + "learning_rate": 1.4960488640946438e-06, + "loss": 0.5369, + "step": 41522 + }, + { + "epoch": 1.06, + "learning_rate": 1.4960248377988562e-06, + "loss": 0.8369, + "step": 41523 + }, + { + "epoch": 1.06, + "learning_rate": 1.496000811123285e-06, + "loss": 0.7314, + "step": 41524 + }, + { + "epoch": 1.06, + "learning_rate": 1.4959767840679492e-06, + "loss": 0.5894, + "step": 41525 + }, + { + "epoch": 1.06, + "learning_rate": 1.4959527566328667e-06, + "loss": 0.512, + "step": 41526 + }, + { + "epoch": 1.06, + "learning_rate": 1.495928728818056e-06, + "loss": 0.6709, + "step": 41527 + }, + { + "epoch": 1.06, + "learning_rate": 1.495904700623535e-06, + "loss": 0.7456, + "step": 41528 + }, + { + "epoch": 1.06, + "learning_rate": 1.495880672049323e-06, + "loss": 0.6768, + "step": 41529 + }, + { + "epoch": 1.06, + "learning_rate": 1.495856643095438e-06, + "loss": 0.7627, + "step": 41530 + }, + { + "epoch": 1.06, + "learning_rate": 1.4958326137618985e-06, + "loss": 0.7021, + "step": 41531 + }, + { + "epoch": 1.06, + "learning_rate": 1.4958085840487225e-06, + "loss": 0.6216, + "step": 41532 + }, + { + "epoch": 1.06, + "learning_rate": 1.4957845539559287e-06, + "loss": 0.7168, + "step": 41533 + }, + { + "epoch": 1.06, + "learning_rate": 1.4957605234835353e-06, + "loss": 0.7832, + "step": 41534 + }, + { + "epoch": 1.06, + "learning_rate": 1.495736492631561e-06, + "loss": 0.5513, + "step": 41535 + }, + { + "epoch": 1.06, + "learning_rate": 1.4957124614000241e-06, + "loss": 0.6201, + "step": 41536 + }, + { + "epoch": 1.06, + "learning_rate": 1.495688429788943e-06, + "loss": 0.709, + "step": 41537 + }, + { + "epoch": 1.06, + "learning_rate": 1.495664397798336e-06, + "loss": 0.7275, + "step": 41538 + }, + { + "epoch": 1.06, + "learning_rate": 1.4956403654282214e-06, + "loss": 0.7002, + "step": 41539 + }, + { + "epoch": 1.06, + "learning_rate": 1.4956163326786179e-06, + "loss": 0.58, + "step": 41540 + }, + { + "epoch": 1.06, + "learning_rate": 1.495592299549544e-06, + "loss": 0.793, + "step": 41541 + }, + { + "epoch": 1.06, + "learning_rate": 1.4955682660410176e-06, + "loss": 0.5601, + "step": 41542 + }, + { + "epoch": 1.06, + "learning_rate": 1.4955442321530574e-06, + "loss": 0.521, + "step": 41543 + }, + { + "epoch": 1.06, + "learning_rate": 1.495520197885682e-06, + "loss": 0.7471, + "step": 41544 + }, + { + "epoch": 1.06, + "learning_rate": 1.495496163238909e-06, + "loss": 0.665, + "step": 41545 + }, + { + "epoch": 1.06, + "learning_rate": 1.495472128212758e-06, + "loss": 0.7505, + "step": 41546 + }, + { + "epoch": 1.06, + "learning_rate": 1.4954480928072464e-06, + "loss": 0.7783, + "step": 41547 + }, + { + "epoch": 1.06, + "learning_rate": 1.4954240570223933e-06, + "loss": 0.6064, + "step": 41548 + }, + { + "epoch": 1.06, + "learning_rate": 1.4954000208582163e-06, + "loss": 0.489, + "step": 41549 + }, + { + "epoch": 1.06, + "learning_rate": 1.4953759843147346e-06, + "loss": 0.7744, + "step": 41550 + }, + { + "epoch": 1.06, + "learning_rate": 1.4953519473919664e-06, + "loss": 0.6934, + "step": 41551 + }, + { + "epoch": 1.06, + "learning_rate": 1.4953279100899298e-06, + "loss": 0.707, + "step": 41552 + }, + { + "epoch": 1.07, + "learning_rate": 1.4953038724086434e-06, + "loss": 0.6084, + "step": 41553 + }, + { + "epoch": 1.07, + "learning_rate": 1.4952798343481257e-06, + "loss": 0.5947, + "step": 41554 + }, + { + "epoch": 1.07, + "learning_rate": 1.4952557959083947e-06, + "loss": 0.6348, + "step": 41555 + }, + { + "epoch": 1.07, + "learning_rate": 1.4952317570894695e-06, + "loss": 0.7354, + "step": 41556 + }, + { + "epoch": 1.07, + "learning_rate": 1.4952077178913677e-06, + "loss": 0.5366, + "step": 41557 + }, + { + "epoch": 1.07, + "learning_rate": 1.4951836783141086e-06, + "loss": 0.6416, + "step": 41558 + }, + { + "epoch": 1.07, + "learning_rate": 1.4951596383577099e-06, + "loss": 0.5903, + "step": 41559 + }, + { + "epoch": 1.07, + "learning_rate": 1.4951355980221902e-06, + "loss": 0.7217, + "step": 41560 + }, + { + "epoch": 1.07, + "learning_rate": 1.495111557307568e-06, + "loss": 0.52, + "step": 41561 + }, + { + "epoch": 1.07, + "learning_rate": 1.4950875162138615e-06, + "loss": 0.7007, + "step": 41562 + }, + { + "epoch": 1.07, + "learning_rate": 1.4950634747410896e-06, + "loss": 0.7432, + "step": 41563 + }, + { + "epoch": 1.07, + "learning_rate": 1.49503943288927e-06, + "loss": 0.7285, + "step": 41564 + }, + { + "epoch": 1.07, + "learning_rate": 1.4950153906584216e-06, + "loss": 0.7256, + "step": 41565 + }, + { + "epoch": 1.07, + "learning_rate": 1.4949913480485628e-06, + "loss": 0.73, + "step": 41566 + }, + { + "epoch": 1.07, + "learning_rate": 1.4949673050597116e-06, + "loss": 0.6494, + "step": 41567 + }, + { + "epoch": 1.07, + "learning_rate": 1.494943261691887e-06, + "loss": 0.6782, + "step": 41568 + }, + { + "epoch": 1.07, + "learning_rate": 1.4949192179451069e-06, + "loss": 0.5757, + "step": 41569 + }, + { + "epoch": 1.07, + "learning_rate": 1.4948951738193899e-06, + "loss": 0.748, + "step": 41570 + }, + { + "epoch": 1.07, + "learning_rate": 1.4948711293147548e-06, + "loss": 0.7539, + "step": 41571 + }, + { + "epoch": 1.07, + "learning_rate": 1.4948470844312192e-06, + "loss": 0.6777, + "step": 41572 + }, + { + "epoch": 1.07, + "learning_rate": 1.494823039168802e-06, + "loss": 0.5796, + "step": 41573 + }, + { + "epoch": 1.07, + "learning_rate": 1.4947989935275214e-06, + "loss": 0.603, + "step": 41574 + }, + { + "epoch": 1.07, + "learning_rate": 1.4947749475073964e-06, + "loss": 0.6826, + "step": 41575 + }, + { + "epoch": 1.07, + "learning_rate": 1.4947509011084447e-06, + "loss": 0.6638, + "step": 41576 + }, + { + "epoch": 1.07, + "learning_rate": 1.4947268543306851e-06, + "loss": 0.5757, + "step": 41577 + }, + { + "epoch": 1.07, + "learning_rate": 1.4947028071741358e-06, + "loss": 0.5508, + "step": 41578 + }, + { + "epoch": 1.07, + "learning_rate": 1.4946787596388153e-06, + "loss": 0.6494, + "step": 41579 + }, + { + "epoch": 1.07, + "learning_rate": 1.494654711724742e-06, + "loss": 0.6353, + "step": 41580 + }, + { + "epoch": 1.07, + "learning_rate": 1.4946306634319343e-06, + "loss": 0.6689, + "step": 41581 + }, + { + "epoch": 1.07, + "learning_rate": 1.4946066147604108e-06, + "loss": 0.3774, + "step": 41582 + }, + { + "epoch": 1.07, + "learning_rate": 1.4945825657101895e-06, + "loss": 0.7549, + "step": 41583 + }, + { + "epoch": 1.07, + "learning_rate": 1.4945585162812894e-06, + "loss": 0.585, + "step": 41584 + }, + { + "epoch": 1.07, + "learning_rate": 1.4945344664737283e-06, + "loss": 0.6392, + "step": 41585 + }, + { + "epoch": 1.07, + "learning_rate": 1.4945104162875253e-06, + "loss": 0.6904, + "step": 41586 + }, + { + "epoch": 1.07, + "learning_rate": 1.494486365722698e-06, + "loss": 0.5527, + "step": 41587 + }, + { + "epoch": 1.07, + "learning_rate": 1.4944623147792656e-06, + "loss": 0.7002, + "step": 41588 + }, + { + "epoch": 1.07, + "learning_rate": 1.4944382634572458e-06, + "loss": 0.5947, + "step": 41589 + }, + { + "epoch": 1.07, + "learning_rate": 1.4944142117566573e-06, + "loss": 0.6309, + "step": 41590 + }, + { + "epoch": 1.07, + "learning_rate": 1.494390159677519e-06, + "loss": 0.6426, + "step": 41591 + }, + { + "epoch": 1.07, + "learning_rate": 1.4943661072198487e-06, + "loss": 0.6748, + "step": 41592 + }, + { + "epoch": 1.07, + "learning_rate": 1.494342054383665e-06, + "loss": 0.8389, + "step": 41593 + }, + { + "epoch": 1.07, + "learning_rate": 1.4943180011689863e-06, + "loss": 0.6797, + "step": 41594 + }, + { + "epoch": 1.07, + "learning_rate": 1.4942939475758308e-06, + "loss": 0.5854, + "step": 41595 + }, + { + "epoch": 1.07, + "learning_rate": 1.4942698936042176e-06, + "loss": 0.7588, + "step": 41596 + }, + { + "epoch": 1.07, + "learning_rate": 1.494245839254164e-06, + "loss": 0.6553, + "step": 41597 + }, + { + "epoch": 1.07, + "learning_rate": 1.4942217845256897e-06, + "loss": 0.875, + "step": 41598 + }, + { + "epoch": 1.07, + "learning_rate": 1.4941977294188122e-06, + "loss": 0.6904, + "step": 41599 + }, + { + "epoch": 1.07, + "learning_rate": 1.4941736739335505e-06, + "loss": 0.7324, + "step": 41600 + }, + { + "epoch": 1.07, + "learning_rate": 1.4941496180699226e-06, + "loss": 0.5, + "step": 41601 + }, + { + "epoch": 1.07, + "learning_rate": 1.4941255618279469e-06, + "loss": 0.6338, + "step": 41602 + }, + { + "epoch": 1.07, + "learning_rate": 1.4941015052076422e-06, + "loss": 0.7441, + "step": 41603 + }, + { + "epoch": 1.07, + "learning_rate": 1.4940774482090265e-06, + "loss": 0.6875, + "step": 41604 + }, + { + "epoch": 1.07, + "learning_rate": 1.4940533908321187e-06, + "loss": 0.6538, + "step": 41605 + }, + { + "epoch": 1.07, + "learning_rate": 1.4940293330769366e-06, + "loss": 0.7275, + "step": 41606 + }, + { + "epoch": 1.07, + "learning_rate": 1.4940052749434993e-06, + "loss": 0.7148, + "step": 41607 + }, + { + "epoch": 1.07, + "learning_rate": 1.4939812164318247e-06, + "loss": 0.7646, + "step": 41608 + }, + { + "epoch": 1.07, + "learning_rate": 1.4939571575419314e-06, + "loss": 0.5688, + "step": 41609 + }, + { + "epoch": 1.07, + "learning_rate": 1.4939330982738377e-06, + "loss": 0.6279, + "step": 41610 + }, + { + "epoch": 1.07, + "learning_rate": 1.4939090386275624e-06, + "loss": 0.7559, + "step": 41611 + }, + { + "epoch": 1.07, + "learning_rate": 1.4938849786031234e-06, + "loss": 0.5771, + "step": 41612 + }, + { + "epoch": 1.07, + "learning_rate": 1.4938609182005394e-06, + "loss": 0.5469, + "step": 41613 + }, + { + "epoch": 1.07, + "learning_rate": 1.4938368574198289e-06, + "loss": 0.7598, + "step": 41614 + }, + { + "epoch": 1.07, + "learning_rate": 1.4938127962610103e-06, + "loss": 0.645, + "step": 41615 + }, + { + "epoch": 1.07, + "learning_rate": 1.4937887347241018e-06, + "loss": 0.479, + "step": 41616 + }, + { + "epoch": 1.07, + "learning_rate": 1.4937646728091223e-06, + "loss": 0.7031, + "step": 41617 + }, + { + "epoch": 1.07, + "learning_rate": 1.4937406105160895e-06, + "loss": 0.6528, + "step": 41618 + }, + { + "epoch": 1.07, + "learning_rate": 1.4937165478450223e-06, + "loss": 0.4648, + "step": 41619 + }, + { + "epoch": 1.07, + "learning_rate": 1.493692484795939e-06, + "loss": 0.7773, + "step": 41620 + }, + { + "epoch": 1.07, + "learning_rate": 1.4936684213688584e-06, + "loss": 0.8271, + "step": 41621 + }, + { + "epoch": 1.07, + "learning_rate": 1.4936443575637983e-06, + "loss": 0.6289, + "step": 41622 + }, + { + "epoch": 1.07, + "learning_rate": 1.4936202933807773e-06, + "loss": 0.7412, + "step": 41623 + }, + { + "epoch": 1.07, + "learning_rate": 1.493596228819814e-06, + "loss": 0.4797, + "step": 41624 + }, + { + "epoch": 1.07, + "learning_rate": 1.4935721638809269e-06, + "loss": 0.5742, + "step": 41625 + }, + { + "epoch": 1.07, + "learning_rate": 1.4935480985641345e-06, + "loss": 0.7959, + "step": 41626 + }, + { + "epoch": 1.07, + "learning_rate": 1.4935240328694544e-06, + "loss": 0.6431, + "step": 41627 + }, + { + "epoch": 1.07, + "learning_rate": 1.4934999667969062e-06, + "loss": 0.4561, + "step": 41628 + }, + { + "epoch": 1.07, + "learning_rate": 1.4934759003465074e-06, + "loss": 0.624, + "step": 41629 + }, + { + "epoch": 1.07, + "learning_rate": 1.493451833518277e-06, + "loss": 0.7939, + "step": 41630 + }, + { + "epoch": 1.07, + "learning_rate": 1.4934277663122332e-06, + "loss": 0.7793, + "step": 41631 + }, + { + "epoch": 1.07, + "learning_rate": 1.4934036987283946e-06, + "loss": 0.5767, + "step": 41632 + }, + { + "epoch": 1.07, + "learning_rate": 1.493379630766779e-06, + "loss": 0.6611, + "step": 41633 + }, + { + "epoch": 1.07, + "learning_rate": 1.493355562427406e-06, + "loss": 0.5885, + "step": 41634 + }, + { + "epoch": 1.07, + "learning_rate": 1.4933314937102926e-06, + "loss": 0.707, + "step": 41635 + }, + { + "epoch": 1.07, + "learning_rate": 1.4933074246154586e-06, + "loss": 0.666, + "step": 41636 + }, + { + "epoch": 1.07, + "learning_rate": 1.4932833551429214e-06, + "loss": 0.6382, + "step": 41637 + }, + { + "epoch": 1.07, + "learning_rate": 1.4932592852927e-06, + "loss": 0.8574, + "step": 41638 + }, + { + "epoch": 1.07, + "learning_rate": 1.4932352150648125e-06, + "loss": 0.7119, + "step": 41639 + }, + { + "epoch": 1.07, + "learning_rate": 1.4932111444592775e-06, + "loss": 0.7021, + "step": 41640 + }, + { + "epoch": 1.07, + "learning_rate": 1.4931870734761134e-06, + "loss": 0.584, + "step": 41641 + }, + { + "epoch": 1.07, + "learning_rate": 1.4931630021153388e-06, + "loss": 0.6205, + "step": 41642 + }, + { + "epoch": 1.07, + "learning_rate": 1.4931389303769717e-06, + "loss": 0.667, + "step": 41643 + }, + { + "epoch": 1.07, + "learning_rate": 1.4931148582610308e-06, + "loss": 0.7144, + "step": 41644 + }, + { + "epoch": 1.07, + "learning_rate": 1.4930907857675345e-06, + "loss": 0.7754, + "step": 41645 + }, + { + "epoch": 1.07, + "learning_rate": 1.4930667128965015e-06, + "loss": 0.5442, + "step": 41646 + }, + { + "epoch": 1.07, + "learning_rate": 1.49304263964795e-06, + "loss": 0.7764, + "step": 41647 + }, + { + "epoch": 1.07, + "learning_rate": 1.4930185660218983e-06, + "loss": 0.7461, + "step": 41648 + }, + { + "epoch": 1.07, + "learning_rate": 1.492994492018365e-06, + "loss": 0.5488, + "step": 41649 + }, + { + "epoch": 1.07, + "learning_rate": 1.4929704176373685e-06, + "loss": 0.5464, + "step": 41650 + }, + { + "epoch": 1.07, + "learning_rate": 1.4929463428789272e-06, + "loss": 0.4419, + "step": 41651 + }, + { + "epoch": 1.07, + "learning_rate": 1.4929222677430596e-06, + "loss": 0.6641, + "step": 41652 + }, + { + "epoch": 1.07, + "learning_rate": 1.492898192229784e-06, + "loss": 0.636, + "step": 41653 + }, + { + "epoch": 1.07, + "learning_rate": 1.4928741163391188e-06, + "loss": 0.4785, + "step": 41654 + }, + { + "epoch": 1.07, + "learning_rate": 1.4928500400710828e-06, + "loss": 0.7109, + "step": 41655 + }, + { + "epoch": 1.07, + "learning_rate": 1.4928259634256942e-06, + "loss": 0.5408, + "step": 41656 + }, + { + "epoch": 1.07, + "learning_rate": 1.4928018864029713e-06, + "loss": 0.6299, + "step": 41657 + }, + { + "epoch": 1.07, + "learning_rate": 1.4927778090029324e-06, + "loss": 0.646, + "step": 41658 + }, + { + "epoch": 1.07, + "learning_rate": 1.4927537312255967e-06, + "loss": 0.7236, + "step": 41659 + }, + { + "epoch": 1.07, + "learning_rate": 1.4927296530709816e-06, + "loss": 0.8037, + "step": 41660 + }, + { + "epoch": 1.07, + "learning_rate": 1.4927055745391066e-06, + "loss": 0.4487, + "step": 41661 + }, + { + "epoch": 1.07, + "learning_rate": 1.492681495629989e-06, + "loss": 0.5522, + "step": 41662 + }, + { + "epoch": 1.07, + "learning_rate": 1.4926574163436485e-06, + "loss": 0.5688, + "step": 41663 + }, + { + "epoch": 1.07, + "learning_rate": 1.4926333366801024e-06, + "loss": 0.7656, + "step": 41664 + }, + { + "epoch": 1.07, + "learning_rate": 1.4926092566393697e-06, + "loss": 0.6318, + "step": 41665 + }, + { + "epoch": 1.07, + "learning_rate": 1.492585176221469e-06, + "loss": 0.7471, + "step": 41666 + }, + { + "epoch": 1.07, + "learning_rate": 1.4925610954264181e-06, + "loss": 0.6748, + "step": 41667 + }, + { + "epoch": 1.07, + "learning_rate": 1.492537014254236e-06, + "loss": 0.5645, + "step": 41668 + }, + { + "epoch": 1.07, + "learning_rate": 1.4925129327049409e-06, + "loss": 0.8018, + "step": 41669 + }, + { + "epoch": 1.07, + "learning_rate": 1.4924888507785513e-06, + "loss": 0.8936, + "step": 41670 + }, + { + "epoch": 1.07, + "learning_rate": 1.4924647684750857e-06, + "loss": 0.8926, + "step": 41671 + }, + { + "epoch": 1.07, + "learning_rate": 1.4924406857945624e-06, + "loss": 0.6758, + "step": 41672 + }, + { + "epoch": 1.07, + "learning_rate": 1.4924166027369997e-06, + "loss": 0.6958, + "step": 41673 + }, + { + "epoch": 1.07, + "learning_rate": 1.4923925193024168e-06, + "loss": 0.6289, + "step": 41674 + }, + { + "epoch": 1.07, + "learning_rate": 1.492368435490831e-06, + "loss": 0.6816, + "step": 41675 + }, + { + "epoch": 1.07, + "learning_rate": 1.492344351302262e-06, + "loss": 0.6323, + "step": 41676 + }, + { + "epoch": 1.07, + "learning_rate": 1.492320266736727e-06, + "loss": 0.6172, + "step": 41677 + }, + { + "epoch": 1.07, + "learning_rate": 1.4922961817942451e-06, + "loss": 0.6885, + "step": 41678 + }, + { + "epoch": 1.07, + "learning_rate": 1.4922720964748345e-06, + "loss": 0.8594, + "step": 41679 + }, + { + "epoch": 1.07, + "learning_rate": 1.4922480107785143e-06, + "loss": 0.79, + "step": 41680 + }, + { + "epoch": 1.07, + "learning_rate": 1.4922239247053022e-06, + "loss": 0.7051, + "step": 41681 + }, + { + "epoch": 1.07, + "learning_rate": 1.492199838255217e-06, + "loss": 0.6504, + "step": 41682 + }, + { + "epoch": 1.07, + "learning_rate": 1.4921757514282765e-06, + "loss": 0.6978, + "step": 41683 + }, + { + "epoch": 1.07, + "learning_rate": 1.4921516642245002e-06, + "loss": 0.5483, + "step": 41684 + }, + { + "epoch": 1.07, + "learning_rate": 1.4921275766439057e-06, + "loss": 0.7158, + "step": 41685 + }, + { + "epoch": 1.07, + "learning_rate": 1.492103488686512e-06, + "loss": 0.5518, + "step": 41686 + }, + { + "epoch": 1.07, + "learning_rate": 1.492079400352337e-06, + "loss": 0.4708, + "step": 41687 + }, + { + "epoch": 1.07, + "learning_rate": 1.4920553116413997e-06, + "loss": 0.5195, + "step": 41688 + }, + { + "epoch": 1.07, + "learning_rate": 1.492031222553718e-06, + "loss": 0.6548, + "step": 41689 + }, + { + "epoch": 1.07, + "learning_rate": 1.4920071330893107e-06, + "loss": 0.5996, + "step": 41690 + }, + { + "epoch": 1.07, + "learning_rate": 1.4919830432481964e-06, + "loss": 0.6167, + "step": 41691 + }, + { + "epoch": 1.07, + "learning_rate": 1.491958953030393e-06, + "loss": 0.6445, + "step": 41692 + }, + { + "epoch": 1.07, + "learning_rate": 1.4919348624359195e-06, + "loss": 0.5537, + "step": 41693 + }, + { + "epoch": 1.07, + "learning_rate": 1.4919107714647937e-06, + "loss": 0.7063, + "step": 41694 + }, + { + "epoch": 1.07, + "learning_rate": 1.4918866801170346e-06, + "loss": 0.6523, + "step": 41695 + }, + { + "epoch": 1.07, + "learning_rate": 1.4918625883926608e-06, + "loss": 0.5083, + "step": 41696 + }, + { + "epoch": 1.07, + "learning_rate": 1.4918384962916903e-06, + "loss": 0.3982, + "step": 41697 + }, + { + "epoch": 1.07, + "learning_rate": 1.4918144038141413e-06, + "loss": 0.7842, + "step": 41698 + }, + { + "epoch": 1.07, + "learning_rate": 1.4917903109600331e-06, + "loss": 0.8232, + "step": 41699 + }, + { + "epoch": 1.07, + "learning_rate": 1.4917662177293835e-06, + "loss": 0.665, + "step": 41700 + }, + { + "epoch": 1.07, + "learning_rate": 1.4917421241222114e-06, + "loss": 0.6094, + "step": 41701 + }, + { + "epoch": 1.07, + "learning_rate": 1.4917180301385344e-06, + "loss": 0.7148, + "step": 41702 + }, + { + "epoch": 1.07, + "learning_rate": 1.491693935778372e-06, + "loss": 0.7246, + "step": 41703 + }, + { + "epoch": 1.07, + "learning_rate": 1.4916698410417418e-06, + "loss": 0.6582, + "step": 41704 + }, + { + "epoch": 1.07, + "learning_rate": 1.4916457459286629e-06, + "loss": 0.6943, + "step": 41705 + }, + { + "epoch": 1.07, + "learning_rate": 1.4916216504391531e-06, + "loss": 0.7539, + "step": 41706 + }, + { + "epoch": 1.07, + "learning_rate": 1.4915975545732317e-06, + "loss": 0.5225, + "step": 41707 + }, + { + "epoch": 1.07, + "learning_rate": 1.4915734583309164e-06, + "loss": 0.7275, + "step": 41708 + }, + { + "epoch": 1.07, + "learning_rate": 1.4915493617122258e-06, + "loss": 0.6611, + "step": 41709 + }, + { + "epoch": 1.07, + "learning_rate": 1.4915252647171785e-06, + "loss": 0.665, + "step": 41710 + }, + { + "epoch": 1.07, + "learning_rate": 1.491501167345793e-06, + "loss": 0.7246, + "step": 41711 + }, + { + "epoch": 1.07, + "learning_rate": 1.4914770695980876e-06, + "loss": 0.519, + "step": 41712 + }, + { + "epoch": 1.07, + "learning_rate": 1.491452971474081e-06, + "loss": 0.5977, + "step": 41713 + }, + { + "epoch": 1.07, + "learning_rate": 1.4914288729737912e-06, + "loss": 0.5356, + "step": 41714 + }, + { + "epoch": 1.07, + "learning_rate": 1.491404774097237e-06, + "loss": 0.5596, + "step": 41715 + }, + { + "epoch": 1.07, + "learning_rate": 1.4913806748444368e-06, + "loss": 0.8066, + "step": 41716 + }, + { + "epoch": 1.07, + "learning_rate": 1.4913565752154087e-06, + "loss": 0.5991, + "step": 41717 + }, + { + "epoch": 1.07, + "learning_rate": 1.491332475210172e-06, + "loss": 0.6074, + "step": 41718 + }, + { + "epoch": 1.07, + "learning_rate": 1.4913083748287441e-06, + "loss": 0.4719, + "step": 41719 + }, + { + "epoch": 1.07, + "learning_rate": 1.4912842740711441e-06, + "loss": 0.5559, + "step": 41720 + }, + { + "epoch": 1.07, + "learning_rate": 1.4912601729373906e-06, + "loss": 0.5442, + "step": 41721 + }, + { + "epoch": 1.07, + "learning_rate": 1.4912360714275019e-06, + "loss": 0.5618, + "step": 41722 + }, + { + "epoch": 1.07, + "learning_rate": 1.4912119695414958e-06, + "loss": 0.7275, + "step": 41723 + }, + { + "epoch": 1.07, + "learning_rate": 1.4911878672793916e-06, + "loss": 0.7773, + "step": 41724 + }, + { + "epoch": 1.07, + "learning_rate": 1.4911637646412072e-06, + "loss": 0.9468, + "step": 41725 + }, + { + "epoch": 1.07, + "learning_rate": 1.4911396616269615e-06, + "loss": 0.6167, + "step": 41726 + }, + { + "epoch": 1.07, + "learning_rate": 1.4911155582366728e-06, + "loss": 0.5669, + "step": 41727 + }, + { + "epoch": 1.07, + "learning_rate": 1.4910914544703594e-06, + "loss": 0.6309, + "step": 41728 + }, + { + "epoch": 1.07, + "learning_rate": 1.4910673503280395e-06, + "loss": 0.7197, + "step": 41729 + }, + { + "epoch": 1.07, + "learning_rate": 1.4910432458097324e-06, + "loss": 0.5957, + "step": 41730 + }, + { + "epoch": 1.07, + "learning_rate": 1.491019140915456e-06, + "loss": 0.6953, + "step": 41731 + }, + { + "epoch": 1.07, + "learning_rate": 1.4909950356452287e-06, + "loss": 0.6338, + "step": 41732 + }, + { + "epoch": 1.07, + "learning_rate": 1.4909709299990691e-06, + "loss": 0.791, + "step": 41733 + }, + { + "epoch": 1.07, + "learning_rate": 1.4909468239769959e-06, + "loss": 0.7412, + "step": 41734 + }, + { + "epoch": 1.07, + "learning_rate": 1.4909227175790266e-06, + "loss": 0.626, + "step": 41735 + }, + { + "epoch": 1.07, + "learning_rate": 1.490898610805181e-06, + "loss": 0.6621, + "step": 41736 + }, + { + "epoch": 1.07, + "learning_rate": 1.4908745036554766e-06, + "loss": 0.7148, + "step": 41737 + }, + { + "epoch": 1.07, + "learning_rate": 1.4908503961299324e-06, + "loss": 0.6089, + "step": 41738 + }, + { + "epoch": 1.07, + "learning_rate": 1.4908262882285664e-06, + "loss": 0.6401, + "step": 41739 + }, + { + "epoch": 1.07, + "learning_rate": 1.4908021799513975e-06, + "loss": 0.6309, + "step": 41740 + }, + { + "epoch": 1.07, + "learning_rate": 1.4907780712984438e-06, + "loss": 0.6626, + "step": 41741 + }, + { + "epoch": 1.07, + "learning_rate": 1.490753962269724e-06, + "loss": 0.5771, + "step": 41742 + }, + { + "epoch": 1.07, + "learning_rate": 1.490729852865256e-06, + "loss": 0.7539, + "step": 41743 + }, + { + "epoch": 1.07, + "learning_rate": 1.4907057430850592e-06, + "loss": 0.873, + "step": 41744 + }, + { + "epoch": 1.07, + "learning_rate": 1.4906816329291514e-06, + "loss": 0.5703, + "step": 41745 + }, + { + "epoch": 1.07, + "learning_rate": 1.4906575223975516e-06, + "loss": 0.7861, + "step": 41746 + }, + { + "epoch": 1.07, + "learning_rate": 1.4906334114902774e-06, + "loss": 0.6172, + "step": 41747 + }, + { + "epoch": 1.07, + "learning_rate": 1.4906093002073478e-06, + "loss": 0.4729, + "step": 41748 + }, + { + "epoch": 1.07, + "learning_rate": 1.4905851885487814e-06, + "loss": 0.7178, + "step": 41749 + }, + { + "epoch": 1.07, + "learning_rate": 1.4905610765145965e-06, + "loss": 0.665, + "step": 41750 + }, + { + "epoch": 1.07, + "learning_rate": 1.4905369641048116e-06, + "loss": 0.7197, + "step": 41751 + }, + { + "epoch": 1.07, + "learning_rate": 1.4905128513194448e-06, + "loss": 0.6836, + "step": 41752 + }, + { + "epoch": 1.07, + "learning_rate": 1.4904887381585152e-06, + "loss": 0.7153, + "step": 41753 + }, + { + "epoch": 1.07, + "learning_rate": 1.4904646246220404e-06, + "loss": 0.7803, + "step": 41754 + }, + { + "epoch": 1.07, + "learning_rate": 1.49044051071004e-06, + "loss": 0.751, + "step": 41755 + }, + { + "epoch": 1.07, + "learning_rate": 1.4904163964225315e-06, + "loss": 0.6709, + "step": 41756 + }, + { + "epoch": 1.07, + "learning_rate": 1.490392281759534e-06, + "loss": 0.5449, + "step": 41757 + }, + { + "epoch": 1.07, + "learning_rate": 1.4903681667210653e-06, + "loss": 0.5425, + "step": 41758 + }, + { + "epoch": 1.07, + "learning_rate": 1.4903440513071445e-06, + "loss": 0.5708, + "step": 41759 + }, + { + "epoch": 1.07, + "learning_rate": 1.4903199355177895e-06, + "loss": 0.5353, + "step": 41760 + }, + { + "epoch": 1.07, + "learning_rate": 1.4902958193530195e-06, + "loss": 0.7461, + "step": 41761 + }, + { + "epoch": 1.07, + "learning_rate": 1.4902717028128524e-06, + "loss": 0.8672, + "step": 41762 + }, + { + "epoch": 1.07, + "learning_rate": 1.4902475858973068e-06, + "loss": 0.7686, + "step": 41763 + }, + { + "epoch": 1.07, + "learning_rate": 1.490223468606401e-06, + "loss": 0.7188, + "step": 41764 + }, + { + "epoch": 1.07, + "learning_rate": 1.4901993509401535e-06, + "loss": 0.438, + "step": 41765 + }, + { + "epoch": 1.07, + "learning_rate": 1.4901752328985835e-06, + "loss": 0.5953, + "step": 41766 + }, + { + "epoch": 1.07, + "learning_rate": 1.4901511144817085e-06, + "loss": 0.6382, + "step": 41767 + }, + { + "epoch": 1.07, + "learning_rate": 1.4901269956895472e-06, + "loss": 0.5697, + "step": 41768 + }, + { + "epoch": 1.07, + "learning_rate": 1.4901028765221183e-06, + "loss": 0.5781, + "step": 41769 + }, + { + "epoch": 1.07, + "learning_rate": 1.4900787569794402e-06, + "loss": 0.4413, + "step": 41770 + }, + { + "epoch": 1.07, + "learning_rate": 1.4900546370615315e-06, + "loss": 0.7471, + "step": 41771 + }, + { + "epoch": 1.07, + "learning_rate": 1.4900305167684104e-06, + "loss": 0.7373, + "step": 41772 + }, + { + "epoch": 1.07, + "learning_rate": 1.4900063961000952e-06, + "loss": 0.6924, + "step": 41773 + }, + { + "epoch": 1.07, + "learning_rate": 1.489982275056605e-06, + "loss": 0.5596, + "step": 41774 + }, + { + "epoch": 1.07, + "learning_rate": 1.4899581536379575e-06, + "loss": 0.7139, + "step": 41775 + }, + { + "epoch": 1.07, + "learning_rate": 1.489934031844172e-06, + "loss": 0.5732, + "step": 41776 + }, + { + "epoch": 1.07, + "learning_rate": 1.4899099096752663e-06, + "loss": 0.5972, + "step": 41777 + }, + { + "epoch": 1.07, + "learning_rate": 1.4898857871312591e-06, + "loss": 0.7578, + "step": 41778 + }, + { + "epoch": 1.07, + "learning_rate": 1.4898616642121688e-06, + "loss": 0.748, + "step": 41779 + }, + { + "epoch": 1.07, + "learning_rate": 1.4898375409180142e-06, + "loss": 0.6963, + "step": 41780 + }, + { + "epoch": 1.07, + "learning_rate": 1.4898134172488136e-06, + "loss": 0.688, + "step": 41781 + }, + { + "epoch": 1.07, + "learning_rate": 1.4897892932045849e-06, + "loss": 0.7236, + "step": 41782 + }, + { + "epoch": 1.07, + "learning_rate": 1.4897651687853473e-06, + "loss": 0.627, + "step": 41783 + }, + { + "epoch": 1.07, + "learning_rate": 1.4897410439911192e-06, + "loss": 0.6582, + "step": 41784 + }, + { + "epoch": 1.07, + "learning_rate": 1.4897169188219185e-06, + "loss": 0.5158, + "step": 41785 + }, + { + "epoch": 1.07, + "learning_rate": 1.4896927932777645e-06, + "loss": 0.6021, + "step": 41786 + }, + { + "epoch": 1.07, + "learning_rate": 1.489668667358675e-06, + "loss": 0.4599, + "step": 41787 + }, + { + "epoch": 1.07, + "learning_rate": 1.4896445410646688e-06, + "loss": 0.8564, + "step": 41788 + }, + { + "epoch": 1.07, + "learning_rate": 1.4896204143957645e-06, + "loss": 0.708, + "step": 41789 + }, + { + "epoch": 1.07, + "learning_rate": 1.48959628735198e-06, + "loss": 0.7676, + "step": 41790 + }, + { + "epoch": 1.07, + "learning_rate": 1.4895721599333344e-06, + "loss": 0.5881, + "step": 41791 + }, + { + "epoch": 1.07, + "learning_rate": 1.4895480321398456e-06, + "loss": 0.6777, + "step": 41792 + }, + { + "epoch": 1.07, + "learning_rate": 1.489523903971533e-06, + "loss": 0.7793, + "step": 41793 + }, + { + "epoch": 1.07, + "learning_rate": 1.4894997754284138e-06, + "loss": 0.6895, + "step": 41794 + }, + { + "epoch": 1.07, + "learning_rate": 1.4894756465105074e-06, + "loss": 0.7148, + "step": 41795 + }, + { + "epoch": 1.07, + "learning_rate": 1.489451517217832e-06, + "loss": 0.8672, + "step": 41796 + }, + { + "epoch": 1.07, + "learning_rate": 1.489427387550406e-06, + "loss": 0.6826, + "step": 41797 + }, + { + "epoch": 1.07, + "learning_rate": 1.489403257508248e-06, + "loss": 0.5647, + "step": 41798 + }, + { + "epoch": 1.07, + "learning_rate": 1.4893791270913765e-06, + "loss": 0.5542, + "step": 41799 + }, + { + "epoch": 1.07, + "learning_rate": 1.4893549962998097e-06, + "loss": 0.4858, + "step": 41800 + }, + { + "epoch": 1.07, + "learning_rate": 1.4893308651335662e-06, + "loss": 0.6943, + "step": 41801 + }, + { + "epoch": 1.07, + "learning_rate": 1.489306733592665e-06, + "loss": 0.4407, + "step": 41802 + }, + { + "epoch": 1.07, + "learning_rate": 1.489282601677124e-06, + "loss": 0.2802, + "step": 41803 + }, + { + "epoch": 1.07, + "learning_rate": 1.4892584693869616e-06, + "loss": 0.7139, + "step": 41804 + }, + { + "epoch": 1.07, + "learning_rate": 1.4892343367221967e-06, + "loss": 0.6733, + "step": 41805 + }, + { + "epoch": 1.07, + "learning_rate": 1.4892102036828476e-06, + "loss": 0.751, + "step": 41806 + }, + { + "epoch": 1.07, + "learning_rate": 1.4891860702689325e-06, + "loss": 0.4595, + "step": 41807 + }, + { + "epoch": 1.07, + "learning_rate": 1.4891619364804702e-06, + "loss": 0.7134, + "step": 41808 + }, + { + "epoch": 1.07, + "learning_rate": 1.489137802317479e-06, + "loss": 0.6738, + "step": 41809 + }, + { + "epoch": 1.07, + "learning_rate": 1.4891136677799778e-06, + "loss": 0.7979, + "step": 41810 + }, + { + "epoch": 1.07, + "learning_rate": 1.4890895328679845e-06, + "loss": 0.7471, + "step": 41811 + }, + { + "epoch": 1.07, + "learning_rate": 1.489065397581518e-06, + "loss": 0.6904, + "step": 41812 + }, + { + "epoch": 1.07, + "learning_rate": 1.4890412619205964e-06, + "loss": 0.584, + "step": 41813 + }, + { + "epoch": 1.07, + "learning_rate": 1.4890171258852384e-06, + "loss": 0.835, + "step": 41814 + }, + { + "epoch": 1.07, + "learning_rate": 1.4889929894754626e-06, + "loss": 0.7681, + "step": 41815 + }, + { + "epoch": 1.07, + "learning_rate": 1.4889688526912875e-06, + "loss": 0.7705, + "step": 41816 + }, + { + "epoch": 1.07, + "learning_rate": 1.4889447155327311e-06, + "loss": 0.5972, + "step": 41817 + }, + { + "epoch": 1.07, + "learning_rate": 1.4889205779998123e-06, + "loss": 0.7344, + "step": 41818 + }, + { + "epoch": 1.07, + "learning_rate": 1.4888964400925494e-06, + "loss": 0.5732, + "step": 41819 + }, + { + "epoch": 1.07, + "learning_rate": 1.4888723018109615e-06, + "loss": 0.625, + "step": 41820 + }, + { + "epoch": 1.07, + "learning_rate": 1.488848163155066e-06, + "loss": 0.3882, + "step": 41821 + }, + { + "epoch": 1.07, + "learning_rate": 1.4888240241248822e-06, + "loss": 0.6313, + "step": 41822 + }, + { + "epoch": 1.07, + "learning_rate": 1.4887998847204282e-06, + "loss": 0.7354, + "step": 41823 + }, + { + "epoch": 1.07, + "learning_rate": 1.4887757449417227e-06, + "loss": 0.6567, + "step": 41824 + }, + { + "epoch": 1.07, + "learning_rate": 1.488751604788784e-06, + "loss": 0.6836, + "step": 41825 + }, + { + "epoch": 1.07, + "learning_rate": 1.4887274642616308e-06, + "loss": 0.7373, + "step": 41826 + }, + { + "epoch": 1.07, + "learning_rate": 1.4887033233602814e-06, + "loss": 0.7246, + "step": 41827 + }, + { + "epoch": 1.07, + "learning_rate": 1.4886791820847542e-06, + "loss": 0.8145, + "step": 41828 + }, + { + "epoch": 1.07, + "learning_rate": 1.4886550404350679e-06, + "loss": 0.6016, + "step": 41829 + }, + { + "epoch": 1.07, + "learning_rate": 1.488630898411241e-06, + "loss": 0.71, + "step": 41830 + }, + { + "epoch": 1.07, + "learning_rate": 1.4886067560132918e-06, + "loss": 0.8369, + "step": 41831 + }, + { + "epoch": 1.07, + "learning_rate": 1.4885826132412388e-06, + "loss": 0.7285, + "step": 41832 + }, + { + "epoch": 1.07, + "learning_rate": 1.4885584700951008e-06, + "loss": 0.7383, + "step": 41833 + }, + { + "epoch": 1.07, + "learning_rate": 1.4885343265748957e-06, + "loss": 0.5518, + "step": 41834 + }, + { + "epoch": 1.07, + "learning_rate": 1.4885101826806428e-06, + "loss": 0.6016, + "step": 41835 + }, + { + "epoch": 1.07, + "learning_rate": 1.4884860384123596e-06, + "loss": 0.7139, + "step": 41836 + }, + { + "epoch": 1.07, + "learning_rate": 1.4884618937700656e-06, + "loss": 0.7754, + "step": 41837 + }, + { + "epoch": 1.07, + "learning_rate": 1.4884377487537782e-06, + "loss": 0.707, + "step": 41838 + }, + { + "epoch": 1.07, + "learning_rate": 1.4884136033635168e-06, + "loss": 0.7881, + "step": 41839 + }, + { + "epoch": 1.07, + "learning_rate": 1.4883894575993e-06, + "loss": 0.3092, + "step": 41840 + }, + { + "epoch": 1.07, + "learning_rate": 1.4883653114611451e-06, + "loss": 0.7646, + "step": 41841 + }, + { + "epoch": 1.07, + "learning_rate": 1.4883411649490717e-06, + "loss": 0.6406, + "step": 41842 + }, + { + "epoch": 1.07, + "learning_rate": 1.488317018063098e-06, + "loss": 0.584, + "step": 41843 + }, + { + "epoch": 1.07, + "learning_rate": 1.4882928708032422e-06, + "loss": 0.7314, + "step": 41844 + }, + { + "epoch": 1.07, + "learning_rate": 1.488268723169523e-06, + "loss": 0.749, + "step": 41845 + }, + { + "epoch": 1.07, + "learning_rate": 1.488244575161959e-06, + "loss": 0.5767, + "step": 41846 + }, + { + "epoch": 1.07, + "learning_rate": 1.4882204267805688e-06, + "loss": 0.5923, + "step": 41847 + }, + { + "epoch": 1.07, + "learning_rate": 1.4881962780253702e-06, + "loss": 0.7012, + "step": 41848 + }, + { + "epoch": 1.07, + "learning_rate": 1.4881721288963825e-06, + "loss": 0.6514, + "step": 41849 + }, + { + "epoch": 1.07, + "learning_rate": 1.4881479793936235e-06, + "loss": 0.6177, + "step": 41850 + }, + { + "epoch": 1.07, + "learning_rate": 1.4881238295171123e-06, + "loss": 0.665, + "step": 41851 + }, + { + "epoch": 1.07, + "learning_rate": 1.4880996792668673e-06, + "loss": 0.6943, + "step": 41852 + }, + { + "epoch": 1.07, + "learning_rate": 1.4880755286429062e-06, + "loss": 0.5811, + "step": 41853 + }, + { + "epoch": 1.07, + "learning_rate": 1.4880513776452488e-06, + "loss": 0.8086, + "step": 41854 + }, + { + "epoch": 1.07, + "learning_rate": 1.4880272262739127e-06, + "loss": 0.5933, + "step": 41855 + }, + { + "epoch": 1.07, + "learning_rate": 1.4880030745289165e-06, + "loss": 0.6777, + "step": 41856 + }, + { + "epoch": 1.07, + "learning_rate": 1.4879789224102788e-06, + "loss": 0.5605, + "step": 41857 + }, + { + "epoch": 1.07, + "learning_rate": 1.487954769918018e-06, + "loss": 0.7393, + "step": 41858 + }, + { + "epoch": 1.07, + "learning_rate": 1.4879306170521526e-06, + "loss": 0.5464, + "step": 41859 + }, + { + "epoch": 1.07, + "learning_rate": 1.4879064638127017e-06, + "loss": 0.5249, + "step": 41860 + }, + { + "epoch": 1.07, + "learning_rate": 1.4878823101996827e-06, + "loss": 0.6099, + "step": 41861 + }, + { + "epoch": 1.07, + "learning_rate": 1.487858156213115e-06, + "loss": 0.6611, + "step": 41862 + }, + { + "epoch": 1.07, + "learning_rate": 1.4878340018530161e-06, + "loss": 0.7842, + "step": 41863 + }, + { + "epoch": 1.07, + "learning_rate": 1.4878098471194058e-06, + "loss": 0.6885, + "step": 41864 + }, + { + "epoch": 1.07, + "learning_rate": 1.4877856920123018e-06, + "loss": 0.7197, + "step": 41865 + }, + { + "epoch": 1.07, + "learning_rate": 1.4877615365317228e-06, + "loss": 0.4634, + "step": 41866 + }, + { + "epoch": 1.07, + "learning_rate": 1.487737380677687e-06, + "loss": 0.5483, + "step": 41867 + }, + { + "epoch": 1.07, + "learning_rate": 1.4877132244502131e-06, + "loss": 0.625, + "step": 41868 + }, + { + "epoch": 1.07, + "learning_rate": 1.4876890678493195e-06, + "loss": 0.6201, + "step": 41869 + }, + { + "epoch": 1.07, + "learning_rate": 1.4876649108750252e-06, + "loss": 0.709, + "step": 41870 + }, + { + "epoch": 1.07, + "learning_rate": 1.4876407535273482e-06, + "loss": 0.6133, + "step": 41871 + }, + { + "epoch": 1.07, + "learning_rate": 1.4876165958063067e-06, + "loss": 0.7041, + "step": 41872 + }, + { + "epoch": 1.07, + "learning_rate": 1.48759243771192e-06, + "loss": 0.6362, + "step": 41873 + }, + { + "epoch": 1.07, + "learning_rate": 1.487568279244206e-06, + "loss": 0.751, + "step": 41874 + }, + { + "epoch": 1.07, + "learning_rate": 1.4875441204031838e-06, + "loss": 0.5938, + "step": 41875 + }, + { + "epoch": 1.07, + "learning_rate": 1.4875199611888708e-06, + "loss": 0.6616, + "step": 41876 + }, + { + "epoch": 1.07, + "learning_rate": 1.4874958016012865e-06, + "loss": 0.6821, + "step": 41877 + }, + { + "epoch": 1.07, + "learning_rate": 1.4874716416404493e-06, + "loss": 0.7148, + "step": 41878 + }, + { + "epoch": 1.07, + "learning_rate": 1.4874474813063772e-06, + "loss": 0.8066, + "step": 41879 + }, + { + "epoch": 1.07, + "learning_rate": 1.487423320599089e-06, + "loss": 0.6899, + "step": 41880 + }, + { + "epoch": 1.07, + "learning_rate": 1.4873991595186035e-06, + "loss": 0.5864, + "step": 41881 + }, + { + "epoch": 1.07, + "learning_rate": 1.4873749980649385e-06, + "loss": 0.7178, + "step": 41882 + }, + { + "epoch": 1.07, + "learning_rate": 1.4873508362381131e-06, + "loss": 0.6277, + "step": 41883 + }, + { + "epoch": 1.07, + "learning_rate": 1.4873266740381454e-06, + "loss": 0.6597, + "step": 41884 + }, + { + "epoch": 1.07, + "learning_rate": 1.4873025114650544e-06, + "loss": 0.7637, + "step": 41885 + }, + { + "epoch": 1.07, + "learning_rate": 1.4872783485188578e-06, + "loss": 0.5664, + "step": 41886 + }, + { + "epoch": 1.07, + "learning_rate": 1.4872541851995748e-06, + "loss": 0.5452, + "step": 41887 + }, + { + "epoch": 1.07, + "learning_rate": 1.4872300215072235e-06, + "loss": 0.6904, + "step": 41888 + }, + { + "epoch": 1.07, + "learning_rate": 1.4872058574418229e-06, + "loss": 0.3972, + "step": 41889 + }, + { + "epoch": 1.07, + "learning_rate": 1.4871816930033912e-06, + "loss": 0.6895, + "step": 41890 + }, + { + "epoch": 1.07, + "learning_rate": 1.4871575281919464e-06, + "loss": 0.4902, + "step": 41891 + }, + { + "epoch": 1.07, + "learning_rate": 1.487133363007508e-06, + "loss": 0.5049, + "step": 41892 + }, + { + "epoch": 1.07, + "learning_rate": 1.4871091974500938e-06, + "loss": 0.7354, + "step": 41893 + }, + { + "epoch": 1.07, + "learning_rate": 1.4870850315197224e-06, + "loss": 0.4302, + "step": 41894 + }, + { + "epoch": 1.07, + "learning_rate": 1.4870608652164122e-06, + "loss": 0.7803, + "step": 41895 + }, + { + "epoch": 1.07, + "learning_rate": 1.4870366985401824e-06, + "loss": 0.5481, + "step": 41896 + }, + { + "epoch": 1.07, + "learning_rate": 1.4870125314910506e-06, + "loss": 0.6328, + "step": 41897 + }, + { + "epoch": 1.07, + "learning_rate": 1.486988364069036e-06, + "loss": 0.6509, + "step": 41898 + }, + { + "epoch": 1.07, + "learning_rate": 1.4869641962741565e-06, + "loss": 0.6309, + "step": 41899 + }, + { + "epoch": 1.07, + "learning_rate": 1.486940028106431e-06, + "loss": 0.7998, + "step": 41900 + }, + { + "epoch": 1.07, + "learning_rate": 1.4869158595658779e-06, + "loss": 0.6553, + "step": 41901 + }, + { + "epoch": 1.07, + "learning_rate": 1.4868916906525157e-06, + "loss": 0.4331, + "step": 41902 + }, + { + "epoch": 1.07, + "learning_rate": 1.486867521366363e-06, + "loss": 0.8115, + "step": 41903 + }, + { + "epoch": 1.07, + "learning_rate": 1.4868433517074382e-06, + "loss": 0.5479, + "step": 41904 + }, + { + "epoch": 1.07, + "learning_rate": 1.4868191816757598e-06, + "loss": 0.6699, + "step": 41905 + }, + { + "epoch": 1.07, + "learning_rate": 1.4867950112713465e-06, + "loss": 0.5781, + "step": 41906 + }, + { + "epoch": 1.07, + "learning_rate": 1.4867708404942164e-06, + "loss": 0.708, + "step": 41907 + }, + { + "epoch": 1.07, + "learning_rate": 1.4867466693443884e-06, + "loss": 0.7036, + "step": 41908 + }, + { + "epoch": 1.07, + "learning_rate": 1.4867224978218808e-06, + "loss": 0.6748, + "step": 41909 + }, + { + "epoch": 1.07, + "learning_rate": 1.4866983259267123e-06, + "loss": 0.7891, + "step": 41910 + }, + { + "epoch": 1.07, + "learning_rate": 1.486674153658901e-06, + "loss": 0.5693, + "step": 41911 + }, + { + "epoch": 1.07, + "learning_rate": 1.486649981018466e-06, + "loss": 0.7119, + "step": 41912 + }, + { + "epoch": 1.07, + "learning_rate": 1.4866258080054254e-06, + "loss": 0.7773, + "step": 41913 + }, + { + "epoch": 1.07, + "learning_rate": 1.4866016346197976e-06, + "loss": 0.7324, + "step": 41914 + }, + { + "epoch": 1.07, + "learning_rate": 1.4865774608616013e-06, + "loss": 0.6567, + "step": 41915 + }, + { + "epoch": 1.07, + "learning_rate": 1.4865532867308552e-06, + "loss": 0.7095, + "step": 41916 + }, + { + "epoch": 1.07, + "learning_rate": 1.4865291122275777e-06, + "loss": 0.623, + "step": 41917 + }, + { + "epoch": 1.07, + "learning_rate": 1.4865049373517869e-06, + "loss": 0.6055, + "step": 41918 + }, + { + "epoch": 1.07, + "learning_rate": 1.4864807621035019e-06, + "loss": 0.6709, + "step": 41919 + }, + { + "epoch": 1.07, + "learning_rate": 1.4864565864827407e-06, + "loss": 0.8232, + "step": 41920 + }, + { + "epoch": 1.07, + "learning_rate": 1.4864324104895225e-06, + "loss": 0.6414, + "step": 41921 + }, + { + "epoch": 1.07, + "learning_rate": 1.4864082341238649e-06, + "loss": 0.707, + "step": 41922 + }, + { + "epoch": 1.07, + "learning_rate": 1.486384057385787e-06, + "loss": 0.5718, + "step": 41923 + }, + { + "epoch": 1.07, + "learning_rate": 1.4863598802753073e-06, + "loss": 0.8096, + "step": 41924 + }, + { + "epoch": 1.07, + "learning_rate": 1.4863357027924444e-06, + "loss": 0.6094, + "step": 41925 + }, + { + "epoch": 1.07, + "learning_rate": 1.4863115249372163e-06, + "loss": 0.6895, + "step": 41926 + }, + { + "epoch": 1.07, + "learning_rate": 1.4862873467096418e-06, + "loss": 0.5781, + "step": 41927 + }, + { + "epoch": 1.07, + "learning_rate": 1.4862631681097396e-06, + "loss": 0.6777, + "step": 41928 + }, + { + "epoch": 1.07, + "learning_rate": 1.486238989137528e-06, + "loss": 0.5205, + "step": 41929 + }, + { + "epoch": 1.07, + "learning_rate": 1.4862148097930256e-06, + "loss": 0.7627, + "step": 41930 + }, + { + "epoch": 1.07, + "learning_rate": 1.4861906300762507e-06, + "loss": 0.7305, + "step": 41931 + }, + { + "epoch": 1.07, + "learning_rate": 1.4861664499872222e-06, + "loss": 0.7354, + "step": 41932 + }, + { + "epoch": 1.07, + "learning_rate": 1.4861422695259585e-06, + "loss": 0.5077, + "step": 41933 + }, + { + "epoch": 1.07, + "learning_rate": 1.4861180886924776e-06, + "loss": 0.7119, + "step": 41934 + }, + { + "epoch": 1.07, + "learning_rate": 1.4860939074867988e-06, + "loss": 0.8135, + "step": 41935 + }, + { + "epoch": 1.07, + "learning_rate": 1.48606972590894e-06, + "loss": 0.6768, + "step": 41936 + }, + { + "epoch": 1.07, + "learning_rate": 1.4860455439589203e-06, + "loss": 0.7373, + "step": 41937 + }, + { + "epoch": 1.07, + "learning_rate": 1.4860213616367576e-06, + "loss": 0.6255, + "step": 41938 + }, + { + "epoch": 1.07, + "learning_rate": 1.4859971789424709e-06, + "loss": 0.6875, + "step": 41939 + }, + { + "epoch": 1.07, + "learning_rate": 1.4859729958760784e-06, + "loss": 0.6504, + "step": 41940 + }, + { + "epoch": 1.07, + "learning_rate": 1.4859488124375985e-06, + "loss": 0.6162, + "step": 41941 + }, + { + "epoch": 1.07, + "learning_rate": 1.4859246286270502e-06, + "loss": 0.7881, + "step": 41942 + }, + { + "epoch": 1.08, + "learning_rate": 1.4859004444444515e-06, + "loss": 0.6006, + "step": 41943 + }, + { + "epoch": 1.08, + "learning_rate": 1.4858762598898214e-06, + "loss": 0.583, + "step": 41944 + }, + { + "epoch": 1.08, + "learning_rate": 1.4858520749631781e-06, + "loss": 0.4937, + "step": 41945 + }, + { + "epoch": 1.08, + "learning_rate": 1.4858278896645404e-06, + "loss": 0.7861, + "step": 41946 + }, + { + "epoch": 1.08, + "learning_rate": 1.4858037039939265e-06, + "loss": 0.7056, + "step": 41947 + }, + { + "epoch": 1.08, + "learning_rate": 1.485779517951355e-06, + "loss": 0.6709, + "step": 41948 + }, + { + "epoch": 1.08, + "learning_rate": 1.4857553315368443e-06, + "loss": 0.6367, + "step": 41949 + }, + { + "epoch": 1.08, + "learning_rate": 1.4857311447504135e-06, + "loss": 0.769, + "step": 41950 + }, + { + "epoch": 1.08, + "learning_rate": 1.4857069575920804e-06, + "loss": 0.4055, + "step": 41951 + }, + { + "epoch": 1.08, + "learning_rate": 1.4856827700618639e-06, + "loss": 0.582, + "step": 41952 + }, + { + "epoch": 1.08, + "learning_rate": 1.4856585821597823e-06, + "loss": 0.5582, + "step": 41953 + }, + { + "epoch": 1.08, + "learning_rate": 1.4856343938858545e-06, + "loss": 0.7192, + "step": 41954 + }, + { + "epoch": 1.08, + "learning_rate": 1.4856102052400986e-06, + "loss": 0.6763, + "step": 41955 + }, + { + "epoch": 1.08, + "learning_rate": 1.4855860162225332e-06, + "loss": 0.6709, + "step": 41956 + }, + { + "epoch": 1.08, + "learning_rate": 1.485561826833177e-06, + "loss": 0.7031, + "step": 41957 + }, + { + "epoch": 1.08, + "learning_rate": 1.4855376370720487e-06, + "loss": 0.6807, + "step": 41958 + }, + { + "epoch": 1.08, + "learning_rate": 1.485513446939166e-06, + "loss": 0.5718, + "step": 41959 + }, + { + "epoch": 1.08, + "learning_rate": 1.4854892564345484e-06, + "loss": 0.7236, + "step": 41960 + }, + { + "epoch": 1.08, + "learning_rate": 1.485465065558214e-06, + "loss": 0.8721, + "step": 41961 + }, + { + "epoch": 1.08, + "learning_rate": 1.4854408743101812e-06, + "loss": 0.6895, + "step": 41962 + }, + { + "epoch": 1.08, + "learning_rate": 1.4854166826904688e-06, + "loss": 0.6514, + "step": 41963 + }, + { + "epoch": 1.08, + "learning_rate": 1.485392490699095e-06, + "loss": 0.7373, + "step": 41964 + }, + { + "epoch": 1.08, + "learning_rate": 1.4853682983360787e-06, + "loss": 0.563, + "step": 41965 + }, + { + "epoch": 1.08, + "learning_rate": 1.4853441056014376e-06, + "loss": 0.6455, + "step": 41966 + }, + { + "epoch": 1.08, + "learning_rate": 1.4853199124951916e-06, + "loss": 0.4392, + "step": 41967 + }, + { + "epoch": 1.08, + "learning_rate": 1.4852957190173578e-06, + "loss": 0.5444, + "step": 41968 + }, + { + "epoch": 1.08, + "learning_rate": 1.485271525167956e-06, + "loss": 0.5957, + "step": 41969 + }, + { + "epoch": 1.08, + "learning_rate": 1.4852473309470037e-06, + "loss": 0.625, + "step": 41970 + }, + { + "epoch": 1.08, + "learning_rate": 1.4852231363545202e-06, + "loss": 0.7441, + "step": 41971 + }, + { + "epoch": 1.08, + "learning_rate": 1.4851989413905233e-06, + "loss": 0.6733, + "step": 41972 + }, + { + "epoch": 1.08, + "learning_rate": 1.4851747460550322e-06, + "loss": 0.5386, + "step": 41973 + }, + { + "epoch": 1.08, + "learning_rate": 1.4851505503480646e-06, + "loss": 0.7373, + "step": 41974 + }, + { + "epoch": 1.08, + "learning_rate": 1.4851263542696399e-06, + "loss": 0.8125, + "step": 41975 + }, + { + "epoch": 1.08, + "learning_rate": 1.4851021578197761e-06, + "loss": 0.5791, + "step": 41976 + }, + { + "epoch": 1.08, + "learning_rate": 1.4850779609984923e-06, + "loss": 0.4792, + "step": 41977 + }, + { + "epoch": 1.08, + "learning_rate": 1.485053763805806e-06, + "loss": 0.7393, + "step": 41978 + }, + { + "epoch": 1.08, + "learning_rate": 1.4850295662417367e-06, + "loss": 0.6597, + "step": 41979 + }, + { + "epoch": 1.08, + "learning_rate": 1.4850053683063023e-06, + "loss": 0.5229, + "step": 41980 + }, + { + "epoch": 1.08, + "learning_rate": 1.484981169999522e-06, + "loss": 0.5625, + "step": 41981 + }, + { + "epoch": 1.08, + "learning_rate": 1.4849569713214137e-06, + "loss": 0.6738, + "step": 41982 + }, + { + "epoch": 1.08, + "learning_rate": 1.4849327722719963e-06, + "loss": 0.7969, + "step": 41983 + }, + { + "epoch": 1.08, + "learning_rate": 1.4849085728512877e-06, + "loss": 0.6299, + "step": 41984 + }, + { + "epoch": 1.08, + "learning_rate": 1.4848843730593073e-06, + "loss": 0.5039, + "step": 41985 + }, + { + "epoch": 1.08, + "learning_rate": 1.4848601728960733e-06, + "loss": 0.6055, + "step": 41986 + }, + { + "epoch": 1.08, + "learning_rate": 1.4848359723616037e-06, + "loss": 0.5308, + "step": 41987 + }, + { + "epoch": 1.08, + "learning_rate": 1.4848117714559178e-06, + "loss": 0.916, + "step": 41988 + }, + { + "epoch": 1.08, + "learning_rate": 1.4847875701790337e-06, + "loss": 0.7119, + "step": 41989 + }, + { + "epoch": 1.08, + "learning_rate": 1.4847633685309707e-06, + "loss": 0.4678, + "step": 41990 + }, + { + "epoch": 1.08, + "learning_rate": 1.484739166511746e-06, + "loss": 0.6589, + "step": 41991 + }, + { + "epoch": 1.08, + "learning_rate": 1.484714964121379e-06, + "loss": 0.6626, + "step": 41992 + }, + { + "epoch": 1.08, + "learning_rate": 1.4846907613598876e-06, + "loss": 0.5366, + "step": 41993 + }, + { + "epoch": 1.08, + "learning_rate": 1.4846665582272913e-06, + "loss": 0.8652, + "step": 41994 + }, + { + "epoch": 1.08, + "learning_rate": 1.484642354723608e-06, + "loss": 0.5137, + "step": 41995 + }, + { + "epoch": 1.08, + "learning_rate": 1.4846181508488565e-06, + "loss": 0.8223, + "step": 41996 + }, + { + "epoch": 1.08, + "learning_rate": 1.4845939466030548e-06, + "loss": 0.6245, + "step": 41997 + }, + { + "epoch": 1.08, + "learning_rate": 1.484569741986222e-06, + "loss": 0.561, + "step": 41998 + }, + { + "epoch": 1.08, + "learning_rate": 1.484545536998376e-06, + "loss": 0.4436, + "step": 41999 + }, + { + "epoch": 1.08, + "learning_rate": 1.4845213316395367e-06, + "loss": 0.7236, + "step": 42000 + }, + { + "epoch": 1.08, + "learning_rate": 1.484497125909721e-06, + "loss": 0.6636, + "step": 42001 + }, + { + "epoch": 1.08, + "learning_rate": 1.4844729198089483e-06, + "loss": 0.7354, + "step": 42002 + }, + { + "epoch": 1.08, + "learning_rate": 1.4844487133372368e-06, + "loss": 0.6479, + "step": 42003 + }, + { + "epoch": 1.08, + "learning_rate": 1.4844245064946055e-06, + "loss": 0.7495, + "step": 42004 + }, + { + "epoch": 1.08, + "learning_rate": 1.4844002992810725e-06, + "loss": 0.6724, + "step": 42005 + }, + { + "epoch": 1.08, + "learning_rate": 1.4843760916966561e-06, + "loss": 0.6689, + "step": 42006 + }, + { + "epoch": 1.08, + "learning_rate": 1.4843518837413757e-06, + "loss": 0.8955, + "step": 42007 + }, + { + "epoch": 1.08, + "learning_rate": 1.484327675415249e-06, + "loss": 0.7998, + "step": 42008 + }, + { + "epoch": 1.08, + "learning_rate": 1.4843034667182952e-06, + "loss": 0.6401, + "step": 42009 + }, + { + "epoch": 1.08, + "learning_rate": 1.4842792576505323e-06, + "loss": 0.7734, + "step": 42010 + }, + { + "epoch": 1.08, + "learning_rate": 1.484255048211979e-06, + "loss": 0.7725, + "step": 42011 + }, + { + "epoch": 1.08, + "learning_rate": 1.484230838402654e-06, + "loss": 0.5476, + "step": 42012 + }, + { + "epoch": 1.08, + "learning_rate": 1.4842066282225755e-06, + "loss": 0.751, + "step": 42013 + }, + { + "epoch": 1.08, + "learning_rate": 1.4841824176717625e-06, + "loss": 0.8242, + "step": 42014 + }, + { + "epoch": 1.08, + "learning_rate": 1.4841582067502333e-06, + "loss": 0.752, + "step": 42015 + }, + { + "epoch": 1.08, + "learning_rate": 1.4841339954580063e-06, + "loss": 0.6924, + "step": 42016 + }, + { + "epoch": 1.08, + "learning_rate": 1.4841097837951002e-06, + "loss": 0.6143, + "step": 42017 + }, + { + "epoch": 1.08, + "learning_rate": 1.4840855717615334e-06, + "loss": 0.7041, + "step": 42018 + }, + { + "epoch": 1.08, + "learning_rate": 1.4840613593573245e-06, + "loss": 0.6943, + "step": 42019 + }, + { + "epoch": 1.08, + "learning_rate": 1.4840371465824925e-06, + "loss": 0.5537, + "step": 42020 + }, + { + "epoch": 1.08, + "learning_rate": 1.484012933437055e-06, + "loss": 0.5405, + "step": 42021 + }, + { + "epoch": 1.08, + "learning_rate": 1.4839887199210312e-06, + "loss": 0.6116, + "step": 42022 + }, + { + "epoch": 1.08, + "learning_rate": 1.4839645060344396e-06, + "loss": 0.6309, + "step": 42023 + }, + { + "epoch": 1.08, + "learning_rate": 1.4839402917772985e-06, + "loss": 0.6709, + "step": 42024 + }, + { + "epoch": 1.08, + "learning_rate": 1.4839160771496268e-06, + "loss": 0.6973, + "step": 42025 + }, + { + "epoch": 1.08, + "learning_rate": 1.4838918621514427e-06, + "loss": 0.6455, + "step": 42026 + }, + { + "epoch": 1.08, + "learning_rate": 1.4838676467827648e-06, + "loss": 0.6475, + "step": 42027 + }, + { + "epoch": 1.08, + "learning_rate": 1.4838434310436116e-06, + "loss": 0.708, + "step": 42028 + }, + { + "epoch": 1.08, + "learning_rate": 1.483819214934002e-06, + "loss": 0.4229, + "step": 42029 + }, + { + "epoch": 1.08, + "learning_rate": 1.4837949984539541e-06, + "loss": 0.5586, + "step": 42030 + }, + { + "epoch": 1.08, + "learning_rate": 1.4837707816034865e-06, + "loss": 0.6401, + "step": 42031 + }, + { + "epoch": 1.08, + "learning_rate": 1.483746564382618e-06, + "loss": 0.5293, + "step": 42032 + }, + { + "epoch": 1.08, + "learning_rate": 1.4837223467913668e-06, + "loss": 0.7139, + "step": 42033 + }, + { + "epoch": 1.08, + "learning_rate": 1.4836981288297519e-06, + "loss": 0.6265, + "step": 42034 + }, + { + "epoch": 1.08, + "learning_rate": 1.4836739104977916e-06, + "loss": 0.6833, + "step": 42035 + }, + { + "epoch": 1.08, + "learning_rate": 1.4836496917955044e-06, + "loss": 0.6328, + "step": 42036 + }, + { + "epoch": 1.08, + "learning_rate": 1.4836254727229087e-06, + "loss": 0.6831, + "step": 42037 + }, + { + "epoch": 1.08, + "learning_rate": 1.4836012532800232e-06, + "loss": 0.5681, + "step": 42038 + }, + { + "epoch": 1.08, + "learning_rate": 1.4835770334668664e-06, + "loss": 0.5815, + "step": 42039 + }, + { + "epoch": 1.08, + "learning_rate": 1.4835528132834576e-06, + "loss": 0.6621, + "step": 42040 + }, + { + "epoch": 1.08, + "learning_rate": 1.4835285927298138e-06, + "loss": 0.5713, + "step": 42041 + }, + { + "epoch": 1.08, + "learning_rate": 1.4835043718059548e-06, + "loss": 0.5444, + "step": 42042 + }, + { + "epoch": 1.08, + "learning_rate": 1.4834801505118985e-06, + "loss": 0.6719, + "step": 42043 + }, + { + "epoch": 1.08, + "learning_rate": 1.483455928847664e-06, + "loss": 0.4604, + "step": 42044 + }, + { + "epoch": 1.08, + "learning_rate": 1.4834317068132692e-06, + "loss": 0.6011, + "step": 42045 + }, + { + "epoch": 1.08, + "learning_rate": 1.4834074844087335e-06, + "loss": 0.7402, + "step": 42046 + }, + { + "epoch": 1.08, + "learning_rate": 1.4833832616340743e-06, + "loss": 0.6909, + "step": 42047 + }, + { + "epoch": 1.08, + "learning_rate": 1.4833590384893112e-06, + "loss": 0.6289, + "step": 42048 + }, + { + "epoch": 1.08, + "learning_rate": 1.4833348149744618e-06, + "loss": 0.5894, + "step": 42049 + }, + { + "epoch": 1.08, + "learning_rate": 1.4833105910895456e-06, + "loss": 0.7314, + "step": 42050 + }, + { + "epoch": 1.08, + "learning_rate": 1.4832863668345804e-06, + "loss": 0.5645, + "step": 42051 + }, + { + "epoch": 1.08, + "learning_rate": 1.4832621422095853e-06, + "loss": 0.7578, + "step": 42052 + }, + { + "epoch": 1.08, + "learning_rate": 1.4832379172145785e-06, + "loss": 0.7197, + "step": 42053 + }, + { + "epoch": 1.08, + "learning_rate": 1.4832136918495785e-06, + "loss": 0.554, + "step": 42054 + }, + { + "epoch": 1.08, + "learning_rate": 1.4831894661146046e-06, + "loss": 0.4246, + "step": 42055 + }, + { + "epoch": 1.08, + "learning_rate": 1.483165240009674e-06, + "loss": 0.7476, + "step": 42056 + }, + { + "epoch": 1.08, + "learning_rate": 1.4831410135348063e-06, + "loss": 0.7568, + "step": 42057 + }, + { + "epoch": 1.08, + "learning_rate": 1.4831167866900197e-06, + "loss": 0.7168, + "step": 42058 + }, + { + "epoch": 1.08, + "learning_rate": 1.483092559475333e-06, + "loss": 0.7422, + "step": 42059 + }, + { + "epoch": 1.08, + "learning_rate": 1.4830683318907644e-06, + "loss": 0.7275, + "step": 42060 + }, + { + "epoch": 1.08, + "learning_rate": 1.4830441039363327e-06, + "loss": 0.7871, + "step": 42061 + }, + { + "epoch": 1.08, + "learning_rate": 1.4830198756120559e-06, + "loss": 0.6201, + "step": 42062 + }, + { + "epoch": 1.08, + "learning_rate": 1.4829956469179534e-06, + "loss": 0.5591, + "step": 42063 + }, + { + "epoch": 1.08, + "learning_rate": 1.4829714178540432e-06, + "loss": 0.5518, + "step": 42064 + }, + { + "epoch": 1.08, + "learning_rate": 1.4829471884203442e-06, + "loss": 0.5908, + "step": 42065 + }, + { + "epoch": 1.08, + "learning_rate": 1.4829229586168743e-06, + "loss": 0.7529, + "step": 42066 + }, + { + "epoch": 1.08, + "learning_rate": 1.4828987284436528e-06, + "loss": 0.6689, + "step": 42067 + }, + { + "epoch": 1.08, + "learning_rate": 1.4828744979006977e-06, + "loss": 0.7168, + "step": 42068 + }, + { + "epoch": 1.08, + "learning_rate": 1.4828502669880284e-06, + "loss": 0.7227, + "step": 42069 + }, + { + "epoch": 1.08, + "learning_rate": 1.4828260357056624e-06, + "loss": 0.707, + "step": 42070 + }, + { + "epoch": 1.08, + "learning_rate": 1.4828018040536185e-06, + "loss": 0.6108, + "step": 42071 + }, + { + "epoch": 1.08, + "learning_rate": 1.482777572031916e-06, + "loss": 0.479, + "step": 42072 + }, + { + "epoch": 1.08, + "learning_rate": 1.4827533396405727e-06, + "loss": 0.5481, + "step": 42073 + }, + { + "epoch": 1.08, + "learning_rate": 1.482729106879607e-06, + "loss": 0.6455, + "step": 42074 + }, + { + "epoch": 1.08, + "learning_rate": 1.4827048737490382e-06, + "loss": 0.6067, + "step": 42075 + }, + { + "epoch": 1.08, + "learning_rate": 1.4826806402488844e-06, + "loss": 0.668, + "step": 42076 + }, + { + "epoch": 1.08, + "learning_rate": 1.4826564063791642e-06, + "loss": 0.6167, + "step": 42077 + }, + { + "epoch": 1.08, + "learning_rate": 1.4826321721398962e-06, + "loss": 0.5781, + "step": 42078 + }, + { + "epoch": 1.08, + "learning_rate": 1.4826079375310989e-06, + "loss": 0.7344, + "step": 42079 + }, + { + "epoch": 1.08, + "learning_rate": 1.4825837025527912e-06, + "loss": 0.7158, + "step": 42080 + }, + { + "epoch": 1.08, + "learning_rate": 1.4825594672049911e-06, + "loss": 0.5781, + "step": 42081 + }, + { + "epoch": 1.08, + "learning_rate": 1.4825352314877173e-06, + "loss": 0.6982, + "step": 42082 + }, + { + "epoch": 1.08, + "learning_rate": 1.4825109954009885e-06, + "loss": 0.7451, + "step": 42083 + }, + { + "epoch": 1.08, + "learning_rate": 1.4824867589448234e-06, + "loss": 0.6123, + "step": 42084 + }, + { + "epoch": 1.08, + "learning_rate": 1.4824625221192402e-06, + "loss": 0.5974, + "step": 42085 + }, + { + "epoch": 1.08, + "learning_rate": 1.4824382849242575e-06, + "loss": 0.6653, + "step": 42086 + }, + { + "epoch": 1.08, + "learning_rate": 1.4824140473598944e-06, + "loss": 0.8574, + "step": 42087 + }, + { + "epoch": 1.08, + "learning_rate": 1.4823898094261687e-06, + "loss": 0.7417, + "step": 42088 + }, + { + "epoch": 1.08, + "learning_rate": 1.4823655711230994e-06, + "loss": 0.7031, + "step": 42089 + }, + { + "epoch": 1.08, + "learning_rate": 1.482341332450705e-06, + "loss": 0.603, + "step": 42090 + }, + { + "epoch": 1.08, + "learning_rate": 1.482317093409004e-06, + "loss": 0.6875, + "step": 42091 + }, + { + "epoch": 1.08, + "learning_rate": 1.482292853998015e-06, + "loss": 0.6572, + "step": 42092 + }, + { + "epoch": 1.08, + "learning_rate": 1.4822686142177566e-06, + "loss": 0.6924, + "step": 42093 + }, + { + "epoch": 1.08, + "learning_rate": 1.4822443740682471e-06, + "loss": 0.6221, + "step": 42094 + }, + { + "epoch": 1.08, + "learning_rate": 1.4822201335495055e-06, + "loss": 0.5801, + "step": 42095 + }, + { + "epoch": 1.08, + "learning_rate": 1.4821958926615498e-06, + "loss": 0.6938, + "step": 42096 + }, + { + "epoch": 1.08, + "learning_rate": 1.482171651404399e-06, + "loss": 0.6038, + "step": 42097 + }, + { + "epoch": 1.08, + "learning_rate": 1.4821474097780714e-06, + "loss": 0.5703, + "step": 42098 + }, + { + "epoch": 1.08, + "learning_rate": 1.4821231677825863e-06, + "loss": 0.6289, + "step": 42099 + }, + { + "epoch": 1.08, + "learning_rate": 1.4820989254179612e-06, + "loss": 0.6636, + "step": 42100 + }, + { + "epoch": 1.08, + "learning_rate": 1.4820746826842152e-06, + "loss": 0.6084, + "step": 42101 + }, + { + "epoch": 1.08, + "learning_rate": 1.4820504395813666e-06, + "loss": 0.5149, + "step": 42102 + }, + { + "epoch": 1.08, + "learning_rate": 1.4820261961094342e-06, + "loss": 0.5894, + "step": 42103 + }, + { + "epoch": 1.08, + "learning_rate": 1.4820019522684369e-06, + "loss": 0.7715, + "step": 42104 + }, + { + "epoch": 1.08, + "learning_rate": 1.4819777080583925e-06, + "loss": 0.792, + "step": 42105 + }, + { + "epoch": 1.08, + "learning_rate": 1.48195346347932e-06, + "loss": 0.709, + "step": 42106 + }, + { + "epoch": 1.08, + "learning_rate": 1.481929218531238e-06, + "loss": 0.6616, + "step": 42107 + }, + { + "epoch": 1.08, + "learning_rate": 1.4819049732141645e-06, + "loss": 0.6865, + "step": 42108 + }, + { + "epoch": 1.08, + "learning_rate": 1.4818807275281193e-06, + "loss": 0.7334, + "step": 42109 + }, + { + "epoch": 1.08, + "learning_rate": 1.4818564814731195e-06, + "loss": 0.6108, + "step": 42110 + }, + { + "epoch": 1.08, + "learning_rate": 1.4818322350491848e-06, + "loss": 0.6292, + "step": 42111 + }, + { + "epoch": 1.08, + "learning_rate": 1.481807988256333e-06, + "loss": 0.7207, + "step": 42112 + }, + { + "epoch": 1.08, + "learning_rate": 1.481783741094583e-06, + "loss": 0.6963, + "step": 42113 + }, + { + "epoch": 1.08, + "learning_rate": 1.4817594935639538e-06, + "loss": 0.5156, + "step": 42114 + }, + { + "epoch": 1.08, + "learning_rate": 1.481735245664463e-06, + "loss": 0.7393, + "step": 42115 + }, + { + "epoch": 1.08, + "learning_rate": 1.4817109973961297e-06, + "loss": 0.6328, + "step": 42116 + }, + { + "epoch": 1.08, + "learning_rate": 1.4816867487589728e-06, + "loss": 0.5444, + "step": 42117 + }, + { + "epoch": 1.08, + "learning_rate": 1.4816624997530101e-06, + "loss": 0.791, + "step": 42118 + }, + { + "epoch": 1.08, + "learning_rate": 1.4816382503782607e-06, + "loss": 0.75, + "step": 42119 + }, + { + "epoch": 1.08, + "learning_rate": 1.4816140006347433e-06, + "loss": 0.6306, + "step": 42120 + }, + { + "epoch": 1.08, + "learning_rate": 1.4815897505224758e-06, + "loss": 0.5361, + "step": 42121 + }, + { + "epoch": 1.08, + "learning_rate": 1.4815655000414772e-06, + "loss": 0.8086, + "step": 42122 + }, + { + "epoch": 1.08, + "learning_rate": 1.4815412491917663e-06, + "loss": 0.5166, + "step": 42123 + }, + { + "epoch": 1.08, + "learning_rate": 1.4815169979733614e-06, + "loss": 0.6865, + "step": 42124 + }, + { + "epoch": 1.08, + "learning_rate": 1.481492746386281e-06, + "loss": 0.7354, + "step": 42125 + }, + { + "epoch": 1.08, + "learning_rate": 1.4814684944305437e-06, + "loss": 0.5967, + "step": 42126 + }, + { + "epoch": 1.08, + "learning_rate": 1.4814442421061678e-06, + "loss": 0.6152, + "step": 42127 + }, + { + "epoch": 1.08, + "learning_rate": 1.4814199894131726e-06, + "loss": 0.6069, + "step": 42128 + }, + { + "epoch": 1.08, + "learning_rate": 1.4813957363515764e-06, + "loss": 0.4907, + "step": 42129 + }, + { + "epoch": 1.08, + "learning_rate": 1.4813714829213974e-06, + "loss": 0.5889, + "step": 42130 + }, + { + "epoch": 1.08, + "learning_rate": 1.4813472291226542e-06, + "loss": 0.7461, + "step": 42131 + }, + { + "epoch": 1.08, + "learning_rate": 1.481322974955366e-06, + "loss": 0.6357, + "step": 42132 + }, + { + "epoch": 1.08, + "learning_rate": 1.4812987204195504e-06, + "loss": 0.4663, + "step": 42133 + }, + { + "epoch": 1.08, + "learning_rate": 1.4812744655152268e-06, + "loss": 0.5537, + "step": 42134 + }, + { + "epoch": 1.08, + "learning_rate": 1.4812502102424136e-06, + "loss": 0.5271, + "step": 42135 + }, + { + "epoch": 1.08, + "learning_rate": 1.481225954601129e-06, + "loss": 0.6387, + "step": 42136 + }, + { + "epoch": 1.08, + "learning_rate": 1.4812016985913918e-06, + "loss": 0.6602, + "step": 42137 + }, + { + "epoch": 1.08, + "learning_rate": 1.4811774422132209e-06, + "loss": 0.6885, + "step": 42138 + }, + { + "epoch": 1.08, + "learning_rate": 1.4811531854666343e-06, + "loss": 0.6309, + "step": 42139 + }, + { + "epoch": 1.08, + "learning_rate": 1.4811289283516506e-06, + "loss": 0.605, + "step": 42140 + }, + { + "epoch": 1.08, + "learning_rate": 1.4811046708682891e-06, + "loss": 0.7559, + "step": 42141 + }, + { + "epoch": 1.08, + "learning_rate": 1.4810804130165674e-06, + "loss": 0.7227, + "step": 42142 + }, + { + "epoch": 1.08, + "learning_rate": 1.481056154796505e-06, + "loss": 0.9766, + "step": 42143 + }, + { + "epoch": 1.08, + "learning_rate": 1.4810318962081198e-06, + "loss": 0.9121, + "step": 42144 + }, + { + "epoch": 1.08, + "learning_rate": 1.4810076372514307e-06, + "loss": 0.6533, + "step": 42145 + }, + { + "epoch": 1.08, + "learning_rate": 1.480983377926456e-06, + "loss": 0.6104, + "step": 42146 + }, + { + "epoch": 1.08, + "learning_rate": 1.4809591182332147e-06, + "loss": 0.4158, + "step": 42147 + }, + { + "epoch": 1.08, + "learning_rate": 1.4809348581717246e-06, + "loss": 0.6418, + "step": 42148 + }, + { + "epoch": 1.08, + "learning_rate": 1.4809105977420054e-06, + "loss": 0.489, + "step": 42149 + }, + { + "epoch": 1.08, + "learning_rate": 1.4808863369440746e-06, + "loss": 0.4556, + "step": 42150 + }, + { + "epoch": 1.08, + "learning_rate": 1.4808620757779515e-06, + "loss": 0.7446, + "step": 42151 + }, + { + "epoch": 1.08, + "learning_rate": 1.4808378142436543e-06, + "loss": 0.7021, + "step": 42152 + }, + { + "epoch": 1.08, + "learning_rate": 1.4808135523412017e-06, + "loss": 0.5723, + "step": 42153 + }, + { + "epoch": 1.08, + "learning_rate": 1.4807892900706125e-06, + "loss": 0.6263, + "step": 42154 + }, + { + "epoch": 1.08, + "learning_rate": 1.480765027431905e-06, + "loss": 0.7573, + "step": 42155 + }, + { + "epoch": 1.08, + "learning_rate": 1.4807407644250976e-06, + "loss": 0.8369, + "step": 42156 + }, + { + "epoch": 1.08, + "learning_rate": 1.4807165010502093e-06, + "loss": 0.7119, + "step": 42157 + }, + { + "epoch": 1.08, + "learning_rate": 1.4806922373072582e-06, + "loss": 0.6121, + "step": 42158 + }, + { + "epoch": 1.08, + "learning_rate": 1.4806679731962635e-06, + "loss": 0.6416, + "step": 42159 + }, + { + "epoch": 1.08, + "learning_rate": 1.4806437087172432e-06, + "loss": 0.5149, + "step": 42160 + }, + { + "epoch": 1.08, + "learning_rate": 1.480619443870216e-06, + "loss": 0.6069, + "step": 42161 + }, + { + "epoch": 1.08, + "learning_rate": 1.4805951786552009e-06, + "loss": 0.7236, + "step": 42162 + }, + { + "epoch": 1.08, + "learning_rate": 1.4805709130722162e-06, + "loss": 0.5801, + "step": 42163 + }, + { + "epoch": 1.08, + "learning_rate": 1.4805466471212803e-06, + "loss": 0.4141, + "step": 42164 + }, + { + "epoch": 1.08, + "learning_rate": 1.4805223808024118e-06, + "loss": 0.7627, + "step": 42165 + }, + { + "epoch": 1.08, + "learning_rate": 1.4804981141156297e-06, + "loss": 0.6885, + "step": 42166 + }, + { + "epoch": 1.08, + "learning_rate": 1.4804738470609518e-06, + "loss": 0.7578, + "step": 42167 + }, + { + "epoch": 1.08, + "learning_rate": 1.4804495796383975e-06, + "loss": 0.6084, + "step": 42168 + }, + { + "epoch": 1.08, + "learning_rate": 1.4804253118479853e-06, + "loss": 0.6445, + "step": 42169 + }, + { + "epoch": 1.08, + "learning_rate": 1.4804010436897331e-06, + "loss": 0.6973, + "step": 42170 + }, + { + "epoch": 1.08, + "learning_rate": 1.48037677516366e-06, + "loss": 0.7373, + "step": 42171 + }, + { + "epoch": 1.08, + "learning_rate": 1.4803525062697846e-06, + "loss": 0.7144, + "step": 42172 + }, + { + "epoch": 1.08, + "learning_rate": 1.4803282370081255e-06, + "loss": 0.6367, + "step": 42173 + }, + { + "epoch": 1.08, + "learning_rate": 1.480303967378701e-06, + "loss": 0.6143, + "step": 42174 + }, + { + "epoch": 1.08, + "learning_rate": 1.4802796973815297e-06, + "loss": 0.5984, + "step": 42175 + }, + { + "epoch": 1.08, + "learning_rate": 1.4802554270166305e-06, + "loss": 0.8105, + "step": 42176 + }, + { + "epoch": 1.08, + "learning_rate": 1.4802311562840218e-06, + "loss": 0.7783, + "step": 42177 + }, + { + "epoch": 1.08, + "learning_rate": 1.4802068851837222e-06, + "loss": 0.436, + "step": 42178 + }, + { + "epoch": 1.08, + "learning_rate": 1.4801826137157502e-06, + "loss": 0.5981, + "step": 42179 + }, + { + "epoch": 1.08, + "learning_rate": 1.4801583418801244e-06, + "loss": 0.6348, + "step": 42180 + }, + { + "epoch": 1.08, + "learning_rate": 1.4801340696768634e-06, + "loss": 0.6411, + "step": 42181 + }, + { + "epoch": 1.08, + "learning_rate": 1.4801097971059862e-06, + "loss": 0.6855, + "step": 42182 + }, + { + "epoch": 1.08, + "learning_rate": 1.4800855241675105e-06, + "loss": 0.7129, + "step": 42183 + }, + { + "epoch": 1.08, + "learning_rate": 1.4800612508614557e-06, + "loss": 0.6025, + "step": 42184 + }, + { + "epoch": 1.08, + "learning_rate": 1.4800369771878401e-06, + "loss": 0.5432, + "step": 42185 + }, + { + "epoch": 1.08, + "learning_rate": 1.480012703146682e-06, + "loss": 0.501, + "step": 42186 + }, + { + "epoch": 1.08, + "learning_rate": 1.4799884287380005e-06, + "loss": 0.6289, + "step": 42187 + }, + { + "epoch": 1.08, + "learning_rate": 1.4799641539618134e-06, + "loss": 0.708, + "step": 42188 + }, + { + "epoch": 1.08, + "learning_rate": 1.4799398788181407e-06, + "loss": 0.7578, + "step": 42189 + }, + { + "epoch": 1.08, + "learning_rate": 1.4799156033069994e-06, + "loss": 0.7422, + "step": 42190 + }, + { + "epoch": 1.08, + "learning_rate": 1.4798913274284091e-06, + "loss": 0.6006, + "step": 42191 + }, + { + "epoch": 1.08, + "learning_rate": 1.4798670511823878e-06, + "loss": 0.7617, + "step": 42192 + }, + { + "epoch": 1.08, + "learning_rate": 1.4798427745689547e-06, + "loss": 0.6133, + "step": 42193 + }, + { + "epoch": 1.08, + "learning_rate": 1.479818497588128e-06, + "loss": 0.8047, + "step": 42194 + }, + { + "epoch": 1.08, + "learning_rate": 1.4797942202399263e-06, + "loss": 0.6924, + "step": 42195 + }, + { + "epoch": 1.08, + "learning_rate": 1.479769942524368e-06, + "loss": 0.6318, + "step": 42196 + }, + { + "epoch": 1.08, + "learning_rate": 1.4797456644414723e-06, + "loss": 0.7358, + "step": 42197 + }, + { + "epoch": 1.08, + "learning_rate": 1.4797213859912572e-06, + "loss": 0.5391, + "step": 42198 + }, + { + "epoch": 1.08, + "learning_rate": 1.4796971071737417e-06, + "loss": 0.8091, + "step": 42199 + }, + { + "epoch": 1.08, + "learning_rate": 1.4796728279889438e-06, + "loss": 0.5557, + "step": 42200 + }, + { + "epoch": 1.08, + "learning_rate": 1.4796485484368826e-06, + "loss": 0.6768, + "step": 42201 + }, + { + "epoch": 1.08, + "learning_rate": 1.4796242685175767e-06, + "loss": 0.6514, + "step": 42202 + }, + { + "epoch": 1.08, + "learning_rate": 1.4795999882310443e-06, + "loss": 0.5515, + "step": 42203 + }, + { + "epoch": 1.08, + "learning_rate": 1.4795757075773045e-06, + "loss": 0.6561, + "step": 42204 + }, + { + "epoch": 1.08, + "learning_rate": 1.4795514265563755e-06, + "loss": 0.6416, + "step": 42205 + }, + { + "epoch": 1.08, + "learning_rate": 1.479527145168276e-06, + "loss": 0.7686, + "step": 42206 + }, + { + "epoch": 1.08, + "learning_rate": 1.4795028634130246e-06, + "loss": 0.6458, + "step": 42207 + }, + { + "epoch": 1.08, + "learning_rate": 1.47947858129064e-06, + "loss": 0.6138, + "step": 42208 + }, + { + "epoch": 1.08, + "learning_rate": 1.479454298801141e-06, + "loss": 0.7588, + "step": 42209 + }, + { + "epoch": 1.08, + "learning_rate": 1.4794300159445454e-06, + "loss": 0.6748, + "step": 42210 + }, + { + "epoch": 1.08, + "learning_rate": 1.4794057327208725e-06, + "loss": 0.8027, + "step": 42211 + }, + { + "epoch": 1.08, + "learning_rate": 1.4793814491301406e-06, + "loss": 0.509, + "step": 42212 + }, + { + "epoch": 1.08, + "learning_rate": 1.4793571651723682e-06, + "loss": 0.7773, + "step": 42213 + }, + { + "epoch": 1.08, + "learning_rate": 1.4793328808475746e-06, + "loss": 0.6958, + "step": 42214 + }, + { + "epoch": 1.08, + "learning_rate": 1.4793085961557774e-06, + "loss": 0.6196, + "step": 42215 + }, + { + "epoch": 1.08, + "learning_rate": 1.4792843110969958e-06, + "loss": 0.5088, + "step": 42216 + }, + { + "epoch": 1.08, + "learning_rate": 1.4792600256712479e-06, + "loss": 0.5864, + "step": 42217 + }, + { + "epoch": 1.08, + "learning_rate": 1.479235739878553e-06, + "loss": 0.645, + "step": 42218 + }, + { + "epoch": 1.08, + "learning_rate": 1.4792114537189293e-06, + "loss": 0.6924, + "step": 42219 + }, + { + "epoch": 1.08, + "learning_rate": 1.4791871671923956e-06, + "loss": 0.7002, + "step": 42220 + }, + { + "epoch": 1.08, + "learning_rate": 1.47916288029897e-06, + "loss": 0.6084, + "step": 42221 + }, + { + "epoch": 1.08, + "learning_rate": 1.4791385930386716e-06, + "loss": 0.6772, + "step": 42222 + }, + { + "epoch": 1.08, + "learning_rate": 1.4791143054115185e-06, + "loss": 0.5947, + "step": 42223 + }, + { + "epoch": 1.08, + "learning_rate": 1.47909001741753e-06, + "loss": 0.7065, + "step": 42224 + }, + { + "epoch": 1.08, + "learning_rate": 1.4790657290567241e-06, + "loss": 0.6245, + "step": 42225 + }, + { + "epoch": 1.08, + "learning_rate": 1.4790414403291199e-06, + "loss": 0.5791, + "step": 42226 + }, + { + "epoch": 1.08, + "learning_rate": 1.479017151234735e-06, + "loss": 0.5742, + "step": 42227 + }, + { + "epoch": 1.08, + "learning_rate": 1.4789928617735895e-06, + "loss": 0.6465, + "step": 42228 + }, + { + "epoch": 1.08, + "learning_rate": 1.4789685719457008e-06, + "loss": 0.6157, + "step": 42229 + }, + { + "epoch": 1.08, + "learning_rate": 1.4789442817510878e-06, + "loss": 0.3962, + "step": 42230 + }, + { + "epoch": 1.08, + "learning_rate": 1.4789199911897692e-06, + "loss": 0.5757, + "step": 42231 + }, + { + "epoch": 1.08, + "learning_rate": 1.4788957002617637e-06, + "loss": 0.7656, + "step": 42232 + }, + { + "epoch": 1.08, + "learning_rate": 1.4788714089670897e-06, + "loss": 0.7231, + "step": 42233 + }, + { + "epoch": 1.08, + "learning_rate": 1.478847117305766e-06, + "loss": 0.7266, + "step": 42234 + }, + { + "epoch": 1.08, + "learning_rate": 1.478822825277811e-06, + "loss": 0.707, + "step": 42235 + }, + { + "epoch": 1.08, + "learning_rate": 1.4787985328832433e-06, + "loss": 0.6895, + "step": 42236 + }, + { + "epoch": 1.08, + "learning_rate": 1.4787742401220817e-06, + "loss": 0.5552, + "step": 42237 + }, + { + "epoch": 1.08, + "learning_rate": 1.4787499469943447e-06, + "loss": 0.5625, + "step": 42238 + }, + { + "epoch": 1.08, + "learning_rate": 1.4787256535000509e-06, + "loss": 0.7339, + "step": 42239 + }, + { + "epoch": 1.08, + "learning_rate": 1.4787013596392188e-06, + "loss": 0.6396, + "step": 42240 + }, + { + "epoch": 1.08, + "learning_rate": 1.4786770654118673e-06, + "loss": 0.6509, + "step": 42241 + }, + { + "epoch": 1.08, + "learning_rate": 1.4786527708180144e-06, + "loss": 0.6045, + "step": 42242 + }, + { + "epoch": 1.08, + "learning_rate": 1.4786284758576793e-06, + "loss": 0.6523, + "step": 42243 + }, + { + "epoch": 1.08, + "learning_rate": 1.4786041805308803e-06, + "loss": 0.6611, + "step": 42244 + }, + { + "epoch": 1.08, + "learning_rate": 1.4785798848376364e-06, + "loss": 0.9355, + "step": 42245 + }, + { + "epoch": 1.08, + "learning_rate": 1.4785555887779652e-06, + "loss": 0.486, + "step": 42246 + }, + { + "epoch": 1.08, + "learning_rate": 1.4785312923518866e-06, + "loss": 0.5337, + "step": 42247 + }, + { + "epoch": 1.08, + "learning_rate": 1.4785069955594182e-06, + "loss": 0.6396, + "step": 42248 + }, + { + "epoch": 1.08, + "learning_rate": 1.4784826984005793e-06, + "loss": 0.6846, + "step": 42249 + }, + { + "epoch": 1.08, + "learning_rate": 1.4784584008753882e-06, + "loss": 0.6602, + "step": 42250 + }, + { + "epoch": 1.08, + "learning_rate": 1.4784341029838632e-06, + "loss": 0.625, + "step": 42251 + }, + { + "epoch": 1.08, + "learning_rate": 1.4784098047260236e-06, + "loss": 0.6836, + "step": 42252 + }, + { + "epoch": 1.08, + "learning_rate": 1.4783855061018873e-06, + "loss": 0.5625, + "step": 42253 + }, + { + "epoch": 1.08, + "learning_rate": 1.4783612071114734e-06, + "loss": 0.5382, + "step": 42254 + }, + { + "epoch": 1.08, + "learning_rate": 1.4783369077548002e-06, + "loss": 0.6465, + "step": 42255 + }, + { + "epoch": 1.08, + "learning_rate": 1.4783126080318864e-06, + "loss": 0.792, + "step": 42256 + }, + { + "epoch": 1.08, + "learning_rate": 1.4782883079427508e-06, + "loss": 0.7354, + "step": 42257 + }, + { + "epoch": 1.08, + "learning_rate": 1.4782640074874119e-06, + "loss": 0.6758, + "step": 42258 + }, + { + "epoch": 1.08, + "learning_rate": 1.4782397066658879e-06, + "loss": 0.7383, + "step": 42259 + }, + { + "epoch": 1.08, + "learning_rate": 1.4782154054781981e-06, + "loss": 0.7515, + "step": 42260 + }, + { + "epoch": 1.08, + "learning_rate": 1.4781911039243604e-06, + "loss": 0.6494, + "step": 42261 + }, + { + "epoch": 1.08, + "learning_rate": 1.478166802004394e-06, + "loss": 0.5547, + "step": 42262 + }, + { + "epoch": 1.08, + "learning_rate": 1.478142499718317e-06, + "loss": 0.526, + "step": 42263 + }, + { + "epoch": 1.08, + "learning_rate": 1.4781181970661487e-06, + "loss": 0.6289, + "step": 42264 + }, + { + "epoch": 1.08, + "learning_rate": 1.478093894047907e-06, + "loss": 0.5952, + "step": 42265 + }, + { + "epoch": 1.08, + "learning_rate": 1.4780695906636108e-06, + "loss": 0.7935, + "step": 42266 + }, + { + "epoch": 1.08, + "learning_rate": 1.4780452869132786e-06, + "loss": 0.5791, + "step": 42267 + }, + { + "epoch": 1.08, + "learning_rate": 1.4780209827969294e-06, + "loss": 0.8789, + "step": 42268 + }, + { + "epoch": 1.08, + "learning_rate": 1.4779966783145814e-06, + "loss": 0.6328, + "step": 42269 + }, + { + "epoch": 1.08, + "learning_rate": 1.4779723734662534e-06, + "loss": 0.4565, + "step": 42270 + }, + { + "epoch": 1.08, + "learning_rate": 1.4779480682519637e-06, + "loss": 0.5232, + "step": 42271 + }, + { + "epoch": 1.08, + "learning_rate": 1.4779237626717313e-06, + "loss": 0.6069, + "step": 42272 + }, + { + "epoch": 1.08, + "learning_rate": 1.4778994567255746e-06, + "loss": 0.6611, + "step": 42273 + }, + { + "epoch": 1.08, + "learning_rate": 1.4778751504135123e-06, + "loss": 0.6162, + "step": 42274 + }, + { + "epoch": 1.08, + "learning_rate": 1.4778508437355627e-06, + "loss": 0.7686, + "step": 42275 + }, + { + "epoch": 1.08, + "learning_rate": 1.477826536691745e-06, + "loss": 0.5908, + "step": 42276 + }, + { + "epoch": 1.08, + "learning_rate": 1.4778022292820776e-06, + "loss": 0.6821, + "step": 42277 + }, + { + "epoch": 1.08, + "learning_rate": 1.4777779215065786e-06, + "loss": 0.6011, + "step": 42278 + }, + { + "epoch": 1.08, + "learning_rate": 1.4777536133652675e-06, + "loss": 0.6509, + "step": 42279 + }, + { + "epoch": 1.08, + "learning_rate": 1.477729304858162e-06, + "loss": 0.627, + "step": 42280 + }, + { + "epoch": 1.08, + "learning_rate": 1.4777049959852815e-06, + "loss": 0.3833, + "step": 42281 + }, + { + "epoch": 1.08, + "learning_rate": 1.4776806867466437e-06, + "loss": 0.748, + "step": 42282 + }, + { + "epoch": 1.08, + "learning_rate": 1.4776563771422682e-06, + "loss": 0.4172, + "step": 42283 + }, + { + "epoch": 1.08, + "learning_rate": 1.4776320671721732e-06, + "loss": 0.6353, + "step": 42284 + }, + { + "epoch": 1.08, + "learning_rate": 1.477607756836377e-06, + "loss": 0.665, + "step": 42285 + }, + { + "epoch": 1.08, + "learning_rate": 1.4775834461348988e-06, + "loss": 0.6631, + "step": 42286 + }, + { + "epoch": 1.08, + "learning_rate": 1.4775591350677569e-06, + "loss": 0.7471, + "step": 42287 + }, + { + "epoch": 1.08, + "learning_rate": 1.4775348236349696e-06, + "loss": 0.7344, + "step": 42288 + }, + { + "epoch": 1.08, + "learning_rate": 1.4775105118365564e-06, + "loss": 0.564, + "step": 42289 + }, + { + "epoch": 1.08, + "learning_rate": 1.4774861996725347e-06, + "loss": 0.7979, + "step": 42290 + }, + { + "epoch": 1.08, + "learning_rate": 1.4774618871429243e-06, + "loss": 0.4644, + "step": 42291 + }, + { + "epoch": 1.08, + "learning_rate": 1.4774375742477427e-06, + "loss": 0.5474, + "step": 42292 + }, + { + "epoch": 1.08, + "learning_rate": 1.4774132609870097e-06, + "loss": 0.7402, + "step": 42293 + }, + { + "epoch": 1.08, + "learning_rate": 1.4773889473607431e-06, + "loss": 0.6724, + "step": 42294 + }, + { + "epoch": 1.08, + "learning_rate": 1.4773646333689616e-06, + "loss": 0.5525, + "step": 42295 + }, + { + "epoch": 1.08, + "learning_rate": 1.4773403190116842e-06, + "loss": 0.4722, + "step": 42296 + }, + { + "epoch": 1.08, + "learning_rate": 1.477316004288929e-06, + "loss": 0.6006, + "step": 42297 + }, + { + "epoch": 1.08, + "learning_rate": 1.477291689200715e-06, + "loss": 0.6958, + "step": 42298 + }, + { + "epoch": 1.08, + "learning_rate": 1.477267373747061e-06, + "loss": 0.6489, + "step": 42299 + }, + { + "epoch": 1.08, + "learning_rate": 1.4772430579279852e-06, + "loss": 0.6504, + "step": 42300 + }, + { + "epoch": 1.08, + "learning_rate": 1.4772187417435057e-06, + "loss": 0.5977, + "step": 42301 + }, + { + "epoch": 1.08, + "learning_rate": 1.4771944251936423e-06, + "loss": 0.6855, + "step": 42302 + }, + { + "epoch": 1.08, + "learning_rate": 1.477170108278413e-06, + "loss": 0.5869, + "step": 42303 + }, + { + "epoch": 1.08, + "learning_rate": 1.4771457909978367e-06, + "loss": 0.7305, + "step": 42304 + }, + { + "epoch": 1.08, + "learning_rate": 1.4771214733519315e-06, + "loss": 0.5654, + "step": 42305 + }, + { + "epoch": 1.08, + "learning_rate": 1.4770971553407166e-06, + "loss": 0.709, + "step": 42306 + }, + { + "epoch": 1.08, + "learning_rate": 1.47707283696421e-06, + "loss": 0.7949, + "step": 42307 + }, + { + "epoch": 1.08, + "learning_rate": 1.4770485182224309e-06, + "loss": 0.6401, + "step": 42308 + }, + { + "epoch": 1.08, + "learning_rate": 1.4770241991153975e-06, + "loss": 0.6533, + "step": 42309 + }, + { + "epoch": 1.08, + "learning_rate": 1.476999879643129e-06, + "loss": 0.48, + "step": 42310 + }, + { + "epoch": 1.08, + "learning_rate": 1.476975559805643e-06, + "loss": 0.3845, + "step": 42311 + }, + { + "epoch": 1.08, + "learning_rate": 1.4769512396029594e-06, + "loss": 0.5918, + "step": 42312 + }, + { + "epoch": 1.08, + "learning_rate": 1.4769269190350957e-06, + "loss": 0.6382, + "step": 42313 + }, + { + "epoch": 1.08, + "learning_rate": 1.4769025981020712e-06, + "loss": 0.5212, + "step": 42314 + }, + { + "epoch": 1.08, + "learning_rate": 1.4768782768039043e-06, + "loss": 0.6714, + "step": 42315 + }, + { + "epoch": 1.08, + "learning_rate": 1.4768539551406136e-06, + "loss": 0.542, + "step": 42316 + }, + { + "epoch": 1.08, + "learning_rate": 1.4768296331122177e-06, + "loss": 0.6621, + "step": 42317 + }, + { + "epoch": 1.08, + "learning_rate": 1.4768053107187352e-06, + "loss": 0.7266, + "step": 42318 + }, + { + "epoch": 1.08, + "learning_rate": 1.476780987960185e-06, + "loss": 0.5415, + "step": 42319 + }, + { + "epoch": 1.08, + "learning_rate": 1.4767566648365856e-06, + "loss": 0.6289, + "step": 42320 + }, + { + "epoch": 1.08, + "learning_rate": 1.4767323413479553e-06, + "loss": 0.7852, + "step": 42321 + }, + { + "epoch": 1.08, + "learning_rate": 1.476708017494313e-06, + "loss": 0.5659, + "step": 42322 + }, + { + "epoch": 1.08, + "learning_rate": 1.4766836932756773e-06, + "loss": 0.4863, + "step": 42323 + }, + { + "epoch": 1.08, + "learning_rate": 1.4766593686920668e-06, + "loss": 0.6152, + "step": 42324 + }, + { + "epoch": 1.08, + "learning_rate": 1.4766350437435003e-06, + "loss": 0.5269, + "step": 42325 + }, + { + "epoch": 1.08, + "learning_rate": 1.4766107184299962e-06, + "loss": 0.6895, + "step": 42326 + }, + { + "epoch": 1.08, + "learning_rate": 1.4765863927515731e-06, + "loss": 0.6621, + "step": 42327 + }, + { + "epoch": 1.08, + "learning_rate": 1.4765620667082494e-06, + "loss": 0.7109, + "step": 42328 + }, + { + "epoch": 1.08, + "learning_rate": 1.4765377403000448e-06, + "loss": 0.667, + "step": 42329 + }, + { + "epoch": 1.08, + "learning_rate": 1.4765134135269767e-06, + "loss": 0.7686, + "step": 42330 + }, + { + "epoch": 1.08, + "learning_rate": 1.4764890863890642e-06, + "loss": 0.5378, + "step": 42331 + }, + { + "epoch": 1.08, + "learning_rate": 1.476464758886326e-06, + "loss": 0.5464, + "step": 42332 + }, + { + "epoch": 1.09, + "learning_rate": 1.4764404310187806e-06, + "loss": 0.5884, + "step": 42333 + }, + { + "epoch": 1.09, + "learning_rate": 1.4764161027864467e-06, + "loss": 0.6719, + "step": 42334 + }, + { + "epoch": 1.09, + "learning_rate": 1.476391774189343e-06, + "loss": 0.7222, + "step": 42335 + }, + { + "epoch": 1.09, + "learning_rate": 1.4763674452274878e-06, + "loss": 0.5112, + "step": 42336 + }, + { + "epoch": 1.09, + "learning_rate": 1.4763431159009002e-06, + "loss": 0.6421, + "step": 42337 + }, + { + "epoch": 1.09, + "learning_rate": 1.476318786209598e-06, + "loss": 0.7637, + "step": 42338 + }, + { + "epoch": 1.09, + "learning_rate": 1.4762944561536011e-06, + "loss": 0.6309, + "step": 42339 + }, + { + "epoch": 1.09, + "learning_rate": 1.4762701257329271e-06, + "loss": 0.6816, + "step": 42340 + }, + { + "epoch": 1.09, + "learning_rate": 1.4762457949475949e-06, + "loss": 0.5789, + "step": 42341 + }, + { + "epoch": 1.09, + "learning_rate": 1.4762214637976236e-06, + "loss": 0.5991, + "step": 42342 + }, + { + "epoch": 1.09, + "learning_rate": 1.476197132283031e-06, + "loss": 0.7051, + "step": 42343 + }, + { + "epoch": 1.09, + "learning_rate": 1.4761728004038365e-06, + "loss": 0.4785, + "step": 42344 + }, + { + "epoch": 1.09, + "learning_rate": 1.476148468160058e-06, + "loss": 0.7314, + "step": 42345 + }, + { + "epoch": 1.09, + "learning_rate": 1.4761241355517146e-06, + "loss": 0.7969, + "step": 42346 + }, + { + "epoch": 1.09, + "learning_rate": 1.476099802578825e-06, + "loss": 0.4631, + "step": 42347 + }, + { + "epoch": 1.09, + "learning_rate": 1.4760754692414078e-06, + "loss": 0.5002, + "step": 42348 + }, + { + "epoch": 1.09, + "learning_rate": 1.476051135539481e-06, + "loss": 0.6191, + "step": 42349 + }, + { + "epoch": 1.09, + "learning_rate": 1.4760268014730644e-06, + "loss": 0.5791, + "step": 42350 + }, + { + "epoch": 1.09, + "learning_rate": 1.4760024670421753e-06, + "loss": 0.7725, + "step": 42351 + }, + { + "epoch": 1.09, + "learning_rate": 1.4759781322468335e-06, + "loss": 0.7402, + "step": 42352 + }, + { + "epoch": 1.09, + "learning_rate": 1.4759537970870567e-06, + "loss": 0.6763, + "step": 42353 + }, + { + "epoch": 1.09, + "learning_rate": 1.4759294615628646e-06, + "loss": 0.7036, + "step": 42354 + }, + { + "epoch": 1.09, + "learning_rate": 1.4759051256742744e-06, + "loss": 0.6787, + "step": 42355 + }, + { + "epoch": 1.09, + "learning_rate": 1.4758807894213061e-06, + "loss": 0.7197, + "step": 42356 + }, + { + "epoch": 1.09, + "learning_rate": 1.4758564528039776e-06, + "loss": 0.5933, + "step": 42357 + }, + { + "epoch": 1.09, + "learning_rate": 1.4758321158223077e-06, + "loss": 0.5381, + "step": 42358 + }, + { + "epoch": 1.09, + "learning_rate": 1.475807778476315e-06, + "loss": 0.5295, + "step": 42359 + }, + { + "epoch": 1.09, + "learning_rate": 1.4757834407660183e-06, + "loss": 0.4236, + "step": 42360 + }, + { + "epoch": 1.09, + "learning_rate": 1.4757591026914357e-06, + "loss": 0.8574, + "step": 42361 + }, + { + "epoch": 1.09, + "learning_rate": 1.4757347642525867e-06, + "loss": 0.708, + "step": 42362 + }, + { + "epoch": 1.09, + "learning_rate": 1.4757104254494892e-06, + "loss": 0.5554, + "step": 42363 + }, + { + "epoch": 1.09, + "learning_rate": 1.4756860862821624e-06, + "loss": 0.6968, + "step": 42364 + }, + { + "epoch": 1.09, + "learning_rate": 1.4756617467506243e-06, + "loss": 0.7163, + "step": 42365 + }, + { + "epoch": 1.09, + "learning_rate": 1.475637406854894e-06, + "loss": 0.5918, + "step": 42366 + }, + { + "epoch": 1.09, + "learning_rate": 1.47561306659499e-06, + "loss": 0.6621, + "step": 42367 + }, + { + "epoch": 1.09, + "learning_rate": 1.4755887259709305e-06, + "loss": 0.5522, + "step": 42368 + }, + { + "epoch": 1.09, + "learning_rate": 1.4755643849827355e-06, + "loss": 0.6299, + "step": 42369 + }, + { + "epoch": 1.09, + "learning_rate": 1.475540043630422e-06, + "loss": 0.6787, + "step": 42370 + }, + { + "epoch": 1.09, + "learning_rate": 1.4755157019140097e-06, + "loss": 0.7236, + "step": 42371 + }, + { + "epoch": 1.09, + "learning_rate": 1.4754913598335166e-06, + "loss": 0.6821, + "step": 42372 + }, + { + "epoch": 1.09, + "learning_rate": 1.4754670173889618e-06, + "loss": 0.5908, + "step": 42373 + }, + { + "epoch": 1.09, + "learning_rate": 1.4754426745803638e-06, + "loss": 0.5, + "step": 42374 + }, + { + "epoch": 1.09, + "learning_rate": 1.4754183314077413e-06, + "loss": 0.6699, + "step": 42375 + }, + { + "epoch": 1.09, + "learning_rate": 1.4753939878711126e-06, + "loss": 0.4185, + "step": 42376 + }, + { + "epoch": 1.09, + "learning_rate": 1.4753696439704969e-06, + "loss": 0.6963, + "step": 42377 + }, + { + "epoch": 1.09, + "learning_rate": 1.4753452997059122e-06, + "loss": 0.8369, + "step": 42378 + }, + { + "epoch": 1.09, + "learning_rate": 1.4753209550773777e-06, + "loss": 0.4895, + "step": 42379 + }, + { + "epoch": 1.09, + "learning_rate": 1.4752966100849115e-06, + "loss": 0.7178, + "step": 42380 + }, + { + "epoch": 1.09, + "learning_rate": 1.4752722647285329e-06, + "loss": 0.6489, + "step": 42381 + }, + { + "epoch": 1.09, + "learning_rate": 1.4752479190082598e-06, + "loss": 0.7295, + "step": 42382 + }, + { + "epoch": 1.09, + "learning_rate": 1.4752235729241115e-06, + "loss": 0.5669, + "step": 42383 + }, + { + "epoch": 1.09, + "learning_rate": 1.4751992264761064e-06, + "loss": 0.749, + "step": 42384 + }, + { + "epoch": 1.09, + "learning_rate": 1.4751748796642628e-06, + "loss": 0.7627, + "step": 42385 + }, + { + "epoch": 1.09, + "learning_rate": 1.4751505324886e-06, + "loss": 0.7891, + "step": 42386 + }, + { + "epoch": 1.09, + "learning_rate": 1.475126184949136e-06, + "loss": 0.5298, + "step": 42387 + }, + { + "epoch": 1.09, + "learning_rate": 1.4751018370458898e-06, + "loss": 0.6641, + "step": 42388 + }, + { + "epoch": 1.09, + "learning_rate": 1.4750774887788802e-06, + "loss": 0.7734, + "step": 42389 + }, + { + "epoch": 1.09, + "learning_rate": 1.4750531401481254e-06, + "loss": 0.6299, + "step": 42390 + }, + { + "epoch": 1.09, + "learning_rate": 1.4750287911536444e-06, + "loss": 0.7412, + "step": 42391 + }, + { + "epoch": 1.09, + "learning_rate": 1.4750044417954554e-06, + "loss": 0.6377, + "step": 42392 + }, + { + "epoch": 1.09, + "learning_rate": 1.4749800920735776e-06, + "loss": 0.7549, + "step": 42393 + }, + { + "epoch": 1.09, + "learning_rate": 1.4749557419880293e-06, + "loss": 0.7773, + "step": 42394 + }, + { + "epoch": 1.09, + "learning_rate": 1.4749313915388291e-06, + "loss": 0.6475, + "step": 42395 + }, + { + "epoch": 1.09, + "learning_rate": 1.474907040725996e-06, + "loss": 0.5576, + "step": 42396 + }, + { + "epoch": 1.09, + "learning_rate": 1.4748826895495482e-06, + "loss": 0.6265, + "step": 42397 + }, + { + "epoch": 1.09, + "learning_rate": 1.4748583380095049e-06, + "loss": 0.6172, + "step": 42398 + }, + { + "epoch": 1.09, + "learning_rate": 1.474833986105884e-06, + "loss": 0.6689, + "step": 42399 + }, + { + "epoch": 1.09, + "learning_rate": 1.474809633838705e-06, + "loss": 0.626, + "step": 42400 + }, + { + "epoch": 1.09, + "learning_rate": 1.4747852812079855e-06, + "loss": 0.7744, + "step": 42401 + }, + { + "epoch": 1.09, + "learning_rate": 1.4747609282137451e-06, + "loss": 0.606, + "step": 42402 + }, + { + "epoch": 1.09, + "learning_rate": 1.4747365748560023e-06, + "loss": 0.79, + "step": 42403 + }, + { + "epoch": 1.09, + "learning_rate": 1.474712221134775e-06, + "loss": 0.6328, + "step": 42404 + }, + { + "epoch": 1.09, + "learning_rate": 1.474687867050083e-06, + "loss": 0.6875, + "step": 42405 + }, + { + "epoch": 1.09, + "learning_rate": 1.474663512601944e-06, + "loss": 0.8184, + "step": 42406 + }, + { + "epoch": 1.09, + "learning_rate": 1.4746391577903767e-06, + "loss": 0.6001, + "step": 42407 + }, + { + "epoch": 1.09, + "learning_rate": 1.4746148026154003e-06, + "loss": 0.5586, + "step": 42408 + }, + { + "epoch": 1.09, + "learning_rate": 1.4745904470770334e-06, + "loss": 0.8447, + "step": 42409 + }, + { + "epoch": 1.09, + "learning_rate": 1.474566091175294e-06, + "loss": 0.6499, + "step": 42410 + }, + { + "epoch": 1.09, + "learning_rate": 1.4745417349102015e-06, + "loss": 0.8096, + "step": 42411 + }, + { + "epoch": 1.09, + "learning_rate": 1.474517378281774e-06, + "loss": 0.6855, + "step": 42412 + }, + { + "epoch": 1.09, + "learning_rate": 1.4744930212900307e-06, + "loss": 0.5942, + "step": 42413 + }, + { + "epoch": 1.09, + "learning_rate": 1.4744686639349894e-06, + "loss": 0.6377, + "step": 42414 + }, + { + "epoch": 1.09, + "learning_rate": 1.4744443062166693e-06, + "loss": 0.6777, + "step": 42415 + }, + { + "epoch": 1.09, + "learning_rate": 1.4744199481350892e-06, + "loss": 0.5728, + "step": 42416 + }, + { + "epoch": 1.09, + "learning_rate": 1.4743955896902675e-06, + "loss": 0.5243, + "step": 42417 + }, + { + "epoch": 1.09, + "learning_rate": 1.4743712308822232e-06, + "loss": 0.646, + "step": 42418 + }, + { + "epoch": 1.09, + "learning_rate": 1.4743468717109746e-06, + "loss": 0.6357, + "step": 42419 + }, + { + "epoch": 1.09, + "learning_rate": 1.4743225121765402e-06, + "loss": 0.5752, + "step": 42420 + }, + { + "epoch": 1.09, + "learning_rate": 1.4742981522789388e-06, + "loss": 0.5176, + "step": 42421 + }, + { + "epoch": 1.09, + "learning_rate": 1.4742737920181892e-06, + "loss": 0.5011, + "step": 42422 + }, + { + "epoch": 1.09, + "learning_rate": 1.4742494313943102e-06, + "loss": 0.7144, + "step": 42423 + }, + { + "epoch": 1.09, + "learning_rate": 1.4742250704073198e-06, + "loss": 0.75, + "step": 42424 + }, + { + "epoch": 1.09, + "learning_rate": 1.4742007090572375e-06, + "loss": 0.5737, + "step": 42425 + }, + { + "epoch": 1.09, + "learning_rate": 1.474176347344081e-06, + "loss": 0.6875, + "step": 42426 + }, + { + "epoch": 1.09, + "learning_rate": 1.47415198526787e-06, + "loss": 0.6748, + "step": 42427 + }, + { + "epoch": 1.09, + "learning_rate": 1.4741276228286223e-06, + "loss": 0.8887, + "step": 42428 + }, + { + "epoch": 1.09, + "learning_rate": 1.4741032600263567e-06, + "loss": 0.6147, + "step": 42429 + }, + { + "epoch": 1.09, + "learning_rate": 1.4740788968610925e-06, + "loss": 0.627, + "step": 42430 + }, + { + "epoch": 1.09, + "learning_rate": 1.4740545333328477e-06, + "loss": 0.8496, + "step": 42431 + }, + { + "epoch": 1.09, + "learning_rate": 1.4740301694416411e-06, + "loss": 0.6787, + "step": 42432 + }, + { + "epoch": 1.09, + "learning_rate": 1.4740058051874916e-06, + "loss": 0.6094, + "step": 42433 + }, + { + "epoch": 1.09, + "learning_rate": 1.4739814405704174e-06, + "loss": 0.8516, + "step": 42434 + }, + { + "epoch": 1.09, + "learning_rate": 1.4739570755904373e-06, + "loss": 0.7852, + "step": 42435 + }, + { + "epoch": 1.09, + "learning_rate": 1.4739327102475704e-06, + "loss": 0.7178, + "step": 42436 + }, + { + "epoch": 1.09, + "learning_rate": 1.4739083445418347e-06, + "loss": 0.6611, + "step": 42437 + }, + { + "epoch": 1.09, + "learning_rate": 1.4738839784732497e-06, + "loss": 0.6357, + "step": 42438 + }, + { + "epoch": 1.09, + "learning_rate": 1.4738596120418329e-06, + "loss": 0.6504, + "step": 42439 + }, + { + "epoch": 1.09, + "learning_rate": 1.4738352452476039e-06, + "loss": 0.5635, + "step": 42440 + }, + { + "epoch": 1.09, + "learning_rate": 1.473810878090581e-06, + "loss": 0.6184, + "step": 42441 + }, + { + "epoch": 1.09, + "learning_rate": 1.473786510570783e-06, + "loss": 0.603, + "step": 42442 + }, + { + "epoch": 1.09, + "learning_rate": 1.4737621426882283e-06, + "loss": 0.6851, + "step": 42443 + }, + { + "epoch": 1.09, + "learning_rate": 1.4737377744429357e-06, + "loss": 0.4866, + "step": 42444 + }, + { + "epoch": 1.09, + "learning_rate": 1.473713405834924e-06, + "loss": 0.5554, + "step": 42445 + }, + { + "epoch": 1.09, + "learning_rate": 1.4736890368642116e-06, + "loss": 0.6816, + "step": 42446 + }, + { + "epoch": 1.09, + "learning_rate": 1.4736646675308171e-06, + "loss": 0.7007, + "step": 42447 + }, + { + "epoch": 1.09, + "learning_rate": 1.4736402978347598e-06, + "loss": 0.6924, + "step": 42448 + }, + { + "epoch": 1.09, + "learning_rate": 1.4736159277760578e-06, + "loss": 0.6304, + "step": 42449 + }, + { + "epoch": 1.09, + "learning_rate": 1.4735915573547297e-06, + "loss": 0.5864, + "step": 42450 + }, + { + "epoch": 1.09, + "learning_rate": 1.473567186570794e-06, + "loss": 0.6943, + "step": 42451 + }, + { + "epoch": 1.09, + "learning_rate": 1.4735428154242705e-06, + "loss": 0.4619, + "step": 42452 + }, + { + "epoch": 1.09, + "learning_rate": 1.4735184439151764e-06, + "loss": 0.7803, + "step": 42453 + }, + { + "epoch": 1.09, + "learning_rate": 1.4734940720435312e-06, + "loss": 0.6621, + "step": 42454 + }, + { + "epoch": 1.09, + "learning_rate": 1.4734696998093532e-06, + "loss": 0.7061, + "step": 42455 + }, + { + "epoch": 1.09, + "learning_rate": 1.4734453272126615e-06, + "loss": 0.6602, + "step": 42456 + }, + { + "epoch": 1.09, + "learning_rate": 1.4734209542534743e-06, + "loss": 0.665, + "step": 42457 + }, + { + "epoch": 1.09, + "learning_rate": 1.4733965809318106e-06, + "loss": 0.6719, + "step": 42458 + }, + { + "epoch": 1.09, + "learning_rate": 1.4733722072476888e-06, + "loss": 0.6543, + "step": 42459 + }, + { + "epoch": 1.09, + "learning_rate": 1.4733478332011275e-06, + "loss": 0.6113, + "step": 42460 + }, + { + "epoch": 1.09, + "learning_rate": 1.4733234587921458e-06, + "loss": 0.4686, + "step": 42461 + }, + { + "epoch": 1.09, + "learning_rate": 1.4732990840207618e-06, + "loss": 0.5649, + "step": 42462 + }, + { + "epoch": 1.09, + "learning_rate": 1.473274708886995e-06, + "loss": 0.7148, + "step": 42463 + }, + { + "epoch": 1.09, + "learning_rate": 1.473250333390863e-06, + "loss": 0.4263, + "step": 42464 + }, + { + "epoch": 1.09, + "learning_rate": 1.4732259575323852e-06, + "loss": 0.8359, + "step": 42465 + }, + { + "epoch": 1.09, + "learning_rate": 1.4732015813115796e-06, + "loss": 0.7832, + "step": 42466 + }, + { + "epoch": 1.09, + "learning_rate": 1.473177204728466e-06, + "loss": 0.6196, + "step": 42467 + }, + { + "epoch": 1.09, + "learning_rate": 1.473152827783062e-06, + "loss": 0.4861, + "step": 42468 + }, + { + "epoch": 1.09, + "learning_rate": 1.4731284504753869e-06, + "loss": 0.5991, + "step": 42469 + }, + { + "epoch": 1.09, + "learning_rate": 1.4731040728054587e-06, + "loss": 0.6294, + "step": 42470 + }, + { + "epoch": 1.09, + "learning_rate": 1.4730796947732968e-06, + "loss": 0.8447, + "step": 42471 + }, + { + "epoch": 1.09, + "learning_rate": 1.4730553163789192e-06, + "loss": 0.426, + "step": 42472 + }, + { + "epoch": 1.09, + "learning_rate": 1.4730309376223452e-06, + "loss": 0.6646, + "step": 42473 + }, + { + "epoch": 1.09, + "learning_rate": 1.473006558503593e-06, + "loss": 0.5962, + "step": 42474 + }, + { + "epoch": 1.09, + "learning_rate": 1.4729821790226816e-06, + "loss": 0.9072, + "step": 42475 + }, + { + "epoch": 1.09, + "learning_rate": 1.472957799179629e-06, + "loss": 0.7275, + "step": 42476 + }, + { + "epoch": 1.09, + "learning_rate": 1.4729334189744549e-06, + "loss": 0.7354, + "step": 42477 + }, + { + "epoch": 1.09, + "learning_rate": 1.4729090384071773e-06, + "loss": 0.6396, + "step": 42478 + }, + { + "epoch": 1.09, + "learning_rate": 1.472884657477815e-06, + "loss": 0.6436, + "step": 42479 + }, + { + "epoch": 1.09, + "learning_rate": 1.4728602761863867e-06, + "loss": 0.6362, + "step": 42480 + }, + { + "epoch": 1.09, + "learning_rate": 1.4728358945329107e-06, + "loss": 0.7295, + "step": 42481 + }, + { + "epoch": 1.09, + "learning_rate": 1.4728115125174064e-06, + "loss": 0.6914, + "step": 42482 + }, + { + "epoch": 1.09, + "learning_rate": 1.472787130139892e-06, + "loss": 0.6777, + "step": 42483 + }, + { + "epoch": 1.09, + "learning_rate": 1.472762747400386e-06, + "loss": 0.646, + "step": 42484 + }, + { + "epoch": 1.09, + "learning_rate": 1.4727383642989075e-06, + "loss": 0.6138, + "step": 42485 + }, + { + "epoch": 1.09, + "learning_rate": 1.472713980835475e-06, + "loss": 0.8223, + "step": 42486 + }, + { + "epoch": 1.09, + "learning_rate": 1.472689597010107e-06, + "loss": 0.699, + "step": 42487 + }, + { + "epoch": 1.09, + "learning_rate": 1.4726652128228225e-06, + "loss": 0.5913, + "step": 42488 + }, + { + "epoch": 1.09, + "learning_rate": 1.4726408282736395e-06, + "loss": 0.6914, + "step": 42489 + }, + { + "epoch": 1.09, + "learning_rate": 1.4726164433625777e-06, + "loss": 0.7041, + "step": 42490 + }, + { + "epoch": 1.09, + "learning_rate": 1.472592058089655e-06, + "loss": 0.7305, + "step": 42491 + }, + { + "epoch": 1.09, + "learning_rate": 1.4725676724548903e-06, + "loss": 0.4193, + "step": 42492 + }, + { + "epoch": 1.09, + "learning_rate": 1.4725432864583022e-06, + "loss": 0.6123, + "step": 42493 + }, + { + "epoch": 1.09, + "learning_rate": 1.4725189000999095e-06, + "loss": 0.6904, + "step": 42494 + }, + { + "epoch": 1.09, + "learning_rate": 1.4724945133797308e-06, + "loss": 0.7021, + "step": 42495 + }, + { + "epoch": 1.09, + "learning_rate": 1.472470126297785e-06, + "loss": 0.4614, + "step": 42496 + }, + { + "epoch": 1.09, + "learning_rate": 1.47244573885409e-06, + "loss": 0.749, + "step": 42497 + }, + { + "epoch": 1.09, + "learning_rate": 1.4724213510486656e-06, + "loss": 0.6338, + "step": 42498 + }, + { + "epoch": 1.09, + "learning_rate": 1.4723969628815295e-06, + "loss": 0.3422, + "step": 42499 + }, + { + "epoch": 1.09, + "learning_rate": 1.4723725743527008e-06, + "loss": 0.5723, + "step": 42500 + }, + { + "epoch": 1.09, + "learning_rate": 1.4723481854621984e-06, + "loss": 0.5537, + "step": 42501 + }, + { + "epoch": 1.09, + "learning_rate": 1.4723237962100405e-06, + "loss": 0.5674, + "step": 42502 + }, + { + "epoch": 1.09, + "learning_rate": 1.4722994065962464e-06, + "loss": 0.5908, + "step": 42503 + }, + { + "epoch": 1.09, + "learning_rate": 1.4722750166208337e-06, + "loss": 0.6416, + "step": 42504 + }, + { + "epoch": 1.09, + "learning_rate": 1.4722506262838224e-06, + "loss": 0.6113, + "step": 42505 + }, + { + "epoch": 1.09, + "learning_rate": 1.47222623558523e-06, + "loss": 0.6855, + "step": 42506 + }, + { + "epoch": 1.09, + "learning_rate": 1.4722018445250757e-06, + "loss": 0.6719, + "step": 42507 + }, + { + "epoch": 1.09, + "learning_rate": 1.4721774531033784e-06, + "loss": 0.5283, + "step": 42508 + }, + { + "epoch": 1.09, + "learning_rate": 1.4721530613201566e-06, + "loss": 0.5308, + "step": 42509 + }, + { + "epoch": 1.09, + "learning_rate": 1.4721286691754283e-06, + "loss": 0.6597, + "step": 42510 + }, + { + "epoch": 1.09, + "learning_rate": 1.4721042766692135e-06, + "loss": 0.6416, + "step": 42511 + }, + { + "epoch": 1.09, + "learning_rate": 1.4720798838015297e-06, + "loss": 0.5972, + "step": 42512 + }, + { + "epoch": 1.09, + "learning_rate": 1.4720554905723964e-06, + "loss": 0.6445, + "step": 42513 + }, + { + "epoch": 1.09, + "learning_rate": 1.4720310969818319e-06, + "loss": 0.751, + "step": 42514 + }, + { + "epoch": 1.09, + "learning_rate": 1.4720067030298549e-06, + "loss": 0.6533, + "step": 42515 + }, + { + "epoch": 1.09, + "learning_rate": 1.4719823087164838e-06, + "loss": 0.6406, + "step": 42516 + }, + { + "epoch": 1.09, + "learning_rate": 1.4719579140417376e-06, + "loss": 0.5649, + "step": 42517 + }, + { + "epoch": 1.09, + "learning_rate": 1.4719335190056353e-06, + "loss": 0.7363, + "step": 42518 + }, + { + "epoch": 1.09, + "learning_rate": 1.4719091236081946e-06, + "loss": 0.6729, + "step": 42519 + }, + { + "epoch": 1.09, + "learning_rate": 1.4718847278494351e-06, + "loss": 0.7148, + "step": 42520 + }, + { + "epoch": 1.09, + "learning_rate": 1.471860331729375e-06, + "loss": 0.6758, + "step": 42521 + }, + { + "epoch": 1.09, + "learning_rate": 1.4718359352480333e-06, + "loss": 0.6553, + "step": 42522 + }, + { + "epoch": 1.09, + "learning_rate": 1.471811538405429e-06, + "loss": 0.6191, + "step": 42523 + }, + { + "epoch": 1.09, + "learning_rate": 1.4717871412015797e-06, + "loss": 0.7725, + "step": 42524 + }, + { + "epoch": 1.09, + "learning_rate": 1.4717627436365045e-06, + "loss": 0.6768, + "step": 42525 + }, + { + "epoch": 1.09, + "learning_rate": 1.4717383457102226e-06, + "loss": 0.6675, + "step": 42526 + }, + { + "epoch": 1.09, + "learning_rate": 1.4717139474227521e-06, + "loss": 0.5093, + "step": 42527 + }, + { + "epoch": 1.09, + "learning_rate": 1.4716895487741125e-06, + "loss": 0.5569, + "step": 42528 + }, + { + "epoch": 1.09, + "learning_rate": 1.4716651497643214e-06, + "loss": 0.4795, + "step": 42529 + }, + { + "epoch": 1.09, + "learning_rate": 1.4716407503933981e-06, + "loss": 0.769, + "step": 42530 + }, + { + "epoch": 1.09, + "learning_rate": 1.471616350661361e-06, + "loss": 0.6392, + "step": 42531 + }, + { + "epoch": 1.09, + "learning_rate": 1.4715919505682293e-06, + "loss": 0.6172, + "step": 42532 + }, + { + "epoch": 1.09, + "learning_rate": 1.4715675501140213e-06, + "loss": 0.7476, + "step": 42533 + }, + { + "epoch": 1.09, + "learning_rate": 1.4715431492987552e-06, + "loss": 0.7686, + "step": 42534 + }, + { + "epoch": 1.09, + "learning_rate": 1.4715187481224507e-06, + "loss": 0.6489, + "step": 42535 + }, + { + "epoch": 1.09, + "learning_rate": 1.4714943465851257e-06, + "loss": 0.5303, + "step": 42536 + }, + { + "epoch": 1.09, + "learning_rate": 1.4714699446867993e-06, + "loss": 0.6406, + "step": 42537 + }, + { + "epoch": 1.09, + "learning_rate": 1.4714455424274902e-06, + "loss": 0.5889, + "step": 42538 + }, + { + "epoch": 1.09, + "learning_rate": 1.4714211398072168e-06, + "loss": 0.6914, + "step": 42539 + }, + { + "epoch": 1.09, + "learning_rate": 1.4713967368259978e-06, + "loss": 0.6997, + "step": 42540 + }, + { + "epoch": 1.09, + "learning_rate": 1.4713723334838516e-06, + "loss": 0.7236, + "step": 42541 + }, + { + "epoch": 1.09, + "learning_rate": 1.471347929780798e-06, + "loss": 0.7061, + "step": 42542 + }, + { + "epoch": 1.09, + "learning_rate": 1.4713235257168549e-06, + "loss": 0.2991, + "step": 42543 + }, + { + "epoch": 1.09, + "learning_rate": 1.4712991212920405e-06, + "loss": 0.5244, + "step": 42544 + }, + { + "epoch": 1.09, + "learning_rate": 1.4712747165063743e-06, + "loss": 0.5596, + "step": 42545 + }, + { + "epoch": 1.09, + "learning_rate": 1.471250311359875e-06, + "loss": 0.5991, + "step": 42546 + }, + { + "epoch": 1.09, + "learning_rate": 1.4712259058525607e-06, + "loss": 0.7188, + "step": 42547 + }, + { + "epoch": 1.09, + "learning_rate": 1.4712014999844505e-06, + "loss": 0.8076, + "step": 42548 + }, + { + "epoch": 1.09, + "learning_rate": 1.471177093755563e-06, + "loss": 0.7529, + "step": 42549 + }, + { + "epoch": 1.09, + "learning_rate": 1.4711526871659168e-06, + "loss": 0.6719, + "step": 42550 + }, + { + "epoch": 1.09, + "learning_rate": 1.4711282802155308e-06, + "loss": 0.9199, + "step": 42551 + }, + { + "epoch": 1.09, + "learning_rate": 1.471103872904423e-06, + "loss": 0.55, + "step": 42552 + }, + { + "epoch": 1.09, + "learning_rate": 1.4710794652326136e-06, + "loss": 0.5576, + "step": 42553 + }, + { + "epoch": 1.09, + "learning_rate": 1.4710550572001195e-06, + "loss": 0.7324, + "step": 42554 + }, + { + "epoch": 1.09, + "learning_rate": 1.4710306488069606e-06, + "loss": 0.7666, + "step": 42555 + }, + { + "epoch": 1.09, + "learning_rate": 1.4710062400531549e-06, + "loss": 0.5645, + "step": 42556 + }, + { + "epoch": 1.09, + "learning_rate": 1.4709818309387214e-06, + "loss": 0.5645, + "step": 42557 + }, + { + "epoch": 1.09, + "learning_rate": 1.4709574214636792e-06, + "loss": 0.5435, + "step": 42558 + }, + { + "epoch": 1.09, + "learning_rate": 1.4709330116280463e-06, + "loss": 0.7344, + "step": 42559 + }, + { + "epoch": 1.09, + "learning_rate": 1.4709086014318413e-06, + "loss": 0.5947, + "step": 42560 + }, + { + "epoch": 1.09, + "learning_rate": 1.4708841908750837e-06, + "loss": 0.7393, + "step": 42561 + }, + { + "epoch": 1.09, + "learning_rate": 1.4708597799577915e-06, + "loss": 0.5801, + "step": 42562 + }, + { + "epoch": 1.09, + "learning_rate": 1.4708353686799838e-06, + "loss": 0.3936, + "step": 42563 + }, + { + "epoch": 1.09, + "learning_rate": 1.470810957041679e-06, + "loss": 0.6338, + "step": 42564 + }, + { + "epoch": 1.09, + "learning_rate": 1.4707865450428956e-06, + "loss": 0.5845, + "step": 42565 + }, + { + "epoch": 1.09, + "learning_rate": 1.470762132683653e-06, + "loss": 0.5449, + "step": 42566 + }, + { + "epoch": 1.09, + "learning_rate": 1.4707377199639693e-06, + "loss": 0.542, + "step": 42567 + }, + { + "epoch": 1.09, + "learning_rate": 1.4707133068838636e-06, + "loss": 0.5957, + "step": 42568 + }, + { + "epoch": 1.09, + "learning_rate": 1.4706888934433542e-06, + "loss": 0.6299, + "step": 42569 + }, + { + "epoch": 1.09, + "learning_rate": 1.4706644796424598e-06, + "loss": 0.6504, + "step": 42570 + }, + { + "epoch": 1.09, + "learning_rate": 1.4706400654811995e-06, + "loss": 0.7568, + "step": 42571 + }, + { + "epoch": 1.09, + "learning_rate": 1.4706156509595915e-06, + "loss": 0.708, + "step": 42572 + }, + { + "epoch": 1.09, + "learning_rate": 1.4705912360776548e-06, + "loss": 0.509, + "step": 42573 + }, + { + "epoch": 1.09, + "learning_rate": 1.4705668208354083e-06, + "loss": 0.6455, + "step": 42574 + }, + { + "epoch": 1.09, + "learning_rate": 1.4705424052328702e-06, + "loss": 0.6182, + "step": 42575 + }, + { + "epoch": 1.09, + "learning_rate": 1.4705179892700594e-06, + "loss": 0.7666, + "step": 42576 + }, + { + "epoch": 1.09, + "learning_rate": 1.4704935729469948e-06, + "loss": 0.5767, + "step": 42577 + }, + { + "epoch": 1.09, + "learning_rate": 1.4704691562636948e-06, + "loss": 0.6045, + "step": 42578 + }, + { + "epoch": 1.09, + "learning_rate": 1.470444739220178e-06, + "loss": 0.5737, + "step": 42579 + }, + { + "epoch": 1.09, + "learning_rate": 1.4704203218164636e-06, + "loss": 0.3473, + "step": 42580 + }, + { + "epoch": 1.09, + "learning_rate": 1.4703959040525697e-06, + "loss": 0.7314, + "step": 42581 + }, + { + "epoch": 1.09, + "learning_rate": 1.4703714859285158e-06, + "loss": 0.7881, + "step": 42582 + }, + { + "epoch": 1.09, + "learning_rate": 1.4703470674443195e-06, + "loss": 0.7441, + "step": 42583 + }, + { + "epoch": 1.09, + "learning_rate": 1.4703226486000002e-06, + "loss": 0.6719, + "step": 42584 + }, + { + "epoch": 1.09, + "learning_rate": 1.4702982293955766e-06, + "loss": 0.9395, + "step": 42585 + }, + { + "epoch": 1.09, + "learning_rate": 1.4702738098310671e-06, + "loss": 0.7627, + "step": 42586 + }, + { + "epoch": 1.09, + "learning_rate": 1.4702493899064907e-06, + "loss": 0.6523, + "step": 42587 + }, + { + "epoch": 1.09, + "learning_rate": 1.4702249696218664e-06, + "loss": 0.8301, + "step": 42588 + }, + { + "epoch": 1.09, + "learning_rate": 1.4702005489772117e-06, + "loss": 0.5208, + "step": 42589 + }, + { + "epoch": 1.09, + "learning_rate": 1.4701761279725463e-06, + "loss": 0.7793, + "step": 42590 + }, + { + "epoch": 1.09, + "learning_rate": 1.470151706607889e-06, + "loss": 0.752, + "step": 42591 + }, + { + "epoch": 1.09, + "learning_rate": 1.4701272848832576e-06, + "loss": 0.5269, + "step": 42592 + }, + { + "epoch": 1.09, + "learning_rate": 1.470102862798672e-06, + "loss": 0.6094, + "step": 42593 + }, + { + "epoch": 1.09, + "learning_rate": 1.4700784403541498e-06, + "loss": 0.6838, + "step": 42594 + }, + { + "epoch": 1.09, + "learning_rate": 1.4700540175497103e-06, + "loss": 0.4852, + "step": 42595 + }, + { + "epoch": 1.09, + "learning_rate": 1.4700295943853717e-06, + "loss": 0.5752, + "step": 42596 + }, + { + "epoch": 1.09, + "learning_rate": 1.4700051708611536e-06, + "loss": 0.5361, + "step": 42597 + }, + { + "epoch": 1.09, + "learning_rate": 1.469980746977074e-06, + "loss": 0.5928, + "step": 42598 + }, + { + "epoch": 1.09, + "learning_rate": 1.4699563227331518e-06, + "loss": 0.6367, + "step": 42599 + }, + { + "epoch": 1.09, + "learning_rate": 1.4699318981294052e-06, + "loss": 0.6211, + "step": 42600 + }, + { + "epoch": 1.09, + "learning_rate": 1.4699074731658541e-06, + "loss": 0.6211, + "step": 42601 + }, + { + "epoch": 1.09, + "learning_rate": 1.4698830478425156e-06, + "loss": 0.7388, + "step": 42602 + }, + { + "epoch": 1.09, + "learning_rate": 1.46985862215941e-06, + "loss": 0.6738, + "step": 42603 + }, + { + "epoch": 1.09, + "learning_rate": 1.469834196116555e-06, + "loss": 0.5503, + "step": 42604 + }, + { + "epoch": 1.09, + "learning_rate": 1.4698097697139694e-06, + "loss": 0.6191, + "step": 42605 + }, + { + "epoch": 1.09, + "learning_rate": 1.4697853429516723e-06, + "loss": 0.8223, + "step": 42606 + }, + { + "epoch": 1.09, + "learning_rate": 1.469760915829682e-06, + "loss": 0.606, + "step": 42607 + }, + { + "epoch": 1.09, + "learning_rate": 1.4697364883480174e-06, + "loss": 0.5356, + "step": 42608 + }, + { + "epoch": 1.09, + "learning_rate": 1.469712060506697e-06, + "loss": 0.8896, + "step": 42609 + }, + { + "epoch": 1.09, + "learning_rate": 1.4696876323057398e-06, + "loss": 0.6387, + "step": 42610 + }, + { + "epoch": 1.09, + "learning_rate": 1.4696632037451644e-06, + "loss": 0.6245, + "step": 42611 + }, + { + "epoch": 1.09, + "learning_rate": 1.4696387748249897e-06, + "loss": 0.6882, + "step": 42612 + }, + { + "epoch": 1.09, + "learning_rate": 1.4696143455452342e-06, + "loss": 0.6221, + "step": 42613 + }, + { + "epoch": 1.09, + "learning_rate": 1.4695899159059162e-06, + "loss": 0.6589, + "step": 42614 + }, + { + "epoch": 1.09, + "learning_rate": 1.4695654859070547e-06, + "loss": 0.748, + "step": 42615 + }, + { + "epoch": 1.09, + "learning_rate": 1.4695410555486692e-06, + "loss": 0.8232, + "step": 42616 + }, + { + "epoch": 1.09, + "learning_rate": 1.469516624830777e-06, + "loss": 0.4525, + "step": 42617 + }, + { + "epoch": 1.09, + "learning_rate": 1.469492193753398e-06, + "loss": 0.6021, + "step": 42618 + }, + { + "epoch": 1.09, + "learning_rate": 1.4694677623165502e-06, + "loss": 0.5413, + "step": 42619 + }, + { + "epoch": 1.09, + "learning_rate": 1.4694433305202524e-06, + "loss": 0.6904, + "step": 42620 + }, + { + "epoch": 1.09, + "learning_rate": 1.4694188983645234e-06, + "loss": 0.4419, + "step": 42621 + }, + { + "epoch": 1.09, + "learning_rate": 1.4693944658493822e-06, + "loss": 0.7441, + "step": 42622 + }, + { + "epoch": 1.09, + "learning_rate": 1.4693700329748472e-06, + "loss": 0.7295, + "step": 42623 + }, + { + "epoch": 1.09, + "learning_rate": 1.4693455997409372e-06, + "loss": 0.6348, + "step": 42624 + }, + { + "epoch": 1.09, + "learning_rate": 1.4693211661476706e-06, + "loss": 0.6431, + "step": 42625 + }, + { + "epoch": 1.09, + "learning_rate": 1.4692967321950665e-06, + "loss": 0.6416, + "step": 42626 + }, + { + "epoch": 1.09, + "learning_rate": 1.4692722978831433e-06, + "loss": 0.5781, + "step": 42627 + }, + { + "epoch": 1.09, + "learning_rate": 1.4692478632119202e-06, + "loss": 0.7256, + "step": 42628 + }, + { + "epoch": 1.09, + "learning_rate": 1.4692234281814155e-06, + "loss": 0.5469, + "step": 42629 + }, + { + "epoch": 1.09, + "learning_rate": 1.4691989927916478e-06, + "loss": 0.6963, + "step": 42630 + }, + { + "epoch": 1.09, + "learning_rate": 1.4691745570426362e-06, + "loss": 0.751, + "step": 42631 + }, + { + "epoch": 1.09, + "learning_rate": 1.469150120934399e-06, + "loss": 0.7793, + "step": 42632 + }, + { + "epoch": 1.09, + "learning_rate": 1.4691256844669555e-06, + "loss": 0.6587, + "step": 42633 + }, + { + "epoch": 1.09, + "learning_rate": 1.4691012476403235e-06, + "loss": 0.4192, + "step": 42634 + }, + { + "epoch": 1.09, + "learning_rate": 1.4690768104545227e-06, + "loss": 0.6133, + "step": 42635 + }, + { + "epoch": 1.09, + "learning_rate": 1.4690523729095712e-06, + "loss": 0.457, + "step": 42636 + }, + { + "epoch": 1.09, + "learning_rate": 1.4690279350054878e-06, + "loss": 0.6528, + "step": 42637 + }, + { + "epoch": 1.09, + "learning_rate": 1.4690034967422916e-06, + "loss": 0.4824, + "step": 42638 + }, + { + "epoch": 1.09, + "learning_rate": 1.4689790581200007e-06, + "loss": 0.7891, + "step": 42639 + }, + { + "epoch": 1.09, + "learning_rate": 1.468954619138634e-06, + "loss": 0.5083, + "step": 42640 + }, + { + "epoch": 1.09, + "learning_rate": 1.4689301797982103e-06, + "loss": 0.4224, + "step": 42641 + }, + { + "epoch": 1.09, + "learning_rate": 1.4689057400987485e-06, + "loss": 0.7412, + "step": 42642 + }, + { + "epoch": 1.09, + "learning_rate": 1.4688813000402673e-06, + "loss": 0.6445, + "step": 42643 + }, + { + "epoch": 1.09, + "learning_rate": 1.4688568596227851e-06, + "loss": 0.8594, + "step": 42644 + }, + { + "epoch": 1.09, + "learning_rate": 1.4688324188463207e-06, + "loss": 0.5498, + "step": 42645 + }, + { + "epoch": 1.09, + "learning_rate": 1.4688079777108926e-06, + "loss": 0.7495, + "step": 42646 + }, + { + "epoch": 1.09, + "learning_rate": 1.4687835362165203e-06, + "loss": 0.7153, + "step": 42647 + }, + { + "epoch": 1.09, + "learning_rate": 1.4687590943632218e-06, + "loss": 0.6101, + "step": 42648 + }, + { + "epoch": 1.09, + "learning_rate": 1.468734652151016e-06, + "loss": 0.7275, + "step": 42649 + }, + { + "epoch": 1.09, + "learning_rate": 1.4687102095799216e-06, + "loss": 0.6201, + "step": 42650 + }, + { + "epoch": 1.09, + "learning_rate": 1.4686857666499574e-06, + "loss": 0.5278, + "step": 42651 + }, + { + "epoch": 1.09, + "learning_rate": 1.4686613233611418e-06, + "loss": 0.7715, + "step": 42652 + }, + { + "epoch": 1.09, + "learning_rate": 1.468636879713494e-06, + "loss": 0.7759, + "step": 42653 + }, + { + "epoch": 1.09, + "learning_rate": 1.4686124357070327e-06, + "loss": 0.751, + "step": 42654 + }, + { + "epoch": 1.09, + "learning_rate": 1.468587991341776e-06, + "loss": 0.3052, + "step": 42655 + }, + { + "epoch": 1.09, + "learning_rate": 1.4685635466177434e-06, + "loss": 0.7744, + "step": 42656 + }, + { + "epoch": 1.09, + "learning_rate": 1.4685391015349528e-06, + "loss": 0.6411, + "step": 42657 + }, + { + "epoch": 1.09, + "learning_rate": 1.468514656093424e-06, + "loss": 0.6221, + "step": 42658 + }, + { + "epoch": 1.09, + "learning_rate": 1.4684902102931745e-06, + "loss": 0.7148, + "step": 42659 + }, + { + "epoch": 1.09, + "learning_rate": 1.4684657641342237e-06, + "loss": 0.6572, + "step": 42660 + }, + { + "epoch": 1.09, + "learning_rate": 1.4684413176165903e-06, + "loss": 0.4521, + "step": 42661 + }, + { + "epoch": 1.09, + "learning_rate": 1.4684168707402928e-06, + "loss": 0.4071, + "step": 42662 + }, + { + "epoch": 1.09, + "learning_rate": 1.4683924235053502e-06, + "loss": 0.5024, + "step": 42663 + }, + { + "epoch": 1.09, + "learning_rate": 1.4683679759117812e-06, + "loss": 0.6445, + "step": 42664 + }, + { + "epoch": 1.09, + "learning_rate": 1.4683435279596039e-06, + "loss": 0.6807, + "step": 42665 + }, + { + "epoch": 1.09, + "learning_rate": 1.4683190796488379e-06, + "loss": 0.719, + "step": 42666 + }, + { + "epoch": 1.09, + "learning_rate": 1.4682946309795013e-06, + "loss": 0.6719, + "step": 42667 + }, + { + "epoch": 1.09, + "learning_rate": 1.4682701819516133e-06, + "loss": 0.5898, + "step": 42668 + }, + { + "epoch": 1.09, + "learning_rate": 1.4682457325651921e-06, + "loss": 0.7217, + "step": 42669 + }, + { + "epoch": 1.09, + "learning_rate": 1.4682212828202566e-06, + "loss": 0.7354, + "step": 42670 + }, + { + "epoch": 1.09, + "learning_rate": 1.4681968327168257e-06, + "loss": 0.7373, + "step": 42671 + }, + { + "epoch": 1.09, + "learning_rate": 1.4681723822549181e-06, + "loss": 0.6162, + "step": 42672 + }, + { + "epoch": 1.09, + "learning_rate": 1.4681479314345526e-06, + "loss": 0.7012, + "step": 42673 + }, + { + "epoch": 1.09, + "learning_rate": 1.4681234802557474e-06, + "loss": 0.7886, + "step": 42674 + }, + { + "epoch": 1.09, + "learning_rate": 1.4680990287185218e-06, + "loss": 0.7881, + "step": 42675 + }, + { + "epoch": 1.09, + "learning_rate": 1.468074576822894e-06, + "loss": 0.5938, + "step": 42676 + }, + { + "epoch": 1.09, + "learning_rate": 1.4680501245688833e-06, + "loss": 0.7383, + "step": 42677 + }, + { + "epoch": 1.09, + "learning_rate": 1.4680256719565082e-06, + "loss": 0.5376, + "step": 42678 + }, + { + "epoch": 1.09, + "learning_rate": 1.4680012189857873e-06, + "loss": 0.6548, + "step": 42679 + }, + { + "epoch": 1.09, + "learning_rate": 1.467976765656739e-06, + "loss": 0.6758, + "step": 42680 + }, + { + "epoch": 1.09, + "learning_rate": 1.467952311969383e-06, + "loss": 0.7856, + "step": 42681 + }, + { + "epoch": 1.09, + "learning_rate": 1.4679278579237368e-06, + "loss": 0.6575, + "step": 42682 + }, + { + "epoch": 1.09, + "learning_rate": 1.4679034035198206e-06, + "loss": 0.7432, + "step": 42683 + }, + { + "epoch": 1.09, + "learning_rate": 1.4678789487576515e-06, + "loss": 0.5918, + "step": 42684 + }, + { + "epoch": 1.09, + "learning_rate": 1.4678544936372495e-06, + "loss": 0.668, + "step": 42685 + }, + { + "epoch": 1.09, + "learning_rate": 1.4678300381586324e-06, + "loss": 0.7012, + "step": 42686 + }, + { + "epoch": 1.09, + "learning_rate": 1.4678055823218197e-06, + "loss": 0.6777, + "step": 42687 + }, + { + "epoch": 1.09, + "learning_rate": 1.4677811261268295e-06, + "loss": 0.665, + "step": 42688 + }, + { + "epoch": 1.09, + "learning_rate": 1.4677566695736812e-06, + "loss": 0.6421, + "step": 42689 + }, + { + "epoch": 1.09, + "learning_rate": 1.4677322126623928e-06, + "loss": 0.6084, + "step": 42690 + }, + { + "epoch": 1.09, + "learning_rate": 1.4677077553929835e-06, + "loss": 0.5723, + "step": 42691 + }, + { + "epoch": 1.09, + "learning_rate": 1.4676832977654717e-06, + "loss": 0.6807, + "step": 42692 + }, + { + "epoch": 1.09, + "learning_rate": 1.4676588397798766e-06, + "loss": 0.5913, + "step": 42693 + }, + { + "epoch": 1.09, + "learning_rate": 1.4676343814362163e-06, + "loss": 0.5547, + "step": 42694 + }, + { + "epoch": 1.09, + "learning_rate": 1.46760992273451e-06, + "loss": 0.5386, + "step": 42695 + }, + { + "epoch": 1.09, + "learning_rate": 1.4675854636747761e-06, + "loss": 0.563, + "step": 42696 + }, + { + "epoch": 1.09, + "learning_rate": 1.467561004257034e-06, + "loss": 0.6265, + "step": 42697 + }, + { + "epoch": 1.09, + "learning_rate": 1.4675365444813014e-06, + "loss": 0.6758, + "step": 42698 + }, + { + "epoch": 1.09, + "learning_rate": 1.467512084347598e-06, + "loss": 0.8301, + "step": 42699 + }, + { + "epoch": 1.09, + "learning_rate": 1.4674876238559416e-06, + "loss": 0.7305, + "step": 42700 + }, + { + "epoch": 1.09, + "learning_rate": 1.4674631630063517e-06, + "loss": 0.3906, + "step": 42701 + }, + { + "epoch": 1.09, + "learning_rate": 1.467438701798847e-06, + "loss": 0.7383, + "step": 42702 + }, + { + "epoch": 1.09, + "learning_rate": 1.4674142402334458e-06, + "loss": 0.5132, + "step": 42703 + }, + { + "epoch": 1.09, + "learning_rate": 1.4673897783101668e-06, + "loss": 0.5647, + "step": 42704 + }, + { + "epoch": 1.09, + "learning_rate": 1.467365316029029e-06, + "loss": 0.5293, + "step": 42705 + }, + { + "epoch": 1.09, + "learning_rate": 1.467340853390051e-06, + "loss": 0.8896, + "step": 42706 + }, + { + "epoch": 1.09, + "learning_rate": 1.4673163903932518e-06, + "loss": 0.4717, + "step": 42707 + }, + { + "epoch": 1.09, + "learning_rate": 1.46729192703865e-06, + "loss": 0.5479, + "step": 42708 + }, + { + "epoch": 1.09, + "learning_rate": 1.4672674633262641e-06, + "loss": 0.6699, + "step": 42709 + }, + { + "epoch": 1.09, + "learning_rate": 1.467242999256113e-06, + "loss": 0.7725, + "step": 42710 + }, + { + "epoch": 1.09, + "learning_rate": 1.4672185348282153e-06, + "loss": 0.6758, + "step": 42711 + }, + { + "epoch": 1.09, + "learning_rate": 1.4671940700425905e-06, + "loss": 0.7021, + "step": 42712 + }, + { + "epoch": 1.09, + "learning_rate": 1.4671696048992559e-06, + "loss": 0.5923, + "step": 42713 + }, + { + "epoch": 1.09, + "learning_rate": 1.4671451393982315e-06, + "loss": 0.562, + "step": 42714 + }, + { + "epoch": 1.09, + "learning_rate": 1.4671206735395352e-06, + "loss": 0.5356, + "step": 42715 + }, + { + "epoch": 1.09, + "learning_rate": 1.4670962073231863e-06, + "loss": 0.3748, + "step": 42716 + }, + { + "epoch": 1.09, + "learning_rate": 1.4670717407492033e-06, + "loss": 0.5991, + "step": 42717 + }, + { + "epoch": 1.09, + "learning_rate": 1.4670472738176044e-06, + "loss": 0.6226, + "step": 42718 + }, + { + "epoch": 1.09, + "learning_rate": 1.4670228065284097e-06, + "loss": 0.6128, + "step": 42719 + }, + { + "epoch": 1.09, + "learning_rate": 1.4669983388816368e-06, + "loss": 0.7305, + "step": 42720 + }, + { + "epoch": 1.09, + "learning_rate": 1.4669738708773046e-06, + "loss": 0.5967, + "step": 42721 + }, + { + "epoch": 1.09, + "learning_rate": 1.4669494025154322e-06, + "loss": 0.8164, + "step": 42722 + }, + { + "epoch": 1.1, + "learning_rate": 1.466924933796038e-06, + "loss": 0.4971, + "step": 42723 + }, + { + "epoch": 1.1, + "learning_rate": 1.4669004647191408e-06, + "loss": 0.7485, + "step": 42724 + }, + { + "epoch": 1.1, + "learning_rate": 1.4668759952847593e-06, + "loss": 0.9453, + "step": 42725 + }, + { + "epoch": 1.1, + "learning_rate": 1.4668515254929123e-06, + "loss": 0.4524, + "step": 42726 + }, + { + "epoch": 1.1, + "learning_rate": 1.4668270553436191e-06, + "loss": 0.5347, + "step": 42727 + }, + { + "epoch": 1.1, + "learning_rate": 1.4668025848368975e-06, + "loss": 0.5759, + "step": 42728 + }, + { + "epoch": 1.1, + "learning_rate": 1.4667781139727665e-06, + "loss": 0.7046, + "step": 42729 + }, + { + "epoch": 1.1, + "learning_rate": 1.466753642751245e-06, + "loss": 0.7705, + "step": 42730 + }, + { + "epoch": 1.1, + "learning_rate": 1.4667291711723516e-06, + "loss": 0.7412, + "step": 42731 + }, + { + "epoch": 1.1, + "learning_rate": 1.4667046992361056e-06, + "loss": 0.5195, + "step": 42732 + }, + { + "epoch": 1.1, + "learning_rate": 1.4666802269425248e-06, + "loss": 0.6943, + "step": 42733 + }, + { + "epoch": 1.1, + "learning_rate": 1.4666557542916287e-06, + "loss": 0.7852, + "step": 42734 + }, + { + "epoch": 1.1, + "learning_rate": 1.4666312812834356e-06, + "loss": 0.5444, + "step": 42735 + }, + { + "epoch": 1.1, + "learning_rate": 1.4666068079179642e-06, + "loss": 0.6523, + "step": 42736 + }, + { + "epoch": 1.1, + "learning_rate": 1.4665823341952338e-06, + "loss": 0.4487, + "step": 42737 + }, + { + "epoch": 1.1, + "learning_rate": 1.4665578601152629e-06, + "loss": 0.7168, + "step": 42738 + }, + { + "epoch": 1.1, + "learning_rate": 1.4665333856780697e-06, + "loss": 0.6436, + "step": 42739 + }, + { + "epoch": 1.1, + "learning_rate": 1.4665089108836735e-06, + "loss": 0.7607, + "step": 42740 + }, + { + "epoch": 1.1, + "learning_rate": 1.4664844357320927e-06, + "loss": 0.6226, + "step": 42741 + }, + { + "epoch": 1.1, + "learning_rate": 1.4664599602233466e-06, + "loss": 0.8262, + "step": 42742 + }, + { + "epoch": 1.1, + "learning_rate": 1.4664354843574528e-06, + "loss": 0.6729, + "step": 42743 + }, + { + "epoch": 1.1, + "learning_rate": 1.4664110081344317e-06, + "loss": 0.7344, + "step": 42744 + }, + { + "epoch": 1.1, + "learning_rate": 1.4663865315543005e-06, + "loss": 0.5496, + "step": 42745 + }, + { + "epoch": 1.1, + "learning_rate": 1.466362054617079e-06, + "loss": 0.6152, + "step": 42746 + }, + { + "epoch": 1.1, + "learning_rate": 1.4663375773227853e-06, + "loss": 0.7588, + "step": 42747 + }, + { + "epoch": 1.1, + "learning_rate": 1.4663130996714384e-06, + "loss": 0.8438, + "step": 42748 + }, + { + "epoch": 1.1, + "learning_rate": 1.4662886216630567e-06, + "loss": 0.5176, + "step": 42749 + }, + { + "epoch": 1.1, + "learning_rate": 1.4662641432976598e-06, + "loss": 0.6987, + "step": 42750 + }, + { + "epoch": 1.1, + "learning_rate": 1.4662396645752653e-06, + "loss": 0.5643, + "step": 42751 + }, + { + "epoch": 1.1, + "learning_rate": 1.4662151854958933e-06, + "loss": 0.791, + "step": 42752 + }, + { + "epoch": 1.1, + "learning_rate": 1.466190706059561e-06, + "loss": 0.548, + "step": 42753 + }, + { + "epoch": 1.1, + "learning_rate": 1.4661662262662884e-06, + "loss": 0.5142, + "step": 42754 + }, + { + "epoch": 1.1, + "learning_rate": 1.4661417461160933e-06, + "loss": 0.7363, + "step": 42755 + }, + { + "epoch": 1.1, + "learning_rate": 1.4661172656089954e-06, + "loss": 0.6479, + "step": 42756 + }, + { + "epoch": 1.1, + "learning_rate": 1.4660927847450126e-06, + "loss": 0.7666, + "step": 42757 + }, + { + "epoch": 1.1, + "learning_rate": 1.4660683035241642e-06, + "loss": 0.6191, + "step": 42758 + }, + { + "epoch": 1.1, + "learning_rate": 1.4660438219464685e-06, + "loss": 0.6738, + "step": 42759 + }, + { + "epoch": 1.1, + "learning_rate": 1.4660193400119447e-06, + "loss": 0.6973, + "step": 42760 + }, + { + "epoch": 1.1, + "learning_rate": 1.465994857720611e-06, + "loss": 0.8506, + "step": 42761 + }, + { + "epoch": 1.1, + "learning_rate": 1.465970375072487e-06, + "loss": 0.7969, + "step": 42762 + }, + { + "epoch": 1.1, + "learning_rate": 1.4659458920675907e-06, + "loss": 0.4927, + "step": 42763 + }, + { + "epoch": 1.1, + "learning_rate": 1.465921408705941e-06, + "loss": 0.5603, + "step": 42764 + }, + { + "epoch": 1.1, + "learning_rate": 1.4658969249875566e-06, + "loss": 0.6924, + "step": 42765 + }, + { + "epoch": 1.1, + "learning_rate": 1.4658724409124563e-06, + "loss": 0.6777, + "step": 42766 + }, + { + "epoch": 1.1, + "learning_rate": 1.4658479564806591e-06, + "loss": 0.5757, + "step": 42767 + }, + { + "epoch": 1.1, + "learning_rate": 1.4658234716921834e-06, + "loss": 0.603, + "step": 42768 + }, + { + "epoch": 1.1, + "learning_rate": 1.4657989865470481e-06, + "loss": 0.6328, + "step": 42769 + }, + { + "epoch": 1.1, + "learning_rate": 1.4657745010452717e-06, + "loss": 0.7705, + "step": 42770 + }, + { + "epoch": 1.1, + "learning_rate": 1.4657500151868735e-06, + "loss": 0.8018, + "step": 42771 + }, + { + "epoch": 1.1, + "learning_rate": 1.465725528971872e-06, + "loss": 0.6455, + "step": 42772 + }, + { + "epoch": 1.1, + "learning_rate": 1.465701042400286e-06, + "loss": 0.6631, + "step": 42773 + }, + { + "epoch": 1.1, + "learning_rate": 1.4656765554721338e-06, + "loss": 0.6396, + "step": 42774 + }, + { + "epoch": 1.1, + "learning_rate": 1.4656520681874344e-06, + "loss": 0.6768, + "step": 42775 + }, + { + "epoch": 1.1, + "learning_rate": 1.4656275805462065e-06, + "loss": 0.7461, + "step": 42776 + }, + { + "epoch": 1.1, + "learning_rate": 1.4656030925484697e-06, + "loss": 0.6342, + "step": 42777 + }, + { + "epoch": 1.1, + "learning_rate": 1.4655786041942415e-06, + "loss": 0.6558, + "step": 42778 + }, + { + "epoch": 1.1, + "learning_rate": 1.4655541154835413e-06, + "loss": 0.66, + "step": 42779 + }, + { + "epoch": 1.1, + "learning_rate": 1.4655296264163875e-06, + "loss": 0.6655, + "step": 42780 + }, + { + "epoch": 1.1, + "learning_rate": 1.465505136992799e-06, + "loss": 0.7168, + "step": 42781 + }, + { + "epoch": 1.1, + "learning_rate": 1.4654806472127952e-06, + "loss": 0.5083, + "step": 42782 + }, + { + "epoch": 1.1, + "learning_rate": 1.465456157076394e-06, + "loss": 0.8008, + "step": 42783 + }, + { + "epoch": 1.1, + "learning_rate": 1.4654316665836142e-06, + "loss": 0.8652, + "step": 42784 + }, + { + "epoch": 1.1, + "learning_rate": 1.4654071757344748e-06, + "loss": 0.665, + "step": 42785 + }, + { + "epoch": 1.1, + "learning_rate": 1.4653826845289948e-06, + "loss": 0.5708, + "step": 42786 + }, + { + "epoch": 1.1, + "learning_rate": 1.4653581929671926e-06, + "loss": 0.6377, + "step": 42787 + }, + { + "epoch": 1.1, + "learning_rate": 1.465333701049087e-06, + "loss": 0.6992, + "step": 42788 + }, + { + "epoch": 1.1, + "learning_rate": 1.4653092087746965e-06, + "loss": 0.4055, + "step": 42789 + }, + { + "epoch": 1.1, + "learning_rate": 1.4652847161440405e-06, + "loss": 0.7065, + "step": 42790 + }, + { + "epoch": 1.1, + "learning_rate": 1.4652602231571369e-06, + "loss": 0.8213, + "step": 42791 + }, + { + "epoch": 1.1, + "learning_rate": 1.4652357298140057e-06, + "loss": 0.7607, + "step": 42792 + }, + { + "epoch": 1.1, + "learning_rate": 1.4652112361146642e-06, + "loss": 0.7119, + "step": 42793 + }, + { + "epoch": 1.1, + "learning_rate": 1.4651867420591324e-06, + "loss": 0.6411, + "step": 42794 + }, + { + "epoch": 1.1, + "learning_rate": 1.4651622476474279e-06, + "loss": 0.6582, + "step": 42795 + }, + { + "epoch": 1.1, + "learning_rate": 1.4651377528795706e-06, + "loss": 0.7012, + "step": 42796 + }, + { + "epoch": 1.1, + "learning_rate": 1.4651132577555785e-06, + "loss": 0.5624, + "step": 42797 + }, + { + "epoch": 1.1, + "learning_rate": 1.4650887622754706e-06, + "loss": 0.3966, + "step": 42798 + }, + { + "epoch": 1.1, + "learning_rate": 1.4650642664392655e-06, + "loss": 0.623, + "step": 42799 + }, + { + "epoch": 1.1, + "learning_rate": 1.4650397702469821e-06, + "loss": 0.5547, + "step": 42800 + }, + { + "epoch": 1.1, + "learning_rate": 1.465015273698639e-06, + "loss": 0.5732, + "step": 42801 + }, + { + "epoch": 1.1, + "learning_rate": 1.4649907767942558e-06, + "loss": 0.4348, + "step": 42802 + }, + { + "epoch": 1.1, + "learning_rate": 1.4649662795338498e-06, + "loss": 0.6602, + "step": 42803 + }, + { + "epoch": 1.1, + "learning_rate": 1.4649417819174409e-06, + "loss": 0.6152, + "step": 42804 + }, + { + "epoch": 1.1, + "learning_rate": 1.464917283945047e-06, + "loss": 0.7104, + "step": 42805 + }, + { + "epoch": 1.1, + "learning_rate": 1.4648927856166878e-06, + "loss": 0.623, + "step": 42806 + }, + { + "epoch": 1.1, + "learning_rate": 1.4648682869323814e-06, + "loss": 0.6567, + "step": 42807 + }, + { + "epoch": 1.1, + "learning_rate": 1.4648437878921464e-06, + "loss": 0.7949, + "step": 42808 + }, + { + "epoch": 1.1, + "learning_rate": 1.4648192884960022e-06, + "loss": 0.5835, + "step": 42809 + }, + { + "epoch": 1.1, + "learning_rate": 1.4647947887439671e-06, + "loss": 0.6694, + "step": 42810 + }, + { + "epoch": 1.1, + "learning_rate": 1.4647702886360603e-06, + "loss": 0.6841, + "step": 42811 + }, + { + "epoch": 1.1, + "learning_rate": 1.4647457881723e-06, + "loss": 0.6357, + "step": 42812 + }, + { + "epoch": 1.1, + "learning_rate": 1.4647212873527055e-06, + "loss": 0.7002, + "step": 42813 + }, + { + "epoch": 1.1, + "learning_rate": 1.464696786177295e-06, + "loss": 0.5874, + "step": 42814 + }, + { + "epoch": 1.1, + "learning_rate": 1.4646722846460877e-06, + "loss": 0.748, + "step": 42815 + }, + { + "epoch": 1.1, + "learning_rate": 1.4646477827591019e-06, + "loss": 0.8037, + "step": 42816 + }, + { + "epoch": 1.1, + "learning_rate": 1.4646232805163573e-06, + "loss": 0.5713, + "step": 42817 + }, + { + "epoch": 1.1, + "learning_rate": 1.4645987779178712e-06, + "loss": 0.5967, + "step": 42818 + }, + { + "epoch": 1.1, + "learning_rate": 1.4645742749636637e-06, + "loss": 0.5522, + "step": 42819 + }, + { + "epoch": 1.1, + "learning_rate": 1.4645497716537527e-06, + "loss": 0.478, + "step": 42820 + }, + { + "epoch": 1.1, + "learning_rate": 1.4645252679881577e-06, + "loss": 0.5962, + "step": 42821 + }, + { + "epoch": 1.1, + "learning_rate": 1.4645007639668968e-06, + "loss": 0.7734, + "step": 42822 + }, + { + "epoch": 1.1, + "learning_rate": 1.4644762595899892e-06, + "loss": 0.7744, + "step": 42823 + }, + { + "epoch": 1.1, + "learning_rate": 1.4644517548574534e-06, + "loss": 0.6914, + "step": 42824 + }, + { + "epoch": 1.1, + "learning_rate": 1.4644272497693081e-06, + "loss": 0.668, + "step": 42825 + }, + { + "epoch": 1.1, + "learning_rate": 1.4644027443255725e-06, + "loss": 0.5439, + "step": 42826 + }, + { + "epoch": 1.1, + "learning_rate": 1.464378238526265e-06, + "loss": 0.5918, + "step": 42827 + }, + { + "epoch": 1.1, + "learning_rate": 1.464353732371404e-06, + "loss": 0.6504, + "step": 42828 + }, + { + "epoch": 1.1, + "learning_rate": 1.4643292258610091e-06, + "loss": 0.5562, + "step": 42829 + }, + { + "epoch": 1.1, + "learning_rate": 1.4643047189950988e-06, + "loss": 0.708, + "step": 42830 + }, + { + "epoch": 1.1, + "learning_rate": 1.4642802117736913e-06, + "loss": 0.666, + "step": 42831 + }, + { + "epoch": 1.1, + "learning_rate": 1.4642557041968061e-06, + "loss": 0.5688, + "step": 42832 + }, + { + "epoch": 1.1, + "learning_rate": 1.4642311962644617e-06, + "loss": 0.6792, + "step": 42833 + }, + { + "epoch": 1.1, + "learning_rate": 1.4642066879766765e-06, + "loss": 0.7969, + "step": 42834 + }, + { + "epoch": 1.1, + "learning_rate": 1.4641821793334698e-06, + "loss": 0.7935, + "step": 42835 + }, + { + "epoch": 1.1, + "learning_rate": 1.4641576703348602e-06, + "loss": 0.6709, + "step": 42836 + }, + { + "epoch": 1.1, + "learning_rate": 1.4641331609808662e-06, + "loss": 0.7676, + "step": 42837 + }, + { + "epoch": 1.1, + "learning_rate": 1.4641086512715073e-06, + "loss": 0.5276, + "step": 42838 + }, + { + "epoch": 1.1, + "learning_rate": 1.464084141206801e-06, + "loss": 0.5996, + "step": 42839 + }, + { + "epoch": 1.1, + "learning_rate": 1.4640596307867674e-06, + "loss": 0.6826, + "step": 42840 + }, + { + "epoch": 1.1, + "learning_rate": 1.4640351200114244e-06, + "loss": 0.7227, + "step": 42841 + }, + { + "epoch": 1.1, + "learning_rate": 1.4640106088807913e-06, + "loss": 0.7461, + "step": 42842 + }, + { + "epoch": 1.1, + "learning_rate": 1.463986097394886e-06, + "loss": 0.6558, + "step": 42843 + }, + { + "epoch": 1.1, + "learning_rate": 1.4639615855537287e-06, + "loss": 0.6792, + "step": 42844 + }, + { + "epoch": 1.1, + "learning_rate": 1.4639370733573367e-06, + "loss": 0.4608, + "step": 42845 + }, + { + "epoch": 1.1, + "learning_rate": 1.4639125608057296e-06, + "loss": 0.6958, + "step": 42846 + }, + { + "epoch": 1.1, + "learning_rate": 1.4638880478989262e-06, + "loss": 0.6826, + "step": 42847 + }, + { + "epoch": 1.1, + "learning_rate": 1.463863534636945e-06, + "loss": 0.8281, + "step": 42848 + }, + { + "epoch": 1.1, + "learning_rate": 1.4638390210198045e-06, + "loss": 0.6768, + "step": 42849 + }, + { + "epoch": 1.1, + "learning_rate": 1.4638145070475241e-06, + "loss": 0.6152, + "step": 42850 + }, + { + "epoch": 1.1, + "learning_rate": 1.463789992720122e-06, + "loss": 0.7881, + "step": 42851 + }, + { + "epoch": 1.1, + "learning_rate": 1.4637654780376174e-06, + "loss": 0.6074, + "step": 42852 + }, + { + "epoch": 1.1, + "learning_rate": 1.4637409630000291e-06, + "loss": 0.6875, + "step": 42853 + }, + { + "epoch": 1.1, + "learning_rate": 1.4637164476073753e-06, + "loss": 0.7451, + "step": 42854 + }, + { + "epoch": 1.1, + "learning_rate": 1.4636919318596755e-06, + "loss": 0.75, + "step": 42855 + }, + { + "epoch": 1.1, + "learning_rate": 1.463667415756948e-06, + "loss": 0.4863, + "step": 42856 + }, + { + "epoch": 1.1, + "learning_rate": 1.4636428992992116e-06, + "loss": 0.5736, + "step": 42857 + }, + { + "epoch": 1.1, + "learning_rate": 1.463618382486485e-06, + "loss": 0.3523, + "step": 42858 + }, + { + "epoch": 1.1, + "learning_rate": 1.4635938653187871e-06, + "loss": 0.582, + "step": 42859 + }, + { + "epoch": 1.1, + "learning_rate": 1.4635693477961368e-06, + "loss": 0.5579, + "step": 42860 + }, + { + "epoch": 1.1, + "learning_rate": 1.463544829918553e-06, + "loss": 0.6228, + "step": 42861 + }, + { + "epoch": 1.1, + "learning_rate": 1.4635203116860543e-06, + "loss": 0.5052, + "step": 42862 + }, + { + "epoch": 1.1, + "learning_rate": 1.463495793098659e-06, + "loss": 0.6396, + "step": 42863 + }, + { + "epoch": 1.1, + "learning_rate": 1.4634712741563862e-06, + "loss": 0.6477, + "step": 42864 + }, + { + "epoch": 1.1, + "learning_rate": 1.4634467548592552e-06, + "loss": 0.7402, + "step": 42865 + }, + { + "epoch": 1.1, + "learning_rate": 1.4634222352072841e-06, + "loss": 0.6963, + "step": 42866 + }, + { + "epoch": 1.1, + "learning_rate": 1.4633977152004922e-06, + "loss": 0.8154, + "step": 42867 + }, + { + "epoch": 1.1, + "learning_rate": 1.4633731948388974e-06, + "loss": 0.5996, + "step": 42868 + }, + { + "epoch": 1.1, + "learning_rate": 1.4633486741225193e-06, + "loss": 0.7041, + "step": 42869 + }, + { + "epoch": 1.1, + "learning_rate": 1.4633241530513764e-06, + "loss": 0.6729, + "step": 42870 + }, + { + "epoch": 1.1, + "learning_rate": 1.4632996316254877e-06, + "loss": 0.709, + "step": 42871 + }, + { + "epoch": 1.1, + "learning_rate": 1.4632751098448718e-06, + "loss": 0.6709, + "step": 42872 + }, + { + "epoch": 1.1, + "learning_rate": 1.4632505877095473e-06, + "loss": 0.7163, + "step": 42873 + }, + { + "epoch": 1.1, + "learning_rate": 1.4632260652195332e-06, + "loss": 0.583, + "step": 42874 + }, + { + "epoch": 1.1, + "learning_rate": 1.463201542374848e-06, + "loss": 0.5049, + "step": 42875 + }, + { + "epoch": 1.1, + "learning_rate": 1.463177019175511e-06, + "loss": 0.7642, + "step": 42876 + }, + { + "epoch": 1.1, + "learning_rate": 1.4631524956215405e-06, + "loss": 0.5513, + "step": 42877 + }, + { + "epoch": 1.1, + "learning_rate": 1.4631279717129554e-06, + "loss": 0.6562, + "step": 42878 + }, + { + "epoch": 1.1, + "learning_rate": 1.4631034474497744e-06, + "loss": 0.4863, + "step": 42879 + }, + { + "epoch": 1.1, + "learning_rate": 1.4630789228320163e-06, + "loss": 0.6177, + "step": 42880 + }, + { + "epoch": 1.1, + "learning_rate": 1.4630543978597004e-06, + "loss": 0.6035, + "step": 42881 + }, + { + "epoch": 1.1, + "learning_rate": 1.4630298725328449e-06, + "loss": 0.7002, + "step": 42882 + }, + { + "epoch": 1.1, + "learning_rate": 1.4630053468514686e-06, + "loss": 0.3999, + "step": 42883 + }, + { + "epoch": 1.1, + "learning_rate": 1.4629808208155903e-06, + "loss": 0.6045, + "step": 42884 + }, + { + "epoch": 1.1, + "learning_rate": 1.462956294425229e-06, + "loss": 0.5986, + "step": 42885 + }, + { + "epoch": 1.1, + "learning_rate": 1.4629317676804033e-06, + "loss": 0.5093, + "step": 42886 + }, + { + "epoch": 1.1, + "learning_rate": 1.4629072405811322e-06, + "loss": 0.5981, + "step": 42887 + }, + { + "epoch": 1.1, + "learning_rate": 1.462882713127434e-06, + "loss": 0.7227, + "step": 42888 + }, + { + "epoch": 1.1, + "learning_rate": 1.462858185319328e-06, + "loss": 0.7988, + "step": 42889 + }, + { + "epoch": 1.1, + "learning_rate": 1.4628336571568328e-06, + "loss": 0.5225, + "step": 42890 + }, + { + "epoch": 1.1, + "learning_rate": 1.4628091286399671e-06, + "loss": 0.593, + "step": 42891 + }, + { + "epoch": 1.1, + "learning_rate": 1.4627845997687499e-06, + "loss": 0.6501, + "step": 42892 + }, + { + "epoch": 1.1, + "learning_rate": 1.4627600705431995e-06, + "loss": 0.5986, + "step": 42893 + }, + { + "epoch": 1.1, + "learning_rate": 1.4627355409633354e-06, + "loss": 0.6943, + "step": 42894 + }, + { + "epoch": 1.1, + "learning_rate": 1.4627110110291754e-06, + "loss": 0.7607, + "step": 42895 + }, + { + "epoch": 1.1, + "learning_rate": 1.462686480740739e-06, + "loss": 0.6162, + "step": 42896 + }, + { + "epoch": 1.1, + "learning_rate": 1.4626619500980454e-06, + "loss": 0.7646, + "step": 42897 + }, + { + "epoch": 1.1, + "learning_rate": 1.462637419101112e-06, + "loss": 0.7378, + "step": 42898 + }, + { + "epoch": 1.1, + "learning_rate": 1.4626128877499588e-06, + "loss": 0.5435, + "step": 42899 + }, + { + "epoch": 1.1, + "learning_rate": 1.4625883560446042e-06, + "loss": 0.6748, + "step": 42900 + }, + { + "epoch": 1.1, + "learning_rate": 1.462563823985067e-06, + "loss": 0.75, + "step": 42901 + }, + { + "epoch": 1.1, + "learning_rate": 1.4625392915713662e-06, + "loss": 0.6963, + "step": 42902 + }, + { + "epoch": 1.1, + "learning_rate": 1.46251475880352e-06, + "loss": 0.6333, + "step": 42903 + }, + { + "epoch": 1.1, + "learning_rate": 1.4624902256815475e-06, + "loss": 0.8789, + "step": 42904 + }, + { + "epoch": 1.1, + "learning_rate": 1.4624656922054674e-06, + "loss": 0.626, + "step": 42905 + }, + { + "epoch": 1.1, + "learning_rate": 1.4624411583752987e-06, + "loss": 0.7754, + "step": 42906 + }, + { + "epoch": 1.1, + "learning_rate": 1.4624166241910603e-06, + "loss": 0.5952, + "step": 42907 + }, + { + "epoch": 1.1, + "learning_rate": 1.4623920896527703e-06, + "loss": 0.698, + "step": 42908 + }, + { + "epoch": 1.1, + "learning_rate": 1.4623675547604486e-06, + "loss": 0.7305, + "step": 42909 + }, + { + "epoch": 1.1, + "learning_rate": 1.4623430195141126e-06, + "loss": 0.749, + "step": 42910 + }, + { + "epoch": 1.1, + "learning_rate": 1.4623184839137823e-06, + "loss": 0.6294, + "step": 42911 + }, + { + "epoch": 1.1, + "learning_rate": 1.4622939479594759e-06, + "loss": 0.6533, + "step": 42912 + }, + { + "epoch": 1.1, + "learning_rate": 1.4622694116512121e-06, + "loss": 0.5737, + "step": 42913 + }, + { + "epoch": 1.1, + "learning_rate": 1.46224487498901e-06, + "loss": 0.7393, + "step": 42914 + }, + { + "epoch": 1.1, + "learning_rate": 1.4622203379728884e-06, + "loss": 0.6895, + "step": 42915 + }, + { + "epoch": 1.1, + "learning_rate": 1.4621958006028657e-06, + "loss": 0.5347, + "step": 42916 + }, + { + "epoch": 1.1, + "learning_rate": 1.462171262878961e-06, + "loss": 0.5554, + "step": 42917 + }, + { + "epoch": 1.1, + "learning_rate": 1.462146724801193e-06, + "loss": 0.833, + "step": 42918 + }, + { + "epoch": 1.1, + "learning_rate": 1.4621221863695805e-06, + "loss": 0.668, + "step": 42919 + }, + { + "epoch": 1.1, + "learning_rate": 1.4620976475841423e-06, + "loss": 0.6226, + "step": 42920 + }, + { + "epoch": 1.1, + "learning_rate": 1.462073108444897e-06, + "loss": 0.6138, + "step": 42921 + }, + { + "epoch": 1.1, + "learning_rate": 1.462048568951864e-06, + "loss": 0.8682, + "step": 42922 + }, + { + "epoch": 1.1, + "learning_rate": 1.4620240291050615e-06, + "loss": 0.6895, + "step": 42923 + }, + { + "epoch": 1.1, + "learning_rate": 1.4619994889045081e-06, + "loss": 0.6223, + "step": 42924 + }, + { + "epoch": 1.1, + "learning_rate": 1.4619749483502233e-06, + "loss": 0.5752, + "step": 42925 + }, + { + "epoch": 1.1, + "learning_rate": 1.4619504074422252e-06, + "loss": 0.8066, + "step": 42926 + }, + { + "epoch": 1.1, + "learning_rate": 1.4619258661805334e-06, + "loss": 0.6147, + "step": 42927 + }, + { + "epoch": 1.1, + "learning_rate": 1.4619013245651659e-06, + "loss": 0.752, + "step": 42928 + }, + { + "epoch": 1.1, + "learning_rate": 1.4618767825961418e-06, + "loss": 0.7969, + "step": 42929 + }, + { + "epoch": 1.1, + "learning_rate": 1.46185224027348e-06, + "loss": 0.8291, + "step": 42930 + }, + { + "epoch": 1.1, + "learning_rate": 1.4618276975971988e-06, + "loss": 0.6577, + "step": 42931 + }, + { + "epoch": 1.1, + "learning_rate": 1.461803154567318e-06, + "loss": 0.6089, + "step": 42932 + }, + { + "epoch": 1.1, + "learning_rate": 1.4617786111838552e-06, + "loss": 0.7529, + "step": 42933 + }, + { + "epoch": 1.1, + "learning_rate": 1.46175406744683e-06, + "loss": 0.6572, + "step": 42934 + }, + { + "epoch": 1.1, + "learning_rate": 1.461729523356261e-06, + "loss": 0.8398, + "step": 42935 + }, + { + "epoch": 1.1, + "learning_rate": 1.461704978912167e-06, + "loss": 0.6216, + "step": 42936 + }, + { + "epoch": 1.1, + "learning_rate": 1.4616804341145664e-06, + "loss": 0.5586, + "step": 42937 + }, + { + "epoch": 1.1, + "learning_rate": 1.4616558889634788e-06, + "loss": 0.6094, + "step": 42938 + }, + { + "epoch": 1.1, + "learning_rate": 1.4616313434589218e-06, + "loss": 0.7065, + "step": 42939 + }, + { + "epoch": 1.1, + "learning_rate": 1.4616067976009153e-06, + "loss": 0.7773, + "step": 42940 + }, + { + "epoch": 1.1, + "learning_rate": 1.4615822513894778e-06, + "loss": 0.4971, + "step": 42941 + }, + { + "epoch": 1.1, + "learning_rate": 1.4615577048246279e-06, + "loss": 0.6948, + "step": 42942 + }, + { + "epoch": 1.1, + "learning_rate": 1.4615331579063845e-06, + "loss": 0.6523, + "step": 42943 + }, + { + "epoch": 1.1, + "learning_rate": 1.4615086106347663e-06, + "loss": 0.626, + "step": 42944 + }, + { + "epoch": 1.1, + "learning_rate": 1.4614840630097923e-06, + "loss": 0.6826, + "step": 42945 + }, + { + "epoch": 1.1, + "learning_rate": 1.4614595150314811e-06, + "loss": 0.7588, + "step": 42946 + }, + { + "epoch": 1.1, + "learning_rate": 1.4614349666998518e-06, + "loss": 0.5205, + "step": 42947 + }, + { + "epoch": 1.1, + "learning_rate": 1.4614104180149228e-06, + "loss": 0.6621, + "step": 42948 + }, + { + "epoch": 1.1, + "learning_rate": 1.461385868976713e-06, + "loss": 0.6694, + "step": 42949 + }, + { + "epoch": 1.1, + "learning_rate": 1.461361319585241e-06, + "loss": 0.873, + "step": 42950 + }, + { + "epoch": 1.1, + "learning_rate": 1.4613367698405262e-06, + "loss": 0.5923, + "step": 42951 + }, + { + "epoch": 1.1, + "learning_rate": 1.461312219742587e-06, + "loss": 0.6431, + "step": 42952 + }, + { + "epoch": 1.1, + "learning_rate": 1.4612876692914424e-06, + "loss": 0.6401, + "step": 42953 + }, + { + "epoch": 1.1, + "learning_rate": 1.4612631184871108e-06, + "loss": 0.6411, + "step": 42954 + }, + { + "epoch": 1.1, + "learning_rate": 1.4612385673296113e-06, + "loss": 0.644, + "step": 42955 + }, + { + "epoch": 1.1, + "learning_rate": 1.4612140158189625e-06, + "loss": 0.7891, + "step": 42956 + }, + { + "epoch": 1.1, + "learning_rate": 1.4611894639551837e-06, + "loss": 0.584, + "step": 42957 + }, + { + "epoch": 1.1, + "learning_rate": 1.461164911738293e-06, + "loss": 0.6211, + "step": 42958 + }, + { + "epoch": 1.1, + "learning_rate": 1.4611403591683095e-06, + "loss": 0.6152, + "step": 42959 + }, + { + "epoch": 1.1, + "learning_rate": 1.4611158062452523e-06, + "loss": 0.4648, + "step": 42960 + }, + { + "epoch": 1.1, + "learning_rate": 1.4610912529691396e-06, + "loss": 0.6365, + "step": 42961 + }, + { + "epoch": 1.1, + "learning_rate": 1.4610666993399909e-06, + "loss": 0.6523, + "step": 42962 + }, + { + "epoch": 1.1, + "learning_rate": 1.4610421453578244e-06, + "loss": 0.7334, + "step": 42963 + }, + { + "epoch": 1.1, + "learning_rate": 1.4610175910226592e-06, + "loss": 0.7031, + "step": 42964 + }, + { + "epoch": 1.1, + "learning_rate": 1.4609930363345143e-06, + "loss": 0.604, + "step": 42965 + }, + { + "epoch": 1.1, + "learning_rate": 1.4609684812934075e-06, + "loss": 0.8154, + "step": 42966 + }, + { + "epoch": 1.1, + "learning_rate": 1.460943925899359e-06, + "loss": 0.542, + "step": 42967 + }, + { + "epoch": 1.1, + "learning_rate": 1.4609193701523868e-06, + "loss": 0.7856, + "step": 42968 + }, + { + "epoch": 1.1, + "learning_rate": 1.4608948140525096e-06, + "loss": 0.603, + "step": 42969 + }, + { + "epoch": 1.1, + "learning_rate": 1.4608702575997466e-06, + "loss": 0.623, + "step": 42970 + }, + { + "epoch": 1.1, + "learning_rate": 1.4608457007941165e-06, + "loss": 0.7607, + "step": 42971 + }, + { + "epoch": 1.1, + "learning_rate": 1.4608211436356379e-06, + "loss": 0.6685, + "step": 42972 + }, + { + "epoch": 1.1, + "learning_rate": 1.4607965861243296e-06, + "loss": 0.6562, + "step": 42973 + }, + { + "epoch": 1.1, + "learning_rate": 1.4607720282602109e-06, + "loss": 0.6161, + "step": 42974 + }, + { + "epoch": 1.1, + "learning_rate": 1.4607474700433e-06, + "loss": 0.8242, + "step": 42975 + }, + { + "epoch": 1.1, + "learning_rate": 1.4607229114736162e-06, + "loss": 0.7109, + "step": 42976 + }, + { + "epoch": 1.1, + "learning_rate": 1.4606983525511779e-06, + "loss": 0.5647, + "step": 42977 + }, + { + "epoch": 1.1, + "learning_rate": 1.4606737932760037e-06, + "loss": 0.7012, + "step": 42978 + }, + { + "epoch": 1.1, + "learning_rate": 1.4606492336481134e-06, + "loss": 0.6953, + "step": 42979 + }, + { + "epoch": 1.1, + "learning_rate": 1.4606246736675247e-06, + "loss": 0.6836, + "step": 42980 + }, + { + "epoch": 1.1, + "learning_rate": 1.460600113334257e-06, + "loss": 0.5184, + "step": 42981 + }, + { + "epoch": 1.1, + "learning_rate": 1.4605755526483293e-06, + "loss": 0.665, + "step": 42982 + }, + { + "epoch": 1.1, + "learning_rate": 1.4605509916097596e-06, + "loss": 0.75, + "step": 42983 + }, + { + "epoch": 1.1, + "learning_rate": 1.460526430218567e-06, + "loss": 0.6992, + "step": 42984 + }, + { + "epoch": 1.1, + "learning_rate": 1.460501868474771e-06, + "loss": 0.5952, + "step": 42985 + }, + { + "epoch": 1.1, + "learning_rate": 1.4604773063783898e-06, + "loss": 0.6777, + "step": 42986 + }, + { + "epoch": 1.1, + "learning_rate": 1.4604527439294423e-06, + "loss": 0.6858, + "step": 42987 + }, + { + "epoch": 1.1, + "learning_rate": 1.4604281811279472e-06, + "loss": 0.6719, + "step": 42988 + }, + { + "epoch": 1.1, + "learning_rate": 1.4604036179739235e-06, + "loss": 0.7656, + "step": 42989 + }, + { + "epoch": 1.1, + "learning_rate": 1.4603790544673895e-06, + "loss": 0.6099, + "step": 42990 + }, + { + "epoch": 1.1, + "learning_rate": 1.4603544906083652e-06, + "loss": 0.7812, + "step": 42991 + }, + { + "epoch": 1.1, + "learning_rate": 1.4603299263968681e-06, + "loss": 0.7061, + "step": 42992 + }, + { + "epoch": 1.1, + "learning_rate": 1.4603053618329177e-06, + "loss": 0.5762, + "step": 42993 + }, + { + "epoch": 1.1, + "learning_rate": 1.4602807969165325e-06, + "loss": 0.7285, + "step": 42994 + }, + { + "epoch": 1.1, + "learning_rate": 1.4602562316477316e-06, + "loss": 0.7061, + "step": 42995 + }, + { + "epoch": 1.1, + "learning_rate": 1.4602316660265336e-06, + "loss": 0.5737, + "step": 42996 + }, + { + "epoch": 1.1, + "learning_rate": 1.4602071000529575e-06, + "loss": 0.71, + "step": 42997 + }, + { + "epoch": 1.1, + "learning_rate": 1.4601825337270218e-06, + "loss": 0.6694, + "step": 42998 + }, + { + "epoch": 1.1, + "learning_rate": 1.4601579670487456e-06, + "loss": 0.6992, + "step": 42999 + }, + { + "epoch": 1.1, + "learning_rate": 1.4601334000181475e-06, + "loss": 0.4534, + "step": 43000 + }, + { + "epoch": 1.1, + "learning_rate": 1.4601088326352468e-06, + "loss": 0.6143, + "step": 43001 + }, + { + "epoch": 1.1, + "learning_rate": 1.4600842649000615e-06, + "loss": 0.8281, + "step": 43002 + }, + { + "epoch": 1.1, + "learning_rate": 1.4600596968126111e-06, + "loss": 0.6846, + "step": 43003 + }, + { + "epoch": 1.1, + "learning_rate": 1.460035128372914e-06, + "loss": 0.6304, + "step": 43004 + }, + { + "epoch": 1.1, + "learning_rate": 1.460010559580989e-06, + "loss": 0.6611, + "step": 43005 + }, + { + "epoch": 1.1, + "learning_rate": 1.4599859904368555e-06, + "loss": 0.6499, + "step": 43006 + }, + { + "epoch": 1.1, + "learning_rate": 1.4599614209405312e-06, + "loss": 0.4458, + "step": 43007 + }, + { + "epoch": 1.1, + "learning_rate": 1.4599368510920362e-06, + "loss": 0.6099, + "step": 43008 + }, + { + "epoch": 1.1, + "learning_rate": 1.4599122808913885e-06, + "loss": 0.6519, + "step": 43009 + }, + { + "epoch": 1.1, + "learning_rate": 1.4598877103386072e-06, + "loss": 0.4739, + "step": 43010 + }, + { + "epoch": 1.1, + "learning_rate": 1.459863139433711e-06, + "loss": 0.5663, + "step": 43011 + }, + { + "epoch": 1.1, + "learning_rate": 1.4598385681767187e-06, + "loss": 0.606, + "step": 43012 + }, + { + "epoch": 1.1, + "learning_rate": 1.4598139965676488e-06, + "loss": 0.7012, + "step": 43013 + }, + { + "epoch": 1.1, + "learning_rate": 1.459789424606521e-06, + "loss": 0.6152, + "step": 43014 + }, + { + "epoch": 1.1, + "learning_rate": 1.4597648522933533e-06, + "loss": 0.6201, + "step": 43015 + }, + { + "epoch": 1.1, + "learning_rate": 1.459740279628165e-06, + "loss": 0.6689, + "step": 43016 + }, + { + "epoch": 1.1, + "learning_rate": 1.4597157066109746e-06, + "loss": 0.7852, + "step": 43017 + }, + { + "epoch": 1.1, + "learning_rate": 1.459691133241801e-06, + "loss": 0.6313, + "step": 43018 + }, + { + "epoch": 1.1, + "learning_rate": 1.459666559520663e-06, + "loss": 0.874, + "step": 43019 + }, + { + "epoch": 1.1, + "learning_rate": 1.4596419854475795e-06, + "loss": 0.6953, + "step": 43020 + }, + { + "epoch": 1.1, + "learning_rate": 1.4596174110225691e-06, + "loss": 0.751, + "step": 43021 + }, + { + "epoch": 1.1, + "learning_rate": 1.459592836245651e-06, + "loss": 0.7803, + "step": 43022 + }, + { + "epoch": 1.1, + "learning_rate": 1.4595682611168439e-06, + "loss": 0.7852, + "step": 43023 + }, + { + "epoch": 1.1, + "learning_rate": 1.4595436856361664e-06, + "loss": 0.7178, + "step": 43024 + }, + { + "epoch": 1.1, + "learning_rate": 1.459519109803637e-06, + "loss": 0.6963, + "step": 43025 + }, + { + "epoch": 1.1, + "learning_rate": 1.4594945336192757e-06, + "loss": 0.543, + "step": 43026 + }, + { + "epoch": 1.1, + "learning_rate": 1.4594699570831002e-06, + "loss": 0.7139, + "step": 43027 + }, + { + "epoch": 1.1, + "learning_rate": 1.4594453801951297e-06, + "loss": 0.791, + "step": 43028 + }, + { + "epoch": 1.1, + "learning_rate": 1.4594208029553827e-06, + "loss": 0.5742, + "step": 43029 + }, + { + "epoch": 1.1, + "learning_rate": 1.4593962253638787e-06, + "loss": 0.709, + "step": 43030 + }, + { + "epoch": 1.1, + "learning_rate": 1.459371647420636e-06, + "loss": 0.7734, + "step": 43031 + }, + { + "epoch": 1.1, + "learning_rate": 1.4593470691256735e-06, + "loss": 0.4727, + "step": 43032 + }, + { + "epoch": 1.1, + "learning_rate": 1.4593224904790103e-06, + "loss": 0.5889, + "step": 43033 + }, + { + "epoch": 1.1, + "learning_rate": 1.4592979114806644e-06, + "loss": 0.5042, + "step": 43034 + }, + { + "epoch": 1.1, + "learning_rate": 1.4592733321306559e-06, + "loss": 0.5967, + "step": 43035 + }, + { + "epoch": 1.1, + "learning_rate": 1.4592487524290027e-06, + "loss": 0.6807, + "step": 43036 + }, + { + "epoch": 1.1, + "learning_rate": 1.4592241723757239e-06, + "loss": 0.5337, + "step": 43037 + }, + { + "epoch": 1.1, + "learning_rate": 1.459199591970838e-06, + "loss": 0.6445, + "step": 43038 + }, + { + "epoch": 1.1, + "learning_rate": 1.4591750112143644e-06, + "loss": 0.7861, + "step": 43039 + }, + { + "epoch": 1.1, + "learning_rate": 1.4591504301063214e-06, + "loss": 0.7695, + "step": 43040 + }, + { + "epoch": 1.1, + "learning_rate": 1.4591258486467284e-06, + "loss": 0.7007, + "step": 43041 + }, + { + "epoch": 1.1, + "learning_rate": 1.4591012668356034e-06, + "loss": 0.5815, + "step": 43042 + }, + { + "epoch": 1.1, + "learning_rate": 1.4590766846729658e-06, + "loss": 0.6904, + "step": 43043 + }, + { + "epoch": 1.1, + "learning_rate": 1.4590521021588342e-06, + "loss": 0.7881, + "step": 43044 + }, + { + "epoch": 1.1, + "learning_rate": 1.4590275192932277e-06, + "loss": 0.7158, + "step": 43045 + }, + { + "epoch": 1.1, + "learning_rate": 1.4590029360761648e-06, + "loss": 0.5063, + "step": 43046 + }, + { + "epoch": 1.1, + "learning_rate": 1.4589783525076647e-06, + "loss": 0.6572, + "step": 43047 + }, + { + "epoch": 1.1, + "learning_rate": 1.4589537685877457e-06, + "loss": 0.6992, + "step": 43048 + }, + { + "epoch": 1.1, + "learning_rate": 1.458929184316427e-06, + "loss": 0.6777, + "step": 43049 + }, + { + "epoch": 1.1, + "learning_rate": 1.4589045996937272e-06, + "loss": 0.7075, + "step": 43050 + }, + { + "epoch": 1.1, + "learning_rate": 1.4588800147196655e-06, + "loss": 0.6484, + "step": 43051 + }, + { + "epoch": 1.1, + "learning_rate": 1.4588554293942603e-06, + "loss": 0.751, + "step": 43052 + }, + { + "epoch": 1.1, + "learning_rate": 1.4588308437175308e-06, + "loss": 0.709, + "step": 43053 + }, + { + "epoch": 1.1, + "learning_rate": 1.4588062576894952e-06, + "loss": 0.5879, + "step": 43054 + }, + { + "epoch": 1.1, + "learning_rate": 1.4587816713101733e-06, + "loss": 0.6943, + "step": 43055 + }, + { + "epoch": 1.1, + "learning_rate": 1.4587570845795832e-06, + "loss": 0.71, + "step": 43056 + }, + { + "epoch": 1.1, + "learning_rate": 1.4587324974977436e-06, + "loss": 0.5811, + "step": 43057 + }, + { + "epoch": 1.1, + "learning_rate": 1.4587079100646737e-06, + "loss": 0.4819, + "step": 43058 + }, + { + "epoch": 1.1, + "learning_rate": 1.4586833222803922e-06, + "loss": 0.7686, + "step": 43059 + }, + { + "epoch": 1.1, + "learning_rate": 1.4586587341449184e-06, + "loss": 0.6475, + "step": 43060 + }, + { + "epoch": 1.1, + "learning_rate": 1.4586341456582702e-06, + "loss": 0.7363, + "step": 43061 + }, + { + "epoch": 1.1, + "learning_rate": 1.4586095568204673e-06, + "loss": 0.6943, + "step": 43062 + }, + { + "epoch": 1.1, + "learning_rate": 1.4585849676315277e-06, + "loss": 0.6538, + "step": 43063 + }, + { + "epoch": 1.1, + "learning_rate": 1.4585603780914712e-06, + "loss": 0.6211, + "step": 43064 + }, + { + "epoch": 1.1, + "learning_rate": 1.4585357882003158e-06, + "loss": 0.6689, + "step": 43065 + }, + { + "epoch": 1.1, + "learning_rate": 1.4585111979580808e-06, + "loss": 0.7393, + "step": 43066 + }, + { + "epoch": 1.1, + "learning_rate": 1.4584866073647848e-06, + "loss": 0.6396, + "step": 43067 + }, + { + "epoch": 1.1, + "learning_rate": 1.4584620164204466e-06, + "loss": 0.5938, + "step": 43068 + }, + { + "epoch": 1.1, + "learning_rate": 1.458437425125085e-06, + "loss": 0.511, + "step": 43069 + }, + { + "epoch": 1.1, + "learning_rate": 1.458412833478719e-06, + "loss": 0.5962, + "step": 43070 + }, + { + "epoch": 1.1, + "learning_rate": 1.4583882414813677e-06, + "loss": 0.6938, + "step": 43071 + }, + { + "epoch": 1.1, + "learning_rate": 1.4583636491330492e-06, + "loss": 0.5347, + "step": 43072 + }, + { + "epoch": 1.1, + "learning_rate": 1.458339056433783e-06, + "loss": 0.8008, + "step": 43073 + }, + { + "epoch": 1.1, + "learning_rate": 1.4583144633835875e-06, + "loss": 0.6494, + "step": 43074 + }, + { + "epoch": 1.1, + "learning_rate": 1.4582898699824816e-06, + "loss": 0.8926, + "step": 43075 + }, + { + "epoch": 1.1, + "learning_rate": 1.4582652762304846e-06, + "loss": 0.5312, + "step": 43076 + }, + { + "epoch": 1.1, + "learning_rate": 1.4582406821276147e-06, + "loss": 0.459, + "step": 43077 + }, + { + "epoch": 1.1, + "learning_rate": 1.458216087673891e-06, + "loss": 0.6294, + "step": 43078 + }, + { + "epoch": 1.1, + "learning_rate": 1.4581914928693323e-06, + "loss": 0.6475, + "step": 43079 + }, + { + "epoch": 1.1, + "learning_rate": 1.4581668977139572e-06, + "loss": 0.7036, + "step": 43080 + }, + { + "epoch": 1.1, + "learning_rate": 1.4581423022077854e-06, + "loss": 0.7656, + "step": 43081 + }, + { + "epoch": 1.1, + "learning_rate": 1.4581177063508346e-06, + "loss": 0.5913, + "step": 43082 + }, + { + "epoch": 1.1, + "learning_rate": 1.4580931101431243e-06, + "loss": 0.6807, + "step": 43083 + }, + { + "epoch": 1.1, + "learning_rate": 1.458068513584673e-06, + "loss": 0.6182, + "step": 43084 + }, + { + "epoch": 1.1, + "learning_rate": 1.4580439166754998e-06, + "loss": 0.6494, + "step": 43085 + }, + { + "epoch": 1.1, + "learning_rate": 1.4580193194156235e-06, + "loss": 0.7256, + "step": 43086 + }, + { + "epoch": 1.1, + "learning_rate": 1.457994721805063e-06, + "loss": 0.7422, + "step": 43087 + }, + { + "epoch": 1.1, + "learning_rate": 1.4579701238438369e-06, + "loss": 0.7842, + "step": 43088 + }, + { + "epoch": 1.1, + "learning_rate": 1.457945525531964e-06, + "loss": 0.4829, + "step": 43089 + }, + { + "epoch": 1.1, + "learning_rate": 1.4579209268694632e-06, + "loss": 0.75, + "step": 43090 + }, + { + "epoch": 1.1, + "learning_rate": 1.4578963278563539e-06, + "loss": 0.5791, + "step": 43091 + }, + { + "epoch": 1.1, + "learning_rate": 1.4578717284926538e-06, + "loss": 0.7383, + "step": 43092 + }, + { + "epoch": 1.1, + "learning_rate": 1.4578471287783827e-06, + "loss": 0.5801, + "step": 43093 + }, + { + "epoch": 1.1, + "learning_rate": 1.457822528713559e-06, + "loss": 0.4785, + "step": 43094 + }, + { + "epoch": 1.1, + "learning_rate": 1.457797928298202e-06, + "loss": 0.48, + "step": 43095 + }, + { + "epoch": 1.1, + "learning_rate": 1.4577733275323297e-06, + "loss": 0.458, + "step": 43096 + }, + { + "epoch": 1.1, + "learning_rate": 1.4577487264159613e-06, + "loss": 0.5933, + "step": 43097 + }, + { + "epoch": 1.1, + "learning_rate": 1.4577241249491162e-06, + "loss": 0.7227, + "step": 43098 + }, + { + "epoch": 1.1, + "learning_rate": 1.4576995231318128e-06, + "loss": 0.6533, + "step": 43099 + }, + { + "epoch": 1.1, + "learning_rate": 1.4576749209640695e-06, + "loss": 0.7588, + "step": 43100 + }, + { + "epoch": 1.1, + "learning_rate": 1.457650318445906e-06, + "loss": 0.6812, + "step": 43101 + }, + { + "epoch": 1.1, + "learning_rate": 1.4576257155773404e-06, + "loss": 0.5466, + "step": 43102 + }, + { + "epoch": 1.1, + "learning_rate": 1.4576011123583917e-06, + "loss": 0.7236, + "step": 43103 + }, + { + "epoch": 1.1, + "learning_rate": 1.4575765087890793e-06, + "loss": 0.6274, + "step": 43104 + }, + { + "epoch": 1.1, + "learning_rate": 1.4575519048694211e-06, + "loss": 0.5586, + "step": 43105 + }, + { + "epoch": 1.1, + "learning_rate": 1.4575273005994371e-06, + "loss": 0.7549, + "step": 43106 + }, + { + "epoch": 1.1, + "learning_rate": 1.457502695979145e-06, + "loss": 0.6724, + "step": 43107 + }, + { + "epoch": 1.1, + "learning_rate": 1.4574780910085642e-06, + "loss": 0.623, + "step": 43108 + }, + { + "epoch": 1.1, + "learning_rate": 1.4574534856877136e-06, + "loss": 0.7314, + "step": 43109 + }, + { + "epoch": 1.1, + "learning_rate": 1.4574288800166118e-06, + "loss": 0.7949, + "step": 43110 + }, + { + "epoch": 1.1, + "learning_rate": 1.4574042739952779e-06, + "loss": 0.751, + "step": 43111 + }, + { + "epoch": 1.1, + "learning_rate": 1.4573796676237303e-06, + "loss": 0.5382, + "step": 43112 + }, + { + "epoch": 1.11, + "learning_rate": 1.4573550609019883e-06, + "loss": 0.5798, + "step": 43113 + }, + { + "epoch": 1.11, + "learning_rate": 1.4573304538300705e-06, + "loss": 0.7441, + "step": 43114 + }, + { + "epoch": 1.11, + "learning_rate": 1.4573058464079957e-06, + "loss": 0.4563, + "step": 43115 + }, + { + "epoch": 1.11, + "learning_rate": 1.457281238635783e-06, + "loss": 0.772, + "step": 43116 + }, + { + "epoch": 1.11, + "learning_rate": 1.457256630513451e-06, + "loss": 0.623, + "step": 43117 + }, + { + "epoch": 1.11, + "learning_rate": 1.4572320220410187e-06, + "loss": 0.6914, + "step": 43118 + }, + { + "epoch": 1.11, + "learning_rate": 1.4572074132185047e-06, + "loss": 0.5283, + "step": 43119 + }, + { + "epoch": 1.11, + "learning_rate": 1.4571828040459281e-06, + "loss": 0.5957, + "step": 43120 + }, + { + "epoch": 1.11, + "learning_rate": 1.4571581945233077e-06, + "loss": 0.6548, + "step": 43121 + }, + { + "epoch": 1.11, + "learning_rate": 1.4571335846506622e-06, + "loss": 0.7578, + "step": 43122 + }, + { + "epoch": 1.11, + "learning_rate": 1.457108974428011e-06, + "loss": 0.6758, + "step": 43123 + }, + { + "epoch": 1.11, + "learning_rate": 1.457084363855372e-06, + "loss": 0.6674, + "step": 43124 + }, + { + "epoch": 1.11, + "learning_rate": 1.4570597529327644e-06, + "loss": 0.6865, + "step": 43125 + }, + { + "epoch": 1.11, + "learning_rate": 1.4570351416602074e-06, + "loss": 0.4265, + "step": 43126 + }, + { + "epoch": 1.11, + "learning_rate": 1.4570105300377197e-06, + "loss": 0.6914, + "step": 43127 + }, + { + "epoch": 1.11, + "learning_rate": 1.4569859180653197e-06, + "loss": 0.7485, + "step": 43128 + }, + { + "epoch": 1.11, + "learning_rate": 1.456961305743027e-06, + "loss": 0.6289, + "step": 43129 + }, + { + "epoch": 1.11, + "learning_rate": 1.4569366930708596e-06, + "loss": 0.6514, + "step": 43130 + }, + { + "epoch": 1.11, + "learning_rate": 1.4569120800488373e-06, + "loss": 0.749, + "step": 43131 + }, + { + "epoch": 1.11, + "learning_rate": 1.4568874666769782e-06, + "loss": 0.6318, + "step": 43132 + }, + { + "epoch": 1.11, + "learning_rate": 1.4568628529553012e-06, + "loss": 0.6299, + "step": 43133 + }, + { + "epoch": 1.11, + "learning_rate": 1.4568382388838255e-06, + "loss": 0.6787, + "step": 43134 + }, + { + "epoch": 1.11, + "learning_rate": 1.4568136244625698e-06, + "loss": 0.4829, + "step": 43135 + }, + { + "epoch": 1.11, + "learning_rate": 1.4567890096915529e-06, + "loss": 0.4071, + "step": 43136 + }, + { + "epoch": 1.11, + "learning_rate": 1.4567643945707935e-06, + "loss": 0.7344, + "step": 43137 + }, + { + "epoch": 1.11, + "learning_rate": 1.4567397791003107e-06, + "loss": 0.5967, + "step": 43138 + }, + { + "epoch": 1.11, + "learning_rate": 1.4567151632801233e-06, + "loss": 0.8242, + "step": 43139 + }, + { + "epoch": 1.11, + "learning_rate": 1.4566905471102499e-06, + "loss": 0.6172, + "step": 43140 + }, + { + "epoch": 1.11, + "learning_rate": 1.4566659305907098e-06, + "loss": 0.6445, + "step": 43141 + }, + { + "epoch": 1.11, + "learning_rate": 1.4566413137215215e-06, + "loss": 0.7373, + "step": 43142 + }, + { + "epoch": 1.11, + "learning_rate": 1.4566166965027038e-06, + "loss": 0.7061, + "step": 43143 + }, + { + "epoch": 1.11, + "learning_rate": 1.456592078934276e-06, + "loss": 0.5913, + "step": 43144 + }, + { + "epoch": 1.11, + "learning_rate": 1.4565674610162564e-06, + "loss": 0.4614, + "step": 43145 + }, + { + "epoch": 1.11, + "learning_rate": 1.4565428427486644e-06, + "loss": 0.4019, + "step": 43146 + }, + { + "epoch": 1.11, + "learning_rate": 1.4565182241315182e-06, + "loss": 0.6191, + "step": 43147 + }, + { + "epoch": 1.11, + "learning_rate": 1.4564936051648372e-06, + "loss": 0.6357, + "step": 43148 + }, + { + "epoch": 1.11, + "learning_rate": 1.4564689858486395e-06, + "loss": 0.752, + "step": 43149 + }, + { + "epoch": 1.11, + "learning_rate": 1.456444366182945e-06, + "loss": 0.6299, + "step": 43150 + }, + { + "epoch": 1.11, + "learning_rate": 1.456419746167772e-06, + "loss": 0.6309, + "step": 43151 + }, + { + "epoch": 1.11, + "learning_rate": 1.4563951258031394e-06, + "loss": 0.6836, + "step": 43152 + }, + { + "epoch": 1.11, + "learning_rate": 1.456370505089066e-06, + "loss": 0.7842, + "step": 43153 + }, + { + "epoch": 1.11, + "learning_rate": 1.4563458840255706e-06, + "loss": 0.6138, + "step": 43154 + }, + { + "epoch": 1.11, + "learning_rate": 1.4563212626126723e-06, + "loss": 0.8066, + "step": 43155 + }, + { + "epoch": 1.11, + "learning_rate": 1.4562966408503898e-06, + "loss": 0.8438, + "step": 43156 + }, + { + "epoch": 1.11, + "learning_rate": 1.4562720187387418e-06, + "loss": 0.6641, + "step": 43157 + }, + { + "epoch": 1.11, + "learning_rate": 1.4562473962777473e-06, + "loss": 0.6797, + "step": 43158 + }, + { + "epoch": 1.11, + "learning_rate": 1.456222773467425e-06, + "loss": 0.6504, + "step": 43159 + }, + { + "epoch": 1.11, + "learning_rate": 1.4561981503077942e-06, + "loss": 0.7109, + "step": 43160 + }, + { + "epoch": 1.11, + "learning_rate": 1.4561735267988734e-06, + "loss": 0.561, + "step": 43161 + }, + { + "epoch": 1.11, + "learning_rate": 1.4561489029406814e-06, + "loss": 0.7607, + "step": 43162 + }, + { + "epoch": 1.11, + "learning_rate": 1.4561242787332374e-06, + "loss": 0.5938, + "step": 43163 + }, + { + "epoch": 1.11, + "learning_rate": 1.4560996541765595e-06, + "loss": 0.6777, + "step": 43164 + }, + { + "epoch": 1.11, + "learning_rate": 1.4560750292706673e-06, + "loss": 0.6572, + "step": 43165 + }, + { + "epoch": 1.11, + "learning_rate": 1.4560504040155797e-06, + "loss": 0.5825, + "step": 43166 + }, + { + "epoch": 1.11, + "learning_rate": 1.456025778411315e-06, + "loss": 0.4756, + "step": 43167 + }, + { + "epoch": 1.11, + "learning_rate": 1.4560011524578923e-06, + "loss": 0.8066, + "step": 43168 + }, + { + "epoch": 1.11, + "learning_rate": 1.4559765261553307e-06, + "loss": 0.562, + "step": 43169 + }, + { + "epoch": 1.11, + "learning_rate": 1.4559518995036486e-06, + "loss": 0.5105, + "step": 43170 + }, + { + "epoch": 1.11, + "learning_rate": 1.4559272725028656e-06, + "loss": 0.6265, + "step": 43171 + }, + { + "epoch": 1.11, + "learning_rate": 1.4559026451529994e-06, + "loss": 0.6069, + "step": 43172 + }, + { + "epoch": 1.11, + "learning_rate": 1.45587801745407e-06, + "loss": 0.7051, + "step": 43173 + }, + { + "epoch": 1.11, + "learning_rate": 1.4558533894060955e-06, + "loss": 0.6323, + "step": 43174 + }, + { + "epoch": 1.11, + "learning_rate": 1.455828761009095e-06, + "loss": 0.7422, + "step": 43175 + }, + { + "epoch": 1.11, + "learning_rate": 1.4558041322630874e-06, + "loss": 1.04, + "step": 43176 + }, + { + "epoch": 1.11, + "learning_rate": 1.4557795031680918e-06, + "loss": 0.6719, + "step": 43177 + }, + { + "epoch": 1.11, + "learning_rate": 1.4557548737241263e-06, + "loss": 0.7256, + "step": 43178 + }, + { + "epoch": 1.11, + "learning_rate": 1.4557302439312107e-06, + "loss": 0.6152, + "step": 43179 + }, + { + "epoch": 1.11, + "learning_rate": 1.4557056137893632e-06, + "loss": 0.5073, + "step": 43180 + }, + { + "epoch": 1.11, + "learning_rate": 1.455680983298603e-06, + "loss": 0.4922, + "step": 43181 + }, + { + "epoch": 1.11, + "learning_rate": 1.4556563524589484e-06, + "loss": 0.7432, + "step": 43182 + }, + { + "epoch": 1.11, + "learning_rate": 1.4556317212704191e-06, + "loss": 0.79, + "step": 43183 + }, + { + "epoch": 1.11, + "learning_rate": 1.4556070897330334e-06, + "loss": 0.5591, + "step": 43184 + }, + { + "epoch": 1.11, + "learning_rate": 1.4555824578468103e-06, + "loss": 0.7285, + "step": 43185 + }, + { + "epoch": 1.11, + "learning_rate": 1.4555578256117688e-06, + "loss": 0.7188, + "step": 43186 + }, + { + "epoch": 1.11, + "learning_rate": 1.4555331930279276e-06, + "loss": 0.7285, + "step": 43187 + }, + { + "epoch": 1.11, + "learning_rate": 1.4555085600953054e-06, + "loss": 0.457, + "step": 43188 + }, + { + "epoch": 1.11, + "learning_rate": 1.4554839268139214e-06, + "loss": 0.7666, + "step": 43189 + }, + { + "epoch": 1.11, + "learning_rate": 1.4554592931837942e-06, + "loss": 0.6948, + "step": 43190 + }, + { + "epoch": 1.11, + "learning_rate": 1.455434659204943e-06, + "loss": 0.71, + "step": 43191 + }, + { + "epoch": 1.11, + "learning_rate": 1.4554100248773862e-06, + "loss": 0.6064, + "step": 43192 + }, + { + "epoch": 1.11, + "learning_rate": 1.4553853902011426e-06, + "loss": 0.5933, + "step": 43193 + }, + { + "epoch": 1.11, + "learning_rate": 1.4553607551762319e-06, + "loss": 0.5388, + "step": 43194 + }, + { + "epoch": 1.11, + "learning_rate": 1.4553361198026718e-06, + "loss": 0.5454, + "step": 43195 + }, + { + "epoch": 1.11, + "learning_rate": 1.4553114840804825e-06, + "loss": 0.665, + "step": 43196 + }, + { + "epoch": 1.11, + "learning_rate": 1.4552868480096816e-06, + "loss": 0.7144, + "step": 43197 + }, + { + "epoch": 1.11, + "learning_rate": 1.4552622115902889e-06, + "loss": 0.7695, + "step": 43198 + }, + { + "epoch": 1.11, + "learning_rate": 1.4552375748223224e-06, + "loss": 0.6426, + "step": 43199 + }, + { + "epoch": 1.11, + "learning_rate": 1.4552129377058017e-06, + "loss": 0.54, + "step": 43200 + }, + { + "epoch": 1.11, + "learning_rate": 1.4551883002407454e-06, + "loss": 0.502, + "step": 43201 + }, + { + "epoch": 1.11, + "learning_rate": 1.4551636624271724e-06, + "loss": 0.7178, + "step": 43202 + }, + { + "epoch": 1.11, + "learning_rate": 1.4551390242651011e-06, + "loss": 0.6816, + "step": 43203 + }, + { + "epoch": 1.11, + "learning_rate": 1.4551143857545514e-06, + "loss": 0.7109, + "step": 43204 + }, + { + "epoch": 1.11, + "learning_rate": 1.455089746895541e-06, + "loss": 0.6025, + "step": 43205 + }, + { + "epoch": 1.11, + "learning_rate": 1.4550651076880898e-06, + "loss": 0.7783, + "step": 43206 + }, + { + "epoch": 1.11, + "learning_rate": 1.4550404681322158e-06, + "loss": 0.666, + "step": 43207 + }, + { + "epoch": 1.11, + "learning_rate": 1.4550158282279381e-06, + "loss": 0.749, + "step": 43208 + }, + { + "epoch": 1.11, + "learning_rate": 1.4549911879752758e-06, + "loss": 0.7168, + "step": 43209 + }, + { + "epoch": 1.11, + "learning_rate": 1.454966547374248e-06, + "loss": 0.6919, + "step": 43210 + }, + { + "epoch": 1.11, + "learning_rate": 1.4549419064248732e-06, + "loss": 0.792, + "step": 43211 + }, + { + "epoch": 1.11, + "learning_rate": 1.45491726512717e-06, + "loss": 0.6562, + "step": 43212 + }, + { + "epoch": 1.11, + "learning_rate": 1.4548926234811576e-06, + "loss": 0.7192, + "step": 43213 + }, + { + "epoch": 1.11, + "learning_rate": 1.4548679814868549e-06, + "loss": 0.7275, + "step": 43214 + }, + { + "epoch": 1.11, + "learning_rate": 1.4548433391442806e-06, + "loss": 0.5225, + "step": 43215 + }, + { + "epoch": 1.11, + "learning_rate": 1.4548186964534539e-06, + "loss": 0.5889, + "step": 43216 + }, + { + "epoch": 1.11, + "learning_rate": 1.4547940534143935e-06, + "loss": 0.6982, + "step": 43217 + }, + { + "epoch": 1.11, + "learning_rate": 1.454769410027118e-06, + "loss": 0.7266, + "step": 43218 + }, + { + "epoch": 1.11, + "learning_rate": 1.4547447662916466e-06, + "loss": 0.6357, + "step": 43219 + }, + { + "epoch": 1.11, + "learning_rate": 1.4547201222079976e-06, + "loss": 0.623, + "step": 43220 + }, + { + "epoch": 1.11, + "learning_rate": 1.4546954777761912e-06, + "loss": 0.6309, + "step": 43221 + }, + { + "epoch": 1.11, + "learning_rate": 1.4546708329962445e-06, + "loss": 0.6162, + "step": 43222 + }, + { + "epoch": 1.11, + "learning_rate": 1.4546461878681778e-06, + "loss": 0.5232, + "step": 43223 + }, + { + "epoch": 1.11, + "learning_rate": 1.454621542392009e-06, + "loss": 0.7393, + "step": 43224 + }, + { + "epoch": 1.11, + "learning_rate": 1.4545968965677577e-06, + "loss": 0.593, + "step": 43225 + }, + { + "epoch": 1.11, + "learning_rate": 1.4545722503954426e-06, + "loss": 0.6167, + "step": 43226 + }, + { + "epoch": 1.11, + "learning_rate": 1.4545476038750822e-06, + "loss": 0.7412, + "step": 43227 + }, + { + "epoch": 1.11, + "learning_rate": 1.4545229570066955e-06, + "loss": 0.6689, + "step": 43228 + }, + { + "epoch": 1.11, + "learning_rate": 1.4544983097903013e-06, + "loss": 0.5774, + "step": 43229 + }, + { + "epoch": 1.11, + "learning_rate": 1.4544736622259191e-06, + "loss": 0.6411, + "step": 43230 + }, + { + "epoch": 1.11, + "learning_rate": 1.454449014313567e-06, + "loss": 0.7441, + "step": 43231 + }, + { + "epoch": 1.11, + "learning_rate": 1.4544243660532645e-06, + "loss": 0.5542, + "step": 43232 + }, + { + "epoch": 1.11, + "learning_rate": 1.4543997174450298e-06, + "loss": 0.6768, + "step": 43233 + }, + { + "epoch": 1.11, + "learning_rate": 1.4543750684888822e-06, + "loss": 0.5493, + "step": 43234 + }, + { + "epoch": 1.11, + "learning_rate": 1.4543504191848408e-06, + "loss": 0.7158, + "step": 43235 + }, + { + "epoch": 1.11, + "learning_rate": 1.454325769532924e-06, + "loss": 0.8149, + "step": 43236 + }, + { + "epoch": 1.11, + "learning_rate": 1.4543011195331506e-06, + "loss": 0.7222, + "step": 43237 + }, + { + "epoch": 1.11, + "learning_rate": 1.4542764691855403e-06, + "loss": 0.5701, + "step": 43238 + }, + { + "epoch": 1.11, + "learning_rate": 1.454251818490111e-06, + "loss": 0.7832, + "step": 43239 + }, + { + "epoch": 1.11, + "learning_rate": 1.454227167446882e-06, + "loss": 0.3538, + "step": 43240 + }, + { + "epoch": 1.11, + "learning_rate": 1.4542025160558722e-06, + "loss": 0.6855, + "step": 43241 + }, + { + "epoch": 1.11, + "learning_rate": 1.4541778643171003e-06, + "loss": 0.7676, + "step": 43242 + }, + { + "epoch": 1.11, + "learning_rate": 1.4541532122305853e-06, + "loss": 0.7471, + "step": 43243 + }, + { + "epoch": 1.11, + "learning_rate": 1.4541285597963462e-06, + "loss": 0.7251, + "step": 43244 + }, + { + "epoch": 1.11, + "learning_rate": 1.4541039070144017e-06, + "loss": 0.6606, + "step": 43245 + }, + { + "epoch": 1.11, + "learning_rate": 1.4540792538847708e-06, + "loss": 0.5488, + "step": 43246 + }, + { + "epoch": 1.11, + "learning_rate": 1.454054600407472e-06, + "loss": 0.603, + "step": 43247 + }, + { + "epoch": 1.11, + "learning_rate": 1.4540299465825249e-06, + "loss": 0.623, + "step": 43248 + }, + { + "epoch": 1.11, + "learning_rate": 1.4540052924099475e-06, + "loss": 0.4971, + "step": 43249 + }, + { + "epoch": 1.11, + "learning_rate": 1.4539806378897595e-06, + "loss": 0.8608, + "step": 43250 + }, + { + "epoch": 1.11, + "learning_rate": 1.453955983021979e-06, + "loss": 0.6143, + "step": 43251 + }, + { + "epoch": 1.11, + "learning_rate": 1.4539313278066257e-06, + "loss": 0.6807, + "step": 43252 + }, + { + "epoch": 1.11, + "learning_rate": 1.4539066722437179e-06, + "loss": 0.6846, + "step": 43253 + }, + { + "epoch": 1.11, + "learning_rate": 1.4538820163332746e-06, + "loss": 0.5742, + "step": 43254 + }, + { + "epoch": 1.11, + "learning_rate": 1.4538573600753147e-06, + "loss": 0.6836, + "step": 43255 + }, + { + "epoch": 1.11, + "learning_rate": 1.453832703469857e-06, + "loss": 0.5028, + "step": 43256 + }, + { + "epoch": 1.11, + "learning_rate": 1.4538080465169206e-06, + "loss": 0.3142, + "step": 43257 + }, + { + "epoch": 1.11, + "learning_rate": 1.453783389216524e-06, + "loss": 0.6328, + "step": 43258 + }, + { + "epoch": 1.11, + "learning_rate": 1.4537587315686866e-06, + "loss": 0.5645, + "step": 43259 + }, + { + "epoch": 1.11, + "learning_rate": 1.4537340735734269e-06, + "loss": 0.6602, + "step": 43260 + }, + { + "epoch": 1.11, + "learning_rate": 1.4537094152307643e-06, + "loss": 0.5444, + "step": 43261 + }, + { + "epoch": 1.11, + "learning_rate": 1.4536847565407167e-06, + "loss": 0.7305, + "step": 43262 + }, + { + "epoch": 1.11, + "learning_rate": 1.4536600975033037e-06, + "loss": 0.5551, + "step": 43263 + }, + { + "epoch": 1.11, + "learning_rate": 1.453635438118544e-06, + "loss": 0.8408, + "step": 43264 + }, + { + "epoch": 1.11, + "learning_rate": 1.4536107783864565e-06, + "loss": 0.6982, + "step": 43265 + }, + { + "epoch": 1.11, + "learning_rate": 1.4535861183070604e-06, + "loss": 0.5776, + "step": 43266 + }, + { + "epoch": 1.11, + "learning_rate": 1.4535614578803739e-06, + "loss": 0.7129, + "step": 43267 + }, + { + "epoch": 1.11, + "learning_rate": 1.4535367971064162e-06, + "loss": 0.7339, + "step": 43268 + }, + { + "epoch": 1.11, + "learning_rate": 1.4535121359852065e-06, + "loss": 0.6294, + "step": 43269 + }, + { + "epoch": 1.11, + "learning_rate": 1.4534874745167632e-06, + "loss": 0.5767, + "step": 43270 + }, + { + "epoch": 1.11, + "learning_rate": 1.4534628127011056e-06, + "loss": 0.8213, + "step": 43271 + }, + { + "epoch": 1.11, + "learning_rate": 1.4534381505382522e-06, + "loss": 0.6562, + "step": 43272 + }, + { + "epoch": 1.11, + "learning_rate": 1.4534134880282222e-06, + "loss": 0.7168, + "step": 43273 + }, + { + "epoch": 1.11, + "learning_rate": 1.453388825171034e-06, + "loss": 0.7744, + "step": 43274 + }, + { + "epoch": 1.11, + "learning_rate": 1.453364161966707e-06, + "loss": 0.6836, + "step": 43275 + }, + { + "epoch": 1.11, + "learning_rate": 1.4533394984152603e-06, + "loss": 0.4434, + "step": 43276 + }, + { + "epoch": 1.11, + "learning_rate": 1.4533148345167119e-06, + "loss": 0.5762, + "step": 43277 + }, + { + "epoch": 1.11, + "learning_rate": 1.4532901702710815e-06, + "loss": 0.4429, + "step": 43278 + }, + { + "epoch": 1.11, + "learning_rate": 1.4532655056783877e-06, + "loss": 0.5566, + "step": 43279 + }, + { + "epoch": 1.11, + "learning_rate": 1.4532408407386492e-06, + "loss": 0.6465, + "step": 43280 + }, + { + "epoch": 1.11, + "learning_rate": 1.4532161754518847e-06, + "loss": 0.6465, + "step": 43281 + }, + { + "epoch": 1.11, + "learning_rate": 1.4531915098181137e-06, + "loss": 0.6758, + "step": 43282 + }, + { + "epoch": 1.11, + "learning_rate": 1.4531668438373548e-06, + "loss": 0.4976, + "step": 43283 + }, + { + "epoch": 1.11, + "learning_rate": 1.4531421775096268e-06, + "loss": 0.4596, + "step": 43284 + }, + { + "epoch": 1.11, + "learning_rate": 1.4531175108349489e-06, + "loss": 0.584, + "step": 43285 + }, + { + "epoch": 1.11, + "learning_rate": 1.4530928438133398e-06, + "loss": 0.7754, + "step": 43286 + }, + { + "epoch": 1.11, + "learning_rate": 1.4530681764448177e-06, + "loss": 0.4597, + "step": 43287 + }, + { + "epoch": 1.11, + "learning_rate": 1.453043508729403e-06, + "loss": 0.8428, + "step": 43288 + }, + { + "epoch": 1.11, + "learning_rate": 1.453018840667113e-06, + "loss": 0.6709, + "step": 43289 + }, + { + "epoch": 1.11, + "learning_rate": 1.4529941722579678e-06, + "loss": 0.4946, + "step": 43290 + }, + { + "epoch": 1.11, + "learning_rate": 1.4529695035019855e-06, + "loss": 0.6177, + "step": 43291 + }, + { + "epoch": 1.11, + "learning_rate": 1.4529448343991856e-06, + "loss": 0.5996, + "step": 43292 + }, + { + "epoch": 1.11, + "learning_rate": 1.4529201649495862e-06, + "loss": 0.6147, + "step": 43293 + }, + { + "epoch": 1.11, + "learning_rate": 1.452895495153207e-06, + "loss": 0.5522, + "step": 43294 + }, + { + "epoch": 1.11, + "learning_rate": 1.4528708250100666e-06, + "loss": 0.6899, + "step": 43295 + }, + { + "epoch": 1.11, + "learning_rate": 1.4528461545201833e-06, + "loss": 0.4421, + "step": 43296 + }, + { + "epoch": 1.11, + "learning_rate": 1.4528214836835772e-06, + "loss": 0.6377, + "step": 43297 + }, + { + "epoch": 1.11, + "learning_rate": 1.4527968125002663e-06, + "loss": 0.8203, + "step": 43298 + }, + { + "epoch": 1.11, + "learning_rate": 1.4527721409702693e-06, + "loss": 0.6318, + "step": 43299 + }, + { + "epoch": 1.11, + "learning_rate": 1.4527474690936058e-06, + "loss": 0.6309, + "step": 43300 + }, + { + "epoch": 1.11, + "learning_rate": 1.4527227968702946e-06, + "loss": 0.7427, + "step": 43301 + }, + { + "epoch": 1.11, + "learning_rate": 1.452698124300354e-06, + "loss": 0.6265, + "step": 43302 + }, + { + "epoch": 1.11, + "learning_rate": 1.4526734513838036e-06, + "loss": 0.4612, + "step": 43303 + }, + { + "epoch": 1.11, + "learning_rate": 1.4526487781206615e-06, + "loss": 0.6353, + "step": 43304 + }, + { + "epoch": 1.11, + "learning_rate": 1.4526241045109475e-06, + "loss": 0.8379, + "step": 43305 + }, + { + "epoch": 1.11, + "learning_rate": 1.4525994305546799e-06, + "loss": 0.7275, + "step": 43306 + }, + { + "epoch": 1.11, + "learning_rate": 1.4525747562518777e-06, + "loss": 0.5474, + "step": 43307 + }, + { + "epoch": 1.11, + "learning_rate": 1.4525500816025595e-06, + "loss": 0.7803, + "step": 43308 + }, + { + "epoch": 1.11, + "learning_rate": 1.4525254066067448e-06, + "loss": 0.6309, + "step": 43309 + }, + { + "epoch": 1.11, + "learning_rate": 1.4525007312644524e-06, + "loss": 0.6533, + "step": 43310 + }, + { + "epoch": 1.11, + "learning_rate": 1.452476055575701e-06, + "loss": 0.5112, + "step": 43311 + }, + { + "epoch": 1.11, + "learning_rate": 1.452451379540509e-06, + "loss": 0.834, + "step": 43312 + }, + { + "epoch": 1.11, + "learning_rate": 1.4524267031588962e-06, + "loss": 0.6592, + "step": 43313 + }, + { + "epoch": 1.11, + "learning_rate": 1.4524020264308808e-06, + "loss": 0.7012, + "step": 43314 + }, + { + "epoch": 1.11, + "learning_rate": 1.4523773493564824e-06, + "loss": 0.665, + "step": 43315 + }, + { + "epoch": 1.11, + "learning_rate": 1.452352671935719e-06, + "loss": 0.7871, + "step": 43316 + }, + { + "epoch": 1.11, + "learning_rate": 1.4523279941686103e-06, + "loss": 0.6274, + "step": 43317 + }, + { + "epoch": 1.11, + "learning_rate": 1.4523033160551745e-06, + "loss": 0.6475, + "step": 43318 + }, + { + "epoch": 1.11, + "learning_rate": 1.4522786375954313e-06, + "loss": 0.8066, + "step": 43319 + }, + { + "epoch": 1.11, + "learning_rate": 1.4522539587893986e-06, + "loss": 0.6162, + "step": 43320 + }, + { + "epoch": 1.11, + "learning_rate": 1.4522292796370963e-06, + "loss": 0.4448, + "step": 43321 + }, + { + "epoch": 1.11, + "learning_rate": 1.4522046001385426e-06, + "loss": 0.6885, + "step": 43322 + }, + { + "epoch": 1.11, + "learning_rate": 1.4521799202937566e-06, + "loss": 0.7354, + "step": 43323 + }, + { + "epoch": 1.11, + "learning_rate": 1.4521552401027575e-06, + "loss": 0.6709, + "step": 43324 + }, + { + "epoch": 1.11, + "learning_rate": 1.4521305595655637e-06, + "loss": 0.5547, + "step": 43325 + }, + { + "epoch": 1.11, + "learning_rate": 1.4521058786821944e-06, + "loss": 0.7305, + "step": 43326 + }, + { + "epoch": 1.11, + "learning_rate": 1.4520811974526683e-06, + "loss": 0.6826, + "step": 43327 + }, + { + "epoch": 1.11, + "learning_rate": 1.4520565158770045e-06, + "loss": 0.6152, + "step": 43328 + }, + { + "epoch": 1.11, + "learning_rate": 1.4520318339552217e-06, + "loss": 0.6523, + "step": 43329 + }, + { + "epoch": 1.11, + "learning_rate": 1.4520071516873393e-06, + "loss": 0.9326, + "step": 43330 + }, + { + "epoch": 1.11, + "learning_rate": 1.4519824690733756e-06, + "loss": 0.6494, + "step": 43331 + }, + { + "epoch": 1.11, + "learning_rate": 1.4519577861133495e-06, + "loss": 0.5127, + "step": 43332 + }, + { + "epoch": 1.11, + "learning_rate": 1.45193310280728e-06, + "loss": 0.6572, + "step": 43333 + }, + { + "epoch": 1.11, + "learning_rate": 1.4519084191551866e-06, + "loss": 0.7256, + "step": 43334 + }, + { + "epoch": 1.11, + "learning_rate": 1.4518837351570873e-06, + "loss": 0.8135, + "step": 43335 + }, + { + "epoch": 1.11, + "learning_rate": 1.4518590508130018e-06, + "loss": 0.8115, + "step": 43336 + }, + { + "epoch": 1.11, + "learning_rate": 1.4518343661229483e-06, + "loss": 0.6084, + "step": 43337 + }, + { + "epoch": 1.11, + "learning_rate": 1.4518096810869461e-06, + "loss": 0.8896, + "step": 43338 + }, + { + "epoch": 1.11, + "learning_rate": 1.4517849957050136e-06, + "loss": 0.707, + "step": 43339 + }, + { + "epoch": 1.11, + "learning_rate": 1.4517603099771706e-06, + "loss": 0.7549, + "step": 43340 + }, + { + "epoch": 1.11, + "learning_rate": 1.4517356239034356e-06, + "loss": 0.6204, + "step": 43341 + }, + { + "epoch": 1.11, + "learning_rate": 1.4517109374838273e-06, + "loss": 0.7012, + "step": 43342 + }, + { + "epoch": 1.11, + "learning_rate": 1.4516862507183643e-06, + "loss": 0.6045, + "step": 43343 + }, + { + "epoch": 1.11, + "learning_rate": 1.4516615636070662e-06, + "loss": 0.6577, + "step": 43344 + }, + { + "epoch": 1.11, + "learning_rate": 1.4516368761499517e-06, + "loss": 0.6348, + "step": 43345 + }, + { + "epoch": 1.11, + "learning_rate": 1.4516121883470393e-06, + "loss": 0.48, + "step": 43346 + }, + { + "epoch": 1.11, + "learning_rate": 1.4515875001983484e-06, + "loss": 0.6934, + "step": 43347 + }, + { + "epoch": 1.11, + "learning_rate": 1.4515628117038976e-06, + "loss": 0.5889, + "step": 43348 + }, + { + "epoch": 1.11, + "learning_rate": 1.451538122863706e-06, + "loss": 0.752, + "step": 43349 + }, + { + "epoch": 1.11, + "learning_rate": 1.4515134336777925e-06, + "loss": 0.6475, + "step": 43350 + }, + { + "epoch": 1.11, + "learning_rate": 1.4514887441461761e-06, + "loss": 0.6201, + "step": 43351 + }, + { + "epoch": 1.11, + "learning_rate": 1.4514640542688752e-06, + "loss": 0.6772, + "step": 43352 + }, + { + "epoch": 1.11, + "learning_rate": 1.4514393640459092e-06, + "loss": 0.564, + "step": 43353 + }, + { + "epoch": 1.11, + "learning_rate": 1.4514146734772967e-06, + "loss": 0.4103, + "step": 43354 + }, + { + "epoch": 1.11, + "learning_rate": 1.4513899825630572e-06, + "loss": 0.5125, + "step": 43355 + }, + { + "epoch": 1.11, + "learning_rate": 1.4513652913032085e-06, + "loss": 0.6445, + "step": 43356 + }, + { + "epoch": 1.11, + "learning_rate": 1.4513405996977705e-06, + "loss": 0.5894, + "step": 43357 + }, + { + "epoch": 1.11, + "learning_rate": 1.4513159077467616e-06, + "loss": 0.5415, + "step": 43358 + }, + { + "epoch": 1.11, + "learning_rate": 1.451291215450201e-06, + "loss": 0.6855, + "step": 43359 + }, + { + "epoch": 1.11, + "learning_rate": 1.4512665228081074e-06, + "loss": 0.561, + "step": 43360 + }, + { + "epoch": 1.11, + "learning_rate": 1.4512418298204998e-06, + "loss": 0.7285, + "step": 43361 + }, + { + "epoch": 1.11, + "learning_rate": 1.451217136487397e-06, + "loss": 0.6841, + "step": 43362 + }, + { + "epoch": 1.11, + "learning_rate": 1.4511924428088183e-06, + "loss": 0.6982, + "step": 43363 + }, + { + "epoch": 1.11, + "learning_rate": 1.4511677487847818e-06, + "loss": 0.6279, + "step": 43364 + }, + { + "epoch": 1.11, + "learning_rate": 1.4511430544153071e-06, + "loss": 0.7139, + "step": 43365 + }, + { + "epoch": 1.11, + "learning_rate": 1.451118359700413e-06, + "loss": 0.4182, + "step": 43366 + }, + { + "epoch": 1.11, + "learning_rate": 1.4510936646401181e-06, + "loss": 0.5615, + "step": 43367 + }, + { + "epoch": 1.11, + "learning_rate": 1.4510689692344417e-06, + "loss": 0.6211, + "step": 43368 + }, + { + "epoch": 1.11, + "learning_rate": 1.4510442734834027e-06, + "loss": 0.488, + "step": 43369 + }, + { + "epoch": 1.11, + "learning_rate": 1.4510195773870197e-06, + "loss": 0.6943, + "step": 43370 + }, + { + "epoch": 1.11, + "learning_rate": 1.4509948809453117e-06, + "loss": 0.6865, + "step": 43371 + }, + { + "epoch": 1.11, + "learning_rate": 1.4509701841582978e-06, + "loss": 0.7734, + "step": 43372 + }, + { + "epoch": 1.11, + "learning_rate": 1.4509454870259964e-06, + "loss": 0.5435, + "step": 43373 + }, + { + "epoch": 1.11, + "learning_rate": 1.450920789548427e-06, + "loss": 0.4783, + "step": 43374 + }, + { + "epoch": 1.11, + "learning_rate": 1.4508960917256083e-06, + "loss": 0.7017, + "step": 43375 + }, + { + "epoch": 1.11, + "learning_rate": 1.450871393557559e-06, + "loss": 0.7036, + "step": 43376 + }, + { + "epoch": 1.11, + "learning_rate": 1.4508466950442986e-06, + "loss": 0.668, + "step": 43377 + }, + { + "epoch": 1.11, + "learning_rate": 1.4508219961858455e-06, + "loss": 0.5732, + "step": 43378 + }, + { + "epoch": 1.11, + "learning_rate": 1.4507972969822184e-06, + "loss": 0.665, + "step": 43379 + }, + { + "epoch": 1.11, + "learning_rate": 1.450772597433437e-06, + "loss": 0.8369, + "step": 43380 + }, + { + "epoch": 1.11, + "learning_rate": 1.4507478975395193e-06, + "loss": 0.6123, + "step": 43381 + }, + { + "epoch": 1.11, + "learning_rate": 1.4507231973004853e-06, + "loss": 0.6523, + "step": 43382 + }, + { + "epoch": 1.11, + "learning_rate": 1.4506984967163525e-06, + "loss": 0.5049, + "step": 43383 + }, + { + "epoch": 1.11, + "learning_rate": 1.450673795787141e-06, + "loss": 0.668, + "step": 43384 + }, + { + "epoch": 1.11, + "learning_rate": 1.4506490945128693e-06, + "loss": 0.4988, + "step": 43385 + }, + { + "epoch": 1.11, + "learning_rate": 1.4506243928935561e-06, + "loss": 0.7881, + "step": 43386 + }, + { + "epoch": 1.11, + "learning_rate": 1.4505996909292208e-06, + "loss": 0.5918, + "step": 43387 + }, + { + "epoch": 1.11, + "learning_rate": 1.4505749886198818e-06, + "loss": 0.7256, + "step": 43388 + }, + { + "epoch": 1.11, + "learning_rate": 1.4505502859655584e-06, + "loss": 0.5239, + "step": 43389 + }, + { + "epoch": 1.11, + "learning_rate": 1.4505255829662693e-06, + "loss": 0.4097, + "step": 43390 + }, + { + "epoch": 1.11, + "learning_rate": 1.4505008796220335e-06, + "loss": 0.5283, + "step": 43391 + }, + { + "epoch": 1.11, + "learning_rate": 1.4504761759328698e-06, + "loss": 0.6973, + "step": 43392 + }, + { + "epoch": 1.11, + "learning_rate": 1.4504514718987974e-06, + "loss": 0.7949, + "step": 43393 + }, + { + "epoch": 1.11, + "learning_rate": 1.4504267675198346e-06, + "loss": 0.6406, + "step": 43394 + }, + { + "epoch": 1.11, + "learning_rate": 1.4504020627960013e-06, + "loss": 0.563, + "step": 43395 + }, + { + "epoch": 1.11, + "learning_rate": 1.4503773577273155e-06, + "loss": 0.6934, + "step": 43396 + }, + { + "epoch": 1.11, + "learning_rate": 1.4503526523137968e-06, + "loss": 0.6326, + "step": 43397 + }, + { + "epoch": 1.11, + "learning_rate": 1.4503279465554635e-06, + "loss": 0.5283, + "step": 43398 + }, + { + "epoch": 1.11, + "learning_rate": 1.4503032404523347e-06, + "loss": 0.791, + "step": 43399 + }, + { + "epoch": 1.11, + "learning_rate": 1.4502785340044297e-06, + "loss": 0.6326, + "step": 43400 + }, + { + "epoch": 1.11, + "learning_rate": 1.450253827211767e-06, + "loss": 0.4858, + "step": 43401 + }, + { + "epoch": 1.11, + "learning_rate": 1.4502291200743655e-06, + "loss": 0.7495, + "step": 43402 + }, + { + "epoch": 1.11, + "learning_rate": 1.4502044125922446e-06, + "loss": 0.4309, + "step": 43403 + }, + { + "epoch": 1.11, + "learning_rate": 1.4501797047654223e-06, + "loss": 0.7988, + "step": 43404 + }, + { + "epoch": 1.11, + "learning_rate": 1.4501549965939189e-06, + "loss": 0.645, + "step": 43405 + }, + { + "epoch": 1.11, + "learning_rate": 1.450130288077752e-06, + "loss": 0.4819, + "step": 43406 + }, + { + "epoch": 1.11, + "learning_rate": 1.4501055792169411e-06, + "loss": 0.5322, + "step": 43407 + }, + { + "epoch": 1.11, + "learning_rate": 1.450080870011505e-06, + "loss": 0.5029, + "step": 43408 + }, + { + "epoch": 1.11, + "learning_rate": 1.4500561604614628e-06, + "loss": 0.7432, + "step": 43409 + }, + { + "epoch": 1.11, + "learning_rate": 1.4500314505668332e-06, + "loss": 0.6709, + "step": 43410 + }, + { + "epoch": 1.11, + "learning_rate": 1.4500067403276353e-06, + "loss": 0.5615, + "step": 43411 + }, + { + "epoch": 1.11, + "learning_rate": 1.4499820297438879e-06, + "loss": 0.6313, + "step": 43412 + }, + { + "epoch": 1.11, + "learning_rate": 1.4499573188156098e-06, + "loss": 0.6172, + "step": 43413 + }, + { + "epoch": 1.11, + "learning_rate": 1.44993260754282e-06, + "loss": 0.6216, + "step": 43414 + }, + { + "epoch": 1.11, + "learning_rate": 1.449907895925538e-06, + "loss": 0.6006, + "step": 43415 + }, + { + "epoch": 1.11, + "learning_rate": 1.449883183963782e-06, + "loss": 0.6299, + "step": 43416 + }, + { + "epoch": 1.11, + "learning_rate": 1.449858471657571e-06, + "loss": 0.5493, + "step": 43417 + }, + { + "epoch": 1.11, + "learning_rate": 1.4498337590069241e-06, + "loss": 0.6494, + "step": 43418 + }, + { + "epoch": 1.11, + "learning_rate": 1.4498090460118602e-06, + "loss": 0.835, + "step": 43419 + }, + { + "epoch": 1.11, + "learning_rate": 1.4497843326723983e-06, + "loss": 0.6909, + "step": 43420 + }, + { + "epoch": 1.11, + "learning_rate": 1.449759618988557e-06, + "loss": 0.8105, + "step": 43421 + }, + { + "epoch": 1.11, + "learning_rate": 1.4497349049603556e-06, + "loss": 0.8662, + "step": 43422 + }, + { + "epoch": 1.11, + "learning_rate": 1.4497101905878127e-06, + "loss": 0.7393, + "step": 43423 + }, + { + "epoch": 1.11, + "learning_rate": 1.4496854758709477e-06, + "loss": 0.6147, + "step": 43424 + }, + { + "epoch": 1.11, + "learning_rate": 1.4496607608097788e-06, + "loss": 0.4421, + "step": 43425 + }, + { + "epoch": 1.11, + "learning_rate": 1.4496360454043255e-06, + "loss": 0.6807, + "step": 43426 + }, + { + "epoch": 1.11, + "learning_rate": 1.4496113296546067e-06, + "loss": 0.6689, + "step": 43427 + }, + { + "epoch": 1.11, + "learning_rate": 1.4495866135606408e-06, + "loss": 0.7148, + "step": 43428 + }, + { + "epoch": 1.11, + "learning_rate": 1.4495618971224475e-06, + "loss": 0.6709, + "step": 43429 + }, + { + "epoch": 1.11, + "learning_rate": 1.4495371803400452e-06, + "loss": 0.5698, + "step": 43430 + }, + { + "epoch": 1.11, + "learning_rate": 1.449512463213453e-06, + "loss": 0.5945, + "step": 43431 + }, + { + "epoch": 1.11, + "learning_rate": 1.4494877457426897e-06, + "loss": 0.4497, + "step": 43432 + }, + { + "epoch": 1.11, + "learning_rate": 1.4494630279277741e-06, + "loss": 0.6753, + "step": 43433 + }, + { + "epoch": 1.11, + "learning_rate": 1.4494383097687258e-06, + "loss": 0.7441, + "step": 43434 + }, + { + "epoch": 1.11, + "learning_rate": 1.449413591265563e-06, + "loss": 0.8945, + "step": 43435 + }, + { + "epoch": 1.11, + "learning_rate": 1.4493888724183046e-06, + "loss": 0.6406, + "step": 43436 + }, + { + "epoch": 1.11, + "learning_rate": 1.4493641532269702e-06, + "loss": 0.7051, + "step": 43437 + }, + { + "epoch": 1.11, + "learning_rate": 1.449339433691578e-06, + "loss": 0.6104, + "step": 43438 + }, + { + "epoch": 1.11, + "learning_rate": 1.4493147138121476e-06, + "loss": 0.5122, + "step": 43439 + }, + { + "epoch": 1.11, + "learning_rate": 1.4492899935886975e-06, + "loss": 0.4868, + "step": 43440 + }, + { + "epoch": 1.11, + "learning_rate": 1.4492652730212467e-06, + "loss": 0.626, + "step": 43441 + }, + { + "epoch": 1.11, + "learning_rate": 1.449240552109814e-06, + "loss": 0.5557, + "step": 43442 + }, + { + "epoch": 1.11, + "learning_rate": 1.4492158308544187e-06, + "loss": 0.6353, + "step": 43443 + }, + { + "epoch": 1.11, + "learning_rate": 1.449191109255079e-06, + "loss": 0.6633, + "step": 43444 + }, + { + "epoch": 1.11, + "learning_rate": 1.449166387311815e-06, + "loss": 0.5557, + "step": 43445 + }, + { + "epoch": 1.11, + "learning_rate": 1.4491416650246447e-06, + "loss": 0.4902, + "step": 43446 + }, + { + "epoch": 1.11, + "learning_rate": 1.4491169423935873e-06, + "loss": 0.6797, + "step": 43447 + }, + { + "epoch": 1.11, + "learning_rate": 1.4490922194186611e-06, + "loss": 0.7559, + "step": 43448 + }, + { + "epoch": 1.11, + "learning_rate": 1.4490674960998864e-06, + "loss": 0.6323, + "step": 43449 + }, + { + "epoch": 1.11, + "learning_rate": 1.4490427724372811e-06, + "loss": 0.6729, + "step": 43450 + }, + { + "epoch": 1.11, + "learning_rate": 1.4490180484308645e-06, + "loss": 0.7188, + "step": 43451 + }, + { + "epoch": 1.11, + "learning_rate": 1.4489933240806553e-06, + "loss": 0.6616, + "step": 43452 + }, + { + "epoch": 1.11, + "learning_rate": 1.4489685993866728e-06, + "loss": 0.6445, + "step": 43453 + }, + { + "epoch": 1.11, + "learning_rate": 1.4489438743489354e-06, + "loss": 0.6865, + "step": 43454 + }, + { + "epoch": 1.11, + "learning_rate": 1.4489191489674624e-06, + "loss": 0.6572, + "step": 43455 + }, + { + "epoch": 1.11, + "learning_rate": 1.4488944232422726e-06, + "loss": 0.3762, + "step": 43456 + }, + { + "epoch": 1.11, + "learning_rate": 1.448869697173385e-06, + "loss": 0.7476, + "step": 43457 + }, + { + "epoch": 1.11, + "learning_rate": 1.4488449707608186e-06, + "loss": 0.7705, + "step": 43458 + }, + { + "epoch": 1.11, + "learning_rate": 1.448820244004592e-06, + "loss": 0.7217, + "step": 43459 + }, + { + "epoch": 1.11, + "learning_rate": 1.4487955169047248e-06, + "loss": 0.7734, + "step": 43460 + }, + { + "epoch": 1.11, + "learning_rate": 1.448770789461235e-06, + "loss": 0.644, + "step": 43461 + }, + { + "epoch": 1.11, + "learning_rate": 1.4487460616741424e-06, + "loss": 0.542, + "step": 43462 + }, + { + "epoch": 1.11, + "learning_rate": 1.4487213335434654e-06, + "loss": 0.6729, + "step": 43463 + }, + { + "epoch": 1.11, + "learning_rate": 1.4486966050692234e-06, + "loss": 0.6228, + "step": 43464 + }, + { + "epoch": 1.11, + "learning_rate": 1.4486718762514348e-06, + "loss": 0.75, + "step": 43465 + }, + { + "epoch": 1.11, + "learning_rate": 1.448647147090119e-06, + "loss": 0.5933, + "step": 43466 + }, + { + "epoch": 1.11, + "learning_rate": 1.4486224175852941e-06, + "loss": 0.7422, + "step": 43467 + }, + { + "epoch": 1.11, + "learning_rate": 1.4485976877369802e-06, + "loss": 0.7227, + "step": 43468 + }, + { + "epoch": 1.11, + "learning_rate": 1.4485729575451955e-06, + "loss": 0.562, + "step": 43469 + }, + { + "epoch": 1.11, + "learning_rate": 1.4485482270099593e-06, + "loss": 0.7861, + "step": 43470 + }, + { + "epoch": 1.11, + "learning_rate": 1.4485234961312902e-06, + "loss": 0.7056, + "step": 43471 + }, + { + "epoch": 1.11, + "learning_rate": 1.4484987649092072e-06, + "loss": 0.561, + "step": 43472 + }, + { + "epoch": 1.11, + "learning_rate": 1.4484740333437295e-06, + "loss": 0.7715, + "step": 43473 + }, + { + "epoch": 1.11, + "learning_rate": 1.4484493014348758e-06, + "loss": 0.6997, + "step": 43474 + }, + { + "epoch": 1.11, + "learning_rate": 1.448424569182665e-06, + "loss": 0.5601, + "step": 43475 + }, + { + "epoch": 1.11, + "learning_rate": 1.4483998365871162e-06, + "loss": 0.6611, + "step": 43476 + }, + { + "epoch": 1.11, + "learning_rate": 1.448375103648248e-06, + "loss": 0.7051, + "step": 43477 + }, + { + "epoch": 1.11, + "learning_rate": 1.44835037036608e-06, + "loss": 0.6997, + "step": 43478 + }, + { + "epoch": 1.11, + "learning_rate": 1.4483256367406304e-06, + "loss": 0.6504, + "step": 43479 + }, + { + "epoch": 1.11, + "learning_rate": 1.4483009027719188e-06, + "loss": 0.605, + "step": 43480 + }, + { + "epoch": 1.11, + "learning_rate": 1.4482761684599638e-06, + "loss": 0.668, + "step": 43481 + }, + { + "epoch": 1.11, + "learning_rate": 1.448251433804784e-06, + "loss": 0.5635, + "step": 43482 + }, + { + "epoch": 1.11, + "learning_rate": 1.448226698806399e-06, + "loss": 0.7461, + "step": 43483 + }, + { + "epoch": 1.11, + "learning_rate": 1.4482019634648273e-06, + "loss": 0.5959, + "step": 43484 + }, + { + "epoch": 1.11, + "learning_rate": 1.4481772277800882e-06, + "loss": 0.75, + "step": 43485 + }, + { + "epoch": 1.11, + "learning_rate": 1.4481524917522e-06, + "loss": 0.624, + "step": 43486 + }, + { + "epoch": 1.11, + "learning_rate": 1.4481277553811823e-06, + "loss": 0.5664, + "step": 43487 + }, + { + "epoch": 1.11, + "learning_rate": 1.4481030186670536e-06, + "loss": 0.6787, + "step": 43488 + }, + { + "epoch": 1.11, + "learning_rate": 1.448078281609833e-06, + "loss": 0.6401, + "step": 43489 + }, + { + "epoch": 1.11, + "learning_rate": 1.4480535442095398e-06, + "loss": 0.458, + "step": 43490 + }, + { + "epoch": 1.11, + "learning_rate": 1.4480288064661926e-06, + "loss": 0.4121, + "step": 43491 + }, + { + "epoch": 1.11, + "learning_rate": 1.44800406837981e-06, + "loss": 0.5654, + "step": 43492 + }, + { + "epoch": 1.11, + "learning_rate": 1.4479793299504114e-06, + "loss": 0.6475, + "step": 43493 + }, + { + "epoch": 1.11, + "learning_rate": 1.4479545911780155e-06, + "loss": 0.6006, + "step": 43494 + }, + { + "epoch": 1.11, + "learning_rate": 1.447929852062642e-06, + "loss": 0.7861, + "step": 43495 + }, + { + "epoch": 1.11, + "learning_rate": 1.4479051126043085e-06, + "loss": 0.6982, + "step": 43496 + }, + { + "epoch": 1.11, + "learning_rate": 1.4478803728030352e-06, + "loss": 0.6494, + "step": 43497 + }, + { + "epoch": 1.11, + "learning_rate": 1.4478556326588397e-06, + "loss": 0.7617, + "step": 43498 + }, + { + "epoch": 1.11, + "learning_rate": 1.4478308921717425e-06, + "loss": 0.4883, + "step": 43499 + }, + { + "epoch": 1.11, + "learning_rate": 1.4478061513417614e-06, + "loss": 0.6582, + "step": 43500 + }, + { + "epoch": 1.11, + "learning_rate": 1.4477814101689156e-06, + "loss": 0.5845, + "step": 43501 + }, + { + "epoch": 1.11, + "learning_rate": 1.4477566686532245e-06, + "loss": 0.563, + "step": 43502 + }, + { + "epoch": 1.12, + "learning_rate": 1.4477319267947065e-06, + "loss": 0.6445, + "step": 43503 + }, + { + "epoch": 1.12, + "learning_rate": 1.447707184593381e-06, + "loss": 0.5485, + "step": 43504 + }, + { + "epoch": 1.12, + "learning_rate": 1.4476824420492666e-06, + "loss": 0.4941, + "step": 43505 + }, + { + "epoch": 1.12, + "learning_rate": 1.4476576991623822e-06, + "loss": 0.6069, + "step": 43506 + }, + { + "epoch": 1.12, + "learning_rate": 1.4476329559327469e-06, + "loss": 0.6885, + "step": 43507 + }, + { + "epoch": 1.12, + "learning_rate": 1.4476082123603798e-06, + "loss": 0.5491, + "step": 43508 + }, + { + "epoch": 1.12, + "learning_rate": 1.4475834684452995e-06, + "loss": 0.7739, + "step": 43509 + }, + { + "epoch": 1.12, + "learning_rate": 1.4475587241875254e-06, + "loss": 0.5957, + "step": 43510 + }, + { + "epoch": 1.12, + "learning_rate": 1.4475339795870758e-06, + "loss": 0.6938, + "step": 43511 + }, + { + "epoch": 1.12, + "learning_rate": 1.44750923464397e-06, + "loss": 0.5322, + "step": 43512 + }, + { + "epoch": 1.12, + "learning_rate": 1.4474844893582272e-06, + "loss": 0.4863, + "step": 43513 + }, + { + "epoch": 1.12, + "learning_rate": 1.447459743729866e-06, + "loss": 0.7295, + "step": 43514 + }, + { + "epoch": 1.12, + "learning_rate": 1.4474349977589056e-06, + "loss": 0.7695, + "step": 43515 + }, + { + "epoch": 1.12, + "learning_rate": 1.4474102514453645e-06, + "loss": 0.6938, + "step": 43516 + }, + { + "epoch": 1.12, + "learning_rate": 1.447385504789262e-06, + "loss": 0.7627, + "step": 43517 + }, + { + "epoch": 1.12, + "learning_rate": 1.4473607577906173e-06, + "loss": 0.6431, + "step": 43518 + }, + { + "epoch": 1.12, + "learning_rate": 1.4473360104494487e-06, + "loss": 0.6543, + "step": 43519 + }, + { + "epoch": 1.12, + "learning_rate": 1.4473112627657757e-06, + "loss": 0.6904, + "step": 43520 + }, + { + "epoch": 1.12, + "learning_rate": 1.447286514739617e-06, + "loss": 0.6924, + "step": 43521 + }, + { + "epoch": 1.12, + "learning_rate": 1.4472617663709916e-06, + "loss": 0.3418, + "step": 43522 + }, + { + "epoch": 1.12, + "learning_rate": 1.4472370176599183e-06, + "loss": 0.6885, + "step": 43523 + }, + { + "epoch": 1.12, + "learning_rate": 1.447212268606416e-06, + "loss": 0.5415, + "step": 43524 + }, + { + "epoch": 1.12, + "learning_rate": 1.4471875192105042e-06, + "loss": 0.5796, + "step": 43525 + }, + { + "epoch": 1.12, + "learning_rate": 1.4471627694722012e-06, + "loss": 0.6655, + "step": 43526 + }, + { + "epoch": 1.12, + "learning_rate": 1.4471380193915266e-06, + "loss": 0.7383, + "step": 43527 + }, + { + "epoch": 1.12, + "learning_rate": 1.4471132689684987e-06, + "loss": 0.6279, + "step": 43528 + }, + { + "epoch": 1.12, + "learning_rate": 1.4470885182031367e-06, + "loss": 0.6021, + "step": 43529 + }, + { + "epoch": 1.12, + "learning_rate": 1.4470637670954598e-06, + "loss": 0.5139, + "step": 43530 + }, + { + "epoch": 1.12, + "learning_rate": 1.4470390156454866e-06, + "loss": 0.6504, + "step": 43531 + }, + { + "epoch": 1.12, + "learning_rate": 1.447014263853236e-06, + "loss": 0.5454, + "step": 43532 + }, + { + "epoch": 1.12, + "learning_rate": 1.4469895117187274e-06, + "loss": 0.8311, + "step": 43533 + }, + { + "epoch": 1.12, + "learning_rate": 1.4469647592419794e-06, + "loss": 0.707, + "step": 43534 + }, + { + "epoch": 1.12, + "learning_rate": 1.4469400064230111e-06, + "loss": 0.7612, + "step": 43535 + }, + { + "epoch": 1.12, + "learning_rate": 1.4469152532618414e-06, + "loss": 0.7559, + "step": 43536 + }, + { + "epoch": 1.12, + "learning_rate": 1.446890499758489e-06, + "loss": 0.6147, + "step": 43537 + }, + { + "epoch": 1.12, + "learning_rate": 1.4468657459129732e-06, + "loss": 0.6543, + "step": 43538 + }, + { + "epoch": 1.12, + "learning_rate": 1.4468409917253128e-06, + "loss": 0.5835, + "step": 43539 + }, + { + "epoch": 1.12, + "learning_rate": 1.446816237195527e-06, + "loss": 0.7617, + "step": 43540 + }, + { + "epoch": 1.12, + "learning_rate": 1.4467914823236346e-06, + "loss": 0.7295, + "step": 43541 + }, + { + "epoch": 1.12, + "learning_rate": 1.446766727109654e-06, + "loss": 0.5854, + "step": 43542 + }, + { + "epoch": 1.12, + "learning_rate": 1.4467419715536054e-06, + "loss": 0.5977, + "step": 43543 + }, + { + "epoch": 1.12, + "learning_rate": 1.4467172156555062e-06, + "loss": 0.322, + "step": 43544 + }, + { + "epoch": 1.12, + "learning_rate": 1.4466924594153768e-06, + "loss": 0.7471, + "step": 43545 + }, + { + "epoch": 1.12, + "learning_rate": 1.4466677028332354e-06, + "loss": 0.8486, + "step": 43546 + }, + { + "epoch": 1.12, + "learning_rate": 1.446642945909101e-06, + "loss": 0.7031, + "step": 43547 + }, + { + "epoch": 1.12, + "learning_rate": 1.4466181886429926e-06, + "loss": 0.7334, + "step": 43548 + }, + { + "epoch": 1.12, + "learning_rate": 1.446593431034929e-06, + "loss": 0.6621, + "step": 43549 + }, + { + "epoch": 1.12, + "learning_rate": 1.4465686730849301e-06, + "loss": 0.749, + "step": 43550 + }, + { + "epoch": 1.12, + "learning_rate": 1.446543914793013e-06, + "loss": 0.625, + "step": 43551 + }, + { + "epoch": 1.12, + "learning_rate": 1.4465191561591986e-06, + "loss": 0.5874, + "step": 43552 + }, + { + "epoch": 1.12, + "learning_rate": 1.4464943971835045e-06, + "loss": 0.488, + "step": 43553 + }, + { + "epoch": 1.12, + "learning_rate": 1.4464696378659507e-06, + "loss": 0.7305, + "step": 43554 + }, + { + "epoch": 1.12, + "learning_rate": 1.4464448782065553e-06, + "loss": 0.667, + "step": 43555 + }, + { + "epoch": 1.12, + "learning_rate": 1.4464201182053377e-06, + "loss": 0.7646, + "step": 43556 + }, + { + "epoch": 1.12, + "learning_rate": 1.4463953578623164e-06, + "loss": 0.5659, + "step": 43557 + }, + { + "epoch": 1.12, + "learning_rate": 1.446370597177511e-06, + "loss": 0.583, + "step": 43558 + }, + { + "epoch": 1.12, + "learning_rate": 1.44634583615094e-06, + "loss": 0.583, + "step": 43559 + }, + { + "epoch": 1.12, + "learning_rate": 1.446321074782623e-06, + "loss": 0.707, + "step": 43560 + }, + { + "epoch": 1.12, + "learning_rate": 1.4462963130725781e-06, + "loss": 0.6138, + "step": 43561 + }, + { + "epoch": 1.12, + "learning_rate": 1.4462715510208246e-06, + "loss": 0.6196, + "step": 43562 + }, + { + "epoch": 1.12, + "learning_rate": 1.4462467886273815e-06, + "loss": 0.6191, + "step": 43563 + }, + { + "epoch": 1.12, + "learning_rate": 1.4462220258922677e-06, + "loss": 0.5869, + "step": 43564 + }, + { + "epoch": 1.12, + "learning_rate": 1.4461972628155024e-06, + "loss": 0.5791, + "step": 43565 + }, + { + "epoch": 1.12, + "learning_rate": 1.446172499397104e-06, + "loss": 0.5874, + "step": 43566 + }, + { + "epoch": 1.12, + "learning_rate": 1.4461477356370923e-06, + "loss": 0.6841, + "step": 43567 + }, + { + "epoch": 1.12, + "learning_rate": 1.4461229715354858e-06, + "loss": 0.834, + "step": 43568 + }, + { + "epoch": 1.12, + "learning_rate": 1.4460982070923028e-06, + "loss": 0.6001, + "step": 43569 + }, + { + "epoch": 1.12, + "learning_rate": 1.4460734423075636e-06, + "loss": 0.6128, + "step": 43570 + }, + { + "epoch": 1.12, + "learning_rate": 1.4460486771812863e-06, + "loss": 0.748, + "step": 43571 + }, + { + "epoch": 1.12, + "learning_rate": 1.4460239117134898e-06, + "loss": 0.7891, + "step": 43572 + }, + { + "epoch": 1.12, + "learning_rate": 1.4459991459041937e-06, + "loss": 0.8091, + "step": 43573 + }, + { + "epoch": 1.12, + "learning_rate": 1.4459743797534162e-06, + "loss": 0.5488, + "step": 43574 + }, + { + "epoch": 1.12, + "learning_rate": 1.445949613261177e-06, + "loss": 0.5884, + "step": 43575 + }, + { + "epoch": 1.12, + "learning_rate": 1.4459248464274943e-06, + "loss": 0.7002, + "step": 43576 + }, + { + "epoch": 1.12, + "learning_rate": 1.4459000792523876e-06, + "loss": 0.709, + "step": 43577 + }, + { + "epoch": 1.12, + "learning_rate": 1.4458753117358757e-06, + "loss": 0.5532, + "step": 43578 + }, + { + "epoch": 1.12, + "learning_rate": 1.4458505438779779e-06, + "loss": 0.8389, + "step": 43579 + }, + { + "epoch": 1.12, + "learning_rate": 1.4458257756787125e-06, + "loss": 0.6206, + "step": 43580 + }, + { + "epoch": 1.12, + "learning_rate": 1.445801007138099e-06, + "loss": 0.7861, + "step": 43581 + }, + { + "epoch": 1.12, + "learning_rate": 1.4457762382561557e-06, + "loss": 0.7812, + "step": 43582 + }, + { + "epoch": 1.12, + "learning_rate": 1.4457514690329022e-06, + "loss": 0.5543, + "step": 43583 + }, + { + "epoch": 1.12, + "learning_rate": 1.4457266994683575e-06, + "loss": 0.6426, + "step": 43584 + }, + { + "epoch": 1.12, + "learning_rate": 1.4457019295625403e-06, + "loss": 0.5845, + "step": 43585 + }, + { + "epoch": 1.12, + "learning_rate": 1.4456771593154696e-06, + "loss": 0.7422, + "step": 43586 + }, + { + "epoch": 1.12, + "learning_rate": 1.4456523887271645e-06, + "loss": 0.748, + "step": 43587 + }, + { + "epoch": 1.12, + "learning_rate": 1.4456276177976436e-06, + "loss": 0.6665, + "step": 43588 + }, + { + "epoch": 1.12, + "learning_rate": 1.4456028465269264e-06, + "loss": 0.5874, + "step": 43589 + }, + { + "epoch": 1.12, + "learning_rate": 1.4455780749150315e-06, + "loss": 0.6079, + "step": 43590 + }, + { + "epoch": 1.12, + "learning_rate": 1.445553302961978e-06, + "loss": 0.8584, + "step": 43591 + }, + { + "epoch": 1.12, + "learning_rate": 1.4455285306677846e-06, + "loss": 0.6221, + "step": 43592 + }, + { + "epoch": 1.12, + "learning_rate": 1.4455037580324704e-06, + "loss": 0.7627, + "step": 43593 + }, + { + "epoch": 1.12, + "learning_rate": 1.4454789850560552e-06, + "loss": 0.5264, + "step": 43594 + }, + { + "epoch": 1.12, + "learning_rate": 1.4454542117385566e-06, + "loss": 0.6729, + "step": 43595 + }, + { + "epoch": 1.12, + "learning_rate": 1.4454294380799942e-06, + "loss": 0.7354, + "step": 43596 + }, + { + "epoch": 1.12, + "learning_rate": 1.445404664080387e-06, + "loss": 0.6333, + "step": 43597 + }, + { + "epoch": 1.12, + "learning_rate": 1.4453798897397543e-06, + "loss": 0.6953, + "step": 43598 + }, + { + "epoch": 1.12, + "learning_rate": 1.4453551150581142e-06, + "loss": 0.667, + "step": 43599 + }, + { + "epoch": 1.12, + "learning_rate": 1.4453303400354866e-06, + "loss": 0.6602, + "step": 43600 + }, + { + "epoch": 1.12, + "learning_rate": 1.4453055646718896e-06, + "loss": 0.6611, + "step": 43601 + }, + { + "epoch": 1.12, + "learning_rate": 1.445280788967343e-06, + "loss": 0.7578, + "step": 43602 + }, + { + "epoch": 1.12, + "learning_rate": 1.445256012921865e-06, + "loss": 0.7109, + "step": 43603 + }, + { + "epoch": 1.12, + "learning_rate": 1.4452312365354753e-06, + "loss": 0.6436, + "step": 43604 + }, + { + "epoch": 1.12, + "learning_rate": 1.4452064598081924e-06, + "loss": 0.7241, + "step": 43605 + }, + { + "epoch": 1.12, + "learning_rate": 1.4451816827400353e-06, + "loss": 0.6631, + "step": 43606 + }, + { + "epoch": 1.12, + "learning_rate": 1.445156905331023e-06, + "loss": 0.6797, + "step": 43607 + }, + { + "epoch": 1.12, + "learning_rate": 1.4451321275811748e-06, + "loss": 0.6963, + "step": 43608 + }, + { + "epoch": 1.12, + "learning_rate": 1.445107349490509e-06, + "loss": 0.687, + "step": 43609 + }, + { + "epoch": 1.12, + "learning_rate": 1.4450825710590453e-06, + "loss": 0.5273, + "step": 43610 + }, + { + "epoch": 1.12, + "learning_rate": 1.4450577922868021e-06, + "loss": 0.5474, + "step": 43611 + }, + { + "epoch": 1.12, + "learning_rate": 1.4450330131737988e-06, + "loss": 0.5068, + "step": 43612 + }, + { + "epoch": 1.12, + "learning_rate": 1.445008233720054e-06, + "loss": 0.6182, + "step": 43613 + }, + { + "epoch": 1.12, + "learning_rate": 1.4449834539255871e-06, + "loss": 0.5635, + "step": 43614 + }, + { + "epoch": 1.12, + "learning_rate": 1.4449586737904169e-06, + "loss": 0.626, + "step": 43615 + }, + { + "epoch": 1.12, + "learning_rate": 1.444933893314562e-06, + "loss": 0.4861, + "step": 43616 + }, + { + "epoch": 1.12, + "learning_rate": 1.4449091124980418e-06, + "loss": 0.7656, + "step": 43617 + }, + { + "epoch": 1.12, + "learning_rate": 1.444884331340875e-06, + "loss": 0.5908, + "step": 43618 + }, + { + "epoch": 1.12, + "learning_rate": 1.4448595498430812e-06, + "loss": 0.6099, + "step": 43619 + }, + { + "epoch": 1.12, + "learning_rate": 1.4448347680046784e-06, + "loss": 0.6367, + "step": 43620 + }, + { + "epoch": 1.12, + "learning_rate": 1.444809985825686e-06, + "loss": 0.5488, + "step": 43621 + }, + { + "epoch": 1.12, + "learning_rate": 1.4447852033061233e-06, + "loss": 0.6436, + "step": 43622 + }, + { + "epoch": 1.12, + "learning_rate": 1.4447604204460091e-06, + "loss": 0.6992, + "step": 43623 + }, + { + "epoch": 1.12, + "learning_rate": 1.4447356372453623e-06, + "loss": 0.5459, + "step": 43624 + }, + { + "epoch": 1.12, + "learning_rate": 1.4447108537042018e-06, + "loss": 0.6772, + "step": 43625 + }, + { + "epoch": 1.12, + "learning_rate": 1.4446860698225466e-06, + "loss": 0.6729, + "step": 43626 + }, + { + "epoch": 1.12, + "learning_rate": 1.4446612856004157e-06, + "loss": 0.7012, + "step": 43627 + }, + { + "epoch": 1.12, + "learning_rate": 1.4446365010378281e-06, + "loss": 0.6191, + "step": 43628 + }, + { + "epoch": 1.12, + "learning_rate": 1.4446117161348028e-06, + "loss": 0.6436, + "step": 43629 + }, + { + "epoch": 1.12, + "learning_rate": 1.4445869308913587e-06, + "loss": 0.6172, + "step": 43630 + }, + { + "epoch": 1.12, + "learning_rate": 1.4445621453075152e-06, + "loss": 0.6279, + "step": 43631 + }, + { + "epoch": 1.12, + "learning_rate": 1.4445373593832904e-06, + "loss": 0.6289, + "step": 43632 + }, + { + "epoch": 1.12, + "learning_rate": 1.444512573118704e-06, + "loss": 0.6499, + "step": 43633 + }, + { + "epoch": 1.12, + "learning_rate": 1.444487786513775e-06, + "loss": 0.668, + "step": 43634 + }, + { + "epoch": 1.12, + "learning_rate": 1.4444629995685216e-06, + "loss": 0.4231, + "step": 43635 + }, + { + "epoch": 1.12, + "learning_rate": 1.4444382122829636e-06, + "loss": 0.4988, + "step": 43636 + }, + { + "epoch": 1.12, + "learning_rate": 1.4444134246571196e-06, + "loss": 0.6426, + "step": 43637 + }, + { + "epoch": 1.12, + "learning_rate": 1.444388636691009e-06, + "loss": 0.6006, + "step": 43638 + }, + { + "epoch": 1.12, + "learning_rate": 1.4443638483846504e-06, + "loss": 0.7773, + "step": 43639 + }, + { + "epoch": 1.12, + "learning_rate": 1.4443390597380628e-06, + "loss": 0.5815, + "step": 43640 + }, + { + "epoch": 1.12, + "learning_rate": 1.4443142707512648e-06, + "loss": 0.5688, + "step": 43641 + }, + { + "epoch": 1.12, + "learning_rate": 1.444289481424276e-06, + "loss": 0.7065, + "step": 43642 + }, + { + "epoch": 1.12, + "learning_rate": 1.4442646917571153e-06, + "loss": 0.499, + "step": 43643 + }, + { + "epoch": 1.12, + "learning_rate": 1.4442399017498017e-06, + "loss": 0.8125, + "step": 43644 + }, + { + "epoch": 1.12, + "learning_rate": 1.4442151114023537e-06, + "loss": 0.6455, + "step": 43645 + }, + { + "epoch": 1.12, + "learning_rate": 1.4441903207147907e-06, + "loss": 0.5664, + "step": 43646 + }, + { + "epoch": 1.12, + "learning_rate": 1.4441655296871316e-06, + "loss": 0.6084, + "step": 43647 + }, + { + "epoch": 1.12, + "learning_rate": 1.4441407383193956e-06, + "loss": 0.5842, + "step": 43648 + }, + { + "epoch": 1.12, + "learning_rate": 1.4441159466116013e-06, + "loss": 0.3658, + "step": 43649 + }, + { + "epoch": 1.12, + "learning_rate": 1.4440911545637677e-06, + "loss": 0.2881, + "step": 43650 + }, + { + "epoch": 1.12, + "learning_rate": 1.4440663621759142e-06, + "loss": 0.5967, + "step": 43651 + }, + { + "epoch": 1.12, + "learning_rate": 1.4440415694480592e-06, + "loss": 0.5098, + "step": 43652 + }, + { + "epoch": 1.12, + "learning_rate": 1.4440167763802222e-06, + "loss": 0.6729, + "step": 43653 + }, + { + "epoch": 1.12, + "learning_rate": 1.4439919829724218e-06, + "loss": 0.5118, + "step": 43654 + }, + { + "epoch": 1.12, + "learning_rate": 1.4439671892246773e-06, + "loss": 0.4617, + "step": 43655 + }, + { + "epoch": 1.12, + "learning_rate": 1.4439423951370076e-06, + "loss": 0.7739, + "step": 43656 + }, + { + "epoch": 1.12, + "learning_rate": 1.4439176007094313e-06, + "loss": 0.7188, + "step": 43657 + }, + { + "epoch": 1.12, + "learning_rate": 1.443892805941968e-06, + "loss": 0.4492, + "step": 43658 + }, + { + "epoch": 1.12, + "learning_rate": 1.4438680108346367e-06, + "loss": 0.6173, + "step": 43659 + }, + { + "epoch": 1.12, + "learning_rate": 1.4438432153874553e-06, + "loss": 0.5, + "step": 43660 + }, + { + "epoch": 1.12, + "learning_rate": 1.4438184196004441e-06, + "loss": 0.5708, + "step": 43661 + }, + { + "epoch": 1.12, + "learning_rate": 1.4437936234736213e-06, + "loss": 0.7227, + "step": 43662 + }, + { + "epoch": 1.12, + "learning_rate": 1.4437688270070064e-06, + "loss": 0.8242, + "step": 43663 + }, + { + "epoch": 1.12, + "learning_rate": 1.443744030200618e-06, + "loss": 0.7451, + "step": 43664 + }, + { + "epoch": 1.12, + "learning_rate": 1.443719233054475e-06, + "loss": 0.79, + "step": 43665 + }, + { + "epoch": 1.12, + "learning_rate": 1.4436944355685968e-06, + "loss": 0.5947, + "step": 43666 + }, + { + "epoch": 1.12, + "learning_rate": 1.443669637743002e-06, + "loss": 0.5615, + "step": 43667 + }, + { + "epoch": 1.12, + "learning_rate": 1.4436448395777099e-06, + "loss": 0.7441, + "step": 43668 + }, + { + "epoch": 1.12, + "learning_rate": 1.4436200410727396e-06, + "loss": 0.6289, + "step": 43669 + }, + { + "epoch": 1.12, + "learning_rate": 1.4435952422281093e-06, + "loss": 0.5898, + "step": 43670 + }, + { + "epoch": 1.12, + "learning_rate": 1.4435704430438387e-06, + "loss": 0.7207, + "step": 43671 + }, + { + "epoch": 1.12, + "learning_rate": 1.4435456435199464e-06, + "loss": 0.6548, + "step": 43672 + }, + { + "epoch": 1.12, + "learning_rate": 1.4435208436564522e-06, + "loss": 0.5913, + "step": 43673 + }, + { + "epoch": 1.12, + "learning_rate": 1.4434960434533741e-06, + "loss": 0.6328, + "step": 43674 + }, + { + "epoch": 1.12, + "learning_rate": 1.4434712429107316e-06, + "loss": 0.6138, + "step": 43675 + }, + { + "epoch": 1.12, + "learning_rate": 1.4434464420285432e-06, + "loss": 0.7188, + "step": 43676 + }, + { + "epoch": 1.12, + "learning_rate": 1.4434216408068287e-06, + "loss": 0.4454, + "step": 43677 + }, + { + "epoch": 1.12, + "learning_rate": 1.4433968392456064e-06, + "loss": 0.7695, + "step": 43678 + }, + { + "epoch": 1.12, + "learning_rate": 1.4433720373448956e-06, + "loss": 0.6914, + "step": 43679 + }, + { + "epoch": 1.12, + "learning_rate": 1.4433472351047154e-06, + "loss": 0.6479, + "step": 43680 + }, + { + "epoch": 1.12, + "learning_rate": 1.443322432525084e-06, + "loss": 0.4321, + "step": 43681 + }, + { + "epoch": 1.12, + "learning_rate": 1.4432976296060218e-06, + "loss": 0.6099, + "step": 43682 + }, + { + "epoch": 1.12, + "learning_rate": 1.4432728263475462e-06, + "loss": 0.791, + "step": 43683 + }, + { + "epoch": 1.12, + "learning_rate": 1.4432480227496777e-06, + "loss": 0.6406, + "step": 43684 + }, + { + "epoch": 1.12, + "learning_rate": 1.443223218812434e-06, + "loss": 0.6068, + "step": 43685 + }, + { + "epoch": 1.12, + "learning_rate": 1.4431984145358351e-06, + "loss": 0.7256, + "step": 43686 + }, + { + "epoch": 1.12, + "learning_rate": 1.4431736099198993e-06, + "loss": 0.4917, + "step": 43687 + }, + { + "epoch": 1.12, + "learning_rate": 1.4431488049646458e-06, + "loss": 0.8232, + "step": 43688 + }, + { + "epoch": 1.12, + "learning_rate": 1.4431239996700938e-06, + "loss": 0.6553, + "step": 43689 + }, + { + "epoch": 1.12, + "learning_rate": 1.4430991940362622e-06, + "loss": 0.627, + "step": 43690 + }, + { + "epoch": 1.12, + "learning_rate": 1.4430743880631697e-06, + "loss": 0.6294, + "step": 43691 + }, + { + "epoch": 1.12, + "learning_rate": 1.4430495817508356e-06, + "loss": 0.6221, + "step": 43692 + }, + { + "epoch": 1.12, + "learning_rate": 1.4430247750992788e-06, + "loss": 0.4822, + "step": 43693 + }, + { + "epoch": 1.12, + "learning_rate": 1.4429999681085186e-06, + "loss": 0.7012, + "step": 43694 + }, + { + "epoch": 1.12, + "learning_rate": 1.442975160778573e-06, + "loss": 0.667, + "step": 43695 + }, + { + "epoch": 1.12, + "learning_rate": 1.4429503531094625e-06, + "loss": 0.7354, + "step": 43696 + }, + { + "epoch": 1.12, + "learning_rate": 1.4429255451012048e-06, + "loss": 0.6055, + "step": 43697 + }, + { + "epoch": 1.12, + "learning_rate": 1.4429007367538194e-06, + "loss": 0.5664, + "step": 43698 + }, + { + "epoch": 1.12, + "learning_rate": 1.4428759280673255e-06, + "loss": 0.7051, + "step": 43699 + }, + { + "epoch": 1.12, + "learning_rate": 1.4428511190417414e-06, + "loss": 0.5581, + "step": 43700 + }, + { + "epoch": 1.12, + "learning_rate": 1.442826309677087e-06, + "loss": 0.6206, + "step": 43701 + }, + { + "epoch": 1.12, + "learning_rate": 1.4428014999733808e-06, + "loss": 0.7607, + "step": 43702 + }, + { + "epoch": 1.12, + "learning_rate": 1.4427766899306417e-06, + "loss": 0.7157, + "step": 43703 + }, + { + "epoch": 1.12, + "learning_rate": 1.4427518795488888e-06, + "loss": 0.666, + "step": 43704 + }, + { + "epoch": 1.12, + "learning_rate": 1.4427270688281415e-06, + "loss": 0.6284, + "step": 43705 + }, + { + "epoch": 1.12, + "learning_rate": 1.4427022577684181e-06, + "loss": 0.6631, + "step": 43706 + }, + { + "epoch": 1.12, + "learning_rate": 1.442677446369738e-06, + "loss": 0.6162, + "step": 43707 + }, + { + "epoch": 1.12, + "learning_rate": 1.44265263463212e-06, + "loss": 0.6689, + "step": 43708 + }, + { + "epoch": 1.12, + "learning_rate": 1.4426278225555836e-06, + "loss": 0.6069, + "step": 43709 + }, + { + "epoch": 1.12, + "learning_rate": 1.4426030101401472e-06, + "loss": 0.7344, + "step": 43710 + }, + { + "epoch": 1.12, + "learning_rate": 1.44257819738583e-06, + "loss": 0.7959, + "step": 43711 + }, + { + "epoch": 1.12, + "learning_rate": 1.442553384292651e-06, + "loss": 0.7305, + "step": 43712 + }, + { + "epoch": 1.12, + "learning_rate": 1.4425285708606293e-06, + "loss": 0.6797, + "step": 43713 + }, + { + "epoch": 1.12, + "learning_rate": 1.442503757089784e-06, + "loss": 0.4652, + "step": 43714 + }, + { + "epoch": 1.12, + "learning_rate": 1.4424789429801338e-06, + "loss": 0.5029, + "step": 43715 + }, + { + "epoch": 1.12, + "learning_rate": 1.4424541285316976e-06, + "loss": 0.7988, + "step": 43716 + }, + { + "epoch": 1.12, + "learning_rate": 1.442429313744495e-06, + "loss": 0.7192, + "step": 43717 + }, + { + "epoch": 1.12, + "learning_rate": 1.4424044986185443e-06, + "loss": 0.6982, + "step": 43718 + }, + { + "epoch": 1.12, + "learning_rate": 1.4423796831538648e-06, + "loss": 0.666, + "step": 43719 + }, + { + "epoch": 1.12, + "learning_rate": 1.4423548673504758e-06, + "loss": 0.5835, + "step": 43720 + }, + { + "epoch": 1.12, + "learning_rate": 1.4423300512083957e-06, + "loss": 0.7422, + "step": 43721 + }, + { + "epoch": 1.12, + "learning_rate": 1.4423052347276442e-06, + "loss": 0.6523, + "step": 43722 + }, + { + "epoch": 1.12, + "learning_rate": 1.4422804179082395e-06, + "loss": 0.7139, + "step": 43723 + }, + { + "epoch": 1.12, + "learning_rate": 1.4422556007502014e-06, + "loss": 0.6592, + "step": 43724 + }, + { + "epoch": 1.12, + "learning_rate": 1.442230783253548e-06, + "loss": 0.6685, + "step": 43725 + }, + { + "epoch": 1.12, + "learning_rate": 1.4422059654182995e-06, + "loss": 0.7793, + "step": 43726 + }, + { + "epoch": 1.12, + "learning_rate": 1.4421811472444737e-06, + "loss": 0.7422, + "step": 43727 + }, + { + "epoch": 1.12, + "learning_rate": 1.44215632873209e-06, + "loss": 0.6797, + "step": 43728 + }, + { + "epoch": 1.12, + "learning_rate": 1.4421315098811681e-06, + "loss": 0.6562, + "step": 43729 + }, + { + "epoch": 1.12, + "learning_rate": 1.4421066906917263e-06, + "loss": 0.5293, + "step": 43730 + }, + { + "epoch": 1.12, + "learning_rate": 1.4420818711637835e-06, + "loss": 0.4006, + "step": 43731 + }, + { + "epoch": 1.12, + "learning_rate": 1.442057051297359e-06, + "loss": 0.5669, + "step": 43732 + }, + { + "epoch": 1.12, + "learning_rate": 1.4420322310924717e-06, + "loss": 0.6504, + "step": 43733 + }, + { + "epoch": 1.12, + "learning_rate": 1.442007410549141e-06, + "loss": 0.7051, + "step": 43734 + }, + { + "epoch": 1.12, + "learning_rate": 1.4419825896673853e-06, + "loss": 0.8555, + "step": 43735 + }, + { + "epoch": 1.12, + "learning_rate": 1.4419577684472237e-06, + "loss": 0.5437, + "step": 43736 + }, + { + "epoch": 1.12, + "learning_rate": 1.4419329468886754e-06, + "loss": 0.6348, + "step": 43737 + }, + { + "epoch": 1.12, + "learning_rate": 1.4419081249917595e-06, + "loss": 0.6277, + "step": 43738 + }, + { + "epoch": 1.12, + "learning_rate": 1.441883302756495e-06, + "loss": 0.6685, + "step": 43739 + }, + { + "epoch": 1.12, + "learning_rate": 1.4418584801829005e-06, + "loss": 0.6846, + "step": 43740 + }, + { + "epoch": 1.12, + "learning_rate": 1.4418336572709952e-06, + "loss": 0.7031, + "step": 43741 + }, + { + "epoch": 1.12, + "learning_rate": 1.4418088340207987e-06, + "loss": 0.6067, + "step": 43742 + }, + { + "epoch": 1.12, + "learning_rate": 1.441784010432329e-06, + "loss": 0.8193, + "step": 43743 + }, + { + "epoch": 1.12, + "learning_rate": 1.4417591865056057e-06, + "loss": 0.5859, + "step": 43744 + }, + { + "epoch": 1.12, + "learning_rate": 1.441734362240648e-06, + "loss": 0.7305, + "step": 43745 + }, + { + "epoch": 1.12, + "learning_rate": 1.4417095376374741e-06, + "loss": 0.637, + "step": 43746 + }, + { + "epoch": 1.12, + "learning_rate": 1.4416847126961039e-06, + "loss": 0.6699, + "step": 43747 + }, + { + "epoch": 1.12, + "learning_rate": 1.441659887416556e-06, + "loss": 0.5869, + "step": 43748 + }, + { + "epoch": 1.12, + "learning_rate": 1.4416350617988494e-06, + "loss": 0.7363, + "step": 43749 + }, + { + "epoch": 1.12, + "learning_rate": 1.4416102358430028e-06, + "loss": 0.7734, + "step": 43750 + }, + { + "epoch": 1.12, + "learning_rate": 1.4415854095490362e-06, + "loss": 0.6113, + "step": 43751 + }, + { + "epoch": 1.12, + "learning_rate": 1.4415605829169672e-06, + "loss": 0.3911, + "step": 43752 + }, + { + "epoch": 1.12, + "learning_rate": 1.441535755946816e-06, + "loss": 0.5938, + "step": 43753 + }, + { + "epoch": 1.12, + "learning_rate": 1.4415109286386011e-06, + "loss": 0.4639, + "step": 43754 + }, + { + "epoch": 1.12, + "learning_rate": 1.4414861009923417e-06, + "loss": 0.6904, + "step": 43755 + }, + { + "epoch": 1.12, + "learning_rate": 1.4414612730080567e-06, + "loss": 0.6338, + "step": 43756 + }, + { + "epoch": 1.12, + "learning_rate": 1.441436444685765e-06, + "loss": 0.4238, + "step": 43757 + }, + { + "epoch": 1.12, + "learning_rate": 1.4414116160254856e-06, + "loss": 0.7363, + "step": 43758 + }, + { + "epoch": 1.12, + "learning_rate": 1.441386787027238e-06, + "loss": 0.6855, + "step": 43759 + }, + { + "epoch": 1.12, + "learning_rate": 1.4413619576910402e-06, + "loss": 0.6187, + "step": 43760 + }, + { + "epoch": 1.12, + "learning_rate": 1.4413371280169124e-06, + "loss": 0.7695, + "step": 43761 + }, + { + "epoch": 1.12, + "learning_rate": 1.4413122980048728e-06, + "loss": 0.625, + "step": 43762 + }, + { + "epoch": 1.12, + "learning_rate": 1.441287467654941e-06, + "loss": 0.6279, + "step": 43763 + }, + { + "epoch": 1.12, + "learning_rate": 1.4412626369671353e-06, + "loss": 0.7598, + "step": 43764 + }, + { + "epoch": 1.12, + "learning_rate": 1.441237805941475e-06, + "loss": 0.7666, + "step": 43765 + }, + { + "epoch": 1.12, + "learning_rate": 1.4412129745779796e-06, + "loss": 0.6675, + "step": 43766 + }, + { + "epoch": 1.12, + "learning_rate": 1.4411881428766675e-06, + "loss": 0.7607, + "step": 43767 + }, + { + "epoch": 1.12, + "learning_rate": 1.4411633108375578e-06, + "loss": 0.6499, + "step": 43768 + }, + { + "epoch": 1.12, + "learning_rate": 1.4411384784606698e-06, + "loss": 0.4534, + "step": 43769 + }, + { + "epoch": 1.12, + "learning_rate": 1.4411136457460225e-06, + "loss": 0.6631, + "step": 43770 + }, + { + "epoch": 1.12, + "learning_rate": 1.4410888126936341e-06, + "loss": 0.6895, + "step": 43771 + }, + { + "epoch": 1.12, + "learning_rate": 1.441063979303525e-06, + "loss": 0.5791, + "step": 43772 + }, + { + "epoch": 1.12, + "learning_rate": 1.4410391455757131e-06, + "loss": 0.51, + "step": 43773 + }, + { + "epoch": 1.12, + "learning_rate": 1.4410143115102185e-06, + "loss": 0.5608, + "step": 43774 + }, + { + "epoch": 1.12, + "learning_rate": 1.4409894771070587e-06, + "loss": 0.6592, + "step": 43775 + }, + { + "epoch": 1.12, + "learning_rate": 1.440964642366254e-06, + "loss": 0.6743, + "step": 43776 + }, + { + "epoch": 1.12, + "learning_rate": 1.4409398072878226e-06, + "loss": 0.5508, + "step": 43777 + }, + { + "epoch": 1.12, + "learning_rate": 1.4409149718717841e-06, + "loss": 0.665, + "step": 43778 + }, + { + "epoch": 1.12, + "learning_rate": 1.4408901361181571e-06, + "loss": 0.7637, + "step": 43779 + }, + { + "epoch": 1.12, + "learning_rate": 1.440865300026961e-06, + "loss": 0.6587, + "step": 43780 + }, + { + "epoch": 1.12, + "learning_rate": 1.4408404635982144e-06, + "loss": 0.6782, + "step": 43781 + }, + { + "epoch": 1.12, + "learning_rate": 1.4408156268319367e-06, + "loss": 0.3733, + "step": 43782 + }, + { + "epoch": 1.12, + "learning_rate": 1.4407907897281466e-06, + "loss": 0.5415, + "step": 43783 + }, + { + "epoch": 1.12, + "learning_rate": 1.4407659522868636e-06, + "loss": 0.625, + "step": 43784 + }, + { + "epoch": 1.12, + "learning_rate": 1.4407411145081061e-06, + "loss": 0.7153, + "step": 43785 + }, + { + "epoch": 1.12, + "learning_rate": 1.4407162763918933e-06, + "loss": 0.5588, + "step": 43786 + }, + { + "epoch": 1.12, + "learning_rate": 1.4406914379382444e-06, + "loss": 0.8379, + "step": 43787 + }, + { + "epoch": 1.12, + "learning_rate": 1.4406665991471784e-06, + "loss": 0.5264, + "step": 43788 + }, + { + "epoch": 1.12, + "learning_rate": 1.4406417600187144e-06, + "loss": 0.6099, + "step": 43789 + }, + { + "epoch": 1.12, + "learning_rate": 1.4406169205528709e-06, + "loss": 0.75, + "step": 43790 + }, + { + "epoch": 1.12, + "learning_rate": 1.4405920807496674e-06, + "loss": 0.6255, + "step": 43791 + }, + { + "epoch": 1.12, + "learning_rate": 1.440567240609123e-06, + "loss": 0.7344, + "step": 43792 + }, + { + "epoch": 1.12, + "learning_rate": 1.4405424001312563e-06, + "loss": 0.5596, + "step": 43793 + }, + { + "epoch": 1.12, + "learning_rate": 1.4405175593160867e-06, + "loss": 0.5928, + "step": 43794 + }, + { + "epoch": 1.12, + "learning_rate": 1.440492718163633e-06, + "loss": 0.7832, + "step": 43795 + }, + { + "epoch": 1.12, + "learning_rate": 1.4404678766739142e-06, + "loss": 0.7217, + "step": 43796 + }, + { + "epoch": 1.12, + "learning_rate": 1.4404430348469496e-06, + "loss": 0.6836, + "step": 43797 + }, + { + "epoch": 1.12, + "learning_rate": 1.4404181926827576e-06, + "loss": 0.6472, + "step": 43798 + }, + { + "epoch": 1.12, + "learning_rate": 1.4403933501813582e-06, + "loss": 0.582, + "step": 43799 + }, + { + "epoch": 1.12, + "learning_rate": 1.4403685073427697e-06, + "loss": 0.7412, + "step": 43800 + }, + { + "epoch": 1.12, + "learning_rate": 1.440343664167011e-06, + "loss": 0.5474, + "step": 43801 + }, + { + "epoch": 1.12, + "learning_rate": 1.4403188206541016e-06, + "loss": 0.7158, + "step": 43802 + }, + { + "epoch": 1.12, + "learning_rate": 1.4402939768040604e-06, + "loss": 0.5518, + "step": 43803 + }, + { + "epoch": 1.12, + "learning_rate": 1.4402691326169062e-06, + "loss": 0.8018, + "step": 43804 + }, + { + "epoch": 1.12, + "learning_rate": 1.4402442880926583e-06, + "loss": 0.5437, + "step": 43805 + }, + { + "epoch": 1.12, + "learning_rate": 1.4402194432313354e-06, + "loss": 0.6982, + "step": 43806 + }, + { + "epoch": 1.12, + "learning_rate": 1.4401945980329569e-06, + "loss": 0.6061, + "step": 43807 + }, + { + "epoch": 1.12, + "learning_rate": 1.4401697524975414e-06, + "loss": 0.6479, + "step": 43808 + }, + { + "epoch": 1.12, + "learning_rate": 1.4401449066251084e-06, + "loss": 0.7935, + "step": 43809 + }, + { + "epoch": 1.12, + "learning_rate": 1.4401200604156767e-06, + "loss": 0.7188, + "step": 43810 + }, + { + "epoch": 1.12, + "learning_rate": 1.4400952138692653e-06, + "loss": 0.6909, + "step": 43811 + }, + { + "epoch": 1.12, + "learning_rate": 1.4400703669858928e-06, + "loss": 0.4805, + "step": 43812 + }, + { + "epoch": 1.12, + "learning_rate": 1.4400455197655791e-06, + "loss": 0.5132, + "step": 43813 + }, + { + "epoch": 1.12, + "learning_rate": 1.4400206722083428e-06, + "loss": 0.5547, + "step": 43814 + }, + { + "epoch": 1.12, + "learning_rate": 1.4399958243142027e-06, + "loss": 0.6709, + "step": 43815 + }, + { + "epoch": 1.12, + "learning_rate": 1.4399709760831781e-06, + "loss": 0.749, + "step": 43816 + }, + { + "epoch": 1.12, + "learning_rate": 1.439946127515288e-06, + "loss": 0.7085, + "step": 43817 + }, + { + "epoch": 1.12, + "learning_rate": 1.4399212786105514e-06, + "loss": 0.6016, + "step": 43818 + }, + { + "epoch": 1.12, + "learning_rate": 1.4398964293689873e-06, + "loss": 0.708, + "step": 43819 + }, + { + "epoch": 1.12, + "learning_rate": 1.4398715797906147e-06, + "loss": 0.6172, + "step": 43820 + }, + { + "epoch": 1.12, + "learning_rate": 1.4398467298754526e-06, + "loss": 0.5625, + "step": 43821 + }, + { + "epoch": 1.12, + "learning_rate": 1.43982187962352e-06, + "loss": 0.6479, + "step": 43822 + }, + { + "epoch": 1.12, + "learning_rate": 1.439797029034836e-06, + "loss": 0.6694, + "step": 43823 + }, + { + "epoch": 1.12, + "learning_rate": 1.4397721781094202e-06, + "loss": 0.6729, + "step": 43824 + }, + { + "epoch": 1.12, + "learning_rate": 1.4397473268472903e-06, + "loss": 0.6709, + "step": 43825 + }, + { + "epoch": 1.12, + "learning_rate": 1.4397224752484666e-06, + "loss": 0.6729, + "step": 43826 + }, + { + "epoch": 1.12, + "learning_rate": 1.4396976233129674e-06, + "loss": 0.6782, + "step": 43827 + }, + { + "epoch": 1.12, + "learning_rate": 1.439672771040812e-06, + "loss": 0.5425, + "step": 43828 + }, + { + "epoch": 1.12, + "learning_rate": 1.4396479184320193e-06, + "loss": 0.542, + "step": 43829 + }, + { + "epoch": 1.12, + "learning_rate": 1.4396230654866086e-06, + "loss": 0.5144, + "step": 43830 + }, + { + "epoch": 1.12, + "learning_rate": 1.4395982122045985e-06, + "loss": 0.6699, + "step": 43831 + }, + { + "epoch": 1.12, + "learning_rate": 1.4395733585860086e-06, + "loss": 0.7148, + "step": 43832 + }, + { + "epoch": 1.12, + "learning_rate": 1.4395485046308571e-06, + "loss": 0.5571, + "step": 43833 + }, + { + "epoch": 1.12, + "learning_rate": 1.4395236503391638e-06, + "loss": 0.6709, + "step": 43834 + }, + { + "epoch": 1.12, + "learning_rate": 1.4394987957109477e-06, + "loss": 0.6807, + "step": 43835 + }, + { + "epoch": 1.12, + "learning_rate": 1.439473940746227e-06, + "loss": 0.6709, + "step": 43836 + }, + { + "epoch": 1.12, + "learning_rate": 1.4394490854450216e-06, + "loss": 0.8389, + "step": 43837 + }, + { + "epoch": 1.12, + "learning_rate": 1.4394242298073503e-06, + "loss": 0.7002, + "step": 43838 + }, + { + "epoch": 1.12, + "learning_rate": 1.4393993738332321e-06, + "loss": 0.7324, + "step": 43839 + }, + { + "epoch": 1.12, + "learning_rate": 1.439374517522686e-06, + "loss": 0.5957, + "step": 43840 + }, + { + "epoch": 1.12, + "learning_rate": 1.439349660875731e-06, + "loss": 0.5425, + "step": 43841 + }, + { + "epoch": 1.12, + "learning_rate": 1.439324803892386e-06, + "loss": 0.8438, + "step": 43842 + }, + { + "epoch": 1.12, + "learning_rate": 1.4392999465726704e-06, + "loss": 0.5474, + "step": 43843 + }, + { + "epoch": 1.12, + "learning_rate": 1.439275088916603e-06, + "loss": 0.9287, + "step": 43844 + }, + { + "epoch": 1.12, + "learning_rate": 1.439250230924203e-06, + "loss": 0.7588, + "step": 43845 + }, + { + "epoch": 1.12, + "learning_rate": 1.439225372595489e-06, + "loss": 0.5232, + "step": 43846 + }, + { + "epoch": 1.12, + "learning_rate": 1.4392005139304803e-06, + "loss": 0.6895, + "step": 43847 + }, + { + "epoch": 1.12, + "learning_rate": 1.4391756549291963e-06, + "loss": 0.6631, + "step": 43848 + }, + { + "epoch": 1.12, + "learning_rate": 1.4391507955916557e-06, + "loss": 0.7246, + "step": 43849 + }, + { + "epoch": 1.12, + "learning_rate": 1.4391259359178772e-06, + "loss": 0.7549, + "step": 43850 + }, + { + "epoch": 1.12, + "learning_rate": 1.4391010759078803e-06, + "loss": 0.7539, + "step": 43851 + }, + { + "epoch": 1.12, + "learning_rate": 1.4390762155616838e-06, + "loss": 0.7334, + "step": 43852 + }, + { + "epoch": 1.12, + "learning_rate": 1.439051354879307e-06, + "loss": 0.792, + "step": 43853 + }, + { + "epoch": 1.12, + "learning_rate": 1.4390264938607688e-06, + "loss": 0.7432, + "step": 43854 + }, + { + "epoch": 1.12, + "learning_rate": 1.439001632506088e-06, + "loss": 0.6973, + "step": 43855 + }, + { + "epoch": 1.12, + "learning_rate": 1.4389767708152837e-06, + "loss": 0.5479, + "step": 43856 + }, + { + "epoch": 1.12, + "learning_rate": 1.4389519087883754e-06, + "loss": 0.583, + "step": 43857 + }, + { + "epoch": 1.12, + "learning_rate": 1.4389270464253818e-06, + "loss": 0.6206, + "step": 43858 + }, + { + "epoch": 1.12, + "learning_rate": 1.4389021837263217e-06, + "loss": 0.6787, + "step": 43859 + }, + { + "epoch": 1.12, + "learning_rate": 1.4388773206912149e-06, + "loss": 0.6699, + "step": 43860 + }, + { + "epoch": 1.12, + "learning_rate": 1.4388524573200793e-06, + "loss": 0.626, + "step": 43861 + }, + { + "epoch": 1.12, + "learning_rate": 1.4388275936129348e-06, + "loss": 0.5544, + "step": 43862 + }, + { + "epoch": 1.12, + "learning_rate": 1.4388027295698003e-06, + "loss": 0.4041, + "step": 43863 + }, + { + "epoch": 1.12, + "learning_rate": 1.4387778651906948e-06, + "loss": 0.5547, + "step": 43864 + }, + { + "epoch": 1.12, + "learning_rate": 1.438753000475637e-06, + "loss": 0.7349, + "step": 43865 + }, + { + "epoch": 1.12, + "learning_rate": 1.4387281354246464e-06, + "loss": 0.6567, + "step": 43866 + }, + { + "epoch": 1.12, + "learning_rate": 1.4387032700377416e-06, + "loss": 0.7012, + "step": 43867 + }, + { + "epoch": 1.12, + "learning_rate": 1.4386784043149418e-06, + "loss": 0.668, + "step": 43868 + }, + { + "epoch": 1.12, + "learning_rate": 1.4386535382562665e-06, + "loss": 0.6499, + "step": 43869 + }, + { + "epoch": 1.12, + "learning_rate": 1.4386286718617343e-06, + "loss": 0.8408, + "step": 43870 + }, + { + "epoch": 1.12, + "learning_rate": 1.438603805131364e-06, + "loss": 0.6123, + "step": 43871 + }, + { + "epoch": 1.12, + "learning_rate": 1.438578938065175e-06, + "loss": 0.6914, + "step": 43872 + }, + { + "epoch": 1.12, + "learning_rate": 1.4385540706631867e-06, + "loss": 0.7529, + "step": 43873 + }, + { + "epoch": 1.12, + "learning_rate": 1.4385292029254173e-06, + "loss": 0.8809, + "step": 43874 + }, + { + "epoch": 1.12, + "learning_rate": 1.4385043348518862e-06, + "loss": 0.6641, + "step": 43875 + }, + { + "epoch": 1.12, + "learning_rate": 1.4384794664426127e-06, + "loss": 0.4795, + "step": 43876 + }, + { + "epoch": 1.12, + "learning_rate": 1.4384545976976155e-06, + "loss": 0.5559, + "step": 43877 + }, + { + "epoch": 1.12, + "learning_rate": 1.4384297286169141e-06, + "loss": 0.4841, + "step": 43878 + }, + { + "epoch": 1.12, + "learning_rate": 1.4384048592005268e-06, + "loss": 0.4594, + "step": 43879 + }, + { + "epoch": 1.12, + "learning_rate": 1.4383799894484732e-06, + "loss": 0.8701, + "step": 43880 + }, + { + "epoch": 1.12, + "learning_rate": 1.438355119360772e-06, + "loss": 0.8125, + "step": 43881 + }, + { + "epoch": 1.12, + "learning_rate": 1.4383302489374428e-06, + "loss": 0.7012, + "step": 43882 + }, + { + "epoch": 1.12, + "learning_rate": 1.4383053781785044e-06, + "loss": 0.5688, + "step": 43883 + }, + { + "epoch": 1.12, + "learning_rate": 1.4382805070839755e-06, + "loss": 0.7842, + "step": 43884 + }, + { + "epoch": 1.12, + "learning_rate": 1.438255635653875e-06, + "loss": 0.7988, + "step": 43885 + }, + { + "epoch": 1.12, + "learning_rate": 1.4382307638882228e-06, + "loss": 0.6953, + "step": 43886 + }, + { + "epoch": 1.12, + "learning_rate": 1.4382058917870373e-06, + "loss": 0.6807, + "step": 43887 + }, + { + "epoch": 1.12, + "learning_rate": 1.4381810193503378e-06, + "loss": 0.5415, + "step": 43888 + }, + { + "epoch": 1.12, + "learning_rate": 1.4381561465781432e-06, + "loss": 0.6233, + "step": 43889 + }, + { + "epoch": 1.12, + "learning_rate": 1.4381312734704723e-06, + "loss": 0.5354, + "step": 43890 + }, + { + "epoch": 1.12, + "learning_rate": 1.438106400027345e-06, + "loss": 0.6284, + "step": 43891 + }, + { + "epoch": 1.12, + "learning_rate": 1.438081526248779e-06, + "loss": 0.519, + "step": 43892 + }, + { + "epoch": 1.12, + "learning_rate": 1.438056652134795e-06, + "loss": 0.7188, + "step": 43893 + }, + { + "epoch": 1.13, + "learning_rate": 1.4380317776854106e-06, + "loss": 0.6211, + "step": 43894 + }, + { + "epoch": 1.13, + "learning_rate": 1.4380069029006454e-06, + "loss": 0.5021, + "step": 43895 + }, + { + "epoch": 1.13, + "learning_rate": 1.4379820277805186e-06, + "loss": 0.5933, + "step": 43896 + }, + { + "epoch": 1.13, + "learning_rate": 1.4379571523250491e-06, + "loss": 0.7646, + "step": 43897 + }, + { + "epoch": 1.13, + "learning_rate": 1.4379322765342559e-06, + "loss": 0.4951, + "step": 43898 + }, + { + "epoch": 1.13, + "learning_rate": 1.4379074004081583e-06, + "loss": 0.411, + "step": 43899 + }, + { + "epoch": 1.13, + "learning_rate": 1.437882523946775e-06, + "loss": 0.5957, + "step": 43900 + }, + { + "epoch": 1.13, + "learning_rate": 1.437857647150125e-06, + "loss": 0.7314, + "step": 43901 + }, + { + "epoch": 1.13, + "learning_rate": 1.4378327700182276e-06, + "loss": 0.6992, + "step": 43902 + }, + { + "epoch": 1.13, + "learning_rate": 1.437807892551102e-06, + "loss": 0.6348, + "step": 43903 + }, + { + "epoch": 1.13, + "learning_rate": 1.4377830147487668e-06, + "loss": 0.6802, + "step": 43904 + }, + { + "epoch": 1.13, + "learning_rate": 1.4377581366112412e-06, + "loss": 0.5403, + "step": 43905 + }, + { + "epoch": 1.13, + "learning_rate": 1.4377332581385447e-06, + "loss": 0.7441, + "step": 43906 + }, + { + "epoch": 1.13, + "learning_rate": 1.4377083793306955e-06, + "loss": 0.5757, + "step": 43907 + }, + { + "epoch": 1.13, + "learning_rate": 1.4376835001877136e-06, + "loss": 0.6582, + "step": 43908 + }, + { + "epoch": 1.13, + "learning_rate": 1.4376586207096174e-06, + "loss": 0.5825, + "step": 43909 + }, + { + "epoch": 1.13, + "learning_rate": 1.437633740896426e-06, + "loss": 0.5947, + "step": 43910 + }, + { + "epoch": 1.13, + "learning_rate": 1.4376088607481585e-06, + "loss": 0.8027, + "step": 43911 + }, + { + "epoch": 1.13, + "learning_rate": 1.437583980264834e-06, + "loss": 0.3591, + "step": 43912 + }, + { + "epoch": 1.13, + "learning_rate": 1.437559099446472e-06, + "loss": 0.7422, + "step": 43913 + }, + { + "epoch": 1.13, + "learning_rate": 1.437534218293091e-06, + "loss": 0.5415, + "step": 43914 + }, + { + "epoch": 1.13, + "learning_rate": 1.4375093368047097e-06, + "loss": 0.5908, + "step": 43915 + }, + { + "epoch": 1.13, + "learning_rate": 1.4374844549813482e-06, + "loss": 0.5405, + "step": 43916 + }, + { + "epoch": 1.13, + "learning_rate": 1.4374595728230243e-06, + "loss": 0.5605, + "step": 43917 + }, + { + "epoch": 1.13, + "learning_rate": 1.4374346903297584e-06, + "loss": 0.5283, + "step": 43918 + }, + { + "epoch": 1.13, + "learning_rate": 1.4374098075015685e-06, + "loss": 0.6421, + "step": 43919 + }, + { + "epoch": 1.13, + "learning_rate": 1.437384924338474e-06, + "loss": 0.6455, + "step": 43920 + }, + { + "epoch": 1.13, + "learning_rate": 1.437360040840494e-06, + "loss": 0.4819, + "step": 43921 + }, + { + "epoch": 1.13, + "learning_rate": 1.4373351570076478e-06, + "loss": 0.6138, + "step": 43922 + }, + { + "epoch": 1.13, + "learning_rate": 1.437310272839954e-06, + "loss": 0.5288, + "step": 43923 + }, + { + "epoch": 1.13, + "learning_rate": 1.4372853883374316e-06, + "loss": 0.5938, + "step": 43924 + }, + { + "epoch": 1.13, + "learning_rate": 1.4372605035001005e-06, + "loss": 0.6572, + "step": 43925 + }, + { + "epoch": 1.13, + "learning_rate": 1.4372356183279784e-06, + "loss": 0.6826, + "step": 43926 + }, + { + "epoch": 1.13, + "learning_rate": 1.4372107328210853e-06, + "loss": 0.6064, + "step": 43927 + }, + { + "epoch": 1.13, + "learning_rate": 1.4371858469794404e-06, + "loss": 0.6714, + "step": 43928 + }, + { + "epoch": 1.13, + "learning_rate": 1.4371609608030624e-06, + "loss": 0.6147, + "step": 43929 + }, + { + "epoch": 1.13, + "learning_rate": 1.4371360742919699e-06, + "loss": 0.5889, + "step": 43930 + }, + { + "epoch": 1.13, + "learning_rate": 1.4371111874461829e-06, + "loss": 0.751, + "step": 43931 + }, + { + "epoch": 1.13, + "learning_rate": 1.4370863002657191e-06, + "loss": 0.6338, + "step": 43932 + }, + { + "epoch": 1.13, + "learning_rate": 1.4370614127505995e-06, + "loss": 0.7842, + "step": 43933 + }, + { + "epoch": 1.13, + "learning_rate": 1.4370365249008415e-06, + "loss": 0.5171, + "step": 43934 + }, + { + "epoch": 1.13, + "learning_rate": 1.4370116367164648e-06, + "loss": 0.4404, + "step": 43935 + }, + { + "epoch": 1.13, + "learning_rate": 1.4369867481974884e-06, + "loss": 0.5359, + "step": 43936 + }, + { + "epoch": 1.13, + "learning_rate": 1.4369618593439312e-06, + "loss": 0.7363, + "step": 43937 + }, + { + "epoch": 1.13, + "learning_rate": 1.4369369701558128e-06, + "loss": 0.4412, + "step": 43938 + }, + { + "epoch": 1.13, + "learning_rate": 1.4369120806331516e-06, + "loss": 0.6606, + "step": 43939 + }, + { + "epoch": 1.13, + "learning_rate": 1.4368871907759667e-06, + "loss": 0.6738, + "step": 43940 + }, + { + "epoch": 1.13, + "learning_rate": 1.4368623005842776e-06, + "loss": 0.7041, + "step": 43941 + }, + { + "epoch": 1.13, + "learning_rate": 1.4368374100581032e-06, + "loss": 0.7676, + "step": 43942 + }, + { + "epoch": 1.13, + "learning_rate": 1.4368125191974622e-06, + "loss": 0.7129, + "step": 43943 + }, + { + "epoch": 1.13, + "learning_rate": 1.4367876280023742e-06, + "loss": 0.5952, + "step": 43944 + }, + { + "epoch": 1.13, + "learning_rate": 1.4367627364728581e-06, + "loss": 0.6543, + "step": 43945 + }, + { + "epoch": 1.13, + "learning_rate": 1.4367378446089324e-06, + "loss": 0.6826, + "step": 43946 + }, + { + "epoch": 1.13, + "learning_rate": 1.436712952410617e-06, + "loss": 0.6914, + "step": 43947 + }, + { + "epoch": 1.13, + "learning_rate": 1.4366880598779305e-06, + "loss": 0.5537, + "step": 43948 + }, + { + "epoch": 1.13, + "learning_rate": 1.436663167010892e-06, + "loss": 0.8682, + "step": 43949 + }, + { + "epoch": 1.13, + "learning_rate": 1.4366382738095206e-06, + "loss": 0.627, + "step": 43950 + }, + { + "epoch": 1.13, + "learning_rate": 1.4366133802738351e-06, + "loss": 0.6343, + "step": 43951 + }, + { + "epoch": 1.13, + "learning_rate": 1.436588486403855e-06, + "loss": 0.5044, + "step": 43952 + }, + { + "epoch": 1.13, + "learning_rate": 1.4365635921995993e-06, + "loss": 0.7295, + "step": 43953 + }, + { + "epoch": 1.13, + "learning_rate": 1.436538697661087e-06, + "loss": 0.5986, + "step": 43954 + }, + { + "epoch": 1.13, + "learning_rate": 1.4365138027883368e-06, + "loss": 0.7266, + "step": 43955 + }, + { + "epoch": 1.13, + "learning_rate": 1.4364889075813683e-06, + "loss": 0.8623, + "step": 43956 + }, + { + "epoch": 1.13, + "learning_rate": 1.4364640120402e-06, + "loss": 0.5146, + "step": 43957 + }, + { + "epoch": 1.13, + "learning_rate": 1.4364391161648516e-06, + "loss": 0.6055, + "step": 43958 + }, + { + "epoch": 1.13, + "learning_rate": 1.4364142199553417e-06, + "loss": 0.4651, + "step": 43959 + }, + { + "epoch": 1.13, + "learning_rate": 1.4363893234116894e-06, + "loss": 0.626, + "step": 43960 + }, + { + "epoch": 1.13, + "learning_rate": 1.4363644265339141e-06, + "loss": 0.5974, + "step": 43961 + }, + { + "epoch": 1.13, + "learning_rate": 1.4363395293220344e-06, + "loss": 0.6719, + "step": 43962 + }, + { + "epoch": 1.13, + "learning_rate": 1.43631463177607e-06, + "loss": 0.666, + "step": 43963 + }, + { + "epoch": 1.13, + "learning_rate": 1.4362897338960391e-06, + "loss": 0.7959, + "step": 43964 + }, + { + "epoch": 1.13, + "learning_rate": 1.4362648356819614e-06, + "loss": 0.5149, + "step": 43965 + }, + { + "epoch": 1.13, + "learning_rate": 1.4362399371338556e-06, + "loss": 0.6104, + "step": 43966 + }, + { + "epoch": 1.13, + "learning_rate": 1.4362150382517408e-06, + "loss": 0.4878, + "step": 43967 + }, + { + "epoch": 1.13, + "learning_rate": 1.4361901390356366e-06, + "loss": 0.6348, + "step": 43968 + }, + { + "epoch": 1.13, + "learning_rate": 1.4361652394855618e-06, + "loss": 0.6045, + "step": 43969 + }, + { + "epoch": 1.13, + "learning_rate": 1.4361403396015349e-06, + "loss": 0.7002, + "step": 43970 + }, + { + "epoch": 1.13, + "learning_rate": 1.4361154393835756e-06, + "loss": 0.3394, + "step": 43971 + }, + { + "epoch": 1.13, + "learning_rate": 1.4360905388317024e-06, + "loss": 0.6045, + "step": 43972 + }, + { + "epoch": 1.13, + "learning_rate": 1.4360656379459353e-06, + "loss": 0.7441, + "step": 43973 + }, + { + "epoch": 1.13, + "learning_rate": 1.4360407367262925e-06, + "loss": 0.8057, + "step": 43974 + }, + { + "epoch": 1.13, + "learning_rate": 1.4360158351727933e-06, + "loss": 0.7422, + "step": 43975 + }, + { + "epoch": 1.13, + "learning_rate": 1.435990933285457e-06, + "loss": 0.6343, + "step": 43976 + }, + { + "epoch": 1.13, + "learning_rate": 1.4359660310643023e-06, + "loss": 0.5942, + "step": 43977 + }, + { + "epoch": 1.13, + "learning_rate": 1.4359411285093486e-06, + "loss": 0.5869, + "step": 43978 + }, + { + "epoch": 1.13, + "learning_rate": 1.435916225620615e-06, + "loss": 0.6396, + "step": 43979 + }, + { + "epoch": 1.13, + "learning_rate": 1.4358913223981198e-06, + "loss": 0.583, + "step": 43980 + }, + { + "epoch": 1.13, + "learning_rate": 1.4358664188418832e-06, + "loss": 0.5044, + "step": 43981 + }, + { + "epoch": 1.13, + "learning_rate": 1.4358415149519235e-06, + "loss": 0.876, + "step": 43982 + }, + { + "epoch": 1.13, + "learning_rate": 1.4358166107282603e-06, + "loss": 0.7988, + "step": 43983 + }, + { + "epoch": 1.13, + "learning_rate": 1.435791706170912e-06, + "loss": 0.8213, + "step": 43984 + }, + { + "epoch": 1.13, + "learning_rate": 1.435766801279898e-06, + "loss": 0.688, + "step": 43985 + }, + { + "epoch": 1.13, + "learning_rate": 1.4357418960552376e-06, + "loss": 0.7148, + "step": 43986 + }, + { + "epoch": 1.13, + "learning_rate": 1.4357169904969494e-06, + "loss": 0.7256, + "step": 43987 + }, + { + "epoch": 1.13, + "learning_rate": 1.4356920846050532e-06, + "loss": 0.7319, + "step": 43988 + }, + { + "epoch": 1.13, + "learning_rate": 1.4356671783795671e-06, + "loss": 0.7549, + "step": 43989 + }, + { + "epoch": 1.13, + "learning_rate": 1.435642271820511e-06, + "loss": 0.4607, + "step": 43990 + }, + { + "epoch": 1.13, + "learning_rate": 1.4356173649279038e-06, + "loss": 0.5918, + "step": 43991 + }, + { + "epoch": 1.13, + "learning_rate": 1.435592457701764e-06, + "loss": 0.5488, + "step": 43992 + }, + { + "epoch": 1.13, + "learning_rate": 1.4355675501421113e-06, + "loss": 0.6143, + "step": 43993 + }, + { + "epoch": 1.13, + "learning_rate": 1.4355426422489645e-06, + "loss": 0.6128, + "step": 43994 + }, + { + "epoch": 1.13, + "learning_rate": 1.4355177340223426e-06, + "loss": 0.7012, + "step": 43995 + }, + { + "epoch": 1.13, + "learning_rate": 1.435492825462265e-06, + "loss": 0.5085, + "step": 43996 + }, + { + "epoch": 1.13, + "learning_rate": 1.4354679165687504e-06, + "loss": 0.6543, + "step": 43997 + }, + { + "epoch": 1.13, + "learning_rate": 1.4354430073418183e-06, + "loss": 0.6229, + "step": 43998 + }, + { + "epoch": 1.13, + "learning_rate": 1.4354180977814872e-06, + "loss": 0.6577, + "step": 43999 + }, + { + "epoch": 1.13, + "learning_rate": 1.4353931878877767e-06, + "loss": 0.6982, + "step": 44000 + }, + { + "epoch": 1.13, + "learning_rate": 1.4353682776607055e-06, + "loss": 0.8232, + "step": 44001 + }, + { + "epoch": 1.13, + "learning_rate": 1.435343367100293e-06, + "loss": 0.6748, + "step": 44002 + }, + { + "epoch": 1.13, + "learning_rate": 1.4353184562065582e-06, + "loss": 0.7129, + "step": 44003 + }, + { + "epoch": 1.13, + "learning_rate": 1.4352935449795198e-06, + "loss": 0.6094, + "step": 44004 + }, + { + "epoch": 1.13, + "learning_rate": 1.4352686334191973e-06, + "loss": 0.5919, + "step": 44005 + }, + { + "epoch": 1.13, + "learning_rate": 1.4352437215256095e-06, + "loss": 0.6787, + "step": 44006 + }, + { + "epoch": 1.13, + "learning_rate": 1.4352188092987756e-06, + "loss": 0.6611, + "step": 44007 + }, + { + "epoch": 1.13, + "learning_rate": 1.435193896738715e-06, + "loss": 0.6768, + "step": 44008 + }, + { + "epoch": 1.13, + "learning_rate": 1.435168983845446e-06, + "loss": 0.6895, + "step": 44009 + }, + { + "epoch": 1.13, + "learning_rate": 1.4351440706189884e-06, + "loss": 0.7578, + "step": 44010 + }, + { + "epoch": 1.13, + "learning_rate": 1.4351191570593607e-06, + "loss": 0.6313, + "step": 44011 + }, + { + "epoch": 1.13, + "learning_rate": 1.4350942431665824e-06, + "loss": 0.6118, + "step": 44012 + }, + { + "epoch": 1.13, + "learning_rate": 1.4350693289406726e-06, + "loss": 0.5435, + "step": 44013 + }, + { + "epoch": 1.13, + "learning_rate": 1.43504441438165e-06, + "loss": 0.6455, + "step": 44014 + }, + { + "epoch": 1.13, + "learning_rate": 1.4350194994895341e-06, + "loss": 0.6055, + "step": 44015 + }, + { + "epoch": 1.13, + "learning_rate": 1.4349945842643436e-06, + "loss": 0.7119, + "step": 44016 + }, + { + "epoch": 1.13, + "learning_rate": 1.434969668706098e-06, + "loss": 0.7793, + "step": 44017 + }, + { + "epoch": 1.13, + "learning_rate": 1.434944752814816e-06, + "loss": 0.792, + "step": 44018 + }, + { + "epoch": 1.13, + "learning_rate": 1.4349198365905166e-06, + "loss": 0.4829, + "step": 44019 + }, + { + "epoch": 1.13, + "learning_rate": 1.4348949200332192e-06, + "loss": 0.7441, + "step": 44020 + }, + { + "epoch": 1.13, + "learning_rate": 1.4348700031429429e-06, + "loss": 0.835, + "step": 44021 + }, + { + "epoch": 1.13, + "learning_rate": 1.4348450859197062e-06, + "loss": 0.7471, + "step": 44022 + }, + { + "epoch": 1.13, + "learning_rate": 1.4348201683635295e-06, + "loss": 0.8716, + "step": 44023 + }, + { + "epoch": 1.13, + "learning_rate": 1.4347952504744303e-06, + "loss": 0.7568, + "step": 44024 + }, + { + "epoch": 1.13, + "learning_rate": 1.4347703322524285e-06, + "loss": 0.6826, + "step": 44025 + }, + { + "epoch": 1.13, + "learning_rate": 1.4347454136975427e-06, + "loss": 0.585, + "step": 44026 + }, + { + "epoch": 1.13, + "learning_rate": 1.434720494809793e-06, + "loss": 0.6729, + "step": 44027 + }, + { + "epoch": 1.13, + "learning_rate": 1.4346955755891973e-06, + "loss": 0.4553, + "step": 44028 + }, + { + "epoch": 1.13, + "learning_rate": 1.4346706560357756e-06, + "loss": 0.7861, + "step": 44029 + }, + { + "epoch": 1.13, + "learning_rate": 1.434645736149546e-06, + "loss": 0.7578, + "step": 44030 + }, + { + "epoch": 1.13, + "learning_rate": 1.4346208159305286e-06, + "loss": 0.7402, + "step": 44031 + }, + { + "epoch": 1.13, + "learning_rate": 1.434595895378742e-06, + "loss": 0.6006, + "step": 44032 + }, + { + "epoch": 1.13, + "learning_rate": 1.4345709744942051e-06, + "loss": 0.4878, + "step": 44033 + }, + { + "epoch": 1.13, + "learning_rate": 1.4345460532769375e-06, + "loss": 0.7412, + "step": 44034 + }, + { + "epoch": 1.13, + "learning_rate": 1.4345211317269579e-06, + "loss": 0.6465, + "step": 44035 + }, + { + "epoch": 1.13, + "learning_rate": 1.434496209844285e-06, + "loss": 0.6377, + "step": 44036 + }, + { + "epoch": 1.13, + "learning_rate": 1.4344712876289386e-06, + "loss": 0.6836, + "step": 44037 + }, + { + "epoch": 1.13, + "learning_rate": 1.4344463650809377e-06, + "loss": 0.7607, + "step": 44038 + }, + { + "epoch": 1.13, + "learning_rate": 1.4344214422003009e-06, + "loss": 0.6416, + "step": 44039 + }, + { + "epoch": 1.13, + "learning_rate": 1.434396518987048e-06, + "loss": 0.7559, + "step": 44040 + }, + { + "epoch": 1.13, + "learning_rate": 1.4343715954411972e-06, + "loss": 0.6792, + "step": 44041 + }, + { + "epoch": 1.13, + "learning_rate": 1.434346671562768e-06, + "loss": 0.7427, + "step": 44042 + }, + { + "epoch": 1.13, + "learning_rate": 1.4343217473517802e-06, + "loss": 0.5381, + "step": 44043 + }, + { + "epoch": 1.13, + "learning_rate": 1.4342968228082516e-06, + "loss": 0.418, + "step": 44044 + }, + { + "epoch": 1.13, + "learning_rate": 1.434271897932202e-06, + "loss": 0.6445, + "step": 44045 + }, + { + "epoch": 1.13, + "learning_rate": 1.4342469727236506e-06, + "loss": 0.5198, + "step": 44046 + }, + { + "epoch": 1.13, + "learning_rate": 1.4342220471826159e-06, + "loss": 0.7783, + "step": 44047 + }, + { + "epoch": 1.13, + "learning_rate": 1.4341971213091177e-06, + "loss": 0.5786, + "step": 44048 + }, + { + "epoch": 1.13, + "learning_rate": 1.4341721951031745e-06, + "loss": 0.7451, + "step": 44049 + }, + { + "epoch": 1.13, + "learning_rate": 1.4341472685648057e-06, + "loss": 0.7173, + "step": 44050 + }, + { + "epoch": 1.13, + "learning_rate": 1.4341223416940302e-06, + "loss": 0.4885, + "step": 44051 + }, + { + "epoch": 1.13, + "learning_rate": 1.4340974144908673e-06, + "loss": 0.7339, + "step": 44052 + }, + { + "epoch": 1.13, + "learning_rate": 1.434072486955336e-06, + "loss": 0.7539, + "step": 44053 + }, + { + "epoch": 1.13, + "learning_rate": 1.4340475590874555e-06, + "loss": 0.6323, + "step": 44054 + }, + { + "epoch": 1.13, + "learning_rate": 1.4340226308872442e-06, + "loss": 0.624, + "step": 44055 + }, + { + "epoch": 1.13, + "learning_rate": 1.4339977023547222e-06, + "loss": 0.709, + "step": 44056 + }, + { + "epoch": 1.13, + "learning_rate": 1.433972773489908e-06, + "loss": 0.5669, + "step": 44057 + }, + { + "epoch": 1.13, + "learning_rate": 1.4339478442928208e-06, + "loss": 0.5742, + "step": 44058 + }, + { + "epoch": 1.13, + "learning_rate": 1.4339229147634798e-06, + "loss": 0.6367, + "step": 44059 + }, + { + "epoch": 1.13, + "learning_rate": 1.4338979849019036e-06, + "loss": 0.6655, + "step": 44060 + }, + { + "epoch": 1.13, + "learning_rate": 1.433873054708112e-06, + "loss": 0.52, + "step": 44061 + }, + { + "epoch": 1.13, + "learning_rate": 1.4338481241821233e-06, + "loss": 0.5085, + "step": 44062 + }, + { + "epoch": 1.13, + "learning_rate": 1.433823193323958e-06, + "loss": 0.5037, + "step": 44063 + }, + { + "epoch": 1.13, + "learning_rate": 1.4337982621336334e-06, + "loss": 0.3794, + "step": 44064 + }, + { + "epoch": 1.13, + "learning_rate": 1.4337733306111696e-06, + "loss": 0.6201, + "step": 44065 + }, + { + "epoch": 1.13, + "learning_rate": 1.4337483987565854e-06, + "loss": 0.4041, + "step": 44066 + }, + { + "epoch": 1.13, + "learning_rate": 1.4337234665699002e-06, + "loss": 0.8418, + "step": 44067 + }, + { + "epoch": 1.13, + "learning_rate": 1.433698534051133e-06, + "loss": 0.7197, + "step": 44068 + }, + { + "epoch": 1.13, + "learning_rate": 1.4336736012003025e-06, + "loss": 0.584, + "step": 44069 + }, + { + "epoch": 1.13, + "learning_rate": 1.4336486680174282e-06, + "loss": 0.811, + "step": 44070 + }, + { + "epoch": 1.13, + "learning_rate": 1.433623734502529e-06, + "loss": 0.583, + "step": 44071 + }, + { + "epoch": 1.13, + "learning_rate": 1.4335988006556238e-06, + "loss": 0.3262, + "step": 44072 + }, + { + "epoch": 1.13, + "learning_rate": 1.4335738664767328e-06, + "loss": 0.6445, + "step": 44073 + }, + { + "epoch": 1.13, + "learning_rate": 1.4335489319658734e-06, + "loss": 0.5625, + "step": 44074 + }, + { + "epoch": 1.13, + "learning_rate": 1.4335239971230659e-06, + "loss": 0.6206, + "step": 44075 + }, + { + "epoch": 1.13, + "learning_rate": 1.4334990619483288e-06, + "loss": 0.4939, + "step": 44076 + }, + { + "epoch": 1.13, + "learning_rate": 1.4334741264416814e-06, + "loss": 0.6514, + "step": 44077 + }, + { + "epoch": 1.13, + "learning_rate": 1.433449190603143e-06, + "loss": 0.6025, + "step": 44078 + }, + { + "epoch": 1.13, + "learning_rate": 1.4334242544327322e-06, + "loss": 0.7266, + "step": 44079 + }, + { + "epoch": 1.13, + "learning_rate": 1.4333993179304685e-06, + "loss": 0.7617, + "step": 44080 + }, + { + "epoch": 1.13, + "learning_rate": 1.433374381096371e-06, + "loss": 0.5259, + "step": 44081 + }, + { + "epoch": 1.13, + "learning_rate": 1.4333494439304583e-06, + "loss": 0.6567, + "step": 44082 + }, + { + "epoch": 1.13, + "learning_rate": 1.4333245064327503e-06, + "loss": 0.7783, + "step": 44083 + }, + { + "epoch": 1.13, + "learning_rate": 1.4332995686032654e-06, + "loss": 0.7787, + "step": 44084 + }, + { + "epoch": 1.13, + "learning_rate": 1.4332746304420229e-06, + "loss": 0.6958, + "step": 44085 + }, + { + "epoch": 1.13, + "learning_rate": 1.433249691949042e-06, + "loss": 0.7295, + "step": 44086 + }, + { + "epoch": 1.13, + "learning_rate": 1.4332247531243417e-06, + "loss": 0.7451, + "step": 44087 + }, + { + "epoch": 1.13, + "learning_rate": 1.4331998139679416e-06, + "loss": 0.5317, + "step": 44088 + }, + { + "epoch": 1.13, + "learning_rate": 1.4331748744798596e-06, + "loss": 0.5057, + "step": 44089 + }, + { + "epoch": 1.13, + "learning_rate": 1.433149934660116e-06, + "loss": 0.6514, + "step": 44090 + }, + { + "epoch": 1.13, + "learning_rate": 1.4331249945087292e-06, + "loss": 0.8447, + "step": 44091 + }, + { + "epoch": 1.13, + "learning_rate": 1.4331000540257185e-06, + "loss": 0.6553, + "step": 44092 + }, + { + "epoch": 1.13, + "learning_rate": 1.4330751132111032e-06, + "loss": 0.6987, + "step": 44093 + }, + { + "epoch": 1.13, + "learning_rate": 1.4330501720649022e-06, + "loss": 0.5635, + "step": 44094 + }, + { + "epoch": 1.13, + "learning_rate": 1.4330252305871341e-06, + "loss": 0.6123, + "step": 44095 + }, + { + "epoch": 1.13, + "learning_rate": 1.433000288777819e-06, + "loss": 0.7109, + "step": 44096 + }, + { + "epoch": 1.13, + "learning_rate": 1.4329753466369751e-06, + "loss": 0.6855, + "step": 44097 + }, + { + "epoch": 1.13, + "learning_rate": 1.4329504041646225e-06, + "loss": 0.7168, + "step": 44098 + }, + { + "epoch": 1.13, + "learning_rate": 1.4329254613607793e-06, + "loss": 0.6079, + "step": 44099 + }, + { + "epoch": 1.13, + "learning_rate": 1.432900518225465e-06, + "loss": 0.5303, + "step": 44100 + }, + { + "epoch": 1.13, + "learning_rate": 1.4328755747586984e-06, + "loss": 0.6382, + "step": 44101 + }, + { + "epoch": 1.13, + "learning_rate": 1.4328506309604993e-06, + "loss": 0.8174, + "step": 44102 + }, + { + "epoch": 1.13, + "learning_rate": 1.4328256868308862e-06, + "loss": 0.7383, + "step": 44103 + }, + { + "epoch": 1.13, + "learning_rate": 1.4328007423698783e-06, + "loss": 0.6455, + "step": 44104 + }, + { + "epoch": 1.13, + "learning_rate": 1.432775797577495e-06, + "loss": 0.8096, + "step": 44105 + }, + { + "epoch": 1.13, + "learning_rate": 1.4327508524537548e-06, + "loss": 0.8574, + "step": 44106 + }, + { + "epoch": 1.13, + "learning_rate": 1.4327259069986775e-06, + "loss": 0.7061, + "step": 44107 + }, + { + "epoch": 1.13, + "learning_rate": 1.4327009612122818e-06, + "loss": 0.709, + "step": 44108 + }, + { + "epoch": 1.13, + "learning_rate": 1.4326760150945869e-06, + "loss": 0.7979, + "step": 44109 + }, + { + "epoch": 1.13, + "learning_rate": 1.4326510686456117e-06, + "loss": 0.7607, + "step": 44110 + }, + { + "epoch": 1.13, + "learning_rate": 1.4326261218653757e-06, + "loss": 0.6523, + "step": 44111 + }, + { + "epoch": 1.13, + "learning_rate": 1.4326011747538975e-06, + "loss": 0.7422, + "step": 44112 + }, + { + "epoch": 1.13, + "learning_rate": 1.432576227311197e-06, + "loss": 0.6992, + "step": 44113 + }, + { + "epoch": 1.13, + "learning_rate": 1.432551279537292e-06, + "loss": 0.6387, + "step": 44114 + }, + { + "epoch": 1.13, + "learning_rate": 1.4325263314322032e-06, + "loss": 0.5723, + "step": 44115 + }, + { + "epoch": 1.13, + "learning_rate": 1.432501382995948e-06, + "loss": 0.6377, + "step": 44116 + }, + { + "epoch": 1.13, + "learning_rate": 1.4324764342285472e-06, + "loss": 0.6631, + "step": 44117 + }, + { + "epoch": 1.13, + "learning_rate": 1.4324514851300186e-06, + "loss": 0.7148, + "step": 44118 + }, + { + "epoch": 1.13, + "learning_rate": 1.432426535700382e-06, + "loss": 0.7998, + "step": 44119 + }, + { + "epoch": 1.13, + "learning_rate": 1.432401585939656e-06, + "loss": 0.6577, + "step": 44120 + }, + { + "epoch": 1.13, + "learning_rate": 1.4323766358478602e-06, + "loss": 0.7285, + "step": 44121 + }, + { + "epoch": 1.13, + "learning_rate": 1.4323516854250132e-06, + "loss": 0.7617, + "step": 44122 + }, + { + "epoch": 1.13, + "learning_rate": 1.432326734671135e-06, + "loss": 0.5635, + "step": 44123 + }, + { + "epoch": 1.13, + "learning_rate": 1.4323017835862436e-06, + "loss": 0.5353, + "step": 44124 + }, + { + "epoch": 1.13, + "learning_rate": 1.432276832170359e-06, + "loss": 0.7354, + "step": 44125 + }, + { + "epoch": 1.13, + "learning_rate": 1.4322518804234993e-06, + "loss": 0.627, + "step": 44126 + }, + { + "epoch": 1.13, + "learning_rate": 1.4322269283456846e-06, + "loss": 0.8125, + "step": 44127 + }, + { + "epoch": 1.13, + "learning_rate": 1.432201975936934e-06, + "loss": 0.6621, + "step": 44128 + }, + { + "epoch": 1.13, + "learning_rate": 1.4321770231972655e-06, + "loss": 0.4941, + "step": 44129 + }, + { + "epoch": 1.13, + "learning_rate": 1.4321520701266994e-06, + "loss": 0.834, + "step": 44130 + }, + { + "epoch": 1.13, + "learning_rate": 1.4321271167252537e-06, + "loss": 0.7529, + "step": 44131 + }, + { + "epoch": 1.13, + "learning_rate": 1.4321021629929488e-06, + "loss": 0.5182, + "step": 44132 + }, + { + "epoch": 1.13, + "learning_rate": 1.432077208929803e-06, + "loss": 0.6698, + "step": 44133 + }, + { + "epoch": 1.13, + "learning_rate": 1.4320522545358356e-06, + "loss": 0.793, + "step": 44134 + }, + { + "epoch": 1.13, + "learning_rate": 1.4320272998110654e-06, + "loss": 0.6748, + "step": 44135 + }, + { + "epoch": 1.13, + "learning_rate": 1.4320023447555121e-06, + "loss": 0.6738, + "step": 44136 + }, + { + "epoch": 1.13, + "learning_rate": 1.431977389369194e-06, + "loss": 0.5967, + "step": 44137 + }, + { + "epoch": 1.13, + "learning_rate": 1.4319524336521315e-06, + "loss": 0.5518, + "step": 44138 + }, + { + "epoch": 1.13, + "learning_rate": 1.431927477604342e-06, + "loss": 0.5586, + "step": 44139 + }, + { + "epoch": 1.13, + "learning_rate": 1.4319025212258458e-06, + "loss": 0.6465, + "step": 44140 + }, + { + "epoch": 1.13, + "learning_rate": 1.4318775645166617e-06, + "loss": 0.6133, + "step": 44141 + }, + { + "epoch": 1.13, + "learning_rate": 1.431852607476809e-06, + "loss": 0.6689, + "step": 44142 + }, + { + "epoch": 1.13, + "learning_rate": 1.4318276501063062e-06, + "loss": 0.6001, + "step": 44143 + }, + { + "epoch": 1.13, + "learning_rate": 1.4318026924051734e-06, + "loss": 0.5176, + "step": 44144 + }, + { + "epoch": 1.13, + "learning_rate": 1.4317777343734286e-06, + "loss": 0.6455, + "step": 44145 + }, + { + "epoch": 1.13, + "learning_rate": 1.4317527760110917e-06, + "loss": 0.6987, + "step": 44146 + }, + { + "epoch": 1.13, + "learning_rate": 1.4317278173181814e-06, + "loss": 0.6777, + "step": 44147 + }, + { + "epoch": 1.13, + "learning_rate": 1.431702858294717e-06, + "loss": 0.6479, + "step": 44148 + }, + { + "epoch": 1.13, + "learning_rate": 1.4316778989407176e-06, + "loss": 0.6328, + "step": 44149 + }, + { + "epoch": 1.13, + "learning_rate": 1.4316529392562023e-06, + "loss": 0.7148, + "step": 44150 + }, + { + "epoch": 1.13, + "learning_rate": 1.4316279792411902e-06, + "loss": 0.6675, + "step": 44151 + }, + { + "epoch": 1.13, + "learning_rate": 1.4316030188957004e-06, + "loss": 0.7754, + "step": 44152 + }, + { + "epoch": 1.13, + "learning_rate": 1.4315780582197521e-06, + "loss": 0.5217, + "step": 44153 + }, + { + "epoch": 1.13, + "learning_rate": 1.4315530972133642e-06, + "loss": 0.6138, + "step": 44154 + }, + { + "epoch": 1.13, + "learning_rate": 1.4315281358765561e-06, + "loss": 0.5688, + "step": 44155 + }, + { + "epoch": 1.13, + "learning_rate": 1.4315031742093464e-06, + "loss": 0.5968, + "step": 44156 + }, + { + "epoch": 1.13, + "learning_rate": 1.431478212211755e-06, + "loss": 0.6475, + "step": 44157 + }, + { + "epoch": 1.13, + "learning_rate": 1.4314532498838004e-06, + "loss": 0.605, + "step": 44158 + }, + { + "epoch": 1.13, + "learning_rate": 1.431428287225502e-06, + "loss": 0.5669, + "step": 44159 + }, + { + "epoch": 1.13, + "learning_rate": 1.4314033242368784e-06, + "loss": 0.7412, + "step": 44160 + }, + { + "epoch": 1.13, + "learning_rate": 1.4313783609179493e-06, + "loss": 0.5176, + "step": 44161 + }, + { + "epoch": 1.13, + "learning_rate": 1.4313533972687337e-06, + "loss": 0.7646, + "step": 44162 + }, + { + "epoch": 1.13, + "learning_rate": 1.4313284332892508e-06, + "loss": 0.9551, + "step": 44163 + }, + { + "epoch": 1.13, + "learning_rate": 1.4313034689795193e-06, + "loss": 0.697, + "step": 44164 + }, + { + "epoch": 1.13, + "learning_rate": 1.4312785043395587e-06, + "loss": 0.5043, + "step": 44165 + }, + { + "epoch": 1.13, + "learning_rate": 1.4312535393693876e-06, + "loss": 0.6445, + "step": 44166 + }, + { + "epoch": 1.13, + "learning_rate": 1.431228574069026e-06, + "loss": 0.6807, + "step": 44167 + }, + { + "epoch": 1.13, + "learning_rate": 1.4312036084384923e-06, + "loss": 0.2842, + "step": 44168 + }, + { + "epoch": 1.13, + "learning_rate": 1.4311786424778058e-06, + "loss": 0.5378, + "step": 44169 + }, + { + "epoch": 1.13, + "learning_rate": 1.4311536761869857e-06, + "loss": 0.5957, + "step": 44170 + }, + { + "epoch": 1.13, + "learning_rate": 1.4311287095660512e-06, + "loss": 0.7461, + "step": 44171 + }, + { + "epoch": 1.13, + "learning_rate": 1.4311037426150213e-06, + "loss": 0.6143, + "step": 44172 + }, + { + "epoch": 1.13, + "learning_rate": 1.4310787753339147e-06, + "loss": 0.707, + "step": 44173 + }, + { + "epoch": 1.13, + "learning_rate": 1.4310538077227512e-06, + "loss": 0.7783, + "step": 44174 + }, + { + "epoch": 1.13, + "learning_rate": 1.4310288397815493e-06, + "loss": 0.7217, + "step": 44175 + }, + { + "epoch": 1.13, + "learning_rate": 1.4310038715103288e-06, + "loss": 0.7002, + "step": 44176 + }, + { + "epoch": 1.13, + "learning_rate": 1.4309789029091085e-06, + "loss": 0.5928, + "step": 44177 + }, + { + "epoch": 1.13, + "learning_rate": 1.4309539339779072e-06, + "loss": 0.8125, + "step": 44178 + }, + { + "epoch": 1.13, + "learning_rate": 1.4309289647167442e-06, + "loss": 0.6064, + "step": 44179 + }, + { + "epoch": 1.13, + "learning_rate": 1.430903995125639e-06, + "loss": 0.5884, + "step": 44180 + }, + { + "epoch": 1.13, + "learning_rate": 1.43087902520461e-06, + "loss": 0.5439, + "step": 44181 + }, + { + "epoch": 1.13, + "learning_rate": 1.4308540549536775e-06, + "loss": 0.666, + "step": 44182 + }, + { + "epoch": 1.13, + "learning_rate": 1.4308290843728592e-06, + "loss": 0.6826, + "step": 44183 + }, + { + "epoch": 1.13, + "learning_rate": 1.4308041134621752e-06, + "loss": 0.7305, + "step": 44184 + }, + { + "epoch": 1.13, + "learning_rate": 1.430779142221644e-06, + "loss": 0.7041, + "step": 44185 + }, + { + "epoch": 1.13, + "learning_rate": 1.4307541706512854e-06, + "loss": 0.6328, + "step": 44186 + }, + { + "epoch": 1.13, + "learning_rate": 1.4307291987511179e-06, + "loss": 0.5923, + "step": 44187 + }, + { + "epoch": 1.13, + "learning_rate": 1.430704226521161e-06, + "loss": 0.6182, + "step": 44188 + }, + { + "epoch": 1.13, + "learning_rate": 1.4306792539614334e-06, + "loss": 0.6797, + "step": 44189 + }, + { + "epoch": 1.13, + "learning_rate": 1.4306542810719546e-06, + "loss": 0.7627, + "step": 44190 + }, + { + "epoch": 1.13, + "learning_rate": 1.4306293078527437e-06, + "loss": 0.499, + "step": 44191 + }, + { + "epoch": 1.13, + "learning_rate": 1.4306043343038199e-06, + "loss": 0.624, + "step": 44192 + }, + { + "epoch": 1.13, + "learning_rate": 1.4305793604252019e-06, + "loss": 0.6646, + "step": 44193 + }, + { + "epoch": 1.13, + "learning_rate": 1.4305543862169089e-06, + "loss": 0.5522, + "step": 44194 + }, + { + "epoch": 1.13, + "learning_rate": 1.4305294116789608e-06, + "loss": 0.4971, + "step": 44195 + }, + { + "epoch": 1.13, + "learning_rate": 1.4305044368113757e-06, + "loss": 0.7207, + "step": 44196 + }, + { + "epoch": 1.13, + "learning_rate": 1.4304794616141735e-06, + "loss": 0.6177, + "step": 44197 + }, + { + "epoch": 1.13, + "learning_rate": 1.4304544860873727e-06, + "loss": 0.6543, + "step": 44198 + }, + { + "epoch": 1.13, + "learning_rate": 1.4304295102309927e-06, + "loss": 0.7178, + "step": 44199 + }, + { + "epoch": 1.13, + "learning_rate": 1.4304045340450524e-06, + "loss": 0.5107, + "step": 44200 + }, + { + "epoch": 1.13, + "learning_rate": 1.4303795575295713e-06, + "loss": 0.7275, + "step": 44201 + }, + { + "epoch": 1.13, + "learning_rate": 1.4303545806845687e-06, + "loss": 0.6523, + "step": 44202 + }, + { + "epoch": 1.13, + "learning_rate": 1.4303296035100631e-06, + "loss": 0.7314, + "step": 44203 + }, + { + "epoch": 1.13, + "learning_rate": 1.4303046260060738e-06, + "loss": 0.5933, + "step": 44204 + }, + { + "epoch": 1.13, + "learning_rate": 1.4302796481726202e-06, + "loss": 0.6821, + "step": 44205 + }, + { + "epoch": 1.13, + "learning_rate": 1.4302546700097212e-06, + "loss": 0.7188, + "step": 44206 + }, + { + "epoch": 1.13, + "learning_rate": 1.4302296915173962e-06, + "loss": 0.7734, + "step": 44207 + }, + { + "epoch": 1.13, + "learning_rate": 1.4302047126956637e-06, + "loss": 0.5981, + "step": 44208 + }, + { + "epoch": 1.13, + "learning_rate": 1.4301797335445437e-06, + "loss": 0.5488, + "step": 44209 + }, + { + "epoch": 1.13, + "learning_rate": 1.4301547540640544e-06, + "loss": 0.6611, + "step": 44210 + }, + { + "epoch": 1.13, + "learning_rate": 1.4301297742542156e-06, + "loss": 0.709, + "step": 44211 + }, + { + "epoch": 1.13, + "learning_rate": 1.4301047941150465e-06, + "loss": 0.8447, + "step": 44212 + }, + { + "epoch": 1.13, + "learning_rate": 1.4300798136465653e-06, + "loss": 0.6807, + "step": 44213 + }, + { + "epoch": 1.13, + "learning_rate": 1.4300548328487922e-06, + "loss": 0.7197, + "step": 44214 + }, + { + "epoch": 1.13, + "learning_rate": 1.4300298517217458e-06, + "loss": 0.731, + "step": 44215 + }, + { + "epoch": 1.13, + "learning_rate": 1.4300048702654453e-06, + "loss": 0.7051, + "step": 44216 + }, + { + "epoch": 1.13, + "learning_rate": 1.42997988847991e-06, + "loss": 0.5603, + "step": 44217 + }, + { + "epoch": 1.13, + "learning_rate": 1.4299549063651586e-06, + "loss": 0.5225, + "step": 44218 + }, + { + "epoch": 1.13, + "learning_rate": 1.4299299239212105e-06, + "loss": 0.6768, + "step": 44219 + }, + { + "epoch": 1.13, + "learning_rate": 1.429904941148085e-06, + "loss": 0.5557, + "step": 44220 + }, + { + "epoch": 1.13, + "learning_rate": 1.4298799580458008e-06, + "loss": 0.624, + "step": 44221 + }, + { + "epoch": 1.13, + "learning_rate": 1.4298549746143778e-06, + "loss": 0.5713, + "step": 44222 + }, + { + "epoch": 1.13, + "learning_rate": 1.429829990853834e-06, + "loss": 0.7598, + "step": 44223 + }, + { + "epoch": 1.13, + "learning_rate": 1.4298050067641895e-06, + "loss": 0.6982, + "step": 44224 + }, + { + "epoch": 1.13, + "learning_rate": 1.429780022345463e-06, + "loss": 0.6621, + "step": 44225 + }, + { + "epoch": 1.13, + "learning_rate": 1.4297550375976738e-06, + "loss": 0.6108, + "step": 44226 + }, + { + "epoch": 1.13, + "learning_rate": 1.4297300525208406e-06, + "loss": 0.5669, + "step": 44227 + }, + { + "epoch": 1.13, + "learning_rate": 1.4297050671149834e-06, + "loss": 0.574, + "step": 44228 + }, + { + "epoch": 1.13, + "learning_rate": 1.4296800813801201e-06, + "loss": 0.6611, + "step": 44229 + }, + { + "epoch": 1.13, + "learning_rate": 1.4296550953162712e-06, + "loss": 0.5063, + "step": 44230 + }, + { + "epoch": 1.13, + "learning_rate": 1.4296301089234546e-06, + "loss": 0.5537, + "step": 44231 + }, + { + "epoch": 1.13, + "learning_rate": 1.4296051222016902e-06, + "loss": 0.6982, + "step": 44232 + }, + { + "epoch": 1.13, + "learning_rate": 1.429580135150997e-06, + "loss": 0.834, + "step": 44233 + }, + { + "epoch": 1.13, + "learning_rate": 1.429555147771394e-06, + "loss": 0.605, + "step": 44234 + }, + { + "epoch": 1.13, + "learning_rate": 1.4295301600629004e-06, + "loss": 0.625, + "step": 44235 + }, + { + "epoch": 1.13, + "learning_rate": 1.4295051720255352e-06, + "loss": 0.793, + "step": 44236 + }, + { + "epoch": 1.13, + "learning_rate": 1.4294801836593178e-06, + "loss": 0.6089, + "step": 44237 + }, + { + "epoch": 1.13, + "learning_rate": 1.429455194964267e-06, + "loss": 0.5757, + "step": 44238 + }, + { + "epoch": 1.13, + "learning_rate": 1.4294302059404022e-06, + "loss": 0.5209, + "step": 44239 + }, + { + "epoch": 1.13, + "learning_rate": 1.4294052165877423e-06, + "loss": 0.4795, + "step": 44240 + }, + { + "epoch": 1.13, + "learning_rate": 1.4293802269063067e-06, + "loss": 0.7451, + "step": 44241 + }, + { + "epoch": 1.13, + "learning_rate": 1.4293552368961143e-06, + "loss": 0.7881, + "step": 44242 + }, + { + "epoch": 1.13, + "learning_rate": 1.4293302465571847e-06, + "loss": 0.7373, + "step": 44243 + }, + { + "epoch": 1.13, + "learning_rate": 1.4293052558895361e-06, + "loss": 0.5981, + "step": 44244 + }, + { + "epoch": 1.13, + "learning_rate": 1.4292802648931886e-06, + "loss": 0.7222, + "step": 44245 + }, + { + "epoch": 1.13, + "learning_rate": 1.429255273568161e-06, + "loss": 0.4907, + "step": 44246 + }, + { + "epoch": 1.13, + "learning_rate": 1.429230281914472e-06, + "loss": 0.5269, + "step": 44247 + }, + { + "epoch": 1.13, + "learning_rate": 1.4292052899321414e-06, + "loss": 0.5947, + "step": 44248 + }, + { + "epoch": 1.13, + "learning_rate": 1.4291802976211881e-06, + "loss": 0.7393, + "step": 44249 + }, + { + "epoch": 1.13, + "learning_rate": 1.429155304981631e-06, + "loss": 0.7656, + "step": 44250 + }, + { + "epoch": 1.13, + "learning_rate": 1.4291303120134895e-06, + "loss": 0.6465, + "step": 44251 + }, + { + "epoch": 1.13, + "learning_rate": 1.4291053187167826e-06, + "loss": 0.7012, + "step": 44252 + }, + { + "epoch": 1.13, + "learning_rate": 1.4290803250915296e-06, + "loss": 0.5879, + "step": 44253 + }, + { + "epoch": 1.13, + "learning_rate": 1.4290553311377492e-06, + "loss": 0.7578, + "step": 44254 + }, + { + "epoch": 1.13, + "learning_rate": 1.4290303368554613e-06, + "loss": 0.6455, + "step": 44255 + }, + { + "epoch": 1.13, + "learning_rate": 1.4290053422446842e-06, + "loss": 0.6646, + "step": 44256 + }, + { + "epoch": 1.13, + "learning_rate": 1.4289803473054375e-06, + "loss": 0.6165, + "step": 44257 + }, + { + "epoch": 1.13, + "learning_rate": 1.4289553520377406e-06, + "loss": 0.4331, + "step": 44258 + }, + { + "epoch": 1.13, + "learning_rate": 1.428930356441612e-06, + "loss": 0.54, + "step": 44259 + }, + { + "epoch": 1.13, + "learning_rate": 1.4289053605170714e-06, + "loss": 0.5234, + "step": 44260 + }, + { + "epoch": 1.13, + "learning_rate": 1.4288803642641374e-06, + "loss": 0.5591, + "step": 44261 + }, + { + "epoch": 1.13, + "learning_rate": 1.4288553676828297e-06, + "loss": 0.479, + "step": 44262 + }, + { + "epoch": 1.13, + "learning_rate": 1.4288303707731668e-06, + "loss": 0.4382, + "step": 44263 + }, + { + "epoch": 1.13, + "learning_rate": 1.4288053735351686e-06, + "loss": 0.5406, + "step": 44264 + }, + { + "epoch": 1.13, + "learning_rate": 1.4287803759688535e-06, + "loss": 0.5291, + "step": 44265 + }, + { + "epoch": 1.13, + "learning_rate": 1.4287553780742415e-06, + "loss": 0.7832, + "step": 44266 + }, + { + "epoch": 1.13, + "learning_rate": 1.4287303798513507e-06, + "loss": 0.4524, + "step": 44267 + }, + { + "epoch": 1.13, + "learning_rate": 1.428705381300201e-06, + "loss": 0.8389, + "step": 44268 + }, + { + "epoch": 1.13, + "learning_rate": 1.4286803824208112e-06, + "loss": 0.4666, + "step": 44269 + }, + { + "epoch": 1.13, + "learning_rate": 1.4286553832132008e-06, + "loss": 0.627, + "step": 44270 + }, + { + "epoch": 1.13, + "learning_rate": 1.428630383677388e-06, + "loss": 0.6946, + "step": 44271 + }, + { + "epoch": 1.13, + "learning_rate": 1.4286053838133936e-06, + "loss": 0.792, + "step": 44272 + }, + { + "epoch": 1.13, + "learning_rate": 1.428580383621235e-06, + "loss": 0.5703, + "step": 44273 + }, + { + "epoch": 1.13, + "learning_rate": 1.4285553831009325e-06, + "loss": 0.5352, + "step": 44274 + }, + { + "epoch": 1.13, + "learning_rate": 1.4285303822525046e-06, + "loss": 0.6104, + "step": 44275 + }, + { + "epoch": 1.13, + "learning_rate": 1.428505381075971e-06, + "loss": 0.6709, + "step": 44276 + }, + { + "epoch": 1.13, + "learning_rate": 1.4284803795713502e-06, + "loss": 0.7056, + "step": 44277 + }, + { + "epoch": 1.13, + "learning_rate": 1.4284553777386618e-06, + "loss": 0.6367, + "step": 44278 + }, + { + "epoch": 1.13, + "learning_rate": 1.4284303755779248e-06, + "loss": 0.6094, + "step": 44279 + }, + { + "epoch": 1.13, + "learning_rate": 1.4284053730891583e-06, + "loss": 0.7402, + "step": 44280 + }, + { + "epoch": 1.13, + "learning_rate": 1.4283803702723816e-06, + "loss": 0.6523, + "step": 44281 + }, + { + "epoch": 1.13, + "learning_rate": 1.428355367127614e-06, + "loss": 0.6729, + "step": 44282 + }, + { + "epoch": 1.13, + "learning_rate": 1.428330363654874e-06, + "loss": 0.5771, + "step": 44283 + }, + { + "epoch": 1.14, + "learning_rate": 1.428305359854181e-06, + "loss": 0.8066, + "step": 44284 + }, + { + "epoch": 1.14, + "learning_rate": 1.4282803557255548e-06, + "loss": 0.5801, + "step": 44285 + }, + { + "epoch": 1.14, + "learning_rate": 1.4282553512690137e-06, + "loss": 0.6294, + "step": 44286 + }, + { + "epoch": 1.14, + "learning_rate": 1.4282303464845775e-06, + "loss": 0.644, + "step": 44287 + }, + { + "epoch": 1.14, + "learning_rate": 1.4282053413722646e-06, + "loss": 0.7744, + "step": 44288 + }, + { + "epoch": 1.14, + "learning_rate": 1.4281803359320948e-06, + "loss": 0.5835, + "step": 44289 + }, + { + "epoch": 1.14, + "learning_rate": 1.4281553301640867e-06, + "loss": 0.7656, + "step": 44290 + }, + { + "epoch": 1.14, + "learning_rate": 1.42813032406826e-06, + "loss": 0.6602, + "step": 44291 + }, + { + "epoch": 1.14, + "learning_rate": 1.4281053176446336e-06, + "loss": 0.7793, + "step": 44292 + }, + { + "epoch": 1.14, + "learning_rate": 1.4280803108932266e-06, + "loss": 0.6028, + "step": 44293 + }, + { + "epoch": 1.14, + "learning_rate": 1.4280553038140583e-06, + "loss": 0.834, + "step": 44294 + }, + { + "epoch": 1.14, + "learning_rate": 1.4280302964071475e-06, + "loss": 0.5098, + "step": 44295 + }, + { + "epoch": 1.14, + "learning_rate": 1.4280052886725137e-06, + "loss": 0.6533, + "step": 44296 + }, + { + "epoch": 1.14, + "learning_rate": 1.4279802806101762e-06, + "loss": 0.6523, + "step": 44297 + }, + { + "epoch": 1.14, + "learning_rate": 1.4279552722201535e-06, + "loss": 0.8213, + "step": 44298 + }, + { + "epoch": 1.14, + "learning_rate": 1.4279302635024656e-06, + "loss": 0.4563, + "step": 44299 + }, + { + "epoch": 1.14, + "learning_rate": 1.4279052544571305e-06, + "loss": 0.5405, + "step": 44300 + }, + { + "epoch": 1.14, + "learning_rate": 1.4278802450841685e-06, + "loss": 0.5757, + "step": 44301 + }, + { + "epoch": 1.14, + "learning_rate": 1.427855235383598e-06, + "loss": 0.6758, + "step": 44302 + }, + { + "epoch": 1.14, + "learning_rate": 1.4278302253554385e-06, + "loss": 0.4941, + "step": 44303 + }, + { + "epoch": 1.14, + "learning_rate": 1.4278052149997093e-06, + "loss": 0.4082, + "step": 44304 + }, + { + "epoch": 1.14, + "learning_rate": 1.427780204316429e-06, + "loss": 0.5508, + "step": 44305 + }, + { + "epoch": 1.14, + "learning_rate": 1.4277551933056172e-06, + "loss": 0.9014, + "step": 44306 + }, + { + "epoch": 1.14, + "learning_rate": 1.4277301819672928e-06, + "loss": 0.6611, + "step": 44307 + }, + { + "epoch": 1.14, + "learning_rate": 1.4277051703014754e-06, + "loss": 0.7183, + "step": 44308 + }, + { + "epoch": 1.14, + "learning_rate": 1.4276801583081835e-06, + "loss": 0.6128, + "step": 44309 + }, + { + "epoch": 1.14, + "learning_rate": 1.4276551459874366e-06, + "loss": 0.5083, + "step": 44310 + }, + { + "epoch": 1.14, + "learning_rate": 1.4276301333392537e-06, + "loss": 0.6167, + "step": 44311 + }, + { + "epoch": 1.14, + "learning_rate": 1.4276051203636548e-06, + "loss": 0.5935, + "step": 44312 + }, + { + "epoch": 1.14, + "learning_rate": 1.4275801070606576e-06, + "loss": 0.4456, + "step": 44313 + }, + { + "epoch": 1.14, + "learning_rate": 1.427555093430282e-06, + "loss": 0.5576, + "step": 44314 + }, + { + "epoch": 1.14, + "learning_rate": 1.4275300794725472e-06, + "loss": 0.6602, + "step": 44315 + }, + { + "epoch": 1.14, + "learning_rate": 1.4275050651874725e-06, + "loss": 0.7266, + "step": 44316 + }, + { + "epoch": 1.14, + "learning_rate": 1.4274800505750769e-06, + "loss": 0.7021, + "step": 44317 + }, + { + "epoch": 1.14, + "learning_rate": 1.4274550356353793e-06, + "loss": 0.6328, + "step": 44318 + }, + { + "epoch": 1.14, + "learning_rate": 1.4274300203683987e-06, + "loss": 0.6147, + "step": 44319 + }, + { + "epoch": 1.14, + "learning_rate": 1.4274050047741551e-06, + "loss": 0.5063, + "step": 44320 + }, + { + "epoch": 1.14, + "learning_rate": 1.4273799888526665e-06, + "loss": 0.7852, + "step": 44321 + }, + { + "epoch": 1.14, + "learning_rate": 1.4273549726039534e-06, + "loss": 0.707, + "step": 44322 + }, + { + "epoch": 1.14, + "learning_rate": 1.427329956028034e-06, + "loss": 0.8604, + "step": 44323 + }, + { + "epoch": 1.14, + "learning_rate": 1.4273049391249277e-06, + "loss": 0.6592, + "step": 44324 + }, + { + "epoch": 1.14, + "learning_rate": 1.4272799218946533e-06, + "loss": 0.6592, + "step": 44325 + }, + { + "epoch": 1.14, + "learning_rate": 1.427254904337231e-06, + "loss": 0.6279, + "step": 44326 + }, + { + "epoch": 1.14, + "learning_rate": 1.4272298864526788e-06, + "loss": 0.7197, + "step": 44327 + }, + { + "epoch": 1.14, + "learning_rate": 1.4272048682410164e-06, + "loss": 0.728, + "step": 44328 + }, + { + "epoch": 1.14, + "learning_rate": 1.4271798497022629e-06, + "loss": 0.6396, + "step": 44329 + }, + { + "epoch": 1.14, + "learning_rate": 1.4271548308364373e-06, + "loss": 0.603, + "step": 44330 + }, + { + "epoch": 1.14, + "learning_rate": 1.427129811643559e-06, + "loss": 0.6145, + "step": 44331 + }, + { + "epoch": 1.14, + "learning_rate": 1.4271047921236472e-06, + "loss": 0.3169, + "step": 44332 + }, + { + "epoch": 1.14, + "learning_rate": 1.4270797722767208e-06, + "loss": 0.749, + "step": 44333 + }, + { + "epoch": 1.14, + "learning_rate": 1.427054752102799e-06, + "loss": 0.6484, + "step": 44334 + }, + { + "epoch": 1.14, + "learning_rate": 1.427029731601901e-06, + "loss": 0.7871, + "step": 44335 + }, + { + "epoch": 1.14, + "learning_rate": 1.427004710774046e-06, + "loss": 0.4808, + "step": 44336 + }, + { + "epoch": 1.14, + "learning_rate": 1.4269796896192533e-06, + "loss": 0.7134, + "step": 44337 + }, + { + "epoch": 1.14, + "learning_rate": 1.4269546681375416e-06, + "loss": 0.6797, + "step": 44338 + }, + { + "epoch": 1.14, + "learning_rate": 1.4269296463289304e-06, + "loss": 0.4907, + "step": 44339 + }, + { + "epoch": 1.14, + "learning_rate": 1.426904624193439e-06, + "loss": 0.7153, + "step": 44340 + }, + { + "epoch": 1.14, + "learning_rate": 1.426879601731086e-06, + "loss": 0.6611, + "step": 44341 + }, + { + "epoch": 1.14, + "learning_rate": 1.4268545789418914e-06, + "loss": 0.6855, + "step": 44342 + }, + { + "epoch": 1.14, + "learning_rate": 1.4268295558258734e-06, + "loss": 0.8154, + "step": 44343 + }, + { + "epoch": 1.14, + "learning_rate": 1.4268045323830518e-06, + "loss": 0.7305, + "step": 44344 + }, + { + "epoch": 1.14, + "learning_rate": 1.4267795086134459e-06, + "loss": 0.7969, + "step": 44345 + }, + { + "epoch": 1.14, + "learning_rate": 1.4267544845170741e-06, + "loss": 0.8291, + "step": 44346 + }, + { + "epoch": 1.14, + "learning_rate": 1.426729460093956e-06, + "loss": 0.8408, + "step": 44347 + }, + { + "epoch": 1.14, + "learning_rate": 1.426704435344111e-06, + "loss": 0.7334, + "step": 44348 + }, + { + "epoch": 1.14, + "learning_rate": 1.4266794102675581e-06, + "loss": 0.606, + "step": 44349 + }, + { + "epoch": 1.14, + "learning_rate": 1.4266543848643164e-06, + "loss": 0.6943, + "step": 44350 + }, + { + "epoch": 1.14, + "learning_rate": 1.426629359134405e-06, + "loss": 0.626, + "step": 44351 + }, + { + "epoch": 1.14, + "learning_rate": 1.4266043330778431e-06, + "loss": 0.7139, + "step": 44352 + }, + { + "epoch": 1.14, + "learning_rate": 1.4265793066946497e-06, + "loss": 0.5408, + "step": 44353 + }, + { + "epoch": 1.14, + "learning_rate": 1.4265542799848444e-06, + "loss": 0.6455, + "step": 44354 + }, + { + "epoch": 1.14, + "learning_rate": 1.426529252948446e-06, + "loss": 0.5405, + "step": 44355 + }, + { + "epoch": 1.14, + "learning_rate": 1.4265042255854738e-06, + "loss": 0.5854, + "step": 44356 + }, + { + "epoch": 1.14, + "learning_rate": 1.4264791978959468e-06, + "loss": 0.509, + "step": 44357 + }, + { + "epoch": 1.14, + "learning_rate": 1.4264541698798844e-06, + "loss": 0.6328, + "step": 44358 + }, + { + "epoch": 1.14, + "learning_rate": 1.4264291415373056e-06, + "loss": 0.5903, + "step": 44359 + }, + { + "epoch": 1.14, + "learning_rate": 1.4264041128682296e-06, + "loss": 0.5137, + "step": 44360 + }, + { + "epoch": 1.14, + "learning_rate": 1.4263790838726754e-06, + "loss": 0.709, + "step": 44361 + }, + { + "epoch": 1.14, + "learning_rate": 1.426354054550663e-06, + "loss": 0.7246, + "step": 44362 + }, + { + "epoch": 1.14, + "learning_rate": 1.4263290249022104e-06, + "loss": 0.6616, + "step": 44363 + }, + { + "epoch": 1.14, + "learning_rate": 1.4263039949273373e-06, + "loss": 0.7065, + "step": 44364 + }, + { + "epoch": 1.14, + "learning_rate": 1.4262789646260627e-06, + "loss": 0.4616, + "step": 44365 + }, + { + "epoch": 1.14, + "learning_rate": 1.426253933998406e-06, + "loss": 0.7568, + "step": 44366 + }, + { + "epoch": 1.14, + "learning_rate": 1.4262289030443866e-06, + "loss": 0.7295, + "step": 44367 + }, + { + "epoch": 1.14, + "learning_rate": 1.426203871764023e-06, + "loss": 0.4946, + "step": 44368 + }, + { + "epoch": 1.14, + "learning_rate": 1.4261788401573348e-06, + "loss": 0.6875, + "step": 44369 + }, + { + "epoch": 1.14, + "learning_rate": 1.4261538082243409e-06, + "loss": 0.6367, + "step": 44370 + }, + { + "epoch": 1.14, + "learning_rate": 1.4261287759650607e-06, + "loss": 0.6006, + "step": 44371 + }, + { + "epoch": 1.14, + "learning_rate": 1.4261037433795132e-06, + "loss": 0.5771, + "step": 44372 + }, + { + "epoch": 1.14, + "learning_rate": 1.4260787104677179e-06, + "loss": 0.449, + "step": 44373 + }, + { + "epoch": 1.14, + "learning_rate": 1.4260536772296935e-06, + "loss": 0.7656, + "step": 44374 + }, + { + "epoch": 1.14, + "learning_rate": 1.4260286436654596e-06, + "loss": 0.6729, + "step": 44375 + }, + { + "epoch": 1.14, + "learning_rate": 1.426003609775035e-06, + "loss": 0.6484, + "step": 44376 + }, + { + "epoch": 1.14, + "learning_rate": 1.4259785755584392e-06, + "loss": 0.5574, + "step": 44377 + }, + { + "epoch": 1.14, + "learning_rate": 1.4259535410156908e-06, + "loss": 0.7373, + "step": 44378 + }, + { + "epoch": 1.14, + "learning_rate": 1.42592850614681e-06, + "loss": 0.8604, + "step": 44379 + }, + { + "epoch": 1.14, + "learning_rate": 1.4259034709518146e-06, + "loss": 0.7627, + "step": 44380 + }, + { + "epoch": 1.14, + "learning_rate": 1.425878435430725e-06, + "loss": 0.751, + "step": 44381 + }, + { + "epoch": 1.14, + "learning_rate": 1.4258533995835596e-06, + "loss": 0.707, + "step": 44382 + }, + { + "epoch": 1.14, + "learning_rate": 1.4258283634103382e-06, + "loss": 0.5405, + "step": 44383 + }, + { + "epoch": 1.14, + "learning_rate": 1.4258033269110792e-06, + "loss": 0.6279, + "step": 44384 + }, + { + "epoch": 1.14, + "learning_rate": 1.425778290085802e-06, + "loss": 0.4811, + "step": 44385 + }, + { + "epoch": 1.14, + "learning_rate": 1.4257532529345264e-06, + "loss": 0.7725, + "step": 44386 + }, + { + "epoch": 1.14, + "learning_rate": 1.425728215457271e-06, + "loss": 0.7432, + "step": 44387 + }, + { + "epoch": 1.14, + "learning_rate": 1.425703177654055e-06, + "loss": 0.6035, + "step": 44388 + }, + { + "epoch": 1.14, + "learning_rate": 1.4256781395248978e-06, + "loss": 0.8525, + "step": 44389 + }, + { + "epoch": 1.14, + "learning_rate": 1.4256531010698184e-06, + "loss": 0.5005, + "step": 44390 + }, + { + "epoch": 1.14, + "learning_rate": 1.425628062288836e-06, + "loss": 0.6436, + "step": 44391 + }, + { + "epoch": 1.14, + "learning_rate": 1.4256030231819696e-06, + "loss": 0.7959, + "step": 44392 + }, + { + "epoch": 1.14, + "learning_rate": 1.4255779837492386e-06, + "loss": 0.7383, + "step": 44393 + }, + { + "epoch": 1.14, + "learning_rate": 1.4255529439906622e-06, + "loss": 0.6914, + "step": 44394 + }, + { + "epoch": 1.14, + "learning_rate": 1.425527903906259e-06, + "loss": 0.5504, + "step": 44395 + }, + { + "epoch": 1.14, + "learning_rate": 1.425502863496049e-06, + "loss": 0.5854, + "step": 44396 + }, + { + "epoch": 1.14, + "learning_rate": 1.4254778227600515e-06, + "loss": 0.6582, + "step": 44397 + }, + { + "epoch": 1.14, + "learning_rate": 1.4254527816982847e-06, + "loss": 0.6875, + "step": 44398 + }, + { + "epoch": 1.14, + "learning_rate": 1.4254277403107681e-06, + "loss": 0.5049, + "step": 44399 + }, + { + "epoch": 1.14, + "learning_rate": 1.4254026985975214e-06, + "loss": 0.7227, + "step": 44400 + }, + { + "epoch": 1.14, + "learning_rate": 1.4253776565585632e-06, + "loss": 0.5518, + "step": 44401 + }, + { + "epoch": 1.14, + "learning_rate": 1.4253526141939132e-06, + "loss": 0.5903, + "step": 44402 + }, + { + "epoch": 1.14, + "learning_rate": 1.42532757150359e-06, + "loss": 0.468, + "step": 44403 + }, + { + "epoch": 1.14, + "learning_rate": 1.425302528487613e-06, + "loss": 0.4937, + "step": 44404 + }, + { + "epoch": 1.14, + "learning_rate": 1.4252774851460015e-06, + "loss": 0.5916, + "step": 44405 + }, + { + "epoch": 1.14, + "learning_rate": 1.4252524414787745e-06, + "loss": 0.7202, + "step": 44406 + }, + { + "epoch": 1.14, + "learning_rate": 1.4252273974859514e-06, + "loss": 0.7451, + "step": 44407 + }, + { + "epoch": 1.14, + "learning_rate": 1.4252023531675513e-06, + "loss": 0.666, + "step": 44408 + }, + { + "epoch": 1.14, + "learning_rate": 1.425177308523593e-06, + "loss": 0.6367, + "step": 44409 + }, + { + "epoch": 1.14, + "learning_rate": 1.4251522635540962e-06, + "loss": 0.7295, + "step": 44410 + }, + { + "epoch": 1.14, + "learning_rate": 1.4251272182590796e-06, + "loss": 0.5283, + "step": 44411 + }, + { + "epoch": 1.14, + "learning_rate": 1.425102172638563e-06, + "loss": 0.4761, + "step": 44412 + }, + { + "epoch": 1.14, + "learning_rate": 1.4250771266925652e-06, + "loss": 0.6443, + "step": 44413 + }, + { + "epoch": 1.14, + "learning_rate": 1.4250520804211053e-06, + "loss": 0.7588, + "step": 44414 + }, + { + "epoch": 1.14, + "learning_rate": 1.4250270338242023e-06, + "loss": 0.6826, + "step": 44415 + }, + { + "epoch": 1.14, + "learning_rate": 1.425001986901876e-06, + "loss": 0.6943, + "step": 44416 + }, + { + "epoch": 1.14, + "learning_rate": 1.4249769396541451e-06, + "loss": 0.7827, + "step": 44417 + }, + { + "epoch": 1.14, + "learning_rate": 1.4249518920810285e-06, + "loss": 0.9541, + "step": 44418 + }, + { + "epoch": 1.14, + "learning_rate": 1.4249268441825465e-06, + "loss": 0.5547, + "step": 44419 + }, + { + "epoch": 1.14, + "learning_rate": 1.4249017959587172e-06, + "loss": 0.7129, + "step": 44420 + }, + { + "epoch": 1.14, + "learning_rate": 1.42487674740956e-06, + "loss": 0.4912, + "step": 44421 + }, + { + "epoch": 1.14, + "learning_rate": 1.4248516985350945e-06, + "loss": 0.6284, + "step": 44422 + }, + { + "epoch": 1.14, + "learning_rate": 1.4248266493353396e-06, + "loss": 0.6611, + "step": 44423 + }, + { + "epoch": 1.14, + "learning_rate": 1.424801599810314e-06, + "loss": 0.5986, + "step": 44424 + }, + { + "epoch": 1.14, + "learning_rate": 1.4247765499600378e-06, + "loss": 0.7285, + "step": 44425 + }, + { + "epoch": 1.14, + "learning_rate": 1.4247514997845294e-06, + "loss": 0.6416, + "step": 44426 + }, + { + "epoch": 1.14, + "learning_rate": 1.4247264492838088e-06, + "loss": 0.6816, + "step": 44427 + }, + { + "epoch": 1.14, + "learning_rate": 1.4247013984578942e-06, + "loss": 0.7793, + "step": 44428 + }, + { + "epoch": 1.14, + "learning_rate": 1.4246763473068055e-06, + "loss": 0.6934, + "step": 44429 + }, + { + "epoch": 1.14, + "learning_rate": 1.4246512958305615e-06, + "loss": 0.6348, + "step": 44430 + }, + { + "epoch": 1.14, + "learning_rate": 1.4246262440291816e-06, + "loss": 0.7109, + "step": 44431 + }, + { + "epoch": 1.14, + "learning_rate": 1.424601191902685e-06, + "loss": 0.7578, + "step": 44432 + }, + { + "epoch": 1.14, + "learning_rate": 1.4245761394510908e-06, + "loss": 0.75, + "step": 44433 + }, + { + "epoch": 1.14, + "learning_rate": 1.424551086674418e-06, + "loss": 0.5503, + "step": 44434 + }, + { + "epoch": 1.14, + "learning_rate": 1.4245260335726861e-06, + "loss": 0.6016, + "step": 44435 + }, + { + "epoch": 1.14, + "learning_rate": 1.424500980145914e-06, + "loss": 0.4985, + "step": 44436 + }, + { + "epoch": 1.14, + "learning_rate": 1.424475926394121e-06, + "loss": 0.5508, + "step": 44437 + }, + { + "epoch": 1.14, + "learning_rate": 1.4244508723173267e-06, + "loss": 0.6689, + "step": 44438 + }, + { + "epoch": 1.14, + "learning_rate": 1.4244258179155495e-06, + "loss": 0.5837, + "step": 44439 + }, + { + "epoch": 1.14, + "learning_rate": 1.4244007631888091e-06, + "loss": 0.6958, + "step": 44440 + }, + { + "epoch": 1.14, + "learning_rate": 1.4243757081371245e-06, + "loss": 0.6274, + "step": 44441 + }, + { + "epoch": 1.14, + "learning_rate": 1.4243506527605149e-06, + "loss": 0.5225, + "step": 44442 + }, + { + "epoch": 1.14, + "learning_rate": 1.4243255970589995e-06, + "loss": 0.624, + "step": 44443 + }, + { + "epoch": 1.14, + "learning_rate": 1.4243005410325977e-06, + "loss": 0.4739, + "step": 44444 + }, + { + "epoch": 1.14, + "learning_rate": 1.4242754846813282e-06, + "loss": 0.6191, + "step": 44445 + }, + { + "epoch": 1.14, + "learning_rate": 1.4242504280052108e-06, + "loss": 0.6353, + "step": 44446 + }, + { + "epoch": 1.14, + "learning_rate": 1.4242253710042643e-06, + "loss": 0.4824, + "step": 44447 + }, + { + "epoch": 1.14, + "learning_rate": 1.4242003136785077e-06, + "loss": 0.709, + "step": 44448 + }, + { + "epoch": 1.14, + "learning_rate": 1.4241752560279604e-06, + "loss": 0.6777, + "step": 44449 + }, + { + "epoch": 1.14, + "learning_rate": 1.4241501980526419e-06, + "loss": 0.7051, + "step": 44450 + }, + { + "epoch": 1.14, + "learning_rate": 1.4241251397525709e-06, + "loss": 0.5513, + "step": 44451 + }, + { + "epoch": 1.14, + "learning_rate": 1.424100081127767e-06, + "loss": 0.5205, + "step": 44452 + }, + { + "epoch": 1.14, + "learning_rate": 1.4240750221782486e-06, + "loss": 0.6855, + "step": 44453 + }, + { + "epoch": 1.14, + "learning_rate": 1.4240499629040362e-06, + "loss": 0.6807, + "step": 44454 + }, + { + "epoch": 1.14, + "learning_rate": 1.4240249033051477e-06, + "loss": 0.7163, + "step": 44455 + }, + { + "epoch": 1.14, + "learning_rate": 1.423999843381603e-06, + "loss": 0.7754, + "step": 44456 + }, + { + "epoch": 1.14, + "learning_rate": 1.4239747831334212e-06, + "loss": 0.6152, + "step": 44457 + }, + { + "epoch": 1.14, + "learning_rate": 1.4239497225606214e-06, + "loss": 0.6543, + "step": 44458 + }, + { + "epoch": 1.14, + "learning_rate": 1.4239246616632228e-06, + "loss": 0.6235, + "step": 44459 + }, + { + "epoch": 1.14, + "learning_rate": 1.4238996004412445e-06, + "loss": 0.7246, + "step": 44460 + }, + { + "epoch": 1.14, + "learning_rate": 1.4238745388947054e-06, + "loss": 0.6924, + "step": 44461 + }, + { + "epoch": 1.14, + "learning_rate": 1.4238494770236255e-06, + "loss": 0.7148, + "step": 44462 + }, + { + "epoch": 1.14, + "learning_rate": 1.4238244148280237e-06, + "loss": 0.584, + "step": 44463 + }, + { + "epoch": 1.14, + "learning_rate": 1.4237993523079185e-06, + "loss": 0.748, + "step": 44464 + }, + { + "epoch": 1.14, + "learning_rate": 1.4237742894633302e-06, + "loss": 0.4231, + "step": 44465 + }, + { + "epoch": 1.14, + "learning_rate": 1.4237492262942771e-06, + "loss": 0.6357, + "step": 44466 + }, + { + "epoch": 1.14, + "learning_rate": 1.423724162800779e-06, + "loss": 0.5603, + "step": 44467 + }, + { + "epoch": 1.14, + "learning_rate": 1.4236990989828544e-06, + "loss": 0.7598, + "step": 44468 + }, + { + "epoch": 1.14, + "learning_rate": 1.423674034840523e-06, + "loss": 0.7832, + "step": 44469 + }, + { + "epoch": 1.14, + "learning_rate": 1.4236489703738039e-06, + "loss": 0.7998, + "step": 44470 + }, + { + "epoch": 1.14, + "learning_rate": 1.4236239055827163e-06, + "loss": 0.6465, + "step": 44471 + }, + { + "epoch": 1.14, + "learning_rate": 1.4235988404672793e-06, + "loss": 0.7637, + "step": 44472 + }, + { + "epoch": 1.14, + "learning_rate": 1.4235737750275123e-06, + "loss": 0.6569, + "step": 44473 + }, + { + "epoch": 1.14, + "learning_rate": 1.423548709263434e-06, + "loss": 0.6396, + "step": 44474 + }, + { + "epoch": 1.14, + "learning_rate": 1.423523643175064e-06, + "loss": 0.7305, + "step": 44475 + }, + { + "epoch": 1.14, + "learning_rate": 1.4234985767624217e-06, + "loss": 0.5957, + "step": 44476 + }, + { + "epoch": 1.14, + "learning_rate": 1.423473510025526e-06, + "loss": 0.79, + "step": 44477 + }, + { + "epoch": 1.14, + "learning_rate": 1.4234484429643959e-06, + "loss": 0.4849, + "step": 44478 + }, + { + "epoch": 1.14, + "learning_rate": 1.423423375579051e-06, + "loss": 0.7661, + "step": 44479 + }, + { + "epoch": 1.14, + "learning_rate": 1.42339830786951e-06, + "loss": 0.8301, + "step": 44480 + }, + { + "epoch": 1.14, + "learning_rate": 1.4233732398357924e-06, + "loss": 0.4739, + "step": 44481 + }, + { + "epoch": 1.14, + "learning_rate": 1.4233481714779177e-06, + "loss": 0.6763, + "step": 44482 + }, + { + "epoch": 1.14, + "learning_rate": 1.4233231027959045e-06, + "loss": 0.5913, + "step": 44483 + }, + { + "epoch": 1.14, + "learning_rate": 1.4232980337897724e-06, + "loss": 0.6191, + "step": 44484 + }, + { + "epoch": 1.14, + "learning_rate": 1.4232729644595403e-06, + "loss": 0.7607, + "step": 44485 + }, + { + "epoch": 1.14, + "learning_rate": 1.4232478948052277e-06, + "loss": 0.7183, + "step": 44486 + }, + { + "epoch": 1.14, + "learning_rate": 1.4232228248268536e-06, + "loss": 0.7529, + "step": 44487 + }, + { + "epoch": 1.14, + "learning_rate": 1.4231977545244374e-06, + "loss": 0.6904, + "step": 44488 + }, + { + "epoch": 1.14, + "learning_rate": 1.4231726838979978e-06, + "loss": 0.5615, + "step": 44489 + }, + { + "epoch": 1.14, + "learning_rate": 1.4231476129475547e-06, + "loss": 0.5455, + "step": 44490 + }, + { + "epoch": 1.14, + "learning_rate": 1.4231225416731268e-06, + "loss": 0.374, + "step": 44491 + }, + { + "epoch": 1.14, + "learning_rate": 1.4230974700747334e-06, + "loss": 0.7588, + "step": 44492 + }, + { + "epoch": 1.14, + "learning_rate": 1.4230723981523935e-06, + "loss": 0.5371, + "step": 44493 + }, + { + "epoch": 1.14, + "learning_rate": 1.4230473259061268e-06, + "loss": 0.79, + "step": 44494 + }, + { + "epoch": 1.14, + "learning_rate": 1.4230222533359522e-06, + "loss": 0.7871, + "step": 44495 + }, + { + "epoch": 1.14, + "learning_rate": 1.422997180441889e-06, + "loss": 0.5591, + "step": 44496 + }, + { + "epoch": 1.14, + "learning_rate": 1.422972107223956e-06, + "loss": 0.6074, + "step": 44497 + }, + { + "epoch": 1.14, + "learning_rate": 1.422947033682173e-06, + "loss": 0.6777, + "step": 44498 + }, + { + "epoch": 1.14, + "learning_rate": 1.4229219598165585e-06, + "loss": 0.6426, + "step": 44499 + }, + { + "epoch": 1.14, + "learning_rate": 1.4228968856271324e-06, + "loss": 0.749, + "step": 44500 + }, + { + "epoch": 1.14, + "learning_rate": 1.4228718111139137e-06, + "loss": 0.6953, + "step": 44501 + }, + { + "epoch": 1.14, + "learning_rate": 1.4228467362769212e-06, + "loss": 0.52, + "step": 44502 + }, + { + "epoch": 1.14, + "learning_rate": 1.4228216611161745e-06, + "loss": 0.6134, + "step": 44503 + }, + { + "epoch": 1.14, + "learning_rate": 1.422796585631693e-06, + "loss": 0.7144, + "step": 44504 + }, + { + "epoch": 1.14, + "learning_rate": 1.4227715098234952e-06, + "loss": 0.7822, + "step": 44505 + }, + { + "epoch": 1.14, + "learning_rate": 1.4227464336916008e-06, + "loss": 0.4243, + "step": 44506 + }, + { + "epoch": 1.14, + "learning_rate": 1.4227213572360294e-06, + "loss": 0.6592, + "step": 44507 + }, + { + "epoch": 1.14, + "learning_rate": 1.4226962804567987e-06, + "loss": 0.5779, + "step": 44508 + }, + { + "epoch": 1.14, + "learning_rate": 1.4226712033539297e-06, + "loss": 0.5117, + "step": 44509 + }, + { + "epoch": 1.14, + "learning_rate": 1.4226461259274402e-06, + "loss": 0.751, + "step": 44510 + }, + { + "epoch": 1.14, + "learning_rate": 1.4226210481773508e-06, + "loss": 0.6104, + "step": 44511 + }, + { + "epoch": 1.14, + "learning_rate": 1.422595970103679e-06, + "loss": 0.6714, + "step": 44512 + }, + { + "epoch": 1.14, + "learning_rate": 1.4225708917064457e-06, + "loss": 0.5098, + "step": 44513 + }, + { + "epoch": 1.14, + "learning_rate": 1.4225458129856686e-06, + "loss": 0.627, + "step": 44514 + }, + { + "epoch": 1.14, + "learning_rate": 1.4225207339413681e-06, + "loss": 0.7393, + "step": 44515 + }, + { + "epoch": 1.14, + "learning_rate": 1.4224956545735627e-06, + "loss": 0.542, + "step": 44516 + }, + { + "epoch": 1.14, + "learning_rate": 1.4224705748822718e-06, + "loss": 0.748, + "step": 44517 + }, + { + "epoch": 1.14, + "learning_rate": 1.4224454948675146e-06, + "loss": 0.6504, + "step": 44518 + }, + { + "epoch": 1.14, + "learning_rate": 1.4224204145293103e-06, + "loss": 0.646, + "step": 44519 + }, + { + "epoch": 1.14, + "learning_rate": 1.4223953338676781e-06, + "loss": 0.7959, + "step": 44520 + }, + { + "epoch": 1.14, + "learning_rate": 1.4223702528826376e-06, + "loss": 0.7617, + "step": 44521 + }, + { + "epoch": 1.14, + "learning_rate": 1.4223451715742072e-06, + "loss": 0.5753, + "step": 44522 + }, + { + "epoch": 1.14, + "learning_rate": 1.4223200899424066e-06, + "loss": 0.5669, + "step": 44523 + }, + { + "epoch": 1.14, + "learning_rate": 1.422295007987255e-06, + "loss": 0.8174, + "step": 44524 + }, + { + "epoch": 1.14, + "learning_rate": 1.4222699257087713e-06, + "loss": 0.7314, + "step": 44525 + }, + { + "epoch": 1.14, + "learning_rate": 1.422244843106975e-06, + "loss": 0.5649, + "step": 44526 + }, + { + "epoch": 1.14, + "learning_rate": 1.4222197601818853e-06, + "loss": 0.5718, + "step": 44527 + }, + { + "epoch": 1.14, + "learning_rate": 1.4221946769335214e-06, + "loss": 0.8105, + "step": 44528 + }, + { + "epoch": 1.14, + "learning_rate": 1.4221695933619025e-06, + "loss": 0.7471, + "step": 44529 + }, + { + "epoch": 1.14, + "learning_rate": 1.4221445094670477e-06, + "loss": 0.7061, + "step": 44530 + }, + { + "epoch": 1.14, + "learning_rate": 1.4221194252489764e-06, + "loss": 0.6924, + "step": 44531 + }, + { + "epoch": 1.14, + "learning_rate": 1.4220943407077074e-06, + "loss": 0.6885, + "step": 44532 + }, + { + "epoch": 1.14, + "learning_rate": 1.4220692558432601e-06, + "loss": 0.6099, + "step": 44533 + }, + { + "epoch": 1.14, + "learning_rate": 1.4220441706556541e-06, + "loss": 0.7246, + "step": 44534 + }, + { + "epoch": 1.14, + "learning_rate": 1.4220190851449078e-06, + "loss": 0.6162, + "step": 44535 + }, + { + "epoch": 1.14, + "learning_rate": 1.4219939993110418e-06, + "loss": 0.7402, + "step": 44536 + }, + { + "epoch": 1.14, + "learning_rate": 1.4219689131540735e-06, + "loss": 0.6587, + "step": 44537 + }, + { + "epoch": 1.14, + "learning_rate": 1.4219438266740236e-06, + "loss": 0.5862, + "step": 44538 + }, + { + "epoch": 1.14, + "learning_rate": 1.42191873987091e-06, + "loss": 0.6865, + "step": 44539 + }, + { + "epoch": 1.14, + "learning_rate": 1.4218936527447534e-06, + "loss": 0.5752, + "step": 44540 + }, + { + "epoch": 1.14, + "learning_rate": 1.421868565295572e-06, + "loss": 0.7109, + "step": 44541 + }, + { + "epoch": 1.14, + "learning_rate": 1.4218434775233852e-06, + "loss": 0.7812, + "step": 44542 + }, + { + "epoch": 1.14, + "learning_rate": 1.4218183894282118e-06, + "loss": 0.5386, + "step": 44543 + }, + { + "epoch": 1.14, + "learning_rate": 1.421793301010072e-06, + "loss": 0.6191, + "step": 44544 + }, + { + "epoch": 1.14, + "learning_rate": 1.4217682122689842e-06, + "loss": 0.6636, + "step": 44545 + }, + { + "epoch": 1.14, + "learning_rate": 1.4217431232049681e-06, + "loss": 0.6533, + "step": 44546 + }, + { + "epoch": 1.14, + "learning_rate": 1.4217180338180426e-06, + "loss": 0.665, + "step": 44547 + }, + { + "epoch": 1.14, + "learning_rate": 1.4216929441082268e-06, + "loss": 0.6143, + "step": 44548 + }, + { + "epoch": 1.14, + "learning_rate": 1.4216678540755402e-06, + "loss": 0.3352, + "step": 44549 + }, + { + "epoch": 1.14, + "learning_rate": 1.4216427637200022e-06, + "loss": 0.5474, + "step": 44550 + }, + { + "epoch": 1.14, + "learning_rate": 1.4216176730416316e-06, + "loss": 0.7061, + "step": 44551 + }, + { + "epoch": 1.14, + "learning_rate": 1.4215925820404474e-06, + "loss": 0.6836, + "step": 44552 + }, + { + "epoch": 1.14, + "learning_rate": 1.4215674907164695e-06, + "loss": 0.6787, + "step": 44553 + }, + { + "epoch": 1.14, + "learning_rate": 1.4215423990697163e-06, + "loss": 0.4646, + "step": 44554 + }, + { + "epoch": 1.14, + "learning_rate": 1.421517307100208e-06, + "loss": 0.667, + "step": 44555 + }, + { + "epoch": 1.14, + "learning_rate": 1.4214922148079631e-06, + "loss": 0.6191, + "step": 44556 + }, + { + "epoch": 1.14, + "learning_rate": 1.421467122193001e-06, + "loss": 0.5786, + "step": 44557 + }, + { + "epoch": 1.14, + "learning_rate": 1.4214420292553406e-06, + "loss": 0.5615, + "step": 44558 + }, + { + "epoch": 1.14, + "learning_rate": 1.421416935995002e-06, + "loss": 0.6362, + "step": 44559 + }, + { + "epoch": 1.14, + "learning_rate": 1.4213918424120033e-06, + "loss": 0.6152, + "step": 44560 + }, + { + "epoch": 1.14, + "learning_rate": 1.4213667485063647e-06, + "loss": 0.7095, + "step": 44561 + }, + { + "epoch": 1.14, + "learning_rate": 1.4213416542781044e-06, + "loss": 0.7021, + "step": 44562 + }, + { + "epoch": 1.14, + "learning_rate": 1.4213165597272427e-06, + "loss": 0.5376, + "step": 44563 + }, + { + "epoch": 1.14, + "learning_rate": 1.421291464853798e-06, + "loss": 0.6279, + "step": 44564 + }, + { + "epoch": 1.14, + "learning_rate": 1.4212663696577898e-06, + "loss": 0.5603, + "step": 44565 + }, + { + "epoch": 1.14, + "learning_rate": 1.4212412741392377e-06, + "loss": 0.7402, + "step": 44566 + }, + { + "epoch": 1.14, + "learning_rate": 1.42121617829816e-06, + "loss": 0.6265, + "step": 44567 + }, + { + "epoch": 1.14, + "learning_rate": 1.4211910821345767e-06, + "loss": 0.6445, + "step": 44568 + }, + { + "epoch": 1.14, + "learning_rate": 1.4211659856485066e-06, + "loss": 0.8271, + "step": 44569 + }, + { + "epoch": 1.14, + "learning_rate": 1.421140888839969e-06, + "loss": 0.4941, + "step": 44570 + }, + { + "epoch": 1.14, + "learning_rate": 1.4211157917089836e-06, + "loss": 0.8398, + "step": 44571 + }, + { + "epoch": 1.14, + "learning_rate": 1.4210906942555689e-06, + "loss": 0.6562, + "step": 44572 + }, + { + "epoch": 1.14, + "learning_rate": 1.4210655964797442e-06, + "loss": 0.7424, + "step": 44573 + }, + { + "epoch": 1.14, + "learning_rate": 1.4210404983815295e-06, + "loss": 0.5317, + "step": 44574 + }, + { + "epoch": 1.14, + "learning_rate": 1.4210153999609429e-06, + "loss": 0.5747, + "step": 44575 + }, + { + "epoch": 1.14, + "learning_rate": 1.4209903012180046e-06, + "loss": 0.6748, + "step": 44576 + }, + { + "epoch": 1.14, + "learning_rate": 1.4209652021527332e-06, + "loss": 0.6035, + "step": 44577 + }, + { + "epoch": 1.14, + "learning_rate": 1.4209401027651482e-06, + "loss": 0.5112, + "step": 44578 + }, + { + "epoch": 1.14, + "learning_rate": 1.4209150030552684e-06, + "loss": 0.5354, + "step": 44579 + }, + { + "epoch": 1.14, + "learning_rate": 1.4208899030231135e-06, + "loss": 0.5981, + "step": 44580 + }, + { + "epoch": 1.14, + "learning_rate": 1.420864802668703e-06, + "loss": 0.7578, + "step": 44581 + }, + { + "epoch": 1.14, + "learning_rate": 1.4208397019920553e-06, + "loss": 0.5298, + "step": 44582 + }, + { + "epoch": 1.14, + "learning_rate": 1.4208146009931898e-06, + "loss": 0.5747, + "step": 44583 + }, + { + "epoch": 1.14, + "learning_rate": 1.420789499672126e-06, + "loss": 0.5809, + "step": 44584 + }, + { + "epoch": 1.14, + "learning_rate": 1.420764398028883e-06, + "loss": 0.7148, + "step": 44585 + }, + { + "epoch": 1.14, + "learning_rate": 1.4207392960634805e-06, + "loss": 0.5696, + "step": 44586 + }, + { + "epoch": 1.14, + "learning_rate": 1.4207141937759367e-06, + "loss": 0.5629, + "step": 44587 + }, + { + "epoch": 1.14, + "learning_rate": 1.4206890911662719e-06, + "loss": 0.7031, + "step": 44588 + }, + { + "epoch": 1.14, + "learning_rate": 1.4206639882345045e-06, + "loss": 0.5737, + "step": 44589 + }, + { + "epoch": 1.14, + "learning_rate": 1.420638884980654e-06, + "loss": 0.6147, + "step": 44590 + }, + { + "epoch": 1.14, + "learning_rate": 1.4206137814047396e-06, + "loss": 0.5303, + "step": 44591 + }, + { + "epoch": 1.14, + "learning_rate": 1.4205886775067806e-06, + "loss": 0.6279, + "step": 44592 + }, + { + "epoch": 1.14, + "learning_rate": 1.4205635732867964e-06, + "loss": 0.5967, + "step": 44593 + }, + { + "epoch": 1.14, + "learning_rate": 1.4205384687448058e-06, + "loss": 0.542, + "step": 44594 + }, + { + "epoch": 1.14, + "learning_rate": 1.4205133638808282e-06, + "loss": 0.7979, + "step": 44595 + }, + { + "epoch": 1.14, + "learning_rate": 1.420488258694883e-06, + "loss": 0.6235, + "step": 44596 + }, + { + "epoch": 1.14, + "learning_rate": 1.4204631531869896e-06, + "loss": 0.6074, + "step": 44597 + }, + { + "epoch": 1.14, + "learning_rate": 1.4204380473571663e-06, + "loss": 0.6743, + "step": 44598 + }, + { + "epoch": 1.14, + "learning_rate": 1.420412941205433e-06, + "loss": 0.7324, + "step": 44599 + }, + { + "epoch": 1.14, + "learning_rate": 1.4203878347318088e-06, + "loss": 0.8203, + "step": 44600 + }, + { + "epoch": 1.14, + "learning_rate": 1.4203627279363136e-06, + "loss": 0.5957, + "step": 44601 + }, + { + "epoch": 1.14, + "learning_rate": 1.4203376208189655e-06, + "loss": 0.6279, + "step": 44602 + }, + { + "epoch": 1.14, + "learning_rate": 1.4203125133797841e-06, + "loss": 0.834, + "step": 44603 + }, + { + "epoch": 1.14, + "learning_rate": 1.4202874056187888e-06, + "loss": 0.6611, + "step": 44604 + }, + { + "epoch": 1.14, + "learning_rate": 1.420262297535999e-06, + "loss": 0.7021, + "step": 44605 + }, + { + "epoch": 1.14, + "learning_rate": 1.4202371891314336e-06, + "loss": 0.7041, + "step": 44606 + }, + { + "epoch": 1.14, + "learning_rate": 1.4202120804051119e-06, + "loss": 0.5972, + "step": 44607 + }, + { + "epoch": 1.14, + "learning_rate": 1.4201869713570528e-06, + "loss": 0.7627, + "step": 44608 + }, + { + "epoch": 1.14, + "learning_rate": 1.4201618619872762e-06, + "loss": 0.7002, + "step": 44609 + }, + { + "epoch": 1.14, + "learning_rate": 1.4201367522958007e-06, + "loss": 0.6865, + "step": 44610 + }, + { + "epoch": 1.14, + "learning_rate": 1.4201116422826465e-06, + "loss": 0.7041, + "step": 44611 + }, + { + "epoch": 1.14, + "learning_rate": 1.4200865319478315e-06, + "loss": 0.7686, + "step": 44612 + }, + { + "epoch": 1.14, + "learning_rate": 1.4200614212913756e-06, + "loss": 0.8037, + "step": 44613 + }, + { + "epoch": 1.14, + "learning_rate": 1.420036310313298e-06, + "loss": 0.8721, + "step": 44614 + }, + { + "epoch": 1.14, + "learning_rate": 1.4200111990136182e-06, + "loss": 0.627, + "step": 44615 + }, + { + "epoch": 1.14, + "learning_rate": 1.4199860873923548e-06, + "loss": 0.8135, + "step": 44616 + }, + { + "epoch": 1.14, + "learning_rate": 1.4199609754495273e-06, + "loss": 0.6494, + "step": 44617 + }, + { + "epoch": 1.14, + "learning_rate": 1.4199358631851554e-06, + "loss": 0.6201, + "step": 44618 + }, + { + "epoch": 1.14, + "learning_rate": 1.4199107505992576e-06, + "loss": 0.6992, + "step": 44619 + }, + { + "epoch": 1.14, + "learning_rate": 1.4198856376918536e-06, + "loss": 0.5649, + "step": 44620 + }, + { + "epoch": 1.14, + "learning_rate": 1.4198605244629625e-06, + "loss": 0.7324, + "step": 44621 + }, + { + "epoch": 1.14, + "learning_rate": 1.4198354109126033e-06, + "loss": 0.6914, + "step": 44622 + }, + { + "epoch": 1.14, + "learning_rate": 1.4198102970407956e-06, + "loss": 0.5962, + "step": 44623 + }, + { + "epoch": 1.14, + "learning_rate": 1.4197851828475585e-06, + "loss": 0.6113, + "step": 44624 + }, + { + "epoch": 1.14, + "learning_rate": 1.419760068332911e-06, + "loss": 0.6406, + "step": 44625 + }, + { + "epoch": 1.14, + "learning_rate": 1.4197349534968727e-06, + "loss": 0.7227, + "step": 44626 + }, + { + "epoch": 1.14, + "learning_rate": 1.4197098383394625e-06, + "loss": 0.6709, + "step": 44627 + }, + { + "epoch": 1.14, + "learning_rate": 1.4196847228607e-06, + "loss": 0.543, + "step": 44628 + }, + { + "epoch": 1.14, + "learning_rate": 1.419659607060604e-06, + "loss": 0.562, + "step": 44629 + }, + { + "epoch": 1.14, + "learning_rate": 1.419634490939194e-06, + "loss": 0.5542, + "step": 44630 + }, + { + "epoch": 1.14, + "learning_rate": 1.4196093744964893e-06, + "loss": 0.4481, + "step": 44631 + }, + { + "epoch": 1.14, + "learning_rate": 1.4195842577325087e-06, + "loss": 0.5962, + "step": 44632 + }, + { + "epoch": 1.14, + "learning_rate": 1.4195591406472718e-06, + "loss": 0.7314, + "step": 44633 + }, + { + "epoch": 1.14, + "learning_rate": 1.419534023240798e-06, + "loss": 0.6763, + "step": 44634 + }, + { + "epoch": 1.14, + "learning_rate": 1.419508905513106e-06, + "loss": 0.7231, + "step": 44635 + }, + { + "epoch": 1.14, + "learning_rate": 1.4194837874642154e-06, + "loss": 0.6592, + "step": 44636 + }, + { + "epoch": 1.14, + "learning_rate": 1.4194586690941454e-06, + "loss": 0.5723, + "step": 44637 + }, + { + "epoch": 1.14, + "learning_rate": 1.4194335504029152e-06, + "loss": 0.6133, + "step": 44638 + }, + { + "epoch": 1.14, + "learning_rate": 1.419408431390544e-06, + "loss": 0.5598, + "step": 44639 + }, + { + "epoch": 1.14, + "learning_rate": 1.419383312057051e-06, + "loss": 0.959, + "step": 44640 + }, + { + "epoch": 1.14, + "learning_rate": 1.4193581924024555e-06, + "loss": 0.6006, + "step": 44641 + }, + { + "epoch": 1.14, + "learning_rate": 1.419333072426777e-06, + "loss": 0.6426, + "step": 44642 + }, + { + "epoch": 1.14, + "learning_rate": 1.4193079521300341e-06, + "loss": 0.5337, + "step": 44643 + }, + { + "epoch": 1.14, + "learning_rate": 1.4192828315122463e-06, + "loss": 0.6582, + "step": 44644 + }, + { + "epoch": 1.14, + "learning_rate": 1.419257710573433e-06, + "loss": 0.7725, + "step": 44645 + }, + { + "epoch": 1.14, + "learning_rate": 1.4192325893136136e-06, + "loss": 0.6133, + "step": 44646 + }, + { + "epoch": 1.14, + "learning_rate": 1.419207467732807e-06, + "loss": 0.8711, + "step": 44647 + }, + { + "epoch": 1.14, + "learning_rate": 1.4191823458310324e-06, + "loss": 0.6768, + "step": 44648 + }, + { + "epoch": 1.14, + "learning_rate": 1.419157223608309e-06, + "loss": 0.5649, + "step": 44649 + }, + { + "epoch": 1.14, + "learning_rate": 1.4191321010646563e-06, + "loss": 0.3986, + "step": 44650 + }, + { + "epoch": 1.14, + "learning_rate": 1.419106978200094e-06, + "loss": 0.5996, + "step": 44651 + }, + { + "epoch": 1.14, + "learning_rate": 1.41908185501464e-06, + "loss": 0.7461, + "step": 44652 + }, + { + "epoch": 1.14, + "learning_rate": 1.4190567315083146e-06, + "loss": 0.6172, + "step": 44653 + }, + { + "epoch": 1.14, + "learning_rate": 1.4190316076811365e-06, + "loss": 0.6108, + "step": 44654 + }, + { + "epoch": 1.14, + "learning_rate": 1.4190064835331255e-06, + "loss": 0.6787, + "step": 44655 + }, + { + "epoch": 1.14, + "learning_rate": 1.4189813590643005e-06, + "loss": 0.606, + "step": 44656 + }, + { + "epoch": 1.14, + "learning_rate": 1.4189562342746807e-06, + "loss": 0.7129, + "step": 44657 + }, + { + "epoch": 1.14, + "learning_rate": 1.418931109164285e-06, + "loss": 0.5579, + "step": 44658 + }, + { + "epoch": 1.14, + "learning_rate": 1.4189059837331331e-06, + "loss": 0.5898, + "step": 44659 + }, + { + "epoch": 1.14, + "learning_rate": 1.4188808579812443e-06, + "loss": 0.7324, + "step": 44660 + }, + { + "epoch": 1.14, + "learning_rate": 1.4188557319086378e-06, + "loss": 0.3969, + "step": 44661 + }, + { + "epoch": 1.14, + "learning_rate": 1.4188306055153328e-06, + "loss": 0.5024, + "step": 44662 + }, + { + "epoch": 1.14, + "learning_rate": 1.418805478801348e-06, + "loss": 0.5162, + "step": 44663 + }, + { + "epoch": 1.14, + "learning_rate": 1.4187803517667036e-06, + "loss": 0.6646, + "step": 44664 + }, + { + "epoch": 1.14, + "learning_rate": 1.418755224411418e-06, + "loss": 0.5327, + "step": 44665 + }, + { + "epoch": 1.14, + "learning_rate": 1.418730096735511e-06, + "loss": 0.8945, + "step": 44666 + }, + { + "epoch": 1.14, + "learning_rate": 1.4187049687390016e-06, + "loss": 0.7676, + "step": 44667 + }, + { + "epoch": 1.14, + "learning_rate": 1.4186798404219092e-06, + "loss": 0.7295, + "step": 44668 + }, + { + "epoch": 1.14, + "learning_rate": 1.4186547117842524e-06, + "loss": 0.4385, + "step": 44669 + }, + { + "epoch": 1.14, + "learning_rate": 1.4186295828260515e-06, + "loss": 0.6653, + "step": 44670 + }, + { + "epoch": 1.14, + "learning_rate": 1.4186044535473248e-06, + "loss": 0.6177, + "step": 44671 + }, + { + "epoch": 1.14, + "learning_rate": 1.4185793239480922e-06, + "loss": 0.6709, + "step": 44672 + }, + { + "epoch": 1.14, + "learning_rate": 1.4185541940283723e-06, + "loss": 0.6489, + "step": 44673 + }, + { + "epoch": 1.15, + "learning_rate": 1.4185290637881848e-06, + "loss": 0.6094, + "step": 44674 + }, + { + "epoch": 1.15, + "learning_rate": 1.418503933227549e-06, + "loss": 0.3733, + "step": 44675 + }, + { + "epoch": 1.15, + "learning_rate": 1.4184788023464841e-06, + "loss": 0.7129, + "step": 44676 + }, + { + "epoch": 1.15, + "learning_rate": 1.4184536711450089e-06, + "loss": 0.6226, + "step": 44677 + }, + { + "epoch": 1.15, + "learning_rate": 1.4184285396231432e-06, + "loss": 0.6582, + "step": 44678 + }, + { + "epoch": 1.15, + "learning_rate": 1.4184034077809057e-06, + "loss": 0.749, + "step": 44679 + }, + { + "epoch": 1.15, + "learning_rate": 1.4183782756183162e-06, + "loss": 0.4324, + "step": 44680 + }, + { + "epoch": 1.15, + "learning_rate": 1.418353143135394e-06, + "loss": 0.7012, + "step": 44681 + }, + { + "epoch": 1.15, + "learning_rate": 1.4183280103321574e-06, + "loss": 0.8408, + "step": 44682 + }, + { + "epoch": 1.15, + "learning_rate": 1.4183028772086265e-06, + "loss": 0.6084, + "step": 44683 + }, + { + "epoch": 1.15, + "learning_rate": 1.4182777437648207e-06, + "loss": 0.4895, + "step": 44684 + }, + { + "epoch": 1.15, + "learning_rate": 1.4182526100007582e-06, + "loss": 0.6836, + "step": 44685 + }, + { + "epoch": 1.15, + "learning_rate": 1.4182274759164594e-06, + "loss": 0.4919, + "step": 44686 + }, + { + "epoch": 1.15, + "learning_rate": 1.4182023415119429e-06, + "loss": 0.6812, + "step": 44687 + }, + { + "epoch": 1.15, + "learning_rate": 1.418177206787228e-06, + "loss": 0.7188, + "step": 44688 + }, + { + "epoch": 1.15, + "learning_rate": 1.418152071742334e-06, + "loss": 0.3073, + "step": 44689 + }, + { + "epoch": 1.15, + "learning_rate": 1.4181269363772802e-06, + "loss": 0.6865, + "step": 44690 + }, + { + "epoch": 1.15, + "learning_rate": 1.4181018006920865e-06, + "loss": 0.4351, + "step": 44691 + }, + { + "epoch": 1.15, + "learning_rate": 1.4180766646867706e-06, + "loss": 0.689, + "step": 44692 + }, + { + "epoch": 1.15, + "learning_rate": 1.418051528361353e-06, + "loss": 0.6738, + "step": 44693 + }, + { + "epoch": 1.15, + "learning_rate": 1.4180263917158525e-06, + "loss": 0.5063, + "step": 44694 + }, + { + "epoch": 1.15, + "learning_rate": 1.4180012547502884e-06, + "loss": 0.6191, + "step": 44695 + }, + { + "epoch": 1.15, + "learning_rate": 1.41797611746468e-06, + "loss": 0.3837, + "step": 44696 + }, + { + "epoch": 1.15, + "learning_rate": 1.4179509798590468e-06, + "loss": 0.665, + "step": 44697 + }, + { + "epoch": 1.15, + "learning_rate": 1.4179258419334073e-06, + "loss": 0.5234, + "step": 44698 + }, + { + "epoch": 1.15, + "learning_rate": 1.4179007036877813e-06, + "loss": 0.6641, + "step": 44699 + }, + { + "epoch": 1.15, + "learning_rate": 1.4178755651221879e-06, + "loss": 0.6089, + "step": 44700 + }, + { + "epoch": 1.15, + "learning_rate": 1.4178504262366468e-06, + "loss": 0.5596, + "step": 44701 + }, + { + "epoch": 1.15, + "learning_rate": 1.4178252870311765e-06, + "loss": 0.7793, + "step": 44702 + }, + { + "epoch": 1.15, + "learning_rate": 1.4178001475057966e-06, + "loss": 0.5172, + "step": 44703 + }, + { + "epoch": 1.15, + "learning_rate": 1.4177750076605261e-06, + "loss": 0.668, + "step": 44704 + }, + { + "epoch": 1.15, + "learning_rate": 1.417749867495385e-06, + "loss": 0.8926, + "step": 44705 + }, + { + "epoch": 1.15, + "learning_rate": 1.4177247270103918e-06, + "loss": 0.3403, + "step": 44706 + }, + { + "epoch": 1.15, + "learning_rate": 1.4176995862055658e-06, + "loss": 0.7158, + "step": 44707 + }, + { + "epoch": 1.15, + "learning_rate": 1.4176744450809265e-06, + "loss": 0.6428, + "step": 44708 + }, + { + "epoch": 1.15, + "learning_rate": 1.4176493036364932e-06, + "loss": 0.6963, + "step": 44709 + }, + { + "epoch": 1.15, + "learning_rate": 1.417624161872285e-06, + "loss": 0.6953, + "step": 44710 + }, + { + "epoch": 1.15, + "learning_rate": 1.4175990197883214e-06, + "loss": 0.749, + "step": 44711 + }, + { + "epoch": 1.15, + "learning_rate": 1.4175738773846213e-06, + "loss": 0.6914, + "step": 44712 + }, + { + "epoch": 1.15, + "learning_rate": 1.4175487346612038e-06, + "loss": 0.7041, + "step": 44713 + }, + { + "epoch": 1.15, + "learning_rate": 1.4175235916180887e-06, + "loss": 0.8408, + "step": 44714 + }, + { + "epoch": 1.15, + "learning_rate": 1.417498448255295e-06, + "loss": 0.7178, + "step": 44715 + }, + { + "epoch": 1.15, + "learning_rate": 1.417473304572842e-06, + "loss": 0.4995, + "step": 44716 + }, + { + "epoch": 1.15, + "learning_rate": 1.4174481605707488e-06, + "loss": 0.5476, + "step": 44717 + }, + { + "epoch": 1.15, + "learning_rate": 1.4174230162490345e-06, + "loss": 0.791, + "step": 44718 + }, + { + "epoch": 1.15, + "learning_rate": 1.4173978716077186e-06, + "loss": 0.6143, + "step": 44719 + }, + { + "epoch": 1.15, + "learning_rate": 1.4173727266468208e-06, + "loss": 0.6704, + "step": 44720 + }, + { + "epoch": 1.15, + "learning_rate": 1.4173475813663596e-06, + "loss": 0.6313, + "step": 44721 + }, + { + "epoch": 1.15, + "learning_rate": 1.4173224357663547e-06, + "loss": 0.6709, + "step": 44722 + }, + { + "epoch": 1.15, + "learning_rate": 1.417297289846825e-06, + "loss": 0.6313, + "step": 44723 + }, + { + "epoch": 1.15, + "learning_rate": 1.41727214360779e-06, + "loss": 0.6514, + "step": 44724 + }, + { + "epoch": 1.15, + "learning_rate": 1.4172469970492688e-06, + "loss": 0.8662, + "step": 44725 + }, + { + "epoch": 1.15, + "learning_rate": 1.4172218501712809e-06, + "loss": 0.7529, + "step": 44726 + }, + { + "epoch": 1.15, + "learning_rate": 1.4171967029738455e-06, + "loss": 0.6509, + "step": 44727 + }, + { + "epoch": 1.15, + "learning_rate": 1.4171715554569815e-06, + "loss": 0.8652, + "step": 44728 + }, + { + "epoch": 1.15, + "learning_rate": 1.4171464076207088e-06, + "loss": 0.5933, + "step": 44729 + }, + { + "epoch": 1.15, + "learning_rate": 1.4171212594650462e-06, + "loss": 0.6069, + "step": 44730 + }, + { + "epoch": 1.15, + "learning_rate": 1.4170961109900128e-06, + "loss": 0.6465, + "step": 44731 + }, + { + "epoch": 1.15, + "learning_rate": 1.417070962195628e-06, + "loss": 0.6816, + "step": 44732 + }, + { + "epoch": 1.15, + "learning_rate": 1.4170458130819115e-06, + "loss": 0.6929, + "step": 44733 + }, + { + "epoch": 1.15, + "learning_rate": 1.4170206636488817e-06, + "loss": 0.6875, + "step": 44734 + }, + { + "epoch": 1.15, + "learning_rate": 1.4169955138965588e-06, + "loss": 0.7617, + "step": 44735 + }, + { + "epoch": 1.15, + "learning_rate": 1.4169703638249617e-06, + "loss": 0.7578, + "step": 44736 + }, + { + "epoch": 1.15, + "learning_rate": 1.4169452134341094e-06, + "loss": 0.6797, + "step": 44737 + }, + { + "epoch": 1.15, + "learning_rate": 1.416920062724021e-06, + "loss": 0.7148, + "step": 44738 + }, + { + "epoch": 1.15, + "learning_rate": 1.4168949116947165e-06, + "loss": 0.8213, + "step": 44739 + }, + { + "epoch": 1.15, + "learning_rate": 1.4168697603462145e-06, + "loss": 0.625, + "step": 44740 + }, + { + "epoch": 1.15, + "learning_rate": 1.4168446086785348e-06, + "loss": 0.6387, + "step": 44741 + }, + { + "epoch": 1.15, + "learning_rate": 1.416819456691696e-06, + "loss": 0.7354, + "step": 44742 + }, + { + "epoch": 1.15, + "learning_rate": 1.4167943043857179e-06, + "loss": 0.7793, + "step": 44743 + }, + { + "epoch": 1.15, + "learning_rate": 1.4167691517606192e-06, + "loss": 0.5833, + "step": 44744 + }, + { + "epoch": 1.15, + "learning_rate": 1.41674399881642e-06, + "loss": 0.6631, + "step": 44745 + }, + { + "epoch": 1.15, + "learning_rate": 1.416718845553139e-06, + "loss": 0.8682, + "step": 44746 + }, + { + "epoch": 1.15, + "learning_rate": 1.4166936919707955e-06, + "loss": 0.6611, + "step": 44747 + }, + { + "epoch": 1.15, + "learning_rate": 1.4166685380694086e-06, + "loss": 0.5615, + "step": 44748 + }, + { + "epoch": 1.15, + "learning_rate": 1.416643383848998e-06, + "loss": 0.4495, + "step": 44749 + }, + { + "epoch": 1.15, + "learning_rate": 1.4166182293095826e-06, + "loss": 0.6064, + "step": 44750 + }, + { + "epoch": 1.15, + "learning_rate": 1.4165930744511818e-06, + "loss": 0.7969, + "step": 44751 + }, + { + "epoch": 1.15, + "learning_rate": 1.416567919273815e-06, + "loss": 0.9141, + "step": 44752 + }, + { + "epoch": 1.15, + "learning_rate": 1.416542763777501e-06, + "loss": 0.7734, + "step": 44753 + }, + { + "epoch": 1.15, + "learning_rate": 1.4165176079622594e-06, + "loss": 0.6074, + "step": 44754 + }, + { + "epoch": 1.15, + "learning_rate": 1.4164924518281093e-06, + "loss": 0.4822, + "step": 44755 + }, + { + "epoch": 1.15, + "learning_rate": 1.4164672953750708e-06, + "loss": 0.7344, + "step": 44756 + }, + { + "epoch": 1.15, + "learning_rate": 1.4164421386031616e-06, + "loss": 0.7026, + "step": 44757 + }, + { + "epoch": 1.15, + "learning_rate": 1.4164169815124024e-06, + "loss": 0.6143, + "step": 44758 + }, + { + "epoch": 1.15, + "learning_rate": 1.4163918241028115e-06, + "loss": 0.6406, + "step": 44759 + }, + { + "epoch": 1.15, + "learning_rate": 1.416366666374409e-06, + "loss": 0.5439, + "step": 44760 + }, + { + "epoch": 1.15, + "learning_rate": 1.416341508327213e-06, + "loss": 0.6865, + "step": 44761 + }, + { + "epoch": 1.15, + "learning_rate": 1.416316349961244e-06, + "loss": 0.6855, + "step": 44762 + }, + { + "epoch": 1.15, + "learning_rate": 1.41629119127652e-06, + "loss": 0.7334, + "step": 44763 + }, + { + "epoch": 1.15, + "learning_rate": 1.4162660322730617e-06, + "loss": 0.6689, + "step": 44764 + }, + { + "epoch": 1.15, + "learning_rate": 1.4162408729508874e-06, + "loss": 0.708, + "step": 44765 + }, + { + "epoch": 1.15, + "learning_rate": 1.4162157133100168e-06, + "loss": 0.7151, + "step": 44766 + }, + { + "epoch": 1.15, + "learning_rate": 1.4161905533504686e-06, + "loss": 0.5715, + "step": 44767 + }, + { + "epoch": 1.15, + "learning_rate": 1.4161653930722625e-06, + "loss": 0.7061, + "step": 44768 + }, + { + "epoch": 1.15, + "learning_rate": 1.416140232475418e-06, + "loss": 0.6318, + "step": 44769 + }, + { + "epoch": 1.15, + "learning_rate": 1.4161150715599538e-06, + "loss": 0.5518, + "step": 44770 + }, + { + "epoch": 1.15, + "learning_rate": 1.4160899103258897e-06, + "loss": 0.5361, + "step": 44771 + }, + { + "epoch": 1.15, + "learning_rate": 1.4160647487732442e-06, + "loss": 0.5317, + "step": 44772 + }, + { + "epoch": 1.15, + "learning_rate": 1.4160395869020375e-06, + "loss": 0.6533, + "step": 44773 + }, + { + "epoch": 1.15, + "learning_rate": 1.416014424712288e-06, + "loss": 0.7178, + "step": 44774 + }, + { + "epoch": 1.15, + "learning_rate": 1.415989262204016e-06, + "loss": 0.5835, + "step": 44775 + }, + { + "epoch": 1.15, + "learning_rate": 1.4159640993772394e-06, + "loss": 0.5697, + "step": 44776 + }, + { + "epoch": 1.15, + "learning_rate": 1.4159389362319787e-06, + "loss": 0.6821, + "step": 44777 + }, + { + "epoch": 1.15, + "learning_rate": 1.4159137727682526e-06, + "loss": 0.5605, + "step": 44778 + }, + { + "epoch": 1.15, + "learning_rate": 1.4158886089860804e-06, + "loss": 0.7793, + "step": 44779 + }, + { + "epoch": 1.15, + "learning_rate": 1.4158634448854815e-06, + "loss": 0.501, + "step": 44780 + }, + { + "epoch": 1.15, + "learning_rate": 1.415838280466475e-06, + "loss": 0.5723, + "step": 44781 + }, + { + "epoch": 1.15, + "learning_rate": 1.4158131157290803e-06, + "loss": 0.6226, + "step": 44782 + }, + { + "epoch": 1.15, + "learning_rate": 1.4157879506733166e-06, + "loss": 0.7715, + "step": 44783 + }, + { + "epoch": 1.15, + "learning_rate": 1.4157627852992028e-06, + "loss": 0.6025, + "step": 44784 + }, + { + "epoch": 1.15, + "learning_rate": 1.4157376196067594e-06, + "loss": 0.6602, + "step": 44785 + }, + { + "epoch": 1.15, + "learning_rate": 1.4157124535960044e-06, + "loss": 0.749, + "step": 44786 + }, + { + "epoch": 1.15, + "learning_rate": 1.4156872872669575e-06, + "loss": 0.3882, + "step": 44787 + }, + { + "epoch": 1.15, + "learning_rate": 1.4156621206196375e-06, + "loss": 0.6631, + "step": 44788 + }, + { + "epoch": 1.15, + "learning_rate": 1.4156369536540646e-06, + "loss": 0.606, + "step": 44789 + }, + { + "epoch": 1.15, + "learning_rate": 1.4156117863702576e-06, + "loss": 0.7324, + "step": 44790 + }, + { + "epoch": 1.15, + "learning_rate": 1.4155866187682358e-06, + "loss": 0.6973, + "step": 44791 + }, + { + "epoch": 1.15, + "learning_rate": 1.4155614508480182e-06, + "loss": 0.6738, + "step": 44792 + }, + { + "epoch": 1.15, + "learning_rate": 1.4155362826096244e-06, + "loss": 0.6904, + "step": 44793 + }, + { + "epoch": 1.15, + "learning_rate": 1.4155111140530735e-06, + "loss": 0.7354, + "step": 44794 + }, + { + "epoch": 1.15, + "learning_rate": 1.415485945178385e-06, + "loss": 0.6372, + "step": 44795 + }, + { + "epoch": 1.15, + "learning_rate": 1.4154607759855778e-06, + "loss": 0.8086, + "step": 44796 + }, + { + "epoch": 1.15, + "learning_rate": 1.4154356064746718e-06, + "loss": 0.7168, + "step": 44797 + }, + { + "epoch": 1.15, + "learning_rate": 1.4154104366456854e-06, + "loss": 0.7656, + "step": 44798 + }, + { + "epoch": 1.15, + "learning_rate": 1.4153852664986385e-06, + "loss": 0.8057, + "step": 44799 + }, + { + "epoch": 1.15, + "learning_rate": 1.4153600960335505e-06, + "loss": 0.6802, + "step": 44800 + }, + { + "epoch": 1.15, + "learning_rate": 1.4153349252504399e-06, + "loss": 0.7695, + "step": 44801 + }, + { + "epoch": 1.15, + "learning_rate": 1.4153097541493267e-06, + "loss": 0.6758, + "step": 44802 + }, + { + "epoch": 1.15, + "learning_rate": 1.4152845827302299e-06, + "loss": 0.5994, + "step": 44803 + }, + { + "epoch": 1.15, + "learning_rate": 1.4152594109931685e-06, + "loss": 0.606, + "step": 44804 + }, + { + "epoch": 1.15, + "learning_rate": 1.4152342389381626e-06, + "loss": 0.5669, + "step": 44805 + }, + { + "epoch": 1.15, + "learning_rate": 1.4152090665652307e-06, + "loss": 0.7529, + "step": 44806 + }, + { + "epoch": 1.15, + "learning_rate": 1.415183893874392e-06, + "loss": 0.6333, + "step": 44807 + }, + { + "epoch": 1.15, + "learning_rate": 1.4151587208656666e-06, + "loss": 0.6719, + "step": 44808 + }, + { + "epoch": 1.15, + "learning_rate": 1.4151335475390728e-06, + "loss": 0.5396, + "step": 44809 + }, + { + "epoch": 1.15, + "learning_rate": 1.4151083738946307e-06, + "loss": 0.6763, + "step": 44810 + }, + { + "epoch": 1.15, + "learning_rate": 1.4150831999323592e-06, + "loss": 0.6016, + "step": 44811 + }, + { + "epoch": 1.15, + "learning_rate": 1.4150580256522773e-06, + "loss": 0.6423, + "step": 44812 + }, + { + "epoch": 1.15, + "learning_rate": 1.4150328510544048e-06, + "loss": 0.519, + "step": 44813 + }, + { + "epoch": 1.15, + "learning_rate": 1.4150076761387606e-06, + "loss": 0.5471, + "step": 44814 + }, + { + "epoch": 1.15, + "learning_rate": 1.414982500905364e-06, + "loss": 0.6836, + "step": 44815 + }, + { + "epoch": 1.15, + "learning_rate": 1.4149573253542344e-06, + "loss": 0.4561, + "step": 44816 + }, + { + "epoch": 1.15, + "learning_rate": 1.4149321494853912e-06, + "loss": 0.6196, + "step": 44817 + }, + { + "epoch": 1.15, + "learning_rate": 1.4149069732988535e-06, + "loss": 0.5215, + "step": 44818 + }, + { + "epoch": 1.15, + "learning_rate": 1.4148817967946404e-06, + "loss": 0.6406, + "step": 44819 + }, + { + "epoch": 1.15, + "learning_rate": 1.4148566199727719e-06, + "loss": 0.6455, + "step": 44820 + }, + { + "epoch": 1.15, + "learning_rate": 1.4148314428332665e-06, + "loss": 0.6038, + "step": 44821 + }, + { + "epoch": 1.15, + "learning_rate": 1.4148062653761434e-06, + "loss": 0.707, + "step": 44822 + }, + { + "epoch": 1.15, + "learning_rate": 1.4147810876014225e-06, + "loss": 0.7695, + "step": 44823 + }, + { + "epoch": 1.15, + "learning_rate": 1.4147559095091227e-06, + "loss": 0.6279, + "step": 44824 + }, + { + "epoch": 1.15, + "learning_rate": 1.4147307310992638e-06, + "loss": 0.8379, + "step": 44825 + }, + { + "epoch": 1.15, + "learning_rate": 1.414705552371864e-06, + "loss": 0.7559, + "step": 44826 + }, + { + "epoch": 1.15, + "learning_rate": 1.4146803733269437e-06, + "loss": 0.5786, + "step": 44827 + }, + { + "epoch": 1.15, + "learning_rate": 1.4146551939645215e-06, + "loss": 0.6577, + "step": 44828 + }, + { + "epoch": 1.15, + "learning_rate": 1.4146300142846168e-06, + "loss": 0.6104, + "step": 44829 + }, + { + "epoch": 1.15, + "learning_rate": 1.4146048342872491e-06, + "loss": 0.6387, + "step": 44830 + }, + { + "epoch": 1.15, + "learning_rate": 1.4145796539724376e-06, + "loss": 0.6475, + "step": 44831 + }, + { + "epoch": 1.15, + "learning_rate": 1.4145544733402016e-06, + "loss": 0.7305, + "step": 44832 + }, + { + "epoch": 1.15, + "learning_rate": 1.41452929239056e-06, + "loss": 0.7246, + "step": 44833 + }, + { + "epoch": 1.15, + "learning_rate": 1.4145041111235325e-06, + "loss": 0.418, + "step": 44834 + }, + { + "epoch": 1.15, + "learning_rate": 1.4144789295391385e-06, + "loss": 0.447, + "step": 44835 + }, + { + "epoch": 1.15, + "learning_rate": 1.4144537476373967e-06, + "loss": 0.6475, + "step": 44836 + }, + { + "epoch": 1.15, + "learning_rate": 1.414428565418327e-06, + "loss": 0.5347, + "step": 44837 + }, + { + "epoch": 1.15, + "learning_rate": 1.4144033828819482e-06, + "loss": 0.6025, + "step": 44838 + }, + { + "epoch": 1.15, + "learning_rate": 1.4143782000282798e-06, + "loss": 0.4529, + "step": 44839 + }, + { + "epoch": 1.15, + "learning_rate": 1.4143530168573411e-06, + "loss": 0.6343, + "step": 44840 + }, + { + "epoch": 1.15, + "learning_rate": 1.4143278333691514e-06, + "loss": 0.6143, + "step": 44841 + }, + { + "epoch": 1.15, + "learning_rate": 1.41430264956373e-06, + "loss": 0.5972, + "step": 44842 + }, + { + "epoch": 1.15, + "learning_rate": 1.4142774654410958e-06, + "loss": 0.5928, + "step": 44843 + }, + { + "epoch": 1.15, + "learning_rate": 1.4142522810012686e-06, + "loss": 0.7119, + "step": 44844 + }, + { + "epoch": 1.15, + "learning_rate": 1.4142270962442676e-06, + "loss": 0.6992, + "step": 44845 + }, + { + "epoch": 1.15, + "learning_rate": 1.4142019111701117e-06, + "loss": 0.8701, + "step": 44846 + }, + { + "epoch": 1.15, + "learning_rate": 1.4141767257788206e-06, + "loss": 0.709, + "step": 44847 + }, + { + "epoch": 1.15, + "learning_rate": 1.4141515400704136e-06, + "loss": 0.4609, + "step": 44848 + }, + { + "epoch": 1.15, + "learning_rate": 1.4141263540449093e-06, + "loss": 0.6179, + "step": 44849 + }, + { + "epoch": 1.15, + "learning_rate": 1.414101167702328e-06, + "loss": 0.6387, + "step": 44850 + }, + { + "epoch": 1.15, + "learning_rate": 1.4140759810426883e-06, + "loss": 0.7266, + "step": 44851 + }, + { + "epoch": 1.15, + "learning_rate": 1.4140507940660097e-06, + "loss": 0.6436, + "step": 44852 + }, + { + "epoch": 1.15, + "learning_rate": 1.4140256067723112e-06, + "loss": 0.6084, + "step": 44853 + }, + { + "epoch": 1.15, + "learning_rate": 1.4140004191616127e-06, + "loss": 0.5122, + "step": 44854 + }, + { + "epoch": 1.15, + "learning_rate": 1.413975231233933e-06, + "loss": 0.7461, + "step": 44855 + }, + { + "epoch": 1.15, + "learning_rate": 1.4139500429892915e-06, + "loss": 0.521, + "step": 44856 + }, + { + "epoch": 1.15, + "learning_rate": 1.4139248544277073e-06, + "loss": 0.6025, + "step": 44857 + }, + { + "epoch": 1.15, + "learning_rate": 1.4138996655492e-06, + "loss": 0.7109, + "step": 44858 + }, + { + "epoch": 1.15, + "learning_rate": 1.4138744763537884e-06, + "loss": 0.5225, + "step": 44859 + }, + { + "epoch": 1.15, + "learning_rate": 1.4138492868414927e-06, + "loss": 0.6436, + "step": 44860 + }, + { + "epoch": 1.15, + "learning_rate": 1.4138240970123315e-06, + "loss": 0.6074, + "step": 44861 + }, + { + "epoch": 1.15, + "learning_rate": 1.4137989068663239e-06, + "loss": 0.5435, + "step": 44862 + }, + { + "epoch": 1.15, + "learning_rate": 1.4137737164034897e-06, + "loss": 0.5798, + "step": 44863 + }, + { + "epoch": 1.15, + "learning_rate": 1.413748525623848e-06, + "loss": 0.6836, + "step": 44864 + }, + { + "epoch": 1.15, + "learning_rate": 1.4137233345274185e-06, + "loss": 0.6445, + "step": 44865 + }, + { + "epoch": 1.15, + "learning_rate": 1.4136981431142195e-06, + "loss": 0.4985, + "step": 44866 + }, + { + "epoch": 1.15, + "learning_rate": 1.413672951384271e-06, + "loss": 0.603, + "step": 44867 + }, + { + "epoch": 1.15, + "learning_rate": 1.4136477593375922e-06, + "loss": 0.5757, + "step": 44868 + }, + { + "epoch": 1.15, + "learning_rate": 1.4136225669742023e-06, + "loss": 0.5835, + "step": 44869 + }, + { + "epoch": 1.15, + "learning_rate": 1.4135973742941207e-06, + "loss": 0.6582, + "step": 44870 + }, + { + "epoch": 1.15, + "learning_rate": 1.4135721812973667e-06, + "loss": 0.7266, + "step": 44871 + }, + { + "epoch": 1.15, + "learning_rate": 1.413546987983959e-06, + "loss": 0.562, + "step": 44872 + }, + { + "epoch": 1.15, + "learning_rate": 1.4135217943539179e-06, + "loss": 0.6924, + "step": 44873 + }, + { + "epoch": 1.15, + "learning_rate": 1.4134966004072618e-06, + "loss": 0.5381, + "step": 44874 + }, + { + "epoch": 1.15, + "learning_rate": 1.4134714061440108e-06, + "loss": 0.6934, + "step": 44875 + }, + { + "epoch": 1.15, + "learning_rate": 1.4134462115641834e-06, + "loss": 0.6934, + "step": 44876 + }, + { + "epoch": 1.15, + "learning_rate": 1.4134210166677994e-06, + "loss": 0.646, + "step": 44877 + }, + { + "epoch": 1.15, + "learning_rate": 1.4133958214548777e-06, + "loss": 0.5903, + "step": 44878 + }, + { + "epoch": 1.15, + "learning_rate": 1.413370625925438e-06, + "loss": 0.6948, + "step": 44879 + }, + { + "epoch": 1.15, + "learning_rate": 1.4133454300794995e-06, + "loss": 0.6272, + "step": 44880 + }, + { + "epoch": 1.15, + "learning_rate": 1.4133202339170814e-06, + "loss": 0.7607, + "step": 44881 + }, + { + "epoch": 1.15, + "learning_rate": 1.413295037438203e-06, + "loss": 0.7949, + "step": 44882 + }, + { + "epoch": 1.15, + "learning_rate": 1.4132698406428836e-06, + "loss": 0.4907, + "step": 44883 + }, + { + "epoch": 1.15, + "learning_rate": 1.4132446435311423e-06, + "loss": 0.7646, + "step": 44884 + }, + { + "epoch": 1.15, + "learning_rate": 1.4132194461029987e-06, + "loss": 0.6804, + "step": 44885 + }, + { + "epoch": 1.15, + "learning_rate": 1.4131942483584721e-06, + "loss": 0.6172, + "step": 44886 + }, + { + "epoch": 1.15, + "learning_rate": 1.4131690502975816e-06, + "loss": 0.6387, + "step": 44887 + }, + { + "epoch": 1.15, + "learning_rate": 1.4131438519203464e-06, + "loss": 0.6758, + "step": 44888 + }, + { + "epoch": 1.15, + "learning_rate": 1.4131186532267857e-06, + "loss": 0.6489, + "step": 44889 + }, + { + "epoch": 1.15, + "learning_rate": 1.4130934542169199e-06, + "loss": 0.5928, + "step": 44890 + }, + { + "epoch": 1.15, + "learning_rate": 1.4130682548907669e-06, + "loss": 0.6812, + "step": 44891 + }, + { + "epoch": 1.15, + "learning_rate": 1.4130430552483465e-06, + "loss": 0.668, + "step": 44892 + }, + { + "epoch": 1.15, + "learning_rate": 1.413017855289678e-06, + "loss": 0.6514, + "step": 44893 + }, + { + "epoch": 1.15, + "learning_rate": 1.4129926550147807e-06, + "loss": 0.5815, + "step": 44894 + }, + { + "epoch": 1.15, + "learning_rate": 1.4129674544236742e-06, + "loss": 0.8105, + "step": 44895 + }, + { + "epoch": 1.15, + "learning_rate": 1.4129422535163772e-06, + "loss": 0.5151, + "step": 44896 + }, + { + "epoch": 1.15, + "learning_rate": 1.4129170522929094e-06, + "loss": 0.5864, + "step": 44897 + }, + { + "epoch": 1.15, + "learning_rate": 1.4128918507532903e-06, + "loss": 0.7764, + "step": 44898 + }, + { + "epoch": 1.15, + "learning_rate": 1.4128666488975385e-06, + "loss": 0.7812, + "step": 44899 + }, + { + "epoch": 1.15, + "learning_rate": 1.412841446725674e-06, + "loss": 0.585, + "step": 44900 + }, + { + "epoch": 1.15, + "learning_rate": 1.4128162442377157e-06, + "loss": 0.6689, + "step": 44901 + }, + { + "epoch": 1.15, + "learning_rate": 1.4127910414336828e-06, + "loss": 0.752, + "step": 44902 + }, + { + "epoch": 1.15, + "learning_rate": 1.4127658383135947e-06, + "loss": 0.7695, + "step": 44903 + }, + { + "epoch": 1.15, + "learning_rate": 1.412740634877471e-06, + "loss": 0.5869, + "step": 44904 + }, + { + "epoch": 1.15, + "learning_rate": 1.4127154311253308e-06, + "loss": 0.8359, + "step": 44905 + }, + { + "epoch": 1.15, + "learning_rate": 1.4126902270571932e-06, + "loss": 0.6348, + "step": 44906 + }, + { + "epoch": 1.15, + "learning_rate": 1.4126650226730776e-06, + "loss": 0.4883, + "step": 44907 + }, + { + "epoch": 1.15, + "learning_rate": 1.4126398179730034e-06, + "loss": 0.6826, + "step": 44908 + }, + { + "epoch": 1.15, + "learning_rate": 1.4126146129569902e-06, + "loss": 0.6758, + "step": 44909 + }, + { + "epoch": 1.15, + "learning_rate": 1.4125894076250568e-06, + "loss": 0.6885, + "step": 44910 + }, + { + "epoch": 1.15, + "learning_rate": 1.4125642019772226e-06, + "loss": 0.7012, + "step": 44911 + }, + { + "epoch": 1.15, + "learning_rate": 1.412538996013507e-06, + "loss": 0.605, + "step": 44912 + }, + { + "epoch": 1.15, + "learning_rate": 1.4125137897339292e-06, + "loss": 0.5356, + "step": 44913 + }, + { + "epoch": 1.15, + "learning_rate": 1.4124885831385085e-06, + "loss": 0.5957, + "step": 44914 + }, + { + "epoch": 1.15, + "learning_rate": 1.4124633762272646e-06, + "loss": 0.5806, + "step": 44915 + }, + { + "epoch": 1.15, + "learning_rate": 1.4124381690002163e-06, + "loss": 0.6846, + "step": 44916 + }, + { + "epoch": 1.15, + "learning_rate": 1.4124129614573827e-06, + "loss": 0.7397, + "step": 44917 + }, + { + "epoch": 1.15, + "learning_rate": 1.4123877535987839e-06, + "loss": 0.6572, + "step": 44918 + }, + { + "epoch": 1.15, + "learning_rate": 1.4123625454244385e-06, + "loss": 0.6577, + "step": 44919 + }, + { + "epoch": 1.15, + "learning_rate": 1.4123373369343662e-06, + "loss": 0.6489, + "step": 44920 + }, + { + "epoch": 1.15, + "learning_rate": 1.4123121281285863e-06, + "loss": 0.6836, + "step": 44921 + }, + { + "epoch": 1.15, + "learning_rate": 1.4122869190071175e-06, + "loss": 0.5425, + "step": 44922 + }, + { + "epoch": 1.15, + "learning_rate": 1.41226170956998e-06, + "loss": 0.728, + "step": 44923 + }, + { + "epoch": 1.15, + "learning_rate": 1.4122364998171924e-06, + "loss": 0.6113, + "step": 44924 + }, + { + "epoch": 1.15, + "learning_rate": 1.4122112897487744e-06, + "loss": 0.5396, + "step": 44925 + }, + { + "epoch": 1.15, + "learning_rate": 1.412186079364745e-06, + "loss": 0.7715, + "step": 44926 + }, + { + "epoch": 1.15, + "learning_rate": 1.412160868665124e-06, + "loss": 0.6055, + "step": 44927 + }, + { + "epoch": 1.15, + "learning_rate": 1.4121356576499301e-06, + "loss": 0.7568, + "step": 44928 + }, + { + "epoch": 1.15, + "learning_rate": 1.4121104463191832e-06, + "loss": 0.7598, + "step": 44929 + }, + { + "epoch": 1.15, + "learning_rate": 1.412085234672902e-06, + "loss": 0.6138, + "step": 44930 + }, + { + "epoch": 1.15, + "learning_rate": 1.412060022711106e-06, + "loss": 0.623, + "step": 44931 + }, + { + "epoch": 1.15, + "learning_rate": 1.4120348104338148e-06, + "loss": 0.7607, + "step": 44932 + }, + { + "epoch": 1.15, + "learning_rate": 1.4120095978410471e-06, + "loss": 0.4796, + "step": 44933 + }, + { + "epoch": 1.15, + "learning_rate": 1.411984384932823e-06, + "loss": 0.5295, + "step": 44934 + }, + { + "epoch": 1.15, + "learning_rate": 1.4119591717091614e-06, + "loss": 0.7773, + "step": 44935 + }, + { + "epoch": 1.15, + "learning_rate": 1.4119339581700818e-06, + "loss": 0.5801, + "step": 44936 + }, + { + "epoch": 1.15, + "learning_rate": 1.4119087443156027e-06, + "loss": 0.5203, + "step": 44937 + }, + { + "epoch": 1.15, + "learning_rate": 1.4118835301457443e-06, + "loss": 0.6309, + "step": 44938 + }, + { + "epoch": 1.15, + "learning_rate": 1.4118583156605257e-06, + "loss": 0.7578, + "step": 44939 + }, + { + "epoch": 1.15, + "learning_rate": 1.4118331008599663e-06, + "loss": 0.7061, + "step": 44940 + }, + { + "epoch": 1.15, + "learning_rate": 1.4118078857440849e-06, + "loss": 0.6953, + "step": 44941 + }, + { + "epoch": 1.15, + "learning_rate": 1.4117826703129012e-06, + "loss": 0.7441, + "step": 44942 + }, + { + "epoch": 1.15, + "learning_rate": 1.4117574545664344e-06, + "loss": 0.6304, + "step": 44943 + }, + { + "epoch": 1.15, + "learning_rate": 1.4117322385047042e-06, + "loss": 0.6494, + "step": 44944 + }, + { + "epoch": 1.15, + "learning_rate": 1.4117070221277292e-06, + "loss": 0.646, + "step": 44945 + }, + { + "epoch": 1.15, + "learning_rate": 1.4116818054355292e-06, + "loss": 0.7266, + "step": 44946 + }, + { + "epoch": 1.15, + "learning_rate": 1.4116565884281233e-06, + "loss": 0.7422, + "step": 44947 + }, + { + "epoch": 1.15, + "learning_rate": 1.411631371105531e-06, + "loss": 0.6694, + "step": 44948 + }, + { + "epoch": 1.15, + "learning_rate": 1.4116061534677711e-06, + "loss": 0.7627, + "step": 44949 + }, + { + "epoch": 1.15, + "learning_rate": 1.4115809355148638e-06, + "loss": 0.5083, + "step": 44950 + }, + { + "epoch": 1.15, + "learning_rate": 1.4115557172468275e-06, + "loss": 0.7646, + "step": 44951 + }, + { + "epoch": 1.15, + "learning_rate": 1.4115304986636823e-06, + "loss": 0.5598, + "step": 44952 + }, + { + "epoch": 1.15, + "learning_rate": 1.4115052797654467e-06, + "loss": 0.647, + "step": 44953 + }, + { + "epoch": 1.15, + "learning_rate": 1.4114800605521408e-06, + "loss": 0.6875, + "step": 44954 + }, + { + "epoch": 1.15, + "learning_rate": 1.4114548410237833e-06, + "loss": 0.6279, + "step": 44955 + }, + { + "epoch": 1.15, + "learning_rate": 1.411429621180394e-06, + "loss": 0.5518, + "step": 44956 + }, + { + "epoch": 1.15, + "learning_rate": 1.4114044010219917e-06, + "loss": 0.8145, + "step": 44957 + }, + { + "epoch": 1.15, + "learning_rate": 1.411379180548596e-06, + "loss": 0.6182, + "step": 44958 + }, + { + "epoch": 1.15, + "learning_rate": 1.4113539597602264e-06, + "loss": 0.5605, + "step": 44959 + }, + { + "epoch": 1.15, + "learning_rate": 1.411328738656902e-06, + "loss": 0.7637, + "step": 44960 + }, + { + "epoch": 1.15, + "learning_rate": 1.4113035172386419e-06, + "loss": 0.6934, + "step": 44961 + }, + { + "epoch": 1.15, + "learning_rate": 1.4112782955054653e-06, + "loss": 0.6816, + "step": 44962 + }, + { + "epoch": 1.15, + "learning_rate": 1.4112530734573924e-06, + "loss": 0.7354, + "step": 44963 + }, + { + "epoch": 1.15, + "learning_rate": 1.4112278510944415e-06, + "loss": 0.6572, + "step": 44964 + }, + { + "epoch": 1.15, + "learning_rate": 1.4112026284166328e-06, + "loss": 0.5806, + "step": 44965 + }, + { + "epoch": 1.15, + "learning_rate": 1.4111774054239847e-06, + "loss": 0.5698, + "step": 44966 + }, + { + "epoch": 1.15, + "learning_rate": 1.4111521821165173e-06, + "loss": 0.5557, + "step": 44967 + }, + { + "epoch": 1.15, + "learning_rate": 1.4111269584942491e-06, + "loss": 0.7109, + "step": 44968 + }, + { + "epoch": 1.15, + "learning_rate": 1.4111017345572006e-06, + "loss": 0.5967, + "step": 44969 + }, + { + "epoch": 1.15, + "learning_rate": 1.41107651030539e-06, + "loss": 0.5447, + "step": 44970 + }, + { + "epoch": 1.15, + "learning_rate": 1.411051285738837e-06, + "loss": 0.7158, + "step": 44971 + }, + { + "epoch": 1.15, + "learning_rate": 1.4110260608575607e-06, + "loss": 0.8164, + "step": 44972 + }, + { + "epoch": 1.15, + "learning_rate": 1.4110008356615813e-06, + "loss": 0.7266, + "step": 44973 + }, + { + "epoch": 1.15, + "learning_rate": 1.4109756101509169e-06, + "loss": 0.6113, + "step": 44974 + }, + { + "epoch": 1.15, + "learning_rate": 1.4109503843255875e-06, + "loss": 0.5991, + "step": 44975 + }, + { + "epoch": 1.15, + "learning_rate": 1.4109251581856123e-06, + "loss": 0.5947, + "step": 44976 + }, + { + "epoch": 1.15, + "learning_rate": 1.4108999317310106e-06, + "loss": 0.8076, + "step": 44977 + }, + { + "epoch": 1.15, + "learning_rate": 1.410874704961802e-06, + "loss": 0.6582, + "step": 44978 + }, + { + "epoch": 1.15, + "learning_rate": 1.4108494778780048e-06, + "loss": 0.665, + "step": 44979 + }, + { + "epoch": 1.15, + "learning_rate": 1.41082425047964e-06, + "loss": 0.5928, + "step": 44980 + }, + { + "epoch": 1.15, + "learning_rate": 1.4107990227667255e-06, + "loss": 0.5574, + "step": 44981 + }, + { + "epoch": 1.15, + "learning_rate": 1.410773794739281e-06, + "loss": 0.6929, + "step": 44982 + }, + { + "epoch": 1.15, + "learning_rate": 1.4107485663973257e-06, + "loss": 0.5396, + "step": 44983 + }, + { + "epoch": 1.15, + "learning_rate": 1.4107233377408796e-06, + "loss": 0.7217, + "step": 44984 + }, + { + "epoch": 1.15, + "learning_rate": 1.4106981087699614e-06, + "loss": 0.6221, + "step": 44985 + }, + { + "epoch": 1.15, + "learning_rate": 1.4106728794845904e-06, + "loss": 0.7617, + "step": 44986 + }, + { + "epoch": 1.15, + "learning_rate": 1.410647649884786e-06, + "loss": 0.7256, + "step": 44987 + }, + { + "epoch": 1.15, + "learning_rate": 1.4106224199705678e-06, + "loss": 0.5981, + "step": 44988 + }, + { + "epoch": 1.15, + "learning_rate": 1.4105971897419547e-06, + "loss": 0.7051, + "step": 44989 + }, + { + "epoch": 1.15, + "learning_rate": 1.4105719591989665e-06, + "loss": 0.6011, + "step": 44990 + }, + { + "epoch": 1.15, + "learning_rate": 1.410546728341622e-06, + "loss": 0.5747, + "step": 44991 + }, + { + "epoch": 1.15, + "learning_rate": 1.4105214971699407e-06, + "loss": 0.6455, + "step": 44992 + }, + { + "epoch": 1.15, + "learning_rate": 1.4104962656839418e-06, + "loss": 0.7563, + "step": 44993 + }, + { + "epoch": 1.15, + "learning_rate": 1.4104710338836452e-06, + "loss": 0.6841, + "step": 44994 + }, + { + "epoch": 1.15, + "learning_rate": 1.4104458017690696e-06, + "loss": 0.7246, + "step": 44995 + }, + { + "epoch": 1.15, + "learning_rate": 1.4104205693402346e-06, + "loss": 0.5278, + "step": 44996 + }, + { + "epoch": 1.15, + "learning_rate": 1.4103953365971592e-06, + "loss": 0.5007, + "step": 44997 + }, + { + "epoch": 1.15, + "learning_rate": 1.4103701035398632e-06, + "loss": 0.6885, + "step": 44998 + }, + { + "epoch": 1.15, + "learning_rate": 1.4103448701683656e-06, + "loss": 0.6797, + "step": 44999 + }, + { + "epoch": 1.15, + "learning_rate": 1.410319636482686e-06, + "loss": 0.6338, + "step": 45000 + }, + { + "epoch": 1.15, + "learning_rate": 1.4102944024828434e-06, + "loss": 0.6562, + "step": 45001 + }, + { + "epoch": 1.15, + "learning_rate": 1.410269168168857e-06, + "loss": 0.5942, + "step": 45002 + }, + { + "epoch": 1.15, + "learning_rate": 1.4102439335407466e-06, + "loss": 0.6252, + "step": 45003 + }, + { + "epoch": 1.15, + "learning_rate": 1.410218698598531e-06, + "loss": 0.7583, + "step": 45004 + }, + { + "epoch": 1.15, + "learning_rate": 1.4101934633422303e-06, + "loss": 0.5679, + "step": 45005 + }, + { + "epoch": 1.15, + "learning_rate": 1.410168227771863e-06, + "loss": 0.6484, + "step": 45006 + }, + { + "epoch": 1.15, + "learning_rate": 1.410142991887449e-06, + "loss": 0.5605, + "step": 45007 + }, + { + "epoch": 1.15, + "learning_rate": 1.4101177556890069e-06, + "loss": 0.6035, + "step": 45008 + }, + { + "epoch": 1.15, + "learning_rate": 1.410092519176557e-06, + "loss": 0.5923, + "step": 45009 + }, + { + "epoch": 1.15, + "learning_rate": 1.4100672823501179e-06, + "loss": 0.7168, + "step": 45010 + }, + { + "epoch": 1.15, + "learning_rate": 1.410042045209709e-06, + "loss": 0.6016, + "step": 45011 + }, + { + "epoch": 1.15, + "learning_rate": 1.4100168077553498e-06, + "loss": 0.4954, + "step": 45012 + }, + { + "epoch": 1.15, + "learning_rate": 1.4099915699870598e-06, + "loss": 0.5942, + "step": 45013 + }, + { + "epoch": 1.15, + "learning_rate": 1.4099663319048578e-06, + "loss": 0.5781, + "step": 45014 + }, + { + "epoch": 1.15, + "learning_rate": 1.4099410935087637e-06, + "loss": 0.6719, + "step": 45015 + }, + { + "epoch": 1.15, + "learning_rate": 1.4099158547987965e-06, + "loss": 0.7363, + "step": 45016 + }, + { + "epoch": 1.15, + "learning_rate": 1.4098906157749756e-06, + "loss": 0.6924, + "step": 45017 + }, + { + "epoch": 1.15, + "learning_rate": 1.4098653764373204e-06, + "loss": 0.6357, + "step": 45018 + }, + { + "epoch": 1.15, + "learning_rate": 1.4098401367858496e-06, + "loss": 0.6235, + "step": 45019 + }, + { + "epoch": 1.15, + "learning_rate": 1.4098148968205836e-06, + "loss": 0.6738, + "step": 45020 + }, + { + "epoch": 1.15, + "learning_rate": 1.409789656541541e-06, + "loss": 0.6016, + "step": 45021 + }, + { + "epoch": 1.15, + "learning_rate": 1.4097644159487415e-06, + "loss": 0.5259, + "step": 45022 + }, + { + "epoch": 1.15, + "learning_rate": 1.4097391750422038e-06, + "loss": 0.4688, + "step": 45023 + }, + { + "epoch": 1.15, + "learning_rate": 1.409713933821948e-06, + "loss": 0.833, + "step": 45024 + }, + { + "epoch": 1.15, + "learning_rate": 1.409688692287993e-06, + "loss": 0.6904, + "step": 45025 + }, + { + "epoch": 1.15, + "learning_rate": 1.4096634504403582e-06, + "loss": 0.6914, + "step": 45026 + }, + { + "epoch": 1.15, + "learning_rate": 1.4096382082790628e-06, + "loss": 0.6416, + "step": 45027 + }, + { + "epoch": 1.15, + "learning_rate": 1.4096129658041262e-06, + "loss": 0.7256, + "step": 45028 + }, + { + "epoch": 1.15, + "learning_rate": 1.4095877230155679e-06, + "loss": 0.6528, + "step": 45029 + }, + { + "epoch": 1.15, + "learning_rate": 1.4095624799134075e-06, + "loss": 0.5918, + "step": 45030 + }, + { + "epoch": 1.15, + "learning_rate": 1.4095372364976634e-06, + "loss": 0.6865, + "step": 45031 + }, + { + "epoch": 1.15, + "learning_rate": 1.4095119927683558e-06, + "loss": 0.4747, + "step": 45032 + }, + { + "epoch": 1.15, + "learning_rate": 1.4094867487255036e-06, + "loss": 0.7725, + "step": 45033 + }, + { + "epoch": 1.15, + "learning_rate": 1.409461504369126e-06, + "loss": 0.4197, + "step": 45034 + }, + { + "epoch": 1.15, + "learning_rate": 1.4094362596992428e-06, + "loss": 0.6289, + "step": 45035 + }, + { + "epoch": 1.15, + "learning_rate": 1.4094110147158732e-06, + "loss": 0.5137, + "step": 45036 + }, + { + "epoch": 1.15, + "learning_rate": 1.409385769419036e-06, + "loss": 0.5521, + "step": 45037 + }, + { + "epoch": 1.15, + "learning_rate": 1.4093605238087514e-06, + "loss": 0.562, + "step": 45038 + }, + { + "epoch": 1.15, + "learning_rate": 1.4093352778850378e-06, + "loss": 0.4897, + "step": 45039 + }, + { + "epoch": 1.15, + "learning_rate": 1.4093100316479155e-06, + "loss": 0.3964, + "step": 45040 + }, + { + "epoch": 1.15, + "learning_rate": 1.409284785097403e-06, + "loss": 0.6313, + "step": 45041 + }, + { + "epoch": 1.15, + "learning_rate": 1.40925953823352e-06, + "loss": 0.7183, + "step": 45042 + }, + { + "epoch": 1.15, + "learning_rate": 1.4092342910562857e-06, + "loss": 0.533, + "step": 45043 + }, + { + "epoch": 1.15, + "learning_rate": 1.4092090435657196e-06, + "loss": 0.6636, + "step": 45044 + }, + { + "epoch": 1.15, + "learning_rate": 1.4091837957618413e-06, + "loss": 0.748, + "step": 45045 + }, + { + "epoch": 1.15, + "learning_rate": 1.4091585476446694e-06, + "loss": 0.7842, + "step": 45046 + }, + { + "epoch": 1.15, + "learning_rate": 1.4091332992142237e-06, + "loss": 0.5273, + "step": 45047 + }, + { + "epoch": 1.15, + "learning_rate": 1.4091080504705236e-06, + "loss": 0.8467, + "step": 45048 + }, + { + "epoch": 1.15, + "learning_rate": 1.409082801413588e-06, + "loss": 0.5986, + "step": 45049 + }, + { + "epoch": 1.15, + "learning_rate": 1.4090575520434366e-06, + "loss": 0.7549, + "step": 45050 + }, + { + "epoch": 1.15, + "learning_rate": 1.4090323023600888e-06, + "loss": 0.7793, + "step": 45051 + }, + { + "epoch": 1.15, + "learning_rate": 1.4090070523635636e-06, + "loss": 0.667, + "step": 45052 + }, + { + "epoch": 1.15, + "learning_rate": 1.4089818020538804e-06, + "loss": 0.71, + "step": 45053 + }, + { + "epoch": 1.15, + "learning_rate": 1.408956551431059e-06, + "loss": 0.6108, + "step": 45054 + }, + { + "epoch": 1.15, + "learning_rate": 1.4089313004951183e-06, + "loss": 0.4354, + "step": 45055 + }, + { + "epoch": 1.15, + "learning_rate": 1.4089060492460775e-06, + "loss": 0.7607, + "step": 45056 + }, + { + "epoch": 1.15, + "learning_rate": 1.4088807976839561e-06, + "loss": 0.54, + "step": 45057 + }, + { + "epoch": 1.15, + "learning_rate": 1.4088555458087735e-06, + "loss": 0.6904, + "step": 45058 + }, + { + "epoch": 1.15, + "learning_rate": 1.408830293620549e-06, + "loss": 0.7412, + "step": 45059 + }, + { + "epoch": 1.15, + "learning_rate": 1.4088050411193022e-06, + "loss": 0.6089, + "step": 45060 + }, + { + "epoch": 1.15, + "learning_rate": 1.4087797883050518e-06, + "loss": 0.5427, + "step": 45061 + }, + { + "epoch": 1.15, + "learning_rate": 1.408754535177818e-06, + "loss": 0.7285, + "step": 45062 + }, + { + "epoch": 1.15, + "learning_rate": 1.4087292817376193e-06, + "loss": 0.751, + "step": 45063 + }, + { + "epoch": 1.16, + "learning_rate": 1.4087040279844755e-06, + "loss": 0.6296, + "step": 45064 + }, + { + "epoch": 1.16, + "learning_rate": 1.4086787739184058e-06, + "loss": 0.7568, + "step": 45065 + }, + { + "epoch": 1.16, + "learning_rate": 1.4086535195394296e-06, + "loss": 0.6543, + "step": 45066 + }, + { + "epoch": 1.16, + "learning_rate": 1.4086282648475657e-06, + "loss": 0.8018, + "step": 45067 + }, + { + "epoch": 1.16, + "learning_rate": 1.4086030098428346e-06, + "loss": 0.7119, + "step": 45068 + }, + { + "epoch": 1.16, + "learning_rate": 1.4085777545252548e-06, + "loss": 0.7744, + "step": 45069 + }, + { + "epoch": 1.16, + "learning_rate": 1.4085524988948456e-06, + "loss": 0.5093, + "step": 45070 + }, + { + "epoch": 1.16, + "learning_rate": 1.4085272429516266e-06, + "loss": 0.6274, + "step": 45071 + }, + { + "epoch": 1.16, + "learning_rate": 1.4085019866956173e-06, + "loss": 0.7041, + "step": 45072 + }, + { + "epoch": 1.16, + "learning_rate": 1.4084767301268366e-06, + "loss": 0.6558, + "step": 45073 + }, + { + "epoch": 1.16, + "learning_rate": 1.4084514732453041e-06, + "loss": 0.7148, + "step": 45074 + }, + { + "epoch": 1.16, + "learning_rate": 1.4084262160510392e-06, + "loss": 0.7314, + "step": 45075 + }, + { + "epoch": 1.16, + "learning_rate": 1.408400958544061e-06, + "loss": 0.5225, + "step": 45076 + }, + { + "epoch": 1.16, + "learning_rate": 1.4083757007243886e-06, + "loss": 0.6602, + "step": 45077 + }, + { + "epoch": 1.16, + "learning_rate": 1.4083504425920423e-06, + "loss": 0.7168, + "step": 45078 + }, + { + "epoch": 1.16, + "learning_rate": 1.4083251841470407e-06, + "loss": 0.6443, + "step": 45079 + }, + { + "epoch": 1.16, + "learning_rate": 1.4082999253894033e-06, + "loss": 0.6348, + "step": 45080 + }, + { + "epoch": 1.16, + "learning_rate": 1.4082746663191492e-06, + "loss": 0.7334, + "step": 45081 + }, + { + "epoch": 1.16, + "learning_rate": 1.408249406936298e-06, + "loss": 0.666, + "step": 45082 + }, + { + "epoch": 1.16, + "learning_rate": 1.408224147240869e-06, + "loss": 0.6304, + "step": 45083 + }, + { + "epoch": 1.16, + "learning_rate": 1.4081988872328816e-06, + "loss": 0.5162, + "step": 45084 + }, + { + "epoch": 1.16, + "learning_rate": 1.4081736269123552e-06, + "loss": 0.6514, + "step": 45085 + }, + { + "epoch": 1.16, + "learning_rate": 1.4081483662793087e-06, + "loss": 0.6206, + "step": 45086 + }, + { + "epoch": 1.16, + "learning_rate": 1.408123105333762e-06, + "loss": 0.623, + "step": 45087 + }, + { + "epoch": 1.16, + "learning_rate": 1.4080978440757342e-06, + "loss": 0.6392, + "step": 45088 + }, + { + "epoch": 1.16, + "learning_rate": 1.4080725825052448e-06, + "loss": 0.6096, + "step": 45089 + }, + { + "epoch": 1.16, + "learning_rate": 1.4080473206223128e-06, + "loss": 0.6729, + "step": 45090 + }, + { + "epoch": 1.16, + "learning_rate": 1.4080220584269578e-06, + "loss": 0.7305, + "step": 45091 + }, + { + "epoch": 1.16, + "learning_rate": 1.407996795919199e-06, + "loss": 0.6318, + "step": 45092 + }, + { + "epoch": 1.16, + "learning_rate": 1.4079715330990557e-06, + "loss": 0.4385, + "step": 45093 + }, + { + "epoch": 1.16, + "learning_rate": 1.4079462699665477e-06, + "loss": 0.5986, + "step": 45094 + }, + { + "epoch": 1.16, + "learning_rate": 1.4079210065216938e-06, + "loss": 0.7402, + "step": 45095 + }, + { + "epoch": 1.16, + "learning_rate": 1.4078957427645132e-06, + "loss": 0.7148, + "step": 45096 + }, + { + "epoch": 1.16, + "learning_rate": 1.4078704786950263e-06, + "loss": 0.5693, + "step": 45097 + }, + { + "epoch": 1.16, + "learning_rate": 1.407845214313251e-06, + "loss": 0.7041, + "step": 45098 + }, + { + "epoch": 1.16, + "learning_rate": 1.4078199496192081e-06, + "loss": 0.7949, + "step": 45099 + }, + { + "epoch": 1.16, + "learning_rate": 1.4077946846129157e-06, + "loss": 0.6934, + "step": 45100 + }, + { + "epoch": 1.16, + "learning_rate": 1.407769419294394e-06, + "loss": 0.8213, + "step": 45101 + }, + { + "epoch": 1.16, + "learning_rate": 1.4077441536636614e-06, + "loss": 0.6963, + "step": 45102 + }, + { + "epoch": 1.16, + "learning_rate": 1.4077188877207385e-06, + "loss": 0.7139, + "step": 45103 + }, + { + "epoch": 1.16, + "learning_rate": 1.4076936214656438e-06, + "loss": 0.5791, + "step": 45104 + }, + { + "epoch": 1.16, + "learning_rate": 1.4076683548983965e-06, + "loss": 0.748, + "step": 45105 + }, + { + "epoch": 1.16, + "learning_rate": 1.4076430880190166e-06, + "loss": 0.5645, + "step": 45106 + }, + { + "epoch": 1.16, + "learning_rate": 1.4076178208275234e-06, + "loss": 0.5383, + "step": 45107 + }, + { + "epoch": 1.16, + "learning_rate": 1.4075925533239355e-06, + "loss": 0.5645, + "step": 45108 + }, + { + "epoch": 1.16, + "learning_rate": 1.407567285508273e-06, + "loss": 0.6084, + "step": 45109 + }, + { + "epoch": 1.16, + "learning_rate": 1.4075420173805549e-06, + "loss": 0.4785, + "step": 45110 + }, + { + "epoch": 1.16, + "learning_rate": 1.4075167489408004e-06, + "loss": 0.7051, + "step": 45111 + }, + { + "epoch": 1.16, + "learning_rate": 1.4074914801890293e-06, + "loss": 0.7529, + "step": 45112 + }, + { + "epoch": 1.16, + "learning_rate": 1.4074662111252607e-06, + "loss": 0.3707, + "step": 45113 + }, + { + "epoch": 1.16, + "learning_rate": 1.407440941749514e-06, + "loss": 0.6689, + "step": 45114 + }, + { + "epoch": 1.16, + "learning_rate": 1.4074156720618082e-06, + "loss": 0.7178, + "step": 45115 + }, + { + "epoch": 1.16, + "learning_rate": 1.4073904020621635e-06, + "loss": 0.6914, + "step": 45116 + }, + { + "epoch": 1.16, + "learning_rate": 1.4073651317505981e-06, + "loss": 0.624, + "step": 45117 + }, + { + "epoch": 1.16, + "learning_rate": 1.4073398611271324e-06, + "loss": 0.5703, + "step": 45118 + }, + { + "epoch": 1.16, + "learning_rate": 1.407314590191785e-06, + "loss": 0.6777, + "step": 45119 + }, + { + "epoch": 1.16, + "learning_rate": 1.4072893189445758e-06, + "loss": 0.7119, + "step": 45120 + }, + { + "epoch": 1.16, + "learning_rate": 1.4072640473855236e-06, + "loss": 0.7861, + "step": 45121 + }, + { + "epoch": 1.16, + "learning_rate": 1.4072387755146483e-06, + "loss": 0.7949, + "step": 45122 + }, + { + "epoch": 1.16, + "learning_rate": 1.407213503331969e-06, + "loss": 0.6846, + "step": 45123 + }, + { + "epoch": 1.16, + "learning_rate": 1.4071882308375052e-06, + "loss": 0.7373, + "step": 45124 + }, + { + "epoch": 1.16, + "learning_rate": 1.4071629580312756e-06, + "loss": 0.7109, + "step": 45125 + }, + { + "epoch": 1.16, + "learning_rate": 1.4071376849133003e-06, + "loss": 0.4751, + "step": 45126 + }, + { + "epoch": 1.16, + "learning_rate": 1.4071124114835983e-06, + "loss": 0.7168, + "step": 45127 + }, + { + "epoch": 1.16, + "learning_rate": 1.4070871377421894e-06, + "loss": 0.6377, + "step": 45128 + }, + { + "epoch": 1.16, + "learning_rate": 1.4070618636890923e-06, + "loss": 0.562, + "step": 45129 + }, + { + "epoch": 1.16, + "learning_rate": 1.4070365893243265e-06, + "loss": 0.7607, + "step": 45130 + }, + { + "epoch": 1.16, + "learning_rate": 1.4070113146479116e-06, + "loss": 0.6611, + "step": 45131 + }, + { + "epoch": 1.16, + "learning_rate": 1.406986039659867e-06, + "loss": 0.4856, + "step": 45132 + }, + { + "epoch": 1.16, + "learning_rate": 1.4069607643602118e-06, + "loss": 0.707, + "step": 45133 + }, + { + "epoch": 1.16, + "learning_rate": 1.4069354887489656e-06, + "loss": 0.5532, + "step": 45134 + }, + { + "epoch": 1.16, + "learning_rate": 1.4069102128261477e-06, + "loss": 0.6504, + "step": 45135 + }, + { + "epoch": 1.16, + "learning_rate": 1.4068849365917768e-06, + "loss": 0.6426, + "step": 45136 + }, + { + "epoch": 1.16, + "learning_rate": 1.4068596600458732e-06, + "loss": 0.5996, + "step": 45137 + }, + { + "epoch": 1.16, + "learning_rate": 1.4068343831884559e-06, + "loss": 0.6348, + "step": 45138 + }, + { + "epoch": 1.16, + "learning_rate": 1.4068091060195445e-06, + "loss": 0.3792, + "step": 45139 + }, + { + "epoch": 1.16, + "learning_rate": 1.4067838285391575e-06, + "loss": 0.7827, + "step": 45140 + }, + { + "epoch": 1.16, + "learning_rate": 1.4067585507473152e-06, + "loss": 0.4424, + "step": 45141 + }, + { + "epoch": 1.16, + "learning_rate": 1.4067332726440362e-06, + "loss": 0.604, + "step": 45142 + }, + { + "epoch": 1.16, + "learning_rate": 1.4067079942293405e-06, + "loss": 0.5859, + "step": 45143 + }, + { + "epoch": 1.16, + "learning_rate": 1.4066827155032472e-06, + "loss": 0.6279, + "step": 45144 + }, + { + "epoch": 1.16, + "learning_rate": 1.4066574364657758e-06, + "loss": 0.7188, + "step": 45145 + }, + { + "epoch": 1.16, + "learning_rate": 1.4066321571169453e-06, + "loss": 0.5034, + "step": 45146 + }, + { + "epoch": 1.16, + "learning_rate": 1.4066068774567753e-06, + "loss": 0.6729, + "step": 45147 + }, + { + "epoch": 1.16, + "learning_rate": 1.4065815974852847e-06, + "loss": 0.563, + "step": 45148 + }, + { + "epoch": 1.16, + "learning_rate": 1.4065563172024939e-06, + "loss": 0.5864, + "step": 45149 + }, + { + "epoch": 1.16, + "learning_rate": 1.4065310366084214e-06, + "loss": 0.7646, + "step": 45150 + }, + { + "epoch": 1.16, + "learning_rate": 1.4065057557030867e-06, + "loss": 0.5017, + "step": 45151 + }, + { + "epoch": 1.16, + "learning_rate": 1.4064804744865094e-06, + "loss": 0.5679, + "step": 45152 + }, + { + "epoch": 1.16, + "learning_rate": 1.4064551929587086e-06, + "loss": 0.7285, + "step": 45153 + }, + { + "epoch": 1.16, + "learning_rate": 1.4064299111197035e-06, + "loss": 0.5767, + "step": 45154 + }, + { + "epoch": 1.16, + "learning_rate": 1.406404628969514e-06, + "loss": 0.4088, + "step": 45155 + }, + { + "epoch": 1.16, + "learning_rate": 1.406379346508159e-06, + "loss": 0.7183, + "step": 45156 + }, + { + "epoch": 1.16, + "learning_rate": 1.406354063735658e-06, + "loss": 0.4924, + "step": 45157 + }, + { + "epoch": 1.16, + "learning_rate": 1.4063287806520305e-06, + "loss": 0.5747, + "step": 45158 + }, + { + "epoch": 1.16, + "learning_rate": 1.4063034972572959e-06, + "loss": 0.7393, + "step": 45159 + }, + { + "epoch": 1.16, + "learning_rate": 1.4062782135514733e-06, + "loss": 0.7305, + "step": 45160 + }, + { + "epoch": 1.16, + "learning_rate": 1.406252929534582e-06, + "loss": 0.7881, + "step": 45161 + }, + { + "epoch": 1.16, + "learning_rate": 1.4062276452066415e-06, + "loss": 0.6602, + "step": 45162 + }, + { + "epoch": 1.16, + "learning_rate": 1.4062023605676712e-06, + "loss": 0.6914, + "step": 45163 + }, + { + "epoch": 1.16, + "learning_rate": 1.4061770756176907e-06, + "loss": 0.668, + "step": 45164 + }, + { + "epoch": 1.16, + "learning_rate": 1.4061517903567186e-06, + "loss": 0.5327, + "step": 45165 + }, + { + "epoch": 1.16, + "learning_rate": 1.4061265047847752e-06, + "loss": 0.8604, + "step": 45166 + }, + { + "epoch": 1.16, + "learning_rate": 1.4061012189018791e-06, + "loss": 0.6328, + "step": 45167 + }, + { + "epoch": 1.16, + "learning_rate": 1.4060759327080502e-06, + "loss": 0.5225, + "step": 45168 + }, + { + "epoch": 1.16, + "learning_rate": 1.4060506462033075e-06, + "loss": 0.7139, + "step": 45169 + }, + { + "epoch": 1.16, + "learning_rate": 1.4060253593876706e-06, + "loss": 0.707, + "step": 45170 + }, + { + "epoch": 1.16, + "learning_rate": 1.4060000722611585e-06, + "loss": 0.3513, + "step": 45171 + }, + { + "epoch": 1.16, + "learning_rate": 1.405974784823791e-06, + "loss": 0.5635, + "step": 45172 + }, + { + "epoch": 1.16, + "learning_rate": 1.4059494970755871e-06, + "loss": 0.6558, + "step": 45173 + }, + { + "epoch": 1.16, + "learning_rate": 1.4059242090165667e-06, + "loss": 0.53, + "step": 45174 + }, + { + "epoch": 1.16, + "learning_rate": 1.4058989206467487e-06, + "loss": 0.7705, + "step": 45175 + }, + { + "epoch": 1.16, + "learning_rate": 1.4058736319661524e-06, + "loss": 0.6323, + "step": 45176 + }, + { + "epoch": 1.16, + "learning_rate": 1.4058483429747973e-06, + "loss": 0.6875, + "step": 45177 + }, + { + "epoch": 1.16, + "learning_rate": 1.4058230536727028e-06, + "loss": 0.6357, + "step": 45178 + }, + { + "epoch": 1.16, + "learning_rate": 1.4057977640598883e-06, + "loss": 0.6191, + "step": 45179 + }, + { + "epoch": 1.16, + "learning_rate": 1.4057724741363732e-06, + "loss": 0.6963, + "step": 45180 + }, + { + "epoch": 1.16, + "learning_rate": 1.4057471839021768e-06, + "loss": 0.7812, + "step": 45181 + }, + { + "epoch": 1.16, + "learning_rate": 1.4057218933573182e-06, + "loss": 0.6533, + "step": 45182 + }, + { + "epoch": 1.16, + "learning_rate": 1.4056966025018172e-06, + "loss": 0.4683, + "step": 45183 + }, + { + "epoch": 1.16, + "learning_rate": 1.4056713113356929e-06, + "loss": 0.6475, + "step": 45184 + }, + { + "epoch": 1.16, + "learning_rate": 1.4056460198589648e-06, + "loss": 0.7354, + "step": 45185 + }, + { + "epoch": 1.16, + "learning_rate": 1.4056207280716522e-06, + "loss": 0.5444, + "step": 45186 + }, + { + "epoch": 1.16, + "learning_rate": 1.4055954359737743e-06, + "loss": 0.6143, + "step": 45187 + }, + { + "epoch": 1.16, + "learning_rate": 1.4055701435653504e-06, + "loss": 0.5815, + "step": 45188 + }, + { + "epoch": 1.16, + "learning_rate": 1.4055448508464006e-06, + "loss": 0.5795, + "step": 45189 + }, + { + "epoch": 1.16, + "learning_rate": 1.4055195578169436e-06, + "loss": 0.5981, + "step": 45190 + }, + { + "epoch": 1.16, + "learning_rate": 1.4054942644769989e-06, + "loss": 0.4917, + "step": 45191 + }, + { + "epoch": 1.16, + "learning_rate": 1.4054689708265856e-06, + "loss": 0.6514, + "step": 45192 + }, + { + "epoch": 1.16, + "learning_rate": 1.4054436768657237e-06, + "loss": 0.5356, + "step": 45193 + }, + { + "epoch": 1.16, + "learning_rate": 1.4054183825944324e-06, + "loss": 0.7822, + "step": 45194 + }, + { + "epoch": 1.16, + "learning_rate": 1.4053930880127305e-06, + "loss": 0.7656, + "step": 45195 + }, + { + "epoch": 1.16, + "learning_rate": 1.405367793120638e-06, + "loss": 0.8301, + "step": 45196 + }, + { + "epoch": 1.16, + "learning_rate": 1.4053424979181738e-06, + "loss": 0.8926, + "step": 45197 + }, + { + "epoch": 1.16, + "learning_rate": 1.4053172024053574e-06, + "loss": 0.6118, + "step": 45198 + }, + { + "epoch": 1.16, + "learning_rate": 1.4052919065822085e-06, + "loss": 0.5137, + "step": 45199 + }, + { + "epoch": 1.16, + "learning_rate": 1.4052666104487463e-06, + "loss": 0.6904, + "step": 45200 + }, + { + "epoch": 1.16, + "learning_rate": 1.4052413140049897e-06, + "loss": 0.6777, + "step": 45201 + }, + { + "epoch": 1.16, + "learning_rate": 1.4052160172509588e-06, + "loss": 0.6699, + "step": 45202 + }, + { + "epoch": 1.16, + "learning_rate": 1.4051907201866724e-06, + "loss": 0.585, + "step": 45203 + }, + { + "epoch": 1.16, + "learning_rate": 1.4051654228121505e-06, + "loss": 0.6409, + "step": 45204 + }, + { + "epoch": 1.16, + "learning_rate": 1.4051401251274118e-06, + "loss": 0.5038, + "step": 45205 + }, + { + "epoch": 1.16, + "learning_rate": 1.405114827132476e-06, + "loss": 0.6602, + "step": 45206 + }, + { + "epoch": 1.16, + "learning_rate": 1.4050895288273621e-06, + "loss": 0.5537, + "step": 45207 + }, + { + "epoch": 1.16, + "learning_rate": 1.40506423021209e-06, + "loss": 0.6465, + "step": 45208 + }, + { + "epoch": 1.16, + "learning_rate": 1.4050389312866791e-06, + "loss": 0.5903, + "step": 45209 + }, + { + "epoch": 1.16, + "learning_rate": 1.4050136320511483e-06, + "loss": 0.8564, + "step": 45210 + }, + { + "epoch": 1.16, + "learning_rate": 1.404988332505517e-06, + "loss": 0.5503, + "step": 45211 + }, + { + "epoch": 1.16, + "learning_rate": 1.404963032649805e-06, + "loss": 0.7163, + "step": 45212 + }, + { + "epoch": 1.16, + "learning_rate": 1.404937732484031e-06, + "loss": 0.623, + "step": 45213 + }, + { + "epoch": 1.16, + "learning_rate": 1.4049124320082152e-06, + "loss": 0.7578, + "step": 45214 + }, + { + "epoch": 1.16, + "learning_rate": 1.4048871312223767e-06, + "loss": 0.4048, + "step": 45215 + }, + { + "epoch": 1.16, + "learning_rate": 1.4048618301265348e-06, + "loss": 0.6484, + "step": 45216 + }, + { + "epoch": 1.16, + "learning_rate": 1.4048365287207082e-06, + "loss": 0.6265, + "step": 45217 + }, + { + "epoch": 1.16, + "learning_rate": 1.4048112270049175e-06, + "loss": 0.7324, + "step": 45218 + }, + { + "epoch": 1.16, + "learning_rate": 1.4047859249791812e-06, + "loss": 0.7363, + "step": 45219 + }, + { + "epoch": 1.16, + "learning_rate": 1.4047606226435186e-06, + "loss": 0.8291, + "step": 45220 + }, + { + "epoch": 1.16, + "learning_rate": 1.4047353199979498e-06, + "loss": 0.6982, + "step": 45221 + }, + { + "epoch": 1.16, + "learning_rate": 1.4047100170424936e-06, + "loss": 0.6196, + "step": 45222 + }, + { + "epoch": 1.16, + "learning_rate": 1.4046847137771699e-06, + "loss": 0.8574, + "step": 45223 + }, + { + "epoch": 1.16, + "learning_rate": 1.4046594102019975e-06, + "loss": 0.6138, + "step": 45224 + }, + { + "epoch": 1.16, + "learning_rate": 1.404634106316996e-06, + "loss": 0.7188, + "step": 45225 + }, + { + "epoch": 1.16, + "learning_rate": 1.4046088021221847e-06, + "loss": 0.3544, + "step": 45226 + }, + { + "epoch": 1.16, + "learning_rate": 1.404583497617583e-06, + "loss": 0.5675, + "step": 45227 + }, + { + "epoch": 1.16, + "learning_rate": 1.4045581928032105e-06, + "loss": 0.5605, + "step": 45228 + }, + { + "epoch": 1.16, + "learning_rate": 1.4045328876790863e-06, + "loss": 0.6763, + "step": 45229 + }, + { + "epoch": 1.16, + "learning_rate": 1.4045075822452298e-06, + "loss": 0.7412, + "step": 45230 + }, + { + "epoch": 1.16, + "learning_rate": 1.4044822765016607e-06, + "loss": 0.3661, + "step": 45231 + }, + { + "epoch": 1.16, + "learning_rate": 1.4044569704483977e-06, + "loss": 0.6484, + "step": 45232 + }, + { + "epoch": 1.16, + "learning_rate": 1.404431664085461e-06, + "loss": 0.606, + "step": 45233 + }, + { + "epoch": 1.16, + "learning_rate": 1.4044063574128692e-06, + "loss": 0.5452, + "step": 45234 + }, + { + "epoch": 1.16, + "learning_rate": 1.4043810504306425e-06, + "loss": 0.6543, + "step": 45235 + }, + { + "epoch": 1.16, + "learning_rate": 1.4043557431387996e-06, + "loss": 0.5464, + "step": 45236 + }, + { + "epoch": 1.16, + "learning_rate": 1.40433043553736e-06, + "loss": 0.5933, + "step": 45237 + }, + { + "epoch": 1.16, + "learning_rate": 1.404305127626343e-06, + "loss": 0.7139, + "step": 45238 + }, + { + "epoch": 1.16, + "learning_rate": 1.4042798194057686e-06, + "loss": 0.582, + "step": 45239 + }, + { + "epoch": 1.16, + "learning_rate": 1.4042545108756557e-06, + "loss": 0.6855, + "step": 45240 + }, + { + "epoch": 1.16, + "learning_rate": 1.4042292020360233e-06, + "loss": 0.8262, + "step": 45241 + }, + { + "epoch": 1.16, + "learning_rate": 1.4042038928868915e-06, + "loss": 0.6797, + "step": 45242 + }, + { + "epoch": 1.16, + "learning_rate": 1.4041785834282793e-06, + "loss": 0.5569, + "step": 45243 + }, + { + "epoch": 1.16, + "learning_rate": 1.4041532736602061e-06, + "loss": 0.7246, + "step": 45244 + }, + { + "epoch": 1.16, + "learning_rate": 1.4041279635826915e-06, + "loss": 0.7295, + "step": 45245 + }, + { + "epoch": 1.16, + "learning_rate": 1.4041026531957544e-06, + "loss": 0.7275, + "step": 45246 + }, + { + "epoch": 1.16, + "learning_rate": 1.4040773424994147e-06, + "loss": 0.5103, + "step": 45247 + }, + { + "epoch": 1.16, + "learning_rate": 1.4040520314936914e-06, + "loss": 0.6621, + "step": 45248 + }, + { + "epoch": 1.16, + "learning_rate": 1.4040267201786043e-06, + "loss": 0.6899, + "step": 45249 + }, + { + "epoch": 1.16, + "learning_rate": 1.4040014085541724e-06, + "loss": 0.6143, + "step": 45250 + }, + { + "epoch": 1.16, + "learning_rate": 1.4039760966204151e-06, + "loss": 0.6914, + "step": 45251 + }, + { + "epoch": 1.16, + "learning_rate": 1.403950784377352e-06, + "loss": 0.5613, + "step": 45252 + }, + { + "epoch": 1.16, + "learning_rate": 1.4039254718250022e-06, + "loss": 0.6074, + "step": 45253 + }, + { + "epoch": 1.16, + "learning_rate": 1.4039001589633854e-06, + "loss": 0.7197, + "step": 45254 + }, + { + "epoch": 1.16, + "learning_rate": 1.4038748457925206e-06, + "loss": 0.7793, + "step": 45255 + }, + { + "epoch": 1.16, + "learning_rate": 1.4038495323124278e-06, + "loss": 0.5576, + "step": 45256 + }, + { + "epoch": 1.16, + "learning_rate": 1.4038242185231254e-06, + "loss": 0.5693, + "step": 45257 + }, + { + "epoch": 1.16, + "learning_rate": 1.403798904424634e-06, + "loss": 0.6357, + "step": 45258 + }, + { + "epoch": 1.16, + "learning_rate": 1.4037735900169721e-06, + "loss": 0.8887, + "step": 45259 + }, + { + "epoch": 1.16, + "learning_rate": 1.4037482753001594e-06, + "loss": 0.6411, + "step": 45260 + }, + { + "epoch": 1.16, + "learning_rate": 1.403722960274215e-06, + "loss": 0.5966, + "step": 45261 + }, + { + "epoch": 1.16, + "learning_rate": 1.4036976449391585e-06, + "loss": 0.6064, + "step": 45262 + }, + { + "epoch": 1.16, + "learning_rate": 1.4036723292950092e-06, + "loss": 0.6787, + "step": 45263 + }, + { + "epoch": 1.16, + "learning_rate": 1.4036470133417869e-06, + "loss": 0.7339, + "step": 45264 + }, + { + "epoch": 1.16, + "learning_rate": 1.4036216970795104e-06, + "loss": 0.6992, + "step": 45265 + }, + { + "epoch": 1.16, + "learning_rate": 1.4035963805081992e-06, + "loss": 0.8965, + "step": 45266 + }, + { + "epoch": 1.16, + "learning_rate": 1.403571063627873e-06, + "loss": 0.4575, + "step": 45267 + }, + { + "epoch": 1.16, + "learning_rate": 1.403545746438551e-06, + "loss": 0.5488, + "step": 45268 + }, + { + "epoch": 1.16, + "learning_rate": 1.4035204289402527e-06, + "loss": 0.5938, + "step": 45269 + }, + { + "epoch": 1.16, + "learning_rate": 1.403495111132997e-06, + "loss": 0.6157, + "step": 45270 + }, + { + "epoch": 1.16, + "learning_rate": 1.403469793016804e-06, + "loss": 0.626, + "step": 45271 + }, + { + "epoch": 1.16, + "learning_rate": 1.4034444745916925e-06, + "loss": 0.792, + "step": 45272 + }, + { + "epoch": 1.16, + "learning_rate": 1.4034191558576822e-06, + "loss": 0.71, + "step": 45273 + }, + { + "epoch": 1.16, + "learning_rate": 1.4033938368147926e-06, + "loss": 0.7251, + "step": 45274 + }, + { + "epoch": 1.16, + "learning_rate": 1.4033685174630427e-06, + "loss": 0.6611, + "step": 45275 + }, + { + "epoch": 1.16, + "learning_rate": 1.4033431978024522e-06, + "loss": 0.5198, + "step": 45276 + }, + { + "epoch": 1.16, + "learning_rate": 1.40331787783304e-06, + "loss": 0.6714, + "step": 45277 + }, + { + "epoch": 1.16, + "learning_rate": 1.403292557554826e-06, + "loss": 0.8408, + "step": 45278 + }, + { + "epoch": 1.16, + "learning_rate": 1.4032672369678297e-06, + "loss": 0.6211, + "step": 45279 + }, + { + "epoch": 1.16, + "learning_rate": 1.4032419160720702e-06, + "loss": 0.6221, + "step": 45280 + }, + { + "epoch": 1.16, + "learning_rate": 1.4032165948675667e-06, + "loss": 0.7305, + "step": 45281 + }, + { + "epoch": 1.16, + "learning_rate": 1.4031912733543388e-06, + "loss": 0.5921, + "step": 45282 + }, + { + "epoch": 1.16, + "learning_rate": 1.403165951532406e-06, + "loss": 0.835, + "step": 45283 + }, + { + "epoch": 1.16, + "learning_rate": 1.4031406294017874e-06, + "loss": 0.4893, + "step": 45284 + }, + { + "epoch": 1.16, + "learning_rate": 1.4031153069625026e-06, + "loss": 0.3792, + "step": 45285 + }, + { + "epoch": 1.16, + "learning_rate": 1.4030899842145709e-06, + "loss": 0.752, + "step": 45286 + }, + { + "epoch": 1.16, + "learning_rate": 1.4030646611580119e-06, + "loss": 0.5669, + "step": 45287 + }, + { + "epoch": 1.16, + "learning_rate": 1.4030393377928447e-06, + "loss": 0.6318, + "step": 45288 + }, + { + "epoch": 1.16, + "learning_rate": 1.403014014119089e-06, + "loss": 0.6602, + "step": 45289 + }, + { + "epoch": 1.16, + "learning_rate": 1.4029886901367638e-06, + "loss": 0.7217, + "step": 45290 + }, + { + "epoch": 1.16, + "learning_rate": 1.4029633658458885e-06, + "loss": 0.4653, + "step": 45291 + }, + { + "epoch": 1.16, + "learning_rate": 1.4029380412464832e-06, + "loss": 0.5088, + "step": 45292 + }, + { + "epoch": 1.16, + "learning_rate": 1.4029127163385664e-06, + "loss": 0.5913, + "step": 45293 + }, + { + "epoch": 1.16, + "learning_rate": 1.402887391122158e-06, + "loss": 0.5613, + "step": 45294 + }, + { + "epoch": 1.16, + "learning_rate": 1.4028620655972771e-06, + "loss": 0.4177, + "step": 45295 + }, + { + "epoch": 1.16, + "learning_rate": 1.4028367397639436e-06, + "loss": 0.6738, + "step": 45296 + }, + { + "epoch": 1.16, + "learning_rate": 1.4028114136221761e-06, + "loss": 0.6406, + "step": 45297 + }, + { + "epoch": 1.16, + "learning_rate": 1.4027860871719945e-06, + "loss": 0.6221, + "step": 45298 + }, + { + "epoch": 1.16, + "learning_rate": 1.4027607604134185e-06, + "loss": 0.7676, + "step": 45299 + }, + { + "epoch": 1.16, + "learning_rate": 1.4027354333464668e-06, + "loss": 0.689, + "step": 45300 + }, + { + "epoch": 1.16, + "learning_rate": 1.4027101059711591e-06, + "loss": 0.5161, + "step": 45301 + }, + { + "epoch": 1.16, + "learning_rate": 1.4026847782875147e-06, + "loss": 0.7314, + "step": 45302 + }, + { + "epoch": 1.16, + "learning_rate": 1.402659450295553e-06, + "loss": 0.6143, + "step": 45303 + }, + { + "epoch": 1.16, + "learning_rate": 1.4026341219952937e-06, + "loss": 0.5442, + "step": 45304 + }, + { + "epoch": 1.16, + "learning_rate": 1.402608793386756e-06, + "loss": 0.6416, + "step": 45305 + }, + { + "epoch": 1.16, + "learning_rate": 1.4025834644699592e-06, + "loss": 0.8262, + "step": 45306 + }, + { + "epoch": 1.16, + "learning_rate": 1.4025581352449227e-06, + "loss": 0.5027, + "step": 45307 + }, + { + "epoch": 1.16, + "learning_rate": 1.402532805711666e-06, + "loss": 0.6865, + "step": 45308 + }, + { + "epoch": 1.16, + "learning_rate": 1.4025074758702084e-06, + "loss": 0.6406, + "step": 45309 + }, + { + "epoch": 1.16, + "learning_rate": 1.4024821457205693e-06, + "loss": 0.5742, + "step": 45310 + }, + { + "epoch": 1.16, + "learning_rate": 1.4024568152627683e-06, + "loss": 0.7705, + "step": 45311 + }, + { + "epoch": 1.16, + "learning_rate": 1.4024314844968244e-06, + "loss": 0.7168, + "step": 45312 + }, + { + "epoch": 1.16, + "learning_rate": 1.4024061534227574e-06, + "loss": 0.5674, + "step": 45313 + }, + { + "epoch": 1.16, + "learning_rate": 1.4023808220405866e-06, + "loss": 0.6196, + "step": 45314 + }, + { + "epoch": 1.16, + "learning_rate": 1.4023554903503311e-06, + "loss": 0.7212, + "step": 45315 + }, + { + "epoch": 1.16, + "learning_rate": 1.4023301583520104e-06, + "loss": 0.6001, + "step": 45316 + }, + { + "epoch": 1.16, + "learning_rate": 1.4023048260456443e-06, + "loss": 0.6875, + "step": 45317 + }, + { + "epoch": 1.16, + "learning_rate": 1.4022794934312513e-06, + "loss": 0.7148, + "step": 45318 + }, + { + "epoch": 1.16, + "learning_rate": 1.4022541605088523e-06, + "loss": 0.6611, + "step": 45319 + }, + { + "epoch": 1.16, + "learning_rate": 1.4022288272784652e-06, + "loss": 0.7041, + "step": 45320 + }, + { + "epoch": 1.16, + "learning_rate": 1.4022034937401102e-06, + "loss": 0.7275, + "step": 45321 + }, + { + "epoch": 1.16, + "learning_rate": 1.4021781598938063e-06, + "loss": 0.7637, + "step": 45322 + }, + { + "epoch": 1.16, + "learning_rate": 1.4021528257395732e-06, + "loss": 0.8198, + "step": 45323 + }, + { + "epoch": 1.16, + "learning_rate": 1.4021274912774302e-06, + "loss": 0.6016, + "step": 45324 + }, + { + "epoch": 1.16, + "learning_rate": 1.4021021565073965e-06, + "loss": 0.667, + "step": 45325 + }, + { + "epoch": 1.16, + "learning_rate": 1.4020768214294916e-06, + "loss": 0.6934, + "step": 45326 + }, + { + "epoch": 1.16, + "learning_rate": 1.4020514860437351e-06, + "loss": 0.5918, + "step": 45327 + }, + { + "epoch": 1.16, + "learning_rate": 1.4020261503501463e-06, + "loss": 0.6895, + "step": 45328 + }, + { + "epoch": 1.16, + "learning_rate": 1.4020008143487445e-06, + "loss": 0.6387, + "step": 45329 + }, + { + "epoch": 1.16, + "learning_rate": 1.4019754780395493e-06, + "loss": 0.4182, + "step": 45330 + }, + { + "epoch": 1.16, + "learning_rate": 1.4019501414225798e-06, + "loss": 0.7314, + "step": 45331 + }, + { + "epoch": 1.16, + "learning_rate": 1.4019248044978557e-06, + "loss": 0.6846, + "step": 45332 + }, + { + "epoch": 1.16, + "learning_rate": 1.4018994672653963e-06, + "loss": 0.6763, + "step": 45333 + }, + { + "epoch": 1.16, + "learning_rate": 1.4018741297252209e-06, + "loss": 0.7021, + "step": 45334 + }, + { + "epoch": 1.16, + "learning_rate": 1.4018487918773488e-06, + "loss": 0.5869, + "step": 45335 + }, + { + "epoch": 1.16, + "learning_rate": 1.4018234537217997e-06, + "loss": 0.7432, + "step": 45336 + }, + { + "epoch": 1.16, + "learning_rate": 1.4017981152585927e-06, + "loss": 0.749, + "step": 45337 + }, + { + "epoch": 1.16, + "learning_rate": 1.4017727764877474e-06, + "loss": 0.6782, + "step": 45338 + }, + { + "epoch": 1.16, + "learning_rate": 1.4017474374092832e-06, + "loss": 0.626, + "step": 45339 + }, + { + "epoch": 1.16, + "learning_rate": 1.4017220980232197e-06, + "loss": 0.5068, + "step": 45340 + }, + { + "epoch": 1.16, + "learning_rate": 1.4016967583295758e-06, + "loss": 0.5497, + "step": 45341 + }, + { + "epoch": 1.16, + "learning_rate": 1.4016714183283713e-06, + "loss": 0.5142, + "step": 45342 + }, + { + "epoch": 1.16, + "learning_rate": 1.401646078019625e-06, + "loss": 0.5654, + "step": 45343 + }, + { + "epoch": 1.16, + "learning_rate": 1.4016207374033575e-06, + "loss": 0.8232, + "step": 45344 + }, + { + "epoch": 1.16, + "learning_rate": 1.401595396479587e-06, + "loss": 0.707, + "step": 45345 + }, + { + "epoch": 1.16, + "learning_rate": 1.4015700552483335e-06, + "loss": 0.564, + "step": 45346 + }, + { + "epoch": 1.16, + "learning_rate": 1.4015447137096162e-06, + "loss": 0.6514, + "step": 45347 + }, + { + "epoch": 1.16, + "learning_rate": 1.401519371863455e-06, + "loss": 0.4707, + "step": 45348 + }, + { + "epoch": 1.16, + "learning_rate": 1.4014940297098683e-06, + "loss": 0.5083, + "step": 45349 + }, + { + "epoch": 1.16, + "learning_rate": 1.4014686872488763e-06, + "loss": 0.6079, + "step": 45350 + }, + { + "epoch": 1.16, + "learning_rate": 1.4014433444804982e-06, + "loss": 0.668, + "step": 45351 + }, + { + "epoch": 1.16, + "learning_rate": 1.4014180014047534e-06, + "loss": 0.6008, + "step": 45352 + }, + { + "epoch": 1.16, + "learning_rate": 1.4013926580216613e-06, + "loss": 0.5908, + "step": 45353 + }, + { + "epoch": 1.16, + "learning_rate": 1.4013673143312412e-06, + "loss": 0.6289, + "step": 45354 + }, + { + "epoch": 1.16, + "learning_rate": 1.4013419703335127e-06, + "loss": 0.6348, + "step": 45355 + }, + { + "epoch": 1.16, + "learning_rate": 1.401316626028495e-06, + "loss": 0.8374, + "step": 45356 + }, + { + "epoch": 1.16, + "learning_rate": 1.4012912814162077e-06, + "loss": 0.6042, + "step": 45357 + }, + { + "epoch": 1.16, + "learning_rate": 1.4012659364966702e-06, + "loss": 0.6001, + "step": 45358 + }, + { + "epoch": 1.16, + "learning_rate": 1.4012405912699017e-06, + "loss": 0.5889, + "step": 45359 + }, + { + "epoch": 1.16, + "learning_rate": 1.4012152457359217e-06, + "loss": 0.6768, + "step": 45360 + }, + { + "epoch": 1.16, + "learning_rate": 1.4011898998947498e-06, + "loss": 0.7119, + "step": 45361 + }, + { + "epoch": 1.16, + "learning_rate": 1.4011645537464049e-06, + "loss": 0.5259, + "step": 45362 + }, + { + "epoch": 1.16, + "learning_rate": 1.4011392072909072e-06, + "loss": 0.5181, + "step": 45363 + }, + { + "epoch": 1.16, + "learning_rate": 1.4011138605282753e-06, + "loss": 0.8818, + "step": 45364 + }, + { + "epoch": 1.16, + "learning_rate": 1.4010885134585294e-06, + "loss": 0.6318, + "step": 45365 + }, + { + "epoch": 1.16, + "learning_rate": 1.4010631660816879e-06, + "loss": 0.7715, + "step": 45366 + }, + { + "epoch": 1.16, + "learning_rate": 1.401037818397771e-06, + "loss": 0.5645, + "step": 45367 + }, + { + "epoch": 1.16, + "learning_rate": 1.401012470406798e-06, + "loss": 0.4395, + "step": 45368 + }, + { + "epoch": 1.16, + "learning_rate": 1.4009871221087881e-06, + "loss": 0.6846, + "step": 45369 + }, + { + "epoch": 1.16, + "learning_rate": 1.400961773503761e-06, + "loss": 0.6816, + "step": 45370 + }, + { + "epoch": 1.16, + "learning_rate": 1.4009364245917357e-06, + "loss": 0.5776, + "step": 45371 + }, + { + "epoch": 1.16, + "learning_rate": 1.4009110753727316e-06, + "loss": 0.5942, + "step": 45372 + }, + { + "epoch": 1.16, + "learning_rate": 1.4008857258467685e-06, + "loss": 0.5654, + "step": 45373 + }, + { + "epoch": 1.16, + "learning_rate": 1.400860376013866e-06, + "loss": 0.6538, + "step": 45374 + }, + { + "epoch": 1.16, + "learning_rate": 1.4008350258740426e-06, + "loss": 0.8242, + "step": 45375 + }, + { + "epoch": 1.16, + "learning_rate": 1.4008096754273186e-06, + "loss": 0.728, + "step": 45376 + }, + { + "epoch": 1.16, + "learning_rate": 1.4007843246737127e-06, + "loss": 0.5078, + "step": 45377 + }, + { + "epoch": 1.16, + "learning_rate": 1.4007589736132452e-06, + "loss": 0.6055, + "step": 45378 + }, + { + "epoch": 1.16, + "learning_rate": 1.4007336222459345e-06, + "loss": 0.7529, + "step": 45379 + }, + { + "epoch": 1.16, + "learning_rate": 1.4007082705718007e-06, + "loss": 0.6602, + "step": 45380 + }, + { + "epoch": 1.16, + "learning_rate": 1.4006829185908631e-06, + "loss": 0.7295, + "step": 45381 + }, + { + "epoch": 1.16, + "learning_rate": 1.4006575663031408e-06, + "loss": 0.8618, + "step": 45382 + }, + { + "epoch": 1.16, + "learning_rate": 1.4006322137086536e-06, + "loss": 0.7139, + "step": 45383 + }, + { + "epoch": 1.16, + "learning_rate": 1.400606860807421e-06, + "loss": 0.8281, + "step": 45384 + }, + { + "epoch": 1.16, + "learning_rate": 1.4005815075994614e-06, + "loss": 0.5752, + "step": 45385 + }, + { + "epoch": 1.16, + "learning_rate": 1.4005561540847954e-06, + "loss": 0.6621, + "step": 45386 + }, + { + "epoch": 1.16, + "learning_rate": 1.400530800263442e-06, + "loss": 0.6533, + "step": 45387 + }, + { + "epoch": 1.16, + "learning_rate": 1.4005054461354207e-06, + "loss": 0.6982, + "step": 45388 + }, + { + "epoch": 1.16, + "learning_rate": 1.4004800917007504e-06, + "loss": 0.7339, + "step": 45389 + }, + { + "epoch": 1.16, + "learning_rate": 1.4004547369594513e-06, + "loss": 0.5654, + "step": 45390 + }, + { + "epoch": 1.16, + "learning_rate": 1.400429381911542e-06, + "loss": 0.5038, + "step": 45391 + }, + { + "epoch": 1.16, + "learning_rate": 1.4004040265570427e-06, + "loss": 0.75, + "step": 45392 + }, + { + "epoch": 1.16, + "learning_rate": 1.4003786708959725e-06, + "loss": 0.5137, + "step": 45393 + }, + { + "epoch": 1.16, + "learning_rate": 1.4003533149283505e-06, + "loss": 0.6592, + "step": 45394 + }, + { + "epoch": 1.16, + "learning_rate": 1.4003279586541963e-06, + "loss": 0.5684, + "step": 45395 + }, + { + "epoch": 1.16, + "learning_rate": 1.4003026020735297e-06, + "loss": 0.7148, + "step": 45396 + }, + { + "epoch": 1.16, + "learning_rate": 1.4002772451863696e-06, + "loss": 0.604, + "step": 45397 + }, + { + "epoch": 1.16, + "learning_rate": 1.4002518879927356e-06, + "loss": 0.7568, + "step": 45398 + }, + { + "epoch": 1.16, + "learning_rate": 1.4002265304926475e-06, + "loss": 0.835, + "step": 45399 + }, + { + "epoch": 1.16, + "learning_rate": 1.4002011726861238e-06, + "loss": 0.6655, + "step": 45400 + }, + { + "epoch": 1.16, + "learning_rate": 1.4001758145731848e-06, + "loss": 0.7051, + "step": 45401 + }, + { + "epoch": 1.16, + "learning_rate": 1.4001504561538494e-06, + "loss": 0.5015, + "step": 45402 + }, + { + "epoch": 1.16, + "learning_rate": 1.4001250974281375e-06, + "loss": 0.8047, + "step": 45403 + }, + { + "epoch": 1.16, + "learning_rate": 1.400099738396068e-06, + "loss": 0.833, + "step": 45404 + }, + { + "epoch": 1.16, + "learning_rate": 1.4000743790576606e-06, + "loss": 0.5393, + "step": 45405 + }, + { + "epoch": 1.16, + "learning_rate": 1.4000490194129345e-06, + "loss": 0.4946, + "step": 45406 + }, + { + "epoch": 1.16, + "learning_rate": 1.4000236594619092e-06, + "loss": 0.7363, + "step": 45407 + }, + { + "epoch": 1.16, + "learning_rate": 1.3999982992046044e-06, + "loss": 0.7266, + "step": 45408 + }, + { + "epoch": 1.16, + "learning_rate": 1.3999729386410394e-06, + "loss": 0.5439, + "step": 45409 + }, + { + "epoch": 1.16, + "learning_rate": 1.399947577771233e-06, + "loss": 0.7627, + "step": 45410 + }, + { + "epoch": 1.16, + "learning_rate": 1.3999222165952059e-06, + "loss": 0.7783, + "step": 45411 + }, + { + "epoch": 1.16, + "learning_rate": 1.399896855112976e-06, + "loss": 0.6367, + "step": 45412 + }, + { + "epoch": 1.16, + "learning_rate": 1.399871493324564e-06, + "loss": 0.6191, + "step": 45413 + }, + { + "epoch": 1.16, + "learning_rate": 1.3998461312299884e-06, + "loss": 0.7041, + "step": 45414 + }, + { + "epoch": 1.16, + "learning_rate": 1.399820768829269e-06, + "loss": 0.9307, + "step": 45415 + }, + { + "epoch": 1.16, + "learning_rate": 1.3997954061224255e-06, + "loss": 0.6865, + "step": 45416 + }, + { + "epoch": 1.16, + "learning_rate": 1.399770043109477e-06, + "loss": 0.5117, + "step": 45417 + }, + { + "epoch": 1.16, + "learning_rate": 1.3997446797904428e-06, + "loss": 0.7393, + "step": 45418 + }, + { + "epoch": 1.16, + "learning_rate": 1.3997193161653424e-06, + "loss": 0.749, + "step": 45419 + }, + { + "epoch": 1.16, + "learning_rate": 1.3996939522341957e-06, + "loss": 0.7324, + "step": 45420 + }, + { + "epoch": 1.16, + "learning_rate": 1.3996685879970213e-06, + "loss": 0.7715, + "step": 45421 + }, + { + "epoch": 1.16, + "learning_rate": 1.3996432234538393e-06, + "loss": 0.8594, + "step": 45422 + }, + { + "epoch": 1.16, + "learning_rate": 1.3996178586046688e-06, + "loss": 0.6787, + "step": 45423 + }, + { + "epoch": 1.16, + "learning_rate": 1.3995924934495294e-06, + "loss": 0.7744, + "step": 45424 + }, + { + "epoch": 1.16, + "learning_rate": 1.39956712798844e-06, + "loss": 0.6172, + "step": 45425 + }, + { + "epoch": 1.16, + "learning_rate": 1.3995417622214207e-06, + "loss": 0.667, + "step": 45426 + }, + { + "epoch": 1.16, + "learning_rate": 1.3995163961484907e-06, + "loss": 0.6514, + "step": 45427 + }, + { + "epoch": 1.16, + "learning_rate": 1.3994910297696697e-06, + "loss": 0.75, + "step": 45428 + }, + { + "epoch": 1.16, + "learning_rate": 1.399465663084976e-06, + "loss": 0.6206, + "step": 45429 + }, + { + "epoch": 1.16, + "learning_rate": 1.3994402960944304e-06, + "loss": 0.4434, + "step": 45430 + }, + { + "epoch": 1.16, + "learning_rate": 1.3994149287980512e-06, + "loss": 0.7627, + "step": 45431 + }, + { + "epoch": 1.16, + "learning_rate": 1.3993895611958588e-06, + "loss": 0.4473, + "step": 45432 + }, + { + "epoch": 1.16, + "learning_rate": 1.3993641932878721e-06, + "loss": 0.6416, + "step": 45433 + }, + { + "epoch": 1.16, + "learning_rate": 1.3993388250741107e-06, + "loss": 0.6035, + "step": 45434 + }, + { + "epoch": 1.16, + "learning_rate": 1.3993134565545938e-06, + "loss": 0.7129, + "step": 45435 + }, + { + "epoch": 1.16, + "learning_rate": 1.3992880877293407e-06, + "loss": 0.686, + "step": 45436 + }, + { + "epoch": 1.16, + "learning_rate": 1.3992627185983711e-06, + "loss": 0.2832, + "step": 45437 + }, + { + "epoch": 1.16, + "learning_rate": 1.3992373491617047e-06, + "loss": 0.5327, + "step": 45438 + }, + { + "epoch": 1.16, + "learning_rate": 1.3992119794193607e-06, + "loss": 0.7656, + "step": 45439 + }, + { + "epoch": 1.16, + "learning_rate": 1.3991866093713582e-06, + "loss": 0.5737, + "step": 45440 + }, + { + "epoch": 1.16, + "learning_rate": 1.399161239017717e-06, + "loss": 0.5122, + "step": 45441 + }, + { + "epoch": 1.16, + "learning_rate": 1.3991358683584563e-06, + "loss": 0.6401, + "step": 45442 + }, + { + "epoch": 1.16, + "learning_rate": 1.3991104973935956e-06, + "loss": 0.6602, + "step": 45443 + }, + { + "epoch": 1.16, + "learning_rate": 1.3990851261231545e-06, + "loss": 0.6736, + "step": 45444 + }, + { + "epoch": 1.16, + "learning_rate": 1.3990597545471521e-06, + "loss": 0.6362, + "step": 45445 + }, + { + "epoch": 1.16, + "learning_rate": 1.3990343826656079e-06, + "loss": 0.7412, + "step": 45446 + }, + { + "epoch": 1.16, + "learning_rate": 1.3990090104785416e-06, + "loss": 0.6104, + "step": 45447 + }, + { + "epoch": 1.16, + "learning_rate": 1.3989836379859723e-06, + "loss": 0.6582, + "step": 45448 + }, + { + "epoch": 1.16, + "learning_rate": 1.39895826518792e-06, + "loss": 0.5195, + "step": 45449 + }, + { + "epoch": 1.16, + "learning_rate": 1.398932892084403e-06, + "loss": 0.835, + "step": 45450 + }, + { + "epoch": 1.16, + "learning_rate": 1.398907518675442e-06, + "loss": 0.7568, + "step": 45451 + }, + { + "epoch": 1.16, + "learning_rate": 1.3988821449610555e-06, + "loss": 0.6665, + "step": 45452 + }, + { + "epoch": 1.16, + "learning_rate": 1.3988567709412638e-06, + "loss": 0.6704, + "step": 45453 + }, + { + "epoch": 1.17, + "learning_rate": 1.3988313966160852e-06, + "loss": 0.5801, + "step": 45454 + }, + { + "epoch": 1.17, + "learning_rate": 1.3988060219855402e-06, + "loss": 0.6377, + "step": 45455 + }, + { + "epoch": 1.17, + "learning_rate": 1.3987806470496474e-06, + "loss": 0.5771, + "step": 45456 + }, + { + "epoch": 1.17, + "learning_rate": 1.3987552718084268e-06, + "loss": 0.3979, + "step": 45457 + }, + { + "epoch": 1.17, + "learning_rate": 1.3987298962618976e-06, + "loss": 0.4705, + "step": 45458 + }, + { + "epoch": 1.17, + "learning_rate": 1.3987045204100793e-06, + "loss": 0.7441, + "step": 45459 + }, + { + "epoch": 1.17, + "learning_rate": 1.3986791442529914e-06, + "loss": 0.4351, + "step": 45460 + }, + { + "epoch": 1.17, + "learning_rate": 1.398653767790653e-06, + "loss": 0.5762, + "step": 45461 + }, + { + "epoch": 1.17, + "learning_rate": 1.3986283910230836e-06, + "loss": 0.5601, + "step": 45462 + }, + { + "epoch": 1.17, + "learning_rate": 1.3986030139503028e-06, + "loss": 0.7373, + "step": 45463 + }, + { + "epoch": 1.17, + "learning_rate": 1.3985776365723302e-06, + "loss": 0.6396, + "step": 45464 + }, + { + "epoch": 1.17, + "learning_rate": 1.398552258889185e-06, + "loss": 0.5781, + "step": 45465 + }, + { + "epoch": 1.17, + "learning_rate": 1.3985268809008866e-06, + "loss": 0.6587, + "step": 45466 + }, + { + "epoch": 1.17, + "learning_rate": 1.3985015026074545e-06, + "loss": 0.6934, + "step": 45467 + }, + { + "epoch": 1.17, + "learning_rate": 1.3984761240089085e-06, + "loss": 0.7412, + "step": 45468 + }, + { + "epoch": 1.17, + "learning_rate": 1.398450745105267e-06, + "loss": 0.749, + "step": 45469 + }, + { + "epoch": 1.17, + "learning_rate": 1.3984253658965503e-06, + "loss": 0.8057, + "step": 45470 + }, + { + "epoch": 1.17, + "learning_rate": 1.3983999863827778e-06, + "loss": 0.749, + "step": 45471 + }, + { + "epoch": 1.17, + "learning_rate": 1.3983746065639688e-06, + "loss": 0.6812, + "step": 45472 + }, + { + "epoch": 1.17, + "learning_rate": 1.3983492264401423e-06, + "loss": 0.5708, + "step": 45473 + }, + { + "epoch": 1.17, + "learning_rate": 1.3983238460113186e-06, + "loss": 0.6489, + "step": 45474 + }, + { + "epoch": 1.17, + "learning_rate": 1.3982984652775162e-06, + "loss": 0.5903, + "step": 45475 + }, + { + "epoch": 1.17, + "learning_rate": 1.3982730842387553e-06, + "loss": 0.5493, + "step": 45476 + }, + { + "epoch": 1.17, + "learning_rate": 1.3982477028950547e-06, + "loss": 0.5894, + "step": 45477 + }, + { + "epoch": 1.17, + "learning_rate": 1.3982223212464345e-06, + "loss": 0.5923, + "step": 45478 + }, + { + "epoch": 1.17, + "learning_rate": 1.3981969392929135e-06, + "loss": 0.6973, + "step": 45479 + }, + { + "epoch": 1.17, + "learning_rate": 1.3981715570345118e-06, + "loss": 0.7852, + "step": 45480 + }, + { + "epoch": 1.17, + "learning_rate": 1.3981461744712478e-06, + "loss": 0.7383, + "step": 45481 + }, + { + "epoch": 1.17, + "learning_rate": 1.398120791603142e-06, + "loss": 0.5811, + "step": 45482 + }, + { + "epoch": 1.17, + "learning_rate": 1.3980954084302136e-06, + "loss": 0.6396, + "step": 45483 + }, + { + "epoch": 1.17, + "learning_rate": 1.3980700249524815e-06, + "loss": 0.5488, + "step": 45484 + }, + { + "epoch": 1.17, + "learning_rate": 1.3980446411699655e-06, + "loss": 0.6699, + "step": 45485 + }, + { + "epoch": 1.17, + "learning_rate": 1.3980192570826853e-06, + "loss": 0.5737, + "step": 45486 + }, + { + "epoch": 1.17, + "learning_rate": 1.3979938726906597e-06, + "loss": 0.707, + "step": 45487 + }, + { + "epoch": 1.17, + "learning_rate": 1.3979684879939088e-06, + "loss": 0.6162, + "step": 45488 + }, + { + "epoch": 1.17, + "learning_rate": 1.3979431029924518e-06, + "loss": 0.7041, + "step": 45489 + }, + { + "epoch": 1.17, + "learning_rate": 1.3979177176863078e-06, + "loss": 0.6104, + "step": 45490 + }, + { + "epoch": 1.17, + "learning_rate": 1.3978923320754966e-06, + "loss": 0.7061, + "step": 45491 + }, + { + "epoch": 1.17, + "learning_rate": 1.3978669461600373e-06, + "loss": 0.7134, + "step": 45492 + }, + { + "epoch": 1.17, + "learning_rate": 1.39784155993995e-06, + "loss": 0.7969, + "step": 45493 + }, + { + "epoch": 1.17, + "learning_rate": 1.3978161734152533e-06, + "loss": 0.5679, + "step": 45494 + }, + { + "epoch": 1.17, + "learning_rate": 1.3977907865859675e-06, + "loss": 0.5698, + "step": 45495 + }, + { + "epoch": 1.17, + "learning_rate": 1.397765399452111e-06, + "loss": 0.7842, + "step": 45496 + }, + { + "epoch": 1.17, + "learning_rate": 1.3977400120137044e-06, + "loss": 0.647, + "step": 45497 + }, + { + "epoch": 1.17, + "learning_rate": 1.3977146242707662e-06, + "loss": 0.7314, + "step": 45498 + }, + { + "epoch": 1.17, + "learning_rate": 1.3976892362233163e-06, + "loss": 0.5522, + "step": 45499 + }, + { + "epoch": 1.17, + "learning_rate": 1.397663847871374e-06, + "loss": 0.7236, + "step": 45500 + }, + { + "epoch": 1.17, + "learning_rate": 1.397638459214959e-06, + "loss": 0.7393, + "step": 45501 + }, + { + "epoch": 1.17, + "learning_rate": 1.3976130702540903e-06, + "loss": 0.623, + "step": 45502 + }, + { + "epoch": 1.17, + "learning_rate": 1.3975876809887877e-06, + "loss": 0.5688, + "step": 45503 + }, + { + "epoch": 1.17, + "learning_rate": 1.3975622914190703e-06, + "loss": 0.7334, + "step": 45504 + }, + { + "epoch": 1.17, + "learning_rate": 1.3975369015449578e-06, + "loss": 0.5999, + "step": 45505 + }, + { + "epoch": 1.17, + "learning_rate": 1.3975115113664695e-06, + "loss": 0.6343, + "step": 45506 + }, + { + "epoch": 1.17, + "learning_rate": 1.397486120883625e-06, + "loss": 0.6025, + "step": 45507 + }, + { + "epoch": 1.17, + "learning_rate": 1.3974607300964438e-06, + "loss": 0.6685, + "step": 45508 + }, + { + "epoch": 1.17, + "learning_rate": 1.397435339004945e-06, + "loss": 0.541, + "step": 45509 + }, + { + "epoch": 1.17, + "learning_rate": 1.3974099476091483e-06, + "loss": 0.5566, + "step": 45510 + }, + { + "epoch": 1.17, + "learning_rate": 1.397384555909073e-06, + "loss": 0.6494, + "step": 45511 + }, + { + "epoch": 1.17, + "learning_rate": 1.3973591639047387e-06, + "loss": 0.4639, + "step": 45512 + }, + { + "epoch": 1.17, + "learning_rate": 1.3973337715961648e-06, + "loss": 0.7168, + "step": 45513 + }, + { + "epoch": 1.17, + "learning_rate": 1.3973083789833706e-06, + "loss": 0.6831, + "step": 45514 + }, + { + "epoch": 1.17, + "learning_rate": 1.3972829860663757e-06, + "loss": 0.707, + "step": 45515 + }, + { + "epoch": 1.17, + "learning_rate": 1.3972575928451996e-06, + "loss": 0.7188, + "step": 45516 + }, + { + "epoch": 1.17, + "learning_rate": 1.3972321993198612e-06, + "loss": 0.7285, + "step": 45517 + }, + { + "epoch": 1.17, + "learning_rate": 1.3972068054903812e-06, + "loss": 0.7876, + "step": 45518 + }, + { + "epoch": 1.17, + "learning_rate": 1.3971814113567772e-06, + "loss": 0.5796, + "step": 45519 + }, + { + "epoch": 1.17, + "learning_rate": 1.3971560169190704e-06, + "loss": 0.6526, + "step": 45520 + }, + { + "epoch": 1.17, + "learning_rate": 1.3971306221772792e-06, + "loss": 0.6499, + "step": 45521 + }, + { + "epoch": 1.17, + "learning_rate": 1.3971052271314235e-06, + "loss": 0.6519, + "step": 45522 + }, + { + "epoch": 1.17, + "learning_rate": 1.3970798317815225e-06, + "loss": 0.5947, + "step": 45523 + }, + { + "epoch": 1.17, + "learning_rate": 1.3970544361275956e-06, + "loss": 0.5757, + "step": 45524 + }, + { + "epoch": 1.17, + "learning_rate": 1.3970290401696624e-06, + "loss": 0.5381, + "step": 45525 + }, + { + "epoch": 1.17, + "learning_rate": 1.3970036439077425e-06, + "loss": 0.6729, + "step": 45526 + }, + { + "epoch": 1.17, + "learning_rate": 1.396978247341855e-06, + "loss": 0.7334, + "step": 45527 + }, + { + "epoch": 1.17, + "learning_rate": 1.3969528504720197e-06, + "loss": 0.7197, + "step": 45528 + }, + { + "epoch": 1.17, + "learning_rate": 1.3969274532982556e-06, + "loss": 0.5708, + "step": 45529 + }, + { + "epoch": 1.17, + "learning_rate": 1.3969020558205827e-06, + "loss": 0.5249, + "step": 45530 + }, + { + "epoch": 1.17, + "learning_rate": 1.3968766580390198e-06, + "loss": 0.6172, + "step": 45531 + }, + { + "epoch": 1.17, + "learning_rate": 1.396851259953587e-06, + "loss": 0.6758, + "step": 45532 + }, + { + "epoch": 1.17, + "learning_rate": 1.3968258615643031e-06, + "loss": 0.6865, + "step": 45533 + }, + { + "epoch": 1.17, + "learning_rate": 1.3968004628711883e-06, + "loss": 0.582, + "step": 45534 + }, + { + "epoch": 1.17, + "learning_rate": 1.3967750638742612e-06, + "loss": 0.594, + "step": 45535 + }, + { + "epoch": 1.17, + "learning_rate": 1.396749664573542e-06, + "loss": 0.6875, + "step": 45536 + }, + { + "epoch": 1.17, + "learning_rate": 1.3967242649690496e-06, + "loss": 0.5432, + "step": 45537 + }, + { + "epoch": 1.17, + "learning_rate": 1.396698865060804e-06, + "loss": 0.5913, + "step": 45538 + }, + { + "epoch": 1.17, + "learning_rate": 1.396673464848824e-06, + "loss": 0.6382, + "step": 45539 + }, + { + "epoch": 1.17, + "learning_rate": 1.3966480643331296e-06, + "loss": 0.4805, + "step": 45540 + }, + { + "epoch": 1.17, + "learning_rate": 1.3966226635137397e-06, + "loss": 0.7119, + "step": 45541 + }, + { + "epoch": 1.17, + "learning_rate": 1.3965972623906744e-06, + "loss": 0.4362, + "step": 45542 + }, + { + "epoch": 1.17, + "learning_rate": 1.3965718609639528e-06, + "loss": 0.7529, + "step": 45543 + }, + { + "epoch": 1.17, + "learning_rate": 1.396546459233594e-06, + "loss": 0.7773, + "step": 45544 + }, + { + "epoch": 1.17, + "learning_rate": 1.3965210571996183e-06, + "loss": 0.6218, + "step": 45545 + }, + { + "epoch": 1.17, + "learning_rate": 1.396495654862044e-06, + "loss": 0.6855, + "step": 45546 + }, + { + "epoch": 1.17, + "learning_rate": 1.3964702522208918e-06, + "loss": 0.6858, + "step": 45547 + }, + { + "epoch": 1.17, + "learning_rate": 1.3964448492761804e-06, + "loss": 0.4717, + "step": 45548 + }, + { + "epoch": 1.17, + "learning_rate": 1.3964194460279295e-06, + "loss": 0.5479, + "step": 45549 + }, + { + "epoch": 1.17, + "learning_rate": 1.3963940424761582e-06, + "loss": 0.6626, + "step": 45550 + }, + { + "epoch": 1.17, + "learning_rate": 1.3963686386208864e-06, + "loss": 0.6016, + "step": 45551 + }, + { + "epoch": 1.17, + "learning_rate": 1.3963432344621331e-06, + "loss": 0.5146, + "step": 45552 + }, + { + "epoch": 1.17, + "learning_rate": 1.3963178299999182e-06, + "loss": 0.5493, + "step": 45553 + }, + { + "epoch": 1.17, + "learning_rate": 1.3962924252342612e-06, + "loss": 0.6099, + "step": 45554 + }, + { + "epoch": 1.17, + "learning_rate": 1.396267020165181e-06, + "loss": 0.6226, + "step": 45555 + }, + { + "epoch": 1.17, + "learning_rate": 1.3962416147926975e-06, + "loss": 0.7207, + "step": 45556 + }, + { + "epoch": 1.17, + "learning_rate": 1.3962162091168299e-06, + "loss": 0.5981, + "step": 45557 + }, + { + "epoch": 1.17, + "learning_rate": 1.396190803137598e-06, + "loss": 0.6287, + "step": 45558 + }, + { + "epoch": 1.17, + "learning_rate": 1.3961653968550206e-06, + "loss": 0.6816, + "step": 45559 + }, + { + "epoch": 1.17, + "learning_rate": 1.396139990269118e-06, + "loss": 0.6379, + "step": 45560 + }, + { + "epoch": 1.17, + "learning_rate": 1.396114583379909e-06, + "loss": 0.7109, + "step": 45561 + }, + { + "epoch": 1.17, + "learning_rate": 1.3960891761874134e-06, + "loss": 0.6367, + "step": 45562 + }, + { + "epoch": 1.17, + "learning_rate": 1.3960637686916506e-06, + "loss": 0.5977, + "step": 45563 + }, + { + "epoch": 1.17, + "learning_rate": 1.3960383608926398e-06, + "loss": 0.6758, + "step": 45564 + }, + { + "epoch": 1.17, + "learning_rate": 1.3960129527904006e-06, + "loss": 0.5906, + "step": 45565 + }, + { + "epoch": 1.17, + "learning_rate": 1.3959875443849525e-06, + "loss": 0.6167, + "step": 45566 + }, + { + "epoch": 1.17, + "learning_rate": 1.395962135676315e-06, + "loss": 0.5981, + "step": 45567 + }, + { + "epoch": 1.17, + "learning_rate": 1.3959367266645076e-06, + "loss": 0.6675, + "step": 45568 + }, + { + "epoch": 1.17, + "learning_rate": 1.3959113173495497e-06, + "loss": 0.8135, + "step": 45569 + }, + { + "epoch": 1.17, + "learning_rate": 1.3958859077314605e-06, + "loss": 0.6934, + "step": 45570 + }, + { + "epoch": 1.17, + "learning_rate": 1.3958604978102594e-06, + "loss": 0.6353, + "step": 45571 + }, + { + "epoch": 1.17, + "learning_rate": 1.3958350875859668e-06, + "loss": 0.6323, + "step": 45572 + }, + { + "epoch": 1.17, + "learning_rate": 1.395809677058601e-06, + "loss": 0.7031, + "step": 45573 + }, + { + "epoch": 1.17, + "learning_rate": 1.395784266228182e-06, + "loss": 0.4314, + "step": 45574 + }, + { + "epoch": 1.17, + "learning_rate": 1.3957588550947292e-06, + "loss": 0.3771, + "step": 45575 + }, + { + "epoch": 1.17, + "learning_rate": 1.3957334436582625e-06, + "loss": 0.6445, + "step": 45576 + }, + { + "epoch": 1.17, + "learning_rate": 1.3957080319188002e-06, + "loss": 0.5264, + "step": 45577 + }, + { + "epoch": 1.17, + "learning_rate": 1.3956826198763627e-06, + "loss": 0.6797, + "step": 45578 + }, + { + "epoch": 1.17, + "learning_rate": 1.3956572075309693e-06, + "loss": 0.6162, + "step": 45579 + }, + { + "epoch": 1.17, + "learning_rate": 1.3956317948826392e-06, + "loss": 0.6904, + "step": 45580 + }, + { + "epoch": 1.17, + "learning_rate": 1.3956063819313921e-06, + "loss": 0.582, + "step": 45581 + }, + { + "epoch": 1.17, + "learning_rate": 1.3955809686772475e-06, + "loss": 0.6836, + "step": 45582 + }, + { + "epoch": 1.17, + "learning_rate": 1.395555555120225e-06, + "loss": 0.7188, + "step": 45583 + }, + { + "epoch": 1.17, + "learning_rate": 1.3955301412603434e-06, + "loss": 0.6211, + "step": 45584 + }, + { + "epoch": 1.17, + "learning_rate": 1.3955047270976226e-06, + "loss": 0.5752, + "step": 45585 + }, + { + "epoch": 1.17, + "learning_rate": 1.3954793126320818e-06, + "loss": 0.728, + "step": 45586 + }, + { + "epoch": 1.17, + "learning_rate": 1.3954538978637409e-06, + "loss": 0.627, + "step": 45587 + }, + { + "epoch": 1.17, + "learning_rate": 1.3954284827926195e-06, + "loss": 0.5918, + "step": 45588 + }, + { + "epoch": 1.17, + "learning_rate": 1.3954030674187363e-06, + "loss": 0.6104, + "step": 45589 + }, + { + "epoch": 1.17, + "learning_rate": 1.395377651742111e-06, + "loss": 0.6631, + "step": 45590 + }, + { + "epoch": 1.17, + "learning_rate": 1.3953522357627636e-06, + "loss": 0.6123, + "step": 45591 + }, + { + "epoch": 1.17, + "learning_rate": 1.3953268194807128e-06, + "loss": 0.5737, + "step": 45592 + }, + { + "epoch": 1.17, + "learning_rate": 1.395301402895979e-06, + "loss": 0.79, + "step": 45593 + }, + { + "epoch": 1.17, + "learning_rate": 1.3952759860085804e-06, + "loss": 0.6846, + "step": 45594 + }, + { + "epoch": 1.17, + "learning_rate": 1.3952505688185375e-06, + "loss": 0.7246, + "step": 45595 + }, + { + "epoch": 1.17, + "learning_rate": 1.3952251513258693e-06, + "loss": 0.6768, + "step": 45596 + }, + { + "epoch": 1.17, + "learning_rate": 1.3951997335305956e-06, + "loss": 0.6357, + "step": 45597 + }, + { + "epoch": 1.17, + "learning_rate": 1.3951743154327355e-06, + "loss": 0.3943, + "step": 45598 + }, + { + "epoch": 1.17, + "learning_rate": 1.3951488970323084e-06, + "loss": 0.752, + "step": 45599 + }, + { + "epoch": 1.17, + "learning_rate": 1.3951234783293343e-06, + "loss": 0.5776, + "step": 45600 + }, + { + "epoch": 1.17, + "learning_rate": 1.395098059323832e-06, + "loss": 0.6084, + "step": 45601 + }, + { + "epoch": 1.17, + "learning_rate": 1.3950726400158216e-06, + "loss": 0.5137, + "step": 45602 + }, + { + "epoch": 1.17, + "learning_rate": 1.3950472204053222e-06, + "loss": 0.5991, + "step": 45603 + }, + { + "epoch": 1.17, + "learning_rate": 1.395021800492353e-06, + "loss": 0.5083, + "step": 45604 + }, + { + "epoch": 1.17, + "learning_rate": 1.394996380276934e-06, + "loss": 0.7578, + "step": 45605 + }, + { + "epoch": 1.17, + "learning_rate": 1.3949709597590844e-06, + "loss": 0.481, + "step": 45606 + }, + { + "epoch": 1.17, + "learning_rate": 1.3949455389388236e-06, + "loss": 0.585, + "step": 45607 + }, + { + "epoch": 1.17, + "learning_rate": 1.3949201178161715e-06, + "loss": 0.6475, + "step": 45608 + }, + { + "epoch": 1.17, + "learning_rate": 1.394894696391147e-06, + "loss": 0.6406, + "step": 45609 + }, + { + "epoch": 1.17, + "learning_rate": 1.3948692746637699e-06, + "loss": 0.7236, + "step": 45610 + }, + { + "epoch": 1.17, + "learning_rate": 1.3948438526340592e-06, + "loss": 0.6816, + "step": 45611 + }, + { + "epoch": 1.17, + "learning_rate": 1.394818430302035e-06, + "loss": 0.7441, + "step": 45612 + }, + { + "epoch": 1.17, + "learning_rate": 1.3947930076677166e-06, + "loss": 0.5759, + "step": 45613 + }, + { + "epoch": 1.17, + "learning_rate": 1.3947675847311232e-06, + "loss": 0.4761, + "step": 45614 + }, + { + "epoch": 1.17, + "learning_rate": 1.394742161492274e-06, + "loss": 0.7148, + "step": 45615 + }, + { + "epoch": 1.17, + "learning_rate": 1.3947167379511894e-06, + "loss": 0.7959, + "step": 45616 + }, + { + "epoch": 1.17, + "learning_rate": 1.3946913141078883e-06, + "loss": 0.6812, + "step": 45617 + }, + { + "epoch": 1.17, + "learning_rate": 1.39466588996239e-06, + "loss": 0.373, + "step": 45618 + }, + { + "epoch": 1.17, + "learning_rate": 1.3946404655147143e-06, + "loss": 0.6699, + "step": 45619 + }, + { + "epoch": 1.17, + "learning_rate": 1.3946150407648806e-06, + "loss": 0.5039, + "step": 45620 + }, + { + "epoch": 1.17, + "learning_rate": 1.3945896157129083e-06, + "loss": 0.7812, + "step": 45621 + }, + { + "epoch": 1.17, + "learning_rate": 1.3945641903588168e-06, + "loss": 0.6165, + "step": 45622 + }, + { + "epoch": 1.17, + "learning_rate": 1.3945387647026259e-06, + "loss": 0.5657, + "step": 45623 + }, + { + "epoch": 1.17, + "learning_rate": 1.3945133387443542e-06, + "loss": 0.5245, + "step": 45624 + }, + { + "epoch": 1.17, + "learning_rate": 1.3944879124840223e-06, + "loss": 0.6968, + "step": 45625 + }, + { + "epoch": 1.17, + "learning_rate": 1.3944624859216488e-06, + "loss": 0.7178, + "step": 45626 + }, + { + "epoch": 1.17, + "learning_rate": 1.394437059057254e-06, + "loss": 0.4956, + "step": 45627 + }, + { + "epoch": 1.17, + "learning_rate": 1.3944116318908566e-06, + "loss": 0.585, + "step": 45628 + }, + { + "epoch": 1.17, + "learning_rate": 1.3943862044224764e-06, + "loss": 0.5464, + "step": 45629 + }, + { + "epoch": 1.17, + "learning_rate": 1.3943607766521325e-06, + "loss": 0.6084, + "step": 45630 + }, + { + "epoch": 1.17, + "learning_rate": 1.3943353485798451e-06, + "loss": 0.6545, + "step": 45631 + }, + { + "epoch": 1.17, + "learning_rate": 1.3943099202056328e-06, + "loss": 0.5825, + "step": 45632 + }, + { + "epoch": 1.17, + "learning_rate": 1.3942844915295162e-06, + "loss": 0.606, + "step": 45633 + }, + { + "epoch": 1.17, + "learning_rate": 1.3942590625515136e-06, + "loss": 0.6572, + "step": 45634 + }, + { + "epoch": 1.17, + "learning_rate": 1.3942336332716452e-06, + "loss": 0.6289, + "step": 45635 + }, + { + "epoch": 1.17, + "learning_rate": 1.3942082036899299e-06, + "loss": 0.6157, + "step": 45636 + }, + { + "epoch": 1.17, + "learning_rate": 1.3941827738063879e-06, + "loss": 0.6675, + "step": 45637 + }, + { + "epoch": 1.17, + "learning_rate": 1.394157343621038e-06, + "loss": 0.5254, + "step": 45638 + }, + { + "epoch": 1.17, + "learning_rate": 1.3941319131339002e-06, + "loss": 0.7812, + "step": 45639 + }, + { + "epoch": 1.17, + "learning_rate": 1.3941064823449933e-06, + "loss": 0.5996, + "step": 45640 + }, + { + "epoch": 1.17, + "learning_rate": 1.3940810512543374e-06, + "loss": 0.5757, + "step": 45641 + }, + { + "epoch": 1.17, + "learning_rate": 1.3940556198619517e-06, + "loss": 0.5713, + "step": 45642 + }, + { + "epoch": 1.17, + "learning_rate": 1.394030188167856e-06, + "loss": 0.748, + "step": 45643 + }, + { + "epoch": 1.17, + "learning_rate": 1.3940047561720695e-06, + "loss": 0.5156, + "step": 45644 + }, + { + "epoch": 1.17, + "learning_rate": 1.3939793238746115e-06, + "loss": 0.7461, + "step": 45645 + }, + { + "epoch": 1.17, + "learning_rate": 1.3939538912755015e-06, + "loss": 0.7061, + "step": 45646 + }, + { + "epoch": 1.17, + "learning_rate": 1.3939284583747594e-06, + "loss": 0.5596, + "step": 45647 + }, + { + "epoch": 1.17, + "learning_rate": 1.3939030251724044e-06, + "loss": 0.4932, + "step": 45648 + }, + { + "epoch": 1.17, + "learning_rate": 1.3938775916684556e-06, + "loss": 0.5269, + "step": 45649 + }, + { + "epoch": 1.17, + "learning_rate": 1.3938521578629331e-06, + "loss": 0.5435, + "step": 45650 + }, + { + "epoch": 1.17, + "learning_rate": 1.393826723755856e-06, + "loss": 0.6289, + "step": 45651 + }, + { + "epoch": 1.17, + "learning_rate": 1.3938012893472441e-06, + "loss": 0.6455, + "step": 45652 + }, + { + "epoch": 1.17, + "learning_rate": 1.3937758546371166e-06, + "loss": 0.4929, + "step": 45653 + }, + { + "epoch": 1.17, + "learning_rate": 1.393750419625493e-06, + "loss": 0.7153, + "step": 45654 + }, + { + "epoch": 1.17, + "learning_rate": 1.3937249843123926e-06, + "loss": 0.5046, + "step": 45655 + }, + { + "epoch": 1.17, + "learning_rate": 1.3936995486978354e-06, + "loss": 0.6387, + "step": 45656 + }, + { + "epoch": 1.17, + "learning_rate": 1.3936741127818406e-06, + "loss": 0.6172, + "step": 45657 + }, + { + "epoch": 1.17, + "learning_rate": 1.3936486765644272e-06, + "loss": 0.6021, + "step": 45658 + }, + { + "epoch": 1.17, + "learning_rate": 1.3936232400456154e-06, + "loss": 0.6704, + "step": 45659 + }, + { + "epoch": 1.17, + "learning_rate": 1.3935978032254245e-06, + "loss": 0.7036, + "step": 45660 + }, + { + "epoch": 1.17, + "learning_rate": 1.3935723661038734e-06, + "loss": 0.8088, + "step": 45661 + }, + { + "epoch": 1.17, + "learning_rate": 1.3935469286809824e-06, + "loss": 0.6973, + "step": 45662 + }, + { + "epoch": 1.17, + "learning_rate": 1.3935214909567708e-06, + "loss": 0.5098, + "step": 45663 + }, + { + "epoch": 1.17, + "learning_rate": 1.3934960529312574e-06, + "loss": 0.751, + "step": 45664 + }, + { + "epoch": 1.17, + "learning_rate": 1.3934706146044626e-06, + "loss": 0.6465, + "step": 45665 + }, + { + "epoch": 1.17, + "learning_rate": 1.3934451759764053e-06, + "loss": 0.627, + "step": 45666 + }, + { + "epoch": 1.17, + "learning_rate": 1.393419737047105e-06, + "loss": 0.6021, + "step": 45667 + }, + { + "epoch": 1.17, + "learning_rate": 1.3933942978165813e-06, + "loss": 0.3449, + "step": 45668 + }, + { + "epoch": 1.17, + "learning_rate": 1.3933688582848538e-06, + "loss": 0.7666, + "step": 45669 + }, + { + "epoch": 1.17, + "learning_rate": 1.3933434184519416e-06, + "loss": 0.5762, + "step": 45670 + }, + { + "epoch": 1.17, + "learning_rate": 1.3933179783178648e-06, + "loss": 0.6899, + "step": 45671 + }, + { + "epoch": 1.17, + "learning_rate": 1.3932925378826424e-06, + "loss": 0.4536, + "step": 45672 + }, + { + "epoch": 1.17, + "learning_rate": 1.3932670971462939e-06, + "loss": 0.7441, + "step": 45673 + }, + { + "epoch": 1.17, + "learning_rate": 1.3932416561088388e-06, + "loss": 0.6201, + "step": 45674 + }, + { + "epoch": 1.17, + "learning_rate": 1.3932162147702969e-06, + "loss": 0.6538, + "step": 45675 + }, + { + "epoch": 1.17, + "learning_rate": 1.3931907731306872e-06, + "loss": 0.458, + "step": 45676 + }, + { + "epoch": 1.17, + "learning_rate": 1.3931653311900295e-06, + "loss": 0.7207, + "step": 45677 + }, + { + "epoch": 1.17, + "learning_rate": 1.393139888948343e-06, + "loss": 0.5552, + "step": 45678 + }, + { + "epoch": 1.17, + "learning_rate": 1.3931144464056476e-06, + "loss": 0.4907, + "step": 45679 + }, + { + "epoch": 1.17, + "learning_rate": 1.3930890035619624e-06, + "loss": 0.6094, + "step": 45680 + }, + { + "epoch": 1.17, + "learning_rate": 1.393063560417307e-06, + "loss": 0.6934, + "step": 45681 + }, + { + "epoch": 1.17, + "learning_rate": 1.3930381169717012e-06, + "loss": 0.5713, + "step": 45682 + }, + { + "epoch": 1.17, + "learning_rate": 1.3930126732251642e-06, + "loss": 0.7246, + "step": 45683 + }, + { + "epoch": 1.17, + "learning_rate": 1.392987229177715e-06, + "loss": 0.592, + "step": 45684 + }, + { + "epoch": 1.17, + "learning_rate": 1.3929617848293737e-06, + "loss": 0.707, + "step": 45685 + }, + { + "epoch": 1.17, + "learning_rate": 1.3929363401801596e-06, + "loss": 0.7827, + "step": 45686 + }, + { + "epoch": 1.17, + "learning_rate": 1.3929108952300925e-06, + "loss": 0.6016, + "step": 45687 + }, + { + "epoch": 1.17, + "learning_rate": 1.3928854499791916e-06, + "loss": 0.7642, + "step": 45688 + }, + { + "epoch": 1.17, + "learning_rate": 1.392860004427476e-06, + "loss": 0.541, + "step": 45689 + }, + { + "epoch": 1.17, + "learning_rate": 1.392834558574966e-06, + "loss": 0.7266, + "step": 45690 + }, + { + "epoch": 1.17, + "learning_rate": 1.3928091124216802e-06, + "loss": 0.6479, + "step": 45691 + }, + { + "epoch": 1.17, + "learning_rate": 1.3927836659676388e-06, + "loss": 0.6299, + "step": 45692 + }, + { + "epoch": 1.17, + "learning_rate": 1.3927582192128608e-06, + "loss": 0.6001, + "step": 45693 + }, + { + "epoch": 1.17, + "learning_rate": 1.3927327721573661e-06, + "loss": 0.8467, + "step": 45694 + }, + { + "epoch": 1.17, + "learning_rate": 1.3927073248011739e-06, + "loss": 0.624, + "step": 45695 + }, + { + "epoch": 1.17, + "learning_rate": 1.392681877144304e-06, + "loss": 0.6758, + "step": 45696 + }, + { + "epoch": 1.17, + "learning_rate": 1.3926564291867753e-06, + "loss": 0.5371, + "step": 45697 + }, + { + "epoch": 1.17, + "learning_rate": 1.3926309809286077e-06, + "loss": 0.8203, + "step": 45698 + }, + { + "epoch": 1.17, + "learning_rate": 1.3926055323698205e-06, + "loss": 0.6484, + "step": 45699 + }, + { + "epoch": 1.17, + "learning_rate": 1.3925800835104336e-06, + "loss": 0.5555, + "step": 45700 + }, + { + "epoch": 1.17, + "learning_rate": 1.392554634350466e-06, + "loss": 0.5771, + "step": 45701 + }, + { + "epoch": 1.17, + "learning_rate": 1.3925291848899375e-06, + "loss": 0.6494, + "step": 45702 + }, + { + "epoch": 1.17, + "learning_rate": 1.392503735128867e-06, + "loss": 0.5718, + "step": 45703 + }, + { + "epoch": 1.17, + "learning_rate": 1.392478285067275e-06, + "loss": 0.7744, + "step": 45704 + }, + { + "epoch": 1.17, + "learning_rate": 1.3924528347051801e-06, + "loss": 0.6592, + "step": 45705 + }, + { + "epoch": 1.17, + "learning_rate": 1.3924273840426022e-06, + "loss": 0.6567, + "step": 45706 + }, + { + "epoch": 1.17, + "learning_rate": 1.3924019330795609e-06, + "loss": 0.7129, + "step": 45707 + }, + { + "epoch": 1.17, + "learning_rate": 1.392376481816075e-06, + "loss": 0.748, + "step": 45708 + }, + { + "epoch": 1.17, + "learning_rate": 1.392351030252165e-06, + "loss": 0.6035, + "step": 45709 + }, + { + "epoch": 1.17, + "learning_rate": 1.3923255783878496e-06, + "loss": 0.7773, + "step": 45710 + }, + { + "epoch": 1.17, + "learning_rate": 1.3923001262231483e-06, + "loss": 0.6738, + "step": 45711 + }, + { + "epoch": 1.17, + "learning_rate": 1.3922746737580813e-06, + "loss": 0.6875, + "step": 45712 + }, + { + "epoch": 1.17, + "learning_rate": 1.3922492209926676e-06, + "loss": 0.7275, + "step": 45713 + }, + { + "epoch": 1.17, + "learning_rate": 1.3922237679269263e-06, + "loss": 0.749, + "step": 45714 + }, + { + "epoch": 1.17, + "learning_rate": 1.3921983145608775e-06, + "loss": 0.5508, + "step": 45715 + }, + { + "epoch": 1.17, + "learning_rate": 1.3921728608945405e-06, + "loss": 0.6582, + "step": 45716 + }, + { + "epoch": 1.17, + "learning_rate": 1.392147406927935e-06, + "loss": 0.7988, + "step": 45717 + }, + { + "epoch": 1.17, + "learning_rate": 1.39212195266108e-06, + "loss": 0.6836, + "step": 45718 + }, + { + "epoch": 1.17, + "learning_rate": 1.3920964980939952e-06, + "loss": 0.6792, + "step": 45719 + }, + { + "epoch": 1.17, + "learning_rate": 1.3920710432267e-06, + "loss": 0.7344, + "step": 45720 + }, + { + "epoch": 1.17, + "learning_rate": 1.3920455880592143e-06, + "loss": 0.752, + "step": 45721 + }, + { + "epoch": 1.17, + "learning_rate": 1.3920201325915576e-06, + "loss": 0.8096, + "step": 45722 + }, + { + "epoch": 1.17, + "learning_rate": 1.3919946768237488e-06, + "loss": 0.7588, + "step": 45723 + }, + { + "epoch": 1.17, + "learning_rate": 1.3919692207558074e-06, + "loss": 0.3494, + "step": 45724 + }, + { + "epoch": 1.17, + "learning_rate": 1.3919437643877536e-06, + "loss": 0.6479, + "step": 45725 + }, + { + "epoch": 1.17, + "learning_rate": 1.3919183077196061e-06, + "loss": 0.3804, + "step": 45726 + }, + { + "epoch": 1.17, + "learning_rate": 1.3918928507513852e-06, + "loss": 0.7812, + "step": 45727 + }, + { + "epoch": 1.17, + "learning_rate": 1.39186739348311e-06, + "loss": 0.5781, + "step": 45728 + }, + { + "epoch": 1.17, + "learning_rate": 1.3918419359147997e-06, + "loss": 0.7666, + "step": 45729 + }, + { + "epoch": 1.17, + "learning_rate": 1.3918164780464737e-06, + "loss": 0.4678, + "step": 45730 + }, + { + "epoch": 1.17, + "learning_rate": 1.3917910198781526e-06, + "loss": 0.4873, + "step": 45731 + }, + { + "epoch": 1.17, + "learning_rate": 1.391765561409855e-06, + "loss": 0.7617, + "step": 45732 + }, + { + "epoch": 1.17, + "learning_rate": 1.3917401026416e-06, + "loss": 0.6826, + "step": 45733 + }, + { + "epoch": 1.17, + "learning_rate": 1.3917146435734079e-06, + "loss": 0.6924, + "step": 45734 + }, + { + "epoch": 1.17, + "learning_rate": 1.3916891842052978e-06, + "loss": 0.5142, + "step": 45735 + }, + { + "epoch": 1.17, + "learning_rate": 1.3916637245372896e-06, + "loss": 0.7129, + "step": 45736 + }, + { + "epoch": 1.17, + "learning_rate": 1.3916382645694023e-06, + "loss": 0.6797, + "step": 45737 + }, + { + "epoch": 1.17, + "learning_rate": 1.3916128043016558e-06, + "loss": 0.363, + "step": 45738 + }, + { + "epoch": 1.17, + "learning_rate": 1.391587343734069e-06, + "loss": 0.6475, + "step": 45739 + }, + { + "epoch": 1.17, + "learning_rate": 1.391561882866662e-06, + "loss": 0.5591, + "step": 45740 + }, + { + "epoch": 1.17, + "learning_rate": 1.3915364216994538e-06, + "loss": 0.5767, + "step": 45741 + }, + { + "epoch": 1.17, + "learning_rate": 1.3915109602324647e-06, + "loss": 0.6431, + "step": 45742 + }, + { + "epoch": 1.17, + "learning_rate": 1.3914854984657132e-06, + "loss": 0.6064, + "step": 45743 + }, + { + "epoch": 1.17, + "learning_rate": 1.3914600363992196e-06, + "loss": 0.6699, + "step": 45744 + }, + { + "epoch": 1.17, + "learning_rate": 1.3914345740330027e-06, + "loss": 0.4727, + "step": 45745 + }, + { + "epoch": 1.17, + "learning_rate": 1.3914091113670825e-06, + "loss": 0.7207, + "step": 45746 + }, + { + "epoch": 1.17, + "learning_rate": 1.3913836484014785e-06, + "loss": 0.5217, + "step": 45747 + }, + { + "epoch": 1.17, + "learning_rate": 1.3913581851362099e-06, + "loss": 0.7148, + "step": 45748 + }, + { + "epoch": 1.17, + "learning_rate": 1.3913327215712961e-06, + "loss": 0.6729, + "step": 45749 + }, + { + "epoch": 1.17, + "learning_rate": 1.391307257706757e-06, + "loss": 0.8076, + "step": 45750 + }, + { + "epoch": 1.17, + "learning_rate": 1.3912817935426119e-06, + "loss": 0.5205, + "step": 45751 + }, + { + "epoch": 1.17, + "learning_rate": 1.3912563290788806e-06, + "loss": 0.7393, + "step": 45752 + }, + { + "epoch": 1.17, + "learning_rate": 1.391230864315582e-06, + "loss": 0.6055, + "step": 45753 + }, + { + "epoch": 1.17, + "learning_rate": 1.391205399252736e-06, + "loss": 0.7236, + "step": 45754 + }, + { + "epoch": 1.17, + "learning_rate": 1.3911799338903621e-06, + "loss": 0.8398, + "step": 45755 + }, + { + "epoch": 1.17, + "learning_rate": 1.3911544682284796e-06, + "loss": 0.6003, + "step": 45756 + }, + { + "epoch": 1.17, + "learning_rate": 1.3911290022671085e-06, + "loss": 0.5625, + "step": 45757 + }, + { + "epoch": 1.17, + "learning_rate": 1.3911035360062672e-06, + "loss": 0.8428, + "step": 45758 + }, + { + "epoch": 1.17, + "learning_rate": 1.3910780694459765e-06, + "loss": 0.915, + "step": 45759 + }, + { + "epoch": 1.17, + "learning_rate": 1.391052602586255e-06, + "loss": 0.6621, + "step": 45760 + }, + { + "epoch": 1.17, + "learning_rate": 1.3910271354271227e-06, + "loss": 0.5728, + "step": 45761 + }, + { + "epoch": 1.17, + "learning_rate": 1.3910016679685988e-06, + "loss": 0.7197, + "step": 45762 + }, + { + "epoch": 1.17, + "learning_rate": 1.3909762002107028e-06, + "loss": 0.5767, + "step": 45763 + }, + { + "epoch": 1.17, + "learning_rate": 1.3909507321534543e-06, + "loss": 0.6802, + "step": 45764 + }, + { + "epoch": 1.17, + "learning_rate": 1.3909252637968729e-06, + "loss": 0.6973, + "step": 45765 + }, + { + "epoch": 1.17, + "learning_rate": 1.390899795140978e-06, + "loss": 0.7266, + "step": 45766 + }, + { + "epoch": 1.17, + "learning_rate": 1.3908743261857894e-06, + "loss": 0.6035, + "step": 45767 + }, + { + "epoch": 1.17, + "learning_rate": 1.390848856931326e-06, + "loss": 0.5737, + "step": 45768 + }, + { + "epoch": 1.17, + "learning_rate": 1.3908233873776074e-06, + "loss": 0.541, + "step": 45769 + }, + { + "epoch": 1.17, + "learning_rate": 1.3907979175246533e-06, + "loss": 0.6689, + "step": 45770 + }, + { + "epoch": 1.17, + "learning_rate": 1.3907724473724836e-06, + "loss": 0.7012, + "step": 45771 + }, + { + "epoch": 1.17, + "learning_rate": 1.3907469769211172e-06, + "loss": 0.6172, + "step": 45772 + }, + { + "epoch": 1.17, + "learning_rate": 1.390721506170574e-06, + "loss": 0.3445, + "step": 45773 + }, + { + "epoch": 1.17, + "learning_rate": 1.3906960351208729e-06, + "loss": 0.7969, + "step": 45774 + }, + { + "epoch": 1.17, + "learning_rate": 1.3906705637720342e-06, + "loss": 0.8486, + "step": 45775 + }, + { + "epoch": 1.17, + "learning_rate": 1.3906450921240767e-06, + "loss": 0.5977, + "step": 45776 + }, + { + "epoch": 1.17, + "learning_rate": 1.3906196201770205e-06, + "loss": 0.5845, + "step": 45777 + }, + { + "epoch": 1.17, + "learning_rate": 1.3905941479308847e-06, + "loss": 0.7227, + "step": 45778 + }, + { + "epoch": 1.17, + "learning_rate": 1.3905686753856887e-06, + "loss": 0.6357, + "step": 45779 + }, + { + "epoch": 1.17, + "learning_rate": 1.3905432025414526e-06, + "loss": 0.5752, + "step": 45780 + }, + { + "epoch": 1.17, + "learning_rate": 1.3905177293981952e-06, + "loss": 0.5935, + "step": 45781 + }, + { + "epoch": 1.17, + "learning_rate": 1.3904922559559366e-06, + "loss": 0.6016, + "step": 45782 + }, + { + "epoch": 1.17, + "learning_rate": 1.3904667822146958e-06, + "loss": 0.5352, + "step": 45783 + }, + { + "epoch": 1.17, + "learning_rate": 1.3904413081744928e-06, + "loss": 0.7598, + "step": 45784 + }, + { + "epoch": 1.17, + "learning_rate": 1.3904158338353464e-06, + "loss": 0.5986, + "step": 45785 + }, + { + "epoch": 1.17, + "learning_rate": 1.3903903591972773e-06, + "loss": 0.4248, + "step": 45786 + }, + { + "epoch": 1.17, + "learning_rate": 1.3903648842603035e-06, + "loss": 0.6797, + "step": 45787 + }, + { + "epoch": 1.17, + "learning_rate": 1.3903394090244458e-06, + "loss": 0.6924, + "step": 45788 + }, + { + "epoch": 1.17, + "learning_rate": 1.3903139334897228e-06, + "loss": 0.6846, + "step": 45789 + }, + { + "epoch": 1.17, + "learning_rate": 1.3902884576561547e-06, + "loss": 0.7695, + "step": 45790 + }, + { + "epoch": 1.17, + "learning_rate": 1.39026298152376e-06, + "loss": 0.5356, + "step": 45791 + }, + { + "epoch": 1.17, + "learning_rate": 1.3902375050925596e-06, + "loss": 0.7061, + "step": 45792 + }, + { + "epoch": 1.17, + "learning_rate": 1.390212028362572e-06, + "loss": 0.6709, + "step": 45793 + }, + { + "epoch": 1.17, + "learning_rate": 1.390186551333817e-06, + "loss": 0.5413, + "step": 45794 + }, + { + "epoch": 1.17, + "learning_rate": 1.390161074006314e-06, + "loss": 0.551, + "step": 45795 + }, + { + "epoch": 1.17, + "learning_rate": 1.390135596380083e-06, + "loss": 0.6084, + "step": 45796 + }, + { + "epoch": 1.17, + "learning_rate": 1.3901101184551429e-06, + "loss": 0.6943, + "step": 45797 + }, + { + "epoch": 1.17, + "learning_rate": 1.3900846402315132e-06, + "loss": 0.8203, + "step": 45798 + }, + { + "epoch": 1.17, + "learning_rate": 1.390059161709214e-06, + "loss": 0.6787, + "step": 45799 + }, + { + "epoch": 1.17, + "learning_rate": 1.390033682888264e-06, + "loss": 0.7559, + "step": 45800 + }, + { + "epoch": 1.17, + "learning_rate": 1.3900082037686833e-06, + "loss": 0.7217, + "step": 45801 + }, + { + "epoch": 1.17, + "learning_rate": 1.3899827243504913e-06, + "loss": 0.4277, + "step": 45802 + }, + { + "epoch": 1.17, + "learning_rate": 1.3899572446337079e-06, + "loss": 0.7021, + "step": 45803 + }, + { + "epoch": 1.17, + "learning_rate": 1.3899317646183515e-06, + "loss": 0.6221, + "step": 45804 + }, + { + "epoch": 1.17, + "learning_rate": 1.3899062843044424e-06, + "loss": 0.6729, + "step": 45805 + }, + { + "epoch": 1.17, + "learning_rate": 1.389880803692e-06, + "loss": 0.6099, + "step": 45806 + }, + { + "epoch": 1.17, + "learning_rate": 1.3898553227810444e-06, + "loss": 0.5547, + "step": 45807 + }, + { + "epoch": 1.17, + "learning_rate": 1.3898298415715937e-06, + "loss": 0.8008, + "step": 45808 + }, + { + "epoch": 1.17, + "learning_rate": 1.3898043600636687e-06, + "loss": 0.749, + "step": 45809 + }, + { + "epoch": 1.17, + "learning_rate": 1.389778878257288e-06, + "loss": 0.4429, + "step": 45810 + }, + { + "epoch": 1.17, + "learning_rate": 1.3897533961524718e-06, + "loss": 0.5859, + "step": 45811 + }, + { + "epoch": 1.17, + "learning_rate": 1.3897279137492395e-06, + "loss": 0.5083, + "step": 45812 + }, + { + "epoch": 1.17, + "learning_rate": 1.3897024310476103e-06, + "loss": 0.4363, + "step": 45813 + }, + { + "epoch": 1.17, + "learning_rate": 1.3896769480476037e-06, + "loss": 0.5625, + "step": 45814 + }, + { + "epoch": 1.17, + "learning_rate": 1.3896514647492397e-06, + "loss": 0.627, + "step": 45815 + }, + { + "epoch": 1.17, + "learning_rate": 1.389625981152537e-06, + "loss": 0.6353, + "step": 45816 + }, + { + "epoch": 1.17, + "learning_rate": 1.3896004972575162e-06, + "loss": 0.6973, + "step": 45817 + }, + { + "epoch": 1.17, + "learning_rate": 1.3895750130641959e-06, + "loss": 0.6816, + "step": 45818 + }, + { + "epoch": 1.17, + "learning_rate": 1.389549528572596e-06, + "loss": 0.6128, + "step": 45819 + }, + { + "epoch": 1.17, + "learning_rate": 1.3895240437827358e-06, + "loss": 0.5715, + "step": 45820 + }, + { + "epoch": 1.17, + "learning_rate": 1.389498558694635e-06, + "loss": 0.6519, + "step": 45821 + }, + { + "epoch": 1.17, + "learning_rate": 1.3894730733083133e-06, + "loss": 0.5312, + "step": 45822 + }, + { + "epoch": 1.17, + "learning_rate": 1.3894475876237897e-06, + "loss": 0.7266, + "step": 45823 + }, + { + "epoch": 1.17, + "learning_rate": 1.389422101641084e-06, + "loss": 0.7637, + "step": 45824 + }, + { + "epoch": 1.17, + "learning_rate": 1.3893966153602157e-06, + "loss": 0.6074, + "step": 45825 + }, + { + "epoch": 1.17, + "learning_rate": 1.3893711287812046e-06, + "loss": 0.5728, + "step": 45826 + }, + { + "epoch": 1.17, + "learning_rate": 1.3893456419040699e-06, + "loss": 0.5391, + "step": 45827 + }, + { + "epoch": 1.17, + "learning_rate": 1.3893201547288308e-06, + "loss": 0.5376, + "step": 45828 + }, + { + "epoch": 1.17, + "learning_rate": 1.3892946672555073e-06, + "loss": 0.8647, + "step": 45829 + }, + { + "epoch": 1.17, + "learning_rate": 1.389269179484119e-06, + "loss": 0.605, + "step": 45830 + }, + { + "epoch": 1.17, + "learning_rate": 1.3892436914146848e-06, + "loss": 0.667, + "step": 45831 + }, + { + "epoch": 1.17, + "learning_rate": 1.389218203047225e-06, + "loss": 0.6621, + "step": 45832 + }, + { + "epoch": 1.17, + "learning_rate": 1.3891927143817586e-06, + "loss": 0.4666, + "step": 45833 + }, + { + "epoch": 1.17, + "learning_rate": 1.389167225418305e-06, + "loss": 0.6484, + "step": 45834 + }, + { + "epoch": 1.17, + "learning_rate": 1.389141736156884e-06, + "loss": 0.5615, + "step": 45835 + }, + { + "epoch": 1.17, + "learning_rate": 1.3891162465975153e-06, + "loss": 0.7305, + "step": 45836 + }, + { + "epoch": 1.17, + "learning_rate": 1.3890907567402182e-06, + "loss": 0.6763, + "step": 45837 + }, + { + "epoch": 1.17, + "learning_rate": 1.389065266585012e-06, + "loss": 0.6177, + "step": 45838 + }, + { + "epoch": 1.17, + "learning_rate": 1.3890397761319163e-06, + "loss": 0.5869, + "step": 45839 + }, + { + "epoch": 1.17, + "learning_rate": 1.389014285380951e-06, + "loss": 0.6528, + "step": 45840 + }, + { + "epoch": 1.17, + "learning_rate": 1.388988794332135e-06, + "loss": 0.5129, + "step": 45841 + }, + { + "epoch": 1.17, + "learning_rate": 1.3889633029854886e-06, + "loss": 0.6519, + "step": 45842 + }, + { + "epoch": 1.17, + "learning_rate": 1.388937811341031e-06, + "loss": 0.624, + "step": 45843 + }, + { + "epoch": 1.18, + "learning_rate": 1.3889123193987808e-06, + "loss": 0.6426, + "step": 45844 + }, + { + "epoch": 1.18, + "learning_rate": 1.388886827158759e-06, + "loss": 0.5225, + "step": 45845 + }, + { + "epoch": 1.18, + "learning_rate": 1.3888613346209843e-06, + "loss": 0.6326, + "step": 45846 + }, + { + "epoch": 1.18, + "learning_rate": 1.3888358417854764e-06, + "loss": 0.5713, + "step": 45847 + }, + { + "epoch": 1.18, + "learning_rate": 1.3888103486522545e-06, + "loss": 0.8242, + "step": 45848 + }, + { + "epoch": 1.18, + "learning_rate": 1.3887848552213388e-06, + "loss": 0.7998, + "step": 45849 + }, + { + "epoch": 1.18, + "learning_rate": 1.3887593614927479e-06, + "loss": 0.561, + "step": 45850 + }, + { + "epoch": 1.18, + "learning_rate": 1.3887338674665024e-06, + "loss": 0.6626, + "step": 45851 + }, + { + "epoch": 1.18, + "learning_rate": 1.388708373142621e-06, + "loss": 0.5645, + "step": 45852 + }, + { + "epoch": 1.18, + "learning_rate": 1.3886828785211235e-06, + "loss": 0.4171, + "step": 45853 + }, + { + "epoch": 1.18, + "learning_rate": 1.3886573836020291e-06, + "loss": 0.5039, + "step": 45854 + }, + { + "epoch": 1.18, + "learning_rate": 1.3886318883853578e-06, + "loss": 0.4299, + "step": 45855 + }, + { + "epoch": 1.18, + "learning_rate": 1.3886063928711292e-06, + "loss": 0.6221, + "step": 45856 + }, + { + "epoch": 1.18, + "learning_rate": 1.3885808970593624e-06, + "loss": 0.7383, + "step": 45857 + }, + { + "epoch": 1.18, + "learning_rate": 1.3885554009500768e-06, + "loss": 0.6611, + "step": 45858 + }, + { + "epoch": 1.18, + "learning_rate": 1.3885299045432926e-06, + "loss": 0.4666, + "step": 45859 + }, + { + "epoch": 1.18, + "learning_rate": 1.3885044078390286e-06, + "loss": 0.7031, + "step": 45860 + }, + { + "epoch": 1.18, + "learning_rate": 1.3884789108373046e-06, + "loss": 0.6504, + "step": 45861 + }, + { + "epoch": 1.18, + "learning_rate": 1.3884534135381408e-06, + "loss": 0.5596, + "step": 45862 + }, + { + "epoch": 1.18, + "learning_rate": 1.3884279159415555e-06, + "loss": 0.6543, + "step": 45863 + }, + { + "epoch": 1.18, + "learning_rate": 1.388402418047569e-06, + "loss": 0.6309, + "step": 45864 + }, + { + "epoch": 1.18, + "learning_rate": 1.3883769198562005e-06, + "loss": 0.6016, + "step": 45865 + }, + { + "epoch": 1.18, + "learning_rate": 1.3883514213674693e-06, + "loss": 0.573, + "step": 45866 + }, + { + "epoch": 1.18, + "learning_rate": 1.388325922581396e-06, + "loss": 0.5493, + "step": 45867 + }, + { + "epoch": 1.18, + "learning_rate": 1.388300423497999e-06, + "loss": 0.454, + "step": 45868 + }, + { + "epoch": 1.18, + "learning_rate": 1.3882749241172982e-06, + "loss": 0.8516, + "step": 45869 + }, + { + "epoch": 1.18, + "learning_rate": 1.3882494244393132e-06, + "loss": 0.5156, + "step": 45870 + }, + { + "epoch": 1.18, + "learning_rate": 1.3882239244640634e-06, + "loss": 0.5239, + "step": 45871 + }, + { + "epoch": 1.18, + "learning_rate": 1.3881984241915687e-06, + "loss": 0.7295, + "step": 45872 + }, + { + "epoch": 1.18, + "learning_rate": 1.388172923621848e-06, + "loss": 0.7505, + "step": 45873 + }, + { + "epoch": 1.18, + "learning_rate": 1.3881474227549215e-06, + "loss": 0.6543, + "step": 45874 + }, + { + "epoch": 1.18, + "learning_rate": 1.388121921590808e-06, + "loss": 0.709, + "step": 45875 + }, + { + "epoch": 1.18, + "learning_rate": 1.3880964201295275e-06, + "loss": 0.6309, + "step": 45876 + }, + { + "epoch": 1.18, + "learning_rate": 1.3880709183710994e-06, + "loss": 0.6836, + "step": 45877 + }, + { + "epoch": 1.18, + "learning_rate": 1.3880454163155434e-06, + "loss": 0.6289, + "step": 45878 + }, + { + "epoch": 1.18, + "learning_rate": 1.3880199139628785e-06, + "loss": 0.5742, + "step": 45879 + }, + { + "epoch": 1.18, + "learning_rate": 1.387994411313125e-06, + "loss": 0.6755, + "step": 45880 + }, + { + "epoch": 1.18, + "learning_rate": 1.3879689083663015e-06, + "loss": 0.9258, + "step": 45881 + }, + { + "epoch": 1.18, + "learning_rate": 1.3879434051224288e-06, + "loss": 0.5415, + "step": 45882 + }, + { + "epoch": 1.18, + "learning_rate": 1.3879179015815253e-06, + "loss": 0.7402, + "step": 45883 + }, + { + "epoch": 1.18, + "learning_rate": 1.3878923977436108e-06, + "loss": 0.7686, + "step": 45884 + }, + { + "epoch": 1.18, + "learning_rate": 1.3878668936087047e-06, + "loss": 0.5693, + "step": 45885 + }, + { + "epoch": 1.18, + "learning_rate": 1.3878413891768272e-06, + "loss": 0.7627, + "step": 45886 + }, + { + "epoch": 1.18, + "learning_rate": 1.3878158844479973e-06, + "loss": 0.5869, + "step": 45887 + }, + { + "epoch": 1.18, + "learning_rate": 1.3877903794222343e-06, + "loss": 0.5422, + "step": 45888 + }, + { + "epoch": 1.18, + "learning_rate": 1.3877648740995585e-06, + "loss": 0.4636, + "step": 45889 + }, + { + "epoch": 1.18, + "learning_rate": 1.3877393684799885e-06, + "loss": 0.6172, + "step": 45890 + }, + { + "epoch": 1.18, + "learning_rate": 1.3877138625635447e-06, + "loss": 0.666, + "step": 45891 + }, + { + "epoch": 1.18, + "learning_rate": 1.3876883563502462e-06, + "loss": 0.7217, + "step": 45892 + }, + { + "epoch": 1.18, + "learning_rate": 1.3876628498401124e-06, + "loss": 0.7188, + "step": 45893 + }, + { + "epoch": 1.18, + "learning_rate": 1.387637343033163e-06, + "loss": 0.8701, + "step": 45894 + }, + { + "epoch": 1.18, + "learning_rate": 1.3876118359294174e-06, + "loss": 0.5825, + "step": 45895 + }, + { + "epoch": 1.18, + "learning_rate": 1.3875863285288952e-06, + "loss": 0.6763, + "step": 45896 + }, + { + "epoch": 1.18, + "learning_rate": 1.3875608208316163e-06, + "loss": 0.5469, + "step": 45897 + }, + { + "epoch": 1.18, + "learning_rate": 1.3875353128375998e-06, + "loss": 0.6455, + "step": 45898 + }, + { + "epoch": 1.18, + "learning_rate": 1.3875098045468653e-06, + "loss": 0.5049, + "step": 45899 + }, + { + "epoch": 1.18, + "learning_rate": 1.387484295959432e-06, + "loss": 0.5204, + "step": 45900 + }, + { + "epoch": 1.18, + "learning_rate": 1.38745878707532e-06, + "loss": 0.6533, + "step": 45901 + }, + { + "epoch": 1.18, + "learning_rate": 1.387433277894549e-06, + "loss": 0.6611, + "step": 45902 + }, + { + "epoch": 1.18, + "learning_rate": 1.387407768417138e-06, + "loss": 0.6265, + "step": 45903 + }, + { + "epoch": 1.18, + "learning_rate": 1.3873822586431062e-06, + "loss": 0.6357, + "step": 45904 + }, + { + "epoch": 1.18, + "learning_rate": 1.3873567485724743e-06, + "loss": 0.6689, + "step": 45905 + }, + { + "epoch": 1.18, + "learning_rate": 1.3873312382052605e-06, + "loss": 0.7085, + "step": 45906 + }, + { + "epoch": 1.18, + "learning_rate": 1.3873057275414855e-06, + "loss": 0.5869, + "step": 45907 + }, + { + "epoch": 1.18, + "learning_rate": 1.3872802165811682e-06, + "loss": 0.749, + "step": 45908 + }, + { + "epoch": 1.18, + "learning_rate": 1.3872547053243282e-06, + "loss": 0.6548, + "step": 45909 + }, + { + "epoch": 1.18, + "learning_rate": 1.3872291937709848e-06, + "loss": 0.7383, + "step": 45910 + }, + { + "epoch": 1.18, + "learning_rate": 1.387203681921158e-06, + "loss": 0.6729, + "step": 45911 + }, + { + "epoch": 1.18, + "learning_rate": 1.3871781697748674e-06, + "loss": 0.791, + "step": 45912 + }, + { + "epoch": 1.18, + "learning_rate": 1.387152657332132e-06, + "loss": 0.5637, + "step": 45913 + }, + { + "epoch": 1.18, + "learning_rate": 1.3871271445929718e-06, + "loss": 0.6401, + "step": 45914 + }, + { + "epoch": 1.18, + "learning_rate": 1.3871016315574058e-06, + "loss": 0.6436, + "step": 45915 + }, + { + "epoch": 1.18, + "learning_rate": 1.3870761182254541e-06, + "loss": 0.7109, + "step": 45916 + }, + { + "epoch": 1.18, + "learning_rate": 1.3870506045971362e-06, + "loss": 0.8037, + "step": 45917 + }, + { + "epoch": 1.18, + "learning_rate": 1.3870250906724713e-06, + "loss": 0.7246, + "step": 45918 + }, + { + "epoch": 1.18, + "learning_rate": 1.386999576451479e-06, + "loss": 0.7598, + "step": 45919 + }, + { + "epoch": 1.18, + "learning_rate": 1.386974061934179e-06, + "loss": 0.6509, + "step": 45920 + }, + { + "epoch": 1.18, + "learning_rate": 1.3869485471205906e-06, + "loss": 0.7754, + "step": 45921 + }, + { + "epoch": 1.18, + "learning_rate": 1.386923032010734e-06, + "loss": 0.6895, + "step": 45922 + }, + { + "epoch": 1.18, + "learning_rate": 1.3868975166046275e-06, + "loss": 0.5659, + "step": 45923 + }, + { + "epoch": 1.18, + "learning_rate": 1.3868720009022918e-06, + "loss": 0.7441, + "step": 45924 + }, + { + "epoch": 1.18, + "learning_rate": 1.3868464849037457e-06, + "loss": 0.3533, + "step": 45925 + }, + { + "epoch": 1.18, + "learning_rate": 1.3868209686090093e-06, + "loss": 0.8779, + "step": 45926 + }, + { + "epoch": 1.18, + "learning_rate": 1.386795452018102e-06, + "loss": 0.6685, + "step": 45927 + }, + { + "epoch": 1.18, + "learning_rate": 1.386769935131043e-06, + "loss": 0.6689, + "step": 45928 + }, + { + "epoch": 1.18, + "learning_rate": 1.386744417947852e-06, + "loss": 0.7871, + "step": 45929 + }, + { + "epoch": 1.18, + "learning_rate": 1.3867189004685487e-06, + "loss": 0.5449, + "step": 45930 + }, + { + "epoch": 1.18, + "learning_rate": 1.3866933826931524e-06, + "loss": 0.7754, + "step": 45931 + }, + { + "epoch": 1.18, + "learning_rate": 1.3866678646216827e-06, + "loss": 0.6021, + "step": 45932 + }, + { + "epoch": 1.18, + "learning_rate": 1.3866423462541595e-06, + "loss": 0.7256, + "step": 45933 + }, + { + "epoch": 1.18, + "learning_rate": 1.386616827590602e-06, + "loss": 0.626, + "step": 45934 + }, + { + "epoch": 1.18, + "learning_rate": 1.3865913086310294e-06, + "loss": 0.5591, + "step": 45935 + }, + { + "epoch": 1.18, + "learning_rate": 1.3865657893754618e-06, + "loss": 0.7354, + "step": 45936 + }, + { + "epoch": 1.18, + "learning_rate": 1.3865402698239187e-06, + "loss": 0.7549, + "step": 45937 + }, + { + "epoch": 1.18, + "learning_rate": 1.3865147499764194e-06, + "loss": 0.7773, + "step": 45938 + }, + { + "epoch": 1.18, + "learning_rate": 1.3864892298329834e-06, + "loss": 0.9307, + "step": 45939 + }, + { + "epoch": 1.18, + "learning_rate": 1.3864637093936303e-06, + "loss": 0.5386, + "step": 45940 + }, + { + "epoch": 1.18, + "learning_rate": 1.3864381886583803e-06, + "loss": 0.6245, + "step": 45941 + }, + { + "epoch": 1.18, + "learning_rate": 1.3864126676272517e-06, + "loss": 0.6982, + "step": 45942 + }, + { + "epoch": 1.18, + "learning_rate": 1.386387146300265e-06, + "loss": 0.5601, + "step": 45943 + }, + { + "epoch": 1.18, + "learning_rate": 1.3863616246774393e-06, + "loss": 0.5659, + "step": 45944 + }, + { + "epoch": 1.18, + "learning_rate": 1.3863361027587944e-06, + "loss": 0.7256, + "step": 45945 + }, + { + "epoch": 1.18, + "learning_rate": 1.3863105805443496e-06, + "loss": 0.627, + "step": 45946 + }, + { + "epoch": 1.18, + "learning_rate": 1.3862850580341246e-06, + "loss": 0.4199, + "step": 45947 + }, + { + "epoch": 1.18, + "learning_rate": 1.3862595352281388e-06, + "loss": 0.6929, + "step": 45948 + }, + { + "epoch": 1.18, + "learning_rate": 1.386234012126412e-06, + "loss": 0.5891, + "step": 45949 + }, + { + "epoch": 1.18, + "learning_rate": 1.3862084887289634e-06, + "loss": 0.5669, + "step": 45950 + }, + { + "epoch": 1.18, + "learning_rate": 1.3861829650358129e-06, + "loss": 0.6465, + "step": 45951 + }, + { + "epoch": 1.18, + "learning_rate": 1.3861574410469797e-06, + "loss": 0.5771, + "step": 45952 + }, + { + "epoch": 1.18, + "learning_rate": 1.3861319167624837e-06, + "loss": 0.5784, + "step": 45953 + }, + { + "epoch": 1.18, + "learning_rate": 1.386106392182344e-06, + "loss": 0.5991, + "step": 45954 + }, + { + "epoch": 1.18, + "learning_rate": 1.3860808673065805e-06, + "loss": 0.5588, + "step": 45955 + }, + { + "epoch": 1.18, + "learning_rate": 1.3860553421352127e-06, + "loss": 0.7285, + "step": 45956 + }, + { + "epoch": 1.18, + "learning_rate": 1.3860298166682598e-06, + "loss": 0.7018, + "step": 45957 + }, + { + "epoch": 1.18, + "learning_rate": 1.386004290905742e-06, + "loss": 0.6812, + "step": 45958 + }, + { + "epoch": 1.18, + "learning_rate": 1.3859787648476782e-06, + "loss": 0.6553, + "step": 45959 + }, + { + "epoch": 1.18, + "learning_rate": 1.3859532384940882e-06, + "loss": 0.7363, + "step": 45960 + }, + { + "epoch": 1.18, + "learning_rate": 1.3859277118449918e-06, + "loss": 0.5803, + "step": 45961 + }, + { + "epoch": 1.18, + "learning_rate": 1.385902184900408e-06, + "loss": 0.6748, + "step": 45962 + }, + { + "epoch": 1.18, + "learning_rate": 1.385876657660357e-06, + "loss": 0.7852, + "step": 45963 + }, + { + "epoch": 1.18, + "learning_rate": 1.3858511301248576e-06, + "loss": 0.5786, + "step": 45964 + }, + { + "epoch": 1.18, + "learning_rate": 1.3858256022939298e-06, + "loss": 0.5791, + "step": 45965 + }, + { + "epoch": 1.18, + "learning_rate": 1.3858000741675935e-06, + "loss": 0.6338, + "step": 45966 + }, + { + "epoch": 1.18, + "learning_rate": 1.3857745457458672e-06, + "loss": 0.7773, + "step": 45967 + }, + { + "epoch": 1.18, + "learning_rate": 1.3857490170287716e-06, + "loss": 0.5581, + "step": 45968 + }, + { + "epoch": 1.18, + "learning_rate": 1.3857234880163253e-06, + "loss": 0.5811, + "step": 45969 + }, + { + "epoch": 1.18, + "learning_rate": 1.3856979587085485e-06, + "loss": 0.5059, + "step": 45970 + }, + { + "epoch": 1.18, + "learning_rate": 1.3856724291054604e-06, + "loss": 0.748, + "step": 45971 + }, + { + "epoch": 1.18, + "learning_rate": 1.3856468992070808e-06, + "loss": 0.5146, + "step": 45972 + }, + { + "epoch": 1.18, + "learning_rate": 1.385621369013429e-06, + "loss": 0.6333, + "step": 45973 + }, + { + "epoch": 1.18, + "learning_rate": 1.3855958385245248e-06, + "loss": 0.6675, + "step": 45974 + }, + { + "epoch": 1.18, + "learning_rate": 1.3855703077403874e-06, + "loss": 0.6934, + "step": 45975 + }, + { + "epoch": 1.18, + "learning_rate": 1.3855447766610365e-06, + "loss": 0.6162, + "step": 45976 + }, + { + "epoch": 1.18, + "learning_rate": 1.385519245286492e-06, + "loss": 0.7188, + "step": 45977 + }, + { + "epoch": 1.18, + "learning_rate": 1.3854937136167726e-06, + "loss": 0.6543, + "step": 45978 + }, + { + "epoch": 1.18, + "learning_rate": 1.3854681816518988e-06, + "loss": 0.7695, + "step": 45979 + }, + { + "epoch": 1.18, + "learning_rate": 1.3854426493918897e-06, + "loss": 0.7822, + "step": 45980 + }, + { + "epoch": 1.18, + "learning_rate": 1.385417116836765e-06, + "loss": 0.8047, + "step": 45981 + }, + { + "epoch": 1.18, + "learning_rate": 1.3853915839865437e-06, + "loss": 0.6846, + "step": 45982 + }, + { + "epoch": 1.18, + "learning_rate": 1.3853660508412462e-06, + "loss": 0.7295, + "step": 45983 + }, + { + "epoch": 1.18, + "learning_rate": 1.3853405174008914e-06, + "loss": 0.6299, + "step": 45984 + }, + { + "epoch": 1.18, + "learning_rate": 1.3853149836654993e-06, + "loss": 0.6714, + "step": 45985 + }, + { + "epoch": 1.18, + "learning_rate": 1.385289449635089e-06, + "loss": 0.3748, + "step": 45986 + }, + { + "epoch": 1.18, + "learning_rate": 1.3852639153096805e-06, + "loss": 0.7773, + "step": 45987 + }, + { + "epoch": 1.18, + "learning_rate": 1.3852383806892932e-06, + "loss": 0.7715, + "step": 45988 + }, + { + "epoch": 1.18, + "learning_rate": 1.3852128457739463e-06, + "loss": 0.5566, + "step": 45989 + }, + { + "epoch": 1.18, + "learning_rate": 1.3851873105636598e-06, + "loss": 0.7041, + "step": 45990 + }, + { + "epoch": 1.18, + "learning_rate": 1.3851617750584531e-06, + "loss": 0.6016, + "step": 45991 + }, + { + "epoch": 1.18, + "learning_rate": 1.3851362392583456e-06, + "loss": 0.6318, + "step": 45992 + }, + { + "epoch": 1.18, + "learning_rate": 1.3851107031633571e-06, + "loss": 0.45, + "step": 45993 + }, + { + "epoch": 1.18, + "learning_rate": 1.3850851667735072e-06, + "loss": 0.6797, + "step": 45994 + }, + { + "epoch": 1.18, + "learning_rate": 1.385059630088815e-06, + "loss": 0.7256, + "step": 45995 + }, + { + "epoch": 1.18, + "learning_rate": 1.3850340931093005e-06, + "loss": 0.5879, + "step": 45996 + }, + { + "epoch": 1.18, + "learning_rate": 1.385008555834983e-06, + "loss": 0.7422, + "step": 45997 + }, + { + "epoch": 1.18, + "learning_rate": 1.384983018265882e-06, + "loss": 0.7666, + "step": 45998 + }, + { + "epoch": 1.18, + "learning_rate": 1.3849574804020177e-06, + "loss": 0.4695, + "step": 45999 + }, + { + "epoch": 1.18, + "learning_rate": 1.3849319422434088e-06, + "loss": 0.6826, + "step": 46000 + }, + { + "epoch": 1.18, + "learning_rate": 1.3849064037900754e-06, + "loss": 0.6602, + "step": 46001 + }, + { + "epoch": 1.18, + "learning_rate": 1.3848808650420368e-06, + "loss": 0.8262, + "step": 46002 + }, + { + "epoch": 1.18, + "learning_rate": 1.3848553259993122e-06, + "loss": 0.5532, + "step": 46003 + }, + { + "epoch": 1.18, + "learning_rate": 1.384829786661922e-06, + "loss": 0.6797, + "step": 46004 + }, + { + "epoch": 1.18, + "learning_rate": 1.3848042470298853e-06, + "loss": 0.6797, + "step": 46005 + }, + { + "epoch": 1.18, + "learning_rate": 1.384778707103222e-06, + "loss": 0.6602, + "step": 46006 + }, + { + "epoch": 1.18, + "learning_rate": 1.3847531668819508e-06, + "loss": 0.748, + "step": 46007 + }, + { + "epoch": 1.18, + "learning_rate": 1.384727626366092e-06, + "loss": 0.6499, + "step": 46008 + }, + { + "epoch": 1.18, + "learning_rate": 1.3847020855556647e-06, + "loss": 0.563, + "step": 46009 + }, + { + "epoch": 1.18, + "learning_rate": 1.3846765444506892e-06, + "loss": 0.4871, + "step": 46010 + }, + { + "epoch": 1.18, + "learning_rate": 1.3846510030511842e-06, + "loss": 0.625, + "step": 46011 + }, + { + "epoch": 1.18, + "learning_rate": 1.38462546135717e-06, + "loss": 0.5859, + "step": 46012 + }, + { + "epoch": 1.18, + "learning_rate": 1.3845999193686652e-06, + "loss": 0.752, + "step": 46013 + }, + { + "epoch": 1.18, + "learning_rate": 1.3845743770856903e-06, + "loss": 0.5894, + "step": 46014 + }, + { + "epoch": 1.18, + "learning_rate": 1.3845488345082642e-06, + "loss": 0.6846, + "step": 46015 + }, + { + "epoch": 1.18, + "learning_rate": 1.3845232916364071e-06, + "loss": 0.6929, + "step": 46016 + }, + { + "epoch": 1.18, + "learning_rate": 1.384497748470138e-06, + "loss": 0.6221, + "step": 46017 + }, + { + "epoch": 1.18, + "learning_rate": 1.3844722050094765e-06, + "loss": 0.6787, + "step": 46018 + }, + { + "epoch": 1.18, + "learning_rate": 1.3844466612544426e-06, + "loss": 0.3318, + "step": 46019 + }, + { + "epoch": 1.18, + "learning_rate": 1.3844211172050555e-06, + "loss": 0.7002, + "step": 46020 + }, + { + "epoch": 1.18, + "learning_rate": 1.3843955728613347e-06, + "loss": 0.6953, + "step": 46021 + }, + { + "epoch": 1.18, + "learning_rate": 1.3843700282232999e-06, + "loss": 0.6895, + "step": 46022 + }, + { + "epoch": 1.18, + "learning_rate": 1.3843444832909708e-06, + "loss": 0.6797, + "step": 46023 + }, + { + "epoch": 1.18, + "learning_rate": 1.3843189380643666e-06, + "loss": 0.6992, + "step": 46024 + }, + { + "epoch": 1.18, + "learning_rate": 1.3842933925435071e-06, + "loss": 0.7603, + "step": 46025 + }, + { + "epoch": 1.18, + "learning_rate": 1.3842678467284122e-06, + "loss": 0.7144, + "step": 46026 + }, + { + "epoch": 1.18, + "learning_rate": 1.3842423006191006e-06, + "loss": 0.46, + "step": 46027 + }, + { + "epoch": 1.18, + "learning_rate": 1.3842167542155926e-06, + "loss": 0.4443, + "step": 46028 + }, + { + "epoch": 1.18, + "learning_rate": 1.3841912075179073e-06, + "loss": 0.541, + "step": 46029 + }, + { + "epoch": 1.18, + "learning_rate": 1.3841656605260644e-06, + "loss": 0.6582, + "step": 46030 + }, + { + "epoch": 1.18, + "learning_rate": 1.384140113240084e-06, + "loss": 0.6064, + "step": 46031 + }, + { + "epoch": 1.18, + "learning_rate": 1.3841145656599848e-06, + "loss": 0.6514, + "step": 46032 + }, + { + "epoch": 1.18, + "learning_rate": 1.3840890177857868e-06, + "loss": 0.6016, + "step": 46033 + }, + { + "epoch": 1.18, + "learning_rate": 1.3840634696175092e-06, + "loss": 0.7529, + "step": 46034 + }, + { + "epoch": 1.18, + "learning_rate": 1.3840379211551722e-06, + "loss": 0.5181, + "step": 46035 + }, + { + "epoch": 1.18, + "learning_rate": 1.3840123723987952e-06, + "loss": 0.5381, + "step": 46036 + }, + { + "epoch": 1.18, + "learning_rate": 1.3839868233483975e-06, + "loss": 0.566, + "step": 46037 + }, + { + "epoch": 1.18, + "learning_rate": 1.3839612740039983e-06, + "loss": 0.7134, + "step": 46038 + }, + { + "epoch": 1.18, + "learning_rate": 1.3839357243656182e-06, + "loss": 0.4961, + "step": 46039 + }, + { + "epoch": 1.18, + "learning_rate": 1.3839101744332758e-06, + "loss": 0.5344, + "step": 46040 + }, + { + "epoch": 1.18, + "learning_rate": 1.383884624206991e-06, + "loss": 0.7656, + "step": 46041 + }, + { + "epoch": 1.18, + "learning_rate": 1.3838590736867837e-06, + "loss": 0.7559, + "step": 46042 + }, + { + "epoch": 1.18, + "learning_rate": 1.3838335228726729e-06, + "loss": 0.6748, + "step": 46043 + }, + { + "epoch": 1.18, + "learning_rate": 1.3838079717646785e-06, + "loss": 0.6621, + "step": 46044 + }, + { + "epoch": 1.18, + "learning_rate": 1.38378242036282e-06, + "loss": 0.7261, + "step": 46045 + }, + { + "epoch": 1.18, + "learning_rate": 1.3837568686671168e-06, + "loss": 0.5962, + "step": 46046 + }, + { + "epoch": 1.18, + "learning_rate": 1.3837313166775887e-06, + "loss": 0.6523, + "step": 46047 + }, + { + "epoch": 1.18, + "learning_rate": 1.3837057643942554e-06, + "loss": 0.5171, + "step": 46048 + }, + { + "epoch": 1.18, + "learning_rate": 1.3836802118171357e-06, + "loss": 0.5742, + "step": 46049 + }, + { + "epoch": 1.18, + "learning_rate": 1.3836546589462504e-06, + "loss": 0.5635, + "step": 46050 + }, + { + "epoch": 1.18, + "learning_rate": 1.383629105781618e-06, + "loss": 0.7354, + "step": 46051 + }, + { + "epoch": 1.18, + "learning_rate": 1.3836035523232586e-06, + "loss": 0.7393, + "step": 46052 + }, + { + "epoch": 1.18, + "learning_rate": 1.3835779985711914e-06, + "loss": 0.5771, + "step": 46053 + }, + { + "epoch": 1.18, + "learning_rate": 1.383552444525436e-06, + "loss": 0.7158, + "step": 46054 + }, + { + "epoch": 1.18, + "learning_rate": 1.3835268901860121e-06, + "loss": 0.5796, + "step": 46055 + }, + { + "epoch": 1.18, + "learning_rate": 1.38350133555294e-06, + "loss": 0.8086, + "step": 46056 + }, + { + "epoch": 1.18, + "learning_rate": 1.3834757806262381e-06, + "loss": 0.5513, + "step": 46057 + }, + { + "epoch": 1.18, + "learning_rate": 1.3834502254059263e-06, + "loss": 0.832, + "step": 46058 + }, + { + "epoch": 1.18, + "learning_rate": 1.3834246698920241e-06, + "loss": 0.5542, + "step": 46059 + }, + { + "epoch": 1.18, + "learning_rate": 1.3833991140845518e-06, + "loss": 0.5254, + "step": 46060 + }, + { + "epoch": 1.18, + "learning_rate": 1.3833735579835284e-06, + "loss": 0.6699, + "step": 46061 + }, + { + "epoch": 1.18, + "learning_rate": 1.3833480015889733e-06, + "loss": 0.6035, + "step": 46062 + }, + { + "epoch": 1.18, + "learning_rate": 1.3833224449009062e-06, + "loss": 0.5776, + "step": 46063 + }, + { + "epoch": 1.18, + "learning_rate": 1.3832968879193469e-06, + "loss": 0.5693, + "step": 46064 + }, + { + "epoch": 1.18, + "learning_rate": 1.3832713306443144e-06, + "loss": 0.5378, + "step": 46065 + }, + { + "epoch": 1.18, + "learning_rate": 1.3832457730758292e-06, + "loss": 0.7881, + "step": 46066 + }, + { + "epoch": 1.18, + "learning_rate": 1.38322021521391e-06, + "loss": 0.666, + "step": 46067 + }, + { + "epoch": 1.18, + "learning_rate": 1.383194657058577e-06, + "loss": 0.8047, + "step": 46068 + }, + { + "epoch": 1.18, + "learning_rate": 1.3831690986098492e-06, + "loss": 0.7412, + "step": 46069 + }, + { + "epoch": 1.18, + "learning_rate": 1.3831435398677463e-06, + "loss": 0.6523, + "step": 46070 + }, + { + "epoch": 1.18, + "learning_rate": 1.3831179808322886e-06, + "loss": 0.7568, + "step": 46071 + }, + { + "epoch": 1.18, + "learning_rate": 1.3830924215034945e-06, + "loss": 0.8223, + "step": 46072 + }, + { + "epoch": 1.18, + "learning_rate": 1.3830668618813843e-06, + "loss": 0.6797, + "step": 46073 + }, + { + "epoch": 1.18, + "learning_rate": 1.3830413019659775e-06, + "loss": 0.6514, + "step": 46074 + }, + { + "epoch": 1.18, + "learning_rate": 1.3830157417572934e-06, + "loss": 0.5938, + "step": 46075 + }, + { + "epoch": 1.18, + "learning_rate": 1.3829901812553518e-06, + "loss": 0.3806, + "step": 46076 + }, + { + "epoch": 1.18, + "learning_rate": 1.3829646204601726e-06, + "loss": 0.6475, + "step": 46077 + }, + { + "epoch": 1.18, + "learning_rate": 1.3829390593717747e-06, + "loss": 0.4324, + "step": 46078 + }, + { + "epoch": 1.18, + "learning_rate": 1.382913497990178e-06, + "loss": 0.5596, + "step": 46079 + }, + { + "epoch": 1.18, + "learning_rate": 1.382887936315402e-06, + "loss": 0.6494, + "step": 46080 + }, + { + "epoch": 1.18, + "learning_rate": 1.3828623743474665e-06, + "loss": 0.7422, + "step": 46081 + }, + { + "epoch": 1.18, + "learning_rate": 1.3828368120863906e-06, + "loss": 0.7549, + "step": 46082 + }, + { + "epoch": 1.18, + "learning_rate": 1.3828112495321944e-06, + "loss": 0.769, + "step": 46083 + }, + { + "epoch": 1.18, + "learning_rate": 1.382785686684897e-06, + "loss": 0.6084, + "step": 46084 + }, + { + "epoch": 1.18, + "learning_rate": 1.3827601235445183e-06, + "loss": 0.7031, + "step": 46085 + }, + { + "epoch": 1.18, + "learning_rate": 1.3827345601110781e-06, + "loss": 0.7598, + "step": 46086 + }, + { + "epoch": 1.18, + "learning_rate": 1.382708996384595e-06, + "loss": 0.6953, + "step": 46087 + }, + { + "epoch": 1.18, + "learning_rate": 1.3826834323650898e-06, + "loss": 0.6621, + "step": 46088 + }, + { + "epoch": 1.18, + "learning_rate": 1.3826578680525812e-06, + "loss": 0.5112, + "step": 46089 + }, + { + "epoch": 1.18, + "learning_rate": 1.382632303447089e-06, + "loss": 0.8457, + "step": 46090 + }, + { + "epoch": 1.18, + "learning_rate": 1.3826067385486332e-06, + "loss": 0.7251, + "step": 46091 + }, + { + "epoch": 1.18, + "learning_rate": 1.3825811733572329e-06, + "loss": 0.6045, + "step": 46092 + }, + { + "epoch": 1.18, + "learning_rate": 1.3825556078729074e-06, + "loss": 0.6602, + "step": 46093 + }, + { + "epoch": 1.18, + "learning_rate": 1.3825300420956768e-06, + "loss": 0.792, + "step": 46094 + }, + { + "epoch": 1.18, + "learning_rate": 1.3825044760255607e-06, + "loss": 0.7168, + "step": 46095 + }, + { + "epoch": 1.18, + "learning_rate": 1.3824789096625788e-06, + "loss": 0.6646, + "step": 46096 + }, + { + "epoch": 1.18, + "learning_rate": 1.38245334300675e-06, + "loss": 0.5419, + "step": 46097 + }, + { + "epoch": 1.18, + "learning_rate": 1.3824277760580942e-06, + "loss": 0.6763, + "step": 46098 + }, + { + "epoch": 1.18, + "learning_rate": 1.3824022088166309e-06, + "loss": 0.5781, + "step": 46099 + }, + { + "epoch": 1.18, + "learning_rate": 1.3823766412823802e-06, + "loss": 0.4438, + "step": 46100 + }, + { + "epoch": 1.18, + "learning_rate": 1.3823510734553615e-06, + "loss": 0.5898, + "step": 46101 + }, + { + "epoch": 1.18, + "learning_rate": 1.3823255053355938e-06, + "loss": 0.5049, + "step": 46102 + }, + { + "epoch": 1.18, + "learning_rate": 1.3822999369230968e-06, + "loss": 0.6494, + "step": 46103 + }, + { + "epoch": 1.18, + "learning_rate": 1.3822743682178906e-06, + "loss": 0.5463, + "step": 46104 + }, + { + "epoch": 1.18, + "learning_rate": 1.3822487992199943e-06, + "loss": 0.583, + "step": 46105 + }, + { + "epoch": 1.18, + "learning_rate": 1.382223229929428e-06, + "loss": 0.6885, + "step": 46106 + }, + { + "epoch": 1.18, + "learning_rate": 1.3821976603462108e-06, + "loss": 0.7207, + "step": 46107 + }, + { + "epoch": 1.18, + "learning_rate": 1.3821720904703623e-06, + "loss": 0.667, + "step": 46108 + }, + { + "epoch": 1.18, + "learning_rate": 1.3821465203019025e-06, + "loss": 0.6147, + "step": 46109 + }, + { + "epoch": 1.18, + "learning_rate": 1.3821209498408504e-06, + "loss": 0.6255, + "step": 46110 + }, + { + "epoch": 1.18, + "learning_rate": 1.3820953790872261e-06, + "loss": 0.5923, + "step": 46111 + }, + { + "epoch": 1.18, + "learning_rate": 1.3820698080410487e-06, + "loss": 0.4932, + "step": 46112 + }, + { + "epoch": 1.18, + "learning_rate": 1.3820442367023381e-06, + "loss": 0.6426, + "step": 46113 + }, + { + "epoch": 1.18, + "learning_rate": 1.3820186650711136e-06, + "loss": 0.646, + "step": 46114 + }, + { + "epoch": 1.18, + "learning_rate": 1.3819930931473953e-06, + "loss": 0.5297, + "step": 46115 + }, + { + "epoch": 1.18, + "learning_rate": 1.3819675209312026e-06, + "loss": 0.7041, + "step": 46116 + }, + { + "epoch": 1.18, + "learning_rate": 1.3819419484225544e-06, + "loss": 0.6709, + "step": 46117 + }, + { + "epoch": 1.18, + "learning_rate": 1.381916375621471e-06, + "loss": 0.665, + "step": 46118 + }, + { + "epoch": 1.18, + "learning_rate": 1.381890802527972e-06, + "loss": 0.4744, + "step": 46119 + }, + { + "epoch": 1.18, + "learning_rate": 1.3818652291420767e-06, + "loss": 0.6279, + "step": 46120 + }, + { + "epoch": 1.18, + "learning_rate": 1.3818396554638048e-06, + "loss": 0.7002, + "step": 46121 + }, + { + "epoch": 1.18, + "learning_rate": 1.3818140814931756e-06, + "loss": 0.5981, + "step": 46122 + }, + { + "epoch": 1.18, + "learning_rate": 1.3817885072302091e-06, + "loss": 0.666, + "step": 46123 + }, + { + "epoch": 1.18, + "learning_rate": 1.3817629326749246e-06, + "loss": 0.7021, + "step": 46124 + }, + { + "epoch": 1.18, + "learning_rate": 1.381737357827342e-06, + "loss": 0.5532, + "step": 46125 + }, + { + "epoch": 1.18, + "learning_rate": 1.3817117826874803e-06, + "loss": 0.7119, + "step": 46126 + }, + { + "epoch": 1.18, + "learning_rate": 1.3816862072553598e-06, + "loss": 0.6831, + "step": 46127 + }, + { + "epoch": 1.18, + "learning_rate": 1.3816606315309993e-06, + "loss": 0.4307, + "step": 46128 + }, + { + "epoch": 1.18, + "learning_rate": 1.3816350555144192e-06, + "loss": 0.3828, + "step": 46129 + }, + { + "epoch": 1.18, + "learning_rate": 1.3816094792056382e-06, + "loss": 0.4521, + "step": 46130 + }, + { + "epoch": 1.18, + "learning_rate": 1.381583902604677e-06, + "loss": 0.6528, + "step": 46131 + }, + { + "epoch": 1.18, + "learning_rate": 1.3815583257115542e-06, + "loss": 0.8389, + "step": 46132 + }, + { + "epoch": 1.18, + "learning_rate": 1.3815327485262898e-06, + "loss": 0.7021, + "step": 46133 + }, + { + "epoch": 1.18, + "learning_rate": 1.3815071710489033e-06, + "loss": 0.6245, + "step": 46134 + }, + { + "epoch": 1.18, + "learning_rate": 1.3814815932794144e-06, + "loss": 0.7192, + "step": 46135 + }, + { + "epoch": 1.18, + "learning_rate": 1.3814560152178425e-06, + "loss": 0.6797, + "step": 46136 + }, + { + "epoch": 1.18, + "learning_rate": 1.3814304368642069e-06, + "loss": 0.6084, + "step": 46137 + }, + { + "epoch": 1.18, + "learning_rate": 1.381404858218528e-06, + "loss": 0.8994, + "step": 46138 + }, + { + "epoch": 1.18, + "learning_rate": 1.3813792792808248e-06, + "loss": 0.7773, + "step": 46139 + }, + { + "epoch": 1.18, + "learning_rate": 1.3813537000511172e-06, + "loss": 0.4563, + "step": 46140 + }, + { + "epoch": 1.18, + "learning_rate": 1.3813281205294246e-06, + "loss": 0.6416, + "step": 46141 + }, + { + "epoch": 1.18, + "learning_rate": 1.3813025407157663e-06, + "loss": 0.5757, + "step": 46142 + }, + { + "epoch": 1.18, + "learning_rate": 1.3812769606101622e-06, + "loss": 0.8057, + "step": 46143 + }, + { + "epoch": 1.18, + "learning_rate": 1.3812513802126322e-06, + "loss": 0.7344, + "step": 46144 + }, + { + "epoch": 1.18, + "learning_rate": 1.3812257995231952e-06, + "loss": 0.6924, + "step": 46145 + }, + { + "epoch": 1.18, + "learning_rate": 1.3812002185418715e-06, + "loss": 0.6953, + "step": 46146 + }, + { + "epoch": 1.18, + "learning_rate": 1.3811746372686801e-06, + "loss": 0.3853, + "step": 46147 + }, + { + "epoch": 1.18, + "learning_rate": 1.3811490557036406e-06, + "loss": 0.5433, + "step": 46148 + }, + { + "epoch": 1.18, + "learning_rate": 1.381123473846773e-06, + "loss": 0.6855, + "step": 46149 + }, + { + "epoch": 1.18, + "learning_rate": 1.3810978916980969e-06, + "loss": 0.5131, + "step": 46150 + }, + { + "epoch": 1.18, + "learning_rate": 1.3810723092576315e-06, + "loss": 0.5811, + "step": 46151 + }, + { + "epoch": 1.18, + "learning_rate": 1.3810467265253964e-06, + "loss": 0.6719, + "step": 46152 + }, + { + "epoch": 1.18, + "learning_rate": 1.3810211435014115e-06, + "loss": 0.6396, + "step": 46153 + }, + { + "epoch": 1.18, + "learning_rate": 1.3809955601856963e-06, + "loss": 0.686, + "step": 46154 + }, + { + "epoch": 1.18, + "learning_rate": 1.38096997657827e-06, + "loss": 0.6733, + "step": 46155 + }, + { + "epoch": 1.18, + "learning_rate": 1.3809443926791526e-06, + "loss": 0.7852, + "step": 46156 + }, + { + "epoch": 1.18, + "learning_rate": 1.3809188084883639e-06, + "loss": 0.7671, + "step": 46157 + }, + { + "epoch": 1.18, + "learning_rate": 1.3808932240059228e-06, + "loss": 0.5449, + "step": 46158 + }, + { + "epoch": 1.18, + "learning_rate": 1.3808676392318494e-06, + "loss": 0.4705, + "step": 46159 + }, + { + "epoch": 1.18, + "learning_rate": 1.3808420541661631e-06, + "loss": 0.7256, + "step": 46160 + }, + { + "epoch": 1.18, + "learning_rate": 1.380816468808884e-06, + "loss": 0.6177, + "step": 46161 + }, + { + "epoch": 1.18, + "learning_rate": 1.3807908831600308e-06, + "loss": 0.6042, + "step": 46162 + }, + { + "epoch": 1.18, + "learning_rate": 1.3807652972196238e-06, + "loss": 0.5913, + "step": 46163 + }, + { + "epoch": 1.18, + "learning_rate": 1.380739710987682e-06, + "loss": 0.6636, + "step": 46164 + }, + { + "epoch": 1.18, + "learning_rate": 1.3807141244642255e-06, + "loss": 0.7358, + "step": 46165 + }, + { + "epoch": 1.18, + "learning_rate": 1.3806885376492736e-06, + "loss": 0.6484, + "step": 46166 + }, + { + "epoch": 1.18, + "learning_rate": 1.3806629505428463e-06, + "loss": 0.6279, + "step": 46167 + }, + { + "epoch": 1.18, + "learning_rate": 1.3806373631449626e-06, + "loss": 0.6118, + "step": 46168 + }, + { + "epoch": 1.18, + "learning_rate": 1.3806117754556423e-06, + "loss": 0.748, + "step": 46169 + }, + { + "epoch": 1.18, + "learning_rate": 1.3805861874749053e-06, + "loss": 0.6318, + "step": 46170 + }, + { + "epoch": 1.18, + "learning_rate": 1.3805605992027709e-06, + "loss": 0.6943, + "step": 46171 + }, + { + "epoch": 1.18, + "learning_rate": 1.3805350106392586e-06, + "loss": 0.6851, + "step": 46172 + }, + { + "epoch": 1.18, + "learning_rate": 1.3805094217843882e-06, + "loss": 0.6216, + "step": 46173 + }, + { + "epoch": 1.18, + "learning_rate": 1.3804838326381791e-06, + "loss": 0.6318, + "step": 46174 + }, + { + "epoch": 1.18, + "learning_rate": 1.3804582432006513e-06, + "loss": 0.585, + "step": 46175 + }, + { + "epoch": 1.18, + "learning_rate": 1.380432653471824e-06, + "loss": 0.6108, + "step": 46176 + }, + { + "epoch": 1.18, + "learning_rate": 1.3804070634517168e-06, + "loss": 0.7344, + "step": 46177 + }, + { + "epoch": 1.18, + "learning_rate": 1.3803814731403495e-06, + "loss": 0.5537, + "step": 46178 + }, + { + "epoch": 1.18, + "learning_rate": 1.3803558825377416e-06, + "loss": 0.5952, + "step": 46179 + }, + { + "epoch": 1.18, + "learning_rate": 1.3803302916439128e-06, + "loss": 0.6484, + "step": 46180 + }, + { + "epoch": 1.18, + "learning_rate": 1.3803047004588827e-06, + "loss": 0.7231, + "step": 46181 + }, + { + "epoch": 1.18, + "learning_rate": 1.3802791089826704e-06, + "loss": 0.7549, + "step": 46182 + }, + { + "epoch": 1.18, + "learning_rate": 1.380253517215296e-06, + "loss": 0.6416, + "step": 46183 + }, + { + "epoch": 1.18, + "learning_rate": 1.380227925156779e-06, + "loss": 0.4795, + "step": 46184 + }, + { + "epoch": 1.18, + "learning_rate": 1.3802023328071389e-06, + "loss": 0.6587, + "step": 46185 + }, + { + "epoch": 1.18, + "learning_rate": 1.3801767401663956e-06, + "loss": 0.6021, + "step": 46186 + }, + { + "epoch": 1.18, + "learning_rate": 1.3801511472345683e-06, + "loss": 0.7129, + "step": 46187 + }, + { + "epoch": 1.18, + "learning_rate": 1.3801255540116764e-06, + "loss": 0.6396, + "step": 46188 + }, + { + "epoch": 1.18, + "learning_rate": 1.3800999604977403e-06, + "loss": 0.6709, + "step": 46189 + }, + { + "epoch": 1.18, + "learning_rate": 1.380074366692779e-06, + "loss": 0.4937, + "step": 46190 + }, + { + "epoch": 1.18, + "learning_rate": 1.3800487725968122e-06, + "loss": 0.7441, + "step": 46191 + }, + { + "epoch": 1.18, + "learning_rate": 1.3800231782098598e-06, + "loss": 0.6104, + "step": 46192 + }, + { + "epoch": 1.18, + "learning_rate": 1.3799975835319407e-06, + "loss": 0.7114, + "step": 46193 + }, + { + "epoch": 1.18, + "learning_rate": 1.3799719885630753e-06, + "loss": 0.6311, + "step": 46194 + }, + { + "epoch": 1.18, + "learning_rate": 1.3799463933032822e-06, + "loss": 0.5425, + "step": 46195 + }, + { + "epoch": 1.18, + "learning_rate": 1.3799207977525825e-06, + "loss": 0.6934, + "step": 46196 + }, + { + "epoch": 1.18, + "learning_rate": 1.3798952019109945e-06, + "loss": 0.6875, + "step": 46197 + }, + { + "epoch": 1.18, + "learning_rate": 1.379869605778538e-06, + "loss": 0.593, + "step": 46198 + }, + { + "epoch": 1.18, + "learning_rate": 1.379844009355233e-06, + "loss": 0.5986, + "step": 46199 + }, + { + "epoch": 1.18, + "learning_rate": 1.3798184126410987e-06, + "loss": 0.6099, + "step": 46200 + }, + { + "epoch": 1.18, + "learning_rate": 1.3797928156361552e-06, + "loss": 0.4824, + "step": 46201 + }, + { + "epoch": 1.18, + "learning_rate": 1.3797672183404217e-06, + "loss": 0.7959, + "step": 46202 + }, + { + "epoch": 1.18, + "learning_rate": 1.3797416207539179e-06, + "loss": 0.748, + "step": 46203 + }, + { + "epoch": 1.18, + "learning_rate": 1.3797160228766634e-06, + "loss": 0.7295, + "step": 46204 + }, + { + "epoch": 1.18, + "learning_rate": 1.3796904247086776e-06, + "loss": 0.5879, + "step": 46205 + }, + { + "epoch": 1.18, + "learning_rate": 1.3796648262499808e-06, + "loss": 0.6167, + "step": 46206 + }, + { + "epoch": 1.18, + "learning_rate": 1.3796392275005918e-06, + "loss": 0.6797, + "step": 46207 + }, + { + "epoch": 1.18, + "learning_rate": 1.37961362846053e-06, + "loss": 0.6211, + "step": 46208 + }, + { + "epoch": 1.18, + "learning_rate": 1.3795880291298162e-06, + "loss": 0.7129, + "step": 46209 + }, + { + "epoch": 1.18, + "learning_rate": 1.379562429508469e-06, + "loss": 0.4956, + "step": 46210 + }, + { + "epoch": 1.18, + "learning_rate": 1.379536829596509e-06, + "loss": 0.7686, + "step": 46211 + }, + { + "epoch": 1.18, + "learning_rate": 1.3795112293939542e-06, + "loss": 0.7852, + "step": 46212 + }, + { + "epoch": 1.18, + "learning_rate": 1.3794856289008255e-06, + "loss": 0.5259, + "step": 46213 + }, + { + "epoch": 1.18, + "learning_rate": 1.3794600281171418e-06, + "loss": 0.6953, + "step": 46214 + }, + { + "epoch": 1.18, + "learning_rate": 1.3794344270429235e-06, + "loss": 0.7017, + "step": 46215 + }, + { + "epoch": 1.18, + "learning_rate": 1.3794088256781892e-06, + "loss": 0.6621, + "step": 46216 + }, + { + "epoch": 1.18, + "learning_rate": 1.3793832240229595e-06, + "loss": 0.6934, + "step": 46217 + }, + { + "epoch": 1.18, + "learning_rate": 1.3793576220772529e-06, + "loss": 0.8701, + "step": 46218 + }, + { + "epoch": 1.18, + "learning_rate": 1.37933201984109e-06, + "loss": 0.686, + "step": 46219 + }, + { + "epoch": 1.18, + "learning_rate": 1.37930641731449e-06, + "loss": 0.6577, + "step": 46220 + }, + { + "epoch": 1.18, + "learning_rate": 1.3792808144974725e-06, + "loss": 0.6582, + "step": 46221 + }, + { + "epoch": 1.18, + "learning_rate": 1.3792552113900571e-06, + "loss": 0.6797, + "step": 46222 + }, + { + "epoch": 1.18, + "learning_rate": 1.3792296079922633e-06, + "loss": 0.7402, + "step": 46223 + }, + { + "epoch": 1.18, + "learning_rate": 1.379204004304111e-06, + "loss": 0.5576, + "step": 46224 + }, + { + "epoch": 1.18, + "learning_rate": 1.3791784003256196e-06, + "loss": 0.6328, + "step": 46225 + }, + { + "epoch": 1.18, + "learning_rate": 1.3791527960568087e-06, + "loss": 0.833, + "step": 46226 + }, + { + "epoch": 1.18, + "learning_rate": 1.379127191497698e-06, + "loss": 0.7759, + "step": 46227 + }, + { + "epoch": 1.18, + "learning_rate": 1.379101586648307e-06, + "loss": 0.7017, + "step": 46228 + }, + { + "epoch": 1.18, + "learning_rate": 1.3790759815086552e-06, + "loss": 0.5684, + "step": 46229 + }, + { + "epoch": 1.18, + "learning_rate": 1.3790503760787627e-06, + "loss": 0.5352, + "step": 46230 + }, + { + "epoch": 1.18, + "learning_rate": 1.3790247703586487e-06, + "loss": 0.5864, + "step": 46231 + }, + { + "epoch": 1.18, + "learning_rate": 1.3789991643483325e-06, + "loss": 0.7158, + "step": 46232 + }, + { + "epoch": 1.18, + "learning_rate": 1.3789735580478343e-06, + "loss": 0.5815, + "step": 46233 + }, + { + "epoch": 1.19, + "learning_rate": 1.3789479514571736e-06, + "loss": 0.626, + "step": 46234 + }, + { + "epoch": 1.19, + "learning_rate": 1.3789223445763695e-06, + "loss": 0.7549, + "step": 46235 + }, + { + "epoch": 1.19, + "learning_rate": 1.3788967374054424e-06, + "loss": 0.7686, + "step": 46236 + }, + { + "epoch": 1.19, + "learning_rate": 1.3788711299444113e-06, + "loss": 0.603, + "step": 46237 + }, + { + "epoch": 1.19, + "learning_rate": 1.3788455221932959e-06, + "loss": 0.6265, + "step": 46238 + }, + { + "epoch": 1.19, + "learning_rate": 1.378819914152116e-06, + "loss": 0.6689, + "step": 46239 + }, + { + "epoch": 1.19, + "learning_rate": 1.3787943058208912e-06, + "loss": 0.4475, + "step": 46240 + }, + { + "epoch": 1.19, + "learning_rate": 1.378768697199641e-06, + "loss": 0.6807, + "step": 46241 + }, + { + "epoch": 1.19, + "learning_rate": 1.3787430882883851e-06, + "loss": 0.7783, + "step": 46242 + }, + { + "epoch": 1.19, + "learning_rate": 1.3787174790871428e-06, + "loss": 0.668, + "step": 46243 + }, + { + "epoch": 1.19, + "learning_rate": 1.378691869595934e-06, + "loss": 0.6362, + "step": 46244 + }, + { + "epoch": 1.19, + "learning_rate": 1.3786662598147783e-06, + "loss": 0.687, + "step": 46245 + }, + { + "epoch": 1.19, + "learning_rate": 1.3786406497436951e-06, + "loss": 0.5752, + "step": 46246 + }, + { + "epoch": 1.19, + "learning_rate": 1.3786150393827044e-06, + "loss": 0.6992, + "step": 46247 + }, + { + "epoch": 1.19, + "learning_rate": 1.3785894287318255e-06, + "loss": 0.4724, + "step": 46248 + }, + { + "epoch": 1.19, + "learning_rate": 1.378563817791078e-06, + "loss": 0.6177, + "step": 46249 + }, + { + "epoch": 1.19, + "learning_rate": 1.3785382065604816e-06, + "loss": 0.5898, + "step": 46250 + }, + { + "epoch": 1.19, + "learning_rate": 1.378512595040056e-06, + "loss": 0.8047, + "step": 46251 + }, + { + "epoch": 1.19, + "learning_rate": 1.3784869832298205e-06, + "loss": 0.6655, + "step": 46252 + }, + { + "epoch": 1.19, + "learning_rate": 1.3784613711297953e-06, + "loss": 0.666, + "step": 46253 + }, + { + "epoch": 1.19, + "learning_rate": 1.378435758739999e-06, + "loss": 0.5156, + "step": 46254 + }, + { + "epoch": 1.19, + "learning_rate": 1.3784101460604527e-06, + "loss": 0.7432, + "step": 46255 + }, + { + "epoch": 1.19, + "learning_rate": 1.3783845330911745e-06, + "loss": 0.5151, + "step": 46256 + }, + { + "epoch": 1.19, + "learning_rate": 1.378358919832185e-06, + "loss": 0.6177, + "step": 46257 + }, + { + "epoch": 1.19, + "learning_rate": 1.378333306283503e-06, + "loss": 0.6431, + "step": 46258 + }, + { + "epoch": 1.19, + "learning_rate": 1.378307692445149e-06, + "loss": 0.6523, + "step": 46259 + }, + { + "epoch": 1.19, + "learning_rate": 1.3782820783171423e-06, + "loss": 0.583, + "step": 46260 + }, + { + "epoch": 1.19, + "learning_rate": 1.3782564638995021e-06, + "loss": 0.6079, + "step": 46261 + }, + { + "epoch": 1.19, + "learning_rate": 1.3782308491922485e-06, + "loss": 0.5913, + "step": 46262 + }, + { + "epoch": 1.19, + "learning_rate": 1.3782052341954009e-06, + "loss": 0.6006, + "step": 46263 + }, + { + "epoch": 1.19, + "learning_rate": 1.3781796189089788e-06, + "loss": 0.5684, + "step": 46264 + }, + { + "epoch": 1.19, + "learning_rate": 1.3781540033330022e-06, + "loss": 0.5913, + "step": 46265 + }, + { + "epoch": 1.19, + "learning_rate": 1.3781283874674903e-06, + "loss": 0.7725, + "step": 46266 + }, + { + "epoch": 1.19, + "learning_rate": 1.3781027713124628e-06, + "loss": 0.6865, + "step": 46267 + }, + { + "epoch": 1.19, + "learning_rate": 1.3780771548679395e-06, + "loss": 0.6553, + "step": 46268 + }, + { + "epoch": 1.19, + "learning_rate": 1.3780515381339402e-06, + "loss": 0.479, + "step": 46269 + }, + { + "epoch": 1.19, + "learning_rate": 1.3780259211104839e-06, + "loss": 0.6538, + "step": 46270 + }, + { + "epoch": 1.19, + "learning_rate": 1.3780003037975903e-06, + "loss": 0.7021, + "step": 46271 + }, + { + "epoch": 1.19, + "learning_rate": 1.3779746861952797e-06, + "loss": 0.4985, + "step": 46272 + }, + { + "epoch": 1.19, + "learning_rate": 1.3779490683035708e-06, + "loss": 0.665, + "step": 46273 + }, + { + "epoch": 1.19, + "learning_rate": 1.377923450122484e-06, + "loss": 0.6455, + "step": 46274 + }, + { + "epoch": 1.19, + "learning_rate": 1.3778978316520386e-06, + "loss": 0.6382, + "step": 46275 + }, + { + "epoch": 1.19, + "learning_rate": 1.3778722128922545e-06, + "loss": 0.5172, + "step": 46276 + }, + { + "epoch": 1.19, + "learning_rate": 1.3778465938431505e-06, + "loss": 0.6484, + "step": 46277 + }, + { + "epoch": 1.19, + "learning_rate": 1.377820974504747e-06, + "loss": 0.584, + "step": 46278 + }, + { + "epoch": 1.19, + "learning_rate": 1.377795354877063e-06, + "loss": 0.6033, + "step": 46279 + }, + { + "epoch": 1.19, + "learning_rate": 1.377769734960119e-06, + "loss": 0.5352, + "step": 46280 + }, + { + "epoch": 1.19, + "learning_rate": 1.3777441147539338e-06, + "loss": 0.667, + "step": 46281 + }, + { + "epoch": 1.19, + "learning_rate": 1.377718494258527e-06, + "loss": 0.5796, + "step": 46282 + }, + { + "epoch": 1.19, + "learning_rate": 1.377692873473919e-06, + "loss": 0.5571, + "step": 46283 + }, + { + "epoch": 1.19, + "learning_rate": 1.377667252400129e-06, + "loss": 0.7285, + "step": 46284 + }, + { + "epoch": 1.19, + "learning_rate": 1.3776416310371762e-06, + "loss": 0.5615, + "step": 46285 + }, + { + "epoch": 1.19, + "learning_rate": 1.3776160093850808e-06, + "loss": 0.749, + "step": 46286 + }, + { + "epoch": 1.19, + "learning_rate": 1.377590387443862e-06, + "loss": 0.7324, + "step": 46287 + }, + { + "epoch": 1.19, + "learning_rate": 1.3775647652135397e-06, + "loss": 0.7773, + "step": 46288 + }, + { + "epoch": 1.19, + "learning_rate": 1.3775391426941332e-06, + "loss": 0.5967, + "step": 46289 + }, + { + "epoch": 1.19, + "learning_rate": 1.3775135198856625e-06, + "loss": 0.667, + "step": 46290 + }, + { + "epoch": 1.19, + "learning_rate": 1.377487896788147e-06, + "loss": 0.625, + "step": 46291 + }, + { + "epoch": 1.19, + "learning_rate": 1.3774622734016067e-06, + "loss": 0.6436, + "step": 46292 + }, + { + "epoch": 1.19, + "learning_rate": 1.3774366497260605e-06, + "loss": 0.7148, + "step": 46293 + }, + { + "epoch": 1.19, + "learning_rate": 1.3774110257615286e-06, + "loss": 0.834, + "step": 46294 + }, + { + "epoch": 1.19, + "learning_rate": 1.3773854015080307e-06, + "loss": 0.5376, + "step": 46295 + }, + { + "epoch": 1.19, + "learning_rate": 1.3773597769655855e-06, + "loss": 0.585, + "step": 46296 + }, + { + "epoch": 1.19, + "learning_rate": 1.3773341521342138e-06, + "loss": 0.6597, + "step": 46297 + }, + { + "epoch": 1.19, + "learning_rate": 1.3773085270139344e-06, + "loss": 0.7354, + "step": 46298 + }, + { + "epoch": 1.19, + "learning_rate": 1.3772829016047674e-06, + "loss": 0.3857, + "step": 46299 + }, + { + "epoch": 1.19, + "learning_rate": 1.3772572759067323e-06, + "loss": 0.9062, + "step": 46300 + }, + { + "epoch": 1.19, + "learning_rate": 1.3772316499198484e-06, + "loss": 0.5396, + "step": 46301 + }, + { + "epoch": 1.19, + "learning_rate": 1.3772060236441356e-06, + "loss": 0.4641, + "step": 46302 + }, + { + "epoch": 1.19, + "learning_rate": 1.3771803970796135e-06, + "loss": 0.7031, + "step": 46303 + }, + { + "epoch": 1.19, + "learning_rate": 1.3771547702263018e-06, + "loss": 0.7852, + "step": 46304 + }, + { + "epoch": 1.19, + "learning_rate": 1.3771291430842203e-06, + "loss": 0.4868, + "step": 46305 + }, + { + "epoch": 1.19, + "learning_rate": 1.377103515653388e-06, + "loss": 0.6357, + "step": 46306 + }, + { + "epoch": 1.19, + "learning_rate": 1.3770778879338249e-06, + "loss": 0.6533, + "step": 46307 + }, + { + "epoch": 1.19, + "learning_rate": 1.3770522599255504e-06, + "loss": 0.6621, + "step": 46308 + }, + { + "epoch": 1.19, + "learning_rate": 1.377026631628585e-06, + "loss": 0.5723, + "step": 46309 + }, + { + "epoch": 1.19, + "learning_rate": 1.3770010030429472e-06, + "loss": 0.6641, + "step": 46310 + }, + { + "epoch": 1.19, + "learning_rate": 1.3769753741686567e-06, + "loss": 0.5914, + "step": 46311 + }, + { + "epoch": 1.19, + "learning_rate": 1.3769497450057338e-06, + "loss": 0.5479, + "step": 46312 + }, + { + "epoch": 1.19, + "learning_rate": 1.376924115554198e-06, + "loss": 0.4705, + "step": 46313 + }, + { + "epoch": 1.19, + "learning_rate": 1.3768984858140686e-06, + "loss": 0.71, + "step": 46314 + }, + { + "epoch": 1.19, + "learning_rate": 1.3768728557853653e-06, + "loss": 0.6177, + "step": 46315 + }, + { + "epoch": 1.19, + "learning_rate": 1.376847225468108e-06, + "loss": 0.6709, + "step": 46316 + }, + { + "epoch": 1.19, + "learning_rate": 1.3768215948623158e-06, + "loss": 0.613, + "step": 46317 + }, + { + "epoch": 1.19, + "learning_rate": 1.376795963968009e-06, + "loss": 0.8154, + "step": 46318 + }, + { + "epoch": 1.19, + "learning_rate": 1.3767703327852066e-06, + "loss": 0.666, + "step": 46319 + }, + { + "epoch": 1.19, + "learning_rate": 1.3767447013139286e-06, + "loss": 0.8779, + "step": 46320 + }, + { + "epoch": 1.19, + "learning_rate": 1.3767190695541943e-06, + "loss": 0.6494, + "step": 46321 + }, + { + "epoch": 1.19, + "learning_rate": 1.3766934375060237e-06, + "loss": 0.7793, + "step": 46322 + }, + { + "epoch": 1.19, + "learning_rate": 1.3766678051694363e-06, + "loss": 0.3867, + "step": 46323 + }, + { + "epoch": 1.19, + "learning_rate": 1.3766421725444516e-06, + "loss": 0.6082, + "step": 46324 + }, + { + "epoch": 1.19, + "learning_rate": 1.3766165396310894e-06, + "loss": 0.4414, + "step": 46325 + }, + { + "epoch": 1.19, + "learning_rate": 1.376590906429369e-06, + "loss": 0.7344, + "step": 46326 + }, + { + "epoch": 1.19, + "learning_rate": 1.3765652729393105e-06, + "loss": 0.5479, + "step": 46327 + }, + { + "epoch": 1.19, + "learning_rate": 1.3765396391609333e-06, + "loss": 0.6938, + "step": 46328 + }, + { + "epoch": 1.19, + "learning_rate": 1.3765140050942567e-06, + "loss": 0.7188, + "step": 46329 + }, + { + "epoch": 1.19, + "learning_rate": 1.376488370739301e-06, + "loss": 0.499, + "step": 46330 + }, + { + "epoch": 1.19, + "learning_rate": 1.3764627360960853e-06, + "loss": 0.5615, + "step": 46331 + }, + { + "epoch": 1.19, + "learning_rate": 1.3764371011646294e-06, + "loss": 0.6074, + "step": 46332 + }, + { + "epoch": 1.19, + "learning_rate": 1.3764114659449528e-06, + "loss": 0.5171, + "step": 46333 + }, + { + "epoch": 1.19, + "learning_rate": 1.3763858304370755e-06, + "loss": 0.4863, + "step": 46334 + }, + { + "epoch": 1.19, + "learning_rate": 1.3763601946410168e-06, + "loss": 0.708, + "step": 46335 + }, + { + "epoch": 1.19, + "learning_rate": 1.3763345585567963e-06, + "loss": 0.5132, + "step": 46336 + }, + { + "epoch": 1.19, + "learning_rate": 1.3763089221844338e-06, + "loss": 0.6309, + "step": 46337 + }, + { + "epoch": 1.19, + "learning_rate": 1.3762832855239486e-06, + "loss": 0.564, + "step": 46338 + }, + { + "epoch": 1.19, + "learning_rate": 1.376257648575361e-06, + "loss": 0.6611, + "step": 46339 + }, + { + "epoch": 1.19, + "learning_rate": 1.37623201133869e-06, + "loss": 0.464, + "step": 46340 + }, + { + "epoch": 1.19, + "learning_rate": 1.3762063738139554e-06, + "loss": 0.6709, + "step": 46341 + }, + { + "epoch": 1.19, + "learning_rate": 1.376180736001177e-06, + "loss": 0.5986, + "step": 46342 + }, + { + "epoch": 1.19, + "learning_rate": 1.3761550979003743e-06, + "loss": 0.7373, + "step": 46343 + }, + { + "epoch": 1.19, + "learning_rate": 1.376129459511567e-06, + "loss": 0.7666, + "step": 46344 + }, + { + "epoch": 1.19, + "learning_rate": 1.3761038208347748e-06, + "loss": 0.7964, + "step": 46345 + }, + { + "epoch": 1.19, + "learning_rate": 1.376078181870017e-06, + "loss": 0.665, + "step": 46346 + }, + { + "epoch": 1.19, + "learning_rate": 1.3760525426173132e-06, + "loss": 0.7969, + "step": 46347 + }, + { + "epoch": 1.19, + "learning_rate": 1.3760269030766835e-06, + "loss": 0.7539, + "step": 46348 + }, + { + "epoch": 1.19, + "learning_rate": 1.3760012632481473e-06, + "loss": 0.6567, + "step": 46349 + }, + { + "epoch": 1.19, + "learning_rate": 1.3759756231317242e-06, + "loss": 0.6602, + "step": 46350 + }, + { + "epoch": 1.19, + "learning_rate": 1.3759499827274339e-06, + "loss": 0.7217, + "step": 46351 + }, + { + "epoch": 1.19, + "learning_rate": 1.3759243420352959e-06, + "loss": 0.6357, + "step": 46352 + }, + { + "epoch": 1.19, + "learning_rate": 1.37589870105533e-06, + "loss": 0.7148, + "step": 46353 + }, + { + "epoch": 1.19, + "learning_rate": 1.3758730597875556e-06, + "loss": 0.3622, + "step": 46354 + }, + { + "epoch": 1.19, + "learning_rate": 1.3758474182319927e-06, + "loss": 0.8242, + "step": 46355 + }, + { + "epoch": 1.19, + "learning_rate": 1.3758217763886607e-06, + "loss": 0.5908, + "step": 46356 + }, + { + "epoch": 1.19, + "learning_rate": 1.3757961342575789e-06, + "loss": 0.5151, + "step": 46357 + }, + { + "epoch": 1.19, + "learning_rate": 1.3757704918387676e-06, + "loss": 0.5889, + "step": 46358 + }, + { + "epoch": 1.19, + "learning_rate": 1.3757448491322462e-06, + "loss": 0.7725, + "step": 46359 + }, + { + "epoch": 1.19, + "learning_rate": 1.375719206138034e-06, + "loss": 0.5466, + "step": 46360 + }, + { + "epoch": 1.19, + "learning_rate": 1.3756935628561508e-06, + "loss": 0.8428, + "step": 46361 + }, + { + "epoch": 1.19, + "learning_rate": 1.3756679192866165e-06, + "loss": 0.8096, + "step": 46362 + }, + { + "epoch": 1.19, + "learning_rate": 1.3756422754294503e-06, + "loss": 0.6909, + "step": 46363 + }, + { + "epoch": 1.19, + "learning_rate": 1.3756166312846724e-06, + "loss": 0.6143, + "step": 46364 + }, + { + "epoch": 1.19, + "learning_rate": 1.375590986852302e-06, + "loss": 0.667, + "step": 46365 + }, + { + "epoch": 1.19, + "learning_rate": 1.3755653421323591e-06, + "loss": 0.6484, + "step": 46366 + }, + { + "epoch": 1.19, + "learning_rate": 1.3755396971248627e-06, + "loss": 0.7412, + "step": 46367 + }, + { + "epoch": 1.19, + "learning_rate": 1.3755140518298331e-06, + "loss": 0.4711, + "step": 46368 + }, + { + "epoch": 1.19, + "learning_rate": 1.3754884062472894e-06, + "loss": 0.6543, + "step": 46369 + }, + { + "epoch": 1.19, + "learning_rate": 1.375462760377252e-06, + "loss": 0.6279, + "step": 46370 + }, + { + "epoch": 1.19, + "learning_rate": 1.3754371142197394e-06, + "loss": 0.7305, + "step": 46371 + }, + { + "epoch": 1.19, + "learning_rate": 1.3754114677747721e-06, + "loss": 0.5688, + "step": 46372 + }, + { + "epoch": 1.19, + "learning_rate": 1.3753858210423693e-06, + "loss": 0.6875, + "step": 46373 + }, + { + "epoch": 1.19, + "learning_rate": 1.3753601740225514e-06, + "loss": 0.6836, + "step": 46374 + }, + { + "epoch": 1.19, + "learning_rate": 1.3753345267153372e-06, + "loss": 0.6699, + "step": 46375 + }, + { + "epoch": 1.19, + "learning_rate": 1.3753088791207466e-06, + "loss": 0.6748, + "step": 46376 + }, + { + "epoch": 1.19, + "learning_rate": 1.375283231238799e-06, + "loss": 0.7227, + "step": 46377 + }, + { + "epoch": 1.19, + "learning_rate": 1.3752575830695145e-06, + "loss": 0.667, + "step": 46378 + }, + { + "epoch": 1.19, + "learning_rate": 1.3752319346129124e-06, + "loss": 0.6716, + "step": 46379 + }, + { + "epoch": 1.19, + "learning_rate": 1.3752062858690126e-06, + "loss": 0.6538, + "step": 46380 + }, + { + "epoch": 1.19, + "learning_rate": 1.3751806368378346e-06, + "loss": 0.5703, + "step": 46381 + }, + { + "epoch": 1.19, + "learning_rate": 1.375154987519398e-06, + "loss": 0.6641, + "step": 46382 + }, + { + "epoch": 1.19, + "learning_rate": 1.3751293379137226e-06, + "loss": 0.8145, + "step": 46383 + }, + { + "epoch": 1.19, + "learning_rate": 1.3751036880208275e-06, + "loss": 0.7168, + "step": 46384 + }, + { + "epoch": 1.19, + "learning_rate": 1.3750780378407334e-06, + "loss": 0.584, + "step": 46385 + }, + { + "epoch": 1.19, + "learning_rate": 1.3750523873734587e-06, + "loss": 0.5604, + "step": 46386 + }, + { + "epoch": 1.19, + "learning_rate": 1.375026736619024e-06, + "loss": 0.7227, + "step": 46387 + }, + { + "epoch": 1.19, + "learning_rate": 1.3750010855774484e-06, + "loss": 0.5801, + "step": 46388 + }, + { + "epoch": 1.19, + "learning_rate": 1.3749754342487516e-06, + "loss": 0.7168, + "step": 46389 + }, + { + "epoch": 1.19, + "learning_rate": 1.3749497826329538e-06, + "loss": 0.7129, + "step": 46390 + }, + { + "epoch": 1.19, + "learning_rate": 1.3749241307300738e-06, + "loss": 0.5906, + "step": 46391 + }, + { + "epoch": 1.19, + "learning_rate": 1.3748984785401317e-06, + "loss": 0.4727, + "step": 46392 + }, + { + "epoch": 1.19, + "learning_rate": 1.374872826063147e-06, + "loss": 0.749, + "step": 46393 + }, + { + "epoch": 1.19, + "learning_rate": 1.3748471732991393e-06, + "loss": 0.5818, + "step": 46394 + }, + { + "epoch": 1.19, + "learning_rate": 1.374821520248129e-06, + "loss": 0.6768, + "step": 46395 + }, + { + "epoch": 1.19, + "learning_rate": 1.3747958669101346e-06, + "loss": 0.5884, + "step": 46396 + }, + { + "epoch": 1.19, + "learning_rate": 1.3747702132851763e-06, + "loss": 0.7678, + "step": 46397 + }, + { + "epoch": 1.19, + "learning_rate": 1.3747445593732736e-06, + "loss": 0.6084, + "step": 46398 + }, + { + "epoch": 1.19, + "learning_rate": 1.3747189051744462e-06, + "loss": 0.668, + "step": 46399 + }, + { + "epoch": 1.19, + "learning_rate": 1.374693250688714e-06, + "loss": 0.7153, + "step": 46400 + }, + { + "epoch": 1.19, + "learning_rate": 1.3746675959160962e-06, + "loss": 0.6963, + "step": 46401 + }, + { + "epoch": 1.19, + "learning_rate": 1.3746419408566127e-06, + "loss": 0.6079, + "step": 46402 + }, + { + "epoch": 1.19, + "learning_rate": 1.3746162855102832e-06, + "loss": 0.6523, + "step": 46403 + }, + { + "epoch": 1.19, + "learning_rate": 1.3745906298771273e-06, + "loss": 0.7139, + "step": 46404 + }, + { + "epoch": 1.19, + "learning_rate": 1.3745649739571642e-06, + "loss": 0.7705, + "step": 46405 + }, + { + "epoch": 1.19, + "learning_rate": 1.3745393177504144e-06, + "loss": 0.7446, + "step": 46406 + }, + { + "epoch": 1.19, + "learning_rate": 1.3745136612568967e-06, + "loss": 0.6611, + "step": 46407 + }, + { + "epoch": 1.19, + "learning_rate": 1.3744880044766314e-06, + "loss": 0.6255, + "step": 46408 + }, + { + "epoch": 1.19, + "learning_rate": 1.3744623474096374e-06, + "loss": 0.6079, + "step": 46409 + }, + { + "epoch": 1.19, + "learning_rate": 1.3744366900559353e-06, + "loss": 0.6572, + "step": 46410 + }, + { + "epoch": 1.19, + "learning_rate": 1.3744110324155441e-06, + "loss": 0.5571, + "step": 46411 + }, + { + "epoch": 1.19, + "learning_rate": 1.3743853744884835e-06, + "loss": 0.5903, + "step": 46412 + }, + { + "epoch": 1.19, + "learning_rate": 1.3743597162747732e-06, + "loss": 0.6968, + "step": 46413 + }, + { + "epoch": 1.19, + "learning_rate": 1.3743340577744328e-06, + "loss": 0.5469, + "step": 46414 + }, + { + "epoch": 1.19, + "learning_rate": 1.3743083989874823e-06, + "loss": 0.7842, + "step": 46415 + }, + { + "epoch": 1.19, + "learning_rate": 1.3742827399139412e-06, + "loss": 0.6177, + "step": 46416 + }, + { + "epoch": 1.19, + "learning_rate": 1.3742570805538285e-06, + "loss": 0.4458, + "step": 46417 + }, + { + "epoch": 1.19, + "learning_rate": 1.3742314209071646e-06, + "loss": 0.6348, + "step": 46418 + }, + { + "epoch": 1.19, + "learning_rate": 1.3742057609739687e-06, + "loss": 0.6875, + "step": 46419 + }, + { + "epoch": 1.19, + "learning_rate": 1.374180100754261e-06, + "loss": 0.7915, + "step": 46420 + }, + { + "epoch": 1.19, + "learning_rate": 1.3741544402480606e-06, + "loss": 0.8682, + "step": 46421 + }, + { + "epoch": 1.19, + "learning_rate": 1.3741287794553878e-06, + "loss": 0.5703, + "step": 46422 + }, + { + "epoch": 1.19, + "learning_rate": 1.3741031183762611e-06, + "loss": 0.6357, + "step": 46423 + }, + { + "epoch": 1.19, + "learning_rate": 1.3740774570107012e-06, + "loss": 0.708, + "step": 46424 + }, + { + "epoch": 1.19, + "learning_rate": 1.3740517953587274e-06, + "loss": 0.6885, + "step": 46425 + }, + { + "epoch": 1.19, + "learning_rate": 1.3740261334203593e-06, + "loss": 0.5391, + "step": 46426 + }, + { + "epoch": 1.19, + "learning_rate": 1.3740004711956166e-06, + "loss": 0.5996, + "step": 46427 + }, + { + "epoch": 1.19, + "learning_rate": 1.3739748086845189e-06, + "loss": 0.4547, + "step": 46428 + }, + { + "epoch": 1.19, + "learning_rate": 1.373949145887086e-06, + "loss": 0.6958, + "step": 46429 + }, + { + "epoch": 1.19, + "learning_rate": 1.3739234828033372e-06, + "loss": 0.7354, + "step": 46430 + }, + { + "epoch": 1.19, + "learning_rate": 1.3738978194332926e-06, + "loss": 0.6592, + "step": 46431 + }, + { + "epoch": 1.19, + "learning_rate": 1.3738721557769715e-06, + "loss": 0.5762, + "step": 46432 + }, + { + "epoch": 1.19, + "learning_rate": 1.3738464918343938e-06, + "loss": 0.7656, + "step": 46433 + }, + { + "epoch": 1.19, + "learning_rate": 1.373820827605579e-06, + "loss": 0.6304, + "step": 46434 + }, + { + "epoch": 1.19, + "learning_rate": 1.373795163090547e-06, + "loss": 0.6333, + "step": 46435 + }, + { + "epoch": 1.19, + "learning_rate": 1.3737694982893166e-06, + "loss": 0.7476, + "step": 46436 + }, + { + "epoch": 1.19, + "learning_rate": 1.3737438332019085e-06, + "loss": 0.7368, + "step": 46437 + }, + { + "epoch": 1.19, + "learning_rate": 1.373718167828342e-06, + "loss": 0.582, + "step": 46438 + }, + { + "epoch": 1.19, + "learning_rate": 1.3736925021686366e-06, + "loss": 0.9189, + "step": 46439 + }, + { + "epoch": 1.19, + "learning_rate": 1.3736668362228119e-06, + "loss": 0.6172, + "step": 46440 + }, + { + "epoch": 1.19, + "learning_rate": 1.373641169990888e-06, + "loss": 0.6675, + "step": 46441 + }, + { + "epoch": 1.19, + "learning_rate": 1.3736155034728838e-06, + "loss": 0.5894, + "step": 46442 + }, + { + "epoch": 1.19, + "learning_rate": 1.3735898366688196e-06, + "loss": 0.5884, + "step": 46443 + }, + { + "epoch": 1.19, + "learning_rate": 1.3735641695787147e-06, + "loss": 0.5874, + "step": 46444 + }, + { + "epoch": 1.19, + "learning_rate": 1.373538502202589e-06, + "loss": 0.564, + "step": 46445 + }, + { + "epoch": 1.19, + "learning_rate": 1.3735128345404623e-06, + "loss": 0.7559, + "step": 46446 + }, + { + "epoch": 1.19, + "learning_rate": 1.3734871665923537e-06, + "loss": 0.563, + "step": 46447 + }, + { + "epoch": 1.19, + "learning_rate": 1.3734614983582832e-06, + "loss": 0.6323, + "step": 46448 + }, + { + "epoch": 1.19, + "learning_rate": 1.3734358298382707e-06, + "loss": 0.707, + "step": 46449 + }, + { + "epoch": 1.19, + "learning_rate": 1.3734101610323352e-06, + "loss": 0.8271, + "step": 46450 + }, + { + "epoch": 1.19, + "learning_rate": 1.373384491940497e-06, + "loss": 0.6416, + "step": 46451 + }, + { + "epoch": 1.19, + "learning_rate": 1.3733588225627752e-06, + "loss": 0.7939, + "step": 46452 + }, + { + "epoch": 1.19, + "learning_rate": 1.3733331528991897e-06, + "loss": 0.54, + "step": 46453 + }, + { + "epoch": 1.19, + "learning_rate": 1.3733074829497601e-06, + "loss": 0.5542, + "step": 46454 + }, + { + "epoch": 1.19, + "learning_rate": 1.3732818127145065e-06, + "loss": 0.7197, + "step": 46455 + }, + { + "epoch": 1.19, + "learning_rate": 1.3732561421934481e-06, + "loss": 0.6523, + "step": 46456 + }, + { + "epoch": 1.19, + "learning_rate": 1.3732304713866044e-06, + "loss": 0.5643, + "step": 46457 + }, + { + "epoch": 1.19, + "learning_rate": 1.3732048002939953e-06, + "loss": 0.6064, + "step": 46458 + }, + { + "epoch": 1.19, + "learning_rate": 1.3731791289156404e-06, + "loss": 0.7812, + "step": 46459 + }, + { + "epoch": 1.19, + "learning_rate": 1.37315345725156e-06, + "loss": 0.71, + "step": 46460 + }, + { + "epoch": 1.19, + "learning_rate": 1.3731277853017723e-06, + "loss": 0.6846, + "step": 46461 + }, + { + "epoch": 1.19, + "learning_rate": 1.3731021130662983e-06, + "loss": 0.8594, + "step": 46462 + }, + { + "epoch": 1.19, + "learning_rate": 1.3730764405451569e-06, + "loss": 0.7471, + "step": 46463 + }, + { + "epoch": 1.19, + "learning_rate": 1.3730507677383684e-06, + "loss": 0.4617, + "step": 46464 + }, + { + "epoch": 1.19, + "learning_rate": 1.3730250946459518e-06, + "loss": 0.6162, + "step": 46465 + }, + { + "epoch": 1.19, + "learning_rate": 1.372999421267927e-06, + "loss": 0.6816, + "step": 46466 + }, + { + "epoch": 1.19, + "learning_rate": 1.372973747604314e-06, + "loss": 0.5654, + "step": 46467 + }, + { + "epoch": 1.19, + "learning_rate": 1.372948073655132e-06, + "loss": 0.6235, + "step": 46468 + }, + { + "epoch": 1.19, + "learning_rate": 1.3729223994204007e-06, + "loss": 0.5713, + "step": 46469 + }, + { + "epoch": 1.19, + "learning_rate": 1.3728967249001398e-06, + "loss": 0.6167, + "step": 46470 + }, + { + "epoch": 1.19, + "learning_rate": 1.3728710500943695e-06, + "loss": 0.646, + "step": 46471 + }, + { + "epoch": 1.19, + "learning_rate": 1.3728453750031084e-06, + "loss": 0.7607, + "step": 46472 + }, + { + "epoch": 1.19, + "learning_rate": 1.372819699626377e-06, + "loss": 0.7393, + "step": 46473 + }, + { + "epoch": 1.19, + "learning_rate": 1.3727940239641944e-06, + "loss": 0.6182, + "step": 46474 + }, + { + "epoch": 1.19, + "learning_rate": 1.3727683480165813e-06, + "loss": 0.5801, + "step": 46475 + }, + { + "epoch": 1.19, + "learning_rate": 1.372742671783556e-06, + "loss": 0.6743, + "step": 46476 + }, + { + "epoch": 1.19, + "learning_rate": 1.372716995265139e-06, + "loss": 0.6294, + "step": 46477 + }, + { + "epoch": 1.19, + "learning_rate": 1.3726913184613493e-06, + "loss": 0.6953, + "step": 46478 + }, + { + "epoch": 1.19, + "learning_rate": 1.3726656413722074e-06, + "loss": 0.5188, + "step": 46479 + }, + { + "epoch": 1.19, + "learning_rate": 1.3726399639977326e-06, + "loss": 0.7549, + "step": 46480 + }, + { + "epoch": 1.19, + "learning_rate": 1.3726142863379447e-06, + "loss": 0.6953, + "step": 46481 + }, + { + "epoch": 1.19, + "learning_rate": 1.3725886083928625e-06, + "loss": 0.7788, + "step": 46482 + }, + { + "epoch": 1.19, + "learning_rate": 1.372562930162507e-06, + "loss": 0.6875, + "step": 46483 + }, + { + "epoch": 1.19, + "learning_rate": 1.3725372516468968e-06, + "loss": 0.4331, + "step": 46484 + }, + { + "epoch": 1.19, + "learning_rate": 1.3725115728460523e-06, + "loss": 0.6855, + "step": 46485 + }, + { + "epoch": 1.19, + "learning_rate": 1.3724858937599924e-06, + "loss": 0.6938, + "step": 46486 + }, + { + "epoch": 1.19, + "learning_rate": 1.3724602143887376e-06, + "loss": 0.4797, + "step": 46487 + }, + { + "epoch": 1.19, + "learning_rate": 1.3724345347323067e-06, + "loss": 0.6475, + "step": 46488 + }, + { + "epoch": 1.19, + "learning_rate": 1.37240885479072e-06, + "loss": 0.7217, + "step": 46489 + }, + { + "epoch": 1.19, + "learning_rate": 1.372383174563997e-06, + "loss": 0.5977, + "step": 46490 + }, + { + "epoch": 1.19, + "learning_rate": 1.3723574940521575e-06, + "loss": 0.7227, + "step": 46491 + }, + { + "epoch": 1.19, + "learning_rate": 1.3723318132552206e-06, + "loss": 0.5747, + "step": 46492 + }, + { + "epoch": 1.19, + "learning_rate": 1.3723061321732066e-06, + "loss": 0.5688, + "step": 46493 + }, + { + "epoch": 1.19, + "learning_rate": 1.372280450806135e-06, + "loss": 0.6855, + "step": 46494 + }, + { + "epoch": 1.19, + "learning_rate": 1.3722547691540252e-06, + "loss": 0.5981, + "step": 46495 + }, + { + "epoch": 1.19, + "learning_rate": 1.372229087216897e-06, + "loss": 0.6494, + "step": 46496 + }, + { + "epoch": 1.19, + "learning_rate": 1.3722034049947701e-06, + "loss": 0.7354, + "step": 46497 + }, + { + "epoch": 1.19, + "learning_rate": 1.3721777224876642e-06, + "loss": 0.6455, + "step": 46498 + }, + { + "epoch": 1.19, + "learning_rate": 1.372152039695599e-06, + "loss": 0.7773, + "step": 46499 + }, + { + "epoch": 1.19, + "learning_rate": 1.3721263566185944e-06, + "loss": 0.6455, + "step": 46500 + }, + { + "epoch": 1.19, + "learning_rate": 1.3721006732566692e-06, + "loss": 0.7065, + "step": 46501 + }, + { + "epoch": 1.19, + "learning_rate": 1.372074989609844e-06, + "loss": 0.6807, + "step": 46502 + }, + { + "epoch": 1.19, + "learning_rate": 1.372049305678138e-06, + "loss": 0.7764, + "step": 46503 + }, + { + "epoch": 1.19, + "learning_rate": 1.3720236214615709e-06, + "loss": 0.7627, + "step": 46504 + }, + { + "epoch": 1.19, + "learning_rate": 1.3719979369601623e-06, + "loss": 0.875, + "step": 46505 + }, + { + "epoch": 1.19, + "learning_rate": 1.3719722521739324e-06, + "loss": 0.6396, + "step": 46506 + }, + { + "epoch": 1.19, + "learning_rate": 1.3719465671028999e-06, + "loss": 0.4226, + "step": 46507 + }, + { + "epoch": 1.19, + "learning_rate": 1.3719208817470854e-06, + "loss": 0.6357, + "step": 46508 + }, + { + "epoch": 1.19, + "learning_rate": 1.3718951961065077e-06, + "loss": 0.6753, + "step": 46509 + }, + { + "epoch": 1.19, + "learning_rate": 1.3718695101811874e-06, + "loss": 0.624, + "step": 46510 + }, + { + "epoch": 1.19, + "learning_rate": 1.3718438239711438e-06, + "loss": 0.6318, + "step": 46511 + }, + { + "epoch": 1.19, + "learning_rate": 1.3718181374763965e-06, + "loss": 0.8262, + "step": 46512 + }, + { + "epoch": 1.19, + "learning_rate": 1.3717924506969646e-06, + "loss": 0.647, + "step": 46513 + }, + { + "epoch": 1.19, + "learning_rate": 1.3717667636328689e-06, + "loss": 0.6626, + "step": 46514 + }, + { + "epoch": 1.19, + "learning_rate": 1.3717410762841282e-06, + "loss": 0.7109, + "step": 46515 + }, + { + "epoch": 1.19, + "learning_rate": 1.3717153886507623e-06, + "loss": 0.5303, + "step": 46516 + }, + { + "epoch": 1.19, + "learning_rate": 1.3716897007327911e-06, + "loss": 0.7295, + "step": 46517 + }, + { + "epoch": 1.19, + "learning_rate": 1.3716640125302344e-06, + "loss": 0.748, + "step": 46518 + }, + { + "epoch": 1.19, + "learning_rate": 1.3716383240431117e-06, + "loss": 0.6255, + "step": 46519 + }, + { + "epoch": 1.19, + "learning_rate": 1.3716126352714426e-06, + "loss": 0.4932, + "step": 46520 + }, + { + "epoch": 1.19, + "learning_rate": 1.3715869462152467e-06, + "loss": 0.5425, + "step": 46521 + }, + { + "epoch": 1.19, + "learning_rate": 1.3715612568745435e-06, + "loss": 0.7266, + "step": 46522 + }, + { + "epoch": 1.19, + "learning_rate": 1.3715355672493534e-06, + "loss": 0.8799, + "step": 46523 + }, + { + "epoch": 1.19, + "learning_rate": 1.3715098773396952e-06, + "loss": 0.6323, + "step": 46524 + }, + { + "epoch": 1.19, + "learning_rate": 1.3714841871455893e-06, + "loss": 0.5298, + "step": 46525 + }, + { + "epoch": 1.19, + "learning_rate": 1.3714584966670549e-06, + "loss": 0.584, + "step": 46526 + }, + { + "epoch": 1.19, + "learning_rate": 1.3714328059041117e-06, + "loss": 0.5024, + "step": 46527 + }, + { + "epoch": 1.19, + "learning_rate": 1.3714071148567794e-06, + "loss": 0.7393, + "step": 46528 + }, + { + "epoch": 1.19, + "learning_rate": 1.371381423525078e-06, + "loss": 0.6655, + "step": 46529 + }, + { + "epoch": 1.19, + "learning_rate": 1.371355731909027e-06, + "loss": 0.6807, + "step": 46530 + }, + { + "epoch": 1.19, + "learning_rate": 1.371330040008646e-06, + "loss": 0.6074, + "step": 46531 + }, + { + "epoch": 1.19, + "learning_rate": 1.3713043478239542e-06, + "loss": 0.4897, + "step": 46532 + }, + { + "epoch": 1.19, + "learning_rate": 1.371278655354972e-06, + "loss": 0.7061, + "step": 46533 + }, + { + "epoch": 1.19, + "learning_rate": 1.3712529626017188e-06, + "loss": 0.728, + "step": 46534 + }, + { + "epoch": 1.19, + "learning_rate": 1.3712272695642144e-06, + "loss": 0.6699, + "step": 46535 + }, + { + "epoch": 1.19, + "learning_rate": 1.3712015762424783e-06, + "loss": 0.668, + "step": 46536 + }, + { + "epoch": 1.19, + "learning_rate": 1.37117588263653e-06, + "loss": 0.5786, + "step": 46537 + }, + { + "epoch": 1.19, + "learning_rate": 1.3711501887463896e-06, + "loss": 0.4648, + "step": 46538 + }, + { + "epoch": 1.19, + "learning_rate": 1.3711244945720765e-06, + "loss": 0.623, + "step": 46539 + }, + { + "epoch": 1.19, + "learning_rate": 1.3710988001136108e-06, + "loss": 0.8164, + "step": 46540 + }, + { + "epoch": 1.19, + "learning_rate": 1.3710731053710113e-06, + "loss": 0.7285, + "step": 46541 + }, + { + "epoch": 1.19, + "learning_rate": 1.3710474103442985e-06, + "loss": 0.687, + "step": 46542 + }, + { + "epoch": 1.19, + "learning_rate": 1.3710217150334912e-06, + "loss": 0.5708, + "step": 46543 + }, + { + "epoch": 1.19, + "learning_rate": 1.3709960194386105e-06, + "loss": 0.4312, + "step": 46544 + }, + { + "epoch": 1.19, + "learning_rate": 1.3709703235596748e-06, + "loss": 0.6567, + "step": 46545 + }, + { + "epoch": 1.19, + "learning_rate": 1.370944627396704e-06, + "loss": 0.6494, + "step": 46546 + }, + { + "epoch": 1.19, + "learning_rate": 1.370918930949718e-06, + "loss": 0.646, + "step": 46547 + }, + { + "epoch": 1.19, + "learning_rate": 1.3708932342187366e-06, + "loss": 0.6377, + "step": 46548 + }, + { + "epoch": 1.19, + "learning_rate": 1.3708675372037791e-06, + "loss": 0.6167, + "step": 46549 + }, + { + "epoch": 1.19, + "learning_rate": 1.3708418399048657e-06, + "loss": 0.5125, + "step": 46550 + }, + { + "epoch": 1.19, + "learning_rate": 1.3708161423220154e-06, + "loss": 0.4064, + "step": 46551 + }, + { + "epoch": 1.19, + "learning_rate": 1.3707904444552488e-06, + "loss": 0.5664, + "step": 46552 + }, + { + "epoch": 1.19, + "learning_rate": 1.3707647463045845e-06, + "loss": 0.6987, + "step": 46553 + }, + { + "epoch": 1.19, + "learning_rate": 1.3707390478700427e-06, + "loss": 0.6074, + "step": 46554 + }, + { + "epoch": 1.19, + "learning_rate": 1.3707133491516431e-06, + "loss": 0.5466, + "step": 46555 + }, + { + "epoch": 1.19, + "learning_rate": 1.3706876501494053e-06, + "loss": 0.6279, + "step": 46556 + }, + { + "epoch": 1.19, + "learning_rate": 1.3706619508633492e-06, + "loss": 0.6221, + "step": 46557 + }, + { + "epoch": 1.19, + "learning_rate": 1.3706362512934943e-06, + "loss": 0.709, + "step": 46558 + }, + { + "epoch": 1.19, + "learning_rate": 1.3706105514398603e-06, + "loss": 0.7383, + "step": 46559 + }, + { + "epoch": 1.19, + "learning_rate": 1.3705848513024664e-06, + "loss": 0.7314, + "step": 46560 + }, + { + "epoch": 1.19, + "learning_rate": 1.3705591508813332e-06, + "loss": 0.6689, + "step": 46561 + }, + { + "epoch": 1.19, + "learning_rate": 1.3705334501764796e-06, + "loss": 0.5898, + "step": 46562 + }, + { + "epoch": 1.19, + "learning_rate": 1.3705077491879258e-06, + "loss": 0.4801, + "step": 46563 + }, + { + "epoch": 1.19, + "learning_rate": 1.3704820479156911e-06, + "loss": 0.5811, + "step": 46564 + }, + { + "epoch": 1.19, + "learning_rate": 1.3704563463597953e-06, + "loss": 0.5554, + "step": 46565 + }, + { + "epoch": 1.19, + "learning_rate": 1.3704306445202583e-06, + "loss": 0.4849, + "step": 46566 + }, + { + "epoch": 1.19, + "learning_rate": 1.3704049423970994e-06, + "loss": 0.9092, + "step": 46567 + }, + { + "epoch": 1.19, + "learning_rate": 1.3703792399903384e-06, + "loss": 0.6519, + "step": 46568 + }, + { + "epoch": 1.19, + "learning_rate": 1.3703535372999955e-06, + "loss": 0.3479, + "step": 46569 + }, + { + "epoch": 1.19, + "learning_rate": 1.3703278343260895e-06, + "loss": 0.4893, + "step": 46570 + }, + { + "epoch": 1.19, + "learning_rate": 1.3703021310686406e-06, + "loss": 0.6362, + "step": 46571 + }, + { + "epoch": 1.19, + "learning_rate": 1.3702764275276685e-06, + "loss": 0.6494, + "step": 46572 + }, + { + "epoch": 1.19, + "learning_rate": 1.3702507237031925e-06, + "loss": 0.6406, + "step": 46573 + }, + { + "epoch": 1.19, + "learning_rate": 1.3702250195952328e-06, + "loss": 0.4285, + "step": 46574 + }, + { + "epoch": 1.19, + "learning_rate": 1.3701993152038088e-06, + "loss": 0.9062, + "step": 46575 + }, + { + "epoch": 1.19, + "learning_rate": 1.3701736105289401e-06, + "loss": 0.8184, + "step": 46576 + }, + { + "epoch": 1.19, + "learning_rate": 1.3701479055706466e-06, + "loss": 0.707, + "step": 46577 + }, + { + "epoch": 1.19, + "learning_rate": 1.3701222003289474e-06, + "loss": 0.6328, + "step": 46578 + }, + { + "epoch": 1.19, + "learning_rate": 1.3700964948038633e-06, + "loss": 0.8262, + "step": 46579 + }, + { + "epoch": 1.19, + "learning_rate": 1.3700707889954131e-06, + "loss": 0.5933, + "step": 46580 + }, + { + "epoch": 1.19, + "learning_rate": 1.3700450829036165e-06, + "loss": 0.605, + "step": 46581 + }, + { + "epoch": 1.19, + "learning_rate": 1.3700193765284937e-06, + "loss": 0.7646, + "step": 46582 + }, + { + "epoch": 1.19, + "learning_rate": 1.3699936698700638e-06, + "loss": 0.708, + "step": 46583 + }, + { + "epoch": 1.19, + "learning_rate": 1.369967962928347e-06, + "loss": 0.6313, + "step": 46584 + }, + { + "epoch": 1.19, + "learning_rate": 1.369942255703363e-06, + "loss": 0.6631, + "step": 46585 + }, + { + "epoch": 1.19, + "learning_rate": 1.3699165481951307e-06, + "loss": 0.7222, + "step": 46586 + }, + { + "epoch": 1.19, + "learning_rate": 1.3698908404036705e-06, + "loss": 0.4873, + "step": 46587 + }, + { + "epoch": 1.19, + "learning_rate": 1.3698651323290017e-06, + "loss": 0.4934, + "step": 46588 + }, + { + "epoch": 1.19, + "learning_rate": 1.3698394239711446e-06, + "loss": 0.7725, + "step": 46589 + }, + { + "epoch": 1.19, + "learning_rate": 1.3698137153301183e-06, + "loss": 0.6089, + "step": 46590 + }, + { + "epoch": 1.19, + "learning_rate": 1.3697880064059423e-06, + "loss": 0.6973, + "step": 46591 + }, + { + "epoch": 1.19, + "learning_rate": 1.3697622971986372e-06, + "loss": 0.6885, + "step": 46592 + }, + { + "epoch": 1.19, + "learning_rate": 1.3697365877082217e-06, + "loss": 0.7598, + "step": 46593 + }, + { + "epoch": 1.19, + "learning_rate": 1.3697108779347163e-06, + "loss": 0.3716, + "step": 46594 + }, + { + "epoch": 1.19, + "learning_rate": 1.3696851678781397e-06, + "loss": 0.7646, + "step": 46595 + }, + { + "epoch": 1.19, + "learning_rate": 1.3696594575385126e-06, + "loss": 0.7314, + "step": 46596 + }, + { + "epoch": 1.19, + "learning_rate": 1.369633746915854e-06, + "loss": 0.5815, + "step": 46597 + }, + { + "epoch": 1.19, + "learning_rate": 1.3696080360101838e-06, + "loss": 0.7178, + "step": 46598 + }, + { + "epoch": 1.19, + "learning_rate": 1.3695823248215218e-06, + "loss": 0.6089, + "step": 46599 + }, + { + "epoch": 1.19, + "learning_rate": 1.3695566133498877e-06, + "loss": 0.5283, + "step": 46600 + }, + { + "epoch": 1.19, + "learning_rate": 1.3695309015953013e-06, + "loss": 0.9424, + "step": 46601 + }, + { + "epoch": 1.19, + "learning_rate": 1.3695051895577816e-06, + "loss": 0.4424, + "step": 46602 + }, + { + "epoch": 1.19, + "learning_rate": 1.369479477237349e-06, + "loss": 0.8486, + "step": 46603 + }, + { + "epoch": 1.19, + "learning_rate": 1.369453764634023e-06, + "loss": 0.6855, + "step": 46604 + }, + { + "epoch": 1.19, + "learning_rate": 1.3694280517478233e-06, + "loss": 0.6934, + "step": 46605 + }, + { + "epoch": 1.19, + "learning_rate": 1.3694023385787693e-06, + "loss": 0.7383, + "step": 46606 + }, + { + "epoch": 1.19, + "learning_rate": 1.369376625126881e-06, + "loss": 0.6768, + "step": 46607 + }, + { + "epoch": 1.19, + "learning_rate": 1.369350911392178e-06, + "loss": 0.6089, + "step": 46608 + }, + { + "epoch": 1.19, + "learning_rate": 1.3693251973746801e-06, + "loss": 0.5654, + "step": 46609 + }, + { + "epoch": 1.19, + "learning_rate": 1.3692994830744069e-06, + "loss": 0.7324, + "step": 46610 + }, + { + "epoch": 1.19, + "learning_rate": 1.369273768491378e-06, + "loss": 0.6128, + "step": 46611 + }, + { + "epoch": 1.19, + "learning_rate": 1.3692480536256131e-06, + "loss": 0.6895, + "step": 46612 + }, + { + "epoch": 1.19, + "learning_rate": 1.369222338477132e-06, + "loss": 0.6377, + "step": 46613 + }, + { + "epoch": 1.19, + "learning_rate": 1.3691966230459544e-06, + "loss": 0.5249, + "step": 46614 + }, + { + "epoch": 1.19, + "learning_rate": 1.3691709073320998e-06, + "loss": 0.6807, + "step": 46615 + }, + { + "epoch": 1.19, + "learning_rate": 1.3691451913355878e-06, + "loss": 0.7402, + "step": 46616 + }, + { + "epoch": 1.19, + "learning_rate": 1.3691194750564388e-06, + "loss": 0.6494, + "step": 46617 + }, + { + "epoch": 1.19, + "learning_rate": 1.3690937584946716e-06, + "loss": 0.6841, + "step": 46618 + }, + { + "epoch": 1.19, + "learning_rate": 1.3690680416503067e-06, + "loss": 0.793, + "step": 46619 + }, + { + "epoch": 1.19, + "learning_rate": 1.369042324523363e-06, + "loss": 0.5338, + "step": 46620 + }, + { + "epoch": 1.19, + "learning_rate": 1.3690166071138606e-06, + "loss": 0.7852, + "step": 46621 + }, + { + "epoch": 1.19, + "learning_rate": 1.368990889421819e-06, + "loss": 0.6216, + "step": 46622 + }, + { + "epoch": 1.19, + "learning_rate": 1.3689651714472583e-06, + "loss": 0.7168, + "step": 46623 + }, + { + "epoch": 1.19, + "learning_rate": 1.3689394531901979e-06, + "loss": 0.6338, + "step": 46624 + }, + { + "epoch": 1.2, + "learning_rate": 1.3689137346506575e-06, + "loss": 0.7969, + "step": 46625 + }, + { + "epoch": 1.2, + "learning_rate": 1.368888015828657e-06, + "loss": 0.5879, + "step": 46626 + }, + { + "epoch": 1.2, + "learning_rate": 1.3688622967242155e-06, + "loss": 0.5059, + "step": 46627 + }, + { + "epoch": 1.2, + "learning_rate": 1.3688365773373533e-06, + "loss": 0.5491, + "step": 46628 + }, + { + "epoch": 1.2, + "learning_rate": 1.36881085766809e-06, + "loss": 0.6509, + "step": 46629 + }, + { + "epoch": 1.2, + "learning_rate": 1.3687851377164451e-06, + "loss": 0.8428, + "step": 46630 + }, + { + "epoch": 1.2, + "learning_rate": 1.3687594174824384e-06, + "loss": 0.8594, + "step": 46631 + }, + { + "epoch": 1.2, + "learning_rate": 1.3687336969660893e-06, + "loss": 0.5383, + "step": 46632 + }, + { + "epoch": 1.2, + "learning_rate": 1.368707976167418e-06, + "loss": 0.8096, + "step": 46633 + }, + { + "epoch": 1.2, + "learning_rate": 1.3686822550864444e-06, + "loss": 0.647, + "step": 46634 + }, + { + "epoch": 1.2, + "learning_rate": 1.368656533723187e-06, + "loss": 0.7598, + "step": 46635 + }, + { + "epoch": 1.2, + "learning_rate": 1.3686308120776669e-06, + "loss": 0.6328, + "step": 46636 + }, + { + "epoch": 1.2, + "learning_rate": 1.3686050901499028e-06, + "loss": 0.707, + "step": 46637 + }, + { + "epoch": 1.2, + "learning_rate": 1.3685793679399145e-06, + "loss": 0.7725, + "step": 46638 + }, + { + "epoch": 1.2, + "learning_rate": 1.3685536454477221e-06, + "loss": 0.6309, + "step": 46639 + }, + { + "epoch": 1.2, + "learning_rate": 1.3685279226733454e-06, + "loss": 0.6963, + "step": 46640 + }, + { + "epoch": 1.2, + "learning_rate": 1.3685021996168034e-06, + "loss": 0.7168, + "step": 46641 + }, + { + "epoch": 1.2, + "learning_rate": 1.3684764762781164e-06, + "loss": 0.5991, + "step": 46642 + }, + { + "epoch": 1.2, + "learning_rate": 1.368450752657304e-06, + "loss": 0.4997, + "step": 46643 + }, + { + "epoch": 1.2, + "learning_rate": 1.3684250287543858e-06, + "loss": 0.7412, + "step": 46644 + }, + { + "epoch": 1.2, + "learning_rate": 1.3683993045693814e-06, + "loss": 0.6299, + "step": 46645 + }, + { + "epoch": 1.2, + "learning_rate": 1.3683735801023103e-06, + "loss": 0.5947, + "step": 46646 + }, + { + "epoch": 1.2, + "learning_rate": 1.368347855353193e-06, + "loss": 0.5562, + "step": 46647 + }, + { + "epoch": 1.2, + "learning_rate": 1.3683221303220484e-06, + "loss": 0.6565, + "step": 46648 + }, + { + "epoch": 1.2, + "learning_rate": 1.3682964050088967e-06, + "loss": 0.8281, + "step": 46649 + }, + { + "epoch": 1.2, + "learning_rate": 1.368270679413757e-06, + "loss": 0.5488, + "step": 46650 + }, + { + "epoch": 1.2, + "learning_rate": 1.3682449535366498e-06, + "loss": 0.7266, + "step": 46651 + }, + { + "epoch": 1.2, + "learning_rate": 1.3682192273775938e-06, + "loss": 0.6169, + "step": 46652 + }, + { + "epoch": 1.2, + "learning_rate": 1.3681935009366099e-06, + "loss": 0.522, + "step": 46653 + }, + { + "epoch": 1.2, + "learning_rate": 1.368167774213717e-06, + "loss": 0.572, + "step": 46654 + }, + { + "epoch": 1.2, + "learning_rate": 1.368142047208935e-06, + "loss": 0.5627, + "step": 46655 + }, + { + "epoch": 1.2, + "learning_rate": 1.3681163199222832e-06, + "loss": 0.6562, + "step": 46656 + }, + { + "epoch": 1.2, + "learning_rate": 1.368090592353782e-06, + "loss": 0.5376, + "step": 46657 + }, + { + "epoch": 1.2, + "learning_rate": 1.3680648645034504e-06, + "loss": 0.6362, + "step": 46658 + }, + { + "epoch": 1.2, + "learning_rate": 1.3680391363713091e-06, + "loss": 0.6504, + "step": 46659 + }, + { + "epoch": 1.2, + "learning_rate": 1.3680134079573767e-06, + "loss": 0.6772, + "step": 46660 + }, + { + "epoch": 1.2, + "learning_rate": 1.3679876792616734e-06, + "loss": 0.7275, + "step": 46661 + }, + { + "epoch": 1.2, + "learning_rate": 1.3679619502842186e-06, + "loss": 0.6328, + "step": 46662 + }, + { + "epoch": 1.2, + "learning_rate": 1.3679362210250326e-06, + "loss": 0.6699, + "step": 46663 + }, + { + "epoch": 1.2, + "learning_rate": 1.367910491484135e-06, + "loss": 0.7627, + "step": 46664 + }, + { + "epoch": 1.2, + "learning_rate": 1.367884761661545e-06, + "loss": 0.7236, + "step": 46665 + }, + { + "epoch": 1.2, + "learning_rate": 1.3678590315572822e-06, + "loss": 0.6709, + "step": 46666 + }, + { + "epoch": 1.2, + "learning_rate": 1.3678333011713669e-06, + "loss": 0.6187, + "step": 46667 + }, + { + "epoch": 1.2, + "learning_rate": 1.3678075705038186e-06, + "loss": 0.6855, + "step": 46668 + }, + { + "epoch": 1.2, + "learning_rate": 1.367781839554657e-06, + "loss": 0.6709, + "step": 46669 + }, + { + "epoch": 1.2, + "learning_rate": 1.3677561083239017e-06, + "loss": 0.665, + "step": 46670 + }, + { + "epoch": 1.2, + "learning_rate": 1.3677303768115725e-06, + "loss": 0.5366, + "step": 46671 + }, + { + "epoch": 1.2, + "learning_rate": 1.367704645017689e-06, + "loss": 0.5684, + "step": 46672 + }, + { + "epoch": 1.2, + "learning_rate": 1.3676789129422708e-06, + "loss": 0.7637, + "step": 46673 + }, + { + "epoch": 1.2, + "learning_rate": 1.3676531805853381e-06, + "loss": 0.521, + "step": 46674 + }, + { + "epoch": 1.2, + "learning_rate": 1.3676274479469102e-06, + "loss": 0.7729, + "step": 46675 + }, + { + "epoch": 1.2, + "learning_rate": 1.3676017150270068e-06, + "loss": 0.7012, + "step": 46676 + }, + { + "epoch": 1.2, + "learning_rate": 1.3675759818256473e-06, + "loss": 0.7041, + "step": 46677 + }, + { + "epoch": 1.2, + "learning_rate": 1.3675502483428525e-06, + "loss": 0.6621, + "step": 46678 + }, + { + "epoch": 1.2, + "learning_rate": 1.3675245145786408e-06, + "loss": 0.627, + "step": 46679 + }, + { + "epoch": 1.2, + "learning_rate": 1.3674987805330328e-06, + "loss": 0.7227, + "step": 46680 + }, + { + "epoch": 1.2, + "learning_rate": 1.3674730462060478e-06, + "loss": 0.6294, + "step": 46681 + }, + { + "epoch": 1.2, + "learning_rate": 1.3674473115977056e-06, + "loss": 0.6201, + "step": 46682 + }, + { + "epoch": 1.2, + "learning_rate": 1.3674215767080257e-06, + "loss": 0.6389, + "step": 46683 + }, + { + "epoch": 1.2, + "learning_rate": 1.3673958415370283e-06, + "loss": 0.7715, + "step": 46684 + }, + { + "epoch": 1.2, + "learning_rate": 1.3673701060847325e-06, + "loss": 0.5518, + "step": 46685 + }, + { + "epoch": 1.2, + "learning_rate": 1.3673443703511585e-06, + "loss": 0.7598, + "step": 46686 + }, + { + "epoch": 1.2, + "learning_rate": 1.3673186343363257e-06, + "loss": 0.7275, + "step": 46687 + }, + { + "epoch": 1.2, + "learning_rate": 1.367292898040254e-06, + "loss": 0.5459, + "step": 46688 + }, + { + "epoch": 1.2, + "learning_rate": 1.367267161462963e-06, + "loss": 0.6187, + "step": 46689 + }, + { + "epoch": 1.2, + "learning_rate": 1.3672414246044723e-06, + "loss": 0.6924, + "step": 46690 + }, + { + "epoch": 1.2, + "learning_rate": 1.3672156874648018e-06, + "loss": 0.6299, + "step": 46691 + }, + { + "epoch": 1.2, + "learning_rate": 1.3671899500439712e-06, + "loss": 0.8027, + "step": 46692 + }, + { + "epoch": 1.2, + "learning_rate": 1.367164212342e-06, + "loss": 0.6377, + "step": 46693 + }, + { + "epoch": 1.2, + "learning_rate": 1.367138474358908e-06, + "loss": 0.5796, + "step": 46694 + }, + { + "epoch": 1.2, + "learning_rate": 1.3671127360947153e-06, + "loss": 0.6475, + "step": 46695 + }, + { + "epoch": 1.2, + "learning_rate": 1.3670869975494408e-06, + "loss": 0.709, + "step": 46696 + }, + { + "epoch": 1.2, + "learning_rate": 1.3670612587231051e-06, + "loss": 0.7471, + "step": 46697 + }, + { + "epoch": 1.2, + "learning_rate": 1.367035519615727e-06, + "loss": 0.7358, + "step": 46698 + }, + { + "epoch": 1.2, + "learning_rate": 1.3670097802273272e-06, + "loss": 0.7656, + "step": 46699 + }, + { + "epoch": 1.2, + "learning_rate": 1.3669840405579244e-06, + "loss": 0.7119, + "step": 46700 + }, + { + "epoch": 1.2, + "learning_rate": 1.3669583006075394e-06, + "loss": 0.5219, + "step": 46701 + }, + { + "epoch": 1.2, + "learning_rate": 1.3669325603761908e-06, + "loss": 0.6265, + "step": 46702 + }, + { + "epoch": 1.2, + "learning_rate": 1.366906819863899e-06, + "loss": 0.6655, + "step": 46703 + }, + { + "epoch": 1.2, + "learning_rate": 1.3668810790706835e-06, + "loss": 0.3828, + "step": 46704 + }, + { + "epoch": 1.2, + "learning_rate": 1.3668553379965642e-06, + "loss": 0.7061, + "step": 46705 + }, + { + "epoch": 1.2, + "learning_rate": 1.36682959664156e-06, + "loss": 0.7061, + "step": 46706 + }, + { + "epoch": 1.2, + "learning_rate": 1.366803855005692e-06, + "loss": 0.439, + "step": 46707 + }, + { + "epoch": 1.2, + "learning_rate": 1.3667781130889786e-06, + "loss": 0.7505, + "step": 46708 + }, + { + "epoch": 1.2, + "learning_rate": 1.3667523708914406e-06, + "loss": 0.6689, + "step": 46709 + }, + { + "epoch": 1.2, + "learning_rate": 1.3667266284130967e-06, + "loss": 0.708, + "step": 46710 + }, + { + "epoch": 1.2, + "learning_rate": 1.3667008856539671e-06, + "loss": 0.6545, + "step": 46711 + }, + { + "epoch": 1.2, + "learning_rate": 1.3666751426140716e-06, + "loss": 0.6636, + "step": 46712 + }, + { + "epoch": 1.2, + "learning_rate": 1.3666493992934301e-06, + "loss": 0.749, + "step": 46713 + }, + { + "epoch": 1.2, + "learning_rate": 1.3666236556920616e-06, + "loss": 0.6077, + "step": 46714 + }, + { + "epoch": 1.2, + "learning_rate": 1.3665979118099864e-06, + "loss": 0.6021, + "step": 46715 + }, + { + "epoch": 1.2, + "learning_rate": 1.3665721676472241e-06, + "loss": 0.5234, + "step": 46716 + }, + { + "epoch": 1.2, + "learning_rate": 1.3665464232037941e-06, + "loss": 0.585, + "step": 46717 + }, + { + "epoch": 1.2, + "learning_rate": 1.3665206784797165e-06, + "loss": 0.5115, + "step": 46718 + }, + { + "epoch": 1.2, + "learning_rate": 1.366494933475011e-06, + "loss": 0.6328, + "step": 46719 + }, + { + "epoch": 1.2, + "learning_rate": 1.3664691881896973e-06, + "loss": 0.6339, + "step": 46720 + }, + { + "epoch": 1.2, + "learning_rate": 1.3664434426237944e-06, + "loss": 0.4727, + "step": 46721 + }, + { + "epoch": 1.2, + "learning_rate": 1.3664176967773232e-06, + "loss": 0.5259, + "step": 46722 + }, + { + "epoch": 1.2, + "learning_rate": 1.3663919506503025e-06, + "loss": 0.4097, + "step": 46723 + }, + { + "epoch": 1.2, + "learning_rate": 1.3663662042427526e-06, + "loss": 0.708, + "step": 46724 + }, + { + "epoch": 1.2, + "learning_rate": 1.3663404575546927e-06, + "loss": 0.6729, + "step": 46725 + }, + { + "epoch": 1.2, + "learning_rate": 1.3663147105861427e-06, + "loss": 0.436, + "step": 46726 + }, + { + "epoch": 1.2, + "learning_rate": 1.3662889633371223e-06, + "loss": 0.8047, + "step": 46727 + }, + { + "epoch": 1.2, + "learning_rate": 1.3662632158076517e-06, + "loss": 0.5044, + "step": 46728 + }, + { + "epoch": 1.2, + "learning_rate": 1.3662374679977502e-06, + "loss": 0.5986, + "step": 46729 + }, + { + "epoch": 1.2, + "learning_rate": 1.3662117199074372e-06, + "loss": 0.7764, + "step": 46730 + }, + { + "epoch": 1.2, + "learning_rate": 1.3661859715367328e-06, + "loss": 0.6113, + "step": 46731 + }, + { + "epoch": 1.2, + "learning_rate": 1.3661602228856567e-06, + "loss": 0.7119, + "step": 46732 + }, + { + "epoch": 1.2, + "learning_rate": 1.3661344739542285e-06, + "loss": 0.7549, + "step": 46733 + }, + { + "epoch": 1.2, + "learning_rate": 1.3661087247424678e-06, + "loss": 0.7695, + "step": 46734 + }, + { + "epoch": 1.2, + "learning_rate": 1.366082975250395e-06, + "loss": 0.5557, + "step": 46735 + }, + { + "epoch": 1.2, + "learning_rate": 1.3660572254780286e-06, + "loss": 0.6621, + "step": 46736 + }, + { + "epoch": 1.2, + "learning_rate": 1.3660314754253893e-06, + "loss": 0.6943, + "step": 46737 + }, + { + "epoch": 1.2, + "learning_rate": 1.3660057250924969e-06, + "loss": 0.7568, + "step": 46738 + }, + { + "epoch": 1.2, + "learning_rate": 1.3659799744793704e-06, + "loss": 0.7588, + "step": 46739 + }, + { + "epoch": 1.2, + "learning_rate": 1.3659542235860297e-06, + "loss": 0.6123, + "step": 46740 + }, + { + "epoch": 1.2, + "learning_rate": 1.3659284724124952e-06, + "loss": 0.7676, + "step": 46741 + }, + { + "epoch": 1.2, + "learning_rate": 1.3659027209587854e-06, + "loss": 0.5859, + "step": 46742 + }, + { + "epoch": 1.2, + "learning_rate": 1.3658769692249213e-06, + "loss": 0.6709, + "step": 46743 + }, + { + "epoch": 1.2, + "learning_rate": 1.3658512172109219e-06, + "loss": 0.7363, + "step": 46744 + }, + { + "epoch": 1.2, + "learning_rate": 1.3658254649168068e-06, + "loss": 0.7207, + "step": 46745 + }, + { + "epoch": 1.2, + "learning_rate": 1.3657997123425962e-06, + "loss": 0.6128, + "step": 46746 + }, + { + "epoch": 1.2, + "learning_rate": 1.3657739594883096e-06, + "loss": 0.6465, + "step": 46747 + }, + { + "epoch": 1.2, + "learning_rate": 1.3657482063539662e-06, + "loss": 0.5767, + "step": 46748 + }, + { + "epoch": 1.2, + "learning_rate": 1.365722452939587e-06, + "loss": 0.5449, + "step": 46749 + }, + { + "epoch": 1.2, + "learning_rate": 1.3656966992451903e-06, + "loss": 0.5967, + "step": 46750 + }, + { + "epoch": 1.2, + "learning_rate": 1.365670945270797e-06, + "loss": 0.6099, + "step": 46751 + }, + { + "epoch": 1.2, + "learning_rate": 1.3656451910164257e-06, + "loss": 0.5615, + "step": 46752 + }, + { + "epoch": 1.2, + "learning_rate": 1.3656194364820972e-06, + "loss": 0.5693, + "step": 46753 + }, + { + "epoch": 1.2, + "learning_rate": 1.3655936816678304e-06, + "loss": 0.6504, + "step": 46754 + }, + { + "epoch": 1.2, + "learning_rate": 1.3655679265736455e-06, + "loss": 0.6157, + "step": 46755 + }, + { + "epoch": 1.2, + "learning_rate": 1.3655421711995619e-06, + "loss": 0.6279, + "step": 46756 + }, + { + "epoch": 1.2, + "learning_rate": 1.3655164155455996e-06, + "loss": 0.7109, + "step": 46757 + }, + { + "epoch": 1.2, + "learning_rate": 1.3654906596117778e-06, + "loss": 0.6602, + "step": 46758 + }, + { + "epoch": 1.2, + "learning_rate": 1.365464903398117e-06, + "loss": 0.6299, + "step": 46759 + }, + { + "epoch": 1.2, + "learning_rate": 1.3654391469046367e-06, + "loss": 0.5801, + "step": 46760 + }, + { + "epoch": 1.2, + "learning_rate": 1.3654133901313557e-06, + "loss": 0.5645, + "step": 46761 + }, + { + "epoch": 1.2, + "learning_rate": 1.365387633078295e-06, + "loss": 0.6489, + "step": 46762 + }, + { + "epoch": 1.2, + "learning_rate": 1.3653618757454739e-06, + "loss": 0.7139, + "step": 46763 + }, + { + "epoch": 1.2, + "learning_rate": 1.3653361181329122e-06, + "loss": 0.7197, + "step": 46764 + }, + { + "epoch": 1.2, + "learning_rate": 1.365310360240629e-06, + "loss": 0.6177, + "step": 46765 + }, + { + "epoch": 1.2, + "learning_rate": 1.3652846020686445e-06, + "loss": 0.9541, + "step": 46766 + }, + { + "epoch": 1.2, + "learning_rate": 1.3652588436169783e-06, + "loss": 0.4197, + "step": 46767 + }, + { + "epoch": 1.2, + "learning_rate": 1.3652330848856505e-06, + "loss": 0.6912, + "step": 46768 + }, + { + "epoch": 1.2, + "learning_rate": 1.3652073258746804e-06, + "loss": 0.7207, + "step": 46769 + }, + { + "epoch": 1.2, + "learning_rate": 1.3651815665840878e-06, + "loss": 0.6514, + "step": 46770 + }, + { + "epoch": 1.2, + "learning_rate": 1.3651558070138921e-06, + "loss": 0.666, + "step": 46771 + }, + { + "epoch": 1.2, + "learning_rate": 1.365130047164114e-06, + "loss": 0.5088, + "step": 46772 + }, + { + "epoch": 1.2, + "learning_rate": 1.3651042870347722e-06, + "loss": 0.6636, + "step": 46773 + }, + { + "epoch": 1.2, + "learning_rate": 1.3650785266258874e-06, + "loss": 0.7295, + "step": 46774 + }, + { + "epoch": 1.2, + "learning_rate": 1.3650527659374782e-06, + "loss": 0.6528, + "step": 46775 + }, + { + "epoch": 1.2, + "learning_rate": 1.365027004969565e-06, + "loss": 0.604, + "step": 46776 + }, + { + "epoch": 1.2, + "learning_rate": 1.3650012437221672e-06, + "loss": 0.576, + "step": 46777 + }, + { + "epoch": 1.2, + "learning_rate": 1.3649754821953053e-06, + "loss": 0.6089, + "step": 46778 + }, + { + "epoch": 1.2, + "learning_rate": 1.364949720388998e-06, + "loss": 0.7129, + "step": 46779 + }, + { + "epoch": 1.2, + "learning_rate": 1.3649239583032655e-06, + "loss": 0.6147, + "step": 46780 + }, + { + "epoch": 1.2, + "learning_rate": 1.3648981959381277e-06, + "loss": 0.791, + "step": 46781 + }, + { + "epoch": 1.2, + "learning_rate": 1.3648724332936042e-06, + "loss": 0.791, + "step": 46782 + }, + { + "epoch": 1.2, + "learning_rate": 1.3648466703697144e-06, + "loss": 0.5728, + "step": 46783 + }, + { + "epoch": 1.2, + "learning_rate": 1.3648209071664782e-06, + "loss": 0.752, + "step": 46784 + }, + { + "epoch": 1.2, + "learning_rate": 1.364795143683916e-06, + "loss": 0.7148, + "step": 46785 + }, + { + "epoch": 1.2, + "learning_rate": 1.364769379922046e-06, + "loss": 0.7109, + "step": 46786 + }, + { + "epoch": 1.2, + "learning_rate": 1.3647436158808897e-06, + "loss": 0.8301, + "step": 46787 + }, + { + "epoch": 1.2, + "learning_rate": 1.3647178515604653e-06, + "loss": 0.625, + "step": 46788 + }, + { + "epoch": 1.2, + "learning_rate": 1.3646920869607938e-06, + "loss": 0.7188, + "step": 46789 + }, + { + "epoch": 1.2, + "learning_rate": 1.3646663220818942e-06, + "loss": 0.6704, + "step": 46790 + }, + { + "epoch": 1.2, + "learning_rate": 1.3646405569237862e-06, + "loss": 0.8359, + "step": 46791 + }, + { + "epoch": 1.2, + "learning_rate": 1.3646147914864896e-06, + "loss": 0.7075, + "step": 46792 + }, + { + "epoch": 1.2, + "learning_rate": 1.3645890257700244e-06, + "loss": 0.6934, + "step": 46793 + }, + { + "epoch": 1.2, + "learning_rate": 1.3645632597744103e-06, + "loss": 0.6387, + "step": 46794 + }, + { + "epoch": 1.2, + "learning_rate": 1.3645374934996668e-06, + "loss": 0.7222, + "step": 46795 + }, + { + "epoch": 1.2, + "learning_rate": 1.3645117269458135e-06, + "loss": 0.6108, + "step": 46796 + }, + { + "epoch": 1.2, + "learning_rate": 1.3644859601128704e-06, + "loss": 0.6338, + "step": 46797 + }, + { + "epoch": 1.2, + "learning_rate": 1.364460193000857e-06, + "loss": 0.7402, + "step": 46798 + }, + { + "epoch": 1.2, + "learning_rate": 1.3644344256097937e-06, + "loss": 0.7793, + "step": 46799 + }, + { + "epoch": 1.2, + "learning_rate": 1.3644086579396994e-06, + "loss": 0.6265, + "step": 46800 + }, + { + "epoch": 1.2, + "learning_rate": 1.3643828899905941e-06, + "loss": 0.6504, + "step": 46801 + }, + { + "epoch": 1.2, + "learning_rate": 1.3643571217624974e-06, + "loss": 0.6719, + "step": 46802 + }, + { + "epoch": 1.2, + "learning_rate": 1.3643313532554297e-06, + "loss": 0.5928, + "step": 46803 + }, + { + "epoch": 1.2, + "learning_rate": 1.36430558446941e-06, + "loss": 0.6504, + "step": 46804 + }, + { + "epoch": 1.2, + "learning_rate": 1.3642798154044582e-06, + "loss": 0.5654, + "step": 46805 + }, + { + "epoch": 1.2, + "learning_rate": 1.364254046060594e-06, + "loss": 0.6245, + "step": 46806 + }, + { + "epoch": 1.2, + "learning_rate": 1.3642282764378371e-06, + "loss": 0.6802, + "step": 46807 + }, + { + "epoch": 1.2, + "learning_rate": 1.3642025065362078e-06, + "loss": 0.5396, + "step": 46808 + }, + { + "epoch": 1.2, + "learning_rate": 1.3641767363557254e-06, + "loss": 0.6318, + "step": 46809 + }, + { + "epoch": 1.2, + "learning_rate": 1.3641509658964094e-06, + "loss": 0.6104, + "step": 46810 + }, + { + "epoch": 1.2, + "learning_rate": 1.3641251951582798e-06, + "loss": 0.4448, + "step": 46811 + }, + { + "epoch": 1.2, + "learning_rate": 1.364099424141356e-06, + "loss": 0.3718, + "step": 46812 + }, + { + "epoch": 1.2, + "learning_rate": 1.3640736528456581e-06, + "loss": 0.645, + "step": 46813 + }, + { + "epoch": 1.2, + "learning_rate": 1.3640478812712063e-06, + "loss": 0.5898, + "step": 46814 + }, + { + "epoch": 1.2, + "learning_rate": 1.3640221094180193e-06, + "loss": 0.6924, + "step": 46815 + }, + { + "epoch": 1.2, + "learning_rate": 1.3639963372861175e-06, + "loss": 0.6274, + "step": 46816 + }, + { + "epoch": 1.2, + "learning_rate": 1.3639705648755203e-06, + "loss": 0.4985, + "step": 46817 + }, + { + "epoch": 1.2, + "learning_rate": 1.3639447921862476e-06, + "loss": 0.5876, + "step": 46818 + }, + { + "epoch": 1.2, + "learning_rate": 1.363919019218319e-06, + "loss": 0.6943, + "step": 46819 + }, + { + "epoch": 1.2, + "learning_rate": 1.3638932459717547e-06, + "loss": 0.6953, + "step": 46820 + }, + { + "epoch": 1.2, + "learning_rate": 1.3638674724465737e-06, + "loss": 0.7061, + "step": 46821 + }, + { + "epoch": 1.2, + "learning_rate": 1.3638416986427964e-06, + "loss": 0.7285, + "step": 46822 + }, + { + "epoch": 1.2, + "learning_rate": 1.3638159245604416e-06, + "loss": 0.5811, + "step": 46823 + }, + { + "epoch": 1.2, + "learning_rate": 1.3637901501995303e-06, + "loss": 0.5562, + "step": 46824 + }, + { + "epoch": 1.2, + "learning_rate": 1.3637643755600817e-06, + "loss": 0.6602, + "step": 46825 + }, + { + "epoch": 1.2, + "learning_rate": 1.363738600642115e-06, + "loss": 0.5479, + "step": 46826 + }, + { + "epoch": 1.2, + "learning_rate": 1.3637128254456507e-06, + "loss": 0.5669, + "step": 46827 + }, + { + "epoch": 1.2, + "learning_rate": 1.3636870499707081e-06, + "loss": 0.6118, + "step": 46828 + }, + { + "epoch": 1.2, + "learning_rate": 1.363661274217307e-06, + "loss": 0.626, + "step": 46829 + }, + { + "epoch": 1.2, + "learning_rate": 1.3636354981854672e-06, + "loss": 0.5923, + "step": 46830 + }, + { + "epoch": 1.2, + "learning_rate": 1.3636097218752086e-06, + "loss": 0.7354, + "step": 46831 + }, + { + "epoch": 1.2, + "learning_rate": 1.3635839452865505e-06, + "loss": 0.6763, + "step": 46832 + }, + { + "epoch": 1.2, + "learning_rate": 1.3635581684195132e-06, + "loss": 0.6533, + "step": 46833 + }, + { + "epoch": 1.2, + "learning_rate": 1.3635323912741158e-06, + "loss": 0.8633, + "step": 46834 + }, + { + "epoch": 1.2, + "learning_rate": 1.3635066138503786e-06, + "loss": 0.7139, + "step": 46835 + }, + { + "epoch": 1.2, + "learning_rate": 1.3634808361483209e-06, + "loss": 0.5557, + "step": 46836 + }, + { + "epoch": 1.2, + "learning_rate": 1.3634550581679628e-06, + "loss": 0.7437, + "step": 46837 + }, + { + "epoch": 1.2, + "learning_rate": 1.3634292799093237e-06, + "loss": 0.8486, + "step": 46838 + }, + { + "epoch": 1.2, + "learning_rate": 1.3634035013724237e-06, + "loss": 0.6641, + "step": 46839 + }, + { + "epoch": 1.2, + "learning_rate": 1.3633777225572823e-06, + "loss": 0.4103, + "step": 46840 + }, + { + "epoch": 1.2, + "learning_rate": 1.363351943463919e-06, + "loss": 0.751, + "step": 46841 + }, + { + "epoch": 1.2, + "learning_rate": 1.363326164092354e-06, + "loss": 0.7246, + "step": 46842 + }, + { + "epoch": 1.2, + "learning_rate": 1.363300384442607e-06, + "loss": 0.8174, + "step": 46843 + }, + { + "epoch": 1.2, + "learning_rate": 1.3632746045146976e-06, + "loss": 0.5508, + "step": 46844 + }, + { + "epoch": 1.2, + "learning_rate": 1.3632488243086455e-06, + "loss": 0.6362, + "step": 46845 + }, + { + "epoch": 1.2, + "learning_rate": 1.3632230438244703e-06, + "loss": 0.532, + "step": 46846 + }, + { + "epoch": 1.2, + "learning_rate": 1.3631972630621922e-06, + "loss": 0.5852, + "step": 46847 + }, + { + "epoch": 1.2, + "learning_rate": 1.3631714820218308e-06, + "loss": 0.7285, + "step": 46848 + }, + { + "epoch": 1.2, + "learning_rate": 1.363145700703405e-06, + "loss": 0.627, + "step": 46849 + }, + { + "epoch": 1.2, + "learning_rate": 1.3631199191069359e-06, + "loss": 0.5933, + "step": 46850 + }, + { + "epoch": 1.2, + "learning_rate": 1.363094137232442e-06, + "loss": 0.6777, + "step": 46851 + }, + { + "epoch": 1.2, + "learning_rate": 1.3630683550799442e-06, + "loss": 0.6523, + "step": 46852 + }, + { + "epoch": 1.2, + "learning_rate": 1.3630425726494614e-06, + "loss": 0.5942, + "step": 46853 + }, + { + "epoch": 1.2, + "learning_rate": 1.3630167899410137e-06, + "loss": 0.7329, + "step": 46854 + }, + { + "epoch": 1.2, + "learning_rate": 1.3629910069546204e-06, + "loss": 0.7393, + "step": 46855 + }, + { + "epoch": 1.2, + "learning_rate": 1.362965223690302e-06, + "loss": 0.6484, + "step": 46856 + }, + { + "epoch": 1.2, + "learning_rate": 1.3629394401480773e-06, + "loss": 0.6719, + "step": 46857 + }, + { + "epoch": 1.2, + "learning_rate": 1.3629136563279672e-06, + "loss": 0.667, + "step": 46858 + }, + { + "epoch": 1.2, + "learning_rate": 1.3628878722299904e-06, + "loss": 0.584, + "step": 46859 + }, + { + "epoch": 1.2, + "learning_rate": 1.3628620878541672e-06, + "loss": 0.6504, + "step": 46860 + }, + { + "epoch": 1.2, + "learning_rate": 1.362836303200517e-06, + "loss": 0.5942, + "step": 46861 + }, + { + "epoch": 1.2, + "learning_rate": 1.36281051826906e-06, + "loss": 0.6016, + "step": 46862 + }, + { + "epoch": 1.2, + "learning_rate": 1.3627847330598154e-06, + "loss": 0.7119, + "step": 46863 + }, + { + "epoch": 1.2, + "learning_rate": 1.3627589475728034e-06, + "loss": 0.791, + "step": 46864 + }, + { + "epoch": 1.2, + "learning_rate": 1.3627331618080434e-06, + "loss": 0.5581, + "step": 46865 + }, + { + "epoch": 1.2, + "learning_rate": 1.3627073757655554e-06, + "loss": 0.6006, + "step": 46866 + }, + { + "epoch": 1.2, + "learning_rate": 1.362681589445359e-06, + "loss": 0.5942, + "step": 46867 + }, + { + "epoch": 1.2, + "learning_rate": 1.362655802847474e-06, + "loss": 0.707, + "step": 46868 + }, + { + "epoch": 1.2, + "learning_rate": 1.36263001597192e-06, + "loss": 0.7217, + "step": 46869 + }, + { + "epoch": 1.2, + "learning_rate": 1.362604228818717e-06, + "loss": 0.6836, + "step": 46870 + }, + { + "epoch": 1.2, + "learning_rate": 1.3625784413878845e-06, + "loss": 0.7319, + "step": 46871 + }, + { + "epoch": 1.2, + "learning_rate": 1.3625526536794426e-06, + "loss": 0.7637, + "step": 46872 + }, + { + "epoch": 1.2, + "learning_rate": 1.3625268656934108e-06, + "loss": 0.6904, + "step": 46873 + }, + { + "epoch": 1.2, + "learning_rate": 1.3625010774298085e-06, + "loss": 0.6865, + "step": 46874 + }, + { + "epoch": 1.2, + "learning_rate": 1.3624752888886562e-06, + "loss": 0.8066, + "step": 46875 + }, + { + "epoch": 1.2, + "learning_rate": 1.3624495000699728e-06, + "loss": 0.6611, + "step": 46876 + }, + { + "epoch": 1.2, + "learning_rate": 1.3624237109737788e-06, + "loss": 0.7305, + "step": 46877 + }, + { + "epoch": 1.2, + "learning_rate": 1.3623979216000937e-06, + "loss": 0.6821, + "step": 46878 + }, + { + "epoch": 1.2, + "learning_rate": 1.362372131948937e-06, + "loss": 0.5469, + "step": 46879 + }, + { + "epoch": 1.2, + "learning_rate": 1.3623463420203284e-06, + "loss": 0.792, + "step": 46880 + }, + { + "epoch": 1.2, + "learning_rate": 1.3623205518142883e-06, + "loss": 0.6904, + "step": 46881 + }, + { + "epoch": 1.2, + "learning_rate": 1.3622947613308358e-06, + "loss": 0.6797, + "step": 46882 + }, + { + "epoch": 1.2, + "learning_rate": 1.362268970569991e-06, + "loss": 0.772, + "step": 46883 + }, + { + "epoch": 1.2, + "learning_rate": 1.3622431795317733e-06, + "loss": 0.6465, + "step": 46884 + }, + { + "epoch": 1.2, + "learning_rate": 1.3622173882162029e-06, + "loss": 0.5469, + "step": 46885 + }, + { + "epoch": 1.2, + "learning_rate": 1.3621915966232988e-06, + "loss": 0.7476, + "step": 46886 + }, + { + "epoch": 1.2, + "learning_rate": 1.362165804753082e-06, + "loss": 0.7334, + "step": 46887 + }, + { + "epoch": 1.2, + "learning_rate": 1.362140012605571e-06, + "loss": 0.6631, + "step": 46888 + }, + { + "epoch": 1.2, + "learning_rate": 1.362114220180786e-06, + "loss": 0.6714, + "step": 46889 + }, + { + "epoch": 1.2, + "learning_rate": 1.362088427478747e-06, + "loss": 0.7295, + "step": 46890 + }, + { + "epoch": 1.2, + "learning_rate": 1.3620626344994738e-06, + "loss": 0.6694, + "step": 46891 + }, + { + "epoch": 1.2, + "learning_rate": 1.3620368412429853e-06, + "loss": 0.7129, + "step": 46892 + }, + { + "epoch": 1.2, + "learning_rate": 1.362011047709302e-06, + "loss": 0.7061, + "step": 46893 + }, + { + "epoch": 1.2, + "learning_rate": 1.3619852538984438e-06, + "loss": 0.5574, + "step": 46894 + }, + { + "epoch": 1.2, + "learning_rate": 1.3619594598104297e-06, + "loss": 0.6304, + "step": 46895 + }, + { + "epoch": 1.2, + "learning_rate": 1.3619336654452802e-06, + "loss": 0.5562, + "step": 46896 + }, + { + "epoch": 1.2, + "learning_rate": 1.3619078708030146e-06, + "loss": 0.7402, + "step": 46897 + }, + { + "epoch": 1.2, + "learning_rate": 1.361882075883653e-06, + "loss": 0.6025, + "step": 46898 + }, + { + "epoch": 1.2, + "learning_rate": 1.3618562806872146e-06, + "loss": 0.6553, + "step": 46899 + }, + { + "epoch": 1.2, + "learning_rate": 1.3618304852137197e-06, + "loss": 0.7783, + "step": 46900 + }, + { + "epoch": 1.2, + "learning_rate": 1.3618046894631877e-06, + "loss": 0.6948, + "step": 46901 + }, + { + "epoch": 1.2, + "learning_rate": 1.3617788934356386e-06, + "loss": 0.5688, + "step": 46902 + }, + { + "epoch": 1.2, + "learning_rate": 1.3617530971310922e-06, + "loss": 0.5547, + "step": 46903 + }, + { + "epoch": 1.2, + "learning_rate": 1.361727300549568e-06, + "loss": 0.7344, + "step": 46904 + }, + { + "epoch": 1.2, + "learning_rate": 1.3617015036910856e-06, + "loss": 0.4812, + "step": 46905 + }, + { + "epoch": 1.2, + "learning_rate": 1.361675706555665e-06, + "loss": 0.7012, + "step": 46906 + }, + { + "epoch": 1.2, + "learning_rate": 1.361649909143326e-06, + "loss": 0.6345, + "step": 46907 + }, + { + "epoch": 1.2, + "learning_rate": 1.3616241114540886e-06, + "loss": 0.6333, + "step": 46908 + }, + { + "epoch": 1.2, + "learning_rate": 1.3615983134879718e-06, + "loss": 0.6357, + "step": 46909 + }, + { + "epoch": 1.2, + "learning_rate": 1.3615725152449962e-06, + "loss": 0.7002, + "step": 46910 + }, + { + "epoch": 1.2, + "learning_rate": 1.3615467167251805e-06, + "loss": 0.6689, + "step": 46911 + }, + { + "epoch": 1.2, + "learning_rate": 1.3615209179285459e-06, + "loss": 0.6602, + "step": 46912 + }, + { + "epoch": 1.2, + "learning_rate": 1.3614951188551112e-06, + "loss": 0.668, + "step": 46913 + }, + { + "epoch": 1.2, + "learning_rate": 1.3614693195048958e-06, + "loss": 0.667, + "step": 46914 + }, + { + "epoch": 1.2, + "learning_rate": 1.3614435198779204e-06, + "loss": 0.7075, + "step": 46915 + }, + { + "epoch": 1.2, + "learning_rate": 1.3614177199742042e-06, + "loss": 0.5098, + "step": 46916 + }, + { + "epoch": 1.2, + "learning_rate": 1.3613919197937669e-06, + "loss": 0.6638, + "step": 46917 + }, + { + "epoch": 1.2, + "learning_rate": 1.361366119336629e-06, + "loss": 0.575, + "step": 46918 + }, + { + "epoch": 1.2, + "learning_rate": 1.361340318602809e-06, + "loss": 0.6538, + "step": 46919 + }, + { + "epoch": 1.2, + "learning_rate": 1.3613145175923274e-06, + "loss": 0.666, + "step": 46920 + }, + { + "epoch": 1.2, + "learning_rate": 1.3612887163052043e-06, + "loss": 0.7324, + "step": 46921 + }, + { + "epoch": 1.2, + "learning_rate": 1.3612629147414587e-06, + "loss": 0.4885, + "step": 46922 + }, + { + "epoch": 1.2, + "learning_rate": 1.361237112901111e-06, + "loss": 0.488, + "step": 46923 + }, + { + "epoch": 1.2, + "learning_rate": 1.3612113107841805e-06, + "loss": 0.7188, + "step": 46924 + }, + { + "epoch": 1.2, + "learning_rate": 1.361185508390687e-06, + "loss": 0.4207, + "step": 46925 + }, + { + "epoch": 1.2, + "learning_rate": 1.3611597057206504e-06, + "loss": 0.6123, + "step": 46926 + }, + { + "epoch": 1.2, + "learning_rate": 1.3611339027740904e-06, + "loss": 0.8213, + "step": 46927 + }, + { + "epoch": 1.2, + "learning_rate": 1.3611080995510271e-06, + "loss": 0.6035, + "step": 46928 + }, + { + "epoch": 1.2, + "learning_rate": 1.3610822960514796e-06, + "loss": 0.6914, + "step": 46929 + }, + { + "epoch": 1.2, + "learning_rate": 1.361056492275468e-06, + "loss": 0.5552, + "step": 46930 + }, + { + "epoch": 1.2, + "learning_rate": 1.3610306882230122e-06, + "loss": 0.6323, + "step": 46931 + }, + { + "epoch": 1.2, + "learning_rate": 1.3610048838941316e-06, + "loss": 0.6562, + "step": 46932 + }, + { + "epoch": 1.2, + "learning_rate": 1.3609790792888465e-06, + "loss": 0.7246, + "step": 46933 + }, + { + "epoch": 1.2, + "learning_rate": 1.3609532744071758e-06, + "loss": 0.6978, + "step": 46934 + }, + { + "epoch": 1.2, + "learning_rate": 1.3609274692491403e-06, + "loss": 0.5278, + "step": 46935 + }, + { + "epoch": 1.2, + "learning_rate": 1.3609016638147588e-06, + "loss": 0.6846, + "step": 46936 + }, + { + "epoch": 1.2, + "learning_rate": 1.360875858104052e-06, + "loss": 0.7021, + "step": 46937 + }, + { + "epoch": 1.2, + "learning_rate": 1.3608500521170388e-06, + "loss": 0.4946, + "step": 46938 + }, + { + "epoch": 1.2, + "learning_rate": 1.360824245853739e-06, + "loss": 0.6367, + "step": 46939 + }, + { + "epoch": 1.2, + "learning_rate": 1.3607984393141733e-06, + "loss": 0.6372, + "step": 46940 + }, + { + "epoch": 1.2, + "learning_rate": 1.3607726324983603e-06, + "loss": 0.5531, + "step": 46941 + }, + { + "epoch": 1.2, + "learning_rate": 1.3607468254063207e-06, + "loss": 0.6709, + "step": 46942 + }, + { + "epoch": 1.2, + "learning_rate": 1.3607210180380737e-06, + "loss": 0.6621, + "step": 46943 + }, + { + "epoch": 1.2, + "learning_rate": 1.3606952103936392e-06, + "loss": 0.6455, + "step": 46944 + }, + { + "epoch": 1.2, + "learning_rate": 1.360669402473037e-06, + "loss": 0.7725, + "step": 46945 + }, + { + "epoch": 1.2, + "learning_rate": 1.3606435942762868e-06, + "loss": 0.6943, + "step": 46946 + }, + { + "epoch": 1.2, + "learning_rate": 1.360617785803408e-06, + "loss": 0.7188, + "step": 46947 + }, + { + "epoch": 1.2, + "learning_rate": 1.3605919770544214e-06, + "loss": 0.7578, + "step": 46948 + }, + { + "epoch": 1.2, + "learning_rate": 1.360566168029346e-06, + "loss": 0.624, + "step": 46949 + }, + { + "epoch": 1.2, + "learning_rate": 1.3605403587282012e-06, + "loss": 0.6367, + "step": 46950 + }, + { + "epoch": 1.2, + "learning_rate": 1.3605145491510074e-06, + "loss": 0.5203, + "step": 46951 + }, + { + "epoch": 1.2, + "learning_rate": 1.3604887392977844e-06, + "loss": 0.8994, + "step": 46952 + }, + { + "epoch": 1.2, + "learning_rate": 1.3604629291685518e-06, + "loss": 0.6436, + "step": 46953 + }, + { + "epoch": 1.2, + "learning_rate": 1.360437118763329e-06, + "loss": 0.6846, + "step": 46954 + }, + { + "epoch": 1.2, + "learning_rate": 1.360411308082136e-06, + "loss": 0.6514, + "step": 46955 + }, + { + "epoch": 1.2, + "learning_rate": 1.360385497124993e-06, + "loss": 0.7546, + "step": 46956 + }, + { + "epoch": 1.2, + "learning_rate": 1.360359685891919e-06, + "loss": 0.647, + "step": 46957 + }, + { + "epoch": 1.2, + "learning_rate": 1.3603338743829345e-06, + "loss": 0.5474, + "step": 46958 + }, + { + "epoch": 1.2, + "learning_rate": 1.360308062598059e-06, + "loss": 0.6582, + "step": 46959 + }, + { + "epoch": 1.2, + "learning_rate": 1.3602822505373117e-06, + "loss": 0.6787, + "step": 46960 + }, + { + "epoch": 1.2, + "learning_rate": 1.3602564382007132e-06, + "loss": 0.6343, + "step": 46961 + }, + { + "epoch": 1.2, + "learning_rate": 1.360230625588283e-06, + "loss": 0.6445, + "step": 46962 + }, + { + "epoch": 1.2, + "learning_rate": 1.3602048127000405e-06, + "loss": 0.7959, + "step": 46963 + }, + { + "epoch": 1.2, + "learning_rate": 1.3601789995360057e-06, + "loss": 0.626, + "step": 46964 + }, + { + "epoch": 1.2, + "learning_rate": 1.3601531860961987e-06, + "loss": 0.6055, + "step": 46965 + }, + { + "epoch": 1.2, + "learning_rate": 1.3601273723806387e-06, + "loss": 0.4773, + "step": 46966 + }, + { + "epoch": 1.2, + "learning_rate": 1.360101558389346e-06, + "loss": 0.5835, + "step": 46967 + }, + { + "epoch": 1.2, + "learning_rate": 1.3600757441223402e-06, + "loss": 0.7969, + "step": 46968 + }, + { + "epoch": 1.2, + "learning_rate": 1.3600499295796406e-06, + "loss": 0.625, + "step": 46969 + }, + { + "epoch": 1.2, + "learning_rate": 1.3600241147612672e-06, + "loss": 0.6694, + "step": 46970 + }, + { + "epoch": 1.2, + "learning_rate": 1.3599982996672404e-06, + "loss": 0.6919, + "step": 46971 + }, + { + "epoch": 1.2, + "learning_rate": 1.3599724842975788e-06, + "loss": 0.5168, + "step": 46972 + }, + { + "epoch": 1.2, + "learning_rate": 1.3599466686523037e-06, + "loss": 0.7607, + "step": 46973 + }, + { + "epoch": 1.2, + "learning_rate": 1.3599208527314332e-06, + "loss": 0.6914, + "step": 46974 + }, + { + "epoch": 1.2, + "learning_rate": 1.3598950365349882e-06, + "loss": 0.7266, + "step": 46975 + }, + { + "epoch": 1.2, + "learning_rate": 1.359869220062988e-06, + "loss": 0.5884, + "step": 46976 + }, + { + "epoch": 1.2, + "learning_rate": 1.3598434033154527e-06, + "loss": 0.5507, + "step": 46977 + }, + { + "epoch": 1.2, + "learning_rate": 1.3598175862924016e-06, + "loss": 0.5356, + "step": 46978 + }, + { + "epoch": 1.2, + "learning_rate": 1.3597917689938548e-06, + "loss": 0.6768, + "step": 46979 + }, + { + "epoch": 1.2, + "learning_rate": 1.3597659514198318e-06, + "loss": 0.6074, + "step": 46980 + }, + { + "epoch": 1.2, + "learning_rate": 1.359740133570353e-06, + "loss": 0.6445, + "step": 46981 + }, + { + "epoch": 1.2, + "learning_rate": 1.3597143154454373e-06, + "loss": 0.5713, + "step": 46982 + }, + { + "epoch": 1.2, + "learning_rate": 1.3596884970451053e-06, + "loss": 0.6763, + "step": 46983 + }, + { + "epoch": 1.2, + "learning_rate": 1.3596626783693758e-06, + "loss": 0.5283, + "step": 46984 + }, + { + "epoch": 1.2, + "learning_rate": 1.3596368594182694e-06, + "loss": 0.7803, + "step": 46985 + }, + { + "epoch": 1.2, + "learning_rate": 1.3596110401918058e-06, + "loss": 0.7588, + "step": 46986 + }, + { + "epoch": 1.2, + "learning_rate": 1.3595852206900043e-06, + "loss": 0.676, + "step": 46987 + }, + { + "epoch": 1.2, + "learning_rate": 1.3595594009128853e-06, + "loss": 0.7227, + "step": 46988 + }, + { + "epoch": 1.2, + "learning_rate": 1.3595335808604679e-06, + "loss": 0.6377, + "step": 46989 + }, + { + "epoch": 1.2, + "learning_rate": 1.3595077605327721e-06, + "loss": 0.4775, + "step": 46990 + }, + { + "epoch": 1.2, + "learning_rate": 1.3594819399298176e-06, + "loss": 0.8164, + "step": 46991 + }, + { + "epoch": 1.2, + "learning_rate": 1.3594561190516248e-06, + "loss": 0.7246, + "step": 46992 + }, + { + "epoch": 1.2, + "learning_rate": 1.3594302978982128e-06, + "loss": 0.6123, + "step": 46993 + }, + { + "epoch": 1.2, + "learning_rate": 1.3594044764696016e-06, + "loss": 0.6929, + "step": 46994 + }, + { + "epoch": 1.2, + "learning_rate": 1.3593786547658107e-06, + "loss": 0.5942, + "step": 46995 + }, + { + "epoch": 1.2, + "learning_rate": 1.3593528327868602e-06, + "loss": 0.8545, + "step": 46996 + }, + { + "epoch": 1.2, + "learning_rate": 1.3593270105327695e-06, + "loss": 0.5234, + "step": 46997 + }, + { + "epoch": 1.2, + "learning_rate": 1.3593011880035592e-06, + "loss": 0.4441, + "step": 46998 + }, + { + "epoch": 1.2, + "learning_rate": 1.359275365199248e-06, + "loss": 0.7852, + "step": 46999 + }, + { + "epoch": 1.2, + "learning_rate": 1.3592495421198562e-06, + "loss": 0.7559, + "step": 47000 + }, + { + "epoch": 1.2, + "learning_rate": 1.3592237187654036e-06, + "loss": 0.6914, + "step": 47001 + }, + { + "epoch": 1.2, + "learning_rate": 1.3591978951359102e-06, + "loss": 0.7178, + "step": 47002 + }, + { + "epoch": 1.2, + "learning_rate": 1.3591720712313955e-06, + "loss": 0.7744, + "step": 47003 + }, + { + "epoch": 1.2, + "learning_rate": 1.3591462470518788e-06, + "loss": 0.6797, + "step": 47004 + }, + { + "epoch": 1.2, + "learning_rate": 1.3591204225973804e-06, + "loss": 0.6289, + "step": 47005 + }, + { + "epoch": 1.2, + "learning_rate": 1.3590945978679202e-06, + "loss": 0.6753, + "step": 47006 + }, + { + "epoch": 1.2, + "learning_rate": 1.3590687728635177e-06, + "loss": 0.6997, + "step": 47007 + }, + { + "epoch": 1.2, + "learning_rate": 1.359042947584193e-06, + "loss": 0.6108, + "step": 47008 + }, + { + "epoch": 1.2, + "learning_rate": 1.3590171220299656e-06, + "loss": 0.563, + "step": 47009 + }, + { + "epoch": 1.2, + "learning_rate": 1.358991296200855e-06, + "loss": 0.6289, + "step": 47010 + }, + { + "epoch": 1.2, + "learning_rate": 1.3589654700968814e-06, + "loss": 0.6914, + "step": 47011 + }, + { + "epoch": 1.2, + "learning_rate": 1.3589396437180645e-06, + "loss": 0.833, + "step": 47012 + }, + { + "epoch": 1.2, + "learning_rate": 1.3589138170644241e-06, + "loss": 0.5352, + "step": 47013 + }, + { + "epoch": 1.2, + "learning_rate": 1.3588879901359796e-06, + "loss": 0.5586, + "step": 47014 + }, + { + "epoch": 1.21, + "learning_rate": 1.3588621629327514e-06, + "loss": 0.708, + "step": 47015 + }, + { + "epoch": 1.21, + "learning_rate": 1.3588363354547584e-06, + "loss": 0.5698, + "step": 47016 + }, + { + "epoch": 1.21, + "learning_rate": 1.3588105077020215e-06, + "loss": 0.6875, + "step": 47017 + }, + { + "epoch": 1.21, + "learning_rate": 1.3587846796745597e-06, + "loss": 0.5615, + "step": 47018 + }, + { + "epoch": 1.21, + "learning_rate": 1.358758851372393e-06, + "loss": 0.7754, + "step": 47019 + }, + { + "epoch": 1.21, + "learning_rate": 1.3587330227955411e-06, + "loss": 0.6763, + "step": 47020 + }, + { + "epoch": 1.21, + "learning_rate": 1.3587071939440237e-06, + "loss": 0.5547, + "step": 47021 + }, + { + "epoch": 1.21, + "learning_rate": 1.3586813648178609e-06, + "loss": 0.6724, + "step": 47022 + }, + { + "epoch": 1.21, + "learning_rate": 1.3586555354170722e-06, + "loss": 0.7588, + "step": 47023 + }, + { + "epoch": 1.21, + "learning_rate": 1.3586297057416776e-06, + "loss": 0.7246, + "step": 47024 + }, + { + "epoch": 1.21, + "learning_rate": 1.3586038757916965e-06, + "loss": 0.5735, + "step": 47025 + }, + { + "epoch": 1.21, + "learning_rate": 1.3585780455671488e-06, + "loss": 0.4934, + "step": 47026 + }, + { + "epoch": 1.21, + "learning_rate": 1.3585522150680546e-06, + "loss": 0.7471, + "step": 47027 + }, + { + "epoch": 1.21, + "learning_rate": 1.3585263842944335e-06, + "loss": 0.6387, + "step": 47028 + }, + { + "epoch": 1.21, + "learning_rate": 1.3585005532463049e-06, + "loss": 0.4403, + "step": 47029 + }, + { + "epoch": 1.21, + "learning_rate": 1.3584747219236893e-06, + "loss": 0.7129, + "step": 47030 + }, + { + "epoch": 1.21, + "learning_rate": 1.3584488903266058e-06, + "loss": 0.6177, + "step": 47031 + }, + { + "epoch": 1.21, + "learning_rate": 1.3584230584550746e-06, + "loss": 0.7197, + "step": 47032 + }, + { + "epoch": 1.21, + "learning_rate": 1.3583972263091154e-06, + "loss": 0.5186, + "step": 47033 + }, + { + "epoch": 1.21, + "learning_rate": 1.358371393888748e-06, + "loss": 0.4417, + "step": 47034 + }, + { + "epoch": 1.21, + "learning_rate": 1.3583455611939917e-06, + "loss": 0.7139, + "step": 47035 + }, + { + "epoch": 1.21, + "learning_rate": 1.358319728224867e-06, + "loss": 0.6826, + "step": 47036 + }, + { + "epoch": 1.21, + "learning_rate": 1.3582938949813934e-06, + "loss": 0.7314, + "step": 47037 + }, + { + "epoch": 1.21, + "learning_rate": 1.358268061463591e-06, + "loss": 0.5228, + "step": 47038 + }, + { + "epoch": 1.21, + "learning_rate": 1.3582422276714783e-06, + "loss": 0.749, + "step": 47039 + }, + { + "epoch": 1.21, + "learning_rate": 1.3582163936050765e-06, + "loss": 0.6084, + "step": 47040 + }, + { + "epoch": 1.21, + "learning_rate": 1.3581905592644046e-06, + "loss": 0.5762, + "step": 47041 + }, + { + "epoch": 1.21, + "learning_rate": 1.3581647246494832e-06, + "loss": 0.5703, + "step": 47042 + }, + { + "epoch": 1.21, + "learning_rate": 1.3581388897603312e-06, + "loss": 0.6533, + "step": 47043 + }, + { + "epoch": 1.21, + "learning_rate": 1.358113054596969e-06, + "loss": 0.4531, + "step": 47044 + }, + { + "epoch": 1.21, + "learning_rate": 1.3580872191594157e-06, + "loss": 0.7227, + "step": 47045 + }, + { + "epoch": 1.21, + "learning_rate": 1.3580613834476916e-06, + "loss": 0.6797, + "step": 47046 + }, + { + "epoch": 1.21, + "learning_rate": 1.3580355474618164e-06, + "loss": 0.665, + "step": 47047 + }, + { + "epoch": 1.21, + "learning_rate": 1.3580097112018098e-06, + "loss": 0.6621, + "step": 47048 + }, + { + "epoch": 1.21, + "learning_rate": 1.3579838746676916e-06, + "loss": 0.564, + "step": 47049 + }, + { + "epoch": 1.21, + "learning_rate": 1.3579580378594817e-06, + "loss": 0.3911, + "step": 47050 + }, + { + "epoch": 1.21, + "learning_rate": 1.3579322007771998e-06, + "loss": 0.749, + "step": 47051 + }, + { + "epoch": 1.21, + "learning_rate": 1.3579063634208655e-06, + "loss": 0.5708, + "step": 47052 + }, + { + "epoch": 1.21, + "learning_rate": 1.3578805257904994e-06, + "loss": 0.5405, + "step": 47053 + }, + { + "epoch": 1.21, + "learning_rate": 1.3578546878861197e-06, + "loss": 0.7578, + "step": 47054 + }, + { + "epoch": 1.21, + "learning_rate": 1.3578288497077478e-06, + "loss": 0.6025, + "step": 47055 + }, + { + "epoch": 1.21, + "learning_rate": 1.3578030112554024e-06, + "loss": 0.7285, + "step": 47056 + }, + { + "epoch": 1.21, + "learning_rate": 1.357777172529104e-06, + "loss": 0.6709, + "step": 47057 + }, + { + "epoch": 1.21, + "learning_rate": 1.357751333528872e-06, + "loss": 0.5142, + "step": 47058 + }, + { + "epoch": 1.21, + "learning_rate": 1.357725494254726e-06, + "loss": 0.6396, + "step": 47059 + }, + { + "epoch": 1.21, + "learning_rate": 1.357699654706686e-06, + "loss": 0.7383, + "step": 47060 + }, + { + "epoch": 1.21, + "learning_rate": 1.357673814884772e-06, + "loss": 0.791, + "step": 47061 + }, + { + "epoch": 1.21, + "learning_rate": 1.3576479747890037e-06, + "loss": 0.6689, + "step": 47062 + }, + { + "epoch": 1.21, + "learning_rate": 1.357622134419401e-06, + "loss": 0.7861, + "step": 47063 + }, + { + "epoch": 1.21, + "learning_rate": 1.3575962937759831e-06, + "loss": 0.5149, + "step": 47064 + }, + { + "epoch": 1.21, + "learning_rate": 1.3575704528587704e-06, + "loss": 0.5942, + "step": 47065 + }, + { + "epoch": 1.21, + "learning_rate": 1.357544611667782e-06, + "loss": 0.5305, + "step": 47066 + }, + { + "epoch": 1.21, + "learning_rate": 1.3575187702030387e-06, + "loss": 0.6553, + "step": 47067 + }, + { + "epoch": 1.21, + "learning_rate": 1.3574929284645596e-06, + "loss": 0.6816, + "step": 47068 + }, + { + "epoch": 1.21, + "learning_rate": 1.357467086452364e-06, + "loss": 0.499, + "step": 47069 + }, + { + "epoch": 1.21, + "learning_rate": 1.357441244166473e-06, + "loss": 0.6504, + "step": 47070 + }, + { + "epoch": 1.21, + "learning_rate": 1.3574154016069054e-06, + "loss": 0.5835, + "step": 47071 + }, + { + "epoch": 1.21, + "learning_rate": 1.3573895587736813e-06, + "loss": 0.5366, + "step": 47072 + }, + { + "epoch": 1.21, + "learning_rate": 1.3573637156668202e-06, + "loss": 0.7588, + "step": 47073 + }, + { + "epoch": 1.21, + "learning_rate": 1.3573378722863427e-06, + "loss": 0.6016, + "step": 47074 + }, + { + "epoch": 1.21, + "learning_rate": 1.3573120286322674e-06, + "loss": 0.7598, + "step": 47075 + }, + { + "epoch": 1.21, + "learning_rate": 1.3572861847046151e-06, + "loss": 0.7607, + "step": 47076 + }, + { + "epoch": 1.21, + "learning_rate": 1.357260340503405e-06, + "loss": 0.6802, + "step": 47077 + }, + { + "epoch": 1.21, + "learning_rate": 1.3572344960286575e-06, + "loss": 0.7129, + "step": 47078 + }, + { + "epoch": 1.21, + "learning_rate": 1.3572086512803915e-06, + "loss": 0.6479, + "step": 47079 + }, + { + "epoch": 1.21, + "learning_rate": 1.3571828062586275e-06, + "loss": 0.5781, + "step": 47080 + }, + { + "epoch": 1.21, + "learning_rate": 1.3571569609633846e-06, + "loss": 0.5933, + "step": 47081 + }, + { + "epoch": 1.21, + "learning_rate": 1.3571311153946837e-06, + "loss": 0.5835, + "step": 47082 + }, + { + "epoch": 1.21, + "learning_rate": 1.3571052695525436e-06, + "loss": 0.6704, + "step": 47083 + }, + { + "epoch": 1.21, + "learning_rate": 1.3570794234369844e-06, + "loss": 0.6543, + "step": 47084 + }, + { + "epoch": 1.21, + "learning_rate": 1.3570535770480259e-06, + "loss": 0.4556, + "step": 47085 + }, + { + "epoch": 1.21, + "learning_rate": 1.357027730385688e-06, + "loss": 0.5669, + "step": 47086 + }, + { + "epoch": 1.21, + "learning_rate": 1.3570018834499903e-06, + "loss": 0.6123, + "step": 47087 + }, + { + "epoch": 1.21, + "learning_rate": 1.356976036240953e-06, + "loss": 0.4368, + "step": 47088 + }, + { + "epoch": 1.21, + "learning_rate": 1.3569501887585951e-06, + "loss": 0.4926, + "step": 47089 + }, + { + "epoch": 1.21, + "learning_rate": 1.356924341002937e-06, + "loss": 0.6777, + "step": 47090 + }, + { + "epoch": 1.21, + "learning_rate": 1.3568984929739982e-06, + "loss": 0.4597, + "step": 47091 + }, + { + "epoch": 1.21, + "learning_rate": 1.356872644671799e-06, + "loss": 0.7173, + "step": 47092 + }, + { + "epoch": 1.21, + "learning_rate": 1.3568467960963585e-06, + "loss": 0.6299, + "step": 47093 + }, + { + "epoch": 1.21, + "learning_rate": 1.3568209472476967e-06, + "loss": 0.7354, + "step": 47094 + }, + { + "epoch": 1.21, + "learning_rate": 1.356795098125834e-06, + "loss": 0.6982, + "step": 47095 + }, + { + "epoch": 1.21, + "learning_rate": 1.3567692487307892e-06, + "loss": 0.6631, + "step": 47096 + }, + { + "epoch": 1.21, + "learning_rate": 1.3567433990625829e-06, + "loss": 0.6069, + "step": 47097 + }, + { + "epoch": 1.21, + "learning_rate": 1.3567175491212347e-06, + "loss": 0.707, + "step": 47098 + }, + { + "epoch": 1.21, + "learning_rate": 1.356691698906764e-06, + "loss": 0.4517, + "step": 47099 + }, + { + "epoch": 1.21, + "learning_rate": 1.356665848419191e-06, + "loss": 0.7822, + "step": 47100 + }, + { + "epoch": 1.21, + "learning_rate": 1.3566399976585353e-06, + "loss": 0.6501, + "step": 47101 + }, + { + "epoch": 1.21, + "learning_rate": 1.3566141466248167e-06, + "loss": 0.4916, + "step": 47102 + }, + { + "epoch": 1.21, + "learning_rate": 1.3565882953180552e-06, + "loss": 0.5762, + "step": 47103 + }, + { + "epoch": 1.21, + "learning_rate": 1.3565624437382704e-06, + "loss": 0.6338, + "step": 47104 + }, + { + "epoch": 1.21, + "learning_rate": 1.356536591885482e-06, + "loss": 0.5742, + "step": 47105 + }, + { + "epoch": 1.21, + "learning_rate": 1.35651073975971e-06, + "loss": 0.4518, + "step": 47106 + }, + { + "epoch": 1.21, + "learning_rate": 1.356484887360974e-06, + "loss": 0.6797, + "step": 47107 + }, + { + "epoch": 1.21, + "learning_rate": 1.3564590346892941e-06, + "loss": 0.5532, + "step": 47108 + }, + { + "epoch": 1.21, + "learning_rate": 1.35643318174469e-06, + "loss": 0.7734, + "step": 47109 + }, + { + "epoch": 1.21, + "learning_rate": 1.3564073285271812e-06, + "loss": 0.6006, + "step": 47110 + }, + { + "epoch": 1.21, + "learning_rate": 1.3563814750367878e-06, + "loss": 0.6431, + "step": 47111 + }, + { + "epoch": 1.21, + "learning_rate": 1.3563556212735293e-06, + "loss": 0.5144, + "step": 47112 + }, + { + "epoch": 1.21, + "learning_rate": 1.3563297672374258e-06, + "loss": 0.6514, + "step": 47113 + }, + { + "epoch": 1.21, + "learning_rate": 1.3563039129284972e-06, + "loss": 0.4938, + "step": 47114 + }, + { + "epoch": 1.21, + "learning_rate": 1.3562780583467629e-06, + "loss": 0.7632, + "step": 47115 + }, + { + "epoch": 1.21, + "learning_rate": 1.3562522034922426e-06, + "loss": 0.7183, + "step": 47116 + }, + { + "epoch": 1.21, + "learning_rate": 1.3562263483649567e-06, + "loss": 0.6318, + "step": 47117 + }, + { + "epoch": 1.21, + "learning_rate": 1.3562004929649246e-06, + "loss": 0.5854, + "step": 47118 + }, + { + "epoch": 1.21, + "learning_rate": 1.356174637292166e-06, + "loss": 0.7598, + "step": 47119 + }, + { + "epoch": 1.21, + "learning_rate": 1.3561487813467012e-06, + "loss": 0.6855, + "step": 47120 + }, + { + "epoch": 1.21, + "learning_rate": 1.3561229251285494e-06, + "loss": 0.5201, + "step": 47121 + }, + { + "epoch": 1.21, + "learning_rate": 1.3560970686377307e-06, + "loss": 0.877, + "step": 47122 + }, + { + "epoch": 1.21, + "learning_rate": 1.356071211874265e-06, + "loss": 0.6904, + "step": 47123 + }, + { + "epoch": 1.21, + "learning_rate": 1.356045354838172e-06, + "loss": 0.5317, + "step": 47124 + }, + { + "epoch": 1.21, + "learning_rate": 1.3560194975294709e-06, + "loss": 0.7197, + "step": 47125 + }, + { + "epoch": 1.21, + "learning_rate": 1.3559936399481826e-06, + "loss": 0.6113, + "step": 47126 + }, + { + "epoch": 1.21, + "learning_rate": 1.355967782094326e-06, + "loss": 0.7014, + "step": 47127 + }, + { + "epoch": 1.21, + "learning_rate": 1.3559419239679214e-06, + "loss": 0.5869, + "step": 47128 + }, + { + "epoch": 1.21, + "learning_rate": 1.3559160655689886e-06, + "loss": 0.7949, + "step": 47129 + }, + { + "epoch": 1.21, + "learning_rate": 1.3558902068975469e-06, + "loss": 0.5298, + "step": 47130 + }, + { + "epoch": 1.21, + "learning_rate": 1.3558643479536165e-06, + "loss": 0.6025, + "step": 47131 + }, + { + "epoch": 1.21, + "learning_rate": 1.3558384887372173e-06, + "loss": 0.8848, + "step": 47132 + }, + { + "epoch": 1.21, + "learning_rate": 1.3558126292483687e-06, + "loss": 0.6729, + "step": 47133 + }, + { + "epoch": 1.21, + "learning_rate": 1.355786769487091e-06, + "loss": 0.7168, + "step": 47134 + }, + { + "epoch": 1.21, + "learning_rate": 1.3557609094534036e-06, + "loss": 0.4663, + "step": 47135 + }, + { + "epoch": 1.21, + "learning_rate": 1.3557350491473263e-06, + "loss": 0.6304, + "step": 47136 + }, + { + "epoch": 1.21, + "learning_rate": 1.3557091885688795e-06, + "loss": 0.6113, + "step": 47137 + }, + { + "epoch": 1.21, + "learning_rate": 1.355683327718082e-06, + "loss": 0.7637, + "step": 47138 + }, + { + "epoch": 1.21, + "learning_rate": 1.3556574665949543e-06, + "loss": 0.5059, + "step": 47139 + }, + { + "epoch": 1.21, + "learning_rate": 1.3556316051995158e-06, + "loss": 0.7104, + "step": 47140 + }, + { + "epoch": 1.21, + "learning_rate": 1.355605743531787e-06, + "loss": 0.7949, + "step": 47141 + }, + { + "epoch": 1.21, + "learning_rate": 1.355579881591787e-06, + "loss": 0.6782, + "step": 47142 + }, + { + "epoch": 1.21, + "learning_rate": 1.355554019379536e-06, + "loss": 0.5762, + "step": 47143 + }, + { + "epoch": 1.21, + "learning_rate": 1.3555281568950532e-06, + "loss": 0.6724, + "step": 47144 + }, + { + "epoch": 1.21, + "learning_rate": 1.355502294138359e-06, + "loss": 0.5684, + "step": 47145 + }, + { + "epoch": 1.21, + "learning_rate": 1.3554764311094732e-06, + "loss": 0.5034, + "step": 47146 + }, + { + "epoch": 1.21, + "learning_rate": 1.3554505678084156e-06, + "loss": 0.7827, + "step": 47147 + }, + { + "epoch": 1.21, + "learning_rate": 1.3554247042352056e-06, + "loss": 0.6899, + "step": 47148 + }, + { + "epoch": 1.21, + "learning_rate": 1.3553988403898634e-06, + "loss": 0.667, + "step": 47149 + }, + { + "epoch": 1.21, + "learning_rate": 1.3553729762724083e-06, + "loss": 0.5884, + "step": 47150 + }, + { + "epoch": 1.21, + "learning_rate": 1.3553471118828608e-06, + "loss": 0.6592, + "step": 47151 + }, + { + "epoch": 1.21, + "learning_rate": 1.3553212472212402e-06, + "loss": 0.5728, + "step": 47152 + }, + { + "epoch": 1.21, + "learning_rate": 1.3552953822875668e-06, + "loss": 0.717, + "step": 47153 + }, + { + "epoch": 1.21, + "learning_rate": 1.3552695170818596e-06, + "loss": 0.6602, + "step": 47154 + }, + { + "epoch": 1.21, + "learning_rate": 1.3552436516041393e-06, + "loss": 0.6284, + "step": 47155 + }, + { + "epoch": 1.21, + "learning_rate": 1.3552177858544248e-06, + "loss": 0.624, + "step": 47156 + }, + { + "epoch": 1.21, + "learning_rate": 1.3551919198327367e-06, + "loss": 0.6191, + "step": 47157 + }, + { + "epoch": 1.21, + "learning_rate": 1.3551660535390943e-06, + "loss": 0.6372, + "step": 47158 + }, + { + "epoch": 1.21, + "learning_rate": 1.3551401869735174e-06, + "loss": 0.572, + "step": 47159 + }, + { + "epoch": 1.21, + "learning_rate": 1.3551143201360265e-06, + "loss": 0.6362, + "step": 47160 + }, + { + "epoch": 1.21, + "learning_rate": 1.3550884530266403e-06, + "loss": 0.7012, + "step": 47161 + }, + { + "epoch": 1.21, + "learning_rate": 1.3550625856453799e-06, + "loss": 0.8115, + "step": 47162 + }, + { + "epoch": 1.21, + "learning_rate": 1.355036717992264e-06, + "loss": 0.5994, + "step": 47163 + }, + { + "epoch": 1.21, + "learning_rate": 1.3550108500673128e-06, + "loss": 0.5446, + "step": 47164 + }, + { + "epoch": 1.21, + "learning_rate": 1.3549849818705461e-06, + "loss": 0.8359, + "step": 47165 + }, + { + "epoch": 1.21, + "learning_rate": 1.3549591134019838e-06, + "loss": 0.6768, + "step": 47166 + }, + { + "epoch": 1.21, + "learning_rate": 1.3549332446616454e-06, + "loss": 0.5354, + "step": 47167 + }, + { + "epoch": 1.21, + "learning_rate": 1.3549073756495516e-06, + "loss": 0.7168, + "step": 47168 + }, + { + "epoch": 1.21, + "learning_rate": 1.3548815063657209e-06, + "loss": 0.6348, + "step": 47169 + }, + { + "epoch": 1.21, + "learning_rate": 1.354855636810174e-06, + "loss": 0.5312, + "step": 47170 + }, + { + "epoch": 1.21, + "learning_rate": 1.35482976698293e-06, + "loss": 0.6328, + "step": 47171 + }, + { + "epoch": 1.21, + "learning_rate": 1.35480389688401e-06, + "loss": 0.4346, + "step": 47172 + }, + { + "epoch": 1.21, + "learning_rate": 1.3547780265134322e-06, + "loss": 0.5049, + "step": 47173 + }, + { + "epoch": 1.21, + "learning_rate": 1.3547521558712176e-06, + "loss": 0.7158, + "step": 47174 + }, + { + "epoch": 1.21, + "learning_rate": 1.3547262849573854e-06, + "loss": 0.5918, + "step": 47175 + }, + { + "epoch": 1.21, + "learning_rate": 1.3547004137719558e-06, + "loss": 0.7061, + "step": 47176 + }, + { + "epoch": 1.21, + "learning_rate": 1.3546745423149483e-06, + "loss": 0.7954, + "step": 47177 + }, + { + "epoch": 1.21, + "learning_rate": 1.354648670586383e-06, + "loss": 0.8486, + "step": 47178 + }, + { + "epoch": 1.21, + "learning_rate": 1.354622798586279e-06, + "loss": 0.5283, + "step": 47179 + }, + { + "epoch": 1.21, + "learning_rate": 1.354596926314657e-06, + "loss": 0.707, + "step": 47180 + }, + { + "epoch": 1.21, + "learning_rate": 1.3545710537715365e-06, + "loss": 0.7617, + "step": 47181 + }, + { + "epoch": 1.21, + "learning_rate": 1.354545180956937e-06, + "loss": 0.6519, + "step": 47182 + }, + { + "epoch": 1.21, + "learning_rate": 1.3545193078708788e-06, + "loss": 0.7793, + "step": 47183 + }, + { + "epoch": 1.21, + "learning_rate": 1.3544934345133812e-06, + "loss": 0.6724, + "step": 47184 + }, + { + "epoch": 1.21, + "learning_rate": 1.3544675608844646e-06, + "loss": 0.7119, + "step": 47185 + }, + { + "epoch": 1.21, + "learning_rate": 1.3544416869841482e-06, + "loss": 0.6621, + "step": 47186 + }, + { + "epoch": 1.21, + "learning_rate": 1.3544158128124523e-06, + "loss": 0.8545, + "step": 47187 + }, + { + "epoch": 1.21, + "learning_rate": 1.3543899383693964e-06, + "loss": 0.6514, + "step": 47188 + }, + { + "epoch": 1.21, + "learning_rate": 1.3543640636550005e-06, + "loss": 0.7559, + "step": 47189 + }, + { + "epoch": 1.21, + "learning_rate": 1.3543381886692843e-06, + "loss": 0.5964, + "step": 47190 + }, + { + "epoch": 1.21, + "learning_rate": 1.3543123134122676e-06, + "loss": 0.7861, + "step": 47191 + }, + { + "epoch": 1.21, + "learning_rate": 1.3542864378839703e-06, + "loss": 0.6895, + "step": 47192 + }, + { + "epoch": 1.21, + "learning_rate": 1.3542605620844123e-06, + "loss": 0.543, + "step": 47193 + }, + { + "epoch": 1.21, + "learning_rate": 1.3542346860136128e-06, + "loss": 0.668, + "step": 47194 + }, + { + "epoch": 1.21, + "learning_rate": 1.3542088096715925e-06, + "loss": 0.6455, + "step": 47195 + }, + { + "epoch": 1.21, + "learning_rate": 1.3541829330583706e-06, + "loss": 0.6616, + "step": 47196 + }, + { + "epoch": 1.21, + "learning_rate": 1.3541570561739674e-06, + "loss": 0.6904, + "step": 47197 + }, + { + "epoch": 1.21, + "learning_rate": 1.3541311790184022e-06, + "loss": 0.752, + "step": 47198 + }, + { + "epoch": 1.21, + "learning_rate": 1.3541053015916952e-06, + "loss": 0.7402, + "step": 47199 + }, + { + "epoch": 1.21, + "learning_rate": 1.3540794238938657e-06, + "loss": 0.5176, + "step": 47200 + }, + { + "epoch": 1.21, + "learning_rate": 1.3540535459249342e-06, + "loss": 0.6074, + "step": 47201 + }, + { + "epoch": 1.21, + "learning_rate": 1.3540276676849201e-06, + "loss": 0.709, + "step": 47202 + }, + { + "epoch": 1.21, + "learning_rate": 1.3540017891738432e-06, + "loss": 0.5273, + "step": 47203 + }, + { + "epoch": 1.21, + "learning_rate": 1.3539759103917235e-06, + "loss": 0.6289, + "step": 47204 + }, + { + "epoch": 1.21, + "learning_rate": 1.3539500313385809e-06, + "loss": 0.563, + "step": 47205 + }, + { + "epoch": 1.21, + "learning_rate": 1.3539241520144347e-06, + "loss": 0.6895, + "step": 47206 + }, + { + "epoch": 1.21, + "learning_rate": 1.3538982724193054e-06, + "loss": 0.6802, + "step": 47207 + }, + { + "epoch": 1.21, + "learning_rate": 1.3538723925532121e-06, + "loss": 0.6357, + "step": 47208 + }, + { + "epoch": 1.21, + "learning_rate": 1.353846512416175e-06, + "loss": 0.5571, + "step": 47209 + }, + { + "epoch": 1.21, + "learning_rate": 1.3538206320082143e-06, + "loss": 0.6602, + "step": 47210 + }, + { + "epoch": 1.21, + "learning_rate": 1.3537947513293488e-06, + "loss": 0.5371, + "step": 47211 + }, + { + "epoch": 1.21, + "learning_rate": 1.3537688703795995e-06, + "loss": 0.5542, + "step": 47212 + }, + { + "epoch": 1.21, + "learning_rate": 1.3537429891589854e-06, + "loss": 0.6514, + "step": 47213 + }, + { + "epoch": 1.21, + "learning_rate": 1.3537171076675267e-06, + "loss": 0.7207, + "step": 47214 + }, + { + "epoch": 1.21, + "learning_rate": 1.3536912259052426e-06, + "loss": 0.6494, + "step": 47215 + }, + { + "epoch": 1.21, + "learning_rate": 1.3536653438721538e-06, + "loss": 0.3652, + "step": 47216 + }, + { + "epoch": 1.21, + "learning_rate": 1.3536394615682799e-06, + "loss": 0.749, + "step": 47217 + }, + { + "epoch": 1.21, + "learning_rate": 1.3536135789936403e-06, + "loss": 0.561, + "step": 47218 + }, + { + "epoch": 1.21, + "learning_rate": 1.3535876961482548e-06, + "loss": 0.6006, + "step": 47219 + }, + { + "epoch": 1.21, + "learning_rate": 1.3535618130321438e-06, + "loss": 0.5864, + "step": 47220 + }, + { + "epoch": 1.21, + "learning_rate": 1.3535359296453265e-06, + "loss": 0.5703, + "step": 47221 + }, + { + "epoch": 1.21, + "learning_rate": 1.3535100459878233e-06, + "loss": 0.5713, + "step": 47222 + }, + { + "epoch": 1.21, + "learning_rate": 1.3534841620596535e-06, + "loss": 0.6387, + "step": 47223 + }, + { + "epoch": 1.21, + "learning_rate": 1.3534582778608372e-06, + "loss": 0.7402, + "step": 47224 + }, + { + "epoch": 1.21, + "learning_rate": 1.3534323933913944e-06, + "loss": 0.5723, + "step": 47225 + }, + { + "epoch": 1.21, + "learning_rate": 1.3534065086513441e-06, + "loss": 0.75, + "step": 47226 + }, + { + "epoch": 1.21, + "learning_rate": 1.353380623640707e-06, + "loss": 0.7485, + "step": 47227 + }, + { + "epoch": 1.21, + "learning_rate": 1.3533547383595026e-06, + "loss": 0.5532, + "step": 47228 + }, + { + "epoch": 1.21, + "learning_rate": 1.3533288528077508e-06, + "loss": 0.6465, + "step": 47229 + }, + { + "epoch": 1.21, + "learning_rate": 1.3533029669854712e-06, + "loss": 0.8955, + "step": 47230 + }, + { + "epoch": 1.21, + "learning_rate": 1.353277080892684e-06, + "loss": 0.7007, + "step": 47231 + }, + { + "epoch": 1.21, + "learning_rate": 1.3532511945294085e-06, + "loss": 0.7949, + "step": 47232 + }, + { + "epoch": 1.21, + "learning_rate": 1.353225307895665e-06, + "loss": 0.6753, + "step": 47233 + }, + { + "epoch": 1.21, + "learning_rate": 1.3531994209914729e-06, + "loss": 0.6504, + "step": 47234 + }, + { + "epoch": 1.21, + "learning_rate": 1.3531735338168524e-06, + "loss": 0.6768, + "step": 47235 + }, + { + "epoch": 1.21, + "learning_rate": 1.353147646371823e-06, + "loss": 0.6909, + "step": 47236 + }, + { + "epoch": 1.21, + "learning_rate": 1.3531217586564052e-06, + "loss": 0.646, + "step": 47237 + }, + { + "epoch": 1.21, + "learning_rate": 1.3530958706706176e-06, + "loss": 0.5923, + "step": 47238 + }, + { + "epoch": 1.21, + "learning_rate": 1.3530699824144814e-06, + "loss": 0.5652, + "step": 47239 + }, + { + "epoch": 1.21, + "learning_rate": 1.3530440938880151e-06, + "loss": 0.6357, + "step": 47240 + }, + { + "epoch": 1.21, + "learning_rate": 1.3530182050912395e-06, + "loss": 0.6489, + "step": 47241 + }, + { + "epoch": 1.21, + "learning_rate": 1.3529923160241742e-06, + "loss": 0.6719, + "step": 47242 + }, + { + "epoch": 1.21, + "learning_rate": 1.352966426686839e-06, + "loss": 0.5923, + "step": 47243 + }, + { + "epoch": 1.21, + "learning_rate": 1.3529405370792533e-06, + "loss": 0.8174, + "step": 47244 + }, + { + "epoch": 1.21, + "learning_rate": 1.3529146472014374e-06, + "loss": 0.5869, + "step": 47245 + }, + { + "epoch": 1.21, + "learning_rate": 1.352888757053411e-06, + "loss": 0.7305, + "step": 47246 + }, + { + "epoch": 1.21, + "learning_rate": 1.3528628666351938e-06, + "loss": 0.6963, + "step": 47247 + }, + { + "epoch": 1.21, + "learning_rate": 1.352836975946806e-06, + "loss": 0.4856, + "step": 47248 + }, + { + "epoch": 1.21, + "learning_rate": 1.3528110849882665e-06, + "loss": 0.4458, + "step": 47249 + }, + { + "epoch": 1.21, + "learning_rate": 1.3527851937595964e-06, + "loss": 0.6621, + "step": 47250 + }, + { + "epoch": 1.21, + "learning_rate": 1.3527593022608147e-06, + "loss": 0.4629, + "step": 47251 + }, + { + "epoch": 1.21, + "learning_rate": 1.3527334104919418e-06, + "loss": 0.4685, + "step": 47252 + }, + { + "epoch": 1.21, + "learning_rate": 1.3527075184529965e-06, + "loss": 0.6494, + "step": 47253 + }, + { + "epoch": 1.21, + "learning_rate": 1.3526816261439997e-06, + "loss": 0.6387, + "step": 47254 + }, + { + "epoch": 1.21, + "learning_rate": 1.3526557335649704e-06, + "loss": 0.6055, + "step": 47255 + }, + { + "epoch": 1.21, + "learning_rate": 1.3526298407159294e-06, + "loss": 0.479, + "step": 47256 + }, + { + "epoch": 1.21, + "learning_rate": 1.3526039475968956e-06, + "loss": 0.5815, + "step": 47257 + }, + { + "epoch": 1.21, + "learning_rate": 1.3525780542078892e-06, + "loss": 0.5942, + "step": 47258 + }, + { + "epoch": 1.21, + "learning_rate": 1.35255216054893e-06, + "loss": 0.7637, + "step": 47259 + }, + { + "epoch": 1.21, + "learning_rate": 1.3525262666200378e-06, + "loss": 0.5747, + "step": 47260 + }, + { + "epoch": 1.21, + "learning_rate": 1.3525003724212323e-06, + "loss": 0.5918, + "step": 47261 + }, + { + "epoch": 1.21, + "learning_rate": 1.3524744779525339e-06, + "loss": 0.7207, + "step": 47262 + }, + { + "epoch": 1.21, + "learning_rate": 1.3524485832139617e-06, + "loss": 0.5685, + "step": 47263 + }, + { + "epoch": 1.21, + "learning_rate": 1.3524226882055358e-06, + "loss": 0.7217, + "step": 47264 + }, + { + "epoch": 1.21, + "learning_rate": 1.3523967929272762e-06, + "loss": 0.646, + "step": 47265 + }, + { + "epoch": 1.21, + "learning_rate": 1.3523708973792024e-06, + "loss": 0.5083, + "step": 47266 + }, + { + "epoch": 1.21, + "learning_rate": 1.3523450015613347e-06, + "loss": 0.7285, + "step": 47267 + }, + { + "epoch": 1.21, + "learning_rate": 1.3523191054736925e-06, + "loss": 0.5603, + "step": 47268 + }, + { + "epoch": 1.21, + "learning_rate": 1.3522932091162955e-06, + "loss": 0.7046, + "step": 47269 + }, + { + "epoch": 1.21, + "learning_rate": 1.3522673124891642e-06, + "loss": 0.572, + "step": 47270 + }, + { + "epoch": 1.21, + "learning_rate": 1.3522414155923176e-06, + "loss": 0.6309, + "step": 47271 + }, + { + "epoch": 1.21, + "learning_rate": 1.3522155184257763e-06, + "loss": 0.605, + "step": 47272 + }, + { + "epoch": 1.21, + "learning_rate": 1.3521896209895596e-06, + "loss": 0.5378, + "step": 47273 + }, + { + "epoch": 1.21, + "learning_rate": 1.3521637232836874e-06, + "loss": 0.7617, + "step": 47274 + }, + { + "epoch": 1.21, + "learning_rate": 1.3521378253081796e-06, + "loss": 0.6455, + "step": 47275 + }, + { + "epoch": 1.21, + "learning_rate": 1.3521119270630564e-06, + "loss": 0.6436, + "step": 47276 + }, + { + "epoch": 1.21, + "learning_rate": 1.3520860285483372e-06, + "loss": 0.8193, + "step": 47277 + }, + { + "epoch": 1.21, + "learning_rate": 1.3520601297640418e-06, + "loss": 0.6816, + "step": 47278 + }, + { + "epoch": 1.21, + "learning_rate": 1.3520342307101901e-06, + "loss": 0.7188, + "step": 47279 + }, + { + "epoch": 1.21, + "learning_rate": 1.3520083313868018e-06, + "loss": 0.5571, + "step": 47280 + }, + { + "epoch": 1.21, + "learning_rate": 1.3519824317938973e-06, + "loss": 0.626, + "step": 47281 + }, + { + "epoch": 1.21, + "learning_rate": 1.351956531931496e-06, + "loss": 0.752, + "step": 47282 + }, + { + "epoch": 1.21, + "learning_rate": 1.3519306317996177e-06, + "loss": 0.7803, + "step": 47283 + }, + { + "epoch": 1.21, + "learning_rate": 1.3519047313982821e-06, + "loss": 0.7246, + "step": 47284 + }, + { + "epoch": 1.21, + "learning_rate": 1.3518788307275096e-06, + "loss": 0.606, + "step": 47285 + }, + { + "epoch": 1.21, + "learning_rate": 1.3518529297873192e-06, + "loss": 0.5508, + "step": 47286 + }, + { + "epoch": 1.21, + "learning_rate": 1.3518270285777317e-06, + "loss": 0.5342, + "step": 47287 + }, + { + "epoch": 1.21, + "learning_rate": 1.3518011270987658e-06, + "loss": 0.6479, + "step": 47288 + }, + { + "epoch": 1.21, + "learning_rate": 1.3517752253504427e-06, + "loss": 0.6943, + "step": 47289 + }, + { + "epoch": 1.21, + "learning_rate": 1.3517493233327808e-06, + "loss": 0.7441, + "step": 47290 + }, + { + "epoch": 1.21, + "learning_rate": 1.3517234210458008e-06, + "loss": 0.6367, + "step": 47291 + }, + { + "epoch": 1.21, + "learning_rate": 1.3516975184895226e-06, + "loss": 0.7412, + "step": 47292 + }, + { + "epoch": 1.21, + "learning_rate": 1.3516716156639656e-06, + "loss": 0.6914, + "step": 47293 + }, + { + "epoch": 1.21, + "learning_rate": 1.3516457125691497e-06, + "loss": 0.5273, + "step": 47294 + }, + { + "epoch": 1.21, + "learning_rate": 1.3516198092050951e-06, + "loss": 0.7217, + "step": 47295 + }, + { + "epoch": 1.21, + "learning_rate": 1.3515939055718213e-06, + "loss": 0.6841, + "step": 47296 + }, + { + "epoch": 1.21, + "learning_rate": 1.3515680016693483e-06, + "loss": 0.6958, + "step": 47297 + }, + { + "epoch": 1.21, + "learning_rate": 1.3515420974976956e-06, + "loss": 0.7178, + "step": 47298 + }, + { + "epoch": 1.21, + "learning_rate": 1.3515161930568834e-06, + "loss": 0.5942, + "step": 47299 + }, + { + "epoch": 1.21, + "learning_rate": 1.3514902883469314e-06, + "loss": 0.5842, + "step": 47300 + }, + { + "epoch": 1.21, + "learning_rate": 1.3514643833678594e-06, + "loss": 0.5293, + "step": 47301 + }, + { + "epoch": 1.21, + "learning_rate": 1.3514384781196878e-06, + "loss": 0.6846, + "step": 47302 + }, + { + "epoch": 1.21, + "learning_rate": 1.3514125726024352e-06, + "loss": 0.5327, + "step": 47303 + }, + { + "epoch": 1.21, + "learning_rate": 1.3513866668161224e-06, + "loss": 0.6719, + "step": 47304 + }, + { + "epoch": 1.21, + "learning_rate": 1.3513607607607688e-06, + "loss": 0.6758, + "step": 47305 + }, + { + "epoch": 1.21, + "learning_rate": 1.3513348544363949e-06, + "loss": 0.9121, + "step": 47306 + }, + { + "epoch": 1.21, + "learning_rate": 1.3513089478430197e-06, + "loss": 0.8076, + "step": 47307 + }, + { + "epoch": 1.21, + "learning_rate": 1.3512830409806638e-06, + "loss": 0.7549, + "step": 47308 + }, + { + "epoch": 1.21, + "learning_rate": 1.3512571338493461e-06, + "loss": 0.6963, + "step": 47309 + }, + { + "epoch": 1.21, + "learning_rate": 1.3512312264490872e-06, + "loss": 0.7178, + "step": 47310 + }, + { + "epoch": 1.21, + "learning_rate": 1.3512053187799065e-06, + "loss": 0.708, + "step": 47311 + }, + { + "epoch": 1.21, + "learning_rate": 1.3511794108418243e-06, + "loss": 0.5747, + "step": 47312 + }, + { + "epoch": 1.21, + "learning_rate": 1.3511535026348603e-06, + "loss": 0.7798, + "step": 47313 + }, + { + "epoch": 1.21, + "learning_rate": 1.3511275941590338e-06, + "loss": 0.6265, + "step": 47314 + }, + { + "epoch": 1.21, + "learning_rate": 1.351101685414365e-06, + "loss": 0.6758, + "step": 47315 + }, + { + "epoch": 1.21, + "learning_rate": 1.3510757764008745e-06, + "loss": 0.8125, + "step": 47316 + }, + { + "epoch": 1.21, + "learning_rate": 1.3510498671185808e-06, + "loss": 0.5757, + "step": 47317 + }, + { + "epoch": 1.21, + "learning_rate": 1.3510239575675045e-06, + "loss": 0.6353, + "step": 47318 + }, + { + "epoch": 1.21, + "learning_rate": 1.3509980477476653e-06, + "loss": 0.8291, + "step": 47319 + }, + { + "epoch": 1.21, + "learning_rate": 1.3509721376590828e-06, + "loss": 0.6719, + "step": 47320 + }, + { + "epoch": 1.21, + "learning_rate": 1.3509462273017772e-06, + "loss": 0.7861, + "step": 47321 + }, + { + "epoch": 1.21, + "learning_rate": 1.3509203166757685e-06, + "loss": 0.7109, + "step": 47322 + }, + { + "epoch": 1.21, + "learning_rate": 1.3508944057810762e-06, + "loss": 0.6245, + "step": 47323 + }, + { + "epoch": 1.21, + "learning_rate": 1.35086849461772e-06, + "loss": 0.7705, + "step": 47324 + }, + { + "epoch": 1.21, + "learning_rate": 1.35084258318572e-06, + "loss": 0.6025, + "step": 47325 + }, + { + "epoch": 1.21, + "learning_rate": 1.3508166714850958e-06, + "loss": 0.6895, + "step": 47326 + }, + { + "epoch": 1.21, + "learning_rate": 1.350790759515868e-06, + "loss": 0.7148, + "step": 47327 + }, + { + "epoch": 1.21, + "learning_rate": 1.350764847278055e-06, + "loss": 0.4709, + "step": 47328 + }, + { + "epoch": 1.21, + "learning_rate": 1.350738934771678e-06, + "loss": 0.6016, + "step": 47329 + }, + { + "epoch": 1.21, + "learning_rate": 1.3507130219967561e-06, + "loss": 0.6846, + "step": 47330 + }, + { + "epoch": 1.21, + "learning_rate": 1.3506871089533096e-06, + "loss": 0.8291, + "step": 47331 + }, + { + "epoch": 1.21, + "learning_rate": 1.350661195641358e-06, + "loss": 0.8213, + "step": 47332 + }, + { + "epoch": 1.21, + "learning_rate": 1.3506352820609213e-06, + "loss": 0.5308, + "step": 47333 + }, + { + "epoch": 1.21, + "learning_rate": 1.350609368212019e-06, + "loss": 0.6787, + "step": 47334 + }, + { + "epoch": 1.21, + "learning_rate": 1.3505834540946718e-06, + "loss": 0.5518, + "step": 47335 + }, + { + "epoch": 1.21, + "learning_rate": 1.3505575397088982e-06, + "loss": 0.8291, + "step": 47336 + }, + { + "epoch": 1.21, + "learning_rate": 1.3505316250547195e-06, + "loss": 0.8252, + "step": 47337 + }, + { + "epoch": 1.21, + "learning_rate": 1.3505057101321545e-06, + "loss": 0.7979, + "step": 47338 + }, + { + "epoch": 1.21, + "learning_rate": 1.3504797949412234e-06, + "loss": 0.7139, + "step": 47339 + }, + { + "epoch": 1.21, + "learning_rate": 1.3504538794819462e-06, + "loss": 0.6094, + "step": 47340 + }, + { + "epoch": 1.21, + "learning_rate": 1.3504279637543425e-06, + "loss": 0.6362, + "step": 47341 + }, + { + "epoch": 1.21, + "learning_rate": 1.3504020477584322e-06, + "loss": 0.7725, + "step": 47342 + }, + { + "epoch": 1.21, + "learning_rate": 1.350376131494235e-06, + "loss": 0.6641, + "step": 47343 + }, + { + "epoch": 1.21, + "learning_rate": 1.3503502149617712e-06, + "loss": 0.605, + "step": 47344 + }, + { + "epoch": 1.21, + "learning_rate": 1.35032429816106e-06, + "loss": 0.7783, + "step": 47345 + }, + { + "epoch": 1.21, + "learning_rate": 1.350298381092122e-06, + "loss": 0.8047, + "step": 47346 + }, + { + "epoch": 1.21, + "learning_rate": 1.3502724637549765e-06, + "loss": 0.6421, + "step": 47347 + }, + { + "epoch": 1.21, + "learning_rate": 1.3502465461496435e-06, + "loss": 0.6572, + "step": 47348 + }, + { + "epoch": 1.21, + "learning_rate": 1.3502206282761426e-06, + "loss": 0.6982, + "step": 47349 + }, + { + "epoch": 1.21, + "learning_rate": 1.350194710134494e-06, + "loss": 0.6909, + "step": 47350 + }, + { + "epoch": 1.21, + "learning_rate": 1.3501687917247173e-06, + "loss": 0.4829, + "step": 47351 + }, + { + "epoch": 1.21, + "learning_rate": 1.3501428730468329e-06, + "loss": 0.6855, + "step": 47352 + }, + { + "epoch": 1.21, + "learning_rate": 1.35011695410086e-06, + "loss": 0.5479, + "step": 47353 + }, + { + "epoch": 1.21, + "learning_rate": 1.3500910348868184e-06, + "loss": 0.5417, + "step": 47354 + }, + { + "epoch": 1.21, + "learning_rate": 1.3500651154047282e-06, + "loss": 0.6025, + "step": 47355 + }, + { + "epoch": 1.21, + "learning_rate": 1.3500391956546095e-06, + "loss": 0.7939, + "step": 47356 + }, + { + "epoch": 1.21, + "learning_rate": 1.350013275636482e-06, + "loss": 0.6924, + "step": 47357 + }, + { + "epoch": 1.21, + "learning_rate": 1.3499873553503652e-06, + "loss": 0.6489, + "step": 47358 + }, + { + "epoch": 1.21, + "learning_rate": 1.3499614347962788e-06, + "loss": 0.7266, + "step": 47359 + }, + { + "epoch": 1.21, + "learning_rate": 1.3499355139742437e-06, + "loss": 0.7314, + "step": 47360 + }, + { + "epoch": 1.21, + "learning_rate": 1.3499095928842785e-06, + "loss": 0.6699, + "step": 47361 + }, + { + "epoch": 1.21, + "learning_rate": 1.349883671526404e-06, + "loss": 0.6802, + "step": 47362 + }, + { + "epoch": 1.21, + "learning_rate": 1.3498577499006397e-06, + "loss": 0.667, + "step": 47363 + }, + { + "epoch": 1.21, + "learning_rate": 1.349831828007005e-06, + "loss": 0.6292, + "step": 47364 + }, + { + "epoch": 1.21, + "learning_rate": 1.3498059058455205e-06, + "loss": 0.5076, + "step": 47365 + }, + { + "epoch": 1.21, + "learning_rate": 1.3497799834162054e-06, + "loss": 0.5469, + "step": 47366 + }, + { + "epoch": 1.21, + "learning_rate": 1.3497540607190803e-06, + "loss": 0.5933, + "step": 47367 + }, + { + "epoch": 1.21, + "learning_rate": 1.3497281377541643e-06, + "loss": 0.6216, + "step": 47368 + }, + { + "epoch": 1.21, + "learning_rate": 1.3497022145214777e-06, + "loss": 0.5342, + "step": 47369 + }, + { + "epoch": 1.21, + "learning_rate": 1.3496762910210397e-06, + "loss": 0.6436, + "step": 47370 + }, + { + "epoch": 1.21, + "learning_rate": 1.3496503672528711e-06, + "loss": 0.7422, + "step": 47371 + }, + { + "epoch": 1.21, + "learning_rate": 1.3496244432169914e-06, + "loss": 0.7178, + "step": 47372 + }, + { + "epoch": 1.21, + "learning_rate": 1.3495985189134203e-06, + "loss": 0.4924, + "step": 47373 + }, + { + "epoch": 1.21, + "learning_rate": 1.3495725943421775e-06, + "loss": 0.6548, + "step": 47374 + }, + { + "epoch": 1.21, + "learning_rate": 1.3495466695032828e-06, + "loss": 0.6497, + "step": 47375 + }, + { + "epoch": 1.21, + "learning_rate": 1.3495207443967566e-06, + "loss": 0.6973, + "step": 47376 + }, + { + "epoch": 1.21, + "learning_rate": 1.3494948190226184e-06, + "loss": 0.7842, + "step": 47377 + }, + { + "epoch": 1.21, + "learning_rate": 1.3494688933808881e-06, + "loss": 0.6509, + "step": 47378 + }, + { + "epoch": 1.21, + "learning_rate": 1.3494429674715857e-06, + "loss": 0.585, + "step": 47379 + }, + { + "epoch": 1.21, + "learning_rate": 1.3494170412947307e-06, + "loss": 0.6729, + "step": 47380 + }, + { + "epoch": 1.21, + "learning_rate": 1.3493911148503433e-06, + "loss": 0.77, + "step": 47381 + }, + { + "epoch": 1.21, + "learning_rate": 1.349365188138443e-06, + "loss": 0.6904, + "step": 47382 + }, + { + "epoch": 1.21, + "learning_rate": 1.3493392611590497e-06, + "loss": 0.751, + "step": 47383 + }, + { + "epoch": 1.21, + "learning_rate": 1.3493133339121837e-06, + "loss": 0.6572, + "step": 47384 + }, + { + "epoch": 1.21, + "learning_rate": 1.349287406397864e-06, + "loss": 0.6416, + "step": 47385 + }, + { + "epoch": 1.21, + "learning_rate": 1.3492614786161116e-06, + "loss": 0.7417, + "step": 47386 + }, + { + "epoch": 1.21, + "learning_rate": 1.3492355505669458e-06, + "loss": 0.6621, + "step": 47387 + }, + { + "epoch": 1.21, + "learning_rate": 1.3492096222503862e-06, + "loss": 0.6787, + "step": 47388 + }, + { + "epoch": 1.21, + "learning_rate": 1.3491836936664527e-06, + "loss": 0.7705, + "step": 47389 + }, + { + "epoch": 1.21, + "learning_rate": 1.3491577648151653e-06, + "loss": 0.4617, + "step": 47390 + }, + { + "epoch": 1.21, + "learning_rate": 1.3491318356965437e-06, + "loss": 0.5, + "step": 47391 + }, + { + "epoch": 1.21, + "learning_rate": 1.3491059063106086e-06, + "loss": 0.5928, + "step": 47392 + }, + { + "epoch": 1.21, + "learning_rate": 1.3490799766573786e-06, + "loss": 0.7061, + "step": 47393 + }, + { + "epoch": 1.21, + "learning_rate": 1.3490540467368743e-06, + "loss": 0.561, + "step": 47394 + }, + { + "epoch": 1.21, + "learning_rate": 1.3490281165491152e-06, + "loss": 0.4934, + "step": 47395 + }, + { + "epoch": 1.21, + "learning_rate": 1.3490021860941215e-06, + "loss": 0.7354, + "step": 47396 + }, + { + "epoch": 1.21, + "learning_rate": 1.3489762553719128e-06, + "loss": 0.8457, + "step": 47397 + }, + { + "epoch": 1.21, + "learning_rate": 1.3489503243825092e-06, + "loss": 0.6133, + "step": 47398 + }, + { + "epoch": 1.21, + "learning_rate": 1.34892439312593e-06, + "loss": 0.6494, + "step": 47399 + }, + { + "epoch": 1.21, + "learning_rate": 1.3488984616021957e-06, + "loss": 0.7666, + "step": 47400 + }, + { + "epoch": 1.21, + "learning_rate": 1.3488725298113257e-06, + "loss": 0.7129, + "step": 47401 + }, + { + "epoch": 1.21, + "learning_rate": 1.3488465977533404e-06, + "loss": 0.5168, + "step": 47402 + }, + { + "epoch": 1.21, + "learning_rate": 1.348820665428259e-06, + "loss": 0.8516, + "step": 47403 + }, + { + "epoch": 1.21, + "learning_rate": 1.3487947328361018e-06, + "loss": 0.7012, + "step": 47404 + }, + { + "epoch": 1.22, + "learning_rate": 1.3487687999768885e-06, + "loss": 0.5303, + "step": 47405 + }, + { + "epoch": 1.22, + "learning_rate": 1.348742866850639e-06, + "loss": 0.7852, + "step": 47406 + }, + { + "epoch": 1.22, + "learning_rate": 1.3487169334573728e-06, + "loss": 0.7607, + "step": 47407 + }, + { + "epoch": 1.22, + "learning_rate": 1.3486909997971103e-06, + "loss": 0.6943, + "step": 47408 + }, + { + "epoch": 1.22, + "learning_rate": 1.3486650658698712e-06, + "loss": 0.5093, + "step": 47409 + }, + { + "epoch": 1.22, + "learning_rate": 1.348639131675675e-06, + "loss": 0.7402, + "step": 47410 + }, + { + "epoch": 1.22, + "learning_rate": 1.3486131972145422e-06, + "loss": 0.7354, + "step": 47411 + }, + { + "epoch": 1.22, + "learning_rate": 1.3485872624864922e-06, + "loss": 0.54, + "step": 47412 + }, + { + "epoch": 1.22, + "learning_rate": 1.3485613274915452e-06, + "loss": 0.7012, + "step": 47413 + }, + { + "epoch": 1.22, + "learning_rate": 1.3485353922297204e-06, + "loss": 0.7158, + "step": 47414 + }, + { + "epoch": 1.22, + "learning_rate": 1.3485094567010384e-06, + "loss": 0.6182, + "step": 47415 + }, + { + "epoch": 1.22, + "learning_rate": 1.3484835209055185e-06, + "loss": 0.6958, + "step": 47416 + }, + { + "epoch": 1.22, + "learning_rate": 1.3484575848431812e-06, + "loss": 0.6206, + "step": 47417 + }, + { + "epoch": 1.22, + "learning_rate": 1.3484316485140451e-06, + "loss": 0.7178, + "step": 47418 + }, + { + "epoch": 1.22, + "learning_rate": 1.3484057119181318e-06, + "loss": 0.6689, + "step": 47419 + }, + { + "epoch": 1.22, + "learning_rate": 1.3483797750554598e-06, + "loss": 0.5825, + "step": 47420 + }, + { + "epoch": 1.22, + "learning_rate": 1.3483538379260497e-06, + "loss": 0.4431, + "step": 47421 + }, + { + "epoch": 1.22, + "learning_rate": 1.3483279005299208e-06, + "loss": 0.6543, + "step": 47422 + }, + { + "epoch": 1.22, + "learning_rate": 1.3483019628670932e-06, + "loss": 0.645, + "step": 47423 + }, + { + "epoch": 1.22, + "learning_rate": 1.348276024937587e-06, + "loss": 0.7305, + "step": 47424 + }, + { + "epoch": 1.22, + "learning_rate": 1.348250086741422e-06, + "loss": 0.7383, + "step": 47425 + }, + { + "epoch": 1.22, + "learning_rate": 1.3482241482786177e-06, + "loss": 0.5647, + "step": 47426 + }, + { + "epoch": 1.22, + "learning_rate": 1.3481982095491942e-06, + "loss": 0.5081, + "step": 47427 + }, + { + "epoch": 1.22, + "learning_rate": 1.3481722705531712e-06, + "loss": 0.7222, + "step": 47428 + }, + { + "epoch": 1.22, + "learning_rate": 1.348146331290569e-06, + "loss": 0.5591, + "step": 47429 + }, + { + "epoch": 1.22, + "learning_rate": 1.348120391761407e-06, + "loss": 0.7471, + "step": 47430 + }, + { + "epoch": 1.22, + "learning_rate": 1.3480944519657054e-06, + "loss": 0.6846, + "step": 47431 + }, + { + "epoch": 1.22, + "learning_rate": 1.3480685119034835e-06, + "loss": 0.6313, + "step": 47432 + }, + { + "epoch": 1.22, + "learning_rate": 1.3480425715747618e-06, + "loss": 0.6963, + "step": 47433 + }, + { + "epoch": 1.22, + "learning_rate": 1.34801663097956e-06, + "loss": 0.6992, + "step": 47434 + }, + { + "epoch": 1.22, + "learning_rate": 1.3479906901178976e-06, + "loss": 0.3842, + "step": 47435 + }, + { + "epoch": 1.22, + "learning_rate": 1.3479647489897951e-06, + "loss": 0.6831, + "step": 47436 + }, + { + "epoch": 1.22, + "learning_rate": 1.3479388075952716e-06, + "loss": 0.7061, + "step": 47437 + }, + { + "epoch": 1.22, + "learning_rate": 1.3479128659343477e-06, + "loss": 0.7363, + "step": 47438 + }, + { + "epoch": 1.22, + "learning_rate": 1.3478869240070425e-06, + "loss": 0.6582, + "step": 47439 + }, + { + "epoch": 1.22, + "learning_rate": 1.3478609818133766e-06, + "loss": 0.79, + "step": 47440 + }, + { + "epoch": 1.22, + "learning_rate": 1.3478350393533694e-06, + "loss": 0.7803, + "step": 47441 + }, + { + "epoch": 1.22, + "learning_rate": 1.3478090966270411e-06, + "loss": 0.4846, + "step": 47442 + }, + { + "epoch": 1.22, + "learning_rate": 1.3477831536344112e-06, + "loss": 0.6958, + "step": 47443 + }, + { + "epoch": 1.22, + "learning_rate": 1.3477572103754997e-06, + "loss": 0.7529, + "step": 47444 + }, + { + "epoch": 1.22, + "learning_rate": 1.3477312668503266e-06, + "loss": 0.7246, + "step": 47445 + }, + { + "epoch": 1.22, + "learning_rate": 1.3477053230589117e-06, + "loss": 0.7002, + "step": 47446 + }, + { + "epoch": 1.22, + "learning_rate": 1.3476793790012749e-06, + "loss": 0.5586, + "step": 47447 + }, + { + "epoch": 1.22, + "learning_rate": 1.3476534346774357e-06, + "loss": 0.6602, + "step": 47448 + }, + { + "epoch": 1.22, + "learning_rate": 1.3476274900874142e-06, + "loss": 0.6519, + "step": 47449 + }, + { + "epoch": 1.22, + "learning_rate": 1.3476015452312307e-06, + "loss": 0.7324, + "step": 47450 + }, + { + "epoch": 1.22, + "learning_rate": 1.3475756001089045e-06, + "loss": 0.5347, + "step": 47451 + }, + { + "epoch": 1.22, + "learning_rate": 1.3475496547204554e-06, + "loss": 0.709, + "step": 47452 + }, + { + "epoch": 1.22, + "learning_rate": 1.347523709065904e-06, + "loss": 0.479, + "step": 47453 + }, + { + "epoch": 1.22, + "learning_rate": 1.3474977631452692e-06, + "loss": 0.6533, + "step": 47454 + }, + { + "epoch": 1.22, + "learning_rate": 1.3474718169585716e-06, + "loss": 0.5874, + "step": 47455 + }, + { + "epoch": 1.22, + "learning_rate": 1.3474458705058307e-06, + "loss": 0.5566, + "step": 47456 + }, + { + "epoch": 1.22, + "learning_rate": 1.3474199237870668e-06, + "loss": 0.5864, + "step": 47457 + }, + { + "epoch": 1.22, + "learning_rate": 1.3473939768022988e-06, + "loss": 0.5188, + "step": 47458 + }, + { + "epoch": 1.22, + "learning_rate": 1.3473680295515478e-06, + "loss": 0.6523, + "step": 47459 + }, + { + "epoch": 1.22, + "learning_rate": 1.3473420820348327e-06, + "loss": 0.6963, + "step": 47460 + }, + { + "epoch": 1.22, + "learning_rate": 1.347316134252174e-06, + "loss": 0.8037, + "step": 47461 + }, + { + "epoch": 1.22, + "learning_rate": 1.3472901862035913e-06, + "loss": 0.6313, + "step": 47462 + }, + { + "epoch": 1.22, + "learning_rate": 1.3472642378891044e-06, + "loss": 0.502, + "step": 47463 + }, + { + "epoch": 1.22, + "learning_rate": 1.3472382893087328e-06, + "loss": 0.8955, + "step": 47464 + }, + { + "epoch": 1.22, + "learning_rate": 1.3472123404624972e-06, + "loss": 0.7524, + "step": 47465 + }, + { + "epoch": 1.22, + "learning_rate": 1.3471863913504174e-06, + "loss": 0.667, + "step": 47466 + }, + { + "epoch": 1.22, + "learning_rate": 1.3471604419725126e-06, + "loss": 0.793, + "step": 47467 + }, + { + "epoch": 1.22, + "learning_rate": 1.3471344923288031e-06, + "loss": 0.5996, + "step": 47468 + }, + { + "epoch": 1.22, + "learning_rate": 1.3471085424193085e-06, + "loss": 0.5537, + "step": 47469 + }, + { + "epoch": 1.22, + "learning_rate": 1.3470825922440488e-06, + "loss": 0.7134, + "step": 47470 + }, + { + "epoch": 1.22, + "learning_rate": 1.3470566418030443e-06, + "loss": 0.6914, + "step": 47471 + }, + { + "epoch": 1.22, + "learning_rate": 1.3470306910963142e-06, + "loss": 0.5293, + "step": 47472 + }, + { + "epoch": 1.22, + "learning_rate": 1.3470047401238786e-06, + "loss": 0.6631, + "step": 47473 + }, + { + "epoch": 1.22, + "learning_rate": 1.3469787888857575e-06, + "loss": 0.5215, + "step": 47474 + }, + { + "epoch": 1.22, + "learning_rate": 1.3469528373819707e-06, + "loss": 0.6709, + "step": 47475 + }, + { + "epoch": 1.22, + "learning_rate": 1.3469268856125384e-06, + "loss": 0.5007, + "step": 47476 + }, + { + "epoch": 1.22, + "learning_rate": 1.3469009335774798e-06, + "loss": 0.6182, + "step": 47477 + }, + { + "epoch": 1.22, + "learning_rate": 1.3468749812768152e-06, + "loss": 0.7656, + "step": 47478 + }, + { + "epoch": 1.22, + "learning_rate": 1.3468490287105642e-06, + "loss": 0.6235, + "step": 47479 + }, + { + "epoch": 1.22, + "learning_rate": 1.346823075878747e-06, + "loss": 0.5405, + "step": 47480 + }, + { + "epoch": 1.22, + "learning_rate": 1.3467971227813836e-06, + "loss": 0.4829, + "step": 47481 + }, + { + "epoch": 1.22, + "learning_rate": 1.3467711694184932e-06, + "loss": 0.5459, + "step": 47482 + }, + { + "epoch": 1.22, + "learning_rate": 1.346745215790096e-06, + "loss": 0.6582, + "step": 47483 + }, + { + "epoch": 1.22, + "learning_rate": 1.3467192618962122e-06, + "loss": 0.7383, + "step": 47484 + }, + { + "epoch": 1.22, + "learning_rate": 1.3466933077368612e-06, + "loss": 0.5869, + "step": 47485 + }, + { + "epoch": 1.22, + "learning_rate": 1.3466673533120635e-06, + "loss": 0.5957, + "step": 47486 + }, + { + "epoch": 1.22, + "learning_rate": 1.3466413986218382e-06, + "loss": 0.5154, + "step": 47487 + }, + { + "epoch": 1.22, + "learning_rate": 1.3466154436662053e-06, + "loss": 0.8252, + "step": 47488 + }, + { + "epoch": 1.22, + "learning_rate": 1.346589488445185e-06, + "loss": 0.5625, + "step": 47489 + }, + { + "epoch": 1.22, + "learning_rate": 1.3465635329587973e-06, + "loss": 0.5713, + "step": 47490 + }, + { + "epoch": 1.22, + "learning_rate": 1.3465375772070616e-06, + "loss": 0.6357, + "step": 47491 + }, + { + "epoch": 1.22, + "learning_rate": 1.3465116211899982e-06, + "loss": 0.6089, + "step": 47492 + }, + { + "epoch": 1.22, + "learning_rate": 1.3464856649076267e-06, + "loss": 0.627, + "step": 47493 + }, + { + "epoch": 1.22, + "learning_rate": 1.3464597083599673e-06, + "loss": 0.5679, + "step": 47494 + }, + { + "epoch": 1.22, + "learning_rate": 1.3464337515470392e-06, + "loss": 0.584, + "step": 47495 + }, + { + "epoch": 1.22, + "learning_rate": 1.346407794468863e-06, + "loss": 0.646, + "step": 47496 + }, + { + "epoch": 1.22, + "learning_rate": 1.3463818371254583e-06, + "loss": 0.5332, + "step": 47497 + }, + { + "epoch": 1.22, + "learning_rate": 1.3463558795168448e-06, + "loss": 0.5571, + "step": 47498 + }, + { + "epoch": 1.22, + "learning_rate": 1.3463299216430426e-06, + "loss": 0.5625, + "step": 47499 + }, + { + "epoch": 1.22, + "learning_rate": 1.3463039635040714e-06, + "loss": 0.6455, + "step": 47500 + }, + { + "epoch": 1.22, + "learning_rate": 1.3462780050999514e-06, + "loss": 0.9385, + "step": 47501 + }, + { + "epoch": 1.22, + "learning_rate": 1.346252046430702e-06, + "loss": 0.5225, + "step": 47502 + }, + { + "epoch": 1.22, + "learning_rate": 1.3462260874963435e-06, + "loss": 0.686, + "step": 47503 + }, + { + "epoch": 1.22, + "learning_rate": 1.3462001282968956e-06, + "loss": 0.562, + "step": 47504 + }, + { + "epoch": 1.22, + "learning_rate": 1.3461741688323782e-06, + "loss": 0.6069, + "step": 47505 + }, + { + "epoch": 1.22, + "learning_rate": 1.3461482091028111e-06, + "loss": 0.4933, + "step": 47506 + }, + { + "epoch": 1.22, + "learning_rate": 1.3461222491082142e-06, + "loss": 0.6074, + "step": 47507 + }, + { + "epoch": 1.22, + "learning_rate": 1.3460962888486074e-06, + "loss": 0.8037, + "step": 47508 + }, + { + "epoch": 1.22, + "learning_rate": 1.3460703283240107e-06, + "loss": 0.583, + "step": 47509 + }, + { + "epoch": 1.22, + "learning_rate": 1.3460443675344437e-06, + "loss": 0.583, + "step": 47510 + }, + { + "epoch": 1.22, + "learning_rate": 1.3460184064799267e-06, + "loss": 0.8223, + "step": 47511 + }, + { + "epoch": 1.22, + "learning_rate": 1.345992445160479e-06, + "loss": 0.7114, + "step": 47512 + }, + { + "epoch": 1.22, + "learning_rate": 1.345966483576121e-06, + "loss": 0.5825, + "step": 47513 + }, + { + "epoch": 1.22, + "learning_rate": 1.3459405217268722e-06, + "loss": 0.6875, + "step": 47514 + }, + { + "epoch": 1.22, + "learning_rate": 1.3459145596127528e-06, + "loss": 0.7275, + "step": 47515 + }, + { + "epoch": 1.22, + "learning_rate": 1.3458885972337825e-06, + "loss": 0.7109, + "step": 47516 + }, + { + "epoch": 1.22, + "learning_rate": 1.345862634589981e-06, + "loss": 0.6162, + "step": 47517 + }, + { + "epoch": 1.22, + "learning_rate": 1.3458366716813688e-06, + "loss": 0.5308, + "step": 47518 + }, + { + "epoch": 1.22, + "learning_rate": 1.3458107085079648e-06, + "loss": 0.5967, + "step": 47519 + }, + { + "epoch": 1.22, + "learning_rate": 1.34578474506979e-06, + "loss": 0.8008, + "step": 47520 + }, + { + "epoch": 1.22, + "learning_rate": 1.3457587813668637e-06, + "loss": 0.7539, + "step": 47521 + }, + { + "epoch": 1.22, + "learning_rate": 1.3457328173992056e-06, + "loss": 0.6118, + "step": 47522 + }, + { + "epoch": 1.22, + "learning_rate": 1.3457068531668357e-06, + "loss": 0.7168, + "step": 47523 + }, + { + "epoch": 1.22, + "learning_rate": 1.345680888669774e-06, + "loss": 0.5405, + "step": 47524 + }, + { + "epoch": 1.22, + "learning_rate": 1.3456549239080402e-06, + "loss": 0.6267, + "step": 47525 + }, + { + "epoch": 1.22, + "learning_rate": 1.3456289588816547e-06, + "loss": 0.6157, + "step": 47526 + }, + { + "epoch": 1.22, + "learning_rate": 1.3456029935906365e-06, + "loss": 0.4988, + "step": 47527 + }, + { + "epoch": 1.22, + "learning_rate": 1.3455770280350066e-06, + "loss": 0.668, + "step": 47528 + }, + { + "epoch": 1.22, + "learning_rate": 1.3455510622147836e-06, + "loss": 0.5237, + "step": 47529 + }, + { + "epoch": 1.22, + "learning_rate": 1.3455250961299885e-06, + "loss": 0.312, + "step": 47530 + }, + { + "epoch": 1.22, + "learning_rate": 1.3454991297806406e-06, + "loss": 0.6851, + "step": 47531 + }, + { + "epoch": 1.22, + "learning_rate": 1.34547316316676e-06, + "loss": 0.7217, + "step": 47532 + }, + { + "epoch": 1.22, + "learning_rate": 1.3454471962883662e-06, + "loss": 0.6978, + "step": 47533 + }, + { + "epoch": 1.22, + "learning_rate": 1.3454212291454797e-06, + "loss": 0.7363, + "step": 47534 + }, + { + "epoch": 1.22, + "learning_rate": 1.3453952617381197e-06, + "loss": 0.7441, + "step": 47535 + }, + { + "epoch": 1.22, + "learning_rate": 1.3453692940663067e-06, + "loss": 0.5156, + "step": 47536 + }, + { + "epoch": 1.22, + "learning_rate": 1.3453433261300603e-06, + "loss": 0.5654, + "step": 47537 + }, + { + "epoch": 1.22, + "learning_rate": 1.3453173579294004e-06, + "loss": 0.5342, + "step": 47538 + }, + { + "epoch": 1.22, + "learning_rate": 1.3452913894643465e-06, + "loss": 0.5679, + "step": 47539 + }, + { + "epoch": 1.22, + "learning_rate": 1.3452654207349192e-06, + "loss": 0.7109, + "step": 47540 + }, + { + "epoch": 1.22, + "learning_rate": 1.3452394517411383e-06, + "loss": 0.5972, + "step": 47541 + }, + { + "epoch": 1.22, + "learning_rate": 1.3452134824830231e-06, + "loss": 0.7207, + "step": 47542 + }, + { + "epoch": 1.22, + "learning_rate": 1.3451875129605937e-06, + "loss": 0.7559, + "step": 47543 + }, + { + "epoch": 1.22, + "learning_rate": 1.34516154317387e-06, + "loss": 0.707, + "step": 47544 + }, + { + "epoch": 1.22, + "learning_rate": 1.3451355731228723e-06, + "loss": 0.4878, + "step": 47545 + }, + { + "epoch": 1.22, + "learning_rate": 1.3451096028076202e-06, + "loss": 0.6099, + "step": 47546 + }, + { + "epoch": 1.22, + "learning_rate": 1.3450836322281337e-06, + "loss": 0.5679, + "step": 47547 + }, + { + "epoch": 1.22, + "learning_rate": 1.345057661384432e-06, + "loss": 0.436, + "step": 47548 + }, + { + "epoch": 1.22, + "learning_rate": 1.3450316902765357e-06, + "loss": 0.7344, + "step": 47549 + }, + { + "epoch": 1.22, + "learning_rate": 1.3450057189044644e-06, + "loss": 0.7188, + "step": 47550 + }, + { + "epoch": 1.22, + "learning_rate": 1.3449797472682388e-06, + "loss": 0.666, + "step": 47551 + }, + { + "epoch": 1.22, + "learning_rate": 1.3449537753678772e-06, + "loss": 0.6406, + "step": 47552 + }, + { + "epoch": 1.22, + "learning_rate": 1.3449278032034008e-06, + "loss": 0.6956, + "step": 47553 + }, + { + "epoch": 1.22, + "learning_rate": 1.3449018307748288e-06, + "loss": 0.7803, + "step": 47554 + }, + { + "epoch": 1.22, + "learning_rate": 1.3448758580821814e-06, + "loss": 0.6191, + "step": 47555 + }, + { + "epoch": 1.22, + "learning_rate": 1.3448498851254786e-06, + "loss": 0.7021, + "step": 47556 + }, + { + "epoch": 1.22, + "learning_rate": 1.34482391190474e-06, + "loss": 0.6118, + "step": 47557 + }, + { + "epoch": 1.22, + "learning_rate": 1.3447979384199854e-06, + "loss": 0.6572, + "step": 47558 + }, + { + "epoch": 1.22, + "learning_rate": 1.344771964671235e-06, + "loss": 0.5342, + "step": 47559 + }, + { + "epoch": 1.22, + "learning_rate": 1.3447459906585086e-06, + "loss": 0.6274, + "step": 47560 + }, + { + "epoch": 1.22, + "learning_rate": 1.344720016381826e-06, + "loss": 0.6694, + "step": 47561 + }, + { + "epoch": 1.22, + "learning_rate": 1.3446940418412072e-06, + "loss": 0.6133, + "step": 47562 + }, + { + "epoch": 1.22, + "learning_rate": 1.3446680670366718e-06, + "loss": 0.6807, + "step": 47563 + }, + { + "epoch": 1.22, + "learning_rate": 1.34464209196824e-06, + "loss": 0.6001, + "step": 47564 + }, + { + "epoch": 1.22, + "learning_rate": 1.3446161166359318e-06, + "loss": 0.5615, + "step": 47565 + }, + { + "epoch": 1.22, + "learning_rate": 1.344590141039767e-06, + "loss": 0.6494, + "step": 47566 + }, + { + "epoch": 1.22, + "learning_rate": 1.344564165179765e-06, + "loss": 0.6357, + "step": 47567 + }, + { + "epoch": 1.22, + "learning_rate": 1.3445381890559463e-06, + "loss": 0.6963, + "step": 47568 + }, + { + "epoch": 1.22, + "learning_rate": 1.3445122126683304e-06, + "loss": 0.5884, + "step": 47569 + }, + { + "epoch": 1.22, + "learning_rate": 1.3444862360169373e-06, + "loss": 0.6133, + "step": 47570 + }, + { + "epoch": 1.22, + "learning_rate": 1.344460259101787e-06, + "loss": 0.627, + "step": 47571 + }, + { + "epoch": 1.22, + "learning_rate": 1.3444342819228995e-06, + "loss": 0.6982, + "step": 47572 + }, + { + "epoch": 1.22, + "learning_rate": 1.3444083044802942e-06, + "loss": 0.7334, + "step": 47573 + }, + { + "epoch": 1.22, + "learning_rate": 1.3443823267739916e-06, + "loss": 0.7324, + "step": 47574 + }, + { + "epoch": 1.22, + "learning_rate": 1.344356348804011e-06, + "loss": 0.6968, + "step": 47575 + }, + { + "epoch": 1.22, + "learning_rate": 1.3443303705703728e-06, + "loss": 0.6184, + "step": 47576 + }, + { + "epoch": 1.22, + "learning_rate": 1.3443043920730964e-06, + "loss": 0.5089, + "step": 47577 + }, + { + "epoch": 1.22, + "learning_rate": 1.3442784133122023e-06, + "loss": 0.5269, + "step": 47578 + }, + { + "epoch": 1.22, + "learning_rate": 1.3442524342877098e-06, + "loss": 0.7402, + "step": 47579 + }, + { + "epoch": 1.22, + "learning_rate": 1.344226454999639e-06, + "loss": 0.6934, + "step": 47580 + }, + { + "epoch": 1.22, + "learning_rate": 1.3442004754480102e-06, + "loss": 0.5771, + "step": 47581 + }, + { + "epoch": 1.22, + "learning_rate": 1.3441744956328426e-06, + "loss": 0.6812, + "step": 47582 + }, + { + "epoch": 1.22, + "learning_rate": 1.3441485155541566e-06, + "loss": 0.5767, + "step": 47583 + }, + { + "epoch": 1.22, + "learning_rate": 1.3441225352119718e-06, + "loss": 0.6836, + "step": 47584 + }, + { + "epoch": 1.22, + "learning_rate": 1.344096554606308e-06, + "loss": 0.5659, + "step": 47585 + }, + { + "epoch": 1.22, + "learning_rate": 1.3440705737371855e-06, + "loss": 0.6375, + "step": 47586 + }, + { + "epoch": 1.22, + "learning_rate": 1.3440445926046241e-06, + "loss": 0.5491, + "step": 47587 + }, + { + "epoch": 1.22, + "learning_rate": 1.3440186112086433e-06, + "loss": 0.7349, + "step": 47588 + }, + { + "epoch": 1.22, + "learning_rate": 1.3439926295492636e-06, + "loss": 0.5776, + "step": 47589 + }, + { + "epoch": 1.22, + "learning_rate": 1.343966647626504e-06, + "loss": 0.6504, + "step": 47590 + }, + { + "epoch": 1.22, + "learning_rate": 1.3439406654403857e-06, + "loss": 0.6406, + "step": 47591 + }, + { + "epoch": 1.22, + "learning_rate": 1.3439146829909276e-06, + "loss": 0.7329, + "step": 47592 + }, + { + "epoch": 1.22, + "learning_rate": 1.3438887002781496e-06, + "loss": 0.7695, + "step": 47593 + }, + { + "epoch": 1.22, + "learning_rate": 1.3438627173020718e-06, + "loss": 0.6089, + "step": 47594 + }, + { + "epoch": 1.22, + "learning_rate": 1.3438367340627143e-06, + "loss": 0.728, + "step": 47595 + }, + { + "epoch": 1.22, + "learning_rate": 1.3438107505600971e-06, + "loss": 0.7656, + "step": 47596 + }, + { + "epoch": 1.22, + "learning_rate": 1.3437847667942395e-06, + "loss": 0.7144, + "step": 47597 + }, + { + "epoch": 1.22, + "learning_rate": 1.3437587827651614e-06, + "loss": 0.6992, + "step": 47598 + }, + { + "epoch": 1.22, + "learning_rate": 1.3437327984728834e-06, + "loss": 0.5791, + "step": 47599 + }, + { + "epoch": 1.22, + "learning_rate": 1.343706813917425e-06, + "loss": 0.6855, + "step": 47600 + }, + { + "epoch": 1.22, + "learning_rate": 1.3436808290988061e-06, + "loss": 0.5059, + "step": 47601 + }, + { + "epoch": 1.22, + "learning_rate": 1.3436548440170466e-06, + "loss": 0.6821, + "step": 47602 + }, + { + "epoch": 1.22, + "learning_rate": 1.3436288586721664e-06, + "loss": 0.7002, + "step": 47603 + }, + { + "epoch": 1.22, + "learning_rate": 1.343602873064185e-06, + "loss": 0.7021, + "step": 47604 + }, + { + "epoch": 1.22, + "learning_rate": 1.3435768871931231e-06, + "loss": 0.5928, + "step": 47605 + }, + { + "epoch": 1.22, + "learning_rate": 1.3435509010590003e-06, + "loss": 0.7227, + "step": 47606 + }, + { + "epoch": 1.22, + "learning_rate": 1.3435249146618359e-06, + "loss": 0.666, + "step": 47607 + }, + { + "epoch": 1.22, + "learning_rate": 1.3434989280016505e-06, + "loss": 0.5293, + "step": 47608 + }, + { + "epoch": 1.22, + "learning_rate": 1.3434729410784638e-06, + "loss": 0.5815, + "step": 47609 + }, + { + "epoch": 1.22, + "learning_rate": 1.3434469538922955e-06, + "loss": 0.6631, + "step": 47610 + }, + { + "epoch": 1.22, + "learning_rate": 1.343420966443166e-06, + "loss": 0.6748, + "step": 47611 + }, + { + "epoch": 1.22, + "learning_rate": 1.3433949787310946e-06, + "loss": 0.7412, + "step": 47612 + }, + { + "epoch": 1.22, + "learning_rate": 1.3433689907561015e-06, + "loss": 0.5986, + "step": 47613 + }, + { + "epoch": 1.22, + "learning_rate": 1.3433430025182063e-06, + "loss": 0.6611, + "step": 47614 + }, + { + "epoch": 1.22, + "learning_rate": 1.3433170140174294e-06, + "loss": 0.7656, + "step": 47615 + }, + { + "epoch": 1.22, + "learning_rate": 1.3432910252537908e-06, + "loss": 0.6069, + "step": 47616 + }, + { + "epoch": 1.22, + "learning_rate": 1.3432650362273095e-06, + "loss": 0.6758, + "step": 47617 + }, + { + "epoch": 1.22, + "learning_rate": 1.343239046938006e-06, + "loss": 0.6387, + "step": 47618 + }, + { + "epoch": 1.22, + "learning_rate": 1.3432130573859003e-06, + "loss": 0.7314, + "step": 47619 + }, + { + "epoch": 1.22, + "learning_rate": 1.3431870675710121e-06, + "loss": 0.5708, + "step": 47620 + }, + { + "epoch": 1.22, + "learning_rate": 1.3431610774933618e-06, + "loss": 0.8008, + "step": 47621 + }, + { + "epoch": 1.22, + "learning_rate": 1.3431350871529682e-06, + "loss": 0.7729, + "step": 47622 + }, + { + "epoch": 1.22, + "learning_rate": 1.343109096549852e-06, + "loss": 0.625, + "step": 47623 + }, + { + "epoch": 1.22, + "learning_rate": 1.343083105684033e-06, + "loss": 0.5093, + "step": 47624 + }, + { + "epoch": 1.22, + "learning_rate": 1.343057114555531e-06, + "loss": 0.9043, + "step": 47625 + }, + { + "epoch": 1.22, + "learning_rate": 1.3430311231643661e-06, + "loss": 0.7188, + "step": 47626 + }, + { + "epoch": 1.22, + "learning_rate": 1.343005131510558e-06, + "loss": 0.6406, + "step": 47627 + }, + { + "epoch": 1.22, + "learning_rate": 1.3429791395941266e-06, + "loss": 0.5864, + "step": 47628 + }, + { + "epoch": 1.22, + "learning_rate": 1.3429531474150918e-06, + "loss": 0.5857, + "step": 47629 + }, + { + "epoch": 1.22, + "learning_rate": 1.3429271549734733e-06, + "loss": 0.7012, + "step": 47630 + }, + { + "epoch": 1.22, + "learning_rate": 1.3429011622692915e-06, + "loss": 0.5464, + "step": 47631 + }, + { + "epoch": 1.22, + "learning_rate": 1.342875169302566e-06, + "loss": 0.5054, + "step": 47632 + }, + { + "epoch": 1.22, + "learning_rate": 1.342849176073317e-06, + "loss": 0.6738, + "step": 47633 + }, + { + "epoch": 1.22, + "learning_rate": 1.3428231825815636e-06, + "loss": 0.6279, + "step": 47634 + }, + { + "epoch": 1.22, + "learning_rate": 1.3427971888273268e-06, + "loss": 0.6416, + "step": 47635 + }, + { + "epoch": 1.22, + "learning_rate": 1.3427711948106258e-06, + "loss": 0.7554, + "step": 47636 + }, + { + "epoch": 1.22, + "learning_rate": 1.3427452005314805e-06, + "loss": 0.834, + "step": 47637 + }, + { + "epoch": 1.22, + "learning_rate": 1.342719205989911e-06, + "loss": 0.7627, + "step": 47638 + }, + { + "epoch": 1.22, + "learning_rate": 1.3426932111859372e-06, + "loss": 0.5801, + "step": 47639 + }, + { + "epoch": 1.22, + "learning_rate": 1.3426672161195792e-06, + "loss": 0.6758, + "step": 47640 + }, + { + "epoch": 1.22, + "learning_rate": 1.3426412207908565e-06, + "loss": 0.6602, + "step": 47641 + }, + { + "epoch": 1.22, + "learning_rate": 1.3426152251997892e-06, + "loss": 0.5342, + "step": 47642 + }, + { + "epoch": 1.22, + "learning_rate": 1.342589229346397e-06, + "loss": 0.5525, + "step": 47643 + }, + { + "epoch": 1.22, + "learning_rate": 1.3425632332307e-06, + "loss": 0.5334, + "step": 47644 + }, + { + "epoch": 1.22, + "learning_rate": 1.3425372368527183e-06, + "loss": 0.6313, + "step": 47645 + }, + { + "epoch": 1.22, + "learning_rate": 1.3425112402124714e-06, + "loss": 0.5317, + "step": 47646 + }, + { + "epoch": 1.22, + "learning_rate": 1.3424852433099795e-06, + "loss": 0.7529, + "step": 47647 + }, + { + "epoch": 1.22, + "learning_rate": 1.3424592461452622e-06, + "loss": 0.8477, + "step": 47648 + }, + { + "epoch": 1.22, + "learning_rate": 1.3424332487183398e-06, + "loss": 0.644, + "step": 47649 + }, + { + "epoch": 1.22, + "learning_rate": 1.342407251029232e-06, + "loss": 0.5557, + "step": 47650 + }, + { + "epoch": 1.22, + "learning_rate": 1.3423812530779585e-06, + "loss": 0.6484, + "step": 47651 + }, + { + "epoch": 1.22, + "learning_rate": 1.3423552548645398e-06, + "loss": 0.7148, + "step": 47652 + }, + { + "epoch": 1.22, + "learning_rate": 1.342329256388995e-06, + "loss": 0.5259, + "step": 47653 + }, + { + "epoch": 1.22, + "learning_rate": 1.342303257651345e-06, + "loss": 0.5342, + "step": 47654 + }, + { + "epoch": 1.22, + "learning_rate": 1.3422772586516084e-06, + "loss": 0.5923, + "step": 47655 + }, + { + "epoch": 1.22, + "learning_rate": 1.3422512593898066e-06, + "loss": 0.7227, + "step": 47656 + }, + { + "epoch": 1.22, + "learning_rate": 1.3422252598659583e-06, + "loss": 0.6006, + "step": 47657 + }, + { + "epoch": 1.22, + "learning_rate": 1.342199260080084e-06, + "loss": 0.4448, + "step": 47658 + }, + { + "epoch": 1.22, + "learning_rate": 1.3421732600322032e-06, + "loss": 0.7148, + "step": 47659 + }, + { + "epoch": 1.22, + "learning_rate": 1.3421472597223362e-06, + "loss": 0.5291, + "step": 47660 + }, + { + "epoch": 1.22, + "learning_rate": 1.342121259150503e-06, + "loss": 0.6943, + "step": 47661 + }, + { + "epoch": 1.22, + "learning_rate": 1.3420952583167232e-06, + "loss": 0.71, + "step": 47662 + }, + { + "epoch": 1.22, + "learning_rate": 1.3420692572210163e-06, + "loss": 0.8076, + "step": 47663 + }, + { + "epoch": 1.22, + "learning_rate": 1.3420432558634035e-06, + "loss": 0.4449, + "step": 47664 + }, + { + "epoch": 1.22, + "learning_rate": 1.3420172542439033e-06, + "loss": 0.6392, + "step": 47665 + }, + { + "epoch": 1.22, + "learning_rate": 1.3419912523625365e-06, + "loss": 0.5742, + "step": 47666 + }, + { + "epoch": 1.22, + "learning_rate": 1.3419652502193226e-06, + "loss": 0.7617, + "step": 47667 + }, + { + "epoch": 1.22, + "learning_rate": 1.3419392478142818e-06, + "loss": 0.6548, + "step": 47668 + }, + { + "epoch": 1.22, + "learning_rate": 1.3419132451474336e-06, + "loss": 0.7246, + "step": 47669 + }, + { + "epoch": 1.22, + "learning_rate": 1.341887242218798e-06, + "loss": 0.6997, + "step": 47670 + }, + { + "epoch": 1.22, + "learning_rate": 1.3418612390283956e-06, + "loss": 0.8535, + "step": 47671 + }, + { + "epoch": 1.22, + "learning_rate": 1.3418352355762454e-06, + "loss": 0.4897, + "step": 47672 + }, + { + "epoch": 1.22, + "learning_rate": 1.341809231862368e-06, + "loss": 0.6572, + "step": 47673 + }, + { + "epoch": 1.22, + "learning_rate": 1.3417832278867828e-06, + "loss": 0.5825, + "step": 47674 + }, + { + "epoch": 1.22, + "learning_rate": 1.3417572236495097e-06, + "loss": 0.8179, + "step": 47675 + }, + { + "epoch": 1.22, + "learning_rate": 1.341731219150569e-06, + "loss": 0.6787, + "step": 47676 + }, + { + "epoch": 1.22, + "learning_rate": 1.3417052143899804e-06, + "loss": 0.7236, + "step": 47677 + }, + { + "epoch": 1.22, + "learning_rate": 1.3416792093677636e-06, + "loss": 0.5474, + "step": 47678 + }, + { + "epoch": 1.22, + "learning_rate": 1.341653204083939e-06, + "loss": 0.7578, + "step": 47679 + }, + { + "epoch": 1.22, + "learning_rate": 1.3416271985385262e-06, + "loss": 0.5967, + "step": 47680 + }, + { + "epoch": 1.22, + "learning_rate": 1.3416011927315454e-06, + "loss": 0.728, + "step": 47681 + }, + { + "epoch": 1.22, + "learning_rate": 1.3415751866630159e-06, + "loss": 0.7568, + "step": 47682 + }, + { + "epoch": 1.22, + "learning_rate": 1.3415491803329582e-06, + "loss": 0.6021, + "step": 47683 + }, + { + "epoch": 1.22, + "learning_rate": 1.3415231737413917e-06, + "loss": 0.668, + "step": 47684 + }, + { + "epoch": 1.22, + "learning_rate": 1.341497166888337e-06, + "loss": 0.6111, + "step": 47685 + }, + { + "epoch": 1.22, + "learning_rate": 1.3414711597738136e-06, + "loss": 0.7959, + "step": 47686 + }, + { + "epoch": 1.22, + "learning_rate": 1.341445152397841e-06, + "loss": 0.7217, + "step": 47687 + }, + { + "epoch": 1.22, + "learning_rate": 1.3414191447604399e-06, + "loss": 0.752, + "step": 47688 + }, + { + "epoch": 1.22, + "learning_rate": 1.3413931368616297e-06, + "loss": 0.8281, + "step": 47689 + }, + { + "epoch": 1.22, + "learning_rate": 1.3413671287014305e-06, + "loss": 0.5454, + "step": 47690 + }, + { + "epoch": 1.22, + "learning_rate": 1.3413411202798625e-06, + "loss": 0.6475, + "step": 47691 + }, + { + "epoch": 1.22, + "learning_rate": 1.341315111596945e-06, + "loss": 0.6047, + "step": 47692 + }, + { + "epoch": 1.22, + "learning_rate": 1.3412891026526984e-06, + "loss": 0.7559, + "step": 47693 + }, + { + "epoch": 1.22, + "learning_rate": 1.3412630934471422e-06, + "loss": 0.7744, + "step": 47694 + }, + { + "epoch": 1.22, + "learning_rate": 1.3412370839802968e-06, + "loss": 0.6208, + "step": 47695 + }, + { + "epoch": 1.22, + "learning_rate": 1.3412110742521815e-06, + "loss": 0.7451, + "step": 47696 + }, + { + "epoch": 1.22, + "learning_rate": 1.3411850642628165e-06, + "loss": 0.519, + "step": 47697 + }, + { + "epoch": 1.22, + "learning_rate": 1.3411590540122224e-06, + "loss": 0.4883, + "step": 47698 + }, + { + "epoch": 1.22, + "learning_rate": 1.341133043500418e-06, + "loss": 0.5957, + "step": 47699 + }, + { + "epoch": 1.22, + "learning_rate": 1.341107032727424e-06, + "loss": 0.7236, + "step": 47700 + }, + { + "epoch": 1.22, + "learning_rate": 1.3410810216932597e-06, + "loss": 0.7139, + "step": 47701 + }, + { + "epoch": 1.22, + "learning_rate": 1.3410550103979456e-06, + "loss": 0.8838, + "step": 47702 + }, + { + "epoch": 1.22, + "learning_rate": 1.3410289988415013e-06, + "loss": 0.2537, + "step": 47703 + }, + { + "epoch": 1.22, + "learning_rate": 1.3410029870239468e-06, + "loss": 0.6123, + "step": 47704 + }, + { + "epoch": 1.22, + "learning_rate": 1.340976974945302e-06, + "loss": 0.6182, + "step": 47705 + }, + { + "epoch": 1.22, + "learning_rate": 1.340950962605587e-06, + "loss": 0.6626, + "step": 47706 + }, + { + "epoch": 1.22, + "learning_rate": 1.3409249500048211e-06, + "loss": 0.6377, + "step": 47707 + }, + { + "epoch": 1.22, + "learning_rate": 1.340898937143025e-06, + "loss": 0.623, + "step": 47708 + }, + { + "epoch": 1.22, + "learning_rate": 1.3408729240202178e-06, + "loss": 0.6689, + "step": 47709 + }, + { + "epoch": 1.22, + "learning_rate": 1.3408469106364202e-06, + "loss": 0.6865, + "step": 47710 + }, + { + "epoch": 1.22, + "learning_rate": 1.3408208969916519e-06, + "loss": 0.7842, + "step": 47711 + }, + { + "epoch": 1.22, + "learning_rate": 1.3407948830859327e-06, + "loss": 0.6289, + "step": 47712 + }, + { + "epoch": 1.22, + "learning_rate": 1.3407688689192822e-06, + "loss": 0.6724, + "step": 47713 + }, + { + "epoch": 1.22, + "learning_rate": 1.340742854491721e-06, + "loss": 0.4648, + "step": 47714 + }, + { + "epoch": 1.22, + "learning_rate": 1.3407168398032684e-06, + "loss": 0.6606, + "step": 47715 + }, + { + "epoch": 1.22, + "learning_rate": 1.3406908248539446e-06, + "loss": 0.6611, + "step": 47716 + }, + { + "epoch": 1.22, + "learning_rate": 1.3406648096437699e-06, + "loss": 0.5879, + "step": 47717 + }, + { + "epoch": 1.22, + "learning_rate": 1.3406387941727632e-06, + "loss": 0.5698, + "step": 47718 + }, + { + "epoch": 1.22, + "learning_rate": 1.3406127784409456e-06, + "loss": 0.5986, + "step": 47719 + }, + { + "epoch": 1.22, + "learning_rate": 1.340586762448336e-06, + "loss": 0.877, + "step": 47720 + }, + { + "epoch": 1.22, + "learning_rate": 1.340560746194955e-06, + "loss": 0.7017, + "step": 47721 + }, + { + "epoch": 1.22, + "learning_rate": 1.3405347296808222e-06, + "loss": 0.6875, + "step": 47722 + }, + { + "epoch": 1.22, + "learning_rate": 1.340508712905958e-06, + "loss": 0.6699, + "step": 47723 + }, + { + "epoch": 1.22, + "learning_rate": 1.3404826958703813e-06, + "loss": 0.6611, + "step": 47724 + }, + { + "epoch": 1.22, + "learning_rate": 1.3404566785741133e-06, + "loss": 0.645, + "step": 47725 + }, + { + "epoch": 1.22, + "learning_rate": 1.340430661017173e-06, + "loss": 0.4539, + "step": 47726 + }, + { + "epoch": 1.22, + "learning_rate": 1.3404046431995806e-06, + "loss": 0.6646, + "step": 47727 + }, + { + "epoch": 1.22, + "learning_rate": 1.3403786251213559e-06, + "loss": 0.5815, + "step": 47728 + }, + { + "epoch": 1.22, + "learning_rate": 1.340352606782519e-06, + "loss": 0.6943, + "step": 47729 + }, + { + "epoch": 1.22, + "learning_rate": 1.3403265881830898e-06, + "loss": 0.7637, + "step": 47730 + }, + { + "epoch": 1.22, + "learning_rate": 1.3403005693230882e-06, + "loss": 0.6714, + "step": 47731 + }, + { + "epoch": 1.22, + "learning_rate": 1.340274550202534e-06, + "loss": 0.6318, + "step": 47732 + }, + { + "epoch": 1.22, + "learning_rate": 1.3402485308214472e-06, + "loss": 0.6216, + "step": 47733 + }, + { + "epoch": 1.22, + "learning_rate": 1.3402225111798477e-06, + "loss": 0.7744, + "step": 47734 + }, + { + "epoch": 1.22, + "learning_rate": 1.3401964912777556e-06, + "loss": 0.6172, + "step": 47735 + }, + { + "epoch": 1.22, + "learning_rate": 1.3401704711151908e-06, + "loss": 0.5933, + "step": 47736 + }, + { + "epoch": 1.22, + "learning_rate": 1.3401444506921733e-06, + "loss": 0.6289, + "step": 47737 + }, + { + "epoch": 1.22, + "learning_rate": 1.3401184300087224e-06, + "loss": 0.8311, + "step": 47738 + }, + { + "epoch": 1.22, + "learning_rate": 1.3400924090648586e-06, + "loss": 0.6553, + "step": 47739 + }, + { + "epoch": 1.22, + "learning_rate": 1.3400663878606016e-06, + "loss": 0.7178, + "step": 47740 + }, + { + "epoch": 1.22, + "learning_rate": 1.3400403663959714e-06, + "loss": 0.6294, + "step": 47741 + }, + { + "epoch": 1.22, + "learning_rate": 1.3400143446709882e-06, + "loss": 0.5378, + "step": 47742 + }, + { + "epoch": 1.22, + "learning_rate": 1.3399883226856711e-06, + "loss": 0.6885, + "step": 47743 + }, + { + "epoch": 1.22, + "learning_rate": 1.3399623004400412e-06, + "loss": 0.6785, + "step": 47744 + }, + { + "epoch": 1.22, + "learning_rate": 1.3399362779341175e-06, + "loss": 0.4929, + "step": 47745 + }, + { + "epoch": 1.22, + "learning_rate": 1.3399102551679202e-06, + "loss": 0.6641, + "step": 47746 + }, + { + "epoch": 1.22, + "learning_rate": 1.3398842321414692e-06, + "loss": 0.6865, + "step": 47747 + }, + { + "epoch": 1.22, + "learning_rate": 1.3398582088547847e-06, + "loss": 0.709, + "step": 47748 + }, + { + "epoch": 1.22, + "learning_rate": 1.339832185307886e-06, + "loss": 0.7686, + "step": 47749 + }, + { + "epoch": 1.22, + "learning_rate": 1.3398061615007941e-06, + "loss": 0.6821, + "step": 47750 + }, + { + "epoch": 1.22, + "learning_rate": 1.3397801374335277e-06, + "loss": 0.5898, + "step": 47751 + }, + { + "epoch": 1.22, + "learning_rate": 1.3397541131061073e-06, + "loss": 0.6846, + "step": 47752 + }, + { + "epoch": 1.22, + "learning_rate": 1.3397280885185528e-06, + "loss": 0.6475, + "step": 47753 + }, + { + "epoch": 1.22, + "learning_rate": 1.3397020636708844e-06, + "loss": 0.6616, + "step": 47754 + }, + { + "epoch": 1.22, + "learning_rate": 1.3396760385631217e-06, + "loss": 0.7393, + "step": 47755 + }, + { + "epoch": 1.22, + "learning_rate": 1.3396500131952846e-06, + "loss": 0.6953, + "step": 47756 + }, + { + "epoch": 1.22, + "learning_rate": 1.3396239875673928e-06, + "loss": 0.8008, + "step": 47757 + }, + { + "epoch": 1.22, + "learning_rate": 1.3395979616794667e-06, + "loss": 0.5342, + "step": 47758 + }, + { + "epoch": 1.22, + "learning_rate": 1.3395719355315263e-06, + "loss": 0.636, + "step": 47759 + }, + { + "epoch": 1.22, + "learning_rate": 1.339545909123591e-06, + "loss": 0.6372, + "step": 47760 + }, + { + "epoch": 1.22, + "learning_rate": 1.3395198824556812e-06, + "loss": 0.6172, + "step": 47761 + }, + { + "epoch": 1.22, + "learning_rate": 1.3394938555278166e-06, + "loss": 0.6509, + "step": 47762 + }, + { + "epoch": 1.22, + "learning_rate": 1.3394678283400168e-06, + "loss": 0.5488, + "step": 47763 + }, + { + "epoch": 1.22, + "learning_rate": 1.3394418008923027e-06, + "loss": 0.6865, + "step": 47764 + }, + { + "epoch": 1.22, + "learning_rate": 1.3394157731846934e-06, + "loss": 0.8228, + "step": 47765 + }, + { + "epoch": 1.22, + "learning_rate": 1.339389745217209e-06, + "loss": 0.6182, + "step": 47766 + }, + { + "epoch": 1.22, + "learning_rate": 1.3393637169898695e-06, + "loss": 0.5708, + "step": 47767 + }, + { + "epoch": 1.22, + "learning_rate": 1.3393376885026945e-06, + "loss": 0.6543, + "step": 47768 + }, + { + "epoch": 1.22, + "learning_rate": 1.3393116597557047e-06, + "loss": 0.7314, + "step": 47769 + }, + { + "epoch": 1.22, + "learning_rate": 1.3392856307489196e-06, + "loss": 0.5785, + "step": 47770 + }, + { + "epoch": 1.22, + "learning_rate": 1.3392596014823587e-06, + "loss": 0.6763, + "step": 47771 + }, + { + "epoch": 1.22, + "learning_rate": 1.3392335719560424e-06, + "loss": 0.833, + "step": 47772 + }, + { + "epoch": 1.22, + "learning_rate": 1.3392075421699907e-06, + "loss": 0.6377, + "step": 47773 + }, + { + "epoch": 1.22, + "learning_rate": 1.3391815121242232e-06, + "loss": 0.5469, + "step": 47774 + }, + { + "epoch": 1.22, + "learning_rate": 1.3391554818187605e-06, + "loss": 0.6685, + "step": 47775 + }, + { + "epoch": 1.22, + "learning_rate": 1.3391294512536216e-06, + "loss": 0.6206, + "step": 47776 + }, + { + "epoch": 1.22, + "learning_rate": 1.3391034204288269e-06, + "loss": 0.6123, + "step": 47777 + }, + { + "epoch": 1.22, + "learning_rate": 1.3390773893443962e-06, + "loss": 0.7246, + "step": 47778 + }, + { + "epoch": 1.22, + "learning_rate": 1.3390513580003498e-06, + "loss": 0.5771, + "step": 47779 + }, + { + "epoch": 1.22, + "learning_rate": 1.3390253263967072e-06, + "loss": 0.8062, + "step": 47780 + }, + { + "epoch": 1.22, + "learning_rate": 1.3389992945334887e-06, + "loss": 0.604, + "step": 47781 + }, + { + "epoch": 1.22, + "learning_rate": 1.3389732624107138e-06, + "loss": 0.5923, + "step": 47782 + }, + { + "epoch": 1.22, + "learning_rate": 1.3389472300284027e-06, + "loss": 0.7383, + "step": 47783 + }, + { + "epoch": 1.22, + "learning_rate": 1.3389211973865752e-06, + "loss": 0.7803, + "step": 47784 + }, + { + "epoch": 1.22, + "learning_rate": 1.3388951644852514e-06, + "loss": 0.6768, + "step": 47785 + }, + { + "epoch": 1.22, + "learning_rate": 1.3388691313244515e-06, + "loss": 0.625, + "step": 47786 + }, + { + "epoch": 1.22, + "learning_rate": 1.3388430979041947e-06, + "loss": 0.6768, + "step": 47787 + }, + { + "epoch": 1.22, + "learning_rate": 1.3388170642245013e-06, + "loss": 0.7646, + "step": 47788 + }, + { + "epoch": 1.22, + "learning_rate": 1.3387910302853913e-06, + "loss": 0.8066, + "step": 47789 + }, + { + "epoch": 1.22, + "learning_rate": 1.338764996086885e-06, + "loss": 0.6299, + "step": 47790 + }, + { + "epoch": 1.22, + "learning_rate": 1.3387389616290016e-06, + "loss": 0.6318, + "step": 47791 + }, + { + "epoch": 1.22, + "learning_rate": 1.3387129269117612e-06, + "loss": 0.7783, + "step": 47792 + }, + { + "epoch": 1.22, + "learning_rate": 1.3386868919351839e-06, + "loss": 0.6475, + "step": 47793 + }, + { + "epoch": 1.22, + "learning_rate": 1.33866085669929e-06, + "loss": 0.5759, + "step": 47794 + }, + { + "epoch": 1.23, + "learning_rate": 1.3386348212040987e-06, + "loss": 0.7578, + "step": 47795 + }, + { + "epoch": 1.23, + "learning_rate": 1.3386087854496305e-06, + "loss": 0.6504, + "step": 47796 + }, + { + "epoch": 1.23, + "learning_rate": 1.3385827494359047e-06, + "loss": 0.6108, + "step": 47797 + }, + { + "epoch": 1.23, + "learning_rate": 1.338556713162942e-06, + "loss": 0.7148, + "step": 47798 + }, + { + "epoch": 1.23, + "learning_rate": 1.338530676630762e-06, + "loss": 0.6206, + "step": 47799 + }, + { + "epoch": 1.23, + "learning_rate": 1.3385046398393848e-06, + "loss": 0.5034, + "step": 47800 + }, + { + "epoch": 1.23, + "learning_rate": 1.3384786027888298e-06, + "loss": 0.6201, + "step": 47801 + }, + { + "epoch": 1.23, + "learning_rate": 1.3384525654791174e-06, + "loss": 0.7188, + "step": 47802 + }, + { + "epoch": 1.23, + "learning_rate": 1.3384265279102675e-06, + "loss": 0.5347, + "step": 47803 + }, + { + "epoch": 1.23, + "learning_rate": 1.3384004900823e-06, + "loss": 0.5781, + "step": 47804 + }, + { + "epoch": 1.23, + "learning_rate": 1.3383744519952346e-06, + "loss": 0.6724, + "step": 47805 + }, + { + "epoch": 1.23, + "learning_rate": 1.3383484136490916e-06, + "loss": 0.5522, + "step": 47806 + }, + { + "epoch": 1.23, + "learning_rate": 1.3383223750438908e-06, + "loss": 0.7529, + "step": 47807 + }, + { + "epoch": 1.23, + "learning_rate": 1.3382963361796519e-06, + "loss": 0.7588, + "step": 47808 + }, + { + "epoch": 1.23, + "learning_rate": 1.3382702970563953e-06, + "loss": 0.7715, + "step": 47809 + }, + { + "epoch": 1.23, + "learning_rate": 1.3382442576741407e-06, + "loss": 0.6562, + "step": 47810 + }, + { + "epoch": 1.23, + "learning_rate": 1.338218218032908e-06, + "loss": 0.646, + "step": 47811 + }, + { + "epoch": 1.23, + "learning_rate": 1.338192178132717e-06, + "loss": 0.8008, + "step": 47812 + }, + { + "epoch": 1.23, + "learning_rate": 1.338166137973588e-06, + "loss": 0.5906, + "step": 47813 + }, + { + "epoch": 1.23, + "learning_rate": 1.3381400975555406e-06, + "loss": 0.7383, + "step": 47814 + }, + { + "epoch": 1.23, + "learning_rate": 1.3381140568785952e-06, + "loss": 0.707, + "step": 47815 + }, + { + "epoch": 1.23, + "learning_rate": 1.338088015942771e-06, + "loss": 0.5522, + "step": 47816 + }, + { + "epoch": 1.23, + "learning_rate": 1.3380619747480883e-06, + "loss": 0.5986, + "step": 47817 + }, + { + "epoch": 1.23, + "learning_rate": 1.3380359332945673e-06, + "loss": 0.604, + "step": 47818 + }, + { + "epoch": 1.23, + "learning_rate": 1.3380098915822277e-06, + "loss": 0.7432, + "step": 47819 + }, + { + "epoch": 1.23, + "learning_rate": 1.3379838496110895e-06, + "loss": 0.6296, + "step": 47820 + }, + { + "epoch": 1.23, + "learning_rate": 1.3379578073811728e-06, + "loss": 0.7471, + "step": 47821 + }, + { + "epoch": 1.23, + "learning_rate": 1.3379317648924968e-06, + "loss": 0.6396, + "step": 47822 + }, + { + "epoch": 1.23, + "learning_rate": 1.3379057221450825e-06, + "loss": 0.4263, + "step": 47823 + }, + { + "epoch": 1.23, + "learning_rate": 1.337879679138949e-06, + "loss": 0.5232, + "step": 47824 + }, + { + "epoch": 1.23, + "learning_rate": 1.3378536358741168e-06, + "loss": 0.6504, + "step": 47825 + }, + { + "epoch": 1.23, + "learning_rate": 1.3378275923506054e-06, + "loss": 0.7153, + "step": 47826 + }, + { + "epoch": 1.23, + "learning_rate": 1.3378015485684354e-06, + "loss": 0.5132, + "step": 47827 + }, + { + "epoch": 1.23, + "learning_rate": 1.3377755045276255e-06, + "loss": 0.6807, + "step": 47828 + }, + { + "epoch": 1.23, + "learning_rate": 1.337749460228197e-06, + "loss": 0.6973, + "step": 47829 + }, + { + "epoch": 1.23, + "learning_rate": 1.3377234156701693e-06, + "loss": 0.4907, + "step": 47830 + }, + { + "epoch": 1.23, + "learning_rate": 1.337697370853562e-06, + "loss": 0.6616, + "step": 47831 + }, + { + "epoch": 1.23, + "learning_rate": 1.3376713257783955e-06, + "loss": 0.748, + "step": 47832 + }, + { + "epoch": 1.23, + "learning_rate": 1.3376452804446894e-06, + "loss": 0.5129, + "step": 47833 + }, + { + "epoch": 1.23, + "learning_rate": 1.3376192348524641e-06, + "loss": 0.7119, + "step": 47834 + }, + { + "epoch": 1.23, + "learning_rate": 1.3375931890017393e-06, + "loss": 0.708, + "step": 47835 + }, + { + "epoch": 1.23, + "learning_rate": 1.3375671428925349e-06, + "loss": 0.6221, + "step": 47836 + }, + { + "epoch": 1.23, + "learning_rate": 1.3375410965248706e-06, + "loss": 0.6533, + "step": 47837 + }, + { + "epoch": 1.23, + "learning_rate": 1.337515049898767e-06, + "loss": 0.6533, + "step": 47838 + }, + { + "epoch": 1.23, + "learning_rate": 1.3374890030142432e-06, + "loss": 0.7876, + "step": 47839 + }, + { + "epoch": 1.23, + "learning_rate": 1.33746295587132e-06, + "loss": 0.6914, + "step": 47840 + }, + { + "epoch": 1.23, + "learning_rate": 1.3374369084700166e-06, + "loss": 0.7705, + "step": 47841 + }, + { + "epoch": 1.23, + "learning_rate": 1.3374108608103536e-06, + "loss": 0.5605, + "step": 47842 + }, + { + "epoch": 1.23, + "learning_rate": 1.3373848128923501e-06, + "loss": 0.7139, + "step": 47843 + }, + { + "epoch": 1.23, + "learning_rate": 1.3373587647160273e-06, + "loss": 0.7754, + "step": 47844 + }, + { + "epoch": 1.23, + "learning_rate": 1.3373327162814038e-06, + "loss": 0.5366, + "step": 47845 + }, + { + "epoch": 1.23, + "learning_rate": 1.3373066675885005e-06, + "loss": 0.6177, + "step": 47846 + }, + { + "epoch": 1.23, + "learning_rate": 1.3372806186373367e-06, + "loss": 0.8486, + "step": 47847 + }, + { + "epoch": 1.23, + "learning_rate": 1.3372545694279328e-06, + "loss": 0.7109, + "step": 47848 + }, + { + "epoch": 1.23, + "learning_rate": 1.3372285199603087e-06, + "loss": 0.5869, + "step": 47849 + }, + { + "epoch": 1.23, + "learning_rate": 1.3372024702344839e-06, + "loss": 0.6489, + "step": 47850 + }, + { + "epoch": 1.23, + "learning_rate": 1.337176420250479e-06, + "loss": 0.8379, + "step": 47851 + }, + { + "epoch": 1.23, + "learning_rate": 1.3371503700083133e-06, + "loss": 0.6455, + "step": 47852 + }, + { + "epoch": 1.23, + "learning_rate": 1.3371243195080073e-06, + "loss": 0.7842, + "step": 47853 + }, + { + "epoch": 1.23, + "learning_rate": 1.337098268749581e-06, + "loss": 0.5139, + "step": 47854 + }, + { + "epoch": 1.23, + "learning_rate": 1.3370722177330536e-06, + "loss": 0.7227, + "step": 47855 + }, + { + "epoch": 1.23, + "learning_rate": 1.3370461664584456e-06, + "loss": 0.4407, + "step": 47856 + }, + { + "epoch": 1.23, + "learning_rate": 1.3370201149257767e-06, + "loss": 0.5625, + "step": 47857 + }, + { + "epoch": 1.23, + "learning_rate": 1.336994063135067e-06, + "loss": 0.5251, + "step": 47858 + }, + { + "epoch": 1.23, + "learning_rate": 1.3369680110863368e-06, + "loss": 0.6138, + "step": 47859 + }, + { + "epoch": 1.23, + "learning_rate": 1.3369419587796055e-06, + "loss": 0.752, + "step": 47860 + }, + { + "epoch": 1.23, + "learning_rate": 1.3369159062148933e-06, + "loss": 0.7461, + "step": 47861 + }, + { + "epoch": 1.23, + "learning_rate": 1.3368898533922199e-06, + "loss": 0.6758, + "step": 47862 + }, + { + "epoch": 1.23, + "learning_rate": 1.3368638003116057e-06, + "loss": 0.6768, + "step": 47863 + }, + { + "epoch": 1.23, + "learning_rate": 1.3368377469730702e-06, + "loss": 0.6431, + "step": 47864 + }, + { + "epoch": 1.23, + "learning_rate": 1.3368116933766339e-06, + "loss": 0.7227, + "step": 47865 + }, + { + "epoch": 1.23, + "learning_rate": 1.3367856395223158e-06, + "loss": 0.666, + "step": 47866 + }, + { + "epoch": 1.23, + "learning_rate": 1.3367595854101366e-06, + "loss": 0.834, + "step": 47867 + }, + { + "epoch": 1.23, + "learning_rate": 1.336733531040116e-06, + "loss": 0.6475, + "step": 47868 + }, + { + "epoch": 1.23, + "learning_rate": 1.336707476412274e-06, + "loss": 0.7957, + "step": 47869 + }, + { + "epoch": 1.23, + "learning_rate": 1.336681421526631e-06, + "loss": 0.6465, + "step": 47870 + }, + { + "epoch": 1.23, + "learning_rate": 1.3366553663832063e-06, + "loss": 0.6123, + "step": 47871 + }, + { + "epoch": 1.23, + "learning_rate": 1.3366293109820198e-06, + "loss": 0.46, + "step": 47872 + }, + { + "epoch": 1.23, + "learning_rate": 1.336603255323092e-06, + "loss": 0.7617, + "step": 47873 + }, + { + "epoch": 1.23, + "learning_rate": 1.3365771994064422e-06, + "loss": 0.5649, + "step": 47874 + }, + { + "epoch": 1.23, + "learning_rate": 1.336551143232091e-06, + "loss": 0.8428, + "step": 47875 + }, + { + "epoch": 1.23, + "learning_rate": 1.3365250868000582e-06, + "loss": 0.6265, + "step": 47876 + }, + { + "epoch": 1.23, + "learning_rate": 1.3364990301103634e-06, + "loss": 0.7168, + "step": 47877 + }, + { + "epoch": 1.23, + "learning_rate": 1.3364729731630269e-06, + "loss": 0.6084, + "step": 47878 + }, + { + "epoch": 1.23, + "learning_rate": 1.3364469159580682e-06, + "loss": 0.79, + "step": 47879 + }, + { + "epoch": 1.23, + "learning_rate": 1.336420858495508e-06, + "loss": 0.6514, + "step": 47880 + }, + { + "epoch": 1.23, + "learning_rate": 1.3363948007753655e-06, + "loss": 0.6855, + "step": 47881 + }, + { + "epoch": 1.23, + "learning_rate": 1.3363687427976612e-06, + "loss": 0.6479, + "step": 47882 + }, + { + "epoch": 1.23, + "learning_rate": 1.3363426845624147e-06, + "loss": 0.6281, + "step": 47883 + }, + { + "epoch": 1.23, + "learning_rate": 1.3363166260696462e-06, + "loss": 0.5923, + "step": 47884 + }, + { + "epoch": 1.23, + "learning_rate": 1.3362905673193755e-06, + "loss": 0.9531, + "step": 47885 + }, + { + "epoch": 1.23, + "learning_rate": 1.3362645083116224e-06, + "loss": 0.7344, + "step": 47886 + }, + { + "epoch": 1.23, + "learning_rate": 1.3362384490464069e-06, + "loss": 0.6401, + "step": 47887 + }, + { + "epoch": 1.23, + "learning_rate": 1.3362123895237494e-06, + "loss": 0.6982, + "step": 47888 + }, + { + "epoch": 1.23, + "learning_rate": 1.3361863297436694e-06, + "loss": 0.7588, + "step": 47889 + }, + { + "epoch": 1.23, + "learning_rate": 1.336160269706187e-06, + "loss": 0.7295, + "step": 47890 + }, + { + "epoch": 1.23, + "learning_rate": 1.336134209411322e-06, + "loss": 0.7285, + "step": 47891 + }, + { + "epoch": 1.23, + "learning_rate": 1.3361081488590948e-06, + "loss": 0.5039, + "step": 47892 + }, + { + "epoch": 1.23, + "learning_rate": 1.3360820880495248e-06, + "loss": 0.6147, + "step": 47893 + }, + { + "epoch": 1.23, + "learning_rate": 1.3360560269826325e-06, + "loss": 0.8154, + "step": 47894 + }, + { + "epoch": 1.23, + "learning_rate": 1.3360299656584372e-06, + "loss": 0.7168, + "step": 47895 + }, + { + "epoch": 1.23, + "learning_rate": 1.3360039040769593e-06, + "loss": 0.5345, + "step": 47896 + }, + { + "epoch": 1.23, + "learning_rate": 1.3359778422382188e-06, + "loss": 0.6426, + "step": 47897 + }, + { + "epoch": 1.23, + "learning_rate": 1.3359517801422352e-06, + "loss": 0.4607, + "step": 47898 + }, + { + "epoch": 1.23, + "learning_rate": 1.335925717789029e-06, + "loss": 0.7705, + "step": 47899 + }, + { + "epoch": 1.23, + "learning_rate": 1.33589965517862e-06, + "loss": 0.8408, + "step": 47900 + }, + { + "epoch": 1.23, + "learning_rate": 1.335873592311028e-06, + "loss": 0.2503, + "step": 47901 + }, + { + "epoch": 1.23, + "learning_rate": 1.335847529186273e-06, + "loss": 0.5664, + "step": 47902 + }, + { + "epoch": 1.23, + "learning_rate": 1.3358214658043751e-06, + "loss": 0.7061, + "step": 47903 + }, + { + "epoch": 1.23, + "learning_rate": 1.335795402165354e-06, + "loss": 0.6738, + "step": 47904 + }, + { + "epoch": 1.23, + "learning_rate": 1.3357693382692302e-06, + "loss": 0.8096, + "step": 47905 + }, + { + "epoch": 1.23, + "learning_rate": 1.3357432741160226e-06, + "loss": 0.7402, + "step": 47906 + }, + { + "epoch": 1.23, + "learning_rate": 1.3357172097057521e-06, + "loss": 0.6748, + "step": 47907 + }, + { + "epoch": 1.23, + "learning_rate": 1.3356911450384383e-06, + "loss": 0.7554, + "step": 47908 + }, + { + "epoch": 1.23, + "learning_rate": 1.3356650801141014e-06, + "loss": 0.6729, + "step": 47909 + }, + { + "epoch": 1.23, + "learning_rate": 1.3356390149327612e-06, + "loss": 0.5745, + "step": 47910 + }, + { + "epoch": 1.23, + "learning_rate": 1.3356129494944377e-06, + "loss": 0.6904, + "step": 47911 + }, + { + "epoch": 1.23, + "learning_rate": 1.3355868837991503e-06, + "loss": 0.6489, + "step": 47912 + }, + { + "epoch": 1.23, + "learning_rate": 1.33556081784692e-06, + "loss": 0.6699, + "step": 47913 + }, + { + "epoch": 1.23, + "learning_rate": 1.3355347516377658e-06, + "loss": 0.6787, + "step": 47914 + }, + { + "epoch": 1.23, + "learning_rate": 1.3355086851717084e-06, + "loss": 0.646, + "step": 47915 + }, + { + "epoch": 1.23, + "learning_rate": 1.3354826184487674e-06, + "loss": 0.71, + "step": 47916 + }, + { + "epoch": 1.23, + "learning_rate": 1.3354565514689625e-06, + "loss": 0.7031, + "step": 47917 + }, + { + "epoch": 1.23, + "learning_rate": 1.3354304842323142e-06, + "loss": 0.7036, + "step": 47918 + }, + { + "epoch": 1.23, + "learning_rate": 1.3354044167388424e-06, + "loss": 0.7109, + "step": 47919 + }, + { + "epoch": 1.23, + "learning_rate": 1.3353783489885664e-06, + "loss": 0.6836, + "step": 47920 + }, + { + "epoch": 1.23, + "learning_rate": 1.3353522809815067e-06, + "loss": 0.7544, + "step": 47921 + }, + { + "epoch": 1.23, + "learning_rate": 1.3353262127176833e-06, + "loss": 0.6299, + "step": 47922 + }, + { + "epoch": 1.23, + "learning_rate": 1.335300144197116e-06, + "loss": 0.7324, + "step": 47923 + }, + { + "epoch": 1.23, + "learning_rate": 1.335274075419825e-06, + "loss": 0.6479, + "step": 47924 + }, + { + "epoch": 1.23, + "learning_rate": 1.3352480063858299e-06, + "loss": 0.5059, + "step": 47925 + }, + { + "epoch": 1.23, + "learning_rate": 1.3352219370951508e-06, + "loss": 0.6582, + "step": 47926 + }, + { + "epoch": 1.23, + "learning_rate": 1.3351958675478074e-06, + "loss": 0.7197, + "step": 47927 + }, + { + "epoch": 1.23, + "learning_rate": 1.3351697977438203e-06, + "loss": 0.7354, + "step": 47928 + }, + { + "epoch": 1.23, + "learning_rate": 1.335143727683209e-06, + "loss": 0.5642, + "step": 47929 + }, + { + "epoch": 1.23, + "learning_rate": 1.335117657365994e-06, + "loss": 0.5176, + "step": 47930 + }, + { + "epoch": 1.23, + "learning_rate": 1.335091586792194e-06, + "loss": 0.7197, + "step": 47931 + }, + { + "epoch": 1.23, + "learning_rate": 1.3350655159618304e-06, + "loss": 0.5596, + "step": 47932 + }, + { + "epoch": 1.23, + "learning_rate": 1.335039444874922e-06, + "loss": 0.7314, + "step": 47933 + }, + { + "epoch": 1.23, + "learning_rate": 1.3350133735314897e-06, + "loss": 0.5508, + "step": 47934 + }, + { + "epoch": 1.23, + "learning_rate": 1.3349873019315532e-06, + "loss": 0.5557, + "step": 47935 + }, + { + "epoch": 1.23, + "learning_rate": 1.3349612300751321e-06, + "loss": 0.7422, + "step": 47936 + }, + { + "epoch": 1.23, + "learning_rate": 1.3349351579622464e-06, + "loss": 0.5918, + "step": 47937 + }, + { + "epoch": 1.23, + "learning_rate": 1.3349090855929167e-06, + "loss": 0.6704, + "step": 47938 + }, + { + "epoch": 1.23, + "learning_rate": 1.334883012967162e-06, + "loss": 0.7134, + "step": 47939 + }, + { + "epoch": 1.23, + "learning_rate": 1.334856940085003e-06, + "loss": 0.7002, + "step": 47940 + }, + { + "epoch": 1.23, + "learning_rate": 1.3348308669464596e-06, + "loss": 0.4358, + "step": 47941 + }, + { + "epoch": 1.23, + "learning_rate": 1.3348047935515513e-06, + "loss": 0.7207, + "step": 47942 + }, + { + "epoch": 1.23, + "learning_rate": 1.3347787199002987e-06, + "loss": 0.8242, + "step": 47943 + }, + { + "epoch": 1.23, + "learning_rate": 1.334752645992721e-06, + "loss": 0.4603, + "step": 47944 + }, + { + "epoch": 1.23, + "learning_rate": 1.3347265718288391e-06, + "loss": 0.668, + "step": 47945 + }, + { + "epoch": 1.23, + "learning_rate": 1.3347004974086721e-06, + "loss": 0.4412, + "step": 47946 + }, + { + "epoch": 1.23, + "learning_rate": 1.3346744227322404e-06, + "loss": 0.752, + "step": 47947 + }, + { + "epoch": 1.23, + "learning_rate": 1.3346483477995638e-06, + "loss": 0.5725, + "step": 47948 + }, + { + "epoch": 1.23, + "learning_rate": 1.3346222726106627e-06, + "loss": 0.6738, + "step": 47949 + }, + { + "epoch": 1.23, + "learning_rate": 1.3345961971655564e-06, + "loss": 0.6133, + "step": 47950 + }, + { + "epoch": 1.23, + "learning_rate": 1.3345701214642654e-06, + "loss": 0.4146, + "step": 47951 + }, + { + "epoch": 1.23, + "learning_rate": 1.3345440455068091e-06, + "loss": 0.5581, + "step": 47952 + }, + { + "epoch": 1.23, + "learning_rate": 1.334517969293208e-06, + "loss": 0.7559, + "step": 47953 + }, + { + "epoch": 1.23, + "learning_rate": 1.334491892823482e-06, + "loss": 0.7061, + "step": 47954 + }, + { + "epoch": 1.23, + "learning_rate": 1.334465816097651e-06, + "loss": 0.6157, + "step": 47955 + }, + { + "epoch": 1.23, + "learning_rate": 1.3344397391157345e-06, + "loss": 0.7104, + "step": 47956 + }, + { + "epoch": 1.23, + "learning_rate": 1.3344136618777531e-06, + "loss": 0.7559, + "step": 47957 + }, + { + "epoch": 1.23, + "learning_rate": 1.3343875843837262e-06, + "loss": 0.5698, + "step": 47958 + }, + { + "epoch": 1.23, + "learning_rate": 1.3343615066336747e-06, + "loss": 0.6421, + "step": 47959 + }, + { + "epoch": 1.23, + "learning_rate": 1.3343354286276176e-06, + "loss": 0.6299, + "step": 47960 + }, + { + "epoch": 1.23, + "learning_rate": 1.3343093503655753e-06, + "loss": 0.6934, + "step": 47961 + }, + { + "epoch": 1.23, + "learning_rate": 1.3342832718475677e-06, + "loss": 0.6768, + "step": 47962 + }, + { + "epoch": 1.23, + "learning_rate": 1.334257193073615e-06, + "loss": 0.7373, + "step": 47963 + }, + { + "epoch": 1.23, + "learning_rate": 1.3342311140437366e-06, + "loss": 0.5352, + "step": 47964 + }, + { + "epoch": 1.23, + "learning_rate": 1.3342050347579527e-06, + "loss": 0.6611, + "step": 47965 + }, + { + "epoch": 1.23, + "learning_rate": 1.3341789552162838e-06, + "loss": 0.708, + "step": 47966 + }, + { + "epoch": 1.23, + "learning_rate": 1.3341528754187493e-06, + "loss": 0.5266, + "step": 47967 + }, + { + "epoch": 1.23, + "learning_rate": 1.3341267953653691e-06, + "loss": 0.4386, + "step": 47968 + }, + { + "epoch": 1.23, + "learning_rate": 1.3341007150561634e-06, + "loss": 0.7085, + "step": 47969 + }, + { + "epoch": 1.23, + "learning_rate": 1.3340746344911526e-06, + "loss": 0.6914, + "step": 47970 + }, + { + "epoch": 1.23, + "learning_rate": 1.3340485536703557e-06, + "loss": 0.7383, + "step": 47971 + }, + { + "epoch": 1.23, + "learning_rate": 1.3340224725937934e-06, + "loss": 0.7295, + "step": 47972 + }, + { + "epoch": 1.23, + "learning_rate": 1.3339963912614854e-06, + "loss": 0.5806, + "step": 47973 + }, + { + "epoch": 1.23, + "learning_rate": 1.3339703096734518e-06, + "loss": 0.6689, + "step": 47974 + }, + { + "epoch": 1.23, + "learning_rate": 1.3339442278297127e-06, + "loss": 0.5256, + "step": 47975 + }, + { + "epoch": 1.23, + "learning_rate": 1.3339181457302876e-06, + "loss": 0.4756, + "step": 47976 + }, + { + "epoch": 1.23, + "learning_rate": 1.3338920633751964e-06, + "loss": 0.6543, + "step": 47977 + }, + { + "epoch": 1.23, + "learning_rate": 1.3338659807644598e-06, + "loss": 0.4434, + "step": 47978 + }, + { + "epoch": 1.23, + "learning_rate": 1.3338398978980972e-06, + "loss": 0.7314, + "step": 47979 + }, + { + "epoch": 1.23, + "learning_rate": 1.333813814776129e-06, + "loss": 0.6084, + "step": 47980 + }, + { + "epoch": 1.23, + "learning_rate": 1.3337877313985746e-06, + "loss": 0.5676, + "step": 47981 + }, + { + "epoch": 1.23, + "learning_rate": 1.3337616477654545e-06, + "loss": 0.7803, + "step": 47982 + }, + { + "epoch": 1.23, + "learning_rate": 1.3337355638767881e-06, + "loss": 0.5623, + "step": 47983 + }, + { + "epoch": 1.23, + "learning_rate": 1.3337094797325963e-06, + "loss": 0.6294, + "step": 47984 + }, + { + "epoch": 1.23, + "learning_rate": 1.3336833953328984e-06, + "loss": 0.71, + "step": 47985 + }, + { + "epoch": 1.23, + "learning_rate": 1.333657310677714e-06, + "loss": 0.7119, + "step": 47986 + }, + { + "epoch": 1.23, + "learning_rate": 1.3336312257670638e-06, + "loss": 0.6455, + "step": 47987 + }, + { + "epoch": 1.23, + "learning_rate": 1.3336051406009674e-06, + "loss": 0.6582, + "step": 47988 + }, + { + "epoch": 1.23, + "learning_rate": 1.333579055179445e-06, + "loss": 0.4951, + "step": 47989 + }, + { + "epoch": 1.23, + "learning_rate": 1.3335529695025165e-06, + "loss": 0.532, + "step": 47990 + }, + { + "epoch": 1.23, + "learning_rate": 1.3335268835702019e-06, + "loss": 0.6807, + "step": 47991 + }, + { + "epoch": 1.23, + "learning_rate": 1.333500797382521e-06, + "loss": 0.5803, + "step": 47992 + }, + { + "epoch": 1.23, + "learning_rate": 1.3334747109394938e-06, + "loss": 0.6719, + "step": 47993 + }, + { + "epoch": 1.23, + "learning_rate": 1.3334486242411403e-06, + "loss": 0.5967, + "step": 47994 + }, + { + "epoch": 1.23, + "learning_rate": 1.3334225372874808e-06, + "loss": 0.5586, + "step": 47995 + }, + { + "epoch": 1.23, + "learning_rate": 1.3333964500785348e-06, + "loss": 0.6719, + "step": 47996 + }, + { + "epoch": 1.23, + "learning_rate": 1.3333703626143224e-06, + "loss": 0.4644, + "step": 47997 + }, + { + "epoch": 1.23, + "learning_rate": 1.3333442748948637e-06, + "loss": 0.7168, + "step": 47998 + }, + { + "epoch": 1.23, + "learning_rate": 1.3333181869201786e-06, + "loss": 0.6025, + "step": 47999 + }, + { + "epoch": 1.23, + "learning_rate": 1.3332920986902873e-06, + "loss": 0.4795, + "step": 48000 + }, + { + "epoch": 1.23, + "learning_rate": 1.3332660102052096e-06, + "loss": 0.4429, + "step": 48001 + }, + { + "epoch": 1.23, + "learning_rate": 1.333239921464965e-06, + "loss": 0.5771, + "step": 48002 + }, + { + "epoch": 1.23, + "learning_rate": 1.3332138324695743e-06, + "loss": 0.5076, + "step": 48003 + }, + { + "epoch": 1.23, + "learning_rate": 1.3331877432190568e-06, + "loss": 0.6621, + "step": 48004 + }, + { + "epoch": 1.23, + "learning_rate": 1.333161653713433e-06, + "loss": 0.645, + "step": 48005 + }, + { + "epoch": 1.23, + "learning_rate": 1.3331355639527227e-06, + "loss": 0.5466, + "step": 48006 + }, + { + "epoch": 1.23, + "learning_rate": 1.3331094739369454e-06, + "loss": 0.7637, + "step": 48007 + }, + { + "epoch": 1.23, + "learning_rate": 1.3330833836661217e-06, + "loss": 0.5864, + "step": 48008 + }, + { + "epoch": 1.23, + "learning_rate": 1.3330572931402718e-06, + "loss": 0.7305, + "step": 48009 + }, + { + "epoch": 1.23, + "learning_rate": 1.3330312023594148e-06, + "loss": 0.5913, + "step": 48010 + }, + { + "epoch": 1.23, + "learning_rate": 1.333005111323571e-06, + "loss": 0.7734, + "step": 48011 + }, + { + "epoch": 1.23, + "learning_rate": 1.3329790200327608e-06, + "loss": 0.5488, + "step": 48012 + }, + { + "epoch": 1.23, + "learning_rate": 1.3329529284870036e-06, + "loss": 0.6289, + "step": 48013 + }, + { + "epoch": 1.23, + "learning_rate": 1.3329268366863202e-06, + "loss": 0.8311, + "step": 48014 + }, + { + "epoch": 1.23, + "learning_rate": 1.3329007446307295e-06, + "loss": 0.4629, + "step": 48015 + }, + { + "epoch": 1.23, + "learning_rate": 1.332874652320252e-06, + "loss": 0.7031, + "step": 48016 + }, + { + "epoch": 1.23, + "learning_rate": 1.332848559754908e-06, + "loss": 0.3967, + "step": 48017 + }, + { + "epoch": 1.23, + "learning_rate": 1.332822466934717e-06, + "loss": 0.6509, + "step": 48018 + }, + { + "epoch": 1.23, + "learning_rate": 1.3327963738596993e-06, + "loss": 0.5166, + "step": 48019 + }, + { + "epoch": 1.23, + "learning_rate": 1.3327702805298743e-06, + "loss": 0.728, + "step": 48020 + }, + { + "epoch": 1.23, + "learning_rate": 1.3327441869452627e-06, + "loss": 0.5691, + "step": 48021 + }, + { + "epoch": 1.23, + "learning_rate": 1.332718093105884e-06, + "loss": 0.7295, + "step": 48022 + }, + { + "epoch": 1.23, + "learning_rate": 1.3326919990117586e-06, + "loss": 0.7031, + "step": 48023 + }, + { + "epoch": 1.23, + "learning_rate": 1.3326659046629064e-06, + "loss": 0.6914, + "step": 48024 + }, + { + "epoch": 1.23, + "learning_rate": 1.3326398100593469e-06, + "loss": 0.6143, + "step": 48025 + }, + { + "epoch": 1.23, + "learning_rate": 1.3326137152011003e-06, + "loss": 0.5919, + "step": 48026 + }, + { + "epoch": 1.23, + "learning_rate": 1.3325876200881867e-06, + "loss": 0.8198, + "step": 48027 + }, + { + "epoch": 1.23, + "learning_rate": 1.3325615247206263e-06, + "loss": 0.6597, + "step": 48028 + }, + { + "epoch": 1.23, + "learning_rate": 1.3325354290984388e-06, + "loss": 0.7588, + "step": 48029 + }, + { + "epoch": 1.23, + "learning_rate": 1.332509333221644e-06, + "loss": 0.75, + "step": 48030 + }, + { + "epoch": 1.23, + "learning_rate": 1.3324832370902624e-06, + "loss": 0.5684, + "step": 48031 + }, + { + "epoch": 1.23, + "learning_rate": 1.3324571407043133e-06, + "loss": 0.6973, + "step": 48032 + }, + { + "epoch": 1.23, + "learning_rate": 1.332431044063817e-06, + "loss": 0.5669, + "step": 48033 + }, + { + "epoch": 1.23, + "learning_rate": 1.332404947168794e-06, + "loss": 0.48, + "step": 48034 + }, + { + "epoch": 1.23, + "learning_rate": 1.3323788500192637e-06, + "loss": 0.6597, + "step": 48035 + }, + { + "epoch": 1.23, + "learning_rate": 1.3323527526152458e-06, + "loss": 0.5735, + "step": 48036 + }, + { + "epoch": 1.23, + "learning_rate": 1.332326654956761e-06, + "loss": 0.5488, + "step": 48037 + }, + { + "epoch": 1.23, + "learning_rate": 1.3323005570438288e-06, + "loss": 0.7461, + "step": 48038 + }, + { + "epoch": 1.23, + "learning_rate": 1.33227445887647e-06, + "loss": 0.5083, + "step": 48039 + }, + { + "epoch": 1.23, + "learning_rate": 1.332248360454703e-06, + "loss": 0.6807, + "step": 48040 + }, + { + "epoch": 1.23, + "learning_rate": 1.3322222617785492e-06, + "loss": 0.6025, + "step": 48041 + }, + { + "epoch": 1.23, + "learning_rate": 1.3321961628480278e-06, + "loss": 0.6602, + "step": 48042 + }, + { + "epoch": 1.23, + "learning_rate": 1.332170063663159e-06, + "loss": 0.7266, + "step": 48043 + }, + { + "epoch": 1.23, + "learning_rate": 1.3321439642239635e-06, + "loss": 0.7539, + "step": 48044 + }, + { + "epoch": 1.23, + "learning_rate": 1.3321178645304602e-06, + "loss": 0.5908, + "step": 48045 + }, + { + "epoch": 1.23, + "learning_rate": 1.3320917645826694e-06, + "loss": 0.5146, + "step": 48046 + }, + { + "epoch": 1.23, + "learning_rate": 1.3320656643806116e-06, + "loss": 0.6064, + "step": 48047 + }, + { + "epoch": 1.23, + "learning_rate": 1.332039563924306e-06, + "loss": 0.7002, + "step": 48048 + }, + { + "epoch": 1.23, + "learning_rate": 1.3320134632137733e-06, + "loss": 0.7163, + "step": 48049 + }, + { + "epoch": 1.23, + "learning_rate": 1.331987362249033e-06, + "loss": 0.6626, + "step": 48050 + }, + { + "epoch": 1.23, + "learning_rate": 1.3319612610301051e-06, + "loss": 0.5933, + "step": 48051 + }, + { + "epoch": 1.23, + "learning_rate": 1.3319351595570098e-06, + "loss": 0.5098, + "step": 48052 + }, + { + "epoch": 1.23, + "learning_rate": 1.331909057829767e-06, + "loss": 0.4561, + "step": 48053 + }, + { + "epoch": 1.23, + "learning_rate": 1.331882955848397e-06, + "loss": 0.5938, + "step": 48054 + }, + { + "epoch": 1.23, + "learning_rate": 1.3318568536129192e-06, + "loss": 0.6001, + "step": 48055 + }, + { + "epoch": 1.23, + "learning_rate": 1.331830751123354e-06, + "loss": 0.5532, + "step": 48056 + }, + { + "epoch": 1.23, + "learning_rate": 1.3318046483797209e-06, + "loss": 0.7676, + "step": 48057 + }, + { + "epoch": 1.23, + "learning_rate": 1.3317785453820408e-06, + "loss": 0.5425, + "step": 48058 + }, + { + "epoch": 1.23, + "learning_rate": 1.3317524421303327e-06, + "loss": 0.751, + "step": 48059 + }, + { + "epoch": 1.23, + "learning_rate": 1.3317263386246173e-06, + "loss": 0.748, + "step": 48060 + }, + { + "epoch": 1.23, + "learning_rate": 1.331700234864914e-06, + "loss": 0.5284, + "step": 48061 + }, + { + "epoch": 1.23, + "learning_rate": 1.3316741308512434e-06, + "loss": 0.4646, + "step": 48062 + }, + { + "epoch": 1.23, + "learning_rate": 1.3316480265836248e-06, + "loss": 0.7266, + "step": 48063 + }, + { + "epoch": 1.23, + "learning_rate": 1.331621922062079e-06, + "loss": 0.7188, + "step": 48064 + }, + { + "epoch": 1.23, + "learning_rate": 1.331595817286625e-06, + "loss": 0.6621, + "step": 48065 + }, + { + "epoch": 1.23, + "learning_rate": 1.3315697122572838e-06, + "loss": 0.6992, + "step": 48066 + }, + { + "epoch": 1.23, + "learning_rate": 1.3315436069740746e-06, + "loss": 0.6069, + "step": 48067 + }, + { + "epoch": 1.23, + "learning_rate": 1.331517501437018e-06, + "loss": 0.6133, + "step": 48068 + }, + { + "epoch": 1.23, + "learning_rate": 1.3314913956461336e-06, + "loss": 0.6157, + "step": 48069 + }, + { + "epoch": 1.23, + "learning_rate": 1.3314652896014413e-06, + "loss": 0.7144, + "step": 48070 + }, + { + "epoch": 1.23, + "learning_rate": 1.3314391833029613e-06, + "loss": 0.7168, + "step": 48071 + }, + { + "epoch": 1.23, + "learning_rate": 1.3314130767507137e-06, + "loss": 0.7197, + "step": 48072 + }, + { + "epoch": 1.23, + "learning_rate": 1.3313869699447182e-06, + "loss": 0.707, + "step": 48073 + }, + { + "epoch": 1.23, + "learning_rate": 1.331360862884995e-06, + "loss": 0.6167, + "step": 48074 + }, + { + "epoch": 1.23, + "learning_rate": 1.3313347555715641e-06, + "loss": 0.7002, + "step": 48075 + }, + { + "epoch": 1.23, + "learning_rate": 1.3313086480044453e-06, + "loss": 0.6831, + "step": 48076 + }, + { + "epoch": 1.23, + "learning_rate": 1.331282540183659e-06, + "loss": 0.6807, + "step": 48077 + }, + { + "epoch": 1.23, + "learning_rate": 1.3312564321092243e-06, + "loss": 0.7285, + "step": 48078 + }, + { + "epoch": 1.23, + "learning_rate": 1.3312303237811624e-06, + "loss": 0.8096, + "step": 48079 + }, + { + "epoch": 1.23, + "learning_rate": 1.3312042151994924e-06, + "loss": 0.6128, + "step": 48080 + }, + { + "epoch": 1.23, + "learning_rate": 1.3311781063642346e-06, + "loss": 0.8462, + "step": 48081 + }, + { + "epoch": 1.23, + "learning_rate": 1.3311519972754086e-06, + "loss": 0.6616, + "step": 48082 + }, + { + "epoch": 1.23, + "learning_rate": 1.3311258879330352e-06, + "loss": 0.7598, + "step": 48083 + }, + { + "epoch": 1.23, + "learning_rate": 1.3310997783371338e-06, + "loss": 0.6855, + "step": 48084 + }, + { + "epoch": 1.23, + "learning_rate": 1.3310736684877246e-06, + "loss": 0.833, + "step": 48085 + }, + { + "epoch": 1.23, + "learning_rate": 1.3310475583848276e-06, + "loss": 0.7085, + "step": 48086 + }, + { + "epoch": 1.23, + "learning_rate": 1.3310214480284626e-06, + "loss": 0.6396, + "step": 48087 + }, + { + "epoch": 1.23, + "learning_rate": 1.3309953374186494e-06, + "loss": 0.6299, + "step": 48088 + }, + { + "epoch": 1.23, + "learning_rate": 1.3309692265554086e-06, + "loss": 0.6226, + "step": 48089 + }, + { + "epoch": 1.23, + "learning_rate": 1.3309431154387597e-06, + "loss": 0.6465, + "step": 48090 + }, + { + "epoch": 1.23, + "learning_rate": 1.3309170040687233e-06, + "loss": 0.6406, + "step": 48091 + }, + { + "epoch": 1.23, + "learning_rate": 1.3308908924453183e-06, + "loss": 0.7041, + "step": 48092 + }, + { + "epoch": 1.23, + "learning_rate": 1.3308647805685658e-06, + "loss": 0.8477, + "step": 48093 + }, + { + "epoch": 1.23, + "learning_rate": 1.3308386684384854e-06, + "loss": 0.5391, + "step": 48094 + }, + { + "epoch": 1.23, + "learning_rate": 1.3308125560550966e-06, + "loss": 0.7979, + "step": 48095 + }, + { + "epoch": 1.23, + "learning_rate": 1.3307864434184204e-06, + "loss": 0.4949, + "step": 48096 + }, + { + "epoch": 1.23, + "learning_rate": 1.3307603305284758e-06, + "loss": 0.8525, + "step": 48097 + }, + { + "epoch": 1.23, + "learning_rate": 1.3307342173852833e-06, + "loss": 0.5361, + "step": 48098 + }, + { + "epoch": 1.23, + "learning_rate": 1.330708103988863e-06, + "loss": 0.5391, + "step": 48099 + }, + { + "epoch": 1.23, + "learning_rate": 1.3306819903392347e-06, + "loss": 0.6396, + "step": 48100 + }, + { + "epoch": 1.23, + "learning_rate": 1.3306558764364181e-06, + "loss": 0.5918, + "step": 48101 + }, + { + "epoch": 1.23, + "learning_rate": 1.330629762280434e-06, + "loss": 0.7002, + "step": 48102 + }, + { + "epoch": 1.23, + "learning_rate": 1.3306036478713015e-06, + "loss": 0.5566, + "step": 48103 + }, + { + "epoch": 1.23, + "learning_rate": 1.330577533209041e-06, + "loss": 0.5786, + "step": 48104 + }, + { + "epoch": 1.23, + "learning_rate": 1.3305514182936729e-06, + "loss": 0.455, + "step": 48105 + }, + { + "epoch": 1.23, + "learning_rate": 1.3305253031252165e-06, + "loss": 0.5171, + "step": 48106 + }, + { + "epoch": 1.23, + "learning_rate": 1.3304991877036918e-06, + "loss": 0.6328, + "step": 48107 + }, + { + "epoch": 1.23, + "learning_rate": 1.3304730720291192e-06, + "loss": 0.6396, + "step": 48108 + }, + { + "epoch": 1.23, + "learning_rate": 1.330446956101519e-06, + "loss": 0.6523, + "step": 48109 + }, + { + "epoch": 1.23, + "learning_rate": 1.3304208399209104e-06, + "loss": 0.6748, + "step": 48110 + }, + { + "epoch": 1.23, + "learning_rate": 1.3303947234873135e-06, + "loss": 0.6787, + "step": 48111 + }, + { + "epoch": 1.23, + "learning_rate": 1.3303686068007492e-06, + "loss": 0.6914, + "step": 48112 + }, + { + "epoch": 1.23, + "learning_rate": 1.3303424898612363e-06, + "loss": 0.5142, + "step": 48113 + }, + { + "epoch": 1.23, + "learning_rate": 1.3303163726687955e-06, + "loss": 0.5137, + "step": 48114 + }, + { + "epoch": 1.23, + "learning_rate": 1.3302902552234468e-06, + "loss": 0.7422, + "step": 48115 + }, + { + "epoch": 1.23, + "learning_rate": 1.33026413752521e-06, + "loss": 0.5513, + "step": 48116 + }, + { + "epoch": 1.23, + "learning_rate": 1.330238019574105e-06, + "loss": 0.5874, + "step": 48117 + }, + { + "epoch": 1.23, + "learning_rate": 1.330211901370152e-06, + "loss": 0.7559, + "step": 48118 + }, + { + "epoch": 1.23, + "learning_rate": 1.330185782913371e-06, + "loss": 0.6226, + "step": 48119 + }, + { + "epoch": 1.23, + "learning_rate": 1.3301596642037815e-06, + "loss": 0.6934, + "step": 48120 + }, + { + "epoch": 1.23, + "learning_rate": 1.3301335452414044e-06, + "loss": 0.5776, + "step": 48121 + }, + { + "epoch": 1.23, + "learning_rate": 1.330107426026259e-06, + "loss": 0.7578, + "step": 48122 + }, + { + "epoch": 1.23, + "learning_rate": 1.3300813065583655e-06, + "loss": 0.7998, + "step": 48123 + }, + { + "epoch": 1.23, + "learning_rate": 1.3300551868377442e-06, + "loss": 0.7529, + "step": 48124 + }, + { + "epoch": 1.23, + "learning_rate": 1.3300290668644147e-06, + "loss": 0.9248, + "step": 48125 + }, + { + "epoch": 1.23, + "learning_rate": 1.3300029466383972e-06, + "loss": 0.6821, + "step": 48126 + }, + { + "epoch": 1.23, + "learning_rate": 1.3299768261597114e-06, + "loss": 0.5786, + "step": 48127 + }, + { + "epoch": 1.23, + "learning_rate": 1.3299507054283776e-06, + "loss": 0.5952, + "step": 48128 + }, + { + "epoch": 1.23, + "learning_rate": 1.329924584444416e-06, + "loss": 0.752, + "step": 48129 + }, + { + "epoch": 1.23, + "learning_rate": 1.3298984632078458e-06, + "loss": 0.5386, + "step": 48130 + }, + { + "epoch": 1.23, + "learning_rate": 1.3298723417186879e-06, + "loss": 0.6479, + "step": 48131 + }, + { + "epoch": 1.23, + "learning_rate": 1.3298462199769615e-06, + "loss": 0.6382, + "step": 48132 + }, + { + "epoch": 1.23, + "learning_rate": 1.3298200979826875e-06, + "loss": 0.6196, + "step": 48133 + }, + { + "epoch": 1.23, + "learning_rate": 1.329793975735885e-06, + "loss": 0.6133, + "step": 48134 + }, + { + "epoch": 1.23, + "learning_rate": 1.3297678532365747e-06, + "loss": 0.7002, + "step": 48135 + }, + { + "epoch": 1.23, + "learning_rate": 1.3297417304847761e-06, + "loss": 0.7852, + "step": 48136 + }, + { + "epoch": 1.23, + "learning_rate": 1.3297156074805099e-06, + "loss": 0.6099, + "step": 48137 + }, + { + "epoch": 1.23, + "learning_rate": 1.3296894842237951e-06, + "loss": 0.6885, + "step": 48138 + }, + { + "epoch": 1.23, + "learning_rate": 1.3296633607146523e-06, + "loss": 0.6562, + "step": 48139 + }, + { + "epoch": 1.23, + "learning_rate": 1.3296372369531017e-06, + "loss": 0.6211, + "step": 48140 + }, + { + "epoch": 1.23, + "learning_rate": 1.3296111129391628e-06, + "loss": 0.6509, + "step": 48141 + }, + { + "epoch": 1.23, + "learning_rate": 1.3295849886728558e-06, + "loss": 0.6758, + "step": 48142 + }, + { + "epoch": 1.23, + "learning_rate": 1.329558864154201e-06, + "loss": 0.668, + "step": 48143 + }, + { + "epoch": 1.23, + "learning_rate": 1.329532739383218e-06, + "loss": 0.9385, + "step": 48144 + }, + { + "epoch": 1.23, + "learning_rate": 1.3295066143599267e-06, + "loss": 0.6709, + "step": 48145 + }, + { + "epoch": 1.23, + "learning_rate": 1.3294804890843475e-06, + "loss": 0.5469, + "step": 48146 + }, + { + "epoch": 1.23, + "learning_rate": 1.3294543635565e-06, + "loss": 0.7373, + "step": 48147 + }, + { + "epoch": 1.23, + "learning_rate": 1.329428237776405e-06, + "loss": 0.6929, + "step": 48148 + }, + { + "epoch": 1.23, + "learning_rate": 1.3294021117440817e-06, + "loss": 0.7236, + "step": 48149 + }, + { + "epoch": 1.23, + "learning_rate": 1.3293759854595503e-06, + "loss": 0.6504, + "step": 48150 + }, + { + "epoch": 1.23, + "learning_rate": 1.3293498589228307e-06, + "loss": 0.7764, + "step": 48151 + }, + { + "epoch": 1.23, + "learning_rate": 1.3293237321339433e-06, + "loss": 0.573, + "step": 48152 + }, + { + "epoch": 1.23, + "learning_rate": 1.3292976050929077e-06, + "loss": 0.6416, + "step": 48153 + }, + { + "epoch": 1.23, + "learning_rate": 1.3292714777997443e-06, + "loss": 0.5337, + "step": 48154 + }, + { + "epoch": 1.23, + "learning_rate": 1.3292453502544725e-06, + "loss": 0.5669, + "step": 48155 + }, + { + "epoch": 1.23, + "learning_rate": 1.329219222457113e-06, + "loss": 0.9121, + "step": 48156 + }, + { + "epoch": 1.23, + "learning_rate": 1.3291930944076853e-06, + "loss": 0.7354, + "step": 48157 + }, + { + "epoch": 1.23, + "learning_rate": 1.3291669661062094e-06, + "loss": 0.6602, + "step": 48158 + }, + { + "epoch": 1.23, + "learning_rate": 1.329140837552706e-06, + "loss": 0.5757, + "step": 48159 + }, + { + "epoch": 1.23, + "learning_rate": 1.3291147087471943e-06, + "loss": 0.5754, + "step": 48160 + }, + { + "epoch": 1.23, + "learning_rate": 1.3290885796896945e-06, + "loss": 0.6436, + "step": 48161 + }, + { + "epoch": 1.23, + "learning_rate": 1.3290624503802268e-06, + "loss": 0.6055, + "step": 48162 + }, + { + "epoch": 1.23, + "learning_rate": 1.329036320818811e-06, + "loss": 0.7207, + "step": 48163 + }, + { + "epoch": 1.23, + "learning_rate": 1.3290101910054677e-06, + "loss": 0.6611, + "step": 48164 + }, + { + "epoch": 1.23, + "learning_rate": 1.328984060940216e-06, + "loss": 0.8027, + "step": 48165 + }, + { + "epoch": 1.23, + "learning_rate": 1.3289579306230763e-06, + "loss": 0.9043, + "step": 48166 + }, + { + "epoch": 1.23, + "learning_rate": 1.3289318000540687e-06, + "loss": 0.7578, + "step": 48167 + }, + { + "epoch": 1.23, + "learning_rate": 1.328905669233213e-06, + "loss": 0.5898, + "step": 48168 + }, + { + "epoch": 1.23, + "learning_rate": 1.32887953816053e-06, + "loss": 0.6445, + "step": 48169 + }, + { + "epoch": 1.23, + "learning_rate": 1.3288534068360383e-06, + "loss": 0.6523, + "step": 48170 + }, + { + "epoch": 1.23, + "learning_rate": 1.3288272752597592e-06, + "loss": 0.6279, + "step": 48171 + }, + { + "epoch": 1.23, + "learning_rate": 1.3288011434317116e-06, + "loss": 0.5586, + "step": 48172 + }, + { + "epoch": 1.23, + "learning_rate": 1.3287750113519168e-06, + "loss": 0.7559, + "step": 48173 + }, + { + "epoch": 1.23, + "learning_rate": 1.3287488790203936e-06, + "loss": 0.6582, + "step": 48174 + }, + { + "epoch": 1.23, + "learning_rate": 1.3287227464371626e-06, + "loss": 0.5737, + "step": 48175 + }, + { + "epoch": 1.23, + "learning_rate": 1.3286966136022438e-06, + "loss": 0.5557, + "step": 48176 + }, + { + "epoch": 1.23, + "learning_rate": 1.328670480515657e-06, + "loss": 0.6484, + "step": 48177 + }, + { + "epoch": 1.23, + "learning_rate": 1.3286443471774222e-06, + "loss": 0.5081, + "step": 48178 + }, + { + "epoch": 1.23, + "learning_rate": 1.32861821358756e-06, + "loss": 0.7275, + "step": 48179 + }, + { + "epoch": 1.23, + "learning_rate": 1.3285920797460897e-06, + "loss": 0.5913, + "step": 48180 + }, + { + "epoch": 1.23, + "learning_rate": 1.3285659456530314e-06, + "loss": 0.4437, + "step": 48181 + }, + { + "epoch": 1.23, + "learning_rate": 1.3285398113084053e-06, + "loss": 0.4731, + "step": 48182 + }, + { + "epoch": 1.23, + "learning_rate": 1.3285136767122316e-06, + "loss": 0.5879, + "step": 48183 + }, + { + "epoch": 1.23, + "learning_rate": 1.3284875418645298e-06, + "loss": 0.6123, + "step": 48184 + }, + { + "epoch": 1.24, + "learning_rate": 1.3284614067653204e-06, + "loss": 0.4252, + "step": 48185 + }, + { + "epoch": 1.24, + "learning_rate": 1.328435271414623e-06, + "loss": 0.6641, + "step": 48186 + }, + { + "epoch": 1.24, + "learning_rate": 1.328409135812458e-06, + "loss": 0.6045, + "step": 48187 + }, + { + "epoch": 1.24, + "learning_rate": 1.328382999958845e-06, + "loss": 0.4954, + "step": 48188 + }, + { + "epoch": 1.24, + "learning_rate": 1.3283568638538045e-06, + "loss": 0.5015, + "step": 48189 + }, + { + "epoch": 1.24, + "learning_rate": 1.3283307274973564e-06, + "loss": 0.5273, + "step": 48190 + }, + { + "epoch": 1.24, + "learning_rate": 1.32830459088952e-06, + "loss": 0.6113, + "step": 48191 + }, + { + "epoch": 1.24, + "learning_rate": 1.3282784540303162e-06, + "loss": 0.7637, + "step": 48192 + }, + { + "epoch": 1.24, + "learning_rate": 1.3282523169197646e-06, + "loss": 0.6875, + "step": 48193 + }, + { + "epoch": 1.24, + "learning_rate": 1.3282261795578858e-06, + "loss": 0.6436, + "step": 48194 + }, + { + "epoch": 1.24, + "learning_rate": 1.3282000419446987e-06, + "loss": 0.7827, + "step": 48195 + }, + { + "epoch": 1.24, + "learning_rate": 1.328173904080224e-06, + "loss": 0.5181, + "step": 48196 + }, + { + "epoch": 1.24, + "learning_rate": 1.3281477659644815e-06, + "loss": 0.8447, + "step": 48197 + }, + { + "epoch": 1.24, + "learning_rate": 1.3281216275974916e-06, + "loss": 0.7158, + "step": 48198 + }, + { + "epoch": 1.24, + "learning_rate": 1.3280954889792743e-06, + "loss": 0.4353, + "step": 48199 + }, + { + "epoch": 1.24, + "learning_rate": 1.328069350109849e-06, + "loss": 0.6104, + "step": 48200 + }, + { + "epoch": 1.24, + "learning_rate": 1.328043210989236e-06, + "loss": 0.6245, + "step": 48201 + }, + { + "epoch": 1.24, + "learning_rate": 1.3280170716174557e-06, + "loss": 0.7559, + "step": 48202 + }, + { + "epoch": 1.24, + "learning_rate": 1.3279909319945275e-06, + "loss": 0.626, + "step": 48203 + }, + { + "epoch": 1.24, + "learning_rate": 1.3279647921204722e-06, + "loss": 0.5037, + "step": 48204 + }, + { + "epoch": 1.24, + "learning_rate": 1.3279386519953088e-06, + "loss": 0.7402, + "step": 48205 + }, + { + "epoch": 1.24, + "learning_rate": 1.3279125116190583e-06, + "loss": 0.7773, + "step": 48206 + }, + { + "epoch": 1.24, + "learning_rate": 1.3278863709917398e-06, + "loss": 0.6421, + "step": 48207 + }, + { + "epoch": 1.24, + "learning_rate": 1.327860230113374e-06, + "loss": 0.6489, + "step": 48208 + }, + { + "epoch": 1.24, + "learning_rate": 1.327834088983981e-06, + "loss": 0.441, + "step": 48209 + }, + { + "epoch": 1.24, + "learning_rate": 1.32780794760358e-06, + "loss": 0.6885, + "step": 48210 + }, + { + "epoch": 1.24, + "learning_rate": 1.327781805972192e-06, + "loss": 0.5615, + "step": 48211 + }, + { + "epoch": 1.24, + "learning_rate": 1.3277556640898362e-06, + "loss": 0.5322, + "step": 48212 + }, + { + "epoch": 1.24, + "learning_rate": 1.327729521956533e-06, + "loss": 0.5513, + "step": 48213 + }, + { + "epoch": 1.24, + "learning_rate": 1.3277033795723026e-06, + "loss": 0.6296, + "step": 48214 + }, + { + "epoch": 1.24, + "learning_rate": 1.3276772369371647e-06, + "loss": 0.6758, + "step": 48215 + }, + { + "epoch": 1.24, + "learning_rate": 1.3276510940511392e-06, + "loss": 0.7109, + "step": 48216 + }, + { + "epoch": 1.24, + "learning_rate": 1.3276249509142466e-06, + "loss": 0.7412, + "step": 48217 + }, + { + "epoch": 1.24, + "learning_rate": 1.3275988075265064e-06, + "loss": 0.6582, + "step": 48218 + }, + { + "epoch": 1.24, + "learning_rate": 1.3275726638879392e-06, + "loss": 0.5535, + "step": 48219 + }, + { + "epoch": 1.24, + "learning_rate": 1.3275465199985643e-06, + "loss": 0.7275, + "step": 48220 + }, + { + "epoch": 1.24, + "learning_rate": 1.3275203758584024e-06, + "loss": 0.7178, + "step": 48221 + }, + { + "epoch": 1.24, + "learning_rate": 1.327494231467473e-06, + "loss": 0.5657, + "step": 48222 + }, + { + "epoch": 1.24, + "learning_rate": 1.3274680868257962e-06, + "loss": 0.7383, + "step": 48223 + }, + { + "epoch": 1.24, + "learning_rate": 1.3274419419333924e-06, + "loss": 0.7268, + "step": 48224 + }, + { + "epoch": 1.24, + "learning_rate": 1.3274157967902812e-06, + "loss": 0.543, + "step": 48225 + }, + { + "epoch": 1.24, + "learning_rate": 1.3273896513964828e-06, + "loss": 0.6401, + "step": 48226 + }, + { + "epoch": 1.24, + "learning_rate": 1.3273635057520173e-06, + "loss": 0.6821, + "step": 48227 + }, + { + "epoch": 1.24, + "learning_rate": 1.3273373598569043e-06, + "loss": 0.8086, + "step": 48228 + }, + { + "epoch": 1.24, + "learning_rate": 1.3273112137111645e-06, + "loss": 0.481, + "step": 48229 + }, + { + "epoch": 1.24, + "learning_rate": 1.3272850673148177e-06, + "loss": 0.6294, + "step": 48230 + }, + { + "epoch": 1.24, + "learning_rate": 1.3272589206678832e-06, + "loss": 0.7085, + "step": 48231 + }, + { + "epoch": 1.24, + "learning_rate": 1.3272327737703821e-06, + "loss": 0.8604, + "step": 48232 + }, + { + "epoch": 1.24, + "learning_rate": 1.3272066266223338e-06, + "loss": 0.5605, + "step": 48233 + }, + { + "epoch": 1.24, + "learning_rate": 1.3271804792237584e-06, + "loss": 0.627, + "step": 48234 + }, + { + "epoch": 1.24, + "learning_rate": 1.3271543315746759e-06, + "loss": 0.5566, + "step": 48235 + }, + { + "epoch": 1.24, + "learning_rate": 1.3271281836751062e-06, + "loss": 0.606, + "step": 48236 + }, + { + "epoch": 1.24, + "learning_rate": 1.3271020355250696e-06, + "loss": 0.5962, + "step": 48237 + }, + { + "epoch": 1.24, + "learning_rate": 1.3270758871245861e-06, + "loss": 0.6948, + "step": 48238 + }, + { + "epoch": 1.24, + "learning_rate": 1.3270497384736758e-06, + "loss": 0.6426, + "step": 48239 + }, + { + "epoch": 1.24, + "learning_rate": 1.3270235895723585e-06, + "loss": 0.6011, + "step": 48240 + }, + { + "epoch": 1.24, + "learning_rate": 1.3269974404206541e-06, + "loss": 0.6484, + "step": 48241 + }, + { + "epoch": 1.24, + "learning_rate": 1.326971291018583e-06, + "loss": 0.7314, + "step": 48242 + }, + { + "epoch": 1.24, + "learning_rate": 1.3269451413661646e-06, + "loss": 0.5327, + "step": 48243 + }, + { + "epoch": 1.24, + "learning_rate": 1.3269189914634197e-06, + "loss": 0.5972, + "step": 48244 + }, + { + "epoch": 1.24, + "learning_rate": 1.326892841310368e-06, + "loss": 0.6768, + "step": 48245 + }, + { + "epoch": 1.24, + "learning_rate": 1.3268666909070292e-06, + "loss": 0.5625, + "step": 48246 + }, + { + "epoch": 1.24, + "learning_rate": 1.3268405402534236e-06, + "loss": 0.561, + "step": 48247 + }, + { + "epoch": 1.24, + "learning_rate": 1.3268143893495713e-06, + "loss": 0.6328, + "step": 48248 + }, + { + "epoch": 1.24, + "learning_rate": 1.3267882381954927e-06, + "loss": 0.7422, + "step": 48249 + }, + { + "epoch": 1.24, + "learning_rate": 1.326762086791207e-06, + "loss": 0.4951, + "step": 48250 + }, + { + "epoch": 1.24, + "learning_rate": 1.3267359351367344e-06, + "loss": 0.5393, + "step": 48251 + }, + { + "epoch": 1.24, + "learning_rate": 1.3267097832320952e-06, + "loss": 0.4546, + "step": 48252 + }, + { + "epoch": 1.24, + "learning_rate": 1.3266836310773095e-06, + "loss": 0.7686, + "step": 48253 + }, + { + "epoch": 1.24, + "learning_rate": 1.3266574786723973e-06, + "loss": 0.3999, + "step": 48254 + }, + { + "epoch": 1.24, + "learning_rate": 1.3266313260173782e-06, + "loss": 0.665, + "step": 48255 + }, + { + "epoch": 1.24, + "learning_rate": 1.3266051731122725e-06, + "loss": 0.6357, + "step": 48256 + }, + { + "epoch": 1.24, + "learning_rate": 1.3265790199571006e-06, + "loss": 0.6616, + "step": 48257 + }, + { + "epoch": 1.24, + "learning_rate": 1.3265528665518816e-06, + "loss": 0.8867, + "step": 48258 + }, + { + "epoch": 1.24, + "learning_rate": 1.3265267128966367e-06, + "loss": 0.4722, + "step": 48259 + }, + { + "epoch": 1.24, + "learning_rate": 1.326500558991385e-06, + "loss": 0.5122, + "step": 48260 + }, + { + "epoch": 1.24, + "learning_rate": 1.3264744048361467e-06, + "loss": 0.7158, + "step": 48261 + }, + { + "epoch": 1.24, + "learning_rate": 1.326448250430942e-06, + "loss": 0.6514, + "step": 48262 + }, + { + "epoch": 1.24, + "learning_rate": 1.326422095775791e-06, + "loss": 0.6484, + "step": 48263 + }, + { + "epoch": 1.24, + "learning_rate": 1.3263959408707137e-06, + "loss": 0.5796, + "step": 48264 + }, + { + "epoch": 1.24, + "learning_rate": 1.32636978571573e-06, + "loss": 0.6221, + "step": 48265 + }, + { + "epoch": 1.24, + "learning_rate": 1.32634363031086e-06, + "loss": 0.5092, + "step": 48266 + }, + { + "epoch": 1.24, + "learning_rate": 1.3263174746561233e-06, + "loss": 0.592, + "step": 48267 + }, + { + "epoch": 1.24, + "learning_rate": 1.3262913187515405e-06, + "loss": 0.8154, + "step": 48268 + }, + { + "epoch": 1.24, + "learning_rate": 1.326265162597132e-06, + "loss": 0.6426, + "step": 48269 + }, + { + "epoch": 1.24, + "learning_rate": 1.3262390061929166e-06, + "loss": 0.5088, + "step": 48270 + }, + { + "epoch": 1.24, + "learning_rate": 1.3262128495389154e-06, + "loss": 0.7793, + "step": 48271 + }, + { + "epoch": 1.24, + "learning_rate": 1.3261866926351476e-06, + "loss": 0.7681, + "step": 48272 + }, + { + "epoch": 1.24, + "learning_rate": 1.326160535481634e-06, + "loss": 0.7529, + "step": 48273 + }, + { + "epoch": 1.24, + "learning_rate": 1.326134378078394e-06, + "loss": 0.5874, + "step": 48274 + }, + { + "epoch": 1.24, + "learning_rate": 1.3261082204254482e-06, + "loss": 0.6489, + "step": 48275 + }, + { + "epoch": 1.24, + "learning_rate": 1.326082062522816e-06, + "loss": 0.8223, + "step": 48276 + }, + { + "epoch": 1.24, + "learning_rate": 1.3260559043705183e-06, + "loss": 0.7295, + "step": 48277 + }, + { + "epoch": 1.24, + "learning_rate": 1.3260297459685738e-06, + "loss": 0.6953, + "step": 48278 + }, + { + "epoch": 1.24, + "learning_rate": 1.3260035873170039e-06, + "loss": 0.7393, + "step": 48279 + }, + { + "epoch": 1.24, + "learning_rate": 1.325977428415828e-06, + "loss": 0.7432, + "step": 48280 + }, + { + "epoch": 1.24, + "learning_rate": 1.3259512692650659e-06, + "loss": 0.6699, + "step": 48281 + }, + { + "epoch": 1.24, + "learning_rate": 1.3259251098647378e-06, + "loss": 0.6992, + "step": 48282 + }, + { + "epoch": 1.24, + "learning_rate": 1.3258989502148642e-06, + "loss": 0.6611, + "step": 48283 + }, + { + "epoch": 1.24, + "learning_rate": 1.325872790315465e-06, + "loss": 0.6631, + "step": 48284 + }, + { + "epoch": 1.24, + "learning_rate": 1.3258466301665593e-06, + "loss": 0.4667, + "step": 48285 + }, + { + "epoch": 1.24, + "learning_rate": 1.3258204697681684e-06, + "loss": 0.7104, + "step": 48286 + }, + { + "epoch": 1.24, + "learning_rate": 1.3257943091203112e-06, + "loss": 0.8486, + "step": 48287 + }, + { + "epoch": 1.24, + "learning_rate": 1.3257681482230087e-06, + "loss": 0.623, + "step": 48288 + }, + { + "epoch": 1.24, + "learning_rate": 1.3257419870762804e-06, + "loss": 0.4692, + "step": 48289 + }, + { + "epoch": 1.24, + "learning_rate": 1.3257158256801467e-06, + "loss": 0.7573, + "step": 48290 + }, + { + "epoch": 1.24, + "learning_rate": 1.325689664034627e-06, + "loss": 0.707, + "step": 48291 + }, + { + "epoch": 1.24, + "learning_rate": 1.3256635021397418e-06, + "loss": 0.6104, + "step": 48292 + }, + { + "epoch": 1.24, + "learning_rate": 1.3256373399955107e-06, + "loss": 0.5054, + "step": 48293 + }, + { + "epoch": 1.24, + "learning_rate": 1.3256111776019548e-06, + "loss": 0.5364, + "step": 48294 + }, + { + "epoch": 1.24, + "learning_rate": 1.3255850149590928e-06, + "loss": 0.4692, + "step": 48295 + }, + { + "epoch": 1.24, + "learning_rate": 1.3255588520669453e-06, + "loss": 0.6807, + "step": 48296 + }, + { + "epoch": 1.24, + "learning_rate": 1.3255326889255324e-06, + "loss": 0.6299, + "step": 48297 + }, + { + "epoch": 1.24, + "learning_rate": 1.3255065255348745e-06, + "loss": 0.8086, + "step": 48298 + }, + { + "epoch": 1.24, + "learning_rate": 1.325480361894991e-06, + "loss": 0.6675, + "step": 48299 + }, + { + "epoch": 1.24, + "learning_rate": 1.325454198005902e-06, + "loss": 0.5801, + "step": 48300 + }, + { + "epoch": 1.24, + "learning_rate": 1.325428033867628e-06, + "loss": 0.4958, + "step": 48301 + }, + { + "epoch": 1.24, + "learning_rate": 1.3254018694801882e-06, + "loss": 0.6426, + "step": 48302 + }, + { + "epoch": 1.24, + "learning_rate": 1.3253757048436035e-06, + "loss": 0.6621, + "step": 48303 + }, + { + "epoch": 1.24, + "learning_rate": 1.3253495399578937e-06, + "loss": 0.6367, + "step": 48304 + }, + { + "epoch": 1.24, + "learning_rate": 1.3253233748230788e-06, + "loss": 0.8623, + "step": 48305 + }, + { + "epoch": 1.24, + "learning_rate": 1.3252972094391783e-06, + "loss": 0.5547, + "step": 48306 + }, + { + "epoch": 1.24, + "learning_rate": 1.3252710438062129e-06, + "loss": 0.4512, + "step": 48307 + }, + { + "epoch": 1.24, + "learning_rate": 1.3252448779242026e-06, + "loss": 0.6621, + "step": 48308 + }, + { + "epoch": 1.24, + "learning_rate": 1.325218711793167e-06, + "loss": 0.6719, + "step": 48309 + }, + { + "epoch": 1.24, + "learning_rate": 1.3251925454131265e-06, + "loss": 0.5635, + "step": 48310 + }, + { + "epoch": 1.24, + "learning_rate": 1.325166378784101e-06, + "loss": 0.4644, + "step": 48311 + }, + { + "epoch": 1.24, + "learning_rate": 1.3251402119061104e-06, + "loss": 0.5212, + "step": 48312 + }, + { + "epoch": 1.24, + "learning_rate": 1.3251140447791754e-06, + "loss": 0.7178, + "step": 48313 + }, + { + "epoch": 1.24, + "learning_rate": 1.325087877403315e-06, + "loss": 0.6001, + "step": 48314 + }, + { + "epoch": 1.24, + "learning_rate": 1.3250617097785498e-06, + "loss": 0.5017, + "step": 48315 + }, + { + "epoch": 1.24, + "learning_rate": 1.3250355419049e-06, + "loss": 0.6875, + "step": 48316 + }, + { + "epoch": 1.24, + "learning_rate": 1.3250093737823853e-06, + "loss": 0.6992, + "step": 48317 + }, + { + "epoch": 1.24, + "learning_rate": 1.3249832054110259e-06, + "loss": 0.7754, + "step": 48318 + }, + { + "epoch": 1.24, + "learning_rate": 1.3249570367908419e-06, + "loss": 0.6719, + "step": 48319 + }, + { + "epoch": 1.24, + "learning_rate": 1.3249308679218531e-06, + "loss": 0.6343, + "step": 48320 + }, + { + "epoch": 1.24, + "learning_rate": 1.3249046988040796e-06, + "loss": 0.5771, + "step": 48321 + }, + { + "epoch": 1.24, + "learning_rate": 1.3248785294375418e-06, + "loss": 0.8311, + "step": 48322 + }, + { + "epoch": 1.24, + "learning_rate": 1.3248523598222592e-06, + "loss": 0.7983, + "step": 48323 + }, + { + "epoch": 1.24, + "learning_rate": 1.3248261899582522e-06, + "loss": 0.606, + "step": 48324 + }, + { + "epoch": 1.24, + "learning_rate": 1.3248000198455407e-06, + "loss": 0.7227, + "step": 48325 + }, + { + "epoch": 1.24, + "learning_rate": 1.3247738494841447e-06, + "loss": 0.6416, + "step": 48326 + }, + { + "epoch": 1.24, + "learning_rate": 1.3247476788740844e-06, + "loss": 0.7231, + "step": 48327 + }, + { + "epoch": 1.24, + "learning_rate": 1.3247215080153797e-06, + "loss": 0.6211, + "step": 48328 + }, + { + "epoch": 1.24, + "learning_rate": 1.3246953369080507e-06, + "loss": 0.4946, + "step": 48329 + }, + { + "epoch": 1.24, + "learning_rate": 1.3246691655521173e-06, + "loss": 0.5518, + "step": 48330 + }, + { + "epoch": 1.24, + "learning_rate": 1.3246429939475997e-06, + "loss": 0.708, + "step": 48331 + }, + { + "epoch": 1.24, + "learning_rate": 1.3246168220945179e-06, + "loss": 0.7256, + "step": 48332 + }, + { + "epoch": 1.24, + "learning_rate": 1.324590649992892e-06, + "loss": 0.3894, + "step": 48333 + }, + { + "epoch": 1.24, + "learning_rate": 1.3245644776427421e-06, + "loss": 0.5703, + "step": 48334 + }, + { + "epoch": 1.24, + "learning_rate": 1.3245383050440878e-06, + "loss": 0.5269, + "step": 48335 + }, + { + "epoch": 1.24, + "learning_rate": 1.3245121321969495e-06, + "loss": 0.5371, + "step": 48336 + }, + { + "epoch": 1.24, + "learning_rate": 1.324485959101347e-06, + "loss": 0.4856, + "step": 48337 + }, + { + "epoch": 1.24, + "learning_rate": 1.324459785757301e-06, + "loss": 0.708, + "step": 48338 + }, + { + "epoch": 1.24, + "learning_rate": 1.3244336121648306e-06, + "loss": 0.542, + "step": 48339 + }, + { + "epoch": 1.24, + "learning_rate": 1.3244074383239567e-06, + "loss": 0.7168, + "step": 48340 + }, + { + "epoch": 1.24, + "learning_rate": 1.3243812642346988e-06, + "loss": 0.6709, + "step": 48341 + }, + { + "epoch": 1.24, + "learning_rate": 1.324355089897077e-06, + "loss": 0.6382, + "step": 48342 + }, + { + "epoch": 1.24, + "learning_rate": 1.3243289153111115e-06, + "loss": 0.6455, + "step": 48343 + }, + { + "epoch": 1.24, + "learning_rate": 1.324302740476822e-06, + "loss": 0.6958, + "step": 48344 + }, + { + "epoch": 1.24, + "learning_rate": 1.3242765653942292e-06, + "loss": 0.4833, + "step": 48345 + }, + { + "epoch": 1.24, + "learning_rate": 1.3242503900633523e-06, + "loss": 0.666, + "step": 48346 + }, + { + "epoch": 1.24, + "learning_rate": 1.3242242144842122e-06, + "loss": 0.6011, + "step": 48347 + }, + { + "epoch": 1.24, + "learning_rate": 1.3241980386568284e-06, + "loss": 0.5591, + "step": 48348 + }, + { + "epoch": 1.24, + "learning_rate": 1.324171862581221e-06, + "loss": 0.606, + "step": 48349 + }, + { + "epoch": 1.24, + "learning_rate": 1.32414568625741e-06, + "loss": 0.6694, + "step": 48350 + }, + { + "epoch": 1.24, + "learning_rate": 1.3241195096854158e-06, + "loss": 0.6968, + "step": 48351 + }, + { + "epoch": 1.24, + "learning_rate": 1.3240933328652578e-06, + "loss": 0.5645, + "step": 48352 + }, + { + "epoch": 1.24, + "learning_rate": 1.3240671557969573e-06, + "loss": 0.4745, + "step": 48353 + }, + { + "epoch": 1.24, + "learning_rate": 1.3240409784805327e-06, + "loss": 0.6875, + "step": 48354 + }, + { + "epoch": 1.24, + "learning_rate": 1.324014800916005e-06, + "loss": 0.6455, + "step": 48355 + }, + { + "epoch": 1.24, + "learning_rate": 1.323988623103394e-06, + "loss": 0.4712, + "step": 48356 + }, + { + "epoch": 1.24, + "learning_rate": 1.32396244504272e-06, + "loss": 0.5073, + "step": 48357 + }, + { + "epoch": 1.24, + "learning_rate": 1.323936266734003e-06, + "loss": 0.7178, + "step": 48358 + }, + { + "epoch": 1.24, + "learning_rate": 1.3239100881772627e-06, + "loss": 0.7314, + "step": 48359 + }, + { + "epoch": 1.24, + "learning_rate": 1.323883909372519e-06, + "loss": 0.647, + "step": 48360 + }, + { + "epoch": 1.24, + "learning_rate": 1.323857730319793e-06, + "loss": 0.5396, + "step": 48361 + }, + { + "epoch": 1.24, + "learning_rate": 1.3238315510191033e-06, + "loss": 0.8525, + "step": 48362 + }, + { + "epoch": 1.24, + "learning_rate": 1.323805371470471e-06, + "loss": 0.472, + "step": 48363 + }, + { + "epoch": 1.24, + "learning_rate": 1.3237791916739159e-06, + "loss": 0.6597, + "step": 48364 + }, + { + "epoch": 1.24, + "learning_rate": 1.3237530116294578e-06, + "loss": 0.6396, + "step": 48365 + }, + { + "epoch": 1.24, + "learning_rate": 1.323726831337117e-06, + "loss": 0.7256, + "step": 48366 + }, + { + "epoch": 1.24, + "learning_rate": 1.3237006507969133e-06, + "loss": 0.5425, + "step": 48367 + }, + { + "epoch": 1.24, + "learning_rate": 1.3236744700088674e-06, + "loss": 0.7246, + "step": 48368 + }, + { + "epoch": 1.24, + "learning_rate": 1.3236482889729981e-06, + "loss": 0.5762, + "step": 48369 + }, + { + "epoch": 1.24, + "learning_rate": 1.3236221076893266e-06, + "loss": 0.6768, + "step": 48370 + }, + { + "epoch": 1.24, + "learning_rate": 1.3235959261578725e-06, + "loss": 0.5464, + "step": 48371 + }, + { + "epoch": 1.24, + "learning_rate": 1.3235697443786558e-06, + "loss": 0.5959, + "step": 48372 + }, + { + "epoch": 1.24, + "learning_rate": 1.3235435623516967e-06, + "loss": 0.7119, + "step": 48373 + }, + { + "epoch": 1.24, + "learning_rate": 1.3235173800770153e-06, + "loss": 0.479, + "step": 48374 + }, + { + "epoch": 1.24, + "learning_rate": 1.3234911975546313e-06, + "loss": 0.665, + "step": 48375 + }, + { + "epoch": 1.24, + "learning_rate": 1.323465014784565e-06, + "loss": 0.7578, + "step": 48376 + }, + { + "epoch": 1.24, + "learning_rate": 1.3234388317668361e-06, + "loss": 0.7017, + "step": 48377 + }, + { + "epoch": 1.24, + "learning_rate": 1.3234126485014656e-06, + "loss": 0.6294, + "step": 48378 + }, + { + "epoch": 1.24, + "learning_rate": 1.3233864649884728e-06, + "loss": 0.4189, + "step": 48379 + }, + { + "epoch": 1.24, + "learning_rate": 1.3233602812278774e-06, + "loss": 0.5696, + "step": 48380 + }, + { + "epoch": 1.24, + "learning_rate": 1.3233340972197002e-06, + "loss": 0.5552, + "step": 48381 + }, + { + "epoch": 1.24, + "learning_rate": 1.323307912963961e-06, + "loss": 0.6228, + "step": 48382 + }, + { + "epoch": 1.24, + "learning_rate": 1.3232817284606797e-06, + "loss": 0.7559, + "step": 48383 + }, + { + "epoch": 1.24, + "learning_rate": 1.3232555437098764e-06, + "loss": 0.7529, + "step": 48384 + }, + { + "epoch": 1.24, + "learning_rate": 1.3232293587115713e-06, + "loss": 0.7881, + "step": 48385 + }, + { + "epoch": 1.24, + "learning_rate": 1.3232031734657843e-06, + "loss": 0.7158, + "step": 48386 + }, + { + "epoch": 1.24, + "learning_rate": 1.3231769879725354e-06, + "loss": 0.6504, + "step": 48387 + }, + { + "epoch": 1.24, + "learning_rate": 1.323150802231845e-06, + "loss": 0.7197, + "step": 48388 + }, + { + "epoch": 1.24, + "learning_rate": 1.3231246162437327e-06, + "loss": 0.6021, + "step": 48389 + }, + { + "epoch": 1.24, + "learning_rate": 1.3230984300082187e-06, + "loss": 0.5129, + "step": 48390 + }, + { + "epoch": 1.24, + "learning_rate": 1.323072243525323e-06, + "loss": 0.6787, + "step": 48391 + }, + { + "epoch": 1.24, + "learning_rate": 1.3230460567950656e-06, + "loss": 0.6357, + "step": 48392 + }, + { + "epoch": 1.24, + "learning_rate": 1.3230198698174673e-06, + "loss": 0.6416, + "step": 48393 + }, + { + "epoch": 1.24, + "learning_rate": 1.3229936825925472e-06, + "loss": 0.5806, + "step": 48394 + }, + { + "epoch": 1.24, + "learning_rate": 1.3229674951203257e-06, + "loss": 0.7246, + "step": 48395 + }, + { + "epoch": 1.24, + "learning_rate": 1.3229413074008227e-06, + "loss": 0.6162, + "step": 48396 + }, + { + "epoch": 1.24, + "learning_rate": 1.3229151194340586e-06, + "loss": 0.6438, + "step": 48397 + }, + { + "epoch": 1.24, + "learning_rate": 1.3228889312200533e-06, + "loss": 0.6904, + "step": 48398 + }, + { + "epoch": 1.24, + "learning_rate": 1.3228627427588266e-06, + "loss": 0.6318, + "step": 48399 + }, + { + "epoch": 1.24, + "learning_rate": 1.3228365540503988e-06, + "loss": 0.5708, + "step": 48400 + }, + { + "epoch": 1.24, + "learning_rate": 1.3228103650947898e-06, + "loss": 0.5649, + "step": 48401 + }, + { + "epoch": 1.24, + "learning_rate": 1.3227841758920197e-06, + "loss": 0.7754, + "step": 48402 + }, + { + "epoch": 1.24, + "learning_rate": 1.322757986442109e-06, + "loss": 0.7695, + "step": 48403 + }, + { + "epoch": 1.24, + "learning_rate": 1.322731796745077e-06, + "loss": 0.5765, + "step": 48404 + }, + { + "epoch": 1.24, + "learning_rate": 1.3227056068009443e-06, + "loss": 0.5244, + "step": 48405 + }, + { + "epoch": 1.24, + "learning_rate": 1.3226794166097307e-06, + "loss": 0.6885, + "step": 48406 + }, + { + "epoch": 1.24, + "learning_rate": 1.322653226171456e-06, + "loss": 0.708, + "step": 48407 + }, + { + "epoch": 1.24, + "learning_rate": 1.322627035486141e-06, + "loss": 0.5552, + "step": 48408 + }, + { + "epoch": 1.24, + "learning_rate": 1.3226008445538051e-06, + "loss": 0.6787, + "step": 48409 + }, + { + "epoch": 1.24, + "learning_rate": 1.3225746533744685e-06, + "loss": 0.6504, + "step": 48410 + }, + { + "epoch": 1.24, + "learning_rate": 1.3225484619481513e-06, + "loss": 0.6533, + "step": 48411 + }, + { + "epoch": 1.24, + "learning_rate": 1.3225222702748738e-06, + "loss": 0.7085, + "step": 48412 + }, + { + "epoch": 1.24, + "learning_rate": 1.3224960783546557e-06, + "loss": 0.5872, + "step": 48413 + }, + { + "epoch": 1.24, + "learning_rate": 1.3224698861875175e-06, + "loss": 0.5591, + "step": 48414 + }, + { + "epoch": 1.24, + "learning_rate": 1.3224436937734783e-06, + "loss": 0.6484, + "step": 48415 + }, + { + "epoch": 1.24, + "learning_rate": 1.3224175011125593e-06, + "loss": 0.6035, + "step": 48416 + }, + { + "epoch": 1.24, + "learning_rate": 1.3223913082047798e-06, + "loss": 0.6768, + "step": 48417 + }, + { + "epoch": 1.24, + "learning_rate": 1.3223651150501605e-06, + "loss": 0.7158, + "step": 48418 + }, + { + "epoch": 1.24, + "learning_rate": 1.3223389216487204e-06, + "loss": 0.5535, + "step": 48419 + }, + { + "epoch": 1.24, + "learning_rate": 1.3223127280004807e-06, + "loss": 0.7656, + "step": 48420 + }, + { + "epoch": 1.24, + "learning_rate": 1.3222865341054606e-06, + "loss": 0.7832, + "step": 48421 + }, + { + "epoch": 1.24, + "learning_rate": 1.3222603399636807e-06, + "loss": 0.7324, + "step": 48422 + }, + { + "epoch": 1.24, + "learning_rate": 1.322234145575161e-06, + "loss": 0.5796, + "step": 48423 + }, + { + "epoch": 1.24, + "learning_rate": 1.3222079509399216e-06, + "loss": 0.6982, + "step": 48424 + }, + { + "epoch": 1.24, + "learning_rate": 1.3221817560579819e-06, + "loss": 0.7686, + "step": 48425 + }, + { + "epoch": 1.24, + "learning_rate": 1.3221555609293626e-06, + "loss": 0.5298, + "step": 48426 + }, + { + "epoch": 1.24, + "learning_rate": 1.3221293655540836e-06, + "loss": 0.6533, + "step": 48427 + }, + { + "epoch": 1.24, + "learning_rate": 1.322103169932165e-06, + "loss": 0.6548, + "step": 48428 + }, + { + "epoch": 1.24, + "learning_rate": 1.322076974063627e-06, + "loss": 0.6714, + "step": 48429 + }, + { + "epoch": 1.24, + "learning_rate": 1.3220507779484894e-06, + "loss": 0.5193, + "step": 48430 + }, + { + "epoch": 1.24, + "learning_rate": 1.3220245815867718e-06, + "loss": 0.6294, + "step": 48431 + }, + { + "epoch": 1.24, + "learning_rate": 1.3219983849784955e-06, + "loss": 0.6465, + "step": 48432 + }, + { + "epoch": 1.24, + "learning_rate": 1.3219721881236796e-06, + "loss": 0.6445, + "step": 48433 + }, + { + "epoch": 1.24, + "learning_rate": 1.321945991022344e-06, + "loss": 0.5669, + "step": 48434 + }, + { + "epoch": 1.24, + "learning_rate": 1.3219197936745096e-06, + "loss": 0.6187, + "step": 48435 + }, + { + "epoch": 1.24, + "learning_rate": 1.321893596080196e-06, + "loss": 0.6899, + "step": 48436 + }, + { + "epoch": 1.24, + "learning_rate": 1.3218673982394233e-06, + "loss": 0.5508, + "step": 48437 + }, + { + "epoch": 1.24, + "learning_rate": 1.3218412001522116e-06, + "loss": 0.6191, + "step": 48438 + }, + { + "epoch": 1.24, + "learning_rate": 1.3218150018185806e-06, + "loss": 0.835, + "step": 48439 + }, + { + "epoch": 1.24, + "learning_rate": 1.3217888032385507e-06, + "loss": 0.8096, + "step": 48440 + }, + { + "epoch": 1.24, + "learning_rate": 1.321762604412142e-06, + "loss": 0.5991, + "step": 48441 + }, + { + "epoch": 1.24, + "learning_rate": 1.3217364053393743e-06, + "loss": 0.5051, + "step": 48442 + }, + { + "epoch": 1.24, + "learning_rate": 1.3217102060202682e-06, + "loss": 0.4775, + "step": 48443 + }, + { + "epoch": 1.24, + "learning_rate": 1.3216840064548431e-06, + "loss": 0.9229, + "step": 48444 + }, + { + "epoch": 1.24, + "learning_rate": 1.3216578066431195e-06, + "loss": 0.7295, + "step": 48445 + }, + { + "epoch": 1.24, + "learning_rate": 1.321631606585117e-06, + "loss": 0.5776, + "step": 48446 + }, + { + "epoch": 1.24, + "learning_rate": 1.3216054062808563e-06, + "loss": 0.5718, + "step": 48447 + }, + { + "epoch": 1.24, + "learning_rate": 1.321579205730357e-06, + "loss": 0.7222, + "step": 48448 + }, + { + "epoch": 1.24, + "learning_rate": 1.3215530049336395e-06, + "loss": 0.3511, + "step": 48449 + }, + { + "epoch": 1.24, + "learning_rate": 1.3215268038907232e-06, + "loss": 0.5806, + "step": 48450 + }, + { + "epoch": 1.24, + "learning_rate": 1.3215006026016291e-06, + "loss": 0.5093, + "step": 48451 + }, + { + "epoch": 1.24, + "learning_rate": 1.3214744010663762e-06, + "loss": 0.4346, + "step": 48452 + }, + { + "epoch": 1.24, + "learning_rate": 1.3214481992849857e-06, + "loss": 0.5269, + "step": 48453 + }, + { + "epoch": 1.24, + "learning_rate": 1.3214219972574769e-06, + "loss": 0.6104, + "step": 48454 + }, + { + "epoch": 1.24, + "learning_rate": 1.3213957949838698e-06, + "loss": 0.6387, + "step": 48455 + }, + { + "epoch": 1.24, + "learning_rate": 1.321369592464185e-06, + "loss": 0.5781, + "step": 48456 + }, + { + "epoch": 1.24, + "learning_rate": 1.3213433896984425e-06, + "loss": 0.6064, + "step": 48457 + }, + { + "epoch": 1.24, + "learning_rate": 1.321317186686662e-06, + "loss": 0.7773, + "step": 48458 + }, + { + "epoch": 1.24, + "learning_rate": 1.3212909834288633e-06, + "loss": 0.7236, + "step": 48459 + }, + { + "epoch": 1.24, + "learning_rate": 1.3212647799250671e-06, + "loss": 0.6533, + "step": 48460 + }, + { + "epoch": 1.24, + "learning_rate": 1.3212385761752934e-06, + "loss": 0.5194, + "step": 48461 + }, + { + "epoch": 1.24, + "learning_rate": 1.3212123721795618e-06, + "loss": 0.7764, + "step": 48462 + }, + { + "epoch": 1.24, + "learning_rate": 1.3211861679378927e-06, + "loss": 0.5518, + "step": 48463 + }, + { + "epoch": 1.24, + "learning_rate": 1.3211599634503065e-06, + "loss": 0.7319, + "step": 48464 + }, + { + "epoch": 1.24, + "learning_rate": 1.3211337587168226e-06, + "loss": 0.605, + "step": 48465 + }, + { + "epoch": 1.24, + "learning_rate": 1.3211075537374613e-06, + "loss": 0.7793, + "step": 48466 + }, + { + "epoch": 1.24, + "learning_rate": 1.3210813485122428e-06, + "loss": 0.7124, + "step": 48467 + }, + { + "epoch": 1.24, + "learning_rate": 1.3210551430411871e-06, + "loss": 0.752, + "step": 48468 + }, + { + "epoch": 1.24, + "learning_rate": 1.3210289373243143e-06, + "loss": 0.7109, + "step": 48469 + }, + { + "epoch": 1.24, + "learning_rate": 1.3210027313616443e-06, + "loss": 0.7358, + "step": 48470 + }, + { + "epoch": 1.24, + "learning_rate": 1.320976525153197e-06, + "loss": 0.6245, + "step": 48471 + }, + { + "epoch": 1.24, + "learning_rate": 1.320950318698993e-06, + "loss": 0.6699, + "step": 48472 + }, + { + "epoch": 1.24, + "learning_rate": 1.3209241119990523e-06, + "loss": 0.5859, + "step": 48473 + }, + { + "epoch": 1.24, + "learning_rate": 1.3208979050533945e-06, + "loss": 0.7715, + "step": 48474 + }, + { + "epoch": 1.24, + "learning_rate": 1.32087169786204e-06, + "loss": 0.6274, + "step": 48475 + }, + { + "epoch": 1.24, + "learning_rate": 1.320845490425009e-06, + "loss": 0.6782, + "step": 48476 + }, + { + "epoch": 1.24, + "learning_rate": 1.3208192827423208e-06, + "loss": 0.7773, + "step": 48477 + }, + { + "epoch": 1.24, + "learning_rate": 1.3207930748139963e-06, + "loss": 0.3983, + "step": 48478 + }, + { + "epoch": 1.24, + "learning_rate": 1.3207668666400556e-06, + "loss": 0.6187, + "step": 48479 + }, + { + "epoch": 1.24, + "learning_rate": 1.320740658220518e-06, + "loss": 0.7334, + "step": 48480 + }, + { + "epoch": 1.24, + "learning_rate": 1.3207144495554045e-06, + "loss": 0.6699, + "step": 48481 + }, + { + "epoch": 1.24, + "learning_rate": 1.3206882406447342e-06, + "loss": 0.6353, + "step": 48482 + }, + { + "epoch": 1.24, + "learning_rate": 1.320662031488528e-06, + "loss": 0.7812, + "step": 48483 + }, + { + "epoch": 1.24, + "learning_rate": 1.3206358220868057e-06, + "loss": 0.6699, + "step": 48484 + }, + { + "epoch": 1.24, + "learning_rate": 1.320609612439587e-06, + "loss": 0.7051, + "step": 48485 + }, + { + "epoch": 1.24, + "learning_rate": 1.3205834025468924e-06, + "loss": 0.7754, + "step": 48486 + }, + { + "epoch": 1.24, + "learning_rate": 1.3205571924087417e-06, + "loss": 0.6523, + "step": 48487 + }, + { + "epoch": 1.24, + "learning_rate": 1.3205309820251552e-06, + "loss": 0.7627, + "step": 48488 + }, + { + "epoch": 1.24, + "learning_rate": 1.3205047713961532e-06, + "loss": 0.665, + "step": 48489 + }, + { + "epoch": 1.24, + "learning_rate": 1.320478560521755e-06, + "loss": 0.6338, + "step": 48490 + }, + { + "epoch": 1.24, + "learning_rate": 1.3204523494019812e-06, + "loss": 0.7061, + "step": 48491 + }, + { + "epoch": 1.24, + "learning_rate": 1.3204261380368515e-06, + "loss": 0.6719, + "step": 48492 + }, + { + "epoch": 1.24, + "learning_rate": 1.320399926426387e-06, + "loss": 0.8164, + "step": 48493 + }, + { + "epoch": 1.24, + "learning_rate": 1.3203737145706063e-06, + "loss": 0.7603, + "step": 48494 + }, + { + "epoch": 1.24, + "learning_rate": 1.3203475024695305e-06, + "loss": 0.709, + "step": 48495 + }, + { + "epoch": 1.24, + "learning_rate": 1.3203212901231792e-06, + "loss": 0.7051, + "step": 48496 + }, + { + "epoch": 1.24, + "learning_rate": 1.3202950775315726e-06, + "loss": 0.6372, + "step": 48497 + }, + { + "epoch": 1.24, + "learning_rate": 1.3202688646947311e-06, + "loss": 0.6895, + "step": 48498 + }, + { + "epoch": 1.24, + "learning_rate": 1.3202426516126739e-06, + "loss": 0.6855, + "step": 48499 + }, + { + "epoch": 1.24, + "learning_rate": 1.3202164382854221e-06, + "loss": 0.4741, + "step": 48500 + }, + { + "epoch": 1.24, + "learning_rate": 1.320190224712995e-06, + "loss": 0.7725, + "step": 48501 + }, + { + "epoch": 1.24, + "learning_rate": 1.3201640108954133e-06, + "loss": 0.6514, + "step": 48502 + }, + { + "epoch": 1.24, + "learning_rate": 1.3201377968326965e-06, + "loss": 0.6826, + "step": 48503 + }, + { + "epoch": 1.24, + "learning_rate": 1.320111582524865e-06, + "loss": 0.4556, + "step": 48504 + }, + { + "epoch": 1.24, + "learning_rate": 1.3200853679719388e-06, + "loss": 0.748, + "step": 48505 + }, + { + "epoch": 1.24, + "learning_rate": 1.3200591531739378e-06, + "loss": 0.5835, + "step": 48506 + }, + { + "epoch": 1.24, + "learning_rate": 1.3200329381308822e-06, + "loss": 0.793, + "step": 48507 + }, + { + "epoch": 1.24, + "learning_rate": 1.3200067228427924e-06, + "loss": 0.75, + "step": 48508 + }, + { + "epoch": 1.24, + "learning_rate": 1.319980507309688e-06, + "loss": 0.6953, + "step": 48509 + }, + { + "epoch": 1.24, + "learning_rate": 1.3199542915315892e-06, + "loss": 0.7119, + "step": 48510 + }, + { + "epoch": 1.24, + "learning_rate": 1.319928075508516e-06, + "loss": 0.7119, + "step": 48511 + }, + { + "epoch": 1.24, + "learning_rate": 1.3199018592404887e-06, + "loss": 0.7173, + "step": 48512 + }, + { + "epoch": 1.24, + "learning_rate": 1.3198756427275274e-06, + "loss": 0.7295, + "step": 48513 + }, + { + "epoch": 1.24, + "learning_rate": 1.319849425969652e-06, + "loss": 0.6816, + "step": 48514 + }, + { + "epoch": 1.24, + "learning_rate": 1.3198232089668824e-06, + "loss": 0.5649, + "step": 48515 + }, + { + "epoch": 1.24, + "learning_rate": 1.3197969917192388e-06, + "loss": 0.665, + "step": 48516 + }, + { + "epoch": 1.24, + "learning_rate": 1.3197707742267415e-06, + "loss": 0.7559, + "step": 48517 + }, + { + "epoch": 1.24, + "learning_rate": 1.3197445564894104e-06, + "loss": 0.6514, + "step": 48518 + }, + { + "epoch": 1.24, + "learning_rate": 1.3197183385072659e-06, + "loss": 0.7285, + "step": 48519 + }, + { + "epoch": 1.24, + "learning_rate": 1.3196921202803275e-06, + "loss": 0.6621, + "step": 48520 + }, + { + "epoch": 1.24, + "learning_rate": 1.3196659018086155e-06, + "loss": 0.5938, + "step": 48521 + }, + { + "epoch": 1.24, + "learning_rate": 1.31963968309215e-06, + "loss": 0.6553, + "step": 48522 + }, + { + "epoch": 1.24, + "learning_rate": 1.3196134641309513e-06, + "loss": 0.7207, + "step": 48523 + }, + { + "epoch": 1.24, + "learning_rate": 1.319587244925039e-06, + "loss": 0.5845, + "step": 48524 + }, + { + "epoch": 1.24, + "learning_rate": 1.3195610254744335e-06, + "loss": 0.5977, + "step": 48525 + }, + { + "epoch": 1.24, + "learning_rate": 1.3195348057791549e-06, + "loss": 0.6221, + "step": 48526 + }, + { + "epoch": 1.24, + "learning_rate": 1.3195085858392232e-06, + "loss": 0.4696, + "step": 48527 + }, + { + "epoch": 1.24, + "learning_rate": 1.3194823656546585e-06, + "loss": 0.4653, + "step": 48528 + }, + { + "epoch": 1.24, + "learning_rate": 1.3194561452254809e-06, + "loss": 0.5582, + "step": 48529 + }, + { + "epoch": 1.24, + "learning_rate": 1.3194299245517102e-06, + "loss": 0.7393, + "step": 48530 + }, + { + "epoch": 1.24, + "learning_rate": 1.319403703633367e-06, + "loss": 0.7998, + "step": 48531 + }, + { + "epoch": 1.24, + "learning_rate": 1.3193774824704703e-06, + "loss": 0.5552, + "step": 48532 + }, + { + "epoch": 1.24, + "learning_rate": 1.319351261063042e-06, + "loss": 0.7617, + "step": 48533 + }, + { + "epoch": 1.24, + "learning_rate": 1.3193250394111006e-06, + "loss": 0.6738, + "step": 48534 + }, + { + "epoch": 1.24, + "learning_rate": 1.3192988175146668e-06, + "loss": 0.7163, + "step": 48535 + }, + { + "epoch": 1.24, + "learning_rate": 1.3192725953737603e-06, + "loss": 0.5396, + "step": 48536 + }, + { + "epoch": 1.24, + "learning_rate": 1.3192463729884018e-06, + "loss": 0.6719, + "step": 48537 + }, + { + "epoch": 1.24, + "learning_rate": 1.319220150358611e-06, + "loss": 0.449, + "step": 48538 + }, + { + "epoch": 1.24, + "learning_rate": 1.3191939274844079e-06, + "loss": 0.6128, + "step": 48539 + }, + { + "epoch": 1.24, + "learning_rate": 1.3191677043658125e-06, + "loss": 0.7339, + "step": 48540 + }, + { + "epoch": 1.24, + "learning_rate": 1.3191414810028454e-06, + "loss": 0.6484, + "step": 48541 + }, + { + "epoch": 1.24, + "learning_rate": 1.3191152573955262e-06, + "loss": 0.6313, + "step": 48542 + }, + { + "epoch": 1.24, + "learning_rate": 1.3190890335438751e-06, + "loss": 0.8506, + "step": 48543 + }, + { + "epoch": 1.24, + "learning_rate": 1.3190628094479124e-06, + "loss": 0.6797, + "step": 48544 + }, + { + "epoch": 1.24, + "learning_rate": 1.3190365851076575e-06, + "loss": 0.5576, + "step": 48545 + }, + { + "epoch": 1.24, + "learning_rate": 1.3190103605231312e-06, + "loss": 0.7466, + "step": 48546 + }, + { + "epoch": 1.24, + "learning_rate": 1.3189841356943537e-06, + "loss": 0.7539, + "step": 48547 + }, + { + "epoch": 1.24, + "learning_rate": 1.3189579106213444e-06, + "loss": 0.8506, + "step": 48548 + }, + { + "epoch": 1.24, + "learning_rate": 1.3189316853041236e-06, + "loss": 0.6465, + "step": 48549 + }, + { + "epoch": 1.24, + "learning_rate": 1.3189054597427115e-06, + "loss": 0.6743, + "step": 48550 + }, + { + "epoch": 1.24, + "learning_rate": 1.3188792339371282e-06, + "loss": 0.5601, + "step": 48551 + }, + { + "epoch": 1.24, + "learning_rate": 1.318853007887394e-06, + "loss": 0.6748, + "step": 48552 + }, + { + "epoch": 1.24, + "learning_rate": 1.3188267815935283e-06, + "loss": 0.7344, + "step": 48553 + }, + { + "epoch": 1.24, + "learning_rate": 1.3188005550555518e-06, + "loss": 0.4763, + "step": 48554 + }, + { + "epoch": 1.24, + "learning_rate": 1.3187743282734843e-06, + "loss": 0.8262, + "step": 48555 + }, + { + "epoch": 1.24, + "learning_rate": 1.318748101247346e-06, + "loss": 0.7842, + "step": 48556 + }, + { + "epoch": 1.24, + "learning_rate": 1.318721873977157e-06, + "loss": 0.5503, + "step": 48557 + }, + { + "epoch": 1.24, + "learning_rate": 1.3186956464629372e-06, + "loss": 0.6436, + "step": 48558 + }, + { + "epoch": 1.24, + "learning_rate": 1.3186694187047068e-06, + "loss": 0.6377, + "step": 48559 + }, + { + "epoch": 1.24, + "learning_rate": 1.318643190702486e-06, + "loss": 0.5073, + "step": 48560 + }, + { + "epoch": 1.24, + "learning_rate": 1.3186169624562946e-06, + "loss": 0.7734, + "step": 48561 + }, + { + "epoch": 1.24, + "learning_rate": 1.318590733966153e-06, + "loss": 0.6025, + "step": 48562 + }, + { + "epoch": 1.24, + "learning_rate": 1.3185645052320812e-06, + "loss": 0.7598, + "step": 48563 + }, + { + "epoch": 1.24, + "learning_rate": 1.3185382762540988e-06, + "loss": 0.667, + "step": 48564 + }, + { + "epoch": 1.24, + "learning_rate": 1.3185120470322266e-06, + "loss": 0.7246, + "step": 48565 + }, + { + "epoch": 1.24, + "learning_rate": 1.3184858175664845e-06, + "loss": 0.5588, + "step": 48566 + }, + { + "epoch": 1.24, + "learning_rate": 1.318459587856892e-06, + "loss": 0.4885, + "step": 48567 + }, + { + "epoch": 1.24, + "learning_rate": 1.31843335790347e-06, + "loss": 0.7402, + "step": 48568 + }, + { + "epoch": 1.24, + "learning_rate": 1.3184071277062384e-06, + "loss": 0.5933, + "step": 48569 + }, + { + "epoch": 1.24, + "learning_rate": 1.3183808972652166e-06, + "loss": 0.5811, + "step": 48570 + }, + { + "epoch": 1.24, + "learning_rate": 1.3183546665804255e-06, + "loss": 0.6421, + "step": 48571 + }, + { + "epoch": 1.24, + "learning_rate": 1.3183284356518847e-06, + "loss": 0.5625, + "step": 48572 + }, + { + "epoch": 1.24, + "learning_rate": 1.3183022044796145e-06, + "loss": 0.7373, + "step": 48573 + }, + { + "epoch": 1.24, + "learning_rate": 1.318275973063635e-06, + "loss": 0.6772, + "step": 48574 + }, + { + "epoch": 1.25, + "learning_rate": 1.3182497414039664e-06, + "loss": 0.6758, + "step": 48575 + }, + { + "epoch": 1.25, + "learning_rate": 1.3182235095006282e-06, + "loss": 0.6113, + "step": 48576 + }, + { + "epoch": 1.25, + "learning_rate": 1.3181972773536412e-06, + "loss": 0.5178, + "step": 48577 + }, + { + "epoch": 1.25, + "learning_rate": 1.3181710449630251e-06, + "loss": 0.6729, + "step": 48578 + }, + { + "epoch": 1.25, + "learning_rate": 1.3181448123288003e-06, + "loss": 0.6973, + "step": 48579 + }, + { + "epoch": 1.25, + "learning_rate": 1.3181185794509858e-06, + "loss": 0.6128, + "step": 48580 + }, + { + "epoch": 1.25, + "learning_rate": 1.3180923463296035e-06, + "loss": 0.792, + "step": 48581 + }, + { + "epoch": 1.25, + "learning_rate": 1.3180661129646719e-06, + "loss": 0.6553, + "step": 48582 + }, + { + "epoch": 1.25, + "learning_rate": 1.3180398793562121e-06, + "loss": 0.6206, + "step": 48583 + }, + { + "epoch": 1.25, + "learning_rate": 1.3180136455042436e-06, + "loss": 0.6475, + "step": 48584 + }, + { + "epoch": 1.25, + "learning_rate": 1.3179874114087869e-06, + "loss": 0.6821, + "step": 48585 + }, + { + "epoch": 1.25, + "learning_rate": 1.3179611770698614e-06, + "loss": 0.7632, + "step": 48586 + }, + { + "epoch": 1.25, + "learning_rate": 1.317934942487488e-06, + "loss": 0.665, + "step": 48587 + }, + { + "epoch": 1.25, + "learning_rate": 1.3179087076616863e-06, + "loss": 0.6709, + "step": 48588 + }, + { + "epoch": 1.25, + "learning_rate": 1.3178824725924763e-06, + "loss": 0.5054, + "step": 48589 + }, + { + "epoch": 1.25, + "learning_rate": 1.3178562372798786e-06, + "loss": 0.6367, + "step": 48590 + }, + { + "epoch": 1.25, + "learning_rate": 1.317830001723913e-06, + "loss": 0.7012, + "step": 48591 + }, + { + "epoch": 1.25, + "learning_rate": 1.3178037659245997e-06, + "loss": 0.6904, + "step": 48592 + }, + { + "epoch": 1.25, + "learning_rate": 1.3177775298819587e-06, + "loss": 0.4622, + "step": 48593 + }, + { + "epoch": 1.25, + "learning_rate": 1.3177512935960098e-06, + "loss": 0.6406, + "step": 48594 + }, + { + "epoch": 1.25, + "learning_rate": 1.3177250570667734e-06, + "loss": 0.7959, + "step": 48595 + }, + { + "epoch": 1.25, + "learning_rate": 1.3176988202942695e-06, + "loss": 0.5688, + "step": 48596 + }, + { + "epoch": 1.25, + "learning_rate": 1.317672583278518e-06, + "loss": 0.6982, + "step": 48597 + }, + { + "epoch": 1.25, + "learning_rate": 1.3176463460195399e-06, + "loss": 0.6582, + "step": 48598 + }, + { + "epoch": 1.25, + "learning_rate": 1.317620108517354e-06, + "loss": 0.6162, + "step": 48599 + }, + { + "epoch": 1.25, + "learning_rate": 1.317593870771981e-06, + "loss": 0.7451, + "step": 48600 + }, + { + "epoch": 1.25, + "learning_rate": 1.317567632783441e-06, + "loss": 0.4327, + "step": 48601 + }, + { + "epoch": 1.25, + "learning_rate": 1.3175413945517546e-06, + "loss": 0.5898, + "step": 48602 + }, + { + "epoch": 1.25, + "learning_rate": 1.3175151560769409e-06, + "loss": 0.6484, + "step": 48603 + }, + { + "epoch": 1.25, + "learning_rate": 1.3174889173590206e-06, + "loss": 0.6724, + "step": 48604 + }, + { + "epoch": 1.25, + "learning_rate": 1.3174626783980134e-06, + "loss": 0.5508, + "step": 48605 + }, + { + "epoch": 1.25, + "learning_rate": 1.3174364391939399e-06, + "loss": 0.6621, + "step": 48606 + }, + { + "epoch": 1.25, + "learning_rate": 1.3174101997468198e-06, + "loss": 0.6738, + "step": 48607 + }, + { + "epoch": 1.25, + "learning_rate": 1.3173839600566732e-06, + "loss": 0.6406, + "step": 48608 + }, + { + "epoch": 1.25, + "learning_rate": 1.3173577201235205e-06, + "loss": 0.6895, + "step": 48609 + }, + { + "epoch": 1.25, + "learning_rate": 1.3173314799473814e-06, + "loss": 0.7354, + "step": 48610 + }, + { + "epoch": 1.25, + "learning_rate": 1.317305239528276e-06, + "loss": 0.5493, + "step": 48611 + }, + { + "epoch": 1.25, + "learning_rate": 1.317278998866225e-06, + "loss": 0.6299, + "step": 48612 + }, + { + "epoch": 1.25, + "learning_rate": 1.3172527579612478e-06, + "loss": 0.6724, + "step": 48613 + }, + { + "epoch": 1.25, + "learning_rate": 1.3172265168133648e-06, + "loss": 0.8135, + "step": 48614 + }, + { + "epoch": 1.25, + "learning_rate": 1.317200275422596e-06, + "loss": 0.5236, + "step": 48615 + }, + { + "epoch": 1.25, + "learning_rate": 1.3171740337889616e-06, + "loss": 0.5723, + "step": 48616 + }, + { + "epoch": 1.25, + "learning_rate": 1.3171477919124818e-06, + "loss": 0.6943, + "step": 48617 + }, + { + "epoch": 1.25, + "learning_rate": 1.3171215497931762e-06, + "loss": 0.509, + "step": 48618 + }, + { + "epoch": 1.25, + "learning_rate": 1.3170953074310655e-06, + "loss": 0.8379, + "step": 48619 + }, + { + "epoch": 1.25, + "learning_rate": 1.3170690648261693e-06, + "loss": 0.6867, + "step": 48620 + }, + { + "epoch": 1.25, + "learning_rate": 1.317042821978508e-06, + "loss": 0.418, + "step": 48621 + }, + { + "epoch": 1.25, + "learning_rate": 1.3170165788881016e-06, + "loss": 0.625, + "step": 48622 + }, + { + "epoch": 1.25, + "learning_rate": 1.31699033555497e-06, + "loss": 0.6073, + "step": 48623 + }, + { + "epoch": 1.25, + "learning_rate": 1.3169640919791336e-06, + "loss": 0.667, + "step": 48624 + }, + { + "epoch": 1.25, + "learning_rate": 1.3169378481606124e-06, + "loss": 0.5664, + "step": 48625 + }, + { + "epoch": 1.25, + "learning_rate": 1.3169116040994264e-06, + "loss": 0.6743, + "step": 48626 + }, + { + "epoch": 1.25, + "learning_rate": 1.316885359795596e-06, + "loss": 0.7402, + "step": 48627 + }, + { + "epoch": 1.25, + "learning_rate": 1.3168591152491406e-06, + "loss": 0.6836, + "step": 48628 + }, + { + "epoch": 1.25, + "learning_rate": 1.316832870460081e-06, + "loss": 0.8105, + "step": 48629 + }, + { + "epoch": 1.25, + "learning_rate": 1.3168066254284371e-06, + "loss": 0.2849, + "step": 48630 + }, + { + "epoch": 1.25, + "learning_rate": 1.316780380154229e-06, + "loss": 0.7207, + "step": 48631 + }, + { + "epoch": 1.25, + "learning_rate": 1.3167541346374767e-06, + "loss": 0.6943, + "step": 48632 + }, + { + "epoch": 1.25, + "learning_rate": 1.3167278888782e-06, + "loss": 0.6855, + "step": 48633 + }, + { + "epoch": 1.25, + "learning_rate": 1.3167016428764195e-06, + "loss": 0.6458, + "step": 48634 + }, + { + "epoch": 1.25, + "learning_rate": 1.316675396632155e-06, + "loss": 0.75, + "step": 48635 + }, + { + "epoch": 1.25, + "learning_rate": 1.3166491501454269e-06, + "loss": 0.5869, + "step": 48636 + }, + { + "epoch": 1.25, + "learning_rate": 1.3166229034162553e-06, + "loss": 0.7295, + "step": 48637 + }, + { + "epoch": 1.25, + "learning_rate": 1.3165966564446599e-06, + "loss": 0.6597, + "step": 48638 + }, + { + "epoch": 1.25, + "learning_rate": 1.3165704092306606e-06, + "loss": 0.7061, + "step": 48639 + }, + { + "epoch": 1.25, + "learning_rate": 1.3165441617742783e-06, + "loss": 0.5977, + "step": 48640 + }, + { + "epoch": 1.25, + "learning_rate": 1.3165179140755327e-06, + "loss": 0.6826, + "step": 48641 + }, + { + "epoch": 1.25, + "learning_rate": 1.316491666134444e-06, + "loss": 0.7402, + "step": 48642 + }, + { + "epoch": 1.25, + "learning_rate": 1.316465417951032e-06, + "loss": 0.752, + "step": 48643 + }, + { + "epoch": 1.25, + "learning_rate": 1.316439169525317e-06, + "loss": 0.4702, + "step": 48644 + }, + { + "epoch": 1.25, + "learning_rate": 1.316412920857319e-06, + "loss": 0.6562, + "step": 48645 + }, + { + "epoch": 1.25, + "learning_rate": 1.3163866719470583e-06, + "loss": 0.6357, + "step": 48646 + }, + { + "epoch": 1.25, + "learning_rate": 1.3163604227945548e-06, + "loss": 0.5603, + "step": 48647 + }, + { + "epoch": 1.25, + "learning_rate": 1.3163341733998288e-06, + "loss": 0.5505, + "step": 48648 + }, + { + "epoch": 1.25, + "learning_rate": 1.3163079237629e-06, + "loss": 0.5532, + "step": 48649 + }, + { + "epoch": 1.25, + "learning_rate": 1.316281673883789e-06, + "loss": 0.5981, + "step": 48650 + }, + { + "epoch": 1.25, + "learning_rate": 1.3162554237625153e-06, + "loss": 0.5757, + "step": 48651 + }, + { + "epoch": 1.25, + "learning_rate": 1.3162291733990997e-06, + "loss": 0.7031, + "step": 48652 + }, + { + "epoch": 1.25, + "learning_rate": 1.316202922793562e-06, + "loss": 0.7793, + "step": 48653 + }, + { + "epoch": 1.25, + "learning_rate": 1.316176671945922e-06, + "loss": 0.6963, + "step": 48654 + }, + { + "epoch": 1.25, + "learning_rate": 1.3161504208562005e-06, + "loss": 0.5942, + "step": 48655 + }, + { + "epoch": 1.25, + "learning_rate": 1.316124169524417e-06, + "loss": 0.585, + "step": 48656 + }, + { + "epoch": 1.25, + "learning_rate": 1.3160979179505918e-06, + "loss": 0.7568, + "step": 48657 + }, + { + "epoch": 1.25, + "learning_rate": 1.3160716661347446e-06, + "loss": 0.7559, + "step": 48658 + }, + { + "epoch": 1.25, + "learning_rate": 1.3160454140768962e-06, + "loss": 0.541, + "step": 48659 + }, + { + "epoch": 1.25, + "learning_rate": 1.3160191617770663e-06, + "loss": 0.5762, + "step": 48660 + }, + { + "epoch": 1.25, + "learning_rate": 1.3159929092352748e-06, + "loss": 0.7334, + "step": 48661 + }, + { + "epoch": 1.25, + "learning_rate": 1.3159666564515424e-06, + "loss": 0.7559, + "step": 48662 + }, + { + "epoch": 1.25, + "learning_rate": 1.3159404034258887e-06, + "loss": 0.5828, + "step": 48663 + }, + { + "epoch": 1.25, + "learning_rate": 1.315914150158334e-06, + "loss": 0.749, + "step": 48664 + }, + { + "epoch": 1.25, + "learning_rate": 1.3158878966488983e-06, + "loss": 0.7051, + "step": 48665 + }, + { + "epoch": 1.25, + "learning_rate": 1.3158616428976016e-06, + "loss": 0.6191, + "step": 48666 + }, + { + "epoch": 1.25, + "learning_rate": 1.3158353889044648e-06, + "loss": 0.7012, + "step": 48667 + }, + { + "epoch": 1.25, + "learning_rate": 1.3158091346695066e-06, + "loss": 0.7998, + "step": 48668 + }, + { + "epoch": 1.25, + "learning_rate": 1.3157828801927484e-06, + "loss": 0.4409, + "step": 48669 + }, + { + "epoch": 1.25, + "learning_rate": 1.3157566254742093e-06, + "loss": 0.6904, + "step": 48670 + }, + { + "epoch": 1.25, + "learning_rate": 1.3157303705139101e-06, + "loss": 0.4756, + "step": 48671 + }, + { + "epoch": 1.25, + "learning_rate": 1.315704115311871e-06, + "loss": 0.5881, + "step": 48672 + }, + { + "epoch": 1.25, + "learning_rate": 1.3156778598681116e-06, + "loss": 0.6328, + "step": 48673 + }, + { + "epoch": 1.25, + "learning_rate": 1.3156516041826518e-06, + "loss": 0.6182, + "step": 48674 + }, + { + "epoch": 1.25, + "learning_rate": 1.3156253482555124e-06, + "loss": 0.6152, + "step": 48675 + }, + { + "epoch": 1.25, + "learning_rate": 1.3155990920867131e-06, + "loss": 0.4816, + "step": 48676 + }, + { + "epoch": 1.25, + "learning_rate": 1.315572835676274e-06, + "loss": 0.6377, + "step": 48677 + }, + { + "epoch": 1.25, + "learning_rate": 1.3155465790242154e-06, + "loss": 0.5483, + "step": 48678 + }, + { + "epoch": 1.25, + "learning_rate": 1.3155203221305574e-06, + "loss": 0.7764, + "step": 48679 + }, + { + "epoch": 1.25, + "learning_rate": 1.3154940649953198e-06, + "loss": 0.7422, + "step": 48680 + }, + { + "epoch": 1.25, + "learning_rate": 1.315467807618523e-06, + "loss": 0.5481, + "step": 48681 + }, + { + "epoch": 1.25, + "learning_rate": 1.3154415500001873e-06, + "loss": 0.5801, + "step": 48682 + }, + { + "epoch": 1.25, + "learning_rate": 1.3154152921403321e-06, + "loss": 0.6335, + "step": 48683 + }, + { + "epoch": 1.25, + "learning_rate": 1.3153890340389779e-06, + "loss": 0.5703, + "step": 48684 + }, + { + "epoch": 1.25, + "learning_rate": 1.315362775696145e-06, + "loss": 0.4458, + "step": 48685 + }, + { + "epoch": 1.25, + "learning_rate": 1.3153365171118532e-06, + "loss": 0.7178, + "step": 48686 + }, + { + "epoch": 1.25, + "learning_rate": 1.315310258286123e-06, + "loss": 0.5352, + "step": 48687 + }, + { + "epoch": 1.25, + "learning_rate": 1.315283999218974e-06, + "loss": 0.6406, + "step": 48688 + }, + { + "epoch": 1.25, + "learning_rate": 1.3152577399104264e-06, + "loss": 0.5762, + "step": 48689 + }, + { + "epoch": 1.25, + "learning_rate": 1.3152314803605006e-06, + "loss": 0.6289, + "step": 48690 + }, + { + "epoch": 1.25, + "learning_rate": 1.3152052205692163e-06, + "loss": 0.5122, + "step": 48691 + }, + { + "epoch": 1.25, + "learning_rate": 1.3151789605365946e-06, + "loss": 0.7705, + "step": 48692 + }, + { + "epoch": 1.25, + "learning_rate": 1.3151527002626544e-06, + "loss": 0.7383, + "step": 48693 + }, + { + "epoch": 1.25, + "learning_rate": 1.315126439747416e-06, + "loss": 0.5715, + "step": 48694 + }, + { + "epoch": 1.25, + "learning_rate": 1.3151001789909e-06, + "loss": 0.8496, + "step": 48695 + }, + { + "epoch": 1.25, + "learning_rate": 1.3150739179931263e-06, + "loss": 0.4954, + "step": 48696 + }, + { + "epoch": 1.25, + "learning_rate": 1.3150476567541151e-06, + "loss": 0.623, + "step": 48697 + }, + { + "epoch": 1.25, + "learning_rate": 1.3150213952738863e-06, + "loss": 0.6206, + "step": 48698 + }, + { + "epoch": 1.25, + "learning_rate": 1.31499513355246e-06, + "loss": 0.5952, + "step": 48699 + }, + { + "epoch": 1.25, + "learning_rate": 1.3149688715898565e-06, + "loss": 0.6211, + "step": 48700 + }, + { + "epoch": 1.25, + "learning_rate": 1.3149426093860958e-06, + "loss": 0.6074, + "step": 48701 + }, + { + "epoch": 1.25, + "learning_rate": 1.3149163469411981e-06, + "loss": 0.566, + "step": 48702 + }, + { + "epoch": 1.25, + "learning_rate": 1.3148900842551834e-06, + "loss": 0.6865, + "step": 48703 + }, + { + "epoch": 1.25, + "learning_rate": 1.3148638213280716e-06, + "loss": 0.7217, + "step": 48704 + }, + { + "epoch": 1.25, + "learning_rate": 1.3148375581598834e-06, + "loss": 0.8154, + "step": 48705 + }, + { + "epoch": 1.25, + "learning_rate": 1.3148112947506383e-06, + "loss": 0.4521, + "step": 48706 + }, + { + "epoch": 1.25, + "learning_rate": 1.3147850311003572e-06, + "loss": 0.5483, + "step": 48707 + }, + { + "epoch": 1.25, + "learning_rate": 1.3147587672090593e-06, + "loss": 0.7236, + "step": 48708 + }, + { + "epoch": 1.25, + "learning_rate": 1.3147325030767648e-06, + "loss": 0.4595, + "step": 48709 + }, + { + "epoch": 1.25, + "learning_rate": 1.3147062387034944e-06, + "loss": 0.707, + "step": 48710 + }, + { + "epoch": 1.25, + "learning_rate": 1.3146799740892678e-06, + "loss": 0.6182, + "step": 48711 + }, + { + "epoch": 1.25, + "learning_rate": 1.3146537092341055e-06, + "loss": 0.5332, + "step": 48712 + }, + { + "epoch": 1.25, + "learning_rate": 1.3146274441380269e-06, + "loss": 0.603, + "step": 48713 + }, + { + "epoch": 1.25, + "learning_rate": 1.3146011788010527e-06, + "loss": 0.7656, + "step": 48714 + }, + { + "epoch": 1.25, + "learning_rate": 1.314574913223203e-06, + "loss": 0.645, + "step": 48715 + }, + { + "epoch": 1.25, + "learning_rate": 1.3145486474044972e-06, + "loss": 0.7871, + "step": 48716 + }, + { + "epoch": 1.25, + "learning_rate": 1.3145223813449568e-06, + "loss": 0.6416, + "step": 48717 + }, + { + "epoch": 1.25, + "learning_rate": 1.3144961150446006e-06, + "loss": 0.7178, + "step": 48718 + }, + { + "epoch": 1.25, + "learning_rate": 1.3144698485034492e-06, + "loss": 0.647, + "step": 48719 + }, + { + "epoch": 1.25, + "learning_rate": 1.3144435817215227e-06, + "loss": 0.5206, + "step": 48720 + }, + { + "epoch": 1.25, + "learning_rate": 1.3144173146988413e-06, + "loss": 0.5869, + "step": 48721 + }, + { + "epoch": 1.25, + "learning_rate": 1.314391047435425e-06, + "loss": 0.5557, + "step": 48722 + }, + { + "epoch": 1.25, + "learning_rate": 1.3143647799312938e-06, + "loss": 0.7041, + "step": 48723 + }, + { + "epoch": 1.25, + "learning_rate": 1.3143385121864682e-06, + "loss": 0.8066, + "step": 48724 + }, + { + "epoch": 1.25, + "learning_rate": 1.3143122442009677e-06, + "loss": 0.5337, + "step": 48725 + }, + { + "epoch": 1.25, + "learning_rate": 1.314285975974813e-06, + "loss": 0.5942, + "step": 48726 + }, + { + "epoch": 1.25, + "learning_rate": 1.314259707508024e-06, + "loss": 0.5349, + "step": 48727 + }, + { + "epoch": 1.25, + "learning_rate": 1.3142334388006208e-06, + "loss": 0.7188, + "step": 48728 + }, + { + "epoch": 1.25, + "learning_rate": 1.3142071698526233e-06, + "loss": 0.6406, + "step": 48729 + }, + { + "epoch": 1.25, + "learning_rate": 1.314180900664052e-06, + "loss": 0.4556, + "step": 48730 + }, + { + "epoch": 1.25, + "learning_rate": 1.3141546312349268e-06, + "loss": 0.6562, + "step": 48731 + }, + { + "epoch": 1.25, + "learning_rate": 1.314128361565268e-06, + "loss": 0.5859, + "step": 48732 + }, + { + "epoch": 1.25, + "learning_rate": 1.3141020916550954e-06, + "loss": 0.6519, + "step": 48733 + }, + { + "epoch": 1.25, + "learning_rate": 1.3140758215044292e-06, + "loss": 0.4675, + "step": 48734 + }, + { + "epoch": 1.25, + "learning_rate": 1.3140495511132895e-06, + "loss": 0.6611, + "step": 48735 + }, + { + "epoch": 1.25, + "learning_rate": 1.3140232804816966e-06, + "loss": 0.7217, + "step": 48736 + }, + { + "epoch": 1.25, + "learning_rate": 1.313997009609671e-06, + "loss": 0.6309, + "step": 48737 + }, + { + "epoch": 1.25, + "learning_rate": 1.3139707384972316e-06, + "loss": 0.6436, + "step": 48738 + }, + { + "epoch": 1.25, + "learning_rate": 1.3139444671443995e-06, + "loss": 0.7168, + "step": 48739 + }, + { + "epoch": 1.25, + "learning_rate": 1.3139181955511947e-06, + "loss": 0.6445, + "step": 48740 + }, + { + "epoch": 1.25, + "learning_rate": 1.3138919237176369e-06, + "loss": 0.5649, + "step": 48741 + }, + { + "epoch": 1.25, + "learning_rate": 1.3138656516437468e-06, + "loss": 0.6577, + "step": 48742 + }, + { + "epoch": 1.25, + "learning_rate": 1.313839379329544e-06, + "loss": 0.5864, + "step": 48743 + }, + { + "epoch": 1.25, + "learning_rate": 1.3138131067750486e-06, + "loss": 0.6743, + "step": 48744 + }, + { + "epoch": 1.25, + "learning_rate": 1.3137868339802814e-06, + "loss": 0.624, + "step": 48745 + }, + { + "epoch": 1.25, + "learning_rate": 1.313760560945262e-06, + "loss": 0.6025, + "step": 48746 + }, + { + "epoch": 1.25, + "learning_rate": 1.3137342876700105e-06, + "loss": 0.5688, + "step": 48747 + }, + { + "epoch": 1.25, + "learning_rate": 1.3137080141545467e-06, + "loss": 0.7949, + "step": 48748 + }, + { + "epoch": 1.25, + "learning_rate": 1.3136817403988916e-06, + "loss": 0.6445, + "step": 48749 + }, + { + "epoch": 1.25, + "learning_rate": 1.3136554664030643e-06, + "loss": 0.6323, + "step": 48750 + }, + { + "epoch": 1.25, + "learning_rate": 1.313629192167086e-06, + "loss": 0.6553, + "step": 48751 + }, + { + "epoch": 1.25, + "learning_rate": 1.313602917690976e-06, + "loss": 0.5918, + "step": 48752 + }, + { + "epoch": 1.25, + "learning_rate": 1.3135766429747545e-06, + "loss": 0.5181, + "step": 48753 + }, + { + "epoch": 1.25, + "learning_rate": 1.3135503680184418e-06, + "loss": 0.6191, + "step": 48754 + }, + { + "epoch": 1.25, + "learning_rate": 1.3135240928220583e-06, + "loss": 0.6689, + "step": 48755 + }, + { + "epoch": 1.25, + "learning_rate": 1.3134978173856234e-06, + "loss": 0.5649, + "step": 48756 + }, + { + "epoch": 1.25, + "learning_rate": 1.3134715417091584e-06, + "loss": 0.6096, + "step": 48757 + }, + { + "epoch": 1.25, + "learning_rate": 1.313445265792682e-06, + "loss": 0.6558, + "step": 48758 + }, + { + "epoch": 1.25, + "learning_rate": 1.313418989636215e-06, + "loss": 0.7275, + "step": 48759 + }, + { + "epoch": 1.25, + "learning_rate": 1.3133927132397778e-06, + "loss": 0.521, + "step": 48760 + }, + { + "epoch": 1.25, + "learning_rate": 1.3133664366033899e-06, + "loss": 0.6743, + "step": 48761 + }, + { + "epoch": 1.25, + "learning_rate": 1.313340159727072e-06, + "loss": 0.7012, + "step": 48762 + }, + { + "epoch": 1.25, + "learning_rate": 1.313313882610844e-06, + "loss": 0.4312, + "step": 48763 + }, + { + "epoch": 1.25, + "learning_rate": 1.3132876052547253e-06, + "loss": 0.6758, + "step": 48764 + }, + { + "epoch": 1.25, + "learning_rate": 1.3132613276587373e-06, + "loss": 0.6343, + "step": 48765 + }, + { + "epoch": 1.25, + "learning_rate": 1.3132350498228992e-06, + "loss": 0.7705, + "step": 48766 + }, + { + "epoch": 1.25, + "learning_rate": 1.3132087717472319e-06, + "loss": 0.7695, + "step": 48767 + }, + { + "epoch": 1.25, + "learning_rate": 1.3131824934317546e-06, + "loss": 0.6309, + "step": 48768 + }, + { + "epoch": 1.25, + "learning_rate": 1.3131562148764878e-06, + "loss": 0.6191, + "step": 48769 + }, + { + "epoch": 1.25, + "learning_rate": 1.3131299360814519e-06, + "loss": 0.5728, + "step": 48770 + }, + { + "epoch": 1.25, + "learning_rate": 1.3131036570466666e-06, + "loss": 0.8135, + "step": 48771 + }, + { + "epoch": 1.25, + "learning_rate": 1.3130773777721529e-06, + "loss": 0.4854, + "step": 48772 + }, + { + "epoch": 1.25, + "learning_rate": 1.3130510982579294e-06, + "loss": 0.6865, + "step": 48773 + }, + { + "epoch": 1.25, + "learning_rate": 1.3130248185040176e-06, + "loss": 0.5771, + "step": 48774 + }, + { + "epoch": 1.25, + "learning_rate": 1.3129985385104368e-06, + "loss": 0.3909, + "step": 48775 + }, + { + "epoch": 1.25, + "learning_rate": 1.3129722582772075e-06, + "loss": 0.7451, + "step": 48776 + }, + { + "epoch": 1.25, + "learning_rate": 1.3129459778043499e-06, + "loss": 0.5083, + "step": 48777 + }, + { + "epoch": 1.25, + "learning_rate": 1.312919697091884e-06, + "loss": 0.7988, + "step": 48778 + }, + { + "epoch": 1.25, + "learning_rate": 1.3128934161398295e-06, + "loss": 0.7646, + "step": 48779 + }, + { + "epoch": 1.25, + "learning_rate": 1.312867134948207e-06, + "loss": 0.7568, + "step": 48780 + }, + { + "epoch": 1.25, + "learning_rate": 1.3128408535170366e-06, + "loss": 0.6484, + "step": 48781 + }, + { + "epoch": 1.25, + "learning_rate": 1.3128145718463386e-06, + "loss": 0.7324, + "step": 48782 + }, + { + "epoch": 1.25, + "learning_rate": 1.3127882899361325e-06, + "loss": 0.6455, + "step": 48783 + }, + { + "epoch": 1.25, + "learning_rate": 1.312762007786439e-06, + "loss": 0.6162, + "step": 48784 + }, + { + "epoch": 1.25, + "learning_rate": 1.3127357253972778e-06, + "loss": 0.7031, + "step": 48785 + }, + { + "epoch": 1.25, + "learning_rate": 1.3127094427686694e-06, + "loss": 0.6416, + "step": 48786 + }, + { + "epoch": 1.25, + "learning_rate": 1.3126831599006338e-06, + "loss": 0.6401, + "step": 48787 + }, + { + "epoch": 1.25, + "learning_rate": 1.3126568767931907e-06, + "loss": 0.6836, + "step": 48788 + }, + { + "epoch": 1.25, + "learning_rate": 1.312630593446361e-06, + "loss": 0.5884, + "step": 48789 + }, + { + "epoch": 1.25, + "learning_rate": 1.3126043098601645e-06, + "loss": 0.6934, + "step": 48790 + }, + { + "epoch": 1.25, + "learning_rate": 1.3125780260346208e-06, + "loss": 0.6758, + "step": 48791 + }, + { + "epoch": 1.25, + "learning_rate": 1.312551741969751e-06, + "loss": 0.6118, + "step": 48792 + }, + { + "epoch": 1.25, + "learning_rate": 1.3125254576655744e-06, + "loss": 0.6509, + "step": 48793 + }, + { + "epoch": 1.25, + "learning_rate": 1.3124991731221112e-06, + "loss": 0.7666, + "step": 48794 + }, + { + "epoch": 1.25, + "learning_rate": 1.3124728883393822e-06, + "loss": 0.5217, + "step": 48795 + }, + { + "epoch": 1.25, + "learning_rate": 1.3124466033174068e-06, + "loss": 0.5742, + "step": 48796 + }, + { + "epoch": 1.25, + "learning_rate": 1.3124203180562059e-06, + "loss": 0.6719, + "step": 48797 + }, + { + "epoch": 1.25, + "learning_rate": 1.3123940325557987e-06, + "loss": 0.4382, + "step": 48798 + }, + { + "epoch": 1.25, + "learning_rate": 1.3123677468162058e-06, + "loss": 0.604, + "step": 48799 + }, + { + "epoch": 1.25, + "learning_rate": 1.3123414608374472e-06, + "loss": 0.7275, + "step": 48800 + }, + { + "epoch": 1.25, + "learning_rate": 1.312315174619543e-06, + "loss": 0.4717, + "step": 48801 + }, + { + "epoch": 1.25, + "learning_rate": 1.312288888162514e-06, + "loss": 0.5552, + "step": 48802 + }, + { + "epoch": 1.25, + "learning_rate": 1.3122626014663794e-06, + "loss": 0.569, + "step": 48803 + }, + { + "epoch": 1.25, + "learning_rate": 1.3122363145311595e-06, + "loss": 0.6538, + "step": 48804 + }, + { + "epoch": 1.25, + "learning_rate": 1.3122100273568748e-06, + "loss": 0.6531, + "step": 48805 + }, + { + "epoch": 1.25, + "learning_rate": 1.312183739943545e-06, + "loss": 0.4962, + "step": 48806 + }, + { + "epoch": 1.25, + "learning_rate": 1.3121574522911906e-06, + "loss": 0.5679, + "step": 48807 + }, + { + "epoch": 1.25, + "learning_rate": 1.3121311643998318e-06, + "loss": 0.7812, + "step": 48808 + }, + { + "epoch": 1.25, + "learning_rate": 1.3121048762694886e-06, + "loss": 0.6592, + "step": 48809 + }, + { + "epoch": 1.25, + "learning_rate": 1.3120785879001805e-06, + "loss": 0.4205, + "step": 48810 + }, + { + "epoch": 1.25, + "learning_rate": 1.3120522992919288e-06, + "loss": 0.5941, + "step": 48811 + }, + { + "epoch": 1.25, + "learning_rate": 1.3120260104447527e-06, + "loss": 0.8066, + "step": 48812 + }, + { + "epoch": 1.25, + "learning_rate": 1.3119997213586723e-06, + "loss": 0.6104, + "step": 48813 + }, + { + "epoch": 1.25, + "learning_rate": 1.3119734320337088e-06, + "loss": 0.708, + "step": 48814 + }, + { + "epoch": 1.25, + "learning_rate": 1.311947142469881e-06, + "loss": 0.7139, + "step": 48815 + }, + { + "epoch": 1.25, + "learning_rate": 1.31192085266721e-06, + "loss": 0.439, + "step": 48816 + }, + { + "epoch": 1.25, + "learning_rate": 1.3118945626257154e-06, + "loss": 0.6299, + "step": 48817 + }, + { + "epoch": 1.25, + "learning_rate": 1.3118682723454173e-06, + "loss": 0.5156, + "step": 48818 + }, + { + "epoch": 1.25, + "learning_rate": 1.311841981826336e-06, + "loss": 0.6147, + "step": 48819 + }, + { + "epoch": 1.25, + "learning_rate": 1.3118156910684919e-06, + "loss": 0.5679, + "step": 48820 + }, + { + "epoch": 1.25, + "learning_rate": 1.3117894000719046e-06, + "loss": 0.5327, + "step": 48821 + }, + { + "epoch": 1.25, + "learning_rate": 1.3117631088365948e-06, + "loss": 0.6924, + "step": 48822 + }, + { + "epoch": 1.25, + "learning_rate": 1.311736817362582e-06, + "loss": 0.6167, + "step": 48823 + }, + { + "epoch": 1.25, + "learning_rate": 1.311710525649887e-06, + "loss": 0.7764, + "step": 48824 + }, + { + "epoch": 1.25, + "learning_rate": 1.3116842336985292e-06, + "loss": 0.6035, + "step": 48825 + }, + { + "epoch": 1.25, + "learning_rate": 1.3116579415085294e-06, + "loss": 0.7603, + "step": 48826 + }, + { + "epoch": 1.25, + "learning_rate": 1.3116316490799074e-06, + "loss": 0.5654, + "step": 48827 + }, + { + "epoch": 1.25, + "learning_rate": 1.3116053564126834e-06, + "loss": 0.7578, + "step": 48828 + }, + { + "epoch": 1.25, + "learning_rate": 1.3115790635068773e-06, + "loss": 0.5459, + "step": 48829 + }, + { + "epoch": 1.25, + "learning_rate": 1.3115527703625096e-06, + "loss": 0.6475, + "step": 48830 + }, + { + "epoch": 1.25, + "learning_rate": 1.3115264769796e-06, + "loss": 0.7725, + "step": 48831 + }, + { + "epoch": 1.25, + "learning_rate": 1.3115001833581691e-06, + "loss": 0.5991, + "step": 48832 + }, + { + "epoch": 1.25, + "learning_rate": 1.3114738894982372e-06, + "loss": 0.6924, + "step": 48833 + }, + { + "epoch": 1.25, + "learning_rate": 1.3114475953998235e-06, + "loss": 0.4938, + "step": 48834 + }, + { + "epoch": 1.25, + "learning_rate": 1.3114213010629489e-06, + "loss": 0.6279, + "step": 48835 + }, + { + "epoch": 1.25, + "learning_rate": 1.3113950064876336e-06, + "loss": 0.6509, + "step": 48836 + }, + { + "epoch": 1.25, + "learning_rate": 1.3113687116738972e-06, + "loss": 0.6357, + "step": 48837 + }, + { + "epoch": 1.25, + "learning_rate": 1.3113424166217598e-06, + "loss": 0.7148, + "step": 48838 + }, + { + "epoch": 1.25, + "learning_rate": 1.3113161213312424e-06, + "loss": 0.7188, + "step": 48839 + }, + { + "epoch": 1.25, + "learning_rate": 1.3112898258023641e-06, + "loss": 0.7163, + "step": 48840 + }, + { + "epoch": 1.25, + "learning_rate": 1.3112635300351458e-06, + "loss": 0.7065, + "step": 48841 + }, + { + "epoch": 1.25, + "learning_rate": 1.3112372340296072e-06, + "loss": 0.5742, + "step": 48842 + }, + { + "epoch": 1.25, + "learning_rate": 1.3112109377857688e-06, + "loss": 0.6538, + "step": 48843 + }, + { + "epoch": 1.25, + "learning_rate": 1.31118464130365e-06, + "loss": 0.8057, + "step": 48844 + }, + { + "epoch": 1.25, + "learning_rate": 1.3111583445832719e-06, + "loss": 0.6709, + "step": 48845 + }, + { + "epoch": 1.25, + "learning_rate": 1.3111320476246537e-06, + "loss": 0.8223, + "step": 48846 + }, + { + "epoch": 1.25, + "learning_rate": 1.3111057504278166e-06, + "loss": 0.5249, + "step": 48847 + }, + { + "epoch": 1.25, + "learning_rate": 1.3110794529927796e-06, + "loss": 0.6787, + "step": 48848 + }, + { + "epoch": 1.25, + "learning_rate": 1.3110531553195635e-06, + "loss": 0.7158, + "step": 48849 + }, + { + "epoch": 1.25, + "learning_rate": 1.3110268574081885e-06, + "loss": 0.5566, + "step": 48850 + }, + { + "epoch": 1.25, + "learning_rate": 1.3110005592586744e-06, + "loss": 0.6431, + "step": 48851 + }, + { + "epoch": 1.25, + "learning_rate": 1.3109742608710415e-06, + "loss": 0.6831, + "step": 48852 + }, + { + "epoch": 1.25, + "learning_rate": 1.31094796224531e-06, + "loss": 0.6777, + "step": 48853 + }, + { + "epoch": 1.25, + "learning_rate": 1.3109216633814998e-06, + "loss": 0.6357, + "step": 48854 + }, + { + "epoch": 1.25, + "learning_rate": 1.3108953642796311e-06, + "loss": 0.7837, + "step": 48855 + }, + { + "epoch": 1.25, + "learning_rate": 1.310869064939724e-06, + "loss": 0.5615, + "step": 48856 + }, + { + "epoch": 1.25, + "learning_rate": 1.3108427653617991e-06, + "loss": 0.8135, + "step": 48857 + }, + { + "epoch": 1.25, + "learning_rate": 1.3108164655458762e-06, + "loss": 0.7666, + "step": 48858 + }, + { + "epoch": 1.25, + "learning_rate": 1.3107901654919752e-06, + "loss": 0.6328, + "step": 48859 + }, + { + "epoch": 1.25, + "learning_rate": 1.3107638652001165e-06, + "loss": 0.7246, + "step": 48860 + }, + { + "epoch": 1.25, + "learning_rate": 1.31073756467032e-06, + "loss": 0.8008, + "step": 48861 + }, + { + "epoch": 1.25, + "learning_rate": 1.3107112639026069e-06, + "loss": 0.5371, + "step": 48862 + }, + { + "epoch": 1.25, + "learning_rate": 1.3106849628969953e-06, + "loss": 0.6846, + "step": 48863 + }, + { + "epoch": 1.25, + "learning_rate": 1.3106586616535072e-06, + "loss": 0.7051, + "step": 48864 + }, + { + "epoch": 1.25, + "learning_rate": 1.3106323601721618e-06, + "loss": 0.7529, + "step": 48865 + }, + { + "epoch": 1.25, + "learning_rate": 1.3106060584529796e-06, + "loss": 0.4922, + "step": 48866 + }, + { + "epoch": 1.25, + "learning_rate": 1.3105797564959808e-06, + "loss": 0.5425, + "step": 48867 + }, + { + "epoch": 1.25, + "learning_rate": 1.3105534543011851e-06, + "loss": 0.7764, + "step": 48868 + }, + { + "epoch": 1.25, + "learning_rate": 1.310527151868613e-06, + "loss": 0.7334, + "step": 48869 + }, + { + "epoch": 1.25, + "learning_rate": 1.3105008491982845e-06, + "loss": 0.5664, + "step": 48870 + }, + { + "epoch": 1.25, + "learning_rate": 1.3104745462902195e-06, + "loss": 0.6177, + "step": 48871 + }, + { + "epoch": 1.25, + "learning_rate": 1.3104482431444392e-06, + "loss": 0.6348, + "step": 48872 + }, + { + "epoch": 1.25, + "learning_rate": 1.3104219397609622e-06, + "loss": 0.749, + "step": 48873 + }, + { + "epoch": 1.25, + "learning_rate": 1.3103956361398098e-06, + "loss": 0.7295, + "step": 48874 + }, + { + "epoch": 1.25, + "learning_rate": 1.3103693322810014e-06, + "loss": 0.7295, + "step": 48875 + }, + { + "epoch": 1.25, + "learning_rate": 1.3103430281845577e-06, + "loss": 0.5049, + "step": 48876 + }, + { + "epoch": 1.25, + "learning_rate": 1.3103167238504986e-06, + "loss": 0.6689, + "step": 48877 + }, + { + "epoch": 1.25, + "learning_rate": 1.3102904192788441e-06, + "loss": 0.6606, + "step": 48878 + }, + { + "epoch": 1.25, + "learning_rate": 1.3102641144696148e-06, + "loss": 0.5693, + "step": 48879 + }, + { + "epoch": 1.25, + "learning_rate": 1.3102378094228304e-06, + "loss": 0.4746, + "step": 48880 + }, + { + "epoch": 1.25, + "learning_rate": 1.310211504138511e-06, + "loss": 0.708, + "step": 48881 + }, + { + "epoch": 1.25, + "learning_rate": 1.3101851986166769e-06, + "loss": 0.6738, + "step": 48882 + }, + { + "epoch": 1.25, + "learning_rate": 1.3101588928573487e-06, + "loss": 0.6279, + "step": 48883 + }, + { + "epoch": 1.25, + "learning_rate": 1.3101325868605457e-06, + "loss": 0.7695, + "step": 48884 + }, + { + "epoch": 1.25, + "learning_rate": 1.3101062806262886e-06, + "loss": 0.6719, + "step": 48885 + }, + { + "epoch": 1.25, + "learning_rate": 1.3100799741545972e-06, + "loss": 0.7852, + "step": 48886 + }, + { + "epoch": 1.25, + "learning_rate": 1.310053667445492e-06, + "loss": 0.6504, + "step": 48887 + }, + { + "epoch": 1.25, + "learning_rate": 1.310027360498993e-06, + "loss": 0.4548, + "step": 48888 + }, + { + "epoch": 1.25, + "learning_rate": 1.31000105331512e-06, + "loss": 0.5161, + "step": 48889 + }, + { + "epoch": 1.25, + "learning_rate": 1.3099747458938937e-06, + "loss": 0.5354, + "step": 48890 + }, + { + "epoch": 1.25, + "learning_rate": 1.309948438235334e-06, + "loss": 0.6553, + "step": 48891 + }, + { + "epoch": 1.25, + "learning_rate": 1.309922130339461e-06, + "loss": 0.5371, + "step": 48892 + }, + { + "epoch": 1.25, + "learning_rate": 1.3098958222062951e-06, + "loss": 0.7378, + "step": 48893 + }, + { + "epoch": 1.25, + "learning_rate": 1.3098695138358555e-06, + "loss": 0.834, + "step": 48894 + }, + { + "epoch": 1.25, + "learning_rate": 1.3098432052281638e-06, + "loss": 0.5231, + "step": 48895 + }, + { + "epoch": 1.25, + "learning_rate": 1.309816896383239e-06, + "loss": 0.6914, + "step": 48896 + }, + { + "epoch": 1.25, + "learning_rate": 1.309790587301102e-06, + "loss": 0.8125, + "step": 48897 + }, + { + "epoch": 1.25, + "learning_rate": 1.3097642779817722e-06, + "loss": 0.7559, + "step": 48898 + }, + { + "epoch": 1.25, + "learning_rate": 1.3097379684252703e-06, + "loss": 0.5884, + "step": 48899 + }, + { + "epoch": 1.25, + "learning_rate": 1.3097116586316165e-06, + "loss": 0.7168, + "step": 48900 + }, + { + "epoch": 1.25, + "learning_rate": 1.3096853486008303e-06, + "loss": 0.4878, + "step": 48901 + }, + { + "epoch": 1.25, + "learning_rate": 1.3096590383329326e-06, + "loss": 0.8184, + "step": 48902 + }, + { + "epoch": 1.25, + "learning_rate": 1.3096327278279429e-06, + "loss": 0.6145, + "step": 48903 + }, + { + "epoch": 1.25, + "learning_rate": 1.309606417085882e-06, + "loss": 0.6523, + "step": 48904 + }, + { + "epoch": 1.25, + "learning_rate": 1.3095801061067695e-06, + "loss": 1.0234, + "step": 48905 + }, + { + "epoch": 1.25, + "learning_rate": 1.309553794890626e-06, + "loss": 0.4172, + "step": 48906 + }, + { + "epoch": 1.25, + "learning_rate": 1.3095274834374709e-06, + "loss": 0.4716, + "step": 48907 + }, + { + "epoch": 1.25, + "learning_rate": 1.3095011717473251e-06, + "loss": 0.6279, + "step": 48908 + }, + { + "epoch": 1.25, + "learning_rate": 1.3094748598202086e-06, + "loss": 0.5059, + "step": 48909 + }, + { + "epoch": 1.25, + "learning_rate": 1.3094485476561415e-06, + "loss": 0.5952, + "step": 48910 + }, + { + "epoch": 1.25, + "learning_rate": 1.3094222352551439e-06, + "loss": 0.603, + "step": 48911 + }, + { + "epoch": 1.25, + "learning_rate": 1.3093959226172358e-06, + "loss": 0.4216, + "step": 48912 + }, + { + "epoch": 1.25, + "learning_rate": 1.3093696097424372e-06, + "loss": 0.7412, + "step": 48913 + }, + { + "epoch": 1.25, + "learning_rate": 1.3093432966307687e-06, + "loss": 0.6133, + "step": 48914 + }, + { + "epoch": 1.25, + "learning_rate": 1.3093169832822502e-06, + "loss": 0.5854, + "step": 48915 + }, + { + "epoch": 1.25, + "learning_rate": 1.3092906696969021e-06, + "loss": 0.6133, + "step": 48916 + }, + { + "epoch": 1.25, + "learning_rate": 1.3092643558747444e-06, + "loss": 0.5535, + "step": 48917 + }, + { + "epoch": 1.25, + "learning_rate": 1.309238041815797e-06, + "loss": 0.6333, + "step": 48918 + }, + { + "epoch": 1.25, + "learning_rate": 1.3092117275200803e-06, + "loss": 0.5234, + "step": 48919 + }, + { + "epoch": 1.25, + "learning_rate": 1.3091854129876143e-06, + "loss": 0.5669, + "step": 48920 + }, + { + "epoch": 1.25, + "learning_rate": 1.3091590982184195e-06, + "loss": 0.8091, + "step": 48921 + }, + { + "epoch": 1.25, + "learning_rate": 1.3091327832125154e-06, + "loss": 0.6824, + "step": 48922 + }, + { + "epoch": 1.25, + "learning_rate": 1.3091064679699228e-06, + "loss": 0.6514, + "step": 48923 + }, + { + "epoch": 1.25, + "learning_rate": 1.3090801524906617e-06, + "loss": 0.5774, + "step": 48924 + }, + { + "epoch": 1.25, + "learning_rate": 1.309053836774752e-06, + "loss": 0.6504, + "step": 48925 + }, + { + "epoch": 1.25, + "learning_rate": 1.3090275208222142e-06, + "loss": 0.6265, + "step": 48926 + }, + { + "epoch": 1.25, + "learning_rate": 1.309001204633068e-06, + "loss": 0.668, + "step": 48927 + }, + { + "epoch": 1.25, + "learning_rate": 1.3089748882073338e-06, + "loss": 0.6968, + "step": 48928 + }, + { + "epoch": 1.25, + "learning_rate": 1.3089485715450316e-06, + "loss": 0.6841, + "step": 48929 + }, + { + "epoch": 1.25, + "learning_rate": 1.3089222546461819e-06, + "loss": 0.7744, + "step": 48930 + }, + { + "epoch": 1.25, + "learning_rate": 1.3088959375108045e-06, + "loss": 0.5298, + "step": 48931 + }, + { + "epoch": 1.25, + "learning_rate": 1.3088696201389197e-06, + "loss": 0.6763, + "step": 48932 + }, + { + "epoch": 1.25, + "learning_rate": 1.3088433025305478e-06, + "loss": 0.8066, + "step": 48933 + }, + { + "epoch": 1.25, + "learning_rate": 1.3088169846857086e-06, + "loss": 0.6646, + "step": 48934 + }, + { + "epoch": 1.25, + "learning_rate": 1.3087906666044227e-06, + "loss": 0.6123, + "step": 48935 + }, + { + "epoch": 1.25, + "learning_rate": 1.30876434828671e-06, + "loss": 0.6851, + "step": 48936 + }, + { + "epoch": 1.25, + "learning_rate": 1.3087380297325904e-06, + "loss": 0.5574, + "step": 48937 + }, + { + "epoch": 1.25, + "learning_rate": 1.3087117109420842e-06, + "loss": 0.7646, + "step": 48938 + }, + { + "epoch": 1.25, + "learning_rate": 1.3086853919152118e-06, + "loss": 0.7598, + "step": 48939 + }, + { + "epoch": 1.25, + "learning_rate": 1.308659072651993e-06, + "loss": 0.708, + "step": 48940 + }, + { + "epoch": 1.25, + "learning_rate": 1.3086327531524483e-06, + "loss": 0.6299, + "step": 48941 + }, + { + "epoch": 1.25, + "learning_rate": 1.308606433416598e-06, + "loss": 0.5396, + "step": 48942 + }, + { + "epoch": 1.25, + "learning_rate": 1.3085801134444615e-06, + "loss": 0.6655, + "step": 48943 + }, + { + "epoch": 1.25, + "learning_rate": 1.3085537932360592e-06, + "loss": 0.7432, + "step": 48944 + }, + { + "epoch": 1.25, + "learning_rate": 1.3085274727914119e-06, + "loss": 0.6396, + "step": 48945 + }, + { + "epoch": 1.25, + "learning_rate": 1.3085011521105393e-06, + "loss": 0.9316, + "step": 48946 + }, + { + "epoch": 1.25, + "learning_rate": 1.3084748311934614e-06, + "loss": 0.5493, + "step": 48947 + }, + { + "epoch": 1.25, + "learning_rate": 1.3084485100401987e-06, + "loss": 0.5723, + "step": 48948 + }, + { + "epoch": 1.25, + "learning_rate": 1.3084221886507706e-06, + "loss": 0.5859, + "step": 48949 + }, + { + "epoch": 1.25, + "learning_rate": 1.3083958670251984e-06, + "loss": 0.7725, + "step": 48950 + }, + { + "epoch": 1.25, + "learning_rate": 1.3083695451635015e-06, + "loss": 0.7676, + "step": 48951 + }, + { + "epoch": 1.25, + "learning_rate": 1.3083432230657003e-06, + "loss": 0.6079, + "step": 48952 + }, + { + "epoch": 1.25, + "learning_rate": 1.3083169007318146e-06, + "loss": 0.6108, + "step": 48953 + }, + { + "epoch": 1.25, + "learning_rate": 1.3082905781618652e-06, + "loss": 0.5938, + "step": 48954 + }, + { + "epoch": 1.25, + "learning_rate": 1.3082642553558714e-06, + "loss": 0.6689, + "step": 48955 + }, + { + "epoch": 1.25, + "learning_rate": 1.3082379323138543e-06, + "loss": 0.7178, + "step": 48956 + }, + { + "epoch": 1.25, + "learning_rate": 1.3082116090358332e-06, + "loss": 0.5535, + "step": 48957 + }, + { + "epoch": 1.25, + "learning_rate": 1.3081852855218292e-06, + "loss": 0.7393, + "step": 48958 + }, + { + "epoch": 1.25, + "learning_rate": 1.3081589617718614e-06, + "loss": 0.5488, + "step": 48959 + }, + { + "epoch": 1.25, + "learning_rate": 1.3081326377859506e-06, + "loss": 0.7773, + "step": 48960 + }, + { + "epoch": 1.25, + "learning_rate": 1.308106313564117e-06, + "loss": 0.8652, + "step": 48961 + }, + { + "epoch": 1.25, + "learning_rate": 1.3080799891063803e-06, + "loss": 0.6367, + "step": 48962 + }, + { + "epoch": 1.25, + "learning_rate": 1.308053664412761e-06, + "loss": 0.5012, + "step": 48963 + }, + { + "epoch": 1.25, + "learning_rate": 1.308027339483279e-06, + "loss": 0.5879, + "step": 48964 + }, + { + "epoch": 1.25, + "learning_rate": 1.3080010143179547e-06, + "loss": 0.6699, + "step": 48965 + }, + { + "epoch": 1.26, + "learning_rate": 1.3079746889168082e-06, + "loss": 0.7275, + "step": 48966 + }, + { + "epoch": 1.26, + "learning_rate": 1.30794836327986e-06, + "loss": 0.8213, + "step": 48967 + }, + { + "epoch": 1.26, + "learning_rate": 1.3079220374071294e-06, + "loss": 0.5771, + "step": 48968 + }, + { + "epoch": 1.26, + "learning_rate": 1.3078957112986371e-06, + "loss": 0.6074, + "step": 48969 + }, + { + "epoch": 1.26, + "learning_rate": 1.3078693849544034e-06, + "loss": 0.5801, + "step": 48970 + }, + { + "epoch": 1.26, + "learning_rate": 1.3078430583744484e-06, + "loss": 0.6611, + "step": 48971 + }, + { + "epoch": 1.26, + "learning_rate": 1.3078167315587919e-06, + "loss": 0.4805, + "step": 48972 + }, + { + "epoch": 1.26, + "learning_rate": 1.3077904045074544e-06, + "loss": 0.7056, + "step": 48973 + }, + { + "epoch": 1.26, + "learning_rate": 1.3077640772204556e-06, + "loss": 0.5977, + "step": 48974 + }, + { + "epoch": 1.26, + "learning_rate": 1.3077377496978167e-06, + "loss": 0.626, + "step": 48975 + }, + { + "epoch": 1.26, + "learning_rate": 1.3077114219395565e-06, + "loss": 0.8574, + "step": 48976 + }, + { + "epoch": 1.26, + "learning_rate": 1.3076850939456962e-06, + "loss": 0.6274, + "step": 48977 + }, + { + "epoch": 1.26, + "learning_rate": 1.3076587657162553e-06, + "loss": 0.5859, + "step": 48978 + }, + { + "epoch": 1.26, + "learning_rate": 1.3076324372512543e-06, + "loss": 0.6489, + "step": 48979 + }, + { + "epoch": 1.26, + "learning_rate": 1.3076061085507132e-06, + "loss": 0.7207, + "step": 48980 + }, + { + "epoch": 1.26, + "learning_rate": 1.3075797796146529e-06, + "loss": 0.8145, + "step": 48981 + }, + { + "epoch": 1.26, + "learning_rate": 1.3075534504430921e-06, + "loss": 0.6826, + "step": 48982 + }, + { + "epoch": 1.26, + "learning_rate": 1.307527121036052e-06, + "loss": 1.043, + "step": 48983 + }, + { + "epoch": 1.26, + "learning_rate": 1.3075007913935525e-06, + "loss": 0.6035, + "step": 48984 + }, + { + "epoch": 1.26, + "learning_rate": 1.307474461515614e-06, + "loss": 0.8184, + "step": 48985 + }, + { + "epoch": 1.26, + "learning_rate": 1.3074481314022563e-06, + "loss": 0.7646, + "step": 48986 + }, + { + "epoch": 1.26, + "learning_rate": 1.3074218010534996e-06, + "loss": 0.5103, + "step": 48987 + }, + { + "epoch": 1.26, + "learning_rate": 1.3073954704693643e-06, + "loss": 0.7427, + "step": 48988 + }, + { + "epoch": 1.26, + "learning_rate": 1.3073691396498705e-06, + "loss": 0.6177, + "step": 48989 + }, + { + "epoch": 1.26, + "learning_rate": 1.307342808595038e-06, + "loss": 0.6494, + "step": 48990 + }, + { + "epoch": 1.26, + "learning_rate": 1.3073164773048875e-06, + "loss": 0.5024, + "step": 48991 + }, + { + "epoch": 1.26, + "learning_rate": 1.307290145779439e-06, + "loss": 0.5342, + "step": 48992 + }, + { + "epoch": 1.26, + "learning_rate": 1.3072638140187122e-06, + "loss": 0.6104, + "step": 48993 + }, + { + "epoch": 1.26, + "learning_rate": 1.307237482022728e-06, + "loss": 0.6836, + "step": 48994 + }, + { + "epoch": 1.26, + "learning_rate": 1.3072111497915058e-06, + "loss": 0.7197, + "step": 48995 + }, + { + "epoch": 1.26, + "learning_rate": 1.3071848173250665e-06, + "loss": 0.6338, + "step": 48996 + }, + { + "epoch": 1.26, + "learning_rate": 1.3071584846234295e-06, + "loss": 0.6104, + "step": 48997 + }, + { + "epoch": 1.26, + "learning_rate": 1.307132151686616e-06, + "loss": 0.6772, + "step": 48998 + }, + { + "epoch": 1.26, + "learning_rate": 1.3071058185146448e-06, + "loss": 0.7017, + "step": 48999 + }, + { + "epoch": 1.26, + "learning_rate": 1.3070794851075374e-06, + "loss": 0.7676, + "step": 49000 + }, + { + "epoch": 1.26, + "learning_rate": 1.307053151465313e-06, + "loss": 0.71, + "step": 49001 + }, + { + "epoch": 1.26, + "learning_rate": 1.3070268175879924e-06, + "loss": 0.6519, + "step": 49002 + }, + { + "epoch": 1.26, + "learning_rate": 1.3070004834755951e-06, + "loss": 0.6768, + "step": 49003 + }, + { + "epoch": 1.26, + "learning_rate": 1.306974149128142e-06, + "loss": 0.6416, + "step": 49004 + }, + { + "epoch": 1.26, + "learning_rate": 1.3069478145456526e-06, + "loss": 0.8984, + "step": 49005 + }, + { + "epoch": 1.26, + "learning_rate": 1.3069214797281479e-06, + "loss": 0.8594, + "step": 49006 + }, + { + "epoch": 1.26, + "learning_rate": 1.3068951446756472e-06, + "loss": 0.6182, + "step": 49007 + }, + { + "epoch": 1.26, + "learning_rate": 1.3068688093881708e-06, + "loss": 0.5327, + "step": 49008 + }, + { + "epoch": 1.26, + "learning_rate": 1.3068424738657392e-06, + "loss": 0.7373, + "step": 49009 + }, + { + "epoch": 1.26, + "learning_rate": 1.3068161381083726e-06, + "loss": 0.5738, + "step": 49010 + }, + { + "epoch": 1.26, + "learning_rate": 1.306789802116091e-06, + "loss": 0.6582, + "step": 49011 + }, + { + "epoch": 1.26, + "learning_rate": 1.3067634658889141e-06, + "loss": 0.7373, + "step": 49012 + }, + { + "epoch": 1.26, + "learning_rate": 1.306737129426863e-06, + "loss": 0.582, + "step": 49013 + }, + { + "epoch": 1.26, + "learning_rate": 1.306710792729957e-06, + "loss": 0.5459, + "step": 49014 + }, + { + "epoch": 1.26, + "learning_rate": 1.3066844557982171e-06, + "loss": 0.5178, + "step": 49015 + }, + { + "epoch": 1.26, + "learning_rate": 1.3066581186316628e-06, + "loss": 0.6152, + "step": 49016 + }, + { + "epoch": 1.26, + "learning_rate": 1.3066317812303145e-06, + "loss": 0.6255, + "step": 49017 + }, + { + "epoch": 1.26, + "learning_rate": 1.3066054435941922e-06, + "loss": 0.7412, + "step": 49018 + }, + { + "epoch": 1.26, + "learning_rate": 1.3065791057233164e-06, + "loss": 0.6006, + "step": 49019 + }, + { + "epoch": 1.26, + "learning_rate": 1.3065527676177068e-06, + "loss": 0.4966, + "step": 49020 + }, + { + "epoch": 1.26, + "learning_rate": 1.3065264292773844e-06, + "loss": 0.4592, + "step": 49021 + }, + { + "epoch": 1.26, + "learning_rate": 1.3065000907023682e-06, + "loss": 0.7002, + "step": 49022 + }, + { + "epoch": 1.26, + "learning_rate": 1.3064737518926794e-06, + "loss": 0.584, + "step": 49023 + }, + { + "epoch": 1.26, + "learning_rate": 1.3064474128483373e-06, + "loss": 0.5449, + "step": 49024 + }, + { + "epoch": 1.26, + "learning_rate": 1.3064210735693628e-06, + "loss": 0.5728, + "step": 49025 + }, + { + "epoch": 1.26, + "learning_rate": 1.306394734055776e-06, + "loss": 0.5132, + "step": 49026 + }, + { + "epoch": 1.26, + "learning_rate": 1.3063683943075964e-06, + "loss": 0.6143, + "step": 49027 + }, + { + "epoch": 1.26, + "learning_rate": 1.306342054324845e-06, + "loss": 0.6768, + "step": 49028 + }, + { + "epoch": 1.26, + "learning_rate": 1.3063157141075411e-06, + "loss": 0.6318, + "step": 49029 + }, + { + "epoch": 1.26, + "learning_rate": 1.3062893736557056e-06, + "loss": 0.623, + "step": 49030 + }, + { + "epoch": 1.26, + "learning_rate": 1.3062630329693585e-06, + "loss": 0.7168, + "step": 49031 + }, + { + "epoch": 1.26, + "learning_rate": 1.30623669204852e-06, + "loss": 0.7373, + "step": 49032 + }, + { + "epoch": 1.26, + "learning_rate": 1.30621035089321e-06, + "loss": 1.0176, + "step": 49033 + }, + { + "epoch": 1.26, + "learning_rate": 1.3061840095034484e-06, + "loss": 0.5513, + "step": 49034 + }, + { + "epoch": 1.26, + "learning_rate": 1.3061576678792564e-06, + "loss": 0.6089, + "step": 49035 + }, + { + "epoch": 1.26, + "learning_rate": 1.3061313260206532e-06, + "loss": 0.7139, + "step": 49036 + }, + { + "epoch": 1.26, + "learning_rate": 1.3061049839276593e-06, + "loss": 0.6541, + "step": 49037 + }, + { + "epoch": 1.26, + "learning_rate": 1.3060786416002952e-06, + "loss": 0.709, + "step": 49038 + }, + { + "epoch": 1.26, + "learning_rate": 1.3060522990385802e-06, + "loss": 0.6973, + "step": 49039 + }, + { + "epoch": 1.26, + "learning_rate": 1.3060259562425356e-06, + "loss": 0.7129, + "step": 49040 + }, + { + "epoch": 1.26, + "learning_rate": 1.305999613212181e-06, + "loss": 0.6406, + "step": 49041 + }, + { + "epoch": 1.26, + "learning_rate": 1.3059732699475361e-06, + "loss": 0.7021, + "step": 49042 + }, + { + "epoch": 1.26, + "learning_rate": 1.3059469264486217e-06, + "loss": 0.6536, + "step": 49043 + }, + { + "epoch": 1.26, + "learning_rate": 1.305920582715458e-06, + "loss": 0.4204, + "step": 49044 + }, + { + "epoch": 1.26, + "learning_rate": 1.3058942387480647e-06, + "loss": 0.5911, + "step": 49045 + }, + { + "epoch": 1.26, + "learning_rate": 1.3058678945464627e-06, + "loss": 0.7598, + "step": 49046 + }, + { + "epoch": 1.26, + "learning_rate": 1.3058415501106712e-06, + "loss": 0.623, + "step": 49047 + }, + { + "epoch": 1.26, + "learning_rate": 1.3058152054407113e-06, + "loss": 0.5908, + "step": 49048 + }, + { + "epoch": 1.26, + "learning_rate": 1.3057888605366025e-06, + "loss": 0.7959, + "step": 49049 + }, + { + "epoch": 1.26, + "learning_rate": 1.3057625153983654e-06, + "loss": 0.7852, + "step": 49050 + }, + { + "epoch": 1.26, + "learning_rate": 1.30573617002602e-06, + "loss": 0.7349, + "step": 49051 + }, + { + "epoch": 1.26, + "learning_rate": 1.3057098244195864e-06, + "loss": 0.5991, + "step": 49052 + }, + { + "epoch": 1.26, + "learning_rate": 1.3056834785790845e-06, + "loss": 0.5908, + "step": 49053 + }, + { + "epoch": 1.26, + "learning_rate": 1.3056571325045354e-06, + "loss": 0.5037, + "step": 49054 + }, + { + "epoch": 1.26, + "learning_rate": 1.305630786195958e-06, + "loss": 0.6641, + "step": 49055 + }, + { + "epoch": 1.26, + "learning_rate": 1.3056044396533738e-06, + "loss": 0.6523, + "step": 49056 + }, + { + "epoch": 1.26, + "learning_rate": 1.3055780928768023e-06, + "loss": 0.6621, + "step": 49057 + }, + { + "epoch": 1.26, + "learning_rate": 1.3055517458662634e-06, + "loss": 0.791, + "step": 49058 + }, + { + "epoch": 1.26, + "learning_rate": 1.3055253986217775e-06, + "loss": 0.5498, + "step": 49059 + }, + { + "epoch": 1.26, + "learning_rate": 1.3054990511433653e-06, + "loss": 0.5801, + "step": 49060 + }, + { + "epoch": 1.26, + "learning_rate": 1.3054727034310464e-06, + "loss": 0.7246, + "step": 49061 + }, + { + "epoch": 1.26, + "learning_rate": 1.3054463554848408e-06, + "loss": 0.6393, + "step": 49062 + }, + { + "epoch": 1.26, + "learning_rate": 1.305420007304769e-06, + "loss": 0.6611, + "step": 49063 + }, + { + "epoch": 1.26, + "learning_rate": 1.3053936588908513e-06, + "loss": 0.6294, + "step": 49064 + }, + { + "epoch": 1.26, + "learning_rate": 1.3053673102431078e-06, + "loss": 0.7725, + "step": 49065 + }, + { + "epoch": 1.26, + "learning_rate": 1.3053409613615584e-06, + "loss": 0.5132, + "step": 49066 + }, + { + "epoch": 1.26, + "learning_rate": 1.3053146122462239e-06, + "loss": 0.6826, + "step": 49067 + }, + { + "epoch": 1.26, + "learning_rate": 1.3052882628971235e-06, + "loss": 0.6411, + "step": 49068 + }, + { + "epoch": 1.26, + "learning_rate": 1.305261913314278e-06, + "loss": 0.4893, + "step": 49069 + }, + { + "epoch": 1.26, + "learning_rate": 1.3052355634977076e-06, + "loss": 0.6196, + "step": 49070 + }, + { + "epoch": 1.26, + "learning_rate": 1.3052092134474325e-06, + "loss": 0.7246, + "step": 49071 + }, + { + "epoch": 1.26, + "learning_rate": 1.3051828631634727e-06, + "loss": 0.7695, + "step": 49072 + }, + { + "epoch": 1.26, + "learning_rate": 1.3051565126458485e-06, + "loss": 0.6206, + "step": 49073 + }, + { + "epoch": 1.26, + "learning_rate": 1.3051301618945795e-06, + "loss": 0.6846, + "step": 49074 + }, + { + "epoch": 1.26, + "learning_rate": 1.3051038109096868e-06, + "loss": 0.626, + "step": 49075 + }, + { + "epoch": 1.26, + "learning_rate": 1.3050774596911902e-06, + "loss": 0.707, + "step": 49076 + }, + { + "epoch": 1.26, + "learning_rate": 1.3050511082391095e-06, + "loss": 0.3888, + "step": 49077 + }, + { + "epoch": 1.26, + "learning_rate": 1.3050247565534653e-06, + "loss": 0.6421, + "step": 49078 + }, + { + "epoch": 1.26, + "learning_rate": 1.3049984046342777e-06, + "loss": 0.7354, + "step": 49079 + }, + { + "epoch": 1.26, + "learning_rate": 1.3049720524815669e-06, + "loss": 0.5632, + "step": 49080 + }, + { + "epoch": 1.26, + "learning_rate": 1.304945700095353e-06, + "loss": 0.7422, + "step": 49081 + }, + { + "epoch": 1.26, + "learning_rate": 1.3049193474756562e-06, + "loss": 0.6013, + "step": 49082 + }, + { + "epoch": 1.26, + "learning_rate": 1.3048929946224966e-06, + "loss": 0.748, + "step": 49083 + }, + { + "epoch": 1.26, + "learning_rate": 1.3048666415358945e-06, + "loss": 0.7129, + "step": 49084 + }, + { + "epoch": 1.26, + "learning_rate": 1.3048402882158698e-06, + "loss": 0.5762, + "step": 49085 + }, + { + "epoch": 1.26, + "learning_rate": 1.3048139346624434e-06, + "loss": 0.6934, + "step": 49086 + }, + { + "epoch": 1.26, + "learning_rate": 1.3047875808756345e-06, + "loss": 0.6553, + "step": 49087 + }, + { + "epoch": 1.26, + "learning_rate": 1.3047612268554643e-06, + "loss": 0.7793, + "step": 49088 + }, + { + "epoch": 1.26, + "learning_rate": 1.3047348726019519e-06, + "loss": 0.5293, + "step": 49089 + }, + { + "epoch": 1.26, + "learning_rate": 1.3047085181151183e-06, + "loss": 0.5693, + "step": 49090 + }, + { + "epoch": 1.26, + "learning_rate": 1.3046821633949833e-06, + "loss": 0.5615, + "step": 49091 + }, + { + "epoch": 1.26, + "learning_rate": 1.3046558084415674e-06, + "loss": 0.6538, + "step": 49092 + }, + { + "epoch": 1.26, + "learning_rate": 1.3046294532548902e-06, + "loss": 0.6758, + "step": 49093 + }, + { + "epoch": 1.26, + "learning_rate": 1.3046030978349726e-06, + "loss": 0.54, + "step": 49094 + }, + { + "epoch": 1.26, + "learning_rate": 1.3045767421818341e-06, + "loss": 0.522, + "step": 49095 + }, + { + "epoch": 1.26, + "learning_rate": 1.3045503862954955e-06, + "loss": 0.8721, + "step": 49096 + }, + { + "epoch": 1.26, + "learning_rate": 1.3045240301759763e-06, + "loss": 0.7012, + "step": 49097 + }, + { + "epoch": 1.26, + "learning_rate": 1.3044976738232973e-06, + "loss": 0.6611, + "step": 49098 + }, + { + "epoch": 1.26, + "learning_rate": 1.3044713172374784e-06, + "loss": 0.6729, + "step": 49099 + }, + { + "epoch": 1.26, + "learning_rate": 1.30444496041854e-06, + "loss": 0.7344, + "step": 49100 + }, + { + "epoch": 1.26, + "learning_rate": 1.3044186033665016e-06, + "loss": 0.5771, + "step": 49101 + }, + { + "epoch": 1.26, + "learning_rate": 1.3043922460813842e-06, + "loss": 0.5332, + "step": 49102 + }, + { + "epoch": 1.26, + "learning_rate": 1.3043658885632075e-06, + "loss": 0.8291, + "step": 49103 + }, + { + "epoch": 1.26, + "learning_rate": 1.304339530811992e-06, + "loss": 0.645, + "step": 49104 + }, + { + "epoch": 1.26, + "learning_rate": 1.3043131728277577e-06, + "loss": 0.7227, + "step": 49105 + }, + { + "epoch": 1.26, + "learning_rate": 1.3042868146105248e-06, + "loss": 0.7373, + "step": 49106 + }, + { + "epoch": 1.26, + "learning_rate": 1.3042604561603133e-06, + "loss": 0.6816, + "step": 49107 + }, + { + "epoch": 1.26, + "learning_rate": 1.3042340974771437e-06, + "loss": 0.7471, + "step": 49108 + }, + { + "epoch": 1.26, + "learning_rate": 1.3042077385610361e-06, + "loss": 0.4557, + "step": 49109 + }, + { + "epoch": 1.26, + "learning_rate": 1.3041813794120104e-06, + "loss": 0.6572, + "step": 49110 + }, + { + "epoch": 1.26, + "learning_rate": 1.3041550200300875e-06, + "loss": 0.5918, + "step": 49111 + }, + { + "epoch": 1.26, + "learning_rate": 1.3041286604152866e-06, + "loss": 0.6523, + "step": 49112 + }, + { + "epoch": 1.26, + "learning_rate": 1.3041023005676286e-06, + "loss": 0.5869, + "step": 49113 + }, + { + "epoch": 1.26, + "learning_rate": 1.304075940487133e-06, + "loss": 0.7031, + "step": 49114 + }, + { + "epoch": 1.26, + "learning_rate": 1.304049580173821e-06, + "loss": 0.8184, + "step": 49115 + }, + { + "epoch": 1.26, + "learning_rate": 1.3040232196277122e-06, + "loss": 0.9551, + "step": 49116 + }, + { + "epoch": 1.26, + "learning_rate": 1.303996858848827e-06, + "loss": 0.6685, + "step": 49117 + }, + { + "epoch": 1.26, + "learning_rate": 1.3039704978371847e-06, + "loss": 0.6289, + "step": 49118 + }, + { + "epoch": 1.26, + "learning_rate": 1.3039441365928063e-06, + "loss": 0.6675, + "step": 49119 + }, + { + "epoch": 1.26, + "learning_rate": 1.303917775115712e-06, + "loss": 0.6143, + "step": 49120 + }, + { + "epoch": 1.26, + "learning_rate": 1.3038914134059221e-06, + "loss": 0.4495, + "step": 49121 + }, + { + "epoch": 1.26, + "learning_rate": 1.303865051463456e-06, + "loss": 0.6401, + "step": 49122 + }, + { + "epoch": 1.26, + "learning_rate": 1.3038386892883348e-06, + "loss": 0.7529, + "step": 49123 + }, + { + "epoch": 1.26, + "learning_rate": 1.3038123268805781e-06, + "loss": 0.5856, + "step": 49124 + }, + { + "epoch": 1.26, + "learning_rate": 1.3037859642402063e-06, + "loss": 0.4905, + "step": 49125 + }, + { + "epoch": 1.26, + "learning_rate": 1.3037596013672398e-06, + "loss": 0.7021, + "step": 49126 + }, + { + "epoch": 1.26, + "learning_rate": 1.3037332382616982e-06, + "loss": 0.645, + "step": 49127 + }, + { + "epoch": 1.26, + "learning_rate": 1.3037068749236022e-06, + "loss": 0.5691, + "step": 49128 + }, + { + "epoch": 1.26, + "learning_rate": 1.3036805113529716e-06, + "loss": 0.6768, + "step": 49129 + }, + { + "epoch": 1.26, + "learning_rate": 1.303654147549827e-06, + "loss": 0.5083, + "step": 49130 + }, + { + "epoch": 1.26, + "learning_rate": 1.3036277835141884e-06, + "loss": 0.5393, + "step": 49131 + }, + { + "epoch": 1.26, + "learning_rate": 1.303601419246076e-06, + "loss": 0.5767, + "step": 49132 + }, + { + "epoch": 1.26, + "learning_rate": 1.3035750547455097e-06, + "loss": 0.527, + "step": 49133 + }, + { + "epoch": 1.26, + "learning_rate": 1.3035486900125104e-06, + "loss": 0.6543, + "step": 49134 + }, + { + "epoch": 1.26, + "learning_rate": 1.3035223250470972e-06, + "loss": 0.4976, + "step": 49135 + }, + { + "epoch": 1.26, + "learning_rate": 1.3034959598492913e-06, + "loss": 0.5813, + "step": 49136 + }, + { + "epoch": 1.26, + "learning_rate": 1.3034695944191125e-06, + "loss": 0.7178, + "step": 49137 + }, + { + "epoch": 1.26, + "learning_rate": 1.3034432287565808e-06, + "loss": 0.7168, + "step": 49138 + }, + { + "epoch": 1.26, + "learning_rate": 1.3034168628617167e-06, + "loss": 0.4937, + "step": 49139 + }, + { + "epoch": 1.26, + "learning_rate": 1.3033904967345403e-06, + "loss": 0.5552, + "step": 49140 + }, + { + "epoch": 1.26, + "learning_rate": 1.3033641303750717e-06, + "loss": 0.6348, + "step": 49141 + }, + { + "epoch": 1.26, + "learning_rate": 1.3033377637833314e-06, + "loss": 0.8076, + "step": 49142 + }, + { + "epoch": 1.26, + "learning_rate": 1.303311396959339e-06, + "loss": 0.6309, + "step": 49143 + }, + { + "epoch": 1.26, + "learning_rate": 1.303285029903115e-06, + "loss": 0.6934, + "step": 49144 + }, + { + "epoch": 1.26, + "learning_rate": 1.3032586626146796e-06, + "loss": 0.6252, + "step": 49145 + }, + { + "epoch": 1.26, + "learning_rate": 1.303232295094053e-06, + "loss": 0.8584, + "step": 49146 + }, + { + "epoch": 1.26, + "learning_rate": 1.3032059273412555e-06, + "loss": 0.666, + "step": 49147 + }, + { + "epoch": 1.26, + "learning_rate": 1.303179559356307e-06, + "loss": 0.665, + "step": 49148 + }, + { + "epoch": 1.26, + "learning_rate": 1.3031531911392279e-06, + "loss": 0.6465, + "step": 49149 + }, + { + "epoch": 1.26, + "learning_rate": 1.3031268226900385e-06, + "loss": 0.6064, + "step": 49150 + }, + { + "epoch": 1.26, + "learning_rate": 1.303100454008759e-06, + "loss": 0.7578, + "step": 49151 + }, + { + "epoch": 1.26, + "learning_rate": 1.303074085095409e-06, + "loss": 0.7852, + "step": 49152 + }, + { + "epoch": 1.26, + "learning_rate": 1.3030477159500093e-06, + "loss": 0.5923, + "step": 49153 + }, + { + "epoch": 1.26, + "learning_rate": 1.3030213465725797e-06, + "loss": 0.4659, + "step": 49154 + }, + { + "epoch": 1.26, + "learning_rate": 1.3029949769631405e-06, + "loss": 0.6768, + "step": 49155 + }, + { + "epoch": 1.26, + "learning_rate": 1.3029686071217123e-06, + "loss": 0.6436, + "step": 49156 + }, + { + "epoch": 1.26, + "learning_rate": 1.302942237048315e-06, + "loss": 0.7598, + "step": 49157 + }, + { + "epoch": 1.26, + "learning_rate": 1.3029158667429684e-06, + "loss": 0.6377, + "step": 49158 + }, + { + "epoch": 1.26, + "learning_rate": 1.3028894962056935e-06, + "loss": 0.6104, + "step": 49159 + }, + { + "epoch": 1.26, + "learning_rate": 1.3028631254365098e-06, + "loss": 0.585, + "step": 49160 + }, + { + "epoch": 1.26, + "learning_rate": 1.302836754435438e-06, + "loss": 0.7139, + "step": 49161 + }, + { + "epoch": 1.26, + "learning_rate": 1.3028103832024977e-06, + "loss": 0.5264, + "step": 49162 + }, + { + "epoch": 1.26, + "learning_rate": 1.3027840117377093e-06, + "loss": 0.7412, + "step": 49163 + }, + { + "epoch": 1.26, + "learning_rate": 1.3027576400410933e-06, + "loss": 0.7363, + "step": 49164 + }, + { + "epoch": 1.26, + "learning_rate": 1.30273126811267e-06, + "loss": 0.5425, + "step": 49165 + }, + { + "epoch": 1.26, + "learning_rate": 1.3027048959524586e-06, + "loss": 0.7725, + "step": 49166 + }, + { + "epoch": 1.26, + "learning_rate": 1.3026785235604804e-06, + "loss": 0.6367, + "step": 49167 + }, + { + "epoch": 1.26, + "learning_rate": 1.3026521509367552e-06, + "loss": 0.5938, + "step": 49168 + }, + { + "epoch": 1.26, + "learning_rate": 1.3026257780813032e-06, + "loss": 0.6362, + "step": 49169 + }, + { + "epoch": 1.26, + "learning_rate": 1.3025994049941441e-06, + "loss": 0.5361, + "step": 49170 + }, + { + "epoch": 1.26, + "learning_rate": 1.3025730316752993e-06, + "loss": 0.7285, + "step": 49171 + }, + { + "epoch": 1.26, + "learning_rate": 1.3025466581247877e-06, + "loss": 0.6826, + "step": 49172 + }, + { + "epoch": 1.26, + "learning_rate": 1.3025202843426302e-06, + "loss": 0.7109, + "step": 49173 + }, + { + "epoch": 1.26, + "learning_rate": 1.3024939103288467e-06, + "loss": 0.6934, + "step": 49174 + }, + { + "epoch": 1.26, + "learning_rate": 1.3024675360834575e-06, + "loss": 0.6416, + "step": 49175 + }, + { + "epoch": 1.26, + "learning_rate": 1.3024411616064831e-06, + "loss": 0.874, + "step": 49176 + }, + { + "epoch": 1.26, + "learning_rate": 1.3024147868979433e-06, + "loss": 0.6538, + "step": 49177 + }, + { + "epoch": 1.26, + "learning_rate": 1.3023884119578585e-06, + "loss": 0.6235, + "step": 49178 + }, + { + "epoch": 1.26, + "learning_rate": 1.3023620367862485e-06, + "loss": 0.5862, + "step": 49179 + }, + { + "epoch": 1.26, + "learning_rate": 1.302335661383134e-06, + "loss": 0.7231, + "step": 49180 + }, + { + "epoch": 1.26, + "learning_rate": 1.302309285748535e-06, + "loss": 0.666, + "step": 49181 + }, + { + "epoch": 1.26, + "learning_rate": 1.3022829098824717e-06, + "loss": 0.396, + "step": 49182 + }, + { + "epoch": 1.26, + "learning_rate": 1.302256533784964e-06, + "loss": 0.5596, + "step": 49183 + }, + { + "epoch": 1.26, + "learning_rate": 1.3022301574560326e-06, + "loss": 0.7832, + "step": 49184 + }, + { + "epoch": 1.26, + "learning_rate": 1.3022037808956975e-06, + "loss": 0.6104, + "step": 49185 + }, + { + "epoch": 1.26, + "learning_rate": 1.3021774041039788e-06, + "loss": 0.7686, + "step": 49186 + }, + { + "epoch": 1.26, + "learning_rate": 1.3021510270808966e-06, + "loss": 0.7285, + "step": 49187 + }, + { + "epoch": 1.26, + "learning_rate": 1.3021246498264716e-06, + "loss": 0.7705, + "step": 49188 + }, + { + "epoch": 1.26, + "learning_rate": 1.3020982723407233e-06, + "loss": 0.668, + "step": 49189 + }, + { + "epoch": 1.26, + "learning_rate": 1.3020718946236724e-06, + "loss": 0.5425, + "step": 49190 + }, + { + "epoch": 1.26, + "learning_rate": 1.302045516675339e-06, + "loss": 0.6504, + "step": 49191 + }, + { + "epoch": 1.26, + "learning_rate": 1.302019138495743e-06, + "loss": 0.6548, + "step": 49192 + }, + { + "epoch": 1.26, + "learning_rate": 1.301992760084905e-06, + "loss": 0.498, + "step": 49193 + }, + { + "epoch": 1.26, + "learning_rate": 1.301966381442845e-06, + "loss": 0.6729, + "step": 49194 + }, + { + "epoch": 1.26, + "learning_rate": 1.3019400025695835e-06, + "loss": 0.7197, + "step": 49195 + }, + { + "epoch": 1.26, + "learning_rate": 1.30191362346514e-06, + "loss": 0.561, + "step": 49196 + }, + { + "epoch": 1.26, + "learning_rate": 1.3018872441295353e-06, + "loss": 0.6309, + "step": 49197 + }, + { + "epoch": 1.26, + "learning_rate": 1.3018608645627893e-06, + "loss": 0.8154, + "step": 49198 + }, + { + "epoch": 1.26, + "learning_rate": 1.3018344847649225e-06, + "loss": 0.5786, + "step": 49199 + }, + { + "epoch": 1.26, + "learning_rate": 1.3018081047359549e-06, + "loss": 0.6084, + "step": 49200 + }, + { + "epoch": 1.26, + "learning_rate": 1.301781724475907e-06, + "loss": 0.7207, + "step": 49201 + }, + { + "epoch": 1.26, + "learning_rate": 1.3017553439847979e-06, + "loss": 0.7529, + "step": 49202 + }, + { + "epoch": 1.26, + "learning_rate": 1.3017289632626491e-06, + "loss": 0.5541, + "step": 49203 + }, + { + "epoch": 1.26, + "learning_rate": 1.3017025823094802e-06, + "loss": 0.7393, + "step": 49204 + }, + { + "epoch": 1.26, + "learning_rate": 1.3016762011253119e-06, + "loss": 0.7344, + "step": 49205 + }, + { + "epoch": 1.26, + "learning_rate": 1.3016498197101636e-06, + "loss": 0.6816, + "step": 49206 + }, + { + "epoch": 1.26, + "learning_rate": 1.301623438064056e-06, + "loss": 0.4802, + "step": 49207 + }, + { + "epoch": 1.26, + "learning_rate": 1.301597056187009e-06, + "loss": 0.6006, + "step": 49208 + }, + { + "epoch": 1.26, + "learning_rate": 1.3015706740790433e-06, + "loss": 0.6172, + "step": 49209 + }, + { + "epoch": 1.26, + "learning_rate": 1.3015442917401789e-06, + "loss": 0.5605, + "step": 49210 + }, + { + "epoch": 1.26, + "learning_rate": 1.3015179091704353e-06, + "loss": 0.6997, + "step": 49211 + }, + { + "epoch": 1.26, + "learning_rate": 1.3014915263698338e-06, + "loss": 0.4829, + "step": 49212 + }, + { + "epoch": 1.26, + "learning_rate": 1.3014651433383941e-06, + "loss": 0.7637, + "step": 49213 + }, + { + "epoch": 1.26, + "learning_rate": 1.3014387600761363e-06, + "loss": 0.6445, + "step": 49214 + }, + { + "epoch": 1.26, + "learning_rate": 1.3014123765830807e-06, + "loss": 0.6675, + "step": 49215 + }, + { + "epoch": 1.26, + "learning_rate": 1.3013859928592475e-06, + "loss": 0.751, + "step": 49216 + }, + { + "epoch": 1.26, + "learning_rate": 1.3013596089046568e-06, + "loss": 0.7734, + "step": 49217 + }, + { + "epoch": 1.26, + "learning_rate": 1.3013332247193291e-06, + "loss": 0.5808, + "step": 49218 + }, + { + "epoch": 1.26, + "learning_rate": 1.3013068403032841e-06, + "loss": 0.8223, + "step": 49219 + }, + { + "epoch": 1.26, + "learning_rate": 1.301280455656543e-06, + "loss": 0.7285, + "step": 49220 + }, + { + "epoch": 1.26, + "learning_rate": 1.3012540707791246e-06, + "loss": 0.6768, + "step": 49221 + }, + { + "epoch": 1.26, + "learning_rate": 1.30122768567105e-06, + "loss": 0.6211, + "step": 49222 + }, + { + "epoch": 1.26, + "learning_rate": 1.3012013003323393e-06, + "loss": 0.5146, + "step": 49223 + }, + { + "epoch": 1.26, + "learning_rate": 1.3011749147630123e-06, + "loss": 0.6377, + "step": 49224 + }, + { + "epoch": 1.26, + "learning_rate": 1.3011485289630902e-06, + "loss": 0.5137, + "step": 49225 + }, + { + "epoch": 1.26, + "learning_rate": 1.301122142932592e-06, + "loss": 0.428, + "step": 49226 + }, + { + "epoch": 1.26, + "learning_rate": 1.3010957566715383e-06, + "loss": 0.7441, + "step": 49227 + }, + { + "epoch": 1.26, + "learning_rate": 1.3010693701799498e-06, + "loss": 0.6416, + "step": 49228 + }, + { + "epoch": 1.26, + "learning_rate": 1.301042983457846e-06, + "loss": 0.7168, + "step": 49229 + }, + { + "epoch": 1.26, + "learning_rate": 1.3010165965052477e-06, + "loss": 0.7266, + "step": 49230 + }, + { + "epoch": 1.26, + "learning_rate": 1.300990209322175e-06, + "loss": 0.6846, + "step": 49231 + }, + { + "epoch": 1.26, + "learning_rate": 1.3009638219086477e-06, + "loss": 0.4612, + "step": 49232 + }, + { + "epoch": 1.26, + "learning_rate": 1.300937434264686e-06, + "loss": 0.6973, + "step": 49233 + }, + { + "epoch": 1.26, + "learning_rate": 1.3009110463903106e-06, + "loss": 0.7627, + "step": 49234 + }, + { + "epoch": 1.26, + "learning_rate": 1.3008846582855415e-06, + "loss": 0.6572, + "step": 49235 + }, + { + "epoch": 1.26, + "learning_rate": 1.3008582699503987e-06, + "loss": 0.6396, + "step": 49236 + }, + { + "epoch": 1.26, + "learning_rate": 1.3008318813849026e-06, + "loss": 0.7754, + "step": 49237 + }, + { + "epoch": 1.26, + "learning_rate": 1.3008054925890732e-06, + "loss": 0.7207, + "step": 49238 + }, + { + "epoch": 1.26, + "learning_rate": 1.3007791035629311e-06, + "loss": 0.7568, + "step": 49239 + }, + { + "epoch": 1.26, + "learning_rate": 1.3007527143064962e-06, + "loss": 0.7471, + "step": 49240 + }, + { + "epoch": 1.26, + "learning_rate": 1.300726324819789e-06, + "loss": 0.5903, + "step": 49241 + }, + { + "epoch": 1.26, + "learning_rate": 1.3006999351028291e-06, + "loss": 0.7051, + "step": 49242 + }, + { + "epoch": 1.26, + "learning_rate": 1.3006735451556374e-06, + "loss": 0.6719, + "step": 49243 + }, + { + "epoch": 1.26, + "learning_rate": 1.3006471549782333e-06, + "loss": 0.8047, + "step": 49244 + }, + { + "epoch": 1.26, + "learning_rate": 1.3006207645706383e-06, + "loss": 0.5334, + "step": 49245 + }, + { + "epoch": 1.26, + "learning_rate": 1.3005943739328712e-06, + "loss": 0.6582, + "step": 49246 + }, + { + "epoch": 1.26, + "learning_rate": 1.300567983064953e-06, + "loss": 0.6062, + "step": 49247 + }, + { + "epoch": 1.26, + "learning_rate": 1.3005415919669036e-06, + "loss": 0.7354, + "step": 49248 + }, + { + "epoch": 1.26, + "learning_rate": 1.3005152006387435e-06, + "loss": 0.6494, + "step": 49249 + }, + { + "epoch": 1.26, + "learning_rate": 1.3004888090804927e-06, + "loss": 0.5303, + "step": 49250 + }, + { + "epoch": 1.26, + "learning_rate": 1.3004624172921713e-06, + "loss": 0.5918, + "step": 49251 + }, + { + "epoch": 1.26, + "learning_rate": 1.3004360252737996e-06, + "loss": 0.668, + "step": 49252 + }, + { + "epoch": 1.26, + "learning_rate": 1.300409633025398e-06, + "loss": 0.5615, + "step": 49253 + }, + { + "epoch": 1.26, + "learning_rate": 1.3003832405469864e-06, + "loss": 0.6592, + "step": 49254 + }, + { + "epoch": 1.26, + "learning_rate": 1.3003568478385854e-06, + "loss": 0.6489, + "step": 49255 + }, + { + "epoch": 1.26, + "learning_rate": 1.300330454900215e-06, + "loss": 0.8018, + "step": 49256 + }, + { + "epoch": 1.26, + "learning_rate": 1.300304061731895e-06, + "loss": 0.6514, + "step": 49257 + }, + { + "epoch": 1.26, + "learning_rate": 1.3002776683336462e-06, + "loss": 0.6133, + "step": 49258 + }, + { + "epoch": 1.26, + "learning_rate": 1.3002512747054888e-06, + "loss": 0.6187, + "step": 49259 + }, + { + "epoch": 1.26, + "learning_rate": 1.3002248808474426e-06, + "loss": 0.564, + "step": 49260 + }, + { + "epoch": 1.26, + "learning_rate": 1.300198486759528e-06, + "loss": 0.6436, + "step": 49261 + }, + { + "epoch": 1.26, + "learning_rate": 1.3001720924417652e-06, + "loss": 0.6904, + "step": 49262 + }, + { + "epoch": 1.26, + "learning_rate": 1.3001456978941745e-06, + "loss": 0.6377, + "step": 49263 + }, + { + "epoch": 1.26, + "learning_rate": 1.300119303116776e-06, + "loss": 0.6802, + "step": 49264 + }, + { + "epoch": 1.26, + "learning_rate": 1.30009290810959e-06, + "loss": 0.7646, + "step": 49265 + }, + { + "epoch": 1.26, + "learning_rate": 1.3000665128726368e-06, + "loss": 0.5098, + "step": 49266 + }, + { + "epoch": 1.26, + "learning_rate": 1.300040117405936e-06, + "loss": 0.6245, + "step": 49267 + }, + { + "epoch": 1.26, + "learning_rate": 1.3000137217095088e-06, + "loss": 0.4888, + "step": 49268 + }, + { + "epoch": 1.26, + "learning_rate": 1.2999873257833745e-06, + "loss": 0.6611, + "step": 49269 + }, + { + "epoch": 1.26, + "learning_rate": 1.299960929627554e-06, + "loss": 0.6074, + "step": 49270 + }, + { + "epoch": 1.26, + "learning_rate": 1.299934533242067e-06, + "loss": 0.4646, + "step": 49271 + }, + { + "epoch": 1.26, + "learning_rate": 1.299908136626934e-06, + "loss": 0.437, + "step": 49272 + }, + { + "epoch": 1.26, + "learning_rate": 1.2998817397821752e-06, + "loss": 0.7705, + "step": 49273 + }, + { + "epoch": 1.26, + "learning_rate": 1.2998553427078104e-06, + "loss": 0.8574, + "step": 49274 + }, + { + "epoch": 1.26, + "learning_rate": 1.2998289454038608e-06, + "loss": 0.6904, + "step": 49275 + }, + { + "epoch": 1.26, + "learning_rate": 1.2998025478703457e-06, + "loss": 0.7354, + "step": 49276 + }, + { + "epoch": 1.26, + "learning_rate": 1.2997761501072853e-06, + "loss": 0.5972, + "step": 49277 + }, + { + "epoch": 1.26, + "learning_rate": 1.2997497521147e-06, + "loss": 0.5825, + "step": 49278 + }, + { + "epoch": 1.26, + "learning_rate": 1.2997233538926104e-06, + "loss": 0.4094, + "step": 49279 + }, + { + "epoch": 1.26, + "learning_rate": 1.2996969554410364e-06, + "loss": 0.7168, + "step": 49280 + }, + { + "epoch": 1.26, + "learning_rate": 1.2996705567599981e-06, + "loss": 0.668, + "step": 49281 + }, + { + "epoch": 1.26, + "learning_rate": 1.2996441578495158e-06, + "loss": 0.6782, + "step": 49282 + }, + { + "epoch": 1.26, + "learning_rate": 1.29961775870961e-06, + "loss": 0.5396, + "step": 49283 + }, + { + "epoch": 1.26, + "learning_rate": 1.2995913593403003e-06, + "loss": 0.6895, + "step": 49284 + }, + { + "epoch": 1.26, + "learning_rate": 1.299564959741608e-06, + "loss": 0.8135, + "step": 49285 + }, + { + "epoch": 1.26, + "learning_rate": 1.2995385599135517e-06, + "loss": 0.7031, + "step": 49286 + }, + { + "epoch": 1.26, + "learning_rate": 1.299512159856153e-06, + "loss": 0.6201, + "step": 49287 + }, + { + "epoch": 1.26, + "learning_rate": 1.2994857595694314e-06, + "loss": 0.6484, + "step": 49288 + }, + { + "epoch": 1.26, + "learning_rate": 1.2994593590534074e-06, + "loss": 0.6504, + "step": 49289 + }, + { + "epoch": 1.26, + "learning_rate": 1.2994329583081012e-06, + "loss": 0.575, + "step": 49290 + }, + { + "epoch": 1.26, + "learning_rate": 1.299406557333533e-06, + "loss": 0.8252, + "step": 49291 + }, + { + "epoch": 1.26, + "learning_rate": 1.2993801561297227e-06, + "loss": 0.6992, + "step": 49292 + }, + { + "epoch": 1.26, + "learning_rate": 1.299353754696691e-06, + "loss": 0.6226, + "step": 49293 + }, + { + "epoch": 1.26, + "learning_rate": 1.2993273530344577e-06, + "loss": 0.6655, + "step": 49294 + }, + { + "epoch": 1.26, + "learning_rate": 1.2993009511430435e-06, + "loss": 0.5718, + "step": 49295 + }, + { + "epoch": 1.26, + "learning_rate": 1.299274549022468e-06, + "loss": 0.6924, + "step": 49296 + }, + { + "epoch": 1.26, + "learning_rate": 1.299248146672752e-06, + "loss": 0.7007, + "step": 49297 + }, + { + "epoch": 1.26, + "learning_rate": 1.2992217440939153e-06, + "loss": 0.6455, + "step": 49298 + }, + { + "epoch": 1.26, + "learning_rate": 1.2991953412859784e-06, + "loss": 0.6777, + "step": 49299 + }, + { + "epoch": 1.26, + "learning_rate": 1.2991689382489614e-06, + "loss": 0.5281, + "step": 49300 + }, + { + "epoch": 1.26, + "learning_rate": 1.2991425349828842e-06, + "loss": 0.6689, + "step": 49301 + }, + { + "epoch": 1.26, + "learning_rate": 1.2991161314877677e-06, + "loss": 0.8564, + "step": 49302 + }, + { + "epoch": 1.26, + "learning_rate": 1.2990897277636314e-06, + "loss": 0.7168, + "step": 49303 + }, + { + "epoch": 1.26, + "learning_rate": 1.299063323810496e-06, + "loss": 0.6484, + "step": 49304 + }, + { + "epoch": 1.26, + "learning_rate": 1.2990369196283817e-06, + "loss": 0.5469, + "step": 49305 + }, + { + "epoch": 1.26, + "learning_rate": 1.2990105152173085e-06, + "loss": 0.6055, + "step": 49306 + }, + { + "epoch": 1.26, + "learning_rate": 1.2989841105772965e-06, + "loss": 0.6294, + "step": 49307 + }, + { + "epoch": 1.26, + "learning_rate": 1.2989577057083662e-06, + "loss": 0.6758, + "step": 49308 + }, + { + "epoch": 1.26, + "learning_rate": 1.2989313006105378e-06, + "loss": 0.6934, + "step": 49309 + }, + { + "epoch": 1.26, + "learning_rate": 1.2989048952838317e-06, + "loss": 0.5049, + "step": 49310 + }, + { + "epoch": 1.26, + "learning_rate": 1.2988784897282675e-06, + "loss": 0.5552, + "step": 49311 + }, + { + "epoch": 1.26, + "learning_rate": 1.2988520839438659e-06, + "loss": 0.8555, + "step": 49312 + }, + { + "epoch": 1.26, + "learning_rate": 1.2988256779306468e-06, + "loss": 0.7109, + "step": 49313 + }, + { + "epoch": 1.26, + "learning_rate": 1.298799271688631e-06, + "loss": 0.6279, + "step": 49314 + }, + { + "epoch": 1.26, + "learning_rate": 1.2987728652178383e-06, + "loss": 0.6973, + "step": 49315 + }, + { + "epoch": 1.26, + "learning_rate": 1.2987464585182888e-06, + "loss": 0.6104, + "step": 49316 + }, + { + "epoch": 1.26, + "learning_rate": 1.2987200515900027e-06, + "loss": 0.4702, + "step": 49317 + }, + { + "epoch": 1.26, + "learning_rate": 1.2986936444330005e-06, + "loss": 0.6006, + "step": 49318 + }, + { + "epoch": 1.26, + "learning_rate": 1.2986672370473023e-06, + "loss": 0.4835, + "step": 49319 + }, + { + "epoch": 1.26, + "learning_rate": 1.2986408294329284e-06, + "loss": 0.3215, + "step": 49320 + }, + { + "epoch": 1.26, + "learning_rate": 1.298614421589899e-06, + "loss": 0.5972, + "step": 49321 + }, + { + "epoch": 1.26, + "learning_rate": 1.2985880135182346e-06, + "loss": 0.833, + "step": 49322 + }, + { + "epoch": 1.26, + "learning_rate": 1.2985616052179544e-06, + "loss": 0.5291, + "step": 49323 + }, + { + "epoch": 1.26, + "learning_rate": 1.2985351966890796e-06, + "loss": 0.6055, + "step": 49324 + }, + { + "epoch": 1.26, + "learning_rate": 1.2985087879316303e-06, + "loss": 0.7832, + "step": 49325 + }, + { + "epoch": 1.26, + "learning_rate": 1.2984823789456263e-06, + "loss": 0.501, + "step": 49326 + }, + { + "epoch": 1.26, + "learning_rate": 1.298455969731088e-06, + "loss": 0.5913, + "step": 49327 + }, + { + "epoch": 1.26, + "learning_rate": 1.2984295602880359e-06, + "loss": 0.5083, + "step": 49328 + }, + { + "epoch": 1.26, + "learning_rate": 1.29840315061649e-06, + "loss": 0.6357, + "step": 49329 + }, + { + "epoch": 1.26, + "learning_rate": 1.2983767407164705e-06, + "loss": 0.7295, + "step": 49330 + }, + { + "epoch": 1.26, + "learning_rate": 1.2983503305879977e-06, + "loss": 0.5782, + "step": 49331 + }, + { + "epoch": 1.26, + "learning_rate": 1.2983239202310916e-06, + "loss": 0.8652, + "step": 49332 + }, + { + "epoch": 1.26, + "learning_rate": 1.298297509645773e-06, + "loss": 0.7461, + "step": 49333 + }, + { + "epoch": 1.26, + "learning_rate": 1.2982710988320611e-06, + "loss": 0.7266, + "step": 49334 + }, + { + "epoch": 1.26, + "learning_rate": 1.2982446877899774e-06, + "loss": 0.667, + "step": 49335 + }, + { + "epoch": 1.26, + "learning_rate": 1.298218276519541e-06, + "loss": 0.6782, + "step": 49336 + }, + { + "epoch": 1.26, + "learning_rate": 1.2981918650207726e-06, + "loss": 0.7534, + "step": 49337 + }, + { + "epoch": 1.26, + "learning_rate": 1.2981654532936922e-06, + "loss": 0.665, + "step": 49338 + }, + { + "epoch": 1.26, + "learning_rate": 1.2981390413383206e-06, + "loss": 0.5073, + "step": 49339 + }, + { + "epoch": 1.26, + "learning_rate": 1.2981126291546778e-06, + "loss": 0.647, + "step": 49340 + }, + { + "epoch": 1.26, + "learning_rate": 1.2980862167427836e-06, + "loss": 0.7886, + "step": 49341 + }, + { + "epoch": 1.26, + "learning_rate": 1.2980598041026585e-06, + "loss": 0.7578, + "step": 49342 + }, + { + "epoch": 1.26, + "learning_rate": 1.2980333912343226e-06, + "loss": 0.7461, + "step": 49343 + }, + { + "epoch": 1.26, + "learning_rate": 1.2980069781377962e-06, + "loss": 0.7676, + "step": 49344 + }, + { + "epoch": 1.26, + "learning_rate": 1.2979805648130997e-06, + "loss": 0.6621, + "step": 49345 + }, + { + "epoch": 1.26, + "learning_rate": 1.2979541512602533e-06, + "loss": 0.564, + "step": 49346 + }, + { + "epoch": 1.26, + "learning_rate": 1.2979277374792769e-06, + "loss": 0.7676, + "step": 49347 + }, + { + "epoch": 1.26, + "learning_rate": 1.2979013234701913e-06, + "loss": 0.7334, + "step": 49348 + }, + { + "epoch": 1.26, + "learning_rate": 1.297874909233016e-06, + "loss": 0.7363, + "step": 49349 + }, + { + "epoch": 1.26, + "learning_rate": 1.2978484947677717e-06, + "loss": 0.5068, + "step": 49350 + }, + { + "epoch": 1.26, + "learning_rate": 1.2978220800744783e-06, + "loss": 0.5142, + "step": 49351 + }, + { + "epoch": 1.26, + "learning_rate": 1.2977956651531566e-06, + "loss": 0.4229, + "step": 49352 + }, + { + "epoch": 1.26, + "learning_rate": 1.297769250003826e-06, + "loss": 0.5293, + "step": 49353 + }, + { + "epoch": 1.26, + "learning_rate": 1.2977428346265075e-06, + "loss": 0.7471, + "step": 49354 + }, + { + "epoch": 1.26, + "learning_rate": 1.2977164190212212e-06, + "loss": 0.7275, + "step": 49355 + }, + { + "epoch": 1.27, + "learning_rate": 1.2976900031879868e-06, + "loss": 0.7988, + "step": 49356 + }, + { + "epoch": 1.27, + "learning_rate": 1.2976635871268246e-06, + "loss": 0.6592, + "step": 49357 + }, + { + "epoch": 1.27, + "learning_rate": 1.2976371708377556e-06, + "loss": 0.4094, + "step": 49358 + }, + { + "epoch": 1.27, + "learning_rate": 1.297610754320799e-06, + "loss": 0.7241, + "step": 49359 + }, + { + "epoch": 1.27, + "learning_rate": 1.2975843375759762e-06, + "loss": 0.5532, + "step": 49360 + }, + { + "epoch": 1.27, + "learning_rate": 1.2975579206033063e-06, + "loss": 0.708, + "step": 49361 + }, + { + "epoch": 1.27, + "learning_rate": 1.29753150340281e-06, + "loss": 0.8125, + "step": 49362 + }, + { + "epoch": 1.27, + "learning_rate": 1.2975050859745076e-06, + "loss": 0.7607, + "step": 49363 + }, + { + "epoch": 1.27, + "learning_rate": 1.2974786683184191e-06, + "loss": 0.709, + "step": 49364 + }, + { + "epoch": 1.27, + "learning_rate": 1.297452250434565e-06, + "loss": 0.5603, + "step": 49365 + }, + { + "epoch": 1.27, + "learning_rate": 1.2974258323229656e-06, + "loss": 0.7104, + "step": 49366 + }, + { + "epoch": 1.27, + "learning_rate": 1.2973994139836405e-06, + "loss": 0.3921, + "step": 49367 + }, + { + "epoch": 1.27, + "learning_rate": 1.2973729954166107e-06, + "loss": 0.6846, + "step": 49368 + }, + { + "epoch": 1.27, + "learning_rate": 1.2973465766218956e-06, + "loss": 0.8145, + "step": 49369 + }, + { + "epoch": 1.27, + "learning_rate": 1.2973201575995164e-06, + "loss": 0.7402, + "step": 49370 + }, + { + "epoch": 1.27, + "learning_rate": 1.2972937383494924e-06, + "loss": 0.5532, + "step": 49371 + }, + { + "epoch": 1.27, + "learning_rate": 1.2972673188718443e-06, + "loss": 0.3977, + "step": 49372 + }, + { + "epoch": 1.27, + "learning_rate": 1.2972408991665926e-06, + "loss": 0.5698, + "step": 49373 + }, + { + "epoch": 1.27, + "learning_rate": 1.297214479233757e-06, + "loss": 0.4995, + "step": 49374 + }, + { + "epoch": 1.27, + "learning_rate": 1.2971880590733582e-06, + "loss": 0.6357, + "step": 49375 + }, + { + "epoch": 1.27, + "learning_rate": 1.297161638685416e-06, + "loss": 0.5918, + "step": 49376 + }, + { + "epoch": 1.27, + "learning_rate": 1.2971352180699506e-06, + "loss": 0.6484, + "step": 49377 + }, + { + "epoch": 1.27, + "learning_rate": 1.2971087972269825e-06, + "loss": 0.7812, + "step": 49378 + }, + { + "epoch": 1.27, + "learning_rate": 1.2970823761565322e-06, + "loss": 0.5962, + "step": 49379 + }, + { + "epoch": 1.27, + "learning_rate": 1.2970559548586192e-06, + "loss": 0.6914, + "step": 49380 + }, + { + "epoch": 1.27, + "learning_rate": 1.2970295333332644e-06, + "loss": 0.7822, + "step": 49381 + }, + { + "epoch": 1.27, + "learning_rate": 1.2970031115804873e-06, + "loss": 0.6543, + "step": 49382 + }, + { + "epoch": 1.27, + "learning_rate": 1.2969766896003088e-06, + "loss": 0.5508, + "step": 49383 + }, + { + "epoch": 1.27, + "learning_rate": 1.296950267392749e-06, + "loss": 0.7505, + "step": 49384 + }, + { + "epoch": 1.27, + "learning_rate": 1.2969238449578284e-06, + "loss": 0.5796, + "step": 49385 + }, + { + "epoch": 1.27, + "learning_rate": 1.2968974222955662e-06, + "loss": 0.7471, + "step": 49386 + }, + { + "epoch": 1.27, + "learning_rate": 1.2968709994059837e-06, + "loss": 0.6768, + "step": 49387 + }, + { + "epoch": 1.27, + "learning_rate": 1.2968445762891005e-06, + "loss": 0.424, + "step": 49388 + }, + { + "epoch": 1.27, + "learning_rate": 1.296818152944937e-06, + "loss": 0.6348, + "step": 49389 + }, + { + "epoch": 1.27, + "learning_rate": 1.2967917293735138e-06, + "loss": 0.543, + "step": 49390 + }, + { + "epoch": 1.27, + "learning_rate": 1.2967653055748504e-06, + "loss": 0.7163, + "step": 49391 + }, + { + "epoch": 1.27, + "learning_rate": 1.296738881548968e-06, + "loss": 0.7422, + "step": 49392 + }, + { + "epoch": 1.27, + "learning_rate": 1.2967124572958857e-06, + "loss": 0.6533, + "step": 49393 + }, + { + "epoch": 1.27, + "learning_rate": 1.2966860328156247e-06, + "loss": 0.6154, + "step": 49394 + }, + { + "epoch": 1.27, + "learning_rate": 1.2966596081082049e-06, + "loss": 0.6514, + "step": 49395 + }, + { + "epoch": 1.27, + "learning_rate": 1.2966331831736464e-06, + "loss": 0.603, + "step": 49396 + }, + { + "epoch": 1.27, + "learning_rate": 1.2966067580119694e-06, + "loss": 0.79, + "step": 49397 + }, + { + "epoch": 1.27, + "learning_rate": 1.2965803326231941e-06, + "loss": 0.6592, + "step": 49398 + }, + { + "epoch": 1.27, + "learning_rate": 1.296553907007341e-06, + "loss": 0.582, + "step": 49399 + }, + { + "epoch": 1.27, + "learning_rate": 1.2965274811644305e-06, + "loss": 0.749, + "step": 49400 + }, + { + "epoch": 1.27, + "learning_rate": 1.2965010550944822e-06, + "loss": 0.605, + "step": 49401 + }, + { + "epoch": 1.27, + "learning_rate": 1.2964746287975167e-06, + "loss": 0.5776, + "step": 49402 + }, + { + "epoch": 1.27, + "learning_rate": 1.2964482022735543e-06, + "loss": 0.5586, + "step": 49403 + }, + { + "epoch": 1.27, + "learning_rate": 1.2964217755226152e-06, + "loss": 0.6304, + "step": 49404 + }, + { + "epoch": 1.27, + "learning_rate": 1.2963953485447197e-06, + "loss": 0.5664, + "step": 49405 + }, + { + "epoch": 1.27, + "learning_rate": 1.2963689213398877e-06, + "loss": 0.7734, + "step": 49406 + }, + { + "epoch": 1.27, + "learning_rate": 1.2963424939081395e-06, + "loss": 0.7617, + "step": 49407 + }, + { + "epoch": 1.27, + "learning_rate": 1.2963160662494957e-06, + "loss": 0.5745, + "step": 49408 + }, + { + "epoch": 1.27, + "learning_rate": 1.296289638363976e-06, + "loss": 0.7617, + "step": 49409 + }, + { + "epoch": 1.27, + "learning_rate": 1.2962632102516013e-06, + "loss": 0.7686, + "step": 49410 + }, + { + "epoch": 1.27, + "learning_rate": 1.2962367819123916e-06, + "loss": 0.667, + "step": 49411 + }, + { + "epoch": 1.27, + "learning_rate": 1.296210353346367e-06, + "loss": 0.5186, + "step": 49412 + }, + { + "epoch": 1.27, + "learning_rate": 1.2961839245535471e-06, + "loss": 0.4419, + "step": 49413 + }, + { + "epoch": 1.27, + "learning_rate": 1.2961574955339533e-06, + "loss": 0.752, + "step": 49414 + }, + { + "epoch": 1.27, + "learning_rate": 1.2961310662876056e-06, + "loss": 0.748, + "step": 49415 + }, + { + "epoch": 1.27, + "learning_rate": 1.2961046368145235e-06, + "loss": 0.7192, + "step": 49416 + }, + { + "epoch": 1.27, + "learning_rate": 1.2960782071147279e-06, + "loss": 0.6167, + "step": 49417 + }, + { + "epoch": 1.27, + "learning_rate": 1.2960517771882385e-06, + "loss": 0.6504, + "step": 49418 + }, + { + "epoch": 1.27, + "learning_rate": 1.2960253470350762e-06, + "loss": 0.7725, + "step": 49419 + }, + { + "epoch": 1.27, + "learning_rate": 1.295998916655261e-06, + "loss": 0.533, + "step": 49420 + }, + { + "epoch": 1.27, + "learning_rate": 1.295972486048813e-06, + "loss": 0.6006, + "step": 49421 + }, + { + "epoch": 1.27, + "learning_rate": 1.295946055215752e-06, + "loss": 0.6631, + "step": 49422 + }, + { + "epoch": 1.27, + "learning_rate": 1.295919624156099e-06, + "loss": 0.5465, + "step": 49423 + }, + { + "epoch": 1.27, + "learning_rate": 1.295893192869874e-06, + "loss": 0.5757, + "step": 49424 + }, + { + "epoch": 1.27, + "learning_rate": 1.2958667613570974e-06, + "loss": 0.8027, + "step": 49425 + }, + { + "epoch": 1.27, + "learning_rate": 1.2958403296177888e-06, + "loss": 0.6816, + "step": 49426 + }, + { + "epoch": 1.27, + "learning_rate": 1.2958138976519692e-06, + "loss": 0.7231, + "step": 49427 + }, + { + "epoch": 1.27, + "learning_rate": 1.2957874654596584e-06, + "loss": 0.6445, + "step": 49428 + }, + { + "epoch": 1.27, + "learning_rate": 1.2957610330408765e-06, + "loss": 0.6475, + "step": 49429 + }, + { + "epoch": 1.27, + "learning_rate": 1.2957346003956445e-06, + "loss": 0.6621, + "step": 49430 + }, + { + "epoch": 1.27, + "learning_rate": 1.2957081675239818e-06, + "loss": 0.8262, + "step": 49431 + }, + { + "epoch": 1.27, + "learning_rate": 1.2956817344259089e-06, + "loss": 0.4218, + "step": 49432 + }, + { + "epoch": 1.27, + "learning_rate": 1.295655301101446e-06, + "loss": 0.5883, + "step": 49433 + }, + { + "epoch": 1.27, + "learning_rate": 1.2956288675506135e-06, + "loss": 0.7207, + "step": 49434 + }, + { + "epoch": 1.27, + "learning_rate": 1.2956024337734319e-06, + "loss": 0.6362, + "step": 49435 + }, + { + "epoch": 1.27, + "learning_rate": 1.295575999769921e-06, + "loss": 0.626, + "step": 49436 + }, + { + "epoch": 1.27, + "learning_rate": 1.2955495655401009e-06, + "loss": 0.6445, + "step": 49437 + }, + { + "epoch": 1.27, + "learning_rate": 1.295523131083992e-06, + "loss": 0.4246, + "step": 49438 + }, + { + "epoch": 1.27, + "learning_rate": 1.295496696401615e-06, + "loss": 0.5693, + "step": 49439 + }, + { + "epoch": 1.27, + "learning_rate": 1.2954702614929898e-06, + "loss": 0.7061, + "step": 49440 + }, + { + "epoch": 1.27, + "learning_rate": 1.2954438263581362e-06, + "loss": 0.6885, + "step": 49441 + }, + { + "epoch": 1.27, + "learning_rate": 1.2954173909970752e-06, + "loss": 0.7324, + "step": 49442 + }, + { + "epoch": 1.27, + "learning_rate": 1.2953909554098261e-06, + "loss": 0.5144, + "step": 49443 + }, + { + "epoch": 1.27, + "learning_rate": 1.2953645195964106e-06, + "loss": 0.5293, + "step": 49444 + }, + { + "epoch": 1.27, + "learning_rate": 1.2953380835568474e-06, + "loss": 0.6406, + "step": 49445 + }, + { + "epoch": 1.27, + "learning_rate": 1.2953116472911577e-06, + "loss": 0.6807, + "step": 49446 + }, + { + "epoch": 1.27, + "learning_rate": 1.2952852107993613e-06, + "loss": 0.4824, + "step": 49447 + }, + { + "epoch": 1.27, + "learning_rate": 1.2952587740814787e-06, + "loss": 0.5308, + "step": 49448 + }, + { + "epoch": 1.27, + "learning_rate": 1.2952323371375298e-06, + "loss": 0.4717, + "step": 49449 + }, + { + "epoch": 1.27, + "learning_rate": 1.2952058999675357e-06, + "loss": 0.6082, + "step": 49450 + }, + { + "epoch": 1.27, + "learning_rate": 1.2951794625715153e-06, + "loss": 0.8018, + "step": 49451 + }, + { + "epoch": 1.27, + "learning_rate": 1.29515302494949e-06, + "loss": 0.6143, + "step": 49452 + }, + { + "epoch": 1.27, + "learning_rate": 1.2951265871014793e-06, + "loss": 0.624, + "step": 49453 + }, + { + "epoch": 1.27, + "learning_rate": 1.2951001490275041e-06, + "loss": 0.626, + "step": 49454 + }, + { + "epoch": 1.27, + "learning_rate": 1.2950737107275842e-06, + "loss": 0.7598, + "step": 49455 + }, + { + "epoch": 1.27, + "learning_rate": 1.2950472722017398e-06, + "loss": 0.772, + "step": 49456 + }, + { + "epoch": 1.27, + "learning_rate": 1.2950208334499913e-06, + "loss": 0.7842, + "step": 49457 + }, + { + "epoch": 1.27, + "learning_rate": 1.294994394472359e-06, + "loss": 0.7783, + "step": 49458 + }, + { + "epoch": 1.27, + "learning_rate": 1.2949679552688627e-06, + "loss": 0.5583, + "step": 49459 + }, + { + "epoch": 1.27, + "learning_rate": 1.2949415158395232e-06, + "loss": 0.5422, + "step": 49460 + }, + { + "epoch": 1.27, + "learning_rate": 1.2949150761843609e-06, + "loss": 0.6704, + "step": 49461 + }, + { + "epoch": 1.27, + "learning_rate": 1.294888636303395e-06, + "loss": 0.647, + "step": 49462 + }, + { + "epoch": 1.27, + "learning_rate": 1.2948621961966471e-06, + "loss": 0.6548, + "step": 49463 + }, + { + "epoch": 1.27, + "learning_rate": 1.2948357558641363e-06, + "loss": 0.5269, + "step": 49464 + }, + { + "epoch": 1.27, + "learning_rate": 1.2948093153058836e-06, + "loss": 0.6982, + "step": 49465 + }, + { + "epoch": 1.27, + "learning_rate": 1.2947828745219089e-06, + "loss": 0.6299, + "step": 49466 + }, + { + "epoch": 1.27, + "learning_rate": 1.2947564335122325e-06, + "loss": 0.8164, + "step": 49467 + }, + { + "epoch": 1.27, + "learning_rate": 1.2947299922768746e-06, + "loss": 0.5, + "step": 49468 + }, + { + "epoch": 1.27, + "learning_rate": 1.2947035508158554e-06, + "loss": 0.6807, + "step": 49469 + }, + { + "epoch": 1.27, + "learning_rate": 1.2946771091291955e-06, + "loss": 0.6602, + "step": 49470 + }, + { + "epoch": 1.27, + "learning_rate": 1.294650667216915e-06, + "loss": 0.6377, + "step": 49471 + }, + { + "epoch": 1.27, + "learning_rate": 1.2946242250790336e-06, + "loss": 0.6016, + "step": 49472 + }, + { + "epoch": 1.27, + "learning_rate": 1.2945977827155722e-06, + "loss": 0.8271, + "step": 49473 + }, + { + "epoch": 1.27, + "learning_rate": 1.2945713401265506e-06, + "loss": 0.6816, + "step": 49474 + }, + { + "epoch": 1.27, + "learning_rate": 1.2945448973119897e-06, + "loss": 0.6602, + "step": 49475 + }, + { + "epoch": 1.27, + "learning_rate": 1.2945184542719089e-06, + "loss": 0.7588, + "step": 49476 + }, + { + "epoch": 1.27, + "learning_rate": 1.294492011006329e-06, + "loss": 0.665, + "step": 49477 + }, + { + "epoch": 1.27, + "learning_rate": 1.2944655675152702e-06, + "loss": 0.5972, + "step": 49478 + }, + { + "epoch": 1.27, + "learning_rate": 1.2944391237987527e-06, + "loss": 0.7056, + "step": 49479 + }, + { + "epoch": 1.27, + "learning_rate": 1.2944126798567967e-06, + "loss": 0.5708, + "step": 49480 + }, + { + "epoch": 1.27, + "learning_rate": 1.2943862356894221e-06, + "loss": 0.6074, + "step": 49481 + }, + { + "epoch": 1.27, + "learning_rate": 1.29435979129665e-06, + "loss": 0.4777, + "step": 49482 + }, + { + "epoch": 1.27, + "learning_rate": 1.2943333466784995e-06, + "loss": 0.5825, + "step": 49483 + }, + { + "epoch": 1.27, + "learning_rate": 1.2943069018349921e-06, + "loss": 0.7212, + "step": 49484 + }, + { + "epoch": 1.27, + "learning_rate": 1.294280456766147e-06, + "loss": 0.7412, + "step": 49485 + }, + { + "epoch": 1.27, + "learning_rate": 1.2942540114719856e-06, + "loss": 0.5298, + "step": 49486 + }, + { + "epoch": 1.27, + "learning_rate": 1.2942275659525268e-06, + "loss": 0.6162, + "step": 49487 + }, + { + "epoch": 1.27, + "learning_rate": 1.2942011202077917e-06, + "loss": 0.5215, + "step": 49488 + }, + { + "epoch": 1.27, + "learning_rate": 1.2941746742378001e-06, + "loss": 0.7451, + "step": 49489 + }, + { + "epoch": 1.27, + "learning_rate": 1.2941482280425728e-06, + "loss": 0.5647, + "step": 49490 + }, + { + "epoch": 1.27, + "learning_rate": 1.2941217816221296e-06, + "loss": 0.7979, + "step": 49491 + }, + { + "epoch": 1.27, + "learning_rate": 1.2940953349764908e-06, + "loss": 0.6865, + "step": 49492 + }, + { + "epoch": 1.27, + "learning_rate": 1.2940688881056765e-06, + "loss": 0.7686, + "step": 49493 + }, + { + "epoch": 1.27, + "learning_rate": 1.2940424410097078e-06, + "loss": 0.324, + "step": 49494 + }, + { + "epoch": 1.27, + "learning_rate": 1.2940159936886036e-06, + "loss": 0.6548, + "step": 49495 + }, + { + "epoch": 1.27, + "learning_rate": 1.2939895461423854e-06, + "loss": 0.5107, + "step": 49496 + }, + { + "epoch": 1.27, + "learning_rate": 1.2939630983710728e-06, + "loss": 0.6509, + "step": 49497 + }, + { + "epoch": 1.27, + "learning_rate": 1.293936650374686e-06, + "loss": 0.5732, + "step": 49498 + }, + { + "epoch": 1.27, + "learning_rate": 1.2939102021532456e-06, + "loss": 0.8467, + "step": 49499 + }, + { + "epoch": 1.27, + "learning_rate": 1.2938837537067715e-06, + "loss": 0.6182, + "step": 49500 + }, + { + "epoch": 1.27, + "learning_rate": 1.2938573050352843e-06, + "loss": 0.6353, + "step": 49501 + }, + { + "epoch": 1.27, + "learning_rate": 1.293830856138804e-06, + "loss": 0.6055, + "step": 49502 + }, + { + "epoch": 1.27, + "learning_rate": 1.293804407017351e-06, + "loss": 0.7742, + "step": 49503 + }, + { + "epoch": 1.27, + "learning_rate": 1.2937779576709456e-06, + "loss": 0.834, + "step": 49504 + }, + { + "epoch": 1.27, + "learning_rate": 1.2937515080996075e-06, + "loss": 0.7461, + "step": 49505 + }, + { + "epoch": 1.27, + "learning_rate": 1.2937250583033577e-06, + "loss": 0.7109, + "step": 49506 + }, + { + "epoch": 1.27, + "learning_rate": 1.2936986082822162e-06, + "loss": 0.7432, + "step": 49507 + }, + { + "epoch": 1.27, + "learning_rate": 1.2936721580362026e-06, + "loss": 0.4458, + "step": 49508 + }, + { + "epoch": 1.27, + "learning_rate": 1.2936457075653385e-06, + "loss": 0.5781, + "step": 49509 + }, + { + "epoch": 1.27, + "learning_rate": 1.293619256869643e-06, + "loss": 0.6196, + "step": 49510 + }, + { + "epoch": 1.27, + "learning_rate": 1.2935928059491369e-06, + "loss": 0.7021, + "step": 49511 + }, + { + "epoch": 1.27, + "learning_rate": 1.29356635480384e-06, + "loss": 0.5996, + "step": 49512 + }, + { + "epoch": 1.27, + "learning_rate": 1.293539903433773e-06, + "loss": 0.6812, + "step": 49513 + }, + { + "epoch": 1.27, + "learning_rate": 1.293513451838956e-06, + "loss": 0.625, + "step": 49514 + }, + { + "epoch": 1.27, + "learning_rate": 1.2934870000194094e-06, + "loss": 0.54, + "step": 49515 + }, + { + "epoch": 1.27, + "learning_rate": 1.293460547975153e-06, + "loss": 0.7051, + "step": 49516 + }, + { + "epoch": 1.27, + "learning_rate": 1.2934340957062075e-06, + "loss": 0.7246, + "step": 49517 + }, + { + "epoch": 1.27, + "learning_rate": 1.2934076432125928e-06, + "loss": 0.532, + "step": 49518 + }, + { + "epoch": 1.27, + "learning_rate": 1.2933811904943298e-06, + "loss": 0.8604, + "step": 49519 + }, + { + "epoch": 1.27, + "learning_rate": 1.293354737551438e-06, + "loss": 0.5762, + "step": 49520 + }, + { + "epoch": 1.27, + "learning_rate": 1.293328284383938e-06, + "loss": 0.8115, + "step": 49521 + }, + { + "epoch": 1.27, + "learning_rate": 1.29330183099185e-06, + "loss": 0.7861, + "step": 49522 + }, + { + "epoch": 1.27, + "learning_rate": 1.2932753773751946e-06, + "loss": 0.7695, + "step": 49523 + }, + { + "epoch": 1.27, + "learning_rate": 1.2932489235339915e-06, + "loss": 0.6074, + "step": 49524 + }, + { + "epoch": 1.27, + "learning_rate": 1.293222469468261e-06, + "loss": 0.5693, + "step": 49525 + }, + { + "epoch": 1.27, + "learning_rate": 1.2931960151780237e-06, + "loss": 0.8359, + "step": 49526 + }, + { + "epoch": 1.27, + "learning_rate": 1.2931695606632995e-06, + "loss": 0.667, + "step": 49527 + }, + { + "epoch": 1.27, + "learning_rate": 1.293143105924109e-06, + "loss": 0.4868, + "step": 49528 + }, + { + "epoch": 1.27, + "learning_rate": 1.2931166509604725e-06, + "loss": 0.7529, + "step": 49529 + }, + { + "epoch": 1.27, + "learning_rate": 1.29309019577241e-06, + "loss": 0.7363, + "step": 49530 + }, + { + "epoch": 1.27, + "learning_rate": 1.2930637403599415e-06, + "loss": 0.6306, + "step": 49531 + }, + { + "epoch": 1.27, + "learning_rate": 1.293037284723088e-06, + "loss": 0.7861, + "step": 49532 + }, + { + "epoch": 1.27, + "learning_rate": 1.2930108288618688e-06, + "loss": 0.5513, + "step": 49533 + }, + { + "epoch": 1.27, + "learning_rate": 1.2929843727763053e-06, + "loss": 0.7432, + "step": 49534 + }, + { + "epoch": 1.27, + "learning_rate": 1.2929579164664165e-06, + "loss": 0.623, + "step": 49535 + }, + { + "epoch": 1.27, + "learning_rate": 1.292931459932224e-06, + "loss": 0.6826, + "step": 49536 + }, + { + "epoch": 1.27, + "learning_rate": 1.2929050031737468e-06, + "loss": 0.6631, + "step": 49537 + }, + { + "epoch": 1.27, + "learning_rate": 1.2928785461910058e-06, + "loss": 0.5223, + "step": 49538 + }, + { + "epoch": 1.27, + "learning_rate": 1.2928520889840212e-06, + "loss": 0.6514, + "step": 49539 + }, + { + "epoch": 1.27, + "learning_rate": 1.2928256315528134e-06, + "loss": 0.3564, + "step": 49540 + }, + { + "epoch": 1.27, + "learning_rate": 1.2927991738974022e-06, + "loss": 0.6343, + "step": 49541 + }, + { + "epoch": 1.27, + "learning_rate": 1.2927727160178083e-06, + "loss": 0.4607, + "step": 49542 + }, + { + "epoch": 1.27, + "learning_rate": 1.2927462579140516e-06, + "loss": 0.625, + "step": 49543 + }, + { + "epoch": 1.27, + "learning_rate": 1.2927197995861528e-06, + "loss": 0.7939, + "step": 49544 + }, + { + "epoch": 1.27, + "learning_rate": 1.2926933410341318e-06, + "loss": 0.7422, + "step": 49545 + }, + { + "epoch": 1.27, + "learning_rate": 1.292666882258009e-06, + "loss": 0.5332, + "step": 49546 + }, + { + "epoch": 1.27, + "learning_rate": 1.2926404232578048e-06, + "loss": 0.585, + "step": 49547 + }, + { + "epoch": 1.27, + "learning_rate": 1.2926139640335389e-06, + "loss": 0.5479, + "step": 49548 + }, + { + "epoch": 1.27, + "learning_rate": 1.2925875045852323e-06, + "loss": 0.5505, + "step": 49549 + }, + { + "epoch": 1.27, + "learning_rate": 1.2925610449129044e-06, + "loss": 0.6768, + "step": 49550 + }, + { + "epoch": 1.27, + "learning_rate": 1.2925345850165765e-06, + "loss": 0.6665, + "step": 49551 + }, + { + "epoch": 1.27, + "learning_rate": 1.2925081248962682e-06, + "loss": 0.6553, + "step": 49552 + }, + { + "epoch": 1.27, + "learning_rate": 1.2924816645519996e-06, + "loss": 0.6304, + "step": 49553 + }, + { + "epoch": 1.27, + "learning_rate": 1.2924552039837914e-06, + "loss": 0.6631, + "step": 49554 + }, + { + "epoch": 1.27, + "learning_rate": 1.2924287431916642e-06, + "loss": 0.6895, + "step": 49555 + }, + { + "epoch": 1.27, + "learning_rate": 1.292402282175637e-06, + "loss": 0.5752, + "step": 49556 + }, + { + "epoch": 1.27, + "learning_rate": 1.2923758209357311e-06, + "loss": 0.6201, + "step": 49557 + }, + { + "epoch": 1.27, + "learning_rate": 1.2923493594719662e-06, + "loss": 0.625, + "step": 49558 + }, + { + "epoch": 1.27, + "learning_rate": 1.2923228977843636e-06, + "loss": 0.4032, + "step": 49559 + }, + { + "epoch": 1.27, + "learning_rate": 1.2922964358729422e-06, + "loss": 0.7588, + "step": 49560 + }, + { + "epoch": 1.27, + "learning_rate": 1.292269973737723e-06, + "loss": 0.6843, + "step": 49561 + }, + { + "epoch": 1.27, + "learning_rate": 1.292243511378726e-06, + "loss": 0.5923, + "step": 49562 + }, + { + "epoch": 1.27, + "learning_rate": 1.2922170487959716e-06, + "loss": 0.5894, + "step": 49563 + }, + { + "epoch": 1.27, + "learning_rate": 1.2921905859894803e-06, + "loss": 0.5356, + "step": 49564 + }, + { + "epoch": 1.27, + "learning_rate": 1.2921641229592722e-06, + "loss": 0.7754, + "step": 49565 + }, + { + "epoch": 1.27, + "learning_rate": 1.292137659705367e-06, + "loss": 0.6025, + "step": 49566 + }, + { + "epoch": 1.27, + "learning_rate": 1.2921111962277856e-06, + "loss": 0.4844, + "step": 49567 + }, + { + "epoch": 1.27, + "learning_rate": 1.2920847325265478e-06, + "loss": 0.5339, + "step": 49568 + }, + { + "epoch": 1.27, + "learning_rate": 1.2920582686016745e-06, + "loss": 0.6372, + "step": 49569 + }, + { + "epoch": 1.27, + "learning_rate": 1.292031804453186e-06, + "loss": 0.6387, + "step": 49570 + }, + { + "epoch": 1.27, + "learning_rate": 1.2920053400811015e-06, + "loss": 0.5137, + "step": 49571 + }, + { + "epoch": 1.27, + "learning_rate": 1.2919788754854422e-06, + "loss": 0.6787, + "step": 49572 + }, + { + "epoch": 1.27, + "learning_rate": 1.2919524106662279e-06, + "loss": 0.8047, + "step": 49573 + }, + { + "epoch": 1.27, + "learning_rate": 1.2919259456234794e-06, + "loss": 0.5825, + "step": 49574 + }, + { + "epoch": 1.27, + "learning_rate": 1.2918994803572165e-06, + "loss": 0.4768, + "step": 49575 + }, + { + "epoch": 1.27, + "learning_rate": 1.2918730148674594e-06, + "loss": 0.5962, + "step": 49576 + }, + { + "epoch": 1.27, + "learning_rate": 1.2918465491542287e-06, + "loss": 0.6772, + "step": 49577 + }, + { + "epoch": 1.27, + "learning_rate": 1.2918200832175447e-06, + "loss": 0.6309, + "step": 49578 + }, + { + "epoch": 1.27, + "learning_rate": 1.2917936170574275e-06, + "loss": 0.6211, + "step": 49579 + }, + { + "epoch": 1.27, + "learning_rate": 1.291767150673897e-06, + "loss": 0.6367, + "step": 49580 + }, + { + "epoch": 1.27, + "learning_rate": 1.291740684066974e-06, + "loss": 0.6562, + "step": 49581 + }, + { + "epoch": 1.27, + "learning_rate": 1.2917142172366786e-06, + "loss": 0.5259, + "step": 49582 + }, + { + "epoch": 1.27, + "learning_rate": 1.2916877501830308e-06, + "loss": 0.6968, + "step": 49583 + }, + { + "epoch": 1.27, + "learning_rate": 1.2916612829060517e-06, + "loss": 0.6802, + "step": 49584 + }, + { + "epoch": 1.27, + "learning_rate": 1.2916348154057604e-06, + "loss": 0.6572, + "step": 49585 + }, + { + "epoch": 1.27, + "learning_rate": 1.2916083476821778e-06, + "loss": 0.7061, + "step": 49586 + }, + { + "epoch": 1.27, + "learning_rate": 1.291581879735324e-06, + "loss": 0.5869, + "step": 49587 + }, + { + "epoch": 1.27, + "learning_rate": 1.2915554115652196e-06, + "loss": 0.8262, + "step": 49588 + }, + { + "epoch": 1.27, + "learning_rate": 1.2915289431718845e-06, + "loss": 0.6748, + "step": 49589 + }, + { + "epoch": 1.27, + "learning_rate": 1.291502474555339e-06, + "loss": 0.7871, + "step": 49590 + }, + { + "epoch": 1.27, + "learning_rate": 1.2914760057156039e-06, + "loss": 0.8096, + "step": 49591 + }, + { + "epoch": 1.27, + "learning_rate": 1.2914495366526988e-06, + "loss": 0.6184, + "step": 49592 + }, + { + "epoch": 1.27, + "learning_rate": 1.2914230673666439e-06, + "loss": 0.7666, + "step": 49593 + }, + { + "epoch": 1.27, + "learning_rate": 1.2913965978574602e-06, + "loss": 0.4758, + "step": 49594 + }, + { + "epoch": 1.27, + "learning_rate": 1.2913701281251674e-06, + "loss": 0.5889, + "step": 49595 + }, + { + "epoch": 1.27, + "learning_rate": 1.2913436581697856e-06, + "loss": 0.6904, + "step": 49596 + }, + { + "epoch": 1.27, + "learning_rate": 1.2913171879913356e-06, + "loss": 0.5649, + "step": 49597 + }, + { + "epoch": 1.27, + "learning_rate": 1.2912907175898372e-06, + "loss": 0.5459, + "step": 49598 + }, + { + "epoch": 1.27, + "learning_rate": 1.2912642469653115e-06, + "loss": 0.5215, + "step": 49599 + }, + { + "epoch": 1.27, + "learning_rate": 1.2912377761177774e-06, + "loss": 0.8408, + "step": 49600 + }, + { + "epoch": 1.27, + "learning_rate": 1.2912113050472564e-06, + "loss": 0.4722, + "step": 49601 + }, + { + "epoch": 1.27, + "learning_rate": 1.291184833753768e-06, + "loss": 0.686, + "step": 49602 + }, + { + "epoch": 1.27, + "learning_rate": 1.291158362237333e-06, + "loss": 0.5918, + "step": 49603 + }, + { + "epoch": 1.27, + "learning_rate": 1.2911318904979714e-06, + "loss": 0.7891, + "step": 49604 + }, + { + "epoch": 1.27, + "learning_rate": 1.2911054185357036e-06, + "loss": 0.6357, + "step": 49605 + }, + { + "epoch": 1.27, + "learning_rate": 1.2910789463505493e-06, + "loss": 0.5343, + "step": 49606 + }, + { + "epoch": 1.27, + "learning_rate": 1.2910524739425296e-06, + "loss": 0.6367, + "step": 49607 + }, + { + "epoch": 1.27, + "learning_rate": 1.2910260013116645e-06, + "loss": 0.5679, + "step": 49608 + }, + { + "epoch": 1.27, + "learning_rate": 1.2909995284579742e-06, + "loss": 0.6406, + "step": 49609 + }, + { + "epoch": 1.27, + "learning_rate": 1.2909730553814786e-06, + "loss": 0.603, + "step": 49610 + }, + { + "epoch": 1.27, + "learning_rate": 1.2909465820821986e-06, + "loss": 0.604, + "step": 49611 + }, + { + "epoch": 1.27, + "learning_rate": 1.290920108560154e-06, + "loss": 0.564, + "step": 49612 + }, + { + "epoch": 1.27, + "learning_rate": 1.2908936348153651e-06, + "loss": 0.7471, + "step": 49613 + }, + { + "epoch": 1.27, + "learning_rate": 1.2908671608478528e-06, + "loss": 0.543, + "step": 49614 + }, + { + "epoch": 1.27, + "learning_rate": 1.2908406866576364e-06, + "loss": 0.7344, + "step": 49615 + }, + { + "epoch": 1.27, + "learning_rate": 1.290814212244737e-06, + "loss": 0.6304, + "step": 49616 + }, + { + "epoch": 1.27, + "learning_rate": 1.2907877376091743e-06, + "loss": 0.665, + "step": 49617 + }, + { + "epoch": 1.27, + "learning_rate": 1.290761262750969e-06, + "loss": 0.5669, + "step": 49618 + }, + { + "epoch": 1.27, + "learning_rate": 1.2907347876701412e-06, + "loss": 0.7412, + "step": 49619 + }, + { + "epoch": 1.27, + "learning_rate": 1.290708312366711e-06, + "loss": 0.6699, + "step": 49620 + }, + { + "epoch": 1.27, + "learning_rate": 1.2906818368406986e-06, + "loss": 0.731, + "step": 49621 + }, + { + "epoch": 1.27, + "learning_rate": 1.2906553610921247e-06, + "loss": 0.6406, + "step": 49622 + }, + { + "epoch": 1.27, + "learning_rate": 1.2906288851210093e-06, + "loss": 0.5339, + "step": 49623 + }, + { + "epoch": 1.27, + "learning_rate": 1.290602408927373e-06, + "loss": 0.627, + "step": 49624 + }, + { + "epoch": 1.27, + "learning_rate": 1.2905759325112355e-06, + "loss": 0.5972, + "step": 49625 + }, + { + "epoch": 1.27, + "learning_rate": 1.2905494558726175e-06, + "loss": 0.7227, + "step": 49626 + }, + { + "epoch": 1.27, + "learning_rate": 1.2905229790115391e-06, + "loss": 0.5972, + "step": 49627 + }, + { + "epoch": 1.27, + "learning_rate": 1.2904965019280206e-06, + "loss": 0.6406, + "step": 49628 + }, + { + "epoch": 1.27, + "learning_rate": 1.2904700246220822e-06, + "loss": 0.7041, + "step": 49629 + }, + { + "epoch": 1.27, + "learning_rate": 1.2904435470937448e-06, + "loss": 0.7244, + "step": 49630 + }, + { + "epoch": 1.27, + "learning_rate": 1.2904170693430273e-06, + "loss": 0.7129, + "step": 49631 + }, + { + "epoch": 1.27, + "learning_rate": 1.2903905913699514e-06, + "loss": 0.6021, + "step": 49632 + }, + { + "epoch": 1.27, + "learning_rate": 1.2903641131745363e-06, + "loss": 0.8164, + "step": 49633 + }, + { + "epoch": 1.27, + "learning_rate": 1.290337634756803e-06, + "loss": 0.667, + "step": 49634 + }, + { + "epoch": 1.27, + "learning_rate": 1.290311156116772e-06, + "loss": 0.5796, + "step": 49635 + }, + { + "epoch": 1.27, + "learning_rate": 1.2902846772544622e-06, + "loss": 0.7119, + "step": 49636 + }, + { + "epoch": 1.27, + "learning_rate": 1.2902581981698953e-06, + "loss": 0.751, + "step": 49637 + }, + { + "epoch": 1.27, + "learning_rate": 1.2902317188630912e-06, + "loss": 0.5562, + "step": 49638 + }, + { + "epoch": 1.27, + "learning_rate": 1.2902052393340696e-06, + "loss": 0.6816, + "step": 49639 + }, + { + "epoch": 1.27, + "learning_rate": 1.2901787595828513e-06, + "loss": 0.5078, + "step": 49640 + }, + { + "epoch": 1.27, + "learning_rate": 1.2901522796094567e-06, + "loss": 0.5015, + "step": 49641 + }, + { + "epoch": 1.27, + "learning_rate": 1.2901257994139054e-06, + "loss": 0.6914, + "step": 49642 + }, + { + "epoch": 1.27, + "learning_rate": 1.2900993189962183e-06, + "loss": 0.5132, + "step": 49643 + }, + { + "epoch": 1.27, + "learning_rate": 1.2900728383564159e-06, + "loss": 0.5107, + "step": 49644 + }, + { + "epoch": 1.27, + "learning_rate": 1.2900463574945178e-06, + "loss": 0.6279, + "step": 49645 + }, + { + "epoch": 1.27, + "learning_rate": 1.2900198764105444e-06, + "loss": 0.7222, + "step": 49646 + }, + { + "epoch": 1.27, + "learning_rate": 1.289993395104516e-06, + "loss": 0.8701, + "step": 49647 + }, + { + "epoch": 1.27, + "learning_rate": 1.2899669135764532e-06, + "loss": 0.5366, + "step": 49648 + }, + { + "epoch": 1.27, + "learning_rate": 1.2899404318263765e-06, + "loss": 0.6172, + "step": 49649 + }, + { + "epoch": 1.27, + "learning_rate": 1.289913949854305e-06, + "loss": 0.7568, + "step": 49650 + }, + { + "epoch": 1.27, + "learning_rate": 1.28988746766026e-06, + "loss": 0.71, + "step": 49651 + }, + { + "epoch": 1.27, + "learning_rate": 1.2898609852442614e-06, + "loss": 0.6763, + "step": 49652 + }, + { + "epoch": 1.27, + "learning_rate": 1.2898345026063298e-06, + "loss": 0.447, + "step": 49653 + }, + { + "epoch": 1.27, + "learning_rate": 1.2898080197464854e-06, + "loss": 0.4778, + "step": 49654 + }, + { + "epoch": 1.27, + "learning_rate": 1.289781536664748e-06, + "loss": 0.7646, + "step": 49655 + }, + { + "epoch": 1.27, + "learning_rate": 1.289755053361138e-06, + "loss": 0.6582, + "step": 49656 + }, + { + "epoch": 1.27, + "learning_rate": 1.2897285698356765e-06, + "loss": 0.478, + "step": 49657 + }, + { + "epoch": 1.27, + "learning_rate": 1.2897020860883824e-06, + "loss": 0.5825, + "step": 49658 + }, + { + "epoch": 1.27, + "learning_rate": 1.2896756021192774e-06, + "loss": 0.4797, + "step": 49659 + }, + { + "epoch": 1.27, + "learning_rate": 1.2896491179283808e-06, + "loss": 0.6191, + "step": 49660 + }, + { + "epoch": 1.27, + "learning_rate": 1.2896226335157132e-06, + "loss": 0.3131, + "step": 49661 + }, + { + "epoch": 1.27, + "learning_rate": 1.2895961488812947e-06, + "loss": 0.6387, + "step": 49662 + }, + { + "epoch": 1.27, + "learning_rate": 1.289569664025146e-06, + "loss": 0.6787, + "step": 49663 + }, + { + "epoch": 1.27, + "learning_rate": 1.2895431789472872e-06, + "loss": 0.4617, + "step": 49664 + }, + { + "epoch": 1.27, + "learning_rate": 1.2895166936477384e-06, + "loss": 0.6035, + "step": 49665 + }, + { + "epoch": 1.27, + "learning_rate": 1.28949020812652e-06, + "loss": 0.7207, + "step": 49666 + }, + { + "epoch": 1.27, + "learning_rate": 1.289463722383652e-06, + "loss": 0.6028, + "step": 49667 + }, + { + "epoch": 1.27, + "learning_rate": 1.2894372364191552e-06, + "loss": 0.7812, + "step": 49668 + }, + { + "epoch": 1.27, + "learning_rate": 1.2894107502330496e-06, + "loss": 0.6807, + "step": 49669 + }, + { + "epoch": 1.27, + "learning_rate": 1.2893842638253555e-06, + "loss": 0.5029, + "step": 49670 + }, + { + "epoch": 1.27, + "learning_rate": 1.2893577771960931e-06, + "loss": 0.6938, + "step": 49671 + }, + { + "epoch": 1.27, + "learning_rate": 1.289331290345283e-06, + "loss": 0.3943, + "step": 49672 + }, + { + "epoch": 1.27, + "learning_rate": 1.2893048032729448e-06, + "loss": 0.6602, + "step": 49673 + }, + { + "epoch": 1.27, + "learning_rate": 1.2892783159790997e-06, + "loss": 0.6055, + "step": 49674 + }, + { + "epoch": 1.27, + "learning_rate": 1.289251828463767e-06, + "loss": 0.6738, + "step": 49675 + }, + { + "epoch": 1.27, + "learning_rate": 1.2892253407269678e-06, + "loss": 0.7314, + "step": 49676 + }, + { + "epoch": 1.27, + "learning_rate": 1.289198852768722e-06, + "loss": 0.4062, + "step": 49677 + }, + { + "epoch": 1.27, + "learning_rate": 1.2891723645890498e-06, + "loss": 0.6562, + "step": 49678 + }, + { + "epoch": 1.27, + "learning_rate": 1.289145876187972e-06, + "loss": 0.7383, + "step": 49679 + }, + { + "epoch": 1.27, + "learning_rate": 1.289119387565508e-06, + "loss": 0.7549, + "step": 49680 + }, + { + "epoch": 1.27, + "learning_rate": 1.2890928987216788e-06, + "loss": 0.6091, + "step": 49681 + }, + { + "epoch": 1.27, + "learning_rate": 1.2890664096565044e-06, + "loss": 0.6689, + "step": 49682 + }, + { + "epoch": 1.27, + "learning_rate": 1.289039920370005e-06, + "loss": 0.4302, + "step": 49683 + }, + { + "epoch": 1.27, + "learning_rate": 1.2890134308622015e-06, + "loss": 0.5381, + "step": 49684 + }, + { + "epoch": 1.27, + "learning_rate": 1.2889869411331134e-06, + "loss": 0.6157, + "step": 49685 + }, + { + "epoch": 1.27, + "learning_rate": 1.2889604511827612e-06, + "loss": 0.7178, + "step": 49686 + }, + { + "epoch": 1.27, + "learning_rate": 1.2889339610111653e-06, + "loss": 0.7969, + "step": 49687 + }, + { + "epoch": 1.27, + "learning_rate": 1.288907470618346e-06, + "loss": 0.7881, + "step": 49688 + }, + { + "epoch": 1.27, + "learning_rate": 1.2888809800043238e-06, + "loss": 0.5476, + "step": 49689 + }, + { + "epoch": 1.27, + "learning_rate": 1.2888544891691184e-06, + "loss": 0.6826, + "step": 49690 + }, + { + "epoch": 1.27, + "learning_rate": 1.2888279981127506e-06, + "loss": 0.708, + "step": 49691 + }, + { + "epoch": 1.27, + "learning_rate": 1.2888015068352404e-06, + "loss": 0.7373, + "step": 49692 + }, + { + "epoch": 1.27, + "learning_rate": 1.2887750153366079e-06, + "loss": 0.7646, + "step": 49693 + }, + { + "epoch": 1.27, + "learning_rate": 1.288748523616874e-06, + "loss": 0.6641, + "step": 49694 + }, + { + "epoch": 1.27, + "learning_rate": 1.2887220316760585e-06, + "loss": 0.7598, + "step": 49695 + }, + { + "epoch": 1.27, + "learning_rate": 1.2886955395141819e-06, + "loss": 0.6611, + "step": 49696 + }, + { + "epoch": 1.27, + "learning_rate": 1.2886690471312642e-06, + "loss": 0.6953, + "step": 49697 + }, + { + "epoch": 1.27, + "learning_rate": 1.2886425545273261e-06, + "loss": 0.5742, + "step": 49698 + }, + { + "epoch": 1.27, + "learning_rate": 1.2886160617023878e-06, + "loss": 0.7126, + "step": 49699 + }, + { + "epoch": 1.27, + "learning_rate": 1.2885895686564688e-06, + "loss": 0.7197, + "step": 49700 + }, + { + "epoch": 1.27, + "learning_rate": 1.288563075389591e-06, + "loss": 0.7607, + "step": 49701 + }, + { + "epoch": 1.27, + "learning_rate": 1.288536581901773e-06, + "loss": 0.7466, + "step": 49702 + }, + { + "epoch": 1.27, + "learning_rate": 1.288510088193036e-06, + "loss": 0.6616, + "step": 49703 + }, + { + "epoch": 1.27, + "learning_rate": 1.2884835942634e-06, + "loss": 0.6416, + "step": 49704 + }, + { + "epoch": 1.27, + "learning_rate": 1.2884571001128854e-06, + "loss": 0.5771, + "step": 49705 + }, + { + "epoch": 1.27, + "learning_rate": 1.2884306057415127e-06, + "loss": 0.7158, + "step": 49706 + }, + { + "epoch": 1.27, + "learning_rate": 1.2884041111493016e-06, + "loss": 0.7363, + "step": 49707 + }, + { + "epoch": 1.27, + "learning_rate": 1.2883776163362729e-06, + "loss": 0.8809, + "step": 49708 + }, + { + "epoch": 1.27, + "learning_rate": 1.2883511213024467e-06, + "loss": 0.6084, + "step": 49709 + }, + { + "epoch": 1.27, + "learning_rate": 1.2883246260478436e-06, + "loss": 0.5723, + "step": 49710 + }, + { + "epoch": 1.27, + "learning_rate": 1.2882981305724831e-06, + "loss": 0.793, + "step": 49711 + }, + { + "epoch": 1.27, + "learning_rate": 1.2882716348763863e-06, + "loss": 0.7373, + "step": 49712 + }, + { + "epoch": 1.27, + "learning_rate": 1.288245138959573e-06, + "loss": 0.6377, + "step": 49713 + }, + { + "epoch": 1.27, + "learning_rate": 1.2882186428220638e-06, + "loss": 0.5889, + "step": 49714 + }, + { + "epoch": 1.27, + "learning_rate": 1.2881921464638788e-06, + "loss": 0.7451, + "step": 49715 + }, + { + "epoch": 1.27, + "learning_rate": 1.2881656498850383e-06, + "loss": 0.6963, + "step": 49716 + }, + { + "epoch": 1.27, + "learning_rate": 1.2881391530855622e-06, + "loss": 0.6099, + "step": 49717 + }, + { + "epoch": 1.27, + "learning_rate": 1.2881126560654718e-06, + "loss": 0.7178, + "step": 49718 + }, + { + "epoch": 1.27, + "learning_rate": 1.2880861588247867e-06, + "loss": 0.6621, + "step": 49719 + }, + { + "epoch": 1.27, + "learning_rate": 1.2880596613635274e-06, + "loss": 0.6724, + "step": 49720 + }, + { + "epoch": 1.27, + "learning_rate": 1.2880331636817134e-06, + "loss": 0.5742, + "step": 49721 + }, + { + "epoch": 1.27, + "learning_rate": 1.2880066657793662e-06, + "loss": 0.6631, + "step": 49722 + }, + { + "epoch": 1.27, + "learning_rate": 1.2879801676565051e-06, + "loss": 0.7344, + "step": 49723 + }, + { + "epoch": 1.27, + "learning_rate": 1.2879536693131514e-06, + "loss": 0.6738, + "step": 49724 + }, + { + "epoch": 1.27, + "learning_rate": 1.2879271707493246e-06, + "loss": 0.593, + "step": 49725 + }, + { + "epoch": 1.27, + "learning_rate": 1.287900671965045e-06, + "loss": 0.7969, + "step": 49726 + }, + { + "epoch": 1.27, + "learning_rate": 1.2878741729603332e-06, + "loss": 0.792, + "step": 49727 + }, + { + "epoch": 1.27, + "learning_rate": 1.2878476737352096e-06, + "loss": 0.6572, + "step": 49728 + }, + { + "epoch": 1.27, + "learning_rate": 1.2878211742896943e-06, + "loss": 0.7041, + "step": 49729 + }, + { + "epoch": 1.27, + "learning_rate": 1.287794674623807e-06, + "loss": 0.6675, + "step": 49730 + }, + { + "epoch": 1.27, + "learning_rate": 1.2877681747375691e-06, + "loss": 0.7412, + "step": 49731 + }, + { + "epoch": 1.27, + "learning_rate": 1.2877416746309999e-06, + "loss": 0.5791, + "step": 49732 + }, + { + "epoch": 1.27, + "learning_rate": 1.2877151743041206e-06, + "loss": 0.5928, + "step": 49733 + }, + { + "epoch": 1.27, + "learning_rate": 1.2876886737569508e-06, + "loss": 0.7656, + "step": 49734 + }, + { + "epoch": 1.27, + "learning_rate": 1.2876621729895113e-06, + "loss": 0.7637, + "step": 49735 + }, + { + "epoch": 1.27, + "learning_rate": 1.2876356720018215e-06, + "loss": 0.6108, + "step": 49736 + }, + { + "epoch": 1.27, + "learning_rate": 1.2876091707939028e-06, + "loss": 0.8789, + "step": 49737 + }, + { + "epoch": 1.27, + "learning_rate": 1.2875826693657745e-06, + "loss": 0.707, + "step": 49738 + }, + { + "epoch": 1.27, + "learning_rate": 1.287556167717458e-06, + "loss": 0.4795, + "step": 49739 + }, + { + "epoch": 1.27, + "learning_rate": 1.2875296658489725e-06, + "loss": 0.7422, + "step": 49740 + }, + { + "epoch": 1.27, + "learning_rate": 1.2875031637603388e-06, + "loss": 0.6218, + "step": 49741 + }, + { + "epoch": 1.27, + "learning_rate": 1.2874766614515773e-06, + "loss": 0.5718, + "step": 49742 + }, + { + "epoch": 1.27, + "learning_rate": 1.287450158922708e-06, + "loss": 0.5576, + "step": 49743 + }, + { + "epoch": 1.27, + "learning_rate": 1.2874236561737514e-06, + "loss": 0.5449, + "step": 49744 + }, + { + "epoch": 1.27, + "learning_rate": 1.2873971532047278e-06, + "loss": 0.6826, + "step": 49745 + }, + { + "epoch": 1.28, + "learning_rate": 1.2873706500156574e-06, + "loss": 0.7773, + "step": 49746 + }, + { + "epoch": 1.28, + "learning_rate": 1.2873441466065605e-06, + "loss": 0.75, + "step": 49747 + }, + { + "epoch": 1.28, + "learning_rate": 1.2873176429774572e-06, + "loss": 0.6318, + "step": 49748 + }, + { + "epoch": 1.28, + "learning_rate": 1.2872911391283681e-06, + "loss": 0.7598, + "step": 49749 + }, + { + "epoch": 1.28, + "learning_rate": 1.2872646350593136e-06, + "loss": 0.5991, + "step": 49750 + }, + { + "epoch": 1.28, + "learning_rate": 1.2872381307703135e-06, + "loss": 0.4819, + "step": 49751 + }, + { + "epoch": 1.28, + "learning_rate": 1.2872116262613886e-06, + "loss": 0.5859, + "step": 49752 + }, + { + "epoch": 1.28, + "learning_rate": 1.2871851215325587e-06, + "loss": 0.7891, + "step": 49753 + }, + { + "epoch": 1.28, + "learning_rate": 1.2871586165838445e-06, + "loss": 0.666, + "step": 49754 + }, + { + "epoch": 1.28, + "learning_rate": 1.287132111415266e-06, + "loss": 0.6582, + "step": 49755 + }, + { + "epoch": 1.28, + "learning_rate": 1.2871056060268439e-06, + "loss": 0.6025, + "step": 49756 + }, + { + "epoch": 1.28, + "learning_rate": 1.287079100418598e-06, + "loss": 0.7744, + "step": 49757 + }, + { + "epoch": 1.28, + "learning_rate": 1.287052594590549e-06, + "loss": 0.5859, + "step": 49758 + }, + { + "epoch": 1.28, + "learning_rate": 1.2870260885427172e-06, + "loss": 0.6421, + "step": 49759 + }, + { + "epoch": 1.28, + "learning_rate": 1.2869995822751225e-06, + "loss": 0.8018, + "step": 49760 + }, + { + "epoch": 1.28, + "learning_rate": 1.2869730757877853e-06, + "loss": 0.6431, + "step": 49761 + }, + { + "epoch": 1.28, + "learning_rate": 1.2869465690807262e-06, + "loss": 0.75, + "step": 49762 + }, + { + "epoch": 1.28, + "learning_rate": 1.286920062153965e-06, + "loss": 0.7363, + "step": 49763 + }, + { + "epoch": 1.28, + "learning_rate": 1.286893555007523e-06, + "loss": 0.625, + "step": 49764 + }, + { + "epoch": 1.28, + "learning_rate": 1.2868670476414192e-06, + "loss": 0.6636, + "step": 49765 + }, + { + "epoch": 1.28, + "learning_rate": 1.2868405400556746e-06, + "loss": 0.7002, + "step": 49766 + }, + { + "epoch": 1.28, + "learning_rate": 1.2868140322503094e-06, + "loss": 0.5559, + "step": 49767 + }, + { + "epoch": 1.28, + "learning_rate": 1.286787524225344e-06, + "loss": 0.6738, + "step": 49768 + }, + { + "epoch": 1.28, + "learning_rate": 1.2867610159807986e-06, + "loss": 0.6934, + "step": 49769 + }, + { + "epoch": 1.28, + "learning_rate": 1.286734507516693e-06, + "loss": 0.54, + "step": 49770 + }, + { + "epoch": 1.28, + "learning_rate": 1.2867079988330485e-06, + "loss": 0.6631, + "step": 49771 + }, + { + "epoch": 1.28, + "learning_rate": 1.2866814899298848e-06, + "loss": 0.6289, + "step": 49772 + }, + { + "epoch": 1.28, + "learning_rate": 1.286654980807222e-06, + "loss": 0.5378, + "step": 49773 + }, + { + "epoch": 1.28, + "learning_rate": 1.2866284714650807e-06, + "loss": 0.5537, + "step": 49774 + }, + { + "epoch": 1.28, + "learning_rate": 1.2866019619034817e-06, + "loss": 0.8145, + "step": 49775 + }, + { + "epoch": 1.28, + "learning_rate": 1.286575452122444e-06, + "loss": 0.6689, + "step": 49776 + }, + { + "epoch": 1.28, + "learning_rate": 1.286548942121989e-06, + "loss": 0.6719, + "step": 49777 + }, + { + "epoch": 1.28, + "learning_rate": 1.2865224319021365e-06, + "loss": 0.4871, + "step": 49778 + }, + { + "epoch": 1.28, + "learning_rate": 1.2864959214629073e-06, + "loss": 0.6719, + "step": 49779 + }, + { + "epoch": 1.28, + "learning_rate": 1.286469410804321e-06, + "loss": 0.6685, + "step": 49780 + }, + { + "epoch": 1.28, + "learning_rate": 1.2864428999263988e-06, + "loss": 0.6738, + "step": 49781 + }, + { + "epoch": 1.28, + "learning_rate": 1.2864163888291597e-06, + "loss": 0.5723, + "step": 49782 + }, + { + "epoch": 1.28, + "learning_rate": 1.286389877512625e-06, + "loss": 0.5361, + "step": 49783 + }, + { + "epoch": 1.28, + "learning_rate": 1.2863633659768152e-06, + "loss": 0.4668, + "step": 49784 + }, + { + "epoch": 1.28, + "learning_rate": 1.2863368542217496e-06, + "loss": 0.5688, + "step": 49785 + }, + { + "epoch": 1.28, + "learning_rate": 1.2863103422474491e-06, + "loss": 0.8076, + "step": 49786 + }, + { + "epoch": 1.28, + "learning_rate": 1.286283830053934e-06, + "loss": 0.6357, + "step": 49787 + }, + { + "epoch": 1.28, + "learning_rate": 1.2862573176412248e-06, + "loss": 0.6621, + "step": 49788 + }, + { + "epoch": 1.28, + "learning_rate": 1.2862308050093414e-06, + "loss": 0.6963, + "step": 49789 + }, + { + "epoch": 1.28, + "learning_rate": 1.2862042921583039e-06, + "loss": 0.4126, + "step": 49790 + }, + { + "epoch": 1.28, + "learning_rate": 1.2861777790881332e-06, + "loss": 0.6396, + "step": 49791 + }, + { + "epoch": 1.28, + "learning_rate": 1.286151265798849e-06, + "loss": 0.5747, + "step": 49792 + }, + { + "epoch": 1.28, + "learning_rate": 1.2861247522904724e-06, + "loss": 0.4932, + "step": 49793 + }, + { + "epoch": 1.28, + "learning_rate": 1.286098238563023e-06, + "loss": 0.752, + "step": 49794 + }, + { + "epoch": 1.28, + "learning_rate": 1.2860717246165214e-06, + "loss": 0.7275, + "step": 49795 + }, + { + "epoch": 1.28, + "learning_rate": 1.2860452104509878e-06, + "loss": 0.6875, + "step": 49796 + }, + { + "epoch": 1.28, + "learning_rate": 1.2860186960664424e-06, + "loss": 0.6084, + "step": 49797 + }, + { + "epoch": 1.28, + "learning_rate": 1.2859921814629062e-06, + "loss": 0.6357, + "step": 49798 + }, + { + "epoch": 1.28, + "learning_rate": 1.2859656666403984e-06, + "loss": 0.6064, + "step": 49799 + }, + { + "epoch": 1.28, + "learning_rate": 1.28593915159894e-06, + "loss": 0.5889, + "step": 49800 + }, + { + "epoch": 1.28, + "learning_rate": 1.285912636338551e-06, + "loss": 0.7715, + "step": 49801 + }, + { + "epoch": 1.28, + "learning_rate": 1.285886120859252e-06, + "loss": 0.5679, + "step": 49802 + }, + { + "epoch": 1.28, + "learning_rate": 1.2858596051610633e-06, + "loss": 0.7705, + "step": 49803 + }, + { + "epoch": 1.28, + "learning_rate": 1.2858330892440049e-06, + "loss": 0.6284, + "step": 49804 + }, + { + "epoch": 1.28, + "learning_rate": 1.285806573108097e-06, + "loss": 0.8154, + "step": 49805 + }, + { + "epoch": 1.28, + "learning_rate": 1.2857800567533603e-06, + "loss": 0.5837, + "step": 49806 + }, + { + "epoch": 1.28, + "learning_rate": 1.2857535401798148e-06, + "loss": 0.6807, + "step": 49807 + }, + { + "epoch": 1.28, + "learning_rate": 1.2857270233874815e-06, + "loss": 0.4802, + "step": 49808 + }, + { + "epoch": 1.28, + "learning_rate": 1.2857005063763797e-06, + "loss": 0.6543, + "step": 49809 + }, + { + "epoch": 1.28, + "learning_rate": 1.2856739891465302e-06, + "loss": 0.7222, + "step": 49810 + }, + { + "epoch": 1.28, + "learning_rate": 1.2856474716979532e-06, + "loss": 0.6914, + "step": 49811 + }, + { + "epoch": 1.28, + "learning_rate": 1.2856209540306694e-06, + "loss": 0.7461, + "step": 49812 + }, + { + "epoch": 1.28, + "learning_rate": 1.2855944361446984e-06, + "loss": 0.6636, + "step": 49813 + }, + { + "epoch": 1.28, + "learning_rate": 1.285567918040061e-06, + "loss": 0.6221, + "step": 49814 + }, + { + "epoch": 1.28, + "learning_rate": 1.2855413997167774e-06, + "loss": 0.4624, + "step": 49815 + }, + { + "epoch": 1.28, + "learning_rate": 1.2855148811748677e-06, + "loss": 0.5581, + "step": 49816 + }, + { + "epoch": 1.28, + "learning_rate": 1.2854883624143526e-06, + "loss": 0.6094, + "step": 49817 + }, + { + "epoch": 1.28, + "learning_rate": 1.2854618434352525e-06, + "loss": 0.7402, + "step": 49818 + }, + { + "epoch": 1.28, + "learning_rate": 1.285435324237587e-06, + "loss": 0.6216, + "step": 49819 + }, + { + "epoch": 1.28, + "learning_rate": 1.2854088048213767e-06, + "loss": 0.6816, + "step": 49820 + }, + { + "epoch": 1.28, + "learning_rate": 1.285382285186642e-06, + "loss": 0.5857, + "step": 49821 + }, + { + "epoch": 1.28, + "learning_rate": 1.2853557653334033e-06, + "loss": 0.6709, + "step": 49822 + }, + { + "epoch": 1.28, + "learning_rate": 1.285329245261681e-06, + "loss": 0.6147, + "step": 49823 + }, + { + "epoch": 1.28, + "learning_rate": 1.2853027249714953e-06, + "loss": 0.4081, + "step": 49824 + }, + { + "epoch": 1.28, + "learning_rate": 1.2852762044628663e-06, + "loss": 0.5205, + "step": 49825 + }, + { + "epoch": 1.28, + "learning_rate": 1.285249683735814e-06, + "loss": 0.7876, + "step": 49826 + }, + { + "epoch": 1.28, + "learning_rate": 1.2852231627903596e-06, + "loss": 0.7324, + "step": 49827 + }, + { + "epoch": 1.28, + "learning_rate": 1.2851966416265227e-06, + "loss": 0.4612, + "step": 49828 + }, + { + "epoch": 1.28, + "learning_rate": 1.2851701202443241e-06, + "loss": 0.3921, + "step": 49829 + }, + { + "epoch": 1.28, + "learning_rate": 1.2851435986437835e-06, + "loss": 0.7734, + "step": 49830 + }, + { + "epoch": 1.28, + "learning_rate": 1.2851170768249219e-06, + "loss": 0.5693, + "step": 49831 + }, + { + "epoch": 1.28, + "learning_rate": 1.2850905547877589e-06, + "loss": 0.6699, + "step": 49832 + }, + { + "epoch": 1.28, + "learning_rate": 1.2850640325323155e-06, + "loss": 0.394, + "step": 49833 + }, + { + "epoch": 1.28, + "learning_rate": 1.2850375100586118e-06, + "loss": 0.5972, + "step": 49834 + }, + { + "epoch": 1.28, + "learning_rate": 1.2850109873666678e-06, + "loss": 0.5542, + "step": 49835 + }, + { + "epoch": 1.28, + "learning_rate": 1.2849844644565035e-06, + "loss": 0.6157, + "step": 49836 + }, + { + "epoch": 1.28, + "learning_rate": 1.2849579413281403e-06, + "loss": 0.6855, + "step": 49837 + }, + { + "epoch": 1.28, + "learning_rate": 1.284931417981598e-06, + "loss": 0.6787, + "step": 49838 + }, + { + "epoch": 1.28, + "learning_rate": 1.2849048944168962e-06, + "loss": 0.6121, + "step": 49839 + }, + { + "epoch": 1.28, + "learning_rate": 1.2848783706340563e-06, + "loss": 0.5029, + "step": 49840 + }, + { + "epoch": 1.28, + "learning_rate": 1.284851846633098e-06, + "loss": 0.6777, + "step": 49841 + }, + { + "epoch": 1.28, + "learning_rate": 1.2848253224140417e-06, + "loss": 0.5457, + "step": 49842 + }, + { + "epoch": 1.28, + "learning_rate": 1.284798797976908e-06, + "loss": 0.6792, + "step": 49843 + }, + { + "epoch": 1.28, + "learning_rate": 1.2847722733217167e-06, + "loss": 0.6387, + "step": 49844 + }, + { + "epoch": 1.28, + "learning_rate": 1.2847457484484882e-06, + "loss": 0.7607, + "step": 49845 + }, + { + "epoch": 1.28, + "learning_rate": 1.2847192233572433e-06, + "loss": 0.666, + "step": 49846 + }, + { + "epoch": 1.28, + "learning_rate": 1.2846926980480017e-06, + "loss": 0.6318, + "step": 49847 + }, + { + "epoch": 1.28, + "learning_rate": 1.2846661725207845e-06, + "loss": 0.7119, + "step": 49848 + }, + { + "epoch": 1.28, + "learning_rate": 1.2846396467756111e-06, + "loss": 0.5203, + "step": 49849 + }, + { + "epoch": 1.28, + "learning_rate": 1.2846131208125025e-06, + "loss": 0.5244, + "step": 49850 + }, + { + "epoch": 1.28, + "learning_rate": 1.2845865946314783e-06, + "loss": 0.5896, + "step": 49851 + }, + { + "epoch": 1.28, + "learning_rate": 1.2845600682325594e-06, + "loss": 0.6904, + "step": 49852 + }, + { + "epoch": 1.28, + "learning_rate": 1.284533541615766e-06, + "loss": 0.5938, + "step": 49853 + }, + { + "epoch": 1.28, + "learning_rate": 1.2845070147811185e-06, + "loss": 0.6582, + "step": 49854 + }, + { + "epoch": 1.28, + "learning_rate": 1.2844804877286368e-06, + "loss": 0.5713, + "step": 49855 + }, + { + "epoch": 1.28, + "learning_rate": 1.2844539604583416e-06, + "loss": 0.5635, + "step": 49856 + }, + { + "epoch": 1.28, + "learning_rate": 1.2844274329702529e-06, + "loss": 0.7539, + "step": 49857 + }, + { + "epoch": 1.28, + "learning_rate": 1.2844009052643913e-06, + "loss": 0.7617, + "step": 49858 + }, + { + "epoch": 1.28, + "learning_rate": 1.284374377340777e-06, + "loss": 0.5737, + "step": 49859 + }, + { + "epoch": 1.28, + "learning_rate": 1.2843478491994305e-06, + "loss": 0.6855, + "step": 49860 + }, + { + "epoch": 1.28, + "learning_rate": 1.2843213208403716e-06, + "loss": 0.6768, + "step": 49861 + }, + { + "epoch": 1.28, + "learning_rate": 1.2842947922636213e-06, + "loss": 0.8887, + "step": 49862 + }, + { + "epoch": 1.28, + "learning_rate": 1.2842682634691992e-06, + "loss": 0.5845, + "step": 49863 + }, + { + "epoch": 1.28, + "learning_rate": 1.2842417344571262e-06, + "loss": 0.5557, + "step": 49864 + }, + { + "epoch": 1.28, + "learning_rate": 1.2842152052274221e-06, + "loss": 0.7861, + "step": 49865 + }, + { + "epoch": 1.28, + "learning_rate": 1.2841886757801076e-06, + "loss": 0.4514, + "step": 49866 + }, + { + "epoch": 1.28, + "learning_rate": 1.2841621461152033e-06, + "loss": 0.4895, + "step": 49867 + }, + { + "epoch": 1.28, + "learning_rate": 1.2841356162327288e-06, + "loss": 0.7759, + "step": 49868 + }, + { + "epoch": 1.28, + "learning_rate": 1.284109086132705e-06, + "loss": 0.627, + "step": 49869 + }, + { + "epoch": 1.28, + "learning_rate": 1.2840825558151513e-06, + "loss": 0.7148, + "step": 49870 + }, + { + "epoch": 1.28, + "learning_rate": 1.2840560252800892e-06, + "loss": 0.7725, + "step": 49871 + }, + { + "epoch": 1.28, + "learning_rate": 1.284029494527538e-06, + "loss": 0.5452, + "step": 49872 + }, + { + "epoch": 1.28, + "learning_rate": 1.2840029635575192e-06, + "loss": 0.8066, + "step": 49873 + }, + { + "epoch": 1.28, + "learning_rate": 1.2839764323700517e-06, + "loss": 0.7764, + "step": 49874 + }, + { + "epoch": 1.28, + "learning_rate": 1.2839499009651566e-06, + "loss": 0.6753, + "step": 49875 + }, + { + "epoch": 1.28, + "learning_rate": 1.2839233693428542e-06, + "loss": 0.5427, + "step": 49876 + }, + { + "epoch": 1.28, + "learning_rate": 1.2838968375031649e-06, + "loss": 0.7754, + "step": 49877 + }, + { + "epoch": 1.28, + "learning_rate": 1.2838703054461086e-06, + "loss": 0.5815, + "step": 49878 + }, + { + "epoch": 1.28, + "learning_rate": 1.2838437731717062e-06, + "loss": 0.5015, + "step": 49879 + }, + { + "epoch": 1.28, + "learning_rate": 1.2838172406799773e-06, + "loss": 0.47, + "step": 49880 + }, + { + "epoch": 1.28, + "learning_rate": 1.2837907079709428e-06, + "loss": 0.4756, + "step": 49881 + }, + { + "epoch": 1.28, + "learning_rate": 1.2837641750446226e-06, + "loss": 0.6943, + "step": 49882 + }, + { + "epoch": 1.28, + "learning_rate": 1.2837376419010376e-06, + "loss": 0.5991, + "step": 49883 + }, + { + "epoch": 1.28, + "learning_rate": 1.2837111085402075e-06, + "loss": 0.6172, + "step": 49884 + }, + { + "epoch": 1.28, + "learning_rate": 1.2836845749621528e-06, + "loss": 0.8359, + "step": 49885 + }, + { + "epoch": 1.28, + "learning_rate": 1.283658041166894e-06, + "loss": 0.5288, + "step": 49886 + }, + { + "epoch": 1.28, + "learning_rate": 1.283631507154451e-06, + "loss": 0.6914, + "step": 49887 + }, + { + "epoch": 1.28, + "learning_rate": 1.283604972924845e-06, + "loss": 0.6387, + "step": 49888 + }, + { + "epoch": 1.28, + "learning_rate": 1.283578438478095e-06, + "loss": 0.5308, + "step": 49889 + }, + { + "epoch": 1.28, + "learning_rate": 1.2835519038142225e-06, + "loss": 0.6431, + "step": 49890 + }, + { + "epoch": 1.28, + "learning_rate": 1.2835253689332471e-06, + "loss": 0.6768, + "step": 49891 + }, + { + "epoch": 1.28, + "learning_rate": 1.2834988338351895e-06, + "loss": 0.6968, + "step": 49892 + }, + { + "epoch": 1.28, + "learning_rate": 1.28347229852007e-06, + "loss": 0.6943, + "step": 49893 + }, + { + "epoch": 1.28, + "learning_rate": 1.2834457629879086e-06, + "loss": 0.7607, + "step": 49894 + }, + { + "epoch": 1.28, + "learning_rate": 1.2834192272387257e-06, + "loss": 0.7256, + "step": 49895 + }, + { + "epoch": 1.28, + "learning_rate": 1.2833926912725419e-06, + "loss": 0.5615, + "step": 49896 + }, + { + "epoch": 1.28, + "learning_rate": 1.283366155089377e-06, + "loss": 0.6772, + "step": 49897 + }, + { + "epoch": 1.28, + "learning_rate": 1.2833396186892525e-06, + "loss": 0.6592, + "step": 49898 + }, + { + "epoch": 1.28, + "learning_rate": 1.2833130820721872e-06, + "loss": 0.5435, + "step": 49899 + }, + { + "epoch": 1.28, + "learning_rate": 1.2832865452382022e-06, + "loss": 0.7461, + "step": 49900 + }, + { + "epoch": 1.28, + "learning_rate": 1.2832600081873178e-06, + "loss": 0.6357, + "step": 49901 + }, + { + "epoch": 1.28, + "learning_rate": 1.2832334709195541e-06, + "loss": 0.7031, + "step": 49902 + }, + { + "epoch": 1.28, + "learning_rate": 1.2832069334349318e-06, + "loss": 0.7686, + "step": 49903 + }, + { + "epoch": 1.28, + "learning_rate": 1.2831803957334706e-06, + "loss": 0.5229, + "step": 49904 + }, + { + "epoch": 1.28, + "learning_rate": 1.2831538578151918e-06, + "loss": 0.6611, + "step": 49905 + }, + { + "epoch": 1.28, + "learning_rate": 1.2831273196801145e-06, + "loss": 0.5488, + "step": 49906 + }, + { + "epoch": 1.28, + "learning_rate": 1.28310078132826e-06, + "loss": 0.6577, + "step": 49907 + }, + { + "epoch": 1.28, + "learning_rate": 1.283074242759648e-06, + "loss": 0.5508, + "step": 49908 + }, + { + "epoch": 1.28, + "learning_rate": 1.2830477039742992e-06, + "loss": 0.8721, + "step": 49909 + }, + { + "epoch": 1.28, + "learning_rate": 1.2830211649722337e-06, + "loss": 0.6919, + "step": 49910 + }, + { + "epoch": 1.28, + "learning_rate": 1.2829946257534721e-06, + "loss": 0.8428, + "step": 49911 + }, + { + "epoch": 1.28, + "learning_rate": 1.2829680863180343e-06, + "loss": 0.5513, + "step": 49912 + }, + { + "epoch": 1.28, + "learning_rate": 1.2829415466659413e-06, + "loss": 0.6396, + "step": 49913 + }, + { + "epoch": 1.28, + "learning_rate": 1.2829150067972124e-06, + "loss": 0.5923, + "step": 49914 + }, + { + "epoch": 1.28, + "learning_rate": 1.2828884667118688e-06, + "loss": 0.6934, + "step": 49915 + }, + { + "epoch": 1.28, + "learning_rate": 1.2828619264099303e-06, + "loss": 0.5366, + "step": 49916 + }, + { + "epoch": 1.28, + "learning_rate": 1.2828353858914176e-06, + "loss": 0.455, + "step": 49917 + }, + { + "epoch": 1.28, + "learning_rate": 1.2828088451563509e-06, + "loss": 0.623, + "step": 49918 + }, + { + "epoch": 1.28, + "learning_rate": 1.2827823042047503e-06, + "loss": 0.71, + "step": 49919 + }, + { + "epoch": 1.28, + "learning_rate": 1.2827557630366363e-06, + "loss": 0.7852, + "step": 49920 + }, + { + "epoch": 1.28, + "learning_rate": 1.2827292216520293e-06, + "loss": 0.6753, + "step": 49921 + }, + { + "epoch": 1.28, + "learning_rate": 1.2827026800509495e-06, + "loss": 0.7461, + "step": 49922 + }, + { + "epoch": 1.28, + "learning_rate": 1.2826761382334171e-06, + "loss": 0.6675, + "step": 49923 + }, + { + "epoch": 1.28, + "learning_rate": 1.282649596199453e-06, + "loss": 0.748, + "step": 49924 + }, + { + "epoch": 1.28, + "learning_rate": 1.282623053949077e-06, + "loss": 0.5815, + "step": 49925 + }, + { + "epoch": 1.28, + "learning_rate": 1.2825965114823092e-06, + "loss": 0.708, + "step": 49926 + }, + { + "epoch": 1.28, + "learning_rate": 1.2825699687991704e-06, + "loss": 0.5786, + "step": 49927 + }, + { + "epoch": 1.28, + "learning_rate": 1.282543425899681e-06, + "loss": 0.4429, + "step": 49928 + }, + { + "epoch": 1.28, + "learning_rate": 1.2825168827838609e-06, + "loss": 0.7998, + "step": 49929 + }, + { + "epoch": 1.28, + "learning_rate": 1.2824903394517303e-06, + "loss": 0.8447, + "step": 49930 + }, + { + "epoch": 1.28, + "learning_rate": 1.2824637959033103e-06, + "loss": 0.5669, + "step": 49931 + }, + { + "epoch": 1.28, + "learning_rate": 1.2824372521386204e-06, + "loss": 0.5723, + "step": 49932 + }, + { + "epoch": 1.28, + "learning_rate": 1.2824107081576816e-06, + "loss": 0.8623, + "step": 49933 + }, + { + "epoch": 1.28, + "learning_rate": 1.282384163960514e-06, + "loss": 0.7285, + "step": 49934 + }, + { + "epoch": 1.28, + "learning_rate": 1.2823576195471372e-06, + "loss": 0.4231, + "step": 49935 + }, + { + "epoch": 1.28, + "learning_rate": 1.2823310749175728e-06, + "loss": 0.6484, + "step": 49936 + }, + { + "epoch": 1.28, + "learning_rate": 1.28230453007184e-06, + "loss": 0.5164, + "step": 49937 + }, + { + "epoch": 1.28, + "learning_rate": 1.2822779850099603e-06, + "loss": 0.6992, + "step": 49938 + }, + { + "epoch": 1.28, + "learning_rate": 1.2822514397319526e-06, + "loss": 0.7793, + "step": 49939 + }, + { + "epoch": 1.28, + "learning_rate": 1.2822248942378385e-06, + "loss": 0.4881, + "step": 49940 + }, + { + "epoch": 1.28, + "learning_rate": 1.282198348527637e-06, + "loss": 0.5269, + "step": 49941 + }, + { + "epoch": 1.28, + "learning_rate": 1.2821718026013699e-06, + "loss": 0.6719, + "step": 49942 + }, + { + "epoch": 1.28, + "learning_rate": 1.2821452564590567e-06, + "loss": 0.6318, + "step": 49943 + }, + { + "epoch": 1.28, + "learning_rate": 1.2821187101007178e-06, + "loss": 0.7061, + "step": 49944 + }, + { + "epoch": 1.28, + "learning_rate": 1.2820921635263734e-06, + "loss": 0.6992, + "step": 49945 + }, + { + "epoch": 1.28, + "learning_rate": 1.2820656167360445e-06, + "loss": 0.6565, + "step": 49946 + }, + { + "epoch": 1.28, + "learning_rate": 1.2820390697297504e-06, + "loss": 0.6592, + "step": 49947 + }, + { + "epoch": 1.28, + "learning_rate": 1.282012522507512e-06, + "loss": 0.6597, + "step": 49948 + }, + { + "epoch": 1.28, + "learning_rate": 1.2819859750693498e-06, + "loss": 0.6982, + "step": 49949 + }, + { + "epoch": 1.28, + "learning_rate": 1.2819594274152836e-06, + "loss": 0.645, + "step": 49950 + }, + { + "epoch": 1.28, + "learning_rate": 1.2819328795453345e-06, + "loss": 0.7402, + "step": 49951 + }, + { + "epoch": 1.28, + "learning_rate": 1.2819063314595223e-06, + "loss": 0.8701, + "step": 49952 + }, + { + "epoch": 1.28, + "learning_rate": 1.2818797831578672e-06, + "loss": 0.6465, + "step": 49953 + }, + { + "epoch": 1.28, + "learning_rate": 1.2818532346403895e-06, + "loss": 0.5757, + "step": 49954 + }, + { + "epoch": 1.28, + "learning_rate": 1.28182668590711e-06, + "loss": 0.6147, + "step": 49955 + }, + { + "epoch": 1.28, + "learning_rate": 1.2818001369580485e-06, + "loss": 0.8213, + "step": 49956 + }, + { + "epoch": 1.28, + "learning_rate": 1.2817735877932258e-06, + "loss": 0.8105, + "step": 49957 + }, + { + "epoch": 1.28, + "learning_rate": 1.281747038412662e-06, + "loss": 0.605, + "step": 49958 + }, + { + "epoch": 1.28, + "learning_rate": 1.2817204888163777e-06, + "loss": 0.6611, + "step": 49959 + }, + { + "epoch": 1.28, + "learning_rate": 1.2816939390043926e-06, + "loss": 0.7173, + "step": 49960 + }, + { + "epoch": 1.28, + "learning_rate": 1.2816673889767275e-06, + "loss": 0.8154, + "step": 49961 + }, + { + "epoch": 1.28, + "learning_rate": 1.2816408387334025e-06, + "loss": 0.7832, + "step": 49962 + }, + { + "epoch": 1.28, + "learning_rate": 1.2816142882744388e-06, + "loss": 0.5881, + "step": 49963 + }, + { + "epoch": 1.28, + "learning_rate": 1.2815877375998552e-06, + "loss": 0.7051, + "step": 49964 + }, + { + "epoch": 1.28, + "learning_rate": 1.281561186709673e-06, + "loss": 0.8047, + "step": 49965 + }, + { + "epoch": 1.28, + "learning_rate": 1.2815346356039124e-06, + "loss": 0.6016, + "step": 49966 + }, + { + "epoch": 1.28, + "learning_rate": 1.2815080842825935e-06, + "loss": 0.7529, + "step": 49967 + }, + { + "epoch": 1.28, + "learning_rate": 1.2814815327457372e-06, + "loss": 0.7275, + "step": 49968 + }, + { + "epoch": 1.28, + "learning_rate": 1.2814549809933633e-06, + "loss": 0.4721, + "step": 49969 + }, + { + "epoch": 1.28, + "learning_rate": 1.281428429025492e-06, + "loss": 0.7812, + "step": 49970 + }, + { + "epoch": 1.28, + "learning_rate": 1.281401876842144e-06, + "loss": 0.6235, + "step": 49971 + }, + { + "epoch": 1.28, + "learning_rate": 1.2813753244433394e-06, + "loss": 0.8057, + "step": 49972 + }, + { + "epoch": 1.28, + "learning_rate": 1.281348771829099e-06, + "loss": 0.5473, + "step": 49973 + }, + { + "epoch": 1.28, + "learning_rate": 1.2813222189994426e-06, + "loss": 0.5754, + "step": 49974 + }, + { + "epoch": 1.28, + "learning_rate": 1.2812956659543905e-06, + "loss": 0.4833, + "step": 49975 + }, + { + "epoch": 1.28, + "learning_rate": 1.2812691126939636e-06, + "loss": 0.6782, + "step": 49976 + }, + { + "epoch": 1.28, + "learning_rate": 1.2812425592181817e-06, + "loss": 0.6738, + "step": 49977 + }, + { + "epoch": 1.28, + "learning_rate": 1.2812160055270655e-06, + "loss": 0.5659, + "step": 49978 + }, + { + "epoch": 1.28, + "learning_rate": 1.2811894516206349e-06, + "loss": 0.623, + "step": 49979 + }, + { + "epoch": 1.28, + "learning_rate": 1.2811628974989106e-06, + "loss": 0.8408, + "step": 49980 + }, + { + "epoch": 1.28, + "learning_rate": 1.2811363431619126e-06, + "loss": 0.8096, + "step": 49981 + }, + { + "epoch": 1.28, + "learning_rate": 1.2811097886096617e-06, + "loss": 0.8076, + "step": 49982 + }, + { + "epoch": 1.28, + "learning_rate": 1.2810832338421777e-06, + "loss": 0.6675, + "step": 49983 + }, + { + "epoch": 1.28, + "learning_rate": 1.2810566788594815e-06, + "loss": 0.543, + "step": 49984 + }, + { + "epoch": 1.28, + "learning_rate": 1.2810301236615929e-06, + "loss": 0.8611, + "step": 49985 + }, + { + "epoch": 1.28, + "learning_rate": 1.2810035682485325e-06, + "loss": 0.7012, + "step": 49986 + }, + { + "epoch": 1.28, + "learning_rate": 1.2809770126203205e-06, + "loss": 0.6611, + "step": 49987 + }, + { + "epoch": 1.28, + "learning_rate": 1.2809504567769778e-06, + "loss": 0.6826, + "step": 49988 + }, + { + "epoch": 1.28, + "learning_rate": 1.2809239007185236e-06, + "loss": 0.7729, + "step": 49989 + }, + { + "epoch": 1.28, + "learning_rate": 1.280897344444979e-06, + "loss": 0.7529, + "step": 49990 + }, + { + "epoch": 1.28, + "learning_rate": 1.2808707879563645e-06, + "loss": 0.6372, + "step": 49991 + }, + { + "epoch": 1.28, + "learning_rate": 1.2808442312527001e-06, + "loss": 0.5225, + "step": 49992 + }, + { + "epoch": 1.28, + "learning_rate": 1.2808176743340063e-06, + "loss": 0.7949, + "step": 49993 + }, + { + "epoch": 1.28, + "learning_rate": 1.2807911172003027e-06, + "loss": 0.7002, + "step": 49994 + }, + { + "epoch": 1.28, + "learning_rate": 1.280764559851611e-06, + "loss": 0.5776, + "step": 49995 + }, + { + "epoch": 1.28, + "learning_rate": 1.2807380022879502e-06, + "loss": 0.8691, + "step": 49996 + }, + { + "epoch": 1.28, + "learning_rate": 1.2807114445093413e-06, + "loss": 0.6455, + "step": 49997 + }, + { + "epoch": 1.28, + "learning_rate": 1.280684886515805e-06, + "loss": 0.6733, + "step": 49998 + }, + { + "epoch": 1.28, + "learning_rate": 1.280658328307361e-06, + "loss": 0.6438, + "step": 49999 + }, + { + "epoch": 1.28, + "learning_rate": 1.2806317698840297e-06, + "loss": 0.4318, + "step": 50000 + }, + { + "epoch": 1.28, + "learning_rate": 1.2806052112458316e-06, + "loss": 0.6055, + "step": 50001 + }, + { + "epoch": 1.28, + "learning_rate": 1.2805786523927869e-06, + "loss": 0.6123, + "step": 50002 + }, + { + "epoch": 1.28, + "learning_rate": 1.2805520933249164e-06, + "loss": 0.5898, + "step": 50003 + }, + { + "epoch": 1.28, + "learning_rate": 1.2805255340422396e-06, + "loss": 0.5688, + "step": 50004 + }, + { + "epoch": 1.28, + "learning_rate": 1.2804989745447777e-06, + "loss": 0.7178, + "step": 50005 + }, + { + "epoch": 1.28, + "learning_rate": 1.2804724148325503e-06, + "loss": 0.6289, + "step": 50006 + }, + { + "epoch": 1.28, + "learning_rate": 1.2804458549055781e-06, + "loss": 0.564, + "step": 50007 + }, + { + "epoch": 1.28, + "learning_rate": 1.2804192947638816e-06, + "loss": 0.5579, + "step": 50008 + }, + { + "epoch": 1.28, + "learning_rate": 1.280392734407481e-06, + "loss": 0.6895, + "step": 50009 + }, + { + "epoch": 1.28, + "learning_rate": 1.2803661738363962e-06, + "loss": 0.6567, + "step": 50010 + }, + { + "epoch": 1.28, + "learning_rate": 1.2803396130506484e-06, + "loss": 0.7397, + "step": 50011 + }, + { + "epoch": 1.28, + "learning_rate": 1.280313052050257e-06, + "loss": 0.6379, + "step": 50012 + }, + { + "epoch": 1.28, + "learning_rate": 1.2802864908352428e-06, + "loss": 0.7109, + "step": 50013 + }, + { + "epoch": 1.28, + "learning_rate": 1.2802599294056264e-06, + "loss": 0.7236, + "step": 50014 + }, + { + "epoch": 1.28, + "learning_rate": 1.2802333677614278e-06, + "loss": 0.4922, + "step": 50015 + }, + { + "epoch": 1.28, + "learning_rate": 1.2802068059026674e-06, + "loss": 0.7051, + "step": 50016 + }, + { + "epoch": 1.28, + "learning_rate": 1.2801802438293654e-06, + "loss": 0.7998, + "step": 50017 + }, + { + "epoch": 1.28, + "learning_rate": 1.2801536815415423e-06, + "loss": 0.6426, + "step": 50018 + }, + { + "epoch": 1.28, + "learning_rate": 1.2801271190392185e-06, + "loss": 0.5845, + "step": 50019 + }, + { + "epoch": 1.28, + "learning_rate": 1.2801005563224141e-06, + "loss": 0.7568, + "step": 50020 + }, + { + "epoch": 1.28, + "learning_rate": 1.2800739933911495e-06, + "loss": 0.6973, + "step": 50021 + }, + { + "epoch": 1.28, + "learning_rate": 1.2800474302454455e-06, + "loss": 0.7236, + "step": 50022 + }, + { + "epoch": 1.28, + "learning_rate": 1.280020866885322e-06, + "loss": 0.8506, + "step": 50023 + }, + { + "epoch": 1.28, + "learning_rate": 1.2799943033107993e-06, + "loss": 0.8008, + "step": 50024 + }, + { + "epoch": 1.28, + "learning_rate": 1.2799677395218974e-06, + "loss": 0.603, + "step": 50025 + }, + { + "epoch": 1.28, + "learning_rate": 1.2799411755186378e-06, + "loss": 0.6621, + "step": 50026 + }, + { + "epoch": 1.28, + "learning_rate": 1.2799146113010395e-06, + "loss": 0.6377, + "step": 50027 + }, + { + "epoch": 1.28, + "learning_rate": 1.279888046869124e-06, + "loss": 0.6543, + "step": 50028 + }, + { + "epoch": 1.28, + "learning_rate": 1.2798614822229108e-06, + "loss": 0.5801, + "step": 50029 + }, + { + "epoch": 1.28, + "learning_rate": 1.2798349173624206e-06, + "loss": 0.5425, + "step": 50030 + }, + { + "epoch": 1.28, + "learning_rate": 1.2798083522876734e-06, + "loss": 0.709, + "step": 50031 + }, + { + "epoch": 1.28, + "learning_rate": 1.2797817869986902e-06, + "loss": 0.4893, + "step": 50032 + }, + { + "epoch": 1.28, + "learning_rate": 1.2797552214954907e-06, + "loss": 0.6509, + "step": 50033 + }, + { + "epoch": 1.28, + "learning_rate": 1.2797286557780958e-06, + "loss": 0.7119, + "step": 50034 + }, + { + "epoch": 1.28, + "learning_rate": 1.2797020898465252e-06, + "loss": 0.583, + "step": 50035 + }, + { + "epoch": 1.28, + "learning_rate": 1.2796755237007997e-06, + "loss": 0.708, + "step": 50036 + }, + { + "epoch": 1.28, + "learning_rate": 1.2796489573409393e-06, + "loss": 0.6382, + "step": 50037 + }, + { + "epoch": 1.28, + "learning_rate": 1.2796223907669647e-06, + "loss": 0.6763, + "step": 50038 + }, + { + "epoch": 1.28, + "learning_rate": 1.2795958239788965e-06, + "loss": 0.5918, + "step": 50039 + }, + { + "epoch": 1.28, + "learning_rate": 1.279569256976754e-06, + "loss": 0.7559, + "step": 50040 + }, + { + "epoch": 1.28, + "learning_rate": 1.2795426897605587e-06, + "loss": 0.5422, + "step": 50041 + }, + { + "epoch": 1.28, + "learning_rate": 1.27951612233033e-06, + "loss": 0.6523, + "step": 50042 + }, + { + "epoch": 1.28, + "learning_rate": 1.2794895546860889e-06, + "loss": 0.6226, + "step": 50043 + }, + { + "epoch": 1.28, + "learning_rate": 1.2794629868278553e-06, + "loss": 0.7617, + "step": 50044 + }, + { + "epoch": 1.28, + "learning_rate": 1.27943641875565e-06, + "loss": 0.6875, + "step": 50045 + }, + { + "epoch": 1.28, + "learning_rate": 1.2794098504694927e-06, + "loss": 0.79, + "step": 50046 + }, + { + "epoch": 1.28, + "learning_rate": 1.2793832819694044e-06, + "loss": 0.7734, + "step": 50047 + }, + { + "epoch": 1.28, + "learning_rate": 1.2793567132554052e-06, + "loss": 0.7744, + "step": 50048 + }, + { + "epoch": 1.28, + "learning_rate": 1.2793301443275155e-06, + "loss": 0.4707, + "step": 50049 + }, + { + "epoch": 1.28, + "learning_rate": 1.2793035751857553e-06, + "loss": 0.7441, + "step": 50050 + }, + { + "epoch": 1.28, + "learning_rate": 1.2792770058301451e-06, + "loss": 0.7266, + "step": 50051 + }, + { + "epoch": 1.28, + "learning_rate": 1.2792504362607055e-06, + "loss": 0.7637, + "step": 50052 + }, + { + "epoch": 1.28, + "learning_rate": 1.2792238664774572e-06, + "loss": 0.4741, + "step": 50053 + }, + { + "epoch": 1.28, + "learning_rate": 1.2791972964804192e-06, + "loss": 0.792, + "step": 50054 + }, + { + "epoch": 1.28, + "learning_rate": 1.2791707262696132e-06, + "loss": 0.7295, + "step": 50055 + }, + { + "epoch": 1.28, + "learning_rate": 1.2791441558450587e-06, + "loss": 0.6138, + "step": 50056 + }, + { + "epoch": 1.28, + "learning_rate": 1.2791175852067765e-06, + "loss": 0.7197, + "step": 50057 + }, + { + "epoch": 1.28, + "learning_rate": 1.279091014354787e-06, + "loss": 0.5908, + "step": 50058 + }, + { + "epoch": 1.28, + "learning_rate": 1.2790644432891098e-06, + "loss": 0.6147, + "step": 50059 + }, + { + "epoch": 1.28, + "learning_rate": 1.2790378720097662e-06, + "loss": 0.7842, + "step": 50060 + }, + { + "epoch": 1.28, + "learning_rate": 1.279011300516776e-06, + "loss": 0.6582, + "step": 50061 + }, + { + "epoch": 1.28, + "learning_rate": 1.2789847288101595e-06, + "loss": 0.7891, + "step": 50062 + }, + { + "epoch": 1.28, + "learning_rate": 1.2789581568899377e-06, + "loss": 0.5898, + "step": 50063 + }, + { + "epoch": 1.28, + "learning_rate": 1.2789315847561302e-06, + "loss": 0.7461, + "step": 50064 + }, + { + "epoch": 1.28, + "learning_rate": 1.2789050124087575e-06, + "loss": 0.6641, + "step": 50065 + }, + { + "epoch": 1.28, + "learning_rate": 1.2788784398478404e-06, + "loss": 0.498, + "step": 50066 + }, + { + "epoch": 1.28, + "learning_rate": 1.2788518670733983e-06, + "loss": 0.7939, + "step": 50067 + }, + { + "epoch": 1.28, + "learning_rate": 1.2788252940854527e-06, + "loss": 0.7988, + "step": 50068 + }, + { + "epoch": 1.28, + "learning_rate": 1.2787987208840233e-06, + "loss": 0.4325, + "step": 50069 + }, + { + "epoch": 1.28, + "learning_rate": 1.2787721474691305e-06, + "loss": 0.7939, + "step": 50070 + }, + { + "epoch": 1.28, + "learning_rate": 1.2787455738407943e-06, + "loss": 0.8105, + "step": 50071 + }, + { + "epoch": 1.28, + "learning_rate": 1.278718999999036e-06, + "loss": 0.6348, + "step": 50072 + }, + { + "epoch": 1.28, + "learning_rate": 1.2786924259438752e-06, + "loss": 0.7617, + "step": 50073 + }, + { + "epoch": 1.28, + "learning_rate": 1.2786658516753324e-06, + "loss": 0.7773, + "step": 50074 + }, + { + "epoch": 1.28, + "learning_rate": 1.2786392771934278e-06, + "loss": 0.7295, + "step": 50075 + }, + { + "epoch": 1.28, + "learning_rate": 1.278612702498182e-06, + "loss": 0.8125, + "step": 50076 + }, + { + "epoch": 1.28, + "learning_rate": 1.2785861275896153e-06, + "loss": 0.6606, + "step": 50077 + }, + { + "epoch": 1.28, + "learning_rate": 1.2785595524677485e-06, + "loss": 0.8027, + "step": 50078 + }, + { + "epoch": 1.28, + "learning_rate": 1.2785329771326005e-06, + "loss": 0.7734, + "step": 50079 + }, + { + "epoch": 1.28, + "learning_rate": 1.2785064015841933e-06, + "loss": 0.7319, + "step": 50080 + }, + { + "epoch": 1.28, + "learning_rate": 1.2784798258225462e-06, + "loss": 0.6514, + "step": 50081 + }, + { + "epoch": 1.28, + "learning_rate": 1.2784532498476801e-06, + "loss": 0.4204, + "step": 50082 + }, + { + "epoch": 1.28, + "learning_rate": 1.2784266736596153e-06, + "loss": 0.752, + "step": 50083 + }, + { + "epoch": 1.28, + "learning_rate": 1.2784000972583715e-06, + "loss": 0.549, + "step": 50084 + }, + { + "epoch": 1.28, + "learning_rate": 1.27837352064397e-06, + "loss": 0.5698, + "step": 50085 + }, + { + "epoch": 1.28, + "learning_rate": 1.2783469438164303e-06, + "loss": 0.6758, + "step": 50086 + }, + { + "epoch": 1.28, + "learning_rate": 1.2783203667757736e-06, + "loss": 0.5828, + "step": 50087 + }, + { + "epoch": 1.28, + "learning_rate": 1.2782937895220193e-06, + "loss": 0.7695, + "step": 50088 + }, + { + "epoch": 1.28, + "learning_rate": 1.2782672120551888e-06, + "loss": 0.6943, + "step": 50089 + }, + { + "epoch": 1.28, + "learning_rate": 1.2782406343753014e-06, + "loss": 0.5405, + "step": 50090 + }, + { + "epoch": 1.28, + "learning_rate": 1.2782140564823783e-06, + "loss": 0.5186, + "step": 50091 + }, + { + "epoch": 1.28, + "learning_rate": 1.2781874783764394e-06, + "loss": 0.6074, + "step": 50092 + }, + { + "epoch": 1.28, + "learning_rate": 1.278160900057505e-06, + "loss": 0.4954, + "step": 50093 + }, + { + "epoch": 1.28, + "learning_rate": 1.2781343215255958e-06, + "loss": 0.7197, + "step": 50094 + }, + { + "epoch": 1.28, + "learning_rate": 1.2781077427807319e-06, + "loss": 0.6704, + "step": 50095 + }, + { + "epoch": 1.28, + "learning_rate": 1.2780811638229332e-06, + "loss": 0.6201, + "step": 50096 + }, + { + "epoch": 1.28, + "learning_rate": 1.2780545846522212e-06, + "loss": 0.6602, + "step": 50097 + }, + { + "epoch": 1.28, + "learning_rate": 1.2780280052686152e-06, + "loss": 0.6426, + "step": 50098 + }, + { + "epoch": 1.28, + "learning_rate": 1.2780014256721364e-06, + "loss": 0.7034, + "step": 50099 + }, + { + "epoch": 1.28, + "learning_rate": 1.277974845862804e-06, + "loss": 0.6387, + "step": 50100 + }, + { + "epoch": 1.28, + "learning_rate": 1.2779482658406395e-06, + "loss": 0.6216, + "step": 50101 + }, + { + "epoch": 1.28, + "learning_rate": 1.2779216856056627e-06, + "loss": 0.7217, + "step": 50102 + }, + { + "epoch": 1.28, + "learning_rate": 1.277895105157894e-06, + "loss": 0.6807, + "step": 50103 + }, + { + "epoch": 1.28, + "learning_rate": 1.2778685244973539e-06, + "loss": 0.7227, + "step": 50104 + }, + { + "epoch": 1.28, + "learning_rate": 1.2778419436240626e-06, + "loss": 0.6191, + "step": 50105 + }, + { + "epoch": 1.28, + "learning_rate": 1.2778153625380403e-06, + "loss": 0.7598, + "step": 50106 + }, + { + "epoch": 1.28, + "learning_rate": 1.277788781239308e-06, + "loss": 0.7578, + "step": 50107 + }, + { + "epoch": 1.28, + "learning_rate": 1.2777621997278853e-06, + "loss": 0.5713, + "step": 50108 + }, + { + "epoch": 1.28, + "learning_rate": 1.277735618003793e-06, + "loss": 0.5518, + "step": 50109 + }, + { + "epoch": 1.28, + "learning_rate": 1.2777090360670511e-06, + "loss": 0.7539, + "step": 50110 + }, + { + "epoch": 1.28, + "learning_rate": 1.27768245391768e-06, + "loss": 0.8125, + "step": 50111 + }, + { + "epoch": 1.28, + "learning_rate": 1.2776558715557006e-06, + "loss": 0.6304, + "step": 50112 + }, + { + "epoch": 1.28, + "learning_rate": 1.2776292889811329e-06, + "loss": 0.7949, + "step": 50113 + }, + { + "epoch": 1.28, + "learning_rate": 1.277602706193997e-06, + "loss": 0.7241, + "step": 50114 + }, + { + "epoch": 1.28, + "learning_rate": 1.2775761231943133e-06, + "loss": 0.5693, + "step": 50115 + }, + { + "epoch": 1.28, + "learning_rate": 1.2775495399821026e-06, + "loss": 0.5967, + "step": 50116 + }, + { + "epoch": 1.28, + "learning_rate": 1.277522956557385e-06, + "loss": 0.7822, + "step": 50117 + }, + { + "epoch": 1.28, + "learning_rate": 1.2774963729201808e-06, + "loss": 0.5371, + "step": 50118 + }, + { + "epoch": 1.28, + "learning_rate": 1.2774697890705105e-06, + "loss": 0.7236, + "step": 50119 + }, + { + "epoch": 1.28, + "learning_rate": 1.277443205008394e-06, + "loss": 0.561, + "step": 50120 + }, + { + "epoch": 1.28, + "learning_rate": 1.2774166207338522e-06, + "loss": 0.6504, + "step": 50121 + }, + { + "epoch": 1.28, + "learning_rate": 1.2773900362469053e-06, + "loss": 0.6826, + "step": 50122 + }, + { + "epoch": 1.28, + "learning_rate": 1.2773634515475735e-06, + "loss": 0.5867, + "step": 50123 + }, + { + "epoch": 1.28, + "learning_rate": 1.2773368666358775e-06, + "loss": 0.6113, + "step": 50124 + }, + { + "epoch": 1.28, + "learning_rate": 1.277310281511837e-06, + "loss": 0.7539, + "step": 50125 + }, + { + "epoch": 1.28, + "learning_rate": 1.277283696175473e-06, + "loss": 0.6289, + "step": 50126 + }, + { + "epoch": 1.28, + "learning_rate": 1.2772571106268057e-06, + "loss": 0.5815, + "step": 50127 + }, + { + "epoch": 1.28, + "learning_rate": 1.2772305248658553e-06, + "loss": 0.6099, + "step": 50128 + }, + { + "epoch": 1.28, + "learning_rate": 1.2772039388926422e-06, + "loss": 0.5891, + "step": 50129 + }, + { + "epoch": 1.28, + "learning_rate": 1.2771773527071866e-06, + "loss": 0.7188, + "step": 50130 + }, + { + "epoch": 1.28, + "learning_rate": 1.2771507663095094e-06, + "loss": 0.6128, + "step": 50131 + }, + { + "epoch": 1.28, + "learning_rate": 1.2771241796996303e-06, + "loss": 0.6304, + "step": 50132 + }, + { + "epoch": 1.28, + "learning_rate": 1.2770975928775704e-06, + "loss": 0.6904, + "step": 50133 + }, + { + "epoch": 1.28, + "learning_rate": 1.2770710058433492e-06, + "loss": 0.7842, + "step": 50134 + }, + { + "epoch": 1.28, + "learning_rate": 1.2770444185969878e-06, + "loss": 0.7861, + "step": 50135 + }, + { + "epoch": 1.29, + "learning_rate": 1.2770178311385058e-06, + "loss": 0.7988, + "step": 50136 + }, + { + "epoch": 1.29, + "learning_rate": 1.2769912434679244e-06, + "loss": 0.8018, + "step": 50137 + }, + { + "epoch": 1.29, + "learning_rate": 1.2769646555852634e-06, + "loss": 0.7393, + "step": 50138 + }, + { + "epoch": 1.29, + "learning_rate": 1.2769380674905432e-06, + "loss": 0.5547, + "step": 50139 + }, + { + "epoch": 1.29, + "learning_rate": 1.2769114791837842e-06, + "loss": 0.7412, + "step": 50140 + }, + { + "epoch": 1.29, + "learning_rate": 1.2768848906650069e-06, + "loss": 0.6223, + "step": 50141 + }, + { + "epoch": 1.29, + "learning_rate": 1.2768583019342316e-06, + "loss": 0.5791, + "step": 50142 + }, + { + "epoch": 1.29, + "learning_rate": 1.2768317129914788e-06, + "loss": 0.6196, + "step": 50143 + }, + { + "epoch": 1.29, + "learning_rate": 1.2768051238367682e-06, + "loss": 0.7148, + "step": 50144 + }, + { + "epoch": 1.29, + "learning_rate": 1.2767785344701211e-06, + "loss": 0.627, + "step": 50145 + }, + { + "epoch": 1.29, + "learning_rate": 1.2767519448915572e-06, + "loss": 0.6008, + "step": 50146 + }, + { + "epoch": 1.29, + "learning_rate": 1.2767253551010972e-06, + "loss": 0.7031, + "step": 50147 + }, + { + "epoch": 1.29, + "learning_rate": 1.2766987650987614e-06, + "loss": 0.5928, + "step": 50148 + }, + { + "epoch": 1.29, + "learning_rate": 1.2766721748845697e-06, + "loss": 0.8047, + "step": 50149 + }, + { + "epoch": 1.29, + "learning_rate": 1.2766455844585431e-06, + "loss": 0.8359, + "step": 50150 + }, + { + "epoch": 1.29, + "learning_rate": 1.2766189938207016e-06, + "loss": 0.8164, + "step": 50151 + }, + { + "epoch": 1.29, + "learning_rate": 1.2765924029710658e-06, + "loss": 0.665, + "step": 50152 + }, + { + "epoch": 1.29, + "learning_rate": 1.2765658119096555e-06, + "loss": 0.707, + "step": 50153 + }, + { + "epoch": 1.29, + "learning_rate": 1.2765392206364923e-06, + "loss": 0.606, + "step": 50154 + }, + { + "epoch": 1.29, + "learning_rate": 1.276512629151595e-06, + "loss": 0.438, + "step": 50155 + }, + { + "epoch": 1.29, + "learning_rate": 1.2764860374549848e-06, + "loss": 0.7949, + "step": 50156 + }, + { + "epoch": 1.29, + "learning_rate": 1.2764594455466822e-06, + "loss": 0.6123, + "step": 50157 + }, + { + "epoch": 1.29, + "learning_rate": 1.2764328534267073e-06, + "loss": 0.7568, + "step": 50158 + }, + { + "epoch": 1.29, + "learning_rate": 1.2764062610950802e-06, + "loss": 0.6143, + "step": 50159 + }, + { + "epoch": 1.29, + "learning_rate": 1.2763796685518218e-06, + "loss": 0.6641, + "step": 50160 + }, + { + "epoch": 1.29, + "learning_rate": 1.276353075796952e-06, + "loss": 0.8994, + "step": 50161 + }, + { + "epoch": 1.29, + "learning_rate": 1.2763264828304915e-06, + "loss": 0.6277, + "step": 50162 + }, + { + "epoch": 1.29, + "learning_rate": 1.2762998896524605e-06, + "loss": 0.6616, + "step": 50163 + }, + { + "epoch": 1.29, + "learning_rate": 1.2762732962628795e-06, + "loss": 0.7451, + "step": 50164 + }, + { + "epoch": 1.29, + "learning_rate": 1.2762467026617682e-06, + "loss": 0.4626, + "step": 50165 + }, + { + "epoch": 1.29, + "learning_rate": 1.2762201088491483e-06, + "loss": 0.4655, + "step": 50166 + }, + { + "epoch": 1.29, + "learning_rate": 1.2761935148250388e-06, + "loss": 0.7285, + "step": 50167 + }, + { + "epoch": 1.29, + "learning_rate": 1.276166920589461e-06, + "loss": 0.4392, + "step": 50168 + }, + { + "epoch": 1.29, + "learning_rate": 1.2761403261424344e-06, + "loss": 0.7871, + "step": 50169 + }, + { + "epoch": 1.29, + "learning_rate": 1.2761137314839803e-06, + "loss": 0.6079, + "step": 50170 + }, + { + "epoch": 1.29, + "learning_rate": 1.2760871366141182e-06, + "loss": 0.8057, + "step": 50171 + }, + { + "epoch": 1.29, + "learning_rate": 1.2760605415328691e-06, + "loss": 0.5923, + "step": 50172 + }, + { + "epoch": 1.29, + "learning_rate": 1.276033946240253e-06, + "loss": 0.8232, + "step": 50173 + }, + { + "epoch": 1.29, + "learning_rate": 1.2760073507362907e-06, + "loss": 0.7383, + "step": 50174 + }, + { + "epoch": 1.29, + "learning_rate": 1.2759807550210023e-06, + "loss": 0.7285, + "step": 50175 + }, + { + "epoch": 1.29, + "learning_rate": 1.2759541590944075e-06, + "loss": 0.7734, + "step": 50176 + }, + { + "epoch": 1.29, + "learning_rate": 1.2759275629565282e-06, + "loss": 0.7158, + "step": 50177 + }, + { + "epoch": 1.29, + "learning_rate": 1.2759009666073832e-06, + "loss": 0.5654, + "step": 50178 + }, + { + "epoch": 1.29, + "learning_rate": 1.2758743700469937e-06, + "loss": 0.5413, + "step": 50179 + }, + { + "epoch": 1.29, + "learning_rate": 1.2758477732753798e-06, + "loss": 0.6724, + "step": 50180 + }, + { + "epoch": 1.29, + "learning_rate": 1.275821176292562e-06, + "loss": 0.6484, + "step": 50181 + }, + { + "epoch": 1.29, + "learning_rate": 1.2757945790985606e-06, + "loss": 0.8008, + "step": 50182 + }, + { + "epoch": 1.29, + "learning_rate": 1.2757679816933961e-06, + "loss": 0.6543, + "step": 50183 + }, + { + "epoch": 1.29, + "learning_rate": 1.2757413840770886e-06, + "loss": 0.75, + "step": 50184 + }, + { + "epoch": 1.29, + "learning_rate": 1.2757147862496587e-06, + "loss": 0.6025, + "step": 50185 + }, + { + "epoch": 1.29, + "learning_rate": 1.2756881882111264e-06, + "loss": 0.7979, + "step": 50186 + }, + { + "epoch": 1.29, + "learning_rate": 1.2756615899615129e-06, + "loss": 0.8086, + "step": 50187 + }, + { + "epoch": 1.29, + "learning_rate": 1.2756349915008376e-06, + "loss": 0.7832, + "step": 50188 + }, + { + "epoch": 1.29, + "learning_rate": 1.2756083928291212e-06, + "loss": 0.6226, + "step": 50189 + }, + { + "epoch": 1.29, + "learning_rate": 1.275581793946384e-06, + "loss": 0.5832, + "step": 50190 + }, + { + "epoch": 1.29, + "learning_rate": 1.2755551948526469e-06, + "loss": 0.5776, + "step": 50191 + }, + { + "epoch": 1.29, + "learning_rate": 1.2755285955479295e-06, + "loss": 0.6484, + "step": 50192 + }, + { + "epoch": 1.29, + "learning_rate": 1.2755019960322528e-06, + "loss": 0.644, + "step": 50193 + }, + { + "epoch": 1.29, + "learning_rate": 1.2754753963056368e-06, + "loss": 0.7744, + "step": 50194 + }, + { + "epoch": 1.29, + "learning_rate": 1.275448796368102e-06, + "loss": 0.6396, + "step": 50195 + }, + { + "epoch": 1.29, + "learning_rate": 1.2754221962196684e-06, + "loss": 0.6523, + "step": 50196 + }, + { + "epoch": 1.29, + "learning_rate": 1.275395595860357e-06, + "loss": 0.668, + "step": 50197 + }, + { + "epoch": 1.29, + "learning_rate": 1.2753689952901877e-06, + "loss": 0.6143, + "step": 50198 + }, + { + "epoch": 1.29, + "learning_rate": 1.2753423945091813e-06, + "loss": 0.7588, + "step": 50199 + }, + { + "epoch": 1.29, + "learning_rate": 1.2753157935173577e-06, + "loss": 0.5815, + "step": 50200 + }, + { + "epoch": 1.29, + "learning_rate": 1.2752891923147374e-06, + "loss": 0.6211, + "step": 50201 + }, + { + "epoch": 1.29, + "learning_rate": 1.275262590901341e-06, + "loss": 0.7393, + "step": 50202 + }, + { + "epoch": 1.29, + "learning_rate": 1.2752359892771884e-06, + "loss": 0.6074, + "step": 50203 + }, + { + "epoch": 1.29, + "learning_rate": 1.2752093874423006e-06, + "loss": 0.793, + "step": 50204 + }, + { + "epoch": 1.29, + "learning_rate": 1.2751827853966975e-06, + "loss": 0.5811, + "step": 50205 + }, + { + "epoch": 1.29, + "learning_rate": 1.2751561831403994e-06, + "loss": 0.7285, + "step": 50206 + }, + { + "epoch": 1.29, + "learning_rate": 1.2751295806734272e-06, + "loss": 0.6748, + "step": 50207 + }, + { + "epoch": 1.29, + "learning_rate": 1.2751029779958007e-06, + "loss": 0.5376, + "step": 50208 + }, + { + "epoch": 1.29, + "learning_rate": 1.2750763751075404e-06, + "loss": 0.6631, + "step": 50209 + }, + { + "epoch": 1.29, + "learning_rate": 1.275049772008667e-06, + "loss": 0.7559, + "step": 50210 + }, + { + "epoch": 1.29, + "learning_rate": 1.2750231686992003e-06, + "loss": 0.7109, + "step": 50211 + }, + { + "epoch": 1.29, + "learning_rate": 1.2749965651791617e-06, + "loss": 0.6816, + "step": 50212 + }, + { + "epoch": 1.29, + "learning_rate": 1.2749699614485703e-06, + "loss": 0.4856, + "step": 50213 + }, + { + "epoch": 1.29, + "learning_rate": 1.2749433575074474e-06, + "loss": 0.5747, + "step": 50214 + }, + { + "epoch": 1.29, + "learning_rate": 1.2749167533558125e-06, + "loss": 0.5449, + "step": 50215 + }, + { + "epoch": 1.29, + "learning_rate": 1.2748901489936867e-06, + "loss": 0.6548, + "step": 50216 + }, + { + "epoch": 1.29, + "learning_rate": 1.2748635444210905e-06, + "loss": 0.7617, + "step": 50217 + }, + { + "epoch": 1.29, + "learning_rate": 1.2748369396380434e-06, + "loss": 0.6963, + "step": 50218 + }, + { + "epoch": 1.29, + "learning_rate": 1.2748103346445667e-06, + "loss": 0.7412, + "step": 50219 + }, + { + "epoch": 1.29, + "learning_rate": 1.2747837294406801e-06, + "loss": 0.6528, + "step": 50220 + }, + { + "epoch": 1.29, + "learning_rate": 1.2747571240264043e-06, + "loss": 0.603, + "step": 50221 + }, + { + "epoch": 1.29, + "learning_rate": 1.2747305184017598e-06, + "loss": 0.6704, + "step": 50222 + }, + { + "epoch": 1.29, + "learning_rate": 1.2747039125667667e-06, + "loss": 0.5771, + "step": 50223 + }, + { + "epoch": 1.29, + "learning_rate": 1.274677306521445e-06, + "loss": 0.7627, + "step": 50224 + }, + { + "epoch": 1.29, + "learning_rate": 1.2746507002658162e-06, + "loss": 0.7588, + "step": 50225 + }, + { + "epoch": 1.29, + "learning_rate": 1.2746240937998995e-06, + "loss": 0.647, + "step": 50226 + }, + { + "epoch": 1.29, + "learning_rate": 1.274597487123716e-06, + "loss": 0.6602, + "step": 50227 + }, + { + "epoch": 1.29, + "learning_rate": 1.2745708802372858e-06, + "loss": 0.5898, + "step": 50228 + }, + { + "epoch": 1.29, + "learning_rate": 1.2745442731406293e-06, + "loss": 0.6807, + "step": 50229 + }, + { + "epoch": 1.29, + "learning_rate": 1.2745176658337666e-06, + "loss": 0.8564, + "step": 50230 + }, + { + "epoch": 1.29, + "learning_rate": 1.2744910583167187e-06, + "loss": 0.6777, + "step": 50231 + }, + { + "epoch": 1.29, + "learning_rate": 1.2744644505895057e-06, + "loss": 0.8066, + "step": 50232 + }, + { + "epoch": 1.29, + "learning_rate": 1.2744378426521477e-06, + "loss": 0.425, + "step": 50233 + }, + { + "epoch": 1.29, + "learning_rate": 1.2744112345046651e-06, + "loss": 0.749, + "step": 50234 + }, + { + "epoch": 1.29, + "learning_rate": 1.2743846261470785e-06, + "loss": 0.467, + "step": 50235 + }, + { + "epoch": 1.29, + "learning_rate": 1.2743580175794081e-06, + "loss": 0.6533, + "step": 50236 + }, + { + "epoch": 1.29, + "learning_rate": 1.2743314088016748e-06, + "loss": 0.5273, + "step": 50237 + }, + { + "epoch": 1.29, + "learning_rate": 1.2743047998138985e-06, + "loss": 0.2727, + "step": 50238 + }, + { + "epoch": 1.29, + "learning_rate": 1.274278190616099e-06, + "loss": 0.5203, + "step": 50239 + }, + { + "epoch": 1.29, + "learning_rate": 1.2742515812082981e-06, + "loss": 0.7844, + "step": 50240 + }, + { + "epoch": 1.29, + "learning_rate": 1.274224971590515e-06, + "loss": 0.7002, + "step": 50241 + }, + { + "epoch": 1.29, + "learning_rate": 1.2741983617627704e-06, + "loss": 0.8262, + "step": 50242 + }, + { + "epoch": 1.29, + "learning_rate": 1.2741717517250847e-06, + "loss": 0.6978, + "step": 50243 + }, + { + "epoch": 1.29, + "learning_rate": 1.2741451414774786e-06, + "loss": 0.5404, + "step": 50244 + }, + { + "epoch": 1.29, + "learning_rate": 1.2741185310199718e-06, + "loss": 0.6904, + "step": 50245 + }, + { + "epoch": 1.29, + "learning_rate": 1.2740919203525852e-06, + "loss": 0.689, + "step": 50246 + }, + { + "epoch": 1.29, + "learning_rate": 1.2740653094753393e-06, + "loss": 0.7598, + "step": 50247 + }, + { + "epoch": 1.29, + "learning_rate": 1.2740386983882538e-06, + "loss": 0.8125, + "step": 50248 + }, + { + "epoch": 1.29, + "learning_rate": 1.2740120870913497e-06, + "loss": 0.708, + "step": 50249 + }, + { + "epoch": 1.29, + "learning_rate": 1.273985475584647e-06, + "loss": 0.6338, + "step": 50250 + }, + { + "epoch": 1.29, + "learning_rate": 1.2739588638681662e-06, + "loss": 0.5239, + "step": 50251 + }, + { + "epoch": 1.29, + "learning_rate": 1.273932251941928e-06, + "loss": 0.5146, + "step": 50252 + }, + { + "epoch": 1.29, + "learning_rate": 1.273905639805952e-06, + "loss": 0.4871, + "step": 50253 + }, + { + "epoch": 1.29, + "learning_rate": 1.2738790274602593e-06, + "loss": 0.748, + "step": 50254 + }, + { + "epoch": 1.29, + "learning_rate": 1.27385241490487e-06, + "loss": 0.5288, + "step": 50255 + }, + { + "epoch": 1.29, + "learning_rate": 1.2738258021398045e-06, + "loss": 0.5288, + "step": 50256 + }, + { + "epoch": 1.29, + "learning_rate": 1.2737991891650832e-06, + "loss": 0.6641, + "step": 50257 + }, + { + "epoch": 1.29, + "learning_rate": 1.2737725759807264e-06, + "loss": 0.644, + "step": 50258 + }, + { + "epoch": 1.29, + "learning_rate": 1.2737459625867546e-06, + "loss": 0.7871, + "step": 50259 + }, + { + "epoch": 1.29, + "learning_rate": 1.273719348983188e-06, + "loss": 0.709, + "step": 50260 + }, + { + "epoch": 1.29, + "learning_rate": 1.2736927351700471e-06, + "loss": 0.5037, + "step": 50261 + }, + { + "epoch": 1.29, + "learning_rate": 1.2736661211473522e-06, + "loss": 0.6592, + "step": 50262 + }, + { + "epoch": 1.29, + "learning_rate": 1.273639506915124e-06, + "loss": 0.4792, + "step": 50263 + }, + { + "epoch": 1.29, + "learning_rate": 1.2736128924733823e-06, + "loss": 0.6113, + "step": 50264 + }, + { + "epoch": 1.29, + "learning_rate": 1.273586277822148e-06, + "loss": 0.5505, + "step": 50265 + }, + { + "epoch": 1.29, + "learning_rate": 1.2735596629614408e-06, + "loss": 0.6406, + "step": 50266 + }, + { + "epoch": 1.29, + "learning_rate": 1.2735330478912825e-06, + "loss": 0.9561, + "step": 50267 + }, + { + "epoch": 1.29, + "learning_rate": 1.2735064326116918e-06, + "loss": 0.6631, + "step": 50268 + }, + { + "epoch": 1.29, + "learning_rate": 1.2734798171226899e-06, + "loss": 0.6074, + "step": 50269 + }, + { + "epoch": 1.29, + "learning_rate": 1.2734532014242971e-06, + "loss": 0.9258, + "step": 50270 + }, + { + "epoch": 1.29, + "learning_rate": 1.2734265855165338e-06, + "loss": 0.521, + "step": 50271 + }, + { + "epoch": 1.29, + "learning_rate": 1.2733999693994205e-06, + "loss": 0.5356, + "step": 50272 + }, + { + "epoch": 1.29, + "learning_rate": 1.2733733530729774e-06, + "loss": 0.5977, + "step": 50273 + }, + { + "epoch": 1.29, + "learning_rate": 1.2733467365372246e-06, + "loss": 0.541, + "step": 50274 + }, + { + "epoch": 1.29, + "learning_rate": 1.2733201197921829e-06, + "loss": 0.6543, + "step": 50275 + }, + { + "epoch": 1.29, + "learning_rate": 1.2732935028378724e-06, + "loss": 0.7158, + "step": 50276 + }, + { + "epoch": 1.29, + "learning_rate": 1.273266885674314e-06, + "loss": 0.501, + "step": 50277 + }, + { + "epoch": 1.29, + "learning_rate": 1.2732402683015273e-06, + "loss": 0.5537, + "step": 50278 + }, + { + "epoch": 1.29, + "learning_rate": 1.2732136507195334e-06, + "loss": 0.7241, + "step": 50279 + }, + { + "epoch": 1.29, + "learning_rate": 1.273187032928352e-06, + "loss": 0.7402, + "step": 50280 + }, + { + "epoch": 1.29, + "learning_rate": 1.2731604149280043e-06, + "loss": 0.5576, + "step": 50281 + }, + { + "epoch": 1.29, + "learning_rate": 1.2731337967185102e-06, + "loss": 0.7261, + "step": 50282 + }, + { + "epoch": 1.29, + "learning_rate": 1.2731071782998898e-06, + "loss": 0.6523, + "step": 50283 + }, + { + "epoch": 1.29, + "learning_rate": 1.2730805596721639e-06, + "loss": 0.6685, + "step": 50284 + }, + { + "epoch": 1.29, + "learning_rate": 1.2730539408353531e-06, + "loss": 0.4866, + "step": 50285 + }, + { + "epoch": 1.29, + "learning_rate": 1.2730273217894769e-06, + "loss": 0.6211, + "step": 50286 + }, + { + "epoch": 1.29, + "learning_rate": 1.2730007025345567e-06, + "loss": 0.6094, + "step": 50287 + }, + { + "epoch": 1.29, + "learning_rate": 1.272974083070612e-06, + "loss": 0.4849, + "step": 50288 + }, + { + "epoch": 1.29, + "learning_rate": 1.2729474633976638e-06, + "loss": 0.5723, + "step": 50289 + }, + { + "epoch": 1.29, + "learning_rate": 1.2729208435157323e-06, + "loss": 0.5791, + "step": 50290 + }, + { + "epoch": 1.29, + "learning_rate": 1.2728942234248379e-06, + "loss": 0.6064, + "step": 50291 + }, + { + "epoch": 1.29, + "learning_rate": 1.2728676031250011e-06, + "loss": 0.7139, + "step": 50292 + }, + { + "epoch": 1.29, + "learning_rate": 1.2728409826162418e-06, + "loss": 0.6675, + "step": 50293 + }, + { + "epoch": 1.29, + "learning_rate": 1.2728143618985808e-06, + "loss": 0.5735, + "step": 50294 + }, + { + "epoch": 1.29, + "learning_rate": 1.2727877409720384e-06, + "loss": 0.5576, + "step": 50295 + }, + { + "epoch": 1.29, + "learning_rate": 1.272761119836635e-06, + "loss": 0.7393, + "step": 50296 + }, + { + "epoch": 1.29, + "learning_rate": 1.2727344984923912e-06, + "loss": 0.729, + "step": 50297 + }, + { + "epoch": 1.29, + "learning_rate": 1.2727078769393266e-06, + "loss": 0.5591, + "step": 50298 + }, + { + "epoch": 1.29, + "learning_rate": 1.2726812551774625e-06, + "loss": 0.7017, + "step": 50299 + }, + { + "epoch": 1.29, + "learning_rate": 1.2726546332068187e-06, + "loss": 0.549, + "step": 50300 + }, + { + "epoch": 1.29, + "learning_rate": 1.2726280110274159e-06, + "loss": 0.6377, + "step": 50301 + }, + { + "epoch": 1.29, + "learning_rate": 1.2726013886392747e-06, + "loss": 0.5862, + "step": 50302 + }, + { + "epoch": 1.29, + "learning_rate": 1.2725747660424144e-06, + "loss": 0.7246, + "step": 50303 + }, + { + "epoch": 1.29, + "learning_rate": 1.2725481432368566e-06, + "loss": 0.6294, + "step": 50304 + }, + { + "epoch": 1.29, + "learning_rate": 1.2725215202226212e-06, + "loss": 0.5479, + "step": 50305 + }, + { + "epoch": 1.29, + "learning_rate": 1.2724948969997284e-06, + "loss": 0.7051, + "step": 50306 + }, + { + "epoch": 1.29, + "learning_rate": 1.2724682735681991e-06, + "loss": 0.6567, + "step": 50307 + }, + { + "epoch": 1.29, + "learning_rate": 1.272441649928053e-06, + "loss": 0.6758, + "step": 50308 + }, + { + "epoch": 1.29, + "learning_rate": 1.2724150260793113e-06, + "loss": 0.6484, + "step": 50309 + }, + { + "epoch": 1.29, + "learning_rate": 1.2723884020219936e-06, + "loss": 0.75, + "step": 50310 + }, + { + "epoch": 1.29, + "learning_rate": 1.2723617777561207e-06, + "loss": 0.6011, + "step": 50311 + }, + { + "epoch": 1.29, + "learning_rate": 1.272335153281713e-06, + "loss": 0.7168, + "step": 50312 + }, + { + "epoch": 1.29, + "learning_rate": 1.2723085285987908e-06, + "loss": 0.6963, + "step": 50313 + }, + { + "epoch": 1.29, + "learning_rate": 1.2722819037073741e-06, + "loss": 0.8184, + "step": 50314 + }, + { + "epoch": 1.29, + "learning_rate": 1.272255278607484e-06, + "loss": 0.6748, + "step": 50315 + }, + { + "epoch": 1.29, + "learning_rate": 1.2722286532991406e-06, + "loss": 0.488, + "step": 50316 + }, + { + "epoch": 1.29, + "learning_rate": 1.2722020277823644e-06, + "loss": 0.5146, + "step": 50317 + }, + { + "epoch": 1.29, + "learning_rate": 1.2721754020571754e-06, + "loss": 0.8145, + "step": 50318 + }, + { + "epoch": 1.29, + "learning_rate": 1.2721487761235944e-06, + "loss": 0.71, + "step": 50319 + }, + { + "epoch": 1.29, + "learning_rate": 1.272122149981641e-06, + "loss": 0.7407, + "step": 50320 + }, + { + "epoch": 1.29, + "learning_rate": 1.2720955236313367e-06, + "loss": 0.7139, + "step": 50321 + }, + { + "epoch": 1.29, + "learning_rate": 1.2720688970727015e-06, + "loss": 0.6748, + "step": 50322 + }, + { + "epoch": 1.29, + "learning_rate": 1.2720422703057553e-06, + "loss": 0.5571, + "step": 50323 + }, + { + "epoch": 1.29, + "learning_rate": 1.2720156433305188e-06, + "loss": 0.6006, + "step": 50324 + }, + { + "epoch": 1.29, + "learning_rate": 1.2719890161470125e-06, + "loss": 0.6592, + "step": 50325 + }, + { + "epoch": 1.29, + "learning_rate": 1.2719623887552567e-06, + "loss": 0.6091, + "step": 50326 + }, + { + "epoch": 1.29, + "learning_rate": 1.2719357611552722e-06, + "loss": 0.6099, + "step": 50327 + }, + { + "epoch": 1.29, + "learning_rate": 1.2719091333470786e-06, + "loss": 0.6963, + "step": 50328 + }, + { + "epoch": 1.29, + "learning_rate": 1.2718825053306965e-06, + "loss": 0.6172, + "step": 50329 + }, + { + "epoch": 1.29, + "learning_rate": 1.271855877106147e-06, + "loss": 0.6162, + "step": 50330 + }, + { + "epoch": 1.29, + "learning_rate": 1.2718292486734497e-06, + "loss": 0.4771, + "step": 50331 + }, + { + "epoch": 1.29, + "learning_rate": 1.2718026200326252e-06, + "loss": 0.6484, + "step": 50332 + }, + { + "epoch": 1.29, + "learning_rate": 1.271775991183694e-06, + "loss": 0.5708, + "step": 50333 + }, + { + "epoch": 1.29, + "learning_rate": 1.2717493621266765e-06, + "loss": 0.5317, + "step": 50334 + }, + { + "epoch": 1.29, + "learning_rate": 1.2717227328615927e-06, + "loss": 0.7061, + "step": 50335 + }, + { + "epoch": 1.29, + "learning_rate": 1.2716961033884635e-06, + "loss": 0.7227, + "step": 50336 + }, + { + "epoch": 1.29, + "learning_rate": 1.271669473707309e-06, + "loss": 0.7012, + "step": 50337 + }, + { + "epoch": 1.29, + "learning_rate": 1.2716428438181499e-06, + "loss": 0.5513, + "step": 50338 + }, + { + "epoch": 1.29, + "learning_rate": 1.271616213721006e-06, + "loss": 0.4846, + "step": 50339 + }, + { + "epoch": 1.29, + "learning_rate": 1.2715895834158985e-06, + "loss": 0.6299, + "step": 50340 + }, + { + "epoch": 1.29, + "learning_rate": 1.271562952902847e-06, + "loss": 0.668, + "step": 50341 + }, + { + "epoch": 1.29, + "learning_rate": 1.2715363221818727e-06, + "loss": 0.6558, + "step": 50342 + }, + { + "epoch": 1.29, + "learning_rate": 1.2715096912529951e-06, + "loss": 0.6304, + "step": 50343 + }, + { + "epoch": 1.29, + "learning_rate": 1.271483060116235e-06, + "loss": 0.5044, + "step": 50344 + }, + { + "epoch": 1.29, + "learning_rate": 1.2714564287716126e-06, + "loss": 0.7422, + "step": 50345 + }, + { + "epoch": 1.29, + "learning_rate": 1.271429797219149e-06, + "loss": 0.6357, + "step": 50346 + }, + { + "epoch": 1.29, + "learning_rate": 1.271403165458864e-06, + "loss": 0.6602, + "step": 50347 + }, + { + "epoch": 1.29, + "learning_rate": 1.271376533490778e-06, + "loss": 0.6309, + "step": 50348 + }, + { + "epoch": 1.29, + "learning_rate": 1.2713499013149115e-06, + "loss": 0.8652, + "step": 50349 + }, + { + "epoch": 1.29, + "learning_rate": 1.2713232689312845e-06, + "loss": 0.8281, + "step": 50350 + }, + { + "epoch": 1.29, + "learning_rate": 1.271296636339918e-06, + "loss": 0.4961, + "step": 50351 + }, + { + "epoch": 1.29, + "learning_rate": 1.2712700035408322e-06, + "loss": 0.6875, + "step": 50352 + }, + { + "epoch": 1.29, + "learning_rate": 1.2712433705340475e-06, + "loss": 0.6836, + "step": 50353 + }, + { + "epoch": 1.29, + "learning_rate": 1.2712167373195839e-06, + "loss": 0.6953, + "step": 50354 + }, + { + "epoch": 1.29, + "learning_rate": 1.2711901038974623e-06, + "loss": 0.7227, + "step": 50355 + }, + { + "epoch": 1.29, + "learning_rate": 1.271163470267703e-06, + "loss": 0.4905, + "step": 50356 + }, + { + "epoch": 1.29, + "learning_rate": 1.2711368364303266e-06, + "loss": 0.7676, + "step": 50357 + }, + { + "epoch": 1.29, + "learning_rate": 1.2711102023853525e-06, + "loss": 0.7134, + "step": 50358 + }, + { + "epoch": 1.29, + "learning_rate": 1.2710835681328022e-06, + "loss": 0.5762, + "step": 50359 + }, + { + "epoch": 1.29, + "learning_rate": 1.2710569336726955e-06, + "loss": 0.6899, + "step": 50360 + }, + { + "epoch": 1.29, + "learning_rate": 1.2710302990050533e-06, + "loss": 0.4231, + "step": 50361 + }, + { + "epoch": 1.29, + "learning_rate": 1.2710036641298954e-06, + "loss": 0.6895, + "step": 50362 + }, + { + "epoch": 1.29, + "learning_rate": 1.2709770290472426e-06, + "loss": 0.7725, + "step": 50363 + }, + { + "epoch": 1.29, + "learning_rate": 1.2709503937571146e-06, + "loss": 0.7656, + "step": 50364 + }, + { + "epoch": 1.29, + "learning_rate": 1.270923758259533e-06, + "loss": 0.5115, + "step": 50365 + }, + { + "epoch": 1.29, + "learning_rate": 1.270897122554517e-06, + "loss": 0.6685, + "step": 50366 + }, + { + "epoch": 1.29, + "learning_rate": 1.2708704866420883e-06, + "loss": 0.6689, + "step": 50367 + }, + { + "epoch": 1.29, + "learning_rate": 1.270843850522266e-06, + "loss": 0.4001, + "step": 50368 + }, + { + "epoch": 1.29, + "learning_rate": 1.270817214195071e-06, + "loss": 0.6978, + "step": 50369 + }, + { + "epoch": 1.29, + "learning_rate": 1.2707905776605237e-06, + "loss": 0.7207, + "step": 50370 + }, + { + "epoch": 1.29, + "learning_rate": 1.2707639409186445e-06, + "loss": 0.553, + "step": 50371 + }, + { + "epoch": 1.29, + "learning_rate": 1.270737303969454e-06, + "loss": 0.5249, + "step": 50372 + }, + { + "epoch": 1.29, + "learning_rate": 1.2707106668129722e-06, + "loss": 0.5806, + "step": 50373 + }, + { + "epoch": 1.29, + "learning_rate": 1.2706840294492198e-06, + "loss": 0.623, + "step": 50374 + }, + { + "epoch": 1.29, + "learning_rate": 1.2706573918782174e-06, + "loss": 0.6138, + "step": 50375 + }, + { + "epoch": 1.29, + "learning_rate": 1.2706307540999845e-06, + "loss": 0.7109, + "step": 50376 + }, + { + "epoch": 1.29, + "learning_rate": 1.2706041161145422e-06, + "loss": 0.8008, + "step": 50377 + }, + { + "epoch": 1.29, + "learning_rate": 1.2705774779219112e-06, + "loss": 0.5798, + "step": 50378 + }, + { + "epoch": 1.29, + "learning_rate": 1.270550839522111e-06, + "loss": 0.7646, + "step": 50379 + }, + { + "epoch": 1.29, + "learning_rate": 1.2705242009151626e-06, + "loss": 0.6523, + "step": 50380 + }, + { + "epoch": 1.29, + "learning_rate": 1.2704975621010862e-06, + "loss": 0.6475, + "step": 50381 + }, + { + "epoch": 1.29, + "learning_rate": 1.2704709230799023e-06, + "loss": 0.7061, + "step": 50382 + }, + { + "epoch": 1.29, + "learning_rate": 1.2704442838516314e-06, + "loss": 0.7705, + "step": 50383 + }, + { + "epoch": 1.29, + "learning_rate": 1.2704176444162938e-06, + "loss": 0.7368, + "step": 50384 + }, + { + "epoch": 1.29, + "learning_rate": 1.2703910047739094e-06, + "loss": 0.7715, + "step": 50385 + }, + { + "epoch": 1.29, + "learning_rate": 1.2703643649244995e-06, + "loss": 0.5881, + "step": 50386 + }, + { + "epoch": 1.29, + "learning_rate": 1.2703377248680838e-06, + "loss": 0.6338, + "step": 50387 + }, + { + "epoch": 1.29, + "learning_rate": 1.2703110846046832e-06, + "loss": 0.5913, + "step": 50388 + }, + { + "epoch": 1.29, + "learning_rate": 1.2702844441343172e-06, + "loss": 0.6562, + "step": 50389 + }, + { + "epoch": 1.29, + "learning_rate": 1.2702578034570076e-06, + "loss": 0.6123, + "step": 50390 + }, + { + "epoch": 1.29, + "learning_rate": 1.2702311625727735e-06, + "loss": 0.5123, + "step": 50391 + }, + { + "epoch": 1.29, + "learning_rate": 1.270204521481636e-06, + "loss": 0.5513, + "step": 50392 + }, + { + "epoch": 1.29, + "learning_rate": 1.2701778801836153e-06, + "loss": 0.5552, + "step": 50393 + }, + { + "epoch": 1.29, + "learning_rate": 1.2701512386787318e-06, + "loss": 0.4775, + "step": 50394 + }, + { + "epoch": 1.29, + "learning_rate": 1.270124596967006e-06, + "loss": 0.5536, + "step": 50395 + }, + { + "epoch": 1.29, + "learning_rate": 1.2700979550484583e-06, + "loss": 0.6445, + "step": 50396 + }, + { + "epoch": 1.29, + "learning_rate": 1.2700713129231088e-06, + "loss": 0.7598, + "step": 50397 + }, + { + "epoch": 1.29, + "learning_rate": 1.2700446705909782e-06, + "loss": 0.6099, + "step": 50398 + }, + { + "epoch": 1.29, + "learning_rate": 1.2700180280520867e-06, + "loss": 0.7256, + "step": 50399 + }, + { + "epoch": 1.29, + "learning_rate": 1.2699913853064547e-06, + "loss": 0.6919, + "step": 50400 + }, + { + "epoch": 1.29, + "learning_rate": 1.2699647423541033e-06, + "loss": 0.7024, + "step": 50401 + }, + { + "epoch": 1.29, + "learning_rate": 1.269938099195052e-06, + "loss": 0.6904, + "step": 50402 + }, + { + "epoch": 1.29, + "learning_rate": 1.2699114558293213e-06, + "loss": 0.6714, + "step": 50403 + }, + { + "epoch": 1.29, + "learning_rate": 1.269884812256932e-06, + "loss": 0.7119, + "step": 50404 + }, + { + "epoch": 1.29, + "learning_rate": 1.2698581684779044e-06, + "loss": 0.6611, + "step": 50405 + }, + { + "epoch": 1.29, + "learning_rate": 1.2698315244922586e-06, + "loss": 0.6216, + "step": 50406 + }, + { + "epoch": 1.29, + "learning_rate": 1.2698048803000155e-06, + "loss": 0.7988, + "step": 50407 + }, + { + "epoch": 1.29, + "learning_rate": 1.2697782359011948e-06, + "loss": 0.6475, + "step": 50408 + }, + { + "epoch": 1.29, + "learning_rate": 1.2697515912958177e-06, + "loss": 0.5466, + "step": 50409 + }, + { + "epoch": 1.29, + "learning_rate": 1.2697249464839037e-06, + "loss": 0.6455, + "step": 50410 + }, + { + "epoch": 1.29, + "learning_rate": 1.2696983014654742e-06, + "loss": 0.6797, + "step": 50411 + }, + { + "epoch": 1.29, + "learning_rate": 1.2696716562405489e-06, + "loss": 0.7764, + "step": 50412 + }, + { + "epoch": 1.29, + "learning_rate": 1.2696450108091484e-06, + "loss": 0.6494, + "step": 50413 + }, + { + "epoch": 1.29, + "learning_rate": 1.2696183651712933e-06, + "loss": 0.5178, + "step": 50414 + }, + { + "epoch": 1.29, + "learning_rate": 1.2695917193270039e-06, + "loss": 0.6738, + "step": 50415 + }, + { + "epoch": 1.29, + "learning_rate": 1.2695650732763002e-06, + "loss": 0.6074, + "step": 50416 + }, + { + "epoch": 1.29, + "learning_rate": 1.269538427019203e-06, + "loss": 0.6519, + "step": 50417 + }, + { + "epoch": 1.29, + "learning_rate": 1.2695117805557324e-06, + "loss": 0.7354, + "step": 50418 + }, + { + "epoch": 1.29, + "learning_rate": 1.2694851338859095e-06, + "loss": 0.4683, + "step": 50419 + }, + { + "epoch": 1.29, + "learning_rate": 1.269458487009754e-06, + "loss": 0.708, + "step": 50420 + }, + { + "epoch": 1.29, + "learning_rate": 1.2694318399272866e-06, + "loss": 0.7686, + "step": 50421 + }, + { + "epoch": 1.29, + "learning_rate": 1.2694051926385274e-06, + "loss": 0.7266, + "step": 50422 + }, + { + "epoch": 1.29, + "learning_rate": 1.269378545143497e-06, + "loss": 0.7666, + "step": 50423 + }, + { + "epoch": 1.29, + "learning_rate": 1.2693518974422162e-06, + "loss": 0.6621, + "step": 50424 + }, + { + "epoch": 1.29, + "learning_rate": 1.2693252495347047e-06, + "loss": 0.4697, + "step": 50425 + }, + { + "epoch": 1.29, + "learning_rate": 1.2692986014209836e-06, + "loss": 0.8301, + "step": 50426 + }, + { + "epoch": 1.29, + "learning_rate": 1.2692719531010727e-06, + "loss": 0.5586, + "step": 50427 + }, + { + "epoch": 1.29, + "learning_rate": 1.2692453045749927e-06, + "loss": 0.6865, + "step": 50428 + }, + { + "epoch": 1.29, + "learning_rate": 1.2692186558427638e-06, + "loss": 0.813, + "step": 50429 + }, + { + "epoch": 1.29, + "learning_rate": 1.2691920069044066e-06, + "loss": 0.7617, + "step": 50430 + }, + { + "epoch": 1.29, + "learning_rate": 1.2691653577599417e-06, + "loss": 0.7217, + "step": 50431 + }, + { + "epoch": 1.29, + "learning_rate": 1.269138708409389e-06, + "loss": 0.583, + "step": 50432 + }, + { + "epoch": 1.29, + "learning_rate": 1.2691120588527692e-06, + "loss": 0.5945, + "step": 50433 + }, + { + "epoch": 1.29, + "learning_rate": 1.269085409090103e-06, + "loss": 0.5693, + "step": 50434 + }, + { + "epoch": 1.29, + "learning_rate": 1.26905875912141e-06, + "loss": 0.5391, + "step": 50435 + }, + { + "epoch": 1.29, + "learning_rate": 1.2690321089467114e-06, + "loss": 0.7441, + "step": 50436 + }, + { + "epoch": 1.29, + "learning_rate": 1.2690054585660272e-06, + "loss": 0.6572, + "step": 50437 + }, + { + "epoch": 1.29, + "learning_rate": 1.268978807979378e-06, + "loss": 0.4841, + "step": 50438 + }, + { + "epoch": 1.29, + "learning_rate": 1.268952157186784e-06, + "loss": 0.7178, + "step": 50439 + }, + { + "epoch": 1.29, + "learning_rate": 1.2689255061882656e-06, + "loss": 0.611, + "step": 50440 + }, + { + "epoch": 1.29, + "learning_rate": 1.2688988549838433e-06, + "loss": 0.6768, + "step": 50441 + }, + { + "epoch": 1.29, + "learning_rate": 1.2688722035735376e-06, + "loss": 0.563, + "step": 50442 + }, + { + "epoch": 1.29, + "learning_rate": 1.268845551957369e-06, + "loss": 0.6445, + "step": 50443 + }, + { + "epoch": 1.29, + "learning_rate": 1.2688189001353571e-06, + "loss": 0.7061, + "step": 50444 + }, + { + "epoch": 1.29, + "learning_rate": 1.2687922481075235e-06, + "loss": 0.6445, + "step": 50445 + }, + { + "epoch": 1.29, + "learning_rate": 1.268765595873888e-06, + "loss": 0.6343, + "step": 50446 + }, + { + "epoch": 1.29, + "learning_rate": 1.2687389434344709e-06, + "loss": 0.6387, + "step": 50447 + }, + { + "epoch": 1.29, + "learning_rate": 1.2687122907892928e-06, + "loss": 0.626, + "step": 50448 + }, + { + "epoch": 1.29, + "learning_rate": 1.268685637938374e-06, + "loss": 0.5562, + "step": 50449 + }, + { + "epoch": 1.29, + "learning_rate": 1.268658984881735e-06, + "loss": 0.6357, + "step": 50450 + }, + { + "epoch": 1.29, + "learning_rate": 1.2686323316193963e-06, + "loss": 0.5608, + "step": 50451 + }, + { + "epoch": 1.29, + "learning_rate": 1.2686056781513778e-06, + "loss": 0.6572, + "step": 50452 + }, + { + "epoch": 1.29, + "learning_rate": 1.2685790244777007e-06, + "loss": 0.6545, + "step": 50453 + }, + { + "epoch": 1.29, + "learning_rate": 1.2685523705983846e-06, + "loss": 0.5879, + "step": 50454 + }, + { + "epoch": 1.29, + "learning_rate": 1.2685257165134507e-06, + "loss": 0.4255, + "step": 50455 + }, + { + "epoch": 1.29, + "learning_rate": 1.2684990622229187e-06, + "loss": 0.5488, + "step": 50456 + }, + { + "epoch": 1.29, + "learning_rate": 1.2684724077268097e-06, + "loss": 0.7637, + "step": 50457 + }, + { + "epoch": 1.29, + "learning_rate": 1.2684457530251432e-06, + "loss": 0.613, + "step": 50458 + }, + { + "epoch": 1.29, + "learning_rate": 1.2684190981179403e-06, + "loss": 0.7715, + "step": 50459 + }, + { + "epoch": 1.29, + "learning_rate": 1.2683924430052213e-06, + "loss": 0.5693, + "step": 50460 + }, + { + "epoch": 1.29, + "learning_rate": 1.2683657876870067e-06, + "loss": 0.6897, + "step": 50461 + }, + { + "epoch": 1.29, + "learning_rate": 1.2683391321633165e-06, + "loss": 0.5952, + "step": 50462 + }, + { + "epoch": 1.29, + "learning_rate": 1.2683124764341714e-06, + "loss": 0.5889, + "step": 50463 + }, + { + "epoch": 1.29, + "learning_rate": 1.268285820499592e-06, + "loss": 0.7266, + "step": 50464 + }, + { + "epoch": 1.29, + "learning_rate": 1.2682591643595984e-06, + "loss": 0.5304, + "step": 50465 + }, + { + "epoch": 1.29, + "learning_rate": 1.268232508014211e-06, + "loss": 0.6416, + "step": 50466 + }, + { + "epoch": 1.29, + "learning_rate": 1.2682058514634504e-06, + "loss": 0.8398, + "step": 50467 + }, + { + "epoch": 1.29, + "learning_rate": 1.2681791947073368e-06, + "loss": 0.5999, + "step": 50468 + }, + { + "epoch": 1.29, + "learning_rate": 1.2681525377458905e-06, + "loss": 0.7275, + "step": 50469 + }, + { + "epoch": 1.29, + "learning_rate": 1.2681258805791326e-06, + "loss": 0.5732, + "step": 50470 + }, + { + "epoch": 1.29, + "learning_rate": 1.2680992232070828e-06, + "loss": 0.8291, + "step": 50471 + }, + { + "epoch": 1.29, + "learning_rate": 1.2680725656297619e-06, + "loss": 0.4656, + "step": 50472 + }, + { + "epoch": 1.29, + "learning_rate": 1.26804590784719e-06, + "loss": 0.6724, + "step": 50473 + }, + { + "epoch": 1.29, + "learning_rate": 1.2680192498593878e-06, + "loss": 0.543, + "step": 50474 + }, + { + "epoch": 1.29, + "learning_rate": 1.2679925916663753e-06, + "loss": 0.6133, + "step": 50475 + }, + { + "epoch": 1.29, + "learning_rate": 1.2679659332681738e-06, + "loss": 0.6353, + "step": 50476 + }, + { + "epoch": 1.29, + "learning_rate": 1.2679392746648026e-06, + "loss": 0.5774, + "step": 50477 + }, + { + "epoch": 1.29, + "learning_rate": 1.2679126158562826e-06, + "loss": 0.4004, + "step": 50478 + }, + { + "epoch": 1.29, + "learning_rate": 1.2678859568426344e-06, + "loss": 0.5854, + "step": 50479 + }, + { + "epoch": 1.29, + "learning_rate": 1.2678592976238783e-06, + "loss": 0.6924, + "step": 50480 + }, + { + "epoch": 1.29, + "learning_rate": 1.2678326382000346e-06, + "loss": 0.6494, + "step": 50481 + }, + { + "epoch": 1.29, + "learning_rate": 1.2678059785711237e-06, + "loss": 0.6128, + "step": 50482 + }, + { + "epoch": 1.29, + "learning_rate": 1.267779318737166e-06, + "loss": 0.5361, + "step": 50483 + }, + { + "epoch": 1.29, + "learning_rate": 1.2677526586981821e-06, + "loss": 0.6777, + "step": 50484 + }, + { + "epoch": 1.29, + "learning_rate": 1.2677259984541922e-06, + "loss": 0.7295, + "step": 50485 + }, + { + "epoch": 1.29, + "learning_rate": 1.267699338005217e-06, + "loss": 0.6387, + "step": 50486 + }, + { + "epoch": 1.29, + "learning_rate": 1.2676726773512767e-06, + "loss": 0.7129, + "step": 50487 + }, + { + "epoch": 1.29, + "learning_rate": 1.2676460164923915e-06, + "loss": 0.8672, + "step": 50488 + }, + { + "epoch": 1.29, + "learning_rate": 1.2676193554285823e-06, + "loss": 0.6484, + "step": 50489 + }, + { + "epoch": 1.29, + "learning_rate": 1.2675926941598691e-06, + "loss": 0.6982, + "step": 50490 + }, + { + "epoch": 1.29, + "learning_rate": 1.2675660326862726e-06, + "loss": 0.6152, + "step": 50491 + }, + { + "epoch": 1.29, + "learning_rate": 1.267539371007813e-06, + "loss": 0.7144, + "step": 50492 + }, + { + "epoch": 1.29, + "learning_rate": 1.267512709124511e-06, + "loss": 0.6748, + "step": 50493 + }, + { + "epoch": 1.29, + "learning_rate": 1.2674860470363867e-06, + "loss": 0.4336, + "step": 50494 + }, + { + "epoch": 1.29, + "learning_rate": 1.2674593847434607e-06, + "loss": 0.7725, + "step": 50495 + }, + { + "epoch": 1.29, + "learning_rate": 1.2674327222457533e-06, + "loss": 0.7998, + "step": 50496 + }, + { + "epoch": 1.29, + "learning_rate": 1.267406059543285e-06, + "loss": 0.6738, + "step": 50497 + }, + { + "epoch": 1.29, + "learning_rate": 1.267379396636076e-06, + "loss": 0.5049, + "step": 50498 + }, + { + "epoch": 1.29, + "learning_rate": 1.267352733524147e-06, + "loss": 0.7754, + "step": 50499 + }, + { + "epoch": 1.29, + "learning_rate": 1.267326070207518e-06, + "loss": 0.645, + "step": 50500 + }, + { + "epoch": 1.29, + "learning_rate": 1.2672994066862103e-06, + "loss": 0.584, + "step": 50501 + }, + { + "epoch": 1.29, + "learning_rate": 1.2672727429602435e-06, + "loss": 0.5985, + "step": 50502 + }, + { + "epoch": 1.29, + "learning_rate": 1.2672460790296382e-06, + "loss": 0.645, + "step": 50503 + }, + { + "epoch": 1.29, + "learning_rate": 1.2672194148944147e-06, + "loss": 0.8408, + "step": 50504 + }, + { + "epoch": 1.29, + "learning_rate": 1.2671927505545938e-06, + "loss": 0.6001, + "step": 50505 + }, + { + "epoch": 1.29, + "learning_rate": 1.2671660860101959e-06, + "loss": 0.5146, + "step": 50506 + }, + { + "epoch": 1.29, + "learning_rate": 1.2671394212612407e-06, + "loss": 0.5103, + "step": 50507 + }, + { + "epoch": 1.29, + "learning_rate": 1.2671127563077493e-06, + "loss": 0.7236, + "step": 50508 + }, + { + "epoch": 1.29, + "learning_rate": 1.2670860911497418e-06, + "loss": 0.7783, + "step": 50509 + }, + { + "epoch": 1.29, + "learning_rate": 1.2670594257872394e-06, + "loss": 0.5986, + "step": 50510 + }, + { + "epoch": 1.29, + "learning_rate": 1.2670327602202613e-06, + "loss": 0.6245, + "step": 50511 + }, + { + "epoch": 1.29, + "learning_rate": 1.2670060944488288e-06, + "loss": 0.5947, + "step": 50512 + }, + { + "epoch": 1.29, + "learning_rate": 1.2669794284729616e-06, + "loss": 0.7363, + "step": 50513 + }, + { + "epoch": 1.29, + "learning_rate": 1.266952762292681e-06, + "loss": 0.7266, + "step": 50514 + }, + { + "epoch": 1.29, + "learning_rate": 1.2669260959080066e-06, + "loss": 0.7725, + "step": 50515 + }, + { + "epoch": 1.29, + "learning_rate": 1.2668994293189594e-06, + "loss": 0.7549, + "step": 50516 + }, + { + "epoch": 1.29, + "learning_rate": 1.2668727625255596e-06, + "loss": 0.4727, + "step": 50517 + }, + { + "epoch": 1.29, + "learning_rate": 1.2668460955278274e-06, + "loss": 0.7236, + "step": 50518 + }, + { + "epoch": 1.29, + "learning_rate": 1.2668194283257833e-06, + "loss": 0.792, + "step": 50519 + }, + { + "epoch": 1.29, + "learning_rate": 1.2667927609194482e-06, + "loss": 0.7363, + "step": 50520 + }, + { + "epoch": 1.29, + "learning_rate": 1.266766093308842e-06, + "loss": 0.5232, + "step": 50521 + }, + { + "epoch": 1.29, + "learning_rate": 1.2667394254939854e-06, + "loss": 0.4951, + "step": 50522 + }, + { + "epoch": 1.29, + "learning_rate": 1.2667127574748984e-06, + "loss": 0.6201, + "step": 50523 + }, + { + "epoch": 1.29, + "learning_rate": 1.2666860892516017e-06, + "loss": 0.7017, + "step": 50524 + }, + { + "epoch": 1.29, + "learning_rate": 1.2666594208241159e-06, + "loss": 0.7891, + "step": 50525 + }, + { + "epoch": 1.3, + "learning_rate": 1.2666327521924612e-06, + "loss": 0.751, + "step": 50526 + }, + { + "epoch": 1.3, + "learning_rate": 1.2666060833566583e-06, + "loss": 0.6255, + "step": 50527 + }, + { + "epoch": 1.3, + "learning_rate": 1.2665794143167272e-06, + "loss": 0.6895, + "step": 50528 + }, + { + "epoch": 1.3, + "learning_rate": 1.2665527450726882e-06, + "loss": 0.5703, + "step": 50529 + }, + { + "epoch": 1.3, + "learning_rate": 1.2665260756245624e-06, + "loss": 0.6729, + "step": 50530 + }, + { + "epoch": 1.3, + "learning_rate": 1.2664994059723696e-06, + "loss": 0.4368, + "step": 50531 + }, + { + "epoch": 1.3, + "learning_rate": 1.2664727361161304e-06, + "loss": 0.7285, + "step": 50532 + }, + { + "epoch": 1.3, + "learning_rate": 1.2664460660558657e-06, + "loss": 0.624, + "step": 50533 + }, + { + "epoch": 1.3, + "learning_rate": 1.2664193957915949e-06, + "loss": 0.668, + "step": 50534 + }, + { + "epoch": 1.3, + "learning_rate": 1.2663927253233398e-06, + "loss": 0.5796, + "step": 50535 + }, + { + "epoch": 1.3, + "learning_rate": 1.2663660546511195e-06, + "loss": 0.6318, + "step": 50536 + }, + { + "epoch": 1.3, + "learning_rate": 1.2663393837749552e-06, + "loss": 0.6768, + "step": 50537 + }, + { + "epoch": 1.3, + "learning_rate": 1.2663127126948667e-06, + "loss": 0.3779, + "step": 50538 + }, + { + "epoch": 1.3, + "learning_rate": 1.266286041410875e-06, + "loss": 0.6992, + "step": 50539 + }, + { + "epoch": 1.3, + "learning_rate": 1.2662593699230005e-06, + "loss": 0.6855, + "step": 50540 + }, + { + "epoch": 1.3, + "learning_rate": 1.2662326982312634e-06, + "loss": 0.5371, + "step": 50541 + }, + { + "epoch": 1.3, + "learning_rate": 1.266206026335684e-06, + "loss": 0.5234, + "step": 50542 + }, + { + "epoch": 1.3, + "learning_rate": 1.2661793542362831e-06, + "loss": 0.6814, + "step": 50543 + }, + { + "epoch": 1.3, + "learning_rate": 1.2661526819330805e-06, + "loss": 0.7637, + "step": 50544 + }, + { + "epoch": 1.3, + "learning_rate": 1.2661260094260974e-06, + "loss": 0.6348, + "step": 50545 + }, + { + "epoch": 1.3, + "learning_rate": 1.2660993367153538e-06, + "loss": 0.5022, + "step": 50546 + }, + { + "epoch": 1.3, + "learning_rate": 1.2660726638008702e-06, + "loss": 0.4722, + "step": 50547 + }, + { + "epoch": 1.3, + "learning_rate": 1.2660459906826668e-06, + "loss": 0.7324, + "step": 50548 + }, + { + "epoch": 1.3, + "learning_rate": 1.2660193173607644e-06, + "loss": 0.6797, + "step": 50549 + }, + { + "epoch": 1.3, + "learning_rate": 1.265992643835183e-06, + "loss": 0.8184, + "step": 50550 + }, + { + "epoch": 1.3, + "learning_rate": 1.2659659701059435e-06, + "loss": 0.6025, + "step": 50551 + }, + { + "epoch": 1.3, + "learning_rate": 1.2659392961730663e-06, + "loss": 0.4937, + "step": 50552 + }, + { + "epoch": 1.3, + "learning_rate": 1.265912622036571e-06, + "loss": 0.4854, + "step": 50553 + }, + { + "epoch": 1.3, + "learning_rate": 1.265885947696479e-06, + "loss": 0.7588, + "step": 50554 + }, + { + "epoch": 1.3, + "learning_rate": 1.2658592731528102e-06, + "loss": 0.7354, + "step": 50555 + }, + { + "epoch": 1.3, + "learning_rate": 1.2658325984055855e-06, + "loss": 0.7129, + "step": 50556 + }, + { + "epoch": 1.3, + "learning_rate": 1.265805923454825e-06, + "loss": 0.7383, + "step": 50557 + }, + { + "epoch": 1.3, + "learning_rate": 1.2657792483005488e-06, + "loss": 0.6274, + "step": 50558 + }, + { + "epoch": 1.3, + "learning_rate": 1.2657525729427777e-06, + "loss": 0.6807, + "step": 50559 + }, + { + "epoch": 1.3, + "learning_rate": 1.265725897381532e-06, + "loss": 0.751, + "step": 50560 + }, + { + "epoch": 1.3, + "learning_rate": 1.2656992216168325e-06, + "loss": 0.6416, + "step": 50561 + }, + { + "epoch": 1.3, + "learning_rate": 1.2656725456486994e-06, + "loss": 0.5779, + "step": 50562 + }, + { + "epoch": 1.3, + "learning_rate": 1.2656458694771526e-06, + "loss": 0.5469, + "step": 50563 + }, + { + "epoch": 1.3, + "learning_rate": 1.2656191931022132e-06, + "loss": 0.5129, + "step": 50564 + }, + { + "epoch": 1.3, + "learning_rate": 1.2655925165239013e-06, + "loss": 0.7441, + "step": 50565 + }, + { + "epoch": 1.3, + "learning_rate": 1.2655658397422377e-06, + "loss": 0.8076, + "step": 50566 + }, + { + "epoch": 1.3, + "learning_rate": 1.2655391627572423e-06, + "loss": 0.6074, + "step": 50567 + }, + { + "epoch": 1.3, + "learning_rate": 1.2655124855689358e-06, + "loss": 0.6665, + "step": 50568 + }, + { + "epoch": 1.3, + "learning_rate": 1.2654858081773388e-06, + "loss": 0.5918, + "step": 50569 + }, + { + "epoch": 1.3, + "learning_rate": 1.2654591305824713e-06, + "loss": 0.6177, + "step": 50570 + }, + { + "epoch": 1.3, + "learning_rate": 1.265432452784354e-06, + "loss": 0.5288, + "step": 50571 + }, + { + "epoch": 1.3, + "learning_rate": 1.2654057747830072e-06, + "loss": 0.7119, + "step": 50572 + }, + { + "epoch": 1.3, + "learning_rate": 1.2653790965784517e-06, + "loss": 0.3145, + "step": 50573 + }, + { + "epoch": 1.3, + "learning_rate": 1.2653524181707074e-06, + "loss": 0.5366, + "step": 50574 + }, + { + "epoch": 1.3, + "learning_rate": 1.2653257395597946e-06, + "loss": 0.7266, + "step": 50575 + }, + { + "epoch": 1.3, + "learning_rate": 1.2652990607457348e-06, + "loss": 0.6514, + "step": 50576 + }, + { + "epoch": 1.3, + "learning_rate": 1.2652723817285473e-06, + "loss": 0.5879, + "step": 50577 + }, + { + "epoch": 1.3, + "learning_rate": 1.2652457025082528e-06, + "loss": 0.6499, + "step": 50578 + }, + { + "epoch": 1.3, + "learning_rate": 1.2652190230848723e-06, + "loss": 0.7676, + "step": 50579 + }, + { + "epoch": 1.3, + "learning_rate": 1.2651923434584253e-06, + "loss": 0.5728, + "step": 50580 + }, + { + "epoch": 1.3, + "learning_rate": 1.2651656636289332e-06, + "loss": 0.626, + "step": 50581 + }, + { + "epoch": 1.3, + "learning_rate": 1.2651389835964156e-06, + "loss": 0.5157, + "step": 50582 + }, + { + "epoch": 1.3, + "learning_rate": 1.2651123033608934e-06, + "loss": 0.6157, + "step": 50583 + }, + { + "epoch": 1.3, + "learning_rate": 1.2650856229223868e-06, + "loss": 0.6768, + "step": 50584 + }, + { + "epoch": 1.3, + "learning_rate": 1.2650589422809165e-06, + "loss": 0.5918, + "step": 50585 + }, + { + "epoch": 1.3, + "learning_rate": 1.2650322614365027e-06, + "loss": 0.8799, + "step": 50586 + }, + { + "epoch": 1.3, + "learning_rate": 1.265005580389166e-06, + "loss": 0.6777, + "step": 50587 + }, + { + "epoch": 1.3, + "learning_rate": 1.2649788991389263e-06, + "loss": 0.5126, + "step": 50588 + }, + { + "epoch": 1.3, + "learning_rate": 1.2649522176858048e-06, + "loss": 0.6493, + "step": 50589 + }, + { + "epoch": 1.3, + "learning_rate": 1.2649255360298213e-06, + "loss": 0.5625, + "step": 50590 + }, + { + "epoch": 1.3, + "learning_rate": 1.2648988541709971e-06, + "loss": 0.6514, + "step": 50591 + }, + { + "epoch": 1.3, + "learning_rate": 1.2648721721093511e-06, + "loss": 0.4382, + "step": 50592 + }, + { + "epoch": 1.3, + "learning_rate": 1.2648454898449055e-06, + "loss": 0.594, + "step": 50593 + }, + { + "epoch": 1.3, + "learning_rate": 1.2648188073776794e-06, + "loss": 0.7158, + "step": 50594 + }, + { + "epoch": 1.3, + "learning_rate": 1.2647921247076939e-06, + "loss": 0.5151, + "step": 50595 + }, + { + "epoch": 1.3, + "learning_rate": 1.2647654418349691e-06, + "loss": 0.6602, + "step": 50596 + }, + { + "epoch": 1.3, + "learning_rate": 1.2647387587595257e-06, + "loss": 0.7109, + "step": 50597 + }, + { + "epoch": 1.3, + "learning_rate": 1.264712075481384e-06, + "loss": 0.6543, + "step": 50598 + }, + { + "epoch": 1.3, + "learning_rate": 1.2646853920005642e-06, + "loss": 0.748, + "step": 50599 + }, + { + "epoch": 1.3, + "learning_rate": 1.2646587083170875e-06, + "loss": 0.6875, + "step": 50600 + }, + { + "epoch": 1.3, + "learning_rate": 1.2646320244309734e-06, + "loss": 0.6105, + "step": 50601 + }, + { + "epoch": 1.3, + "learning_rate": 1.2646053403422428e-06, + "loss": 0.7217, + "step": 50602 + }, + { + "epoch": 1.3, + "learning_rate": 1.264578656050916e-06, + "loss": 0.5803, + "step": 50603 + }, + { + "epoch": 1.3, + "learning_rate": 1.2645519715570134e-06, + "loss": 0.5093, + "step": 50604 + }, + { + "epoch": 1.3, + "learning_rate": 1.2645252868605556e-06, + "loss": 0.7344, + "step": 50605 + }, + { + "epoch": 1.3, + "learning_rate": 1.2644986019615633e-06, + "loss": 0.7109, + "step": 50606 + }, + { + "epoch": 1.3, + "learning_rate": 1.2644719168600562e-06, + "loss": 0.6484, + "step": 50607 + }, + { + "epoch": 1.3, + "learning_rate": 1.2644452315560555e-06, + "loss": 0.8389, + "step": 50608 + }, + { + "epoch": 1.3, + "learning_rate": 1.2644185460495807e-06, + "loss": 0.6934, + "step": 50609 + }, + { + "epoch": 1.3, + "learning_rate": 1.2643918603406532e-06, + "loss": 0.5457, + "step": 50610 + }, + { + "epoch": 1.3, + "learning_rate": 1.2643651744292928e-06, + "loss": 0.7871, + "step": 50611 + }, + { + "epoch": 1.3, + "learning_rate": 1.2643384883155204e-06, + "loss": 0.6758, + "step": 50612 + }, + { + "epoch": 1.3, + "learning_rate": 1.2643118019993558e-06, + "loss": 0.7314, + "step": 50613 + }, + { + "epoch": 1.3, + "learning_rate": 1.2642851154808197e-06, + "loss": 0.6162, + "step": 50614 + }, + { + "epoch": 1.3, + "learning_rate": 1.2642584287599328e-06, + "loss": 0.7344, + "step": 50615 + }, + { + "epoch": 1.3, + "learning_rate": 1.2642317418367156e-06, + "loss": 0.6602, + "step": 50616 + }, + { + "epoch": 1.3, + "learning_rate": 1.2642050547111884e-06, + "loss": 0.7998, + "step": 50617 + }, + { + "epoch": 1.3, + "learning_rate": 1.2641783673833714e-06, + "loss": 0.4782, + "step": 50618 + }, + { + "epoch": 1.3, + "learning_rate": 1.264151679853285e-06, + "loss": 0.6108, + "step": 50619 + }, + { + "epoch": 1.3, + "learning_rate": 1.26412499212095e-06, + "loss": 0.7979, + "step": 50620 + }, + { + "epoch": 1.3, + "learning_rate": 1.2640983041863865e-06, + "loss": 0.8135, + "step": 50621 + }, + { + "epoch": 1.3, + "learning_rate": 1.264071616049615e-06, + "loss": 0.618, + "step": 50622 + }, + { + "epoch": 1.3, + "learning_rate": 1.264044927710656e-06, + "loss": 0.6055, + "step": 50623 + }, + { + "epoch": 1.3, + "learning_rate": 1.26401823916953e-06, + "loss": 0.7188, + "step": 50624 + }, + { + "epoch": 1.3, + "learning_rate": 1.2639915504262576e-06, + "loss": 0.531, + "step": 50625 + }, + { + "epoch": 1.3, + "learning_rate": 1.263964861480859e-06, + "loss": 0.707, + "step": 50626 + }, + { + "epoch": 1.3, + "learning_rate": 1.2639381723333543e-06, + "loss": 0.4424, + "step": 50627 + }, + { + "epoch": 1.3, + "learning_rate": 1.2639114829837644e-06, + "loss": 0.5132, + "step": 50628 + }, + { + "epoch": 1.3, + "learning_rate": 1.2638847934321097e-06, + "loss": 0.6523, + "step": 50629 + }, + { + "epoch": 1.3, + "learning_rate": 1.2638581036784105e-06, + "loss": 0.6904, + "step": 50630 + }, + { + "epoch": 1.3, + "learning_rate": 1.2638314137226877e-06, + "loss": 0.5146, + "step": 50631 + }, + { + "epoch": 1.3, + "learning_rate": 1.2638047235649608e-06, + "loss": 0.6836, + "step": 50632 + }, + { + "epoch": 1.3, + "learning_rate": 1.2637780332052508e-06, + "loss": 0.9482, + "step": 50633 + }, + { + "epoch": 1.3, + "learning_rate": 1.263751342643578e-06, + "loss": 0.79, + "step": 50634 + }, + { + "epoch": 1.3, + "learning_rate": 1.263724651879963e-06, + "loss": 0.7544, + "step": 50635 + }, + { + "epoch": 1.3, + "learning_rate": 1.2636979609144266e-06, + "loss": 0.6826, + "step": 50636 + }, + { + "epoch": 1.3, + "learning_rate": 1.2636712697469885e-06, + "loss": 0.6611, + "step": 50637 + }, + { + "epoch": 1.3, + "learning_rate": 1.2636445783776693e-06, + "loss": 0.4753, + "step": 50638 + }, + { + "epoch": 1.3, + "learning_rate": 1.2636178868064894e-06, + "loss": 0.8496, + "step": 50639 + }, + { + "epoch": 1.3, + "learning_rate": 1.2635911950334697e-06, + "loss": 0.6953, + "step": 50640 + }, + { + "epoch": 1.3, + "learning_rate": 1.2635645030586303e-06, + "loss": 0.7598, + "step": 50641 + }, + { + "epoch": 1.3, + "learning_rate": 1.263537810881992e-06, + "loss": 0.834, + "step": 50642 + }, + { + "epoch": 1.3, + "learning_rate": 1.2635111185035744e-06, + "loss": 0.8252, + "step": 50643 + }, + { + "epoch": 1.3, + "learning_rate": 1.2634844259233985e-06, + "loss": 0.8496, + "step": 50644 + }, + { + "epoch": 1.3, + "learning_rate": 1.263457733141485e-06, + "loss": 0.623, + "step": 50645 + }, + { + "epoch": 1.3, + "learning_rate": 1.2634310401578541e-06, + "loss": 0.7749, + "step": 50646 + }, + { + "epoch": 1.3, + "learning_rate": 1.2634043469725257e-06, + "loss": 0.5986, + "step": 50647 + }, + { + "epoch": 1.3, + "learning_rate": 1.263377653585521e-06, + "loss": 0.6387, + "step": 50648 + }, + { + "epoch": 1.3, + "learning_rate": 1.2633509599968599e-06, + "loss": 0.6104, + "step": 50649 + }, + { + "epoch": 1.3, + "learning_rate": 1.2633242662065634e-06, + "loss": 0.6602, + "step": 50650 + }, + { + "epoch": 1.3, + "learning_rate": 1.2632975722146514e-06, + "loss": 0.6475, + "step": 50651 + }, + { + "epoch": 1.3, + "learning_rate": 1.2632708780211448e-06, + "loss": 0.6963, + "step": 50652 + }, + { + "epoch": 1.3, + "learning_rate": 1.2632441836260633e-06, + "loss": 0.7383, + "step": 50653 + }, + { + "epoch": 1.3, + "learning_rate": 1.2632174890294283e-06, + "loss": 0.6733, + "step": 50654 + }, + { + "epoch": 1.3, + "learning_rate": 1.2631907942312596e-06, + "loss": 0.7461, + "step": 50655 + }, + { + "epoch": 1.3, + "learning_rate": 1.2631640992315779e-06, + "loss": 0.5879, + "step": 50656 + }, + { + "epoch": 1.3, + "learning_rate": 1.2631374040304034e-06, + "loss": 0.7119, + "step": 50657 + }, + { + "epoch": 1.3, + "learning_rate": 1.2631107086277568e-06, + "loss": 0.8174, + "step": 50658 + }, + { + "epoch": 1.3, + "learning_rate": 1.2630840130236584e-06, + "loss": 0.5454, + "step": 50659 + }, + { + "epoch": 1.3, + "learning_rate": 1.2630573172181287e-06, + "loss": 0.6055, + "step": 50660 + }, + { + "epoch": 1.3, + "learning_rate": 1.263030621211188e-06, + "loss": 0.6826, + "step": 50661 + }, + { + "epoch": 1.3, + "learning_rate": 1.2630039250028568e-06, + "loss": 0.6909, + "step": 50662 + }, + { + "epoch": 1.3, + "learning_rate": 1.262977228593156e-06, + "loss": 0.5112, + "step": 50663 + }, + { + "epoch": 1.3, + "learning_rate": 1.2629505319821055e-06, + "loss": 0.7285, + "step": 50664 + }, + { + "epoch": 1.3, + "learning_rate": 1.2629238351697253e-06, + "loss": 0.8047, + "step": 50665 + }, + { + "epoch": 1.3, + "learning_rate": 1.262897138156037e-06, + "loss": 0.7744, + "step": 50666 + }, + { + "epoch": 1.3, + "learning_rate": 1.2628704409410605e-06, + "loss": 0.6729, + "step": 50667 + }, + { + "epoch": 1.3, + "learning_rate": 1.2628437435248157e-06, + "loss": 0.7256, + "step": 50668 + }, + { + "epoch": 1.3, + "learning_rate": 1.2628170459073238e-06, + "loss": 0.666, + "step": 50669 + }, + { + "epoch": 1.3, + "learning_rate": 1.2627903480886049e-06, + "loss": 0.7754, + "step": 50670 + }, + { + "epoch": 1.3, + "learning_rate": 1.2627636500686798e-06, + "loss": 0.603, + "step": 50671 + }, + { + "epoch": 1.3, + "learning_rate": 1.2627369518475682e-06, + "loss": 0.6016, + "step": 50672 + }, + { + "epoch": 1.3, + "learning_rate": 1.2627102534252915e-06, + "loss": 0.5757, + "step": 50673 + }, + { + "epoch": 1.3, + "learning_rate": 1.262683554801869e-06, + "loss": 0.6216, + "step": 50674 + }, + { + "epoch": 1.3, + "learning_rate": 1.2626568559773226e-06, + "loss": 0.5913, + "step": 50675 + }, + { + "epoch": 1.3, + "learning_rate": 1.2626301569516713e-06, + "loss": 0.6553, + "step": 50676 + }, + { + "epoch": 1.3, + "learning_rate": 1.2626034577249365e-06, + "loss": 0.7041, + "step": 50677 + }, + { + "epoch": 1.3, + "learning_rate": 1.2625767582971378e-06, + "loss": 0.6436, + "step": 50678 + }, + { + "epoch": 1.3, + "learning_rate": 1.2625500586682966e-06, + "loss": 0.6592, + "step": 50679 + }, + { + "epoch": 1.3, + "learning_rate": 1.262523358838433e-06, + "loss": 0.5879, + "step": 50680 + }, + { + "epoch": 1.3, + "learning_rate": 1.262496658807567e-06, + "loss": 0.7104, + "step": 50681 + }, + { + "epoch": 1.3, + "learning_rate": 1.2624699585757195e-06, + "loss": 0.8682, + "step": 50682 + }, + { + "epoch": 1.3, + "learning_rate": 1.2624432581429107e-06, + "loss": 0.6226, + "step": 50683 + }, + { + "epoch": 1.3, + "learning_rate": 1.2624165575091612e-06, + "loss": 0.7764, + "step": 50684 + }, + { + "epoch": 1.3, + "learning_rate": 1.2623898566744915e-06, + "loss": 0.7383, + "step": 50685 + }, + { + "epoch": 1.3, + "learning_rate": 1.262363155638922e-06, + "loss": 0.7627, + "step": 50686 + }, + { + "epoch": 1.3, + "learning_rate": 1.262336454402473e-06, + "loss": 0.6826, + "step": 50687 + }, + { + "epoch": 1.3, + "learning_rate": 1.2623097529651652e-06, + "loss": 0.7271, + "step": 50688 + }, + { + "epoch": 1.3, + "learning_rate": 1.2622830513270187e-06, + "loss": 0.8447, + "step": 50689 + }, + { + "epoch": 1.3, + "learning_rate": 1.2622563494880542e-06, + "loss": 0.4371, + "step": 50690 + }, + { + "epoch": 1.3, + "learning_rate": 1.262229647448292e-06, + "loss": 0.397, + "step": 50691 + }, + { + "epoch": 1.3, + "learning_rate": 1.2622029452077528e-06, + "loss": 0.5619, + "step": 50692 + }, + { + "epoch": 1.3, + "learning_rate": 1.2621762427664566e-06, + "loss": 0.7373, + "step": 50693 + }, + { + "epoch": 1.3, + "learning_rate": 1.2621495401244244e-06, + "loss": 0.6138, + "step": 50694 + }, + { + "epoch": 1.3, + "learning_rate": 1.262122837281676e-06, + "loss": 0.6392, + "step": 50695 + }, + { + "epoch": 1.3, + "learning_rate": 1.2620961342382326e-06, + "loss": 0.7676, + "step": 50696 + }, + { + "epoch": 1.3, + "learning_rate": 1.262069430994114e-06, + "loss": 0.4292, + "step": 50697 + }, + { + "epoch": 1.3, + "learning_rate": 1.262042727549341e-06, + "loss": 0.5288, + "step": 50698 + }, + { + "epoch": 1.3, + "learning_rate": 1.2620160239039336e-06, + "loss": 0.5557, + "step": 50699 + }, + { + "epoch": 1.3, + "learning_rate": 1.2619893200579133e-06, + "loss": 0.7023, + "step": 50700 + }, + { + "epoch": 1.3, + "learning_rate": 1.261962616011299e-06, + "loss": 0.5977, + "step": 50701 + }, + { + "epoch": 1.3, + "learning_rate": 1.2619359117641123e-06, + "loss": 0.5684, + "step": 50702 + }, + { + "epoch": 1.3, + "learning_rate": 1.2619092073163736e-06, + "loss": 0.6768, + "step": 50703 + }, + { + "epoch": 1.3, + "learning_rate": 1.2618825026681025e-06, + "loss": 0.7949, + "step": 50704 + }, + { + "epoch": 1.3, + "learning_rate": 1.2618557978193206e-06, + "loss": 0.4624, + "step": 50705 + }, + { + "epoch": 1.3, + "learning_rate": 1.2618290927700472e-06, + "loss": 0.5527, + "step": 50706 + }, + { + "epoch": 1.3, + "learning_rate": 1.2618023875203036e-06, + "loss": 0.7363, + "step": 50707 + }, + { + "epoch": 1.3, + "learning_rate": 1.2617756820701102e-06, + "loss": 0.5586, + "step": 50708 + }, + { + "epoch": 1.3, + "learning_rate": 1.2617489764194868e-06, + "loss": 0.6758, + "step": 50709 + }, + { + "epoch": 1.3, + "learning_rate": 1.2617222705684544e-06, + "loss": 0.667, + "step": 50710 + }, + { + "epoch": 1.3, + "learning_rate": 1.2616955645170333e-06, + "loss": 0.7422, + "step": 50711 + }, + { + "epoch": 1.3, + "learning_rate": 1.2616688582652437e-06, + "loss": 0.6987, + "step": 50712 + }, + { + "epoch": 1.3, + "learning_rate": 1.2616421518131066e-06, + "loss": 0.7148, + "step": 50713 + }, + { + "epoch": 1.3, + "learning_rate": 1.261615445160642e-06, + "loss": 0.5798, + "step": 50714 + }, + { + "epoch": 1.3, + "learning_rate": 1.2615887383078708e-06, + "loss": 0.5874, + "step": 50715 + }, + { + "epoch": 1.3, + "learning_rate": 1.2615620312548124e-06, + "loss": 0.5767, + "step": 50716 + }, + { + "epoch": 1.3, + "learning_rate": 1.2615353240014886e-06, + "loss": 0.8008, + "step": 50717 + }, + { + "epoch": 1.3, + "learning_rate": 1.261508616547919e-06, + "loss": 0.5562, + "step": 50718 + }, + { + "epoch": 1.3, + "learning_rate": 1.2614819088941243e-06, + "loss": 0.5288, + "step": 50719 + }, + { + "epoch": 1.3, + "learning_rate": 1.2614552010401251e-06, + "loss": 0.7024, + "step": 50720 + }, + { + "epoch": 1.3, + "learning_rate": 1.2614284929859416e-06, + "loss": 0.6206, + "step": 50721 + }, + { + "epoch": 1.3, + "learning_rate": 1.261401784731594e-06, + "loss": 0.6357, + "step": 50722 + }, + { + "epoch": 1.3, + "learning_rate": 1.2613750762771033e-06, + "loss": 0.6577, + "step": 50723 + }, + { + "epoch": 1.3, + "learning_rate": 1.2613483676224897e-06, + "loss": 0.8184, + "step": 50724 + }, + { + "epoch": 1.3, + "learning_rate": 1.2613216587677736e-06, + "loss": 0.5674, + "step": 50725 + }, + { + "epoch": 1.3, + "learning_rate": 1.261294949712976e-06, + "loss": 0.6567, + "step": 50726 + }, + { + "epoch": 1.3, + "learning_rate": 1.2612682404581166e-06, + "loss": 0.8291, + "step": 50727 + }, + { + "epoch": 1.3, + "learning_rate": 1.2612415310032156e-06, + "loss": 0.592, + "step": 50728 + }, + { + "epoch": 1.3, + "learning_rate": 1.2612148213482944e-06, + "loss": 0.8555, + "step": 50729 + }, + { + "epoch": 1.3, + "learning_rate": 1.2611881114933732e-06, + "loss": 0.5913, + "step": 50730 + }, + { + "epoch": 1.3, + "learning_rate": 1.261161401438472e-06, + "loss": 0.6279, + "step": 50731 + }, + { + "epoch": 1.3, + "learning_rate": 1.2611346911836118e-06, + "loss": 0.5986, + "step": 50732 + }, + { + "epoch": 1.3, + "learning_rate": 1.2611079807288124e-06, + "loss": 0.6748, + "step": 50733 + }, + { + "epoch": 1.3, + "learning_rate": 1.261081270074095e-06, + "loss": 0.5793, + "step": 50734 + }, + { + "epoch": 1.3, + "learning_rate": 1.2610545592194795e-06, + "loss": 0.7949, + "step": 50735 + }, + { + "epoch": 1.3, + "learning_rate": 1.2610278481649864e-06, + "loss": 0.5864, + "step": 50736 + }, + { + "epoch": 1.3, + "learning_rate": 1.2610011369106364e-06, + "loss": 0.8076, + "step": 50737 + }, + { + "epoch": 1.3, + "learning_rate": 1.26097442545645e-06, + "loss": 0.6689, + "step": 50738 + }, + { + "epoch": 1.3, + "learning_rate": 1.260947713802447e-06, + "loss": 0.7109, + "step": 50739 + }, + { + "epoch": 1.3, + "learning_rate": 1.2609210019486489e-06, + "loss": 0.5571, + "step": 50740 + }, + { + "epoch": 1.3, + "learning_rate": 1.2608942898950752e-06, + "loss": 0.6855, + "step": 50741 + }, + { + "epoch": 1.3, + "learning_rate": 1.260867577641747e-06, + "loss": 0.5916, + "step": 50742 + }, + { + "epoch": 1.3, + "learning_rate": 1.2608408651886842e-06, + "loss": 0.8525, + "step": 50743 + }, + { + "epoch": 1.3, + "learning_rate": 1.2608141525359077e-06, + "loss": 0.4844, + "step": 50744 + }, + { + "epoch": 1.3, + "learning_rate": 1.260787439683438e-06, + "loss": 0.5688, + "step": 50745 + }, + { + "epoch": 1.3, + "learning_rate": 1.2607607266312953e-06, + "loss": 0.5139, + "step": 50746 + }, + { + "epoch": 1.3, + "learning_rate": 1.2607340133794997e-06, + "loss": 0.4103, + "step": 50747 + }, + { + "epoch": 1.3, + "learning_rate": 1.2607072999280724e-06, + "loss": 0.7007, + "step": 50748 + }, + { + "epoch": 1.3, + "learning_rate": 1.2606805862770333e-06, + "loss": 0.6138, + "step": 50749 + }, + { + "epoch": 1.3, + "learning_rate": 1.2606538724264032e-06, + "loss": 0.5413, + "step": 50750 + }, + { + "epoch": 1.3, + "learning_rate": 1.2606271583762026e-06, + "loss": 0.6099, + "step": 50751 + }, + { + "epoch": 1.3, + "learning_rate": 1.2606004441264512e-06, + "loss": 0.7031, + "step": 50752 + }, + { + "epoch": 1.3, + "learning_rate": 1.2605737296771706e-06, + "loss": 0.7173, + "step": 50753 + }, + { + "epoch": 1.3, + "learning_rate": 1.2605470150283805e-06, + "loss": 0.6016, + "step": 50754 + }, + { + "epoch": 1.3, + "learning_rate": 1.2605203001801014e-06, + "loss": 0.7461, + "step": 50755 + }, + { + "epoch": 1.3, + "learning_rate": 1.260493585132354e-06, + "loss": 0.6436, + "step": 50756 + }, + { + "epoch": 1.3, + "learning_rate": 1.2604668698851586e-06, + "loss": 0.6807, + "step": 50757 + }, + { + "epoch": 1.3, + "learning_rate": 1.2604401544385356e-06, + "loss": 0.5488, + "step": 50758 + }, + { + "epoch": 1.3, + "learning_rate": 1.2604134387925057e-06, + "loss": 0.6709, + "step": 50759 + }, + { + "epoch": 1.3, + "learning_rate": 1.2603867229470893e-06, + "loss": 0.6372, + "step": 50760 + }, + { + "epoch": 1.3, + "learning_rate": 1.2603600069023065e-06, + "loss": 0.5532, + "step": 50761 + }, + { + "epoch": 1.3, + "learning_rate": 1.2603332906581781e-06, + "loss": 0.5591, + "step": 50762 + }, + { + "epoch": 1.3, + "learning_rate": 1.2603065742147245e-06, + "loss": 0.5884, + "step": 50763 + }, + { + "epoch": 1.3, + "learning_rate": 1.260279857571966e-06, + "loss": 0.6914, + "step": 50764 + }, + { + "epoch": 1.3, + "learning_rate": 1.2602531407299237e-06, + "loss": 0.5601, + "step": 50765 + }, + { + "epoch": 1.3, + "learning_rate": 1.2602264236886169e-06, + "loss": 0.6807, + "step": 50766 + }, + { + "epoch": 1.3, + "learning_rate": 1.260199706448067e-06, + "loss": 0.6895, + "step": 50767 + }, + { + "epoch": 1.3, + "learning_rate": 1.2601729890082941e-06, + "loss": 0.7773, + "step": 50768 + }, + { + "epoch": 1.3, + "learning_rate": 1.2601462713693187e-06, + "loss": 0.4268, + "step": 50769 + }, + { + "epoch": 1.3, + "learning_rate": 1.2601195535311613e-06, + "loss": 0.6587, + "step": 50770 + }, + { + "epoch": 1.3, + "learning_rate": 1.2600928354938422e-06, + "loss": 0.583, + "step": 50771 + }, + { + "epoch": 1.3, + "learning_rate": 1.260066117257382e-06, + "loss": 0.6123, + "step": 50772 + }, + { + "epoch": 1.3, + "learning_rate": 1.2600393988218013e-06, + "loss": 0.6831, + "step": 50773 + }, + { + "epoch": 1.3, + "learning_rate": 1.26001268018712e-06, + "loss": 0.7031, + "step": 50774 + }, + { + "epoch": 1.3, + "learning_rate": 1.2599859613533595e-06, + "loss": 0.6626, + "step": 50775 + }, + { + "epoch": 1.3, + "learning_rate": 1.2599592423205395e-06, + "loss": 0.635, + "step": 50776 + }, + { + "epoch": 1.3, + "learning_rate": 1.2599325230886805e-06, + "loss": 0.5278, + "step": 50777 + }, + { + "epoch": 1.3, + "learning_rate": 1.2599058036578032e-06, + "loss": 0.6255, + "step": 50778 + }, + { + "epoch": 1.3, + "learning_rate": 1.2598790840279279e-06, + "loss": 0.5347, + "step": 50779 + }, + { + "epoch": 1.3, + "learning_rate": 1.2598523641990752e-06, + "loss": 0.5168, + "step": 50780 + }, + { + "epoch": 1.3, + "learning_rate": 1.2598256441712657e-06, + "loss": 0.748, + "step": 50781 + }, + { + "epoch": 1.3, + "learning_rate": 1.2597989239445195e-06, + "loss": 0.6533, + "step": 50782 + }, + { + "epoch": 1.3, + "learning_rate": 1.2597722035188569e-06, + "loss": 0.6572, + "step": 50783 + }, + { + "epoch": 1.3, + "learning_rate": 1.259745482894299e-06, + "loss": 0.6572, + "step": 50784 + }, + { + "epoch": 1.3, + "learning_rate": 1.259718762070866e-06, + "loss": 0.7422, + "step": 50785 + }, + { + "epoch": 1.3, + "learning_rate": 1.259692041048578e-06, + "loss": 0.6211, + "step": 50786 + }, + { + "epoch": 1.3, + "learning_rate": 1.259665319827456e-06, + "loss": 0.6182, + "step": 50787 + }, + { + "epoch": 1.3, + "learning_rate": 1.2596385984075203e-06, + "loss": 0.585, + "step": 50788 + }, + { + "epoch": 1.3, + "learning_rate": 1.2596118767887906e-06, + "loss": 0.7344, + "step": 50789 + }, + { + "epoch": 1.3, + "learning_rate": 1.259585154971289e-06, + "loss": 0.6099, + "step": 50790 + }, + { + "epoch": 1.3, + "learning_rate": 1.2595584329550343e-06, + "loss": 0.7412, + "step": 50791 + }, + { + "epoch": 1.3, + "learning_rate": 1.2595317107400478e-06, + "loss": 0.5796, + "step": 50792 + }, + { + "epoch": 1.3, + "learning_rate": 1.2595049883263498e-06, + "loss": 0.5483, + "step": 50793 + }, + { + "epoch": 1.3, + "learning_rate": 1.2594782657139607e-06, + "loss": 0.751, + "step": 50794 + }, + { + "epoch": 1.3, + "learning_rate": 1.259451542902901e-06, + "loss": 0.6187, + "step": 50795 + }, + { + "epoch": 1.3, + "learning_rate": 1.2594248198931915e-06, + "loss": 0.4541, + "step": 50796 + }, + { + "epoch": 1.3, + "learning_rate": 1.259398096684852e-06, + "loss": 0.7139, + "step": 50797 + }, + { + "epoch": 1.3, + "learning_rate": 1.2593713732779034e-06, + "loss": 0.6421, + "step": 50798 + }, + { + "epoch": 1.3, + "learning_rate": 1.259344649672366e-06, + "loss": 0.6777, + "step": 50799 + }, + { + "epoch": 1.3, + "learning_rate": 1.2593179258682605e-06, + "loss": 0.7129, + "step": 50800 + }, + { + "epoch": 1.3, + "learning_rate": 1.2592912018656072e-06, + "loss": 0.5869, + "step": 50801 + }, + { + "epoch": 1.3, + "learning_rate": 1.2592644776644264e-06, + "loss": 0.6709, + "step": 50802 + }, + { + "epoch": 1.3, + "learning_rate": 1.2592377532647389e-06, + "loss": 0.6074, + "step": 50803 + }, + { + "epoch": 1.3, + "learning_rate": 1.2592110286665647e-06, + "loss": 0.7588, + "step": 50804 + }, + { + "epoch": 1.3, + "learning_rate": 1.259184303869925e-06, + "loss": 0.5977, + "step": 50805 + }, + { + "epoch": 1.3, + "learning_rate": 1.2591575788748391e-06, + "loss": 0.4714, + "step": 50806 + }, + { + "epoch": 1.3, + "learning_rate": 1.2591308536813287e-06, + "loss": 0.5967, + "step": 50807 + }, + { + "epoch": 1.3, + "learning_rate": 1.2591041282894135e-06, + "loss": 0.5371, + "step": 50808 + }, + { + "epoch": 1.3, + "learning_rate": 1.2590774026991142e-06, + "loss": 0.6558, + "step": 50809 + }, + { + "epoch": 1.3, + "learning_rate": 1.2590506769104513e-06, + "loss": 0.7705, + "step": 50810 + }, + { + "epoch": 1.3, + "learning_rate": 1.2590239509234453e-06, + "loss": 0.5308, + "step": 50811 + }, + { + "epoch": 1.3, + "learning_rate": 1.2589972247381164e-06, + "loss": 0.6361, + "step": 50812 + }, + { + "epoch": 1.3, + "learning_rate": 1.2589704983544853e-06, + "loss": 0.71, + "step": 50813 + }, + { + "epoch": 1.3, + "learning_rate": 1.2589437717725724e-06, + "loss": 0.6675, + "step": 50814 + }, + { + "epoch": 1.3, + "learning_rate": 1.2589170449923981e-06, + "loss": 0.5933, + "step": 50815 + }, + { + "epoch": 1.3, + "learning_rate": 1.2588903180139832e-06, + "loss": 0.7666, + "step": 50816 + }, + { + "epoch": 1.3, + "learning_rate": 1.2588635908373477e-06, + "loss": 0.6553, + "step": 50817 + }, + { + "epoch": 1.3, + "learning_rate": 1.2588368634625119e-06, + "loss": 0.5845, + "step": 50818 + }, + { + "epoch": 1.3, + "learning_rate": 1.2588101358894972e-06, + "loss": 0.5825, + "step": 50819 + }, + { + "epoch": 1.3, + "learning_rate": 1.2587834081183234e-06, + "loss": 0.6885, + "step": 50820 + }, + { + "epoch": 1.3, + "learning_rate": 1.2587566801490104e-06, + "loss": 0.7646, + "step": 50821 + }, + { + "epoch": 1.3, + "learning_rate": 1.25872995198158e-06, + "loss": 0.6914, + "step": 50822 + }, + { + "epoch": 1.3, + "learning_rate": 1.2587032236160516e-06, + "loss": 0.6758, + "step": 50823 + }, + { + "epoch": 1.3, + "learning_rate": 1.2586764950524463e-06, + "loss": 0.5283, + "step": 50824 + }, + { + "epoch": 1.3, + "learning_rate": 1.2586497662907843e-06, + "loss": 0.7314, + "step": 50825 + }, + { + "epoch": 1.3, + "learning_rate": 1.2586230373310858e-06, + "loss": 0.7812, + "step": 50826 + }, + { + "epoch": 1.3, + "learning_rate": 1.2585963081733714e-06, + "loss": 0.6143, + "step": 50827 + }, + { + "epoch": 1.3, + "learning_rate": 1.2585695788176622e-06, + "loss": 0.6626, + "step": 50828 + }, + { + "epoch": 1.3, + "learning_rate": 1.2585428492639778e-06, + "loss": 0.5752, + "step": 50829 + }, + { + "epoch": 1.3, + "learning_rate": 1.2585161195123396e-06, + "loss": 0.6064, + "step": 50830 + }, + { + "epoch": 1.3, + "learning_rate": 1.2584893895627668e-06, + "loss": 0.6484, + "step": 50831 + }, + { + "epoch": 1.3, + "learning_rate": 1.2584626594152806e-06, + "loss": 0.6284, + "step": 50832 + }, + { + "epoch": 1.3, + "learning_rate": 1.258435929069902e-06, + "loss": 0.707, + "step": 50833 + }, + { + "epoch": 1.3, + "learning_rate": 1.2584091985266504e-06, + "loss": 0.7451, + "step": 50834 + }, + { + "epoch": 1.3, + "learning_rate": 1.2583824677855467e-06, + "loss": 0.8379, + "step": 50835 + }, + { + "epoch": 1.3, + "learning_rate": 1.258355736846612e-06, + "loss": 0.5146, + "step": 50836 + }, + { + "epoch": 1.3, + "learning_rate": 1.2583290057098657e-06, + "loss": 0.71, + "step": 50837 + }, + { + "epoch": 1.3, + "learning_rate": 1.2583022743753289e-06, + "loss": 0.5288, + "step": 50838 + }, + { + "epoch": 1.3, + "learning_rate": 1.2582755428430217e-06, + "loss": 0.6465, + "step": 50839 + }, + { + "epoch": 1.3, + "learning_rate": 1.258248811112965e-06, + "loss": 0.54, + "step": 50840 + }, + { + "epoch": 1.3, + "learning_rate": 1.2582220791851792e-06, + "loss": 0.5947, + "step": 50841 + }, + { + "epoch": 1.3, + "learning_rate": 1.2581953470596843e-06, + "loss": 0.7144, + "step": 50842 + }, + { + "epoch": 1.3, + "learning_rate": 1.2581686147365014e-06, + "loss": 0.667, + "step": 50843 + }, + { + "epoch": 1.3, + "learning_rate": 1.2581418822156505e-06, + "loss": 0.7295, + "step": 50844 + }, + { + "epoch": 1.3, + "learning_rate": 1.2581151494971525e-06, + "loss": 0.7344, + "step": 50845 + }, + { + "epoch": 1.3, + "learning_rate": 1.258088416581027e-06, + "loss": 0.627, + "step": 50846 + }, + { + "epoch": 1.3, + "learning_rate": 1.2580616834672957e-06, + "loss": 0.6943, + "step": 50847 + }, + { + "epoch": 1.3, + "learning_rate": 1.258034950155978e-06, + "loss": 0.8076, + "step": 50848 + }, + { + "epoch": 1.3, + "learning_rate": 1.2580082166470949e-06, + "loss": 0.6602, + "step": 50849 + }, + { + "epoch": 1.3, + "learning_rate": 1.257981482940667e-06, + "loss": 0.5625, + "step": 50850 + }, + { + "epoch": 1.3, + "learning_rate": 1.2579547490367144e-06, + "loss": 0.8555, + "step": 50851 + }, + { + "epoch": 1.3, + "learning_rate": 1.2579280149352576e-06, + "loss": 0.5483, + "step": 50852 + }, + { + "epoch": 1.3, + "learning_rate": 1.2579012806363172e-06, + "loss": 0.8086, + "step": 50853 + }, + { + "epoch": 1.3, + "learning_rate": 1.2578745461399136e-06, + "loss": 0.5698, + "step": 50854 + }, + { + "epoch": 1.3, + "learning_rate": 1.2578478114460678e-06, + "loss": 0.7725, + "step": 50855 + }, + { + "epoch": 1.3, + "learning_rate": 1.2578210765547992e-06, + "loss": 0.533, + "step": 50856 + }, + { + "epoch": 1.3, + "learning_rate": 1.2577943414661292e-06, + "loss": 0.5801, + "step": 50857 + }, + { + "epoch": 1.3, + "learning_rate": 1.2577676061800778e-06, + "loss": 0.8379, + "step": 50858 + }, + { + "epoch": 1.3, + "learning_rate": 1.2577408706966654e-06, + "loss": 0.6133, + "step": 50859 + }, + { + "epoch": 1.3, + "learning_rate": 1.257714135015913e-06, + "loss": 0.6978, + "step": 50860 + }, + { + "epoch": 1.3, + "learning_rate": 1.2576873991378408e-06, + "loss": 0.7607, + "step": 50861 + }, + { + "epoch": 1.3, + "learning_rate": 1.2576606630624689e-06, + "loss": 0.5496, + "step": 50862 + }, + { + "epoch": 1.3, + "learning_rate": 1.257633926789818e-06, + "loss": 0.5898, + "step": 50863 + }, + { + "epoch": 1.3, + "learning_rate": 1.2576071903199087e-06, + "loss": 0.6486, + "step": 50864 + }, + { + "epoch": 1.3, + "learning_rate": 1.2575804536527619e-06, + "loss": 0.6768, + "step": 50865 + }, + { + "epoch": 1.3, + "learning_rate": 1.2575537167883972e-06, + "loss": 0.6382, + "step": 50866 + }, + { + "epoch": 1.3, + "learning_rate": 1.2575269797268353e-06, + "loss": 0.6201, + "step": 50867 + }, + { + "epoch": 1.3, + "learning_rate": 1.2575002424680971e-06, + "loss": 0.6797, + "step": 50868 + }, + { + "epoch": 1.3, + "learning_rate": 1.2574735050122027e-06, + "loss": 0.5925, + "step": 50869 + }, + { + "epoch": 1.3, + "learning_rate": 1.2574467673591728e-06, + "loss": 0.543, + "step": 50870 + }, + { + "epoch": 1.3, + "learning_rate": 1.2574200295090278e-06, + "loss": 0.6631, + "step": 50871 + }, + { + "epoch": 1.3, + "learning_rate": 1.257393291461788e-06, + "loss": 0.6665, + "step": 50872 + }, + { + "epoch": 1.3, + "learning_rate": 1.2573665532174737e-06, + "loss": 0.5552, + "step": 50873 + }, + { + "epoch": 1.3, + "learning_rate": 1.257339814776106e-06, + "loss": 0.5508, + "step": 50874 + }, + { + "epoch": 1.3, + "learning_rate": 1.2573130761377053e-06, + "loss": 0.7363, + "step": 50875 + }, + { + "epoch": 1.3, + "learning_rate": 1.2572863373022916e-06, + "loss": 0.8516, + "step": 50876 + }, + { + "epoch": 1.3, + "learning_rate": 1.2572595982698852e-06, + "loss": 0.7427, + "step": 50877 + }, + { + "epoch": 1.3, + "learning_rate": 1.2572328590405073e-06, + "loss": 0.6553, + "step": 50878 + }, + { + "epoch": 1.3, + "learning_rate": 1.2572061196141777e-06, + "loss": 0.5015, + "step": 50879 + }, + { + "epoch": 1.3, + "learning_rate": 1.2571793799909179e-06, + "loss": 0.6001, + "step": 50880 + }, + { + "epoch": 1.3, + "learning_rate": 1.257152640170747e-06, + "loss": 0.5664, + "step": 50881 + }, + { + "epoch": 1.3, + "learning_rate": 1.2571259001536864e-06, + "loss": 0.4287, + "step": 50882 + }, + { + "epoch": 1.3, + "learning_rate": 1.2570991599397562e-06, + "loss": 0.5984, + "step": 50883 + }, + { + "epoch": 1.3, + "learning_rate": 1.2570724195289772e-06, + "loss": 0.5229, + "step": 50884 + }, + { + "epoch": 1.3, + "learning_rate": 1.2570456789213697e-06, + "loss": 0.584, + "step": 50885 + }, + { + "epoch": 1.3, + "learning_rate": 1.2570189381169537e-06, + "loss": 0.6909, + "step": 50886 + }, + { + "epoch": 1.3, + "learning_rate": 1.2569921971157506e-06, + "loss": 0.708, + "step": 50887 + }, + { + "epoch": 1.3, + "learning_rate": 1.25696545591778e-06, + "loss": 0.6929, + "step": 50888 + }, + { + "epoch": 1.3, + "learning_rate": 1.2569387145230632e-06, + "loss": 0.6694, + "step": 50889 + }, + { + "epoch": 1.3, + "learning_rate": 1.25691197293162e-06, + "loss": 0.4186, + "step": 50890 + }, + { + "epoch": 1.3, + "learning_rate": 1.2568852311434712e-06, + "loss": 0.4822, + "step": 50891 + }, + { + "epoch": 1.3, + "learning_rate": 1.2568584891586368e-06, + "loss": 0.6602, + "step": 50892 + }, + { + "epoch": 1.3, + "learning_rate": 1.2568317469771384e-06, + "loss": 0.644, + "step": 50893 + }, + { + "epoch": 1.3, + "learning_rate": 1.2568050045989951e-06, + "loss": 0.5615, + "step": 50894 + }, + { + "epoch": 1.3, + "learning_rate": 1.2567782620242284e-06, + "loss": 0.915, + "step": 50895 + }, + { + "epoch": 1.3, + "learning_rate": 1.2567515192528582e-06, + "loss": 0.564, + "step": 50896 + }, + { + "epoch": 1.3, + "learning_rate": 1.2567247762849053e-06, + "loss": 0.4686, + "step": 50897 + }, + { + "epoch": 1.3, + "learning_rate": 1.2566980331203898e-06, + "loss": 0.7988, + "step": 50898 + }, + { + "epoch": 1.3, + "learning_rate": 1.2566712897593325e-06, + "loss": 0.6318, + "step": 50899 + }, + { + "epoch": 1.3, + "learning_rate": 1.2566445462017541e-06, + "loss": 0.365, + "step": 50900 + }, + { + "epoch": 1.3, + "learning_rate": 1.2566178024476747e-06, + "loss": 0.6777, + "step": 50901 + }, + { + "epoch": 1.3, + "learning_rate": 1.2565910584971145e-06, + "loss": 0.6465, + "step": 50902 + }, + { + "epoch": 1.3, + "learning_rate": 1.2565643143500945e-06, + "loss": 0.7568, + "step": 50903 + }, + { + "epoch": 1.3, + "learning_rate": 1.2565375700066349e-06, + "loss": 0.5383, + "step": 50904 + }, + { + "epoch": 1.3, + "learning_rate": 1.2565108254667564e-06, + "loss": 0.5977, + "step": 50905 + }, + { + "epoch": 1.3, + "learning_rate": 1.2564840807304795e-06, + "loss": 0.6587, + "step": 50906 + }, + { + "epoch": 1.3, + "learning_rate": 1.2564573357978242e-06, + "loss": 0.6943, + "step": 50907 + }, + { + "epoch": 1.3, + "learning_rate": 1.2564305906688114e-06, + "loss": 0.6333, + "step": 50908 + }, + { + "epoch": 1.3, + "learning_rate": 1.2564038453434617e-06, + "loss": 0.7012, + "step": 50909 + }, + { + "epoch": 1.3, + "learning_rate": 1.2563770998217954e-06, + "loss": 0.7017, + "step": 50910 + }, + { + "epoch": 1.3, + "learning_rate": 1.2563503541038328e-06, + "loss": 0.6152, + "step": 50911 + }, + { + "epoch": 1.3, + "learning_rate": 1.2563236081895946e-06, + "loss": 0.7222, + "step": 50912 + }, + { + "epoch": 1.3, + "learning_rate": 1.2562968620791008e-06, + "loss": 0.6626, + "step": 50913 + }, + { + "epoch": 1.3, + "learning_rate": 1.2562701157723728e-06, + "loss": 0.6201, + "step": 50914 + }, + { + "epoch": 1.3, + "learning_rate": 1.2562433692694304e-06, + "loss": 0.7363, + "step": 50915 + }, + { + "epoch": 1.31, + "learning_rate": 1.2562166225702942e-06, + "loss": 0.5227, + "step": 50916 + }, + { + "epoch": 1.31, + "learning_rate": 1.2561898756749844e-06, + "loss": 0.6072, + "step": 50917 + }, + { + "epoch": 1.31, + "learning_rate": 1.2561631285835223e-06, + "loss": 0.4697, + "step": 50918 + }, + { + "epoch": 1.31, + "learning_rate": 1.2561363812959273e-06, + "loss": 0.6455, + "step": 50919 + }, + { + "epoch": 1.31, + "learning_rate": 1.2561096338122212e-06, + "loss": 0.6533, + "step": 50920 + }, + { + "epoch": 1.31, + "learning_rate": 1.2560828861324231e-06, + "loss": 0.6797, + "step": 50921 + }, + { + "epoch": 1.31, + "learning_rate": 1.2560561382565547e-06, + "loss": 0.7061, + "step": 50922 + }, + { + "epoch": 1.31, + "learning_rate": 1.2560293901846352e-06, + "loss": 0.7695, + "step": 50923 + }, + { + "epoch": 1.31, + "learning_rate": 1.2560026419166862e-06, + "loss": 0.5615, + "step": 50924 + }, + { + "epoch": 1.31, + "learning_rate": 1.2559758934527275e-06, + "loss": 0.6553, + "step": 50925 + }, + { + "epoch": 1.31, + "learning_rate": 1.2559491447927802e-06, + "loss": 0.4731, + "step": 50926 + }, + { + "epoch": 1.31, + "learning_rate": 1.2559223959368641e-06, + "loss": 0.6387, + "step": 50927 + }, + { + "epoch": 1.31, + "learning_rate": 1.2558956468850001e-06, + "loss": 0.6382, + "step": 50928 + }, + { + "epoch": 1.31, + "learning_rate": 1.2558688976372085e-06, + "loss": 0.6631, + "step": 50929 + }, + { + "epoch": 1.31, + "learning_rate": 1.2558421481935099e-06, + "loss": 0.7695, + "step": 50930 + }, + { + "epoch": 1.31, + "learning_rate": 1.2558153985539249e-06, + "loss": 0.6826, + "step": 50931 + }, + { + "epoch": 1.31, + "learning_rate": 1.2557886487184735e-06, + "loss": 0.6582, + "step": 50932 + }, + { + "epoch": 1.31, + "learning_rate": 1.2557618986871766e-06, + "loss": 0.6284, + "step": 50933 + }, + { + "epoch": 1.31, + "learning_rate": 1.2557351484600546e-06, + "loss": 0.4844, + "step": 50934 + }, + { + "epoch": 1.31, + "learning_rate": 1.255708398037128e-06, + "loss": 0.538, + "step": 50935 + }, + { + "epoch": 1.31, + "learning_rate": 1.255681647418417e-06, + "loss": 0.6992, + "step": 50936 + }, + { + "epoch": 1.31, + "learning_rate": 1.255654896603943e-06, + "loss": 0.5034, + "step": 50937 + }, + { + "epoch": 1.31, + "learning_rate": 1.255628145593725e-06, + "loss": 0.7598, + "step": 50938 + }, + { + "epoch": 1.31, + "learning_rate": 1.2556013943877845e-06, + "loss": 0.7139, + "step": 50939 + }, + { + "epoch": 1.31, + "learning_rate": 1.255574642986142e-06, + "loss": 0.5381, + "step": 50940 + }, + { + "epoch": 1.31, + "learning_rate": 1.2555478913888178e-06, + "loss": 0.6567, + "step": 50941 + }, + { + "epoch": 1.31, + "learning_rate": 1.2555211395958318e-06, + "loss": 0.7012, + "step": 50942 + }, + { + "epoch": 1.31, + "learning_rate": 1.2554943876072055e-06, + "loss": 0.7266, + "step": 50943 + }, + { + "epoch": 1.31, + "learning_rate": 1.2554676354229586e-06, + "loss": 0.5962, + "step": 50944 + }, + { + "epoch": 1.31, + "learning_rate": 1.2554408830431125e-06, + "loss": 0.5359, + "step": 50945 + }, + { + "epoch": 1.31, + "learning_rate": 1.2554141304676864e-06, + "loss": 0.5752, + "step": 50946 + }, + { + "epoch": 1.31, + "learning_rate": 1.2553873776967017e-06, + "loss": 0.5901, + "step": 50947 + }, + { + "epoch": 1.31, + "learning_rate": 1.2553606247301782e-06, + "loss": 0.7139, + "step": 50948 + }, + { + "epoch": 1.31, + "learning_rate": 1.2553338715681374e-06, + "loss": 0.5391, + "step": 50949 + }, + { + "epoch": 1.31, + "learning_rate": 1.255307118210599e-06, + "loss": 0.6685, + "step": 50950 + }, + { + "epoch": 1.31, + "learning_rate": 1.2552803646575839e-06, + "loss": 0.4702, + "step": 50951 + }, + { + "epoch": 1.31, + "learning_rate": 1.255253610909112e-06, + "loss": 0.6104, + "step": 50952 + }, + { + "epoch": 1.31, + "learning_rate": 1.255226856965204e-06, + "loss": 0.4739, + "step": 50953 + }, + { + "epoch": 1.31, + "learning_rate": 1.2552001028258806e-06, + "loss": 0.708, + "step": 50954 + }, + { + "epoch": 1.31, + "learning_rate": 1.2551733484911626e-06, + "loss": 0.7373, + "step": 50955 + }, + { + "epoch": 1.31, + "learning_rate": 1.2551465939610698e-06, + "loss": 0.6641, + "step": 50956 + }, + { + "epoch": 1.31, + "learning_rate": 1.2551198392356233e-06, + "loss": 0.6304, + "step": 50957 + }, + { + "epoch": 1.31, + "learning_rate": 1.2550930843148432e-06, + "loss": 0.6904, + "step": 50958 + }, + { + "epoch": 1.31, + "learning_rate": 1.2550663291987495e-06, + "loss": 0.7383, + "step": 50959 + }, + { + "epoch": 1.31, + "learning_rate": 1.2550395738873641e-06, + "loss": 0.6963, + "step": 50960 + }, + { + "epoch": 1.31, + "learning_rate": 1.2550128183807061e-06, + "loss": 0.6123, + "step": 50961 + }, + { + "epoch": 1.31, + "learning_rate": 1.2549860626787964e-06, + "loss": 0.6777, + "step": 50962 + }, + { + "epoch": 1.31, + "learning_rate": 1.2549593067816558e-06, + "loss": 0.7676, + "step": 50963 + }, + { + "epoch": 1.31, + "learning_rate": 1.2549325506893046e-06, + "loss": 0.8955, + "step": 50964 + }, + { + "epoch": 1.31, + "learning_rate": 1.2549057944017633e-06, + "loss": 0.6348, + "step": 50965 + }, + { + "epoch": 1.31, + "learning_rate": 1.2548790379190523e-06, + "loss": 0.6357, + "step": 50966 + }, + { + "epoch": 1.31, + "learning_rate": 1.254852281241192e-06, + "loss": 0.668, + "step": 50967 + }, + { + "epoch": 1.31, + "learning_rate": 1.2548255243682034e-06, + "loss": 0.6328, + "step": 50968 + }, + { + "epoch": 1.31, + "learning_rate": 1.2547987673001064e-06, + "loss": 0.604, + "step": 50969 + }, + { + "epoch": 1.31, + "learning_rate": 1.2547720100369217e-06, + "loss": 0.6689, + "step": 50970 + }, + { + "epoch": 1.31, + "learning_rate": 1.2547452525786697e-06, + "loss": 0.7412, + "step": 50971 + }, + { + "epoch": 1.31, + "learning_rate": 1.254718494925371e-06, + "loss": 0.665, + "step": 50972 + }, + { + "epoch": 1.31, + "learning_rate": 1.254691737077046e-06, + "loss": 0.8184, + "step": 50973 + }, + { + "epoch": 1.31, + "learning_rate": 1.2546649790337155e-06, + "loss": 0.8271, + "step": 50974 + }, + { + "epoch": 1.31, + "learning_rate": 1.2546382207953997e-06, + "loss": 0.5869, + "step": 50975 + }, + { + "epoch": 1.31, + "learning_rate": 1.2546114623621188e-06, + "loss": 0.5996, + "step": 50976 + }, + { + "epoch": 1.31, + "learning_rate": 1.2545847037338936e-06, + "loss": 0.7007, + "step": 50977 + }, + { + "epoch": 1.31, + "learning_rate": 1.2545579449107448e-06, + "loss": 0.583, + "step": 50978 + }, + { + "epoch": 1.31, + "learning_rate": 1.254531185892693e-06, + "loss": 0.7461, + "step": 50979 + }, + { + "epoch": 1.31, + "learning_rate": 1.254504426679758e-06, + "loss": 0.7754, + "step": 50980 + }, + { + "epoch": 1.31, + "learning_rate": 1.2544776672719609e-06, + "loss": 0.8428, + "step": 50981 + }, + { + "epoch": 1.31, + "learning_rate": 1.2544509076693215e-06, + "loss": 0.7568, + "step": 50982 + }, + { + "epoch": 1.31, + "learning_rate": 1.2544241478718612e-06, + "loss": 0.7402, + "step": 50983 + }, + { + "epoch": 1.31, + "learning_rate": 1.2543973878795996e-06, + "loss": 0.5547, + "step": 50984 + }, + { + "epoch": 1.31, + "learning_rate": 1.2543706276925581e-06, + "loss": 0.7295, + "step": 50985 + }, + { + "epoch": 1.31, + "learning_rate": 1.2543438673107565e-06, + "loss": 0.7979, + "step": 50986 + }, + { + "epoch": 1.31, + "learning_rate": 1.2543171067342154e-06, + "loss": 0.646, + "step": 50987 + }, + { + "epoch": 1.31, + "learning_rate": 1.2542903459629551e-06, + "loss": 0.7539, + "step": 50988 + }, + { + "epoch": 1.31, + "learning_rate": 1.2542635849969972e-06, + "loss": 0.6257, + "step": 50989 + }, + { + "epoch": 1.31, + "learning_rate": 1.2542368238363608e-06, + "loss": 0.8135, + "step": 50990 + }, + { + "epoch": 1.31, + "learning_rate": 1.254210062481067e-06, + "loss": 0.6729, + "step": 50991 + }, + { + "epoch": 1.31, + "learning_rate": 1.2541833009311363e-06, + "loss": 0.6943, + "step": 50992 + }, + { + "epoch": 1.31, + "learning_rate": 1.254156539186589e-06, + "loss": 0.7646, + "step": 50993 + }, + { + "epoch": 1.31, + "learning_rate": 1.2541297772474462e-06, + "loss": 0.6641, + "step": 50994 + }, + { + "epoch": 1.31, + "learning_rate": 1.2541030151137273e-06, + "loss": 0.5991, + "step": 50995 + }, + { + "epoch": 1.31, + "learning_rate": 1.2540762527854539e-06, + "loss": 0.5466, + "step": 50996 + }, + { + "epoch": 1.31, + "learning_rate": 1.2540494902626458e-06, + "loss": 0.6289, + "step": 50997 + }, + { + "epoch": 1.31, + "learning_rate": 1.2540227275453234e-06, + "loss": 0.6592, + "step": 50998 + }, + { + "epoch": 1.31, + "learning_rate": 1.253995964633508e-06, + "loss": 0.7275, + "step": 50999 + }, + { + "epoch": 1.31, + "learning_rate": 1.253969201527219e-06, + "loss": 0.4639, + "step": 51000 + }, + { + "epoch": 1.31, + "learning_rate": 1.2539424382264777e-06, + "loss": 0.7148, + "step": 51001 + }, + { + "epoch": 1.31, + "learning_rate": 1.2539156747313046e-06, + "loss": 0.6873, + "step": 51002 + }, + { + "epoch": 1.31, + "learning_rate": 1.2538889110417196e-06, + "loss": 0.5999, + "step": 51003 + }, + { + "epoch": 1.31, + "learning_rate": 1.253862147157744e-06, + "loss": 0.5867, + "step": 51004 + }, + { + "epoch": 1.31, + "learning_rate": 1.2538353830793974e-06, + "loss": 0.6572, + "step": 51005 + }, + { + "epoch": 1.31, + "learning_rate": 1.2538086188067007e-06, + "loss": 0.709, + "step": 51006 + }, + { + "epoch": 1.31, + "learning_rate": 1.2537818543396746e-06, + "loss": 0.7598, + "step": 51007 + }, + { + "epoch": 1.31, + "learning_rate": 1.2537550896783393e-06, + "loss": 0.6016, + "step": 51008 + }, + { + "epoch": 1.31, + "learning_rate": 1.2537283248227155e-06, + "loss": 0.7676, + "step": 51009 + }, + { + "epoch": 1.31, + "learning_rate": 1.2537015597728238e-06, + "loss": 0.5947, + "step": 51010 + }, + { + "epoch": 1.31, + "learning_rate": 1.2536747945286839e-06, + "loss": 0.4133, + "step": 51011 + }, + { + "epoch": 1.31, + "learning_rate": 1.2536480290903172e-06, + "loss": 0.605, + "step": 51012 + }, + { + "epoch": 1.31, + "learning_rate": 1.253621263457744e-06, + "loss": 0.7246, + "step": 51013 + }, + { + "epoch": 1.31, + "learning_rate": 1.2535944976309847e-06, + "loss": 0.5793, + "step": 51014 + }, + { + "epoch": 1.31, + "learning_rate": 1.2535677316100595e-06, + "loss": 0.6592, + "step": 51015 + }, + { + "epoch": 1.31, + "learning_rate": 1.2535409653949892e-06, + "loss": 0.752, + "step": 51016 + }, + { + "epoch": 1.31, + "learning_rate": 1.253514198985794e-06, + "loss": 0.3582, + "step": 51017 + }, + { + "epoch": 1.31, + "learning_rate": 1.2534874323824952e-06, + "loss": 0.6396, + "step": 51018 + }, + { + "epoch": 1.31, + "learning_rate": 1.2534606655851122e-06, + "loss": 0.6934, + "step": 51019 + }, + { + "epoch": 1.31, + "learning_rate": 1.2534338985936664e-06, + "loss": 0.5317, + "step": 51020 + }, + { + "epoch": 1.31, + "learning_rate": 1.2534071314081778e-06, + "loss": 0.6157, + "step": 51021 + }, + { + "epoch": 1.31, + "learning_rate": 1.2533803640286666e-06, + "loss": 0.6689, + "step": 51022 + }, + { + "epoch": 1.31, + "learning_rate": 1.2533535964551542e-06, + "loss": 0.52, + "step": 51023 + }, + { + "epoch": 1.31, + "learning_rate": 1.2533268286876606e-06, + "loss": 0.7039, + "step": 51024 + }, + { + "epoch": 1.31, + "learning_rate": 1.2533000607262064e-06, + "loss": 0.8018, + "step": 51025 + }, + { + "epoch": 1.31, + "learning_rate": 1.2532732925708115e-06, + "loss": 0.7324, + "step": 51026 + }, + { + "epoch": 1.31, + "learning_rate": 1.2532465242214971e-06, + "loss": 0.5781, + "step": 51027 + }, + { + "epoch": 1.31, + "learning_rate": 1.2532197556782836e-06, + "loss": 0.8125, + "step": 51028 + }, + { + "epoch": 1.31, + "learning_rate": 1.2531929869411916e-06, + "loss": 0.7891, + "step": 51029 + }, + { + "epoch": 1.31, + "learning_rate": 1.2531662180102408e-06, + "loss": 0.7861, + "step": 51030 + }, + { + "epoch": 1.31, + "learning_rate": 1.2531394488854527e-06, + "loss": 0.5791, + "step": 51031 + }, + { + "epoch": 1.31, + "learning_rate": 1.253112679566847e-06, + "loss": 0.6709, + "step": 51032 + }, + { + "epoch": 1.31, + "learning_rate": 1.2530859100544448e-06, + "loss": 0.6182, + "step": 51033 + }, + { + "epoch": 1.31, + "learning_rate": 1.2530591403482666e-06, + "loss": 0.6211, + "step": 51034 + }, + { + "epoch": 1.31, + "learning_rate": 1.2530323704483322e-06, + "loss": 0.6367, + "step": 51035 + }, + { + "epoch": 1.31, + "learning_rate": 1.2530056003546627e-06, + "loss": 0.4634, + "step": 51036 + }, + { + "epoch": 1.31, + "learning_rate": 1.2529788300672785e-06, + "loss": 0.8945, + "step": 51037 + }, + { + "epoch": 1.31, + "learning_rate": 1.2529520595862e-06, + "loss": 0.6631, + "step": 51038 + }, + { + "epoch": 1.31, + "learning_rate": 1.2529252889114478e-06, + "loss": 0.5938, + "step": 51039 + }, + { + "epoch": 1.31, + "learning_rate": 1.2528985180430422e-06, + "loss": 0.7292, + "step": 51040 + }, + { + "epoch": 1.31, + "learning_rate": 1.2528717469810042e-06, + "loss": 0.5214, + "step": 51041 + }, + { + "epoch": 1.31, + "learning_rate": 1.2528449757253534e-06, + "loss": 0.7686, + "step": 51042 + }, + { + "epoch": 1.31, + "learning_rate": 1.2528182042761112e-06, + "loss": 0.6431, + "step": 51043 + }, + { + "epoch": 1.31, + "learning_rate": 1.2527914326332979e-06, + "loss": 0.4917, + "step": 51044 + }, + { + "epoch": 1.31, + "learning_rate": 1.252764660796933e-06, + "loss": 0.605, + "step": 51045 + }, + { + "epoch": 1.31, + "learning_rate": 1.2527378887670388e-06, + "loss": 0.6763, + "step": 51046 + }, + { + "epoch": 1.31, + "learning_rate": 1.2527111165436342e-06, + "loss": 0.4868, + "step": 51047 + }, + { + "epoch": 1.31, + "learning_rate": 1.2526843441267405e-06, + "loss": 0.34, + "step": 51048 + }, + { + "epoch": 1.31, + "learning_rate": 1.252657571516378e-06, + "loss": 0.5769, + "step": 51049 + }, + { + "epoch": 1.31, + "learning_rate": 1.2526307987125673e-06, + "loss": 0.7207, + "step": 51050 + }, + { + "epoch": 1.31, + "learning_rate": 1.2526040257153288e-06, + "loss": 0.6357, + "step": 51051 + }, + { + "epoch": 1.31, + "learning_rate": 1.2525772525246829e-06, + "loss": 0.7148, + "step": 51052 + }, + { + "epoch": 1.31, + "learning_rate": 1.25255047914065e-06, + "loss": 0.8545, + "step": 51053 + }, + { + "epoch": 1.31, + "learning_rate": 1.2525237055632513e-06, + "loss": 0.6406, + "step": 51054 + }, + { + "epoch": 1.31, + "learning_rate": 1.2524969317925065e-06, + "loss": 0.5552, + "step": 51055 + }, + { + "epoch": 1.31, + "learning_rate": 1.2524701578284367e-06, + "loss": 0.6592, + "step": 51056 + }, + { + "epoch": 1.31, + "learning_rate": 1.2524433836710616e-06, + "loss": 0.6982, + "step": 51057 + }, + { + "epoch": 1.31, + "learning_rate": 1.2524166093204028e-06, + "loss": 0.6826, + "step": 51058 + }, + { + "epoch": 1.31, + "learning_rate": 1.2523898347764798e-06, + "loss": 0.79, + "step": 51059 + }, + { + "epoch": 1.31, + "learning_rate": 1.2523630600393139e-06, + "loss": 0.6182, + "step": 51060 + }, + { + "epoch": 1.31, + "learning_rate": 1.2523362851089247e-06, + "loss": 0.6431, + "step": 51061 + }, + { + "epoch": 1.31, + "learning_rate": 1.2523095099853337e-06, + "loss": 0.7002, + "step": 51062 + }, + { + "epoch": 1.31, + "learning_rate": 1.2522827346685603e-06, + "loss": 0.626, + "step": 51063 + }, + { + "epoch": 1.31, + "learning_rate": 1.252255959158626e-06, + "loss": 0.3822, + "step": 51064 + }, + { + "epoch": 1.31, + "learning_rate": 1.252229183455551e-06, + "loss": 0.6431, + "step": 51065 + }, + { + "epoch": 1.31, + "learning_rate": 1.2522024075593556e-06, + "loss": 0.6338, + "step": 51066 + }, + { + "epoch": 1.31, + "learning_rate": 1.2521756314700604e-06, + "loss": 0.6104, + "step": 51067 + }, + { + "epoch": 1.31, + "learning_rate": 1.2521488551876857e-06, + "loss": 0.7539, + "step": 51068 + }, + { + "epoch": 1.31, + "learning_rate": 1.2521220787122525e-06, + "loss": 0.6665, + "step": 51069 + }, + { + "epoch": 1.31, + "learning_rate": 1.252095302043781e-06, + "loss": 0.7036, + "step": 51070 + }, + { + "epoch": 1.31, + "learning_rate": 1.2520685251822918e-06, + "loss": 0.5215, + "step": 51071 + }, + { + "epoch": 1.31, + "learning_rate": 1.252041748127805e-06, + "loss": 0.5435, + "step": 51072 + }, + { + "epoch": 1.31, + "learning_rate": 1.2520149708803418e-06, + "loss": 0.8154, + "step": 51073 + }, + { + "epoch": 1.31, + "learning_rate": 1.2519881934399221e-06, + "loss": 0.6904, + "step": 51074 + }, + { + "epoch": 1.31, + "learning_rate": 1.2519614158065667e-06, + "loss": 0.562, + "step": 51075 + }, + { + "epoch": 1.31, + "learning_rate": 1.251934637980296e-06, + "loss": 0.7246, + "step": 51076 + }, + { + "epoch": 1.31, + "learning_rate": 1.2519078599611307e-06, + "loss": 0.3274, + "step": 51077 + }, + { + "epoch": 1.31, + "learning_rate": 1.2518810817490906e-06, + "loss": 0.7217, + "step": 51078 + }, + { + "epoch": 1.31, + "learning_rate": 1.2518543033441975e-06, + "loss": 0.7539, + "step": 51079 + }, + { + "epoch": 1.31, + "learning_rate": 1.2518275247464704e-06, + "loss": 0.5037, + "step": 51080 + }, + { + "epoch": 1.31, + "learning_rate": 1.251800745955931e-06, + "loss": 0.5776, + "step": 51081 + }, + { + "epoch": 1.31, + "learning_rate": 1.2517739669725993e-06, + "loss": 0.6001, + "step": 51082 + }, + { + "epoch": 1.31, + "learning_rate": 1.2517471877964956e-06, + "loss": 0.623, + "step": 51083 + }, + { + "epoch": 1.31, + "learning_rate": 1.2517204084276412e-06, + "loss": 0.748, + "step": 51084 + }, + { + "epoch": 1.31, + "learning_rate": 1.2516936288660554e-06, + "loss": 0.6992, + "step": 51085 + }, + { + "epoch": 1.31, + "learning_rate": 1.2516668491117596e-06, + "loss": 0.5522, + "step": 51086 + }, + { + "epoch": 1.31, + "learning_rate": 1.2516400691647744e-06, + "loss": 0.5835, + "step": 51087 + }, + { + "epoch": 1.31, + "learning_rate": 1.2516132890251194e-06, + "loss": 0.6411, + "step": 51088 + }, + { + "epoch": 1.31, + "learning_rate": 1.2515865086928162e-06, + "loss": 0.626, + "step": 51089 + }, + { + "epoch": 1.31, + "learning_rate": 1.2515597281678845e-06, + "loss": 0.6699, + "step": 51090 + }, + { + "epoch": 1.31, + "learning_rate": 1.251532947450345e-06, + "loss": 0.7012, + "step": 51091 + }, + { + "epoch": 1.31, + "learning_rate": 1.2515061665402185e-06, + "loss": 0.7793, + "step": 51092 + }, + { + "epoch": 1.31, + "learning_rate": 1.251479385437525e-06, + "loss": 0.6514, + "step": 51093 + }, + { + "epoch": 1.31, + "learning_rate": 1.2514526041422859e-06, + "loss": 0.7441, + "step": 51094 + }, + { + "epoch": 1.31, + "learning_rate": 1.2514258226545204e-06, + "loss": 0.7017, + "step": 51095 + }, + { + "epoch": 1.31, + "learning_rate": 1.25139904097425e-06, + "loss": 0.7617, + "step": 51096 + }, + { + "epoch": 1.31, + "learning_rate": 1.2513722591014947e-06, + "loss": 0.6494, + "step": 51097 + }, + { + "epoch": 1.31, + "learning_rate": 1.2513454770362758e-06, + "loss": 0.7085, + "step": 51098 + }, + { + "epoch": 1.31, + "learning_rate": 1.251318694778613e-06, + "loss": 0.5645, + "step": 51099 + }, + { + "epoch": 1.31, + "learning_rate": 1.251291912328527e-06, + "loss": 0.4541, + "step": 51100 + }, + { + "epoch": 1.31, + "learning_rate": 1.2512651296860378e-06, + "loss": 0.7285, + "step": 51101 + }, + { + "epoch": 1.31, + "learning_rate": 1.251238346851167e-06, + "loss": 0.521, + "step": 51102 + }, + { + "epoch": 1.31, + "learning_rate": 1.2512115638239345e-06, + "loss": 0.6123, + "step": 51103 + }, + { + "epoch": 1.31, + "learning_rate": 1.251184780604361e-06, + "loss": 0.625, + "step": 51104 + }, + { + "epoch": 1.31, + "learning_rate": 1.2511579971924664e-06, + "loss": 0.6797, + "step": 51105 + }, + { + "epoch": 1.31, + "learning_rate": 1.251131213588272e-06, + "loss": 0.7061, + "step": 51106 + }, + { + "epoch": 1.31, + "learning_rate": 1.2511044297917978e-06, + "loss": 0.6885, + "step": 51107 + }, + { + "epoch": 1.31, + "learning_rate": 1.2510776458030648e-06, + "loss": 0.6875, + "step": 51108 + }, + { + "epoch": 1.31, + "learning_rate": 1.2510508616220929e-06, + "loss": 0.6211, + "step": 51109 + }, + { + "epoch": 1.31, + "learning_rate": 1.251024077248903e-06, + "loss": 0.6431, + "step": 51110 + }, + { + "epoch": 1.31, + "learning_rate": 1.2509972926835154e-06, + "loss": 0.668, + "step": 51111 + }, + { + "epoch": 1.31, + "learning_rate": 1.2509705079259508e-06, + "loss": 0.5649, + "step": 51112 + }, + { + "epoch": 1.31, + "learning_rate": 1.2509437229762296e-06, + "loss": 0.603, + "step": 51113 + }, + { + "epoch": 1.31, + "learning_rate": 1.2509169378343724e-06, + "loss": 0.7529, + "step": 51114 + }, + { + "epoch": 1.31, + "learning_rate": 1.2508901525003996e-06, + "loss": 0.6914, + "step": 51115 + }, + { + "epoch": 1.31, + "learning_rate": 1.2508633669743317e-06, + "loss": 0.6982, + "step": 51116 + }, + { + "epoch": 1.31, + "learning_rate": 1.2508365812561893e-06, + "loss": 0.6719, + "step": 51117 + }, + { + "epoch": 1.31, + "learning_rate": 1.2508097953459929e-06, + "loss": 0.6042, + "step": 51118 + }, + { + "epoch": 1.31, + "learning_rate": 1.250783009243763e-06, + "loss": 0.5728, + "step": 51119 + }, + { + "epoch": 1.31, + "learning_rate": 1.2507562229495199e-06, + "loss": 0.6904, + "step": 51120 + }, + { + "epoch": 1.31, + "learning_rate": 1.2507294364632845e-06, + "loss": 0.6992, + "step": 51121 + }, + { + "epoch": 1.31, + "learning_rate": 1.2507026497850769e-06, + "loss": 0.7217, + "step": 51122 + }, + { + "epoch": 1.31, + "learning_rate": 1.2506758629149178e-06, + "loss": 0.6323, + "step": 51123 + }, + { + "epoch": 1.31, + "learning_rate": 1.2506490758528281e-06, + "loss": 0.6729, + "step": 51124 + }, + { + "epoch": 1.31, + "learning_rate": 1.2506222885988278e-06, + "loss": 0.7832, + "step": 51125 + }, + { + "epoch": 1.31, + "learning_rate": 1.250595501152937e-06, + "loss": 0.5483, + "step": 51126 + }, + { + "epoch": 1.31, + "learning_rate": 1.2505687135151771e-06, + "loss": 0.4705, + "step": 51127 + }, + { + "epoch": 1.31, + "learning_rate": 1.2505419256855682e-06, + "loss": 0.7793, + "step": 51128 + }, + { + "epoch": 1.31, + "learning_rate": 1.250515137664131e-06, + "loss": 0.7217, + "step": 51129 + }, + { + "epoch": 1.31, + "learning_rate": 1.2504883494508861e-06, + "loss": 0.5432, + "step": 51130 + }, + { + "epoch": 1.31, + "learning_rate": 1.2504615610458536e-06, + "loss": 0.6895, + "step": 51131 + }, + { + "epoch": 1.31, + "learning_rate": 1.250434772449054e-06, + "loss": 0.6843, + "step": 51132 + }, + { + "epoch": 1.31, + "learning_rate": 1.2504079836605082e-06, + "loss": 0.7705, + "step": 51133 + }, + { + "epoch": 1.31, + "learning_rate": 1.2503811946802366e-06, + "loss": 0.7568, + "step": 51134 + }, + { + "epoch": 1.31, + "learning_rate": 1.2503544055082594e-06, + "loss": 0.7168, + "step": 51135 + }, + { + "epoch": 1.31, + "learning_rate": 1.2503276161445976e-06, + "loss": 0.6001, + "step": 51136 + }, + { + "epoch": 1.31, + "learning_rate": 1.250300826589271e-06, + "loss": 0.5425, + "step": 51137 + }, + { + "epoch": 1.31, + "learning_rate": 1.2502740368423007e-06, + "loss": 0.4839, + "step": 51138 + }, + { + "epoch": 1.31, + "learning_rate": 1.2502472469037075e-06, + "loss": 0.7278, + "step": 51139 + }, + { + "epoch": 1.31, + "learning_rate": 1.2502204567735113e-06, + "loss": 0.7622, + "step": 51140 + }, + { + "epoch": 1.31, + "learning_rate": 1.2501936664517324e-06, + "loss": 0.3378, + "step": 51141 + }, + { + "epoch": 1.31, + "learning_rate": 1.2501668759383924e-06, + "loss": 0.832, + "step": 51142 + }, + { + "epoch": 1.31, + "learning_rate": 1.2501400852335104e-06, + "loss": 0.5518, + "step": 51143 + }, + { + "epoch": 1.31, + "learning_rate": 1.2501132943371082e-06, + "loss": 0.626, + "step": 51144 + }, + { + "epoch": 1.31, + "learning_rate": 1.2500865032492055e-06, + "loss": 0.6895, + "step": 51145 + }, + { + "epoch": 1.31, + "learning_rate": 1.2500597119698233e-06, + "loss": 0.5996, + "step": 51146 + }, + { + "epoch": 1.31, + "learning_rate": 1.2500329204989815e-06, + "loss": 0.425, + "step": 51147 + }, + { + "epoch": 1.31, + "learning_rate": 1.2500061288367011e-06, + "loss": 0.7715, + "step": 51148 + }, + { + "epoch": 1.31, + "learning_rate": 1.2499793369830028e-06, + "loss": 0.624, + "step": 51149 + }, + { + "epoch": 1.31, + "learning_rate": 1.2499525449379068e-06, + "loss": 0.686, + "step": 51150 + }, + { + "epoch": 1.31, + "learning_rate": 1.249925752701433e-06, + "loss": 0.6372, + "step": 51151 + }, + { + "epoch": 1.31, + "learning_rate": 1.2498989602736032e-06, + "loss": 0.6377, + "step": 51152 + }, + { + "epoch": 1.31, + "learning_rate": 1.2498721676544367e-06, + "loss": 0.668, + "step": 51153 + }, + { + "epoch": 1.31, + "learning_rate": 1.2498453748439552e-06, + "loss": 0.7822, + "step": 51154 + }, + { + "epoch": 1.31, + "learning_rate": 1.2498185818421782e-06, + "loss": 0.4944, + "step": 51155 + }, + { + "epoch": 1.31, + "learning_rate": 1.2497917886491266e-06, + "loss": 0.645, + "step": 51156 + }, + { + "epoch": 1.31, + "learning_rate": 1.249764995264821e-06, + "loss": 0.5229, + "step": 51157 + }, + { + "epoch": 1.31, + "learning_rate": 1.2497382016892818e-06, + "loss": 0.7632, + "step": 51158 + }, + { + "epoch": 1.31, + "learning_rate": 1.24971140792253e-06, + "loss": 0.4893, + "step": 51159 + }, + { + "epoch": 1.31, + "learning_rate": 1.2496846139645849e-06, + "loss": 0.6191, + "step": 51160 + }, + { + "epoch": 1.31, + "learning_rate": 1.2496578198154681e-06, + "loss": 0.4551, + "step": 51161 + }, + { + "epoch": 1.31, + "learning_rate": 1.2496310254751997e-06, + "loss": 0.7959, + "step": 51162 + }, + { + "epoch": 1.31, + "learning_rate": 1.2496042309438007e-06, + "loss": 0.6592, + "step": 51163 + }, + { + "epoch": 1.31, + "learning_rate": 1.2495774362212907e-06, + "loss": 0.7539, + "step": 51164 + }, + { + "epoch": 1.31, + "learning_rate": 1.2495506413076911e-06, + "loss": 0.3979, + "step": 51165 + }, + { + "epoch": 1.31, + "learning_rate": 1.2495238462030217e-06, + "loss": 0.5103, + "step": 51166 + }, + { + "epoch": 1.31, + "learning_rate": 1.2494970509073037e-06, + "loss": 0.4592, + "step": 51167 + }, + { + "epoch": 1.31, + "learning_rate": 1.249470255420557e-06, + "loss": 0.8022, + "step": 51168 + }, + { + "epoch": 1.31, + "learning_rate": 1.2494434597428028e-06, + "loss": 0.6277, + "step": 51169 + }, + { + "epoch": 1.31, + "learning_rate": 1.249416663874061e-06, + "loss": 0.5474, + "step": 51170 + }, + { + "epoch": 1.31, + "learning_rate": 1.2493898678143521e-06, + "loss": 0.6611, + "step": 51171 + }, + { + "epoch": 1.31, + "learning_rate": 1.2493630715636969e-06, + "loss": 0.6074, + "step": 51172 + }, + { + "epoch": 1.31, + "learning_rate": 1.2493362751221161e-06, + "loss": 0.4633, + "step": 51173 + }, + { + "epoch": 1.31, + "learning_rate": 1.2493094784896299e-06, + "loss": 0.6152, + "step": 51174 + }, + { + "epoch": 1.31, + "learning_rate": 1.2492826816662588e-06, + "loss": 0.5752, + "step": 51175 + }, + { + "epoch": 1.31, + "learning_rate": 1.2492558846520234e-06, + "loss": 0.4756, + "step": 51176 + }, + { + "epoch": 1.31, + "learning_rate": 1.2492290874469443e-06, + "loss": 0.6045, + "step": 51177 + }, + { + "epoch": 1.31, + "learning_rate": 1.2492022900510419e-06, + "loss": 0.5752, + "step": 51178 + }, + { + "epoch": 1.31, + "learning_rate": 1.249175492464337e-06, + "loss": 0.266, + "step": 51179 + }, + { + "epoch": 1.31, + "learning_rate": 1.2491486946868498e-06, + "loss": 0.7666, + "step": 51180 + }, + { + "epoch": 1.31, + "learning_rate": 1.2491218967186004e-06, + "loss": 0.7314, + "step": 51181 + }, + { + "epoch": 1.31, + "learning_rate": 1.2490950985596104e-06, + "loss": 0.5315, + "step": 51182 + }, + { + "epoch": 1.31, + "learning_rate": 1.2490683002098995e-06, + "loss": 0.7754, + "step": 51183 + }, + { + "epoch": 1.31, + "learning_rate": 1.2490415016694886e-06, + "loss": 0.8027, + "step": 51184 + }, + { + "epoch": 1.31, + "learning_rate": 1.249014702938398e-06, + "loss": 0.6279, + "step": 51185 + }, + { + "epoch": 1.31, + "learning_rate": 1.2489879040166482e-06, + "loss": 0.6084, + "step": 51186 + }, + { + "epoch": 1.31, + "learning_rate": 1.2489611049042597e-06, + "loss": 0.7607, + "step": 51187 + }, + { + "epoch": 1.31, + "learning_rate": 1.2489343056012533e-06, + "loss": 0.7078, + "step": 51188 + }, + { + "epoch": 1.31, + "learning_rate": 1.2489075061076496e-06, + "loss": 0.6724, + "step": 51189 + }, + { + "epoch": 1.31, + "learning_rate": 1.2488807064234685e-06, + "loss": 0.3514, + "step": 51190 + }, + { + "epoch": 1.31, + "learning_rate": 1.248853906548731e-06, + "loss": 0.7705, + "step": 51191 + }, + { + "epoch": 1.31, + "learning_rate": 1.2488271064834575e-06, + "loss": 0.7451, + "step": 51192 + }, + { + "epoch": 1.31, + "learning_rate": 1.2488003062276683e-06, + "loss": 0.5742, + "step": 51193 + }, + { + "epoch": 1.31, + "learning_rate": 1.2487735057813849e-06, + "loss": 0.6592, + "step": 51194 + }, + { + "epoch": 1.31, + "learning_rate": 1.2487467051446263e-06, + "loss": 0.7593, + "step": 51195 + }, + { + "epoch": 1.31, + "learning_rate": 1.2487199043174142e-06, + "loss": 0.5234, + "step": 51196 + }, + { + "epoch": 1.31, + "learning_rate": 1.2486931032997682e-06, + "loss": 0.7051, + "step": 51197 + }, + { + "epoch": 1.31, + "learning_rate": 1.24866630209171e-06, + "loss": 0.7148, + "step": 51198 + }, + { + "epoch": 1.31, + "learning_rate": 1.2486395006932591e-06, + "loss": 0.6113, + "step": 51199 + }, + { + "epoch": 1.31, + "learning_rate": 1.2486126991044362e-06, + "loss": 0.5952, + "step": 51200 + }, + { + "epoch": 1.31, + "learning_rate": 1.2485858973252623e-06, + "loss": 0.7373, + "step": 51201 + }, + { + "epoch": 1.31, + "learning_rate": 1.2485590953557572e-06, + "loss": 0.6914, + "step": 51202 + }, + { + "epoch": 1.31, + "learning_rate": 1.2485322931959424e-06, + "loss": 0.7217, + "step": 51203 + }, + { + "epoch": 1.31, + "learning_rate": 1.2485054908458374e-06, + "loss": 0.6826, + "step": 51204 + }, + { + "epoch": 1.31, + "learning_rate": 1.2484786883054633e-06, + "loss": 0.5371, + "step": 51205 + }, + { + "epoch": 1.31, + "learning_rate": 1.2484518855748407e-06, + "loss": 0.6465, + "step": 51206 + }, + { + "epoch": 1.31, + "learning_rate": 1.2484250826539898e-06, + "loss": 0.6592, + "step": 51207 + }, + { + "epoch": 1.31, + "learning_rate": 1.248398279542931e-06, + "loss": 0.584, + "step": 51208 + }, + { + "epoch": 1.31, + "learning_rate": 1.2483714762416855e-06, + "loss": 0.7861, + "step": 51209 + }, + { + "epoch": 1.31, + "learning_rate": 1.2483446727502728e-06, + "loss": 0.644, + "step": 51210 + }, + { + "epoch": 1.31, + "learning_rate": 1.2483178690687146e-06, + "loss": 0.6016, + "step": 51211 + }, + { + "epoch": 1.31, + "learning_rate": 1.2482910651970305e-06, + "loss": 0.6943, + "step": 51212 + }, + { + "epoch": 1.31, + "learning_rate": 1.2482642611352411e-06, + "loss": 0.5315, + "step": 51213 + }, + { + "epoch": 1.31, + "learning_rate": 1.2482374568833678e-06, + "loss": 0.6205, + "step": 51214 + }, + { + "epoch": 1.31, + "learning_rate": 1.2482106524414302e-06, + "loss": 0.6765, + "step": 51215 + }, + { + "epoch": 1.31, + "learning_rate": 1.2481838478094487e-06, + "loss": 0.4043, + "step": 51216 + }, + { + "epoch": 1.31, + "learning_rate": 1.2481570429874447e-06, + "loss": 0.5939, + "step": 51217 + }, + { + "epoch": 1.31, + "learning_rate": 1.2481302379754381e-06, + "loss": 0.6436, + "step": 51218 + }, + { + "epoch": 1.31, + "learning_rate": 1.2481034327734498e-06, + "loss": 0.7832, + "step": 51219 + }, + { + "epoch": 1.31, + "learning_rate": 1.2480766273815002e-06, + "loss": 0.5859, + "step": 51220 + }, + { + "epoch": 1.31, + "learning_rate": 1.2480498217996096e-06, + "loss": 0.75, + "step": 51221 + }, + { + "epoch": 1.31, + "learning_rate": 1.2480230160277981e-06, + "loss": 0.5251, + "step": 51222 + }, + { + "epoch": 1.31, + "learning_rate": 1.2479962100660874e-06, + "loss": 0.4683, + "step": 51223 + }, + { + "epoch": 1.31, + "learning_rate": 1.2479694039144975e-06, + "loss": 0.6572, + "step": 51224 + }, + { + "epoch": 1.31, + "learning_rate": 1.2479425975730485e-06, + "loss": 0.6299, + "step": 51225 + }, + { + "epoch": 1.31, + "learning_rate": 1.2479157910417612e-06, + "loss": 0.7788, + "step": 51226 + }, + { + "epoch": 1.31, + "learning_rate": 1.2478889843206562e-06, + "loss": 0.752, + "step": 51227 + }, + { + "epoch": 1.31, + "learning_rate": 1.2478621774097542e-06, + "loss": 0.4456, + "step": 51228 + }, + { + "epoch": 1.31, + "learning_rate": 1.2478353703090757e-06, + "loss": 0.7559, + "step": 51229 + }, + { + "epoch": 1.31, + "learning_rate": 1.2478085630186408e-06, + "loss": 0.5879, + "step": 51230 + }, + { + "epoch": 1.31, + "learning_rate": 1.24778175553847e-06, + "loss": 0.5234, + "step": 51231 + }, + { + "epoch": 1.31, + "learning_rate": 1.2477549478685845e-06, + "loss": 0.7979, + "step": 51232 + }, + { + "epoch": 1.31, + "learning_rate": 1.2477281400090043e-06, + "loss": 0.7305, + "step": 51233 + }, + { + "epoch": 1.31, + "learning_rate": 1.2477013319597502e-06, + "loss": 0.5022, + "step": 51234 + }, + { + "epoch": 1.31, + "learning_rate": 1.2476745237208423e-06, + "loss": 0.6064, + "step": 51235 + }, + { + "epoch": 1.31, + "learning_rate": 1.2476477152923014e-06, + "loss": 0.5781, + "step": 51236 + }, + { + "epoch": 1.31, + "learning_rate": 1.2476209066741484e-06, + "loss": 0.5308, + "step": 51237 + }, + { + "epoch": 1.31, + "learning_rate": 1.2475940978664033e-06, + "loss": 0.4844, + "step": 51238 + }, + { + "epoch": 1.31, + "learning_rate": 1.2475672888690868e-06, + "loss": 0.5132, + "step": 51239 + }, + { + "epoch": 1.31, + "learning_rate": 1.2475404796822193e-06, + "loss": 0.5605, + "step": 51240 + }, + { + "epoch": 1.31, + "learning_rate": 1.2475136703058214e-06, + "loss": 0.668, + "step": 51241 + }, + { + "epoch": 1.31, + "learning_rate": 1.2474868607399137e-06, + "loss": 0.6123, + "step": 51242 + }, + { + "epoch": 1.31, + "learning_rate": 1.2474600509845166e-06, + "loss": 0.5571, + "step": 51243 + }, + { + "epoch": 1.31, + "learning_rate": 1.2474332410396508e-06, + "loss": 0.6439, + "step": 51244 + }, + { + "epoch": 1.31, + "learning_rate": 1.247406430905337e-06, + "loss": 0.6675, + "step": 51245 + }, + { + "epoch": 1.31, + "learning_rate": 1.247379620581595e-06, + "loss": 0.6699, + "step": 51246 + }, + { + "epoch": 1.31, + "learning_rate": 1.247352810068446e-06, + "loss": 0.624, + "step": 51247 + }, + { + "epoch": 1.31, + "learning_rate": 1.2473259993659105e-06, + "loss": 0.5854, + "step": 51248 + }, + { + "epoch": 1.31, + "learning_rate": 1.2472991884740089e-06, + "loss": 0.5913, + "step": 51249 + }, + { + "epoch": 1.31, + "learning_rate": 1.2472723773927613e-06, + "loss": 0.6577, + "step": 51250 + }, + { + "epoch": 1.31, + "learning_rate": 1.247245566122189e-06, + "loss": 0.6196, + "step": 51251 + }, + { + "epoch": 1.31, + "learning_rate": 1.247218754662312e-06, + "loss": 0.6797, + "step": 51252 + }, + { + "epoch": 1.31, + "learning_rate": 1.2471919430131508e-06, + "loss": 0.6152, + "step": 51253 + }, + { + "epoch": 1.31, + "learning_rate": 1.2471651311747263e-06, + "loss": 0.7363, + "step": 51254 + }, + { + "epoch": 1.31, + "learning_rate": 1.2471383191470588e-06, + "loss": 0.6196, + "step": 51255 + }, + { + "epoch": 1.31, + "learning_rate": 1.2471115069301687e-06, + "loss": 0.6289, + "step": 51256 + }, + { + "epoch": 1.31, + "learning_rate": 1.247084694524077e-06, + "loss": 0.5747, + "step": 51257 + }, + { + "epoch": 1.31, + "learning_rate": 1.2470578819288033e-06, + "loss": 0.5942, + "step": 51258 + }, + { + "epoch": 1.31, + "learning_rate": 1.2470310691443696e-06, + "loss": 0.6514, + "step": 51259 + }, + { + "epoch": 1.31, + "learning_rate": 1.247004256170795e-06, + "loss": 0.6494, + "step": 51260 + }, + { + "epoch": 1.31, + "learning_rate": 1.2469774430081005e-06, + "loss": 0.6689, + "step": 51261 + }, + { + "epoch": 1.31, + "learning_rate": 1.246950629656307e-06, + "loss": 0.7197, + "step": 51262 + }, + { + "epoch": 1.31, + "learning_rate": 1.2469238161154348e-06, + "loss": 0.8047, + "step": 51263 + }, + { + "epoch": 1.31, + "learning_rate": 1.2468970023855044e-06, + "loss": 0.7627, + "step": 51264 + }, + { + "epoch": 1.31, + "learning_rate": 1.246870188466536e-06, + "loss": 0.6519, + "step": 51265 + }, + { + "epoch": 1.31, + "learning_rate": 1.2468433743585506e-06, + "loss": 0.4253, + "step": 51266 + }, + { + "epoch": 1.31, + "learning_rate": 1.2468165600615687e-06, + "loss": 0.6831, + "step": 51267 + }, + { + "epoch": 1.31, + "learning_rate": 1.2467897455756106e-06, + "loss": 0.6025, + "step": 51268 + }, + { + "epoch": 1.31, + "learning_rate": 1.2467629309006968e-06, + "loss": 0.4841, + "step": 51269 + }, + { + "epoch": 1.31, + "learning_rate": 1.2467361160368483e-06, + "loss": 0.7612, + "step": 51270 + }, + { + "epoch": 1.31, + "learning_rate": 1.246709300984085e-06, + "loss": 0.5791, + "step": 51271 + }, + { + "epoch": 1.31, + "learning_rate": 1.2466824857424281e-06, + "loss": 0.6709, + "step": 51272 + }, + { + "epoch": 1.31, + "learning_rate": 1.2466556703118976e-06, + "loss": 0.7305, + "step": 51273 + }, + { + "epoch": 1.31, + "learning_rate": 1.2466288546925141e-06, + "loss": 0.6514, + "step": 51274 + }, + { + "epoch": 1.31, + "learning_rate": 1.2466020388842982e-06, + "loss": 0.6914, + "step": 51275 + }, + { + "epoch": 1.31, + "learning_rate": 1.2465752228872706e-06, + "loss": 0.5811, + "step": 51276 + }, + { + "epoch": 1.31, + "learning_rate": 1.2465484067014514e-06, + "loss": 0.5259, + "step": 51277 + }, + { + "epoch": 1.31, + "learning_rate": 1.246521590326862e-06, + "loss": 0.7783, + "step": 51278 + }, + { + "epoch": 1.31, + "learning_rate": 1.2464947737635219e-06, + "loss": 0.6416, + "step": 51279 + }, + { + "epoch": 1.31, + "learning_rate": 1.246467957011452e-06, + "loss": 0.7559, + "step": 51280 + }, + { + "epoch": 1.31, + "learning_rate": 1.2464411400706732e-06, + "loss": 0.4675, + "step": 51281 + }, + { + "epoch": 1.31, + "learning_rate": 1.2464143229412053e-06, + "loss": 0.4624, + "step": 51282 + }, + { + "epoch": 1.31, + "learning_rate": 1.24638750562307e-06, + "loss": 0.6431, + "step": 51283 + }, + { + "epoch": 1.31, + "learning_rate": 1.2463606881162868e-06, + "loss": 0.8027, + "step": 51284 + }, + { + "epoch": 1.31, + "learning_rate": 1.2463338704208764e-06, + "loss": 0.6289, + "step": 51285 + }, + { + "epoch": 1.31, + "learning_rate": 1.2463070525368594e-06, + "loss": 0.7046, + "step": 51286 + }, + { + "epoch": 1.31, + "learning_rate": 1.2462802344642566e-06, + "loss": 0.752, + "step": 51287 + }, + { + "epoch": 1.31, + "learning_rate": 1.2462534162030885e-06, + "loss": 0.5752, + "step": 51288 + }, + { + "epoch": 1.31, + "learning_rate": 1.2462265977533753e-06, + "loss": 0.8662, + "step": 51289 + }, + { + "epoch": 1.31, + "learning_rate": 1.2461997791151376e-06, + "loss": 0.7246, + "step": 51290 + }, + { + "epoch": 1.31, + "learning_rate": 1.246172960288396e-06, + "loss": 0.7148, + "step": 51291 + }, + { + "epoch": 1.31, + "learning_rate": 1.2461461412731713e-06, + "loss": 0.7871, + "step": 51292 + }, + { + "epoch": 1.31, + "learning_rate": 1.246119322069484e-06, + "loss": 0.7354, + "step": 51293 + }, + { + "epoch": 1.31, + "learning_rate": 1.2460925026773542e-06, + "loss": 0.6904, + "step": 51294 + }, + { + "epoch": 1.31, + "learning_rate": 1.2460656830968029e-06, + "loss": 0.625, + "step": 51295 + }, + { + "epoch": 1.31, + "learning_rate": 1.24603886332785e-06, + "loss": 0.5781, + "step": 51296 + }, + { + "epoch": 1.31, + "learning_rate": 1.2460120433705167e-06, + "loss": 0.6172, + "step": 51297 + }, + { + "epoch": 1.31, + "learning_rate": 1.2459852232248234e-06, + "loss": 0.5444, + "step": 51298 + }, + { + "epoch": 1.31, + "learning_rate": 1.2459584028907903e-06, + "loss": 0.7139, + "step": 51299 + }, + { + "epoch": 1.31, + "learning_rate": 1.2459315823684382e-06, + "loss": 0.6143, + "step": 51300 + }, + { + "epoch": 1.31, + "learning_rate": 1.2459047616577878e-06, + "loss": 0.6309, + "step": 51301 + }, + { + "epoch": 1.31, + "learning_rate": 1.2458779407588592e-06, + "loss": 0.5161, + "step": 51302 + }, + { + "epoch": 1.31, + "learning_rate": 1.2458511196716734e-06, + "loss": 0.446, + "step": 51303 + }, + { + "epoch": 1.31, + "learning_rate": 1.2458242983962505e-06, + "loss": 0.5433, + "step": 51304 + }, + { + "epoch": 1.31, + "learning_rate": 1.2457974769326114e-06, + "loss": 0.7578, + "step": 51305 + }, + { + "epoch": 1.31, + "learning_rate": 1.2457706552807763e-06, + "loss": 0.5645, + "step": 51306 + }, + { + "epoch": 1.32, + "learning_rate": 1.245743833440766e-06, + "loss": 0.707, + "step": 51307 + }, + { + "epoch": 1.32, + "learning_rate": 1.245717011412601e-06, + "loss": 0.5664, + "step": 51308 + }, + { + "epoch": 1.32, + "learning_rate": 1.2456901891963017e-06, + "loss": 0.6875, + "step": 51309 + }, + { + "epoch": 1.32, + "learning_rate": 1.2456633667918889e-06, + "loss": 0.7212, + "step": 51310 + }, + { + "epoch": 1.32, + "learning_rate": 1.2456365441993826e-06, + "loss": 0.4624, + "step": 51311 + }, + { + "epoch": 1.32, + "learning_rate": 1.2456097214188038e-06, + "loss": 0.6958, + "step": 51312 + }, + { + "epoch": 1.32, + "learning_rate": 1.245582898450173e-06, + "loss": 0.7119, + "step": 51313 + }, + { + "epoch": 1.32, + "learning_rate": 1.2455560752935109e-06, + "loss": 0.6733, + "step": 51314 + }, + { + "epoch": 1.32, + "learning_rate": 1.2455292519488373e-06, + "loss": 0.6313, + "step": 51315 + }, + { + "epoch": 1.32, + "learning_rate": 1.2455024284161736e-06, + "loss": 0.5364, + "step": 51316 + }, + { + "epoch": 1.32, + "learning_rate": 1.2454756046955398e-06, + "loss": 0.7578, + "step": 51317 + }, + { + "epoch": 1.32, + "learning_rate": 1.2454487807869572e-06, + "loss": 0.6338, + "step": 51318 + }, + { + "epoch": 1.32, + "learning_rate": 1.245421956690445e-06, + "loss": 0.709, + "step": 51319 + }, + { + "epoch": 1.32, + "learning_rate": 1.2453951324060247e-06, + "loss": 0.7197, + "step": 51320 + }, + { + "epoch": 1.32, + "learning_rate": 1.2453683079337167e-06, + "loss": 0.5542, + "step": 51321 + }, + { + "epoch": 1.32, + "learning_rate": 1.2453414832735417e-06, + "loss": 0.6689, + "step": 51322 + }, + { + "epoch": 1.32, + "learning_rate": 1.2453146584255197e-06, + "loss": 0.6362, + "step": 51323 + }, + { + "epoch": 1.32, + "learning_rate": 1.2452878333896718e-06, + "loss": 0.5752, + "step": 51324 + }, + { + "epoch": 1.32, + "learning_rate": 1.2452610081660178e-06, + "loss": 0.7051, + "step": 51325 + }, + { + "epoch": 1.32, + "learning_rate": 1.2452341827545792e-06, + "loss": 0.7012, + "step": 51326 + }, + { + "epoch": 1.32, + "learning_rate": 1.2452073571553756e-06, + "loss": 0.563, + "step": 51327 + }, + { + "epoch": 1.32, + "learning_rate": 1.2451805313684286e-06, + "loss": 0.7036, + "step": 51328 + }, + { + "epoch": 1.32, + "learning_rate": 1.2451537053937577e-06, + "loss": 0.6943, + "step": 51329 + }, + { + "epoch": 1.32, + "learning_rate": 1.2451268792313843e-06, + "loss": 0.6846, + "step": 51330 + }, + { + "epoch": 1.32, + "learning_rate": 1.245100052881328e-06, + "loss": 0.7446, + "step": 51331 + }, + { + "epoch": 1.32, + "learning_rate": 1.2450732263436102e-06, + "loss": 0.6116, + "step": 51332 + }, + { + "epoch": 1.32, + "learning_rate": 1.245046399618251e-06, + "loss": 0.7432, + "step": 51333 + }, + { + "epoch": 1.32, + "learning_rate": 1.2450195727052708e-06, + "loss": 0.6338, + "step": 51334 + }, + { + "epoch": 1.32, + "learning_rate": 1.2449927456046907e-06, + "loss": 0.606, + "step": 51335 + }, + { + "epoch": 1.32, + "learning_rate": 1.2449659183165309e-06, + "loss": 0.748, + "step": 51336 + }, + { + "epoch": 1.32, + "learning_rate": 1.2449390908408118e-06, + "loss": 0.5378, + "step": 51337 + }, + { + "epoch": 1.32, + "learning_rate": 1.2449122631775545e-06, + "loss": 0.5757, + "step": 51338 + }, + { + "epoch": 1.32, + "learning_rate": 1.2448854353267789e-06, + "loss": 0.606, + "step": 51339 + }, + { + "epoch": 1.32, + "learning_rate": 1.2448586072885054e-06, + "loss": 0.7373, + "step": 51340 + }, + { + "epoch": 1.32, + "learning_rate": 1.2448317790627553e-06, + "loss": 0.5503, + "step": 51341 + }, + { + "epoch": 1.32, + "learning_rate": 1.2448049506495486e-06, + "loss": 0.7656, + "step": 51342 + }, + { + "epoch": 1.32, + "learning_rate": 1.2447781220489064e-06, + "loss": 0.6992, + "step": 51343 + }, + { + "epoch": 1.32, + "learning_rate": 1.2447512932608484e-06, + "loss": 0.7012, + "step": 51344 + }, + { + "epoch": 1.32, + "learning_rate": 1.2447244642853958e-06, + "loss": 0.668, + "step": 51345 + }, + { + "epoch": 1.32, + "learning_rate": 1.2446976351225685e-06, + "loss": 0.7339, + "step": 51346 + }, + { + "epoch": 1.32, + "learning_rate": 1.2446708057723882e-06, + "loss": 0.5015, + "step": 51347 + }, + { + "epoch": 1.32, + "learning_rate": 1.2446439762348744e-06, + "loss": 0.6016, + "step": 51348 + }, + { + "epoch": 1.32, + "learning_rate": 1.244617146510048e-06, + "loss": 0.4619, + "step": 51349 + }, + { + "epoch": 1.32, + "learning_rate": 1.2445903165979292e-06, + "loss": 0.6123, + "step": 51350 + }, + { + "epoch": 1.32, + "learning_rate": 1.2445634864985393e-06, + "loss": 0.6763, + "step": 51351 + }, + { + "epoch": 1.32, + "learning_rate": 1.2445366562118979e-06, + "loss": 0.582, + "step": 51352 + }, + { + "epoch": 1.32, + "learning_rate": 1.2445098257380264e-06, + "loss": 0.6724, + "step": 51353 + }, + { + "epoch": 1.32, + "learning_rate": 1.2444829950769448e-06, + "loss": 0.79, + "step": 51354 + }, + { + "epoch": 1.32, + "learning_rate": 1.2444561642286738e-06, + "loss": 0.4578, + "step": 51355 + }, + { + "epoch": 1.32, + "learning_rate": 1.2444293331932342e-06, + "loss": 0.6973, + "step": 51356 + }, + { + "epoch": 1.32, + "learning_rate": 1.2444025019706461e-06, + "loss": 0.8447, + "step": 51357 + }, + { + "epoch": 1.32, + "learning_rate": 1.2443756705609304e-06, + "loss": 0.3235, + "step": 51358 + }, + { + "epoch": 1.32, + "learning_rate": 1.244348838964107e-06, + "loss": 0.5938, + "step": 51359 + }, + { + "epoch": 1.32, + "learning_rate": 1.2443220071801974e-06, + "loss": 0.5444, + "step": 51360 + }, + { + "epoch": 1.32, + "learning_rate": 1.2442951752092214e-06, + "loss": 0.5522, + "step": 51361 + }, + { + "epoch": 1.32, + "learning_rate": 1.2442683430512e-06, + "loss": 0.6367, + "step": 51362 + }, + { + "epoch": 1.32, + "learning_rate": 1.2442415107061537e-06, + "loss": 0.7754, + "step": 51363 + }, + { + "epoch": 1.32, + "learning_rate": 1.2442146781741027e-06, + "loss": 0.6543, + "step": 51364 + }, + { + "epoch": 1.32, + "learning_rate": 1.2441878454550675e-06, + "loss": 0.4639, + "step": 51365 + }, + { + "epoch": 1.32, + "learning_rate": 1.2441610125490693e-06, + "loss": 0.5352, + "step": 51366 + }, + { + "epoch": 1.32, + "learning_rate": 1.244134179456128e-06, + "loss": 0.7422, + "step": 51367 + }, + { + "epoch": 1.32, + "learning_rate": 1.2441073461762649e-06, + "loss": 0.6406, + "step": 51368 + }, + { + "epoch": 1.32, + "learning_rate": 1.2440805127094993e-06, + "loss": 0.5933, + "step": 51369 + }, + { + "epoch": 1.32, + "learning_rate": 1.2440536790558528e-06, + "loss": 0.5627, + "step": 51370 + }, + { + "epoch": 1.32, + "learning_rate": 1.2440268452153456e-06, + "loss": 0.6289, + "step": 51371 + }, + { + "epoch": 1.32, + "learning_rate": 1.2440000111879983e-06, + "loss": 0.6172, + "step": 51372 + }, + { + "epoch": 1.32, + "learning_rate": 1.2439731769738316e-06, + "loss": 0.6797, + "step": 51373 + }, + { + "epoch": 1.32, + "learning_rate": 1.2439463425728656e-06, + "loss": 0.5037, + "step": 51374 + }, + { + "epoch": 1.32, + "learning_rate": 1.2439195079851211e-06, + "loss": 0.5479, + "step": 51375 + }, + { + "epoch": 1.32, + "learning_rate": 1.2438926732106188e-06, + "loss": 0.4956, + "step": 51376 + }, + { + "epoch": 1.32, + "learning_rate": 1.2438658382493788e-06, + "loss": 0.573, + "step": 51377 + }, + { + "epoch": 1.32, + "learning_rate": 1.243839003101422e-06, + "loss": 0.6855, + "step": 51378 + }, + { + "epoch": 1.32, + "learning_rate": 1.2438121677667692e-06, + "loss": 0.7383, + "step": 51379 + }, + { + "epoch": 1.32, + "learning_rate": 1.2437853322454403e-06, + "loss": 0.7832, + "step": 51380 + }, + { + "epoch": 1.32, + "learning_rate": 1.2437584965374567e-06, + "loss": 0.5247, + "step": 51381 + }, + { + "epoch": 1.32, + "learning_rate": 1.2437316606428376e-06, + "loss": 0.688, + "step": 51382 + }, + { + "epoch": 1.32, + "learning_rate": 1.2437048245616053e-06, + "loss": 0.6104, + "step": 51383 + }, + { + "epoch": 1.32, + "learning_rate": 1.2436779882937786e-06, + "loss": 0.6631, + "step": 51384 + }, + { + "epoch": 1.32, + "learning_rate": 1.2436511518393796e-06, + "loss": 0.5151, + "step": 51385 + }, + { + "epoch": 1.32, + "learning_rate": 1.2436243151984275e-06, + "loss": 0.3661, + "step": 51386 + }, + { + "epoch": 1.32, + "learning_rate": 1.2435974783709437e-06, + "loss": 0.7695, + "step": 51387 + }, + { + "epoch": 1.32, + "learning_rate": 1.2435706413569487e-06, + "loss": 0.6392, + "step": 51388 + }, + { + "epoch": 1.32, + "learning_rate": 1.2435438041564628e-06, + "loss": 0.7119, + "step": 51389 + }, + { + "epoch": 1.32, + "learning_rate": 1.2435169667695063e-06, + "loss": 0.416, + "step": 51390 + }, + { + "epoch": 1.32, + "learning_rate": 1.2434901291961001e-06, + "loss": 0.667, + "step": 51391 + }, + { + "epoch": 1.32, + "learning_rate": 1.243463291436265e-06, + "loss": 0.7871, + "step": 51392 + }, + { + "epoch": 1.32, + "learning_rate": 1.2434364534900213e-06, + "loss": 0.4519, + "step": 51393 + }, + { + "epoch": 1.32, + "learning_rate": 1.2434096153573891e-06, + "loss": 0.6797, + "step": 51394 + }, + { + "epoch": 1.32, + "learning_rate": 1.2433827770383896e-06, + "loss": 0.6499, + "step": 51395 + }, + { + "epoch": 1.32, + "learning_rate": 1.243355938533043e-06, + "loss": 0.6143, + "step": 51396 + }, + { + "epoch": 1.32, + "learning_rate": 1.24332909984137e-06, + "loss": 0.6104, + "step": 51397 + }, + { + "epoch": 1.32, + "learning_rate": 1.243302260963391e-06, + "loss": 0.814, + "step": 51398 + }, + { + "epoch": 1.32, + "learning_rate": 1.2432754218991269e-06, + "loss": 0.6475, + "step": 51399 + }, + { + "epoch": 1.32, + "learning_rate": 1.2432485826485978e-06, + "loss": 0.7529, + "step": 51400 + }, + { + "epoch": 1.32, + "learning_rate": 1.2432217432118243e-06, + "loss": 0.5707, + "step": 51401 + }, + { + "epoch": 1.32, + "learning_rate": 1.2431949035888273e-06, + "loss": 0.7246, + "step": 51402 + }, + { + "epoch": 1.32, + "learning_rate": 1.2431680637796272e-06, + "loss": 0.7803, + "step": 51403 + }, + { + "epoch": 1.32, + "learning_rate": 1.2431412237842444e-06, + "loss": 0.6958, + "step": 51404 + }, + { + "epoch": 1.32, + "learning_rate": 1.2431143836026995e-06, + "loss": 0.8662, + "step": 51405 + }, + { + "epoch": 1.32, + "learning_rate": 1.2430875432350131e-06, + "loss": 0.71, + "step": 51406 + }, + { + "epoch": 1.32, + "learning_rate": 1.2430607026812059e-06, + "loss": 0.7832, + "step": 51407 + }, + { + "epoch": 1.32, + "learning_rate": 1.2430338619412983e-06, + "loss": 0.6699, + "step": 51408 + }, + { + "epoch": 1.32, + "learning_rate": 1.2430070210153107e-06, + "loss": 0.7236, + "step": 51409 + }, + { + "epoch": 1.32, + "learning_rate": 1.242980179903264e-06, + "loss": 0.5288, + "step": 51410 + }, + { + "epoch": 1.32, + "learning_rate": 1.2429533386051783e-06, + "loss": 0.563, + "step": 51411 + }, + { + "epoch": 1.32, + "learning_rate": 1.2429264971210745e-06, + "loss": 0.5854, + "step": 51412 + }, + { + "epoch": 1.32, + "learning_rate": 1.242899655450973e-06, + "loss": 0.7168, + "step": 51413 + }, + { + "epoch": 1.32, + "learning_rate": 1.2428728135948945e-06, + "loss": 0.637, + "step": 51414 + }, + { + "epoch": 1.32, + "learning_rate": 1.2428459715528594e-06, + "loss": 0.6082, + "step": 51415 + }, + { + "epoch": 1.32, + "learning_rate": 1.2428191293248884e-06, + "loss": 0.7002, + "step": 51416 + }, + { + "epoch": 1.32, + "learning_rate": 1.2427922869110017e-06, + "loss": 0.6899, + "step": 51417 + }, + { + "epoch": 1.32, + "learning_rate": 1.2427654443112202e-06, + "loss": 0.7529, + "step": 51418 + }, + { + "epoch": 1.32, + "learning_rate": 1.2427386015255646e-06, + "loss": 0.7744, + "step": 51419 + }, + { + "epoch": 1.32, + "learning_rate": 1.2427117585540551e-06, + "loss": 0.5957, + "step": 51420 + }, + { + "epoch": 1.32, + "learning_rate": 1.2426849153967123e-06, + "loss": 0.6348, + "step": 51421 + }, + { + "epoch": 1.32, + "learning_rate": 1.242658072053557e-06, + "loss": 0.7402, + "step": 51422 + }, + { + "epoch": 1.32, + "learning_rate": 1.2426312285246092e-06, + "loss": 0.8174, + "step": 51423 + }, + { + "epoch": 1.32, + "learning_rate": 1.24260438480989e-06, + "loss": 0.5542, + "step": 51424 + }, + { + "epoch": 1.32, + "learning_rate": 1.24257754090942e-06, + "loss": 0.7334, + "step": 51425 + }, + { + "epoch": 1.32, + "learning_rate": 1.242550696823219e-06, + "loss": 0.4849, + "step": 51426 + }, + { + "epoch": 1.32, + "learning_rate": 1.2425238525513084e-06, + "loss": 0.6104, + "step": 51427 + }, + { + "epoch": 1.32, + "learning_rate": 1.2424970080937086e-06, + "loss": 0.6562, + "step": 51428 + }, + { + "epoch": 1.32, + "learning_rate": 1.2424701634504399e-06, + "loss": 0.6279, + "step": 51429 + }, + { + "epoch": 1.32, + "learning_rate": 1.2424433186215229e-06, + "loss": 0.502, + "step": 51430 + }, + { + "epoch": 1.32, + "learning_rate": 1.2424164736069782e-06, + "loss": 0.6074, + "step": 51431 + }, + { + "epoch": 1.32, + "learning_rate": 1.2423896284068263e-06, + "loss": 0.668, + "step": 51432 + }, + { + "epoch": 1.32, + "learning_rate": 1.242362783021088e-06, + "loss": 0.6191, + "step": 51433 + }, + { + "epoch": 1.32, + "learning_rate": 1.2423359374497836e-06, + "loss": 0.6514, + "step": 51434 + }, + { + "epoch": 1.32, + "learning_rate": 1.2423090916929335e-06, + "loss": 0.5923, + "step": 51435 + }, + { + "epoch": 1.32, + "learning_rate": 1.2422822457505585e-06, + "loss": 0.7246, + "step": 51436 + }, + { + "epoch": 1.32, + "learning_rate": 1.2422553996226792e-06, + "loss": 0.5557, + "step": 51437 + }, + { + "epoch": 1.32, + "learning_rate": 1.2422285533093162e-06, + "loss": 0.5356, + "step": 51438 + }, + { + "epoch": 1.32, + "learning_rate": 1.24220170681049e-06, + "loss": 0.6108, + "step": 51439 + }, + { + "epoch": 1.32, + "learning_rate": 1.2421748601262208e-06, + "loss": 0.593, + "step": 51440 + }, + { + "epoch": 1.32, + "learning_rate": 1.2421480132565296e-06, + "loss": 0.5503, + "step": 51441 + }, + { + "epoch": 1.32, + "learning_rate": 1.2421211662014366e-06, + "loss": 0.9531, + "step": 51442 + }, + { + "epoch": 1.32, + "learning_rate": 1.242094318960963e-06, + "loss": 0.7471, + "step": 51443 + }, + { + "epoch": 1.32, + "learning_rate": 1.2420674715351287e-06, + "loss": 0.7534, + "step": 51444 + }, + { + "epoch": 1.32, + "learning_rate": 1.2420406239239541e-06, + "loss": 0.6111, + "step": 51445 + }, + { + "epoch": 1.32, + "learning_rate": 1.2420137761274606e-06, + "loss": 0.5789, + "step": 51446 + }, + { + "epoch": 1.32, + "learning_rate": 1.241986928145668e-06, + "loss": 0.5347, + "step": 51447 + }, + { + "epoch": 1.32, + "learning_rate": 1.2419600799785973e-06, + "loss": 0.6924, + "step": 51448 + }, + { + "epoch": 1.32, + "learning_rate": 1.241933231626269e-06, + "loss": 0.6201, + "step": 51449 + }, + { + "epoch": 1.32, + "learning_rate": 1.2419063830887033e-06, + "loss": 0.6992, + "step": 51450 + }, + { + "epoch": 1.32, + "learning_rate": 1.241879534365921e-06, + "loss": 0.75, + "step": 51451 + }, + { + "epoch": 1.32, + "learning_rate": 1.2418526854579428e-06, + "loss": 0.793, + "step": 51452 + }, + { + "epoch": 1.32, + "learning_rate": 1.2418258363647892e-06, + "loss": 0.793, + "step": 51453 + }, + { + "epoch": 1.32, + "learning_rate": 1.2417989870864807e-06, + "loss": 0.5591, + "step": 51454 + }, + { + "epoch": 1.32, + "learning_rate": 1.2417721376230374e-06, + "loss": 0.7275, + "step": 51455 + }, + { + "epoch": 1.32, + "learning_rate": 1.2417452879744807e-06, + "loss": 0.4626, + "step": 51456 + }, + { + "epoch": 1.32, + "learning_rate": 1.2417184381408305e-06, + "loss": 0.7427, + "step": 51457 + }, + { + "epoch": 1.32, + "learning_rate": 1.241691588122108e-06, + "loss": 0.6055, + "step": 51458 + }, + { + "epoch": 1.32, + "learning_rate": 1.241664737918333e-06, + "loss": 0.6382, + "step": 51459 + }, + { + "epoch": 1.32, + "learning_rate": 1.2416378875295267e-06, + "loss": 0.7075, + "step": 51460 + }, + { + "epoch": 1.32, + "learning_rate": 1.2416110369557089e-06, + "loss": 0.7744, + "step": 51461 + }, + { + "epoch": 1.32, + "learning_rate": 1.241584186196901e-06, + "loss": 0.7217, + "step": 51462 + }, + { + "epoch": 1.32, + "learning_rate": 1.2415573352531233e-06, + "loss": 0.5659, + "step": 51463 + }, + { + "epoch": 1.32, + "learning_rate": 1.241530484124396e-06, + "loss": 0.7822, + "step": 51464 + }, + { + "epoch": 1.32, + "learning_rate": 1.24150363281074e-06, + "loss": 0.7529, + "step": 51465 + }, + { + "epoch": 1.32, + "learning_rate": 1.2414767813121757e-06, + "loss": 0.7939, + "step": 51466 + }, + { + "epoch": 1.32, + "learning_rate": 1.2414499296287238e-06, + "loss": 0.4503, + "step": 51467 + }, + { + "epoch": 1.32, + "learning_rate": 1.2414230777604048e-06, + "loss": 0.6123, + "step": 51468 + }, + { + "epoch": 1.32, + "learning_rate": 1.2413962257072395e-06, + "loss": 0.6006, + "step": 51469 + }, + { + "epoch": 1.32, + "learning_rate": 1.2413693734692476e-06, + "loss": 0.5166, + "step": 51470 + }, + { + "epoch": 1.32, + "learning_rate": 1.2413425210464507e-06, + "loss": 0.6372, + "step": 51471 + }, + { + "epoch": 1.32, + "learning_rate": 1.241315668438869e-06, + "loss": 0.7197, + "step": 51472 + }, + { + "epoch": 1.32, + "learning_rate": 1.2412888156465232e-06, + "loss": 0.4402, + "step": 51473 + }, + { + "epoch": 1.32, + "learning_rate": 1.241261962669433e-06, + "loss": 0.6255, + "step": 51474 + }, + { + "epoch": 1.32, + "learning_rate": 1.24123510950762e-06, + "loss": 0.5332, + "step": 51475 + }, + { + "epoch": 1.32, + "learning_rate": 1.2412082561611041e-06, + "loss": 0.6553, + "step": 51476 + }, + { + "epoch": 1.32, + "learning_rate": 1.2411814026299064e-06, + "loss": 0.6343, + "step": 51477 + }, + { + "epoch": 1.32, + "learning_rate": 1.2411545489140472e-06, + "loss": 0.5964, + "step": 51478 + }, + { + "epoch": 1.32, + "learning_rate": 1.241127695013547e-06, + "loss": 0.4475, + "step": 51479 + }, + { + "epoch": 1.32, + "learning_rate": 1.2411008409284262e-06, + "loss": 0.8018, + "step": 51480 + }, + { + "epoch": 1.32, + "learning_rate": 1.241073986658706e-06, + "loss": 0.6494, + "step": 51481 + }, + { + "epoch": 1.32, + "learning_rate": 1.241047132204406e-06, + "loss": 0.6533, + "step": 51482 + }, + { + "epoch": 1.32, + "learning_rate": 1.2410202775655478e-06, + "loss": 0.6626, + "step": 51483 + }, + { + "epoch": 1.32, + "learning_rate": 1.240993422742151e-06, + "loss": 0.573, + "step": 51484 + }, + { + "epoch": 1.32, + "learning_rate": 1.240966567734237e-06, + "loss": 0.6714, + "step": 51485 + }, + { + "epoch": 1.32, + "learning_rate": 1.2409397125418255e-06, + "loss": 0.6431, + "step": 51486 + }, + { + "epoch": 1.32, + "learning_rate": 1.240912857164938e-06, + "loss": 0.792, + "step": 51487 + }, + { + "epoch": 1.32, + "learning_rate": 1.2408860016035944e-06, + "loss": 0.6768, + "step": 51488 + }, + { + "epoch": 1.32, + "learning_rate": 1.2408591458578154e-06, + "loss": 0.4924, + "step": 51489 + }, + { + "epoch": 1.32, + "learning_rate": 1.240832289927622e-06, + "loss": 0.7832, + "step": 51490 + }, + { + "epoch": 1.32, + "learning_rate": 1.240805433813034e-06, + "loss": 0.7173, + "step": 51491 + }, + { + "epoch": 1.32, + "learning_rate": 1.2407785775140725e-06, + "loss": 0.6309, + "step": 51492 + }, + { + "epoch": 1.32, + "learning_rate": 1.240751721030758e-06, + "loss": 0.6953, + "step": 51493 + }, + { + "epoch": 1.32, + "learning_rate": 1.240724864363111e-06, + "loss": 0.6836, + "step": 51494 + }, + { + "epoch": 1.32, + "learning_rate": 1.2406980075111517e-06, + "loss": 0.4932, + "step": 51495 + }, + { + "epoch": 1.32, + "learning_rate": 1.2406711504749013e-06, + "loss": 0.7119, + "step": 51496 + }, + { + "epoch": 1.32, + "learning_rate": 1.24064429325438e-06, + "loss": 0.6875, + "step": 51497 + }, + { + "epoch": 1.32, + "learning_rate": 1.2406174358496086e-06, + "loss": 0.4922, + "step": 51498 + }, + { + "epoch": 1.32, + "learning_rate": 1.2405905782606072e-06, + "loss": 0.8066, + "step": 51499 + }, + { + "epoch": 1.32, + "learning_rate": 1.2405637204873967e-06, + "loss": 0.4535, + "step": 51500 + }, + { + "epoch": 1.32, + "learning_rate": 1.2405368625299977e-06, + "loss": 0.667, + "step": 51501 + }, + { + "epoch": 1.32, + "learning_rate": 1.2405100043884308e-06, + "loss": 0.5518, + "step": 51502 + }, + { + "epoch": 1.32, + "learning_rate": 1.2404831460627163e-06, + "loss": 0.6465, + "step": 51503 + }, + { + "epoch": 1.32, + "learning_rate": 1.240456287552875e-06, + "loss": 0.6377, + "step": 51504 + }, + { + "epoch": 1.32, + "learning_rate": 1.2404294288589272e-06, + "loss": 0.5913, + "step": 51505 + }, + { + "epoch": 1.32, + "learning_rate": 1.2404025699808937e-06, + "loss": 0.6699, + "step": 51506 + }, + { + "epoch": 1.32, + "learning_rate": 1.2403757109187948e-06, + "loss": 0.7402, + "step": 51507 + }, + { + "epoch": 1.32, + "learning_rate": 1.2403488516726518e-06, + "loss": 0.5615, + "step": 51508 + }, + { + "epoch": 1.32, + "learning_rate": 1.2403219922424845e-06, + "loss": 0.6406, + "step": 51509 + }, + { + "epoch": 1.32, + "learning_rate": 1.2402951326283137e-06, + "loss": 0.623, + "step": 51510 + }, + { + "epoch": 1.32, + "learning_rate": 1.24026827283016e-06, + "loss": 0.5122, + "step": 51511 + }, + { + "epoch": 1.32, + "learning_rate": 1.2402414128480438e-06, + "loss": 0.6985, + "step": 51512 + }, + { + "epoch": 1.32, + "learning_rate": 1.2402145526819859e-06, + "loss": 0.8213, + "step": 51513 + }, + { + "epoch": 1.32, + "learning_rate": 1.2401876923320067e-06, + "loss": 0.6572, + "step": 51514 + }, + { + "epoch": 1.32, + "learning_rate": 1.2401608317981269e-06, + "loss": 0.5596, + "step": 51515 + }, + { + "epoch": 1.32, + "learning_rate": 1.2401339710803666e-06, + "loss": 0.6216, + "step": 51516 + }, + { + "epoch": 1.32, + "learning_rate": 1.2401071101787472e-06, + "loss": 0.458, + "step": 51517 + }, + { + "epoch": 1.32, + "learning_rate": 1.2400802490932888e-06, + "loss": 0.2642, + "step": 51518 + }, + { + "epoch": 1.32, + "learning_rate": 1.240053387824012e-06, + "loss": 0.8389, + "step": 51519 + }, + { + "epoch": 1.32, + "learning_rate": 1.2400265263709374e-06, + "loss": 0.5579, + "step": 51520 + }, + { + "epoch": 1.32, + "learning_rate": 1.2399996647340854e-06, + "loss": 0.6973, + "step": 51521 + }, + { + "epoch": 1.32, + "learning_rate": 1.2399728029134765e-06, + "loss": 0.5464, + "step": 51522 + }, + { + "epoch": 1.32, + "learning_rate": 1.2399459409091319e-06, + "loss": 0.6934, + "step": 51523 + }, + { + "epoch": 1.32, + "learning_rate": 1.2399190787210715e-06, + "loss": 0.8115, + "step": 51524 + }, + { + "epoch": 1.32, + "learning_rate": 1.2398922163493159e-06, + "loss": 0.7295, + "step": 51525 + }, + { + "epoch": 1.32, + "learning_rate": 1.239865353793886e-06, + "loss": 0.7451, + "step": 51526 + }, + { + "epoch": 1.32, + "learning_rate": 1.2398384910548023e-06, + "loss": 0.6367, + "step": 51527 + }, + { + "epoch": 1.32, + "learning_rate": 1.2398116281320855e-06, + "loss": 0.7871, + "step": 51528 + }, + { + "epoch": 1.32, + "learning_rate": 1.2397847650257558e-06, + "loss": 0.6384, + "step": 51529 + }, + { + "epoch": 1.32, + "learning_rate": 1.2397579017358337e-06, + "loss": 0.4697, + "step": 51530 + }, + { + "epoch": 1.32, + "learning_rate": 1.2397310382623402e-06, + "loss": 0.6479, + "step": 51531 + }, + { + "epoch": 1.32, + "learning_rate": 1.2397041746052953e-06, + "loss": 0.5708, + "step": 51532 + }, + { + "epoch": 1.32, + "learning_rate": 1.2396773107647204e-06, + "loss": 0.5825, + "step": 51533 + }, + { + "epoch": 1.32, + "learning_rate": 1.2396504467406356e-06, + "loss": 0.6213, + "step": 51534 + }, + { + "epoch": 1.32, + "learning_rate": 1.2396235825330613e-06, + "loss": 0.7998, + "step": 51535 + }, + { + "epoch": 1.32, + "learning_rate": 1.2395967181420183e-06, + "loss": 0.7422, + "step": 51536 + }, + { + "epoch": 1.32, + "learning_rate": 1.2395698535675273e-06, + "loss": 0.5571, + "step": 51537 + }, + { + "epoch": 1.32, + "learning_rate": 1.2395429888096083e-06, + "loss": 0.8027, + "step": 51538 + }, + { + "epoch": 1.32, + "learning_rate": 1.2395161238682823e-06, + "loss": 0.5688, + "step": 51539 + }, + { + "epoch": 1.32, + "learning_rate": 1.2394892587435701e-06, + "loss": 0.6436, + "step": 51540 + }, + { + "epoch": 1.32, + "learning_rate": 1.2394623934354918e-06, + "loss": 0.5181, + "step": 51541 + }, + { + "epoch": 1.32, + "learning_rate": 1.239435527944068e-06, + "loss": 0.5088, + "step": 51542 + }, + { + "epoch": 1.32, + "learning_rate": 1.2394086622693199e-06, + "loss": 0.5093, + "step": 51543 + }, + { + "epoch": 1.32, + "learning_rate": 1.239381796411267e-06, + "loss": 0.6309, + "step": 51544 + }, + { + "epoch": 1.32, + "learning_rate": 1.239354930369931e-06, + "loss": 0.5581, + "step": 51545 + }, + { + "epoch": 1.32, + "learning_rate": 1.2393280641453317e-06, + "loss": 0.6875, + "step": 51546 + }, + { + "epoch": 1.32, + "learning_rate": 1.2393011977374897e-06, + "loss": 0.7207, + "step": 51547 + }, + { + "epoch": 1.32, + "learning_rate": 1.2392743311464263e-06, + "loss": 0.791, + "step": 51548 + }, + { + "epoch": 1.32, + "learning_rate": 1.239247464372161e-06, + "loss": 0.6514, + "step": 51549 + }, + { + "epoch": 1.32, + "learning_rate": 1.2392205974147152e-06, + "loss": 0.4048, + "step": 51550 + }, + { + "epoch": 1.32, + "learning_rate": 1.2391937302741088e-06, + "loss": 0.6353, + "step": 51551 + }, + { + "epoch": 1.32, + "learning_rate": 1.2391668629503633e-06, + "loss": 0.6133, + "step": 51552 + }, + { + "epoch": 1.32, + "learning_rate": 1.2391399954434987e-06, + "loss": 0.6465, + "step": 51553 + }, + { + "epoch": 1.32, + "learning_rate": 1.2391131277535353e-06, + "loss": 0.5796, + "step": 51554 + }, + { + "epoch": 1.32, + "learning_rate": 1.239086259880494e-06, + "loss": 0.7139, + "step": 51555 + }, + { + "epoch": 1.32, + "learning_rate": 1.2390593918243957e-06, + "loss": 0.7285, + "step": 51556 + }, + { + "epoch": 1.32, + "learning_rate": 1.2390325235852602e-06, + "loss": 0.7471, + "step": 51557 + }, + { + "epoch": 1.32, + "learning_rate": 1.2390056551631087e-06, + "loss": 0.7666, + "step": 51558 + }, + { + "epoch": 1.32, + "learning_rate": 1.2389787865579616e-06, + "loss": 0.6689, + "step": 51559 + }, + { + "epoch": 1.32, + "learning_rate": 1.2389519177698391e-06, + "loss": 0.6484, + "step": 51560 + }, + { + "epoch": 1.32, + "learning_rate": 1.2389250487987624e-06, + "loss": 0.6406, + "step": 51561 + }, + { + "epoch": 1.32, + "learning_rate": 1.2388981796447517e-06, + "loss": 0.8379, + "step": 51562 + }, + { + "epoch": 1.32, + "learning_rate": 1.2388713103078279e-06, + "loss": 0.7061, + "step": 51563 + }, + { + "epoch": 1.32, + "learning_rate": 1.2388444407880108e-06, + "loss": 0.6116, + "step": 51564 + }, + { + "epoch": 1.32, + "learning_rate": 1.2388175710853218e-06, + "loss": 0.7593, + "step": 51565 + }, + { + "epoch": 1.32, + "learning_rate": 1.2387907011997811e-06, + "loss": 0.5311, + "step": 51566 + }, + { + "epoch": 1.32, + "learning_rate": 1.2387638311314096e-06, + "loss": 0.8506, + "step": 51567 + }, + { + "epoch": 1.32, + "learning_rate": 1.2387369608802275e-06, + "loss": 0.7031, + "step": 51568 + }, + { + "epoch": 1.32, + "learning_rate": 1.2387100904462554e-06, + "loss": 0.7207, + "step": 51569 + }, + { + "epoch": 1.32, + "learning_rate": 1.2386832198295137e-06, + "loss": 0.708, + "step": 51570 + }, + { + "epoch": 1.32, + "learning_rate": 1.2386563490300238e-06, + "loss": 0.7129, + "step": 51571 + }, + { + "epoch": 1.32, + "learning_rate": 1.2386294780478054e-06, + "loss": 0.708, + "step": 51572 + }, + { + "epoch": 1.32, + "learning_rate": 1.2386026068828792e-06, + "loss": 0.6709, + "step": 51573 + }, + { + "epoch": 1.32, + "learning_rate": 1.238575735535266e-06, + "loss": 0.6758, + "step": 51574 + }, + { + "epoch": 1.32, + "learning_rate": 1.2385488640049866e-06, + "loss": 0.7266, + "step": 51575 + }, + { + "epoch": 1.32, + "learning_rate": 1.2385219922920608e-06, + "loss": 0.7505, + "step": 51576 + }, + { + "epoch": 1.32, + "learning_rate": 1.2384951203965105e-06, + "loss": 0.7393, + "step": 51577 + }, + { + "epoch": 1.32, + "learning_rate": 1.2384682483183549e-06, + "loss": 0.6294, + "step": 51578 + }, + { + "epoch": 1.32, + "learning_rate": 1.2384413760576152e-06, + "loss": 0.6738, + "step": 51579 + }, + { + "epoch": 1.32, + "learning_rate": 1.238414503614312e-06, + "loss": 0.5791, + "step": 51580 + }, + { + "epoch": 1.32, + "learning_rate": 1.2383876309884653e-06, + "loss": 0.6855, + "step": 51581 + }, + { + "epoch": 1.32, + "learning_rate": 1.238360758180097e-06, + "loss": 0.8916, + "step": 51582 + }, + { + "epoch": 1.32, + "learning_rate": 1.2383338851892262e-06, + "loss": 0.5635, + "step": 51583 + }, + { + "epoch": 1.32, + "learning_rate": 1.2383070120158743e-06, + "loss": 0.7207, + "step": 51584 + }, + { + "epoch": 1.32, + "learning_rate": 1.2382801386600615e-06, + "loss": 0.5361, + "step": 51585 + }, + { + "epoch": 1.32, + "learning_rate": 1.2382532651218087e-06, + "loss": 0.7332, + "step": 51586 + }, + { + "epoch": 1.32, + "learning_rate": 1.2382263914011364e-06, + "loss": 0.5366, + "step": 51587 + }, + { + "epoch": 1.32, + "learning_rate": 1.238199517498065e-06, + "loss": 0.7485, + "step": 51588 + }, + { + "epoch": 1.32, + "learning_rate": 1.2381726434126152e-06, + "loss": 0.6377, + "step": 51589 + }, + { + "epoch": 1.32, + "learning_rate": 1.2381457691448077e-06, + "loss": 0.6343, + "step": 51590 + }, + { + "epoch": 1.32, + "learning_rate": 1.2381188946946627e-06, + "loss": 0.6211, + "step": 51591 + }, + { + "epoch": 1.32, + "learning_rate": 1.2380920200622013e-06, + "loss": 0.4485, + "step": 51592 + }, + { + "epoch": 1.32, + "learning_rate": 1.2380651452474435e-06, + "loss": 0.7393, + "step": 51593 + }, + { + "epoch": 1.32, + "learning_rate": 1.2380382702504104e-06, + "loss": 0.4858, + "step": 51594 + }, + { + "epoch": 1.32, + "learning_rate": 1.2380113950711222e-06, + "loss": 0.5029, + "step": 51595 + }, + { + "epoch": 1.32, + "learning_rate": 1.2379845197095996e-06, + "loss": 0.4689, + "step": 51596 + }, + { + "epoch": 1.32, + "learning_rate": 1.2379576441658634e-06, + "loss": 0.5076, + "step": 51597 + }, + { + "epoch": 1.32, + "learning_rate": 1.2379307684399335e-06, + "loss": 0.7891, + "step": 51598 + }, + { + "epoch": 1.32, + "learning_rate": 1.2379038925318314e-06, + "loss": 0.4154, + "step": 51599 + }, + { + "epoch": 1.32, + "learning_rate": 1.2378770164415772e-06, + "loss": 0.7896, + "step": 51600 + }, + { + "epoch": 1.32, + "learning_rate": 1.2378501401691912e-06, + "loss": 0.6514, + "step": 51601 + }, + { + "epoch": 1.32, + "learning_rate": 1.2378232637146947e-06, + "loss": 0.7559, + "step": 51602 + }, + { + "epoch": 1.32, + "learning_rate": 1.2377963870781076e-06, + "loss": 0.6367, + "step": 51603 + }, + { + "epoch": 1.32, + "learning_rate": 1.2377695102594508e-06, + "loss": 0.6455, + "step": 51604 + }, + { + "epoch": 1.32, + "learning_rate": 1.2377426332587448e-06, + "loss": 0.8008, + "step": 51605 + }, + { + "epoch": 1.32, + "learning_rate": 1.23771575607601e-06, + "loss": 0.7178, + "step": 51606 + }, + { + "epoch": 1.32, + "learning_rate": 1.2376888787112677e-06, + "loss": 0.6768, + "step": 51607 + }, + { + "epoch": 1.32, + "learning_rate": 1.2376620011645376e-06, + "loss": 0.7549, + "step": 51608 + }, + { + "epoch": 1.32, + "learning_rate": 1.2376351234358406e-06, + "loss": 0.5552, + "step": 51609 + }, + { + "epoch": 1.32, + "learning_rate": 1.2376082455251972e-06, + "loss": 0.6294, + "step": 51610 + }, + { + "epoch": 1.32, + "learning_rate": 1.2375813674326283e-06, + "loss": 0.5825, + "step": 51611 + }, + { + "epoch": 1.32, + "learning_rate": 1.2375544891581544e-06, + "loss": 0.7012, + "step": 51612 + }, + { + "epoch": 1.32, + "learning_rate": 1.2375276107017958e-06, + "loss": 0.5776, + "step": 51613 + }, + { + "epoch": 1.32, + "learning_rate": 1.2375007320635731e-06, + "loss": 0.5349, + "step": 51614 + }, + { + "epoch": 1.32, + "learning_rate": 1.237473853243507e-06, + "loss": 0.6357, + "step": 51615 + }, + { + "epoch": 1.32, + "learning_rate": 1.2374469742416182e-06, + "loss": 0.729, + "step": 51616 + }, + { + "epoch": 1.32, + "learning_rate": 1.2374200950579277e-06, + "loss": 0.6626, + "step": 51617 + }, + { + "epoch": 1.32, + "learning_rate": 1.237393215692455e-06, + "loss": 0.6826, + "step": 51618 + }, + { + "epoch": 1.32, + "learning_rate": 1.2373663361452211e-06, + "loss": 0.6365, + "step": 51619 + }, + { + "epoch": 1.32, + "learning_rate": 1.237339456416247e-06, + "loss": 0.6172, + "step": 51620 + }, + { + "epoch": 1.32, + "learning_rate": 1.2373125765055528e-06, + "loss": 0.6021, + "step": 51621 + }, + { + "epoch": 1.32, + "learning_rate": 1.2372856964131596e-06, + "loss": 0.791, + "step": 51622 + }, + { + "epoch": 1.32, + "learning_rate": 1.2372588161390871e-06, + "loss": 0.8066, + "step": 51623 + }, + { + "epoch": 1.32, + "learning_rate": 1.2372319356833566e-06, + "loss": 0.6562, + "step": 51624 + }, + { + "epoch": 1.32, + "learning_rate": 1.2372050550459888e-06, + "loss": 0.5859, + "step": 51625 + }, + { + "epoch": 1.32, + "learning_rate": 1.2371781742270038e-06, + "loss": 0.6553, + "step": 51626 + }, + { + "epoch": 1.32, + "learning_rate": 1.2371512932264225e-06, + "loss": 0.7021, + "step": 51627 + }, + { + "epoch": 1.32, + "learning_rate": 1.2371244120442653e-06, + "loss": 0.6865, + "step": 51628 + }, + { + "epoch": 1.32, + "learning_rate": 1.2370975306805528e-06, + "loss": 0.5908, + "step": 51629 + }, + { + "epoch": 1.32, + "learning_rate": 1.2370706491353056e-06, + "loss": 0.6582, + "step": 51630 + }, + { + "epoch": 1.32, + "learning_rate": 1.2370437674085443e-06, + "loss": 0.6963, + "step": 51631 + }, + { + "epoch": 1.32, + "learning_rate": 1.2370168855002898e-06, + "loss": 0.697, + "step": 51632 + }, + { + "epoch": 1.32, + "learning_rate": 1.236990003410562e-06, + "loss": 0.5049, + "step": 51633 + }, + { + "epoch": 1.32, + "learning_rate": 1.2369631211393822e-06, + "loss": 0.645, + "step": 51634 + }, + { + "epoch": 1.32, + "learning_rate": 1.2369362386867702e-06, + "loss": 0.5796, + "step": 51635 + }, + { + "epoch": 1.32, + "learning_rate": 1.236909356052747e-06, + "loss": 0.4384, + "step": 51636 + }, + { + "epoch": 1.32, + "learning_rate": 1.2368824732373336e-06, + "loss": 0.6826, + "step": 51637 + }, + { + "epoch": 1.32, + "learning_rate": 1.23685559024055e-06, + "loss": 0.498, + "step": 51638 + }, + { + "epoch": 1.32, + "learning_rate": 1.2368287070624168e-06, + "loss": 0.446, + "step": 51639 + }, + { + "epoch": 1.32, + "learning_rate": 1.2368018237029549e-06, + "loss": 0.6353, + "step": 51640 + }, + { + "epoch": 1.32, + "learning_rate": 1.2367749401621847e-06, + "loss": 0.708, + "step": 51641 + }, + { + "epoch": 1.32, + "learning_rate": 1.236748056440127e-06, + "loss": 0.5427, + "step": 51642 + }, + { + "epoch": 1.32, + "learning_rate": 1.2367211725368021e-06, + "loss": 0.4436, + "step": 51643 + }, + { + "epoch": 1.32, + "learning_rate": 1.2366942884522304e-06, + "loss": 0.71, + "step": 51644 + }, + { + "epoch": 1.32, + "learning_rate": 1.236667404186433e-06, + "loss": 0.493, + "step": 51645 + }, + { + "epoch": 1.32, + "learning_rate": 1.2366405197394306e-06, + "loss": 0.6553, + "step": 51646 + }, + { + "epoch": 1.32, + "learning_rate": 1.2366136351112431e-06, + "loss": 0.6909, + "step": 51647 + }, + { + "epoch": 1.32, + "learning_rate": 1.2365867503018912e-06, + "loss": 0.6631, + "step": 51648 + }, + { + "epoch": 1.32, + "learning_rate": 1.236559865311396e-06, + "loss": 0.6299, + "step": 51649 + }, + { + "epoch": 1.32, + "learning_rate": 1.2365329801397775e-06, + "loss": 0.7471, + "step": 51650 + }, + { + "epoch": 1.32, + "learning_rate": 1.2365060947870569e-06, + "loss": 0.5723, + "step": 51651 + }, + { + "epoch": 1.32, + "learning_rate": 1.2364792092532544e-06, + "loss": 0.5605, + "step": 51652 + }, + { + "epoch": 1.32, + "learning_rate": 1.2364523235383905e-06, + "loss": 0.436, + "step": 51653 + }, + { + "epoch": 1.32, + "learning_rate": 1.2364254376424861e-06, + "loss": 0.6675, + "step": 51654 + }, + { + "epoch": 1.32, + "learning_rate": 1.2363985515655614e-06, + "loss": 0.7842, + "step": 51655 + }, + { + "epoch": 1.32, + "learning_rate": 1.2363716653076372e-06, + "loss": 0.5801, + "step": 51656 + }, + { + "epoch": 1.32, + "learning_rate": 1.2363447788687347e-06, + "loss": 0.6836, + "step": 51657 + }, + { + "epoch": 1.32, + "learning_rate": 1.2363178922488731e-06, + "loss": 0.708, + "step": 51658 + }, + { + "epoch": 1.32, + "learning_rate": 1.2362910054480739e-06, + "loss": 0.7339, + "step": 51659 + }, + { + "epoch": 1.32, + "learning_rate": 1.236264118466358e-06, + "loss": 0.6309, + "step": 51660 + }, + { + "epoch": 1.32, + "learning_rate": 1.236237231303745e-06, + "loss": 0.6587, + "step": 51661 + }, + { + "epoch": 1.32, + "learning_rate": 1.2362103439602563e-06, + "loss": 0.7236, + "step": 51662 + }, + { + "epoch": 1.32, + "learning_rate": 1.2361834564359122e-06, + "loss": 0.6035, + "step": 51663 + }, + { + "epoch": 1.32, + "learning_rate": 1.236156568730733e-06, + "loss": 0.6035, + "step": 51664 + }, + { + "epoch": 1.32, + "learning_rate": 1.2361296808447398e-06, + "loss": 0.5635, + "step": 51665 + }, + { + "epoch": 1.32, + "learning_rate": 1.2361027927779528e-06, + "loss": 0.7725, + "step": 51666 + }, + { + "epoch": 1.32, + "learning_rate": 1.236075904530393e-06, + "loss": 0.5823, + "step": 51667 + }, + { + "epoch": 1.32, + "learning_rate": 1.2360490161020806e-06, + "loss": 0.623, + "step": 51668 + }, + { + "epoch": 1.32, + "learning_rate": 1.2360221274930363e-06, + "loss": 0.6025, + "step": 51669 + }, + { + "epoch": 1.32, + "learning_rate": 1.2359952387032809e-06, + "loss": 0.4585, + "step": 51670 + }, + { + "epoch": 1.32, + "learning_rate": 1.2359683497328344e-06, + "loss": 0.7695, + "step": 51671 + }, + { + "epoch": 1.32, + "learning_rate": 1.2359414605817182e-06, + "loss": 0.6196, + "step": 51672 + }, + { + "epoch": 1.32, + "learning_rate": 1.2359145712499523e-06, + "loss": 0.7129, + "step": 51673 + }, + { + "epoch": 1.32, + "learning_rate": 1.2358876817375573e-06, + "loss": 0.6611, + "step": 51674 + }, + { + "epoch": 1.32, + "learning_rate": 1.2358607920445541e-06, + "loss": 0.4663, + "step": 51675 + }, + { + "epoch": 1.32, + "learning_rate": 1.2358339021709633e-06, + "loss": 0.7021, + "step": 51676 + }, + { + "epoch": 1.32, + "learning_rate": 1.2358070121168051e-06, + "loss": 0.6035, + "step": 51677 + }, + { + "epoch": 1.32, + "learning_rate": 1.2357801218821006e-06, + "loss": 0.6182, + "step": 51678 + }, + { + "epoch": 1.32, + "learning_rate": 1.2357532314668697e-06, + "loss": 0.7549, + "step": 51679 + }, + { + "epoch": 1.32, + "learning_rate": 1.2357263408711335e-06, + "loss": 0.5908, + "step": 51680 + }, + { + "epoch": 1.32, + "learning_rate": 1.2356994500949128e-06, + "loss": 0.7241, + "step": 51681 + }, + { + "epoch": 1.32, + "learning_rate": 1.2356725591382277e-06, + "loss": 0.5874, + "step": 51682 + }, + { + "epoch": 1.32, + "learning_rate": 1.2356456680010987e-06, + "loss": 0.5684, + "step": 51683 + }, + { + "epoch": 1.32, + "learning_rate": 1.235618776683547e-06, + "loss": 0.6504, + "step": 51684 + }, + { + "epoch": 1.32, + "learning_rate": 1.2355918851855925e-06, + "loss": 0.8232, + "step": 51685 + }, + { + "epoch": 1.32, + "learning_rate": 1.2355649935072563e-06, + "loss": 0.7822, + "step": 51686 + }, + { + "epoch": 1.32, + "learning_rate": 1.2355381016485588e-06, + "loss": 0.7188, + "step": 51687 + }, + { + "epoch": 1.32, + "learning_rate": 1.2355112096095206e-06, + "loss": 0.7705, + "step": 51688 + }, + { + "epoch": 1.32, + "learning_rate": 1.2354843173901623e-06, + "loss": 0.7139, + "step": 51689 + }, + { + "epoch": 1.32, + "learning_rate": 1.2354574249905047e-06, + "loss": 0.5459, + "step": 51690 + }, + { + "epoch": 1.32, + "learning_rate": 1.2354305324105677e-06, + "loss": 0.7969, + "step": 51691 + }, + { + "epoch": 1.32, + "learning_rate": 1.2354036396503729e-06, + "loss": 0.603, + "step": 51692 + }, + { + "epoch": 1.32, + "learning_rate": 1.23537674670994e-06, + "loss": 0.6294, + "step": 51693 + }, + { + "epoch": 1.32, + "learning_rate": 1.23534985358929e-06, + "loss": 0.625, + "step": 51694 + }, + { + "epoch": 1.32, + "learning_rate": 1.2353229602884436e-06, + "loss": 0.7349, + "step": 51695 + }, + { + "epoch": 1.32, + "learning_rate": 1.235296066807421e-06, + "loss": 0.8477, + "step": 51696 + }, + { + "epoch": 1.33, + "learning_rate": 1.2352691731462436e-06, + "loss": 0.6729, + "step": 51697 + }, + { + "epoch": 1.33, + "learning_rate": 1.2352422793049306e-06, + "loss": 0.7739, + "step": 51698 + }, + { + "epoch": 1.33, + "learning_rate": 1.2352153852835039e-06, + "loss": 0.6396, + "step": 51699 + }, + { + "epoch": 1.33, + "learning_rate": 1.2351884910819832e-06, + "loss": 0.6724, + "step": 51700 + }, + { + "epoch": 1.33, + "learning_rate": 1.2351615967003898e-06, + "loss": 0.7783, + "step": 51701 + }, + { + "epoch": 1.33, + "learning_rate": 1.235134702138744e-06, + "loss": 0.7832, + "step": 51702 + }, + { + "epoch": 1.33, + "learning_rate": 1.2351078073970665e-06, + "loss": 0.6543, + "step": 51703 + }, + { + "epoch": 1.33, + "learning_rate": 1.2350809124753774e-06, + "loss": 0.8154, + "step": 51704 + }, + { + "epoch": 1.33, + "learning_rate": 1.2350540173736978e-06, + "loss": 0.7754, + "step": 51705 + }, + { + "epoch": 1.33, + "learning_rate": 1.235027122092048e-06, + "loss": 0.6436, + "step": 51706 + }, + { + "epoch": 1.33, + "learning_rate": 1.2350002266304492e-06, + "loss": 0.8145, + "step": 51707 + }, + { + "epoch": 1.33, + "learning_rate": 1.234973330988921e-06, + "loss": 0.6416, + "step": 51708 + }, + { + "epoch": 1.33, + "learning_rate": 1.2349464351674847e-06, + "loss": 0.7451, + "step": 51709 + }, + { + "epoch": 1.33, + "learning_rate": 1.2349195391661606e-06, + "loss": 0.6052, + "step": 51710 + }, + { + "epoch": 1.33, + "learning_rate": 1.2348926429849697e-06, + "loss": 0.6953, + "step": 51711 + }, + { + "epoch": 1.33, + "learning_rate": 1.2348657466239324e-06, + "loss": 0.7734, + "step": 51712 + }, + { + "epoch": 1.33, + "learning_rate": 1.2348388500830689e-06, + "loss": 0.5371, + "step": 51713 + }, + { + "epoch": 1.33, + "learning_rate": 1.2348119533624002e-06, + "loss": 0.5444, + "step": 51714 + }, + { + "epoch": 1.33, + "learning_rate": 1.2347850564619466e-06, + "loss": 0.6963, + "step": 51715 + }, + { + "epoch": 1.33, + "learning_rate": 1.2347581593817291e-06, + "loss": 0.6797, + "step": 51716 + }, + { + "epoch": 1.33, + "learning_rate": 1.234731262121768e-06, + "loss": 0.6006, + "step": 51717 + }, + { + "epoch": 1.33, + "learning_rate": 1.234704364682084e-06, + "loss": 0.6216, + "step": 51718 + }, + { + "epoch": 1.33, + "learning_rate": 1.2346774670626975e-06, + "loss": 0.6525, + "step": 51719 + }, + { + "epoch": 1.33, + "learning_rate": 1.2346505692636296e-06, + "loss": 0.7539, + "step": 51720 + }, + { + "epoch": 1.33, + "learning_rate": 1.2346236712849002e-06, + "loss": 0.4746, + "step": 51721 + }, + { + "epoch": 1.33, + "learning_rate": 1.2345967731265305e-06, + "loss": 0.5469, + "step": 51722 + }, + { + "epoch": 1.33, + "learning_rate": 1.2345698747885407e-06, + "loss": 0.625, + "step": 51723 + }, + { + "epoch": 1.33, + "learning_rate": 1.2345429762709515e-06, + "loss": 0.6025, + "step": 51724 + }, + { + "epoch": 1.33, + "learning_rate": 1.2345160775737835e-06, + "loss": 0.707, + "step": 51725 + }, + { + "epoch": 1.33, + "learning_rate": 1.2344891786970574e-06, + "loss": 0.5791, + "step": 51726 + }, + { + "epoch": 1.33, + "learning_rate": 1.2344622796407938e-06, + "loss": 0.7959, + "step": 51727 + }, + { + "epoch": 1.33, + "learning_rate": 1.2344353804050133e-06, + "loss": 0.6807, + "step": 51728 + }, + { + "epoch": 1.33, + "learning_rate": 1.234408480989736e-06, + "loss": 0.6943, + "step": 51729 + }, + { + "epoch": 1.33, + "learning_rate": 1.234381581394983e-06, + "loss": 0.6426, + "step": 51730 + }, + { + "epoch": 1.33, + "learning_rate": 1.234354681620775e-06, + "loss": 0.6758, + "step": 51731 + }, + { + "epoch": 1.33, + "learning_rate": 1.2343277816671323e-06, + "loss": 0.5957, + "step": 51732 + }, + { + "epoch": 1.33, + "learning_rate": 1.2343008815340756e-06, + "loss": 0.6035, + "step": 51733 + }, + { + "epoch": 1.33, + "learning_rate": 1.2342739812216257e-06, + "loss": 0.7568, + "step": 51734 + }, + { + "epoch": 1.33, + "learning_rate": 1.2342470807298026e-06, + "loss": 0.5935, + "step": 51735 + }, + { + "epoch": 1.33, + "learning_rate": 1.2342201800586275e-06, + "loss": 0.646, + "step": 51736 + }, + { + "epoch": 1.33, + "learning_rate": 1.234193279208121e-06, + "loss": 0.6699, + "step": 51737 + }, + { + "epoch": 1.33, + "learning_rate": 1.2341663781783032e-06, + "loss": 0.5527, + "step": 51738 + }, + { + "epoch": 1.33, + "learning_rate": 1.2341394769691948e-06, + "loss": 0.6572, + "step": 51739 + }, + { + "epoch": 1.33, + "learning_rate": 1.2341125755808168e-06, + "loss": 0.7002, + "step": 51740 + }, + { + "epoch": 1.33, + "learning_rate": 1.2340856740131895e-06, + "loss": 0.4956, + "step": 51741 + }, + { + "epoch": 1.33, + "learning_rate": 1.2340587722663338e-06, + "loss": 0.5908, + "step": 51742 + }, + { + "epoch": 1.33, + "learning_rate": 1.2340318703402698e-06, + "loss": 0.748, + "step": 51743 + }, + { + "epoch": 1.33, + "learning_rate": 1.2340049682350184e-06, + "loss": 0.6738, + "step": 51744 + }, + { + "epoch": 1.33, + "learning_rate": 1.2339780659506002e-06, + "loss": 0.6543, + "step": 51745 + }, + { + "epoch": 1.33, + "learning_rate": 1.2339511634870356e-06, + "loss": 0.6479, + "step": 51746 + }, + { + "epoch": 1.33, + "learning_rate": 1.2339242608443456e-06, + "loss": 0.6406, + "step": 51747 + }, + { + "epoch": 1.33, + "learning_rate": 1.2338973580225505e-06, + "loss": 0.5459, + "step": 51748 + }, + { + "epoch": 1.33, + "learning_rate": 1.233870455021671e-06, + "loss": 0.606, + "step": 51749 + }, + { + "epoch": 1.33, + "learning_rate": 1.2338435518417272e-06, + "loss": 0.5908, + "step": 51750 + }, + { + "epoch": 1.33, + "learning_rate": 1.2338166484827406e-06, + "loss": 0.7285, + "step": 51751 + }, + { + "epoch": 1.33, + "learning_rate": 1.2337897449447314e-06, + "loss": 0.8574, + "step": 51752 + }, + { + "epoch": 1.33, + "learning_rate": 1.2337628412277199e-06, + "loss": 0.8032, + "step": 51753 + }, + { + "epoch": 1.33, + "learning_rate": 1.2337359373317269e-06, + "loss": 0.7139, + "step": 51754 + }, + { + "epoch": 1.33, + "learning_rate": 1.2337090332567732e-06, + "loss": 0.5596, + "step": 51755 + }, + { + "epoch": 1.33, + "learning_rate": 1.2336821290028789e-06, + "loss": 0.6484, + "step": 51756 + }, + { + "epoch": 1.33, + "learning_rate": 1.2336552245700654e-06, + "loss": 0.6309, + "step": 51757 + }, + { + "epoch": 1.33, + "learning_rate": 1.2336283199583528e-06, + "loss": 0.7432, + "step": 51758 + }, + { + "epoch": 1.33, + "learning_rate": 1.2336014151677613e-06, + "loss": 0.5942, + "step": 51759 + }, + { + "epoch": 1.33, + "learning_rate": 1.2335745101983124e-06, + "loss": 0.7291, + "step": 51760 + }, + { + "epoch": 1.33, + "learning_rate": 1.233547605050026e-06, + "loss": 0.5896, + "step": 51761 + }, + { + "epoch": 1.33, + "learning_rate": 1.2335206997229233e-06, + "loss": 0.7236, + "step": 51762 + }, + { + "epoch": 1.33, + "learning_rate": 1.233493794217024e-06, + "loss": 0.6113, + "step": 51763 + }, + { + "epoch": 1.33, + "learning_rate": 1.2334668885323495e-06, + "loss": 0.5737, + "step": 51764 + }, + { + "epoch": 1.33, + "learning_rate": 1.2334399826689202e-06, + "loss": 0.6396, + "step": 51765 + }, + { + "epoch": 1.33, + "learning_rate": 1.2334130766267564e-06, + "loss": 0.5444, + "step": 51766 + }, + { + "epoch": 1.33, + "learning_rate": 1.2333861704058793e-06, + "loss": 0.6982, + "step": 51767 + }, + { + "epoch": 1.33, + "learning_rate": 1.2333592640063089e-06, + "loss": 0.4624, + "step": 51768 + }, + { + "epoch": 1.33, + "learning_rate": 1.2333323574280662e-06, + "loss": 0.708, + "step": 51769 + }, + { + "epoch": 1.33, + "learning_rate": 1.2333054506711713e-06, + "loss": 0.7822, + "step": 51770 + }, + { + "epoch": 1.33, + "learning_rate": 1.2332785437356453e-06, + "loss": 0.6895, + "step": 51771 + }, + { + "epoch": 1.33, + "learning_rate": 1.233251636621509e-06, + "loss": 0.6289, + "step": 51772 + }, + { + "epoch": 1.33, + "learning_rate": 1.2332247293287821e-06, + "loss": 0.6362, + "step": 51773 + }, + { + "epoch": 1.33, + "learning_rate": 1.2331978218574861e-06, + "loss": 0.6982, + "step": 51774 + }, + { + "epoch": 1.33, + "learning_rate": 1.2331709142076409e-06, + "loss": 0.708, + "step": 51775 + }, + { + "epoch": 1.33, + "learning_rate": 1.233144006379268e-06, + "loss": 0.6484, + "step": 51776 + }, + { + "epoch": 1.33, + "learning_rate": 1.233117098372387e-06, + "loss": 0.7188, + "step": 51777 + }, + { + "epoch": 1.33, + "learning_rate": 1.2330901901870193e-06, + "loss": 0.7041, + "step": 51778 + }, + { + "epoch": 1.33, + "learning_rate": 1.233063281823185e-06, + "loss": 0.6963, + "step": 51779 + }, + { + "epoch": 1.33, + "learning_rate": 1.2330363732809047e-06, + "loss": 0.4473, + "step": 51780 + }, + { + "epoch": 1.33, + "learning_rate": 1.2330094645601993e-06, + "loss": 0.626, + "step": 51781 + }, + { + "epoch": 1.33, + "learning_rate": 1.2329825556610893e-06, + "loss": 0.8105, + "step": 51782 + }, + { + "epoch": 1.33, + "learning_rate": 1.2329556465835953e-06, + "loss": 0.5928, + "step": 51783 + }, + { + "epoch": 1.33, + "learning_rate": 1.2329287373277376e-06, + "loss": 0.7773, + "step": 51784 + }, + { + "epoch": 1.33, + "learning_rate": 1.2329018278935374e-06, + "loss": 0.6494, + "step": 51785 + }, + { + "epoch": 1.33, + "learning_rate": 1.2328749182810148e-06, + "loss": 0.4871, + "step": 51786 + }, + { + "epoch": 1.33, + "learning_rate": 1.2328480084901908e-06, + "loss": 0.6284, + "step": 51787 + }, + { + "epoch": 1.33, + "learning_rate": 1.2328210985210855e-06, + "loss": 0.6504, + "step": 51788 + }, + { + "epoch": 1.33, + "learning_rate": 1.2327941883737202e-06, + "loss": 0.5479, + "step": 51789 + }, + { + "epoch": 1.33, + "learning_rate": 1.2327672780481146e-06, + "loss": 0.7402, + "step": 51790 + }, + { + "epoch": 1.33, + "learning_rate": 1.2327403675442903e-06, + "loss": 0.8652, + "step": 51791 + }, + { + "epoch": 1.33, + "learning_rate": 1.232713456862267e-06, + "loss": 0.6196, + "step": 51792 + }, + { + "epoch": 1.33, + "learning_rate": 1.2326865460020659e-06, + "loss": 0.7305, + "step": 51793 + }, + { + "epoch": 1.33, + "learning_rate": 1.2326596349637073e-06, + "loss": 0.7715, + "step": 51794 + }, + { + "epoch": 1.33, + "learning_rate": 1.232632723747212e-06, + "loss": 0.6934, + "step": 51795 + }, + { + "epoch": 1.33, + "learning_rate": 1.2326058123526005e-06, + "loss": 0.7217, + "step": 51796 + }, + { + "epoch": 1.33, + "learning_rate": 1.2325789007798935e-06, + "loss": 0.6533, + "step": 51797 + }, + { + "epoch": 1.33, + "learning_rate": 1.2325519890291113e-06, + "loss": 0.392, + "step": 51798 + }, + { + "epoch": 1.33, + "learning_rate": 1.2325250771002748e-06, + "loss": 0.7051, + "step": 51799 + }, + { + "epoch": 1.33, + "learning_rate": 1.2324981649934044e-06, + "loss": 0.5073, + "step": 51800 + }, + { + "epoch": 1.33, + "learning_rate": 1.2324712527085212e-06, + "loss": 0.9043, + "step": 51801 + }, + { + "epoch": 1.33, + "learning_rate": 1.2324443402456454e-06, + "loss": 0.5459, + "step": 51802 + }, + { + "epoch": 1.33, + "learning_rate": 1.2324174276047977e-06, + "loss": 0.5664, + "step": 51803 + }, + { + "epoch": 1.33, + "learning_rate": 1.2323905147859982e-06, + "loss": 0.5703, + "step": 51804 + }, + { + "epoch": 1.33, + "learning_rate": 1.2323636017892685e-06, + "loss": 0.6919, + "step": 51805 + }, + { + "epoch": 1.33, + "learning_rate": 1.2323366886146284e-06, + "loss": 0.52, + "step": 51806 + }, + { + "epoch": 1.33, + "learning_rate": 1.232309775262099e-06, + "loss": 0.46, + "step": 51807 + }, + { + "epoch": 1.33, + "learning_rate": 1.2322828617317005e-06, + "loss": 0.6406, + "step": 51808 + }, + { + "epoch": 1.33, + "learning_rate": 1.2322559480234536e-06, + "loss": 0.6289, + "step": 51809 + }, + { + "epoch": 1.33, + "learning_rate": 1.2322290341373793e-06, + "loss": 0.7275, + "step": 51810 + }, + { + "epoch": 1.33, + "learning_rate": 1.2322021200734976e-06, + "loss": 0.6943, + "step": 51811 + }, + { + "epoch": 1.33, + "learning_rate": 1.2321752058318297e-06, + "loss": 0.4422, + "step": 51812 + }, + { + "epoch": 1.33, + "learning_rate": 1.2321482914123958e-06, + "loss": 0.5732, + "step": 51813 + }, + { + "epoch": 1.33, + "learning_rate": 1.2321213768152165e-06, + "loss": 0.6865, + "step": 51814 + }, + { + "epoch": 1.33, + "learning_rate": 1.2320944620403127e-06, + "loss": 0.623, + "step": 51815 + }, + { + "epoch": 1.33, + "learning_rate": 1.2320675470877047e-06, + "loss": 0.6934, + "step": 51816 + }, + { + "epoch": 1.33, + "learning_rate": 1.2320406319574135e-06, + "loss": 0.6514, + "step": 51817 + }, + { + "epoch": 1.33, + "learning_rate": 1.2320137166494593e-06, + "loss": 0.461, + "step": 51818 + }, + { + "epoch": 1.33, + "learning_rate": 1.2319868011638629e-06, + "loss": 0.6082, + "step": 51819 + }, + { + "epoch": 1.33, + "learning_rate": 1.2319598855006446e-06, + "loss": 0.748, + "step": 51820 + }, + { + "epoch": 1.33, + "learning_rate": 1.2319329696598254e-06, + "loss": 0.7549, + "step": 51821 + }, + { + "epoch": 1.33, + "learning_rate": 1.231906053641426e-06, + "loss": 0.5791, + "step": 51822 + }, + { + "epoch": 1.33, + "learning_rate": 1.2318791374454667e-06, + "loss": 0.4188, + "step": 51823 + }, + { + "epoch": 1.33, + "learning_rate": 1.2318522210719682e-06, + "loss": 0.7402, + "step": 51824 + }, + { + "epoch": 1.33, + "learning_rate": 1.231825304520951e-06, + "loss": 0.7324, + "step": 51825 + }, + { + "epoch": 1.33, + "learning_rate": 1.2317983877924361e-06, + "loss": 0.5757, + "step": 51826 + }, + { + "epoch": 1.33, + "learning_rate": 1.2317714708864438e-06, + "loss": 0.6143, + "step": 51827 + }, + { + "epoch": 1.33, + "learning_rate": 1.2317445538029944e-06, + "loss": 0.6211, + "step": 51828 + }, + { + "epoch": 1.33, + "learning_rate": 1.2317176365421092e-06, + "loss": 0.7734, + "step": 51829 + }, + { + "epoch": 1.33, + "learning_rate": 1.2316907191038082e-06, + "loss": 0.5811, + "step": 51830 + }, + { + "epoch": 1.33, + "learning_rate": 1.2316638014881123e-06, + "loss": 0.4929, + "step": 51831 + }, + { + "epoch": 1.33, + "learning_rate": 1.2316368836950425e-06, + "loss": 0.6782, + "step": 51832 + }, + { + "epoch": 1.33, + "learning_rate": 1.2316099657246187e-06, + "loss": 0.5217, + "step": 51833 + }, + { + "epoch": 1.33, + "learning_rate": 1.2315830475768614e-06, + "loss": 0.7441, + "step": 51834 + }, + { + "epoch": 1.33, + "learning_rate": 1.2315561292517922e-06, + "loss": 0.4978, + "step": 51835 + }, + { + "epoch": 1.33, + "learning_rate": 1.2315292107494307e-06, + "loss": 0.7139, + "step": 51836 + }, + { + "epoch": 1.33, + "learning_rate": 1.2315022920697983e-06, + "loss": 0.6694, + "step": 51837 + }, + { + "epoch": 1.33, + "learning_rate": 1.231475373212915e-06, + "loss": 0.624, + "step": 51838 + }, + { + "epoch": 1.33, + "learning_rate": 1.2314484541788016e-06, + "loss": 0.5735, + "step": 51839 + }, + { + "epoch": 1.33, + "learning_rate": 1.2314215349674789e-06, + "loss": 0.7031, + "step": 51840 + }, + { + "epoch": 1.33, + "learning_rate": 1.2313946155789674e-06, + "loss": 0.748, + "step": 51841 + }, + { + "epoch": 1.33, + "learning_rate": 1.2313676960132877e-06, + "loss": 0.623, + "step": 51842 + }, + { + "epoch": 1.33, + "learning_rate": 1.2313407762704604e-06, + "loss": 0.6123, + "step": 51843 + }, + { + "epoch": 1.33, + "learning_rate": 1.2313138563505059e-06, + "loss": 0.5737, + "step": 51844 + }, + { + "epoch": 1.33, + "learning_rate": 1.2312869362534452e-06, + "loss": 0.5469, + "step": 51845 + }, + { + "epoch": 1.33, + "learning_rate": 1.2312600159792985e-06, + "loss": 0.5504, + "step": 51846 + }, + { + "epoch": 1.33, + "learning_rate": 1.2312330955280868e-06, + "loss": 0.5244, + "step": 51847 + }, + { + "epoch": 1.33, + "learning_rate": 1.2312061748998308e-06, + "loss": 0.4705, + "step": 51848 + }, + { + "epoch": 1.33, + "learning_rate": 1.2311792540945504e-06, + "loss": 0.7041, + "step": 51849 + }, + { + "epoch": 1.33, + "learning_rate": 1.2311523331122668e-06, + "loss": 0.6875, + "step": 51850 + }, + { + "epoch": 1.33, + "learning_rate": 1.2311254119530005e-06, + "loss": 0.5675, + "step": 51851 + }, + { + "epoch": 1.33, + "learning_rate": 1.2310984906167725e-06, + "loss": 0.6333, + "step": 51852 + }, + { + "epoch": 1.33, + "learning_rate": 1.2310715691036026e-06, + "loss": 0.5999, + "step": 51853 + }, + { + "epoch": 1.33, + "learning_rate": 1.231044647413512e-06, + "loss": 0.7363, + "step": 51854 + }, + { + "epoch": 1.33, + "learning_rate": 1.2310177255465209e-06, + "loss": 0.8066, + "step": 51855 + }, + { + "epoch": 1.33, + "learning_rate": 1.2309908035026507e-06, + "loss": 0.6943, + "step": 51856 + }, + { + "epoch": 1.33, + "learning_rate": 1.2309638812819208e-06, + "loss": 0.6943, + "step": 51857 + }, + { + "epoch": 1.33, + "learning_rate": 1.2309369588843528e-06, + "loss": 0.6548, + "step": 51858 + }, + { + "epoch": 1.33, + "learning_rate": 1.2309100363099668e-06, + "loss": 0.5151, + "step": 51859 + }, + { + "epoch": 1.33, + "learning_rate": 1.2308831135587838e-06, + "loss": 0.6743, + "step": 51860 + }, + { + "epoch": 1.33, + "learning_rate": 1.2308561906308242e-06, + "loss": 0.665, + "step": 51861 + }, + { + "epoch": 1.33, + "learning_rate": 1.2308292675261088e-06, + "loss": 0.6504, + "step": 51862 + }, + { + "epoch": 1.33, + "learning_rate": 1.2308023442446576e-06, + "loss": 0.6714, + "step": 51863 + }, + { + "epoch": 1.33, + "learning_rate": 1.230775420786492e-06, + "loss": 0.7285, + "step": 51864 + }, + { + "epoch": 1.33, + "learning_rate": 1.230748497151632e-06, + "loss": 0.5532, + "step": 51865 + }, + { + "epoch": 1.33, + "learning_rate": 1.2307215733400987e-06, + "loss": 0.709, + "step": 51866 + }, + { + "epoch": 1.33, + "learning_rate": 1.2306946493519124e-06, + "loss": 0.7109, + "step": 51867 + }, + { + "epoch": 1.33, + "learning_rate": 1.2306677251870937e-06, + "loss": 0.4124, + "step": 51868 + }, + { + "epoch": 1.33, + "learning_rate": 1.2306408008456636e-06, + "loss": 0.3708, + "step": 51869 + }, + { + "epoch": 1.33, + "learning_rate": 1.2306138763276424e-06, + "loss": 0.6733, + "step": 51870 + }, + { + "epoch": 1.33, + "learning_rate": 1.2305869516330507e-06, + "loss": 0.7051, + "step": 51871 + }, + { + "epoch": 1.33, + "learning_rate": 1.2305600267619093e-06, + "loss": 0.791, + "step": 51872 + }, + { + "epoch": 1.33, + "learning_rate": 1.2305331017142383e-06, + "loss": 0.5637, + "step": 51873 + }, + { + "epoch": 1.33, + "learning_rate": 1.230506176490059e-06, + "loss": 0.5371, + "step": 51874 + }, + { + "epoch": 1.33, + "learning_rate": 1.2304792510893918e-06, + "loss": 0.9038, + "step": 51875 + }, + { + "epoch": 1.33, + "learning_rate": 1.230452325512257e-06, + "loss": 0.6929, + "step": 51876 + }, + { + "epoch": 1.33, + "learning_rate": 1.2304253997586758e-06, + "loss": 0.4978, + "step": 51877 + }, + { + "epoch": 1.33, + "learning_rate": 1.230398473828668e-06, + "loss": 0.6865, + "step": 51878 + }, + { + "epoch": 1.33, + "learning_rate": 1.230371547722255e-06, + "loss": 0.6875, + "step": 51879 + }, + { + "epoch": 1.33, + "learning_rate": 1.2303446214394569e-06, + "loss": 0.6094, + "step": 51880 + }, + { + "epoch": 1.33, + "learning_rate": 1.2303176949802949e-06, + "loss": 0.8096, + "step": 51881 + }, + { + "epoch": 1.33, + "learning_rate": 1.2302907683447886e-06, + "loss": 0.4673, + "step": 51882 + }, + { + "epoch": 1.33, + "learning_rate": 1.2302638415329598e-06, + "loss": 0.6748, + "step": 51883 + }, + { + "epoch": 1.33, + "learning_rate": 1.230236914544828e-06, + "loss": 0.6992, + "step": 51884 + }, + { + "epoch": 1.33, + "learning_rate": 1.230209987380415e-06, + "loss": 0.7148, + "step": 51885 + }, + { + "epoch": 1.33, + "learning_rate": 1.2301830600397407e-06, + "loss": 0.4826, + "step": 51886 + }, + { + "epoch": 1.33, + "learning_rate": 1.2301561325228258e-06, + "loss": 0.5703, + "step": 51887 + }, + { + "epoch": 1.33, + "learning_rate": 1.2301292048296905e-06, + "loss": 0.7451, + "step": 51888 + }, + { + "epoch": 1.33, + "learning_rate": 1.230102276960356e-06, + "loss": 0.4819, + "step": 51889 + }, + { + "epoch": 1.33, + "learning_rate": 1.230075348914843e-06, + "loss": 0.6072, + "step": 51890 + }, + { + "epoch": 1.33, + "learning_rate": 1.230048420693172e-06, + "loss": 0.4675, + "step": 51891 + }, + { + "epoch": 1.33, + "learning_rate": 1.2300214922953633e-06, + "loss": 0.6206, + "step": 51892 + }, + { + "epoch": 1.33, + "learning_rate": 1.2299945637214376e-06, + "loss": 0.7544, + "step": 51893 + }, + { + "epoch": 1.33, + "learning_rate": 1.2299676349714157e-06, + "loss": 0.7451, + "step": 51894 + }, + { + "epoch": 1.33, + "learning_rate": 1.229940706045318e-06, + "loss": 0.5957, + "step": 51895 + }, + { + "epoch": 1.33, + "learning_rate": 1.229913776943166e-06, + "loss": 0.5493, + "step": 51896 + }, + { + "epoch": 1.33, + "learning_rate": 1.2298868476649788e-06, + "loss": 0.626, + "step": 51897 + }, + { + "epoch": 1.33, + "learning_rate": 1.2298599182107784e-06, + "loss": 0.5977, + "step": 51898 + }, + { + "epoch": 1.33, + "learning_rate": 1.229832988580584e-06, + "loss": 0.5874, + "step": 51899 + }, + { + "epoch": 1.33, + "learning_rate": 1.2298060587744177e-06, + "loss": 0.4788, + "step": 51900 + }, + { + "epoch": 1.33, + "learning_rate": 1.2297791287922995e-06, + "loss": 0.7822, + "step": 51901 + }, + { + "epoch": 1.33, + "learning_rate": 1.22975219863425e-06, + "loss": 0.5991, + "step": 51902 + }, + { + "epoch": 1.33, + "learning_rate": 1.2297252683002895e-06, + "loss": 0.6069, + "step": 51903 + }, + { + "epoch": 1.33, + "learning_rate": 1.2296983377904391e-06, + "loss": 0.8447, + "step": 51904 + }, + { + "epoch": 1.33, + "learning_rate": 1.2296714071047189e-06, + "loss": 0.7734, + "step": 51905 + }, + { + "epoch": 1.33, + "learning_rate": 1.2296444762431506e-06, + "loss": 0.8398, + "step": 51906 + }, + { + "epoch": 1.33, + "learning_rate": 1.2296175452057533e-06, + "loss": 0.5698, + "step": 51907 + }, + { + "epoch": 1.33, + "learning_rate": 1.229590613992549e-06, + "loss": 0.7109, + "step": 51908 + }, + { + "epoch": 1.33, + "learning_rate": 1.2295636826035574e-06, + "loss": 0.5703, + "step": 51909 + }, + { + "epoch": 1.33, + "learning_rate": 1.2295367510387995e-06, + "loss": 0.7539, + "step": 51910 + }, + { + "epoch": 1.33, + "learning_rate": 1.229509819298296e-06, + "loss": 0.5859, + "step": 51911 + }, + { + "epoch": 1.33, + "learning_rate": 1.229482887382067e-06, + "loss": 0.7334, + "step": 51912 + }, + { + "epoch": 1.33, + "learning_rate": 1.2294559552901338e-06, + "loss": 0.3345, + "step": 51913 + }, + { + "epoch": 1.33, + "learning_rate": 1.2294290230225166e-06, + "loss": 0.7529, + "step": 51914 + }, + { + "epoch": 1.33, + "learning_rate": 1.2294020905792365e-06, + "loss": 0.6042, + "step": 51915 + }, + { + "epoch": 1.33, + "learning_rate": 1.2293751579603133e-06, + "loss": 0.7432, + "step": 51916 + }, + { + "epoch": 1.33, + "learning_rate": 1.2293482251657685e-06, + "loss": 0.6362, + "step": 51917 + }, + { + "epoch": 1.33, + "learning_rate": 1.229321292195622e-06, + "loss": 0.7656, + "step": 51918 + }, + { + "epoch": 1.33, + "learning_rate": 1.2292943590498947e-06, + "loss": 0.7363, + "step": 51919 + }, + { + "epoch": 1.33, + "learning_rate": 1.2292674257286073e-06, + "loss": 0.5181, + "step": 51920 + }, + { + "epoch": 1.33, + "learning_rate": 1.229240492231781e-06, + "loss": 0.6025, + "step": 51921 + }, + { + "epoch": 1.33, + "learning_rate": 1.229213558559435e-06, + "loss": 0.5656, + "step": 51922 + }, + { + "epoch": 1.33, + "learning_rate": 1.2291866247115909e-06, + "loss": 0.7432, + "step": 51923 + }, + { + "epoch": 1.33, + "learning_rate": 1.229159690688269e-06, + "loss": 0.6528, + "step": 51924 + }, + { + "epoch": 1.33, + "learning_rate": 1.2291327564894904e-06, + "loss": 0.8027, + "step": 51925 + }, + { + "epoch": 1.33, + "learning_rate": 1.2291058221152754e-06, + "loss": 0.6694, + "step": 51926 + }, + { + "epoch": 1.33, + "learning_rate": 1.2290788875656446e-06, + "loss": 0.7129, + "step": 51927 + }, + { + "epoch": 1.33, + "learning_rate": 1.2290519528406184e-06, + "loss": 0.6587, + "step": 51928 + }, + { + "epoch": 1.33, + "learning_rate": 1.2290250179402178e-06, + "loss": 0.7163, + "step": 51929 + }, + { + "epoch": 1.33, + "learning_rate": 1.228998082864463e-06, + "loss": 0.8184, + "step": 51930 + }, + { + "epoch": 1.33, + "learning_rate": 1.2289711476133754e-06, + "loss": 0.6602, + "step": 51931 + }, + { + "epoch": 1.33, + "learning_rate": 1.2289442121869748e-06, + "loss": 0.6826, + "step": 51932 + }, + { + "epoch": 1.33, + "learning_rate": 1.2289172765852822e-06, + "loss": 0.6406, + "step": 51933 + }, + { + "epoch": 1.33, + "learning_rate": 1.228890340808318e-06, + "loss": 0.7822, + "step": 51934 + }, + { + "epoch": 1.33, + "learning_rate": 1.2288634048561032e-06, + "loss": 0.4639, + "step": 51935 + }, + { + "epoch": 1.33, + "learning_rate": 1.2288364687286583e-06, + "loss": 0.7314, + "step": 51936 + }, + { + "epoch": 1.33, + "learning_rate": 1.2288095324260034e-06, + "loss": 0.7324, + "step": 51937 + }, + { + "epoch": 1.33, + "learning_rate": 1.22878259594816e-06, + "loss": 0.6636, + "step": 51938 + }, + { + "epoch": 1.33, + "learning_rate": 1.228755659295148e-06, + "loss": 0.7676, + "step": 51939 + }, + { + "epoch": 1.33, + "learning_rate": 1.2287287224669887e-06, + "loss": 0.6289, + "step": 51940 + }, + { + "epoch": 1.33, + "learning_rate": 1.228701785463702e-06, + "loss": 0.7842, + "step": 51941 + }, + { + "epoch": 1.33, + "learning_rate": 1.228674848285309e-06, + "loss": 0.7617, + "step": 51942 + }, + { + "epoch": 1.33, + "learning_rate": 1.22864791093183e-06, + "loss": 0.6294, + "step": 51943 + }, + { + "epoch": 1.33, + "learning_rate": 1.2286209734032863e-06, + "loss": 0.3983, + "step": 51944 + }, + { + "epoch": 1.33, + "learning_rate": 1.2285940356996973e-06, + "loss": 0.6572, + "step": 51945 + }, + { + "epoch": 1.33, + "learning_rate": 1.2285670978210849e-06, + "loss": 0.7725, + "step": 51946 + }, + { + "epoch": 1.33, + "learning_rate": 1.2285401597674689e-06, + "loss": 0.4485, + "step": 51947 + }, + { + "epoch": 1.33, + "learning_rate": 1.2285132215388705e-06, + "loss": 0.6562, + "step": 51948 + }, + { + "epoch": 1.33, + "learning_rate": 1.2284862831353098e-06, + "loss": 0.5981, + "step": 51949 + }, + { + "epoch": 1.33, + "learning_rate": 1.2284593445568076e-06, + "loss": 0.5347, + "step": 51950 + }, + { + "epoch": 1.33, + "learning_rate": 1.2284324058033848e-06, + "loss": 0.6841, + "step": 51951 + }, + { + "epoch": 1.33, + "learning_rate": 1.2284054668750618e-06, + "loss": 0.5258, + "step": 51952 + }, + { + "epoch": 1.33, + "learning_rate": 1.228378527771859e-06, + "loss": 0.75, + "step": 51953 + }, + { + "epoch": 1.33, + "learning_rate": 1.2283515884937977e-06, + "loss": 0.436, + "step": 51954 + }, + { + "epoch": 1.33, + "learning_rate": 1.2283246490408976e-06, + "loss": 0.7402, + "step": 51955 + }, + { + "epoch": 1.33, + "learning_rate": 1.22829770941318e-06, + "loss": 0.7725, + "step": 51956 + }, + { + "epoch": 1.33, + "learning_rate": 1.2282707696106653e-06, + "loss": 0.8018, + "step": 51957 + }, + { + "epoch": 1.33, + "learning_rate": 1.2282438296333742e-06, + "loss": 0.7441, + "step": 51958 + }, + { + "epoch": 1.33, + "learning_rate": 1.2282168894813274e-06, + "loss": 0.5083, + "step": 51959 + }, + { + "epoch": 1.33, + "learning_rate": 1.2281899491545454e-06, + "loss": 0.5947, + "step": 51960 + }, + { + "epoch": 1.33, + "learning_rate": 1.2281630086530489e-06, + "loss": 0.666, + "step": 51961 + }, + { + "epoch": 1.33, + "learning_rate": 1.2281360679768581e-06, + "loss": 0.6387, + "step": 51962 + }, + { + "epoch": 1.33, + "learning_rate": 1.2281091271259944e-06, + "loss": 0.7871, + "step": 51963 + }, + { + "epoch": 1.33, + "learning_rate": 1.2280821861004777e-06, + "loss": 0.7881, + "step": 51964 + }, + { + "epoch": 1.33, + "learning_rate": 1.2280552449003291e-06, + "loss": 0.6606, + "step": 51965 + }, + { + "epoch": 1.33, + "learning_rate": 1.2280283035255693e-06, + "loss": 0.5974, + "step": 51966 + }, + { + "epoch": 1.33, + "learning_rate": 1.2280013619762187e-06, + "loss": 0.7275, + "step": 51967 + }, + { + "epoch": 1.33, + "learning_rate": 1.2279744202522978e-06, + "loss": 0.9072, + "step": 51968 + }, + { + "epoch": 1.33, + "learning_rate": 1.2279474783538273e-06, + "loss": 0.6826, + "step": 51969 + }, + { + "epoch": 1.33, + "learning_rate": 1.2279205362808277e-06, + "loss": 0.6543, + "step": 51970 + }, + { + "epoch": 1.33, + "learning_rate": 1.2278935940333204e-06, + "loss": 0.7295, + "step": 51971 + }, + { + "epoch": 1.33, + "learning_rate": 1.227866651611325e-06, + "loss": 0.5308, + "step": 51972 + }, + { + "epoch": 1.33, + "learning_rate": 1.227839709014863e-06, + "loss": 0.5264, + "step": 51973 + }, + { + "epoch": 1.33, + "learning_rate": 1.2278127662439542e-06, + "loss": 0.7871, + "step": 51974 + }, + { + "epoch": 1.33, + "learning_rate": 1.2277858232986198e-06, + "loss": 0.6523, + "step": 51975 + }, + { + "epoch": 1.33, + "learning_rate": 1.22775888017888e-06, + "loss": 0.6245, + "step": 51976 + }, + { + "epoch": 1.33, + "learning_rate": 1.2277319368847561e-06, + "loss": 0.5828, + "step": 51977 + }, + { + "epoch": 1.33, + "learning_rate": 1.2277049934162681e-06, + "loss": 0.707, + "step": 51978 + }, + { + "epoch": 1.33, + "learning_rate": 1.227678049773437e-06, + "loss": 0.5806, + "step": 51979 + }, + { + "epoch": 1.33, + "learning_rate": 1.2276511059562831e-06, + "loss": 0.7285, + "step": 51980 + }, + { + "epoch": 1.33, + "learning_rate": 1.2276241619648273e-06, + "loss": 0.7969, + "step": 51981 + }, + { + "epoch": 1.33, + "learning_rate": 1.2275972177990903e-06, + "loss": 0.6294, + "step": 51982 + }, + { + "epoch": 1.33, + "learning_rate": 1.2275702734590922e-06, + "loss": 0.4729, + "step": 51983 + }, + { + "epoch": 1.33, + "learning_rate": 1.2275433289448544e-06, + "loss": 0.7656, + "step": 51984 + }, + { + "epoch": 1.33, + "learning_rate": 1.227516384256397e-06, + "loss": 0.573, + "step": 51985 + }, + { + "epoch": 1.33, + "learning_rate": 1.227489439393741e-06, + "loss": 0.7461, + "step": 51986 + }, + { + "epoch": 1.33, + "learning_rate": 1.2274624943569062e-06, + "loss": 0.6206, + "step": 51987 + }, + { + "epoch": 1.33, + "learning_rate": 1.2274355491459143e-06, + "loss": 0.7793, + "step": 51988 + }, + { + "epoch": 1.33, + "learning_rate": 1.2274086037607854e-06, + "loss": 0.585, + "step": 51989 + }, + { + "epoch": 1.33, + "learning_rate": 1.2273816582015401e-06, + "loss": 0.7725, + "step": 51990 + }, + { + "epoch": 1.33, + "learning_rate": 1.227354712468199e-06, + "loss": 0.7871, + "step": 51991 + }, + { + "epoch": 1.33, + "learning_rate": 1.2273277665607833e-06, + "loss": 0.7822, + "step": 51992 + }, + { + "epoch": 1.33, + "learning_rate": 1.2273008204793128e-06, + "loss": 0.6895, + "step": 51993 + }, + { + "epoch": 1.33, + "learning_rate": 1.2272738742238085e-06, + "loss": 0.7285, + "step": 51994 + }, + { + "epoch": 1.33, + "learning_rate": 1.227246927794291e-06, + "loss": 0.6782, + "step": 51995 + }, + { + "epoch": 1.33, + "learning_rate": 1.2272199811907813e-06, + "loss": 0.6851, + "step": 51996 + }, + { + "epoch": 1.33, + "learning_rate": 1.2271930344132994e-06, + "loss": 0.7578, + "step": 51997 + }, + { + "epoch": 1.33, + "learning_rate": 1.2271660874618665e-06, + "loss": 0.6079, + "step": 51998 + }, + { + "epoch": 1.33, + "learning_rate": 1.2271391403365029e-06, + "loss": 0.5635, + "step": 51999 + }, + { + "epoch": 1.33, + "learning_rate": 1.227112193037229e-06, + "loss": 0.7236, + "step": 52000 + }, + { + "epoch": 1.33, + "learning_rate": 1.2270852455640662e-06, + "loss": 0.6504, + "step": 52001 + }, + { + "epoch": 1.33, + "learning_rate": 1.2270582979170344e-06, + "loss": 0.5835, + "step": 52002 + }, + { + "epoch": 1.33, + "learning_rate": 1.2270313500961544e-06, + "loss": 0.792, + "step": 52003 + }, + { + "epoch": 1.33, + "learning_rate": 1.227004402101447e-06, + "loss": 0.5269, + "step": 52004 + }, + { + "epoch": 1.33, + "learning_rate": 1.226977453932933e-06, + "loss": 0.5938, + "step": 52005 + }, + { + "epoch": 1.33, + "learning_rate": 1.2269505055906327e-06, + "loss": 0.6191, + "step": 52006 + }, + { + "epoch": 1.33, + "learning_rate": 1.226923557074567e-06, + "loss": 0.7051, + "step": 52007 + }, + { + "epoch": 1.33, + "learning_rate": 1.2268966083847559e-06, + "loss": 0.522, + "step": 52008 + }, + { + "epoch": 1.33, + "learning_rate": 1.2268696595212207e-06, + "loss": 0.7998, + "step": 52009 + }, + { + "epoch": 1.33, + "learning_rate": 1.226842710483982e-06, + "loss": 0.7451, + "step": 52010 + }, + { + "epoch": 1.33, + "learning_rate": 1.22681576127306e-06, + "loss": 0.5908, + "step": 52011 + }, + { + "epoch": 1.33, + "learning_rate": 1.2267888118884757e-06, + "loss": 0.6758, + "step": 52012 + }, + { + "epoch": 1.33, + "learning_rate": 1.2267618623302499e-06, + "loss": 0.6777, + "step": 52013 + }, + { + "epoch": 1.33, + "learning_rate": 1.2267349125984026e-06, + "loss": 0.6562, + "step": 52014 + }, + { + "epoch": 1.33, + "learning_rate": 1.2267079626929548e-06, + "loss": 0.5693, + "step": 52015 + }, + { + "epoch": 1.33, + "learning_rate": 1.2266810126139276e-06, + "loss": 0.4524, + "step": 52016 + }, + { + "epoch": 1.33, + "learning_rate": 1.226654062361341e-06, + "loss": 0.7617, + "step": 52017 + }, + { + "epoch": 1.33, + "learning_rate": 1.2266271119352155e-06, + "loss": 0.5396, + "step": 52018 + }, + { + "epoch": 1.33, + "learning_rate": 1.226600161335572e-06, + "loss": 0.5625, + "step": 52019 + }, + { + "epoch": 1.33, + "learning_rate": 1.2265732105624314e-06, + "loss": 0.8691, + "step": 52020 + }, + { + "epoch": 1.33, + "learning_rate": 1.226546259615814e-06, + "loss": 0.7744, + "step": 52021 + }, + { + "epoch": 1.33, + "learning_rate": 1.2265193084957408e-06, + "loss": 0.6592, + "step": 52022 + }, + { + "epoch": 1.33, + "learning_rate": 1.226492357202232e-06, + "loss": 0.6914, + "step": 52023 + }, + { + "epoch": 1.33, + "learning_rate": 1.2264654057353085e-06, + "loss": 0.4208, + "step": 52024 + }, + { + "epoch": 1.33, + "learning_rate": 1.226438454094991e-06, + "loss": 0.4604, + "step": 52025 + }, + { + "epoch": 1.33, + "learning_rate": 1.2264115022812997e-06, + "loss": 0.6318, + "step": 52026 + }, + { + "epoch": 1.33, + "learning_rate": 1.2263845502942553e-06, + "loss": 0.7461, + "step": 52027 + }, + { + "epoch": 1.33, + "learning_rate": 1.2263575981338792e-06, + "loss": 0.7705, + "step": 52028 + }, + { + "epoch": 1.33, + "learning_rate": 1.2263306458001909e-06, + "loss": 0.7773, + "step": 52029 + }, + { + "epoch": 1.33, + "learning_rate": 1.2263036932932123e-06, + "loss": 0.5903, + "step": 52030 + }, + { + "epoch": 1.33, + "learning_rate": 1.2262767406129631e-06, + "loss": 0.7061, + "step": 52031 + }, + { + "epoch": 1.33, + "learning_rate": 1.2262497877594642e-06, + "loss": 0.5767, + "step": 52032 + }, + { + "epoch": 1.33, + "learning_rate": 1.2262228347327358e-06, + "loss": 0.6982, + "step": 52033 + }, + { + "epoch": 1.33, + "learning_rate": 1.2261958815327998e-06, + "loss": 0.6812, + "step": 52034 + }, + { + "epoch": 1.33, + "learning_rate": 1.2261689281596752e-06, + "loss": 0.6172, + "step": 52035 + }, + { + "epoch": 1.33, + "learning_rate": 1.2261419746133842e-06, + "loss": 0.605, + "step": 52036 + }, + { + "epoch": 1.33, + "learning_rate": 1.2261150208939461e-06, + "loss": 0.5776, + "step": 52037 + }, + { + "epoch": 1.33, + "learning_rate": 1.2260880670013824e-06, + "loss": 0.6167, + "step": 52038 + }, + { + "epoch": 1.33, + "learning_rate": 1.2260611129357135e-06, + "loss": 0.6592, + "step": 52039 + }, + { + "epoch": 1.33, + "learning_rate": 1.22603415869696e-06, + "loss": 0.6943, + "step": 52040 + }, + { + "epoch": 1.33, + "learning_rate": 1.2260072042851423e-06, + "loss": 0.5617, + "step": 52041 + }, + { + "epoch": 1.33, + "learning_rate": 1.2259802497002816e-06, + "loss": 0.7285, + "step": 52042 + }, + { + "epoch": 1.33, + "learning_rate": 1.2259532949423978e-06, + "loss": 0.7783, + "step": 52043 + }, + { + "epoch": 1.33, + "learning_rate": 1.2259263400115125e-06, + "loss": 0.7871, + "step": 52044 + }, + { + "epoch": 1.33, + "learning_rate": 1.2258993849076452e-06, + "loss": 0.6594, + "step": 52045 + }, + { + "epoch": 1.33, + "learning_rate": 1.2258724296308177e-06, + "loss": 0.5889, + "step": 52046 + }, + { + "epoch": 1.33, + "learning_rate": 1.2258454741810499e-06, + "loss": 0.7715, + "step": 52047 + }, + { + "epoch": 1.33, + "learning_rate": 1.225818518558362e-06, + "loss": 0.5569, + "step": 52048 + }, + { + "epoch": 1.33, + "learning_rate": 1.225791562762776e-06, + "loss": 0.6367, + "step": 52049 + }, + { + "epoch": 1.33, + "learning_rate": 1.2257646067943114e-06, + "loss": 0.5774, + "step": 52050 + }, + { + "epoch": 1.33, + "learning_rate": 1.2257376506529895e-06, + "loss": 0.6592, + "step": 52051 + }, + { + "epoch": 1.33, + "learning_rate": 1.2257106943388306e-06, + "loss": 0.6885, + "step": 52052 + }, + { + "epoch": 1.33, + "learning_rate": 1.2256837378518553e-06, + "loss": 0.6514, + "step": 52053 + }, + { + "epoch": 1.33, + "learning_rate": 1.2256567811920842e-06, + "loss": 0.7285, + "step": 52054 + }, + { + "epoch": 1.33, + "learning_rate": 1.2256298243595381e-06, + "loss": 0.6396, + "step": 52055 + }, + { + "epoch": 1.33, + "learning_rate": 1.2256028673542377e-06, + "loss": 0.7168, + "step": 52056 + }, + { + "epoch": 1.33, + "learning_rate": 1.2255759101762039e-06, + "loss": 0.3921, + "step": 52057 + }, + { + "epoch": 1.33, + "learning_rate": 1.2255489528254566e-06, + "loss": 0.583, + "step": 52058 + }, + { + "epoch": 1.33, + "learning_rate": 1.2255219953020168e-06, + "loss": 0.6953, + "step": 52059 + }, + { + "epoch": 1.33, + "learning_rate": 1.2254950376059052e-06, + "loss": 0.5688, + "step": 52060 + }, + { + "epoch": 1.33, + "learning_rate": 1.2254680797371428e-06, + "loss": 0.6725, + "step": 52061 + }, + { + "epoch": 1.33, + "learning_rate": 1.2254411216957494e-06, + "loss": 0.5503, + "step": 52062 + }, + { + "epoch": 1.33, + "learning_rate": 1.2254141634817464e-06, + "loss": 0.4736, + "step": 52063 + }, + { + "epoch": 1.33, + "learning_rate": 1.225387205095154e-06, + "loss": 0.5679, + "step": 52064 + }, + { + "epoch": 1.33, + "learning_rate": 1.2253602465359929e-06, + "loss": 0.8252, + "step": 52065 + }, + { + "epoch": 1.33, + "learning_rate": 1.2253332878042841e-06, + "loss": 0.5625, + "step": 52066 + }, + { + "epoch": 1.33, + "learning_rate": 1.2253063289000475e-06, + "loss": 0.554, + "step": 52067 + }, + { + "epoch": 1.33, + "learning_rate": 1.2252793698233045e-06, + "loss": 0.7168, + "step": 52068 + }, + { + "epoch": 1.33, + "learning_rate": 1.2252524105740756e-06, + "loss": 0.5684, + "step": 52069 + }, + { + "epoch": 1.33, + "learning_rate": 1.225225451152381e-06, + "loss": 0.6968, + "step": 52070 + }, + { + "epoch": 1.33, + "learning_rate": 1.2251984915582418e-06, + "loss": 0.668, + "step": 52071 + }, + { + "epoch": 1.33, + "learning_rate": 1.2251715317916786e-06, + "loss": 0.541, + "step": 52072 + }, + { + "epoch": 1.33, + "learning_rate": 1.2251445718527116e-06, + "loss": 0.6514, + "step": 52073 + }, + { + "epoch": 1.33, + "learning_rate": 1.225117611741362e-06, + "loss": 0.6631, + "step": 52074 + }, + { + "epoch": 1.33, + "learning_rate": 1.2250906514576498e-06, + "loss": 0.7295, + "step": 52075 + }, + { + "epoch": 1.33, + "learning_rate": 1.2250636910015965e-06, + "loss": 0.6934, + "step": 52076 + }, + { + "epoch": 1.33, + "learning_rate": 1.2250367303732222e-06, + "loss": 0.7178, + "step": 52077 + }, + { + "epoch": 1.33, + "learning_rate": 1.2250097695725474e-06, + "loss": 0.7803, + "step": 52078 + }, + { + "epoch": 1.33, + "learning_rate": 1.224982808599593e-06, + "loss": 0.7666, + "step": 52079 + }, + { + "epoch": 1.33, + "learning_rate": 1.2249558474543798e-06, + "loss": 0.627, + "step": 52080 + }, + { + "epoch": 1.33, + "learning_rate": 1.2249288861369283e-06, + "loss": 0.7822, + "step": 52081 + }, + { + "epoch": 1.33, + "learning_rate": 1.2249019246472589e-06, + "loss": 0.7646, + "step": 52082 + }, + { + "epoch": 1.33, + "learning_rate": 1.2248749629853923e-06, + "loss": 0.7285, + "step": 52083 + }, + { + "epoch": 1.33, + "learning_rate": 1.2248480011513496e-06, + "loss": 0.624, + "step": 52084 + }, + { + "epoch": 1.33, + "learning_rate": 1.2248210391451508e-06, + "loss": 0.481, + "step": 52085 + }, + { + "epoch": 1.33, + "learning_rate": 1.2247940769668174e-06, + "loss": 0.7983, + "step": 52086 + }, + { + "epoch": 1.34, + "learning_rate": 1.224767114616369e-06, + "loss": 0.6255, + "step": 52087 + }, + { + "epoch": 1.34, + "learning_rate": 1.224740152093827e-06, + "loss": 0.7852, + "step": 52088 + }, + { + "epoch": 1.34, + "learning_rate": 1.2247131893992115e-06, + "loss": 0.606, + "step": 52089 + }, + { + "epoch": 1.34, + "learning_rate": 1.2246862265325437e-06, + "loss": 0.5791, + "step": 52090 + }, + { + "epoch": 1.34, + "learning_rate": 1.2246592634938442e-06, + "loss": 0.5605, + "step": 52091 + }, + { + "epoch": 1.34, + "learning_rate": 1.224632300283133e-06, + "loss": 0.6255, + "step": 52092 + }, + { + "epoch": 1.34, + "learning_rate": 1.2246053369004314e-06, + "loss": 0.604, + "step": 52093 + }, + { + "epoch": 1.34, + "learning_rate": 1.2245783733457596e-06, + "loss": 0.792, + "step": 52094 + }, + { + "epoch": 1.34, + "learning_rate": 1.2245514096191386e-06, + "loss": 0.7334, + "step": 52095 + }, + { + "epoch": 1.34, + "learning_rate": 1.2245244457205893e-06, + "loss": 0.668, + "step": 52096 + }, + { + "epoch": 1.34, + "learning_rate": 1.2244974816501314e-06, + "loss": 0.4081, + "step": 52097 + }, + { + "epoch": 1.34, + "learning_rate": 1.2244705174077862e-06, + "loss": 0.6494, + "step": 52098 + }, + { + "epoch": 1.34, + "learning_rate": 1.2244435529935746e-06, + "loss": 0.7773, + "step": 52099 + }, + { + "epoch": 1.34, + "learning_rate": 1.2244165884075164e-06, + "loss": 0.7773, + "step": 52100 + }, + { + "epoch": 1.34, + "learning_rate": 1.2243896236496334e-06, + "loss": 0.8467, + "step": 52101 + }, + { + "epoch": 1.34, + "learning_rate": 1.224362658719945e-06, + "loss": 0.6978, + "step": 52102 + }, + { + "epoch": 1.34, + "learning_rate": 1.2243356936184726e-06, + "loss": 0.5728, + "step": 52103 + }, + { + "epoch": 1.34, + "learning_rate": 1.2243087283452364e-06, + "loss": 0.625, + "step": 52104 + }, + { + "epoch": 1.34, + "learning_rate": 1.2242817629002577e-06, + "loss": 0.5156, + "step": 52105 + }, + { + "epoch": 1.34, + "learning_rate": 1.2242547972835569e-06, + "loss": 0.6069, + "step": 52106 + }, + { + "epoch": 1.34, + "learning_rate": 1.2242278314951542e-06, + "loss": 0.7529, + "step": 52107 + }, + { + "epoch": 1.34, + "learning_rate": 1.2242008655350706e-06, + "loss": 0.7412, + "step": 52108 + }, + { + "epoch": 1.34, + "learning_rate": 1.2241738994033267e-06, + "loss": 0.6934, + "step": 52109 + }, + { + "epoch": 1.34, + "learning_rate": 1.2241469330999433e-06, + "loss": 0.5872, + "step": 52110 + }, + { + "epoch": 1.34, + "learning_rate": 1.2241199666249408e-06, + "loss": 0.6572, + "step": 52111 + }, + { + "epoch": 1.34, + "learning_rate": 1.2240929999783398e-06, + "loss": 0.3173, + "step": 52112 + }, + { + "epoch": 1.34, + "learning_rate": 1.2240660331601614e-06, + "loss": 0.5632, + "step": 52113 + }, + { + "epoch": 1.34, + "learning_rate": 1.2240390661704257e-06, + "loss": 0.4365, + "step": 52114 + }, + { + "epoch": 1.34, + "learning_rate": 1.2240120990091537e-06, + "loss": 0.5957, + "step": 52115 + }, + { + "epoch": 1.34, + "learning_rate": 1.2239851316763658e-06, + "loss": 0.5698, + "step": 52116 + }, + { + "epoch": 1.34, + "learning_rate": 1.223958164172083e-06, + "loss": 0.6406, + "step": 52117 + }, + { + "epoch": 1.34, + "learning_rate": 1.2239311964963254e-06, + "loss": 0.6523, + "step": 52118 + }, + { + "epoch": 1.34, + "learning_rate": 1.223904228649114e-06, + "loss": 0.7139, + "step": 52119 + }, + { + "epoch": 1.34, + "learning_rate": 1.2238772606304698e-06, + "loss": 0.6279, + "step": 52120 + }, + { + "epoch": 1.34, + "learning_rate": 1.223850292440413e-06, + "loss": 0.7236, + "step": 52121 + }, + { + "epoch": 1.34, + "learning_rate": 1.2238233240789644e-06, + "loss": 0.6738, + "step": 52122 + }, + { + "epoch": 1.34, + "learning_rate": 1.223796355546144e-06, + "loss": 0.7051, + "step": 52123 + }, + { + "epoch": 1.34, + "learning_rate": 1.2237693868419738e-06, + "loss": 0.6289, + "step": 52124 + }, + { + "epoch": 1.34, + "learning_rate": 1.2237424179664731e-06, + "loss": 0.6675, + "step": 52125 + }, + { + "epoch": 1.34, + "learning_rate": 1.2237154489196634e-06, + "loss": 0.6338, + "step": 52126 + }, + { + "epoch": 1.34, + "learning_rate": 1.223688479701565e-06, + "loss": 0.6313, + "step": 52127 + }, + { + "epoch": 1.34, + "learning_rate": 1.2236615103121985e-06, + "loss": 0.6111, + "step": 52128 + }, + { + "epoch": 1.34, + "learning_rate": 1.2236345407515846e-06, + "loss": 0.606, + "step": 52129 + }, + { + "epoch": 1.34, + "learning_rate": 1.2236075710197444e-06, + "loss": 0.6509, + "step": 52130 + }, + { + "epoch": 1.34, + "learning_rate": 1.2235806011166981e-06, + "loss": 0.5195, + "step": 52131 + }, + { + "epoch": 1.34, + "learning_rate": 1.223553631042466e-06, + "loss": 0.5151, + "step": 52132 + }, + { + "epoch": 1.34, + "learning_rate": 1.2235266607970696e-06, + "loss": 0.6875, + "step": 52133 + }, + { + "epoch": 1.34, + "learning_rate": 1.2234996903805289e-06, + "loss": 0.6992, + "step": 52134 + }, + { + "epoch": 1.34, + "learning_rate": 1.2234727197928646e-06, + "loss": 0.585, + "step": 52135 + }, + { + "epoch": 1.34, + "learning_rate": 1.2234457490340978e-06, + "loss": 0.6787, + "step": 52136 + }, + { + "epoch": 1.34, + "learning_rate": 1.223418778104249e-06, + "loss": 0.5825, + "step": 52137 + }, + { + "epoch": 1.34, + "learning_rate": 1.2233918070033382e-06, + "loss": 0.5085, + "step": 52138 + }, + { + "epoch": 1.34, + "learning_rate": 1.2233648357313867e-06, + "loss": 0.6138, + "step": 52139 + }, + { + "epoch": 1.34, + "learning_rate": 1.223337864288415e-06, + "loss": 0.7441, + "step": 52140 + }, + { + "epoch": 1.34, + "learning_rate": 1.2233108926744444e-06, + "loss": 0.7524, + "step": 52141 + }, + { + "epoch": 1.34, + "learning_rate": 1.2232839208894942e-06, + "loss": 0.6279, + "step": 52142 + }, + { + "epoch": 1.34, + "learning_rate": 1.2232569489335863e-06, + "loss": 0.7725, + "step": 52143 + }, + { + "epoch": 1.34, + "learning_rate": 1.2232299768067403e-06, + "loss": 0.8242, + "step": 52144 + }, + { + "epoch": 1.34, + "learning_rate": 1.2232030045089775e-06, + "loss": 0.6777, + "step": 52145 + }, + { + "epoch": 1.34, + "learning_rate": 1.2231760320403189e-06, + "loss": 0.4377, + "step": 52146 + }, + { + "epoch": 1.34, + "learning_rate": 1.2231490594007842e-06, + "loss": 0.4834, + "step": 52147 + }, + { + "epoch": 1.34, + "learning_rate": 1.2231220865903945e-06, + "loss": 0.7471, + "step": 52148 + }, + { + "epoch": 1.34, + "learning_rate": 1.2230951136091708e-06, + "loss": 0.7817, + "step": 52149 + }, + { + "epoch": 1.34, + "learning_rate": 1.2230681404571333e-06, + "loss": 0.5791, + "step": 52150 + }, + { + "epoch": 1.34, + "learning_rate": 1.223041167134303e-06, + "loss": 0.6543, + "step": 52151 + }, + { + "epoch": 1.34, + "learning_rate": 1.2230141936406996e-06, + "loss": 0.6216, + "step": 52152 + }, + { + "epoch": 1.34, + "learning_rate": 1.2229872199763451e-06, + "loss": 0.6797, + "step": 52153 + }, + { + "epoch": 1.34, + "learning_rate": 1.2229602461412592e-06, + "loss": 0.6021, + "step": 52154 + }, + { + "epoch": 1.34, + "learning_rate": 1.222933272135463e-06, + "loss": 0.6099, + "step": 52155 + }, + { + "epoch": 1.34, + "learning_rate": 1.2229062979589773e-06, + "loss": 0.4802, + "step": 52156 + }, + { + "epoch": 1.34, + "learning_rate": 1.2228793236118223e-06, + "loss": 0.667, + "step": 52157 + }, + { + "epoch": 1.34, + "learning_rate": 1.2228523490940188e-06, + "loss": 0.7295, + "step": 52158 + }, + { + "epoch": 1.34, + "learning_rate": 1.2228253744055876e-06, + "loss": 0.5552, + "step": 52159 + }, + { + "epoch": 1.34, + "learning_rate": 1.2227983995465495e-06, + "loss": 0.7197, + "step": 52160 + }, + { + "epoch": 1.34, + "learning_rate": 1.2227714245169244e-06, + "loss": 0.7539, + "step": 52161 + }, + { + "epoch": 1.34, + "learning_rate": 1.2227444493167335e-06, + "loss": 0.8057, + "step": 52162 + }, + { + "epoch": 1.34, + "learning_rate": 1.2227174739459979e-06, + "loss": 0.6063, + "step": 52163 + }, + { + "epoch": 1.34, + "learning_rate": 1.2226904984047373e-06, + "loss": 0.5376, + "step": 52164 + }, + { + "epoch": 1.34, + "learning_rate": 1.222663522692973e-06, + "loss": 0.6445, + "step": 52165 + }, + { + "epoch": 1.34, + "learning_rate": 1.2226365468107257e-06, + "loss": 0.6602, + "step": 52166 + }, + { + "epoch": 1.34, + "learning_rate": 1.2226095707580154e-06, + "loss": 0.6436, + "step": 52167 + }, + { + "epoch": 1.34, + "learning_rate": 1.2225825945348635e-06, + "loss": 0.7285, + "step": 52168 + }, + { + "epoch": 1.34, + "learning_rate": 1.22255561814129e-06, + "loss": 0.5247, + "step": 52169 + }, + { + "epoch": 1.34, + "learning_rate": 1.2225286415773167e-06, + "loss": 0.427, + "step": 52170 + }, + { + "epoch": 1.34, + "learning_rate": 1.2225016648429628e-06, + "loss": 0.7871, + "step": 52171 + }, + { + "epoch": 1.34, + "learning_rate": 1.2224746879382494e-06, + "loss": 0.5757, + "step": 52172 + }, + { + "epoch": 1.34, + "learning_rate": 1.2224477108631977e-06, + "loss": 0.5671, + "step": 52173 + }, + { + "epoch": 1.34, + "learning_rate": 1.222420733617828e-06, + "loss": 0.5088, + "step": 52174 + }, + { + "epoch": 1.34, + "learning_rate": 1.222393756202161e-06, + "loss": 0.605, + "step": 52175 + }, + { + "epoch": 1.34, + "learning_rate": 1.2223667786162174e-06, + "loss": 0.7998, + "step": 52176 + }, + { + "epoch": 1.34, + "learning_rate": 1.2223398008600176e-06, + "loss": 0.5728, + "step": 52177 + }, + { + "epoch": 1.34, + "learning_rate": 1.2223128229335826e-06, + "loss": 0.626, + "step": 52178 + }, + { + "epoch": 1.34, + "learning_rate": 1.2222858448369327e-06, + "loss": 0.7295, + "step": 52179 + }, + { + "epoch": 1.34, + "learning_rate": 1.2222588665700888e-06, + "loss": 0.7002, + "step": 52180 + }, + { + "epoch": 1.34, + "learning_rate": 1.2222318881330716e-06, + "loss": 0.3877, + "step": 52181 + }, + { + "epoch": 1.34, + "learning_rate": 1.2222049095259014e-06, + "loss": 0.5464, + "step": 52182 + }, + { + "epoch": 1.34, + "learning_rate": 1.2221779307485996e-06, + "loss": 0.7676, + "step": 52183 + }, + { + "epoch": 1.34, + "learning_rate": 1.2221509518011858e-06, + "loss": 0.6738, + "step": 52184 + }, + { + "epoch": 1.34, + "learning_rate": 1.2221239726836818e-06, + "loss": 0.7124, + "step": 52185 + }, + { + "epoch": 1.34, + "learning_rate": 1.2220969933961075e-06, + "loss": 0.6406, + "step": 52186 + }, + { + "epoch": 1.34, + "learning_rate": 1.2220700139384836e-06, + "loss": 0.6997, + "step": 52187 + }, + { + "epoch": 1.34, + "learning_rate": 1.2220430343108308e-06, + "loss": 0.6328, + "step": 52188 + }, + { + "epoch": 1.34, + "learning_rate": 1.2220160545131702e-06, + "loss": 0.7222, + "step": 52189 + }, + { + "epoch": 1.34, + "learning_rate": 1.221989074545522e-06, + "loss": 0.751, + "step": 52190 + }, + { + "epoch": 1.34, + "learning_rate": 1.221962094407907e-06, + "loss": 0.6782, + "step": 52191 + }, + { + "epoch": 1.34, + "learning_rate": 1.2219351141003455e-06, + "loss": 0.7832, + "step": 52192 + }, + { + "epoch": 1.34, + "learning_rate": 1.2219081336228588e-06, + "loss": 0.5928, + "step": 52193 + }, + { + "epoch": 1.34, + "learning_rate": 1.2218811529754672e-06, + "loss": 0.6294, + "step": 52194 + }, + { + "epoch": 1.34, + "learning_rate": 1.2218541721581913e-06, + "loss": 0.6758, + "step": 52195 + }, + { + "epoch": 1.34, + "learning_rate": 1.2218271911710521e-06, + "loss": 0.5713, + "step": 52196 + }, + { + "epoch": 1.34, + "learning_rate": 1.2218002100140699e-06, + "loss": 0.5928, + "step": 52197 + }, + { + "epoch": 1.34, + "learning_rate": 1.2217732286872654e-06, + "loss": 0.7285, + "step": 52198 + }, + { + "epoch": 1.34, + "learning_rate": 1.2217462471906593e-06, + "loss": 0.4734, + "step": 52199 + }, + { + "epoch": 1.34, + "learning_rate": 1.2217192655242725e-06, + "loss": 0.3972, + "step": 52200 + }, + { + "epoch": 1.34, + "learning_rate": 1.221692283688125e-06, + "loss": 0.5317, + "step": 52201 + }, + { + "epoch": 1.34, + "learning_rate": 1.2216653016822386e-06, + "loss": 0.5051, + "step": 52202 + }, + { + "epoch": 1.34, + "learning_rate": 1.221638319506633e-06, + "loss": 0.7725, + "step": 52203 + }, + { + "epoch": 1.34, + "learning_rate": 1.2216113371613289e-06, + "loss": 0.6436, + "step": 52204 + }, + { + "epoch": 1.34, + "learning_rate": 1.2215843546463472e-06, + "loss": 0.793, + "step": 52205 + }, + { + "epoch": 1.34, + "learning_rate": 1.2215573719617086e-06, + "loss": 0.6577, + "step": 52206 + }, + { + "epoch": 1.34, + "learning_rate": 1.2215303891074337e-06, + "loss": 0.6372, + "step": 52207 + }, + { + "epoch": 1.34, + "learning_rate": 1.2215034060835434e-06, + "loss": 0.7578, + "step": 52208 + }, + { + "epoch": 1.34, + "learning_rate": 1.2214764228900579e-06, + "loss": 0.5449, + "step": 52209 + }, + { + "epoch": 1.34, + "learning_rate": 1.2214494395269982e-06, + "loss": 0.6055, + "step": 52210 + }, + { + "epoch": 1.34, + "learning_rate": 1.2214224559943848e-06, + "loss": 0.481, + "step": 52211 + }, + { + "epoch": 1.34, + "learning_rate": 1.2213954722922386e-06, + "loss": 0.6201, + "step": 52212 + }, + { + "epoch": 1.34, + "learning_rate": 1.2213684884205797e-06, + "loss": 0.6846, + "step": 52213 + }, + { + "epoch": 1.34, + "learning_rate": 1.2213415043794293e-06, + "loss": 0.7051, + "step": 52214 + }, + { + "epoch": 1.34, + "learning_rate": 1.221314520168808e-06, + "loss": 0.6851, + "step": 52215 + }, + { + "epoch": 1.34, + "learning_rate": 1.2212875357887362e-06, + "loss": 0.666, + "step": 52216 + }, + { + "epoch": 1.34, + "learning_rate": 1.2212605512392347e-06, + "loss": 0.7959, + "step": 52217 + }, + { + "epoch": 1.34, + "learning_rate": 1.2212335665203243e-06, + "loss": 0.6064, + "step": 52218 + }, + { + "epoch": 1.34, + "learning_rate": 1.2212065816320254e-06, + "loss": 0.606, + "step": 52219 + }, + { + "epoch": 1.34, + "learning_rate": 1.221179596574359e-06, + "loss": 0.5181, + "step": 52220 + }, + { + "epoch": 1.34, + "learning_rate": 1.2211526113473453e-06, + "loss": 0.668, + "step": 52221 + }, + { + "epoch": 1.34, + "learning_rate": 1.2211256259510053e-06, + "loss": 0.6621, + "step": 52222 + }, + { + "epoch": 1.34, + "learning_rate": 1.2210986403853595e-06, + "loss": 0.5796, + "step": 52223 + }, + { + "epoch": 1.34, + "learning_rate": 1.221071654650429e-06, + "loss": 0.3679, + "step": 52224 + }, + { + "epoch": 1.34, + "learning_rate": 1.221044668746234e-06, + "loss": 0.5488, + "step": 52225 + }, + { + "epoch": 1.34, + "learning_rate": 1.2210176826727947e-06, + "loss": 0.6504, + "step": 52226 + }, + { + "epoch": 1.34, + "learning_rate": 1.2209906964301328e-06, + "loss": 0.7021, + "step": 52227 + }, + { + "epoch": 1.34, + "learning_rate": 1.2209637100182683e-06, + "loss": 0.6826, + "step": 52228 + }, + { + "epoch": 1.34, + "learning_rate": 1.220936723437222e-06, + "loss": 0.7383, + "step": 52229 + }, + { + "epoch": 1.34, + "learning_rate": 1.220909736687015e-06, + "loss": 0.7114, + "step": 52230 + }, + { + "epoch": 1.34, + "learning_rate": 1.2208827497676675e-06, + "loss": 0.7363, + "step": 52231 + }, + { + "epoch": 1.34, + "learning_rate": 1.2208557626791998e-06, + "loss": 0.5483, + "step": 52232 + }, + { + "epoch": 1.34, + "learning_rate": 1.2208287754216332e-06, + "loss": 0.5337, + "step": 52233 + }, + { + "epoch": 1.34, + "learning_rate": 1.2208017879949883e-06, + "loss": 0.7275, + "step": 52234 + }, + { + "epoch": 1.34, + "learning_rate": 1.2207748003992857e-06, + "loss": 0.7415, + "step": 52235 + }, + { + "epoch": 1.34, + "learning_rate": 1.2207478126345459e-06, + "loss": 0.6377, + "step": 52236 + }, + { + "epoch": 1.34, + "learning_rate": 1.2207208247007895e-06, + "loss": 0.5918, + "step": 52237 + }, + { + "epoch": 1.34, + "learning_rate": 1.2206938365980373e-06, + "loss": 0.5579, + "step": 52238 + }, + { + "epoch": 1.34, + "learning_rate": 1.2206668483263102e-06, + "loss": 0.6187, + "step": 52239 + }, + { + "epoch": 1.34, + "learning_rate": 1.2206398598856285e-06, + "loss": 0.564, + "step": 52240 + }, + { + "epoch": 1.34, + "learning_rate": 1.220612871276013e-06, + "loss": 0.6633, + "step": 52241 + }, + { + "epoch": 1.34, + "learning_rate": 1.2205858824974843e-06, + "loss": 0.5962, + "step": 52242 + }, + { + "epoch": 1.34, + "learning_rate": 1.2205588935500633e-06, + "loss": 0.6621, + "step": 52243 + }, + { + "epoch": 1.34, + "learning_rate": 1.2205319044337703e-06, + "loss": 0.55, + "step": 52244 + }, + { + "epoch": 1.34, + "learning_rate": 1.2205049151486265e-06, + "loss": 0.791, + "step": 52245 + }, + { + "epoch": 1.34, + "learning_rate": 1.2204779256946518e-06, + "loss": 0.5737, + "step": 52246 + }, + { + "epoch": 1.34, + "learning_rate": 1.2204509360718675e-06, + "loss": 0.626, + "step": 52247 + }, + { + "epoch": 1.34, + "learning_rate": 1.220423946280294e-06, + "loss": 0.5234, + "step": 52248 + }, + { + "epoch": 1.34, + "learning_rate": 1.220396956319952e-06, + "loss": 0.5986, + "step": 52249 + }, + { + "epoch": 1.34, + "learning_rate": 1.2203699661908627e-06, + "loss": 0.561, + "step": 52250 + }, + { + "epoch": 1.34, + "learning_rate": 1.2203429758930454e-06, + "loss": 0.7412, + "step": 52251 + }, + { + "epoch": 1.34, + "learning_rate": 1.2203159854265222e-06, + "loss": 0.7598, + "step": 52252 + }, + { + "epoch": 1.34, + "learning_rate": 1.2202889947913129e-06, + "loss": 0.7451, + "step": 52253 + }, + { + "epoch": 1.34, + "learning_rate": 1.2202620039874385e-06, + "loss": 0.3427, + "step": 52254 + }, + { + "epoch": 1.34, + "learning_rate": 1.2202350130149197e-06, + "loss": 0.6035, + "step": 52255 + }, + { + "epoch": 1.34, + "learning_rate": 1.2202080218737771e-06, + "loss": 0.7568, + "step": 52256 + }, + { + "epoch": 1.34, + "learning_rate": 1.2201810305640312e-06, + "loss": 0.7266, + "step": 52257 + }, + { + "epoch": 1.34, + "learning_rate": 1.220154039085703e-06, + "loss": 0.5464, + "step": 52258 + }, + { + "epoch": 1.34, + "learning_rate": 1.2201270474388126e-06, + "loss": 0.8105, + "step": 52259 + }, + { + "epoch": 1.34, + "learning_rate": 1.2201000556233816e-06, + "loss": 0.6265, + "step": 52260 + }, + { + "epoch": 1.34, + "learning_rate": 1.2200730636394296e-06, + "loss": 0.5537, + "step": 52261 + }, + { + "epoch": 1.34, + "learning_rate": 1.2200460714869782e-06, + "loss": 0.6147, + "step": 52262 + }, + { + "epoch": 1.34, + "learning_rate": 1.220019079166047e-06, + "loss": 0.8047, + "step": 52263 + }, + { + "epoch": 1.34, + "learning_rate": 1.219992086676658e-06, + "loss": 0.7471, + "step": 52264 + }, + { + "epoch": 1.34, + "learning_rate": 1.219965094018831e-06, + "loss": 0.5015, + "step": 52265 + }, + { + "epoch": 1.34, + "learning_rate": 1.219938101192587e-06, + "loss": 0.5278, + "step": 52266 + }, + { + "epoch": 1.34, + "learning_rate": 1.219911108197946e-06, + "loss": 0.4126, + "step": 52267 + }, + { + "epoch": 1.34, + "learning_rate": 1.2198841150349296e-06, + "loss": 0.7344, + "step": 52268 + }, + { + "epoch": 1.34, + "learning_rate": 1.2198571217035576e-06, + "loss": 0.707, + "step": 52269 + }, + { + "epoch": 1.34, + "learning_rate": 1.2198301282038514e-06, + "loss": 0.6274, + "step": 52270 + }, + { + "epoch": 1.34, + "learning_rate": 1.2198031345358314e-06, + "loss": 0.6406, + "step": 52271 + }, + { + "epoch": 1.34, + "learning_rate": 1.2197761406995181e-06, + "loss": 0.4661, + "step": 52272 + }, + { + "epoch": 1.34, + "learning_rate": 1.2197491466949326e-06, + "loss": 0.668, + "step": 52273 + }, + { + "epoch": 1.34, + "learning_rate": 1.2197221525220948e-06, + "loss": 0.7129, + "step": 52274 + }, + { + "epoch": 1.34, + "learning_rate": 1.2196951581810266e-06, + "loss": 0.6992, + "step": 52275 + }, + { + "epoch": 1.34, + "learning_rate": 1.2196681636717475e-06, + "loss": 0.6816, + "step": 52276 + }, + { + "epoch": 1.34, + "learning_rate": 1.2196411689942786e-06, + "loss": 0.605, + "step": 52277 + }, + { + "epoch": 1.34, + "learning_rate": 1.2196141741486404e-06, + "loss": 0.5787, + "step": 52278 + }, + { + "epoch": 1.34, + "learning_rate": 1.2195871791348537e-06, + "loss": 0.751, + "step": 52279 + }, + { + "epoch": 1.34, + "learning_rate": 1.2195601839529394e-06, + "loss": 0.5942, + "step": 52280 + }, + { + "epoch": 1.34, + "learning_rate": 1.219533188602918e-06, + "loss": 0.6572, + "step": 52281 + }, + { + "epoch": 1.34, + "learning_rate": 1.2195061930848099e-06, + "loss": 0.6021, + "step": 52282 + }, + { + "epoch": 1.34, + "learning_rate": 1.2194791973986363e-06, + "loss": 0.4277, + "step": 52283 + }, + { + "epoch": 1.34, + "learning_rate": 1.2194522015444174e-06, + "loss": 0.6235, + "step": 52284 + }, + { + "epoch": 1.34, + "learning_rate": 1.2194252055221742e-06, + "loss": 0.6699, + "step": 52285 + }, + { + "epoch": 1.34, + "learning_rate": 1.219398209331927e-06, + "loss": 0.668, + "step": 52286 + }, + { + "epoch": 1.34, + "learning_rate": 1.2193712129736967e-06, + "loss": 0.5601, + "step": 52287 + }, + { + "epoch": 1.34, + "learning_rate": 1.2193442164475038e-06, + "loss": 0.6758, + "step": 52288 + }, + { + "epoch": 1.34, + "learning_rate": 1.2193172197533693e-06, + "loss": 0.7446, + "step": 52289 + }, + { + "epoch": 1.34, + "learning_rate": 1.2192902228913137e-06, + "loss": 0.7412, + "step": 52290 + }, + { + "epoch": 1.34, + "learning_rate": 1.2192632258613578e-06, + "loss": 0.4156, + "step": 52291 + }, + { + "epoch": 1.34, + "learning_rate": 1.2192362286635218e-06, + "loss": 0.6851, + "step": 52292 + }, + { + "epoch": 1.34, + "learning_rate": 1.219209231297827e-06, + "loss": 0.4758, + "step": 52293 + }, + { + "epoch": 1.34, + "learning_rate": 1.2191822337642936e-06, + "loss": 0.7168, + "step": 52294 + }, + { + "epoch": 1.34, + "learning_rate": 1.2191552360629427e-06, + "loss": 0.6177, + "step": 52295 + }, + { + "epoch": 1.34, + "learning_rate": 1.2191282381937944e-06, + "loss": 0.6655, + "step": 52296 + }, + { + "epoch": 1.34, + "learning_rate": 1.2191012401568696e-06, + "loss": 0.7007, + "step": 52297 + }, + { + "epoch": 1.34, + "learning_rate": 1.2190742419521893e-06, + "loss": 0.5493, + "step": 52298 + }, + { + "epoch": 1.34, + "learning_rate": 1.2190472435797738e-06, + "loss": 0.8281, + "step": 52299 + }, + { + "epoch": 1.34, + "learning_rate": 1.2190202450396443e-06, + "loss": 0.6743, + "step": 52300 + }, + { + "epoch": 1.34, + "learning_rate": 1.2189932463318207e-06, + "loss": 0.6758, + "step": 52301 + }, + { + "epoch": 1.34, + "learning_rate": 1.2189662474563241e-06, + "loss": 0.6797, + "step": 52302 + }, + { + "epoch": 1.34, + "learning_rate": 1.2189392484131748e-06, + "loss": 0.7578, + "step": 52303 + }, + { + "epoch": 1.34, + "learning_rate": 1.2189122492023942e-06, + "loss": 0.6738, + "step": 52304 + }, + { + "epoch": 1.34, + "learning_rate": 1.2188852498240026e-06, + "loss": 0.6895, + "step": 52305 + }, + { + "epoch": 1.34, + "learning_rate": 1.2188582502780204e-06, + "loss": 0.7939, + "step": 52306 + }, + { + "epoch": 1.34, + "learning_rate": 1.2188312505644684e-06, + "loss": 0.8149, + "step": 52307 + }, + { + "epoch": 1.34, + "learning_rate": 1.2188042506833678e-06, + "loss": 0.7612, + "step": 52308 + }, + { + "epoch": 1.34, + "learning_rate": 1.2187772506347385e-06, + "loss": 0.7432, + "step": 52309 + }, + { + "epoch": 1.34, + "learning_rate": 1.2187502504186016e-06, + "loss": 0.6499, + "step": 52310 + }, + { + "epoch": 1.34, + "learning_rate": 1.2187232500349777e-06, + "loss": 0.6206, + "step": 52311 + }, + { + "epoch": 1.34, + "learning_rate": 1.2186962494838878e-06, + "loss": 0.4639, + "step": 52312 + }, + { + "epoch": 1.34, + "learning_rate": 1.2186692487653516e-06, + "loss": 0.7246, + "step": 52313 + }, + { + "epoch": 1.34, + "learning_rate": 1.2186422478793908e-06, + "loss": 0.7383, + "step": 52314 + }, + { + "epoch": 1.34, + "learning_rate": 1.2186152468260256e-06, + "loss": 0.4672, + "step": 52315 + }, + { + "epoch": 1.34, + "learning_rate": 1.2185882456052765e-06, + "loss": 0.5693, + "step": 52316 + }, + { + "epoch": 1.34, + "learning_rate": 1.218561244217165e-06, + "loss": 0.7622, + "step": 52317 + }, + { + "epoch": 1.34, + "learning_rate": 1.2185342426617106e-06, + "loss": 0.4612, + "step": 52318 + }, + { + "epoch": 1.34, + "learning_rate": 1.218507240938935e-06, + "loss": 0.7539, + "step": 52319 + }, + { + "epoch": 1.34, + "learning_rate": 1.2184802390488584e-06, + "loss": 0.7793, + "step": 52320 + }, + { + "epoch": 1.34, + "learning_rate": 1.2184532369915015e-06, + "loss": 0.6709, + "step": 52321 + }, + { + "epoch": 1.34, + "learning_rate": 1.2184262347668847e-06, + "loss": 0.4741, + "step": 52322 + }, + { + "epoch": 1.34, + "learning_rate": 1.2183992323750294e-06, + "loss": 0.8066, + "step": 52323 + }, + { + "epoch": 1.34, + "learning_rate": 1.2183722298159555e-06, + "loss": 0.6182, + "step": 52324 + }, + { + "epoch": 1.34, + "learning_rate": 1.2183452270896846e-06, + "loss": 0.667, + "step": 52325 + }, + { + "epoch": 1.34, + "learning_rate": 1.2183182241962362e-06, + "loss": 0.5845, + "step": 52326 + }, + { + "epoch": 1.34, + "learning_rate": 1.2182912211356319e-06, + "loss": 0.7363, + "step": 52327 + }, + { + "epoch": 1.34, + "learning_rate": 1.2182642179078918e-06, + "loss": 0.6411, + "step": 52328 + }, + { + "epoch": 1.34, + "learning_rate": 1.2182372145130368e-06, + "loss": 0.6846, + "step": 52329 + }, + { + "epoch": 1.34, + "learning_rate": 1.2182102109510878e-06, + "loss": 0.4487, + "step": 52330 + }, + { + "epoch": 1.34, + "learning_rate": 1.2181832072220654e-06, + "loss": 0.626, + "step": 52331 + }, + { + "epoch": 1.34, + "learning_rate": 1.2181562033259898e-06, + "loss": 0.5757, + "step": 52332 + }, + { + "epoch": 1.34, + "learning_rate": 1.2181291992628824e-06, + "loss": 0.6396, + "step": 52333 + }, + { + "epoch": 1.34, + "learning_rate": 1.218102195032763e-06, + "loss": 0.7471, + "step": 52334 + }, + { + "epoch": 1.34, + "learning_rate": 1.2180751906356532e-06, + "loss": 0.5513, + "step": 52335 + }, + { + "epoch": 1.34, + "learning_rate": 1.2180481860715731e-06, + "loss": 0.6641, + "step": 52336 + }, + { + "epoch": 1.34, + "learning_rate": 1.2180211813405433e-06, + "loss": 0.7344, + "step": 52337 + }, + { + "epoch": 1.34, + "learning_rate": 1.2179941764425852e-06, + "loss": 0.752, + "step": 52338 + }, + { + "epoch": 1.34, + "learning_rate": 1.217967171377719e-06, + "loss": 0.7871, + "step": 52339 + }, + { + "epoch": 1.34, + "learning_rate": 1.217940166145965e-06, + "loss": 0.7256, + "step": 52340 + }, + { + "epoch": 1.34, + "learning_rate": 1.2179131607473443e-06, + "loss": 0.7656, + "step": 52341 + }, + { + "epoch": 1.34, + "learning_rate": 1.2178861551818775e-06, + "loss": 0.6055, + "step": 52342 + }, + { + "epoch": 1.34, + "learning_rate": 1.2178591494495854e-06, + "loss": 0.6167, + "step": 52343 + }, + { + "epoch": 1.34, + "learning_rate": 1.2178321435504887e-06, + "loss": 0.7383, + "step": 52344 + }, + { + "epoch": 1.34, + "learning_rate": 1.2178051374846076e-06, + "loss": 0.6836, + "step": 52345 + }, + { + "epoch": 1.34, + "learning_rate": 1.2177781312519635e-06, + "loss": 0.5974, + "step": 52346 + }, + { + "epoch": 1.34, + "learning_rate": 1.2177511248525763e-06, + "loss": 0.6416, + "step": 52347 + }, + { + "epoch": 1.34, + "learning_rate": 1.2177241182864672e-06, + "loss": 0.4988, + "step": 52348 + }, + { + "epoch": 1.34, + "learning_rate": 1.2176971115536567e-06, + "loss": 0.6611, + "step": 52349 + }, + { + "epoch": 1.34, + "learning_rate": 1.217670104654166e-06, + "loss": 0.4407, + "step": 52350 + }, + { + "epoch": 1.34, + "learning_rate": 1.2176430975880147e-06, + "loss": 0.7676, + "step": 52351 + }, + { + "epoch": 1.34, + "learning_rate": 1.2176160903552244e-06, + "loss": 0.5033, + "step": 52352 + }, + { + "epoch": 1.34, + "learning_rate": 1.2175890829558153e-06, + "loss": 0.8174, + "step": 52353 + }, + { + "epoch": 1.34, + "learning_rate": 1.2175620753898083e-06, + "loss": 0.7168, + "step": 52354 + }, + { + "epoch": 1.34, + "learning_rate": 1.2175350676572243e-06, + "loss": 0.6484, + "step": 52355 + }, + { + "epoch": 1.34, + "learning_rate": 1.2175080597580836e-06, + "loss": 0.7529, + "step": 52356 + }, + { + "epoch": 1.34, + "learning_rate": 1.2174810516924066e-06, + "loss": 0.5842, + "step": 52357 + }, + { + "epoch": 1.34, + "learning_rate": 1.2174540434602146e-06, + "loss": 0.4377, + "step": 52358 + }, + { + "epoch": 1.34, + "learning_rate": 1.2174270350615282e-06, + "loss": 0.6865, + "step": 52359 + }, + { + "epoch": 1.34, + "learning_rate": 1.2174000264963677e-06, + "loss": 0.6924, + "step": 52360 + }, + { + "epoch": 1.34, + "learning_rate": 1.2173730177647541e-06, + "loss": 0.3939, + "step": 52361 + }, + { + "epoch": 1.34, + "learning_rate": 1.2173460088667078e-06, + "loss": 0.5503, + "step": 52362 + }, + { + "epoch": 1.34, + "learning_rate": 1.2173189998022499e-06, + "loss": 0.5215, + "step": 52363 + }, + { + "epoch": 1.34, + "learning_rate": 1.2172919905714005e-06, + "loss": 0.4844, + "step": 52364 + }, + { + "epoch": 1.34, + "learning_rate": 1.217264981174181e-06, + "loss": 0.5737, + "step": 52365 + }, + { + "epoch": 1.34, + "learning_rate": 1.2172379716106116e-06, + "loss": 0.521, + "step": 52366 + }, + { + "epoch": 1.34, + "learning_rate": 1.217210961880713e-06, + "loss": 0.4507, + "step": 52367 + }, + { + "epoch": 1.34, + "learning_rate": 1.2171839519845056e-06, + "loss": 0.5227, + "step": 52368 + }, + { + "epoch": 1.34, + "learning_rate": 1.2171569419220112e-06, + "loss": 0.6309, + "step": 52369 + }, + { + "epoch": 1.34, + "learning_rate": 1.2171299316932493e-06, + "loss": 0.6274, + "step": 52370 + }, + { + "epoch": 1.34, + "learning_rate": 1.217102921298241e-06, + "loss": 0.7588, + "step": 52371 + }, + { + "epoch": 1.34, + "learning_rate": 1.217075910737007e-06, + "loss": 0.5532, + "step": 52372 + }, + { + "epoch": 1.34, + "learning_rate": 1.2170489000095678e-06, + "loss": 0.6816, + "step": 52373 + }, + { + "epoch": 1.34, + "learning_rate": 1.2170218891159443e-06, + "loss": 0.4741, + "step": 52374 + }, + { + "epoch": 1.34, + "learning_rate": 1.2169948780561577e-06, + "loss": 0.7578, + "step": 52375 + }, + { + "epoch": 1.34, + "learning_rate": 1.2169678668302272e-06, + "loss": 0.6582, + "step": 52376 + }, + { + "epoch": 1.34, + "learning_rate": 1.216940855438175e-06, + "loss": 0.6982, + "step": 52377 + }, + { + "epoch": 1.34, + "learning_rate": 1.2169138438800207e-06, + "loss": 0.6094, + "step": 52378 + }, + { + "epoch": 1.34, + "learning_rate": 1.2168868321557857e-06, + "loss": 0.6221, + "step": 52379 + }, + { + "epoch": 1.34, + "learning_rate": 1.2168598202654905e-06, + "loss": 0.5449, + "step": 52380 + }, + { + "epoch": 1.34, + "learning_rate": 1.2168328082091555e-06, + "loss": 0.6953, + "step": 52381 + }, + { + "epoch": 1.34, + "learning_rate": 1.216805795986802e-06, + "loss": 0.6958, + "step": 52382 + }, + { + "epoch": 1.34, + "learning_rate": 1.2167787835984497e-06, + "loss": 0.6553, + "step": 52383 + }, + { + "epoch": 1.34, + "learning_rate": 1.2167517710441203e-06, + "loss": 0.5728, + "step": 52384 + }, + { + "epoch": 1.34, + "learning_rate": 1.2167247583238338e-06, + "loss": 0.5972, + "step": 52385 + }, + { + "epoch": 1.34, + "learning_rate": 1.2166977454376112e-06, + "loss": 0.4932, + "step": 52386 + }, + { + "epoch": 1.34, + "learning_rate": 1.2166707323854731e-06, + "loss": 0.5112, + "step": 52387 + }, + { + "epoch": 1.34, + "learning_rate": 1.2166437191674402e-06, + "loss": 0.4392, + "step": 52388 + }, + { + "epoch": 1.34, + "learning_rate": 1.2166167057835329e-06, + "loss": 0.5708, + "step": 52389 + }, + { + "epoch": 1.34, + "learning_rate": 1.2165896922337726e-06, + "loss": 0.6265, + "step": 52390 + }, + { + "epoch": 1.34, + "learning_rate": 1.2165626785181792e-06, + "loss": 0.7314, + "step": 52391 + }, + { + "epoch": 1.34, + "learning_rate": 1.2165356646367739e-06, + "loss": 0.6948, + "step": 52392 + }, + { + "epoch": 1.34, + "learning_rate": 1.216508650589577e-06, + "loss": 0.6123, + "step": 52393 + }, + { + "epoch": 1.34, + "learning_rate": 1.2164816363766095e-06, + "loss": 0.6484, + "step": 52394 + }, + { + "epoch": 1.34, + "learning_rate": 1.2164546219978922e-06, + "loss": 0.3704, + "step": 52395 + }, + { + "epoch": 1.34, + "learning_rate": 1.2164276074534451e-06, + "loss": 0.7168, + "step": 52396 + }, + { + "epoch": 1.34, + "learning_rate": 1.2164005927432896e-06, + "loss": 0.6528, + "step": 52397 + }, + { + "epoch": 1.34, + "learning_rate": 1.2163735778674461e-06, + "loss": 0.7754, + "step": 52398 + }, + { + "epoch": 1.34, + "learning_rate": 1.216346562825935e-06, + "loss": 0.7412, + "step": 52399 + }, + { + "epoch": 1.34, + "learning_rate": 1.2163195476187777e-06, + "loss": 0.7202, + "step": 52400 + }, + { + "epoch": 1.34, + "learning_rate": 1.2162925322459946e-06, + "loss": 0.7129, + "step": 52401 + }, + { + "epoch": 1.34, + "learning_rate": 1.216265516707606e-06, + "loss": 0.6445, + "step": 52402 + }, + { + "epoch": 1.34, + "learning_rate": 1.2162385010036324e-06, + "loss": 0.6875, + "step": 52403 + }, + { + "epoch": 1.34, + "learning_rate": 1.2162114851340956e-06, + "loss": 0.6201, + "step": 52404 + }, + { + "epoch": 1.34, + "learning_rate": 1.2161844690990154e-06, + "loss": 0.7383, + "step": 52405 + }, + { + "epoch": 1.34, + "learning_rate": 1.2161574528984124e-06, + "loss": 0.6392, + "step": 52406 + }, + { + "epoch": 1.34, + "learning_rate": 1.2161304365323079e-06, + "loss": 0.793, + "step": 52407 + }, + { + "epoch": 1.34, + "learning_rate": 1.216103420000722e-06, + "loss": 0.585, + "step": 52408 + }, + { + "epoch": 1.34, + "learning_rate": 1.2160764033036759e-06, + "loss": 0.6416, + "step": 52409 + }, + { + "epoch": 1.34, + "learning_rate": 1.2160493864411901e-06, + "loss": 0.521, + "step": 52410 + }, + { + "epoch": 1.34, + "learning_rate": 1.2160223694132852e-06, + "loss": 0.625, + "step": 52411 + }, + { + "epoch": 1.34, + "learning_rate": 1.2159953522199814e-06, + "loss": 0.5977, + "step": 52412 + }, + { + "epoch": 1.34, + "learning_rate": 1.2159683348613006e-06, + "loss": 0.5684, + "step": 52413 + }, + { + "epoch": 1.34, + "learning_rate": 1.2159413173372624e-06, + "loss": 0.6499, + "step": 52414 + }, + { + "epoch": 1.34, + "learning_rate": 1.2159142996478878e-06, + "loss": 0.6084, + "step": 52415 + }, + { + "epoch": 1.34, + "learning_rate": 1.2158872817931979e-06, + "loss": 0.6421, + "step": 52416 + }, + { + "epoch": 1.34, + "learning_rate": 1.2158602637732128e-06, + "loss": 0.667, + "step": 52417 + }, + { + "epoch": 1.34, + "learning_rate": 1.2158332455879532e-06, + "loss": 0.7217, + "step": 52418 + }, + { + "epoch": 1.34, + "learning_rate": 1.2158062272374404e-06, + "loss": 0.7515, + "step": 52419 + }, + { + "epoch": 1.34, + "learning_rate": 1.2157792087216946e-06, + "loss": 0.5613, + "step": 52420 + }, + { + "epoch": 1.34, + "learning_rate": 1.2157521900407366e-06, + "loss": 0.6113, + "step": 52421 + }, + { + "epoch": 1.34, + "learning_rate": 1.2157251711945866e-06, + "loss": 0.6826, + "step": 52422 + }, + { + "epoch": 1.34, + "learning_rate": 1.2156981521832663e-06, + "loss": 0.5391, + "step": 52423 + }, + { + "epoch": 1.34, + "learning_rate": 1.2156711330067954e-06, + "loss": 0.6133, + "step": 52424 + }, + { + "epoch": 1.34, + "learning_rate": 1.2156441136651956e-06, + "loss": 0.5591, + "step": 52425 + }, + { + "epoch": 1.34, + "learning_rate": 1.2156170941584867e-06, + "loss": 0.7212, + "step": 52426 + }, + { + "epoch": 1.34, + "learning_rate": 1.2155900744866895e-06, + "loss": 0.6094, + "step": 52427 + }, + { + "epoch": 1.34, + "learning_rate": 1.2155630546498251e-06, + "loss": 0.6548, + "step": 52428 + }, + { + "epoch": 1.34, + "learning_rate": 1.2155360346479142e-06, + "loss": 0.7422, + "step": 52429 + }, + { + "epoch": 1.34, + "learning_rate": 1.2155090144809772e-06, + "loss": 0.6343, + "step": 52430 + }, + { + "epoch": 1.34, + "learning_rate": 1.2154819941490346e-06, + "loss": 0.75, + "step": 52431 + }, + { + "epoch": 1.34, + "learning_rate": 1.2154549736521075e-06, + "loss": 0.7295, + "step": 52432 + }, + { + "epoch": 1.34, + "learning_rate": 1.2154279529902163e-06, + "loss": 0.7363, + "step": 52433 + }, + { + "epoch": 1.34, + "learning_rate": 1.2154009321633819e-06, + "loss": 0.7158, + "step": 52434 + }, + { + "epoch": 1.34, + "learning_rate": 1.215373911171625e-06, + "loss": 0.7295, + "step": 52435 + }, + { + "epoch": 1.34, + "learning_rate": 1.215346890014966e-06, + "loss": 0.5154, + "step": 52436 + }, + { + "epoch": 1.34, + "learning_rate": 1.215319868693426e-06, + "loss": 0.5552, + "step": 52437 + }, + { + "epoch": 1.34, + "learning_rate": 1.2152928472070255e-06, + "loss": 0.6851, + "step": 52438 + }, + { + "epoch": 1.34, + "learning_rate": 1.2152658255557847e-06, + "loss": 0.7349, + "step": 52439 + }, + { + "epoch": 1.34, + "learning_rate": 1.2152388037397256e-06, + "loss": 0.6021, + "step": 52440 + }, + { + "epoch": 1.34, + "learning_rate": 1.2152117817588675e-06, + "loss": 0.6699, + "step": 52441 + }, + { + "epoch": 1.34, + "learning_rate": 1.2151847596132316e-06, + "loss": 0.6562, + "step": 52442 + }, + { + "epoch": 1.34, + "learning_rate": 1.2151577373028386e-06, + "loss": 0.6177, + "step": 52443 + }, + { + "epoch": 1.34, + "learning_rate": 1.2151307148277094e-06, + "loss": 0.8857, + "step": 52444 + }, + { + "epoch": 1.34, + "learning_rate": 1.2151036921878646e-06, + "loss": 0.5781, + "step": 52445 + }, + { + "epoch": 1.34, + "learning_rate": 1.2150766693833247e-06, + "loss": 0.6709, + "step": 52446 + }, + { + "epoch": 1.34, + "learning_rate": 1.2150496464141103e-06, + "loss": 0.647, + "step": 52447 + }, + { + "epoch": 1.34, + "learning_rate": 1.2150226232802424e-06, + "loss": 0.751, + "step": 52448 + }, + { + "epoch": 1.34, + "learning_rate": 1.2149955999817417e-06, + "loss": 0.5489, + "step": 52449 + }, + { + "epoch": 1.34, + "learning_rate": 1.2149685765186285e-06, + "loss": 0.6279, + "step": 52450 + }, + { + "epoch": 1.34, + "learning_rate": 1.2149415528909236e-06, + "loss": 0.7959, + "step": 52451 + }, + { + "epoch": 1.34, + "learning_rate": 1.2149145290986483e-06, + "loss": 0.6597, + "step": 52452 + }, + { + "epoch": 1.34, + "learning_rate": 1.2148875051418226e-06, + "loss": 0.4551, + "step": 52453 + }, + { + "epoch": 1.34, + "learning_rate": 1.2148604810204674e-06, + "loss": 0.7656, + "step": 52454 + }, + { + "epoch": 1.34, + "learning_rate": 1.2148334567346035e-06, + "loss": 0.6558, + "step": 52455 + }, + { + "epoch": 1.34, + "learning_rate": 1.2148064322842514e-06, + "loss": 0.7227, + "step": 52456 + }, + { + "epoch": 1.34, + "learning_rate": 1.2147794076694319e-06, + "loss": 0.7861, + "step": 52457 + }, + { + "epoch": 1.34, + "learning_rate": 1.2147523828901656e-06, + "loss": 0.5322, + "step": 52458 + }, + { + "epoch": 1.34, + "learning_rate": 1.2147253579464737e-06, + "loss": 0.6943, + "step": 52459 + }, + { + "epoch": 1.34, + "learning_rate": 1.2146983328383761e-06, + "loss": 0.5083, + "step": 52460 + }, + { + "epoch": 1.34, + "learning_rate": 1.214671307565894e-06, + "loss": 0.7578, + "step": 52461 + }, + { + "epoch": 1.34, + "learning_rate": 1.2146442821290477e-06, + "loss": 0.7075, + "step": 52462 + }, + { + "epoch": 1.34, + "learning_rate": 1.2146172565278586e-06, + "loss": 0.4963, + "step": 52463 + }, + { + "epoch": 1.34, + "learning_rate": 1.2145902307623465e-06, + "loss": 0.7002, + "step": 52464 + }, + { + "epoch": 1.34, + "learning_rate": 1.2145632048325327e-06, + "loss": 0.6934, + "step": 52465 + }, + { + "epoch": 1.34, + "learning_rate": 1.2145361787384375e-06, + "loss": 0.6519, + "step": 52466 + }, + { + "epoch": 1.34, + "learning_rate": 1.2145091524800821e-06, + "loss": 0.665, + "step": 52467 + }, + { + "epoch": 1.34, + "learning_rate": 1.2144821260574866e-06, + "loss": 0.5032, + "step": 52468 + }, + { + "epoch": 1.34, + "learning_rate": 1.2144550994706723e-06, + "loss": 0.5811, + "step": 52469 + }, + { + "epoch": 1.34, + "learning_rate": 1.2144280727196599e-06, + "loss": 0.6982, + "step": 52470 + }, + { + "epoch": 1.34, + "learning_rate": 1.2144010458044692e-06, + "loss": 0.4561, + "step": 52471 + }, + { + "epoch": 1.34, + "learning_rate": 1.2143740187251218e-06, + "loss": 0.6406, + "step": 52472 + }, + { + "epoch": 1.34, + "learning_rate": 1.2143469914816376e-06, + "loss": 0.5088, + "step": 52473 + }, + { + "epoch": 1.34, + "learning_rate": 1.2143199640740385e-06, + "loss": 0.6064, + "step": 52474 + }, + { + "epoch": 1.34, + "learning_rate": 1.2142929365023439e-06, + "loss": 0.7002, + "step": 52475 + }, + { + "epoch": 1.34, + "learning_rate": 1.2142659087665752e-06, + "loss": 0.6973, + "step": 52476 + }, + { + "epoch": 1.35, + "learning_rate": 1.2142388808667527e-06, + "loss": 0.7251, + "step": 52477 + }, + { + "epoch": 1.35, + "learning_rate": 1.2142118528028978e-06, + "loss": 0.6239, + "step": 52478 + }, + { + "epoch": 1.35, + "learning_rate": 1.2141848245750305e-06, + "loss": 0.5638, + "step": 52479 + }, + { + "epoch": 1.35, + "learning_rate": 1.2141577961831719e-06, + "loss": 0.6426, + "step": 52480 + }, + { + "epoch": 1.35, + "learning_rate": 1.2141307676273423e-06, + "loss": 0.5417, + "step": 52481 + }, + { + "epoch": 1.35, + "learning_rate": 1.2141037389075627e-06, + "loss": 0.6455, + "step": 52482 + }, + { + "epoch": 1.35, + "learning_rate": 1.2140767100238537e-06, + "loss": 0.5771, + "step": 52483 + }, + { + "epoch": 1.35, + "learning_rate": 1.2140496809762361e-06, + "loss": 0.5182, + "step": 52484 + }, + { + "epoch": 1.35, + "learning_rate": 1.2140226517647304e-06, + "loss": 0.7549, + "step": 52485 + }, + { + "epoch": 1.35, + "learning_rate": 1.2139956223893575e-06, + "loss": 0.7178, + "step": 52486 + }, + { + "epoch": 1.35, + "learning_rate": 1.2139685928501377e-06, + "loss": 0.6343, + "step": 52487 + }, + { + "epoch": 1.35, + "learning_rate": 1.2139415631470924e-06, + "loss": 0.6338, + "step": 52488 + }, + { + "epoch": 1.35, + "learning_rate": 1.2139145332802417e-06, + "loss": 0.6841, + "step": 52489 + }, + { + "epoch": 1.35, + "learning_rate": 1.2138875032496062e-06, + "loss": 0.5713, + "step": 52490 + }, + { + "epoch": 1.35, + "learning_rate": 1.2138604730552073e-06, + "loss": 0.5991, + "step": 52491 + }, + { + "epoch": 1.35, + "learning_rate": 1.213833442697065e-06, + "loss": 0.7046, + "step": 52492 + }, + { + "epoch": 1.35, + "learning_rate": 1.2138064121752004e-06, + "loss": 0.5713, + "step": 52493 + }, + { + "epoch": 1.35, + "learning_rate": 1.213779381489634e-06, + "loss": 0.8574, + "step": 52494 + }, + { + "epoch": 1.35, + "learning_rate": 1.2137523506403868e-06, + "loss": 0.7979, + "step": 52495 + }, + { + "epoch": 1.35, + "learning_rate": 1.2137253196274788e-06, + "loss": 0.7383, + "step": 52496 + }, + { + "epoch": 1.35, + "learning_rate": 1.2136982884509314e-06, + "loss": 0.5266, + "step": 52497 + }, + { + "epoch": 1.35, + "learning_rate": 1.213671257110765e-06, + "loss": 0.71, + "step": 52498 + }, + { + "epoch": 1.35, + "learning_rate": 1.2136442256070005e-06, + "loss": 0.647, + "step": 52499 + }, + { + "epoch": 1.35, + "learning_rate": 1.2136171939396582e-06, + "loss": 0.6919, + "step": 52500 + }, + { + "epoch": 1.35, + "learning_rate": 1.2135901621087595e-06, + "loss": 0.3462, + "step": 52501 + }, + { + "epoch": 1.35, + "learning_rate": 1.2135631301143238e-06, + "loss": 0.6367, + "step": 52502 + }, + { + "epoch": 1.35, + "learning_rate": 1.2135360979563733e-06, + "loss": 0.5938, + "step": 52503 + }, + { + "epoch": 1.35, + "learning_rate": 1.2135090656349281e-06, + "loss": 0.5248, + "step": 52504 + }, + { + "epoch": 1.35, + "learning_rate": 1.2134820331500085e-06, + "loss": 0.7559, + "step": 52505 + }, + { + "epoch": 1.35, + "learning_rate": 1.2134550005016355e-06, + "loss": 0.708, + "step": 52506 + }, + { + "epoch": 1.35, + "learning_rate": 1.21342796768983e-06, + "loss": 0.5938, + "step": 52507 + }, + { + "epoch": 1.35, + "learning_rate": 1.2134009347146124e-06, + "loss": 0.7598, + "step": 52508 + }, + { + "epoch": 1.35, + "learning_rate": 1.2133739015760038e-06, + "loss": 0.5767, + "step": 52509 + }, + { + "epoch": 1.35, + "learning_rate": 1.2133468682740241e-06, + "loss": 0.4258, + "step": 52510 + }, + { + "epoch": 1.35, + "learning_rate": 1.2133198348086948e-06, + "loss": 0.5483, + "step": 52511 + }, + { + "epoch": 1.35, + "learning_rate": 1.2132928011800364e-06, + "loss": 0.6455, + "step": 52512 + }, + { + "epoch": 1.35, + "learning_rate": 1.2132657673880693e-06, + "loss": 0.4917, + "step": 52513 + }, + { + "epoch": 1.35, + "learning_rate": 1.2132387334328147e-06, + "loss": 0.71, + "step": 52514 + }, + { + "epoch": 1.35, + "learning_rate": 1.2132116993142925e-06, + "loss": 0.7051, + "step": 52515 + }, + { + "epoch": 1.35, + "learning_rate": 1.2131846650325244e-06, + "loss": 0.7148, + "step": 52516 + }, + { + "epoch": 1.35, + "learning_rate": 1.2131576305875301e-06, + "loss": 0.5408, + "step": 52517 + }, + { + "epoch": 1.35, + "learning_rate": 1.2131305959793314e-06, + "loss": 0.627, + "step": 52518 + }, + { + "epoch": 1.35, + "learning_rate": 1.213103561207948e-06, + "loss": 0.8662, + "step": 52519 + }, + { + "epoch": 1.35, + "learning_rate": 1.2130765262734013e-06, + "loss": 0.6777, + "step": 52520 + }, + { + "epoch": 1.35, + "learning_rate": 1.2130494911757114e-06, + "loss": 0.6127, + "step": 52521 + }, + { + "epoch": 1.35, + "learning_rate": 1.2130224559148997e-06, + "loss": 0.4995, + "step": 52522 + }, + { + "epoch": 1.35, + "learning_rate": 1.212995420490986e-06, + "loss": 0.6221, + "step": 52523 + }, + { + "epoch": 1.35, + "learning_rate": 1.212968384903992e-06, + "loss": 0.6519, + "step": 52524 + }, + { + "epoch": 1.35, + "learning_rate": 1.2129413491539375e-06, + "loss": 0.6846, + "step": 52525 + }, + { + "epoch": 1.35, + "learning_rate": 1.2129143132408439e-06, + "loss": 0.6729, + "step": 52526 + }, + { + "epoch": 1.35, + "learning_rate": 1.2128872771647312e-06, + "loss": 0.7803, + "step": 52527 + }, + { + "epoch": 1.35, + "learning_rate": 1.2128602409256207e-06, + "loss": 0.6191, + "step": 52528 + }, + { + "epoch": 1.35, + "learning_rate": 1.2128332045235333e-06, + "loss": 0.6846, + "step": 52529 + }, + { + "epoch": 1.35, + "learning_rate": 1.2128061679584888e-06, + "loss": 0.7119, + "step": 52530 + }, + { + "epoch": 1.35, + "learning_rate": 1.2127791312305084e-06, + "loss": 0.5791, + "step": 52531 + }, + { + "epoch": 1.35, + "learning_rate": 1.212752094339613e-06, + "loss": 0.5249, + "step": 52532 + }, + { + "epoch": 1.35, + "learning_rate": 1.212725057285823e-06, + "loss": 0.6592, + "step": 52533 + }, + { + "epoch": 1.35, + "learning_rate": 1.2126980200691593e-06, + "loss": 0.6768, + "step": 52534 + }, + { + "epoch": 1.35, + "learning_rate": 1.2126709826896426e-06, + "loss": 0.689, + "step": 52535 + }, + { + "epoch": 1.35, + "learning_rate": 1.2126439451472934e-06, + "loss": 0.7646, + "step": 52536 + }, + { + "epoch": 1.35, + "learning_rate": 1.2126169074421324e-06, + "loss": 0.7168, + "step": 52537 + }, + { + "epoch": 1.35, + "learning_rate": 1.2125898695741806e-06, + "loss": 0.6299, + "step": 52538 + }, + { + "epoch": 1.35, + "learning_rate": 1.2125628315434585e-06, + "loss": 0.5493, + "step": 52539 + }, + { + "epoch": 1.35, + "learning_rate": 1.2125357933499864e-06, + "loss": 0.5576, + "step": 52540 + }, + { + "epoch": 1.35, + "learning_rate": 1.2125087549937859e-06, + "loss": 0.5405, + "step": 52541 + }, + { + "epoch": 1.35, + "learning_rate": 1.212481716474877e-06, + "loss": 0.7588, + "step": 52542 + }, + { + "epoch": 1.35, + "learning_rate": 1.2124546777932805e-06, + "loss": 0.5908, + "step": 52543 + }, + { + "epoch": 1.35, + "learning_rate": 1.2124276389490175e-06, + "loss": 0.8638, + "step": 52544 + }, + { + "epoch": 1.35, + "learning_rate": 1.2124005999421086e-06, + "loss": 0.5994, + "step": 52545 + }, + { + "epoch": 1.35, + "learning_rate": 1.2123735607725737e-06, + "loss": 0.2734, + "step": 52546 + }, + { + "epoch": 1.35, + "learning_rate": 1.2123465214404344e-06, + "loss": 0.7148, + "step": 52547 + }, + { + "epoch": 1.35, + "learning_rate": 1.2123194819457113e-06, + "loss": 0.7041, + "step": 52548 + }, + { + "epoch": 1.35, + "learning_rate": 1.212292442288425e-06, + "loss": 0.7061, + "step": 52549 + }, + { + "epoch": 1.35, + "learning_rate": 1.2122654024685959e-06, + "loss": 0.7139, + "step": 52550 + }, + { + "epoch": 1.35, + "learning_rate": 1.212238362486245e-06, + "loss": 0.6768, + "step": 52551 + }, + { + "epoch": 1.35, + "learning_rate": 1.212211322341393e-06, + "loss": 0.5469, + "step": 52552 + }, + { + "epoch": 1.35, + "learning_rate": 1.2121842820340604e-06, + "loss": 0.6172, + "step": 52553 + }, + { + "epoch": 1.35, + "learning_rate": 1.2121572415642682e-06, + "loss": 0.792, + "step": 52554 + }, + { + "epoch": 1.35, + "learning_rate": 1.212130200932037e-06, + "loss": 0.7412, + "step": 52555 + }, + { + "epoch": 1.35, + "learning_rate": 1.2121031601373873e-06, + "loss": 0.5048, + "step": 52556 + }, + { + "epoch": 1.35, + "learning_rate": 1.2120761191803402e-06, + "loss": 0.5547, + "step": 52557 + }, + { + "epoch": 1.35, + "learning_rate": 1.2120490780609158e-06, + "loss": 0.6104, + "step": 52558 + }, + { + "epoch": 1.35, + "learning_rate": 1.2120220367791353e-06, + "loss": 0.6577, + "step": 52559 + }, + { + "epoch": 1.35, + "learning_rate": 1.2119949953350197e-06, + "loss": 0.6543, + "step": 52560 + }, + { + "epoch": 1.35, + "learning_rate": 1.2119679537285886e-06, + "loss": 0.5464, + "step": 52561 + }, + { + "epoch": 1.35, + "learning_rate": 1.2119409119598637e-06, + "loss": 0.4226, + "step": 52562 + }, + { + "epoch": 1.35, + "learning_rate": 1.2119138700288653e-06, + "loss": 0.7803, + "step": 52563 + }, + { + "epoch": 1.35, + "learning_rate": 1.2118868279356148e-06, + "loss": 0.5566, + "step": 52564 + }, + { + "epoch": 1.35, + "learning_rate": 1.2118597856801316e-06, + "loss": 0.4297, + "step": 52565 + }, + { + "epoch": 1.35, + "learning_rate": 1.2118327432624373e-06, + "loss": 0.5272, + "step": 52566 + }, + { + "epoch": 1.35, + "learning_rate": 1.2118057006825524e-06, + "loss": 0.5483, + "step": 52567 + }, + { + "epoch": 1.35, + "learning_rate": 1.2117786579404977e-06, + "loss": 0.7236, + "step": 52568 + }, + { + "epoch": 1.35, + "learning_rate": 1.2117516150362938e-06, + "loss": 0.6555, + "step": 52569 + }, + { + "epoch": 1.35, + "learning_rate": 1.2117245719699614e-06, + "loss": 0.8018, + "step": 52570 + }, + { + "epoch": 1.35, + "learning_rate": 1.2116975287415211e-06, + "loss": 0.7471, + "step": 52571 + }, + { + "epoch": 1.35, + "learning_rate": 1.2116704853509939e-06, + "loss": 0.7285, + "step": 52572 + }, + { + "epoch": 1.35, + "learning_rate": 1.2116434417984e-06, + "loss": 0.6699, + "step": 52573 + }, + { + "epoch": 1.35, + "learning_rate": 1.2116163980837613e-06, + "loss": 0.8066, + "step": 52574 + }, + { + "epoch": 1.35, + "learning_rate": 1.2115893542070967e-06, + "loss": 0.4863, + "step": 52575 + }, + { + "epoch": 1.35, + "learning_rate": 1.2115623101684285e-06, + "loss": 0.626, + "step": 52576 + }, + { + "epoch": 1.35, + "learning_rate": 1.2115352659677763e-06, + "loss": 0.5344, + "step": 52577 + }, + { + "epoch": 1.35, + "learning_rate": 1.2115082216051615e-06, + "loss": 0.6355, + "step": 52578 + }, + { + "epoch": 1.35, + "learning_rate": 1.2114811770806047e-06, + "loss": 0.7236, + "step": 52579 + }, + { + "epoch": 1.35, + "learning_rate": 1.2114541323941261e-06, + "loss": 0.6423, + "step": 52580 + }, + { + "epoch": 1.35, + "learning_rate": 1.211427087545747e-06, + "loss": 0.7168, + "step": 52581 + }, + { + "epoch": 1.35, + "learning_rate": 1.2114000425354882e-06, + "loss": 0.6709, + "step": 52582 + }, + { + "epoch": 1.35, + "learning_rate": 1.2113729973633697e-06, + "loss": 0.6074, + "step": 52583 + }, + { + "epoch": 1.35, + "learning_rate": 1.211345952029413e-06, + "loss": 0.6436, + "step": 52584 + }, + { + "epoch": 1.35, + "learning_rate": 1.2113189065336383e-06, + "loss": 0.625, + "step": 52585 + }, + { + "epoch": 1.35, + "learning_rate": 1.2112918608760661e-06, + "loss": 0.6572, + "step": 52586 + }, + { + "epoch": 1.35, + "learning_rate": 1.2112648150567176e-06, + "loss": 0.6621, + "step": 52587 + }, + { + "epoch": 1.35, + "learning_rate": 1.2112377690756132e-06, + "loss": 0.6748, + "step": 52588 + }, + { + "epoch": 1.35, + "learning_rate": 1.2112107229327744e-06, + "loss": 0.4443, + "step": 52589 + }, + { + "epoch": 1.35, + "learning_rate": 1.2111836766282206e-06, + "loss": 0.5156, + "step": 52590 + }, + { + "epoch": 1.35, + "learning_rate": 1.2111566301619736e-06, + "loss": 0.6709, + "step": 52591 + }, + { + "epoch": 1.35, + "learning_rate": 1.2111295835340532e-06, + "loss": 0.6748, + "step": 52592 + }, + { + "epoch": 1.35, + "learning_rate": 1.211102536744481e-06, + "loss": 0.6694, + "step": 52593 + }, + { + "epoch": 1.35, + "learning_rate": 1.2110754897932771e-06, + "loss": 0.6802, + "step": 52594 + }, + { + "epoch": 1.35, + "learning_rate": 1.2110484426804625e-06, + "loss": 0.5137, + "step": 52595 + }, + { + "epoch": 1.35, + "learning_rate": 1.2110213954060578e-06, + "loss": 0.5669, + "step": 52596 + }, + { + "epoch": 1.35, + "learning_rate": 1.2109943479700836e-06, + "loss": 0.7178, + "step": 52597 + }, + { + "epoch": 1.35, + "learning_rate": 1.2109673003725608e-06, + "loss": 0.8369, + "step": 52598 + }, + { + "epoch": 1.35, + "learning_rate": 1.2109402526135102e-06, + "loss": 0.4404, + "step": 52599 + }, + { + "epoch": 1.35, + "learning_rate": 1.210913204692952e-06, + "loss": 0.6523, + "step": 52600 + }, + { + "epoch": 1.35, + "learning_rate": 1.2108861566109076e-06, + "loss": 0.5713, + "step": 52601 + }, + { + "epoch": 1.35, + "learning_rate": 1.2108591083673972e-06, + "loss": 0.6753, + "step": 52602 + }, + { + "epoch": 1.35, + "learning_rate": 1.2108320599624417e-06, + "loss": 0.7173, + "step": 52603 + }, + { + "epoch": 1.35, + "learning_rate": 1.210805011396062e-06, + "loss": 0.6318, + "step": 52604 + }, + { + "epoch": 1.35, + "learning_rate": 1.210777962668278e-06, + "loss": 0.6426, + "step": 52605 + }, + { + "epoch": 1.35, + "learning_rate": 1.2107509137791113e-06, + "loss": 0.8105, + "step": 52606 + }, + { + "epoch": 1.35, + "learning_rate": 1.2107238647285824e-06, + "loss": 0.6191, + "step": 52607 + }, + { + "epoch": 1.35, + "learning_rate": 1.210696815516712e-06, + "loss": 0.6982, + "step": 52608 + }, + { + "epoch": 1.35, + "learning_rate": 1.2106697661435208e-06, + "loss": 0.365, + "step": 52609 + }, + { + "epoch": 1.35, + "learning_rate": 1.2106427166090294e-06, + "loss": 0.6309, + "step": 52610 + }, + { + "epoch": 1.35, + "learning_rate": 1.2106156669132584e-06, + "loss": 0.7031, + "step": 52611 + }, + { + "epoch": 1.35, + "learning_rate": 1.2105886170562288e-06, + "loss": 0.665, + "step": 52612 + }, + { + "epoch": 1.35, + "learning_rate": 1.210561567037961e-06, + "loss": 0.6416, + "step": 52613 + }, + { + "epoch": 1.35, + "learning_rate": 1.210534516858476e-06, + "loss": 0.4758, + "step": 52614 + }, + { + "epoch": 1.35, + "learning_rate": 1.2105074665177945e-06, + "loss": 0.5767, + "step": 52615 + }, + { + "epoch": 1.35, + "learning_rate": 1.210480416015937e-06, + "loss": 0.6851, + "step": 52616 + }, + { + "epoch": 1.35, + "learning_rate": 1.2104533653529243e-06, + "loss": 0.8125, + "step": 52617 + }, + { + "epoch": 1.35, + "learning_rate": 1.210426314528777e-06, + "loss": 0.6787, + "step": 52618 + }, + { + "epoch": 1.35, + "learning_rate": 1.2103992635435165e-06, + "loss": 0.6519, + "step": 52619 + }, + { + "epoch": 1.35, + "learning_rate": 1.2103722123971624e-06, + "loss": 0.6338, + "step": 52620 + }, + { + "epoch": 1.35, + "learning_rate": 1.2103451610897363e-06, + "loss": 0.7783, + "step": 52621 + }, + { + "epoch": 1.35, + "learning_rate": 1.2103181096212585e-06, + "loss": 0.6299, + "step": 52622 + }, + { + "epoch": 1.35, + "learning_rate": 1.2102910579917493e-06, + "loss": 0.7168, + "step": 52623 + }, + { + "epoch": 1.35, + "learning_rate": 1.2102640062012306e-06, + "loss": 0.4712, + "step": 52624 + }, + { + "epoch": 1.35, + "learning_rate": 1.2102369542497221e-06, + "loss": 0.6689, + "step": 52625 + }, + { + "epoch": 1.35, + "learning_rate": 1.2102099021372452e-06, + "loss": 0.6318, + "step": 52626 + }, + { + "epoch": 1.35, + "learning_rate": 1.2101828498638197e-06, + "loss": 0.4614, + "step": 52627 + }, + { + "epoch": 1.35, + "learning_rate": 1.2101557974294672e-06, + "loss": 0.3591, + "step": 52628 + }, + { + "epoch": 1.35, + "learning_rate": 1.210128744834208e-06, + "loss": 0.6138, + "step": 52629 + }, + { + "epoch": 1.35, + "learning_rate": 1.2101016920780626e-06, + "loss": 0.6318, + "step": 52630 + }, + { + "epoch": 1.35, + "learning_rate": 1.2100746391610524e-06, + "loss": 0.5215, + "step": 52631 + }, + { + "epoch": 1.35, + "learning_rate": 1.2100475860831974e-06, + "loss": 0.626, + "step": 52632 + }, + { + "epoch": 1.35, + "learning_rate": 1.2100205328445187e-06, + "loss": 0.5759, + "step": 52633 + }, + { + "epoch": 1.35, + "learning_rate": 1.209993479445037e-06, + "loss": 0.6484, + "step": 52634 + }, + { + "epoch": 1.35, + "learning_rate": 1.2099664258847733e-06, + "loss": 0.6992, + "step": 52635 + }, + { + "epoch": 1.35, + "learning_rate": 1.2099393721637473e-06, + "loss": 0.9102, + "step": 52636 + }, + { + "epoch": 1.35, + "learning_rate": 1.2099123182819807e-06, + "loss": 0.6855, + "step": 52637 + }, + { + "epoch": 1.35, + "learning_rate": 1.2098852642394939e-06, + "loss": 0.5356, + "step": 52638 + }, + { + "epoch": 1.35, + "learning_rate": 1.2098582100363077e-06, + "loss": 0.6094, + "step": 52639 + }, + { + "epoch": 1.35, + "learning_rate": 1.2098311556724426e-06, + "loss": 0.6396, + "step": 52640 + }, + { + "epoch": 1.35, + "learning_rate": 1.2098041011479195e-06, + "loss": 0.8057, + "step": 52641 + }, + { + "epoch": 1.35, + "learning_rate": 1.2097770464627589e-06, + "loss": 0.8545, + "step": 52642 + }, + { + "epoch": 1.35, + "learning_rate": 1.2097499916169818e-06, + "loss": 0.5979, + "step": 52643 + }, + { + "epoch": 1.35, + "learning_rate": 1.2097229366106087e-06, + "loss": 0.6611, + "step": 52644 + }, + { + "epoch": 1.35, + "learning_rate": 1.2096958814436604e-06, + "loss": 0.5608, + "step": 52645 + }, + { + "epoch": 1.35, + "learning_rate": 1.2096688261161575e-06, + "loss": 0.4512, + "step": 52646 + }, + { + "epoch": 1.35, + "learning_rate": 1.209641770628121e-06, + "loss": 0.5425, + "step": 52647 + }, + { + "epoch": 1.35, + "learning_rate": 1.2096147149795712e-06, + "loss": 0.6523, + "step": 52648 + }, + { + "epoch": 1.35, + "learning_rate": 1.2095876591705292e-06, + "loss": 0.6187, + "step": 52649 + }, + { + "epoch": 1.35, + "learning_rate": 1.2095606032010157e-06, + "loss": 0.6143, + "step": 52650 + }, + { + "epoch": 1.35, + "learning_rate": 1.209533547071051e-06, + "loss": 0.7324, + "step": 52651 + }, + { + "epoch": 1.35, + "learning_rate": 1.2095064907806565e-06, + "loss": 0.6089, + "step": 52652 + }, + { + "epoch": 1.35, + "learning_rate": 1.209479434329852e-06, + "loss": 0.645, + "step": 52653 + }, + { + "epoch": 1.35, + "learning_rate": 1.2094523777186593e-06, + "loss": 0.7324, + "step": 52654 + }, + { + "epoch": 1.35, + "learning_rate": 1.2094253209470982e-06, + "loss": 0.5, + "step": 52655 + }, + { + "epoch": 1.35, + "learning_rate": 1.20939826401519e-06, + "loss": 0.6602, + "step": 52656 + }, + { + "epoch": 1.35, + "learning_rate": 1.2093712069229546e-06, + "loss": 0.4984, + "step": 52657 + }, + { + "epoch": 1.35, + "learning_rate": 1.2093441496704138e-06, + "loss": 0.7119, + "step": 52658 + }, + { + "epoch": 1.35, + "learning_rate": 1.2093170922575878e-06, + "loss": 0.8335, + "step": 52659 + }, + { + "epoch": 1.35, + "learning_rate": 1.2092900346844971e-06, + "loss": 0.5879, + "step": 52660 + }, + { + "epoch": 1.35, + "learning_rate": 1.209262976951163e-06, + "loss": 0.627, + "step": 52661 + }, + { + "epoch": 1.35, + "learning_rate": 1.2092359190576056e-06, + "loss": 0.7227, + "step": 52662 + }, + { + "epoch": 1.35, + "learning_rate": 1.2092088610038456e-06, + "loss": 0.5483, + "step": 52663 + }, + { + "epoch": 1.35, + "learning_rate": 1.2091818027899047e-06, + "loss": 0.6606, + "step": 52664 + }, + { + "epoch": 1.35, + "learning_rate": 1.2091547444158023e-06, + "loss": 0.542, + "step": 52665 + }, + { + "epoch": 1.35, + "learning_rate": 1.20912768588156e-06, + "loss": 0.5527, + "step": 52666 + }, + { + "epoch": 1.35, + "learning_rate": 1.209100627187198e-06, + "loss": 0.5742, + "step": 52667 + }, + { + "epoch": 1.35, + "learning_rate": 1.2090735683327375e-06, + "loss": 0.7334, + "step": 52668 + }, + { + "epoch": 1.35, + "learning_rate": 1.209046509318199e-06, + "loss": 1.0098, + "step": 52669 + }, + { + "epoch": 1.35, + "learning_rate": 1.209019450143603e-06, + "loss": 0.6216, + "step": 52670 + }, + { + "epoch": 1.35, + "learning_rate": 1.2089923908089708e-06, + "loss": 0.6807, + "step": 52671 + }, + { + "epoch": 1.35, + "learning_rate": 1.2089653313143224e-06, + "loss": 0.5388, + "step": 52672 + }, + { + "epoch": 1.35, + "learning_rate": 1.2089382716596788e-06, + "loss": 0.7656, + "step": 52673 + }, + { + "epoch": 1.35, + "learning_rate": 1.2089112118450611e-06, + "loss": 0.6152, + "step": 52674 + }, + { + "epoch": 1.35, + "learning_rate": 1.2088841518704896e-06, + "loss": 0.6846, + "step": 52675 + }, + { + "epoch": 1.35, + "learning_rate": 1.2088570917359849e-06, + "loss": 0.6213, + "step": 52676 + }, + { + "epoch": 1.35, + "learning_rate": 1.208830031441568e-06, + "loss": 0.6357, + "step": 52677 + }, + { + "epoch": 1.35, + "learning_rate": 1.2088029709872594e-06, + "loss": 0.6885, + "step": 52678 + }, + { + "epoch": 1.35, + "learning_rate": 1.2087759103730806e-06, + "loss": 0.6582, + "step": 52679 + }, + { + "epoch": 1.35, + "learning_rate": 1.208748849599051e-06, + "loss": 0.5359, + "step": 52680 + }, + { + "epoch": 1.35, + "learning_rate": 1.2087217886651924e-06, + "loss": 0.6538, + "step": 52681 + }, + { + "epoch": 1.35, + "learning_rate": 1.2086947275715247e-06, + "loss": 0.5889, + "step": 52682 + }, + { + "epoch": 1.35, + "learning_rate": 1.2086676663180695e-06, + "loss": 0.4463, + "step": 52683 + }, + { + "epoch": 1.35, + "learning_rate": 1.2086406049048468e-06, + "loss": 0.5859, + "step": 52684 + }, + { + "epoch": 1.35, + "learning_rate": 1.2086135433318777e-06, + "loss": 0.6934, + "step": 52685 + }, + { + "epoch": 1.35, + "learning_rate": 1.2085864815991826e-06, + "loss": 0.5199, + "step": 52686 + }, + { + "epoch": 1.35, + "learning_rate": 1.2085594197067827e-06, + "loss": 0.3151, + "step": 52687 + }, + { + "epoch": 1.35, + "learning_rate": 1.2085323576546981e-06, + "loss": 0.7773, + "step": 52688 + }, + { + "epoch": 1.35, + "learning_rate": 1.2085052954429504e-06, + "loss": 0.6953, + "step": 52689 + }, + { + "epoch": 1.35, + "learning_rate": 1.2084782330715595e-06, + "loss": 0.6406, + "step": 52690 + }, + { + "epoch": 1.35, + "learning_rate": 1.2084511705405462e-06, + "loss": 0.6826, + "step": 52691 + }, + { + "epoch": 1.35, + "learning_rate": 1.2084241078499315e-06, + "loss": 0.7002, + "step": 52692 + }, + { + "epoch": 1.35, + "learning_rate": 1.2083970449997363e-06, + "loss": 0.6592, + "step": 52693 + }, + { + "epoch": 1.35, + "learning_rate": 1.208369981989981e-06, + "loss": 0.5149, + "step": 52694 + }, + { + "epoch": 1.35, + "learning_rate": 1.2083429188206862e-06, + "loss": 0.6069, + "step": 52695 + }, + { + "epoch": 1.35, + "learning_rate": 1.2083158554918728e-06, + "loss": 0.6978, + "step": 52696 + }, + { + "epoch": 1.35, + "learning_rate": 1.2082887920035615e-06, + "loss": 0.8301, + "step": 52697 + }, + { + "epoch": 1.35, + "learning_rate": 1.2082617283557731e-06, + "loss": 0.6138, + "step": 52698 + }, + { + "epoch": 1.35, + "learning_rate": 1.2082346645485287e-06, + "loss": 0.6338, + "step": 52699 + }, + { + "epoch": 1.35, + "learning_rate": 1.2082076005818483e-06, + "loss": 0.5593, + "step": 52700 + }, + { + "epoch": 1.35, + "learning_rate": 1.2081805364557527e-06, + "loss": 0.5198, + "step": 52701 + }, + { + "epoch": 1.35, + "learning_rate": 1.208153472170263e-06, + "loss": 0.5259, + "step": 52702 + }, + { + "epoch": 1.35, + "learning_rate": 1.2081264077253995e-06, + "loss": 0.5933, + "step": 52703 + }, + { + "epoch": 1.35, + "learning_rate": 1.208099343121184e-06, + "loss": 0.5572, + "step": 52704 + }, + { + "epoch": 1.35, + "learning_rate": 1.2080722783576357e-06, + "loss": 0.6494, + "step": 52705 + }, + { + "epoch": 1.35, + "learning_rate": 1.208045213434776e-06, + "loss": 0.6245, + "step": 52706 + }, + { + "epoch": 1.35, + "learning_rate": 1.2080181483526256e-06, + "loss": 0.6558, + "step": 52707 + }, + { + "epoch": 1.35, + "learning_rate": 1.2079910831112058e-06, + "loss": 0.7808, + "step": 52708 + }, + { + "epoch": 1.35, + "learning_rate": 1.2079640177105363e-06, + "loss": 0.6562, + "step": 52709 + }, + { + "epoch": 1.35, + "learning_rate": 1.2079369521506386e-06, + "loss": 0.5542, + "step": 52710 + }, + { + "epoch": 1.35, + "learning_rate": 1.207909886431533e-06, + "loss": 0.7588, + "step": 52711 + }, + { + "epoch": 1.35, + "learning_rate": 1.2078828205532403e-06, + "loss": 0.605, + "step": 52712 + }, + { + "epoch": 1.35, + "learning_rate": 1.2078557545157814e-06, + "loss": 0.7402, + "step": 52713 + }, + { + "epoch": 1.35, + "learning_rate": 1.2078286883191768e-06, + "loss": 0.6748, + "step": 52714 + }, + { + "epoch": 1.35, + "learning_rate": 1.2078016219634474e-06, + "loss": 0.6396, + "step": 52715 + }, + { + "epoch": 1.35, + "learning_rate": 1.2077745554486139e-06, + "loss": 0.6514, + "step": 52716 + }, + { + "epoch": 1.35, + "learning_rate": 1.2077474887746967e-06, + "loss": 0.6816, + "step": 52717 + }, + { + "epoch": 1.35, + "learning_rate": 1.2077204219417172e-06, + "loss": 0.6348, + "step": 52718 + }, + { + "epoch": 1.35, + "learning_rate": 1.2076933549496958e-06, + "loss": 0.5283, + "step": 52719 + }, + { + "epoch": 1.35, + "learning_rate": 1.2076662877986526e-06, + "loss": 0.6548, + "step": 52720 + }, + { + "epoch": 1.35, + "learning_rate": 1.2076392204886093e-06, + "loss": 0.7061, + "step": 52721 + }, + { + "epoch": 1.35, + "learning_rate": 1.2076121530195858e-06, + "loss": 0.5352, + "step": 52722 + }, + { + "epoch": 1.35, + "learning_rate": 1.2075850853916033e-06, + "loss": 0.7998, + "step": 52723 + }, + { + "epoch": 1.35, + "learning_rate": 1.207558017604683e-06, + "loss": 0.7397, + "step": 52724 + }, + { + "epoch": 1.35, + "learning_rate": 1.2075309496588447e-06, + "loss": 0.5942, + "step": 52725 + }, + { + "epoch": 1.35, + "learning_rate": 1.2075038815541091e-06, + "loss": 0.5024, + "step": 52726 + }, + { + "epoch": 1.35, + "learning_rate": 1.207476813290498e-06, + "loss": 0.6211, + "step": 52727 + }, + { + "epoch": 1.35, + "learning_rate": 1.207449744868031e-06, + "loss": 0.792, + "step": 52728 + }, + { + "epoch": 1.35, + "learning_rate": 1.2074226762867297e-06, + "loss": 0.4819, + "step": 52729 + }, + { + "epoch": 1.35, + "learning_rate": 1.207395607546614e-06, + "loss": 0.7295, + "step": 52730 + }, + { + "epoch": 1.35, + "learning_rate": 1.2073685386477052e-06, + "loss": 0.5566, + "step": 52731 + }, + { + "epoch": 1.35, + "learning_rate": 1.2073414695900237e-06, + "loss": 0.8271, + "step": 52732 + }, + { + "epoch": 1.35, + "learning_rate": 1.2073144003735904e-06, + "loss": 0.5581, + "step": 52733 + }, + { + "epoch": 1.35, + "learning_rate": 1.2072873309984262e-06, + "loss": 0.6309, + "step": 52734 + }, + { + "epoch": 1.35, + "learning_rate": 1.2072602614645514e-06, + "loss": 0.4832, + "step": 52735 + }, + { + "epoch": 1.35, + "learning_rate": 1.207233191771987e-06, + "loss": 0.5791, + "step": 52736 + }, + { + "epoch": 1.35, + "learning_rate": 1.2072061219207538e-06, + "loss": 0.4927, + "step": 52737 + }, + { + "epoch": 1.35, + "learning_rate": 1.207179051910872e-06, + "loss": 0.5142, + "step": 52738 + }, + { + "epoch": 1.35, + "learning_rate": 1.2071519817423632e-06, + "loss": 0.5059, + "step": 52739 + }, + { + "epoch": 1.35, + "learning_rate": 1.2071249114152476e-06, + "loss": 0.5869, + "step": 52740 + }, + { + "epoch": 1.35, + "learning_rate": 1.2070978409295457e-06, + "loss": 0.4834, + "step": 52741 + }, + { + "epoch": 1.35, + "learning_rate": 1.2070707702852787e-06, + "loss": 0.5093, + "step": 52742 + }, + { + "epoch": 1.35, + "learning_rate": 1.207043699482467e-06, + "loss": 0.666, + "step": 52743 + }, + { + "epoch": 1.35, + "learning_rate": 1.2070166285211315e-06, + "loss": 0.8164, + "step": 52744 + }, + { + "epoch": 1.35, + "learning_rate": 1.2069895574012928e-06, + "loss": 0.7148, + "step": 52745 + }, + { + "epoch": 1.35, + "learning_rate": 1.2069624861229722e-06, + "loss": 0.5708, + "step": 52746 + }, + { + "epoch": 1.35, + "learning_rate": 1.2069354146861894e-06, + "loss": 0.583, + "step": 52747 + }, + { + "epoch": 1.35, + "learning_rate": 1.2069083430909662e-06, + "loss": 0.7949, + "step": 52748 + }, + { + "epoch": 1.35, + "learning_rate": 1.2068812713373222e-06, + "loss": 0.6436, + "step": 52749 + }, + { + "epoch": 1.35, + "learning_rate": 1.206854199425279e-06, + "loss": 0.7734, + "step": 52750 + }, + { + "epoch": 1.35, + "learning_rate": 1.206827127354857e-06, + "loss": 0.6274, + "step": 52751 + }, + { + "epoch": 1.35, + "learning_rate": 1.2068000551260772e-06, + "loss": 0.6729, + "step": 52752 + }, + { + "epoch": 1.35, + "learning_rate": 1.2067729827389599e-06, + "loss": 0.624, + "step": 52753 + }, + { + "epoch": 1.35, + "learning_rate": 1.206745910193526e-06, + "loss": 0.583, + "step": 52754 + }, + { + "epoch": 1.35, + "learning_rate": 1.206718837489796e-06, + "loss": 0.6738, + "step": 52755 + }, + { + "epoch": 1.35, + "learning_rate": 1.2066917646277914e-06, + "loss": 0.7109, + "step": 52756 + }, + { + "epoch": 1.35, + "learning_rate": 1.206664691607532e-06, + "loss": 0.6357, + "step": 52757 + }, + { + "epoch": 1.35, + "learning_rate": 1.2066376184290392e-06, + "loss": 0.7412, + "step": 52758 + }, + { + "epoch": 1.35, + "learning_rate": 1.2066105450923336e-06, + "loss": 0.6777, + "step": 52759 + }, + { + "epoch": 1.35, + "learning_rate": 1.2065834715974355e-06, + "loss": 0.7979, + "step": 52760 + }, + { + "epoch": 1.35, + "learning_rate": 1.2065563979443663e-06, + "loss": 0.8174, + "step": 52761 + }, + { + "epoch": 1.35, + "learning_rate": 1.2065293241331462e-06, + "loss": 0.6396, + "step": 52762 + }, + { + "epoch": 1.35, + "learning_rate": 1.206502250163796e-06, + "loss": 0.6084, + "step": 52763 + }, + { + "epoch": 1.35, + "learning_rate": 1.2064751760363366e-06, + "loss": 0.5874, + "step": 52764 + }, + { + "epoch": 1.35, + "learning_rate": 1.2064481017507885e-06, + "loss": 0.6416, + "step": 52765 + }, + { + "epoch": 1.35, + "learning_rate": 1.2064210273071726e-06, + "loss": 0.6094, + "step": 52766 + }, + { + "epoch": 1.35, + "learning_rate": 1.2063939527055097e-06, + "loss": 0.5996, + "step": 52767 + }, + { + "epoch": 1.35, + "learning_rate": 1.2063668779458205e-06, + "loss": 0.6279, + "step": 52768 + }, + { + "epoch": 1.35, + "learning_rate": 1.2063398030281258e-06, + "loss": 0.6924, + "step": 52769 + }, + { + "epoch": 1.35, + "learning_rate": 1.2063127279524459e-06, + "loss": 0.5068, + "step": 52770 + }, + { + "epoch": 1.35, + "learning_rate": 1.206285652718802e-06, + "loss": 0.6836, + "step": 52771 + }, + { + "epoch": 1.35, + "learning_rate": 1.2062585773272145e-06, + "loss": 0.5615, + "step": 52772 + }, + { + "epoch": 1.35, + "learning_rate": 1.2062315017777046e-06, + "loss": 0.7432, + "step": 52773 + }, + { + "epoch": 1.35, + "learning_rate": 1.2062044260702925e-06, + "loss": 0.7388, + "step": 52774 + }, + { + "epoch": 1.35, + "learning_rate": 1.2061773502049993e-06, + "loss": 0.7373, + "step": 52775 + }, + { + "epoch": 1.35, + "learning_rate": 1.2061502741818453e-06, + "loss": 0.6719, + "step": 52776 + }, + { + "epoch": 1.35, + "learning_rate": 1.2061231980008515e-06, + "loss": 0.5889, + "step": 52777 + }, + { + "epoch": 1.35, + "learning_rate": 1.2060961216620388e-06, + "loss": 0.5063, + "step": 52778 + }, + { + "epoch": 1.35, + "learning_rate": 1.206069045165428e-06, + "loss": 0.6694, + "step": 52779 + }, + { + "epoch": 1.35, + "learning_rate": 1.2060419685110393e-06, + "loss": 0.5234, + "step": 52780 + }, + { + "epoch": 1.35, + "learning_rate": 1.206014891698894e-06, + "loss": 0.7246, + "step": 52781 + }, + { + "epoch": 1.35, + "learning_rate": 1.205987814729012e-06, + "loss": 0.79, + "step": 52782 + }, + { + "epoch": 1.35, + "learning_rate": 1.2059607376014152e-06, + "loss": 0.5396, + "step": 52783 + }, + { + "epoch": 1.35, + "learning_rate": 1.2059336603161236e-06, + "loss": 0.7061, + "step": 52784 + }, + { + "epoch": 1.35, + "learning_rate": 1.205906582873158e-06, + "loss": 0.6226, + "step": 52785 + }, + { + "epoch": 1.35, + "learning_rate": 1.2058795052725393e-06, + "loss": 0.5557, + "step": 52786 + }, + { + "epoch": 1.35, + "learning_rate": 1.2058524275142878e-06, + "loss": 0.6348, + "step": 52787 + }, + { + "epoch": 1.35, + "learning_rate": 1.2058253495984253e-06, + "loss": 0.5742, + "step": 52788 + }, + { + "epoch": 1.35, + "learning_rate": 1.205798271524971e-06, + "loss": 0.6045, + "step": 52789 + }, + { + "epoch": 1.35, + "learning_rate": 1.2057711932939467e-06, + "loss": 0.6196, + "step": 52790 + }, + { + "epoch": 1.35, + "learning_rate": 1.2057441149053729e-06, + "loss": 0.5493, + "step": 52791 + }, + { + "epoch": 1.35, + "learning_rate": 1.2057170363592702e-06, + "loss": 0.7539, + "step": 52792 + }, + { + "epoch": 1.35, + "learning_rate": 1.2056899576556597e-06, + "loss": 0.5085, + "step": 52793 + }, + { + "epoch": 1.35, + "learning_rate": 1.2056628787945618e-06, + "loss": 0.7012, + "step": 52794 + }, + { + "epoch": 1.35, + "learning_rate": 1.2056357997759968e-06, + "loss": 0.5505, + "step": 52795 + }, + { + "epoch": 1.35, + "learning_rate": 1.2056087205999863e-06, + "loss": 0.6572, + "step": 52796 + }, + { + "epoch": 1.35, + "learning_rate": 1.2055816412665504e-06, + "loss": 0.7764, + "step": 52797 + }, + { + "epoch": 1.35, + "learning_rate": 1.2055545617757108e-06, + "loss": 0.6733, + "step": 52798 + }, + { + "epoch": 1.35, + "learning_rate": 1.2055274821274868e-06, + "loss": 0.7832, + "step": 52799 + }, + { + "epoch": 1.35, + "learning_rate": 1.2055004023219002e-06, + "loss": 0.4985, + "step": 52800 + }, + { + "epoch": 1.35, + "learning_rate": 1.205473322358971e-06, + "loss": 0.3915, + "step": 52801 + }, + { + "epoch": 1.35, + "learning_rate": 1.2054462422387207e-06, + "loss": 0.5244, + "step": 52802 + }, + { + "epoch": 1.35, + "learning_rate": 1.2054191619611699e-06, + "loss": 0.6377, + "step": 52803 + }, + { + "epoch": 1.35, + "learning_rate": 1.2053920815263385e-06, + "loss": 0.7837, + "step": 52804 + }, + { + "epoch": 1.35, + "learning_rate": 1.2053650009342481e-06, + "loss": 0.6982, + "step": 52805 + }, + { + "epoch": 1.35, + "learning_rate": 1.2053379201849192e-06, + "loss": 0.8516, + "step": 52806 + }, + { + "epoch": 1.35, + "learning_rate": 1.2053108392783725e-06, + "loss": 0.709, + "step": 52807 + }, + { + "epoch": 1.35, + "learning_rate": 1.2052837582146287e-06, + "loss": 0.5088, + "step": 52808 + }, + { + "epoch": 1.35, + "learning_rate": 1.2052566769937084e-06, + "loss": 0.666, + "step": 52809 + }, + { + "epoch": 1.35, + "learning_rate": 1.2052295956156327e-06, + "loss": 0.6377, + "step": 52810 + }, + { + "epoch": 1.35, + "learning_rate": 1.205202514080422e-06, + "loss": 0.5959, + "step": 52811 + }, + { + "epoch": 1.35, + "learning_rate": 1.205175432388097e-06, + "loss": 0.6787, + "step": 52812 + }, + { + "epoch": 1.35, + "learning_rate": 1.2051483505386792e-06, + "loss": 0.7188, + "step": 52813 + }, + { + "epoch": 1.35, + "learning_rate": 1.2051212685321882e-06, + "loss": 0.6738, + "step": 52814 + }, + { + "epoch": 1.35, + "learning_rate": 1.2050941863686457e-06, + "loss": 0.6294, + "step": 52815 + }, + { + "epoch": 1.35, + "learning_rate": 1.2050671040480715e-06, + "loss": 0.4299, + "step": 52816 + }, + { + "epoch": 1.35, + "learning_rate": 1.2050400215704874e-06, + "loss": 0.6357, + "step": 52817 + }, + { + "epoch": 1.35, + "learning_rate": 1.2050129389359134e-06, + "loss": 0.6504, + "step": 52818 + }, + { + "epoch": 1.35, + "learning_rate": 1.2049858561443705e-06, + "loss": 0.5239, + "step": 52819 + }, + { + "epoch": 1.35, + "learning_rate": 1.2049587731958789e-06, + "loss": 0.5789, + "step": 52820 + }, + { + "epoch": 1.35, + "learning_rate": 1.2049316900904602e-06, + "loss": 0.9365, + "step": 52821 + }, + { + "epoch": 1.35, + "learning_rate": 1.2049046068281342e-06, + "loss": 0.6431, + "step": 52822 + }, + { + "epoch": 1.35, + "learning_rate": 1.2048775234089227e-06, + "loss": 0.7109, + "step": 52823 + }, + { + "epoch": 1.35, + "learning_rate": 1.204850439832846e-06, + "loss": 0.564, + "step": 52824 + }, + { + "epoch": 1.35, + "learning_rate": 1.2048233560999246e-06, + "loss": 0.5605, + "step": 52825 + }, + { + "epoch": 1.35, + "learning_rate": 1.2047962722101793e-06, + "loss": 0.4993, + "step": 52826 + }, + { + "epoch": 1.35, + "learning_rate": 1.2047691881636308e-06, + "loss": 0.6274, + "step": 52827 + }, + { + "epoch": 1.35, + "learning_rate": 1.2047421039603001e-06, + "loss": 0.6846, + "step": 52828 + }, + { + "epoch": 1.35, + "learning_rate": 1.2047150196002076e-06, + "loss": 0.7124, + "step": 52829 + }, + { + "epoch": 1.35, + "learning_rate": 1.2046879350833746e-06, + "loss": 0.6357, + "step": 52830 + }, + { + "epoch": 1.35, + "learning_rate": 1.2046608504098207e-06, + "loss": 0.7373, + "step": 52831 + }, + { + "epoch": 1.35, + "learning_rate": 1.2046337655795682e-06, + "loss": 0.8271, + "step": 52832 + }, + { + "epoch": 1.35, + "learning_rate": 1.204606680592637e-06, + "loss": 0.5295, + "step": 52833 + }, + { + "epoch": 1.35, + "learning_rate": 1.2045795954490474e-06, + "loss": 0.7266, + "step": 52834 + }, + { + "epoch": 1.35, + "learning_rate": 1.2045525101488207e-06, + "loss": 0.5879, + "step": 52835 + }, + { + "epoch": 1.35, + "learning_rate": 1.2045254246919778e-06, + "loss": 0.6709, + "step": 52836 + }, + { + "epoch": 1.35, + "learning_rate": 1.204498339078539e-06, + "loss": 0.6201, + "step": 52837 + }, + { + "epoch": 1.35, + "learning_rate": 1.2044712533085255e-06, + "loss": 0.7393, + "step": 52838 + }, + { + "epoch": 1.35, + "learning_rate": 1.2044441673819575e-06, + "loss": 0.6562, + "step": 52839 + }, + { + "epoch": 1.35, + "learning_rate": 1.2044170812988562e-06, + "loss": 0.6758, + "step": 52840 + }, + { + "epoch": 1.35, + "learning_rate": 1.2043899950592418e-06, + "loss": 0.6364, + "step": 52841 + }, + { + "epoch": 1.35, + "learning_rate": 1.2043629086631355e-06, + "loss": 0.585, + "step": 52842 + }, + { + "epoch": 1.35, + "learning_rate": 1.2043358221105581e-06, + "loss": 0.5249, + "step": 52843 + }, + { + "epoch": 1.35, + "learning_rate": 1.2043087354015301e-06, + "loss": 0.5386, + "step": 52844 + }, + { + "epoch": 1.35, + "learning_rate": 1.204281648536072e-06, + "loss": 0.5745, + "step": 52845 + }, + { + "epoch": 1.35, + "learning_rate": 1.2042545615142052e-06, + "loss": 0.6738, + "step": 52846 + }, + { + "epoch": 1.35, + "learning_rate": 1.20422747433595e-06, + "loss": 0.7461, + "step": 52847 + }, + { + "epoch": 1.35, + "learning_rate": 1.2042003870013272e-06, + "loss": 0.5771, + "step": 52848 + }, + { + "epoch": 1.35, + "learning_rate": 1.2041732995103575e-06, + "loss": 0.6191, + "step": 52849 + }, + { + "epoch": 1.35, + "learning_rate": 1.2041462118630616e-06, + "loss": 0.6304, + "step": 52850 + }, + { + "epoch": 1.35, + "learning_rate": 1.2041191240594606e-06, + "loss": 0.7354, + "step": 52851 + }, + { + "epoch": 1.35, + "learning_rate": 1.2040920360995748e-06, + "loss": 0.4292, + "step": 52852 + }, + { + "epoch": 1.35, + "learning_rate": 1.2040649479834252e-06, + "loss": 0.6113, + "step": 52853 + }, + { + "epoch": 1.35, + "learning_rate": 1.2040378597110323e-06, + "loss": 0.7119, + "step": 52854 + }, + { + "epoch": 1.35, + "learning_rate": 1.204010771282417e-06, + "loss": 0.7285, + "step": 52855 + }, + { + "epoch": 1.35, + "learning_rate": 1.2039836826976e-06, + "loss": 0.5723, + "step": 52856 + }, + { + "epoch": 1.35, + "learning_rate": 1.2039565939566024e-06, + "loss": 0.8125, + "step": 52857 + }, + { + "epoch": 1.35, + "learning_rate": 1.2039295050594444e-06, + "loss": 0.4546, + "step": 52858 + }, + { + "epoch": 1.35, + "learning_rate": 1.203902416006147e-06, + "loss": 0.5669, + "step": 52859 + }, + { + "epoch": 1.35, + "learning_rate": 1.2038753267967307e-06, + "loss": 0.6289, + "step": 52860 + }, + { + "epoch": 1.35, + "learning_rate": 1.2038482374312166e-06, + "loss": 0.5566, + "step": 52861 + }, + { + "epoch": 1.35, + "learning_rate": 1.2038211479096253e-06, + "loss": 0.7939, + "step": 52862 + }, + { + "epoch": 1.35, + "learning_rate": 1.2037940582319776e-06, + "loss": 0.4897, + "step": 52863 + }, + { + "epoch": 1.35, + "learning_rate": 1.2037669683982938e-06, + "loss": 0.4961, + "step": 52864 + }, + { + "epoch": 1.35, + "learning_rate": 1.2037398784085954e-06, + "loss": 0.5129, + "step": 52865 + }, + { + "epoch": 1.35, + "learning_rate": 1.2037127882629025e-06, + "loss": 0.5444, + "step": 52866 + }, + { + "epoch": 1.36, + "learning_rate": 1.2036856979612362e-06, + "loss": 0.5889, + "step": 52867 + }, + { + "epoch": 1.36, + "learning_rate": 1.2036586075036173e-06, + "loss": 0.3687, + "step": 52868 + }, + { + "epoch": 1.36, + "learning_rate": 1.2036315168900662e-06, + "loss": 0.8867, + "step": 52869 + }, + { + "epoch": 1.36, + "learning_rate": 1.2036044261206035e-06, + "loss": 0.5645, + "step": 52870 + }, + { + "epoch": 1.36, + "learning_rate": 1.2035773351952507e-06, + "loss": 0.7129, + "step": 52871 + }, + { + "epoch": 1.36, + "learning_rate": 1.2035502441140277e-06, + "loss": 0.6738, + "step": 52872 + }, + { + "epoch": 1.36, + "learning_rate": 1.203523152876956e-06, + "loss": 0.6299, + "step": 52873 + }, + { + "epoch": 1.36, + "learning_rate": 1.2034960614840558e-06, + "loss": 0.6689, + "step": 52874 + }, + { + "epoch": 1.36, + "learning_rate": 1.203468969935348e-06, + "loss": 0.6963, + "step": 52875 + }, + { + "epoch": 1.36, + "learning_rate": 1.2034418782308536e-06, + "loss": 0.5596, + "step": 52876 + }, + { + "epoch": 1.36, + "learning_rate": 1.2034147863705928e-06, + "loss": 0.4956, + "step": 52877 + }, + { + "epoch": 1.36, + "learning_rate": 1.2033876943545869e-06, + "loss": 0.6416, + "step": 52878 + }, + { + "epoch": 1.36, + "learning_rate": 1.2033606021828562e-06, + "loss": 0.6665, + "step": 52879 + }, + { + "epoch": 1.36, + "learning_rate": 1.2033335098554218e-06, + "loss": 0.6328, + "step": 52880 + }, + { + "epoch": 1.36, + "learning_rate": 1.203306417372304e-06, + "loss": 0.6616, + "step": 52881 + }, + { + "epoch": 1.36, + "learning_rate": 1.2032793247335241e-06, + "loss": 0.7168, + "step": 52882 + }, + { + "epoch": 1.36, + "learning_rate": 1.2032522319391025e-06, + "loss": 0.7041, + "step": 52883 + }, + { + "epoch": 1.36, + "learning_rate": 1.2032251389890601e-06, + "loss": 0.8604, + "step": 52884 + }, + { + "epoch": 1.36, + "learning_rate": 1.2031980458834174e-06, + "loss": 0.7305, + "step": 52885 + }, + { + "epoch": 1.36, + "learning_rate": 1.2031709526221953e-06, + "loss": 0.4582, + "step": 52886 + }, + { + "epoch": 1.36, + "learning_rate": 1.2031438592054145e-06, + "loss": 0.6626, + "step": 52887 + }, + { + "epoch": 1.36, + "learning_rate": 1.2031167656330963e-06, + "loss": 0.7041, + "step": 52888 + }, + { + "epoch": 1.36, + "learning_rate": 1.2030896719052604e-06, + "loss": 0.5801, + "step": 52889 + }, + { + "epoch": 1.36, + "learning_rate": 1.2030625780219284e-06, + "loss": 0.6133, + "step": 52890 + }, + { + "epoch": 1.36, + "learning_rate": 1.2030354839831203e-06, + "loss": 0.7432, + "step": 52891 + }, + { + "epoch": 1.36, + "learning_rate": 1.2030083897888575e-06, + "loss": 0.5537, + "step": 52892 + }, + { + "epoch": 1.36, + "learning_rate": 1.2029812954391605e-06, + "loss": 0.6992, + "step": 52893 + }, + { + "epoch": 1.36, + "learning_rate": 1.20295420093405e-06, + "loss": 0.5601, + "step": 52894 + }, + { + "epoch": 1.36, + "learning_rate": 1.2029271062735468e-06, + "loss": 0.4568, + "step": 52895 + }, + { + "epoch": 1.36, + "learning_rate": 1.2029000114576717e-06, + "loss": 0.6006, + "step": 52896 + }, + { + "epoch": 1.36, + "learning_rate": 1.2028729164864455e-06, + "loss": 0.5034, + "step": 52897 + }, + { + "epoch": 1.36, + "learning_rate": 1.2028458213598887e-06, + "loss": 0.5647, + "step": 52898 + }, + { + "epoch": 1.36, + "learning_rate": 1.2028187260780222e-06, + "loss": 0.5508, + "step": 52899 + }, + { + "epoch": 1.36, + "learning_rate": 1.2027916306408667e-06, + "loss": 0.7197, + "step": 52900 + }, + { + "epoch": 1.36, + "learning_rate": 1.202764535048443e-06, + "loss": 0.8926, + "step": 52901 + }, + { + "epoch": 1.36, + "learning_rate": 1.2027374393007716e-06, + "loss": 0.5474, + "step": 52902 + }, + { + "epoch": 1.36, + "learning_rate": 1.2027103433978743e-06, + "loss": 0.7734, + "step": 52903 + }, + { + "epoch": 1.36, + "learning_rate": 1.2026832473397702e-06, + "loss": 0.666, + "step": 52904 + }, + { + "epoch": 1.36, + "learning_rate": 1.202656151126481e-06, + "loss": 0.5503, + "step": 52905 + }, + { + "epoch": 1.36, + "learning_rate": 1.2026290547580274e-06, + "loss": 0.5315, + "step": 52906 + }, + { + "epoch": 1.36, + "learning_rate": 1.20260195823443e-06, + "loss": 0.6904, + "step": 52907 + }, + { + "epoch": 1.36, + "learning_rate": 1.2025748615557096e-06, + "loss": 0.5586, + "step": 52908 + }, + { + "epoch": 1.36, + "learning_rate": 1.2025477647218872e-06, + "loss": 0.6128, + "step": 52909 + }, + { + "epoch": 1.36, + "learning_rate": 1.202520667732983e-06, + "loss": 0.6338, + "step": 52910 + }, + { + "epoch": 1.36, + "learning_rate": 1.2024935705890177e-06, + "loss": 0.7178, + "step": 52911 + }, + { + "epoch": 1.36, + "learning_rate": 1.2024664732900128e-06, + "loss": 0.8662, + "step": 52912 + }, + { + "epoch": 1.36, + "learning_rate": 1.2024393758359888e-06, + "loss": 0.6323, + "step": 52913 + }, + { + "epoch": 1.36, + "learning_rate": 1.202412278226966e-06, + "loss": 0.708, + "step": 52914 + }, + { + "epoch": 1.36, + "learning_rate": 1.2023851804629657e-06, + "loss": 0.5972, + "step": 52915 + }, + { + "epoch": 1.36, + "learning_rate": 1.2023580825440079e-06, + "loss": 0.5542, + "step": 52916 + }, + { + "epoch": 1.36, + "learning_rate": 1.2023309844701142e-06, + "loss": 0.5938, + "step": 52917 + }, + { + "epoch": 1.36, + "learning_rate": 1.2023038862413049e-06, + "loss": 0.6523, + "step": 52918 + }, + { + "epoch": 1.36, + "learning_rate": 1.2022767878576008e-06, + "loss": 0.7227, + "step": 52919 + }, + { + "epoch": 1.36, + "learning_rate": 1.2022496893190225e-06, + "loss": 0.6777, + "step": 52920 + }, + { + "epoch": 1.36, + "learning_rate": 1.202222590625591e-06, + "loss": 0.748, + "step": 52921 + }, + { + "epoch": 1.36, + "learning_rate": 1.2021954917773272e-06, + "loss": 0.5986, + "step": 52922 + }, + { + "epoch": 1.36, + "learning_rate": 1.2021683927742514e-06, + "loss": 0.646, + "step": 52923 + }, + { + "epoch": 1.36, + "learning_rate": 1.2021412936163847e-06, + "loss": 0.7734, + "step": 52924 + }, + { + "epoch": 1.36, + "learning_rate": 1.2021141943037474e-06, + "loss": 0.6234, + "step": 52925 + }, + { + "epoch": 1.36, + "learning_rate": 1.2020870948363608e-06, + "loss": 0.5388, + "step": 52926 + }, + { + "epoch": 1.36, + "learning_rate": 1.2020599952142453e-06, + "loss": 0.6045, + "step": 52927 + }, + { + "epoch": 1.36, + "learning_rate": 1.2020328954374219e-06, + "loss": 0.6836, + "step": 52928 + }, + { + "epoch": 1.36, + "learning_rate": 1.202005795505911e-06, + "loss": 0.8174, + "step": 52929 + }, + { + "epoch": 1.36, + "learning_rate": 1.2019786954197338e-06, + "loss": 0.7456, + "step": 52930 + }, + { + "epoch": 1.36, + "learning_rate": 1.2019515951789105e-06, + "loss": 0.6831, + "step": 52931 + }, + { + "epoch": 1.36, + "learning_rate": 1.2019244947834623e-06, + "loss": 0.7852, + "step": 52932 + }, + { + "epoch": 1.36, + "learning_rate": 1.20189739423341e-06, + "loss": 0.6196, + "step": 52933 + }, + { + "epoch": 1.36, + "learning_rate": 1.2018702935287739e-06, + "loss": 0.707, + "step": 52934 + }, + { + "epoch": 1.36, + "learning_rate": 1.201843192669575e-06, + "loss": 0.7559, + "step": 52935 + }, + { + "epoch": 1.36, + "learning_rate": 1.2018160916558342e-06, + "loss": 0.3564, + "step": 52936 + }, + { + "epoch": 1.36, + "learning_rate": 1.2017889904875718e-06, + "loss": 0.6475, + "step": 52937 + }, + { + "epoch": 1.36, + "learning_rate": 1.2017618891648091e-06, + "loss": 0.6528, + "step": 52938 + }, + { + "epoch": 1.36, + "learning_rate": 1.2017347876875667e-06, + "loss": 0.709, + "step": 52939 + }, + { + "epoch": 1.36, + "learning_rate": 1.2017076860558648e-06, + "loss": 0.7266, + "step": 52940 + }, + { + "epoch": 1.36, + "learning_rate": 1.201680584269725e-06, + "loss": 0.708, + "step": 52941 + }, + { + "epoch": 1.36, + "learning_rate": 1.2016534823291677e-06, + "loss": 0.6621, + "step": 52942 + }, + { + "epoch": 1.36, + "learning_rate": 1.2016263802342135e-06, + "loss": 0.5044, + "step": 52943 + }, + { + "epoch": 1.36, + "learning_rate": 1.201599277984883e-06, + "loss": 0.7344, + "step": 52944 + }, + { + "epoch": 1.36, + "learning_rate": 1.2015721755811976e-06, + "loss": 0.6035, + "step": 52945 + }, + { + "epoch": 1.36, + "learning_rate": 1.2015450730231773e-06, + "loss": 0.6816, + "step": 52946 + }, + { + "epoch": 1.36, + "learning_rate": 1.2015179703108433e-06, + "loss": 0.5898, + "step": 52947 + }, + { + "epoch": 1.36, + "learning_rate": 1.2014908674442163e-06, + "loss": 0.7178, + "step": 52948 + }, + { + "epoch": 1.36, + "learning_rate": 1.2014637644233171e-06, + "loss": 0.7334, + "step": 52949 + }, + { + "epoch": 1.36, + "learning_rate": 1.2014366612481664e-06, + "loss": 0.6309, + "step": 52950 + }, + { + "epoch": 1.36, + "learning_rate": 1.2014095579187848e-06, + "loss": 0.7383, + "step": 52951 + }, + { + "epoch": 1.36, + "learning_rate": 1.201382454435193e-06, + "loss": 0.5447, + "step": 52952 + }, + { + "epoch": 1.36, + "learning_rate": 1.2013553507974124e-06, + "loss": 0.918, + "step": 52953 + }, + { + "epoch": 1.36, + "learning_rate": 1.2013282470054626e-06, + "loss": 0.7344, + "step": 52954 + }, + { + "epoch": 1.36, + "learning_rate": 1.2013011430593656e-06, + "loss": 0.5684, + "step": 52955 + }, + { + "epoch": 1.36, + "learning_rate": 1.2012740389591412e-06, + "loss": 0.8545, + "step": 52956 + }, + { + "epoch": 1.36, + "learning_rate": 1.2012469347048106e-06, + "loss": 0.791, + "step": 52957 + }, + { + "epoch": 1.36, + "learning_rate": 1.2012198302963946e-06, + "loss": 0.585, + "step": 52958 + }, + { + "epoch": 1.36, + "learning_rate": 1.2011927257339138e-06, + "loss": 0.7153, + "step": 52959 + }, + { + "epoch": 1.36, + "learning_rate": 1.201165621017389e-06, + "loss": 0.7002, + "step": 52960 + }, + { + "epoch": 1.36, + "learning_rate": 1.2011385161468408e-06, + "loss": 0.5879, + "step": 52961 + }, + { + "epoch": 1.36, + "learning_rate": 1.20111141112229e-06, + "loss": 0.7363, + "step": 52962 + }, + { + "epoch": 1.36, + "learning_rate": 1.2010843059437577e-06, + "loss": 0.6445, + "step": 52963 + }, + { + "epoch": 1.36, + "learning_rate": 1.2010572006112643e-06, + "loss": 0.6406, + "step": 52964 + }, + { + "epoch": 1.36, + "learning_rate": 1.2010300951248305e-06, + "loss": 0.5591, + "step": 52965 + }, + { + "epoch": 1.36, + "learning_rate": 1.2010029894844774e-06, + "loss": 0.7441, + "step": 52966 + }, + { + "epoch": 1.36, + "learning_rate": 1.2009758836902252e-06, + "loss": 0.7646, + "step": 52967 + }, + { + "epoch": 1.36, + "learning_rate": 1.2009487777420958e-06, + "loss": 0.5776, + "step": 52968 + }, + { + "epoch": 1.36, + "learning_rate": 1.2009216716401085e-06, + "loss": 0.7773, + "step": 52969 + }, + { + "epoch": 1.36, + "learning_rate": 1.2008945653842848e-06, + "loss": 0.5776, + "step": 52970 + }, + { + "epoch": 1.36, + "learning_rate": 1.2008674589746452e-06, + "loss": 0.7227, + "step": 52971 + }, + { + "epoch": 1.36, + "learning_rate": 1.200840352411211e-06, + "loss": 0.8301, + "step": 52972 + }, + { + "epoch": 1.36, + "learning_rate": 1.2008132456940026e-06, + "loss": 0.3735, + "step": 52973 + }, + { + "epoch": 1.36, + "learning_rate": 1.2007861388230404e-06, + "loss": 0.7246, + "step": 52974 + }, + { + "epoch": 1.36, + "learning_rate": 1.2007590317983456e-06, + "loss": 0.751, + "step": 52975 + }, + { + "epoch": 1.36, + "learning_rate": 1.200731924619939e-06, + "loss": 0.6436, + "step": 52976 + }, + { + "epoch": 1.36, + "learning_rate": 1.2007048172878409e-06, + "loss": 0.5481, + "step": 52977 + }, + { + "epoch": 1.36, + "learning_rate": 1.2006777098020728e-06, + "loss": 0.8057, + "step": 52978 + }, + { + "epoch": 1.36, + "learning_rate": 1.2006506021626548e-06, + "loss": 0.8311, + "step": 52979 + }, + { + "epoch": 1.36, + "learning_rate": 1.2006234943696078e-06, + "loss": 0.6108, + "step": 52980 + }, + { + "epoch": 1.36, + "learning_rate": 1.2005963864229526e-06, + "loss": 0.6143, + "step": 52981 + }, + { + "epoch": 1.36, + "learning_rate": 1.20056927832271e-06, + "loss": 0.6978, + "step": 52982 + }, + { + "epoch": 1.36, + "learning_rate": 1.2005421700689007e-06, + "loss": 0.6719, + "step": 52983 + }, + { + "epoch": 1.36, + "learning_rate": 1.2005150616615453e-06, + "loss": 0.5957, + "step": 52984 + }, + { + "epoch": 1.36, + "learning_rate": 1.200487953100665e-06, + "loss": 0.6067, + "step": 52985 + }, + { + "epoch": 1.36, + "learning_rate": 1.20046084438628e-06, + "loss": 0.6211, + "step": 52986 + }, + { + "epoch": 1.36, + "learning_rate": 1.2004337355184118e-06, + "loss": 0.5889, + "step": 52987 + }, + { + "epoch": 1.36, + "learning_rate": 1.2004066264970805e-06, + "loss": 0.7842, + "step": 52988 + }, + { + "epoch": 1.36, + "learning_rate": 1.2003795173223072e-06, + "loss": 0.6182, + "step": 52989 + }, + { + "epoch": 1.36, + "learning_rate": 1.2003524079941124e-06, + "loss": 0.5646, + "step": 52990 + }, + { + "epoch": 1.36, + "learning_rate": 1.2003252985125168e-06, + "loss": 0.7178, + "step": 52991 + }, + { + "epoch": 1.36, + "learning_rate": 1.2002981888775411e-06, + "loss": 0.5605, + "step": 52992 + }, + { + "epoch": 1.36, + "learning_rate": 1.2002710790892072e-06, + "loss": 0.7646, + "step": 52993 + }, + { + "epoch": 1.36, + "learning_rate": 1.2002439691475342e-06, + "loss": 0.6982, + "step": 52994 + }, + { + "epoch": 1.36, + "learning_rate": 1.2002168590525438e-06, + "loss": 0.707, + "step": 52995 + }, + { + "epoch": 1.36, + "learning_rate": 1.2001897488042566e-06, + "loss": 0.7217, + "step": 52996 + }, + { + "epoch": 1.36, + "learning_rate": 1.2001626384026932e-06, + "loss": 0.6333, + "step": 52997 + }, + { + "epoch": 1.36, + "learning_rate": 1.2001355278478747e-06, + "loss": 0.4363, + "step": 52998 + }, + { + "epoch": 1.36, + "learning_rate": 1.2001084171398215e-06, + "loss": 0.7334, + "step": 52999 + }, + { + "epoch": 1.36, + "learning_rate": 1.200081306278554e-06, + "loss": 0.7031, + "step": 53000 + }, + { + "epoch": 1.36, + "learning_rate": 1.2000541952640942e-06, + "loss": 0.5781, + "step": 53001 + }, + { + "epoch": 1.36, + "learning_rate": 1.2000270840964617e-06, + "loss": 0.6768, + "step": 53002 + }, + { + "epoch": 1.36, + "learning_rate": 1.1999999727756777e-06, + "loss": 0.7734, + "step": 53003 + }, + { + "epoch": 1.36, + "learning_rate": 1.1999728613017632e-06, + "loss": 0.7168, + "step": 53004 + }, + { + "epoch": 1.36, + "learning_rate": 1.1999457496747386e-06, + "loss": 0.6699, + "step": 53005 + }, + { + "epoch": 1.36, + "learning_rate": 1.1999186378946242e-06, + "loss": 0.5391, + "step": 53006 + }, + { + "epoch": 1.36, + "learning_rate": 1.199891525961442e-06, + "loss": 0.6187, + "step": 53007 + }, + { + "epoch": 1.36, + "learning_rate": 1.1998644138752117e-06, + "loss": 0.5884, + "step": 53008 + }, + { + "epoch": 1.36, + "learning_rate": 1.1998373016359543e-06, + "loss": 0.6885, + "step": 53009 + }, + { + "epoch": 1.36, + "learning_rate": 1.1998101892436907e-06, + "loss": 0.6602, + "step": 53010 + }, + { + "epoch": 1.36, + "learning_rate": 1.1997830766984415e-06, + "loss": 0.7031, + "step": 53011 + }, + { + "epoch": 1.36, + "learning_rate": 1.1997559640002281e-06, + "loss": 0.626, + "step": 53012 + }, + { + "epoch": 1.36, + "learning_rate": 1.1997288511490705e-06, + "loss": 0.6006, + "step": 53013 + }, + { + "epoch": 1.36, + "learning_rate": 1.1997017381449897e-06, + "loss": 0.7295, + "step": 53014 + }, + { + "epoch": 1.36, + "learning_rate": 1.1996746249880063e-06, + "loss": 0.6965, + "step": 53015 + }, + { + "epoch": 1.36, + "learning_rate": 1.1996475116781414e-06, + "loss": 0.6167, + "step": 53016 + }, + { + "epoch": 1.36, + "learning_rate": 1.1996203982154153e-06, + "loss": 0.5044, + "step": 53017 + }, + { + "epoch": 1.36, + "learning_rate": 1.1995932845998496e-06, + "loss": 0.626, + "step": 53018 + }, + { + "epoch": 1.36, + "learning_rate": 1.1995661708314639e-06, + "loss": 0.4576, + "step": 53019 + }, + { + "epoch": 1.36, + "learning_rate": 1.19953905691028e-06, + "loss": 0.647, + "step": 53020 + }, + { + "epoch": 1.36, + "learning_rate": 1.1995119428363178e-06, + "loss": 0.583, + "step": 53021 + }, + { + "epoch": 1.36, + "learning_rate": 1.199484828609599e-06, + "loss": 0.5718, + "step": 53022 + }, + { + "epoch": 1.36, + "learning_rate": 1.1994577142301433e-06, + "loss": 0.688, + "step": 53023 + }, + { + "epoch": 1.36, + "learning_rate": 1.1994305996979726e-06, + "loss": 0.6885, + "step": 53024 + }, + { + "epoch": 1.36, + "learning_rate": 1.1994034850131065e-06, + "loss": 0.5513, + "step": 53025 + }, + { + "epoch": 1.36, + "learning_rate": 1.1993763701755666e-06, + "loss": 0.5674, + "step": 53026 + }, + { + "epoch": 1.36, + "learning_rate": 1.1993492551853733e-06, + "loss": 0.5171, + "step": 53027 + }, + { + "epoch": 1.36, + "learning_rate": 1.1993221400425473e-06, + "loss": 0.5986, + "step": 53028 + }, + { + "epoch": 1.36, + "learning_rate": 1.1992950247471098e-06, + "loss": 0.5118, + "step": 53029 + }, + { + "epoch": 1.36, + "learning_rate": 1.199267909299081e-06, + "loss": 0.8975, + "step": 53030 + }, + { + "epoch": 1.36, + "learning_rate": 1.1992407936984822e-06, + "loss": 0.7842, + "step": 53031 + }, + { + "epoch": 1.36, + "learning_rate": 1.1992136779453337e-06, + "loss": 0.5962, + "step": 53032 + }, + { + "epoch": 1.36, + "learning_rate": 1.1991865620396567e-06, + "loss": 0.604, + "step": 53033 + }, + { + "epoch": 1.36, + "learning_rate": 1.199159445981471e-06, + "loss": 0.7373, + "step": 53034 + }, + { + "epoch": 1.36, + "learning_rate": 1.1991323297707987e-06, + "loss": 0.6504, + "step": 53035 + }, + { + "epoch": 1.36, + "learning_rate": 1.1991052134076599e-06, + "loss": 0.6196, + "step": 53036 + }, + { + "epoch": 1.36, + "learning_rate": 1.1990780968920754e-06, + "loss": 0.7178, + "step": 53037 + }, + { + "epoch": 1.36, + "learning_rate": 1.1990509802240658e-06, + "loss": 0.5977, + "step": 53038 + }, + { + "epoch": 1.36, + "learning_rate": 1.199023863403652e-06, + "loss": 0.7021, + "step": 53039 + }, + { + "epoch": 1.36, + "learning_rate": 1.1989967464308549e-06, + "loss": 0.7305, + "step": 53040 + }, + { + "epoch": 1.36, + "learning_rate": 1.198969629305695e-06, + "loss": 0.5879, + "step": 53041 + }, + { + "epoch": 1.36, + "learning_rate": 1.1989425120281932e-06, + "loss": 0.9111, + "step": 53042 + }, + { + "epoch": 1.36, + "learning_rate": 1.1989153945983706e-06, + "loss": 0.5662, + "step": 53043 + }, + { + "epoch": 1.36, + "learning_rate": 1.1988882770162472e-06, + "loss": 0.6738, + "step": 53044 + }, + { + "epoch": 1.36, + "learning_rate": 1.1988611592818446e-06, + "loss": 0.6895, + "step": 53045 + }, + { + "epoch": 1.36, + "learning_rate": 1.1988340413951826e-06, + "loss": 0.6133, + "step": 53046 + }, + { + "epoch": 1.36, + "learning_rate": 1.198806923356283e-06, + "loss": 0.3467, + "step": 53047 + }, + { + "epoch": 1.36, + "learning_rate": 1.1987798051651659e-06, + "loss": 0.791, + "step": 53048 + }, + { + "epoch": 1.36, + "learning_rate": 1.1987526868218523e-06, + "loss": 0.7119, + "step": 53049 + }, + { + "epoch": 1.36, + "learning_rate": 1.1987255683263627e-06, + "loss": 0.8555, + "step": 53050 + }, + { + "epoch": 1.36, + "learning_rate": 1.1986984496787182e-06, + "loss": 0.707, + "step": 53051 + }, + { + "epoch": 1.36, + "learning_rate": 1.1986713308789397e-06, + "loss": 0.7656, + "step": 53052 + }, + { + "epoch": 1.36, + "learning_rate": 1.1986442119270473e-06, + "loss": 0.5557, + "step": 53053 + }, + { + "epoch": 1.36, + "learning_rate": 1.1986170928230623e-06, + "loss": 0.6001, + "step": 53054 + }, + { + "epoch": 1.36, + "learning_rate": 1.1985899735670053e-06, + "loss": 0.709, + "step": 53055 + }, + { + "epoch": 1.36, + "learning_rate": 1.1985628541588972e-06, + "loss": 0.6172, + "step": 53056 + }, + { + "epoch": 1.36, + "learning_rate": 1.1985357345987588e-06, + "loss": 0.6111, + "step": 53057 + }, + { + "epoch": 1.36, + "learning_rate": 1.1985086148866103e-06, + "loss": 0.6348, + "step": 53058 + }, + { + "epoch": 1.36, + "learning_rate": 1.198481495022473e-06, + "loss": 0.7979, + "step": 53059 + }, + { + "epoch": 1.36, + "learning_rate": 1.1984543750063678e-06, + "loss": 0.5322, + "step": 53060 + }, + { + "epoch": 1.36, + "learning_rate": 1.1984272548383149e-06, + "loss": 0.5063, + "step": 53061 + }, + { + "epoch": 1.36, + "learning_rate": 1.198400134518336e-06, + "loss": 0.4961, + "step": 53062 + }, + { + "epoch": 1.36, + "learning_rate": 1.1983730140464502e-06, + "loss": 0.7344, + "step": 53063 + }, + { + "epoch": 1.36, + "learning_rate": 1.1983458934226802e-06, + "loss": 0.5815, + "step": 53064 + }, + { + "epoch": 1.36, + "learning_rate": 1.1983187726470454e-06, + "loss": 0.8223, + "step": 53065 + }, + { + "epoch": 1.36, + "learning_rate": 1.1982916517195671e-06, + "loss": 0.5825, + "step": 53066 + }, + { + "epoch": 1.36, + "learning_rate": 1.1982645306402664e-06, + "loss": 0.5166, + "step": 53067 + }, + { + "epoch": 1.36, + "learning_rate": 1.1982374094091632e-06, + "loss": 0.7529, + "step": 53068 + }, + { + "epoch": 1.36, + "learning_rate": 1.1982102880262788e-06, + "loss": 0.6299, + "step": 53069 + }, + { + "epoch": 1.36, + "learning_rate": 1.198183166491634e-06, + "loss": 0.4932, + "step": 53070 + }, + { + "epoch": 1.36, + "learning_rate": 1.1981560448052493e-06, + "loss": 0.7666, + "step": 53071 + }, + { + "epoch": 1.36, + "learning_rate": 1.198128922967146e-06, + "loss": 0.4243, + "step": 53072 + }, + { + "epoch": 1.36, + "learning_rate": 1.198101800977344e-06, + "loss": 0.7305, + "step": 53073 + }, + { + "epoch": 1.36, + "learning_rate": 1.1980746788358649e-06, + "loss": 0.6074, + "step": 53074 + }, + { + "epoch": 1.36, + "learning_rate": 1.198047556542729e-06, + "loss": 0.5547, + "step": 53075 + }, + { + "epoch": 1.36, + "learning_rate": 1.1980204340979573e-06, + "loss": 0.4724, + "step": 53076 + }, + { + "epoch": 1.36, + "learning_rate": 1.1979933115015703e-06, + "loss": 0.812, + "step": 53077 + }, + { + "epoch": 1.36, + "learning_rate": 1.197966188753589e-06, + "loss": 0.8213, + "step": 53078 + }, + { + "epoch": 1.36, + "learning_rate": 1.1979390658540342e-06, + "loss": 0.5547, + "step": 53079 + }, + { + "epoch": 1.36, + "learning_rate": 1.1979119428029264e-06, + "loss": 0.5439, + "step": 53080 + }, + { + "epoch": 1.36, + "learning_rate": 1.1978848196002864e-06, + "loss": 0.7139, + "step": 53081 + }, + { + "epoch": 1.36, + "learning_rate": 1.1978576962461356e-06, + "loss": 0.6924, + "step": 53082 + }, + { + "epoch": 1.36, + "learning_rate": 1.197830572740494e-06, + "loss": 0.7686, + "step": 53083 + }, + { + "epoch": 1.36, + "learning_rate": 1.1978034490833825e-06, + "loss": 0.7031, + "step": 53084 + }, + { + "epoch": 1.36, + "learning_rate": 1.197776325274822e-06, + "loss": 0.5586, + "step": 53085 + }, + { + "epoch": 1.36, + "learning_rate": 1.197749201314833e-06, + "loss": 0.584, + "step": 53086 + }, + { + "epoch": 1.36, + "learning_rate": 1.1977220772034373e-06, + "loss": 0.7935, + "step": 53087 + }, + { + "epoch": 1.36, + "learning_rate": 1.1976949529406541e-06, + "loss": 0.7002, + "step": 53088 + }, + { + "epoch": 1.36, + "learning_rate": 1.1976678285265057e-06, + "loss": 0.4824, + "step": 53089 + }, + { + "epoch": 1.36, + "learning_rate": 1.1976407039610115e-06, + "loss": 0.7656, + "step": 53090 + }, + { + "epoch": 1.36, + "learning_rate": 1.197613579244193e-06, + "loss": 0.75, + "step": 53091 + }, + { + "epoch": 1.36, + "learning_rate": 1.1975864543760712e-06, + "loss": 0.7588, + "step": 53092 + }, + { + "epoch": 1.36, + "learning_rate": 1.1975593293566664e-06, + "loss": 0.5659, + "step": 53093 + }, + { + "epoch": 1.36, + "learning_rate": 1.1975322041859994e-06, + "loss": 0.5076, + "step": 53094 + }, + { + "epoch": 1.36, + "learning_rate": 1.1975050788640913e-06, + "loss": 0.7012, + "step": 53095 + }, + { + "epoch": 1.36, + "learning_rate": 1.1974779533909622e-06, + "loss": 0.5815, + "step": 53096 + }, + { + "epoch": 1.36, + "learning_rate": 1.1974508277666339e-06, + "loss": 0.7451, + "step": 53097 + }, + { + "epoch": 1.36, + "learning_rate": 1.1974237019911262e-06, + "loss": 0.6958, + "step": 53098 + }, + { + "epoch": 1.36, + "learning_rate": 1.19739657606446e-06, + "loss": 0.4722, + "step": 53099 + }, + { + "epoch": 1.36, + "learning_rate": 1.1973694499866566e-06, + "loss": 0.6172, + "step": 53100 + }, + { + "epoch": 1.36, + "learning_rate": 1.1973423237577365e-06, + "loss": 0.5879, + "step": 53101 + }, + { + "epoch": 1.36, + "learning_rate": 1.197315197377721e-06, + "loss": 0.708, + "step": 53102 + }, + { + "epoch": 1.36, + "learning_rate": 1.1972880708466294e-06, + "loss": 0.5034, + "step": 53103 + }, + { + "epoch": 1.36, + "learning_rate": 1.1972609441644838e-06, + "loss": 0.5271, + "step": 53104 + }, + { + "epoch": 1.36, + "learning_rate": 1.1972338173313046e-06, + "loss": 0.5708, + "step": 53105 + }, + { + "epoch": 1.36, + "learning_rate": 1.1972066903471125e-06, + "loss": 0.7139, + "step": 53106 + }, + { + "epoch": 1.36, + "learning_rate": 1.1971795632119283e-06, + "loss": 0.7764, + "step": 53107 + }, + { + "epoch": 1.36, + "learning_rate": 1.197152435925773e-06, + "loss": 0.6274, + "step": 53108 + }, + { + "epoch": 1.36, + "learning_rate": 1.1971253084886667e-06, + "loss": 0.5254, + "step": 53109 + }, + { + "epoch": 1.36, + "learning_rate": 1.1970981809006308e-06, + "loss": 0.4862, + "step": 53110 + }, + { + "epoch": 1.36, + "learning_rate": 1.197071053161686e-06, + "loss": 0.7363, + "step": 53111 + }, + { + "epoch": 1.36, + "learning_rate": 1.1970439252718532e-06, + "loss": 0.7979, + "step": 53112 + }, + { + "epoch": 1.36, + "learning_rate": 1.1970167972311523e-06, + "loss": 0.7295, + "step": 53113 + }, + { + "epoch": 1.36, + "learning_rate": 1.196989669039605e-06, + "loss": 0.6602, + "step": 53114 + }, + { + "epoch": 1.36, + "learning_rate": 1.1969625406972318e-06, + "loss": 0.7617, + "step": 53115 + }, + { + "epoch": 1.36, + "learning_rate": 1.1969354122040533e-06, + "loss": 0.5861, + "step": 53116 + }, + { + "epoch": 1.36, + "learning_rate": 1.1969082835600908e-06, + "loss": 0.7461, + "step": 53117 + }, + { + "epoch": 1.36, + "learning_rate": 1.1968811547653641e-06, + "loss": 0.6689, + "step": 53118 + }, + { + "epoch": 1.36, + "learning_rate": 1.1968540258198952e-06, + "loss": 0.5601, + "step": 53119 + }, + { + "epoch": 1.36, + "learning_rate": 1.1968268967237035e-06, + "loss": 0.7021, + "step": 53120 + }, + { + "epoch": 1.36, + "learning_rate": 1.1967997674768112e-06, + "loss": 0.4207, + "step": 53121 + }, + { + "epoch": 1.36, + "learning_rate": 1.196772638079238e-06, + "loss": 0.6826, + "step": 53122 + }, + { + "epoch": 1.36, + "learning_rate": 1.1967455085310052e-06, + "loss": 0.6274, + "step": 53123 + }, + { + "epoch": 1.36, + "learning_rate": 1.196718378832133e-06, + "loss": 0.6099, + "step": 53124 + }, + { + "epoch": 1.36, + "learning_rate": 1.196691248982643e-06, + "loss": 0.6899, + "step": 53125 + }, + { + "epoch": 1.36, + "learning_rate": 1.1966641189825552e-06, + "loss": 0.666, + "step": 53126 + }, + { + "epoch": 1.36, + "learning_rate": 1.1966369888318912e-06, + "loss": 0.793, + "step": 53127 + }, + { + "epoch": 1.36, + "learning_rate": 1.1966098585306709e-06, + "loss": 0.8486, + "step": 53128 + }, + { + "epoch": 1.36, + "learning_rate": 1.1965827280789159e-06, + "loss": 0.6284, + "step": 53129 + }, + { + "epoch": 1.36, + "learning_rate": 1.196555597476646e-06, + "loss": 0.8975, + "step": 53130 + }, + { + "epoch": 1.36, + "learning_rate": 1.1965284667238829e-06, + "loss": 0.6943, + "step": 53131 + }, + { + "epoch": 1.36, + "learning_rate": 1.196501335820647e-06, + "loss": 0.5811, + "step": 53132 + }, + { + "epoch": 1.36, + "learning_rate": 1.196474204766959e-06, + "loss": 0.6904, + "step": 53133 + }, + { + "epoch": 1.36, + "learning_rate": 1.1964470735628395e-06, + "loss": 0.5835, + "step": 53134 + }, + { + "epoch": 1.36, + "learning_rate": 1.1964199422083096e-06, + "loss": 0.561, + "step": 53135 + }, + { + "epoch": 1.36, + "learning_rate": 1.19639281070339e-06, + "loss": 0.5415, + "step": 53136 + }, + { + "epoch": 1.36, + "learning_rate": 1.1963656790481015e-06, + "loss": 0.667, + "step": 53137 + }, + { + "epoch": 1.36, + "learning_rate": 1.1963385472424651e-06, + "loss": 0.5693, + "step": 53138 + }, + { + "epoch": 1.36, + "learning_rate": 1.196311415286501e-06, + "loss": 0.5659, + "step": 53139 + }, + { + "epoch": 1.36, + "learning_rate": 1.1962842831802301e-06, + "loss": 0.6211, + "step": 53140 + }, + { + "epoch": 1.36, + "learning_rate": 1.1962571509236738e-06, + "loss": 0.7188, + "step": 53141 + }, + { + "epoch": 1.36, + "learning_rate": 1.1962300185168524e-06, + "loss": 0.6904, + "step": 53142 + }, + { + "epoch": 1.36, + "learning_rate": 1.1962028859597864e-06, + "loss": 0.6992, + "step": 53143 + }, + { + "epoch": 1.36, + "learning_rate": 1.196175753252497e-06, + "loss": 0.6631, + "step": 53144 + }, + { + "epoch": 1.36, + "learning_rate": 1.1961486203950045e-06, + "loss": 0.5298, + "step": 53145 + }, + { + "epoch": 1.36, + "learning_rate": 1.1961214873873304e-06, + "loss": 0.6768, + "step": 53146 + }, + { + "epoch": 1.36, + "learning_rate": 1.1960943542294952e-06, + "loss": 0.6377, + "step": 53147 + }, + { + "epoch": 1.36, + "learning_rate": 1.1960672209215195e-06, + "loss": 0.7256, + "step": 53148 + }, + { + "epoch": 1.36, + "learning_rate": 1.196040087463424e-06, + "loss": 0.7188, + "step": 53149 + }, + { + "epoch": 1.36, + "learning_rate": 1.1960129538552296e-06, + "loss": 0.6943, + "step": 53150 + }, + { + "epoch": 1.36, + "learning_rate": 1.195985820096957e-06, + "loss": 0.6665, + "step": 53151 + }, + { + "epoch": 1.36, + "learning_rate": 1.1959586861886276e-06, + "loss": 0.7266, + "step": 53152 + }, + { + "epoch": 1.36, + "learning_rate": 1.1959315521302611e-06, + "loss": 0.7061, + "step": 53153 + }, + { + "epoch": 1.36, + "learning_rate": 1.1959044179218792e-06, + "loss": 0.7598, + "step": 53154 + }, + { + "epoch": 1.36, + "learning_rate": 1.1958772835635017e-06, + "loss": 0.6816, + "step": 53155 + }, + { + "epoch": 1.36, + "learning_rate": 1.1958501490551505e-06, + "loss": 0.5848, + "step": 53156 + }, + { + "epoch": 1.36, + "learning_rate": 1.1958230143968458e-06, + "loss": 0.6973, + "step": 53157 + }, + { + "epoch": 1.36, + "learning_rate": 1.1957958795886085e-06, + "loss": 0.9038, + "step": 53158 + }, + { + "epoch": 1.36, + "learning_rate": 1.1957687446304589e-06, + "loss": 0.5923, + "step": 53159 + }, + { + "epoch": 1.36, + "learning_rate": 1.1957416095224185e-06, + "loss": 0.7295, + "step": 53160 + }, + { + "epoch": 1.36, + "learning_rate": 1.1957144742645075e-06, + "loss": 0.6738, + "step": 53161 + }, + { + "epoch": 1.36, + "learning_rate": 1.1956873388567472e-06, + "loss": 0.6992, + "step": 53162 + }, + { + "epoch": 1.36, + "learning_rate": 1.195660203299158e-06, + "loss": 0.5942, + "step": 53163 + }, + { + "epoch": 1.36, + "learning_rate": 1.1956330675917605e-06, + "loss": 0.5771, + "step": 53164 + }, + { + "epoch": 1.36, + "learning_rate": 1.195605931734576e-06, + "loss": 0.7314, + "step": 53165 + }, + { + "epoch": 1.36, + "learning_rate": 1.1955787957276251e-06, + "loss": 0.7373, + "step": 53166 + }, + { + "epoch": 1.36, + "learning_rate": 1.1955516595709287e-06, + "loss": 0.5996, + "step": 53167 + }, + { + "epoch": 1.36, + "learning_rate": 1.195524523264507e-06, + "loss": 0.6313, + "step": 53168 + }, + { + "epoch": 1.36, + "learning_rate": 1.1954973868083812e-06, + "loss": 0.5063, + "step": 53169 + }, + { + "epoch": 1.36, + "learning_rate": 1.1954702502025723e-06, + "loss": 0.7671, + "step": 53170 + }, + { + "epoch": 1.36, + "learning_rate": 1.1954431134471007e-06, + "loss": 0.5225, + "step": 53171 + }, + { + "epoch": 1.36, + "learning_rate": 1.1954159765419873e-06, + "loss": 0.6885, + "step": 53172 + }, + { + "epoch": 1.36, + "learning_rate": 1.1953888394872528e-06, + "loss": 0.6641, + "step": 53173 + }, + { + "epoch": 1.36, + "learning_rate": 1.1953617022829181e-06, + "loss": 0.3948, + "step": 53174 + }, + { + "epoch": 1.36, + "learning_rate": 1.195334564929004e-06, + "loss": 0.7246, + "step": 53175 + }, + { + "epoch": 1.36, + "learning_rate": 1.1953074274255309e-06, + "loss": 0.4675, + "step": 53176 + }, + { + "epoch": 1.36, + "learning_rate": 1.1952802897725203e-06, + "loss": 0.4858, + "step": 53177 + }, + { + "epoch": 1.36, + "learning_rate": 1.1952531519699923e-06, + "loss": 0.7358, + "step": 53178 + }, + { + "epoch": 1.36, + "learning_rate": 1.195226014017968e-06, + "loss": 0.7563, + "step": 53179 + }, + { + "epoch": 1.36, + "learning_rate": 1.195198875916468e-06, + "loss": 0.6201, + "step": 53180 + }, + { + "epoch": 1.36, + "learning_rate": 1.1951717376655132e-06, + "loss": 0.6494, + "step": 53181 + }, + { + "epoch": 1.36, + "learning_rate": 1.1951445992651248e-06, + "loss": 0.708, + "step": 53182 + }, + { + "epoch": 1.36, + "learning_rate": 1.1951174607153227e-06, + "loss": 0.6602, + "step": 53183 + }, + { + "epoch": 1.36, + "learning_rate": 1.1950903220161284e-06, + "loss": 0.5996, + "step": 53184 + }, + { + "epoch": 1.36, + "learning_rate": 1.1950631831675621e-06, + "loss": 0.5674, + "step": 53185 + }, + { + "epoch": 1.36, + "learning_rate": 1.195036044169645e-06, + "loss": 0.7412, + "step": 53186 + }, + { + "epoch": 1.36, + "learning_rate": 1.1950089050223979e-06, + "loss": 0.6277, + "step": 53187 + }, + { + "epoch": 1.36, + "learning_rate": 1.1949817657258416e-06, + "loss": 0.6377, + "step": 53188 + }, + { + "epoch": 1.36, + "learning_rate": 1.1949546262799964e-06, + "loss": 0.5037, + "step": 53189 + }, + { + "epoch": 1.36, + "learning_rate": 1.1949274866848835e-06, + "loss": 0.6533, + "step": 53190 + }, + { + "epoch": 1.36, + "learning_rate": 1.1949003469405235e-06, + "loss": 0.7773, + "step": 53191 + }, + { + "epoch": 1.36, + "learning_rate": 1.1948732070469376e-06, + "loss": 0.5015, + "step": 53192 + }, + { + "epoch": 1.36, + "learning_rate": 1.1948460670041457e-06, + "loss": 0.6533, + "step": 53193 + }, + { + "epoch": 1.36, + "learning_rate": 1.1948189268121697e-06, + "loss": 0.6089, + "step": 53194 + }, + { + "epoch": 1.36, + "learning_rate": 1.1947917864710296e-06, + "loss": 0.5381, + "step": 53195 + }, + { + "epoch": 1.36, + "learning_rate": 1.1947646459807464e-06, + "loss": 0.7314, + "step": 53196 + }, + { + "epoch": 1.36, + "learning_rate": 1.1947375053413407e-06, + "loss": 0.7192, + "step": 53197 + }, + { + "epoch": 1.36, + "learning_rate": 1.1947103645528335e-06, + "loss": 0.5615, + "step": 53198 + }, + { + "epoch": 1.36, + "learning_rate": 1.1946832236152456e-06, + "loss": 0.6221, + "step": 53199 + }, + { + "epoch": 1.36, + "learning_rate": 1.1946560825285976e-06, + "loss": 0.4744, + "step": 53200 + }, + { + "epoch": 1.36, + "learning_rate": 1.1946289412929106e-06, + "loss": 0.6709, + "step": 53201 + }, + { + "epoch": 1.36, + "learning_rate": 1.1946017999082053e-06, + "loss": 0.5996, + "step": 53202 + }, + { + "epoch": 1.36, + "learning_rate": 1.1945746583745018e-06, + "loss": 0.4644, + "step": 53203 + }, + { + "epoch": 1.36, + "learning_rate": 1.1945475166918217e-06, + "loss": 0.5981, + "step": 53204 + }, + { + "epoch": 1.36, + "learning_rate": 1.1945203748601856e-06, + "loss": 0.7217, + "step": 53205 + }, + { + "epoch": 1.36, + "learning_rate": 1.194493232879614e-06, + "loss": 0.5337, + "step": 53206 + }, + { + "epoch": 1.36, + "learning_rate": 1.1944660907501281e-06, + "loss": 0.9414, + "step": 53207 + }, + { + "epoch": 1.36, + "learning_rate": 1.1944389484717482e-06, + "loss": 0.5117, + "step": 53208 + }, + { + "epoch": 1.36, + "learning_rate": 1.1944118060444957e-06, + "loss": 0.5406, + "step": 53209 + }, + { + "epoch": 1.36, + "learning_rate": 1.1943846634683907e-06, + "loss": 0.6943, + "step": 53210 + }, + { + "epoch": 1.36, + "learning_rate": 1.1943575207434544e-06, + "loss": 0.6826, + "step": 53211 + }, + { + "epoch": 1.36, + "learning_rate": 1.1943303778697075e-06, + "loss": 0.5552, + "step": 53212 + }, + { + "epoch": 1.36, + "learning_rate": 1.1943032348471708e-06, + "loss": 0.6943, + "step": 53213 + }, + { + "epoch": 1.36, + "learning_rate": 1.1942760916758649e-06, + "loss": 0.6699, + "step": 53214 + }, + { + "epoch": 1.36, + "learning_rate": 1.1942489483558108e-06, + "loss": 0.7607, + "step": 53215 + }, + { + "epoch": 1.36, + "learning_rate": 1.1942218048870295e-06, + "loss": 0.7412, + "step": 53216 + }, + { + "epoch": 1.36, + "learning_rate": 1.1941946612695413e-06, + "loss": 0.5664, + "step": 53217 + }, + { + "epoch": 1.36, + "learning_rate": 1.194167517503367e-06, + "loss": 0.6758, + "step": 53218 + }, + { + "epoch": 1.36, + "learning_rate": 1.1941403735885278e-06, + "loss": 0.4351, + "step": 53219 + }, + { + "epoch": 1.36, + "learning_rate": 1.194113229525044e-06, + "loss": 0.4722, + "step": 53220 + }, + { + "epoch": 1.36, + "learning_rate": 1.194086085312937e-06, + "loss": 0.6252, + "step": 53221 + }, + { + "epoch": 1.36, + "learning_rate": 1.1940589409522269e-06, + "loss": 0.6572, + "step": 53222 + }, + { + "epoch": 1.36, + "learning_rate": 1.194031796442935e-06, + "loss": 0.7656, + "step": 53223 + }, + { + "epoch": 1.36, + "learning_rate": 1.1940046517850815e-06, + "loss": 0.5815, + "step": 53224 + }, + { + "epoch": 1.36, + "learning_rate": 1.1939775069786878e-06, + "loss": 0.707, + "step": 53225 + }, + { + "epoch": 1.36, + "learning_rate": 1.1939503620237744e-06, + "loss": 0.6841, + "step": 53226 + }, + { + "epoch": 1.36, + "learning_rate": 1.1939232169203621e-06, + "loss": 0.7773, + "step": 53227 + }, + { + "epoch": 1.36, + "learning_rate": 1.1938960716684718e-06, + "loss": 0.6772, + "step": 53228 + }, + { + "epoch": 1.36, + "learning_rate": 1.193868926268124e-06, + "loss": 0.6543, + "step": 53229 + }, + { + "epoch": 1.36, + "learning_rate": 1.19384178071934e-06, + "loss": 0.6538, + "step": 53230 + }, + { + "epoch": 1.36, + "learning_rate": 1.1938146350221401e-06, + "loss": 0.7305, + "step": 53231 + }, + { + "epoch": 1.36, + "learning_rate": 1.1937874891765453e-06, + "loss": 0.6855, + "step": 53232 + }, + { + "epoch": 1.36, + "learning_rate": 1.1937603431825762e-06, + "loss": 0.5825, + "step": 53233 + }, + { + "epoch": 1.36, + "learning_rate": 1.1937331970402537e-06, + "loss": 0.6211, + "step": 53234 + }, + { + "epoch": 1.36, + "learning_rate": 1.1937060507495986e-06, + "loss": 0.6826, + "step": 53235 + }, + { + "epoch": 1.36, + "learning_rate": 1.193678904310632e-06, + "loss": 0.7959, + "step": 53236 + }, + { + "epoch": 1.36, + "learning_rate": 1.1936517577233743e-06, + "loss": 0.7632, + "step": 53237 + }, + { + "epoch": 1.36, + "learning_rate": 1.193624610987846e-06, + "loss": 0.6826, + "step": 53238 + }, + { + "epoch": 1.36, + "learning_rate": 1.1935974641040684e-06, + "loss": 0.5571, + "step": 53239 + }, + { + "epoch": 1.36, + "learning_rate": 1.1935703170720623e-06, + "loss": 0.4951, + "step": 53240 + }, + { + "epoch": 1.36, + "learning_rate": 1.1935431698918479e-06, + "loss": 0.7461, + "step": 53241 + }, + { + "epoch": 1.36, + "learning_rate": 1.1935160225634471e-06, + "loss": 0.6152, + "step": 53242 + }, + { + "epoch": 1.36, + "learning_rate": 1.1934888750868792e-06, + "loss": 0.6548, + "step": 53243 + }, + { + "epoch": 1.36, + "learning_rate": 1.1934617274621664e-06, + "loss": 0.6904, + "step": 53244 + }, + { + "epoch": 1.36, + "learning_rate": 1.1934345796893284e-06, + "loss": 0.6162, + "step": 53245 + }, + { + "epoch": 1.36, + "learning_rate": 1.1934074317683866e-06, + "loss": 0.5151, + "step": 53246 + }, + { + "epoch": 1.36, + "learning_rate": 1.1933802836993617e-06, + "loss": 0.6084, + "step": 53247 + }, + { + "epoch": 1.36, + "learning_rate": 1.1933531354822743e-06, + "loss": 0.5518, + "step": 53248 + }, + { + "epoch": 1.36, + "learning_rate": 1.1933259871171453e-06, + "loss": 0.7607, + "step": 53249 + }, + { + "epoch": 1.36, + "learning_rate": 1.1932988386039956e-06, + "loss": 0.4438, + "step": 53250 + }, + { + "epoch": 1.36, + "learning_rate": 1.1932716899428455e-06, + "loss": 0.4241, + "step": 53251 + }, + { + "epoch": 1.36, + "learning_rate": 1.1932445411337164e-06, + "loss": 0.5088, + "step": 53252 + }, + { + "epoch": 1.36, + "learning_rate": 1.193217392176629e-06, + "loss": 0.9141, + "step": 53253 + }, + { + "epoch": 1.36, + "learning_rate": 1.1931902430716037e-06, + "loss": 0.6943, + "step": 53254 + }, + { + "epoch": 1.36, + "learning_rate": 1.1931630938186617e-06, + "loss": 0.7109, + "step": 53255 + }, + { + "epoch": 1.36, + "learning_rate": 1.1931359444178234e-06, + "loss": 0.5718, + "step": 53256 + }, + { + "epoch": 1.37, + "learning_rate": 1.19310879486911e-06, + "loss": 0.7998, + "step": 53257 + }, + { + "epoch": 1.37, + "learning_rate": 1.1930816451725417e-06, + "loss": 0.5977, + "step": 53258 + }, + { + "epoch": 1.37, + "learning_rate": 1.1930544953281402e-06, + "loss": 0.7725, + "step": 53259 + }, + { + "epoch": 1.37, + "learning_rate": 1.1930273453359255e-06, + "loss": 0.5359, + "step": 53260 + }, + { + "epoch": 1.37, + "learning_rate": 1.1930001951959185e-06, + "loss": 0.4628, + "step": 53261 + }, + { + "epoch": 1.37, + "learning_rate": 1.1929730449081403e-06, + "loss": 0.4663, + "step": 53262 + }, + { + "epoch": 1.37, + "learning_rate": 1.1929458944726116e-06, + "loss": 0.6816, + "step": 53263 + }, + { + "epoch": 1.37, + "learning_rate": 1.1929187438893528e-06, + "loss": 0.6492, + "step": 53264 + }, + { + "epoch": 1.37, + "learning_rate": 1.1928915931583851e-06, + "loss": 0.6426, + "step": 53265 + }, + { + "epoch": 1.37, + "learning_rate": 1.192864442279729e-06, + "loss": 0.6323, + "step": 53266 + }, + { + "epoch": 1.37, + "learning_rate": 1.192837291253406e-06, + "loss": 0.7749, + "step": 53267 + }, + { + "epoch": 1.37, + "learning_rate": 1.1928101400794362e-06, + "loss": 0.752, + "step": 53268 + }, + { + "epoch": 1.37, + "learning_rate": 1.1927829887578403e-06, + "loss": 0.5405, + "step": 53269 + }, + { + "epoch": 1.37, + "learning_rate": 1.1927558372886392e-06, + "loss": 0.7607, + "step": 53270 + }, + { + "epoch": 1.37, + "learning_rate": 1.192728685671854e-06, + "loss": 0.7227, + "step": 53271 + }, + { + "epoch": 1.37, + "learning_rate": 1.1927015339075056e-06, + "loss": 0.6895, + "step": 53272 + }, + { + "epoch": 1.37, + "learning_rate": 1.192674381995614e-06, + "loss": 0.5159, + "step": 53273 + }, + { + "epoch": 1.37, + "learning_rate": 1.1926472299362009e-06, + "loss": 0.7324, + "step": 53274 + }, + { + "epoch": 1.37, + "learning_rate": 1.1926200777292866e-06, + "loss": 0.5671, + "step": 53275 + }, + { + "epoch": 1.37, + "learning_rate": 1.1925929253748916e-06, + "loss": 0.6626, + "step": 53276 + }, + { + "epoch": 1.37, + "learning_rate": 1.1925657728730374e-06, + "loss": 0.4912, + "step": 53277 + }, + { + "epoch": 1.37, + "learning_rate": 1.1925386202237443e-06, + "loss": 0.5244, + "step": 53278 + }, + { + "epoch": 1.37, + "learning_rate": 1.1925114674270331e-06, + "loss": 0.7729, + "step": 53279 + }, + { + "epoch": 1.37, + "learning_rate": 1.1924843144829251e-06, + "loss": 0.6543, + "step": 53280 + }, + { + "epoch": 1.37, + "learning_rate": 1.1924571613914403e-06, + "loss": 0.6885, + "step": 53281 + }, + { + "epoch": 1.37, + "learning_rate": 1.1924300081526004e-06, + "loss": 0.4902, + "step": 53282 + }, + { + "epoch": 1.37, + "learning_rate": 1.1924028547664253e-06, + "loss": 0.3378, + "step": 53283 + }, + { + "epoch": 1.37, + "learning_rate": 1.1923757012329362e-06, + "loss": 0.7354, + "step": 53284 + }, + { + "epoch": 1.37, + "learning_rate": 1.192348547552154e-06, + "loss": 0.8594, + "step": 53285 + }, + { + "epoch": 1.37, + "learning_rate": 1.1923213937240995e-06, + "loss": 0.5061, + "step": 53286 + }, + { + "epoch": 1.37, + "learning_rate": 1.1922942397487932e-06, + "loss": 0.5928, + "step": 53287 + }, + { + "epoch": 1.37, + "learning_rate": 1.192267085626256e-06, + "loss": 0.6157, + "step": 53288 + }, + { + "epoch": 1.37, + "learning_rate": 1.1922399313565087e-06, + "loss": 0.6411, + "step": 53289 + }, + { + "epoch": 1.37, + "learning_rate": 1.1922127769395723e-06, + "loss": 0.7285, + "step": 53290 + }, + { + "epoch": 1.37, + "learning_rate": 1.192185622375467e-06, + "loss": 0.8135, + "step": 53291 + }, + { + "epoch": 1.37, + "learning_rate": 1.1921584676642144e-06, + "loss": 0.4991, + "step": 53292 + }, + { + "epoch": 1.37, + "learning_rate": 1.1921313128058348e-06, + "loss": 0.7314, + "step": 53293 + }, + { + "epoch": 1.37, + "learning_rate": 1.1921041578003493e-06, + "loss": 0.5481, + "step": 53294 + }, + { + "epoch": 1.37, + "learning_rate": 1.192077002647778e-06, + "loss": 0.6992, + "step": 53295 + }, + { + "epoch": 1.37, + "learning_rate": 1.1920498473481425e-06, + "loss": 0.5115, + "step": 53296 + }, + { + "epoch": 1.37, + "learning_rate": 1.1920226919014633e-06, + "loss": 0.7979, + "step": 53297 + }, + { + "epoch": 1.37, + "learning_rate": 1.1919955363077608e-06, + "loss": 0.5957, + "step": 53298 + }, + { + "epoch": 1.37, + "learning_rate": 1.1919683805670566e-06, + "loss": 0.8184, + "step": 53299 + }, + { + "epoch": 1.37, + "learning_rate": 1.1919412246793706e-06, + "loss": 0.6562, + "step": 53300 + }, + { + "epoch": 1.37, + "learning_rate": 1.1919140686447242e-06, + "loss": 0.6211, + "step": 53301 + }, + { + "epoch": 1.37, + "learning_rate": 1.1918869124631383e-06, + "loss": 0.8662, + "step": 53302 + }, + { + "epoch": 1.37, + "learning_rate": 1.1918597561346332e-06, + "loss": 0.7695, + "step": 53303 + }, + { + "epoch": 1.37, + "learning_rate": 1.1918325996592298e-06, + "loss": 0.791, + "step": 53304 + }, + { + "epoch": 1.37, + "learning_rate": 1.1918054430369492e-06, + "loss": 0.6416, + "step": 53305 + }, + { + "epoch": 1.37, + "learning_rate": 1.1917782862678117e-06, + "loss": 0.5977, + "step": 53306 + }, + { + "epoch": 1.37, + "learning_rate": 1.1917511293518389e-06, + "loss": 0.5016, + "step": 53307 + }, + { + "epoch": 1.37, + "learning_rate": 1.1917239722890507e-06, + "loss": 0.7861, + "step": 53308 + }, + { + "epoch": 1.37, + "learning_rate": 1.1916968150794682e-06, + "loss": 0.7188, + "step": 53309 + }, + { + "epoch": 1.37, + "learning_rate": 1.1916696577231121e-06, + "loss": 0.8291, + "step": 53310 + }, + { + "epoch": 1.37, + "learning_rate": 1.1916425002200038e-06, + "loss": 0.6084, + "step": 53311 + }, + { + "epoch": 1.37, + "learning_rate": 1.1916153425701636e-06, + "loss": 0.7588, + "step": 53312 + }, + { + "epoch": 1.37, + "learning_rate": 1.1915881847736124e-06, + "loss": 0.6875, + "step": 53313 + }, + { + "epoch": 1.37, + "learning_rate": 1.1915610268303706e-06, + "loss": 0.6221, + "step": 53314 + }, + { + "epoch": 1.37, + "learning_rate": 1.1915338687404597e-06, + "loss": 0.5605, + "step": 53315 + }, + { + "epoch": 1.37, + "learning_rate": 1.1915067105038996e-06, + "loss": 0.7109, + "step": 53316 + }, + { + "epoch": 1.37, + "learning_rate": 1.191479552120712e-06, + "loss": 0.5363, + "step": 53317 + }, + { + "epoch": 1.37, + "learning_rate": 1.1914523935909172e-06, + "loss": 0.5724, + "step": 53318 + }, + { + "epoch": 1.37, + "learning_rate": 1.1914252349145362e-06, + "loss": 0.6631, + "step": 53319 + }, + { + "epoch": 1.37, + "learning_rate": 1.1913980760915898e-06, + "loss": 0.665, + "step": 53320 + }, + { + "epoch": 1.37, + "learning_rate": 1.1913709171220985e-06, + "loss": 0.6533, + "step": 53321 + }, + { + "epoch": 1.37, + "learning_rate": 1.1913437580060834e-06, + "loss": 0.5752, + "step": 53322 + }, + { + "epoch": 1.37, + "learning_rate": 1.191316598743565e-06, + "loss": 0.4548, + "step": 53323 + }, + { + "epoch": 1.37, + "learning_rate": 1.1912894393345645e-06, + "loss": 0.4397, + "step": 53324 + }, + { + "epoch": 1.37, + "learning_rate": 1.1912622797791024e-06, + "loss": 0.6812, + "step": 53325 + }, + { + "epoch": 1.37, + "learning_rate": 1.1912351200771995e-06, + "loss": 0.7725, + "step": 53326 + }, + { + "epoch": 1.37, + "learning_rate": 1.1912079602288768e-06, + "loss": 0.6733, + "step": 53327 + }, + { + "epoch": 1.37, + "learning_rate": 1.1911808002341548e-06, + "loss": 0.6826, + "step": 53328 + }, + { + "epoch": 1.37, + "learning_rate": 1.1911536400930545e-06, + "loss": 0.5249, + "step": 53329 + }, + { + "epoch": 1.37, + "learning_rate": 1.1911264798055967e-06, + "loss": 0.6455, + "step": 53330 + }, + { + "epoch": 1.37, + "learning_rate": 1.191099319371802e-06, + "loss": 0.6174, + "step": 53331 + }, + { + "epoch": 1.37, + "learning_rate": 1.1910721587916916e-06, + "loss": 0.6555, + "step": 53332 + }, + { + "epoch": 1.37, + "learning_rate": 1.1910449980652858e-06, + "loss": 0.5996, + "step": 53333 + }, + { + "epoch": 1.37, + "learning_rate": 1.1910178371926059e-06, + "loss": 0.6914, + "step": 53334 + }, + { + "epoch": 1.37, + "learning_rate": 1.1909906761736718e-06, + "loss": 0.4974, + "step": 53335 + }, + { + "epoch": 1.37, + "learning_rate": 1.1909635150085055e-06, + "loss": 0.7676, + "step": 53336 + }, + { + "epoch": 1.37, + "learning_rate": 1.1909363536971271e-06, + "loss": 0.5776, + "step": 53337 + }, + { + "epoch": 1.37, + "learning_rate": 1.1909091922395576e-06, + "loss": 0.7446, + "step": 53338 + }, + { + "epoch": 1.37, + "learning_rate": 1.1908820306358174e-06, + "loss": 0.5693, + "step": 53339 + }, + { + "epoch": 1.37, + "learning_rate": 1.190854868885928e-06, + "loss": 0.6616, + "step": 53340 + }, + { + "epoch": 1.37, + "learning_rate": 1.1908277069899094e-06, + "loss": 0.5298, + "step": 53341 + }, + { + "epoch": 1.37, + "learning_rate": 1.1908005449477832e-06, + "loss": 0.5352, + "step": 53342 + }, + { + "epoch": 1.37, + "learning_rate": 1.1907733827595695e-06, + "loss": 0.7842, + "step": 53343 + }, + { + "epoch": 1.37, + "learning_rate": 1.1907462204252894e-06, + "loss": 0.665, + "step": 53344 + }, + { + "epoch": 1.37, + "learning_rate": 1.1907190579449638e-06, + "loss": 0.6328, + "step": 53345 + }, + { + "epoch": 1.37, + "learning_rate": 1.1906918953186134e-06, + "loss": 0.5237, + "step": 53346 + }, + { + "epoch": 1.37, + "learning_rate": 1.190664732546259e-06, + "loss": 0.5065, + "step": 53347 + }, + { + "epoch": 1.37, + "learning_rate": 1.190637569627921e-06, + "loss": 0.6523, + "step": 53348 + }, + { + "epoch": 1.37, + "learning_rate": 1.1906104065636212e-06, + "loss": 0.6426, + "step": 53349 + }, + { + "epoch": 1.37, + "learning_rate": 1.1905832433533794e-06, + "loss": 0.8516, + "step": 53350 + }, + { + "epoch": 1.37, + "learning_rate": 1.1905560799972173e-06, + "loss": 0.6914, + "step": 53351 + }, + { + "epoch": 1.37, + "learning_rate": 1.1905289164951544e-06, + "loss": 0.4146, + "step": 53352 + }, + { + "epoch": 1.37, + "learning_rate": 1.1905017528472126e-06, + "loss": 0.6782, + "step": 53353 + }, + { + "epoch": 1.37, + "learning_rate": 1.1904745890534123e-06, + "loss": 0.8125, + "step": 53354 + }, + { + "epoch": 1.37, + "learning_rate": 1.1904474251137744e-06, + "loss": 0.6299, + "step": 53355 + }, + { + "epoch": 1.37, + "learning_rate": 1.1904202610283199e-06, + "loss": 0.6602, + "step": 53356 + }, + { + "epoch": 1.37, + "learning_rate": 1.1903930967970692e-06, + "loss": 0.6548, + "step": 53357 + }, + { + "epoch": 1.37, + "learning_rate": 1.190365932420043e-06, + "loss": 0.8623, + "step": 53358 + }, + { + "epoch": 1.37, + "learning_rate": 1.1903387678972628e-06, + "loss": 0.7891, + "step": 53359 + }, + { + "epoch": 1.37, + "learning_rate": 1.1903116032287484e-06, + "loss": 0.6973, + "step": 53360 + }, + { + "epoch": 1.37, + "learning_rate": 1.1902844384145216e-06, + "loss": 0.6188, + "step": 53361 + }, + { + "epoch": 1.37, + "learning_rate": 1.1902572734546028e-06, + "loss": 0.6758, + "step": 53362 + }, + { + "epoch": 1.37, + "learning_rate": 1.1902301083490123e-06, + "loss": 0.6416, + "step": 53363 + }, + { + "epoch": 1.37, + "learning_rate": 1.1902029430977718e-06, + "loss": 0.6631, + "step": 53364 + }, + { + "epoch": 1.37, + "learning_rate": 1.1901757777009015e-06, + "loss": 0.7734, + "step": 53365 + }, + { + "epoch": 1.37, + "learning_rate": 1.1901486121584225e-06, + "loss": 0.688, + "step": 53366 + }, + { + "epoch": 1.37, + "learning_rate": 1.190121446470355e-06, + "loss": 0.6904, + "step": 53367 + }, + { + "epoch": 1.37, + "learning_rate": 1.1900942806367206e-06, + "loss": 0.605, + "step": 53368 + }, + { + "epoch": 1.37, + "learning_rate": 1.1900671146575396e-06, + "loss": 0.6143, + "step": 53369 + }, + { + "epoch": 1.37, + "learning_rate": 1.1900399485328332e-06, + "loss": 0.5825, + "step": 53370 + }, + { + "epoch": 1.37, + "learning_rate": 1.190012782262622e-06, + "loss": 0.5605, + "step": 53371 + }, + { + "epoch": 1.37, + "learning_rate": 1.1899856158469265e-06, + "loss": 0.8369, + "step": 53372 + }, + { + "epoch": 1.37, + "learning_rate": 1.1899584492857677e-06, + "loss": 0.7158, + "step": 53373 + }, + { + "epoch": 1.37, + "learning_rate": 1.1899312825791666e-06, + "loss": 0.6541, + "step": 53374 + }, + { + "epoch": 1.37, + "learning_rate": 1.1899041157271437e-06, + "loss": 0.7188, + "step": 53375 + }, + { + "epoch": 1.37, + "learning_rate": 1.1898769487297202e-06, + "loss": 0.6743, + "step": 53376 + }, + { + "epoch": 1.37, + "learning_rate": 1.1898497815869164e-06, + "loss": 0.6519, + "step": 53377 + }, + { + "epoch": 1.37, + "learning_rate": 1.1898226142987535e-06, + "loss": 0.6426, + "step": 53378 + }, + { + "epoch": 1.37, + "learning_rate": 1.189795446865252e-06, + "loss": 0.7227, + "step": 53379 + }, + { + "epoch": 1.37, + "learning_rate": 1.1897682792864331e-06, + "loss": 0.6211, + "step": 53380 + }, + { + "epoch": 1.37, + "learning_rate": 1.1897411115623172e-06, + "loss": 0.6421, + "step": 53381 + }, + { + "epoch": 1.37, + "learning_rate": 1.1897139436929253e-06, + "loss": 0.7998, + "step": 53382 + }, + { + "epoch": 1.37, + "learning_rate": 1.189686775678278e-06, + "loss": 0.7715, + "step": 53383 + }, + { + "epoch": 1.37, + "learning_rate": 1.1896596075183966e-06, + "loss": 0.6204, + "step": 53384 + }, + { + "epoch": 1.37, + "learning_rate": 1.1896324392133012e-06, + "loss": 0.6125, + "step": 53385 + }, + { + "epoch": 1.37, + "learning_rate": 1.189605270763013e-06, + "loss": 0.4751, + "step": 53386 + }, + { + "epoch": 1.37, + "learning_rate": 1.189578102167553e-06, + "loss": 0.584, + "step": 53387 + }, + { + "epoch": 1.37, + "learning_rate": 1.1895509334269417e-06, + "loss": 0.5186, + "step": 53388 + }, + { + "epoch": 1.37, + "learning_rate": 1.1895237645411999e-06, + "loss": 0.488, + "step": 53389 + }, + { + "epoch": 1.37, + "learning_rate": 1.1894965955103482e-06, + "loss": 0.6299, + "step": 53390 + }, + { + "epoch": 1.37, + "learning_rate": 1.1894694263344082e-06, + "loss": 0.5371, + "step": 53391 + }, + { + "epoch": 1.37, + "learning_rate": 1.1894422570134e-06, + "loss": 0.655, + "step": 53392 + }, + { + "epoch": 1.37, + "learning_rate": 1.1894150875473444e-06, + "loss": 0.6943, + "step": 53393 + }, + { + "epoch": 1.37, + "learning_rate": 1.1893879179362623e-06, + "loss": 0.5054, + "step": 53394 + }, + { + "epoch": 1.37, + "learning_rate": 1.1893607481801748e-06, + "loss": 0.5991, + "step": 53395 + }, + { + "epoch": 1.37, + "learning_rate": 1.1893335782791025e-06, + "loss": 0.729, + "step": 53396 + }, + { + "epoch": 1.37, + "learning_rate": 1.1893064082330661e-06, + "loss": 0.7368, + "step": 53397 + }, + { + "epoch": 1.37, + "learning_rate": 1.1892792380420864e-06, + "loss": 0.5798, + "step": 53398 + }, + { + "epoch": 1.37, + "learning_rate": 1.1892520677061846e-06, + "loss": 0.5894, + "step": 53399 + }, + { + "epoch": 1.37, + "learning_rate": 1.1892248972253808e-06, + "loss": 0.4562, + "step": 53400 + }, + { + "epoch": 1.37, + "learning_rate": 1.1891977265996966e-06, + "loss": 0.4027, + "step": 53401 + }, + { + "epoch": 1.37, + "learning_rate": 1.189170555829152e-06, + "loss": 0.5854, + "step": 53402 + }, + { + "epoch": 1.37, + "learning_rate": 1.1891433849137684e-06, + "loss": 0.5479, + "step": 53403 + }, + { + "epoch": 1.37, + "learning_rate": 1.1891162138535663e-06, + "loss": 0.6367, + "step": 53404 + }, + { + "epoch": 1.37, + "learning_rate": 1.1890890426485668e-06, + "loss": 0.7285, + "step": 53405 + }, + { + "epoch": 1.37, + "learning_rate": 1.1890618712987905e-06, + "loss": 0.6689, + "step": 53406 + }, + { + "epoch": 1.37, + "learning_rate": 1.189034699804258e-06, + "loss": 0.6602, + "step": 53407 + }, + { + "epoch": 1.37, + "learning_rate": 1.1890075281649905e-06, + "loss": 0.4929, + "step": 53408 + }, + { + "epoch": 1.37, + "learning_rate": 1.1889803563810086e-06, + "loss": 0.6406, + "step": 53409 + }, + { + "epoch": 1.37, + "learning_rate": 1.1889531844523331e-06, + "loss": 0.5864, + "step": 53410 + }, + { + "epoch": 1.37, + "learning_rate": 1.1889260123789849e-06, + "loss": 0.7549, + "step": 53411 + }, + { + "epoch": 1.37, + "learning_rate": 1.1888988401609847e-06, + "loss": 0.7065, + "step": 53412 + }, + { + "epoch": 1.37, + "learning_rate": 1.1888716677983533e-06, + "loss": 0.6914, + "step": 53413 + }, + { + "epoch": 1.37, + "learning_rate": 1.1888444952911116e-06, + "loss": 0.7456, + "step": 53414 + }, + { + "epoch": 1.37, + "learning_rate": 1.1888173226392802e-06, + "loss": 0.7197, + "step": 53415 + }, + { + "epoch": 1.37, + "learning_rate": 1.1887901498428805e-06, + "loss": 0.6416, + "step": 53416 + }, + { + "epoch": 1.37, + "learning_rate": 1.1887629769019322e-06, + "loss": 0.728, + "step": 53417 + }, + { + "epoch": 1.37, + "learning_rate": 1.1887358038164573e-06, + "loss": 0.7402, + "step": 53418 + }, + { + "epoch": 1.37, + "learning_rate": 1.1887086305864758e-06, + "loss": 0.5264, + "step": 53419 + }, + { + "epoch": 1.37, + "learning_rate": 1.1886814572120089e-06, + "loss": 0.6926, + "step": 53420 + }, + { + "epoch": 1.37, + "learning_rate": 1.1886542836930773e-06, + "loss": 0.7734, + "step": 53421 + }, + { + "epoch": 1.37, + "learning_rate": 1.1886271100297019e-06, + "loss": 0.6318, + "step": 53422 + }, + { + "epoch": 1.37, + "learning_rate": 1.188599936221903e-06, + "loss": 0.5325, + "step": 53423 + }, + { + "epoch": 1.37, + "learning_rate": 1.188572762269702e-06, + "loss": 0.6172, + "step": 53424 + }, + { + "epoch": 1.37, + "learning_rate": 1.1885455881731197e-06, + "loss": 0.7339, + "step": 53425 + }, + { + "epoch": 1.37, + "learning_rate": 1.1885184139321764e-06, + "loss": 0.7207, + "step": 53426 + }, + { + "epoch": 1.37, + "learning_rate": 1.1884912395468936e-06, + "loss": 0.8271, + "step": 53427 + }, + { + "epoch": 1.37, + "learning_rate": 1.1884640650172915e-06, + "loss": 0.7109, + "step": 53428 + }, + { + "epoch": 1.37, + "learning_rate": 1.188436890343391e-06, + "loss": 0.7119, + "step": 53429 + }, + { + "epoch": 1.37, + "learning_rate": 1.1884097155252133e-06, + "loss": 0.6816, + "step": 53430 + }, + { + "epoch": 1.37, + "learning_rate": 1.188382540562779e-06, + "loss": 0.5928, + "step": 53431 + }, + { + "epoch": 1.37, + "learning_rate": 1.1883553654561085e-06, + "loss": 0.6846, + "step": 53432 + }, + { + "epoch": 1.37, + "learning_rate": 1.188328190205223e-06, + "loss": 0.5356, + "step": 53433 + }, + { + "epoch": 1.37, + "learning_rate": 1.1883010148101434e-06, + "loss": 0.5117, + "step": 53434 + }, + { + "epoch": 1.37, + "learning_rate": 1.1882738392708904e-06, + "loss": 0.6382, + "step": 53435 + }, + { + "epoch": 1.37, + "learning_rate": 1.1882466635874848e-06, + "loss": 0.7344, + "step": 53436 + }, + { + "epoch": 1.37, + "learning_rate": 1.1882194877599473e-06, + "loss": 0.7314, + "step": 53437 + }, + { + "epoch": 1.37, + "learning_rate": 1.188192311788299e-06, + "loss": 0.5762, + "step": 53438 + }, + { + "epoch": 1.37, + "learning_rate": 1.1881651356725602e-06, + "loss": 0.7446, + "step": 53439 + }, + { + "epoch": 1.37, + "learning_rate": 1.1881379594127518e-06, + "loss": 0.5381, + "step": 53440 + }, + { + "epoch": 1.37, + "learning_rate": 1.1881107830088957e-06, + "loss": 0.7051, + "step": 53441 + }, + { + "epoch": 1.37, + "learning_rate": 1.188083606461011e-06, + "loss": 0.6313, + "step": 53442 + }, + { + "epoch": 1.37, + "learning_rate": 1.1880564297691196e-06, + "loss": 0.7939, + "step": 53443 + }, + { + "epoch": 1.37, + "learning_rate": 1.1880292529332422e-06, + "loss": 0.7041, + "step": 53444 + }, + { + "epoch": 1.37, + "learning_rate": 1.188002075953399e-06, + "loss": 0.752, + "step": 53445 + }, + { + "epoch": 1.37, + "learning_rate": 1.1879748988296117e-06, + "loss": 0.4944, + "step": 53446 + }, + { + "epoch": 1.37, + "learning_rate": 1.1879477215619008e-06, + "loss": 0.4282, + "step": 53447 + }, + { + "epoch": 1.37, + "learning_rate": 1.1879205441502862e-06, + "loss": 0.752, + "step": 53448 + }, + { + "epoch": 1.37, + "learning_rate": 1.18789336659479e-06, + "loss": 0.6094, + "step": 53449 + }, + { + "epoch": 1.37, + "learning_rate": 1.1878661888954325e-06, + "loss": 0.6099, + "step": 53450 + }, + { + "epoch": 1.37, + "learning_rate": 1.1878390110522344e-06, + "loss": 0.6335, + "step": 53451 + }, + { + "epoch": 1.37, + "learning_rate": 1.1878118330652168e-06, + "loss": 0.6313, + "step": 53452 + }, + { + "epoch": 1.37, + "learning_rate": 1.1877846549343998e-06, + "loss": 0.603, + "step": 53453 + }, + { + "epoch": 1.37, + "learning_rate": 1.1877574766598052e-06, + "loss": 0.8076, + "step": 53454 + }, + { + "epoch": 1.37, + "learning_rate": 1.1877302982414534e-06, + "loss": 0.6875, + "step": 53455 + }, + { + "epoch": 1.37, + "learning_rate": 1.187703119679365e-06, + "loss": 0.627, + "step": 53456 + }, + { + "epoch": 1.37, + "learning_rate": 1.1876759409735609e-06, + "loss": 0.8369, + "step": 53457 + }, + { + "epoch": 1.37, + "learning_rate": 1.1876487621240619e-06, + "loss": 0.5645, + "step": 53458 + }, + { + "epoch": 1.37, + "learning_rate": 1.187621583130889e-06, + "loss": 0.7598, + "step": 53459 + }, + { + "epoch": 1.37, + "learning_rate": 1.1875944039940628e-06, + "loss": 0.7188, + "step": 53460 + }, + { + "epoch": 1.37, + "learning_rate": 1.187567224713604e-06, + "loss": 0.7622, + "step": 53461 + }, + { + "epoch": 1.37, + "learning_rate": 1.187540045289534e-06, + "loss": 0.6953, + "step": 53462 + }, + { + "epoch": 1.37, + "learning_rate": 1.1875128657218729e-06, + "loss": 0.7764, + "step": 53463 + }, + { + "epoch": 1.37, + "learning_rate": 1.1874856860106421e-06, + "loss": 0.6516, + "step": 53464 + }, + { + "epoch": 1.37, + "learning_rate": 1.187458506155862e-06, + "loss": 0.5728, + "step": 53465 + }, + { + "epoch": 1.37, + "learning_rate": 1.1874313261575536e-06, + "loss": 0.4644, + "step": 53466 + }, + { + "epoch": 1.37, + "learning_rate": 1.1874041460157375e-06, + "loss": 0.6875, + "step": 53467 + }, + { + "epoch": 1.37, + "learning_rate": 1.1873769657304349e-06, + "loss": 0.6592, + "step": 53468 + }, + { + "epoch": 1.37, + "learning_rate": 1.187349785301666e-06, + "loss": 0.7812, + "step": 53469 + }, + { + "epoch": 1.37, + "learning_rate": 1.1873226047294522e-06, + "loss": 0.6357, + "step": 53470 + }, + { + "epoch": 1.37, + "learning_rate": 1.1872954240138142e-06, + "loss": 0.7197, + "step": 53471 + }, + { + "epoch": 1.37, + "learning_rate": 1.1872682431547728e-06, + "loss": 0.4937, + "step": 53472 + }, + { + "epoch": 1.37, + "learning_rate": 1.1872410621523483e-06, + "loss": 0.627, + "step": 53473 + }, + { + "epoch": 1.37, + "learning_rate": 1.187213881006562e-06, + "loss": 0.7051, + "step": 53474 + }, + { + "epoch": 1.37, + "learning_rate": 1.1871866997174348e-06, + "loss": 0.7676, + "step": 53475 + }, + { + "epoch": 1.37, + "learning_rate": 1.1871595182849874e-06, + "loss": 0.7124, + "step": 53476 + }, + { + "epoch": 1.37, + "learning_rate": 1.1871323367092406e-06, + "loss": 0.645, + "step": 53477 + }, + { + "epoch": 1.37, + "learning_rate": 1.1871051549902149e-06, + "loss": 0.6826, + "step": 53478 + }, + { + "epoch": 1.37, + "learning_rate": 1.1870779731279317e-06, + "loss": 0.5151, + "step": 53479 + }, + { + "epoch": 1.37, + "learning_rate": 1.187050791122411e-06, + "loss": 0.6279, + "step": 53480 + }, + { + "epoch": 1.37, + "learning_rate": 1.1870236089736749e-06, + "loss": 0.5801, + "step": 53481 + }, + { + "epoch": 1.37, + "learning_rate": 1.1869964266817427e-06, + "loss": 0.5334, + "step": 53482 + }, + { + "epoch": 1.37, + "learning_rate": 1.1869692442466364e-06, + "loss": 0.6367, + "step": 53483 + }, + { + "epoch": 1.37, + "learning_rate": 1.1869420616683761e-06, + "loss": 0.6152, + "step": 53484 + }, + { + "epoch": 1.37, + "learning_rate": 1.186914878946983e-06, + "loss": 0.677, + "step": 53485 + }, + { + "epoch": 1.37, + "learning_rate": 1.1868876960824776e-06, + "loss": 0.6011, + "step": 53486 + }, + { + "epoch": 1.37, + "learning_rate": 1.186860513074881e-06, + "loss": 0.5103, + "step": 53487 + }, + { + "epoch": 1.37, + "learning_rate": 1.1868333299242138e-06, + "loss": 0.6553, + "step": 53488 + }, + { + "epoch": 1.37, + "learning_rate": 1.186806146630497e-06, + "loss": 0.5991, + "step": 53489 + }, + { + "epoch": 1.37, + "learning_rate": 1.1867789631937512e-06, + "loss": 0.5139, + "step": 53490 + }, + { + "epoch": 1.37, + "learning_rate": 1.1867517796139978e-06, + "loss": 0.6294, + "step": 53491 + }, + { + "epoch": 1.37, + "learning_rate": 1.1867245958912567e-06, + "loss": 0.6938, + "step": 53492 + }, + { + "epoch": 1.37, + "learning_rate": 1.1866974120255492e-06, + "loss": 0.623, + "step": 53493 + }, + { + "epoch": 1.37, + "learning_rate": 1.1866702280168962e-06, + "loss": 0.6621, + "step": 53494 + }, + { + "epoch": 1.37, + "learning_rate": 1.1866430438653182e-06, + "loss": 0.6616, + "step": 53495 + }, + { + "epoch": 1.37, + "learning_rate": 1.1866158595708365e-06, + "loss": 0.6514, + "step": 53496 + }, + { + "epoch": 1.37, + "learning_rate": 1.1865886751334713e-06, + "loss": 0.5767, + "step": 53497 + }, + { + "epoch": 1.37, + "learning_rate": 1.1865614905532439e-06, + "loss": 0.6963, + "step": 53498 + }, + { + "epoch": 1.37, + "learning_rate": 1.186534305830175e-06, + "loss": 0.6604, + "step": 53499 + }, + { + "epoch": 1.37, + "learning_rate": 1.1865071209642852e-06, + "loss": 0.7012, + "step": 53500 + }, + { + "epoch": 1.37, + "learning_rate": 1.1864799359555954e-06, + "loss": 0.4697, + "step": 53501 + }, + { + "epoch": 1.37, + "learning_rate": 1.1864527508041268e-06, + "loss": 0.7607, + "step": 53502 + }, + { + "epoch": 1.37, + "learning_rate": 1.1864255655098995e-06, + "loss": 0.5383, + "step": 53503 + }, + { + "epoch": 1.37, + "learning_rate": 1.186398380072935e-06, + "loss": 0.585, + "step": 53504 + }, + { + "epoch": 1.37, + "learning_rate": 1.1863711944932536e-06, + "loss": 0.7104, + "step": 53505 + }, + { + "epoch": 1.37, + "learning_rate": 1.1863440087708772e-06, + "loss": 0.8164, + "step": 53506 + }, + { + "epoch": 1.37, + "learning_rate": 1.1863168229058249e-06, + "loss": 0.6133, + "step": 53507 + }, + { + "epoch": 1.37, + "learning_rate": 1.1862896368981186e-06, + "loss": 0.6787, + "step": 53508 + }, + { + "epoch": 1.37, + "learning_rate": 1.1862624507477788e-06, + "loss": 0.5513, + "step": 53509 + }, + { + "epoch": 1.37, + "learning_rate": 1.1862352644548264e-06, + "loss": 0.5527, + "step": 53510 + }, + { + "epoch": 1.37, + "learning_rate": 1.1862080780192825e-06, + "loss": 0.6167, + "step": 53511 + }, + { + "epoch": 1.37, + "learning_rate": 1.1861808914411674e-06, + "loss": 0.6709, + "step": 53512 + }, + { + "epoch": 1.37, + "learning_rate": 1.1861537047205018e-06, + "loss": 0.7217, + "step": 53513 + }, + { + "epoch": 1.37, + "learning_rate": 1.1861265178573074e-06, + "loss": 0.7139, + "step": 53514 + }, + { + "epoch": 1.37, + "learning_rate": 1.1860993308516042e-06, + "loss": 0.5151, + "step": 53515 + }, + { + "epoch": 1.37, + "learning_rate": 1.1860721437034137e-06, + "loss": 0.7568, + "step": 53516 + }, + { + "epoch": 1.37, + "learning_rate": 1.186044956412756e-06, + "loss": 0.6299, + "step": 53517 + }, + { + "epoch": 1.37, + "learning_rate": 1.1860177689796525e-06, + "loss": 0.5132, + "step": 53518 + }, + { + "epoch": 1.37, + "learning_rate": 1.1859905814041234e-06, + "loss": 0.5706, + "step": 53519 + }, + { + "epoch": 1.37, + "learning_rate": 1.18596339368619e-06, + "loss": 0.4561, + "step": 53520 + }, + { + "epoch": 1.37, + "learning_rate": 1.185936205825873e-06, + "loss": 0.6709, + "step": 53521 + }, + { + "epoch": 1.37, + "learning_rate": 1.185909017823193e-06, + "loss": 0.6133, + "step": 53522 + }, + { + "epoch": 1.37, + "learning_rate": 1.1858818296781712e-06, + "loss": 0.6265, + "step": 53523 + }, + { + "epoch": 1.37, + "learning_rate": 1.185854641390828e-06, + "loss": 0.5303, + "step": 53524 + }, + { + "epoch": 1.37, + "learning_rate": 1.1858274529611848e-06, + "loss": 0.697, + "step": 53525 + }, + { + "epoch": 1.37, + "learning_rate": 1.1858002643892619e-06, + "loss": 0.6211, + "step": 53526 + }, + { + "epoch": 1.37, + "learning_rate": 1.1857730756750806e-06, + "loss": 0.5532, + "step": 53527 + }, + { + "epoch": 1.37, + "learning_rate": 1.1857458868186609e-06, + "loss": 0.6973, + "step": 53528 + }, + { + "epoch": 1.37, + "learning_rate": 1.1857186978200243e-06, + "loss": 0.6411, + "step": 53529 + }, + { + "epoch": 1.37, + "learning_rate": 1.1856915086791915e-06, + "loss": 0.7578, + "step": 53530 + }, + { + "epoch": 1.37, + "learning_rate": 1.1856643193961833e-06, + "loss": 0.6016, + "step": 53531 + }, + { + "epoch": 1.37, + "learning_rate": 1.1856371299710202e-06, + "loss": 0.5649, + "step": 53532 + }, + { + "epoch": 1.37, + "learning_rate": 1.1856099404037236e-06, + "loss": 0.6816, + "step": 53533 + }, + { + "epoch": 1.37, + "learning_rate": 1.1855827506943138e-06, + "loss": 0.4543, + "step": 53534 + }, + { + "epoch": 1.37, + "learning_rate": 1.1855555608428118e-06, + "loss": 0.7812, + "step": 53535 + }, + { + "epoch": 1.37, + "learning_rate": 1.1855283708492385e-06, + "loss": 0.6729, + "step": 53536 + }, + { + "epoch": 1.37, + "learning_rate": 1.1855011807136148e-06, + "loss": 0.689, + "step": 53537 + }, + { + "epoch": 1.37, + "learning_rate": 1.185473990435961e-06, + "loss": 0.7642, + "step": 53538 + }, + { + "epoch": 1.37, + "learning_rate": 1.1854468000162987e-06, + "loss": 0.5266, + "step": 53539 + }, + { + "epoch": 1.37, + "learning_rate": 1.185419609454648e-06, + "loss": 0.7031, + "step": 53540 + }, + { + "epoch": 1.37, + "learning_rate": 1.1853924187510302e-06, + "loss": 0.7144, + "step": 53541 + }, + { + "epoch": 1.37, + "learning_rate": 1.1853652279054662e-06, + "loss": 0.4802, + "step": 53542 + }, + { + "epoch": 1.37, + "learning_rate": 1.1853380369179762e-06, + "loss": 0.7324, + "step": 53543 + }, + { + "epoch": 1.37, + "learning_rate": 1.1853108457885815e-06, + "loss": 0.4045, + "step": 53544 + }, + { + "epoch": 1.37, + "learning_rate": 1.1852836545173028e-06, + "loss": 0.4648, + "step": 53545 + }, + { + "epoch": 1.37, + "learning_rate": 1.185256463104161e-06, + "loss": 0.5435, + "step": 53546 + }, + { + "epoch": 1.37, + "learning_rate": 1.1852292715491767e-06, + "loss": 0.5502, + "step": 53547 + }, + { + "epoch": 1.37, + "learning_rate": 1.185202079852371e-06, + "loss": 0.6289, + "step": 53548 + }, + { + "epoch": 1.37, + "learning_rate": 1.1851748880137641e-06, + "loss": 0.6826, + "step": 53549 + }, + { + "epoch": 1.37, + "learning_rate": 1.1851476960333779e-06, + "loss": 0.6094, + "step": 53550 + }, + { + "epoch": 1.37, + "learning_rate": 1.1851205039112326e-06, + "loss": 0.5132, + "step": 53551 + }, + { + "epoch": 1.37, + "learning_rate": 1.185093311647349e-06, + "loss": 0.6475, + "step": 53552 + }, + { + "epoch": 1.37, + "learning_rate": 1.1850661192417478e-06, + "loss": 0.6855, + "step": 53553 + }, + { + "epoch": 1.37, + "learning_rate": 1.18503892669445e-06, + "loss": 0.6328, + "step": 53554 + }, + { + "epoch": 1.37, + "learning_rate": 1.1850117340054762e-06, + "loss": 0.3855, + "step": 53555 + }, + { + "epoch": 1.37, + "learning_rate": 1.184984541174848e-06, + "loss": 0.6196, + "step": 53556 + }, + { + "epoch": 1.37, + "learning_rate": 1.1849573482025852e-06, + "loss": 0.5139, + "step": 53557 + }, + { + "epoch": 1.37, + "learning_rate": 1.1849301550887092e-06, + "loss": 0.6216, + "step": 53558 + }, + { + "epoch": 1.37, + "learning_rate": 1.1849029618332404e-06, + "loss": 0.6455, + "step": 53559 + }, + { + "epoch": 1.37, + "learning_rate": 1.1848757684362002e-06, + "loss": 0.7241, + "step": 53560 + }, + { + "epoch": 1.37, + "learning_rate": 1.1848485748976092e-06, + "loss": 0.7178, + "step": 53561 + }, + { + "epoch": 1.37, + "learning_rate": 1.1848213812174878e-06, + "loss": 0.7207, + "step": 53562 + }, + { + "epoch": 1.37, + "learning_rate": 1.1847941873958575e-06, + "loss": 0.6084, + "step": 53563 + }, + { + "epoch": 1.37, + "learning_rate": 1.1847669934327386e-06, + "loss": 0.7441, + "step": 53564 + }, + { + "epoch": 1.37, + "learning_rate": 1.1847397993281521e-06, + "loss": 0.6855, + "step": 53565 + }, + { + "epoch": 1.37, + "learning_rate": 1.184712605082119e-06, + "loss": 0.4775, + "step": 53566 + }, + { + "epoch": 1.37, + "learning_rate": 1.18468541069466e-06, + "loss": 0.7153, + "step": 53567 + }, + { + "epoch": 1.37, + "learning_rate": 1.1846582161657956e-06, + "loss": 0.6699, + "step": 53568 + }, + { + "epoch": 1.37, + "learning_rate": 1.1846310214955471e-06, + "loss": 0.5635, + "step": 53569 + }, + { + "epoch": 1.37, + "learning_rate": 1.1846038266839348e-06, + "loss": 0.5303, + "step": 53570 + }, + { + "epoch": 1.37, + "learning_rate": 1.1845766317309804e-06, + "loss": 0.6641, + "step": 53571 + }, + { + "epoch": 1.37, + "learning_rate": 1.1845494366367037e-06, + "loss": 0.6533, + "step": 53572 + }, + { + "epoch": 1.37, + "learning_rate": 1.1845222414011262e-06, + "loss": 0.5366, + "step": 53573 + }, + { + "epoch": 1.37, + "learning_rate": 1.1844950460242682e-06, + "loss": 0.668, + "step": 53574 + }, + { + "epoch": 1.37, + "learning_rate": 1.1844678505061512e-06, + "loss": 0.6753, + "step": 53575 + }, + { + "epoch": 1.37, + "learning_rate": 1.1844406548467955e-06, + "loss": 0.6758, + "step": 53576 + }, + { + "epoch": 1.37, + "learning_rate": 1.1844134590462222e-06, + "loss": 0.5273, + "step": 53577 + }, + { + "epoch": 1.37, + "learning_rate": 1.1843862631044517e-06, + "loss": 0.6519, + "step": 53578 + }, + { + "epoch": 1.37, + "learning_rate": 1.1843590670215054e-06, + "loss": 0.6802, + "step": 53579 + }, + { + "epoch": 1.37, + "learning_rate": 1.1843318707974036e-06, + "loss": 0.6582, + "step": 53580 + }, + { + "epoch": 1.37, + "learning_rate": 1.184304674432168e-06, + "loss": 0.5564, + "step": 53581 + }, + { + "epoch": 1.37, + "learning_rate": 1.1842774779258178e-06, + "loss": 0.5625, + "step": 53582 + }, + { + "epoch": 1.37, + "learning_rate": 1.1842502812783755e-06, + "loss": 0.6768, + "step": 53583 + }, + { + "epoch": 1.37, + "learning_rate": 1.1842230844898609e-06, + "loss": 0.47, + "step": 53584 + }, + { + "epoch": 1.37, + "learning_rate": 1.1841958875602954e-06, + "loss": 0.5928, + "step": 53585 + }, + { + "epoch": 1.37, + "learning_rate": 1.1841686904896993e-06, + "loss": 0.6514, + "step": 53586 + }, + { + "epoch": 1.37, + "learning_rate": 1.1841414932780937e-06, + "loss": 0.4919, + "step": 53587 + }, + { + "epoch": 1.37, + "learning_rate": 1.1841142959254996e-06, + "loss": 0.7529, + "step": 53588 + }, + { + "epoch": 1.37, + "learning_rate": 1.1840870984319375e-06, + "loss": 0.8643, + "step": 53589 + }, + { + "epoch": 1.37, + "learning_rate": 1.1840599007974286e-06, + "loss": 0.5981, + "step": 53590 + }, + { + "epoch": 1.37, + "learning_rate": 1.1840327030219934e-06, + "loss": 0.6924, + "step": 53591 + }, + { + "epoch": 1.37, + "learning_rate": 1.184005505105653e-06, + "loss": 0.5728, + "step": 53592 + }, + { + "epoch": 1.37, + "learning_rate": 1.1839783070484276e-06, + "loss": 0.6914, + "step": 53593 + }, + { + "epoch": 1.37, + "learning_rate": 1.1839511088503388e-06, + "loss": 0.7246, + "step": 53594 + }, + { + "epoch": 1.37, + "learning_rate": 1.1839239105114069e-06, + "loss": 0.7139, + "step": 53595 + }, + { + "epoch": 1.37, + "learning_rate": 1.1838967120316533e-06, + "loss": 0.6162, + "step": 53596 + }, + { + "epoch": 1.37, + "learning_rate": 1.1838695134110982e-06, + "loss": 0.8418, + "step": 53597 + }, + { + "epoch": 1.37, + "learning_rate": 1.1838423146497628e-06, + "loss": 0.6304, + "step": 53598 + }, + { + "epoch": 1.37, + "learning_rate": 1.1838151157476674e-06, + "loss": 0.7959, + "step": 53599 + }, + { + "epoch": 1.37, + "learning_rate": 1.1837879167048335e-06, + "loss": 0.6562, + "step": 53600 + }, + { + "epoch": 1.37, + "learning_rate": 1.1837607175212818e-06, + "loss": 0.6807, + "step": 53601 + }, + { + "epoch": 1.37, + "learning_rate": 1.1837335181970328e-06, + "loss": 0.6729, + "step": 53602 + }, + { + "epoch": 1.37, + "learning_rate": 1.1837063187321073e-06, + "loss": 0.665, + "step": 53603 + }, + { + "epoch": 1.37, + "learning_rate": 1.1836791191265266e-06, + "loss": 0.6416, + "step": 53604 + }, + { + "epoch": 1.37, + "learning_rate": 1.183651919380311e-06, + "loss": 0.6465, + "step": 53605 + }, + { + "epoch": 1.37, + "learning_rate": 1.1836247194934816e-06, + "loss": 0.4937, + "step": 53606 + }, + { + "epoch": 1.37, + "learning_rate": 1.1835975194660595e-06, + "loss": 0.6113, + "step": 53607 + }, + { + "epoch": 1.37, + "learning_rate": 1.183570319298065e-06, + "loss": 0.6465, + "step": 53608 + }, + { + "epoch": 1.37, + "learning_rate": 1.183543118989519e-06, + "loss": 0.7715, + "step": 53609 + }, + { + "epoch": 1.37, + "learning_rate": 1.183515918540443e-06, + "loss": 0.7471, + "step": 53610 + }, + { + "epoch": 1.37, + "learning_rate": 1.1834887179508568e-06, + "loss": 0.5879, + "step": 53611 + }, + { + "epoch": 1.37, + "learning_rate": 1.1834615172207817e-06, + "loss": 0.7441, + "step": 53612 + }, + { + "epoch": 1.37, + "learning_rate": 1.1834343163502387e-06, + "loss": 0.7412, + "step": 53613 + }, + { + "epoch": 1.37, + "learning_rate": 1.1834071153392484e-06, + "loss": 0.6577, + "step": 53614 + }, + { + "epoch": 1.37, + "learning_rate": 1.183379914187832e-06, + "loss": 0.7754, + "step": 53615 + }, + { + "epoch": 1.37, + "learning_rate": 1.1833527128960098e-06, + "loss": 0.6816, + "step": 53616 + }, + { + "epoch": 1.37, + "learning_rate": 1.183325511463803e-06, + "loss": 0.6816, + "step": 53617 + }, + { + "epoch": 1.37, + "learning_rate": 1.1832983098912318e-06, + "loss": 0.8027, + "step": 53618 + }, + { + "epoch": 1.37, + "learning_rate": 1.1832711081783182e-06, + "loss": 0.6841, + "step": 53619 + }, + { + "epoch": 1.37, + "learning_rate": 1.183243906325082e-06, + "loss": 0.4758, + "step": 53620 + }, + { + "epoch": 1.37, + "learning_rate": 1.1832167043315446e-06, + "loss": 0.3127, + "step": 53621 + }, + { + "epoch": 1.37, + "learning_rate": 1.1831895021977263e-06, + "loss": 0.7861, + "step": 53622 + }, + { + "epoch": 1.37, + "learning_rate": 1.1831622999236484e-06, + "loss": 0.6626, + "step": 53623 + }, + { + "epoch": 1.37, + "learning_rate": 1.1831350975093312e-06, + "loss": 0.5879, + "step": 53624 + }, + { + "epoch": 1.37, + "learning_rate": 1.183107894954796e-06, + "loss": 0.6807, + "step": 53625 + }, + { + "epoch": 1.37, + "learning_rate": 1.1830806922600639e-06, + "loss": 0.467, + "step": 53626 + }, + { + "epoch": 1.37, + "learning_rate": 1.1830534894251552e-06, + "loss": 0.5059, + "step": 53627 + }, + { + "epoch": 1.37, + "learning_rate": 1.1830262864500907e-06, + "loss": 0.6816, + "step": 53628 + }, + { + "epoch": 1.37, + "learning_rate": 1.1829990833348913e-06, + "loss": 0.6116, + "step": 53629 + }, + { + "epoch": 1.37, + "learning_rate": 1.1829718800795781e-06, + "loss": 0.6543, + "step": 53630 + }, + { + "epoch": 1.37, + "learning_rate": 1.1829446766841716e-06, + "loss": 0.6387, + "step": 53631 + }, + { + "epoch": 1.37, + "learning_rate": 1.182917473148693e-06, + "loss": 0.6387, + "step": 53632 + }, + { + "epoch": 1.37, + "learning_rate": 1.1828902694731624e-06, + "loss": 0.5732, + "step": 53633 + }, + { + "epoch": 1.37, + "learning_rate": 1.1828630656576018e-06, + "loss": 0.6748, + "step": 53634 + }, + { + "epoch": 1.37, + "learning_rate": 1.182835861702031e-06, + "loss": 0.73, + "step": 53635 + }, + { + "epoch": 1.37, + "learning_rate": 1.1828086576064712e-06, + "loss": 0.6504, + "step": 53636 + }, + { + "epoch": 1.37, + "learning_rate": 1.1827814533709433e-06, + "loss": 0.6162, + "step": 53637 + }, + { + "epoch": 1.37, + "learning_rate": 1.182754248995468e-06, + "loss": 0.7607, + "step": 53638 + }, + { + "epoch": 1.37, + "learning_rate": 1.182727044480066e-06, + "loss": 0.749, + "step": 53639 + }, + { + "epoch": 1.37, + "learning_rate": 1.1826998398247588e-06, + "loss": 0.6924, + "step": 53640 + }, + { + "epoch": 1.37, + "learning_rate": 1.1826726350295662e-06, + "loss": 0.7207, + "step": 53641 + }, + { + "epoch": 1.37, + "learning_rate": 1.18264543009451e-06, + "loss": 0.5645, + "step": 53642 + }, + { + "epoch": 1.37, + "learning_rate": 1.1826182250196101e-06, + "loss": 0.7363, + "step": 53643 + }, + { + "epoch": 1.37, + "learning_rate": 1.182591019804888e-06, + "loss": 0.7119, + "step": 53644 + }, + { + "epoch": 1.37, + "learning_rate": 1.1825638144503646e-06, + "loss": 0.8232, + "step": 53645 + }, + { + "epoch": 1.37, + "learning_rate": 1.1825366089560604e-06, + "loss": 0.6543, + "step": 53646 + }, + { + "epoch": 1.38, + "learning_rate": 1.1825094033219962e-06, + "loss": 0.5869, + "step": 53647 + }, + { + "epoch": 1.38, + "learning_rate": 1.182482197548193e-06, + "loss": 0.6548, + "step": 53648 + }, + { + "epoch": 1.38, + "learning_rate": 1.1824549916346714e-06, + "loss": 0.6621, + "step": 53649 + }, + { + "epoch": 1.38, + "learning_rate": 1.1824277855814525e-06, + "loss": 0.4805, + "step": 53650 + }, + { + "epoch": 1.38, + "learning_rate": 1.1824005793885573e-06, + "loss": 0.7129, + "step": 53651 + }, + { + "epoch": 1.38, + "learning_rate": 1.182373373056006e-06, + "loss": 0.5029, + "step": 53652 + }, + { + "epoch": 1.38, + "learning_rate": 1.1823461665838199e-06, + "loss": 0.6602, + "step": 53653 + }, + { + "epoch": 1.38, + "learning_rate": 1.1823189599720198e-06, + "loss": 0.6787, + "step": 53654 + }, + { + "epoch": 1.38, + "learning_rate": 1.1822917532206264e-06, + "loss": 0.4357, + "step": 53655 + }, + { + "epoch": 1.38, + "learning_rate": 1.1822645463296606e-06, + "loss": 0.5317, + "step": 53656 + }, + { + "epoch": 1.38, + "learning_rate": 1.1822373392991434e-06, + "loss": 0.5923, + "step": 53657 + }, + { + "epoch": 1.38, + "learning_rate": 1.1822101321290952e-06, + "loss": 0.5654, + "step": 53658 + }, + { + "epoch": 1.38, + "learning_rate": 1.182182924819537e-06, + "loss": 0.563, + "step": 53659 + }, + { + "epoch": 1.38, + "learning_rate": 1.18215571737049e-06, + "loss": 0.6025, + "step": 53660 + }, + { + "epoch": 1.38, + "learning_rate": 1.1821285097819747e-06, + "loss": 0.5225, + "step": 53661 + }, + { + "epoch": 1.38, + "learning_rate": 1.1821013020540118e-06, + "loss": 0.4792, + "step": 53662 + }, + { + "epoch": 1.38, + "learning_rate": 1.1820740941866222e-06, + "loss": 0.5775, + "step": 53663 + }, + { + "epoch": 1.38, + "learning_rate": 1.182046886179827e-06, + "loss": 0.686, + "step": 53664 + }, + { + "epoch": 1.38, + "learning_rate": 1.1820196780336474e-06, + "loss": 0.5542, + "step": 53665 + }, + { + "epoch": 1.38, + "learning_rate": 1.1819924697481029e-06, + "loss": 0.6562, + "step": 53666 + }, + { + "epoch": 1.38, + "learning_rate": 1.1819652613232154e-06, + "loss": 0.7031, + "step": 53667 + }, + { + "epoch": 1.38, + "learning_rate": 1.1819380527590055e-06, + "loss": 0.958, + "step": 53668 + }, + { + "epoch": 1.38, + "learning_rate": 1.1819108440554938e-06, + "loss": 0.4774, + "step": 53669 + }, + { + "epoch": 1.38, + "learning_rate": 1.1818836352127017e-06, + "loss": 0.6836, + "step": 53670 + }, + { + "epoch": 1.38, + "learning_rate": 1.1818564262306496e-06, + "loss": 0.6416, + "step": 53671 + }, + { + "epoch": 1.38, + "learning_rate": 1.1818292171093582e-06, + "loss": 0.6436, + "step": 53672 + }, + { + "epoch": 1.38, + "learning_rate": 1.1818020078488486e-06, + "loss": 0.6211, + "step": 53673 + }, + { + "epoch": 1.38, + "learning_rate": 1.1817747984491415e-06, + "loss": 0.4407, + "step": 53674 + }, + { + "epoch": 1.38, + "learning_rate": 1.181747588910258e-06, + "loss": 0.4749, + "step": 53675 + }, + { + "epoch": 1.38, + "learning_rate": 1.1817203792322185e-06, + "loss": 0.7549, + "step": 53676 + }, + { + "epoch": 1.38, + "learning_rate": 1.1816931694150442e-06, + "loss": 0.6484, + "step": 53677 + }, + { + "epoch": 1.38, + "learning_rate": 1.1816659594587557e-06, + "loss": 0.4785, + "step": 53678 + }, + { + "epoch": 1.38, + "learning_rate": 1.1816387493633739e-06, + "loss": 0.625, + "step": 53679 + }, + { + "epoch": 1.38, + "learning_rate": 1.1816115391289202e-06, + "loss": 0.7461, + "step": 53680 + }, + { + "epoch": 1.38, + "learning_rate": 1.1815843287554142e-06, + "loss": 0.708, + "step": 53681 + }, + { + "epoch": 1.38, + "learning_rate": 1.1815571182428777e-06, + "loss": 0.6875, + "step": 53682 + }, + { + "epoch": 1.38, + "learning_rate": 1.181529907591331e-06, + "loss": 0.6367, + "step": 53683 + }, + { + "epoch": 1.38, + "learning_rate": 1.1815026968007954e-06, + "loss": 0.626, + "step": 53684 + }, + { + "epoch": 1.38, + "learning_rate": 1.181475485871292e-06, + "loss": 0.6113, + "step": 53685 + }, + { + "epoch": 1.38, + "learning_rate": 1.1814482748028405e-06, + "loss": 0.7666, + "step": 53686 + }, + { + "epoch": 1.38, + "learning_rate": 1.1814210635954628e-06, + "loss": 0.6797, + "step": 53687 + }, + { + "epoch": 1.38, + "learning_rate": 1.181393852249179e-06, + "loss": 0.616, + "step": 53688 + }, + { + "epoch": 1.38, + "learning_rate": 1.1813666407640103e-06, + "loss": 0.7324, + "step": 53689 + }, + { + "epoch": 1.38, + "learning_rate": 1.181339429139978e-06, + "loss": 0.8545, + "step": 53690 + }, + { + "epoch": 1.38, + "learning_rate": 1.1813122173771018e-06, + "loss": 0.6904, + "step": 53691 + }, + { + "epoch": 1.38, + "learning_rate": 1.1812850054754035e-06, + "loss": 0.5864, + "step": 53692 + }, + { + "epoch": 1.38, + "learning_rate": 1.1812577934349035e-06, + "loss": 0.6523, + "step": 53693 + }, + { + "epoch": 1.38, + "learning_rate": 1.181230581255623e-06, + "loss": 0.752, + "step": 53694 + }, + { + "epoch": 1.38, + "learning_rate": 1.1812033689375822e-06, + "loss": 0.7441, + "step": 53695 + }, + { + "epoch": 1.38, + "learning_rate": 1.1811761564808023e-06, + "loss": 0.6587, + "step": 53696 + }, + { + "epoch": 1.38, + "learning_rate": 1.1811489438853044e-06, + "loss": 0.5879, + "step": 53697 + }, + { + "epoch": 1.38, + "learning_rate": 1.1811217311511092e-06, + "loss": 0.6621, + "step": 53698 + }, + { + "epoch": 1.38, + "learning_rate": 1.181094518278237e-06, + "loss": 0.7061, + "step": 53699 + }, + { + "epoch": 1.38, + "learning_rate": 1.1810673052667094e-06, + "loss": 0.5662, + "step": 53700 + }, + { + "epoch": 1.38, + "learning_rate": 1.1810400921165468e-06, + "loss": 0.7119, + "step": 53701 + }, + { + "epoch": 1.38, + "learning_rate": 1.18101287882777e-06, + "loss": 0.8184, + "step": 53702 + }, + { + "epoch": 1.38, + "learning_rate": 1.1809856654004003e-06, + "loss": 0.4626, + "step": 53703 + }, + { + "epoch": 1.38, + "learning_rate": 1.1809584518344574e-06, + "loss": 0.6763, + "step": 53704 + }, + { + "epoch": 1.38, + "learning_rate": 1.180931238129964e-06, + "loss": 0.4454, + "step": 53705 + }, + { + "epoch": 1.38, + "learning_rate": 1.1809040242869392e-06, + "loss": 0.7334, + "step": 53706 + }, + { + "epoch": 1.38, + "learning_rate": 1.1808768103054047e-06, + "loss": 0.5903, + "step": 53707 + }, + { + "epoch": 1.38, + "learning_rate": 1.1808495961853811e-06, + "loss": 0.5859, + "step": 53708 + }, + { + "epoch": 1.38, + "learning_rate": 1.1808223819268893e-06, + "loss": 0.6724, + "step": 53709 + }, + { + "epoch": 1.38, + "learning_rate": 1.1807951675299501e-06, + "loss": 0.6191, + "step": 53710 + }, + { + "epoch": 1.38, + "learning_rate": 1.1807679529945844e-06, + "loss": 0.7715, + "step": 53711 + }, + { + "epoch": 1.38, + "learning_rate": 1.180740738320813e-06, + "loss": 0.7266, + "step": 53712 + }, + { + "epoch": 1.38, + "learning_rate": 1.1807135235086566e-06, + "loss": 0.4241, + "step": 53713 + }, + { + "epoch": 1.38, + "learning_rate": 1.1806863085581361e-06, + "loss": 0.707, + "step": 53714 + }, + { + "epoch": 1.38, + "learning_rate": 1.180659093469273e-06, + "loss": 0.4907, + "step": 53715 + }, + { + "epoch": 1.38, + "learning_rate": 1.1806318782420867e-06, + "loss": 0.7266, + "step": 53716 + }, + { + "epoch": 1.38, + "learning_rate": 1.1806046628765996e-06, + "loss": 0.4781, + "step": 53717 + }, + { + "epoch": 1.38, + "learning_rate": 1.180577447372831e-06, + "loss": 0.7842, + "step": 53718 + }, + { + "epoch": 1.38, + "learning_rate": 1.1805502317308035e-06, + "loss": 0.6519, + "step": 53719 + }, + { + "epoch": 1.38, + "learning_rate": 1.1805230159505365e-06, + "loss": 0.603, + "step": 53720 + }, + { + "epoch": 1.38, + "learning_rate": 1.180495800032051e-06, + "loss": 0.5337, + "step": 53721 + }, + { + "epoch": 1.38, + "learning_rate": 1.1804685839753688e-06, + "loss": 0.6455, + "step": 53722 + }, + { + "epoch": 1.38, + "learning_rate": 1.1804413677805097e-06, + "loss": 0.5385, + "step": 53723 + }, + { + "epoch": 1.38, + "learning_rate": 1.180414151447495e-06, + "loss": 0.5439, + "step": 53724 + }, + { + "epoch": 1.38, + "learning_rate": 1.1803869349763456e-06, + "loss": 0.7559, + "step": 53725 + }, + { + "epoch": 1.38, + "learning_rate": 1.1803597183670822e-06, + "loss": 0.6553, + "step": 53726 + }, + { + "epoch": 1.38, + "learning_rate": 1.1803325016197255e-06, + "loss": 0.5923, + "step": 53727 + }, + { + "epoch": 1.38, + "learning_rate": 1.1803052847342967e-06, + "loss": 0.6248, + "step": 53728 + }, + { + "epoch": 1.38, + "learning_rate": 1.1802780677108162e-06, + "loss": 0.5596, + "step": 53729 + }, + { + "epoch": 1.38, + "learning_rate": 1.1802508505493055e-06, + "loss": 0.752, + "step": 53730 + }, + { + "epoch": 1.38, + "learning_rate": 1.1802236332497843e-06, + "loss": 0.6924, + "step": 53731 + }, + { + "epoch": 1.38, + "learning_rate": 1.180196415812275e-06, + "loss": 0.7554, + "step": 53732 + }, + { + "epoch": 1.38, + "learning_rate": 1.180169198236797e-06, + "loss": 0.7197, + "step": 53733 + }, + { + "epoch": 1.38, + "learning_rate": 1.1801419805233719e-06, + "loss": 0.791, + "step": 53734 + }, + { + "epoch": 1.38, + "learning_rate": 1.1801147626720202e-06, + "loss": 0.6201, + "step": 53735 + }, + { + "epoch": 1.38, + "learning_rate": 1.1800875446827633e-06, + "loss": 0.6104, + "step": 53736 + }, + { + "epoch": 1.38, + "learning_rate": 1.1800603265556212e-06, + "loss": 0.6963, + "step": 53737 + }, + { + "epoch": 1.38, + "learning_rate": 1.1800331082906155e-06, + "loss": 0.5679, + "step": 53738 + }, + { + "epoch": 1.38, + "learning_rate": 1.1800058898877666e-06, + "loss": 0.8389, + "step": 53739 + }, + { + "epoch": 1.38, + "learning_rate": 1.1799786713470954e-06, + "loss": 0.5587, + "step": 53740 + }, + { + "epoch": 1.38, + "learning_rate": 1.179951452668623e-06, + "loss": 0.6875, + "step": 53741 + }, + { + "epoch": 1.38, + "learning_rate": 1.1799242338523697e-06, + "loss": 0.3728, + "step": 53742 + }, + { + "epoch": 1.38, + "learning_rate": 1.179897014898357e-06, + "loss": 0.5115, + "step": 53743 + }, + { + "epoch": 1.38, + "learning_rate": 1.1798697958066055e-06, + "loss": 0.5967, + "step": 53744 + }, + { + "epoch": 1.38, + "learning_rate": 1.179842576577136e-06, + "loss": 0.5273, + "step": 53745 + }, + { + "epoch": 1.38, + "learning_rate": 1.179815357209969e-06, + "loss": 0.5099, + "step": 53746 + }, + { + "epoch": 1.38, + "learning_rate": 1.1797881377051259e-06, + "loss": 0.6084, + "step": 53747 + }, + { + "epoch": 1.38, + "learning_rate": 1.179760918062627e-06, + "loss": 0.7256, + "step": 53748 + }, + { + "epoch": 1.38, + "learning_rate": 1.1797336982824937e-06, + "loss": 0.5952, + "step": 53749 + }, + { + "epoch": 1.38, + "learning_rate": 1.1797064783647465e-06, + "loss": 0.6646, + "step": 53750 + }, + { + "epoch": 1.38, + "learning_rate": 1.1796792583094064e-06, + "loss": 0.6699, + "step": 53751 + }, + { + "epoch": 1.38, + "learning_rate": 1.1796520381164941e-06, + "loss": 0.4773, + "step": 53752 + }, + { + "epoch": 1.38, + "learning_rate": 1.1796248177860303e-06, + "loss": 0.75, + "step": 53753 + }, + { + "epoch": 1.38, + "learning_rate": 1.179597597318036e-06, + "loss": 0.5942, + "step": 53754 + }, + { + "epoch": 1.38, + "learning_rate": 1.1795703767125326e-06, + "loss": 0.6128, + "step": 53755 + }, + { + "epoch": 1.38, + "learning_rate": 1.1795431559695402e-06, + "loss": 0.6274, + "step": 53756 + }, + { + "epoch": 1.38, + "learning_rate": 1.1795159350890795e-06, + "loss": 0.6455, + "step": 53757 + }, + { + "epoch": 1.38, + "learning_rate": 1.179488714071172e-06, + "loss": 0.7168, + "step": 53758 + }, + { + "epoch": 1.38, + "learning_rate": 1.1794614929158382e-06, + "loss": 0.6826, + "step": 53759 + }, + { + "epoch": 1.38, + "learning_rate": 1.179434271623099e-06, + "loss": 0.5723, + "step": 53760 + }, + { + "epoch": 1.38, + "learning_rate": 1.1794070501929753e-06, + "loss": 0.5254, + "step": 53761 + }, + { + "epoch": 1.38, + "learning_rate": 1.1793798286254876e-06, + "loss": 0.6904, + "step": 53762 + }, + { + "epoch": 1.38, + "learning_rate": 1.1793526069206574e-06, + "loss": 0.6494, + "step": 53763 + }, + { + "epoch": 1.38, + "learning_rate": 1.1793253850785049e-06, + "loss": 0.6387, + "step": 53764 + }, + { + "epoch": 1.38, + "learning_rate": 1.179298163099051e-06, + "loss": 0.6981, + "step": 53765 + }, + { + "epoch": 1.38, + "learning_rate": 1.1792709409823172e-06, + "loss": 0.7734, + "step": 53766 + }, + { + "epoch": 1.38, + "learning_rate": 1.1792437187283235e-06, + "loss": 0.6152, + "step": 53767 + }, + { + "epoch": 1.38, + "learning_rate": 1.1792164963370914e-06, + "loss": 0.7344, + "step": 53768 + }, + { + "epoch": 1.38, + "learning_rate": 1.179189273808641e-06, + "loss": 0.8438, + "step": 53769 + }, + { + "epoch": 1.38, + "learning_rate": 1.1791620511429946e-06, + "loss": 0.6914, + "step": 53770 + }, + { + "epoch": 1.38, + "learning_rate": 1.1791348283401712e-06, + "loss": 0.5027, + "step": 53771 + }, + { + "epoch": 1.38, + "learning_rate": 1.1791076054001928e-06, + "loss": 0.707, + "step": 53772 + }, + { + "epoch": 1.38, + "learning_rate": 1.1790803823230798e-06, + "loss": 0.7539, + "step": 53773 + }, + { + "epoch": 1.38, + "learning_rate": 1.1790531591088534e-06, + "loss": 0.876, + "step": 53774 + }, + { + "epoch": 1.38, + "learning_rate": 1.1790259357575338e-06, + "loss": 0.6738, + "step": 53775 + }, + { + "epoch": 1.38, + "learning_rate": 1.1789987122691426e-06, + "loss": 0.7061, + "step": 53776 + }, + { + "epoch": 1.38, + "learning_rate": 1.1789714886437003e-06, + "loss": 0.7803, + "step": 53777 + }, + { + "epoch": 1.38, + "learning_rate": 1.1789442648812278e-06, + "loss": 0.7607, + "step": 53778 + }, + { + "epoch": 1.38, + "learning_rate": 1.1789170409817457e-06, + "loss": 0.562, + "step": 53779 + }, + { + "epoch": 1.38, + "learning_rate": 1.1788898169452754e-06, + "loss": 0.6865, + "step": 53780 + }, + { + "epoch": 1.38, + "learning_rate": 1.1788625927718373e-06, + "loss": 0.584, + "step": 53781 + }, + { + "epoch": 1.38, + "learning_rate": 1.1788353684614521e-06, + "loss": 0.5649, + "step": 53782 + }, + { + "epoch": 1.38, + "learning_rate": 1.178808144014141e-06, + "loss": 0.7119, + "step": 53783 + }, + { + "epoch": 1.38, + "learning_rate": 1.1787809194299247e-06, + "loss": 0.6445, + "step": 53784 + }, + { + "epoch": 1.38, + "learning_rate": 1.178753694708824e-06, + "loss": 0.7266, + "step": 53785 + }, + { + "epoch": 1.38, + "learning_rate": 1.1787264698508599e-06, + "loss": 0.6289, + "step": 53786 + }, + { + "epoch": 1.38, + "learning_rate": 1.1786992448560533e-06, + "loss": 0.6855, + "step": 53787 + }, + { + "epoch": 1.38, + "learning_rate": 1.1786720197244248e-06, + "loss": 0.6919, + "step": 53788 + }, + { + "epoch": 1.38, + "learning_rate": 1.1786447944559952e-06, + "loss": 0.4189, + "step": 53789 + }, + { + "epoch": 1.38, + "learning_rate": 1.1786175690507855e-06, + "loss": 0.6184, + "step": 53790 + }, + { + "epoch": 1.38, + "learning_rate": 1.178590343508817e-06, + "loss": 0.5757, + "step": 53791 + }, + { + "epoch": 1.38, + "learning_rate": 1.1785631178301096e-06, + "loss": 0.6434, + "step": 53792 + }, + { + "epoch": 1.38, + "learning_rate": 1.1785358920146848e-06, + "loss": 0.645, + "step": 53793 + }, + { + "epoch": 1.38, + "learning_rate": 1.1785086660625632e-06, + "loss": 0.7207, + "step": 53794 + }, + { + "epoch": 1.38, + "learning_rate": 1.178481439973766e-06, + "loss": 0.5784, + "step": 53795 + }, + { + "epoch": 1.38, + "learning_rate": 1.1784542137483134e-06, + "loss": 0.4985, + "step": 53796 + }, + { + "epoch": 1.38, + "learning_rate": 1.1784269873862267e-06, + "loss": 0.644, + "step": 53797 + }, + { + "epoch": 1.38, + "learning_rate": 1.1783997608875266e-06, + "loss": 0.668, + "step": 53798 + }, + { + "epoch": 1.38, + "learning_rate": 1.1783725342522345e-06, + "loss": 0.5288, + "step": 53799 + }, + { + "epoch": 1.38, + "learning_rate": 1.17834530748037e-06, + "loss": 0.6763, + "step": 53800 + }, + { + "epoch": 1.38, + "learning_rate": 1.1783180805719553e-06, + "loss": 0.8047, + "step": 53801 + }, + { + "epoch": 1.38, + "learning_rate": 1.1782908535270103e-06, + "loss": 0.5503, + "step": 53802 + }, + { + "epoch": 1.38, + "learning_rate": 1.1782636263455566e-06, + "loss": 0.6514, + "step": 53803 + }, + { + "epoch": 1.38, + "learning_rate": 1.1782363990276141e-06, + "loss": 0.5859, + "step": 53804 + }, + { + "epoch": 1.38, + "learning_rate": 1.1782091715732047e-06, + "loss": 0.6689, + "step": 53805 + }, + { + "epoch": 1.38, + "learning_rate": 1.1781819439823484e-06, + "loss": 0.6553, + "step": 53806 + }, + { + "epoch": 1.38, + "learning_rate": 1.1781547162550665e-06, + "loss": 0.5757, + "step": 53807 + }, + { + "epoch": 1.38, + "learning_rate": 1.1781274883913794e-06, + "loss": 0.6226, + "step": 53808 + }, + { + "epoch": 1.38, + "learning_rate": 1.1781002603913086e-06, + "loss": 0.8848, + "step": 53809 + }, + { + "epoch": 1.38, + "learning_rate": 1.1780730322548745e-06, + "loss": 0.5232, + "step": 53810 + }, + { + "epoch": 1.38, + "learning_rate": 1.178045803982098e-06, + "loss": 0.4868, + "step": 53811 + }, + { + "epoch": 1.38, + "learning_rate": 1.1780185755730003e-06, + "loss": 0.668, + "step": 53812 + }, + { + "epoch": 1.38, + "learning_rate": 1.1779913470276017e-06, + "loss": 0.6816, + "step": 53813 + }, + { + "epoch": 1.38, + "learning_rate": 1.1779641183459234e-06, + "loss": 0.7544, + "step": 53814 + }, + { + "epoch": 1.38, + "learning_rate": 1.1779368895279864e-06, + "loss": 0.6709, + "step": 53815 + }, + { + "epoch": 1.38, + "learning_rate": 1.1779096605738113e-06, + "loss": 0.6475, + "step": 53816 + }, + { + "epoch": 1.38, + "learning_rate": 1.1778824314834185e-06, + "loss": 0.8711, + "step": 53817 + }, + { + "epoch": 1.38, + "learning_rate": 1.1778552022568296e-06, + "loss": 0.7744, + "step": 53818 + }, + { + "epoch": 1.38, + "learning_rate": 1.177827972894065e-06, + "loss": 0.7686, + "step": 53819 + }, + { + "epoch": 1.38, + "learning_rate": 1.177800743395146e-06, + "loss": 0.6396, + "step": 53820 + }, + { + "epoch": 1.38, + "learning_rate": 1.1777735137600928e-06, + "loss": 0.7188, + "step": 53821 + }, + { + "epoch": 1.38, + "learning_rate": 1.1777462839889267e-06, + "loss": 0.6914, + "step": 53822 + }, + { + "epoch": 1.38, + "learning_rate": 1.1777190540816684e-06, + "loss": 0.6943, + "step": 53823 + }, + { + "epoch": 1.38, + "learning_rate": 1.177691824038339e-06, + "loss": 0.3308, + "step": 53824 + }, + { + "epoch": 1.38, + "learning_rate": 1.1776645938589591e-06, + "loss": 0.6025, + "step": 53825 + }, + { + "epoch": 1.38, + "learning_rate": 1.1776373635435494e-06, + "loss": 0.6182, + "step": 53826 + }, + { + "epoch": 1.38, + "learning_rate": 1.1776101330921311e-06, + "loss": 0.77, + "step": 53827 + }, + { + "epoch": 1.38, + "learning_rate": 1.1775829025047249e-06, + "loss": 0.709, + "step": 53828 + }, + { + "epoch": 1.38, + "learning_rate": 1.1775556717813512e-06, + "loss": 0.6816, + "step": 53829 + }, + { + "epoch": 1.38, + "learning_rate": 1.1775284409220318e-06, + "loss": 0.646, + "step": 53830 + }, + { + "epoch": 1.38, + "learning_rate": 1.177501209926787e-06, + "loss": 0.5459, + "step": 53831 + }, + { + "epoch": 1.38, + "learning_rate": 1.1774739787956373e-06, + "loss": 0.7847, + "step": 53832 + }, + { + "epoch": 1.38, + "learning_rate": 1.1774467475286043e-06, + "loss": 0.6963, + "step": 53833 + }, + { + "epoch": 1.38, + "learning_rate": 1.1774195161257086e-06, + "loss": 0.6279, + "step": 53834 + }, + { + "epoch": 1.38, + "learning_rate": 1.1773922845869707e-06, + "loss": 0.6318, + "step": 53835 + }, + { + "epoch": 1.38, + "learning_rate": 1.1773650529124114e-06, + "loss": 0.5503, + "step": 53836 + }, + { + "epoch": 1.38, + "learning_rate": 1.1773378211020525e-06, + "loss": 0.7275, + "step": 53837 + }, + { + "epoch": 1.38, + "learning_rate": 1.1773105891559137e-06, + "loss": 0.4917, + "step": 53838 + }, + { + "epoch": 1.38, + "learning_rate": 1.1772833570740163e-06, + "loss": 0.6953, + "step": 53839 + }, + { + "epoch": 1.38, + "learning_rate": 1.1772561248563815e-06, + "loss": 0.5109, + "step": 53840 + }, + { + "epoch": 1.38, + "learning_rate": 1.1772288925030295e-06, + "loss": 0.6367, + "step": 53841 + }, + { + "epoch": 1.38, + "learning_rate": 1.1772016600139818e-06, + "loss": 0.7617, + "step": 53842 + }, + { + "epoch": 1.38, + "learning_rate": 1.1771744273892587e-06, + "loss": 0.7471, + "step": 53843 + }, + { + "epoch": 1.38, + "learning_rate": 1.1771471946288813e-06, + "loss": 0.584, + "step": 53844 + }, + { + "epoch": 1.38, + "learning_rate": 1.177119961732871e-06, + "loss": 0.7207, + "step": 53845 + }, + { + "epoch": 1.38, + "learning_rate": 1.1770927287012474e-06, + "loss": 0.7705, + "step": 53846 + }, + { + "epoch": 1.38, + "learning_rate": 1.1770654955340323e-06, + "loss": 0.7686, + "step": 53847 + }, + { + "epoch": 1.38, + "learning_rate": 1.177038262231246e-06, + "loss": 0.625, + "step": 53848 + }, + { + "epoch": 1.38, + "learning_rate": 1.17701102879291e-06, + "loss": 0.7383, + "step": 53849 + }, + { + "epoch": 1.38, + "learning_rate": 1.1769837952190447e-06, + "loss": 0.5864, + "step": 53850 + }, + { + "epoch": 1.38, + "learning_rate": 1.1769565615096714e-06, + "loss": 0.4856, + "step": 53851 + }, + { + "epoch": 1.38, + "learning_rate": 1.1769293276648098e-06, + "loss": 0.5825, + "step": 53852 + }, + { + "epoch": 1.38, + "learning_rate": 1.176902093684482e-06, + "loss": 0.752, + "step": 53853 + }, + { + "epoch": 1.38, + "learning_rate": 1.1768748595687084e-06, + "loss": 0.7754, + "step": 53854 + }, + { + "epoch": 1.38, + "learning_rate": 1.1768476253175098e-06, + "loss": 0.6389, + "step": 53855 + }, + { + "epoch": 1.38, + "learning_rate": 1.1768203909309074e-06, + "loss": 0.6318, + "step": 53856 + }, + { + "epoch": 1.38, + "learning_rate": 1.1767931564089213e-06, + "loss": 0.5461, + "step": 53857 + }, + { + "epoch": 1.38, + "learning_rate": 1.176765921751573e-06, + "loss": 0.7666, + "step": 53858 + }, + { + "epoch": 1.38, + "learning_rate": 1.1767386869588828e-06, + "loss": 0.6118, + "step": 53859 + }, + { + "epoch": 1.38, + "learning_rate": 1.1767114520308728e-06, + "loss": 0.7158, + "step": 53860 + }, + { + "epoch": 1.38, + "learning_rate": 1.1766842169675624e-06, + "loss": 0.3524, + "step": 53861 + }, + { + "epoch": 1.38, + "learning_rate": 1.1766569817689732e-06, + "loss": 0.5938, + "step": 53862 + }, + { + "epoch": 1.38, + "learning_rate": 1.1766297464351253e-06, + "loss": 0.5107, + "step": 53863 + }, + { + "epoch": 1.38, + "learning_rate": 1.1766025109660407e-06, + "loss": 0.5176, + "step": 53864 + }, + { + "epoch": 1.38, + "learning_rate": 1.1765752753617397e-06, + "loss": 0.6748, + "step": 53865 + }, + { + "epoch": 1.38, + "learning_rate": 1.1765480396222429e-06, + "loss": 0.6924, + "step": 53866 + }, + { + "epoch": 1.38, + "learning_rate": 1.1765208037475714e-06, + "loss": 0.5923, + "step": 53867 + }, + { + "epoch": 1.38, + "learning_rate": 1.1764935677377462e-06, + "loss": 0.6626, + "step": 53868 + }, + { + "epoch": 1.38, + "learning_rate": 1.1764663315927876e-06, + "loss": 0.749, + "step": 53869 + }, + { + "epoch": 1.38, + "learning_rate": 1.1764390953127175e-06, + "loss": 0.5757, + "step": 53870 + }, + { + "epoch": 1.38, + "learning_rate": 1.1764118588975556e-06, + "loss": 0.5278, + "step": 53871 + }, + { + "epoch": 1.38, + "learning_rate": 1.1763846223473235e-06, + "loss": 0.7607, + "step": 53872 + }, + { + "epoch": 1.38, + "learning_rate": 1.1763573856620416e-06, + "loss": 0.8105, + "step": 53873 + }, + { + "epoch": 1.38, + "learning_rate": 1.176330148841731e-06, + "loss": 0.4636, + "step": 53874 + }, + { + "epoch": 1.38, + "learning_rate": 1.1763029118864127e-06, + "loss": 0.5596, + "step": 53875 + }, + { + "epoch": 1.38, + "learning_rate": 1.176275674796107e-06, + "loss": 0.7163, + "step": 53876 + }, + { + "epoch": 1.38, + "learning_rate": 1.1762484375708355e-06, + "loss": 0.5588, + "step": 53877 + }, + { + "epoch": 1.38, + "learning_rate": 1.1762212002106184e-06, + "loss": 0.6807, + "step": 53878 + }, + { + "epoch": 1.38, + "learning_rate": 1.1761939627154768e-06, + "loss": 0.6016, + "step": 53879 + }, + { + "epoch": 1.38, + "learning_rate": 1.176166725085432e-06, + "loss": 0.6885, + "step": 53880 + }, + { + "epoch": 1.38, + "learning_rate": 1.1761394873205042e-06, + "loss": 0.5732, + "step": 53881 + }, + { + "epoch": 1.38, + "learning_rate": 1.1761122494207144e-06, + "loss": 0.5923, + "step": 53882 + }, + { + "epoch": 1.38, + "learning_rate": 1.1760850113860835e-06, + "loss": 0.6577, + "step": 53883 + }, + { + "epoch": 1.38, + "learning_rate": 1.1760577732166324e-06, + "loss": 0.6455, + "step": 53884 + }, + { + "epoch": 1.38, + "learning_rate": 1.1760305349123822e-06, + "loss": 0.71, + "step": 53885 + }, + { + "epoch": 1.38, + "learning_rate": 1.1760032964733535e-06, + "loss": 0.7998, + "step": 53886 + }, + { + "epoch": 1.38, + "learning_rate": 1.175976057899567e-06, + "loss": 0.4808, + "step": 53887 + }, + { + "epoch": 1.38, + "learning_rate": 1.1759488191910436e-06, + "loss": 0.5879, + "step": 53888 + }, + { + "epoch": 1.38, + "learning_rate": 1.1759215803478046e-06, + "loss": 0.5889, + "step": 53889 + }, + { + "epoch": 1.38, + "learning_rate": 1.1758943413698704e-06, + "loss": 0.6372, + "step": 53890 + }, + { + "epoch": 1.38, + "learning_rate": 1.1758671022572623e-06, + "loss": 0.6787, + "step": 53891 + }, + { + "epoch": 1.38, + "learning_rate": 1.1758398630100002e-06, + "loss": 0.7168, + "step": 53892 + }, + { + "epoch": 1.38, + "learning_rate": 1.175812623628106e-06, + "loss": 0.9678, + "step": 53893 + }, + { + "epoch": 1.38, + "learning_rate": 1.1757853841116e-06, + "loss": 0.7148, + "step": 53894 + }, + { + "epoch": 1.38, + "learning_rate": 1.1757581444605037e-06, + "loss": 0.6177, + "step": 53895 + }, + { + "epoch": 1.38, + "learning_rate": 1.1757309046748368e-06, + "loss": 0.6963, + "step": 53896 + }, + { + "epoch": 1.38, + "learning_rate": 1.1757036647546212e-06, + "loss": 0.6431, + "step": 53897 + }, + { + "epoch": 1.38, + "learning_rate": 1.1756764246998771e-06, + "loss": 0.6689, + "step": 53898 + }, + { + "epoch": 1.38, + "learning_rate": 1.1756491845106257e-06, + "loss": 0.567, + "step": 53899 + }, + { + "epoch": 1.38, + "learning_rate": 1.1756219441868883e-06, + "loss": 0.6304, + "step": 53900 + }, + { + "epoch": 1.38, + "learning_rate": 1.1755947037286846e-06, + "loss": 0.5781, + "step": 53901 + }, + { + "epoch": 1.38, + "learning_rate": 1.1755674631360363e-06, + "loss": 0.5332, + "step": 53902 + }, + { + "epoch": 1.38, + "learning_rate": 1.175540222408964e-06, + "loss": 0.4915, + "step": 53903 + }, + { + "epoch": 1.38, + "learning_rate": 1.1755129815474888e-06, + "loss": 0.6396, + "step": 53904 + }, + { + "epoch": 1.38, + "learning_rate": 1.1754857405516316e-06, + "loss": 0.4846, + "step": 53905 + }, + { + "epoch": 1.38, + "learning_rate": 1.175458499421413e-06, + "loss": 0.5564, + "step": 53906 + }, + { + "epoch": 1.38, + "learning_rate": 1.1754312581568535e-06, + "loss": 0.7236, + "step": 53907 + }, + { + "epoch": 1.38, + "learning_rate": 1.1754040167579746e-06, + "loss": 0.6768, + "step": 53908 + }, + { + "epoch": 1.38, + "learning_rate": 1.1753767752247968e-06, + "loss": 0.7915, + "step": 53909 + }, + { + "epoch": 1.38, + "learning_rate": 1.1753495335573413e-06, + "loss": 0.7271, + "step": 53910 + }, + { + "epoch": 1.38, + "learning_rate": 1.1753222917556284e-06, + "loss": 0.6929, + "step": 53911 + }, + { + "epoch": 1.38, + "learning_rate": 1.1752950498196794e-06, + "loss": 0.7412, + "step": 53912 + }, + { + "epoch": 1.38, + "learning_rate": 1.175267807749515e-06, + "loss": 0.6543, + "step": 53913 + }, + { + "epoch": 1.38, + "learning_rate": 1.1752405655451562e-06, + "loss": 0.6279, + "step": 53914 + }, + { + "epoch": 1.38, + "learning_rate": 1.1752133232066237e-06, + "loss": 0.7285, + "step": 53915 + }, + { + "epoch": 1.38, + "learning_rate": 1.1751860807339387e-06, + "loss": 0.5645, + "step": 53916 + }, + { + "epoch": 1.38, + "learning_rate": 1.1751588381271212e-06, + "loss": 0.5728, + "step": 53917 + }, + { + "epoch": 1.38, + "learning_rate": 1.1751315953861932e-06, + "loss": 0.4258, + "step": 53918 + }, + { + "epoch": 1.38, + "learning_rate": 1.1751043525111743e-06, + "loss": 0.751, + "step": 53919 + }, + { + "epoch": 1.38, + "learning_rate": 1.1750771095020867e-06, + "loss": 0.6089, + "step": 53920 + }, + { + "epoch": 1.38, + "learning_rate": 1.1750498663589506e-06, + "loss": 0.7051, + "step": 53921 + }, + { + "epoch": 1.38, + "learning_rate": 1.1750226230817863e-06, + "loss": 0.708, + "step": 53922 + }, + { + "epoch": 1.38, + "learning_rate": 1.1749953796706157e-06, + "loss": 0.4186, + "step": 53923 + }, + { + "epoch": 1.38, + "learning_rate": 1.1749681361254591e-06, + "loss": 0.6211, + "step": 53924 + }, + { + "epoch": 1.38, + "learning_rate": 1.1749408924463375e-06, + "loss": 0.5498, + "step": 53925 + }, + { + "epoch": 1.38, + "learning_rate": 1.1749136486332716e-06, + "loss": 0.4297, + "step": 53926 + }, + { + "epoch": 1.38, + "learning_rate": 1.1748864046862824e-06, + "loss": 0.4937, + "step": 53927 + }, + { + "epoch": 1.38, + "learning_rate": 1.1748591606053904e-06, + "loss": 0.6899, + "step": 53928 + }, + { + "epoch": 1.38, + "learning_rate": 1.1748319163906172e-06, + "loss": 0.8223, + "step": 53929 + }, + { + "epoch": 1.38, + "learning_rate": 1.1748046720419832e-06, + "loss": 0.7051, + "step": 53930 + }, + { + "epoch": 1.38, + "learning_rate": 1.1747774275595092e-06, + "loss": 0.688, + "step": 53931 + }, + { + "epoch": 1.38, + "learning_rate": 1.174750182943216e-06, + "loss": 0.7778, + "step": 53932 + }, + { + "epoch": 1.38, + "learning_rate": 1.174722938193125e-06, + "loss": 0.5784, + "step": 53933 + }, + { + "epoch": 1.38, + "learning_rate": 1.1746956933092565e-06, + "loss": 0.6855, + "step": 53934 + }, + { + "epoch": 1.38, + "learning_rate": 1.1746684482916316e-06, + "loss": 0.8135, + "step": 53935 + }, + { + "epoch": 1.38, + "learning_rate": 1.1746412031402708e-06, + "loss": 0.3057, + "step": 53936 + }, + { + "epoch": 1.38, + "learning_rate": 1.1746139578551954e-06, + "loss": 0.6455, + "step": 53937 + }, + { + "epoch": 1.38, + "learning_rate": 1.1745867124364261e-06, + "loss": 0.6367, + "step": 53938 + }, + { + "epoch": 1.38, + "learning_rate": 1.174559466883984e-06, + "loss": 0.5803, + "step": 53939 + }, + { + "epoch": 1.38, + "learning_rate": 1.1745322211978898e-06, + "loss": 0.814, + "step": 53940 + }, + { + "epoch": 1.38, + "learning_rate": 1.174504975378164e-06, + "loss": 0.6509, + "step": 53941 + }, + { + "epoch": 1.38, + "learning_rate": 1.1744777294248278e-06, + "loss": 0.5732, + "step": 53942 + }, + { + "epoch": 1.38, + "learning_rate": 1.1744504833379024e-06, + "loss": 0.6709, + "step": 53943 + }, + { + "epoch": 1.38, + "learning_rate": 1.174423237117408e-06, + "loss": 0.7441, + "step": 53944 + }, + { + "epoch": 1.38, + "learning_rate": 1.1743959907633656e-06, + "loss": 0.7676, + "step": 53945 + }, + { + "epoch": 1.38, + "learning_rate": 1.1743687442757963e-06, + "loss": 0.6567, + "step": 53946 + }, + { + "epoch": 1.38, + "learning_rate": 1.1743414976547209e-06, + "loss": 0.6504, + "step": 53947 + }, + { + "epoch": 1.38, + "learning_rate": 1.1743142509001603e-06, + "loss": 0.5996, + "step": 53948 + }, + { + "epoch": 1.38, + "learning_rate": 1.1742870040121352e-06, + "loss": 0.7021, + "step": 53949 + }, + { + "epoch": 1.38, + "learning_rate": 1.1742597569906667e-06, + "loss": 0.3569, + "step": 53950 + }, + { + "epoch": 1.38, + "learning_rate": 1.1742325098357752e-06, + "loss": 0.833, + "step": 53951 + }, + { + "epoch": 1.38, + "learning_rate": 1.1742052625474822e-06, + "loss": 0.5952, + "step": 53952 + }, + { + "epoch": 1.38, + "learning_rate": 1.174178015125808e-06, + "loss": 0.6387, + "step": 53953 + }, + { + "epoch": 1.38, + "learning_rate": 1.1741507675707741e-06, + "loss": 0.7188, + "step": 53954 + }, + { + "epoch": 1.38, + "learning_rate": 1.1741235198824006e-06, + "loss": 0.6978, + "step": 53955 + }, + { + "epoch": 1.38, + "learning_rate": 1.1740962720607091e-06, + "loss": 0.5825, + "step": 53956 + }, + { + "epoch": 1.38, + "learning_rate": 1.1740690241057196e-06, + "loss": 0.6787, + "step": 53957 + }, + { + "epoch": 1.38, + "learning_rate": 1.1740417760174538e-06, + "loss": 0.5693, + "step": 53958 + }, + { + "epoch": 1.38, + "learning_rate": 1.174014527795932e-06, + "loss": 0.4382, + "step": 53959 + }, + { + "epoch": 1.38, + "learning_rate": 1.1739872794411757e-06, + "loss": 0.6597, + "step": 53960 + }, + { + "epoch": 1.38, + "learning_rate": 1.1739600309532047e-06, + "loss": 0.6875, + "step": 53961 + }, + { + "epoch": 1.38, + "learning_rate": 1.173932782332041e-06, + "loss": 0.5527, + "step": 53962 + }, + { + "epoch": 1.38, + "learning_rate": 1.1739055335777046e-06, + "loss": 0.7627, + "step": 53963 + }, + { + "epoch": 1.38, + "learning_rate": 1.173878284690217e-06, + "loss": 0.5908, + "step": 53964 + }, + { + "epoch": 1.38, + "learning_rate": 1.1738510356695989e-06, + "loss": 0.667, + "step": 53965 + }, + { + "epoch": 1.38, + "learning_rate": 1.1738237865158706e-06, + "loss": 0.6162, + "step": 53966 + }, + { + "epoch": 1.38, + "learning_rate": 1.1737965372290537e-06, + "loss": 0.5259, + "step": 53967 + }, + { + "epoch": 1.38, + "learning_rate": 1.173769287809169e-06, + "loss": 0.5386, + "step": 53968 + }, + { + "epoch": 1.38, + "learning_rate": 1.173742038256237e-06, + "loss": 0.7363, + "step": 53969 + }, + { + "epoch": 1.38, + "learning_rate": 1.1737147885702782e-06, + "loss": 0.5498, + "step": 53970 + }, + { + "epoch": 1.38, + "learning_rate": 1.1736875387513146e-06, + "loss": 0.627, + "step": 53971 + }, + { + "epoch": 1.38, + "learning_rate": 1.173660288799366e-06, + "loss": 0.5293, + "step": 53972 + }, + { + "epoch": 1.38, + "learning_rate": 1.173633038714454e-06, + "loss": 0.6582, + "step": 53973 + }, + { + "epoch": 1.38, + "learning_rate": 1.1736057884965992e-06, + "loss": 0.5596, + "step": 53974 + }, + { + "epoch": 1.38, + "learning_rate": 1.1735785381458224e-06, + "loss": 0.7402, + "step": 53975 + }, + { + "epoch": 1.38, + "learning_rate": 1.1735512876621444e-06, + "loss": 0.8125, + "step": 53976 + }, + { + "epoch": 1.38, + "learning_rate": 1.1735240370455862e-06, + "loss": 0.625, + "step": 53977 + }, + { + "epoch": 1.38, + "learning_rate": 1.1734967862961685e-06, + "loss": 0.6709, + "step": 53978 + }, + { + "epoch": 1.38, + "learning_rate": 1.1734695354139126e-06, + "loss": 0.7559, + "step": 53979 + }, + { + "epoch": 1.38, + "learning_rate": 1.1734422843988387e-06, + "loss": 0.6123, + "step": 53980 + }, + { + "epoch": 1.38, + "learning_rate": 1.1734150332509683e-06, + "loss": 0.5859, + "step": 53981 + }, + { + "epoch": 1.38, + "learning_rate": 1.1733877819703214e-06, + "loss": 0.6914, + "step": 53982 + }, + { + "epoch": 1.38, + "learning_rate": 1.1733605305569202e-06, + "loss": 0.7471, + "step": 53983 + }, + { + "epoch": 1.38, + "learning_rate": 1.1733332790107846e-06, + "loss": 0.6079, + "step": 53984 + }, + { + "epoch": 1.38, + "learning_rate": 1.1733060273319355e-06, + "loss": 0.7559, + "step": 53985 + }, + { + "epoch": 1.38, + "learning_rate": 1.1732787755203938e-06, + "loss": 0.4907, + "step": 53986 + }, + { + "epoch": 1.38, + "learning_rate": 1.1732515235761811e-06, + "loss": 0.7163, + "step": 53987 + }, + { + "epoch": 1.38, + "learning_rate": 1.173224271499317e-06, + "loss": 0.4446, + "step": 53988 + }, + { + "epoch": 1.38, + "learning_rate": 1.1731970192898235e-06, + "loss": 0.8242, + "step": 53989 + }, + { + "epoch": 1.38, + "learning_rate": 1.1731697669477209e-06, + "loss": 0.5898, + "step": 53990 + }, + { + "epoch": 1.38, + "learning_rate": 1.17314251447303e-06, + "loss": 0.6528, + "step": 53991 + }, + { + "epoch": 1.38, + "learning_rate": 1.173115261865772e-06, + "loss": 0.7832, + "step": 53992 + }, + { + "epoch": 1.38, + "learning_rate": 1.1730880091259674e-06, + "loss": 0.6001, + "step": 53993 + }, + { + "epoch": 1.38, + "learning_rate": 1.1730607562536379e-06, + "loss": 0.6953, + "step": 53994 + }, + { + "epoch": 1.38, + "learning_rate": 1.173033503248803e-06, + "loss": 0.6382, + "step": 53995 + }, + { + "epoch": 1.38, + "learning_rate": 1.1730062501114848e-06, + "loss": 0.7017, + "step": 53996 + }, + { + "epoch": 1.38, + "learning_rate": 1.1729789968417033e-06, + "loss": 0.5112, + "step": 53997 + }, + { + "epoch": 1.38, + "learning_rate": 1.1729517434394799e-06, + "loss": 0.6108, + "step": 53998 + }, + { + "epoch": 1.38, + "learning_rate": 1.1729244899048354e-06, + "loss": 0.6426, + "step": 53999 + }, + { + "epoch": 1.38, + "learning_rate": 1.1728972362377905e-06, + "loss": 0.6748, + "step": 54000 + }, + { + "epoch": 1.38, + "learning_rate": 1.1728699824383658e-06, + "loss": 0.4592, + "step": 54001 + }, + { + "epoch": 1.38, + "learning_rate": 1.1728427285065829e-06, + "loss": 0.873, + "step": 54002 + }, + { + "epoch": 1.38, + "learning_rate": 1.172815474442462e-06, + "loss": 0.8398, + "step": 54003 + }, + { + "epoch": 1.38, + "learning_rate": 1.1727882202460248e-06, + "loss": 0.5227, + "step": 54004 + }, + { + "epoch": 1.38, + "learning_rate": 1.172760965917291e-06, + "loss": 0.7178, + "step": 54005 + }, + { + "epoch": 1.38, + "learning_rate": 1.1727337114562825e-06, + "loss": 0.6094, + "step": 54006 + }, + { + "epoch": 1.38, + "learning_rate": 1.1727064568630193e-06, + "loss": 0.6816, + "step": 54007 + }, + { + "epoch": 1.38, + "learning_rate": 1.1726792021375232e-06, + "loss": 0.5684, + "step": 54008 + }, + { + "epoch": 1.38, + "learning_rate": 1.1726519472798142e-06, + "loss": 0.542, + "step": 54009 + }, + { + "epoch": 1.38, + "learning_rate": 1.1726246922899135e-06, + "loss": 0.6792, + "step": 54010 + }, + { + "epoch": 1.38, + "learning_rate": 1.1725974371678423e-06, + "loss": 0.6367, + "step": 54011 + }, + { + "epoch": 1.38, + "learning_rate": 1.172570181913621e-06, + "loss": 0.6001, + "step": 54012 + }, + { + "epoch": 1.38, + "learning_rate": 1.1725429265272707e-06, + "loss": 0.5757, + "step": 54013 + }, + { + "epoch": 1.38, + "learning_rate": 1.1725156710088123e-06, + "loss": 0.6123, + "step": 54014 + }, + { + "epoch": 1.38, + "learning_rate": 1.1724884153582664e-06, + "loss": 0.7656, + "step": 54015 + }, + { + "epoch": 1.38, + "learning_rate": 1.172461159575654e-06, + "loss": 0.2573, + "step": 54016 + }, + { + "epoch": 1.38, + "learning_rate": 1.1724339036609962e-06, + "loss": 0.6113, + "step": 54017 + }, + { + "epoch": 1.38, + "learning_rate": 1.1724066476143135e-06, + "loss": 0.6001, + "step": 54018 + }, + { + "epoch": 1.38, + "learning_rate": 1.1723793914356274e-06, + "loss": 0.6863, + "step": 54019 + }, + { + "epoch": 1.38, + "learning_rate": 1.1723521351249578e-06, + "loss": 0.5208, + "step": 54020 + }, + { + "epoch": 1.38, + "learning_rate": 1.1723248786823266e-06, + "loss": 0.7402, + "step": 54021 + }, + { + "epoch": 1.38, + "learning_rate": 1.1722976221077536e-06, + "loss": 0.5244, + "step": 54022 + }, + { + "epoch": 1.38, + "learning_rate": 1.1722703654012606e-06, + "loss": 0.6729, + "step": 54023 + }, + { + "epoch": 1.38, + "learning_rate": 1.172243108562868e-06, + "loss": 0.6558, + "step": 54024 + }, + { + "epoch": 1.38, + "learning_rate": 1.1722158515925971e-06, + "loss": 0.5122, + "step": 54025 + }, + { + "epoch": 1.38, + "learning_rate": 1.172188594490468e-06, + "loss": 0.6455, + "step": 54026 + }, + { + "epoch": 1.38, + "learning_rate": 1.172161337256502e-06, + "loss": 0.4795, + "step": 54027 + }, + { + "epoch": 1.38, + "learning_rate": 1.17213407989072e-06, + "loss": 0.7402, + "step": 54028 + }, + { + "epoch": 1.38, + "learning_rate": 1.172106822393143e-06, + "loss": 0.6685, + "step": 54029 + }, + { + "epoch": 1.38, + "learning_rate": 1.172079564763792e-06, + "loss": 0.7842, + "step": 54030 + }, + { + "epoch": 1.38, + "learning_rate": 1.1720523070026873e-06, + "loss": 0.6211, + "step": 54031 + }, + { + "epoch": 1.38, + "learning_rate": 1.1720250491098499e-06, + "loss": 0.6543, + "step": 54032 + }, + { + "epoch": 1.38, + "learning_rate": 1.171997791085301e-06, + "loss": 0.7842, + "step": 54033 + }, + { + "epoch": 1.38, + "learning_rate": 1.1719705329290613e-06, + "loss": 0.4955, + "step": 54034 + }, + { + "epoch": 1.38, + "learning_rate": 1.1719432746411514e-06, + "loss": 0.5674, + "step": 54035 + }, + { + "epoch": 1.38, + "learning_rate": 1.171916016221593e-06, + "loss": 0.6255, + "step": 54036 + }, + { + "epoch": 1.38, + "learning_rate": 1.171888757670406e-06, + "loss": 0.562, + "step": 54037 + }, + { + "epoch": 1.39, + "learning_rate": 1.1718614989876117e-06, + "loss": 0.7617, + "step": 54038 + }, + { + "epoch": 1.39, + "learning_rate": 1.171834240173231e-06, + "loss": 0.7695, + "step": 54039 + }, + { + "epoch": 1.39, + "learning_rate": 1.1718069812272847e-06, + "loss": 0.6963, + "step": 54040 + }, + { + "epoch": 1.39, + "learning_rate": 1.1717797221497938e-06, + "loss": 0.7451, + "step": 54041 + }, + { + "epoch": 1.39, + "learning_rate": 1.171752462940779e-06, + "loss": 0.7432, + "step": 54042 + }, + { + "epoch": 1.39, + "learning_rate": 1.1717252036002611e-06, + "loss": 0.6108, + "step": 54043 + }, + { + "epoch": 1.39, + "learning_rate": 1.1716979441282616e-06, + "loss": 0.6265, + "step": 54044 + }, + { + "epoch": 1.39, + "learning_rate": 1.1716706845248005e-06, + "loss": 0.6462, + "step": 54045 + }, + { + "epoch": 1.39, + "learning_rate": 1.1716434247898992e-06, + "loss": 0.6094, + "step": 54046 + }, + { + "epoch": 1.39, + "learning_rate": 1.1716161649235782e-06, + "loss": 0.6523, + "step": 54047 + }, + { + "epoch": 1.39, + "learning_rate": 1.1715889049258588e-06, + "loss": 0.5645, + "step": 54048 + }, + { + "epoch": 1.39, + "learning_rate": 1.1715616447967615e-06, + "loss": 0.5864, + "step": 54049 + }, + { + "epoch": 1.39, + "learning_rate": 1.1715343845363075e-06, + "loss": 0.7227, + "step": 54050 + }, + { + "epoch": 1.39, + "learning_rate": 1.1715071241445173e-06, + "loss": 0.7051, + "step": 54051 + }, + { + "epoch": 1.39, + "learning_rate": 1.1714798636214122e-06, + "loss": 0.4463, + "step": 54052 + }, + { + "epoch": 1.39, + "learning_rate": 1.1714526029670126e-06, + "loss": 0.8057, + "step": 54053 + }, + { + "epoch": 1.39, + "learning_rate": 1.1714253421813397e-06, + "loss": 0.7393, + "step": 54054 + }, + { + "epoch": 1.39, + "learning_rate": 1.1713980812644147e-06, + "loss": 0.5239, + "step": 54055 + }, + { + "epoch": 1.39, + "learning_rate": 1.1713708202162576e-06, + "loss": 0.7549, + "step": 54056 + }, + { + "epoch": 1.39, + "learning_rate": 1.1713435590368898e-06, + "loss": 0.6221, + "step": 54057 + }, + { + "epoch": 1.39, + "learning_rate": 1.1713162977263323e-06, + "loss": 0.4668, + "step": 54058 + }, + { + "epoch": 1.39, + "learning_rate": 1.1712890362846058e-06, + "loss": 0.7598, + "step": 54059 + }, + { + "epoch": 1.39, + "learning_rate": 1.1712617747117308e-06, + "loss": 0.7793, + "step": 54060 + }, + { + "epoch": 1.39, + "learning_rate": 1.1712345130077288e-06, + "loss": 0.7705, + "step": 54061 + }, + { + "epoch": 1.39, + "learning_rate": 1.1712072511726203e-06, + "loss": 0.7002, + "step": 54062 + }, + { + "epoch": 1.39, + "learning_rate": 1.1711799892064264e-06, + "loss": 0.4927, + "step": 54063 + }, + { + "epoch": 1.39, + "learning_rate": 1.171152727109168e-06, + "loss": 0.5703, + "step": 54064 + }, + { + "epoch": 1.39, + "learning_rate": 1.1711254648808657e-06, + "loss": 0.6128, + "step": 54065 + }, + { + "epoch": 1.39, + "learning_rate": 1.1710982025215404e-06, + "loss": 0.7451, + "step": 54066 + }, + { + "epoch": 1.39, + "learning_rate": 1.171070940031213e-06, + "loss": 0.7036, + "step": 54067 + }, + { + "epoch": 1.39, + "learning_rate": 1.1710436774099047e-06, + "loss": 0.6465, + "step": 54068 + }, + { + "epoch": 1.39, + "learning_rate": 1.1710164146576363e-06, + "loss": 0.749, + "step": 54069 + }, + { + "epoch": 1.39, + "learning_rate": 1.1709891517744278e-06, + "loss": 0.6636, + "step": 54070 + }, + { + "epoch": 1.39, + "learning_rate": 1.1709618887603011e-06, + "loss": 0.8389, + "step": 54071 + }, + { + "epoch": 1.39, + "learning_rate": 1.1709346256152767e-06, + "loss": 0.4331, + "step": 54072 + }, + { + "epoch": 1.39, + "learning_rate": 1.170907362339376e-06, + "loss": 0.5381, + "step": 54073 + }, + { + "epoch": 1.39, + "learning_rate": 1.170880098932619e-06, + "loss": 0.5391, + "step": 54074 + }, + { + "epoch": 1.39, + "learning_rate": 1.170852835395027e-06, + "loss": 0.6802, + "step": 54075 + }, + { + "epoch": 1.39, + "learning_rate": 1.1708255717266206e-06, + "loss": 0.4626, + "step": 54076 + }, + { + "epoch": 1.39, + "learning_rate": 1.1707983079274212e-06, + "loss": 0.7974, + "step": 54077 + }, + { + "epoch": 1.39, + "learning_rate": 1.1707710439974492e-06, + "loss": 0.5278, + "step": 54078 + }, + { + "epoch": 1.39, + "learning_rate": 1.1707437799367259e-06, + "loss": 0.7178, + "step": 54079 + }, + { + "epoch": 1.39, + "learning_rate": 1.1707165157452718e-06, + "loss": 0.6169, + "step": 54080 + }, + { + "epoch": 1.39, + "learning_rate": 1.170689251423108e-06, + "loss": 0.6953, + "step": 54081 + }, + { + "epoch": 1.39, + "learning_rate": 1.170661986970255e-06, + "loss": 0.5938, + "step": 54082 + }, + { + "epoch": 1.39, + "learning_rate": 1.170634722386734e-06, + "loss": 0.6162, + "step": 54083 + }, + { + "epoch": 1.39, + "learning_rate": 1.1706074576725665e-06, + "loss": 0.5684, + "step": 54084 + }, + { + "epoch": 1.39, + "learning_rate": 1.170580192827772e-06, + "loss": 0.647, + "step": 54085 + }, + { + "epoch": 1.39, + "learning_rate": 1.1705529278523725e-06, + "loss": 0.4531, + "step": 54086 + }, + { + "epoch": 1.39, + "learning_rate": 1.1705256627463883e-06, + "loss": 0.8623, + "step": 54087 + }, + { + "epoch": 1.39, + "learning_rate": 1.1704983975098404e-06, + "loss": 0.7061, + "step": 54088 + }, + { + "epoch": 1.39, + "learning_rate": 1.1704711321427498e-06, + "loss": 0.5388, + "step": 54089 + }, + { + "epoch": 1.39, + "learning_rate": 1.1704438666451373e-06, + "loss": 0.6318, + "step": 54090 + }, + { + "epoch": 1.39, + "learning_rate": 1.1704166010170235e-06, + "loss": 0.5752, + "step": 54091 + }, + { + "epoch": 1.39, + "learning_rate": 1.17038933525843e-06, + "loss": 0.6465, + "step": 54092 + }, + { + "epoch": 1.39, + "learning_rate": 1.1703620693693767e-06, + "loss": 0.489, + "step": 54093 + }, + { + "epoch": 1.39, + "learning_rate": 1.1703348033498856e-06, + "loss": 0.7236, + "step": 54094 + }, + { + "epoch": 1.39, + "learning_rate": 1.1703075371999764e-06, + "loss": 0.5575, + "step": 54095 + }, + { + "epoch": 1.39, + "learning_rate": 1.1702802709196712e-06, + "loss": 0.7266, + "step": 54096 + }, + { + "epoch": 1.39, + "learning_rate": 1.1702530045089895e-06, + "loss": 0.8398, + "step": 54097 + }, + { + "epoch": 1.39, + "learning_rate": 1.1702257379679532e-06, + "loss": 0.582, + "step": 54098 + }, + { + "epoch": 1.39, + "learning_rate": 1.1701984712965832e-06, + "loss": 0.7305, + "step": 54099 + }, + { + "epoch": 1.39, + "learning_rate": 1.1701712044948995e-06, + "loss": 0.6064, + "step": 54100 + }, + { + "epoch": 1.39, + "learning_rate": 1.1701439375629238e-06, + "loss": 0.7808, + "step": 54101 + }, + { + "epoch": 1.39, + "learning_rate": 1.1701166705006767e-06, + "loss": 0.7373, + "step": 54102 + }, + { + "epoch": 1.39, + "learning_rate": 1.1700894033081792e-06, + "loss": 0.6074, + "step": 54103 + }, + { + "epoch": 1.39, + "learning_rate": 1.1700621359854519e-06, + "loss": 0.6284, + "step": 54104 + }, + { + "epoch": 1.39, + "learning_rate": 1.170034868532516e-06, + "loss": 0.6953, + "step": 54105 + }, + { + "epoch": 1.39, + "learning_rate": 1.170007600949392e-06, + "loss": 0.7891, + "step": 54106 + }, + { + "epoch": 1.39, + "learning_rate": 1.169980333236101e-06, + "loss": 0.5806, + "step": 54107 + }, + { + "epoch": 1.39, + "learning_rate": 1.1699530653926638e-06, + "loss": 0.6724, + "step": 54108 + }, + { + "epoch": 1.39, + "learning_rate": 1.169925797419102e-06, + "loss": 0.6855, + "step": 54109 + }, + { + "epoch": 1.39, + "learning_rate": 1.1698985293154354e-06, + "loss": 0.6807, + "step": 54110 + }, + { + "epoch": 1.39, + "learning_rate": 1.1698712610816852e-06, + "loss": 0.6807, + "step": 54111 + }, + { + "epoch": 1.39, + "learning_rate": 1.1698439927178722e-06, + "loss": 0.6353, + "step": 54112 + }, + { + "epoch": 1.39, + "learning_rate": 1.169816724224018e-06, + "loss": 0.521, + "step": 54113 + }, + { + "epoch": 1.39, + "learning_rate": 1.1697894556001427e-06, + "loss": 0.6943, + "step": 54114 + }, + { + "epoch": 1.39, + "learning_rate": 1.1697621868462675e-06, + "loss": 0.7261, + "step": 54115 + }, + { + "epoch": 1.39, + "learning_rate": 1.169734917962413e-06, + "loss": 0.6533, + "step": 54116 + }, + { + "epoch": 1.39, + "learning_rate": 1.1697076489486005e-06, + "loss": 0.5078, + "step": 54117 + }, + { + "epoch": 1.39, + "learning_rate": 1.1696803798048502e-06, + "loss": 0.876, + "step": 54118 + }, + { + "epoch": 1.39, + "learning_rate": 1.169653110531184e-06, + "loss": 0.6401, + "step": 54119 + }, + { + "epoch": 1.39, + "learning_rate": 1.169625841127622e-06, + "loss": 0.5454, + "step": 54120 + }, + { + "epoch": 1.39, + "learning_rate": 1.1695985715941853e-06, + "loss": 0.5581, + "step": 54121 + }, + { + "epoch": 1.39, + "learning_rate": 1.1695713019308947e-06, + "loss": 0.8018, + "step": 54122 + }, + { + "epoch": 1.39, + "learning_rate": 1.1695440321377712e-06, + "loss": 0.5439, + "step": 54123 + }, + { + "epoch": 1.39, + "learning_rate": 1.1695167622148357e-06, + "loss": 0.5242, + "step": 54124 + }, + { + "epoch": 1.39, + "learning_rate": 1.1694894921621087e-06, + "loss": 0.7295, + "step": 54125 + }, + { + "epoch": 1.39, + "learning_rate": 1.1694622219796117e-06, + "loss": 0.6426, + "step": 54126 + }, + { + "epoch": 1.39, + "learning_rate": 1.1694349516673652e-06, + "loss": 0.438, + "step": 54127 + }, + { + "epoch": 1.39, + "learning_rate": 1.1694076812253902e-06, + "loss": 0.5947, + "step": 54128 + }, + { + "epoch": 1.39, + "learning_rate": 1.1693804106537075e-06, + "loss": 0.4265, + "step": 54129 + }, + { + "epoch": 1.39, + "learning_rate": 1.169353139952338e-06, + "loss": 0.667, + "step": 54130 + }, + { + "epoch": 1.39, + "learning_rate": 1.1693258691213026e-06, + "loss": 0.7412, + "step": 54131 + }, + { + "epoch": 1.39, + "learning_rate": 1.169298598160622e-06, + "loss": 0.6523, + "step": 54132 + }, + { + "epoch": 1.39, + "learning_rate": 1.1692713270703173e-06, + "loss": 0.7363, + "step": 54133 + }, + { + "epoch": 1.39, + "learning_rate": 1.1692440558504099e-06, + "loss": 0.4717, + "step": 54134 + }, + { + "epoch": 1.39, + "learning_rate": 1.1692167845009193e-06, + "loss": 0.7129, + "step": 54135 + }, + { + "epoch": 1.39, + "learning_rate": 1.1691895130218676e-06, + "loss": 0.6006, + "step": 54136 + }, + { + "epoch": 1.39, + "learning_rate": 1.169162241413275e-06, + "loss": 0.4907, + "step": 54137 + }, + { + "epoch": 1.39, + "learning_rate": 1.1691349696751628e-06, + "loss": 0.6963, + "step": 54138 + }, + { + "epoch": 1.39, + "learning_rate": 1.1691076978075521e-06, + "loss": 0.6455, + "step": 54139 + }, + { + "epoch": 1.39, + "learning_rate": 1.169080425810463e-06, + "loss": 0.6211, + "step": 54140 + }, + { + "epoch": 1.39, + "learning_rate": 1.1690531536839168e-06, + "loss": 0.4861, + "step": 54141 + }, + { + "epoch": 1.39, + "learning_rate": 1.1690258814279345e-06, + "loss": 0.6719, + "step": 54142 + }, + { + "epoch": 1.39, + "learning_rate": 1.1689986090425366e-06, + "loss": 0.7334, + "step": 54143 + }, + { + "epoch": 1.39, + "learning_rate": 1.1689713365277445e-06, + "loss": 0.5059, + "step": 54144 + }, + { + "epoch": 1.39, + "learning_rate": 1.1689440638835788e-06, + "loss": 0.7148, + "step": 54145 + }, + { + "epoch": 1.39, + "learning_rate": 1.16891679111006e-06, + "loss": 0.4995, + "step": 54146 + }, + { + "epoch": 1.39, + "learning_rate": 1.1688895182072101e-06, + "loss": 0.6602, + "step": 54147 + }, + { + "epoch": 1.39, + "learning_rate": 1.1688622451750488e-06, + "loss": 0.5859, + "step": 54148 + }, + { + "epoch": 1.39, + "learning_rate": 1.1688349720135978e-06, + "loss": 0.6978, + "step": 54149 + }, + { + "epoch": 1.39, + "learning_rate": 1.168807698722877e-06, + "loss": 0.6665, + "step": 54150 + }, + { + "epoch": 1.39, + "learning_rate": 1.1687804253029083e-06, + "loss": 0.5537, + "step": 54151 + }, + { + "epoch": 1.39, + "learning_rate": 1.168753151753712e-06, + "loss": 0.5413, + "step": 54152 + }, + { + "epoch": 1.39, + "learning_rate": 1.1687258780753095e-06, + "loss": 0.448, + "step": 54153 + }, + { + "epoch": 1.39, + "learning_rate": 1.1686986042677212e-06, + "loss": 0.5625, + "step": 54154 + }, + { + "epoch": 1.39, + "learning_rate": 1.1686713303309683e-06, + "loss": 0.6807, + "step": 54155 + }, + { + "epoch": 1.39, + "learning_rate": 1.1686440562650712e-06, + "loss": 0.6479, + "step": 54156 + }, + { + "epoch": 1.39, + "learning_rate": 1.1686167820700511e-06, + "loss": 0.4851, + "step": 54157 + }, + { + "epoch": 1.39, + "learning_rate": 1.168589507745929e-06, + "loss": 0.6973, + "step": 54158 + }, + { + "epoch": 1.39, + "learning_rate": 1.1685622332927261e-06, + "loss": 0.6406, + "step": 54159 + }, + { + "epoch": 1.39, + "learning_rate": 1.1685349587104623e-06, + "loss": 0.4972, + "step": 54160 + }, + { + "epoch": 1.39, + "learning_rate": 1.168507683999159e-06, + "loss": 0.6895, + "step": 54161 + }, + { + "epoch": 1.39, + "learning_rate": 1.1684804091588372e-06, + "loss": 0.707, + "step": 54162 + }, + { + "epoch": 1.39, + "learning_rate": 1.1684531341895178e-06, + "loss": 0.7339, + "step": 54163 + }, + { + "epoch": 1.39, + "learning_rate": 1.1684258590912216e-06, + "loss": 0.7861, + "step": 54164 + }, + { + "epoch": 1.39, + "learning_rate": 1.1683985838639693e-06, + "loss": 0.8301, + "step": 54165 + }, + { + "epoch": 1.39, + "learning_rate": 1.1683713085077823e-06, + "loss": 0.5928, + "step": 54166 + }, + { + "epoch": 1.39, + "learning_rate": 1.1683440330226809e-06, + "loss": 0.7627, + "step": 54167 + }, + { + "epoch": 1.39, + "learning_rate": 1.168316757408686e-06, + "loss": 0.542, + "step": 54168 + }, + { + "epoch": 1.39, + "learning_rate": 1.168289481665819e-06, + "loss": 0.7207, + "step": 54169 + }, + { + "epoch": 1.39, + "learning_rate": 1.1682622057941005e-06, + "loss": 0.6577, + "step": 54170 + }, + { + "epoch": 1.39, + "learning_rate": 1.168234929793551e-06, + "loss": 0.6118, + "step": 54171 + }, + { + "epoch": 1.39, + "learning_rate": 1.1682076536641922e-06, + "loss": 0.6094, + "step": 54172 + }, + { + "epoch": 1.39, + "learning_rate": 1.168180377406044e-06, + "loss": 0.6274, + "step": 54173 + }, + { + "epoch": 1.39, + "learning_rate": 1.1681531010191287e-06, + "loss": 0.75, + "step": 54174 + }, + { + "epoch": 1.39, + "learning_rate": 1.1681258245034655e-06, + "loss": 0.7393, + "step": 54175 + }, + { + "epoch": 1.39, + "learning_rate": 1.1680985478590763e-06, + "loss": 0.4712, + "step": 54176 + }, + { + "epoch": 1.39, + "learning_rate": 1.1680712710859818e-06, + "loss": 0.6299, + "step": 54177 + }, + { + "epoch": 1.39, + "learning_rate": 1.1680439941842028e-06, + "loss": 0.4067, + "step": 54178 + }, + { + "epoch": 1.39, + "learning_rate": 1.1680167171537605e-06, + "loss": 0.6465, + "step": 54179 + }, + { + "epoch": 1.39, + "learning_rate": 1.1679894399946754e-06, + "loss": 0.623, + "step": 54180 + }, + { + "epoch": 1.39, + "learning_rate": 1.1679621627069685e-06, + "loss": 0.551, + "step": 54181 + }, + { + "epoch": 1.39, + "learning_rate": 1.1679348852906605e-06, + "loss": 0.6201, + "step": 54182 + }, + { + "epoch": 1.39, + "learning_rate": 1.1679076077457725e-06, + "loss": 0.8164, + "step": 54183 + }, + { + "epoch": 1.39, + "learning_rate": 1.167880330072326e-06, + "loss": 0.4707, + "step": 54184 + }, + { + "epoch": 1.39, + "learning_rate": 1.1678530522703405e-06, + "loss": 0.6047, + "step": 54185 + }, + { + "epoch": 1.39, + "learning_rate": 1.1678257743398378e-06, + "loss": 0.6426, + "step": 54186 + }, + { + "epoch": 1.39, + "learning_rate": 1.1677984962808388e-06, + "loss": 0.6797, + "step": 54187 + }, + { + "epoch": 1.39, + "learning_rate": 1.167771218093364e-06, + "loss": 0.5615, + "step": 54188 + }, + { + "epoch": 1.39, + "learning_rate": 1.1677439397774347e-06, + "loss": 0.8057, + "step": 54189 + }, + { + "epoch": 1.39, + "learning_rate": 1.1677166613330714e-06, + "loss": 0.6353, + "step": 54190 + }, + { + "epoch": 1.39, + "learning_rate": 1.1676893827602952e-06, + "loss": 0.6182, + "step": 54191 + }, + { + "epoch": 1.39, + "learning_rate": 1.1676621040591267e-06, + "loss": 0.7109, + "step": 54192 + }, + { + "epoch": 1.39, + "learning_rate": 1.1676348252295875e-06, + "loss": 0.8506, + "step": 54193 + }, + { + "epoch": 1.39, + "learning_rate": 1.1676075462716978e-06, + "loss": 0.5935, + "step": 54194 + }, + { + "epoch": 1.39, + "learning_rate": 1.167580267185479e-06, + "loss": 0.5745, + "step": 54195 + }, + { + "epoch": 1.39, + "learning_rate": 1.1675529879709514e-06, + "loss": 0.5083, + "step": 54196 + }, + { + "epoch": 1.39, + "learning_rate": 1.1675257086281363e-06, + "loss": 0.6431, + "step": 54197 + }, + { + "epoch": 1.39, + "learning_rate": 1.1674984291570543e-06, + "loss": 0.5903, + "step": 54198 + }, + { + "epoch": 1.39, + "learning_rate": 1.1674711495577268e-06, + "loss": 0.6826, + "step": 54199 + }, + { + "epoch": 1.39, + "learning_rate": 1.1674438698301739e-06, + "loss": 0.5811, + "step": 54200 + }, + { + "epoch": 1.39, + "learning_rate": 1.1674165899744174e-06, + "loss": 0.5977, + "step": 54201 + }, + { + "epoch": 1.39, + "learning_rate": 1.167389309990477e-06, + "loss": 0.7041, + "step": 54202 + }, + { + "epoch": 1.39, + "learning_rate": 1.167362029878375e-06, + "loss": 0.7793, + "step": 54203 + }, + { + "epoch": 1.39, + "learning_rate": 1.1673347496381313e-06, + "loss": 0.7373, + "step": 54204 + }, + { + "epoch": 1.39, + "learning_rate": 1.167307469269767e-06, + "loss": 0.5859, + "step": 54205 + }, + { + "epoch": 1.39, + "learning_rate": 1.1672801887733033e-06, + "loss": 0.7432, + "step": 54206 + }, + { + "epoch": 1.39, + "learning_rate": 1.1672529081487607e-06, + "loss": 0.5303, + "step": 54207 + }, + { + "epoch": 1.39, + "learning_rate": 1.16722562739616e-06, + "loss": 0.6411, + "step": 54208 + }, + { + "epoch": 1.39, + "learning_rate": 1.1671983465155228e-06, + "loss": 0.6816, + "step": 54209 + }, + { + "epoch": 1.39, + "learning_rate": 1.1671710655068694e-06, + "loss": 0.5269, + "step": 54210 + }, + { + "epoch": 1.39, + "learning_rate": 1.1671437843702208e-06, + "loss": 0.3887, + "step": 54211 + }, + { + "epoch": 1.39, + "learning_rate": 1.1671165031055975e-06, + "loss": 0.7773, + "step": 54212 + }, + { + "epoch": 1.39, + "learning_rate": 1.1670892217130213e-06, + "loss": 0.8208, + "step": 54213 + }, + { + "epoch": 1.39, + "learning_rate": 1.1670619401925124e-06, + "loss": 0.8203, + "step": 54214 + }, + { + "epoch": 1.39, + "learning_rate": 1.1670346585440916e-06, + "loss": 0.5161, + "step": 54215 + }, + { + "epoch": 1.39, + "learning_rate": 1.1670073767677804e-06, + "loss": 0.7168, + "step": 54216 + }, + { + "epoch": 1.39, + "learning_rate": 1.1669800948635988e-06, + "loss": 0.8213, + "step": 54217 + }, + { + "epoch": 1.39, + "learning_rate": 1.1669528128315688e-06, + "loss": 0.625, + "step": 54218 + }, + { + "epoch": 1.39, + "learning_rate": 1.1669255306717105e-06, + "loss": 0.6353, + "step": 54219 + }, + { + "epoch": 1.39, + "learning_rate": 1.166898248384045e-06, + "loss": 0.6709, + "step": 54220 + }, + { + "epoch": 1.39, + "learning_rate": 1.1668709659685932e-06, + "loss": 0.6958, + "step": 54221 + }, + { + "epoch": 1.39, + "learning_rate": 1.1668436834253759e-06, + "loss": 0.7256, + "step": 54222 + }, + { + "epoch": 1.39, + "learning_rate": 1.1668164007544143e-06, + "loss": 0.6904, + "step": 54223 + }, + { + "epoch": 1.39, + "learning_rate": 1.1667891179557289e-06, + "loss": 0.5703, + "step": 54224 + }, + { + "epoch": 1.39, + "learning_rate": 1.1667618350293405e-06, + "loss": 0.7314, + "step": 54225 + }, + { + "epoch": 1.39, + "learning_rate": 1.1667345519752704e-06, + "loss": 0.5371, + "step": 54226 + }, + { + "epoch": 1.39, + "learning_rate": 1.1667072687935393e-06, + "loss": 0.7715, + "step": 54227 + }, + { + "epoch": 1.39, + "learning_rate": 1.1666799854841684e-06, + "loss": 0.6465, + "step": 54228 + }, + { + "epoch": 1.39, + "learning_rate": 1.1666527020471782e-06, + "loss": 0.709, + "step": 54229 + }, + { + "epoch": 1.39, + "learning_rate": 1.1666254184825895e-06, + "loss": 0.7832, + "step": 54230 + }, + { + "epoch": 1.39, + "learning_rate": 1.1665981347904232e-06, + "loss": 0.6489, + "step": 54231 + }, + { + "epoch": 1.39, + "learning_rate": 1.1665708509707007e-06, + "loss": 0.627, + "step": 54232 + }, + { + "epoch": 1.39, + "learning_rate": 1.1665435670234426e-06, + "loss": 0.6641, + "step": 54233 + }, + { + "epoch": 1.39, + "learning_rate": 1.1665162829486694e-06, + "loss": 0.6304, + "step": 54234 + }, + { + "epoch": 1.39, + "learning_rate": 1.1664889987464026e-06, + "loss": 0.7148, + "step": 54235 + }, + { + "epoch": 1.39, + "learning_rate": 1.1664617144166627e-06, + "loss": 0.752, + "step": 54236 + }, + { + "epoch": 1.39, + "learning_rate": 1.1664344299594709e-06, + "loss": 0.4512, + "step": 54237 + }, + { + "epoch": 1.39, + "learning_rate": 1.1664071453748478e-06, + "loss": 0.4971, + "step": 54238 + }, + { + "epoch": 1.39, + "learning_rate": 1.1663798606628147e-06, + "loss": 0.5913, + "step": 54239 + }, + { + "epoch": 1.39, + "learning_rate": 1.1663525758233916e-06, + "loss": 0.5085, + "step": 54240 + }, + { + "epoch": 1.39, + "learning_rate": 1.1663252908566004e-06, + "loss": 0.5979, + "step": 54241 + }, + { + "epoch": 1.39, + "learning_rate": 1.1662980057624612e-06, + "loss": 0.5822, + "step": 54242 + }, + { + "epoch": 1.39, + "learning_rate": 1.1662707205409958e-06, + "loss": 0.6953, + "step": 54243 + }, + { + "epoch": 1.39, + "learning_rate": 1.166243435192224e-06, + "loss": 0.6836, + "step": 54244 + }, + { + "epoch": 1.39, + "learning_rate": 1.1662161497161678e-06, + "loss": 0.5139, + "step": 54245 + }, + { + "epoch": 1.39, + "learning_rate": 1.166188864112847e-06, + "loss": 0.4673, + "step": 54246 + }, + { + "epoch": 1.39, + "learning_rate": 1.1661615783822835e-06, + "loss": 0.7129, + "step": 54247 + }, + { + "epoch": 1.39, + "learning_rate": 1.1661342925244974e-06, + "loss": 0.7607, + "step": 54248 + }, + { + "epoch": 1.39, + "learning_rate": 1.1661070065395102e-06, + "loss": 0.5684, + "step": 54249 + }, + { + "epoch": 1.39, + "learning_rate": 1.166079720427342e-06, + "loss": 0.6875, + "step": 54250 + }, + { + "epoch": 1.39, + "learning_rate": 1.1660524341880146e-06, + "loss": 0.8057, + "step": 54251 + }, + { + "epoch": 1.39, + "learning_rate": 1.1660251478215485e-06, + "loss": 0.5336, + "step": 54252 + }, + { + "epoch": 1.39, + "learning_rate": 1.1659978613279645e-06, + "loss": 0.8193, + "step": 54253 + }, + { + "epoch": 1.39, + "learning_rate": 1.1659705747072837e-06, + "loss": 0.6177, + "step": 54254 + }, + { + "epoch": 1.39, + "learning_rate": 1.1659432879595263e-06, + "loss": 0.4197, + "step": 54255 + }, + { + "epoch": 1.39, + "learning_rate": 1.1659160010847144e-06, + "loss": 0.6729, + "step": 54256 + }, + { + "epoch": 1.39, + "learning_rate": 1.165888714082868e-06, + "loss": 0.6135, + "step": 54257 + }, + { + "epoch": 1.39, + "learning_rate": 1.1658614269540083e-06, + "loss": 0.6294, + "step": 54258 + }, + { + "epoch": 1.39, + "learning_rate": 1.1658341396981559e-06, + "loss": 0.7422, + "step": 54259 + }, + { + "epoch": 1.39, + "learning_rate": 1.1658068523153324e-06, + "loss": 0.6035, + "step": 54260 + }, + { + "epoch": 1.39, + "learning_rate": 1.1657795648055577e-06, + "loss": 0.7666, + "step": 54261 + }, + { + "epoch": 1.39, + "learning_rate": 1.1657522771688534e-06, + "loss": 0.7158, + "step": 54262 + }, + { + "epoch": 1.39, + "learning_rate": 1.1657249894052403e-06, + "loss": 0.8389, + "step": 54263 + }, + { + "epoch": 1.39, + "learning_rate": 1.1656977015147393e-06, + "loss": 0.5908, + "step": 54264 + }, + { + "epoch": 1.39, + "learning_rate": 1.165670413497371e-06, + "loss": 0.4788, + "step": 54265 + }, + { + "epoch": 1.39, + "learning_rate": 1.1656431253531564e-06, + "loss": 0.7998, + "step": 54266 + }, + { + "epoch": 1.39, + "learning_rate": 1.1656158370821165e-06, + "loss": 0.5981, + "step": 54267 + }, + { + "epoch": 1.39, + "learning_rate": 1.1655885486842725e-06, + "loss": 0.7031, + "step": 54268 + }, + { + "epoch": 1.39, + "learning_rate": 1.1655612601596445e-06, + "loss": 0.7363, + "step": 54269 + }, + { + "epoch": 1.39, + "learning_rate": 1.165533971508254e-06, + "loss": 0.4259, + "step": 54270 + }, + { + "epoch": 1.39, + "learning_rate": 1.1655066827301219e-06, + "loss": 0.584, + "step": 54271 + }, + { + "epoch": 1.39, + "learning_rate": 1.1654793938252689e-06, + "loss": 0.7031, + "step": 54272 + }, + { + "epoch": 1.39, + "learning_rate": 1.165452104793716e-06, + "loss": 0.7705, + "step": 54273 + }, + { + "epoch": 1.39, + "learning_rate": 1.165424815635484e-06, + "loss": 0.582, + "step": 54274 + }, + { + "epoch": 1.39, + "learning_rate": 1.1653975263505935e-06, + "loss": 0.6855, + "step": 54275 + }, + { + "epoch": 1.39, + "learning_rate": 1.1653702369390662e-06, + "loss": 0.5244, + "step": 54276 + }, + { + "epoch": 1.39, + "learning_rate": 1.165342947400922e-06, + "loss": 0.7334, + "step": 54277 + }, + { + "epoch": 1.39, + "learning_rate": 1.1653156577361826e-06, + "loss": 0.6646, + "step": 54278 + }, + { + "epoch": 1.39, + "learning_rate": 1.1652883679448688e-06, + "loss": 0.5815, + "step": 54279 + }, + { + "epoch": 1.39, + "learning_rate": 1.165261078027001e-06, + "loss": 0.6333, + "step": 54280 + }, + { + "epoch": 1.39, + "learning_rate": 1.1652337879826005e-06, + "loss": 0.6187, + "step": 54281 + }, + { + "epoch": 1.39, + "learning_rate": 1.1652064978116878e-06, + "loss": 0.5874, + "step": 54282 + }, + { + "epoch": 1.39, + "learning_rate": 1.1651792075142847e-06, + "loss": 0.79, + "step": 54283 + }, + { + "epoch": 1.39, + "learning_rate": 1.1651519170904109e-06, + "loss": 0.5264, + "step": 54284 + }, + { + "epoch": 1.39, + "learning_rate": 1.1651246265400882e-06, + "loss": 0.6641, + "step": 54285 + }, + { + "epoch": 1.39, + "learning_rate": 1.1650973358633369e-06, + "loss": 0.6616, + "step": 54286 + }, + { + "epoch": 1.39, + "learning_rate": 1.1650700450601785e-06, + "loss": 0.7021, + "step": 54287 + }, + { + "epoch": 1.39, + "learning_rate": 1.1650427541306336e-06, + "loss": 0.7314, + "step": 54288 + }, + { + "epoch": 1.39, + "learning_rate": 1.1650154630747229e-06, + "loss": 0.4194, + "step": 54289 + }, + { + "epoch": 1.39, + "learning_rate": 1.164988171892467e-06, + "loss": 0.71, + "step": 54290 + }, + { + "epoch": 1.39, + "learning_rate": 1.1649608805838878e-06, + "loss": 0.7578, + "step": 54291 + }, + { + "epoch": 1.39, + "learning_rate": 1.1649335891490052e-06, + "loss": 0.5239, + "step": 54292 + }, + { + "epoch": 1.39, + "learning_rate": 1.1649062975878412e-06, + "loss": 0.4751, + "step": 54293 + }, + { + "epoch": 1.39, + "learning_rate": 1.1648790059004155e-06, + "loss": 0.79, + "step": 54294 + }, + { + "epoch": 1.39, + "learning_rate": 1.1648517140867498e-06, + "loss": 0.8242, + "step": 54295 + }, + { + "epoch": 1.39, + "learning_rate": 1.1648244221468644e-06, + "loss": 0.5959, + "step": 54296 + }, + { + "epoch": 1.39, + "learning_rate": 1.1647971300807807e-06, + "loss": 0.4927, + "step": 54297 + }, + { + "epoch": 1.39, + "learning_rate": 1.1647698378885196e-06, + "loss": 0.5635, + "step": 54298 + }, + { + "epoch": 1.39, + "learning_rate": 1.1647425455701014e-06, + "loss": 0.708, + "step": 54299 + }, + { + "epoch": 1.39, + "learning_rate": 1.1647152531255476e-06, + "loss": 0.5947, + "step": 54300 + }, + { + "epoch": 1.39, + "learning_rate": 1.164687960554879e-06, + "loss": 0.6704, + "step": 54301 + }, + { + "epoch": 1.39, + "learning_rate": 1.1646606678581164e-06, + "loss": 0.7529, + "step": 54302 + }, + { + "epoch": 1.39, + "learning_rate": 1.1646333750352805e-06, + "loss": 0.5659, + "step": 54303 + }, + { + "epoch": 1.39, + "learning_rate": 1.1646060820863928e-06, + "loss": 0.481, + "step": 54304 + }, + { + "epoch": 1.39, + "learning_rate": 1.1645787890114733e-06, + "loss": 0.5164, + "step": 54305 + }, + { + "epoch": 1.39, + "learning_rate": 1.1645514958105436e-06, + "loss": 0.4172, + "step": 54306 + }, + { + "epoch": 1.39, + "learning_rate": 1.1645242024836242e-06, + "loss": 0.6504, + "step": 54307 + }, + { + "epoch": 1.39, + "learning_rate": 1.1644969090307369e-06, + "loss": 0.5659, + "step": 54308 + }, + { + "epoch": 1.39, + "learning_rate": 1.164469615451901e-06, + "loss": 0.6484, + "step": 54309 + }, + { + "epoch": 1.39, + "learning_rate": 1.1644423217471389e-06, + "loss": 0.7041, + "step": 54310 + }, + { + "epoch": 1.39, + "learning_rate": 1.1644150279164704e-06, + "loss": 0.5352, + "step": 54311 + }, + { + "epoch": 1.39, + "learning_rate": 1.1643877339599171e-06, + "loss": 0.5498, + "step": 54312 + }, + { + "epoch": 1.39, + "learning_rate": 1.1643604398774999e-06, + "loss": 0.623, + "step": 54313 + }, + { + "epoch": 1.39, + "learning_rate": 1.1643331456692391e-06, + "loss": 0.6211, + "step": 54314 + }, + { + "epoch": 1.39, + "learning_rate": 1.164305851335156e-06, + "loss": 0.625, + "step": 54315 + }, + { + "epoch": 1.39, + "learning_rate": 1.1642785568752715e-06, + "loss": 0.7339, + "step": 54316 + }, + { + "epoch": 1.39, + "learning_rate": 1.1642512622896063e-06, + "loss": 0.6587, + "step": 54317 + }, + { + "epoch": 1.39, + "learning_rate": 1.164223967578182e-06, + "loss": 0.6709, + "step": 54318 + }, + { + "epoch": 1.39, + "learning_rate": 1.1641966727410185e-06, + "loss": 0.6226, + "step": 54319 + }, + { + "epoch": 1.39, + "learning_rate": 1.1641693777781374e-06, + "loss": 0.7197, + "step": 54320 + }, + { + "epoch": 1.39, + "learning_rate": 1.1641420826895591e-06, + "loss": 0.8027, + "step": 54321 + }, + { + "epoch": 1.39, + "learning_rate": 1.164114787475305e-06, + "loss": 0.75, + "step": 54322 + }, + { + "epoch": 1.39, + "learning_rate": 1.1640874921353958e-06, + "loss": 0.6416, + "step": 54323 + }, + { + "epoch": 1.39, + "learning_rate": 1.164060196669852e-06, + "loss": 0.8311, + "step": 54324 + }, + { + "epoch": 1.39, + "learning_rate": 1.164032901078695e-06, + "loss": 0.7256, + "step": 54325 + }, + { + "epoch": 1.39, + "learning_rate": 1.1640056053619455e-06, + "loss": 0.6934, + "step": 54326 + }, + { + "epoch": 1.39, + "learning_rate": 1.1639783095196246e-06, + "loss": 0.7744, + "step": 54327 + }, + { + "epoch": 1.39, + "learning_rate": 1.1639510135517533e-06, + "loss": 0.5576, + "step": 54328 + }, + { + "epoch": 1.39, + "learning_rate": 1.1639237174583521e-06, + "loss": 0.4854, + "step": 54329 + }, + { + "epoch": 1.39, + "learning_rate": 1.1638964212394418e-06, + "loss": 0.6704, + "step": 54330 + }, + { + "epoch": 1.39, + "learning_rate": 1.1638691248950436e-06, + "loss": 0.5845, + "step": 54331 + }, + { + "epoch": 1.39, + "learning_rate": 1.1638418284251782e-06, + "loss": 0.6182, + "step": 54332 + }, + { + "epoch": 1.39, + "learning_rate": 1.163814531829867e-06, + "loss": 0.4802, + "step": 54333 + }, + { + "epoch": 1.39, + "learning_rate": 1.1637872351091304e-06, + "loss": 0.7266, + "step": 54334 + }, + { + "epoch": 1.39, + "learning_rate": 1.1637599382629895e-06, + "loss": 0.6748, + "step": 54335 + }, + { + "epoch": 1.39, + "learning_rate": 1.163732641291465e-06, + "loss": 0.6816, + "step": 54336 + }, + { + "epoch": 1.39, + "learning_rate": 1.1637053441945782e-06, + "loss": 0.5, + "step": 54337 + }, + { + "epoch": 1.39, + "learning_rate": 1.1636780469723495e-06, + "loss": 0.6357, + "step": 54338 + }, + { + "epoch": 1.39, + "learning_rate": 1.1636507496248002e-06, + "loss": 0.6953, + "step": 54339 + }, + { + "epoch": 1.39, + "learning_rate": 1.1636234521519508e-06, + "loss": 0.6816, + "step": 54340 + }, + { + "epoch": 1.39, + "learning_rate": 1.1635961545538227e-06, + "loss": 0.5708, + "step": 54341 + }, + { + "epoch": 1.39, + "learning_rate": 1.1635688568304363e-06, + "loss": 0.6255, + "step": 54342 + }, + { + "epoch": 1.39, + "learning_rate": 1.163541558981813e-06, + "loss": 0.6416, + "step": 54343 + }, + { + "epoch": 1.39, + "learning_rate": 1.1635142610079732e-06, + "loss": 0.6172, + "step": 54344 + }, + { + "epoch": 1.39, + "learning_rate": 1.1634869629089382e-06, + "loss": 0.7007, + "step": 54345 + }, + { + "epoch": 1.39, + "learning_rate": 1.1634596646847287e-06, + "loss": 0.5889, + "step": 54346 + }, + { + "epoch": 1.39, + "learning_rate": 1.163432366335366e-06, + "loss": 0.5129, + "step": 54347 + }, + { + "epoch": 1.39, + "learning_rate": 1.1634050678608705e-06, + "loss": 0.6592, + "step": 54348 + }, + { + "epoch": 1.39, + "learning_rate": 1.1633777692612627e-06, + "loss": 0.4365, + "step": 54349 + }, + { + "epoch": 1.39, + "learning_rate": 1.1633504705365647e-06, + "loss": 0.5776, + "step": 54350 + }, + { + "epoch": 1.39, + "learning_rate": 1.1633231716867964e-06, + "loss": 0.6357, + "step": 54351 + }, + { + "epoch": 1.39, + "learning_rate": 1.1632958727119793e-06, + "loss": 0.7119, + "step": 54352 + }, + { + "epoch": 1.39, + "learning_rate": 1.163268573612134e-06, + "loss": 0.5693, + "step": 54353 + }, + { + "epoch": 1.39, + "learning_rate": 1.1632412743872812e-06, + "loss": 0.5986, + "step": 54354 + }, + { + "epoch": 1.39, + "learning_rate": 1.1632139750374422e-06, + "loss": 0.7207, + "step": 54355 + }, + { + "epoch": 1.39, + "learning_rate": 1.1631866755626378e-06, + "loss": 0.5784, + "step": 54356 + }, + { + "epoch": 1.39, + "learning_rate": 1.163159375962889e-06, + "loss": 0.5615, + "step": 54357 + }, + { + "epoch": 1.39, + "learning_rate": 1.1631320762382166e-06, + "loss": 0.7246, + "step": 54358 + }, + { + "epoch": 1.39, + "learning_rate": 1.1631047763886413e-06, + "loss": 0.4436, + "step": 54359 + }, + { + "epoch": 1.39, + "learning_rate": 1.1630774764141842e-06, + "loss": 0.7334, + "step": 54360 + }, + { + "epoch": 1.39, + "learning_rate": 1.163050176314866e-06, + "loss": 0.6777, + "step": 54361 + }, + { + "epoch": 1.39, + "learning_rate": 1.163022876090708e-06, + "loss": 0.7256, + "step": 54362 + }, + { + "epoch": 1.39, + "learning_rate": 1.162995575741731e-06, + "loss": 0.5957, + "step": 54363 + }, + { + "epoch": 1.39, + "learning_rate": 1.1629682752679554e-06, + "loss": 0.72, + "step": 54364 + }, + { + "epoch": 1.39, + "learning_rate": 1.1629409746694028e-06, + "loss": 0.7451, + "step": 54365 + }, + { + "epoch": 1.39, + "learning_rate": 1.1629136739460937e-06, + "loss": 0.6592, + "step": 54366 + }, + { + "epoch": 1.39, + "learning_rate": 1.1628863730980489e-06, + "loss": 0.5796, + "step": 54367 + }, + { + "epoch": 1.39, + "learning_rate": 1.1628590721252898e-06, + "loss": 0.731, + "step": 54368 + }, + { + "epoch": 1.39, + "learning_rate": 1.1628317710278367e-06, + "loss": 0.6973, + "step": 54369 + }, + { + "epoch": 1.39, + "learning_rate": 1.162804469805711e-06, + "loss": 0.8115, + "step": 54370 + }, + { + "epoch": 1.39, + "learning_rate": 1.1627771684589333e-06, + "loss": 0.5835, + "step": 54371 + }, + { + "epoch": 1.39, + "learning_rate": 1.1627498669875247e-06, + "loss": 0.6587, + "step": 54372 + }, + { + "epoch": 1.39, + "learning_rate": 1.1627225653915062e-06, + "loss": 0.6641, + "step": 54373 + }, + { + "epoch": 1.39, + "learning_rate": 1.1626952636708981e-06, + "loss": 0.4263, + "step": 54374 + }, + { + "epoch": 1.39, + "learning_rate": 1.162667961825722e-06, + "loss": 0.7207, + "step": 54375 + }, + { + "epoch": 1.39, + "learning_rate": 1.1626406598559983e-06, + "loss": 0.7524, + "step": 54376 + }, + { + "epoch": 1.39, + "learning_rate": 1.1626133577617485e-06, + "loss": 0.6104, + "step": 54377 + }, + { + "epoch": 1.39, + "learning_rate": 1.162586055542993e-06, + "loss": 0.6992, + "step": 54378 + }, + { + "epoch": 1.39, + "learning_rate": 1.1625587531997527e-06, + "loss": 0.6777, + "step": 54379 + }, + { + "epoch": 1.39, + "learning_rate": 1.1625314507320485e-06, + "loss": 0.7295, + "step": 54380 + }, + { + "epoch": 1.39, + "learning_rate": 1.1625041481399016e-06, + "loss": 0.7549, + "step": 54381 + }, + { + "epoch": 1.39, + "learning_rate": 1.1624768454233327e-06, + "loss": 0.5996, + "step": 54382 + }, + { + "epoch": 1.39, + "learning_rate": 1.1624495425823631e-06, + "loss": 0.6289, + "step": 54383 + }, + { + "epoch": 1.39, + "learning_rate": 1.1624222396170129e-06, + "loss": 0.6772, + "step": 54384 + }, + { + "epoch": 1.39, + "learning_rate": 1.1623949365273036e-06, + "loss": 0.5981, + "step": 54385 + }, + { + "epoch": 1.39, + "learning_rate": 1.162367633313256e-06, + "loss": 0.6646, + "step": 54386 + }, + { + "epoch": 1.39, + "learning_rate": 1.1623403299748908e-06, + "loss": 0.5308, + "step": 54387 + }, + { + "epoch": 1.39, + "learning_rate": 1.1623130265122293e-06, + "loss": 0.5757, + "step": 54388 + }, + { + "epoch": 1.39, + "learning_rate": 1.162285722925292e-06, + "loss": 0.5415, + "step": 54389 + }, + { + "epoch": 1.39, + "learning_rate": 1.1622584192141002e-06, + "loss": 0.5547, + "step": 54390 + }, + { + "epoch": 1.39, + "learning_rate": 1.1622311153786745e-06, + "loss": 0.7422, + "step": 54391 + }, + { + "epoch": 1.39, + "learning_rate": 1.1622038114190357e-06, + "loss": 0.4966, + "step": 54392 + }, + { + "epoch": 1.39, + "learning_rate": 1.1621765073352053e-06, + "loss": 0.4707, + "step": 54393 + }, + { + "epoch": 1.39, + "learning_rate": 1.1621492031272035e-06, + "loss": 0.7139, + "step": 54394 + }, + { + "epoch": 1.39, + "learning_rate": 1.1621218987950515e-06, + "loss": 0.583, + "step": 54395 + }, + { + "epoch": 1.39, + "learning_rate": 1.1620945943387703e-06, + "loss": 0.4612, + "step": 54396 + }, + { + "epoch": 1.39, + "learning_rate": 1.1620672897583805e-06, + "loss": 0.6309, + "step": 54397 + }, + { + "epoch": 1.39, + "learning_rate": 1.1620399850539038e-06, + "loss": 0.6831, + "step": 54398 + }, + { + "epoch": 1.39, + "learning_rate": 1.16201268022536e-06, + "loss": 0.6251, + "step": 54399 + }, + { + "epoch": 1.39, + "learning_rate": 1.161985375272771e-06, + "loss": 0.4927, + "step": 54400 + }, + { + "epoch": 1.39, + "learning_rate": 1.1619580701961567e-06, + "loss": 0.7178, + "step": 54401 + }, + { + "epoch": 1.39, + "learning_rate": 1.161930764995539e-06, + "loss": 0.8809, + "step": 54402 + }, + { + "epoch": 1.39, + "learning_rate": 1.1619034596709382e-06, + "loss": 0.6523, + "step": 54403 + }, + { + "epoch": 1.39, + "learning_rate": 1.1618761542223753e-06, + "loss": 0.5854, + "step": 54404 + }, + { + "epoch": 1.39, + "learning_rate": 1.1618488486498712e-06, + "loss": 0.6367, + "step": 54405 + }, + { + "epoch": 1.39, + "learning_rate": 1.1618215429534472e-06, + "loss": 0.583, + "step": 54406 + }, + { + "epoch": 1.39, + "learning_rate": 1.1617942371331235e-06, + "loss": 0.5659, + "step": 54407 + }, + { + "epoch": 1.39, + "learning_rate": 1.1617669311889216e-06, + "loss": 0.7109, + "step": 54408 + }, + { + "epoch": 1.39, + "learning_rate": 1.1617396251208622e-06, + "loss": 0.5024, + "step": 54409 + }, + { + "epoch": 1.39, + "learning_rate": 1.1617123189289663e-06, + "loss": 0.625, + "step": 54410 + }, + { + "epoch": 1.39, + "learning_rate": 1.1616850126132545e-06, + "loss": 0.7344, + "step": 54411 + }, + { + "epoch": 1.39, + "learning_rate": 1.161657706173748e-06, + "loss": 0.5684, + "step": 54412 + }, + { + "epoch": 1.39, + "learning_rate": 1.1616303996104677e-06, + "loss": 0.5674, + "step": 54413 + }, + { + "epoch": 1.39, + "learning_rate": 1.1616030929234345e-06, + "loss": 0.6812, + "step": 54414 + }, + { + "epoch": 1.39, + "learning_rate": 1.161575786112669e-06, + "loss": 0.9375, + "step": 54415 + }, + { + "epoch": 1.39, + "learning_rate": 1.1615484791781924e-06, + "loss": 0.6416, + "step": 54416 + }, + { + "epoch": 1.39, + "learning_rate": 1.1615211721200258e-06, + "loss": 0.5459, + "step": 54417 + }, + { + "epoch": 1.39, + "learning_rate": 1.1614938649381896e-06, + "loss": 0.6885, + "step": 54418 + }, + { + "epoch": 1.39, + "learning_rate": 1.1614665576327052e-06, + "loss": 0.5649, + "step": 54419 + }, + { + "epoch": 1.39, + "learning_rate": 1.161439250203593e-06, + "loss": 0.8291, + "step": 54420 + }, + { + "epoch": 1.39, + "learning_rate": 1.1614119426508744e-06, + "loss": 0.7666, + "step": 54421 + }, + { + "epoch": 1.39, + "learning_rate": 1.16138463497457e-06, + "loss": 0.7617, + "step": 54422 + }, + { + "epoch": 1.39, + "learning_rate": 1.161357327174701e-06, + "loss": 0.6021, + "step": 54423 + }, + { + "epoch": 1.39, + "learning_rate": 1.1613300192512877e-06, + "loss": 0.6055, + "step": 54424 + }, + { + "epoch": 1.39, + "learning_rate": 1.1613027112043518e-06, + "loss": 0.6558, + "step": 54425 + }, + { + "epoch": 1.39, + "learning_rate": 1.1612754030339135e-06, + "loss": 0.751, + "step": 54426 + }, + { + "epoch": 1.39, + "learning_rate": 1.1612480947399944e-06, + "loss": 0.7246, + "step": 54427 + }, + { + "epoch": 1.4, + "learning_rate": 1.1612207863226152e-06, + "loss": 0.5942, + "step": 54428 + }, + { + "epoch": 1.4, + "learning_rate": 1.1611934777817963e-06, + "loss": 0.5, + "step": 54429 + }, + { + "epoch": 1.4, + "learning_rate": 1.1611661691175586e-06, + "loss": 0.655, + "step": 54430 + }, + { + "epoch": 1.4, + "learning_rate": 1.1611388603299241e-06, + "loss": 0.5366, + "step": 54431 + }, + { + "epoch": 1.4, + "learning_rate": 1.1611115514189125e-06, + "loss": 0.6719, + "step": 54432 + }, + { + "epoch": 1.4, + "learning_rate": 1.1610842423845455e-06, + "loss": 0.7451, + "step": 54433 + }, + { + "epoch": 1.4, + "learning_rate": 1.1610569332268436e-06, + "loss": 0.6704, + "step": 54434 + }, + { + "epoch": 1.4, + "learning_rate": 1.1610296239458277e-06, + "loss": 0.6533, + "step": 54435 + }, + { + "epoch": 1.4, + "learning_rate": 1.1610023145415189e-06, + "loss": 0.6582, + "step": 54436 + }, + { + "epoch": 1.4, + "learning_rate": 1.1609750050139382e-06, + "loss": 0.4041, + "step": 54437 + }, + { + "epoch": 1.4, + "learning_rate": 1.1609476953631062e-06, + "loss": 0.7642, + "step": 54438 + }, + { + "epoch": 1.4, + "learning_rate": 1.1609203855890438e-06, + "loss": 0.7637, + "step": 54439 + }, + { + "epoch": 1.4, + "learning_rate": 1.1608930756917722e-06, + "loss": 0.6179, + "step": 54440 + }, + { + "epoch": 1.4, + "learning_rate": 1.1608657656713121e-06, + "loss": 0.6738, + "step": 54441 + }, + { + "epoch": 1.4, + "learning_rate": 1.1608384555276844e-06, + "loss": 0.6318, + "step": 54442 + }, + { + "epoch": 1.4, + "learning_rate": 1.1608111452609103e-06, + "loss": 0.7412, + "step": 54443 + }, + { + "epoch": 1.4, + "learning_rate": 1.1607838348710105e-06, + "loss": 0.6201, + "step": 54444 + }, + { + "epoch": 1.4, + "learning_rate": 1.1607565243580057e-06, + "loss": 0.6367, + "step": 54445 + }, + { + "epoch": 1.4, + "learning_rate": 1.1607292137219174e-06, + "loss": 0.5874, + "step": 54446 + }, + { + "epoch": 1.4, + "learning_rate": 1.1607019029627659e-06, + "loss": 0.564, + "step": 54447 + }, + { + "epoch": 1.4, + "learning_rate": 1.1606745920805724e-06, + "loss": 0.6953, + "step": 54448 + }, + { + "epoch": 1.4, + "learning_rate": 1.1606472810753576e-06, + "loss": 0.625, + "step": 54449 + }, + { + "epoch": 1.4, + "learning_rate": 1.1606199699471426e-06, + "loss": 0.7842, + "step": 54450 + }, + { + "epoch": 1.4, + "learning_rate": 1.1605926586959483e-06, + "loss": 0.7822, + "step": 54451 + }, + { + "epoch": 1.4, + "learning_rate": 1.1605653473217956e-06, + "loss": 0.6406, + "step": 54452 + }, + { + "epoch": 1.4, + "learning_rate": 1.1605380358247055e-06, + "loss": 0.6465, + "step": 54453 + }, + { + "epoch": 1.4, + "learning_rate": 1.1605107242046987e-06, + "loss": 0.5845, + "step": 54454 + }, + { + "epoch": 1.4, + "learning_rate": 1.1604834124617961e-06, + "loss": 0.6504, + "step": 54455 + }, + { + "epoch": 1.4, + "learning_rate": 1.160456100596019e-06, + "loss": 0.5469, + "step": 54456 + }, + { + "epoch": 1.4, + "learning_rate": 1.1604287886073878e-06, + "loss": 0.6621, + "step": 54457 + }, + { + "epoch": 1.4, + "learning_rate": 1.1604014764959238e-06, + "loss": 0.4147, + "step": 54458 + }, + { + "epoch": 1.4, + "learning_rate": 1.1603741642616479e-06, + "loss": 0.5884, + "step": 54459 + }, + { + "epoch": 1.4, + "learning_rate": 1.1603468519045805e-06, + "loss": 0.7559, + "step": 54460 + }, + { + "epoch": 1.4, + "learning_rate": 1.1603195394247432e-06, + "loss": 0.5667, + "step": 54461 + }, + { + "epoch": 1.4, + "learning_rate": 1.1602922268221561e-06, + "loss": 0.5925, + "step": 54462 + }, + { + "epoch": 1.4, + "learning_rate": 1.1602649140968414e-06, + "loss": 0.793, + "step": 54463 + }, + { + "epoch": 1.4, + "learning_rate": 1.160237601248819e-06, + "loss": 0.5239, + "step": 54464 + }, + { + "epoch": 1.4, + "learning_rate": 1.1602102882781097e-06, + "loss": 0.7363, + "step": 54465 + }, + { + "epoch": 1.4, + "learning_rate": 1.1601829751847348e-06, + "loss": 0.666, + "step": 54466 + }, + { + "epoch": 1.4, + "learning_rate": 1.1601556619687155e-06, + "loss": 0.5366, + "step": 54467 + }, + { + "epoch": 1.4, + "learning_rate": 1.160128348630072e-06, + "loss": 0.7007, + "step": 54468 + }, + { + "epoch": 1.4, + "learning_rate": 1.160101035168826e-06, + "loss": 0.5095, + "step": 54469 + }, + { + "epoch": 1.4, + "learning_rate": 1.1600737215849974e-06, + "loss": 0.6533, + "step": 54470 + }, + { + "epoch": 1.4, + "learning_rate": 1.160046407878608e-06, + "loss": 0.7471, + "step": 54471 + }, + { + "epoch": 1.4, + "learning_rate": 1.1600190940496784e-06, + "loss": 0.4827, + "step": 54472 + }, + { + "epoch": 1.4, + "learning_rate": 1.15999178009823e-06, + "loss": 0.6709, + "step": 54473 + }, + { + "epoch": 1.4, + "learning_rate": 1.1599644660242827e-06, + "loss": 0.6914, + "step": 54474 + }, + { + "epoch": 1.4, + "learning_rate": 1.1599371518278583e-06, + "loss": 0.7227, + "step": 54475 + }, + { + "epoch": 1.4, + "learning_rate": 1.159909837508977e-06, + "loss": 0.5742, + "step": 54476 + }, + { + "epoch": 1.4, + "learning_rate": 1.1598825230676603e-06, + "loss": 0.6851, + "step": 54477 + }, + { + "epoch": 1.4, + "learning_rate": 1.159855208503929e-06, + "loss": 0.5938, + "step": 54478 + }, + { + "epoch": 1.4, + "learning_rate": 1.1598278938178037e-06, + "loss": 0.547, + "step": 54479 + }, + { + "epoch": 1.4, + "learning_rate": 1.1598005790093055e-06, + "loss": 0.7256, + "step": 54480 + }, + { + "epoch": 1.4, + "learning_rate": 1.1597732640784555e-06, + "loss": 0.5303, + "step": 54481 + }, + { + "epoch": 1.4, + "learning_rate": 1.1597459490252746e-06, + "loss": 0.6855, + "step": 54482 + }, + { + "epoch": 1.4, + "learning_rate": 1.1597186338497833e-06, + "loss": 0.7754, + "step": 54483 + }, + { + "epoch": 1.4, + "learning_rate": 1.159691318552003e-06, + "loss": 0.5132, + "step": 54484 + }, + { + "epoch": 1.4, + "learning_rate": 1.1596640031319542e-06, + "loss": 0.6338, + "step": 54485 + }, + { + "epoch": 1.4, + "learning_rate": 1.1596366875896583e-06, + "loss": 0.6025, + "step": 54486 + }, + { + "epoch": 1.4, + "learning_rate": 1.1596093719251354e-06, + "loss": 0.8008, + "step": 54487 + }, + { + "epoch": 1.4, + "learning_rate": 1.1595820561384075e-06, + "loss": 0.748, + "step": 54488 + }, + { + "epoch": 1.4, + "learning_rate": 1.1595547402294947e-06, + "loss": 0.7051, + "step": 54489 + }, + { + "epoch": 1.4, + "learning_rate": 1.1595274241984183e-06, + "loss": 0.7793, + "step": 54490 + }, + { + "epoch": 1.4, + "learning_rate": 1.159500108045199e-06, + "loss": 0.5654, + "step": 54491 + }, + { + "epoch": 1.4, + "learning_rate": 1.1594727917698576e-06, + "loss": 0.668, + "step": 54492 + }, + { + "epoch": 1.4, + "learning_rate": 1.1594454753724156e-06, + "loss": 0.6543, + "step": 54493 + }, + { + "epoch": 1.4, + "learning_rate": 1.1594181588528934e-06, + "loss": 0.6641, + "step": 54494 + }, + { + "epoch": 1.4, + "learning_rate": 1.159390842211312e-06, + "loss": 0.5938, + "step": 54495 + }, + { + "epoch": 1.4, + "learning_rate": 1.1593635254476923e-06, + "loss": 0.5151, + "step": 54496 + }, + { + "epoch": 1.4, + "learning_rate": 1.1593362085620552e-06, + "loss": 0.7412, + "step": 54497 + }, + { + "epoch": 1.4, + "learning_rate": 1.159308891554422e-06, + "loss": 0.699, + "step": 54498 + }, + { + "epoch": 1.4, + "learning_rate": 1.1592815744248132e-06, + "loss": 0.6362, + "step": 54499 + }, + { + "epoch": 1.4, + "learning_rate": 1.1592542571732498e-06, + "loss": 0.7002, + "step": 54500 + }, + { + "epoch": 1.4, + "learning_rate": 1.1592269397997525e-06, + "loss": 0.6699, + "step": 54501 + }, + { + "epoch": 1.4, + "learning_rate": 1.1591996223043427e-06, + "loss": 0.6602, + "step": 54502 + }, + { + "epoch": 1.4, + "learning_rate": 1.159172304687041e-06, + "loss": 0.7725, + "step": 54503 + }, + { + "epoch": 1.4, + "learning_rate": 1.1591449869478684e-06, + "loss": 0.5747, + "step": 54504 + }, + { + "epoch": 1.4, + "learning_rate": 1.1591176690868457e-06, + "loss": 0.5411, + "step": 54505 + }, + { + "epoch": 1.4, + "learning_rate": 1.159090351103994e-06, + "loss": 0.5371, + "step": 54506 + }, + { + "epoch": 1.4, + "learning_rate": 1.1590630329993343e-06, + "loss": 0.7031, + "step": 54507 + }, + { + "epoch": 1.4, + "learning_rate": 1.1590357147728873e-06, + "loss": 0.8174, + "step": 54508 + }, + { + "epoch": 1.4, + "learning_rate": 1.159008396424674e-06, + "loss": 0.6157, + "step": 54509 + }, + { + "epoch": 1.4, + "learning_rate": 1.1589810779547149e-06, + "loss": 0.7134, + "step": 54510 + }, + { + "epoch": 1.4, + "learning_rate": 1.1589537593630317e-06, + "loss": 0.6504, + "step": 54511 + }, + { + "epoch": 1.4, + "learning_rate": 1.1589264406496446e-06, + "loss": 0.5708, + "step": 54512 + }, + { + "epoch": 1.4, + "learning_rate": 1.1588991218145752e-06, + "loss": 0.5818, + "step": 54513 + }, + { + "epoch": 1.4, + "learning_rate": 1.1588718028578437e-06, + "loss": 0.7017, + "step": 54514 + }, + { + "epoch": 1.4, + "learning_rate": 1.1588444837794716e-06, + "loss": 0.7218, + "step": 54515 + }, + { + "epoch": 1.4, + "learning_rate": 1.1588171645794794e-06, + "loss": 0.7314, + "step": 54516 + }, + { + "epoch": 1.4, + "learning_rate": 1.1587898452578886e-06, + "loss": 0.5693, + "step": 54517 + }, + { + "epoch": 1.4, + "learning_rate": 1.1587625258147192e-06, + "loss": 0.54, + "step": 54518 + }, + { + "epoch": 1.4, + "learning_rate": 1.158735206249993e-06, + "loss": 0.5806, + "step": 54519 + }, + { + "epoch": 1.4, + "learning_rate": 1.1587078865637301e-06, + "loss": 0.5645, + "step": 54520 + }, + { + "epoch": 1.4, + "learning_rate": 1.1586805667559522e-06, + "loss": 0.7188, + "step": 54521 + }, + { + "epoch": 1.4, + "learning_rate": 1.15865324682668e-06, + "loss": 0.6738, + "step": 54522 + }, + { + "epoch": 1.4, + "learning_rate": 1.1586259267759339e-06, + "loss": 0.6904, + "step": 54523 + }, + { + "epoch": 1.4, + "learning_rate": 1.1585986066037357e-06, + "loss": 0.5469, + "step": 54524 + }, + { + "epoch": 1.4, + "learning_rate": 1.1585712863101054e-06, + "loss": 1.1729, + "step": 54525 + }, + { + "epoch": 1.4, + "learning_rate": 1.1585439658950647e-06, + "loss": 0.5781, + "step": 54526 + }, + { + "epoch": 1.4, + "learning_rate": 1.158516645358634e-06, + "loss": 0.6392, + "step": 54527 + }, + { + "epoch": 1.4, + "learning_rate": 1.1584893247008347e-06, + "loss": 0.54, + "step": 54528 + }, + { + "epoch": 1.4, + "learning_rate": 1.158462003921687e-06, + "loss": 0.7461, + "step": 54529 + }, + { + "epoch": 1.4, + "learning_rate": 1.1584346830212124e-06, + "loss": 0.7354, + "step": 54530 + }, + { + "epoch": 1.4, + "learning_rate": 1.1584073619994314e-06, + "loss": 0.5825, + "step": 54531 + }, + { + "epoch": 1.4, + "learning_rate": 1.1583800408563658e-06, + "loss": 0.5679, + "step": 54532 + }, + { + "epoch": 1.4, + "learning_rate": 1.1583527195920353e-06, + "loss": 0.7012, + "step": 54533 + }, + { + "epoch": 1.4, + "learning_rate": 1.1583253982064615e-06, + "loss": 0.7305, + "step": 54534 + }, + { + "epoch": 1.4, + "learning_rate": 1.1582980766996653e-06, + "loss": 0.791, + "step": 54535 + }, + { + "epoch": 1.4, + "learning_rate": 1.1582707550716678e-06, + "loss": 0.5657, + "step": 54536 + }, + { + "epoch": 1.4, + "learning_rate": 1.1582434333224893e-06, + "loss": 0.5525, + "step": 54537 + }, + { + "epoch": 1.4, + "learning_rate": 1.1582161114521514e-06, + "loss": 0.79, + "step": 54538 + }, + { + "epoch": 1.4, + "learning_rate": 1.1581887894606744e-06, + "loss": 0.668, + "step": 54539 + }, + { + "epoch": 1.4, + "learning_rate": 1.1581614673480796e-06, + "loss": 0.6338, + "step": 54540 + }, + { + "epoch": 1.4, + "learning_rate": 1.1581341451143876e-06, + "loss": 0.6323, + "step": 54541 + }, + { + "epoch": 1.4, + "learning_rate": 1.15810682275962e-06, + "loss": 0.6565, + "step": 54542 + }, + { + "epoch": 1.4, + "learning_rate": 1.158079500283797e-06, + "loss": 0.5239, + "step": 54543 + }, + { + "epoch": 1.4, + "learning_rate": 1.1580521776869402e-06, + "loss": 0.5439, + "step": 54544 + }, + { + "epoch": 1.4, + "learning_rate": 1.1580248549690693e-06, + "loss": 0.6436, + "step": 54545 + }, + { + "epoch": 1.4, + "learning_rate": 1.1579975321302067e-06, + "loss": 0.5444, + "step": 54546 + }, + { + "epoch": 1.4, + "learning_rate": 1.1579702091703726e-06, + "loss": 0.6077, + "step": 54547 + }, + { + "epoch": 1.4, + "learning_rate": 1.1579428860895876e-06, + "loss": 0.7236, + "step": 54548 + }, + { + "epoch": 1.4, + "learning_rate": 1.1579155628878734e-06, + "loss": 0.7227, + "step": 54549 + }, + { + "epoch": 1.4, + "learning_rate": 1.1578882395652503e-06, + "loss": 0.7017, + "step": 54550 + }, + { + "epoch": 1.4, + "learning_rate": 1.1578609161217394e-06, + "loss": 0.5986, + "step": 54551 + }, + { + "epoch": 1.4, + "learning_rate": 1.157833592557362e-06, + "loss": 0.7031, + "step": 54552 + }, + { + "epoch": 1.4, + "learning_rate": 1.1578062688721384e-06, + "loss": 0.7256, + "step": 54553 + }, + { + "epoch": 1.4, + "learning_rate": 1.1577789450660897e-06, + "loss": 0.6353, + "step": 54554 + }, + { + "epoch": 1.4, + "learning_rate": 1.157751621139237e-06, + "loss": 0.6338, + "step": 54555 + }, + { + "epoch": 1.4, + "learning_rate": 1.157724297091601e-06, + "loss": 0.5566, + "step": 54556 + }, + { + "epoch": 1.4, + "learning_rate": 1.1576969729232034e-06, + "loss": 0.6646, + "step": 54557 + }, + { + "epoch": 1.4, + "learning_rate": 1.1576696486340638e-06, + "loss": 0.7197, + "step": 54558 + }, + { + "epoch": 1.4, + "learning_rate": 1.157642324224204e-06, + "loss": 0.5008, + "step": 54559 + }, + { + "epoch": 1.4, + "learning_rate": 1.1576149996936446e-06, + "loss": 0.7607, + "step": 54560 + }, + { + "epoch": 1.4, + "learning_rate": 1.157587675042407e-06, + "loss": 0.6562, + "step": 54561 + }, + { + "epoch": 1.4, + "learning_rate": 1.1575603502705115e-06, + "loss": 0.5532, + "step": 54562 + }, + { + "epoch": 1.4, + "learning_rate": 1.1575330253779793e-06, + "loss": 0.5884, + "step": 54563 + }, + { + "epoch": 1.4, + "learning_rate": 1.1575057003648313e-06, + "loss": 0.9023, + "step": 54564 + }, + { + "epoch": 1.4, + "learning_rate": 1.1574783752310885e-06, + "loss": 0.625, + "step": 54565 + }, + { + "epoch": 1.4, + "learning_rate": 1.1574510499767716e-06, + "loss": 0.8223, + "step": 54566 + }, + { + "epoch": 1.4, + "learning_rate": 1.1574237246019018e-06, + "loss": 0.6006, + "step": 54567 + }, + { + "epoch": 1.4, + "learning_rate": 1.1573963991065e-06, + "loss": 0.6611, + "step": 54568 + }, + { + "epoch": 1.4, + "learning_rate": 1.1573690734905867e-06, + "loss": 0.7988, + "step": 54569 + }, + { + "epoch": 1.4, + "learning_rate": 1.1573417477541834e-06, + "loss": 0.6069, + "step": 54570 + }, + { + "epoch": 1.4, + "learning_rate": 1.1573144218973105e-06, + "loss": 0.5728, + "step": 54571 + }, + { + "epoch": 1.4, + "learning_rate": 1.1572870959199896e-06, + "loss": 0.6357, + "step": 54572 + }, + { + "epoch": 1.4, + "learning_rate": 1.157259769822241e-06, + "loss": 0.7344, + "step": 54573 + }, + { + "epoch": 1.4, + "learning_rate": 1.1572324436040859e-06, + "loss": 0.6367, + "step": 54574 + }, + { + "epoch": 1.4, + "learning_rate": 1.1572051172655448e-06, + "loss": 0.4639, + "step": 54575 + }, + { + "epoch": 1.4, + "learning_rate": 1.1571777908066394e-06, + "loss": 0.438, + "step": 54576 + }, + { + "epoch": 1.4, + "learning_rate": 1.15715046422739e-06, + "loss": 0.7754, + "step": 54577 + }, + { + "epoch": 1.4, + "learning_rate": 1.1571231375278176e-06, + "loss": 0.834, + "step": 54578 + }, + { + "epoch": 1.4, + "learning_rate": 1.1570958107079433e-06, + "loss": 0.5767, + "step": 54579 + }, + { + "epoch": 1.4, + "learning_rate": 1.1570684837677882e-06, + "loss": 0.7617, + "step": 54580 + }, + { + "epoch": 1.4, + "learning_rate": 1.1570411567073726e-06, + "loss": 0.5691, + "step": 54581 + }, + { + "epoch": 1.4, + "learning_rate": 1.1570138295267183e-06, + "loss": 0.5762, + "step": 54582 + }, + { + "epoch": 1.4, + "learning_rate": 1.156986502225845e-06, + "loss": 0.645, + "step": 54583 + }, + { + "epoch": 1.4, + "learning_rate": 1.1569591748047751e-06, + "loss": 0.7432, + "step": 54584 + }, + { + "epoch": 1.4, + "learning_rate": 1.1569318472635284e-06, + "loss": 0.7197, + "step": 54585 + }, + { + "epoch": 1.4, + "learning_rate": 1.1569045196021264e-06, + "loss": 0.8115, + "step": 54586 + }, + { + "epoch": 1.4, + "learning_rate": 1.1568771918205897e-06, + "loss": 0.5576, + "step": 54587 + }, + { + "epoch": 1.4, + "learning_rate": 1.1568498639189393e-06, + "loss": 0.7197, + "step": 54588 + }, + { + "epoch": 1.4, + "learning_rate": 1.1568225358971961e-06, + "loss": 0.7227, + "step": 54589 + }, + { + "epoch": 1.4, + "learning_rate": 1.1567952077553814e-06, + "loss": 0.6621, + "step": 54590 + }, + { + "epoch": 1.4, + "learning_rate": 1.1567678794935154e-06, + "loss": 0.5806, + "step": 54591 + }, + { + "epoch": 1.4, + "learning_rate": 1.1567405511116198e-06, + "loss": 0.6914, + "step": 54592 + }, + { + "epoch": 1.4, + "learning_rate": 1.1567132226097148e-06, + "loss": 0.5903, + "step": 54593 + }, + { + "epoch": 1.4, + "learning_rate": 1.156685893987822e-06, + "loss": 0.6992, + "step": 54594 + }, + { + "epoch": 1.4, + "learning_rate": 1.1566585652459619e-06, + "loss": 0.6875, + "step": 54595 + }, + { + "epoch": 1.4, + "learning_rate": 1.1566312363841556e-06, + "loss": 0.7158, + "step": 54596 + }, + { + "epoch": 1.4, + "learning_rate": 1.156603907402424e-06, + "loss": 0.6768, + "step": 54597 + }, + { + "epoch": 1.4, + "learning_rate": 1.156576578300788e-06, + "loss": 0.7393, + "step": 54598 + }, + { + "epoch": 1.4, + "learning_rate": 1.1565492490792686e-06, + "loss": 0.7979, + "step": 54599 + }, + { + "epoch": 1.4, + "learning_rate": 1.1565219197378862e-06, + "loss": 0.5815, + "step": 54600 + }, + { + "epoch": 1.4, + "learning_rate": 1.1564945902766625e-06, + "loss": 0.6851, + "step": 54601 + }, + { + "epoch": 1.4, + "learning_rate": 1.156467260695618e-06, + "loss": 0.5771, + "step": 54602 + }, + { + "epoch": 1.4, + "learning_rate": 1.156439930994774e-06, + "loss": 0.6592, + "step": 54603 + }, + { + "epoch": 1.4, + "learning_rate": 1.1564126011741505e-06, + "loss": 0.7773, + "step": 54604 + }, + { + "epoch": 1.4, + "learning_rate": 1.1563852712337698e-06, + "loss": 0.5796, + "step": 54605 + }, + { + "epoch": 1.4, + "learning_rate": 1.1563579411736516e-06, + "loss": 0.4402, + "step": 54606 + }, + { + "epoch": 1.4, + "learning_rate": 1.1563306109938177e-06, + "loss": 0.5747, + "step": 54607 + }, + { + "epoch": 1.4, + "learning_rate": 1.1563032806942882e-06, + "loss": 0.6543, + "step": 54608 + }, + { + "epoch": 1.4, + "learning_rate": 1.1562759502750848e-06, + "loss": 0.499, + "step": 54609 + }, + { + "epoch": 1.4, + "learning_rate": 1.1562486197362278e-06, + "loss": 0.6982, + "step": 54610 + }, + { + "epoch": 1.4, + "learning_rate": 1.1562212890777384e-06, + "loss": 0.6021, + "step": 54611 + }, + { + "epoch": 1.4, + "learning_rate": 1.156193958299638e-06, + "loss": 0.6733, + "step": 54612 + }, + { + "epoch": 1.4, + "learning_rate": 1.1561666274019466e-06, + "loss": 0.6528, + "step": 54613 + }, + { + "epoch": 1.4, + "learning_rate": 1.1561392963846858e-06, + "loss": 0.5588, + "step": 54614 + }, + { + "epoch": 1.4, + "learning_rate": 1.156111965247876e-06, + "loss": 0.5718, + "step": 54615 + }, + { + "epoch": 1.4, + "learning_rate": 1.1560846339915392e-06, + "loss": 0.5012, + "step": 54616 + }, + { + "epoch": 1.4, + "learning_rate": 1.156057302615695e-06, + "loss": 0.7051, + "step": 54617 + }, + { + "epoch": 1.4, + "learning_rate": 1.156029971120365e-06, + "loss": 0.6265, + "step": 54618 + }, + { + "epoch": 1.4, + "learning_rate": 1.15600263950557e-06, + "loss": 0.6143, + "step": 54619 + }, + { + "epoch": 1.4, + "learning_rate": 1.155975307771331e-06, + "loss": 0.9043, + "step": 54620 + }, + { + "epoch": 1.4, + "learning_rate": 1.1559479759176686e-06, + "loss": 0.877, + "step": 54621 + }, + { + "epoch": 1.4, + "learning_rate": 1.1559206439446048e-06, + "loss": 0.75, + "step": 54622 + }, + { + "epoch": 1.4, + "learning_rate": 1.155893311852159e-06, + "loss": 0.7178, + "step": 54623 + }, + { + "epoch": 1.4, + "learning_rate": 1.155865979640353e-06, + "loss": 0.7236, + "step": 54624 + }, + { + "epoch": 1.4, + "learning_rate": 1.1558386473092076e-06, + "loss": 0.6377, + "step": 54625 + }, + { + "epoch": 1.4, + "learning_rate": 1.1558113148587438e-06, + "loss": 0.4927, + "step": 54626 + }, + { + "epoch": 1.4, + "learning_rate": 1.1557839822889826e-06, + "loss": 0.6748, + "step": 54627 + }, + { + "epoch": 1.4, + "learning_rate": 1.1557566495999445e-06, + "loss": 0.7021, + "step": 54628 + }, + { + "epoch": 1.4, + "learning_rate": 1.1557293167916506e-06, + "loss": 0.7422, + "step": 54629 + }, + { + "epoch": 1.4, + "learning_rate": 1.1557019838641222e-06, + "loss": 0.7227, + "step": 54630 + }, + { + "epoch": 1.4, + "learning_rate": 1.1556746508173798e-06, + "loss": 0.5632, + "step": 54631 + }, + { + "epoch": 1.4, + "learning_rate": 1.1556473176514446e-06, + "loss": 0.521, + "step": 54632 + }, + { + "epoch": 1.4, + "learning_rate": 1.1556199843663372e-06, + "loss": 0.7148, + "step": 54633 + }, + { + "epoch": 1.4, + "learning_rate": 1.155592650962079e-06, + "loss": 0.6914, + "step": 54634 + }, + { + "epoch": 1.4, + "learning_rate": 1.1555653174386903e-06, + "loss": 0.7637, + "step": 54635 + }, + { + "epoch": 1.4, + "learning_rate": 1.1555379837961928e-06, + "loss": 0.7109, + "step": 54636 + }, + { + "epoch": 1.4, + "learning_rate": 1.1555106500346069e-06, + "loss": 0.5127, + "step": 54637 + }, + { + "epoch": 1.4, + "learning_rate": 1.1554833161539534e-06, + "loss": 0.6914, + "step": 54638 + }, + { + "epoch": 1.4, + "learning_rate": 1.1554559821542538e-06, + "loss": 0.6709, + "step": 54639 + }, + { + "epoch": 1.4, + "learning_rate": 1.1554286480355285e-06, + "loss": 0.6777, + "step": 54640 + }, + { + "epoch": 1.4, + "learning_rate": 1.1554013137977985e-06, + "loss": 0.5352, + "step": 54641 + }, + { + "epoch": 1.4, + "learning_rate": 1.1553739794410851e-06, + "loss": 0.6812, + "step": 54642 + }, + { + "epoch": 1.4, + "learning_rate": 1.155346644965409e-06, + "loss": 0.6426, + "step": 54643 + }, + { + "epoch": 1.4, + "learning_rate": 1.155319310370791e-06, + "loss": 0.6572, + "step": 54644 + }, + { + "epoch": 1.4, + "learning_rate": 1.1552919756572522e-06, + "loss": 0.5776, + "step": 54645 + }, + { + "epoch": 1.4, + "learning_rate": 1.1552646408248134e-06, + "loss": 0.5441, + "step": 54646 + }, + { + "epoch": 1.4, + "learning_rate": 1.1552373058734958e-06, + "loss": 0.5737, + "step": 54647 + }, + { + "epoch": 1.4, + "learning_rate": 1.15520997080332e-06, + "loss": 0.7715, + "step": 54648 + }, + { + "epoch": 1.4, + "learning_rate": 1.155182635614307e-06, + "loss": 0.689, + "step": 54649 + }, + { + "epoch": 1.4, + "learning_rate": 1.1551553003064777e-06, + "loss": 0.6836, + "step": 54650 + }, + { + "epoch": 1.4, + "learning_rate": 1.1551279648798535e-06, + "loss": 0.5947, + "step": 54651 + }, + { + "epoch": 1.4, + "learning_rate": 1.1551006293344548e-06, + "loss": 0.4717, + "step": 54652 + }, + { + "epoch": 1.4, + "learning_rate": 1.1550732936703027e-06, + "loss": 0.4756, + "step": 54653 + }, + { + "epoch": 1.4, + "learning_rate": 1.1550459578874177e-06, + "loss": 0.6338, + "step": 54654 + }, + { + "epoch": 1.4, + "learning_rate": 1.1550186219858215e-06, + "loss": 0.6328, + "step": 54655 + }, + { + "epoch": 1.4, + "learning_rate": 1.1549912859655345e-06, + "loss": 0.5396, + "step": 54656 + }, + { + "epoch": 1.4, + "learning_rate": 1.154963949826578e-06, + "loss": 0.562, + "step": 54657 + }, + { + "epoch": 1.4, + "learning_rate": 1.1549366135689729e-06, + "loss": 0.8027, + "step": 54658 + }, + { + "epoch": 1.4, + "learning_rate": 1.1549092771927394e-06, + "loss": 0.7061, + "step": 54659 + }, + { + "epoch": 1.4, + "learning_rate": 1.1548819406978993e-06, + "loss": 0.833, + "step": 54660 + }, + { + "epoch": 1.4, + "learning_rate": 1.1548546040844733e-06, + "loss": 0.5366, + "step": 54661 + }, + { + "epoch": 1.4, + "learning_rate": 1.1548272673524824e-06, + "loss": 0.8701, + "step": 54662 + }, + { + "epoch": 1.4, + "learning_rate": 1.154799930501947e-06, + "loss": 0.6147, + "step": 54663 + }, + { + "epoch": 1.4, + "learning_rate": 1.1547725935328887e-06, + "loss": 0.709, + "step": 54664 + }, + { + "epoch": 1.4, + "learning_rate": 1.1547452564453278e-06, + "loss": 0.5566, + "step": 54665 + }, + { + "epoch": 1.4, + "learning_rate": 1.1547179192392858e-06, + "loss": 0.6227, + "step": 54666 + }, + { + "epoch": 1.4, + "learning_rate": 1.1546905819147835e-06, + "loss": 0.4922, + "step": 54667 + }, + { + "epoch": 1.4, + "learning_rate": 1.1546632444718416e-06, + "loss": 0.6274, + "step": 54668 + }, + { + "epoch": 1.4, + "learning_rate": 1.1546359069104812e-06, + "loss": 0.7578, + "step": 54669 + }, + { + "epoch": 1.4, + "learning_rate": 1.154608569230723e-06, + "loss": 0.7656, + "step": 54670 + }, + { + "epoch": 1.4, + "learning_rate": 1.1545812314325883e-06, + "loss": 0.6289, + "step": 54671 + }, + { + "epoch": 1.4, + "learning_rate": 1.154553893516098e-06, + "loss": 0.5332, + "step": 54672 + }, + { + "epoch": 1.4, + "learning_rate": 1.1545265554812727e-06, + "loss": 0.7134, + "step": 54673 + }, + { + "epoch": 1.4, + "learning_rate": 1.1544992173281335e-06, + "loss": 0.5081, + "step": 54674 + }, + { + "epoch": 1.4, + "learning_rate": 1.1544718790567013e-06, + "loss": 0.4851, + "step": 54675 + }, + { + "epoch": 1.4, + "learning_rate": 1.1544445406669973e-06, + "loss": 0.7705, + "step": 54676 + }, + { + "epoch": 1.4, + "learning_rate": 1.1544172021590423e-06, + "loss": 0.623, + "step": 54677 + }, + { + "epoch": 1.4, + "learning_rate": 1.1543898635328569e-06, + "loss": 0.4204, + "step": 54678 + }, + { + "epoch": 1.4, + "learning_rate": 1.1543625247884622e-06, + "loss": 0.7178, + "step": 54679 + }, + { + "epoch": 1.4, + "learning_rate": 1.1543351859258796e-06, + "loss": 0.6167, + "step": 54680 + }, + { + "epoch": 1.4, + "learning_rate": 1.1543078469451293e-06, + "loss": 0.5337, + "step": 54681 + }, + { + "epoch": 1.4, + "learning_rate": 1.1542805078462327e-06, + "loss": 0.7119, + "step": 54682 + }, + { + "epoch": 1.4, + "learning_rate": 1.1542531686292106e-06, + "loss": 0.5403, + "step": 54683 + }, + { + "epoch": 1.4, + "learning_rate": 1.1542258292940838e-06, + "loss": 0.7314, + "step": 54684 + }, + { + "epoch": 1.4, + "learning_rate": 1.1541984898408736e-06, + "loss": 0.5241, + "step": 54685 + }, + { + "epoch": 1.4, + "learning_rate": 1.1541711502696005e-06, + "loss": 0.7461, + "step": 54686 + }, + { + "epoch": 1.4, + "learning_rate": 1.1541438105802862e-06, + "loss": 0.5996, + "step": 54687 + }, + { + "epoch": 1.4, + "learning_rate": 1.1541164707729505e-06, + "loss": 0.8984, + "step": 54688 + }, + { + "epoch": 1.4, + "learning_rate": 1.1540891308476151e-06, + "loss": 0.4963, + "step": 54689 + }, + { + "epoch": 1.4, + "learning_rate": 1.1540617908043005e-06, + "loss": 0.4175, + "step": 54690 + }, + { + "epoch": 1.4, + "learning_rate": 1.1540344506430281e-06, + "loss": 0.6484, + "step": 54691 + }, + { + "epoch": 1.4, + "learning_rate": 1.1540071103638187e-06, + "loss": 0.5913, + "step": 54692 + }, + { + "epoch": 1.4, + "learning_rate": 1.153979769966693e-06, + "loss": 0.8516, + "step": 54693 + }, + { + "epoch": 1.4, + "learning_rate": 1.1539524294516719e-06, + "loss": 0.5054, + "step": 54694 + }, + { + "epoch": 1.4, + "learning_rate": 1.1539250888187768e-06, + "loss": 1.1191, + "step": 54695 + }, + { + "epoch": 1.4, + "learning_rate": 1.1538977480680281e-06, + "loss": 0.6538, + "step": 54696 + }, + { + "epoch": 1.4, + "learning_rate": 1.1538704071994472e-06, + "loss": 0.5625, + "step": 54697 + }, + { + "epoch": 1.4, + "learning_rate": 1.1538430662130544e-06, + "loss": 0.875, + "step": 54698 + }, + { + "epoch": 1.4, + "learning_rate": 1.1538157251088715e-06, + "loss": 0.5718, + "step": 54699 + }, + { + "epoch": 1.4, + "learning_rate": 1.1537883838869186e-06, + "loss": 0.8564, + "step": 54700 + }, + { + "epoch": 1.4, + "learning_rate": 1.1537610425472174e-06, + "loss": 0.6113, + "step": 54701 + }, + { + "epoch": 1.4, + "learning_rate": 1.1537337010897883e-06, + "loss": 0.6509, + "step": 54702 + }, + { + "epoch": 1.4, + "learning_rate": 1.153706359514652e-06, + "loss": 0.4712, + "step": 54703 + }, + { + "epoch": 1.4, + "learning_rate": 1.1536790178218304e-06, + "loss": 0.4368, + "step": 54704 + }, + { + "epoch": 1.4, + "learning_rate": 1.1536516760113434e-06, + "loss": 0.709, + "step": 54705 + }, + { + "epoch": 1.4, + "learning_rate": 1.1536243340832125e-06, + "loss": 0.5908, + "step": 54706 + }, + { + "epoch": 1.4, + "learning_rate": 1.1535969920374587e-06, + "loss": 0.668, + "step": 54707 + }, + { + "epoch": 1.4, + "learning_rate": 1.1535696498741026e-06, + "loss": 0.5947, + "step": 54708 + }, + { + "epoch": 1.4, + "learning_rate": 1.1535423075931652e-06, + "loss": 0.7131, + "step": 54709 + }, + { + "epoch": 1.4, + "learning_rate": 1.1535149651946677e-06, + "loss": 0.6079, + "step": 54710 + }, + { + "epoch": 1.4, + "learning_rate": 1.1534876226786306e-06, + "loss": 0.6465, + "step": 54711 + }, + { + "epoch": 1.4, + "learning_rate": 1.1534602800450755e-06, + "loss": 0.5239, + "step": 54712 + }, + { + "epoch": 1.4, + "learning_rate": 1.1534329372940223e-06, + "loss": 0.6885, + "step": 54713 + }, + { + "epoch": 1.4, + "learning_rate": 1.153405594425493e-06, + "loss": 0.6143, + "step": 54714 + }, + { + "epoch": 1.4, + "learning_rate": 1.1533782514395079e-06, + "loss": 0.9043, + "step": 54715 + }, + { + "epoch": 1.4, + "learning_rate": 1.1533509083360881e-06, + "loss": 0.627, + "step": 54716 + }, + { + "epoch": 1.4, + "learning_rate": 1.1533235651152548e-06, + "loss": 0.5859, + "step": 54717 + }, + { + "epoch": 1.4, + "learning_rate": 1.1532962217770288e-06, + "loss": 0.3745, + "step": 54718 + }, + { + "epoch": 1.4, + "learning_rate": 1.1532688783214304e-06, + "loss": 0.8076, + "step": 54719 + }, + { + "epoch": 1.4, + "learning_rate": 1.1532415347484814e-06, + "loss": 0.8926, + "step": 54720 + }, + { + "epoch": 1.4, + "learning_rate": 1.1532141910582023e-06, + "loss": 0.54, + "step": 54721 + }, + { + "epoch": 1.4, + "learning_rate": 1.1531868472506142e-06, + "loss": 0.6606, + "step": 54722 + }, + { + "epoch": 1.4, + "learning_rate": 1.1531595033257381e-06, + "loss": 0.4712, + "step": 54723 + }, + { + "epoch": 1.4, + "learning_rate": 1.1531321592835948e-06, + "loss": 0.491, + "step": 54724 + }, + { + "epoch": 1.4, + "learning_rate": 1.153104815124205e-06, + "loss": 0.603, + "step": 54725 + }, + { + "epoch": 1.4, + "learning_rate": 1.1530774708475901e-06, + "loss": 0.792, + "step": 54726 + }, + { + "epoch": 1.4, + "learning_rate": 1.153050126453771e-06, + "loss": 0.6255, + "step": 54727 + }, + { + "epoch": 1.4, + "learning_rate": 1.1530227819427677e-06, + "loss": 0.4858, + "step": 54728 + }, + { + "epoch": 1.4, + "learning_rate": 1.1529954373146027e-06, + "loss": 0.6299, + "step": 54729 + }, + { + "epoch": 1.4, + "learning_rate": 1.1529680925692956e-06, + "loss": 0.6641, + "step": 54730 + }, + { + "epoch": 1.4, + "learning_rate": 1.1529407477068682e-06, + "loss": 0.5713, + "step": 54731 + }, + { + "epoch": 1.4, + "learning_rate": 1.152913402727341e-06, + "loss": 0.498, + "step": 54732 + }, + { + "epoch": 1.4, + "learning_rate": 1.1528860576307352e-06, + "loss": 0.7744, + "step": 54733 + }, + { + "epoch": 1.4, + "learning_rate": 1.1528587124170711e-06, + "loss": 0.6963, + "step": 54734 + }, + { + "epoch": 1.4, + "learning_rate": 1.1528313670863704e-06, + "loss": 0.792, + "step": 54735 + }, + { + "epoch": 1.4, + "learning_rate": 1.1528040216386536e-06, + "loss": 0.6274, + "step": 54736 + }, + { + "epoch": 1.4, + "learning_rate": 1.1527766760739423e-06, + "loss": 0.5718, + "step": 54737 + }, + { + "epoch": 1.4, + "learning_rate": 1.1527493303922565e-06, + "loss": 0.7393, + "step": 54738 + }, + { + "epoch": 1.4, + "learning_rate": 1.1527219845936177e-06, + "loss": 0.6541, + "step": 54739 + }, + { + "epoch": 1.4, + "learning_rate": 1.1526946386780465e-06, + "loss": 0.7266, + "step": 54740 + }, + { + "epoch": 1.4, + "learning_rate": 1.1526672926455642e-06, + "loss": 0.6982, + "step": 54741 + }, + { + "epoch": 1.4, + "learning_rate": 1.1526399464961915e-06, + "loss": 0.552, + "step": 54742 + }, + { + "epoch": 1.4, + "learning_rate": 1.1526126002299497e-06, + "loss": 0.6587, + "step": 54743 + }, + { + "epoch": 1.4, + "learning_rate": 1.152585253846859e-06, + "loss": 0.645, + "step": 54744 + }, + { + "epoch": 1.4, + "learning_rate": 1.1525579073469412e-06, + "loss": 0.8662, + "step": 54745 + }, + { + "epoch": 1.4, + "learning_rate": 1.1525305607302162e-06, + "loss": 0.6328, + "step": 54746 + }, + { + "epoch": 1.4, + "learning_rate": 1.152503213996706e-06, + "loss": 0.6689, + "step": 54747 + }, + { + "epoch": 1.4, + "learning_rate": 1.1524758671464315e-06, + "loss": 0.5483, + "step": 54748 + }, + { + "epoch": 1.4, + "learning_rate": 1.1524485201794126e-06, + "loss": 0.6538, + "step": 54749 + }, + { + "epoch": 1.4, + "learning_rate": 1.152421173095671e-06, + "loss": 0.7314, + "step": 54750 + }, + { + "epoch": 1.4, + "learning_rate": 1.1523938258952275e-06, + "loss": 0.6709, + "step": 54751 + }, + { + "epoch": 1.4, + "learning_rate": 1.1523664785781035e-06, + "loss": 0.6318, + "step": 54752 + }, + { + "epoch": 1.4, + "learning_rate": 1.1523391311443189e-06, + "loss": 0.6992, + "step": 54753 + }, + { + "epoch": 1.4, + "learning_rate": 1.1523117835938955e-06, + "loss": 0.7236, + "step": 54754 + }, + { + "epoch": 1.4, + "learning_rate": 1.1522844359268539e-06, + "loss": 0.6943, + "step": 54755 + }, + { + "epoch": 1.4, + "learning_rate": 1.1522570881432154e-06, + "loss": 0.5054, + "step": 54756 + }, + { + "epoch": 1.4, + "learning_rate": 1.1522297402430003e-06, + "loss": 0.8594, + "step": 54757 + }, + { + "epoch": 1.4, + "learning_rate": 1.1522023922262304e-06, + "loss": 0.6084, + "step": 54758 + }, + { + "epoch": 1.4, + "learning_rate": 1.1521750440929255e-06, + "loss": 0.6543, + "step": 54759 + }, + { + "epoch": 1.4, + "learning_rate": 1.1521476958431074e-06, + "loss": 0.6553, + "step": 54760 + }, + { + "epoch": 1.4, + "learning_rate": 1.1521203474767967e-06, + "loss": 0.7188, + "step": 54761 + }, + { + "epoch": 1.4, + "learning_rate": 1.1520929989940147e-06, + "loss": 0.6484, + "step": 54762 + }, + { + "epoch": 1.4, + "learning_rate": 1.1520656503947818e-06, + "loss": 0.7227, + "step": 54763 + }, + { + "epoch": 1.4, + "learning_rate": 1.1520383016791195e-06, + "loss": 0.6431, + "step": 54764 + }, + { + "epoch": 1.4, + "learning_rate": 1.152010952847048e-06, + "loss": 0.7061, + "step": 54765 + }, + { + "epoch": 1.4, + "learning_rate": 1.1519836038985894e-06, + "loss": 0.6978, + "step": 54766 + }, + { + "epoch": 1.4, + "learning_rate": 1.1519562548337636e-06, + "loss": 0.6553, + "step": 54767 + }, + { + "epoch": 1.4, + "learning_rate": 1.1519289056525915e-06, + "loss": 0.7324, + "step": 54768 + }, + { + "epoch": 1.4, + "learning_rate": 1.151901556355095e-06, + "loss": 0.5464, + "step": 54769 + }, + { + "epoch": 1.4, + "learning_rate": 1.1518742069412943e-06, + "loss": 0.6343, + "step": 54770 + }, + { + "epoch": 1.4, + "learning_rate": 1.1518468574112103e-06, + "loss": 0.6387, + "step": 54771 + }, + { + "epoch": 1.4, + "learning_rate": 1.1518195077648645e-06, + "loss": 0.6416, + "step": 54772 + }, + { + "epoch": 1.4, + "learning_rate": 1.151792158002277e-06, + "loss": 0.5864, + "step": 54773 + }, + { + "epoch": 1.4, + "learning_rate": 1.1517648081234694e-06, + "loss": 0.708, + "step": 54774 + }, + { + "epoch": 1.4, + "learning_rate": 1.1517374581284628e-06, + "loss": 0.8291, + "step": 54775 + }, + { + "epoch": 1.4, + "learning_rate": 1.1517101080172773e-06, + "loss": 0.7773, + "step": 54776 + }, + { + "epoch": 1.4, + "learning_rate": 1.151682757789935e-06, + "loss": 0.4812, + "step": 54777 + }, + { + "epoch": 1.4, + "learning_rate": 1.1516554074464554e-06, + "loss": 0.5999, + "step": 54778 + }, + { + "epoch": 1.4, + "learning_rate": 1.1516280569868608e-06, + "loss": 0.7153, + "step": 54779 + }, + { + "epoch": 1.4, + "learning_rate": 1.1516007064111715e-06, + "loss": 0.6787, + "step": 54780 + }, + { + "epoch": 1.4, + "learning_rate": 1.1515733557194083e-06, + "loss": 0.5908, + "step": 54781 + }, + { + "epoch": 1.4, + "learning_rate": 1.1515460049115927e-06, + "loss": 0.4066, + "step": 54782 + }, + { + "epoch": 1.4, + "learning_rate": 1.1515186539877451e-06, + "loss": 0.5205, + "step": 54783 + }, + { + "epoch": 1.4, + "learning_rate": 1.1514913029478863e-06, + "loss": 0.7148, + "step": 54784 + }, + { + "epoch": 1.4, + "learning_rate": 1.151463951792038e-06, + "loss": 0.5479, + "step": 54785 + }, + { + "epoch": 1.4, + "learning_rate": 1.1514366005202202e-06, + "loss": 0.7188, + "step": 54786 + }, + { + "epoch": 1.4, + "learning_rate": 1.151409249132455e-06, + "loss": 0.6738, + "step": 54787 + }, + { + "epoch": 1.4, + "learning_rate": 1.1513818976287625e-06, + "loss": 0.7041, + "step": 54788 + }, + { + "epoch": 1.4, + "learning_rate": 1.1513545460091638e-06, + "loss": 0.7871, + "step": 54789 + }, + { + "epoch": 1.4, + "learning_rate": 1.1513271942736798e-06, + "loss": 0.7773, + "step": 54790 + }, + { + "epoch": 1.4, + "learning_rate": 1.1512998424223316e-06, + "loss": 0.5632, + "step": 54791 + }, + { + "epoch": 1.4, + "learning_rate": 1.15127249045514e-06, + "loss": 0.5037, + "step": 54792 + }, + { + "epoch": 1.4, + "learning_rate": 1.151245138372126e-06, + "loss": 0.4626, + "step": 54793 + }, + { + "epoch": 1.4, + "learning_rate": 1.1512177861733108e-06, + "loss": 0.6396, + "step": 54794 + }, + { + "epoch": 1.4, + "learning_rate": 1.1511904338587146e-06, + "loss": 0.5957, + "step": 54795 + }, + { + "epoch": 1.4, + "learning_rate": 1.1511630814283593e-06, + "loss": 0.3574, + "step": 54796 + }, + { + "epoch": 1.4, + "learning_rate": 1.1511357288822652e-06, + "loss": 0.856, + "step": 54797 + }, + { + "epoch": 1.4, + "learning_rate": 1.1511083762204536e-06, + "loss": 0.8135, + "step": 54798 + }, + { + "epoch": 1.4, + "learning_rate": 1.1510810234429448e-06, + "loss": 0.6963, + "step": 54799 + }, + { + "epoch": 1.4, + "learning_rate": 1.1510536705497608e-06, + "loss": 0.5713, + "step": 54800 + }, + { + "epoch": 1.4, + "learning_rate": 1.1510263175409213e-06, + "loss": 0.7441, + "step": 54801 + }, + { + "epoch": 1.4, + "learning_rate": 1.1509989644164485e-06, + "loss": 0.7158, + "step": 54802 + }, + { + "epoch": 1.4, + "learning_rate": 1.1509716111763625e-06, + "loss": 0.5957, + "step": 54803 + }, + { + "epoch": 1.4, + "learning_rate": 1.1509442578206845e-06, + "loss": 0.7393, + "step": 54804 + }, + { + "epoch": 1.4, + "learning_rate": 1.1509169043494354e-06, + "loss": 0.5752, + "step": 54805 + }, + { + "epoch": 1.4, + "learning_rate": 1.1508895507626361e-06, + "loss": 0.6899, + "step": 54806 + }, + { + "epoch": 1.4, + "learning_rate": 1.150862197060308e-06, + "loss": 0.5771, + "step": 54807 + }, + { + "epoch": 1.4, + "learning_rate": 1.150834843242471e-06, + "loss": 0.6572, + "step": 54808 + }, + { + "epoch": 1.4, + "learning_rate": 1.1508074893091471e-06, + "loss": 0.5312, + "step": 54809 + }, + { + "epoch": 1.4, + "learning_rate": 1.1507801352603569e-06, + "loss": 0.7158, + "step": 54810 + }, + { + "epoch": 1.4, + "learning_rate": 1.150752781096121e-06, + "loss": 0.7607, + "step": 54811 + }, + { + "epoch": 1.4, + "learning_rate": 1.1507254268164607e-06, + "loss": 0.6436, + "step": 54812 + }, + { + "epoch": 1.4, + "learning_rate": 1.150698072421397e-06, + "loss": 0.6484, + "step": 54813 + }, + { + "epoch": 1.4, + "learning_rate": 1.1506707179109505e-06, + "loss": 0.6309, + "step": 54814 + }, + { + "epoch": 1.4, + "learning_rate": 1.1506433632851427e-06, + "loss": 0.4707, + "step": 54815 + }, + { + "epoch": 1.4, + "learning_rate": 1.150616008543994e-06, + "loss": 0.71, + "step": 54816 + }, + { + "epoch": 1.4, + "learning_rate": 1.1505886536875255e-06, + "loss": 0.6736, + "step": 54817 + }, + { + "epoch": 1.41, + "learning_rate": 1.1505612987157583e-06, + "loss": 0.6553, + "step": 54818 + }, + { + "epoch": 1.41, + "learning_rate": 1.1505339436287132e-06, + "loss": 0.7617, + "step": 54819 + }, + { + "epoch": 1.41, + "learning_rate": 1.1505065884264112e-06, + "loss": 0.7324, + "step": 54820 + }, + { + "epoch": 1.41, + "learning_rate": 1.1504792331088734e-06, + "loss": 0.7725, + "step": 54821 + }, + { + "epoch": 1.41, + "learning_rate": 1.15045187767612e-06, + "loss": 0.7393, + "step": 54822 + }, + { + "epoch": 1.41, + "learning_rate": 1.1504245221281733e-06, + "loss": 0.832, + "step": 54823 + }, + { + "epoch": 1.41, + "learning_rate": 1.1503971664650528e-06, + "loss": 0.6304, + "step": 54824 + }, + { + "epoch": 1.41, + "learning_rate": 1.1503698106867802e-06, + "loss": 0.6191, + "step": 54825 + }, + { + "epoch": 1.41, + "learning_rate": 1.1503424547933767e-06, + "loss": 0.7842, + "step": 54826 + }, + { + "epoch": 1.41, + "learning_rate": 1.1503150987848626e-06, + "loss": 0.8457, + "step": 54827 + }, + { + "epoch": 1.41, + "learning_rate": 1.1502877426612592e-06, + "loss": 0.6533, + "step": 54828 + }, + { + "epoch": 1.41, + "learning_rate": 1.1502603864225874e-06, + "loss": 0.6318, + "step": 54829 + }, + { + "epoch": 1.41, + "learning_rate": 1.150233030068868e-06, + "loss": 0.8037, + "step": 54830 + }, + { + "epoch": 1.41, + "learning_rate": 1.1502056736001224e-06, + "loss": 0.6875, + "step": 54831 + }, + { + "epoch": 1.41, + "learning_rate": 1.1501783170163713e-06, + "loss": 0.5459, + "step": 54832 + }, + { + "epoch": 1.41, + "learning_rate": 1.1501509603176352e-06, + "loss": 0.521, + "step": 54833 + }, + { + "epoch": 1.41, + "learning_rate": 1.1501236035039354e-06, + "loss": 0.6206, + "step": 54834 + }, + { + "epoch": 1.41, + "learning_rate": 1.150096246575293e-06, + "loss": 0.522, + "step": 54835 + }, + { + "epoch": 1.41, + "learning_rate": 1.150068889531729e-06, + "loss": 0.5581, + "step": 54836 + }, + { + "epoch": 1.41, + "learning_rate": 1.1500415323732638e-06, + "loss": 0.6899, + "step": 54837 + }, + { + "epoch": 1.41, + "learning_rate": 1.1500141750999188e-06, + "loss": 0.7539, + "step": 54838 + }, + { + "epoch": 1.41, + "learning_rate": 1.149986817711715e-06, + "loss": 0.4944, + "step": 54839 + }, + { + "epoch": 1.41, + "learning_rate": 1.149959460208673e-06, + "loss": 0.6777, + "step": 54840 + }, + { + "epoch": 1.41, + "learning_rate": 1.1499321025908141e-06, + "loss": 0.6455, + "step": 54841 + }, + { + "epoch": 1.41, + "learning_rate": 1.1499047448581592e-06, + "loss": 0.5981, + "step": 54842 + }, + { + "epoch": 1.41, + "learning_rate": 1.1498773870107288e-06, + "loss": 0.5989, + "step": 54843 + }, + { + "epoch": 1.41, + "learning_rate": 1.1498500290485442e-06, + "loss": 0.6846, + "step": 54844 + }, + { + "epoch": 1.41, + "learning_rate": 1.1498226709716263e-06, + "loss": 0.917, + "step": 54845 + }, + { + "epoch": 1.41, + "learning_rate": 1.1497953127799966e-06, + "loss": 0.5132, + "step": 54846 + }, + { + "epoch": 1.41, + "learning_rate": 1.149767954473675e-06, + "loss": 0.5503, + "step": 54847 + }, + { + "epoch": 1.41, + "learning_rate": 1.1497405960526832e-06, + "loss": 0.4716, + "step": 54848 + }, + { + "epoch": 1.41, + "learning_rate": 1.1497132375170414e-06, + "loss": 0.73, + "step": 54849 + }, + { + "epoch": 1.41, + "learning_rate": 1.1496858788667716e-06, + "loss": 0.7246, + "step": 54850 + }, + { + "epoch": 1.41, + "learning_rate": 1.1496585201018943e-06, + "loss": 0.6411, + "step": 54851 + }, + { + "epoch": 1.41, + "learning_rate": 1.14963116122243e-06, + "loss": 0.748, + "step": 54852 + }, + { + "epoch": 1.41, + "learning_rate": 1.1496038022284e-06, + "loss": 0.6846, + "step": 54853 + }, + { + "epoch": 1.41, + "learning_rate": 1.1495764431198255e-06, + "loss": 0.604, + "step": 54854 + }, + { + "epoch": 1.41, + "learning_rate": 1.1495490838967267e-06, + "loss": 0.7168, + "step": 54855 + }, + { + "epoch": 1.41, + "learning_rate": 1.1495217245591256e-06, + "loss": 0.5864, + "step": 54856 + }, + { + "epoch": 1.41, + "learning_rate": 1.1494943651070425e-06, + "loss": 0.7725, + "step": 54857 + }, + { + "epoch": 1.41, + "learning_rate": 1.1494670055404983e-06, + "loss": 0.6621, + "step": 54858 + }, + { + "epoch": 1.41, + "learning_rate": 1.1494396458595139e-06, + "loss": 0.6611, + "step": 54859 + }, + { + "epoch": 1.41, + "learning_rate": 1.149412286064111e-06, + "loss": 0.7715, + "step": 54860 + }, + { + "epoch": 1.41, + "learning_rate": 1.1493849261543096e-06, + "loss": 0.5679, + "step": 54861 + }, + { + "epoch": 1.41, + "learning_rate": 1.149357566130131e-06, + "loss": 0.584, + "step": 54862 + }, + { + "epoch": 1.41, + "learning_rate": 1.1493302059915962e-06, + "loss": 0.6846, + "step": 54863 + }, + { + "epoch": 1.41, + "learning_rate": 1.149302845738726e-06, + "loss": 0.6108, + "step": 54864 + }, + { + "epoch": 1.41, + "learning_rate": 1.1492754853715415e-06, + "loss": 0.6133, + "step": 54865 + }, + { + "epoch": 1.41, + "learning_rate": 1.1492481248900641e-06, + "loss": 0.7852, + "step": 54866 + }, + { + "epoch": 1.41, + "learning_rate": 1.149220764294314e-06, + "loss": 0.6104, + "step": 54867 + }, + { + "epoch": 1.41, + "learning_rate": 1.149193403584312e-06, + "loss": 0.6299, + "step": 54868 + }, + { + "epoch": 1.41, + "learning_rate": 1.14916604276008e-06, + "loss": 0.6514, + "step": 54869 + }, + { + "epoch": 1.41, + "learning_rate": 1.1491386818216382e-06, + "loss": 0.6763, + "step": 54870 + }, + { + "epoch": 1.41, + "learning_rate": 1.1491113207690082e-06, + "loss": 0.7441, + "step": 54871 + }, + { + "epoch": 1.41, + "learning_rate": 1.14908395960221e-06, + "loss": 0.4758, + "step": 54872 + }, + { + "epoch": 1.41, + "learning_rate": 1.1490565983212652e-06, + "loss": 0.8379, + "step": 54873 + }, + { + "epoch": 1.41, + "learning_rate": 1.1490292369261944e-06, + "loss": 0.71, + "step": 54874 + }, + { + "epoch": 1.41, + "learning_rate": 1.1490018754170192e-06, + "loss": 0.6445, + "step": 54875 + }, + { + "epoch": 1.41, + "learning_rate": 1.1489745137937598e-06, + "loss": 0.7061, + "step": 54876 + }, + { + "epoch": 1.41, + "learning_rate": 1.1489471520564379e-06, + "loss": 0.5398, + "step": 54877 + }, + { + "epoch": 1.41, + "learning_rate": 1.1489197902050734e-06, + "loss": 0.7637, + "step": 54878 + }, + { + "epoch": 1.41, + "learning_rate": 1.148892428239688e-06, + "loss": 0.6807, + "step": 54879 + }, + { + "epoch": 1.41, + "learning_rate": 1.1488650661603027e-06, + "loss": 0.6621, + "step": 54880 + }, + { + "epoch": 1.41, + "learning_rate": 1.1488377039669383e-06, + "loss": 0.707, + "step": 54881 + }, + { + "epoch": 1.41, + "learning_rate": 1.1488103416596157e-06, + "loss": 0.6611, + "step": 54882 + }, + { + "epoch": 1.41, + "learning_rate": 1.1487829792383556e-06, + "loss": 0.7266, + "step": 54883 + }, + { + "epoch": 1.41, + "learning_rate": 1.1487556167031795e-06, + "loss": 0.7129, + "step": 54884 + }, + { + "epoch": 1.41, + "learning_rate": 1.148728254054108e-06, + "loss": 0.6035, + "step": 54885 + }, + { + "epoch": 1.41, + "learning_rate": 1.1487008912911621e-06, + "loss": 0.6904, + "step": 54886 + }, + { + "epoch": 1.41, + "learning_rate": 1.1486735284143628e-06, + "loss": 0.8057, + "step": 54887 + }, + { + "epoch": 1.41, + "learning_rate": 1.148646165423731e-06, + "loss": 0.8213, + "step": 54888 + }, + { + "epoch": 1.41, + "learning_rate": 1.1486188023192875e-06, + "loss": 0.7207, + "step": 54889 + }, + { + "epoch": 1.41, + "learning_rate": 1.1485914391010536e-06, + "loss": 0.5474, + "step": 54890 + }, + { + "epoch": 1.41, + "learning_rate": 1.1485640757690501e-06, + "loss": 0.5312, + "step": 54891 + }, + { + "epoch": 1.41, + "learning_rate": 1.1485367123232982e-06, + "loss": 0.6387, + "step": 54892 + }, + { + "epoch": 1.41, + "learning_rate": 1.1485093487638178e-06, + "loss": 0.6406, + "step": 54893 + }, + { + "epoch": 1.41, + "learning_rate": 1.1484819850906311e-06, + "loss": 0.6602, + "step": 54894 + }, + { + "epoch": 1.41, + "learning_rate": 1.1484546213037584e-06, + "loss": 0.6416, + "step": 54895 + }, + { + "epoch": 1.41, + "learning_rate": 1.1484272574032213e-06, + "loss": 0.4658, + "step": 54896 + }, + { + "epoch": 1.41, + "learning_rate": 1.1483998933890397e-06, + "loss": 0.6108, + "step": 54897 + }, + { + "epoch": 1.41, + "learning_rate": 1.1483725292612354e-06, + "loss": 0.6514, + "step": 54898 + }, + { + "epoch": 1.41, + "learning_rate": 1.1483451650198287e-06, + "loss": 0.6987, + "step": 54899 + }, + { + "epoch": 1.41, + "learning_rate": 1.1483178006648415e-06, + "loss": 0.5349, + "step": 54900 + }, + { + "epoch": 1.41, + "learning_rate": 1.1482904361962939e-06, + "loss": 0.6396, + "step": 54901 + }, + { + "epoch": 1.41, + "learning_rate": 1.148263071614207e-06, + "loss": 0.6699, + "step": 54902 + }, + { + "epoch": 1.41, + "learning_rate": 1.1482357069186022e-06, + "loss": 0.5143, + "step": 54903 + }, + { + "epoch": 1.41, + "learning_rate": 1.1482083421094996e-06, + "loss": 0.5679, + "step": 54904 + }, + { + "epoch": 1.41, + "learning_rate": 1.1481809771869213e-06, + "loss": 0.6787, + "step": 54905 + }, + { + "epoch": 1.41, + "learning_rate": 1.1481536121508874e-06, + "loss": 0.7627, + "step": 54906 + }, + { + "epoch": 1.41, + "learning_rate": 1.1481262470014193e-06, + "loss": 0.7119, + "step": 54907 + }, + { + "epoch": 1.41, + "learning_rate": 1.1480988817385373e-06, + "loss": 0.5898, + "step": 54908 + }, + { + "epoch": 1.41, + "learning_rate": 1.1480715163622632e-06, + "loss": 0.8926, + "step": 54909 + }, + { + "epoch": 1.41, + "learning_rate": 1.148044150872617e-06, + "loss": 0.6133, + "step": 54910 + }, + { + "epoch": 1.41, + "learning_rate": 1.148016785269621e-06, + "loss": 0.6514, + "step": 54911 + }, + { + "epoch": 1.41, + "learning_rate": 1.1479894195532947e-06, + "loss": 0.6626, + "step": 54912 + }, + { + "epoch": 1.41, + "learning_rate": 1.14796205372366e-06, + "loss": 0.5708, + "step": 54913 + }, + { + "epoch": 1.41, + "learning_rate": 1.1479346877807374e-06, + "loss": 0.4532, + "step": 54914 + }, + { + "epoch": 1.41, + "learning_rate": 1.1479073217245482e-06, + "loss": 0.6211, + "step": 54915 + }, + { + "epoch": 1.41, + "learning_rate": 1.147879955555113e-06, + "loss": 0.3706, + "step": 54916 + }, + { + "epoch": 1.41, + "learning_rate": 1.1478525892724531e-06, + "loss": 0.7305, + "step": 54917 + }, + { + "epoch": 1.41, + "learning_rate": 1.147825222876589e-06, + "loss": 0.75, + "step": 54918 + }, + { + "epoch": 1.41, + "learning_rate": 1.1477978563675423e-06, + "loss": 0.5298, + "step": 54919 + }, + { + "epoch": 1.41, + "learning_rate": 1.1477704897453331e-06, + "loss": 0.5413, + "step": 54920 + }, + { + "epoch": 1.41, + "learning_rate": 1.1477431230099832e-06, + "loss": 0.6914, + "step": 54921 + }, + { + "epoch": 1.41, + "learning_rate": 1.1477157561615131e-06, + "loss": 0.6401, + "step": 54922 + }, + { + "epoch": 1.41, + "learning_rate": 1.1476883891999438e-06, + "loss": 0.5723, + "step": 54923 + }, + { + "epoch": 1.41, + "learning_rate": 1.1476610221252962e-06, + "loss": 0.6338, + "step": 54924 + }, + { + "epoch": 1.41, + "learning_rate": 1.1476336549375915e-06, + "loss": 0.7578, + "step": 54925 + }, + { + "epoch": 1.41, + "learning_rate": 1.1476062876368507e-06, + "loss": 0.6494, + "step": 54926 + }, + { + "epoch": 1.41, + "learning_rate": 1.147578920223094e-06, + "loss": 0.8271, + "step": 54927 + }, + { + "epoch": 1.41, + "learning_rate": 1.1475515526963433e-06, + "loss": 0.7119, + "step": 54928 + }, + { + "epoch": 1.41, + "learning_rate": 1.1475241850566188e-06, + "loss": 0.5513, + "step": 54929 + }, + { + "epoch": 1.41, + "learning_rate": 1.1474968173039423e-06, + "loss": 0.6299, + "step": 54930 + }, + { + "epoch": 1.41, + "learning_rate": 1.147469449438334e-06, + "loss": 0.5833, + "step": 54931 + }, + { + "epoch": 1.41, + "learning_rate": 1.1474420814598153e-06, + "loss": 0.8447, + "step": 54932 + }, + { + "epoch": 1.41, + "learning_rate": 1.1474147133684067e-06, + "loss": 0.5244, + "step": 54933 + }, + { + "epoch": 1.41, + "learning_rate": 1.1473873451641297e-06, + "loss": 0.7441, + "step": 54934 + }, + { + "epoch": 1.41, + "learning_rate": 1.1473599768470049e-06, + "loss": 0.5374, + "step": 54935 + }, + { + "epoch": 1.41, + "learning_rate": 1.1473326084170533e-06, + "loss": 0.7041, + "step": 54936 + }, + { + "epoch": 1.41, + "learning_rate": 1.147305239874296e-06, + "loss": 0.6709, + "step": 54937 + }, + { + "epoch": 1.41, + "learning_rate": 1.1472778712187536e-06, + "loss": 0.8096, + "step": 54938 + }, + { + "epoch": 1.41, + "learning_rate": 1.1472505024504475e-06, + "loss": 0.752, + "step": 54939 + }, + { + "epoch": 1.41, + "learning_rate": 1.1472231335693986e-06, + "loss": 0.791, + "step": 54940 + }, + { + "epoch": 1.41, + "learning_rate": 1.1471957645756274e-06, + "loss": 0.6951, + "step": 54941 + }, + { + "epoch": 1.41, + "learning_rate": 1.1471683954691553e-06, + "loss": 0.7734, + "step": 54942 + }, + { + "epoch": 1.41, + "learning_rate": 1.1471410262500032e-06, + "loss": 0.5239, + "step": 54943 + }, + { + "epoch": 1.41, + "learning_rate": 1.1471136569181917e-06, + "loss": 0.5645, + "step": 54944 + }, + { + "epoch": 1.41, + "learning_rate": 1.1470862874737423e-06, + "loss": 0.7266, + "step": 54945 + }, + { + "epoch": 1.41, + "learning_rate": 1.147058917916676e-06, + "loss": 0.6421, + "step": 54946 + }, + { + "epoch": 1.41, + "learning_rate": 1.1470315482470129e-06, + "loss": 0.7861, + "step": 54947 + }, + { + "epoch": 1.41, + "learning_rate": 1.1470041784647745e-06, + "loss": 0.7051, + "step": 54948 + }, + { + "epoch": 1.41, + "learning_rate": 1.146976808569982e-06, + "loss": 0.541, + "step": 54949 + }, + { + "epoch": 1.41, + "learning_rate": 1.1469494385626562e-06, + "loss": 0.5962, + "step": 54950 + }, + { + "epoch": 1.41, + "learning_rate": 1.146922068442818e-06, + "loss": 0.625, + "step": 54951 + }, + { + "epoch": 1.41, + "learning_rate": 1.1468946982104881e-06, + "loss": 0.5459, + "step": 54952 + }, + { + "epoch": 1.41, + "learning_rate": 1.1468673278656877e-06, + "loss": 0.7637, + "step": 54953 + }, + { + "epoch": 1.41, + "learning_rate": 1.1468399574084378e-06, + "loss": 0.5486, + "step": 54954 + }, + { + "epoch": 1.41, + "learning_rate": 1.1468125868387592e-06, + "loss": 0.6123, + "step": 54955 + }, + { + "epoch": 1.41, + "learning_rate": 1.146785216156673e-06, + "loss": 0.665, + "step": 54956 + }, + { + "epoch": 1.41, + "learning_rate": 1.1467578453622004e-06, + "loss": 0.4861, + "step": 54957 + }, + { + "epoch": 1.41, + "learning_rate": 1.1467304744553617e-06, + "loss": 0.5083, + "step": 54958 + }, + { + "epoch": 1.41, + "learning_rate": 1.1467031034361784e-06, + "loss": 0.6426, + "step": 54959 + }, + { + "epoch": 1.41, + "learning_rate": 1.1466757323046712e-06, + "loss": 0.4635, + "step": 54960 + }, + { + "epoch": 1.41, + "learning_rate": 1.1466483610608612e-06, + "loss": 0.7002, + "step": 54961 + }, + { + "epoch": 1.41, + "learning_rate": 1.146620989704769e-06, + "loss": 0.7139, + "step": 54962 + }, + { + "epoch": 1.41, + "learning_rate": 1.1465936182364165e-06, + "loss": 0.4458, + "step": 54963 + }, + { + "epoch": 1.41, + "learning_rate": 1.1465662466558234e-06, + "loss": 0.7705, + "step": 54964 + }, + { + "epoch": 1.41, + "learning_rate": 1.1465388749630116e-06, + "loss": 0.6299, + "step": 54965 + }, + { + "epoch": 1.41, + "learning_rate": 1.1465115031580018e-06, + "loss": 0.5928, + "step": 54966 + }, + { + "epoch": 1.41, + "learning_rate": 1.1464841312408147e-06, + "loss": 0.6162, + "step": 54967 + }, + { + "epoch": 1.41, + "learning_rate": 1.1464567592114712e-06, + "loss": 0.5659, + "step": 54968 + }, + { + "epoch": 1.41, + "learning_rate": 1.1464293870699928e-06, + "loss": 0.7822, + "step": 54969 + }, + { + "epoch": 1.41, + "learning_rate": 1.1464020148163998e-06, + "loss": 0.3828, + "step": 54970 + }, + { + "epoch": 1.41, + "learning_rate": 1.146374642450714e-06, + "loss": 0.6411, + "step": 54971 + }, + { + "epoch": 1.41, + "learning_rate": 1.1463472699729556e-06, + "loss": 0.6006, + "step": 54972 + }, + { + "epoch": 1.41, + "learning_rate": 1.1463198973831456e-06, + "loss": 0.7285, + "step": 54973 + }, + { + "epoch": 1.41, + "learning_rate": 1.1462925246813056e-06, + "loss": 0.4812, + "step": 54974 + }, + { + "epoch": 1.41, + "learning_rate": 1.146265151867456e-06, + "loss": 0.6982, + "step": 54975 + }, + { + "epoch": 1.41, + "learning_rate": 1.146237778941618e-06, + "loss": 0.7461, + "step": 54976 + }, + { + "epoch": 1.41, + "learning_rate": 1.1462104059038122e-06, + "loss": 0.8926, + "step": 54977 + }, + { + "epoch": 1.41, + "learning_rate": 1.14618303275406e-06, + "loss": 0.5854, + "step": 54978 + }, + { + "epoch": 1.41, + "learning_rate": 1.146155659492382e-06, + "loss": 0.5299, + "step": 54979 + }, + { + "epoch": 1.41, + "learning_rate": 1.1461282861187996e-06, + "loss": 0.5864, + "step": 54980 + }, + { + "epoch": 1.41, + "learning_rate": 1.1461009126333334e-06, + "loss": 0.6211, + "step": 54981 + }, + { + "epoch": 1.41, + "learning_rate": 1.1460735390360046e-06, + "loss": 0.6426, + "step": 54982 + }, + { + "epoch": 1.41, + "learning_rate": 1.1460461653268336e-06, + "loss": 0.6733, + "step": 54983 + }, + { + "epoch": 1.41, + "learning_rate": 1.146018791505842e-06, + "loss": 0.6982, + "step": 54984 + }, + { + "epoch": 1.41, + "learning_rate": 1.1459914175730502e-06, + "loss": 0.6445, + "step": 54985 + }, + { + "epoch": 1.41, + "learning_rate": 1.1459640435284802e-06, + "loss": 0.7568, + "step": 54986 + }, + { + "epoch": 1.41, + "learning_rate": 1.1459366693721518e-06, + "loss": 0.6107, + "step": 54987 + }, + { + "epoch": 1.41, + "learning_rate": 1.1459092951040864e-06, + "loss": 0.4104, + "step": 54988 + }, + { + "epoch": 1.41, + "learning_rate": 1.1458819207243048e-06, + "loss": 0.7207, + "step": 54989 + }, + { + "epoch": 1.41, + "learning_rate": 1.1458545462328284e-06, + "loss": 0.4985, + "step": 54990 + }, + { + "epoch": 1.41, + "learning_rate": 1.1458271716296778e-06, + "loss": 0.6963, + "step": 54991 + }, + { + "epoch": 1.41, + "learning_rate": 1.1457997969148741e-06, + "loss": 0.4436, + "step": 54992 + }, + { + "epoch": 1.41, + "learning_rate": 1.145772422088438e-06, + "loss": 0.834, + "step": 54993 + }, + { + "epoch": 1.41, + "learning_rate": 1.1457450471503906e-06, + "loss": 0.7441, + "step": 54994 + }, + { + "epoch": 1.41, + "learning_rate": 1.1457176721007533e-06, + "loss": 0.668, + "step": 54995 + }, + { + "epoch": 1.41, + "learning_rate": 1.1456902969395466e-06, + "loss": 0.5833, + "step": 54996 + }, + { + "epoch": 1.41, + "learning_rate": 1.1456629216667915e-06, + "loss": 0.6206, + "step": 54997 + }, + { + "epoch": 1.41, + "learning_rate": 1.1456355462825086e-06, + "loss": 0.5967, + "step": 54998 + }, + { + "epoch": 1.41, + "learning_rate": 1.1456081707867198e-06, + "loss": 0.5664, + "step": 54999 + }, + { + "epoch": 1.41, + "learning_rate": 1.1455807951794452e-06, + "loss": 0.4116, + "step": 55000 + }, + { + "epoch": 1.41, + "learning_rate": 1.1455534194607063e-06, + "loss": 0.6611, + "step": 55001 + }, + { + "epoch": 1.41, + "learning_rate": 1.1455260436305237e-06, + "loss": 0.6943, + "step": 55002 + }, + { + "epoch": 1.41, + "learning_rate": 1.1454986676889186e-06, + "loss": 0.5419, + "step": 55003 + }, + { + "epoch": 1.41, + "learning_rate": 1.1454712916359117e-06, + "loss": 0.646, + "step": 55004 + }, + { + "epoch": 1.41, + "learning_rate": 1.1454439154715242e-06, + "loss": 0.668, + "step": 55005 + }, + { + "epoch": 1.41, + "learning_rate": 1.145416539195777e-06, + "loss": 0.6963, + "step": 55006 + }, + { + "epoch": 1.41, + "learning_rate": 1.145389162808691e-06, + "loss": 0.7812, + "step": 55007 + }, + { + "epoch": 1.41, + "learning_rate": 1.1453617863102874e-06, + "loss": 0.6758, + "step": 55008 + }, + { + "epoch": 1.41, + "learning_rate": 1.1453344097005867e-06, + "loss": 0.6904, + "step": 55009 + }, + { + "epoch": 1.41, + "learning_rate": 1.14530703297961e-06, + "loss": 0.7041, + "step": 55010 + }, + { + "epoch": 1.41, + "learning_rate": 1.1452796561473788e-06, + "loss": 0.8125, + "step": 55011 + }, + { + "epoch": 1.41, + "learning_rate": 1.1452522792039135e-06, + "loss": 0.8535, + "step": 55012 + }, + { + "epoch": 1.41, + "learning_rate": 1.1452249021492353e-06, + "loss": 0.6162, + "step": 55013 + }, + { + "epoch": 1.41, + "learning_rate": 1.1451975249833648e-06, + "loss": 0.5413, + "step": 55014 + }, + { + "epoch": 1.41, + "learning_rate": 1.1451701477063233e-06, + "loss": 0.5547, + "step": 55015 + }, + { + "epoch": 1.41, + "learning_rate": 1.145142770318132e-06, + "loss": 0.6069, + "step": 55016 + }, + { + "epoch": 1.41, + "learning_rate": 1.145115392818811e-06, + "loss": 0.519, + "step": 55017 + }, + { + "epoch": 1.41, + "learning_rate": 1.1450880152083825e-06, + "loss": 0.6758, + "step": 55018 + }, + { + "epoch": 1.41, + "learning_rate": 1.1450606374868662e-06, + "loss": 0.5522, + "step": 55019 + }, + { + "epoch": 1.41, + "learning_rate": 1.1450332596542837e-06, + "loss": 0.6055, + "step": 55020 + }, + { + "epoch": 1.41, + "learning_rate": 1.1450058817106563e-06, + "loss": 0.5278, + "step": 55021 + }, + { + "epoch": 1.41, + "learning_rate": 1.1449785036560042e-06, + "loss": 0.6006, + "step": 55022 + }, + { + "epoch": 1.41, + "learning_rate": 1.1449511254903487e-06, + "loss": 0.793, + "step": 55023 + }, + { + "epoch": 1.41, + "learning_rate": 1.144923747213711e-06, + "loss": 0.7251, + "step": 55024 + }, + { + "epoch": 1.41, + "learning_rate": 1.1448963688261117e-06, + "loss": 0.5249, + "step": 55025 + }, + { + "epoch": 1.41, + "learning_rate": 1.1448689903275724e-06, + "loss": 0.6416, + "step": 55026 + }, + { + "epoch": 1.41, + "learning_rate": 1.144841611718113e-06, + "loss": 0.7656, + "step": 55027 + }, + { + "epoch": 1.41, + "learning_rate": 1.144814232997755e-06, + "loss": 0.6997, + "step": 55028 + }, + { + "epoch": 1.41, + "learning_rate": 1.1447868541665195e-06, + "loss": 0.6733, + "step": 55029 + }, + { + "epoch": 1.41, + "learning_rate": 1.1447594752244276e-06, + "loss": 0.8545, + "step": 55030 + }, + { + "epoch": 1.41, + "learning_rate": 1.1447320961714998e-06, + "loss": 0.7266, + "step": 55031 + }, + { + "epoch": 1.41, + "learning_rate": 1.1447047170077576e-06, + "loss": 0.666, + "step": 55032 + }, + { + "epoch": 1.41, + "learning_rate": 1.1446773377332212e-06, + "loss": 0.771, + "step": 55033 + }, + { + "epoch": 1.41, + "learning_rate": 1.1446499583479126e-06, + "loss": 0.7842, + "step": 55034 + }, + { + "epoch": 1.41, + "learning_rate": 1.1446225788518515e-06, + "loss": 0.8262, + "step": 55035 + }, + { + "epoch": 1.41, + "learning_rate": 1.14459519924506e-06, + "loss": 0.6704, + "step": 55036 + }, + { + "epoch": 1.41, + "learning_rate": 1.1445678195275584e-06, + "loss": 0.6548, + "step": 55037 + }, + { + "epoch": 1.41, + "learning_rate": 1.1445404396993678e-06, + "loss": 0.6301, + "step": 55038 + }, + { + "epoch": 1.41, + "learning_rate": 1.1445130597605094e-06, + "loss": 0.614, + "step": 55039 + }, + { + "epoch": 1.41, + "learning_rate": 1.1444856797110044e-06, + "loss": 0.7178, + "step": 55040 + }, + { + "epoch": 1.41, + "learning_rate": 1.144458299550873e-06, + "loss": 0.5215, + "step": 55041 + }, + { + "epoch": 1.41, + "learning_rate": 1.1444309192801363e-06, + "loss": 0.5903, + "step": 55042 + }, + { + "epoch": 1.41, + "learning_rate": 1.1444035388988156e-06, + "loss": 0.6816, + "step": 55043 + }, + { + "epoch": 1.41, + "learning_rate": 1.1443761584069315e-06, + "loss": 0.6553, + "step": 55044 + }, + { + "epoch": 1.41, + "learning_rate": 1.1443487778045056e-06, + "loss": 0.5659, + "step": 55045 + }, + { + "epoch": 1.41, + "learning_rate": 1.1443213970915583e-06, + "loss": 0.7002, + "step": 55046 + }, + { + "epoch": 1.41, + "learning_rate": 1.1442940162681112e-06, + "loss": 0.6387, + "step": 55047 + }, + { + "epoch": 1.41, + "learning_rate": 1.1442666353341841e-06, + "loss": 0.7783, + "step": 55048 + }, + { + "epoch": 1.41, + "learning_rate": 1.1442392542897993e-06, + "loss": 0.6445, + "step": 55049 + }, + { + "epoch": 1.41, + "learning_rate": 1.1442118731349766e-06, + "loss": 0.647, + "step": 55050 + }, + { + "epoch": 1.41, + "learning_rate": 1.1441844918697378e-06, + "loss": 0.752, + "step": 55051 + }, + { + "epoch": 1.41, + "learning_rate": 1.1441571104941034e-06, + "loss": 0.6865, + "step": 55052 + }, + { + "epoch": 1.41, + "learning_rate": 1.1441297290080946e-06, + "loss": 0.667, + "step": 55053 + }, + { + "epoch": 1.41, + "learning_rate": 1.1441023474117325e-06, + "loss": 0.688, + "step": 55054 + }, + { + "epoch": 1.41, + "learning_rate": 1.1440749657050377e-06, + "loss": 0.7246, + "step": 55055 + }, + { + "epoch": 1.41, + "learning_rate": 1.1440475838880311e-06, + "loss": 0.6704, + "step": 55056 + }, + { + "epoch": 1.41, + "learning_rate": 1.1440202019607343e-06, + "loss": 0.7627, + "step": 55057 + }, + { + "epoch": 1.41, + "learning_rate": 1.1439928199231675e-06, + "loss": 0.8533, + "step": 55058 + }, + { + "epoch": 1.41, + "learning_rate": 1.1439654377753522e-06, + "loss": 0.6494, + "step": 55059 + }, + { + "epoch": 1.41, + "learning_rate": 1.1439380555173091e-06, + "loss": 0.6777, + "step": 55060 + }, + { + "epoch": 1.41, + "learning_rate": 1.1439106731490594e-06, + "loss": 0.6284, + "step": 55061 + }, + { + "epoch": 1.41, + "learning_rate": 1.1438832906706236e-06, + "loss": 0.6538, + "step": 55062 + }, + { + "epoch": 1.41, + "learning_rate": 1.1438559080820232e-06, + "loss": 0.6797, + "step": 55063 + }, + { + "epoch": 1.41, + "learning_rate": 1.1438285253832792e-06, + "loss": 0.8135, + "step": 55064 + }, + { + "epoch": 1.41, + "learning_rate": 1.1438011425744119e-06, + "loss": 0.6812, + "step": 55065 + }, + { + "epoch": 1.41, + "learning_rate": 1.143773759655443e-06, + "loss": 0.6567, + "step": 55066 + }, + { + "epoch": 1.41, + "learning_rate": 1.1437463766263928e-06, + "loss": 0.4688, + "step": 55067 + }, + { + "epoch": 1.41, + "learning_rate": 1.143718993487283e-06, + "loss": 0.751, + "step": 55068 + }, + { + "epoch": 1.41, + "learning_rate": 1.1436916102381338e-06, + "loss": 0.6506, + "step": 55069 + }, + { + "epoch": 1.41, + "learning_rate": 1.1436642268789667e-06, + "loss": 0.6992, + "step": 55070 + }, + { + "epoch": 1.41, + "learning_rate": 1.1436368434098025e-06, + "loss": 0.6924, + "step": 55071 + }, + { + "epoch": 1.41, + "learning_rate": 1.1436094598306622e-06, + "loss": 0.5957, + "step": 55072 + }, + { + "epoch": 1.41, + "learning_rate": 1.1435820761415667e-06, + "loss": 0.6758, + "step": 55073 + }, + { + "epoch": 1.41, + "learning_rate": 1.143554692342537e-06, + "loss": 0.8691, + "step": 55074 + }, + { + "epoch": 1.41, + "learning_rate": 1.143527308433594e-06, + "loss": 0.6455, + "step": 55075 + }, + { + "epoch": 1.41, + "learning_rate": 1.143499924414759e-06, + "loss": 0.585, + "step": 55076 + }, + { + "epoch": 1.41, + "learning_rate": 1.1434725402860526e-06, + "loss": 0.5159, + "step": 55077 + }, + { + "epoch": 1.41, + "learning_rate": 1.1434451560474957e-06, + "loss": 0.6802, + "step": 55078 + }, + { + "epoch": 1.41, + "learning_rate": 1.1434177716991094e-06, + "loss": 0.9199, + "step": 55079 + }, + { + "epoch": 1.41, + "learning_rate": 1.143390387240915e-06, + "loss": 0.541, + "step": 55080 + }, + { + "epoch": 1.41, + "learning_rate": 1.1433630026729331e-06, + "loss": 0.6528, + "step": 55081 + }, + { + "epoch": 1.41, + "learning_rate": 1.1433356179951846e-06, + "loss": 0.6758, + "step": 55082 + }, + { + "epoch": 1.41, + "learning_rate": 1.1433082332076906e-06, + "loss": 0.5312, + "step": 55083 + }, + { + "epoch": 1.41, + "learning_rate": 1.1432808483104722e-06, + "loss": 0.6846, + "step": 55084 + }, + { + "epoch": 1.41, + "learning_rate": 1.1432534633035501e-06, + "loss": 0.7266, + "step": 55085 + }, + { + "epoch": 1.41, + "learning_rate": 1.1432260781869455e-06, + "loss": 0.8135, + "step": 55086 + }, + { + "epoch": 1.41, + "learning_rate": 1.1431986929606794e-06, + "loss": 0.5584, + "step": 55087 + }, + { + "epoch": 1.41, + "learning_rate": 1.1431713076247725e-06, + "loss": 0.7217, + "step": 55088 + }, + { + "epoch": 1.41, + "learning_rate": 1.1431439221792461e-06, + "loss": 0.6782, + "step": 55089 + }, + { + "epoch": 1.41, + "learning_rate": 1.1431165366241207e-06, + "loss": 0.6842, + "step": 55090 + }, + { + "epoch": 1.41, + "learning_rate": 1.1430891509594178e-06, + "loss": 0.6865, + "step": 55091 + }, + { + "epoch": 1.41, + "learning_rate": 1.143061765185158e-06, + "loss": 0.624, + "step": 55092 + }, + { + "epoch": 1.41, + "learning_rate": 1.1430343793013625e-06, + "loss": 0.6255, + "step": 55093 + }, + { + "epoch": 1.41, + "learning_rate": 1.1430069933080517e-06, + "loss": 0.8008, + "step": 55094 + }, + { + "epoch": 1.41, + "learning_rate": 1.1429796072052472e-06, + "loss": 0.7666, + "step": 55095 + }, + { + "epoch": 1.41, + "learning_rate": 1.1429522209929704e-06, + "loss": 0.6533, + "step": 55096 + }, + { + "epoch": 1.41, + "learning_rate": 1.1429248346712412e-06, + "loss": 0.584, + "step": 55097 + }, + { + "epoch": 1.41, + "learning_rate": 1.1428974482400809e-06, + "loss": 0.7227, + "step": 55098 + }, + { + "epoch": 1.41, + "learning_rate": 1.1428700616995105e-06, + "loss": 0.627, + "step": 55099 + }, + { + "epoch": 1.41, + "learning_rate": 1.1428426750495512e-06, + "loss": 0.7354, + "step": 55100 + }, + { + "epoch": 1.41, + "learning_rate": 1.1428152882902243e-06, + "loss": 0.585, + "step": 55101 + }, + { + "epoch": 1.41, + "learning_rate": 1.1427879014215498e-06, + "loss": 0.5728, + "step": 55102 + }, + { + "epoch": 1.41, + "learning_rate": 1.1427605144435492e-06, + "loss": 0.645, + "step": 55103 + }, + { + "epoch": 1.41, + "learning_rate": 1.1427331273562435e-06, + "loss": 0.6001, + "step": 55104 + }, + { + "epoch": 1.41, + "learning_rate": 1.1427057401596538e-06, + "loss": 0.665, + "step": 55105 + }, + { + "epoch": 1.41, + "learning_rate": 1.1426783528538007e-06, + "loss": 0.6016, + "step": 55106 + }, + { + "epoch": 1.41, + "learning_rate": 1.142650965438705e-06, + "loss": 0.6001, + "step": 55107 + }, + { + "epoch": 1.41, + "learning_rate": 1.1426235779143887e-06, + "loss": 0.5732, + "step": 55108 + }, + { + "epoch": 1.41, + "learning_rate": 1.1425961902808717e-06, + "loss": 0.4312, + "step": 55109 + }, + { + "epoch": 1.41, + "learning_rate": 1.1425688025381755e-06, + "loss": 0.6711, + "step": 55110 + }, + { + "epoch": 1.41, + "learning_rate": 1.1425414146863209e-06, + "loss": 0.3315, + "step": 55111 + }, + { + "epoch": 1.41, + "learning_rate": 1.1425140267253288e-06, + "loss": 0.3545, + "step": 55112 + }, + { + "epoch": 1.41, + "learning_rate": 1.14248663865522e-06, + "loss": 0.6123, + "step": 55113 + }, + { + "epoch": 1.41, + "learning_rate": 1.142459250476016e-06, + "loss": 0.5322, + "step": 55114 + }, + { + "epoch": 1.41, + "learning_rate": 1.1424318621877379e-06, + "loss": 0.5625, + "step": 55115 + }, + { + "epoch": 1.41, + "learning_rate": 1.1424044737904057e-06, + "loss": 0.6387, + "step": 55116 + }, + { + "epoch": 1.41, + "learning_rate": 1.1423770852840411e-06, + "loss": 0.7324, + "step": 55117 + }, + { + "epoch": 1.41, + "learning_rate": 1.142349696668665e-06, + "loss": 0.6904, + "step": 55118 + }, + { + "epoch": 1.41, + "learning_rate": 1.1423223079442981e-06, + "loss": 0.6562, + "step": 55119 + }, + { + "epoch": 1.41, + "learning_rate": 1.142294919110962e-06, + "loss": 0.7061, + "step": 55120 + }, + { + "epoch": 1.41, + "learning_rate": 1.1422675301686767e-06, + "loss": 0.6611, + "step": 55121 + }, + { + "epoch": 1.41, + "learning_rate": 1.142240141117464e-06, + "loss": 0.6953, + "step": 55122 + }, + { + "epoch": 1.41, + "learning_rate": 1.1422127519573444e-06, + "loss": 0.6519, + "step": 55123 + }, + { + "epoch": 1.41, + "learning_rate": 1.142185362688339e-06, + "loss": 0.6875, + "step": 55124 + }, + { + "epoch": 1.41, + "learning_rate": 1.1421579733104689e-06, + "loss": 0.6543, + "step": 55125 + }, + { + "epoch": 1.41, + "learning_rate": 1.142130583823755e-06, + "loss": 0.6577, + "step": 55126 + }, + { + "epoch": 1.41, + "learning_rate": 1.1421031942282182e-06, + "loss": 0.6519, + "step": 55127 + }, + { + "epoch": 1.41, + "learning_rate": 1.1420758045238794e-06, + "loss": 0.4346, + "step": 55128 + }, + { + "epoch": 1.41, + "learning_rate": 1.1420484147107599e-06, + "loss": 0.7349, + "step": 55129 + }, + { + "epoch": 1.41, + "learning_rate": 1.1420210247888804e-06, + "loss": 0.4702, + "step": 55130 + }, + { + "epoch": 1.41, + "learning_rate": 1.1419936347582622e-06, + "loss": 0.4873, + "step": 55131 + }, + { + "epoch": 1.41, + "learning_rate": 1.1419662446189255e-06, + "loss": 0.644, + "step": 55132 + }, + { + "epoch": 1.41, + "learning_rate": 1.1419388543708922e-06, + "loss": 0.501, + "step": 55133 + }, + { + "epoch": 1.41, + "learning_rate": 1.1419114640141822e-06, + "loss": 0.6572, + "step": 55134 + }, + { + "epoch": 1.41, + "learning_rate": 1.141884073548818e-06, + "loss": 0.6978, + "step": 55135 + }, + { + "epoch": 1.41, + "learning_rate": 1.1418566829748191e-06, + "loss": 0.8799, + "step": 55136 + }, + { + "epoch": 1.41, + "learning_rate": 1.1418292922922073e-06, + "loss": 0.6631, + "step": 55137 + }, + { + "epoch": 1.41, + "learning_rate": 1.1418019015010033e-06, + "loss": 0.7393, + "step": 55138 + }, + { + "epoch": 1.41, + "learning_rate": 1.1417745106012279e-06, + "loss": 0.7939, + "step": 55139 + }, + { + "epoch": 1.41, + "learning_rate": 1.1417471195929025e-06, + "loss": 0.5237, + "step": 55140 + }, + { + "epoch": 1.41, + "learning_rate": 1.1417197284760478e-06, + "loss": 0.7529, + "step": 55141 + }, + { + "epoch": 1.41, + "learning_rate": 1.1416923372506845e-06, + "loss": 0.7246, + "step": 55142 + }, + { + "epoch": 1.41, + "learning_rate": 1.1416649459168344e-06, + "loss": 0.5234, + "step": 55143 + }, + { + "epoch": 1.41, + "learning_rate": 1.1416375544745177e-06, + "loss": 0.6318, + "step": 55144 + }, + { + "epoch": 1.41, + "learning_rate": 1.1416101629237557e-06, + "loss": 0.7676, + "step": 55145 + }, + { + "epoch": 1.41, + "learning_rate": 1.1415827712645693e-06, + "loss": 0.6177, + "step": 55146 + }, + { + "epoch": 1.41, + "learning_rate": 1.1415553794969795e-06, + "loss": 0.606, + "step": 55147 + }, + { + "epoch": 1.41, + "learning_rate": 1.1415279876210073e-06, + "loss": 0.4443, + "step": 55148 + }, + { + "epoch": 1.41, + "learning_rate": 1.1415005956366737e-06, + "loss": 0.4619, + "step": 55149 + }, + { + "epoch": 1.41, + "learning_rate": 1.1414732035439994e-06, + "loss": 0.7393, + "step": 55150 + }, + { + "epoch": 1.41, + "learning_rate": 1.1414458113430054e-06, + "loss": 0.5732, + "step": 55151 + }, + { + "epoch": 1.41, + "learning_rate": 1.1414184190337132e-06, + "loss": 0.6699, + "step": 55152 + }, + { + "epoch": 1.41, + "learning_rate": 1.1413910266161432e-06, + "loss": 0.4863, + "step": 55153 + }, + { + "epoch": 1.41, + "learning_rate": 1.1413636340903168e-06, + "loss": 0.5259, + "step": 55154 + }, + { + "epoch": 1.41, + "learning_rate": 1.1413362414562548e-06, + "loss": 0.7646, + "step": 55155 + }, + { + "epoch": 1.41, + "learning_rate": 1.141308848713978e-06, + "loss": 0.7393, + "step": 55156 + }, + { + "epoch": 1.41, + "learning_rate": 1.1412814558635073e-06, + "loss": 0.6396, + "step": 55157 + }, + { + "epoch": 1.41, + "learning_rate": 1.1412540629048641e-06, + "loss": 0.7207, + "step": 55158 + }, + { + "epoch": 1.41, + "learning_rate": 1.141226669838069e-06, + "loss": 0.7852, + "step": 55159 + }, + { + "epoch": 1.41, + "learning_rate": 1.1411992766631437e-06, + "loss": 0.6772, + "step": 55160 + }, + { + "epoch": 1.41, + "learning_rate": 1.141171883380108e-06, + "loss": 0.5605, + "step": 55161 + }, + { + "epoch": 1.41, + "learning_rate": 1.1411444899889837e-06, + "loss": 0.6304, + "step": 55162 + }, + { + "epoch": 1.41, + "learning_rate": 1.1411170964897917e-06, + "loss": 0.8525, + "step": 55163 + }, + { + "epoch": 1.41, + "learning_rate": 1.1410897028825525e-06, + "loss": 0.7188, + "step": 55164 + }, + { + "epoch": 1.41, + "learning_rate": 1.1410623091672877e-06, + "loss": 0.7236, + "step": 55165 + }, + { + "epoch": 1.41, + "learning_rate": 1.141034915344018e-06, + "loss": 0.7402, + "step": 55166 + }, + { + "epoch": 1.41, + "learning_rate": 1.1410075214127638e-06, + "loss": 0.7026, + "step": 55167 + }, + { + "epoch": 1.41, + "learning_rate": 1.140980127373547e-06, + "loss": 0.6016, + "step": 55168 + }, + { + "epoch": 1.41, + "learning_rate": 1.1409527332263881e-06, + "loss": 0.4503, + "step": 55169 + }, + { + "epoch": 1.41, + "learning_rate": 1.1409253389713085e-06, + "loss": 0.353, + "step": 55170 + }, + { + "epoch": 1.41, + "learning_rate": 1.1408979446083286e-06, + "loss": 0.6431, + "step": 55171 + }, + { + "epoch": 1.41, + "learning_rate": 1.1408705501374695e-06, + "loss": 0.7959, + "step": 55172 + }, + { + "epoch": 1.41, + "learning_rate": 1.1408431555587526e-06, + "loss": 0.75, + "step": 55173 + }, + { + "epoch": 1.41, + "learning_rate": 1.1408157608721982e-06, + "loss": 0.5132, + "step": 55174 + }, + { + "epoch": 1.41, + "learning_rate": 1.1407883660778284e-06, + "loss": 0.5132, + "step": 55175 + }, + { + "epoch": 1.41, + "learning_rate": 1.1407609711756627e-06, + "loss": 0.6201, + "step": 55176 + }, + { + "epoch": 1.41, + "learning_rate": 1.140733576165723e-06, + "loss": 0.4622, + "step": 55177 + }, + { + "epoch": 1.41, + "learning_rate": 1.1407061810480298e-06, + "loss": 0.7026, + "step": 55178 + }, + { + "epoch": 1.41, + "learning_rate": 1.140678785822605e-06, + "loss": 0.6196, + "step": 55179 + }, + { + "epoch": 1.41, + "learning_rate": 1.1406513904894684e-06, + "loss": 0.7939, + "step": 55180 + }, + { + "epoch": 1.41, + "learning_rate": 1.1406239950486415e-06, + "loss": 0.5317, + "step": 55181 + }, + { + "epoch": 1.41, + "learning_rate": 1.1405965995001454e-06, + "loss": 0.7246, + "step": 55182 + }, + { + "epoch": 1.41, + "learning_rate": 1.1405692038440011e-06, + "loss": 0.6484, + "step": 55183 + }, + { + "epoch": 1.41, + "learning_rate": 1.1405418080802292e-06, + "loss": 0.564, + "step": 55184 + }, + { + "epoch": 1.41, + "learning_rate": 1.1405144122088511e-06, + "loss": 0.5211, + "step": 55185 + }, + { + "epoch": 1.41, + "learning_rate": 1.1404870162298873e-06, + "loss": 0.71, + "step": 55186 + }, + { + "epoch": 1.41, + "learning_rate": 1.1404596201433595e-06, + "loss": 0.6987, + "step": 55187 + }, + { + "epoch": 1.41, + "learning_rate": 1.1404322239492876e-06, + "loss": 0.834, + "step": 55188 + }, + { + "epoch": 1.41, + "learning_rate": 1.1404048276476937e-06, + "loss": 0.7031, + "step": 55189 + }, + { + "epoch": 1.41, + "learning_rate": 1.140377431238598e-06, + "loss": 0.5894, + "step": 55190 + }, + { + "epoch": 1.41, + "learning_rate": 1.1403500347220218e-06, + "loss": 0.5405, + "step": 55191 + }, + { + "epoch": 1.41, + "learning_rate": 1.1403226380979863e-06, + "loss": 0.6689, + "step": 55192 + }, + { + "epoch": 1.41, + "learning_rate": 1.140295241366512e-06, + "loss": 0.7695, + "step": 55193 + }, + { + "epoch": 1.41, + "learning_rate": 1.14026784452762e-06, + "loss": 0.6313, + "step": 55194 + }, + { + "epoch": 1.41, + "learning_rate": 1.1402404475813314e-06, + "loss": 0.4775, + "step": 55195 + }, + { + "epoch": 1.41, + "learning_rate": 1.1402130505276672e-06, + "loss": 0.7246, + "step": 55196 + }, + { + "epoch": 1.41, + "learning_rate": 1.1401856533666482e-06, + "loss": 0.4802, + "step": 55197 + }, + { + "epoch": 1.41, + "learning_rate": 1.1401582560982957e-06, + "loss": 0.7144, + "step": 55198 + }, + { + "epoch": 1.41, + "learning_rate": 1.14013085872263e-06, + "loss": 0.8066, + "step": 55199 + }, + { + "epoch": 1.41, + "learning_rate": 1.1401034612396733e-06, + "loss": 0.6943, + "step": 55200 + }, + { + "epoch": 1.41, + "learning_rate": 1.1400760636494453e-06, + "loss": 0.6055, + "step": 55201 + }, + { + "epoch": 1.41, + "learning_rate": 1.1400486659519678e-06, + "loss": 0.5898, + "step": 55202 + }, + { + "epoch": 1.41, + "learning_rate": 1.140021268147261e-06, + "loss": 0.7676, + "step": 55203 + }, + { + "epoch": 1.41, + "learning_rate": 1.139993870235347e-06, + "loss": 0.6431, + "step": 55204 + }, + { + "epoch": 1.41, + "learning_rate": 1.1399664722162456e-06, + "loss": 0.4868, + "step": 55205 + }, + { + "epoch": 1.41, + "learning_rate": 1.1399390740899786e-06, + "loss": 0.7119, + "step": 55206 + }, + { + "epoch": 1.41, + "learning_rate": 1.1399116758565665e-06, + "loss": 0.6016, + "step": 55207 + }, + { + "epoch": 1.42, + "learning_rate": 1.1398842775160306e-06, + "loss": 0.689, + "step": 55208 + }, + { + "epoch": 1.42, + "learning_rate": 1.1398568790683916e-06, + "loss": 0.5813, + "step": 55209 + }, + { + "epoch": 1.42, + "learning_rate": 1.139829480513671e-06, + "loss": 0.7871, + "step": 55210 + }, + { + "epoch": 1.42, + "learning_rate": 1.1398020818518889e-06, + "loss": 0.7266, + "step": 55211 + }, + { + "epoch": 1.42, + "learning_rate": 1.139774683083067e-06, + "loss": 0.5682, + "step": 55212 + }, + { + "epoch": 1.42, + "learning_rate": 1.139747284207226e-06, + "loss": 0.7166, + "step": 55213 + }, + { + "epoch": 1.42, + "learning_rate": 1.139719885224387e-06, + "loss": 0.6177, + "step": 55214 + }, + { + "epoch": 1.42, + "learning_rate": 1.139692486134571e-06, + "loss": 0.8633, + "step": 55215 + }, + { + "epoch": 1.42, + "learning_rate": 1.1396650869377985e-06, + "loss": 0.5269, + "step": 55216 + }, + { + "epoch": 1.42, + "learning_rate": 1.1396376876340913e-06, + "loss": 0.6396, + "step": 55217 + }, + { + "epoch": 1.42, + "learning_rate": 1.1396102882234694e-06, + "loss": 0.6626, + "step": 55218 + }, + { + "epoch": 1.42, + "learning_rate": 1.1395828887059548e-06, + "loss": 0.6953, + "step": 55219 + }, + { + "epoch": 1.42, + "learning_rate": 1.1395554890815679e-06, + "loss": 0.7402, + "step": 55220 + }, + { + "epoch": 1.42, + "learning_rate": 1.1395280893503299e-06, + "loss": 0.571, + "step": 55221 + }, + { + "epoch": 1.42, + "learning_rate": 1.1395006895122615e-06, + "loss": 0.6914, + "step": 55222 + }, + { + "epoch": 1.42, + "learning_rate": 1.1394732895673838e-06, + "loss": 0.6328, + "step": 55223 + }, + { + "epoch": 1.42, + "learning_rate": 1.1394458895157177e-06, + "loss": 0.5762, + "step": 55224 + }, + { + "epoch": 1.42, + "learning_rate": 1.139418489357285e-06, + "loss": 0.8047, + "step": 55225 + }, + { + "epoch": 1.42, + "learning_rate": 1.1393910890921051e-06, + "loss": 0.6382, + "step": 55226 + }, + { + "epoch": 1.42, + "learning_rate": 1.1393636887202002e-06, + "loss": 0.6953, + "step": 55227 + }, + { + "epoch": 1.42, + "learning_rate": 1.139336288241591e-06, + "loss": 0.7129, + "step": 55228 + }, + { + "epoch": 1.42, + "learning_rate": 1.1393088876562983e-06, + "loss": 0.6855, + "step": 55229 + }, + { + "epoch": 1.42, + "learning_rate": 1.1392814869643432e-06, + "loss": 0.584, + "step": 55230 + }, + { + "epoch": 1.42, + "learning_rate": 1.1392540861657467e-06, + "loss": 0.7412, + "step": 55231 + }, + { + "epoch": 1.42, + "learning_rate": 1.1392266852605297e-06, + "loss": 0.6205, + "step": 55232 + }, + { + "epoch": 1.42, + "learning_rate": 1.1391992842487132e-06, + "loss": 0.7139, + "step": 55233 + }, + { + "epoch": 1.42, + "learning_rate": 1.1391718831303184e-06, + "loss": 0.5625, + "step": 55234 + }, + { + "epoch": 1.42, + "learning_rate": 1.139144481905366e-06, + "loss": 0.5859, + "step": 55235 + }, + { + "epoch": 1.42, + "learning_rate": 1.139117080573877e-06, + "loss": 0.6582, + "step": 55236 + }, + { + "epoch": 1.42, + "learning_rate": 1.1390896791358723e-06, + "loss": 0.6045, + "step": 55237 + }, + { + "epoch": 1.42, + "learning_rate": 1.1390622775913735e-06, + "loss": 0.6128, + "step": 55238 + }, + { + "epoch": 1.42, + "learning_rate": 1.1390348759404008e-06, + "loss": 0.7471, + "step": 55239 + }, + { + "epoch": 1.42, + "learning_rate": 1.1390074741829757e-06, + "loss": 0.5439, + "step": 55240 + }, + { + "epoch": 1.42, + "learning_rate": 1.1389800723191185e-06, + "loss": 0.7358, + "step": 55241 + }, + { + "epoch": 1.42, + "learning_rate": 1.138952670348851e-06, + "loss": 0.6182, + "step": 55242 + }, + { + "epoch": 1.42, + "learning_rate": 1.1389252682721934e-06, + "loss": 0.7568, + "step": 55243 + }, + { + "epoch": 1.42, + "learning_rate": 1.1388978660891677e-06, + "loss": 0.6357, + "step": 55244 + }, + { + "epoch": 1.42, + "learning_rate": 1.138870463799794e-06, + "loss": 0.7822, + "step": 55245 + }, + { + "epoch": 1.42, + "learning_rate": 1.1388430614040938e-06, + "loss": 0.7773, + "step": 55246 + }, + { + "epoch": 1.42, + "learning_rate": 1.1388156589020876e-06, + "loss": 0.6494, + "step": 55247 + }, + { + "epoch": 1.42, + "learning_rate": 1.1387882562937967e-06, + "loss": 0.6855, + "step": 55248 + }, + { + "epoch": 1.42, + "learning_rate": 1.138760853579242e-06, + "loss": 0.8262, + "step": 55249 + }, + { + "epoch": 1.42, + "learning_rate": 1.1387334507584447e-06, + "loss": 0.7266, + "step": 55250 + }, + { + "epoch": 1.42, + "learning_rate": 1.1387060478314251e-06, + "loss": 0.6382, + "step": 55251 + }, + { + "epoch": 1.42, + "learning_rate": 1.1386786447982053e-06, + "loss": 0.5728, + "step": 55252 + }, + { + "epoch": 1.42, + "learning_rate": 1.138651241658805e-06, + "loss": 0.665, + "step": 55253 + }, + { + "epoch": 1.42, + "learning_rate": 1.1386238384132463e-06, + "loss": 0.625, + "step": 55254 + }, + { + "epoch": 1.42, + "learning_rate": 1.1385964350615495e-06, + "loss": 0.6616, + "step": 55255 + }, + { + "epoch": 1.42, + "learning_rate": 1.138569031603736e-06, + "loss": 0.5361, + "step": 55256 + }, + { + "epoch": 1.42, + "learning_rate": 1.1385416280398262e-06, + "loss": 0.7227, + "step": 55257 + }, + { + "epoch": 1.42, + "learning_rate": 1.1385142243698416e-06, + "loss": 0.8789, + "step": 55258 + }, + { + "epoch": 1.42, + "learning_rate": 1.138486820593803e-06, + "loss": 0.6377, + "step": 55259 + }, + { + "epoch": 1.42, + "learning_rate": 1.1384594167117314e-06, + "loss": 0.5669, + "step": 55260 + }, + { + "epoch": 1.42, + "learning_rate": 1.138432012723648e-06, + "loss": 0.5771, + "step": 55261 + }, + { + "epoch": 1.42, + "learning_rate": 1.138404608629573e-06, + "loss": 0.9062, + "step": 55262 + }, + { + "epoch": 1.42, + "learning_rate": 1.1383772044295286e-06, + "loss": 0.6543, + "step": 55263 + }, + { + "epoch": 1.42, + "learning_rate": 1.1383498001235347e-06, + "loss": 0.6782, + "step": 55264 + }, + { + "epoch": 1.42, + "learning_rate": 1.1383223957116133e-06, + "loss": 0.6567, + "step": 55265 + }, + { + "epoch": 1.42, + "learning_rate": 1.1382949911937843e-06, + "loss": 0.6543, + "step": 55266 + }, + { + "epoch": 1.42, + "learning_rate": 1.1382675865700692e-06, + "loss": 0.6201, + "step": 55267 + }, + { + "epoch": 1.42, + "learning_rate": 1.138240181840489e-06, + "loss": 0.7275, + "step": 55268 + }, + { + "epoch": 1.42, + "learning_rate": 1.1382127770050649e-06, + "loss": 0.6802, + "step": 55269 + }, + { + "epoch": 1.42, + "learning_rate": 1.1381853720638174e-06, + "loss": 0.7334, + "step": 55270 + }, + { + "epoch": 1.42, + "learning_rate": 1.1381579670167677e-06, + "loss": 0.627, + "step": 55271 + }, + { + "epoch": 1.42, + "learning_rate": 1.138130561863937e-06, + "loss": 0.4626, + "step": 55272 + }, + { + "epoch": 1.42, + "learning_rate": 1.1381031566053458e-06, + "loss": 0.6143, + "step": 55273 + }, + { + "epoch": 1.42, + "learning_rate": 1.1380757512410156e-06, + "loss": 0.5205, + "step": 55274 + }, + { + "epoch": 1.42, + "learning_rate": 1.1380483457709674e-06, + "loss": 0.5388, + "step": 55275 + }, + { + "epoch": 1.42, + "learning_rate": 1.1380209401952213e-06, + "loss": 0.5803, + "step": 55276 + }, + { + "epoch": 1.42, + "learning_rate": 1.1379935345137992e-06, + "loss": 0.4988, + "step": 55277 + }, + { + "epoch": 1.42, + "learning_rate": 1.1379661287267218e-06, + "loss": 0.6257, + "step": 55278 + }, + { + "epoch": 1.42, + "learning_rate": 1.13793872283401e-06, + "loss": 0.6816, + "step": 55279 + }, + { + "epoch": 1.42, + "learning_rate": 1.1379113168356852e-06, + "loss": 0.679, + "step": 55280 + }, + { + "epoch": 1.42, + "learning_rate": 1.1378839107317675e-06, + "loss": 0.6499, + "step": 55281 + }, + { + "epoch": 1.42, + "learning_rate": 1.1378565045222787e-06, + "loss": 0.6162, + "step": 55282 + }, + { + "epoch": 1.42, + "learning_rate": 1.1378290982072396e-06, + "loss": 0.6787, + "step": 55283 + }, + { + "epoch": 1.42, + "learning_rate": 1.1378016917866709e-06, + "loss": 0.6172, + "step": 55284 + }, + { + "epoch": 1.42, + "learning_rate": 1.137774285260594e-06, + "loss": 0.542, + "step": 55285 + }, + { + "epoch": 1.42, + "learning_rate": 1.1377468786290297e-06, + "loss": 0.709, + "step": 55286 + }, + { + "epoch": 1.42, + "learning_rate": 1.1377194718919985e-06, + "loss": 0.7012, + "step": 55287 + }, + { + "epoch": 1.42, + "learning_rate": 1.1376920650495222e-06, + "loss": 0.4895, + "step": 55288 + }, + { + "epoch": 1.42, + "learning_rate": 1.1376646581016213e-06, + "loss": 0.7246, + "step": 55289 + }, + { + "epoch": 1.42, + "learning_rate": 1.1376372510483171e-06, + "loss": 0.9531, + "step": 55290 + }, + { + "epoch": 1.42, + "learning_rate": 1.1376098438896302e-06, + "loss": 0.5972, + "step": 55291 + }, + { + "epoch": 1.42, + "learning_rate": 1.137582436625582e-06, + "loss": 0.7861, + "step": 55292 + }, + { + "epoch": 1.42, + "learning_rate": 1.1375550292561929e-06, + "loss": 0.6738, + "step": 55293 + }, + { + "epoch": 1.42, + "learning_rate": 1.1375276217814845e-06, + "loss": 0.6406, + "step": 55294 + }, + { + "epoch": 1.42, + "learning_rate": 1.1375002142014776e-06, + "loss": 0.6023, + "step": 55295 + }, + { + "epoch": 1.42, + "learning_rate": 1.1374728065161928e-06, + "loss": 0.5544, + "step": 55296 + }, + { + "epoch": 1.42, + "learning_rate": 1.1374453987256517e-06, + "loss": 0.6602, + "step": 55297 + }, + { + "epoch": 1.42, + "learning_rate": 1.1374179908298748e-06, + "loss": 0.6836, + "step": 55298 + }, + { + "epoch": 1.42, + "learning_rate": 1.137390582828883e-06, + "loss": 0.6943, + "step": 55299 + }, + { + "epoch": 1.42, + "learning_rate": 1.1373631747226982e-06, + "loss": 0.6064, + "step": 55300 + }, + { + "epoch": 1.42, + "learning_rate": 1.13733576651134e-06, + "loss": 0.6836, + "step": 55301 + }, + { + "epoch": 1.42, + "learning_rate": 1.1373083581948306e-06, + "loss": 0.5132, + "step": 55302 + }, + { + "epoch": 1.42, + "learning_rate": 1.1372809497731902e-06, + "loss": 0.5343, + "step": 55303 + }, + { + "epoch": 1.42, + "learning_rate": 1.1372535412464407e-06, + "loss": 0.6934, + "step": 55304 + }, + { + "epoch": 1.42, + "learning_rate": 1.137226132614602e-06, + "loss": 0.4474, + "step": 55305 + }, + { + "epoch": 1.42, + "learning_rate": 1.1371987238776953e-06, + "loss": 0.7012, + "step": 55306 + }, + { + "epoch": 1.42, + "learning_rate": 1.1371713150357422e-06, + "loss": 0.7744, + "step": 55307 + }, + { + "epoch": 1.42, + "learning_rate": 1.1371439060887632e-06, + "loss": 0.7529, + "step": 55308 + }, + { + "epoch": 1.42, + "learning_rate": 1.1371164970367798e-06, + "loss": 0.5142, + "step": 55309 + }, + { + "epoch": 1.42, + "learning_rate": 1.1370890878798123e-06, + "loss": 0.7705, + "step": 55310 + }, + { + "epoch": 1.42, + "learning_rate": 1.137061678617882e-06, + "loss": 0.6836, + "step": 55311 + }, + { + "epoch": 1.42, + "learning_rate": 1.1370342692510097e-06, + "loss": 0.6338, + "step": 55312 + }, + { + "epoch": 1.42, + "learning_rate": 1.1370068597792168e-06, + "loss": 0.7213, + "step": 55313 + }, + { + "epoch": 1.42, + "learning_rate": 1.1369794502025237e-06, + "loss": 0.6445, + "step": 55314 + }, + { + "epoch": 1.42, + "learning_rate": 1.1369520405209525e-06, + "loss": 0.6069, + "step": 55315 + }, + { + "epoch": 1.42, + "learning_rate": 1.1369246307345227e-06, + "loss": 0.6846, + "step": 55316 + }, + { + "epoch": 1.42, + "learning_rate": 1.1368972208432564e-06, + "loss": 0.793, + "step": 55317 + }, + { + "epoch": 1.42, + "learning_rate": 1.1368698108471738e-06, + "loss": 0.8145, + "step": 55318 + }, + { + "epoch": 1.42, + "learning_rate": 1.1368424007462967e-06, + "loss": 0.5603, + "step": 55319 + }, + { + "epoch": 1.42, + "learning_rate": 1.1368149905406455e-06, + "loss": 0.6924, + "step": 55320 + }, + { + "epoch": 1.42, + "learning_rate": 1.1367875802302413e-06, + "loss": 0.5765, + "step": 55321 + }, + { + "epoch": 1.42, + "learning_rate": 1.136760169815105e-06, + "loss": 0.6454, + "step": 55322 + }, + { + "epoch": 1.42, + "learning_rate": 1.136732759295258e-06, + "loss": 0.5938, + "step": 55323 + }, + { + "epoch": 1.42, + "learning_rate": 1.1367053486707207e-06, + "loss": 0.6621, + "step": 55324 + }, + { + "epoch": 1.42, + "learning_rate": 1.1366779379415148e-06, + "loss": 0.6895, + "step": 55325 + }, + { + "epoch": 1.42, + "learning_rate": 1.1366505271076607e-06, + "loss": 0.5234, + "step": 55326 + }, + { + "epoch": 1.42, + "learning_rate": 1.1366231161691794e-06, + "loss": 0.6174, + "step": 55327 + }, + { + "epoch": 1.42, + "learning_rate": 1.1365957051260923e-06, + "loss": 0.6277, + "step": 55328 + }, + { + "epoch": 1.42, + "learning_rate": 1.1365682939784202e-06, + "loss": 0.7539, + "step": 55329 + }, + { + "epoch": 1.42, + "learning_rate": 1.136540882726184e-06, + "loss": 0.5649, + "step": 55330 + }, + { + "epoch": 1.42, + "learning_rate": 1.1365134713694045e-06, + "loss": 0.4976, + "step": 55331 + }, + { + "epoch": 1.42, + "learning_rate": 1.136486059908103e-06, + "loss": 0.751, + "step": 55332 + }, + { + "epoch": 1.42, + "learning_rate": 1.1364586483423004e-06, + "loss": 0.7266, + "step": 55333 + }, + { + "epoch": 1.42, + "learning_rate": 1.136431236672018e-06, + "loss": 0.6499, + "step": 55334 + }, + { + "epoch": 1.42, + "learning_rate": 1.1364038248972761e-06, + "loss": 0.6113, + "step": 55335 + }, + { + "epoch": 1.42, + "learning_rate": 1.1363764130180961e-06, + "loss": 0.624, + "step": 55336 + }, + { + "epoch": 1.42, + "learning_rate": 1.1363490010344992e-06, + "loss": 0.6011, + "step": 55337 + }, + { + "epoch": 1.42, + "learning_rate": 1.136321588946506e-06, + "loss": 0.6167, + "step": 55338 + }, + { + "epoch": 1.42, + "learning_rate": 1.1362941767541374e-06, + "loss": 0.6973, + "step": 55339 + }, + { + "epoch": 1.42, + "learning_rate": 1.1362667644574151e-06, + "loss": 0.4526, + "step": 55340 + }, + { + "epoch": 1.42, + "learning_rate": 1.136239352056359e-06, + "loss": 0.7129, + "step": 55341 + }, + { + "epoch": 1.42, + "learning_rate": 1.1362119395509914e-06, + "loss": 0.5728, + "step": 55342 + }, + { + "epoch": 1.42, + "learning_rate": 1.1361845269413319e-06, + "loss": 0.6484, + "step": 55343 + }, + { + "epoch": 1.42, + "learning_rate": 1.1361571142274024e-06, + "loss": 0.6924, + "step": 55344 + }, + { + "epoch": 1.42, + "learning_rate": 1.136129701409224e-06, + "loss": 0.6534, + "step": 55345 + }, + { + "epoch": 1.42, + "learning_rate": 1.136102288486817e-06, + "loss": 0.6206, + "step": 55346 + }, + { + "epoch": 1.42, + "learning_rate": 1.1360748754602028e-06, + "loss": 0.6963, + "step": 55347 + }, + { + "epoch": 1.42, + "learning_rate": 1.1360474623294022e-06, + "loss": 0.7607, + "step": 55348 + }, + { + "epoch": 1.42, + "learning_rate": 1.1360200490944363e-06, + "loss": 0.6638, + "step": 55349 + }, + { + "epoch": 1.42, + "learning_rate": 1.1359926357553265e-06, + "loss": 0.6865, + "step": 55350 + }, + { + "epoch": 1.42, + "learning_rate": 1.135965222312093e-06, + "loss": 0.7266, + "step": 55351 + }, + { + "epoch": 1.42, + "learning_rate": 1.1359378087647574e-06, + "loss": 0.7373, + "step": 55352 + }, + { + "epoch": 1.42, + "learning_rate": 1.1359103951133401e-06, + "loss": 0.6514, + "step": 55353 + }, + { + "epoch": 1.42, + "learning_rate": 1.1358829813578627e-06, + "loss": 0.7046, + "step": 55354 + }, + { + "epoch": 1.42, + "learning_rate": 1.1358555674983464e-06, + "loss": 0.6055, + "step": 55355 + }, + { + "epoch": 1.42, + "learning_rate": 1.135828153534811e-06, + "loss": 0.7119, + "step": 55356 + }, + { + "epoch": 1.42, + "learning_rate": 1.1358007394672789e-06, + "loss": 0.5156, + "step": 55357 + }, + { + "epoch": 1.42, + "learning_rate": 1.1357733252957698e-06, + "loss": 0.8184, + "step": 55358 + }, + { + "epoch": 1.42, + "learning_rate": 1.135745911020306e-06, + "loss": 0.7393, + "step": 55359 + }, + { + "epoch": 1.42, + "learning_rate": 1.1357184966409072e-06, + "loss": 0.6353, + "step": 55360 + }, + { + "epoch": 1.42, + "learning_rate": 1.1356910821575952e-06, + "loss": 0.605, + "step": 55361 + }, + { + "epoch": 1.42, + "learning_rate": 1.1356636675703905e-06, + "loss": 0.6528, + "step": 55362 + }, + { + "epoch": 1.42, + "learning_rate": 1.1356362528793148e-06, + "loss": 0.5413, + "step": 55363 + }, + { + "epoch": 1.42, + "learning_rate": 1.1356088380843885e-06, + "loss": 0.7041, + "step": 55364 + }, + { + "epoch": 1.42, + "learning_rate": 1.1355814231856328e-06, + "loss": 0.645, + "step": 55365 + }, + { + "epoch": 1.42, + "learning_rate": 1.1355540081830686e-06, + "loss": 0.5488, + "step": 55366 + }, + { + "epoch": 1.42, + "learning_rate": 1.1355265930767168e-06, + "loss": 0.7324, + "step": 55367 + }, + { + "epoch": 1.42, + "learning_rate": 1.1354991778665986e-06, + "loss": 0.6382, + "step": 55368 + }, + { + "epoch": 1.42, + "learning_rate": 1.135471762552735e-06, + "loss": 0.6719, + "step": 55369 + }, + { + "epoch": 1.42, + "learning_rate": 1.1354443471351469e-06, + "loss": 0.6855, + "step": 55370 + }, + { + "epoch": 1.42, + "learning_rate": 1.1354169316138548e-06, + "loss": 0.5791, + "step": 55371 + }, + { + "epoch": 1.42, + "learning_rate": 1.1353895159888808e-06, + "loss": 0.6826, + "step": 55372 + }, + { + "epoch": 1.42, + "learning_rate": 1.135362100260245e-06, + "loss": 0.4307, + "step": 55373 + }, + { + "epoch": 1.42, + "learning_rate": 1.1353346844279687e-06, + "loss": 0.6719, + "step": 55374 + }, + { + "epoch": 1.42, + "learning_rate": 1.135307268492073e-06, + "loss": 0.4353, + "step": 55375 + }, + { + "epoch": 1.42, + "learning_rate": 1.135279852452579e-06, + "loss": 0.6572, + "step": 55376 + }, + { + "epoch": 1.42, + "learning_rate": 1.1352524363095067e-06, + "loss": 0.749, + "step": 55377 + }, + { + "epoch": 1.42, + "learning_rate": 1.135225020062878e-06, + "loss": 0.5444, + "step": 55378 + }, + { + "epoch": 1.42, + "learning_rate": 1.135197603712714e-06, + "loss": 0.6133, + "step": 55379 + }, + { + "epoch": 1.42, + "learning_rate": 1.1351701872590355e-06, + "loss": 0.6554, + "step": 55380 + }, + { + "epoch": 1.42, + "learning_rate": 1.1351427707018632e-06, + "loss": 0.7881, + "step": 55381 + }, + { + "epoch": 1.42, + "learning_rate": 1.1351153540412185e-06, + "loss": 0.6553, + "step": 55382 + }, + { + "epoch": 1.42, + "learning_rate": 1.1350879372771218e-06, + "loss": 0.8213, + "step": 55383 + }, + { + "epoch": 1.42, + "learning_rate": 1.1350605204095947e-06, + "loss": 0.7217, + "step": 55384 + }, + { + "epoch": 1.42, + "learning_rate": 1.135033103438658e-06, + "loss": 0.6, + "step": 55385 + }, + { + "epoch": 1.42, + "learning_rate": 1.1350056863643326e-06, + "loss": 0.4761, + "step": 55386 + }, + { + "epoch": 1.42, + "learning_rate": 1.1349782691866397e-06, + "loss": 0.5151, + "step": 55387 + }, + { + "epoch": 1.42, + "learning_rate": 1.1349508519055998e-06, + "loss": 0.4888, + "step": 55388 + }, + { + "epoch": 1.42, + "learning_rate": 1.1349234345212347e-06, + "loss": 0.5691, + "step": 55389 + }, + { + "epoch": 1.42, + "learning_rate": 1.134896017033565e-06, + "loss": 0.583, + "step": 55390 + }, + { + "epoch": 1.42, + "learning_rate": 1.134868599442611e-06, + "loss": 0.6685, + "step": 55391 + }, + { + "epoch": 1.42, + "learning_rate": 1.1348411817483948e-06, + "loss": 0.7275, + "step": 55392 + }, + { + "epoch": 1.42, + "learning_rate": 1.1348137639509365e-06, + "loss": 0.6162, + "step": 55393 + }, + { + "epoch": 1.42, + "learning_rate": 1.1347863460502578e-06, + "loss": 0.6602, + "step": 55394 + }, + { + "epoch": 1.42, + "learning_rate": 1.1347589280463795e-06, + "loss": 0.7559, + "step": 55395 + }, + { + "epoch": 1.42, + "learning_rate": 1.134731509939322e-06, + "loss": 0.7432, + "step": 55396 + }, + { + "epoch": 1.42, + "learning_rate": 1.1347040917291071e-06, + "loss": 0.7686, + "step": 55397 + }, + { + "epoch": 1.42, + "learning_rate": 1.1346766734157554e-06, + "loss": 0.8584, + "step": 55398 + }, + { + "epoch": 1.42, + "learning_rate": 1.134649254999288e-06, + "loss": 0.5938, + "step": 55399 + }, + { + "epoch": 1.42, + "learning_rate": 1.134621836479726e-06, + "loss": 0.7471, + "step": 55400 + }, + { + "epoch": 1.42, + "learning_rate": 1.1345944178570903e-06, + "loss": 0.7412, + "step": 55401 + }, + { + "epoch": 1.42, + "learning_rate": 1.1345669991314014e-06, + "loss": 0.6406, + "step": 55402 + }, + { + "epoch": 1.42, + "learning_rate": 1.1345395803026812e-06, + "loss": 0.7139, + "step": 55403 + }, + { + "epoch": 1.42, + "learning_rate": 1.13451216137095e-06, + "loss": 0.7783, + "step": 55404 + }, + { + "epoch": 1.42, + "learning_rate": 1.1344847423362291e-06, + "loss": 0.6582, + "step": 55405 + }, + { + "epoch": 1.42, + "learning_rate": 1.1344573231985392e-06, + "loss": 0.6128, + "step": 55406 + }, + { + "epoch": 1.42, + "learning_rate": 1.134429903957902e-06, + "loss": 0.5232, + "step": 55407 + }, + { + "epoch": 1.42, + "learning_rate": 1.1344024846143373e-06, + "loss": 0.6626, + "step": 55408 + }, + { + "epoch": 1.42, + "learning_rate": 1.1343750651678677e-06, + "loss": 0.5762, + "step": 55409 + }, + { + "epoch": 1.42, + "learning_rate": 1.1343476456185126e-06, + "loss": 0.6738, + "step": 55410 + }, + { + "epoch": 1.42, + "learning_rate": 1.1343202259662938e-06, + "loss": 0.6768, + "step": 55411 + }, + { + "epoch": 1.42, + "learning_rate": 1.1342928062112323e-06, + "loss": 0.6201, + "step": 55412 + }, + { + "epoch": 1.42, + "learning_rate": 1.134265386353349e-06, + "loss": 0.5245, + "step": 55413 + }, + { + "epoch": 1.42, + "learning_rate": 1.134237966392665e-06, + "loss": 0.6108, + "step": 55414 + }, + { + "epoch": 1.42, + "learning_rate": 1.1342105463292006e-06, + "loss": 0.8262, + "step": 55415 + }, + { + "epoch": 1.42, + "learning_rate": 1.1341831261629777e-06, + "loss": 0.6082, + "step": 55416 + }, + { + "epoch": 1.42, + "learning_rate": 1.134155705894017e-06, + "loss": 0.6636, + "step": 55417 + }, + { + "epoch": 1.42, + "learning_rate": 1.1341282855223393e-06, + "loss": 0.6631, + "step": 55418 + }, + { + "epoch": 1.42, + "learning_rate": 1.134100865047966e-06, + "loss": 0.603, + "step": 55419 + }, + { + "epoch": 1.42, + "learning_rate": 1.1340734444709176e-06, + "loss": 0.6199, + "step": 55420 + }, + { + "epoch": 1.42, + "learning_rate": 1.1340460237912154e-06, + "loss": 0.6294, + "step": 55421 + }, + { + "epoch": 1.42, + "learning_rate": 1.1340186030088804e-06, + "loss": 0.6255, + "step": 55422 + }, + { + "epoch": 1.42, + "learning_rate": 1.1339911821239333e-06, + "loss": 0.626, + "step": 55423 + }, + { + "epoch": 1.42, + "learning_rate": 1.1339637611363956e-06, + "loss": 0.6782, + "step": 55424 + }, + { + "epoch": 1.42, + "learning_rate": 1.1339363400462878e-06, + "loss": 0.7979, + "step": 55425 + }, + { + "epoch": 1.42, + "learning_rate": 1.1339089188536313e-06, + "loss": 0.7334, + "step": 55426 + }, + { + "epoch": 1.42, + "learning_rate": 1.1338814975584465e-06, + "loss": 0.7236, + "step": 55427 + }, + { + "epoch": 1.42, + "learning_rate": 1.1338540761607553e-06, + "loss": 0.7686, + "step": 55428 + }, + { + "epoch": 1.42, + "learning_rate": 1.1338266546605779e-06, + "loss": 0.6807, + "step": 55429 + }, + { + "epoch": 1.42, + "learning_rate": 1.1337992330579357e-06, + "loss": 0.626, + "step": 55430 + }, + { + "epoch": 1.42, + "learning_rate": 1.1337718113528493e-06, + "loss": 0.835, + "step": 55431 + }, + { + "epoch": 1.42, + "learning_rate": 1.1337443895453404e-06, + "loss": 0.583, + "step": 55432 + }, + { + "epoch": 1.42, + "learning_rate": 1.1337169676354292e-06, + "loss": 0.7695, + "step": 55433 + }, + { + "epoch": 1.42, + "learning_rate": 1.1336895456231373e-06, + "loss": 0.4667, + "step": 55434 + }, + { + "epoch": 1.42, + "learning_rate": 1.1336621235084855e-06, + "loss": 0.5947, + "step": 55435 + }, + { + "epoch": 1.42, + "learning_rate": 1.1336347012914946e-06, + "loss": 0.7656, + "step": 55436 + }, + { + "epoch": 1.42, + "learning_rate": 1.1336072789721858e-06, + "loss": 0.5679, + "step": 55437 + }, + { + "epoch": 1.42, + "learning_rate": 1.1335798565505801e-06, + "loss": 0.7158, + "step": 55438 + }, + { + "epoch": 1.42, + "learning_rate": 1.1335524340266983e-06, + "loss": 0.6865, + "step": 55439 + }, + { + "epoch": 1.42, + "learning_rate": 1.1335250114005617e-06, + "loss": 0.6406, + "step": 55440 + }, + { + "epoch": 1.42, + "learning_rate": 1.1334975886721911e-06, + "loss": 0.8467, + "step": 55441 + }, + { + "epoch": 1.42, + "learning_rate": 1.1334701658416072e-06, + "loss": 0.6772, + "step": 55442 + }, + { + "epoch": 1.42, + "learning_rate": 1.133442742908832e-06, + "loss": 0.9326, + "step": 55443 + }, + { + "epoch": 1.42, + "learning_rate": 1.1334153198738854e-06, + "loss": 0.385, + "step": 55444 + }, + { + "epoch": 1.42, + "learning_rate": 1.133387896736789e-06, + "loss": 0.3667, + "step": 55445 + }, + { + "epoch": 1.42, + "learning_rate": 1.1333604734975634e-06, + "loss": 0.8838, + "step": 55446 + }, + { + "epoch": 1.42, + "learning_rate": 1.13333305015623e-06, + "loss": 0.6807, + "step": 55447 + }, + { + "epoch": 1.42, + "learning_rate": 1.1333056267128094e-06, + "loss": 0.8477, + "step": 55448 + }, + { + "epoch": 1.42, + "learning_rate": 1.1332782031673231e-06, + "loss": 0.6514, + "step": 55449 + }, + { + "epoch": 1.42, + "learning_rate": 1.1332507795197916e-06, + "loss": 0.6035, + "step": 55450 + }, + { + "epoch": 1.42, + "learning_rate": 1.1332233557702362e-06, + "loss": 0.7549, + "step": 55451 + }, + { + "epoch": 1.42, + "learning_rate": 1.1331959319186777e-06, + "loss": 0.5557, + "step": 55452 + }, + { + "epoch": 1.42, + "learning_rate": 1.1331685079651373e-06, + "loss": 0.6885, + "step": 55453 + }, + { + "epoch": 1.42, + "learning_rate": 1.1331410839096357e-06, + "loss": 0.6582, + "step": 55454 + }, + { + "epoch": 1.42, + "learning_rate": 1.1331136597521946e-06, + "loss": 0.5869, + "step": 55455 + }, + { + "epoch": 1.42, + "learning_rate": 1.133086235492834e-06, + "loss": 0.5449, + "step": 55456 + }, + { + "epoch": 1.42, + "learning_rate": 1.1330588111315755e-06, + "loss": 0.5659, + "step": 55457 + }, + { + "epoch": 1.42, + "learning_rate": 1.13303138666844e-06, + "loss": 0.4731, + "step": 55458 + }, + { + "epoch": 1.42, + "learning_rate": 1.1330039621034485e-06, + "loss": 0.7811, + "step": 55459 + }, + { + "epoch": 1.42, + "learning_rate": 1.132976537436622e-06, + "loss": 0.5986, + "step": 55460 + }, + { + "epoch": 1.42, + "learning_rate": 1.1329491126679815e-06, + "loss": 0.6079, + "step": 55461 + }, + { + "epoch": 1.42, + "learning_rate": 1.132921687797548e-06, + "loss": 0.6816, + "step": 55462 + }, + { + "epoch": 1.42, + "learning_rate": 1.1328942628253425e-06, + "loss": 0.5293, + "step": 55463 + }, + { + "epoch": 1.42, + "learning_rate": 1.1328668377513858e-06, + "loss": 0.6665, + "step": 55464 + }, + { + "epoch": 1.42, + "learning_rate": 1.1328394125756993e-06, + "loss": 0.5503, + "step": 55465 + }, + { + "epoch": 1.42, + "learning_rate": 1.1328119872983036e-06, + "loss": 0.6855, + "step": 55466 + }, + { + "epoch": 1.42, + "learning_rate": 1.1327845619192198e-06, + "loss": 0.7471, + "step": 55467 + }, + { + "epoch": 1.42, + "learning_rate": 1.132757136438469e-06, + "loss": 0.7119, + "step": 55468 + }, + { + "epoch": 1.42, + "learning_rate": 1.1327297108560724e-06, + "loss": 0.583, + "step": 55469 + }, + { + "epoch": 1.42, + "learning_rate": 1.1327022851720507e-06, + "loss": 0.5781, + "step": 55470 + }, + { + "epoch": 1.42, + "learning_rate": 1.1326748593864248e-06, + "loss": 0.5244, + "step": 55471 + }, + { + "epoch": 1.42, + "learning_rate": 1.132647433499216e-06, + "loss": 0.6758, + "step": 55472 + }, + { + "epoch": 1.42, + "learning_rate": 1.132620007510445e-06, + "loss": 0.6094, + "step": 55473 + }, + { + "epoch": 1.42, + "learning_rate": 1.132592581420133e-06, + "loss": 0.6748, + "step": 55474 + }, + { + "epoch": 1.42, + "learning_rate": 1.132565155228301e-06, + "loss": 0.6909, + "step": 55475 + }, + { + "epoch": 1.42, + "learning_rate": 1.13253772893497e-06, + "loss": 0.8008, + "step": 55476 + }, + { + "epoch": 1.42, + "learning_rate": 1.1325103025401608e-06, + "loss": 0.7095, + "step": 55477 + }, + { + "epoch": 1.42, + "learning_rate": 1.1324828760438946e-06, + "loss": 0.7373, + "step": 55478 + }, + { + "epoch": 1.42, + "learning_rate": 1.1324554494461926e-06, + "loss": 0.6265, + "step": 55479 + }, + { + "epoch": 1.42, + "learning_rate": 1.1324280227470754e-06, + "loss": 0.7236, + "step": 55480 + }, + { + "epoch": 1.42, + "learning_rate": 1.132400595946564e-06, + "loss": 0.6885, + "step": 55481 + }, + { + "epoch": 1.42, + "learning_rate": 1.1323731690446799e-06, + "loss": 0.6533, + "step": 55482 + }, + { + "epoch": 1.42, + "learning_rate": 1.1323457420414433e-06, + "loss": 0.6763, + "step": 55483 + }, + { + "epoch": 1.42, + "learning_rate": 1.132318314936876e-06, + "loss": 0.6992, + "step": 55484 + }, + { + "epoch": 1.42, + "learning_rate": 1.1322908877309988e-06, + "loss": 0.7744, + "step": 55485 + }, + { + "epoch": 1.42, + "learning_rate": 1.132263460423832e-06, + "loss": 0.708, + "step": 55486 + }, + { + "epoch": 1.42, + "learning_rate": 1.1322360330153975e-06, + "loss": 0.8301, + "step": 55487 + }, + { + "epoch": 1.42, + "learning_rate": 1.1322086055057156e-06, + "loss": 0.7275, + "step": 55488 + }, + { + "epoch": 1.42, + "learning_rate": 1.1321811778948083e-06, + "loss": 0.7109, + "step": 55489 + }, + { + "epoch": 1.42, + "learning_rate": 1.1321537501826954e-06, + "loss": 0.707, + "step": 55490 + }, + { + "epoch": 1.42, + "learning_rate": 1.1321263223693986e-06, + "loss": 0.6851, + "step": 55491 + }, + { + "epoch": 1.42, + "learning_rate": 1.1320988944549388e-06, + "loss": 0.7051, + "step": 55492 + }, + { + "epoch": 1.42, + "learning_rate": 1.132071466439337e-06, + "loss": 0.5786, + "step": 55493 + }, + { + "epoch": 1.42, + "learning_rate": 1.132044038322614e-06, + "loss": 0.5562, + "step": 55494 + }, + { + "epoch": 1.42, + "learning_rate": 1.1320166101047911e-06, + "loss": 0.6895, + "step": 55495 + }, + { + "epoch": 1.42, + "learning_rate": 1.1319891817858892e-06, + "loss": 0.5784, + "step": 55496 + }, + { + "epoch": 1.42, + "learning_rate": 1.1319617533659292e-06, + "loss": 0.7363, + "step": 55497 + }, + { + "epoch": 1.42, + "learning_rate": 1.1319343248449318e-06, + "loss": 0.6807, + "step": 55498 + }, + { + "epoch": 1.42, + "learning_rate": 1.131906896222919e-06, + "loss": 0.6013, + "step": 55499 + }, + { + "epoch": 1.42, + "learning_rate": 1.1318794674999107e-06, + "loss": 0.5708, + "step": 55500 + }, + { + "epoch": 1.42, + "learning_rate": 1.1318520386759285e-06, + "loss": 0.7246, + "step": 55501 + }, + { + "epoch": 1.42, + "learning_rate": 1.131824609750993e-06, + "loss": 0.604, + "step": 55502 + }, + { + "epoch": 1.42, + "learning_rate": 1.131797180725126e-06, + "loss": 0.54, + "step": 55503 + }, + { + "epoch": 1.42, + "learning_rate": 1.1317697515983474e-06, + "loss": 0.6206, + "step": 55504 + }, + { + "epoch": 1.42, + "learning_rate": 1.131742322370679e-06, + "loss": 0.5947, + "step": 55505 + }, + { + "epoch": 1.42, + "learning_rate": 1.1317148930421416e-06, + "loss": 0.6885, + "step": 55506 + }, + { + "epoch": 1.42, + "learning_rate": 1.131687463612756e-06, + "loss": 0.7178, + "step": 55507 + }, + { + "epoch": 1.42, + "learning_rate": 1.1316600340825435e-06, + "loss": 0.7979, + "step": 55508 + }, + { + "epoch": 1.42, + "learning_rate": 1.1316326044515249e-06, + "loss": 0.531, + "step": 55509 + }, + { + "epoch": 1.42, + "learning_rate": 1.1316051747197216e-06, + "loss": 0.605, + "step": 55510 + }, + { + "epoch": 1.42, + "learning_rate": 1.1315777448871538e-06, + "loss": 0.6924, + "step": 55511 + }, + { + "epoch": 1.42, + "learning_rate": 1.1315503149538432e-06, + "loss": 0.7139, + "step": 55512 + }, + { + "epoch": 1.42, + "learning_rate": 1.1315228849198103e-06, + "loss": 0.4918, + "step": 55513 + }, + { + "epoch": 1.42, + "learning_rate": 1.1314954547850768e-06, + "loss": 0.4121, + "step": 55514 + }, + { + "epoch": 1.42, + "learning_rate": 1.1314680245496631e-06, + "loss": 0.6289, + "step": 55515 + }, + { + "epoch": 1.42, + "learning_rate": 1.1314405942135903e-06, + "loss": 0.6621, + "step": 55516 + }, + { + "epoch": 1.42, + "learning_rate": 1.1314131637768794e-06, + "loss": 0.791, + "step": 55517 + }, + { + "epoch": 1.42, + "learning_rate": 1.1313857332395518e-06, + "loss": 0.6836, + "step": 55518 + }, + { + "epoch": 1.42, + "learning_rate": 1.131358302601628e-06, + "loss": 0.439, + "step": 55519 + }, + { + "epoch": 1.42, + "learning_rate": 1.1313308718631293e-06, + "loss": 0.7236, + "step": 55520 + }, + { + "epoch": 1.42, + "learning_rate": 1.1313034410240762e-06, + "loss": 0.7275, + "step": 55521 + }, + { + "epoch": 1.42, + "learning_rate": 1.1312760100844906e-06, + "loss": 0.5898, + "step": 55522 + }, + { + "epoch": 1.42, + "learning_rate": 1.1312485790443926e-06, + "loss": 0.7588, + "step": 55523 + }, + { + "epoch": 1.42, + "learning_rate": 1.1312211479038039e-06, + "loss": 0.7549, + "step": 55524 + }, + { + "epoch": 1.42, + "learning_rate": 1.131193716662745e-06, + "loss": 0.3342, + "step": 55525 + }, + { + "epoch": 1.42, + "learning_rate": 1.1311662853212373e-06, + "loss": 0.7344, + "step": 55526 + }, + { + "epoch": 1.42, + "learning_rate": 1.1311388538793014e-06, + "loss": 0.6787, + "step": 55527 + }, + { + "epoch": 1.42, + "learning_rate": 1.1311114223369586e-06, + "loss": 0.5896, + "step": 55528 + }, + { + "epoch": 1.42, + "learning_rate": 1.13108399069423e-06, + "loss": 0.6611, + "step": 55529 + }, + { + "epoch": 1.42, + "learning_rate": 1.131056558951136e-06, + "loss": 0.5566, + "step": 55530 + }, + { + "epoch": 1.42, + "learning_rate": 1.131029127107698e-06, + "loss": 0.6826, + "step": 55531 + }, + { + "epoch": 1.42, + "learning_rate": 1.1310016951639375e-06, + "loss": 0.5249, + "step": 55532 + }, + { + "epoch": 1.42, + "learning_rate": 1.1309742631198746e-06, + "loss": 0.5437, + "step": 55533 + }, + { + "epoch": 1.42, + "learning_rate": 1.130946830975531e-06, + "loss": 0.4716, + "step": 55534 + }, + { + "epoch": 1.42, + "learning_rate": 1.1309193987309275e-06, + "loss": 0.5601, + "step": 55535 + }, + { + "epoch": 1.42, + "learning_rate": 1.1308919663860847e-06, + "loss": 0.709, + "step": 55536 + }, + { + "epoch": 1.42, + "learning_rate": 1.1308645339410244e-06, + "loss": 0.6582, + "step": 55537 + }, + { + "epoch": 1.42, + "learning_rate": 1.1308371013957665e-06, + "loss": 0.5955, + "step": 55538 + }, + { + "epoch": 1.42, + "learning_rate": 1.1308096687503335e-06, + "loss": 0.6992, + "step": 55539 + }, + { + "epoch": 1.42, + "learning_rate": 1.1307822360047448e-06, + "loss": 0.5205, + "step": 55540 + }, + { + "epoch": 1.42, + "learning_rate": 1.1307548031590225e-06, + "loss": 0.7715, + "step": 55541 + }, + { + "epoch": 1.42, + "learning_rate": 1.130727370213187e-06, + "loss": 0.7568, + "step": 55542 + }, + { + "epoch": 1.42, + "learning_rate": 1.13069993716726e-06, + "loss": 0.5444, + "step": 55543 + }, + { + "epoch": 1.42, + "learning_rate": 1.1306725040212616e-06, + "loss": 0.8564, + "step": 55544 + }, + { + "epoch": 1.42, + "learning_rate": 1.1306450707752135e-06, + "loss": 0.7266, + "step": 55545 + }, + { + "epoch": 1.42, + "learning_rate": 1.1306176374291365e-06, + "loss": 0.4856, + "step": 55546 + }, + { + "epoch": 1.42, + "learning_rate": 1.1305902039830516e-06, + "loss": 0.709, + "step": 55547 + }, + { + "epoch": 1.42, + "learning_rate": 1.1305627704369795e-06, + "loss": 0.6885, + "step": 55548 + }, + { + "epoch": 1.42, + "learning_rate": 1.1305353367909419e-06, + "loss": 0.5811, + "step": 55549 + }, + { + "epoch": 1.42, + "learning_rate": 1.1305079030449594e-06, + "loss": 0.5513, + "step": 55550 + }, + { + "epoch": 1.42, + "learning_rate": 1.1304804691990523e-06, + "loss": 0.6777, + "step": 55551 + }, + { + "epoch": 1.42, + "learning_rate": 1.1304530352532432e-06, + "loss": 0.8369, + "step": 55552 + }, + { + "epoch": 1.42, + "learning_rate": 1.1304256012075517e-06, + "loss": 0.6982, + "step": 55553 + }, + { + "epoch": 1.42, + "learning_rate": 1.1303981670619995e-06, + "loss": 0.6714, + "step": 55554 + }, + { + "epoch": 1.42, + "learning_rate": 1.1303707328166072e-06, + "loss": 0.6201, + "step": 55555 + }, + { + "epoch": 1.42, + "learning_rate": 1.1303432984713962e-06, + "loss": 0.5425, + "step": 55556 + }, + { + "epoch": 1.42, + "learning_rate": 1.1303158640263871e-06, + "loss": 0.5679, + "step": 55557 + }, + { + "epoch": 1.42, + "learning_rate": 1.1302884294816016e-06, + "loss": 0.5952, + "step": 55558 + }, + { + "epoch": 1.42, + "learning_rate": 1.1302609948370602e-06, + "loss": 0.728, + "step": 55559 + }, + { + "epoch": 1.42, + "learning_rate": 1.1302335600927838e-06, + "loss": 0.5269, + "step": 55560 + }, + { + "epoch": 1.42, + "learning_rate": 1.1302061252487934e-06, + "loss": 0.7275, + "step": 55561 + }, + { + "epoch": 1.42, + "learning_rate": 1.1301786903051104e-06, + "loss": 0.5591, + "step": 55562 + }, + { + "epoch": 1.42, + "learning_rate": 1.1301512552617549e-06, + "loss": 0.4902, + "step": 55563 + }, + { + "epoch": 1.42, + "learning_rate": 1.1301238201187496e-06, + "loss": 0.6553, + "step": 55564 + }, + { + "epoch": 1.42, + "learning_rate": 1.1300963848761135e-06, + "loss": 0.5068, + "step": 55565 + }, + { + "epoch": 1.42, + "learning_rate": 1.1300689495338693e-06, + "loss": 0.4978, + "step": 55566 + }, + { + "epoch": 1.42, + "learning_rate": 1.1300415140920367e-06, + "loss": 0.5459, + "step": 55567 + }, + { + "epoch": 1.42, + "learning_rate": 1.1300140785506377e-06, + "loss": 0.5332, + "step": 55568 + }, + { + "epoch": 1.42, + "learning_rate": 1.1299866429096929e-06, + "loss": 0.6348, + "step": 55569 + }, + { + "epoch": 1.42, + "learning_rate": 1.1299592071692231e-06, + "loss": 0.6841, + "step": 55570 + }, + { + "epoch": 1.42, + "learning_rate": 1.1299317713292497e-06, + "loss": 0.5483, + "step": 55571 + }, + { + "epoch": 1.42, + "learning_rate": 1.1299043353897935e-06, + "loss": 0.6338, + "step": 55572 + }, + { + "epoch": 1.42, + "learning_rate": 1.1298768993508753e-06, + "loss": 0.6621, + "step": 55573 + }, + { + "epoch": 1.42, + "learning_rate": 1.1298494632125167e-06, + "loss": 0.5867, + "step": 55574 + }, + { + "epoch": 1.42, + "learning_rate": 1.129822026974738e-06, + "loss": 0.7178, + "step": 55575 + }, + { + "epoch": 1.42, + "learning_rate": 1.1297945906375605e-06, + "loss": 0.7178, + "step": 55576 + }, + { + "epoch": 1.42, + "learning_rate": 1.1297671542010056e-06, + "loss": 0.6167, + "step": 55577 + }, + { + "epoch": 1.42, + "learning_rate": 1.1297397176650936e-06, + "loss": 0.6924, + "step": 55578 + }, + { + "epoch": 1.42, + "learning_rate": 1.1297122810298464e-06, + "loss": 0.7275, + "step": 55579 + }, + { + "epoch": 1.42, + "learning_rate": 1.129684844295284e-06, + "loss": 0.4966, + "step": 55580 + }, + { + "epoch": 1.42, + "learning_rate": 1.1296574074614281e-06, + "loss": 0.752, + "step": 55581 + }, + { + "epoch": 1.42, + "learning_rate": 1.129629970528299e-06, + "loss": 0.7207, + "step": 55582 + }, + { + "epoch": 1.42, + "learning_rate": 1.1296025334959187e-06, + "loss": 0.6768, + "step": 55583 + }, + { + "epoch": 1.42, + "learning_rate": 1.1295750963643076e-06, + "loss": 0.6357, + "step": 55584 + }, + { + "epoch": 1.42, + "learning_rate": 1.129547659133487e-06, + "loss": 0.5234, + "step": 55585 + }, + { + "epoch": 1.42, + "learning_rate": 1.1295202218034772e-06, + "loss": 0.7412, + "step": 55586 + }, + { + "epoch": 1.42, + "learning_rate": 1.1294927843743e-06, + "loss": 0.4834, + "step": 55587 + }, + { + "epoch": 1.42, + "learning_rate": 1.129465346845976e-06, + "loss": 0.7637, + "step": 55588 + }, + { + "epoch": 1.42, + "learning_rate": 1.1294379092185268e-06, + "loss": 0.6592, + "step": 55589 + }, + { + "epoch": 1.42, + "learning_rate": 1.1294104714919725e-06, + "loss": 0.5864, + "step": 55590 + }, + { + "epoch": 1.42, + "learning_rate": 1.1293830336663349e-06, + "loss": 0.7715, + "step": 55591 + }, + { + "epoch": 1.42, + "learning_rate": 1.1293555957416342e-06, + "loss": 0.7207, + "step": 55592 + }, + { + "epoch": 1.42, + "learning_rate": 1.129328157717892e-06, + "loss": 0.7104, + "step": 55593 + }, + { + "epoch": 1.42, + "learning_rate": 1.1293007195951295e-06, + "loss": 0.5537, + "step": 55594 + }, + { + "epoch": 1.42, + "learning_rate": 1.129273281373367e-06, + "loss": 0.5415, + "step": 55595 + }, + { + "epoch": 1.42, + "learning_rate": 1.1292458430526262e-06, + "loss": 0.4839, + "step": 55596 + }, + { + "epoch": 1.42, + "learning_rate": 1.1292184046329273e-06, + "loss": 0.7002, + "step": 55597 + }, + { + "epoch": 1.43, + "learning_rate": 1.1291909661142925e-06, + "loss": 0.6289, + "step": 55598 + }, + { + "epoch": 1.43, + "learning_rate": 1.1291635274967417e-06, + "loss": 0.6504, + "step": 55599 + }, + { + "epoch": 1.43, + "learning_rate": 1.1291360887802964e-06, + "loss": 0.5933, + "step": 55600 + }, + { + "epoch": 1.43, + "learning_rate": 1.1291086499649775e-06, + "loss": 0.6865, + "step": 55601 + }, + { + "epoch": 1.43, + "learning_rate": 1.1290812110508061e-06, + "loss": 0.6714, + "step": 55602 + }, + { + "epoch": 1.43, + "learning_rate": 1.129053772037803e-06, + "loss": 0.6309, + "step": 55603 + }, + { + "epoch": 1.43, + "learning_rate": 1.1290263329259899e-06, + "loss": 0.5342, + "step": 55604 + }, + { + "epoch": 1.43, + "learning_rate": 1.1289988937153867e-06, + "loss": 0.5181, + "step": 55605 + }, + { + "epoch": 1.43, + "learning_rate": 1.1289714544060152e-06, + "loss": 0.6277, + "step": 55606 + }, + { + "epoch": 1.43, + "learning_rate": 1.128944014997896e-06, + "loss": 0.6924, + "step": 55607 + }, + { + "epoch": 1.43, + "learning_rate": 1.1289165754910506e-06, + "loss": 0.6445, + "step": 55608 + }, + { + "epoch": 1.43, + "learning_rate": 1.1288891358854994e-06, + "loss": 0.4623, + "step": 55609 + }, + { + "epoch": 1.43, + "learning_rate": 1.128861696181264e-06, + "loss": 0.6191, + "step": 55610 + }, + { + "epoch": 1.43, + "learning_rate": 1.1288342563783648e-06, + "loss": 0.6538, + "step": 55611 + }, + { + "epoch": 1.43, + "learning_rate": 1.1288068164768235e-06, + "loss": 0.5762, + "step": 55612 + }, + { + "epoch": 1.43, + "learning_rate": 1.1287793764766602e-06, + "loss": 0.6313, + "step": 55613 + }, + { + "epoch": 1.43, + "learning_rate": 1.128751936377897e-06, + "loss": 0.667, + "step": 55614 + }, + { + "epoch": 1.43, + "learning_rate": 1.1287244961805542e-06, + "loss": 0.6743, + "step": 55615 + }, + { + "epoch": 1.43, + "learning_rate": 1.1286970558846532e-06, + "loss": 0.4663, + "step": 55616 + }, + { + "epoch": 1.43, + "learning_rate": 1.1286696154902143e-06, + "loss": 0.5977, + "step": 55617 + }, + { + "epoch": 1.43, + "learning_rate": 1.1286421749972593e-06, + "loss": 0.606, + "step": 55618 + }, + { + "epoch": 1.43, + "learning_rate": 1.1286147344058088e-06, + "loss": 0.7065, + "step": 55619 + }, + { + "epoch": 1.43, + "learning_rate": 1.1285872937158837e-06, + "loss": 0.7949, + "step": 55620 + }, + { + "epoch": 1.43, + "learning_rate": 1.1285598529275055e-06, + "loss": 0.5986, + "step": 55621 + }, + { + "epoch": 1.43, + "learning_rate": 1.1285324120406948e-06, + "loss": 0.6953, + "step": 55622 + }, + { + "epoch": 1.43, + "learning_rate": 1.1285049710554728e-06, + "loss": 0.7607, + "step": 55623 + }, + { + "epoch": 1.43, + "learning_rate": 1.1284775299718608e-06, + "loss": 0.7168, + "step": 55624 + }, + { + "epoch": 1.43, + "learning_rate": 1.128450088789879e-06, + "loss": 0.7471, + "step": 55625 + }, + { + "epoch": 1.43, + "learning_rate": 1.128422647509549e-06, + "loss": 0.5615, + "step": 55626 + }, + { + "epoch": 1.43, + "learning_rate": 1.1283952061308916e-06, + "loss": 0.4561, + "step": 55627 + }, + { + "epoch": 1.43, + "learning_rate": 1.128367764653928e-06, + "loss": 0.488, + "step": 55628 + }, + { + "epoch": 1.43, + "learning_rate": 1.1283403230786795e-06, + "loss": 0.667, + "step": 55629 + }, + { + "epoch": 1.43, + "learning_rate": 1.1283128814051658e-06, + "loss": 0.5903, + "step": 55630 + }, + { + "epoch": 1.43, + "learning_rate": 1.1282854396334096e-06, + "loss": 0.5796, + "step": 55631 + }, + { + "epoch": 1.43, + "learning_rate": 1.1282579977634309e-06, + "loss": 0.7227, + "step": 55632 + }, + { + "epoch": 1.43, + "learning_rate": 1.128230555795251e-06, + "loss": 0.666, + "step": 55633 + }, + { + "epoch": 1.43, + "learning_rate": 1.1282031137288907e-06, + "loss": 0.5571, + "step": 55634 + }, + { + "epoch": 1.43, + "learning_rate": 1.1281756715643713e-06, + "loss": 0.6904, + "step": 55635 + }, + { + "epoch": 1.43, + "learning_rate": 1.1281482293017135e-06, + "loss": 0.5771, + "step": 55636 + }, + { + "epoch": 1.43, + "learning_rate": 1.1281207869409387e-06, + "loss": 0.4575, + "step": 55637 + }, + { + "epoch": 1.43, + "learning_rate": 1.1280933444820675e-06, + "loss": 0.6855, + "step": 55638 + }, + { + "epoch": 1.43, + "learning_rate": 1.1280659019251213e-06, + "loss": 0.5747, + "step": 55639 + }, + { + "epoch": 1.43, + "learning_rate": 1.1280384592701208e-06, + "loss": 0.5615, + "step": 55640 + }, + { + "epoch": 1.43, + "learning_rate": 1.1280110165170873e-06, + "loss": 0.748, + "step": 55641 + }, + { + "epoch": 1.43, + "learning_rate": 1.1279835736660416e-06, + "loss": 0.5134, + "step": 55642 + }, + { + "epoch": 1.43, + "learning_rate": 1.1279561307170046e-06, + "loss": 0.6494, + "step": 55643 + }, + { + "epoch": 1.43, + "learning_rate": 1.1279286876699978e-06, + "loss": 0.6816, + "step": 55644 + }, + { + "epoch": 1.43, + "learning_rate": 1.1279012445250415e-06, + "loss": 0.5527, + "step": 55645 + }, + { + "epoch": 1.43, + "learning_rate": 1.1278738012821574e-06, + "loss": 0.6597, + "step": 55646 + }, + { + "epoch": 1.43, + "learning_rate": 1.1278463579413659e-06, + "loss": 0.8828, + "step": 55647 + }, + { + "epoch": 1.43, + "learning_rate": 1.1278189145026887e-06, + "loss": 0.4614, + "step": 55648 + }, + { + "epoch": 1.43, + "learning_rate": 1.1277914709661463e-06, + "loss": 0.7227, + "step": 55649 + }, + { + "epoch": 1.43, + "learning_rate": 1.1277640273317598e-06, + "loss": 0.613, + "step": 55650 + }, + { + "epoch": 1.43, + "learning_rate": 1.1277365835995503e-06, + "loss": 0.6338, + "step": 55651 + }, + { + "epoch": 1.43, + "learning_rate": 1.1277091397695386e-06, + "loss": 0.8506, + "step": 55652 + }, + { + "epoch": 1.43, + "learning_rate": 1.127681695841746e-06, + "loss": 0.6729, + "step": 55653 + }, + { + "epoch": 1.43, + "learning_rate": 1.1276542518161937e-06, + "loss": 0.5112, + "step": 55654 + }, + { + "epoch": 1.43, + "learning_rate": 1.127626807692902e-06, + "loss": 0.4298, + "step": 55655 + }, + { + "epoch": 1.43, + "learning_rate": 1.1275993634718926e-06, + "loss": 0.5593, + "step": 55656 + }, + { + "epoch": 1.43, + "learning_rate": 1.1275719191531858e-06, + "loss": 0.6335, + "step": 55657 + }, + { + "epoch": 1.43, + "learning_rate": 1.1275444747368034e-06, + "loss": 0.791, + "step": 55658 + }, + { + "epoch": 1.43, + "learning_rate": 1.1275170302227662e-06, + "loss": 0.6401, + "step": 55659 + }, + { + "epoch": 1.43, + "learning_rate": 1.1274895856110947e-06, + "loss": 0.79, + "step": 55660 + }, + { + "epoch": 1.43, + "learning_rate": 1.1274621409018105e-06, + "loss": 0.6294, + "step": 55661 + }, + { + "epoch": 1.43, + "learning_rate": 1.1274346960949343e-06, + "loss": 0.5293, + "step": 55662 + }, + { + "epoch": 1.43, + "learning_rate": 1.127407251190487e-06, + "loss": 0.7114, + "step": 55663 + }, + { + "epoch": 1.43, + "learning_rate": 1.1273798061884903e-06, + "loss": 0.5195, + "step": 55664 + }, + { + "epoch": 1.43, + "learning_rate": 1.1273523610889646e-06, + "loss": 0.605, + "step": 55665 + }, + { + "epoch": 1.43, + "learning_rate": 1.1273249158919306e-06, + "loss": 0.7529, + "step": 55666 + }, + { + "epoch": 1.43, + "learning_rate": 1.1272974705974103e-06, + "loss": 0.6172, + "step": 55667 + }, + { + "epoch": 1.43, + "learning_rate": 1.127270025205424e-06, + "loss": 0.6436, + "step": 55668 + }, + { + "epoch": 1.43, + "learning_rate": 1.1272425797159933e-06, + "loss": 0.6064, + "step": 55669 + }, + { + "epoch": 1.43, + "learning_rate": 1.127215134129138e-06, + "loss": 0.4329, + "step": 55670 + }, + { + "epoch": 1.43, + "learning_rate": 1.1271876884448806e-06, + "loss": 0.7432, + "step": 55671 + }, + { + "epoch": 1.43, + "learning_rate": 1.127160242663241e-06, + "loss": 0.5687, + "step": 55672 + }, + { + "epoch": 1.43, + "learning_rate": 1.1271327967842408e-06, + "loss": 0.6021, + "step": 55673 + }, + { + "epoch": 1.43, + "learning_rate": 1.1271053508079012e-06, + "loss": 0.6069, + "step": 55674 + }, + { + "epoch": 1.43, + "learning_rate": 1.1270779047342425e-06, + "loss": 0.7842, + "step": 55675 + }, + { + "epoch": 1.43, + "learning_rate": 1.127050458563286e-06, + "loss": 0.627, + "step": 55676 + }, + { + "epoch": 1.43, + "learning_rate": 1.1270230122950531e-06, + "loss": 0.7417, + "step": 55677 + }, + { + "epoch": 1.43, + "learning_rate": 1.1269955659295643e-06, + "loss": 0.5859, + "step": 55678 + }, + { + "epoch": 1.43, + "learning_rate": 1.126968119466841e-06, + "loss": 0.5269, + "step": 55679 + }, + { + "epoch": 1.43, + "learning_rate": 1.1269406729069039e-06, + "loss": 0.7227, + "step": 55680 + }, + { + "epoch": 1.43, + "learning_rate": 1.1269132262497742e-06, + "loss": 0.4767, + "step": 55681 + }, + { + "epoch": 1.43, + "learning_rate": 1.126885779495473e-06, + "loss": 0.52, + "step": 55682 + }, + { + "epoch": 1.43, + "learning_rate": 1.1268583326440212e-06, + "loss": 0.5405, + "step": 55683 + }, + { + "epoch": 1.43, + "learning_rate": 1.1268308856954395e-06, + "loss": 0.7793, + "step": 55684 + }, + { + "epoch": 1.43, + "learning_rate": 1.1268034386497496e-06, + "loss": 0.6523, + "step": 55685 + }, + { + "epoch": 1.43, + "learning_rate": 1.1267759915069719e-06, + "loss": 0.5664, + "step": 55686 + }, + { + "epoch": 1.43, + "learning_rate": 1.1267485442671276e-06, + "loss": 0.8311, + "step": 55687 + }, + { + "epoch": 1.43, + "learning_rate": 1.1267210969302379e-06, + "loss": 0.6016, + "step": 55688 + }, + { + "epoch": 1.43, + "learning_rate": 1.1266936494963237e-06, + "loss": 0.6855, + "step": 55689 + }, + { + "epoch": 1.43, + "learning_rate": 1.126666201965406e-06, + "loss": 0.7007, + "step": 55690 + }, + { + "epoch": 1.43, + "learning_rate": 1.1266387543375057e-06, + "loss": 0.7549, + "step": 55691 + }, + { + "epoch": 1.43, + "learning_rate": 1.1266113066126442e-06, + "loss": 0.7109, + "step": 55692 + }, + { + "epoch": 1.43, + "learning_rate": 1.1265838587908419e-06, + "loss": 0.519, + "step": 55693 + }, + { + "epoch": 1.43, + "learning_rate": 1.1265564108721206e-06, + "loss": 0.6636, + "step": 55694 + }, + { + "epoch": 1.43, + "learning_rate": 1.1265289628565004e-06, + "loss": 0.6592, + "step": 55695 + }, + { + "epoch": 1.43, + "learning_rate": 1.1265015147440032e-06, + "loss": 0.6855, + "step": 55696 + }, + { + "epoch": 1.43, + "learning_rate": 1.1264740665346492e-06, + "loss": 0.614, + "step": 55697 + }, + { + "epoch": 1.43, + "learning_rate": 1.1264466182284603e-06, + "loss": 0.5137, + "step": 55698 + }, + { + "epoch": 1.43, + "learning_rate": 1.1264191698254566e-06, + "loss": 0.6108, + "step": 55699 + }, + { + "epoch": 1.43, + "learning_rate": 1.1263917213256597e-06, + "loss": 0.5527, + "step": 55700 + }, + { + "epoch": 1.43, + "learning_rate": 1.1263642727290905e-06, + "loss": 0.7373, + "step": 55701 + }, + { + "epoch": 1.43, + "learning_rate": 1.12633682403577e-06, + "loss": 0.626, + "step": 55702 + }, + { + "epoch": 1.43, + "learning_rate": 1.1263093752457191e-06, + "loss": 0.5898, + "step": 55703 + }, + { + "epoch": 1.43, + "learning_rate": 1.126281926358959e-06, + "loss": 0.6201, + "step": 55704 + }, + { + "epoch": 1.43, + "learning_rate": 1.1262544773755107e-06, + "loss": 0.6797, + "step": 55705 + }, + { + "epoch": 1.43, + "learning_rate": 1.126227028295395e-06, + "loss": 0.6113, + "step": 55706 + }, + { + "epoch": 1.43, + "learning_rate": 1.126199579118633e-06, + "loss": 0.5559, + "step": 55707 + }, + { + "epoch": 1.43, + "learning_rate": 1.126172129845246e-06, + "loss": 0.5425, + "step": 55708 + }, + { + "epoch": 1.43, + "learning_rate": 1.1261446804752547e-06, + "loss": 0.5476, + "step": 55709 + }, + { + "epoch": 1.43, + "learning_rate": 1.1261172310086804e-06, + "loss": 0.7998, + "step": 55710 + }, + { + "epoch": 1.43, + "learning_rate": 1.1260897814455438e-06, + "loss": 0.7881, + "step": 55711 + }, + { + "epoch": 1.43, + "learning_rate": 1.1260623317858659e-06, + "loss": 0.4966, + "step": 55712 + }, + { + "epoch": 1.43, + "learning_rate": 1.1260348820296682e-06, + "loss": 0.7734, + "step": 55713 + }, + { + "epoch": 1.43, + "learning_rate": 1.126007432176971e-06, + "loss": 0.7334, + "step": 55714 + }, + { + "epoch": 1.43, + "learning_rate": 1.125979982227796e-06, + "loss": 0.71, + "step": 55715 + }, + { + "epoch": 1.43, + "learning_rate": 1.1259525321821636e-06, + "loss": 0.6572, + "step": 55716 + }, + { + "epoch": 1.43, + "learning_rate": 1.1259250820400956e-06, + "loss": 0.5112, + "step": 55717 + }, + { + "epoch": 1.43, + "learning_rate": 1.1258976318016124e-06, + "loss": 0.7773, + "step": 55718 + }, + { + "epoch": 1.43, + "learning_rate": 1.125870181466735e-06, + "loss": 0.8203, + "step": 55719 + }, + { + "epoch": 1.43, + "learning_rate": 1.1258427310354845e-06, + "loss": 0.7812, + "step": 55720 + }, + { + "epoch": 1.43, + "learning_rate": 1.1258152805078825e-06, + "loss": 0.7363, + "step": 55721 + }, + { + "epoch": 1.43, + "learning_rate": 1.1257878298839489e-06, + "loss": 0.646, + "step": 55722 + }, + { + "epoch": 1.43, + "learning_rate": 1.125760379163706e-06, + "loss": 0.5737, + "step": 55723 + }, + { + "epoch": 1.43, + "learning_rate": 1.1257329283471737e-06, + "loss": 0.6758, + "step": 55724 + }, + { + "epoch": 1.43, + "learning_rate": 1.1257054774343735e-06, + "loss": 0.5664, + "step": 55725 + }, + { + "epoch": 1.43, + "learning_rate": 1.1256780264253266e-06, + "loss": 0.5938, + "step": 55726 + }, + { + "epoch": 1.43, + "learning_rate": 1.1256505753200536e-06, + "loss": 0.5664, + "step": 55727 + }, + { + "epoch": 1.43, + "learning_rate": 1.1256231241185758e-06, + "loss": 0.6055, + "step": 55728 + }, + { + "epoch": 1.43, + "learning_rate": 1.125595672820914e-06, + "loss": 0.8506, + "step": 55729 + }, + { + "epoch": 1.43, + "learning_rate": 1.1255682214270896e-06, + "loss": 0.6538, + "step": 55730 + }, + { + "epoch": 1.43, + "learning_rate": 1.1255407699371234e-06, + "loss": 0.5957, + "step": 55731 + }, + { + "epoch": 1.43, + "learning_rate": 1.1255133183510364e-06, + "loss": 0.6147, + "step": 55732 + }, + { + "epoch": 1.43, + "learning_rate": 1.1254858666688497e-06, + "loss": 0.71, + "step": 55733 + }, + { + "epoch": 1.43, + "learning_rate": 1.1254584148905842e-06, + "loss": 0.4722, + "step": 55734 + }, + { + "epoch": 1.43, + "learning_rate": 1.1254309630162605e-06, + "loss": 0.8311, + "step": 55735 + }, + { + "epoch": 1.43, + "learning_rate": 1.1254035110459005e-06, + "loss": 0.6719, + "step": 55736 + }, + { + "epoch": 1.43, + "learning_rate": 1.1253760589795246e-06, + "loss": 0.4453, + "step": 55737 + }, + { + "epoch": 1.43, + "learning_rate": 1.1253486068171545e-06, + "loss": 0.8535, + "step": 55738 + }, + { + "epoch": 1.43, + "learning_rate": 1.1253211545588102e-06, + "loss": 0.5166, + "step": 55739 + }, + { + "epoch": 1.43, + "learning_rate": 1.1252937022045134e-06, + "loss": 0.6553, + "step": 55740 + }, + { + "epoch": 1.43, + "learning_rate": 1.125266249754285e-06, + "loss": 0.5466, + "step": 55741 + }, + { + "epoch": 1.43, + "learning_rate": 1.1252387972081461e-06, + "loss": 0.6631, + "step": 55742 + }, + { + "epoch": 1.43, + "learning_rate": 1.1252113445661175e-06, + "loss": 0.7754, + "step": 55743 + }, + { + "epoch": 1.43, + "learning_rate": 1.1251838918282205e-06, + "loss": 0.6016, + "step": 55744 + }, + { + "epoch": 1.43, + "learning_rate": 1.1251564389944758e-06, + "loss": 0.7344, + "step": 55745 + }, + { + "epoch": 1.43, + "learning_rate": 1.1251289860649045e-06, + "loss": 0.5347, + "step": 55746 + }, + { + "epoch": 1.43, + "learning_rate": 1.1251015330395276e-06, + "loss": 0.6062, + "step": 55747 + }, + { + "epoch": 1.43, + "learning_rate": 1.1250740799183664e-06, + "loss": 0.481, + "step": 55748 + }, + { + "epoch": 1.43, + "learning_rate": 1.1250466267014417e-06, + "loss": 0.6719, + "step": 55749 + }, + { + "epoch": 1.43, + "learning_rate": 1.1250191733887746e-06, + "loss": 0.6709, + "step": 55750 + }, + { + "epoch": 1.43, + "learning_rate": 1.124991719980386e-06, + "loss": 0.6187, + "step": 55751 + }, + { + "epoch": 1.43, + "learning_rate": 1.124964266476297e-06, + "loss": 0.564, + "step": 55752 + }, + { + "epoch": 1.43, + "learning_rate": 1.124936812876529e-06, + "loss": 0.8242, + "step": 55753 + }, + { + "epoch": 1.43, + "learning_rate": 1.1249093591811018e-06, + "loss": 0.5298, + "step": 55754 + }, + { + "epoch": 1.43, + "learning_rate": 1.1248819053900378e-06, + "loss": 0.6157, + "step": 55755 + }, + { + "epoch": 1.43, + "learning_rate": 1.1248544515033572e-06, + "loss": 0.6392, + "step": 55756 + }, + { + "epoch": 1.43, + "learning_rate": 1.1248269975210815e-06, + "loss": 0.6597, + "step": 55757 + }, + { + "epoch": 1.43, + "learning_rate": 1.1247995434432315e-06, + "loss": 0.7383, + "step": 55758 + }, + { + "epoch": 1.43, + "learning_rate": 1.1247720892698282e-06, + "loss": 0.7021, + "step": 55759 + }, + { + "epoch": 1.43, + "learning_rate": 1.1247446350008926e-06, + "loss": 0.6768, + "step": 55760 + }, + { + "epoch": 1.43, + "learning_rate": 1.124717180636446e-06, + "loss": 0.6196, + "step": 55761 + }, + { + "epoch": 1.43, + "learning_rate": 1.1246897261765088e-06, + "loss": 0.748, + "step": 55762 + }, + { + "epoch": 1.43, + "learning_rate": 1.1246622716211026e-06, + "loss": 0.7559, + "step": 55763 + }, + { + "epoch": 1.43, + "learning_rate": 1.1246348169702482e-06, + "loss": 0.5234, + "step": 55764 + }, + { + "epoch": 1.43, + "learning_rate": 1.124607362223967e-06, + "loss": 0.5455, + "step": 55765 + }, + { + "epoch": 1.43, + "learning_rate": 1.124579907382279e-06, + "loss": 0.752, + "step": 55766 + }, + { + "epoch": 1.43, + "learning_rate": 1.1245524524452063e-06, + "loss": 0.6309, + "step": 55767 + }, + { + "epoch": 1.43, + "learning_rate": 1.1245249974127695e-06, + "loss": 0.5298, + "step": 55768 + }, + { + "epoch": 1.43, + "learning_rate": 1.1244975422849897e-06, + "loss": 0.6138, + "step": 55769 + }, + { + "epoch": 1.43, + "learning_rate": 1.1244700870618874e-06, + "loss": 0.6289, + "step": 55770 + }, + { + "epoch": 1.43, + "learning_rate": 1.1244426317434848e-06, + "loss": 0.6689, + "step": 55771 + }, + { + "epoch": 1.43, + "learning_rate": 1.1244151763298016e-06, + "loss": 0.5908, + "step": 55772 + }, + { + "epoch": 1.43, + "learning_rate": 1.1243877208208595e-06, + "loss": 0.8096, + "step": 55773 + }, + { + "epoch": 1.43, + "learning_rate": 1.1243602652166799e-06, + "loss": 0.6143, + "step": 55774 + }, + { + "epoch": 1.43, + "learning_rate": 1.124332809517283e-06, + "loss": 0.6689, + "step": 55775 + }, + { + "epoch": 1.43, + "learning_rate": 1.12430535372269e-06, + "loss": 0.5566, + "step": 55776 + }, + { + "epoch": 1.43, + "learning_rate": 1.1242778978329224e-06, + "loss": 0.6777, + "step": 55777 + }, + { + "epoch": 1.43, + "learning_rate": 1.124250441848001e-06, + "loss": 0.8096, + "step": 55778 + }, + { + "epoch": 1.43, + "learning_rate": 1.1242229857679466e-06, + "loss": 0.7007, + "step": 55779 + }, + { + "epoch": 1.43, + "learning_rate": 1.1241955295927805e-06, + "loss": 0.5464, + "step": 55780 + }, + { + "epoch": 1.43, + "learning_rate": 1.1241680733225231e-06, + "loss": 0.5771, + "step": 55781 + }, + { + "epoch": 1.43, + "learning_rate": 1.1241406169571965e-06, + "loss": 0.3837, + "step": 55782 + }, + { + "epoch": 1.43, + "learning_rate": 1.124113160496821e-06, + "loss": 0.5505, + "step": 55783 + }, + { + "epoch": 1.43, + "learning_rate": 1.1240857039414177e-06, + "loss": 0.8262, + "step": 55784 + }, + { + "epoch": 1.43, + "learning_rate": 1.1240582472910077e-06, + "loss": 0.5759, + "step": 55785 + }, + { + "epoch": 1.43, + "learning_rate": 1.1240307905456119e-06, + "loss": 0.6191, + "step": 55786 + }, + { + "epoch": 1.43, + "learning_rate": 1.1240033337052516e-06, + "loss": 0.5869, + "step": 55787 + }, + { + "epoch": 1.43, + "learning_rate": 1.1239758767699476e-06, + "loss": 0.8682, + "step": 55788 + }, + { + "epoch": 1.43, + "learning_rate": 1.1239484197397208e-06, + "loss": 0.6641, + "step": 55789 + }, + { + "epoch": 1.43, + "learning_rate": 1.1239209626145927e-06, + "loss": 0.7266, + "step": 55790 + }, + { + "epoch": 1.43, + "learning_rate": 1.1238935053945837e-06, + "loss": 0.6787, + "step": 55791 + }, + { + "epoch": 1.43, + "learning_rate": 1.1238660480797154e-06, + "loss": 0.7549, + "step": 55792 + }, + { + "epoch": 1.43, + "learning_rate": 1.1238385906700085e-06, + "loss": 0.7031, + "step": 55793 + }, + { + "epoch": 1.43, + "learning_rate": 1.1238111331654838e-06, + "loss": 0.646, + "step": 55794 + }, + { + "epoch": 1.43, + "learning_rate": 1.1237836755661629e-06, + "loss": 0.8057, + "step": 55795 + }, + { + "epoch": 1.43, + "learning_rate": 1.1237562178720666e-06, + "loss": 0.6172, + "step": 55796 + }, + { + "epoch": 1.43, + "learning_rate": 1.1237287600832156e-06, + "loss": 0.603, + "step": 55797 + }, + { + "epoch": 1.43, + "learning_rate": 1.1237013021996313e-06, + "loss": 0.6611, + "step": 55798 + }, + { + "epoch": 1.43, + "learning_rate": 1.1236738442213347e-06, + "loss": 0.6592, + "step": 55799 + }, + { + "epoch": 1.43, + "learning_rate": 1.1236463861483464e-06, + "loss": 0.7129, + "step": 55800 + }, + { + "epoch": 1.43, + "learning_rate": 1.123618927980688e-06, + "loss": 0.6025, + "step": 55801 + }, + { + "epoch": 1.43, + "learning_rate": 1.12359146971838e-06, + "loss": 0.7119, + "step": 55802 + }, + { + "epoch": 1.43, + "learning_rate": 1.1235640113614443e-06, + "loss": 0.6875, + "step": 55803 + }, + { + "epoch": 1.43, + "learning_rate": 1.123536552909901e-06, + "loss": 0.7344, + "step": 55804 + }, + { + "epoch": 1.43, + "learning_rate": 1.1235090943637713e-06, + "loss": 0.7119, + "step": 55805 + }, + { + "epoch": 1.43, + "learning_rate": 1.1234816357230763e-06, + "loss": 0.748, + "step": 55806 + }, + { + "epoch": 1.43, + "learning_rate": 1.1234541769878375e-06, + "loss": 0.6553, + "step": 55807 + }, + { + "epoch": 1.43, + "learning_rate": 1.1234267181580752e-06, + "loss": 0.6543, + "step": 55808 + }, + { + "epoch": 1.43, + "learning_rate": 1.1233992592338108e-06, + "loss": 0.6953, + "step": 55809 + }, + { + "epoch": 1.43, + "learning_rate": 1.1233718002150652e-06, + "loss": 0.5737, + "step": 55810 + }, + { + "epoch": 1.43, + "learning_rate": 1.1233443411018597e-06, + "loss": 0.5786, + "step": 55811 + }, + { + "epoch": 1.43, + "learning_rate": 1.1233168818942146e-06, + "loss": 0.5649, + "step": 55812 + }, + { + "epoch": 1.43, + "learning_rate": 1.1232894225921523e-06, + "loss": 0.6553, + "step": 55813 + }, + { + "epoch": 1.43, + "learning_rate": 1.1232619631956922e-06, + "loss": 0.6777, + "step": 55814 + }, + { + "epoch": 1.43, + "learning_rate": 1.1232345037048566e-06, + "loss": 0.5396, + "step": 55815 + }, + { + "epoch": 1.43, + "learning_rate": 1.1232070441196655e-06, + "loss": 0.6348, + "step": 55816 + }, + { + "epoch": 1.43, + "learning_rate": 1.1231795844401405e-06, + "loss": 0.8955, + "step": 55817 + }, + { + "epoch": 1.43, + "learning_rate": 1.1231521246663029e-06, + "loss": 0.709, + "step": 55818 + }, + { + "epoch": 1.43, + "learning_rate": 1.1231246647981731e-06, + "loss": 0.5864, + "step": 55819 + }, + { + "epoch": 1.43, + "learning_rate": 1.1230972048357728e-06, + "loss": 0.6875, + "step": 55820 + }, + { + "epoch": 1.43, + "learning_rate": 1.123069744779122e-06, + "loss": 0.627, + "step": 55821 + }, + { + "epoch": 1.43, + "learning_rate": 1.1230422846282428e-06, + "loss": 0.6328, + "step": 55822 + }, + { + "epoch": 1.43, + "learning_rate": 1.1230148243831559e-06, + "loss": 0.6528, + "step": 55823 + }, + { + "epoch": 1.43, + "learning_rate": 1.1229873640438818e-06, + "loss": 0.6777, + "step": 55824 + }, + { + "epoch": 1.43, + "learning_rate": 1.122959903610442e-06, + "loss": 0.5488, + "step": 55825 + }, + { + "epoch": 1.43, + "learning_rate": 1.1229324430828577e-06, + "loss": 0.8604, + "step": 55826 + }, + { + "epoch": 1.43, + "learning_rate": 1.1229049824611495e-06, + "loss": 0.6421, + "step": 55827 + }, + { + "epoch": 1.43, + "learning_rate": 1.1228775217453388e-06, + "loss": 0.5972, + "step": 55828 + }, + { + "epoch": 1.43, + "learning_rate": 1.1228500609354462e-06, + "loss": 0.5122, + "step": 55829 + }, + { + "epoch": 1.43, + "learning_rate": 1.122822600031493e-06, + "loss": 0.6602, + "step": 55830 + }, + { + "epoch": 1.43, + "learning_rate": 1.1227951390335003e-06, + "loss": 0.7559, + "step": 55831 + }, + { + "epoch": 1.43, + "learning_rate": 1.122767677941489e-06, + "loss": 0.7344, + "step": 55832 + }, + { + "epoch": 1.43, + "learning_rate": 1.12274021675548e-06, + "loss": 0.6812, + "step": 55833 + }, + { + "epoch": 1.43, + "learning_rate": 1.1227127554754947e-06, + "loss": 0.79, + "step": 55834 + }, + { + "epoch": 1.43, + "learning_rate": 1.1226852941015534e-06, + "loss": 0.5752, + "step": 55835 + }, + { + "epoch": 1.43, + "learning_rate": 1.1226578326336783e-06, + "loss": 0.6062, + "step": 55836 + }, + { + "epoch": 1.43, + "learning_rate": 1.1226303710718892e-06, + "loss": 0.5791, + "step": 55837 + }, + { + "epoch": 1.43, + "learning_rate": 1.1226029094162078e-06, + "loss": 0.4514, + "step": 55838 + }, + { + "epoch": 1.43, + "learning_rate": 1.1225754476666552e-06, + "loss": 0.5801, + "step": 55839 + }, + { + "epoch": 1.43, + "learning_rate": 1.1225479858232518e-06, + "loss": 0.71, + "step": 55840 + }, + { + "epoch": 1.43, + "learning_rate": 1.1225205238860194e-06, + "loss": 0.7031, + "step": 55841 + }, + { + "epoch": 1.43, + "learning_rate": 1.1224930618549785e-06, + "loss": 0.6143, + "step": 55842 + }, + { + "epoch": 1.43, + "learning_rate": 1.1224655997301503e-06, + "loss": 0.7803, + "step": 55843 + }, + { + "epoch": 1.43, + "learning_rate": 1.1224381375115558e-06, + "loss": 0.75, + "step": 55844 + }, + { + "epoch": 1.43, + "learning_rate": 1.1224106751992161e-06, + "loss": 1.0029, + "step": 55845 + }, + { + "epoch": 1.43, + "learning_rate": 1.122383212793152e-06, + "loss": 0.4937, + "step": 55846 + }, + { + "epoch": 1.43, + "learning_rate": 1.1223557502933851e-06, + "loss": 0.6362, + "step": 55847 + }, + { + "epoch": 1.43, + "learning_rate": 1.1223282876999358e-06, + "loss": 0.6323, + "step": 55848 + }, + { + "epoch": 1.43, + "learning_rate": 1.1223008250128257e-06, + "loss": 0.79, + "step": 55849 + }, + { + "epoch": 1.43, + "learning_rate": 1.1222733622320747e-06, + "loss": 0.7783, + "step": 55850 + }, + { + "epoch": 1.43, + "learning_rate": 1.1222458993577054e-06, + "loss": 0.6426, + "step": 55851 + }, + { + "epoch": 1.43, + "learning_rate": 1.1222184363897374e-06, + "loss": 0.751, + "step": 55852 + }, + { + "epoch": 1.43, + "learning_rate": 1.1221909733281929e-06, + "loss": 0.6167, + "step": 55853 + }, + { + "epoch": 1.43, + "learning_rate": 1.1221635101730923e-06, + "loss": 0.6133, + "step": 55854 + }, + { + "epoch": 1.43, + "learning_rate": 1.1221360469244565e-06, + "loss": 0.3987, + "step": 55855 + }, + { + "epoch": 1.43, + "learning_rate": 1.1221085835823065e-06, + "loss": 0.7695, + "step": 55856 + }, + { + "epoch": 1.43, + "learning_rate": 1.1220811201466641e-06, + "loss": 0.709, + "step": 55857 + }, + { + "epoch": 1.43, + "learning_rate": 1.1220536566175495e-06, + "loss": 0.583, + "step": 55858 + }, + { + "epoch": 1.43, + "learning_rate": 1.1220261929949844e-06, + "loss": 0.7227, + "step": 55859 + }, + { + "epoch": 1.43, + "learning_rate": 1.1219987292789889e-06, + "loss": 0.5146, + "step": 55860 + }, + { + "epoch": 1.43, + "learning_rate": 1.121971265469585e-06, + "loss": 0.4863, + "step": 55861 + }, + { + "epoch": 1.43, + "learning_rate": 1.1219438015667931e-06, + "loss": 0.4697, + "step": 55862 + }, + { + "epoch": 1.43, + "learning_rate": 1.1219163375706343e-06, + "loss": 0.5918, + "step": 55863 + }, + { + "epoch": 1.43, + "learning_rate": 1.1218888734811302e-06, + "loss": 0.8486, + "step": 55864 + }, + { + "epoch": 1.43, + "learning_rate": 1.121861409298301e-06, + "loss": 0.6533, + "step": 55865 + }, + { + "epoch": 1.43, + "learning_rate": 1.1218339450221683e-06, + "loss": 0.6582, + "step": 55866 + }, + { + "epoch": 1.43, + "learning_rate": 1.1218064806527528e-06, + "loss": 0.7451, + "step": 55867 + }, + { + "epoch": 1.43, + "learning_rate": 1.121779016190076e-06, + "loss": 0.5742, + "step": 55868 + }, + { + "epoch": 1.43, + "learning_rate": 1.1217515516341584e-06, + "loss": 0.665, + "step": 55869 + }, + { + "epoch": 1.43, + "learning_rate": 1.1217240869850213e-06, + "loss": 0.6226, + "step": 55870 + }, + { + "epoch": 1.43, + "learning_rate": 1.1216966222426853e-06, + "loss": 0.7725, + "step": 55871 + }, + { + "epoch": 1.43, + "learning_rate": 1.1216691574071724e-06, + "loss": 0.7432, + "step": 55872 + }, + { + "epoch": 1.43, + "learning_rate": 1.121641692478503e-06, + "loss": 0.5178, + "step": 55873 + }, + { + "epoch": 1.43, + "learning_rate": 1.1216142274566977e-06, + "loss": 0.5618, + "step": 55874 + }, + { + "epoch": 1.43, + "learning_rate": 1.121586762341778e-06, + "loss": 0.7803, + "step": 55875 + }, + { + "epoch": 1.43, + "learning_rate": 1.1215592971337652e-06, + "loss": 0.5386, + "step": 55876 + }, + { + "epoch": 1.43, + "learning_rate": 1.1215318318326797e-06, + "loss": 0.4722, + "step": 55877 + }, + { + "epoch": 1.43, + "learning_rate": 1.1215043664385432e-06, + "loss": 0.6021, + "step": 55878 + }, + { + "epoch": 1.43, + "learning_rate": 1.1214769009513762e-06, + "loss": 0.624, + "step": 55879 + }, + { + "epoch": 1.43, + "learning_rate": 1.1214494353712002e-06, + "loss": 0.7051, + "step": 55880 + }, + { + "epoch": 1.43, + "learning_rate": 1.1214219696980353e-06, + "loss": 0.7705, + "step": 55881 + }, + { + "epoch": 1.43, + "learning_rate": 1.121394503931904e-06, + "loss": 0.5771, + "step": 55882 + }, + { + "epoch": 1.43, + "learning_rate": 1.121367038072826e-06, + "loss": 0.6504, + "step": 55883 + }, + { + "epoch": 1.43, + "learning_rate": 1.1213395721208228e-06, + "loss": 0.8398, + "step": 55884 + }, + { + "epoch": 1.43, + "learning_rate": 1.1213121060759156e-06, + "loss": 0.592, + "step": 55885 + }, + { + "epoch": 1.43, + "learning_rate": 1.1212846399381255e-06, + "loss": 0.6914, + "step": 55886 + }, + { + "epoch": 1.43, + "learning_rate": 1.121257173707473e-06, + "loss": 0.7422, + "step": 55887 + }, + { + "epoch": 1.43, + "learning_rate": 1.1212297073839798e-06, + "loss": 0.791, + "step": 55888 + }, + { + "epoch": 1.43, + "learning_rate": 1.1212022409676666e-06, + "loss": 0.353, + "step": 55889 + }, + { + "epoch": 1.43, + "learning_rate": 1.1211747744585537e-06, + "loss": 0.7949, + "step": 55890 + }, + { + "epoch": 1.43, + "learning_rate": 1.1211473078566636e-06, + "loss": 0.6279, + "step": 55891 + }, + { + "epoch": 1.43, + "learning_rate": 1.1211198411620163e-06, + "loss": 0.5073, + "step": 55892 + }, + { + "epoch": 1.43, + "learning_rate": 1.1210923743746334e-06, + "loss": 0.5906, + "step": 55893 + }, + { + "epoch": 1.43, + "learning_rate": 1.1210649074945351e-06, + "loss": 0.7432, + "step": 55894 + }, + { + "epoch": 1.43, + "learning_rate": 1.1210374405217433e-06, + "loss": 0.6758, + "step": 55895 + }, + { + "epoch": 1.43, + "learning_rate": 1.1210099734562787e-06, + "loss": 0.4965, + "step": 55896 + }, + { + "epoch": 1.43, + "learning_rate": 1.1209825062981622e-06, + "loss": 0.793, + "step": 55897 + }, + { + "epoch": 1.43, + "learning_rate": 1.1209550390474152e-06, + "loss": 0.7637, + "step": 55898 + }, + { + "epoch": 1.43, + "learning_rate": 1.1209275717040583e-06, + "loss": 0.627, + "step": 55899 + }, + { + "epoch": 1.43, + "learning_rate": 1.1209001042681125e-06, + "loss": 0.6084, + "step": 55900 + }, + { + "epoch": 1.43, + "learning_rate": 1.1208726367395995e-06, + "loss": 0.6816, + "step": 55901 + }, + { + "epoch": 1.43, + "learning_rate": 1.1208451691185395e-06, + "loss": 0.8516, + "step": 55902 + }, + { + "epoch": 1.43, + "learning_rate": 1.1208177014049542e-06, + "loss": 0.7285, + "step": 55903 + }, + { + "epoch": 1.43, + "learning_rate": 1.1207902335988643e-06, + "loss": 0.6045, + "step": 55904 + }, + { + "epoch": 1.43, + "learning_rate": 1.120762765700291e-06, + "loss": 0.4946, + "step": 55905 + }, + { + "epoch": 1.43, + "learning_rate": 1.1207352977092547e-06, + "loss": 0.5864, + "step": 55906 + }, + { + "epoch": 1.43, + "learning_rate": 1.1207078296257772e-06, + "loss": 0.4766, + "step": 55907 + }, + { + "epoch": 1.43, + "learning_rate": 1.1206803614498795e-06, + "loss": 0.6572, + "step": 55908 + }, + { + "epoch": 1.43, + "learning_rate": 1.1206528931815819e-06, + "loss": 0.5911, + "step": 55909 + }, + { + "epoch": 1.43, + "learning_rate": 1.1206254248209064e-06, + "loss": 0.6631, + "step": 55910 + }, + { + "epoch": 1.43, + "learning_rate": 1.1205979563678733e-06, + "loss": 0.6348, + "step": 55911 + }, + { + "epoch": 1.43, + "learning_rate": 1.120570487822504e-06, + "loss": 0.7256, + "step": 55912 + }, + { + "epoch": 1.43, + "learning_rate": 1.1205430191848196e-06, + "loss": 0.6826, + "step": 55913 + }, + { + "epoch": 1.43, + "learning_rate": 1.1205155504548408e-06, + "loss": 0.6865, + "step": 55914 + }, + { + "epoch": 1.43, + "learning_rate": 1.1204880816325885e-06, + "loss": 0.6992, + "step": 55915 + }, + { + "epoch": 1.43, + "learning_rate": 1.1204606127180842e-06, + "loss": 0.6836, + "step": 55916 + }, + { + "epoch": 1.43, + "learning_rate": 1.1204331437113488e-06, + "loss": 0.6758, + "step": 55917 + }, + { + "epoch": 1.43, + "learning_rate": 1.1204056746124035e-06, + "loss": 0.7471, + "step": 55918 + }, + { + "epoch": 1.43, + "learning_rate": 1.1203782054212688e-06, + "loss": 0.7915, + "step": 55919 + }, + { + "epoch": 1.43, + "learning_rate": 1.1203507361379661e-06, + "loss": 0.6472, + "step": 55920 + }, + { + "epoch": 1.43, + "learning_rate": 1.1203232667625162e-06, + "loss": 0.6279, + "step": 55921 + }, + { + "epoch": 1.43, + "learning_rate": 1.1202957972949407e-06, + "loss": 0.8564, + "step": 55922 + }, + { + "epoch": 1.43, + "learning_rate": 1.12026832773526e-06, + "loss": 0.8359, + "step": 55923 + }, + { + "epoch": 1.43, + "learning_rate": 1.1202408580834957e-06, + "loss": 0.834, + "step": 55924 + }, + { + "epoch": 1.43, + "learning_rate": 1.120213388339668e-06, + "loss": 0.7402, + "step": 55925 + }, + { + "epoch": 1.43, + "learning_rate": 1.1201859185037987e-06, + "loss": 0.5566, + "step": 55926 + }, + { + "epoch": 1.43, + "learning_rate": 1.1201584485759084e-06, + "loss": 0.8027, + "step": 55927 + }, + { + "epoch": 1.43, + "learning_rate": 1.1201309785560185e-06, + "loss": 0.6768, + "step": 55928 + }, + { + "epoch": 1.43, + "learning_rate": 1.1201035084441497e-06, + "loss": 0.4767, + "step": 55929 + }, + { + "epoch": 1.43, + "learning_rate": 1.1200760382403231e-06, + "loss": 0.749, + "step": 55930 + }, + { + "epoch": 1.43, + "learning_rate": 1.12004856794456e-06, + "loss": 0.6357, + "step": 55931 + }, + { + "epoch": 1.43, + "learning_rate": 1.1200210975568814e-06, + "loss": 0.9248, + "step": 55932 + }, + { + "epoch": 1.43, + "learning_rate": 1.1199936270773078e-06, + "loss": 0.8086, + "step": 55933 + }, + { + "epoch": 1.43, + "learning_rate": 1.1199661565058607e-06, + "loss": 0.7554, + "step": 55934 + }, + { + "epoch": 1.43, + "learning_rate": 1.119938685842561e-06, + "loss": 0.5239, + "step": 55935 + }, + { + "epoch": 1.43, + "learning_rate": 1.1199112150874297e-06, + "loss": 0.6943, + "step": 55936 + }, + { + "epoch": 1.43, + "learning_rate": 1.119883744240488e-06, + "loss": 0.6885, + "step": 55937 + }, + { + "epoch": 1.43, + "learning_rate": 1.1198562733017571e-06, + "loss": 0.5996, + "step": 55938 + }, + { + "epoch": 1.43, + "learning_rate": 1.1198288022712574e-06, + "loss": 0.7207, + "step": 55939 + }, + { + "epoch": 1.43, + "learning_rate": 1.1198013311490104e-06, + "loss": 0.6812, + "step": 55940 + }, + { + "epoch": 1.43, + "learning_rate": 1.1197738599350371e-06, + "loss": 0.8584, + "step": 55941 + }, + { + "epoch": 1.43, + "learning_rate": 1.1197463886293582e-06, + "loss": 0.8711, + "step": 55942 + }, + { + "epoch": 1.43, + "learning_rate": 1.1197189172319955e-06, + "loss": 0.438, + "step": 55943 + }, + { + "epoch": 1.43, + "learning_rate": 1.119691445742969e-06, + "loss": 0.6465, + "step": 55944 + }, + { + "epoch": 1.43, + "learning_rate": 1.1196639741623006e-06, + "loss": 0.6738, + "step": 55945 + }, + { + "epoch": 1.43, + "learning_rate": 1.1196365024900108e-06, + "loss": 0.6641, + "step": 55946 + }, + { + "epoch": 1.43, + "learning_rate": 1.119609030726121e-06, + "loss": 0.6016, + "step": 55947 + }, + { + "epoch": 1.43, + "learning_rate": 1.119581558870652e-06, + "loss": 0.7158, + "step": 55948 + }, + { + "epoch": 1.43, + "learning_rate": 1.1195540869236248e-06, + "loss": 0.6426, + "step": 55949 + }, + { + "epoch": 1.43, + "learning_rate": 1.1195266148850605e-06, + "loss": 0.7217, + "step": 55950 + }, + { + "epoch": 1.43, + "learning_rate": 1.1194991427549805e-06, + "loss": 0.645, + "step": 55951 + }, + { + "epoch": 1.43, + "learning_rate": 1.119471670533405e-06, + "loss": 0.604, + "step": 55952 + }, + { + "epoch": 1.43, + "learning_rate": 1.1194441982203559e-06, + "loss": 0.5798, + "step": 55953 + }, + { + "epoch": 1.43, + "learning_rate": 1.1194167258158537e-06, + "loss": 0.5151, + "step": 55954 + }, + { + "epoch": 1.43, + "learning_rate": 1.1193892533199196e-06, + "loss": 0.6943, + "step": 55955 + }, + { + "epoch": 1.43, + "learning_rate": 1.1193617807325747e-06, + "loss": 0.4072, + "step": 55956 + }, + { + "epoch": 1.43, + "learning_rate": 1.11933430805384e-06, + "loss": 0.7451, + "step": 55957 + }, + { + "epoch": 1.43, + "learning_rate": 1.119306835283737e-06, + "loss": 0.6631, + "step": 55958 + }, + { + "epoch": 1.43, + "learning_rate": 1.1192793624222854e-06, + "loss": 0.665, + "step": 55959 + }, + { + "epoch": 1.43, + "learning_rate": 1.1192518894695075e-06, + "loss": 0.6826, + "step": 55960 + }, + { + "epoch": 1.43, + "learning_rate": 1.1192244164254236e-06, + "loss": 0.7256, + "step": 55961 + }, + { + "epoch": 1.43, + "learning_rate": 1.1191969432900555e-06, + "loss": 0.6953, + "step": 55962 + }, + { + "epoch": 1.43, + "learning_rate": 1.1191694700634235e-06, + "loss": 0.6899, + "step": 55963 + }, + { + "epoch": 1.43, + "learning_rate": 1.1191419967455492e-06, + "loss": 0.8076, + "step": 55964 + }, + { + "epoch": 1.43, + "learning_rate": 1.119114523336453e-06, + "loss": 0.6953, + "step": 55965 + }, + { + "epoch": 1.43, + "learning_rate": 1.1190870498361563e-06, + "loss": 0.5691, + "step": 55966 + }, + { + "epoch": 1.43, + "learning_rate": 1.1190595762446802e-06, + "loss": 0.6973, + "step": 55967 + }, + { + "epoch": 1.43, + "learning_rate": 1.119032102562046e-06, + "loss": 0.4985, + "step": 55968 + }, + { + "epoch": 1.43, + "learning_rate": 1.119004628788274e-06, + "loss": 0.6406, + "step": 55969 + }, + { + "epoch": 1.43, + "learning_rate": 1.1189771549233857e-06, + "loss": 0.6328, + "step": 55970 + }, + { + "epoch": 1.43, + "learning_rate": 1.118949680967402e-06, + "loss": 0.4556, + "step": 55971 + }, + { + "epoch": 1.43, + "learning_rate": 1.1189222069203442e-06, + "loss": 0.7354, + "step": 55972 + }, + { + "epoch": 1.43, + "learning_rate": 1.118894732782233e-06, + "loss": 0.5737, + "step": 55973 + }, + { + "epoch": 1.43, + "learning_rate": 1.1188672585530895e-06, + "loss": 0.6411, + "step": 55974 + }, + { + "epoch": 1.43, + "learning_rate": 1.118839784232935e-06, + "loss": 0.6104, + "step": 55975 + }, + { + "epoch": 1.43, + "learning_rate": 1.1188123098217902e-06, + "loss": 0.7007, + "step": 55976 + }, + { + "epoch": 1.43, + "learning_rate": 1.118784835319676e-06, + "loss": 0.6104, + "step": 55977 + }, + { + "epoch": 1.43, + "learning_rate": 1.1187573607266144e-06, + "loss": 0.6562, + "step": 55978 + }, + { + "epoch": 1.43, + "learning_rate": 1.1187298860426252e-06, + "loss": 0.4512, + "step": 55979 + }, + { + "epoch": 1.43, + "learning_rate": 1.1187024112677301e-06, + "loss": 0.7246, + "step": 55980 + }, + { + "epoch": 1.43, + "learning_rate": 1.11867493640195e-06, + "loss": 0.7168, + "step": 55981 + }, + { + "epoch": 1.43, + "learning_rate": 1.118647461445306e-06, + "loss": 0.4673, + "step": 55982 + }, + { + "epoch": 1.43, + "learning_rate": 1.1186199863978194e-06, + "loss": 0.6411, + "step": 55983 + }, + { + "epoch": 1.43, + "learning_rate": 1.1185925112595106e-06, + "loss": 0.6396, + "step": 55984 + }, + { + "epoch": 1.43, + "learning_rate": 1.118565036030401e-06, + "loss": 0.522, + "step": 55985 + }, + { + "epoch": 1.43, + "learning_rate": 1.1185375607105114e-06, + "loss": 0.791, + "step": 55986 + }, + { + "epoch": 1.43, + "learning_rate": 1.1185100852998634e-06, + "loss": 0.5977, + "step": 55987 + }, + { + "epoch": 1.44, + "learning_rate": 1.1184826097984777e-06, + "loss": 0.709, + "step": 55988 + }, + { + "epoch": 1.44, + "learning_rate": 1.1184551342063752e-06, + "loss": 0.5334, + "step": 55989 + }, + { + "epoch": 1.44, + "learning_rate": 1.1184276585235768e-06, + "loss": 0.6128, + "step": 55990 + }, + { + "epoch": 1.44, + "learning_rate": 1.1184001827501042e-06, + "loss": 0.6284, + "step": 55991 + }, + { + "epoch": 1.44, + "learning_rate": 1.1183727068859777e-06, + "loss": 0.6272, + "step": 55992 + }, + { + "epoch": 1.44, + "learning_rate": 1.1183452309312186e-06, + "loss": 0.5781, + "step": 55993 + }, + { + "epoch": 1.44, + "learning_rate": 1.1183177548858484e-06, + "loss": 0.7861, + "step": 55994 + }, + { + "epoch": 1.44, + "learning_rate": 1.1182902787498876e-06, + "loss": 0.6426, + "step": 55995 + }, + { + "epoch": 1.44, + "learning_rate": 1.1182628025233572e-06, + "loss": 0.6426, + "step": 55996 + }, + { + "epoch": 1.44, + "learning_rate": 1.1182353262062785e-06, + "loss": 0.6748, + "step": 55997 + }, + { + "epoch": 1.44, + "learning_rate": 1.1182078497986724e-06, + "loss": 0.5938, + "step": 55998 + }, + { + "epoch": 1.44, + "learning_rate": 1.11818037330056e-06, + "loss": 0.7334, + "step": 55999 + }, + { + "epoch": 1.44, + "learning_rate": 1.1181528967119625e-06, + "loss": 0.4976, + "step": 56000 + }, + { + "epoch": 1.44, + "learning_rate": 1.1181254200329005e-06, + "loss": 0.5425, + "step": 56001 + }, + { + "epoch": 1.44, + "learning_rate": 1.1180979432633955e-06, + "loss": 0.4893, + "step": 56002 + }, + { + "epoch": 1.44, + "learning_rate": 1.1180704664034682e-06, + "loss": 0.6411, + "step": 56003 + }, + { + "epoch": 1.44, + "learning_rate": 1.1180429894531399e-06, + "loss": 0.4149, + "step": 56004 + }, + { + "epoch": 1.44, + "learning_rate": 1.1180155124124312e-06, + "loss": 0.5498, + "step": 56005 + }, + { + "epoch": 1.44, + "learning_rate": 1.1179880352813638e-06, + "loss": 0.7744, + "step": 56006 + }, + { + "epoch": 1.44, + "learning_rate": 1.1179605580599583e-06, + "loss": 0.5923, + "step": 56007 + }, + { + "epoch": 1.44, + "learning_rate": 1.117933080748236e-06, + "loss": 0.7021, + "step": 56008 + }, + { + "epoch": 1.44, + "learning_rate": 1.1179056033462173e-06, + "loss": 0.6997, + "step": 56009 + }, + { + "epoch": 1.44, + "learning_rate": 1.117878125853924e-06, + "loss": 0.7939, + "step": 56010 + }, + { + "epoch": 1.44, + "learning_rate": 1.1178506482713767e-06, + "loss": 0.5752, + "step": 56011 + }, + { + "epoch": 1.44, + "learning_rate": 1.117823170598597e-06, + "loss": 0.5635, + "step": 56012 + }, + { + "epoch": 1.44, + "learning_rate": 1.117795692835605e-06, + "loss": 0.5347, + "step": 56013 + }, + { + "epoch": 1.44, + "learning_rate": 1.1177682149824223e-06, + "loss": 0.6738, + "step": 56014 + }, + { + "epoch": 1.44, + "learning_rate": 1.1177407370390702e-06, + "loss": 0.5967, + "step": 56015 + }, + { + "epoch": 1.44, + "learning_rate": 1.117713259005569e-06, + "loss": 0.6946, + "step": 56016 + }, + { + "epoch": 1.44, + "learning_rate": 1.1176857808819406e-06, + "loss": 0.7422, + "step": 56017 + }, + { + "epoch": 1.44, + "learning_rate": 1.1176583026682053e-06, + "loss": 0.5417, + "step": 56018 + }, + { + "epoch": 1.44, + "learning_rate": 1.1176308243643848e-06, + "loss": 0.6157, + "step": 56019 + }, + { + "epoch": 1.44, + "learning_rate": 1.1176033459704995e-06, + "loss": 0.417, + "step": 56020 + }, + { + "epoch": 1.44, + "learning_rate": 1.1175758674865708e-06, + "loss": 0.455, + "step": 56021 + }, + { + "epoch": 1.44, + "learning_rate": 1.1175483889126196e-06, + "loss": 0.6812, + "step": 56022 + }, + { + "epoch": 1.44, + "learning_rate": 1.1175209102486674e-06, + "loss": 0.7627, + "step": 56023 + }, + { + "epoch": 1.44, + "learning_rate": 1.1174934314947343e-06, + "loss": 0.5425, + "step": 56024 + }, + { + "epoch": 1.44, + "learning_rate": 1.1174659526508422e-06, + "loss": 0.6216, + "step": 56025 + }, + { + "epoch": 1.44, + "learning_rate": 1.1174384737170115e-06, + "loss": 0.5267, + "step": 56026 + }, + { + "epoch": 1.44, + "learning_rate": 1.117410994693264e-06, + "loss": 0.647, + "step": 56027 + }, + { + "epoch": 1.44, + "learning_rate": 1.1173835155796199e-06, + "loss": 0.7607, + "step": 56028 + }, + { + "epoch": 1.44, + "learning_rate": 1.117356036376101e-06, + "loss": 0.6738, + "step": 56029 + }, + { + "epoch": 1.44, + "learning_rate": 1.1173285570827276e-06, + "loss": 0.4844, + "step": 56030 + }, + { + "epoch": 1.44, + "learning_rate": 1.1173010776995214e-06, + "loss": 0.6758, + "step": 56031 + }, + { + "epoch": 1.44, + "learning_rate": 1.1172735982265032e-06, + "loss": 0.7168, + "step": 56032 + }, + { + "epoch": 1.44, + "learning_rate": 1.1172461186636938e-06, + "loss": 0.5859, + "step": 56033 + }, + { + "epoch": 1.44, + "learning_rate": 1.1172186390111144e-06, + "loss": 0.6494, + "step": 56034 + }, + { + "epoch": 1.44, + "learning_rate": 1.117191159268786e-06, + "loss": 0.667, + "step": 56035 + }, + { + "epoch": 1.44, + "learning_rate": 1.1171636794367301e-06, + "loss": 0.4904, + "step": 56036 + }, + { + "epoch": 1.44, + "learning_rate": 1.117136199514967e-06, + "loss": 0.7852, + "step": 56037 + }, + { + "epoch": 1.44, + "learning_rate": 1.1171087195035186e-06, + "loss": 0.749, + "step": 56038 + }, + { + "epoch": 1.44, + "learning_rate": 1.1170812394024051e-06, + "loss": 0.5969, + "step": 56039 + }, + { + "epoch": 1.44, + "learning_rate": 1.1170537592116478e-06, + "loss": 0.4333, + "step": 56040 + }, + { + "epoch": 1.44, + "learning_rate": 1.117026278931268e-06, + "loss": 0.7275, + "step": 56041 + }, + { + "epoch": 1.44, + "learning_rate": 1.1169987985612863e-06, + "loss": 0.5454, + "step": 56042 + }, + { + "epoch": 1.44, + "learning_rate": 1.1169713181017242e-06, + "loss": 0.6826, + "step": 56043 + }, + { + "epoch": 1.44, + "learning_rate": 1.1169438375526025e-06, + "loss": 0.5879, + "step": 56044 + }, + { + "epoch": 1.44, + "learning_rate": 1.116916356913942e-06, + "loss": 0.6096, + "step": 56045 + }, + { + "epoch": 1.44, + "learning_rate": 1.1168888761857644e-06, + "loss": 0.793, + "step": 56046 + }, + { + "epoch": 1.44, + "learning_rate": 1.1168613953680903e-06, + "loss": 0.7324, + "step": 56047 + }, + { + "epoch": 1.44, + "learning_rate": 1.116833914460941e-06, + "loss": 0.7734, + "step": 56048 + }, + { + "epoch": 1.44, + "learning_rate": 1.116806433464337e-06, + "loss": 0.5811, + "step": 56049 + }, + { + "epoch": 1.44, + "learning_rate": 1.1167789523782999e-06, + "loss": 0.6543, + "step": 56050 + }, + { + "epoch": 1.44, + "learning_rate": 1.11675147120285e-06, + "loss": 0.6514, + "step": 56051 + }, + { + "epoch": 1.44, + "learning_rate": 1.1167239899380097e-06, + "loss": 0.6069, + "step": 56052 + }, + { + "epoch": 1.44, + "learning_rate": 1.1166965085837987e-06, + "loss": 0.9902, + "step": 56053 + }, + { + "epoch": 1.44, + "learning_rate": 1.1166690271402386e-06, + "loss": 0.5962, + "step": 56054 + }, + { + "epoch": 1.44, + "learning_rate": 1.1166415456073504e-06, + "loss": 0.488, + "step": 56055 + }, + { + "epoch": 1.44, + "learning_rate": 1.1166140639851551e-06, + "loss": 0.5186, + "step": 56056 + }, + { + "epoch": 1.44, + "learning_rate": 1.1165865822736739e-06, + "loss": 0.7314, + "step": 56057 + }, + { + "epoch": 1.44, + "learning_rate": 1.1165591004729278e-06, + "loss": 0.5776, + "step": 56058 + }, + { + "epoch": 1.44, + "learning_rate": 1.1165316185829373e-06, + "loss": 0.5889, + "step": 56059 + }, + { + "epoch": 1.44, + "learning_rate": 1.1165041366037244e-06, + "loss": 0.5526, + "step": 56060 + }, + { + "epoch": 1.44, + "learning_rate": 1.1164766545353094e-06, + "loss": 0.8545, + "step": 56061 + }, + { + "epoch": 1.44, + "learning_rate": 1.1164491723777137e-06, + "loss": 0.7227, + "step": 56062 + }, + { + "epoch": 1.44, + "learning_rate": 1.1164216901309582e-06, + "loss": 0.6294, + "step": 56063 + }, + { + "epoch": 1.44, + "learning_rate": 1.116394207795064e-06, + "loss": 0.5259, + "step": 56064 + }, + { + "epoch": 1.44, + "learning_rate": 1.1163667253700519e-06, + "loss": 0.5293, + "step": 56065 + }, + { + "epoch": 1.44, + "learning_rate": 1.1163392428559432e-06, + "loss": 0.5957, + "step": 56066 + }, + { + "epoch": 1.44, + "learning_rate": 1.1163117602527592e-06, + "loss": 0.6104, + "step": 56067 + }, + { + "epoch": 1.44, + "learning_rate": 1.11628427756052e-06, + "loss": 0.6846, + "step": 56068 + }, + { + "epoch": 1.44, + "learning_rate": 1.116256794779248e-06, + "loss": 0.6113, + "step": 56069 + }, + { + "epoch": 1.44, + "learning_rate": 1.116229311908963e-06, + "loss": 0.5088, + "step": 56070 + }, + { + "epoch": 1.44, + "learning_rate": 1.1162018289496868e-06, + "loss": 0.7163, + "step": 56071 + }, + { + "epoch": 1.44, + "learning_rate": 1.1161743459014404e-06, + "loss": 0.7725, + "step": 56072 + }, + { + "epoch": 1.44, + "learning_rate": 1.1161468627642443e-06, + "loss": 0.5996, + "step": 56073 + }, + { + "epoch": 1.44, + "learning_rate": 1.11611937953812e-06, + "loss": 0.5226, + "step": 56074 + }, + { + "epoch": 1.44, + "learning_rate": 1.1160918962230884e-06, + "loss": 0.4551, + "step": 56075 + }, + { + "epoch": 1.44, + "learning_rate": 1.1160644128191703e-06, + "loss": 0.5898, + "step": 56076 + }, + { + "epoch": 1.44, + "learning_rate": 1.1160369293263876e-06, + "loss": 0.7627, + "step": 56077 + }, + { + "epoch": 1.44, + "learning_rate": 1.1160094457447603e-06, + "loss": 0.7373, + "step": 56078 + }, + { + "epoch": 1.44, + "learning_rate": 1.1159819620743102e-06, + "loss": 0.7515, + "step": 56079 + }, + { + "epoch": 1.44, + "learning_rate": 1.1159544783150577e-06, + "loss": 0.6685, + "step": 56080 + }, + { + "epoch": 1.44, + "learning_rate": 1.1159269944670246e-06, + "loss": 0.6045, + "step": 56081 + }, + { + "epoch": 1.44, + "learning_rate": 1.1158995105302313e-06, + "loss": 0.5063, + "step": 56082 + }, + { + "epoch": 1.44, + "learning_rate": 1.115872026504699e-06, + "loss": 0.7148, + "step": 56083 + }, + { + "epoch": 1.44, + "learning_rate": 1.115844542390449e-06, + "loss": 0.5073, + "step": 56084 + }, + { + "epoch": 1.44, + "learning_rate": 1.1158170581875022e-06, + "loss": 0.6045, + "step": 56085 + }, + { + "epoch": 1.44, + "learning_rate": 1.1157895738958794e-06, + "loss": 0.7607, + "step": 56086 + }, + { + "epoch": 1.44, + "learning_rate": 1.1157620895156019e-06, + "loss": 0.6196, + "step": 56087 + }, + { + "epoch": 1.44, + "learning_rate": 1.1157346050466906e-06, + "loss": 0.6348, + "step": 56088 + }, + { + "epoch": 1.44, + "learning_rate": 1.1157071204891668e-06, + "loss": 0.5947, + "step": 56089 + }, + { + "epoch": 1.44, + "learning_rate": 1.1156796358430514e-06, + "loss": 0.7456, + "step": 56090 + }, + { + "epoch": 1.44, + "learning_rate": 1.115652151108365e-06, + "loss": 0.7026, + "step": 56091 + }, + { + "epoch": 1.44, + "learning_rate": 1.1156246662851298e-06, + "loss": 0.4658, + "step": 56092 + }, + { + "epoch": 1.44, + "learning_rate": 1.1155971813733658e-06, + "loss": 0.7168, + "step": 56093 + }, + { + "epoch": 1.44, + "learning_rate": 1.1155696963730942e-06, + "loss": 0.6035, + "step": 56094 + }, + { + "epoch": 1.44, + "learning_rate": 1.1155422112843363e-06, + "loss": 0.7227, + "step": 56095 + }, + { + "epoch": 1.44, + "learning_rate": 1.115514726107113e-06, + "loss": 0.5825, + "step": 56096 + }, + { + "epoch": 1.44, + "learning_rate": 1.1154872408414455e-06, + "loss": 0.6699, + "step": 56097 + }, + { + "epoch": 1.44, + "learning_rate": 1.1154597554873548e-06, + "loss": 0.6895, + "step": 56098 + }, + { + "epoch": 1.44, + "learning_rate": 1.1154322700448615e-06, + "loss": 0.6533, + "step": 56099 + }, + { + "epoch": 1.44, + "learning_rate": 1.1154047845139874e-06, + "loss": 0.7549, + "step": 56100 + }, + { + "epoch": 1.44, + "learning_rate": 1.1153772988947528e-06, + "loss": 0.5684, + "step": 56101 + }, + { + "epoch": 1.44, + "learning_rate": 1.1153498131871796e-06, + "loss": 0.6665, + "step": 56102 + }, + { + "epoch": 1.44, + "learning_rate": 1.1153223273912876e-06, + "loss": 0.6592, + "step": 56103 + }, + { + "epoch": 1.44, + "learning_rate": 1.1152948415070993e-06, + "loss": 0.71, + "step": 56104 + }, + { + "epoch": 1.44, + "learning_rate": 1.1152673555346347e-06, + "loss": 0.7021, + "step": 56105 + }, + { + "epoch": 1.44, + "learning_rate": 1.1152398694739154e-06, + "loss": 0.4054, + "step": 56106 + }, + { + "epoch": 1.44, + "learning_rate": 1.1152123833249623e-06, + "loss": 0.4995, + "step": 56107 + }, + { + "epoch": 1.44, + "learning_rate": 1.115184897087796e-06, + "loss": 0.7715, + "step": 56108 + }, + { + "epoch": 1.44, + "learning_rate": 1.115157410762438e-06, + "loss": 0.3291, + "step": 56109 + }, + { + "epoch": 1.44, + "learning_rate": 1.1151299243489094e-06, + "loss": 0.7812, + "step": 56110 + }, + { + "epoch": 1.44, + "learning_rate": 1.1151024378472311e-06, + "loss": 0.5278, + "step": 56111 + }, + { + "epoch": 1.44, + "learning_rate": 1.1150749512574243e-06, + "loss": 0.5847, + "step": 56112 + }, + { + "epoch": 1.44, + "learning_rate": 1.1150474645795096e-06, + "loss": 0.6235, + "step": 56113 + }, + { + "epoch": 1.44, + "learning_rate": 1.1150199778135085e-06, + "loss": 0.7744, + "step": 56114 + }, + { + "epoch": 1.44, + "learning_rate": 1.1149924909594418e-06, + "loss": 0.6006, + "step": 56115 + }, + { + "epoch": 1.44, + "learning_rate": 1.1149650040173305e-06, + "loss": 0.5485, + "step": 56116 + }, + { + "epoch": 1.44, + "learning_rate": 1.1149375169871964e-06, + "loss": 0.689, + "step": 56117 + }, + { + "epoch": 1.44, + "learning_rate": 1.1149100298690594e-06, + "loss": 0.6013, + "step": 56118 + }, + { + "epoch": 1.44, + "learning_rate": 1.1148825426629415e-06, + "loss": 0.5591, + "step": 56119 + }, + { + "epoch": 1.44, + "learning_rate": 1.1148550553688628e-06, + "loss": 0.7812, + "step": 56120 + }, + { + "epoch": 1.44, + "learning_rate": 1.114827567986845e-06, + "loss": 0.6475, + "step": 56121 + }, + { + "epoch": 1.44, + "learning_rate": 1.114800080516909e-06, + "loss": 0.4561, + "step": 56122 + }, + { + "epoch": 1.44, + "learning_rate": 1.1147725929590763e-06, + "loss": 0.6025, + "step": 56123 + }, + { + "epoch": 1.44, + "learning_rate": 1.114745105313367e-06, + "loss": 0.5347, + "step": 56124 + }, + { + "epoch": 1.44, + "learning_rate": 1.1147176175798027e-06, + "loss": 0.5701, + "step": 56125 + }, + { + "epoch": 1.44, + "learning_rate": 1.1146901297584045e-06, + "loss": 0.5947, + "step": 56126 + }, + { + "epoch": 1.44, + "learning_rate": 1.1146626418491933e-06, + "loss": 0.6953, + "step": 56127 + }, + { + "epoch": 1.44, + "learning_rate": 1.1146351538521903e-06, + "loss": 0.5425, + "step": 56128 + }, + { + "epoch": 1.44, + "learning_rate": 1.1146076657674166e-06, + "loss": 0.7544, + "step": 56129 + }, + { + "epoch": 1.44, + "learning_rate": 1.1145801775948927e-06, + "loss": 0.6777, + "step": 56130 + }, + { + "epoch": 1.44, + "learning_rate": 1.1145526893346402e-06, + "loss": 0.7354, + "step": 56131 + }, + { + "epoch": 1.44, + "learning_rate": 1.11452520098668e-06, + "loss": 0.6182, + "step": 56132 + }, + { + "epoch": 1.44, + "learning_rate": 1.1144977125510329e-06, + "loss": 0.6196, + "step": 56133 + }, + { + "epoch": 1.44, + "learning_rate": 1.1144702240277205e-06, + "loss": 0.645, + "step": 56134 + }, + { + "epoch": 1.44, + "learning_rate": 1.114442735416763e-06, + "loss": 0.8311, + "step": 56135 + }, + { + "epoch": 1.44, + "learning_rate": 1.1144152467181824e-06, + "loss": 0.7324, + "step": 56136 + }, + { + "epoch": 1.44, + "learning_rate": 1.1143877579319993e-06, + "loss": 0.5928, + "step": 56137 + }, + { + "epoch": 1.44, + "learning_rate": 1.1143602690582348e-06, + "loss": 0.8369, + "step": 56138 + }, + { + "epoch": 1.44, + "learning_rate": 1.1143327800969096e-06, + "loss": 0.6377, + "step": 56139 + }, + { + "epoch": 1.44, + "learning_rate": 1.1143052910480453e-06, + "loss": 0.6016, + "step": 56140 + }, + { + "epoch": 1.44, + "learning_rate": 1.1142778019116623e-06, + "loss": 0.6846, + "step": 56141 + }, + { + "epoch": 1.44, + "learning_rate": 1.1142503126877827e-06, + "loss": 0.5918, + "step": 56142 + }, + { + "epoch": 1.44, + "learning_rate": 1.1142228233764263e-06, + "loss": 0.6714, + "step": 56143 + }, + { + "epoch": 1.44, + "learning_rate": 1.1141953339776151e-06, + "loss": 0.5918, + "step": 56144 + }, + { + "epoch": 1.44, + "learning_rate": 1.1141678444913696e-06, + "loss": 0.6426, + "step": 56145 + }, + { + "epoch": 1.44, + "learning_rate": 1.114140354917711e-06, + "loss": 0.7427, + "step": 56146 + }, + { + "epoch": 1.44, + "learning_rate": 1.1141128652566608e-06, + "loss": 0.6875, + "step": 56147 + }, + { + "epoch": 1.44, + "learning_rate": 1.1140853755082393e-06, + "loss": 0.5864, + "step": 56148 + }, + { + "epoch": 1.44, + "learning_rate": 1.1140578856724676e-06, + "loss": 0.6306, + "step": 56149 + }, + { + "epoch": 1.44, + "learning_rate": 1.1140303957493676e-06, + "loss": 0.4751, + "step": 56150 + }, + { + "epoch": 1.44, + "learning_rate": 1.114002905738959e-06, + "loss": 0.6072, + "step": 56151 + }, + { + "epoch": 1.44, + "learning_rate": 1.1139754156412642e-06, + "loss": 0.7783, + "step": 56152 + }, + { + "epoch": 1.44, + "learning_rate": 1.1139479254563036e-06, + "loss": 0.5911, + "step": 56153 + }, + { + "epoch": 1.44, + "learning_rate": 1.1139204351840983e-06, + "loss": 0.7124, + "step": 56154 + }, + { + "epoch": 1.44, + "learning_rate": 1.1138929448246692e-06, + "loss": 0.5645, + "step": 56155 + }, + { + "epoch": 1.44, + "learning_rate": 1.1138654543780375e-06, + "loss": 0.7168, + "step": 56156 + }, + { + "epoch": 1.44, + "learning_rate": 1.1138379638442248e-06, + "loss": 0.8301, + "step": 56157 + }, + { + "epoch": 1.44, + "learning_rate": 1.113810473223251e-06, + "loss": 0.6812, + "step": 56158 + }, + { + "epoch": 1.44, + "learning_rate": 1.1137829825151378e-06, + "loss": 0.626, + "step": 56159 + }, + { + "epoch": 1.44, + "learning_rate": 1.1137554917199063e-06, + "loss": 0.7812, + "step": 56160 + }, + { + "epoch": 1.44, + "learning_rate": 1.1137280008375775e-06, + "loss": 0.7217, + "step": 56161 + }, + { + "epoch": 1.44, + "learning_rate": 1.1137005098681726e-06, + "loss": 0.5591, + "step": 56162 + }, + { + "epoch": 1.44, + "learning_rate": 1.1136730188117123e-06, + "loss": 0.6294, + "step": 56163 + }, + { + "epoch": 1.44, + "learning_rate": 1.1136455276682174e-06, + "loss": 0.5186, + "step": 56164 + }, + { + "epoch": 1.44, + "learning_rate": 1.11361803643771e-06, + "loss": 0.5942, + "step": 56165 + }, + { + "epoch": 1.44, + "learning_rate": 1.11359054512021e-06, + "loss": 0.8398, + "step": 56166 + }, + { + "epoch": 1.44, + "learning_rate": 1.1135630537157392e-06, + "loss": 0.5264, + "step": 56167 + }, + { + "epoch": 1.44, + "learning_rate": 1.1135355622243183e-06, + "loss": 0.8037, + "step": 56168 + }, + { + "epoch": 1.44, + "learning_rate": 1.1135080706459686e-06, + "loss": 0.7002, + "step": 56169 + }, + { + "epoch": 1.44, + "learning_rate": 1.1134805789807107e-06, + "loss": 0.5952, + "step": 56170 + }, + { + "epoch": 1.44, + "learning_rate": 1.1134530872285661e-06, + "loss": 0.7715, + "step": 56171 + }, + { + "epoch": 1.44, + "learning_rate": 1.1134255953895557e-06, + "loss": 0.6807, + "step": 56172 + }, + { + "epoch": 1.44, + "learning_rate": 1.1133981034637004e-06, + "loss": 0.5659, + "step": 56173 + }, + { + "epoch": 1.44, + "learning_rate": 1.1133706114510216e-06, + "loss": 0.5739, + "step": 56174 + }, + { + "epoch": 1.44, + "learning_rate": 1.1133431193515399e-06, + "loss": 0.6187, + "step": 56175 + }, + { + "epoch": 1.44, + "learning_rate": 1.1133156271652767e-06, + "loss": 0.625, + "step": 56176 + }, + { + "epoch": 1.44, + "learning_rate": 1.113288134892253e-06, + "loss": 0.4863, + "step": 56177 + }, + { + "epoch": 1.44, + "learning_rate": 1.1132606425324898e-06, + "loss": 0.625, + "step": 56178 + }, + { + "epoch": 1.44, + "learning_rate": 1.113233150086008e-06, + "loss": 0.6797, + "step": 56179 + }, + { + "epoch": 1.44, + "learning_rate": 1.1132056575528288e-06, + "loss": 0.6064, + "step": 56180 + }, + { + "epoch": 1.44, + "learning_rate": 1.113178164932973e-06, + "loss": 0.6558, + "step": 56181 + }, + { + "epoch": 1.44, + "learning_rate": 1.1131506722264625e-06, + "loss": 0.5703, + "step": 56182 + }, + { + "epoch": 1.44, + "learning_rate": 1.1131231794333174e-06, + "loss": 0.5815, + "step": 56183 + }, + { + "epoch": 1.44, + "learning_rate": 1.1130956865535591e-06, + "loss": 0.6104, + "step": 56184 + }, + { + "epoch": 1.44, + "learning_rate": 1.1130681935872085e-06, + "loss": 0.7725, + "step": 56185 + }, + { + "epoch": 1.44, + "learning_rate": 1.1130407005342868e-06, + "loss": 0.7295, + "step": 56186 + }, + { + "epoch": 1.44, + "learning_rate": 1.1130132073948153e-06, + "loss": 0.6636, + "step": 56187 + }, + { + "epoch": 1.44, + "learning_rate": 1.1129857141688145e-06, + "loss": 0.7168, + "step": 56188 + }, + { + "epoch": 1.44, + "learning_rate": 1.1129582208563057e-06, + "loss": 0.6992, + "step": 56189 + }, + { + "epoch": 1.44, + "learning_rate": 1.1129307274573103e-06, + "loss": 0.584, + "step": 56190 + }, + { + "epoch": 1.44, + "learning_rate": 1.1129032339718487e-06, + "loss": 0.667, + "step": 56191 + }, + { + "epoch": 1.44, + "learning_rate": 1.1128757403999428e-06, + "loss": 0.7139, + "step": 56192 + }, + { + "epoch": 1.44, + "learning_rate": 1.1128482467416128e-06, + "loss": 0.7275, + "step": 56193 + }, + { + "epoch": 1.44, + "learning_rate": 1.1128207529968801e-06, + "loss": 0.7568, + "step": 56194 + }, + { + "epoch": 1.44, + "learning_rate": 1.1127932591657654e-06, + "loss": 0.9424, + "step": 56195 + }, + { + "epoch": 1.44, + "learning_rate": 1.1127657652482905e-06, + "loss": 0.6626, + "step": 56196 + }, + { + "epoch": 1.44, + "learning_rate": 1.112738271244476e-06, + "loss": 0.5125, + "step": 56197 + }, + { + "epoch": 1.44, + "learning_rate": 1.1127107771543427e-06, + "loss": 0.6304, + "step": 56198 + }, + { + "epoch": 1.44, + "learning_rate": 1.1126832829779123e-06, + "loss": 0.55, + "step": 56199 + }, + { + "epoch": 1.44, + "learning_rate": 1.1126557887152053e-06, + "loss": 0.5474, + "step": 56200 + }, + { + "epoch": 1.44, + "learning_rate": 1.1126282943662432e-06, + "loss": 0.7305, + "step": 56201 + }, + { + "epoch": 1.44, + "learning_rate": 1.1126007999310465e-06, + "loss": 0.5562, + "step": 56202 + }, + { + "epoch": 1.44, + "learning_rate": 1.1125733054096368e-06, + "loss": 0.4964, + "step": 56203 + }, + { + "epoch": 1.44, + "learning_rate": 1.1125458108020344e-06, + "loss": 0.5952, + "step": 56204 + }, + { + "epoch": 1.44, + "learning_rate": 1.1125183161082613e-06, + "loss": 0.7676, + "step": 56205 + }, + { + "epoch": 1.44, + "learning_rate": 1.1124908213283377e-06, + "loss": 0.4214, + "step": 56206 + }, + { + "epoch": 1.44, + "learning_rate": 1.112463326462286e-06, + "loss": 0.6299, + "step": 56207 + }, + { + "epoch": 1.44, + "learning_rate": 1.1124358315101252e-06, + "loss": 0.6885, + "step": 56208 + }, + { + "epoch": 1.44, + "learning_rate": 1.112408336471878e-06, + "loss": 0.6553, + "step": 56209 + }, + { + "epoch": 1.44, + "learning_rate": 1.1123808413475645e-06, + "loss": 0.7197, + "step": 56210 + }, + { + "epoch": 1.44, + "learning_rate": 1.1123533461372065e-06, + "loss": 0.6167, + "step": 56211 + }, + { + "epoch": 1.44, + "learning_rate": 1.112325850840825e-06, + "loss": 0.7695, + "step": 56212 + }, + { + "epoch": 1.44, + "learning_rate": 1.1122983554584405e-06, + "loss": 0.6416, + "step": 56213 + }, + { + "epoch": 1.44, + "learning_rate": 1.112270859990074e-06, + "loss": 0.751, + "step": 56214 + }, + { + "epoch": 1.44, + "learning_rate": 1.112243364435747e-06, + "loss": 0.7578, + "step": 56215 + }, + { + "epoch": 1.44, + "learning_rate": 1.1122158687954803e-06, + "loss": 0.6855, + "step": 56216 + }, + { + "epoch": 1.44, + "learning_rate": 1.1121883730692955e-06, + "loss": 0.6284, + "step": 56217 + }, + { + "epoch": 1.44, + "learning_rate": 1.1121608772572132e-06, + "loss": 0.7568, + "step": 56218 + }, + { + "epoch": 1.44, + "learning_rate": 1.1121333813592542e-06, + "loss": 0.6021, + "step": 56219 + }, + { + "epoch": 1.44, + "learning_rate": 1.1121058853754397e-06, + "loss": 0.4985, + "step": 56220 + }, + { + "epoch": 1.44, + "learning_rate": 1.1120783893057911e-06, + "loss": 0.6072, + "step": 56221 + }, + { + "epoch": 1.44, + "learning_rate": 1.1120508931503295e-06, + "loss": 0.6846, + "step": 56222 + }, + { + "epoch": 1.44, + "learning_rate": 1.112023396909075e-06, + "loss": 0.7461, + "step": 56223 + }, + { + "epoch": 1.44, + "learning_rate": 1.11199590058205e-06, + "loss": 0.6367, + "step": 56224 + }, + { + "epoch": 1.44, + "learning_rate": 1.1119684041692745e-06, + "loss": 0.605, + "step": 56225 + }, + { + "epoch": 1.44, + "learning_rate": 1.11194090767077e-06, + "loss": 0.55, + "step": 56226 + }, + { + "epoch": 1.44, + "learning_rate": 1.1119134110865576e-06, + "loss": 0.4449, + "step": 56227 + }, + { + "epoch": 1.44, + "learning_rate": 1.1118859144166583e-06, + "loss": 0.6157, + "step": 56228 + }, + { + "epoch": 1.44, + "learning_rate": 1.111858417661093e-06, + "loss": 0.7402, + "step": 56229 + }, + { + "epoch": 1.44, + "learning_rate": 1.1118309208198828e-06, + "loss": 0.8242, + "step": 56230 + }, + { + "epoch": 1.44, + "learning_rate": 1.1118034238930488e-06, + "loss": 0.7559, + "step": 56231 + }, + { + "epoch": 1.44, + "learning_rate": 1.1117759268806123e-06, + "loss": 0.6514, + "step": 56232 + }, + { + "epoch": 1.44, + "learning_rate": 1.111748429782594e-06, + "loss": 0.7012, + "step": 56233 + }, + { + "epoch": 1.44, + "learning_rate": 1.111720932599015e-06, + "loss": 0.5139, + "step": 56234 + }, + { + "epoch": 1.44, + "learning_rate": 1.1116934353298961e-06, + "loss": 0.708, + "step": 56235 + }, + { + "epoch": 1.44, + "learning_rate": 1.111665937975259e-06, + "loss": 0.5293, + "step": 56236 + }, + { + "epoch": 1.44, + "learning_rate": 1.1116384405351247e-06, + "loss": 0.7295, + "step": 56237 + }, + { + "epoch": 1.44, + "learning_rate": 1.1116109430095137e-06, + "loss": 0.7212, + "step": 56238 + }, + { + "epoch": 1.44, + "learning_rate": 1.1115834453984471e-06, + "loss": 0.8047, + "step": 56239 + }, + { + "epoch": 1.44, + "learning_rate": 1.1115559477019464e-06, + "loss": 0.5708, + "step": 56240 + }, + { + "epoch": 1.44, + "learning_rate": 1.1115284499200324e-06, + "loss": 0.6548, + "step": 56241 + }, + { + "epoch": 1.44, + "learning_rate": 1.1115009520527262e-06, + "loss": 0.7363, + "step": 56242 + }, + { + "epoch": 1.44, + "learning_rate": 1.1114734541000491e-06, + "loss": 0.5742, + "step": 56243 + }, + { + "epoch": 1.44, + "learning_rate": 1.1114459560620216e-06, + "loss": 0.4998, + "step": 56244 + }, + { + "epoch": 1.44, + "learning_rate": 1.1114184579386652e-06, + "loss": 0.7236, + "step": 56245 + }, + { + "epoch": 1.44, + "learning_rate": 1.1113909597300007e-06, + "loss": 0.5808, + "step": 56246 + }, + { + "epoch": 1.44, + "learning_rate": 1.1113634614360496e-06, + "loss": 0.6262, + "step": 56247 + }, + { + "epoch": 1.44, + "learning_rate": 1.1113359630568323e-06, + "loss": 0.6899, + "step": 56248 + }, + { + "epoch": 1.44, + "learning_rate": 1.11130846459237e-06, + "loss": 0.6479, + "step": 56249 + }, + { + "epoch": 1.44, + "learning_rate": 1.1112809660426842e-06, + "loss": 0.522, + "step": 56250 + }, + { + "epoch": 1.44, + "learning_rate": 1.1112534674077957e-06, + "loss": 0.7188, + "step": 56251 + }, + { + "epoch": 1.44, + "learning_rate": 1.1112259686877255e-06, + "loss": 0.6997, + "step": 56252 + }, + { + "epoch": 1.44, + "learning_rate": 1.1111984698824947e-06, + "loss": 0.6248, + "step": 56253 + }, + { + "epoch": 1.44, + "learning_rate": 1.1111709709921242e-06, + "loss": 0.8174, + "step": 56254 + }, + { + "epoch": 1.44, + "learning_rate": 1.1111434720166353e-06, + "loss": 0.646, + "step": 56255 + }, + { + "epoch": 1.44, + "learning_rate": 1.1111159729560488e-06, + "loss": 0.7075, + "step": 56256 + }, + { + "epoch": 1.44, + "learning_rate": 1.1110884738103863e-06, + "loss": 0.6392, + "step": 56257 + }, + { + "epoch": 1.44, + "learning_rate": 1.1110609745796682e-06, + "loss": 0.7383, + "step": 56258 + }, + { + "epoch": 1.44, + "learning_rate": 1.1110334752639158e-06, + "loss": 0.5527, + "step": 56259 + }, + { + "epoch": 1.44, + "learning_rate": 1.11100597586315e-06, + "loss": 0.7061, + "step": 56260 + }, + { + "epoch": 1.44, + "learning_rate": 1.1109784763773924e-06, + "loss": 0.7324, + "step": 56261 + }, + { + "epoch": 1.44, + "learning_rate": 1.1109509768066636e-06, + "loss": 0.8184, + "step": 56262 + }, + { + "epoch": 1.44, + "learning_rate": 1.1109234771509846e-06, + "loss": 0.6719, + "step": 56263 + }, + { + "epoch": 1.44, + "learning_rate": 1.1108959774103768e-06, + "loss": 0.623, + "step": 56264 + }, + { + "epoch": 1.44, + "learning_rate": 1.110868477584861e-06, + "loss": 0.7734, + "step": 56265 + }, + { + "epoch": 1.44, + "learning_rate": 1.110840977674458e-06, + "loss": 0.623, + "step": 56266 + }, + { + "epoch": 1.44, + "learning_rate": 1.1108134776791892e-06, + "loss": 0.7168, + "step": 56267 + }, + { + "epoch": 1.44, + "learning_rate": 1.110785977599076e-06, + "loss": 0.4246, + "step": 56268 + }, + { + "epoch": 1.44, + "learning_rate": 1.1107584774341388e-06, + "loss": 0.6787, + "step": 56269 + }, + { + "epoch": 1.44, + "learning_rate": 1.110730977184399e-06, + "loss": 0.5225, + "step": 56270 + }, + { + "epoch": 1.44, + "learning_rate": 1.1107034768498774e-06, + "loss": 0.7051, + "step": 56271 + }, + { + "epoch": 1.44, + "learning_rate": 1.1106759764305957e-06, + "loss": 0.5703, + "step": 56272 + }, + { + "epoch": 1.44, + "learning_rate": 1.110648475926574e-06, + "loss": 0.5923, + "step": 56273 + }, + { + "epoch": 1.44, + "learning_rate": 1.1106209753378342e-06, + "loss": 0.6182, + "step": 56274 + }, + { + "epoch": 1.44, + "learning_rate": 1.1105934746643968e-06, + "loss": 0.6816, + "step": 56275 + }, + { + "epoch": 1.44, + "learning_rate": 1.1105659739062832e-06, + "loss": 0.4753, + "step": 56276 + }, + { + "epoch": 1.44, + "learning_rate": 1.110538473063514e-06, + "loss": 0.6772, + "step": 56277 + }, + { + "epoch": 1.44, + "learning_rate": 1.110510972136111e-06, + "loss": 0.75, + "step": 56278 + }, + { + "epoch": 1.44, + "learning_rate": 1.1104834711240944e-06, + "loss": 0.4956, + "step": 56279 + }, + { + "epoch": 1.44, + "learning_rate": 1.1104559700274862e-06, + "loss": 0.5151, + "step": 56280 + }, + { + "epoch": 1.44, + "learning_rate": 1.1104284688463063e-06, + "loss": 0.6826, + "step": 56281 + }, + { + "epoch": 1.44, + "learning_rate": 1.1104009675805771e-06, + "loss": 0.7178, + "step": 56282 + }, + { + "epoch": 1.44, + "learning_rate": 1.1103734662303185e-06, + "loss": 0.7144, + "step": 56283 + }, + { + "epoch": 1.44, + "learning_rate": 1.1103459647955525e-06, + "loss": 0.6943, + "step": 56284 + }, + { + "epoch": 1.44, + "learning_rate": 1.110318463276299e-06, + "loss": 0.5605, + "step": 56285 + }, + { + "epoch": 1.44, + "learning_rate": 1.1102909616725803e-06, + "loss": 0.6787, + "step": 56286 + }, + { + "epoch": 1.44, + "learning_rate": 1.1102634599844165e-06, + "loss": 0.6406, + "step": 56287 + }, + { + "epoch": 1.44, + "learning_rate": 1.110235958211829e-06, + "loss": 0.52, + "step": 56288 + }, + { + "epoch": 1.44, + "learning_rate": 1.110208456354839e-06, + "loss": 0.5923, + "step": 56289 + }, + { + "epoch": 1.44, + "learning_rate": 1.1101809544134674e-06, + "loss": 0.6514, + "step": 56290 + }, + { + "epoch": 1.44, + "learning_rate": 1.1101534523877356e-06, + "loss": 0.6924, + "step": 56291 + }, + { + "epoch": 1.44, + "learning_rate": 1.110125950277664e-06, + "loss": 0.5315, + "step": 56292 + }, + { + "epoch": 1.44, + "learning_rate": 1.1100984480832744e-06, + "loss": 0.7354, + "step": 56293 + }, + { + "epoch": 1.44, + "learning_rate": 1.1100709458045872e-06, + "loss": 0.5557, + "step": 56294 + }, + { + "epoch": 1.44, + "learning_rate": 1.110043443441624e-06, + "loss": 0.4961, + "step": 56295 + }, + { + "epoch": 1.44, + "learning_rate": 1.1100159409944052e-06, + "loss": 0.8467, + "step": 56296 + }, + { + "epoch": 1.44, + "learning_rate": 1.1099884384629526e-06, + "loss": 0.7793, + "step": 56297 + }, + { + "epoch": 1.44, + "learning_rate": 1.1099609358472869e-06, + "loss": 0.5791, + "step": 56298 + }, + { + "epoch": 1.44, + "learning_rate": 1.1099334331474288e-06, + "loss": 0.623, + "step": 56299 + }, + { + "epoch": 1.44, + "learning_rate": 1.1099059303633999e-06, + "loss": 0.7744, + "step": 56300 + }, + { + "epoch": 1.44, + "learning_rate": 1.1098784274952216e-06, + "loss": 0.7256, + "step": 56301 + }, + { + "epoch": 1.44, + "learning_rate": 1.1098509245429138e-06, + "loss": 0.6189, + "step": 56302 + }, + { + "epoch": 1.44, + "learning_rate": 1.1098234215064983e-06, + "loss": 0.5659, + "step": 56303 + }, + { + "epoch": 1.44, + "learning_rate": 1.109795918385996e-06, + "loss": 0.6904, + "step": 56304 + }, + { + "epoch": 1.44, + "learning_rate": 1.1097684151814281e-06, + "loss": 0.6465, + "step": 56305 + }, + { + "epoch": 1.44, + "learning_rate": 1.1097409118928157e-06, + "loss": 0.4412, + "step": 56306 + }, + { + "epoch": 1.44, + "learning_rate": 1.1097134085201795e-06, + "loss": 0.7998, + "step": 56307 + }, + { + "epoch": 1.44, + "learning_rate": 1.1096859050635412e-06, + "loss": 0.7002, + "step": 56308 + }, + { + "epoch": 1.44, + "learning_rate": 1.1096584015229214e-06, + "loss": 0.542, + "step": 56309 + }, + { + "epoch": 1.44, + "learning_rate": 1.1096308978983406e-06, + "loss": 0.6914, + "step": 56310 + }, + { + "epoch": 1.44, + "learning_rate": 1.109603394189821e-06, + "loss": 0.7559, + "step": 56311 + }, + { + "epoch": 1.44, + "learning_rate": 1.109575890397383e-06, + "loss": 0.6787, + "step": 56312 + }, + { + "epoch": 1.44, + "learning_rate": 1.1095483865210478e-06, + "loss": 0.75, + "step": 56313 + }, + { + "epoch": 1.44, + "learning_rate": 1.1095208825608365e-06, + "loss": 0.7959, + "step": 56314 + }, + { + "epoch": 1.44, + "learning_rate": 1.1094933785167698e-06, + "loss": 0.8008, + "step": 56315 + }, + { + "epoch": 1.44, + "learning_rate": 1.1094658743888694e-06, + "loss": 0.749, + "step": 56316 + }, + { + "epoch": 1.44, + "learning_rate": 1.1094383701771556e-06, + "loss": 0.5176, + "step": 56317 + }, + { + "epoch": 1.44, + "learning_rate": 1.1094108658816504e-06, + "loss": 0.5708, + "step": 56318 + }, + { + "epoch": 1.44, + "learning_rate": 1.109383361502374e-06, + "loss": 0.6504, + "step": 56319 + }, + { + "epoch": 1.44, + "learning_rate": 1.1093558570393478e-06, + "loss": 0.6553, + "step": 56320 + }, + { + "epoch": 1.44, + "learning_rate": 1.109328352492593e-06, + "loss": 0.6279, + "step": 56321 + }, + { + "epoch": 1.44, + "learning_rate": 1.1093008478621304e-06, + "loss": 0.7393, + "step": 56322 + }, + { + "epoch": 1.44, + "learning_rate": 1.109273343147981e-06, + "loss": 0.5605, + "step": 56323 + }, + { + "epoch": 1.44, + "learning_rate": 1.1092458383501663e-06, + "loss": 0.541, + "step": 56324 + }, + { + "epoch": 1.44, + "learning_rate": 1.1092183334687068e-06, + "loss": 0.623, + "step": 56325 + }, + { + "epoch": 1.44, + "learning_rate": 1.1091908285036243e-06, + "loss": 0.5776, + "step": 56326 + }, + { + "epoch": 1.44, + "learning_rate": 1.1091633234549392e-06, + "loss": 0.5137, + "step": 56327 + }, + { + "epoch": 1.44, + "learning_rate": 1.1091358183226728e-06, + "loss": 0.6768, + "step": 56328 + }, + { + "epoch": 1.44, + "learning_rate": 1.1091083131068457e-06, + "loss": 0.6855, + "step": 56329 + }, + { + "epoch": 1.44, + "learning_rate": 1.1090808078074797e-06, + "loss": 0.5562, + "step": 56330 + }, + { + "epoch": 1.44, + "learning_rate": 1.109053302424596e-06, + "loss": 0.5269, + "step": 56331 + }, + { + "epoch": 1.44, + "learning_rate": 1.1090257969582144e-06, + "loss": 0.5513, + "step": 56332 + }, + { + "epoch": 1.44, + "learning_rate": 1.108998291408357e-06, + "loss": 0.6992, + "step": 56333 + }, + { + "epoch": 1.44, + "learning_rate": 1.1089707857750448e-06, + "loss": 0.6943, + "step": 56334 + }, + { + "epoch": 1.44, + "learning_rate": 1.1089432800582985e-06, + "loss": 0.4468, + "step": 56335 + }, + { + "epoch": 1.44, + "learning_rate": 1.1089157742581396e-06, + "loss": 0.8467, + "step": 56336 + }, + { + "epoch": 1.44, + "learning_rate": 1.1088882683745888e-06, + "loss": 0.4954, + "step": 56337 + }, + { + "epoch": 1.44, + "learning_rate": 1.108860762407667e-06, + "loss": 0.5854, + "step": 56338 + }, + { + "epoch": 1.44, + "learning_rate": 1.1088332563573958e-06, + "loss": 0.7012, + "step": 56339 + }, + { + "epoch": 1.44, + "learning_rate": 1.1088057502237958e-06, + "loss": 0.6221, + "step": 56340 + }, + { + "epoch": 1.44, + "learning_rate": 1.1087782440068886e-06, + "loss": 0.5713, + "step": 56341 + }, + { + "epoch": 1.44, + "learning_rate": 1.1087507377066944e-06, + "loss": 0.6562, + "step": 56342 + }, + { + "epoch": 1.44, + "learning_rate": 1.1087232313232351e-06, + "loss": 0.6064, + "step": 56343 + }, + { + "epoch": 1.44, + "learning_rate": 1.1086957248565312e-06, + "loss": 0.7764, + "step": 56344 + }, + { + "epoch": 1.44, + "learning_rate": 1.1086682183066043e-06, + "loss": 0.4702, + "step": 56345 + }, + { + "epoch": 1.44, + "learning_rate": 1.108640711673475e-06, + "loss": 0.543, + "step": 56346 + }, + { + "epoch": 1.44, + "learning_rate": 1.1086132049571645e-06, + "loss": 0.6382, + "step": 56347 + }, + { + "epoch": 1.44, + "learning_rate": 1.1085856981576935e-06, + "loss": 0.8457, + "step": 56348 + }, + { + "epoch": 1.44, + "learning_rate": 1.1085581912750838e-06, + "loss": 0.7754, + "step": 56349 + }, + { + "epoch": 1.44, + "learning_rate": 1.1085306843093561e-06, + "loss": 0.6768, + "step": 56350 + }, + { + "epoch": 1.44, + "learning_rate": 1.1085031772605313e-06, + "loss": 0.7783, + "step": 56351 + }, + { + "epoch": 1.44, + "learning_rate": 1.108475670128631e-06, + "loss": 0.5879, + "step": 56352 + }, + { + "epoch": 1.44, + "learning_rate": 1.1084481629136752e-06, + "loss": 0.5151, + "step": 56353 + }, + { + "epoch": 1.44, + "learning_rate": 1.1084206556156861e-06, + "loss": 0.5261, + "step": 56354 + }, + { + "epoch": 1.44, + "learning_rate": 1.1083931482346842e-06, + "loss": 0.3376, + "step": 56355 + }, + { + "epoch": 1.44, + "learning_rate": 1.1083656407706906e-06, + "loss": 0.5752, + "step": 56356 + }, + { + "epoch": 1.44, + "learning_rate": 1.1083381332237262e-06, + "loss": 0.6621, + "step": 56357 + }, + { + "epoch": 1.44, + "learning_rate": 1.1083106255938126e-06, + "loss": 0.6328, + "step": 56358 + }, + { + "epoch": 1.44, + "learning_rate": 1.1082831178809705e-06, + "loss": 0.6274, + "step": 56359 + }, + { + "epoch": 1.44, + "learning_rate": 1.108255610085221e-06, + "loss": 0.7412, + "step": 56360 + }, + { + "epoch": 1.44, + "learning_rate": 1.1082281022065849e-06, + "loss": 0.6602, + "step": 56361 + }, + { + "epoch": 1.44, + "learning_rate": 1.1082005942450838e-06, + "loss": 0.5127, + "step": 56362 + }, + { + "epoch": 1.44, + "learning_rate": 1.1081730862007384e-06, + "loss": 0.5073, + "step": 56363 + }, + { + "epoch": 1.44, + "learning_rate": 1.1081455780735699e-06, + "loss": 0.5725, + "step": 56364 + }, + { + "epoch": 1.44, + "learning_rate": 1.108118069863599e-06, + "loss": 0.6663, + "step": 56365 + }, + { + "epoch": 1.44, + "learning_rate": 1.1080905615708475e-06, + "loss": 0.876, + "step": 56366 + }, + { + "epoch": 1.44, + "learning_rate": 1.1080630531953357e-06, + "loss": 0.7949, + "step": 56367 + }, + { + "epoch": 1.44, + "learning_rate": 1.1080355447370853e-06, + "loss": 0.6421, + "step": 56368 + }, + { + "epoch": 1.44, + "learning_rate": 1.1080080361961167e-06, + "loss": 0.5767, + "step": 56369 + }, + { + "epoch": 1.44, + "learning_rate": 1.1079805275724513e-06, + "loss": 0.6582, + "step": 56370 + }, + { + "epoch": 1.44, + "learning_rate": 1.1079530188661105e-06, + "loss": 0.4937, + "step": 56371 + }, + { + "epoch": 1.44, + "learning_rate": 1.107925510077115e-06, + "loss": 0.5122, + "step": 56372 + }, + { + "epoch": 1.44, + "learning_rate": 1.1078980012054858e-06, + "loss": 0.6206, + "step": 56373 + }, + { + "epoch": 1.44, + "learning_rate": 1.1078704922512439e-06, + "loss": 0.6416, + "step": 56374 + }, + { + "epoch": 1.44, + "learning_rate": 1.1078429832144105e-06, + "loss": 0.6274, + "step": 56375 + }, + { + "epoch": 1.44, + "learning_rate": 1.107815474095007e-06, + "loss": 0.396, + "step": 56376 + }, + { + "epoch": 1.44, + "learning_rate": 1.1077879648930541e-06, + "loss": 0.55, + "step": 56377 + }, + { + "epoch": 1.44, + "learning_rate": 1.1077604556085727e-06, + "loss": 0.7539, + "step": 56378 + }, + { + "epoch": 1.45, + "learning_rate": 1.1077329462415843e-06, + "loss": 0.6768, + "step": 56379 + }, + { + "epoch": 1.45, + "learning_rate": 1.1077054367921094e-06, + "loss": 0.6792, + "step": 56380 + }, + { + "epoch": 1.45, + "learning_rate": 1.1076779272601698e-06, + "loss": 0.4214, + "step": 56381 + }, + { + "epoch": 1.45, + "learning_rate": 1.107650417645786e-06, + "loss": 0.4958, + "step": 56382 + }, + { + "epoch": 1.45, + "learning_rate": 1.1076229079489793e-06, + "loss": 0.5068, + "step": 56383 + }, + { + "epoch": 1.45, + "learning_rate": 1.1075953981697704e-06, + "loss": 0.8047, + "step": 56384 + }, + { + "epoch": 1.45, + "learning_rate": 1.1075678883081808e-06, + "loss": 0.5239, + "step": 56385 + }, + { + "epoch": 1.45, + "learning_rate": 1.1075403783642317e-06, + "loss": 0.6343, + "step": 56386 + }, + { + "epoch": 1.45, + "learning_rate": 1.1075128683379436e-06, + "loss": 0.5698, + "step": 56387 + }, + { + "epoch": 1.45, + "learning_rate": 1.1074853582293378e-06, + "loss": 0.7754, + "step": 56388 + }, + { + "epoch": 1.45, + "learning_rate": 1.1074578480384356e-06, + "loss": 0.6689, + "step": 56389 + }, + { + "epoch": 1.45, + "learning_rate": 1.1074303377652576e-06, + "loss": 0.6948, + "step": 56390 + }, + { + "epoch": 1.45, + "learning_rate": 1.1074028274098254e-06, + "loss": 0.5737, + "step": 56391 + }, + { + "epoch": 1.45, + "learning_rate": 1.1073753169721596e-06, + "loss": 0.7168, + "step": 56392 + }, + { + "epoch": 1.45, + "learning_rate": 1.1073478064522817e-06, + "loss": 0.439, + "step": 56393 + }, + { + "epoch": 1.45, + "learning_rate": 1.107320295850212e-06, + "loss": 0.7207, + "step": 56394 + }, + { + "epoch": 1.45, + "learning_rate": 1.1072927851659727e-06, + "loss": 0.7285, + "step": 56395 + }, + { + "epoch": 1.45, + "learning_rate": 1.107265274399584e-06, + "loss": 0.4409, + "step": 56396 + }, + { + "epoch": 1.45, + "learning_rate": 1.107237763551067e-06, + "loss": 0.5796, + "step": 56397 + }, + { + "epoch": 1.45, + "learning_rate": 1.1072102526204433e-06, + "loss": 0.5122, + "step": 56398 + }, + { + "epoch": 1.45, + "learning_rate": 1.1071827416077334e-06, + "loss": 0.6602, + "step": 56399 + }, + { + "epoch": 1.45, + "learning_rate": 1.1071552305129587e-06, + "loss": 0.5249, + "step": 56400 + }, + { + "epoch": 1.45, + "learning_rate": 1.1071277193361404e-06, + "loss": 0.5356, + "step": 56401 + }, + { + "epoch": 1.45, + "learning_rate": 1.107100208077299e-06, + "loss": 0.668, + "step": 56402 + }, + { + "epoch": 1.45, + "learning_rate": 1.1070726967364558e-06, + "loss": 0.7998, + "step": 56403 + }, + { + "epoch": 1.45, + "learning_rate": 1.1070451853136324e-06, + "loss": 0.6387, + "step": 56404 + }, + { + "epoch": 1.45, + "learning_rate": 1.1070176738088491e-06, + "loss": 0.4573, + "step": 56405 + }, + { + "epoch": 1.45, + "learning_rate": 1.1069901622221277e-06, + "loss": 0.6602, + "step": 56406 + }, + { + "epoch": 1.45, + "learning_rate": 1.1069626505534884e-06, + "loss": 0.6387, + "step": 56407 + }, + { + "epoch": 1.45, + "learning_rate": 1.1069351388029529e-06, + "loss": 0.707, + "step": 56408 + }, + { + "epoch": 1.45, + "learning_rate": 1.1069076269705416e-06, + "loss": 0.6396, + "step": 56409 + }, + { + "epoch": 1.45, + "learning_rate": 1.1068801150562768e-06, + "loss": 0.6543, + "step": 56410 + }, + { + "epoch": 1.45, + "learning_rate": 1.1068526030601786e-06, + "loss": 0.6377, + "step": 56411 + }, + { + "epoch": 1.45, + "learning_rate": 1.106825090982268e-06, + "loss": 0.5571, + "step": 56412 + }, + { + "epoch": 1.45, + "learning_rate": 1.1067975788225664e-06, + "loss": 0.708, + "step": 56413 + }, + { + "epoch": 1.45, + "learning_rate": 1.106770066581095e-06, + "loss": 0.6528, + "step": 56414 + }, + { + "epoch": 1.45, + "learning_rate": 1.1067425542578747e-06, + "loss": 0.5525, + "step": 56415 + }, + { + "epoch": 1.45, + "learning_rate": 1.1067150418529263e-06, + "loss": 0.7188, + "step": 56416 + }, + { + "epoch": 1.45, + "learning_rate": 1.1066875293662711e-06, + "loss": 0.646, + "step": 56417 + }, + { + "epoch": 1.45, + "learning_rate": 1.1066600167979306e-06, + "loss": 0.5967, + "step": 56418 + }, + { + "epoch": 1.45, + "learning_rate": 1.1066325041479247e-06, + "loss": 0.5171, + "step": 56419 + }, + { + "epoch": 1.45, + "learning_rate": 1.1066049914162757e-06, + "loss": 0.7012, + "step": 56420 + }, + { + "epoch": 1.45, + "learning_rate": 1.1065774786030042e-06, + "loss": 0.6699, + "step": 56421 + }, + { + "epoch": 1.45, + "learning_rate": 1.106549965708131e-06, + "loss": 0.7427, + "step": 56422 + }, + { + "epoch": 1.45, + "learning_rate": 1.1065224527316775e-06, + "loss": 0.665, + "step": 56423 + }, + { + "epoch": 1.45, + "learning_rate": 1.1064949396736644e-06, + "loss": 0.7812, + "step": 56424 + }, + { + "epoch": 1.45, + "learning_rate": 1.1064674265341135e-06, + "loss": 0.791, + "step": 56425 + }, + { + "epoch": 1.45, + "learning_rate": 1.1064399133130451e-06, + "loss": 0.6885, + "step": 56426 + }, + { + "epoch": 1.45, + "learning_rate": 1.1064124000104805e-06, + "loss": 0.6421, + "step": 56427 + }, + { + "epoch": 1.45, + "learning_rate": 1.106384886626441e-06, + "loss": 0.6074, + "step": 56428 + }, + { + "epoch": 1.45, + "learning_rate": 1.1063573731609474e-06, + "loss": 0.6631, + "step": 56429 + }, + { + "epoch": 1.45, + "learning_rate": 1.1063298596140206e-06, + "loss": 0.7188, + "step": 56430 + }, + { + "epoch": 1.45, + "learning_rate": 1.1063023459856825e-06, + "loss": 0.6631, + "step": 56431 + }, + { + "epoch": 1.45, + "learning_rate": 1.1062748322759532e-06, + "loss": 0.6045, + "step": 56432 + }, + { + "epoch": 1.45, + "learning_rate": 1.1062473184848542e-06, + "loss": 0.6421, + "step": 56433 + }, + { + "epoch": 1.45, + "learning_rate": 1.1062198046124062e-06, + "loss": 0.5811, + "step": 56434 + }, + { + "epoch": 1.45, + "learning_rate": 1.106192290658631e-06, + "loss": 0.6694, + "step": 56435 + }, + { + "epoch": 1.45, + "learning_rate": 1.1061647766235492e-06, + "loss": 0.6523, + "step": 56436 + }, + { + "epoch": 1.45, + "learning_rate": 1.106137262507182e-06, + "loss": 0.6421, + "step": 56437 + }, + { + "epoch": 1.45, + "learning_rate": 1.10610974830955e-06, + "loss": 0.665, + "step": 56438 + }, + { + "epoch": 1.45, + "learning_rate": 1.106082234030675e-06, + "loss": 0.6768, + "step": 56439 + }, + { + "epoch": 1.45, + "learning_rate": 1.1060547196705774e-06, + "loss": 0.6299, + "step": 56440 + }, + { + "epoch": 1.45, + "learning_rate": 1.1060272052292789e-06, + "loss": 0.54, + "step": 56441 + }, + { + "epoch": 1.45, + "learning_rate": 1.1059996907068e-06, + "loss": 0.667, + "step": 56442 + }, + { + "epoch": 1.45, + "learning_rate": 1.1059721761031622e-06, + "loss": 0.4976, + "step": 56443 + }, + { + "epoch": 1.45, + "learning_rate": 1.1059446614183862e-06, + "loss": 0.4941, + "step": 56444 + }, + { + "epoch": 1.45, + "learning_rate": 1.1059171466524934e-06, + "loss": 0.627, + "step": 56445 + }, + { + "epoch": 1.45, + "learning_rate": 1.1058896318055047e-06, + "loss": 0.7412, + "step": 56446 + }, + { + "epoch": 1.45, + "learning_rate": 1.105862116877441e-06, + "loss": 0.7568, + "step": 56447 + }, + { + "epoch": 1.45, + "learning_rate": 1.1058346018683239e-06, + "loss": 0.4224, + "step": 56448 + }, + { + "epoch": 1.45, + "learning_rate": 1.1058070867781736e-06, + "loss": 0.5396, + "step": 56449 + }, + { + "epoch": 1.45, + "learning_rate": 1.105779571607012e-06, + "loss": 0.6636, + "step": 56450 + }, + { + "epoch": 1.45, + "learning_rate": 1.10575205635486e-06, + "loss": 0.5659, + "step": 56451 + }, + { + "epoch": 1.45, + "learning_rate": 1.105724541021738e-06, + "loss": 0.7783, + "step": 56452 + }, + { + "epoch": 1.45, + "learning_rate": 1.1056970256076682e-06, + "loss": 0.6167, + "step": 56453 + }, + { + "epoch": 1.45, + "learning_rate": 1.1056695101126704e-06, + "loss": 0.6367, + "step": 56454 + }, + { + "epoch": 1.45, + "learning_rate": 1.1056419945367668e-06, + "loss": 0.6982, + "step": 56455 + }, + { + "epoch": 1.45, + "learning_rate": 1.105614478879978e-06, + "loss": 0.3494, + "step": 56456 + }, + { + "epoch": 1.45, + "learning_rate": 1.1055869631423247e-06, + "loss": 0.7383, + "step": 56457 + }, + { + "epoch": 1.45, + "learning_rate": 1.1055594473238285e-06, + "loss": 0.7461, + "step": 56458 + }, + { + "epoch": 1.45, + "learning_rate": 1.1055319314245104e-06, + "loss": 0.6602, + "step": 56459 + }, + { + "epoch": 1.45, + "learning_rate": 1.105504415444391e-06, + "loss": 0.79, + "step": 56460 + }, + { + "epoch": 1.45, + "learning_rate": 1.1054768993834923e-06, + "loss": 0.6338, + "step": 56461 + }, + { + "epoch": 1.45, + "learning_rate": 1.1054493832418344e-06, + "loss": 0.624, + "step": 56462 + }, + { + "epoch": 1.45, + "learning_rate": 1.1054218670194386e-06, + "loss": 0.6167, + "step": 56463 + }, + { + "epoch": 1.45, + "learning_rate": 1.1053943507163265e-06, + "loss": 0.7227, + "step": 56464 + }, + { + "epoch": 1.45, + "learning_rate": 1.1053668343325185e-06, + "loss": 0.6294, + "step": 56465 + }, + { + "epoch": 1.45, + "learning_rate": 1.1053393178680362e-06, + "loss": 0.6362, + "step": 56466 + }, + { + "epoch": 1.45, + "learning_rate": 1.1053118013229004e-06, + "loss": 0.7896, + "step": 56467 + }, + { + "epoch": 1.45, + "learning_rate": 1.105284284697132e-06, + "loss": 0.614, + "step": 56468 + }, + { + "epoch": 1.45, + "learning_rate": 1.1052567679907522e-06, + "loss": 0.4172, + "step": 56469 + }, + { + "epoch": 1.45, + "learning_rate": 1.105229251203782e-06, + "loss": 0.4801, + "step": 56470 + }, + { + "epoch": 1.45, + "learning_rate": 1.1052017343362435e-06, + "loss": 0.543, + "step": 56471 + }, + { + "epoch": 1.45, + "learning_rate": 1.1051742173881562e-06, + "loss": 0.8379, + "step": 56472 + }, + { + "epoch": 1.45, + "learning_rate": 1.1051467003595418e-06, + "loss": 0.7559, + "step": 56473 + }, + { + "epoch": 1.45, + "learning_rate": 1.1051191832504215e-06, + "loss": 0.5366, + "step": 56474 + }, + { + "epoch": 1.45, + "learning_rate": 1.1050916660608162e-06, + "loss": 0.708, + "step": 56475 + }, + { + "epoch": 1.45, + "learning_rate": 1.1050641487907474e-06, + "loss": 0.6836, + "step": 56476 + }, + { + "epoch": 1.45, + "learning_rate": 1.1050366314402354e-06, + "loss": 0.7637, + "step": 56477 + }, + { + "epoch": 1.45, + "learning_rate": 1.105009114009302e-06, + "loss": 0.6006, + "step": 56478 + }, + { + "epoch": 1.45, + "learning_rate": 1.1049815964979677e-06, + "loss": 0.668, + "step": 56479 + }, + { + "epoch": 1.45, + "learning_rate": 1.1049540789062538e-06, + "loss": 0.4856, + "step": 56480 + }, + { + "epoch": 1.45, + "learning_rate": 1.1049265612341816e-06, + "loss": 0.665, + "step": 56481 + }, + { + "epoch": 1.45, + "learning_rate": 1.1048990434817718e-06, + "loss": 0.5898, + "step": 56482 + }, + { + "epoch": 1.45, + "learning_rate": 1.1048715256490457e-06, + "loss": 0.5728, + "step": 56483 + }, + { + "epoch": 1.45, + "learning_rate": 1.104844007736024e-06, + "loss": 0.645, + "step": 56484 + }, + { + "epoch": 1.45, + "learning_rate": 1.1048164897427287e-06, + "loss": 0.6846, + "step": 56485 + }, + { + "epoch": 1.45, + "learning_rate": 1.1047889716691799e-06, + "loss": 0.6699, + "step": 56486 + }, + { + "epoch": 1.45, + "learning_rate": 1.1047614535153986e-06, + "loss": 0.7446, + "step": 56487 + }, + { + "epoch": 1.45, + "learning_rate": 1.1047339352814067e-06, + "loss": 0.645, + "step": 56488 + }, + { + "epoch": 1.45, + "learning_rate": 1.1047064169672246e-06, + "loss": 0.8428, + "step": 56489 + }, + { + "epoch": 1.45, + "learning_rate": 1.1046788985728739e-06, + "loss": 0.6172, + "step": 56490 + }, + { + "epoch": 1.45, + "learning_rate": 1.1046513800983755e-06, + "loss": 0.5469, + "step": 56491 + }, + { + "epoch": 1.45, + "learning_rate": 1.10462386154375e-06, + "loss": 0.6511, + "step": 56492 + }, + { + "epoch": 1.45, + "learning_rate": 1.1045963429090189e-06, + "loss": 0.8008, + "step": 56493 + }, + { + "epoch": 1.45, + "learning_rate": 1.1045688241942032e-06, + "loss": 0.667, + "step": 56494 + }, + { + "epoch": 1.45, + "learning_rate": 1.1045413053993237e-06, + "loss": 0.6187, + "step": 56495 + }, + { + "epoch": 1.45, + "learning_rate": 1.1045137865244025e-06, + "loss": 0.7109, + "step": 56496 + }, + { + "epoch": 1.45, + "learning_rate": 1.1044862675694592e-06, + "loss": 0.6216, + "step": 56497 + }, + { + "epoch": 1.45, + "learning_rate": 1.1044587485345157e-06, + "loss": 0.6528, + "step": 56498 + }, + { + "epoch": 1.45, + "learning_rate": 1.104431229419593e-06, + "loss": 0.5991, + "step": 56499 + }, + { + "epoch": 1.45, + "learning_rate": 1.1044037102247124e-06, + "loss": 0.7646, + "step": 56500 + }, + { + "epoch": 1.45, + "learning_rate": 1.1043761909498943e-06, + "loss": 0.6465, + "step": 56501 + }, + { + "epoch": 1.45, + "learning_rate": 1.1043486715951605e-06, + "loss": 0.5569, + "step": 56502 + }, + { + "epoch": 1.45, + "learning_rate": 1.1043211521605314e-06, + "loss": 0.6479, + "step": 56503 + }, + { + "epoch": 1.45, + "learning_rate": 1.1042936326460284e-06, + "loss": 0.7061, + "step": 56504 + }, + { + "epoch": 1.45, + "learning_rate": 1.1042661130516724e-06, + "loss": 0.626, + "step": 56505 + }, + { + "epoch": 1.45, + "learning_rate": 1.104238593377485e-06, + "loss": 0.5887, + "step": 56506 + }, + { + "epoch": 1.45, + "learning_rate": 1.104211073623487e-06, + "loss": 0.665, + "step": 56507 + }, + { + "epoch": 1.45, + "learning_rate": 1.104183553789699e-06, + "loss": 0.5913, + "step": 56508 + }, + { + "epoch": 1.45, + "learning_rate": 1.1041560338761425e-06, + "loss": 0.603, + "step": 56509 + }, + { + "epoch": 1.45, + "learning_rate": 1.1041285138828387e-06, + "loss": 0.6504, + "step": 56510 + }, + { + "epoch": 1.45, + "learning_rate": 1.1041009938098084e-06, + "loss": 0.7207, + "step": 56511 + }, + { + "epoch": 1.45, + "learning_rate": 1.1040734736570726e-06, + "loss": 0.5156, + "step": 56512 + }, + { + "epoch": 1.45, + "learning_rate": 1.1040459534246526e-06, + "loss": 0.7041, + "step": 56513 + }, + { + "epoch": 1.45, + "learning_rate": 1.1040184331125694e-06, + "loss": 0.7168, + "step": 56514 + }, + { + "epoch": 1.45, + "learning_rate": 1.1039909127208443e-06, + "loss": 0.6016, + "step": 56515 + }, + { + "epoch": 1.45, + "learning_rate": 1.103963392249498e-06, + "loss": 0.7021, + "step": 56516 + }, + { + "epoch": 1.45, + "learning_rate": 1.1039358716985518e-06, + "loss": 0.5471, + "step": 56517 + }, + { + "epoch": 1.45, + "learning_rate": 1.1039083510680263e-06, + "loss": 0.6567, + "step": 56518 + }, + { + "epoch": 1.45, + "learning_rate": 1.1038808303579435e-06, + "loss": 0.7568, + "step": 56519 + }, + { + "epoch": 1.45, + "learning_rate": 1.1038533095683234e-06, + "loss": 0.8018, + "step": 56520 + }, + { + "epoch": 1.45, + "learning_rate": 1.103825788699188e-06, + "loss": 0.4438, + "step": 56521 + }, + { + "epoch": 1.45, + "learning_rate": 1.1037982677505577e-06, + "loss": 0.6138, + "step": 56522 + }, + { + "epoch": 1.45, + "learning_rate": 1.103770746722454e-06, + "loss": 0.6147, + "step": 56523 + }, + { + "epoch": 1.45, + "learning_rate": 1.1037432256148978e-06, + "loss": 0.604, + "step": 56524 + }, + { + "epoch": 1.45, + "learning_rate": 1.10371570442791e-06, + "loss": 0.7559, + "step": 56525 + }, + { + "epoch": 1.45, + "learning_rate": 1.1036881831615122e-06, + "loss": 0.6504, + "step": 56526 + }, + { + "epoch": 1.45, + "learning_rate": 1.103660661815725e-06, + "loss": 0.6074, + "step": 56527 + }, + { + "epoch": 1.45, + "learning_rate": 1.1036331403905693e-06, + "loss": 0.7148, + "step": 56528 + }, + { + "epoch": 1.45, + "learning_rate": 1.1036056188860667e-06, + "loss": 0.6362, + "step": 56529 + }, + { + "epoch": 1.45, + "learning_rate": 1.1035780973022378e-06, + "loss": 0.6865, + "step": 56530 + }, + { + "epoch": 1.45, + "learning_rate": 1.1035505756391044e-06, + "loss": 0.5837, + "step": 56531 + }, + { + "epoch": 1.45, + "learning_rate": 1.1035230538966868e-06, + "loss": 0.7344, + "step": 56532 + }, + { + "epoch": 1.45, + "learning_rate": 1.1034955320750062e-06, + "loss": 0.71, + "step": 56533 + }, + { + "epoch": 1.45, + "learning_rate": 1.103468010174084e-06, + "loss": 0.4575, + "step": 56534 + }, + { + "epoch": 1.45, + "learning_rate": 1.1034404881939413e-06, + "loss": 0.5784, + "step": 56535 + }, + { + "epoch": 1.45, + "learning_rate": 1.103412966134599e-06, + "loss": 0.6333, + "step": 56536 + }, + { + "epoch": 1.45, + "learning_rate": 1.1033854439960776e-06, + "loss": 0.832, + "step": 56537 + }, + { + "epoch": 1.45, + "learning_rate": 1.1033579217783992e-06, + "loss": 0.5659, + "step": 56538 + }, + { + "epoch": 1.45, + "learning_rate": 1.1033303994815841e-06, + "loss": 0.7041, + "step": 56539 + }, + { + "epoch": 1.45, + "learning_rate": 1.1033028771056539e-06, + "loss": 0.6006, + "step": 56540 + }, + { + "epoch": 1.45, + "learning_rate": 1.1032753546506296e-06, + "loss": 0.5479, + "step": 56541 + }, + { + "epoch": 1.45, + "learning_rate": 1.1032478321165318e-06, + "loss": 0.7539, + "step": 56542 + }, + { + "epoch": 1.45, + "learning_rate": 1.103220309503382e-06, + "loss": 0.6562, + "step": 56543 + }, + { + "epoch": 1.45, + "learning_rate": 1.103192786811201e-06, + "loss": 0.6602, + "step": 56544 + }, + { + "epoch": 1.45, + "learning_rate": 1.1031652640400099e-06, + "loss": 0.4248, + "step": 56545 + }, + { + "epoch": 1.45, + "learning_rate": 1.1031377411898303e-06, + "loss": 0.6362, + "step": 56546 + }, + { + "epoch": 1.45, + "learning_rate": 1.1031102182606825e-06, + "loss": 0.7539, + "step": 56547 + }, + { + "epoch": 1.45, + "learning_rate": 1.1030826952525885e-06, + "loss": 0.8184, + "step": 56548 + }, + { + "epoch": 1.45, + "learning_rate": 1.1030551721655684e-06, + "loss": 0.6245, + "step": 56549 + }, + { + "epoch": 1.45, + "learning_rate": 1.1030276489996437e-06, + "loss": 0.6348, + "step": 56550 + }, + { + "epoch": 1.45, + "learning_rate": 1.1030001257548355e-06, + "loss": 0.5728, + "step": 56551 + }, + { + "epoch": 1.45, + "learning_rate": 1.102972602431165e-06, + "loss": 0.6831, + "step": 56552 + }, + { + "epoch": 1.45, + "learning_rate": 1.1029450790286528e-06, + "loss": 0.6719, + "step": 56553 + }, + { + "epoch": 1.45, + "learning_rate": 1.1029175555473204e-06, + "loss": 0.6768, + "step": 56554 + }, + { + "epoch": 1.45, + "learning_rate": 1.1028900319871887e-06, + "loss": 0.7285, + "step": 56555 + }, + { + "epoch": 1.45, + "learning_rate": 1.1028625083482792e-06, + "loss": 0.6777, + "step": 56556 + }, + { + "epoch": 1.45, + "learning_rate": 1.1028349846306123e-06, + "loss": 0.6387, + "step": 56557 + }, + { + "epoch": 1.45, + "learning_rate": 1.1028074608342093e-06, + "loss": 0.6328, + "step": 56558 + }, + { + "epoch": 1.45, + "learning_rate": 1.1027799369590915e-06, + "loss": 0.5278, + "step": 56559 + }, + { + "epoch": 1.45, + "learning_rate": 1.1027524130052799e-06, + "loss": 0.5601, + "step": 56560 + }, + { + "epoch": 1.45, + "learning_rate": 1.1027248889727956e-06, + "loss": 0.6846, + "step": 56561 + }, + { + "epoch": 1.45, + "learning_rate": 1.1026973648616593e-06, + "loss": 0.6277, + "step": 56562 + }, + { + "epoch": 1.45, + "learning_rate": 1.1026698406718927e-06, + "loss": 0.4536, + "step": 56563 + }, + { + "epoch": 1.45, + "learning_rate": 1.102642316403516e-06, + "loss": 0.5352, + "step": 56564 + }, + { + "epoch": 1.45, + "learning_rate": 1.1026147920565512e-06, + "loss": 0.8076, + "step": 56565 + }, + { + "epoch": 1.45, + "learning_rate": 1.102587267631019e-06, + "loss": 0.5332, + "step": 56566 + }, + { + "epoch": 1.45, + "learning_rate": 1.1025597431269402e-06, + "loss": 0.6172, + "step": 56567 + }, + { + "epoch": 1.45, + "learning_rate": 1.1025322185443362e-06, + "loss": 0.5342, + "step": 56568 + }, + { + "epoch": 1.45, + "learning_rate": 1.1025046938832282e-06, + "loss": 0.6729, + "step": 56569 + }, + { + "epoch": 1.45, + "learning_rate": 1.1024771691436366e-06, + "loss": 0.6685, + "step": 56570 + }, + { + "epoch": 1.45, + "learning_rate": 1.1024496443255835e-06, + "loss": 0.6455, + "step": 56571 + }, + { + "epoch": 1.45, + "learning_rate": 1.102422119429089e-06, + "loss": 0.458, + "step": 56572 + }, + { + "epoch": 1.45, + "learning_rate": 1.1023945944541747e-06, + "loss": 0.4507, + "step": 56573 + }, + { + "epoch": 1.45, + "learning_rate": 1.1023670694008616e-06, + "loss": 0.5264, + "step": 56574 + }, + { + "epoch": 1.45, + "learning_rate": 1.1023395442691707e-06, + "loss": 0.6709, + "step": 56575 + }, + { + "epoch": 1.45, + "learning_rate": 1.1023120190591232e-06, + "loss": 0.7988, + "step": 56576 + }, + { + "epoch": 1.45, + "learning_rate": 1.10228449377074e-06, + "loss": 0.6143, + "step": 56577 + }, + { + "epoch": 1.45, + "learning_rate": 1.1022569684040423e-06, + "loss": 0.6001, + "step": 56578 + }, + { + "epoch": 1.45, + "learning_rate": 1.102229442959051e-06, + "loss": 0.6233, + "step": 56579 + }, + { + "epoch": 1.45, + "learning_rate": 1.1022019174357877e-06, + "loss": 0.6689, + "step": 56580 + }, + { + "epoch": 1.45, + "learning_rate": 1.102174391834273e-06, + "loss": 0.3196, + "step": 56581 + }, + { + "epoch": 1.45, + "learning_rate": 1.102146866154528e-06, + "loss": 0.6592, + "step": 56582 + }, + { + "epoch": 1.45, + "learning_rate": 1.1021193403965737e-06, + "loss": 0.6851, + "step": 56583 + }, + { + "epoch": 1.45, + "learning_rate": 1.1020918145604313e-06, + "loss": 0.5137, + "step": 56584 + }, + { + "epoch": 1.45, + "learning_rate": 1.102064288646122e-06, + "loss": 0.6709, + "step": 56585 + }, + { + "epoch": 1.45, + "learning_rate": 1.102036762653667e-06, + "loss": 0.7402, + "step": 56586 + }, + { + "epoch": 1.45, + "learning_rate": 1.1020092365830867e-06, + "loss": 0.5933, + "step": 56587 + }, + { + "epoch": 1.45, + "learning_rate": 1.1019817104344027e-06, + "loss": 0.5391, + "step": 56588 + }, + { + "epoch": 1.45, + "learning_rate": 1.1019541842076362e-06, + "loss": 0.6177, + "step": 56589 + }, + { + "epoch": 1.45, + "learning_rate": 1.1019266579028082e-06, + "loss": 0.6763, + "step": 56590 + }, + { + "epoch": 1.45, + "learning_rate": 1.1018991315199392e-06, + "loss": 0.6611, + "step": 56591 + }, + { + "epoch": 1.45, + "learning_rate": 1.1018716050590511e-06, + "loss": 0.6963, + "step": 56592 + }, + { + "epoch": 1.45, + "learning_rate": 1.1018440785201642e-06, + "loss": 0.6162, + "step": 56593 + }, + { + "epoch": 1.45, + "learning_rate": 1.1018165519033003e-06, + "loss": 0.7451, + "step": 56594 + }, + { + "epoch": 1.45, + "learning_rate": 1.10178902520848e-06, + "loss": 0.6963, + "step": 56595 + }, + { + "epoch": 1.45, + "learning_rate": 1.1017614984357246e-06, + "loss": 0.483, + "step": 56596 + }, + { + "epoch": 1.45, + "learning_rate": 1.101733971585055e-06, + "loss": 0.6191, + "step": 56597 + }, + { + "epoch": 1.45, + "learning_rate": 1.1017064446564925e-06, + "loss": 0.6934, + "step": 56598 + }, + { + "epoch": 1.45, + "learning_rate": 1.101678917650058e-06, + "loss": 0.6914, + "step": 56599 + }, + { + "epoch": 1.45, + "learning_rate": 1.1016513905657727e-06, + "loss": 0.5852, + "step": 56600 + }, + { + "epoch": 1.45, + "learning_rate": 1.1016238634036576e-06, + "loss": 0.7051, + "step": 56601 + }, + { + "epoch": 1.45, + "learning_rate": 1.1015963361637334e-06, + "loss": 0.5098, + "step": 56602 + }, + { + "epoch": 1.45, + "learning_rate": 1.1015688088460221e-06, + "loss": 0.4705, + "step": 56603 + }, + { + "epoch": 1.45, + "learning_rate": 1.101541281450544e-06, + "loss": 0.4229, + "step": 56604 + }, + { + "epoch": 1.45, + "learning_rate": 1.1015137539773208e-06, + "loss": 0.666, + "step": 56605 + }, + { + "epoch": 1.45, + "learning_rate": 1.1014862264263724e-06, + "loss": 0.6196, + "step": 56606 + }, + { + "epoch": 1.45, + "learning_rate": 1.1014586987977213e-06, + "loss": 0.7593, + "step": 56607 + }, + { + "epoch": 1.45, + "learning_rate": 1.1014311710913875e-06, + "loss": 0.6187, + "step": 56608 + }, + { + "epoch": 1.45, + "learning_rate": 1.1014036433073928e-06, + "loss": 0.5039, + "step": 56609 + }, + { + "epoch": 1.45, + "learning_rate": 1.1013761154457579e-06, + "loss": 0.7217, + "step": 56610 + }, + { + "epoch": 1.45, + "learning_rate": 1.101348587506504e-06, + "loss": 0.748, + "step": 56611 + }, + { + "epoch": 1.45, + "learning_rate": 1.101321059489652e-06, + "loss": 0.6333, + "step": 56612 + }, + { + "epoch": 1.45, + "learning_rate": 1.1012935313952233e-06, + "loss": 0.6177, + "step": 56613 + }, + { + "epoch": 1.45, + "learning_rate": 1.1012660032232389e-06, + "loss": 0.7764, + "step": 56614 + }, + { + "epoch": 1.45, + "learning_rate": 1.1012384749737198e-06, + "loss": 0.561, + "step": 56615 + }, + { + "epoch": 1.45, + "learning_rate": 1.1012109466466868e-06, + "loss": 0.7354, + "step": 56616 + }, + { + "epoch": 1.45, + "learning_rate": 1.1011834182421613e-06, + "loss": 0.7598, + "step": 56617 + }, + { + "epoch": 1.45, + "learning_rate": 1.1011558897601643e-06, + "loss": 0.8389, + "step": 56618 + }, + { + "epoch": 1.45, + "learning_rate": 1.101128361200717e-06, + "loss": 0.8037, + "step": 56619 + }, + { + "epoch": 1.45, + "learning_rate": 1.1011008325638402e-06, + "loss": 0.5759, + "step": 56620 + }, + { + "epoch": 1.45, + "learning_rate": 1.1010733038495552e-06, + "loss": 0.6973, + "step": 56621 + }, + { + "epoch": 1.45, + "learning_rate": 1.101045775057883e-06, + "loss": 0.6167, + "step": 56622 + }, + { + "epoch": 1.45, + "learning_rate": 1.1010182461888446e-06, + "loss": 0.6406, + "step": 56623 + }, + { + "epoch": 1.45, + "learning_rate": 1.1009907172424615e-06, + "loss": 0.4915, + "step": 56624 + }, + { + "epoch": 1.45, + "learning_rate": 1.1009631882187543e-06, + "loss": 0.5762, + "step": 56625 + }, + { + "epoch": 1.45, + "learning_rate": 1.1009356591177441e-06, + "loss": 0.708, + "step": 56626 + }, + { + "epoch": 1.45, + "learning_rate": 1.1009081299394524e-06, + "loss": 0.4434, + "step": 56627 + }, + { + "epoch": 1.45, + "learning_rate": 1.1008806006838995e-06, + "loss": 0.6699, + "step": 56628 + }, + { + "epoch": 1.45, + "learning_rate": 1.1008530713511073e-06, + "loss": 0.5122, + "step": 56629 + }, + { + "epoch": 1.45, + "learning_rate": 1.1008255419410967e-06, + "loss": 0.6191, + "step": 56630 + }, + { + "epoch": 1.45, + "learning_rate": 1.1007980124538882e-06, + "loss": 0.5195, + "step": 56631 + }, + { + "epoch": 1.45, + "learning_rate": 1.1007704828895038e-06, + "loss": 0.6558, + "step": 56632 + }, + { + "epoch": 1.45, + "learning_rate": 1.1007429532479636e-06, + "loss": 0.4116, + "step": 56633 + }, + { + "epoch": 1.45, + "learning_rate": 1.1007154235292893e-06, + "loss": 0.5103, + "step": 56634 + }, + { + "epoch": 1.45, + "learning_rate": 1.100687893733502e-06, + "loss": 0.7344, + "step": 56635 + }, + { + "epoch": 1.45, + "learning_rate": 1.1006603638606225e-06, + "loss": 0.7012, + "step": 56636 + }, + { + "epoch": 1.45, + "learning_rate": 1.1006328339106719e-06, + "loss": 0.6414, + "step": 56637 + }, + { + "epoch": 1.45, + "learning_rate": 1.1006053038836713e-06, + "loss": 0.5527, + "step": 56638 + }, + { + "epoch": 1.45, + "learning_rate": 1.100577773779642e-06, + "loss": 0.7227, + "step": 56639 + }, + { + "epoch": 1.45, + "learning_rate": 1.1005502435986049e-06, + "loss": 0.4365, + "step": 56640 + }, + { + "epoch": 1.45, + "learning_rate": 1.1005227133405812e-06, + "loss": 0.6777, + "step": 56641 + }, + { + "epoch": 1.45, + "learning_rate": 1.1004951830055918e-06, + "loss": 0.6782, + "step": 56642 + }, + { + "epoch": 1.45, + "learning_rate": 1.1004676525936575e-06, + "loss": 0.2974, + "step": 56643 + }, + { + "epoch": 1.45, + "learning_rate": 1.1004401221048004e-06, + "loss": 0.5361, + "step": 56644 + }, + { + "epoch": 1.45, + "learning_rate": 1.1004125915390405e-06, + "loss": 0.5715, + "step": 56645 + }, + { + "epoch": 1.45, + "learning_rate": 1.1003850608963994e-06, + "loss": 0.752, + "step": 56646 + }, + { + "epoch": 1.45, + "learning_rate": 1.1003575301768981e-06, + "loss": 0.7012, + "step": 56647 + }, + { + "epoch": 1.45, + "learning_rate": 1.1003299993805575e-06, + "loss": 0.6572, + "step": 56648 + }, + { + "epoch": 1.45, + "learning_rate": 1.100302468507399e-06, + "loss": 0.5986, + "step": 56649 + }, + { + "epoch": 1.45, + "learning_rate": 1.1002749375574433e-06, + "loss": 0.707, + "step": 56650 + }, + { + "epoch": 1.45, + "learning_rate": 1.1002474065307122e-06, + "loss": 0.5713, + "step": 56651 + }, + { + "epoch": 1.45, + "learning_rate": 1.1002198754272257e-06, + "loss": 0.595, + "step": 56652 + }, + { + "epoch": 1.45, + "learning_rate": 1.1001923442470059e-06, + "loss": 0.6543, + "step": 56653 + }, + { + "epoch": 1.45, + "learning_rate": 1.100164812990073e-06, + "loss": 0.54, + "step": 56654 + }, + { + "epoch": 1.45, + "learning_rate": 1.100137281656449e-06, + "loss": 0.6484, + "step": 56655 + }, + { + "epoch": 1.45, + "learning_rate": 1.100109750246154e-06, + "loss": 0.5527, + "step": 56656 + }, + { + "epoch": 1.45, + "learning_rate": 1.1000822187592098e-06, + "loss": 0.7207, + "step": 56657 + }, + { + "epoch": 1.45, + "learning_rate": 1.1000546871956372e-06, + "loss": 0.7158, + "step": 56658 + }, + { + "epoch": 1.45, + "learning_rate": 1.1000271555554573e-06, + "loss": 0.7422, + "step": 56659 + }, + { + "epoch": 1.45, + "learning_rate": 1.0999996238386912e-06, + "loss": 0.6997, + "step": 56660 + }, + { + "epoch": 1.45, + "learning_rate": 1.0999720920453601e-06, + "loss": 0.6924, + "step": 56661 + }, + { + "epoch": 1.45, + "learning_rate": 1.0999445601754848e-06, + "loss": 0.5986, + "step": 56662 + }, + { + "epoch": 1.45, + "learning_rate": 1.0999170282290868e-06, + "loss": 0.6523, + "step": 56663 + }, + { + "epoch": 1.45, + "learning_rate": 1.0998894962061867e-06, + "loss": 0.6035, + "step": 56664 + }, + { + "epoch": 1.45, + "learning_rate": 1.099861964106806e-06, + "loss": 0.4531, + "step": 56665 + }, + { + "epoch": 1.45, + "learning_rate": 1.0998344319309653e-06, + "loss": 0.5991, + "step": 56666 + }, + { + "epoch": 1.45, + "learning_rate": 1.099806899678686e-06, + "loss": 0.6914, + "step": 56667 + }, + { + "epoch": 1.45, + "learning_rate": 1.0997793673499894e-06, + "loss": 0.3951, + "step": 56668 + }, + { + "epoch": 1.45, + "learning_rate": 1.099751834944896e-06, + "loss": 0.6123, + "step": 56669 + }, + { + "epoch": 1.45, + "learning_rate": 1.0997243024634277e-06, + "loss": 0.5977, + "step": 56670 + }, + { + "epoch": 1.45, + "learning_rate": 1.0996967699056045e-06, + "loss": 0.6592, + "step": 56671 + }, + { + "epoch": 1.45, + "learning_rate": 1.0996692372714486e-06, + "loss": 0.6436, + "step": 56672 + }, + { + "epoch": 1.45, + "learning_rate": 1.09964170456098e-06, + "loss": 0.7129, + "step": 56673 + }, + { + "epoch": 1.45, + "learning_rate": 1.0996141717742208e-06, + "loss": 0.7407, + "step": 56674 + }, + { + "epoch": 1.45, + "learning_rate": 1.0995866389111917e-06, + "loss": 0.6309, + "step": 56675 + }, + { + "epoch": 1.45, + "learning_rate": 1.0995591059719134e-06, + "loss": 0.5547, + "step": 56676 + }, + { + "epoch": 1.45, + "learning_rate": 1.0995315729564071e-06, + "loss": 0.6196, + "step": 56677 + }, + { + "epoch": 1.45, + "learning_rate": 1.0995040398646944e-06, + "loss": 0.7012, + "step": 56678 + }, + { + "epoch": 1.45, + "learning_rate": 1.0994765066967957e-06, + "loss": 0.6104, + "step": 56679 + }, + { + "epoch": 1.45, + "learning_rate": 1.0994489734527329e-06, + "loss": 0.5745, + "step": 56680 + }, + { + "epoch": 1.45, + "learning_rate": 1.0994214401325262e-06, + "loss": 0.5231, + "step": 56681 + }, + { + "epoch": 1.45, + "learning_rate": 1.0993939067361973e-06, + "loss": 0.5986, + "step": 56682 + }, + { + "epoch": 1.45, + "learning_rate": 1.0993663732637666e-06, + "loss": 0.5654, + "step": 56683 + }, + { + "epoch": 1.45, + "learning_rate": 1.0993388397152562e-06, + "loss": 0.6284, + "step": 56684 + }, + { + "epoch": 1.45, + "learning_rate": 1.0993113060906865e-06, + "loss": 0.7295, + "step": 56685 + }, + { + "epoch": 1.45, + "learning_rate": 1.0992837723900784e-06, + "loss": 0.6416, + "step": 56686 + }, + { + "epoch": 1.45, + "learning_rate": 1.0992562386134533e-06, + "loss": 0.8086, + "step": 56687 + }, + { + "epoch": 1.45, + "learning_rate": 1.0992287047608327e-06, + "loss": 0.6133, + "step": 56688 + }, + { + "epoch": 1.45, + "learning_rate": 1.0992011708322366e-06, + "loss": 0.8076, + "step": 56689 + }, + { + "epoch": 1.45, + "learning_rate": 1.0991736368276874e-06, + "loss": 0.6313, + "step": 56690 + }, + { + "epoch": 1.45, + "learning_rate": 1.0991461027472052e-06, + "loss": 0.6992, + "step": 56691 + }, + { + "epoch": 1.45, + "learning_rate": 1.099118568590811e-06, + "loss": 0.6836, + "step": 56692 + }, + { + "epoch": 1.45, + "learning_rate": 1.0990910343585269e-06, + "loss": 0.6104, + "step": 56693 + }, + { + "epoch": 1.45, + "learning_rate": 1.099063500050373e-06, + "loss": 0.6245, + "step": 56694 + }, + { + "epoch": 1.45, + "learning_rate": 1.099035965666371e-06, + "loss": 0.6108, + "step": 56695 + }, + { + "epoch": 1.45, + "learning_rate": 1.0990084312065415e-06, + "loss": 0.5784, + "step": 56696 + }, + { + "epoch": 1.45, + "learning_rate": 1.098980896670906e-06, + "loss": 0.6504, + "step": 56697 + }, + { + "epoch": 1.45, + "learning_rate": 1.098953362059485e-06, + "loss": 0.6094, + "step": 56698 + }, + { + "epoch": 1.45, + "learning_rate": 1.0989258273723004e-06, + "loss": 0.5684, + "step": 56699 + }, + { + "epoch": 1.45, + "learning_rate": 1.0988982926093726e-06, + "loss": 0.7168, + "step": 56700 + }, + { + "epoch": 1.45, + "learning_rate": 1.098870757770723e-06, + "loss": 0.5254, + "step": 56701 + }, + { + "epoch": 1.45, + "learning_rate": 1.0988432228563724e-06, + "loss": 0.7627, + "step": 56702 + }, + { + "epoch": 1.45, + "learning_rate": 1.0988156878663423e-06, + "loss": 0.5981, + "step": 56703 + }, + { + "epoch": 1.45, + "learning_rate": 1.0987881528006534e-06, + "loss": 0.6602, + "step": 56704 + }, + { + "epoch": 1.45, + "learning_rate": 1.0987606176593274e-06, + "loss": 0.7236, + "step": 56705 + }, + { + "epoch": 1.45, + "learning_rate": 1.0987330824423847e-06, + "loss": 0.8428, + "step": 56706 + }, + { + "epoch": 1.45, + "learning_rate": 1.0987055471498463e-06, + "loss": 0.4424, + "step": 56707 + }, + { + "epoch": 1.45, + "learning_rate": 1.0986780117817338e-06, + "loss": 0.8184, + "step": 56708 + }, + { + "epoch": 1.45, + "learning_rate": 1.098650476338068e-06, + "loss": 0.6484, + "step": 56709 + }, + { + "epoch": 1.45, + "learning_rate": 1.0986229408188705e-06, + "loss": 0.4733, + "step": 56710 + }, + { + "epoch": 1.45, + "learning_rate": 1.0985954052241615e-06, + "loss": 0.6626, + "step": 56711 + }, + { + "epoch": 1.45, + "learning_rate": 1.0985678695539627e-06, + "loss": 0.6514, + "step": 56712 + }, + { + "epoch": 1.45, + "learning_rate": 1.0985403338082948e-06, + "loss": 0.7246, + "step": 56713 + }, + { + "epoch": 1.45, + "learning_rate": 1.0985127979871793e-06, + "loss": 0.5447, + "step": 56714 + }, + { + "epoch": 1.45, + "learning_rate": 1.0984852620906372e-06, + "loss": 0.5869, + "step": 56715 + }, + { + "epoch": 1.45, + "learning_rate": 1.0984577261186893e-06, + "loss": 0.7363, + "step": 56716 + }, + { + "epoch": 1.45, + "learning_rate": 1.0984301900713568e-06, + "loss": 0.4236, + "step": 56717 + }, + { + "epoch": 1.45, + "learning_rate": 1.0984026539486612e-06, + "loss": 0.7334, + "step": 56718 + }, + { + "epoch": 1.45, + "learning_rate": 1.0983751177506224e-06, + "loss": 0.7065, + "step": 56719 + }, + { + "epoch": 1.45, + "learning_rate": 1.098347581477263e-06, + "loss": 0.6074, + "step": 56720 + }, + { + "epoch": 1.45, + "learning_rate": 1.0983200451286032e-06, + "loss": 0.605, + "step": 56721 + }, + { + "epoch": 1.45, + "learning_rate": 1.0982925087046644e-06, + "loss": 0.5889, + "step": 56722 + }, + { + "epoch": 1.45, + "learning_rate": 1.0982649722054672e-06, + "loss": 0.7549, + "step": 56723 + }, + { + "epoch": 1.45, + "learning_rate": 1.0982374356310333e-06, + "loss": 0.7979, + "step": 56724 + }, + { + "epoch": 1.45, + "learning_rate": 1.0982098989813834e-06, + "loss": 0.6592, + "step": 56725 + }, + { + "epoch": 1.45, + "learning_rate": 1.0981823622565389e-06, + "loss": 0.6992, + "step": 56726 + }, + { + "epoch": 1.45, + "learning_rate": 1.0981548254565205e-06, + "loss": 0.8091, + "step": 56727 + }, + { + "epoch": 1.45, + "learning_rate": 1.0981272885813494e-06, + "loss": 0.5894, + "step": 56728 + }, + { + "epoch": 1.45, + "learning_rate": 1.0980997516310467e-06, + "loss": 0.7158, + "step": 56729 + }, + { + "epoch": 1.45, + "learning_rate": 1.0980722146056338e-06, + "loss": 0.7471, + "step": 56730 + }, + { + "epoch": 1.45, + "learning_rate": 1.0980446775051314e-06, + "loss": 0.5647, + "step": 56731 + }, + { + "epoch": 1.45, + "learning_rate": 1.0980171403295609e-06, + "loss": 0.6719, + "step": 56732 + }, + { + "epoch": 1.45, + "learning_rate": 1.0979896030789426e-06, + "loss": 0.5535, + "step": 56733 + }, + { + "epoch": 1.45, + "learning_rate": 1.0979620657532986e-06, + "loss": 0.5576, + "step": 56734 + }, + { + "epoch": 1.45, + "learning_rate": 1.0979345283526495e-06, + "loss": 0.5015, + "step": 56735 + }, + { + "epoch": 1.45, + "learning_rate": 1.0979069908770163e-06, + "loss": 0.6304, + "step": 56736 + }, + { + "epoch": 1.45, + "learning_rate": 1.0978794533264205e-06, + "loss": 0.6019, + "step": 56737 + }, + { + "epoch": 1.45, + "learning_rate": 1.0978519157008826e-06, + "loss": 0.4805, + "step": 56738 + }, + { + "epoch": 1.45, + "learning_rate": 1.097824378000424e-06, + "loss": 0.6025, + "step": 56739 + }, + { + "epoch": 1.45, + "learning_rate": 1.0977968402250658e-06, + "loss": 0.7637, + "step": 56740 + }, + { + "epoch": 1.45, + "learning_rate": 1.0977693023748294e-06, + "loss": 0.8003, + "step": 56741 + }, + { + "epoch": 1.45, + "learning_rate": 1.097741764449735e-06, + "loss": 0.8115, + "step": 56742 + }, + { + "epoch": 1.45, + "learning_rate": 1.0977142264498048e-06, + "loss": 0.7285, + "step": 56743 + }, + { + "epoch": 1.45, + "learning_rate": 1.0976866883750589e-06, + "loss": 0.749, + "step": 56744 + }, + { + "epoch": 1.45, + "learning_rate": 1.097659150225519e-06, + "loss": 0.8984, + "step": 56745 + }, + { + "epoch": 1.45, + "learning_rate": 1.097631612001206e-06, + "loss": 0.5142, + "step": 56746 + }, + { + "epoch": 1.45, + "learning_rate": 1.097604073702141e-06, + "loss": 0.6216, + "step": 56747 + }, + { + "epoch": 1.45, + "learning_rate": 1.0975765353283447e-06, + "loss": 0.5035, + "step": 56748 + }, + { + "epoch": 1.45, + "learning_rate": 1.0975489968798387e-06, + "loss": 0.6621, + "step": 56749 + }, + { + "epoch": 1.45, + "learning_rate": 1.0975214583566438e-06, + "loss": 0.5767, + "step": 56750 + }, + { + "epoch": 1.45, + "learning_rate": 1.0974939197587816e-06, + "loss": 0.6211, + "step": 56751 + }, + { + "epoch": 1.45, + "learning_rate": 1.0974663810862724e-06, + "loss": 0.6016, + "step": 56752 + }, + { + "epoch": 1.45, + "learning_rate": 1.097438842339138e-06, + "loss": 0.5576, + "step": 56753 + }, + { + "epoch": 1.45, + "learning_rate": 1.0974113035173987e-06, + "loss": 0.5081, + "step": 56754 + }, + { + "epoch": 1.45, + "learning_rate": 1.0973837646210764e-06, + "loss": 0.4861, + "step": 56755 + }, + { + "epoch": 1.45, + "learning_rate": 1.0973562256501918e-06, + "loss": 0.6514, + "step": 56756 + }, + { + "epoch": 1.45, + "learning_rate": 1.0973286866047658e-06, + "loss": 0.5967, + "step": 56757 + }, + { + "epoch": 1.45, + "learning_rate": 1.09730114748482e-06, + "loss": 0.5308, + "step": 56758 + }, + { + "epoch": 1.45, + "learning_rate": 1.0972736082903748e-06, + "loss": 0.6289, + "step": 56759 + }, + { + "epoch": 1.45, + "learning_rate": 1.0972460690214522e-06, + "loss": 0.751, + "step": 56760 + }, + { + "epoch": 1.45, + "learning_rate": 1.0972185296780724e-06, + "loss": 0.665, + "step": 56761 + }, + { + "epoch": 1.45, + "learning_rate": 1.097190990260257e-06, + "loss": 0.7583, + "step": 56762 + }, + { + "epoch": 1.45, + "learning_rate": 1.0971634507680268e-06, + "loss": 0.6885, + "step": 56763 + }, + { + "epoch": 1.45, + "learning_rate": 1.0971359112014028e-06, + "loss": 0.5957, + "step": 56764 + }, + { + "epoch": 1.45, + "learning_rate": 1.0971083715604068e-06, + "loss": 0.6855, + "step": 56765 + }, + { + "epoch": 1.45, + "learning_rate": 1.0970808318450592e-06, + "loss": 0.9736, + "step": 56766 + }, + { + "epoch": 1.45, + "learning_rate": 1.0970532920553812e-06, + "loss": 0.6663, + "step": 56767 + }, + { + "epoch": 1.45, + "learning_rate": 1.097025752191394e-06, + "loss": 0.7373, + "step": 56768 + }, + { + "epoch": 1.46, + "learning_rate": 1.0969982122531186e-06, + "loss": 0.7295, + "step": 56769 + }, + { + "epoch": 1.46, + "learning_rate": 1.0969706722405762e-06, + "loss": 0.6836, + "step": 56770 + }, + { + "epoch": 1.46, + "learning_rate": 1.0969431321537877e-06, + "loss": 0.7231, + "step": 56771 + }, + { + "epoch": 1.46, + "learning_rate": 1.0969155919927744e-06, + "loss": 0.5112, + "step": 56772 + }, + { + "epoch": 1.46, + "learning_rate": 1.0968880517575573e-06, + "loss": 0.6279, + "step": 56773 + }, + { + "epoch": 1.46, + "learning_rate": 1.0968605114481573e-06, + "loss": 0.6284, + "step": 56774 + }, + { + "epoch": 1.46, + "learning_rate": 1.0968329710645959e-06, + "loss": 0.5999, + "step": 56775 + }, + { + "epoch": 1.46, + "learning_rate": 1.0968054306068936e-06, + "loss": 0.6533, + "step": 56776 + }, + { + "epoch": 1.46, + "learning_rate": 1.0967778900750722e-06, + "loss": 0.665, + "step": 56777 + }, + { + "epoch": 1.46, + "learning_rate": 1.0967503494691523e-06, + "loss": 0.7852, + "step": 56778 + }, + { + "epoch": 1.46, + "learning_rate": 1.096722808789155e-06, + "loss": 0.543, + "step": 56779 + }, + { + "epoch": 1.46, + "learning_rate": 1.0966952680351017e-06, + "loss": 0.583, + "step": 56780 + }, + { + "epoch": 1.46, + "learning_rate": 1.096667727207013e-06, + "loss": 0.7451, + "step": 56781 + }, + { + "epoch": 1.46, + "learning_rate": 1.0966401863049104e-06, + "loss": 0.6592, + "step": 56782 + }, + { + "epoch": 1.46, + "learning_rate": 1.0966126453288148e-06, + "loss": 0.4889, + "step": 56783 + }, + { + "epoch": 1.46, + "learning_rate": 1.0965851042787475e-06, + "loss": 0.5464, + "step": 56784 + }, + { + "epoch": 1.46, + "learning_rate": 1.0965575631547298e-06, + "loss": 0.6841, + "step": 56785 + }, + { + "epoch": 1.46, + "learning_rate": 1.0965300219567817e-06, + "loss": 0.4351, + "step": 56786 + }, + { + "epoch": 1.46, + "learning_rate": 1.0965024806849251e-06, + "loss": 0.644, + "step": 56787 + }, + { + "epoch": 1.46, + "learning_rate": 1.0964749393391813e-06, + "loss": 0.7676, + "step": 56788 + }, + { + "epoch": 1.46, + "learning_rate": 1.0964473979195708e-06, + "loss": 0.6128, + "step": 56789 + }, + { + "epoch": 1.46, + "learning_rate": 1.0964198564261152e-06, + "loss": 0.6831, + "step": 56790 + }, + { + "epoch": 1.46, + "learning_rate": 1.0963923148588351e-06, + "loss": 0.6558, + "step": 56791 + }, + { + "epoch": 1.46, + "learning_rate": 1.096364773217752e-06, + "loss": 0.626, + "step": 56792 + }, + { + "epoch": 1.46, + "learning_rate": 1.096337231502887e-06, + "loss": 0.7285, + "step": 56793 + }, + { + "epoch": 1.46, + "learning_rate": 1.0963096897142606e-06, + "loss": 0.6313, + "step": 56794 + }, + { + "epoch": 1.46, + "learning_rate": 1.0962821478518946e-06, + "loss": 0.511, + "step": 56795 + }, + { + "epoch": 1.46, + "learning_rate": 1.0962546059158097e-06, + "loss": 0.7656, + "step": 56796 + }, + { + "epoch": 1.46, + "learning_rate": 1.096227063906027e-06, + "loss": 0.6699, + "step": 56797 + }, + { + "epoch": 1.46, + "learning_rate": 1.0961995218225677e-06, + "loss": 0.6885, + "step": 56798 + }, + { + "epoch": 1.46, + "learning_rate": 1.0961719796654529e-06, + "loss": 0.5815, + "step": 56799 + }, + { + "epoch": 1.46, + "learning_rate": 1.0961444374347038e-06, + "loss": 0.626, + "step": 56800 + }, + { + "epoch": 1.46, + "learning_rate": 1.096116895130341e-06, + "loss": 0.5811, + "step": 56801 + }, + { + "epoch": 1.46, + "learning_rate": 1.096089352752386e-06, + "loss": 0.4661, + "step": 56802 + }, + { + "epoch": 1.46, + "learning_rate": 1.0960618103008599e-06, + "loss": 0.707, + "step": 56803 + }, + { + "epoch": 1.46, + "learning_rate": 1.0960342677757836e-06, + "loss": 0.6045, + "step": 56804 + }, + { + "epoch": 1.46, + "learning_rate": 1.0960067251771782e-06, + "loss": 0.8018, + "step": 56805 + }, + { + "epoch": 1.46, + "learning_rate": 1.0959791825050653e-06, + "loss": 0.5312, + "step": 56806 + }, + { + "epoch": 1.46, + "learning_rate": 1.095951639759465e-06, + "loss": 0.5903, + "step": 56807 + }, + { + "epoch": 1.46, + "learning_rate": 1.0959240969403994e-06, + "loss": 0.5641, + "step": 56808 + }, + { + "epoch": 1.46, + "learning_rate": 1.0958965540478887e-06, + "loss": 0.6401, + "step": 56809 + }, + { + "epoch": 1.46, + "learning_rate": 1.0958690110819548e-06, + "loss": 0.6313, + "step": 56810 + }, + { + "epoch": 1.46, + "learning_rate": 1.0958414680426183e-06, + "loss": 0.709, + "step": 56811 + }, + { + "epoch": 1.46, + "learning_rate": 1.0958139249299004e-06, + "loss": 0.5229, + "step": 56812 + }, + { + "epoch": 1.46, + "learning_rate": 1.0957863817438218e-06, + "loss": 0.6099, + "step": 56813 + }, + { + "epoch": 1.46, + "learning_rate": 1.0957588384844043e-06, + "loss": 0.7412, + "step": 56814 + }, + { + "epoch": 1.46, + "learning_rate": 1.095731295151669e-06, + "loss": 0.4451, + "step": 56815 + }, + { + "epoch": 1.46, + "learning_rate": 1.0957037517456362e-06, + "loss": 0.7109, + "step": 56816 + }, + { + "epoch": 1.46, + "learning_rate": 1.0956762082663273e-06, + "loss": 0.4841, + "step": 56817 + }, + { + "epoch": 1.46, + "learning_rate": 1.095648664713764e-06, + "loss": 0.6768, + "step": 56818 + }, + { + "epoch": 1.46, + "learning_rate": 1.0956211210879665e-06, + "loss": 0.5889, + "step": 56819 + }, + { + "epoch": 1.46, + "learning_rate": 1.0955935773889565e-06, + "loss": 0.7236, + "step": 56820 + }, + { + "epoch": 1.46, + "learning_rate": 1.0955660336167548e-06, + "loss": 0.6562, + "step": 56821 + }, + { + "epoch": 1.46, + "learning_rate": 1.0955384897713826e-06, + "loss": 0.7305, + "step": 56822 + }, + { + "epoch": 1.46, + "learning_rate": 1.095510945852861e-06, + "loss": 0.4229, + "step": 56823 + }, + { + "epoch": 1.46, + "learning_rate": 1.0954834018612112e-06, + "loss": 0.5901, + "step": 56824 + }, + { + "epoch": 1.46, + "learning_rate": 1.095455857796454e-06, + "loss": 0.708, + "step": 56825 + }, + { + "epoch": 1.46, + "learning_rate": 1.0954283136586107e-06, + "loss": 0.6211, + "step": 56826 + }, + { + "epoch": 1.46, + "learning_rate": 1.0954007694477023e-06, + "loss": 0.5664, + "step": 56827 + }, + { + "epoch": 1.46, + "learning_rate": 1.0953732251637498e-06, + "loss": 0.5469, + "step": 56828 + }, + { + "epoch": 1.46, + "learning_rate": 1.0953456808067748e-06, + "loss": 0.6465, + "step": 56829 + }, + { + "epoch": 1.46, + "learning_rate": 1.0953181363767976e-06, + "loss": 0.6187, + "step": 56830 + }, + { + "epoch": 1.46, + "learning_rate": 1.09529059187384e-06, + "loss": 0.6455, + "step": 56831 + }, + { + "epoch": 1.46, + "learning_rate": 1.0952630472979223e-06, + "loss": 0.7529, + "step": 56832 + }, + { + "epoch": 1.46, + "learning_rate": 1.0952355026490665e-06, + "loss": 0.6929, + "step": 56833 + }, + { + "epoch": 1.46, + "learning_rate": 1.0952079579272928e-06, + "loss": 0.6699, + "step": 56834 + }, + { + "epoch": 1.46, + "learning_rate": 1.0951804131326234e-06, + "loss": 0.48, + "step": 56835 + }, + { + "epoch": 1.46, + "learning_rate": 1.0951528682650784e-06, + "loss": 0.6992, + "step": 56836 + }, + { + "epoch": 1.46, + "learning_rate": 1.0951253233246791e-06, + "loss": 0.7231, + "step": 56837 + }, + { + "epoch": 1.46, + "learning_rate": 1.0950977783114467e-06, + "loss": 0.5801, + "step": 56838 + }, + { + "epoch": 1.46, + "learning_rate": 1.0950702332254025e-06, + "loss": 0.5168, + "step": 56839 + }, + { + "epoch": 1.46, + "learning_rate": 1.0950426880665672e-06, + "loss": 0.6104, + "step": 56840 + }, + { + "epoch": 1.46, + "learning_rate": 1.0950151428349625e-06, + "loss": 0.667, + "step": 56841 + }, + { + "epoch": 1.46, + "learning_rate": 1.0949875975306087e-06, + "loss": 0.4958, + "step": 56842 + }, + { + "epoch": 1.46, + "learning_rate": 1.0949600521535273e-06, + "loss": 0.3528, + "step": 56843 + }, + { + "epoch": 1.46, + "learning_rate": 1.0949325067037392e-06, + "loss": 0.6294, + "step": 56844 + }, + { + "epoch": 1.46, + "learning_rate": 1.0949049611812659e-06, + "loss": 0.6289, + "step": 56845 + }, + { + "epoch": 1.46, + "learning_rate": 1.0948774155861282e-06, + "loss": 0.4341, + "step": 56846 + }, + { + "epoch": 1.46, + "learning_rate": 1.0948498699183472e-06, + "loss": 0.6816, + "step": 56847 + }, + { + "epoch": 1.46, + "learning_rate": 1.094822324177944e-06, + "loss": 0.9326, + "step": 56848 + }, + { + "epoch": 1.46, + "learning_rate": 1.0947947783649397e-06, + "loss": 0.6523, + "step": 56849 + }, + { + "epoch": 1.46, + "learning_rate": 1.0947672324793554e-06, + "loss": 0.6465, + "step": 56850 + }, + { + "epoch": 1.46, + "learning_rate": 1.0947396865212125e-06, + "loss": 0.7236, + "step": 56851 + }, + { + "epoch": 1.46, + "learning_rate": 1.0947121404905313e-06, + "loss": 0.6719, + "step": 56852 + }, + { + "epoch": 1.46, + "learning_rate": 1.0946845943873334e-06, + "loss": 0.6396, + "step": 56853 + }, + { + "epoch": 1.46, + "learning_rate": 1.0946570482116402e-06, + "loss": 0.6831, + "step": 56854 + }, + { + "epoch": 1.46, + "learning_rate": 1.0946295019634723e-06, + "loss": 0.6821, + "step": 56855 + }, + { + "epoch": 1.46, + "learning_rate": 1.0946019556428509e-06, + "loss": 0.7197, + "step": 56856 + }, + { + "epoch": 1.46, + "learning_rate": 1.094574409249797e-06, + "loss": 0.6436, + "step": 56857 + }, + { + "epoch": 1.46, + "learning_rate": 1.0945468627843322e-06, + "loss": 0.8809, + "step": 56858 + }, + { + "epoch": 1.46, + "learning_rate": 1.0945193162464767e-06, + "loss": 0.5054, + "step": 56859 + }, + { + "epoch": 1.46, + "learning_rate": 1.0944917696362528e-06, + "loss": 0.6616, + "step": 56860 + }, + { + "epoch": 1.46, + "learning_rate": 1.0944642229536802e-06, + "loss": 0.4873, + "step": 56861 + }, + { + "epoch": 1.46, + "learning_rate": 1.0944366761987812e-06, + "loss": 0.7012, + "step": 56862 + }, + { + "epoch": 1.46, + "learning_rate": 1.0944091293715758e-06, + "loss": 0.6079, + "step": 56863 + }, + { + "epoch": 1.46, + "learning_rate": 1.0943815824720861e-06, + "loss": 0.6855, + "step": 56864 + }, + { + "epoch": 1.46, + "learning_rate": 1.094354035500333e-06, + "loss": 0.6758, + "step": 56865 + }, + { + "epoch": 1.46, + "learning_rate": 1.0943264884563367e-06, + "loss": 0.4119, + "step": 56866 + }, + { + "epoch": 1.46, + "learning_rate": 1.0942989413401194e-06, + "loss": 0.5295, + "step": 56867 + }, + { + "epoch": 1.46, + "learning_rate": 1.0942713941517017e-06, + "loss": 0.6846, + "step": 56868 + }, + { + "epoch": 1.46, + "learning_rate": 1.0942438468911043e-06, + "loss": 0.6387, + "step": 56869 + }, + { + "epoch": 1.46, + "learning_rate": 1.0942162995583493e-06, + "loss": 0.5229, + "step": 56870 + }, + { + "epoch": 1.46, + "learning_rate": 1.0941887521534569e-06, + "loss": 0.7119, + "step": 56871 + }, + { + "epoch": 1.46, + "learning_rate": 1.0941612046764485e-06, + "loss": 0.6504, + "step": 56872 + }, + { + "epoch": 1.46, + "learning_rate": 1.0941336571273453e-06, + "loss": 0.3577, + "step": 56873 + }, + { + "epoch": 1.46, + "learning_rate": 1.0941061095061681e-06, + "loss": 0.5127, + "step": 56874 + }, + { + "epoch": 1.46, + "learning_rate": 1.0940785618129387e-06, + "loss": 0.7275, + "step": 56875 + }, + { + "epoch": 1.46, + "learning_rate": 1.0940510140476772e-06, + "loss": 0.6113, + "step": 56876 + }, + { + "epoch": 1.46, + "learning_rate": 1.0940234662104053e-06, + "loss": 0.624, + "step": 56877 + }, + { + "epoch": 1.46, + "learning_rate": 1.0939959183011438e-06, + "loss": 0.4521, + "step": 56878 + }, + { + "epoch": 1.46, + "learning_rate": 1.093968370319914e-06, + "loss": 0.5913, + "step": 56879 + }, + { + "epoch": 1.46, + "learning_rate": 1.0939408222667373e-06, + "loss": 0.5835, + "step": 56880 + }, + { + "epoch": 1.46, + "learning_rate": 1.0939132741416342e-06, + "loss": 0.6245, + "step": 56881 + }, + { + "epoch": 1.46, + "learning_rate": 1.0938857259446258e-06, + "loss": 0.4857, + "step": 56882 + }, + { + "epoch": 1.46, + "learning_rate": 1.0938581776757337e-06, + "loss": 0.5073, + "step": 56883 + }, + { + "epoch": 1.46, + "learning_rate": 1.0938306293349785e-06, + "loss": 0.5234, + "step": 56884 + }, + { + "epoch": 1.46, + "learning_rate": 1.0938030809223818e-06, + "loss": 0.7324, + "step": 56885 + }, + { + "epoch": 1.46, + "learning_rate": 1.093775532437964e-06, + "loss": 0.752, + "step": 56886 + }, + { + "epoch": 1.46, + "learning_rate": 1.093747983881747e-06, + "loss": 0.6111, + "step": 56887 + }, + { + "epoch": 1.46, + "learning_rate": 1.093720435253751e-06, + "loss": 0.6846, + "step": 56888 + }, + { + "epoch": 1.46, + "learning_rate": 1.093692886553998e-06, + "loss": 0.5632, + "step": 56889 + }, + { + "epoch": 1.46, + "learning_rate": 1.0936653377825085e-06, + "loss": 0.7227, + "step": 56890 + }, + { + "epoch": 1.46, + "learning_rate": 1.0936377889393035e-06, + "loss": 0.6533, + "step": 56891 + }, + { + "epoch": 1.46, + "learning_rate": 1.0936102400244048e-06, + "loss": 0.5403, + "step": 56892 + }, + { + "epoch": 1.46, + "learning_rate": 1.0935826910378325e-06, + "loss": 0.5364, + "step": 56893 + }, + { + "epoch": 1.46, + "learning_rate": 1.0935551419796089e-06, + "loss": 0.7041, + "step": 56894 + }, + { + "epoch": 1.46, + "learning_rate": 1.093527592849754e-06, + "loss": 0.4595, + "step": 56895 + }, + { + "epoch": 1.46, + "learning_rate": 1.0935000436482894e-06, + "loss": 0.5249, + "step": 56896 + }, + { + "epoch": 1.46, + "learning_rate": 1.0934724943752362e-06, + "loss": 0.6069, + "step": 56897 + }, + { + "epoch": 1.46, + "learning_rate": 1.0934449450306154e-06, + "loss": 0.4019, + "step": 56898 + }, + { + "epoch": 1.46, + "learning_rate": 1.0934173956144482e-06, + "loss": 0.7041, + "step": 56899 + }, + { + "epoch": 1.46, + "learning_rate": 1.0933898461267555e-06, + "loss": 0.5117, + "step": 56900 + }, + { + "epoch": 1.46, + "learning_rate": 1.0933622965675582e-06, + "loss": 0.7222, + "step": 56901 + }, + { + "epoch": 1.46, + "learning_rate": 1.0933347469368782e-06, + "loss": 0.7471, + "step": 56902 + }, + { + "epoch": 1.46, + "learning_rate": 1.0933071972347354e-06, + "loss": 0.7368, + "step": 56903 + }, + { + "epoch": 1.46, + "learning_rate": 1.0932796474611522e-06, + "loss": 0.6733, + "step": 56904 + }, + { + "epoch": 1.46, + "learning_rate": 1.0932520976161489e-06, + "loss": 0.502, + "step": 56905 + }, + { + "epoch": 1.46, + "learning_rate": 1.0932245476997468e-06, + "loss": 0.6807, + "step": 56906 + }, + { + "epoch": 1.46, + "learning_rate": 1.0931969977119665e-06, + "loss": 0.5605, + "step": 56907 + }, + { + "epoch": 1.46, + "learning_rate": 1.09316944765283e-06, + "loss": 0.6445, + "step": 56908 + }, + { + "epoch": 1.46, + "learning_rate": 1.093141897522358e-06, + "loss": 0.7324, + "step": 56909 + }, + { + "epoch": 1.46, + "learning_rate": 1.0931143473205713e-06, + "loss": 0.5645, + "step": 56910 + }, + { + "epoch": 1.46, + "learning_rate": 1.0930867970474913e-06, + "loss": 0.8154, + "step": 56911 + }, + { + "epoch": 1.46, + "learning_rate": 1.0930592467031387e-06, + "loss": 0.6323, + "step": 56912 + }, + { + "epoch": 1.46, + "learning_rate": 1.0930316962875354e-06, + "loss": 0.5229, + "step": 56913 + }, + { + "epoch": 1.46, + "learning_rate": 1.093004145800702e-06, + "loss": 0.5498, + "step": 56914 + }, + { + "epoch": 1.46, + "learning_rate": 1.0929765952426596e-06, + "loss": 0.3368, + "step": 56915 + }, + { + "epoch": 1.46, + "learning_rate": 1.0929490446134289e-06, + "loss": 0.6172, + "step": 56916 + }, + { + "epoch": 1.46, + "learning_rate": 1.0929214939130315e-06, + "loss": 0.7734, + "step": 56917 + }, + { + "epoch": 1.46, + "learning_rate": 1.0928939431414885e-06, + "loss": 0.6707, + "step": 56918 + }, + { + "epoch": 1.46, + "learning_rate": 1.092866392298821e-06, + "loss": 0.6577, + "step": 56919 + }, + { + "epoch": 1.46, + "learning_rate": 1.0928388413850499e-06, + "loss": 0.6611, + "step": 56920 + }, + { + "epoch": 1.46, + "learning_rate": 1.0928112904001962e-06, + "loss": 0.5918, + "step": 56921 + }, + { + "epoch": 1.46, + "learning_rate": 1.0927837393442811e-06, + "loss": 0.7812, + "step": 56922 + }, + { + "epoch": 1.46, + "learning_rate": 1.0927561882173262e-06, + "loss": 0.7461, + "step": 56923 + }, + { + "epoch": 1.46, + "learning_rate": 1.0927286370193521e-06, + "loss": 0.7314, + "step": 56924 + }, + { + "epoch": 1.46, + "learning_rate": 1.0927010857503797e-06, + "loss": 0.6174, + "step": 56925 + }, + { + "epoch": 1.46, + "learning_rate": 1.09267353441043e-06, + "loss": 0.6221, + "step": 56926 + }, + { + "epoch": 1.46, + "learning_rate": 1.0926459829995252e-06, + "loss": 0.8174, + "step": 56927 + }, + { + "epoch": 1.46, + "learning_rate": 1.092618431517685e-06, + "loss": 0.7607, + "step": 56928 + }, + { + "epoch": 1.46, + "learning_rate": 1.0925908799649314e-06, + "loss": 0.6069, + "step": 56929 + }, + { + "epoch": 1.46, + "learning_rate": 1.0925633283412851e-06, + "loss": 0.6968, + "step": 56930 + }, + { + "epoch": 1.46, + "learning_rate": 1.0925357766467676e-06, + "loss": 0.7554, + "step": 56931 + }, + { + "epoch": 1.46, + "learning_rate": 1.0925082248813995e-06, + "loss": 0.8115, + "step": 56932 + }, + { + "epoch": 1.46, + "learning_rate": 1.0924806730452021e-06, + "loss": 0.5391, + "step": 56933 + }, + { + "epoch": 1.46, + "learning_rate": 1.0924531211381966e-06, + "loss": 0.6924, + "step": 56934 + }, + { + "epoch": 1.46, + "learning_rate": 1.092425569160404e-06, + "loss": 0.667, + "step": 56935 + }, + { + "epoch": 1.46, + "learning_rate": 1.0923980171118452e-06, + "loss": 0.6748, + "step": 56936 + }, + { + "epoch": 1.46, + "learning_rate": 1.0923704649925415e-06, + "loss": 0.707, + "step": 56937 + }, + { + "epoch": 1.46, + "learning_rate": 1.092342912802514e-06, + "loss": 0.8252, + "step": 56938 + }, + { + "epoch": 1.46, + "learning_rate": 1.092315360541784e-06, + "loss": 0.6963, + "step": 56939 + }, + { + "epoch": 1.46, + "learning_rate": 1.0922878082103724e-06, + "loss": 0.5947, + "step": 56940 + }, + { + "epoch": 1.46, + "learning_rate": 1.0922602558082999e-06, + "loss": 0.6792, + "step": 56941 + }, + { + "epoch": 1.46, + "learning_rate": 1.0922327033355884e-06, + "loss": 0.5603, + "step": 56942 + }, + { + "epoch": 1.46, + "learning_rate": 1.092205150792258e-06, + "loss": 0.5981, + "step": 56943 + }, + { + "epoch": 1.46, + "learning_rate": 1.092177598178331e-06, + "loss": 0.708, + "step": 56944 + }, + { + "epoch": 1.46, + "learning_rate": 1.0921500454938272e-06, + "loss": 0.4836, + "step": 56945 + }, + { + "epoch": 1.46, + "learning_rate": 1.092122492738769e-06, + "loss": 0.6846, + "step": 56946 + }, + { + "epoch": 1.46, + "learning_rate": 1.0920949399131763e-06, + "loss": 0.4636, + "step": 56947 + }, + { + "epoch": 1.46, + "learning_rate": 1.092067387017071e-06, + "loss": 0.5264, + "step": 56948 + }, + { + "epoch": 1.46, + "learning_rate": 1.092039834050474e-06, + "loss": 0.457, + "step": 56949 + }, + { + "epoch": 1.46, + "learning_rate": 1.0920122810134063e-06, + "loss": 0.4454, + "step": 56950 + }, + { + "epoch": 1.46, + "learning_rate": 1.0919847279058887e-06, + "loss": 0.8047, + "step": 56951 + }, + { + "epoch": 1.46, + "learning_rate": 1.091957174727943e-06, + "loss": 0.4622, + "step": 56952 + }, + { + "epoch": 1.46, + "learning_rate": 1.0919296214795897e-06, + "loss": 0.7002, + "step": 56953 + }, + { + "epoch": 1.46, + "learning_rate": 1.0919020681608505e-06, + "loss": 0.3604, + "step": 56954 + }, + { + "epoch": 1.46, + "learning_rate": 1.0918745147717457e-06, + "loss": 0.625, + "step": 56955 + }, + { + "epoch": 1.46, + "learning_rate": 1.0918469613122967e-06, + "loss": 0.6426, + "step": 56956 + }, + { + "epoch": 1.46, + "learning_rate": 1.091819407782525e-06, + "loss": 0.5688, + "step": 56957 + }, + { + "epoch": 1.46, + "learning_rate": 1.0917918541824515e-06, + "loss": 0.6504, + "step": 56958 + }, + { + "epoch": 1.46, + "learning_rate": 1.091764300512097e-06, + "loss": 0.7129, + "step": 56959 + }, + { + "epoch": 1.46, + "learning_rate": 1.0917367467714829e-06, + "loss": 0.5048, + "step": 56960 + }, + { + "epoch": 1.46, + "learning_rate": 1.0917091929606302e-06, + "loss": 0.8037, + "step": 56961 + }, + { + "epoch": 1.46, + "learning_rate": 1.0916816390795597e-06, + "loss": 0.7236, + "step": 56962 + }, + { + "epoch": 1.46, + "learning_rate": 1.091654085128293e-06, + "loss": 0.6133, + "step": 56963 + }, + { + "epoch": 1.46, + "learning_rate": 1.0916265311068511e-06, + "loss": 0.7153, + "step": 56964 + }, + { + "epoch": 1.46, + "learning_rate": 1.091598977015255e-06, + "loss": 0.7295, + "step": 56965 + }, + { + "epoch": 1.46, + "learning_rate": 1.0915714228535254e-06, + "loss": 0.6172, + "step": 56966 + }, + { + "epoch": 1.46, + "learning_rate": 1.091543868621684e-06, + "loss": 0.709, + "step": 56967 + }, + { + "epoch": 1.46, + "learning_rate": 1.0915163143197517e-06, + "loss": 0.5054, + "step": 56968 + }, + { + "epoch": 1.46, + "learning_rate": 1.0914887599477499e-06, + "loss": 0.7432, + "step": 56969 + }, + { + "epoch": 1.46, + "learning_rate": 1.0914612055056986e-06, + "loss": 0.7021, + "step": 56970 + }, + { + "epoch": 1.46, + "learning_rate": 1.0914336509936202e-06, + "loss": 0.5845, + "step": 56971 + }, + { + "epoch": 1.46, + "learning_rate": 1.0914060964115351e-06, + "loss": 0.6296, + "step": 56972 + }, + { + "epoch": 1.46, + "learning_rate": 1.0913785417594646e-06, + "loss": 0.7295, + "step": 56973 + }, + { + "epoch": 1.46, + "learning_rate": 1.0913509870374298e-06, + "loss": 0.6191, + "step": 56974 + }, + { + "epoch": 1.46, + "learning_rate": 1.0913234322454516e-06, + "loss": 0.623, + "step": 56975 + }, + { + "epoch": 1.46, + "learning_rate": 1.0912958773835511e-06, + "loss": 0.6963, + "step": 56976 + }, + { + "epoch": 1.46, + "learning_rate": 1.09126832245175e-06, + "loss": 0.7812, + "step": 56977 + }, + { + "epoch": 1.46, + "learning_rate": 1.0912407674500686e-06, + "loss": 0.561, + "step": 56978 + }, + { + "epoch": 1.46, + "learning_rate": 1.0912132123785285e-06, + "loss": 0.7383, + "step": 56979 + }, + { + "epoch": 1.46, + "learning_rate": 1.0911856572371508e-06, + "loss": 0.594, + "step": 56980 + }, + { + "epoch": 1.46, + "learning_rate": 1.091158102025956e-06, + "loss": 0.6836, + "step": 56981 + }, + { + "epoch": 1.46, + "learning_rate": 1.0911305467449658e-06, + "loss": 0.4771, + "step": 56982 + }, + { + "epoch": 1.46, + "learning_rate": 1.091102991394201e-06, + "loss": 0.8076, + "step": 56983 + }, + { + "epoch": 1.46, + "learning_rate": 1.0910754359736836e-06, + "loss": 0.5361, + "step": 56984 + }, + { + "epoch": 1.46, + "learning_rate": 1.091047880483433e-06, + "loss": 0.6069, + "step": 56985 + }, + { + "epoch": 1.46, + "learning_rate": 1.0910203249234718e-06, + "loss": 0.5374, + "step": 56986 + }, + { + "epoch": 1.46, + "learning_rate": 1.0909927692938202e-06, + "loss": 0.7256, + "step": 56987 + }, + { + "epoch": 1.46, + "learning_rate": 1.0909652135944995e-06, + "loss": 0.7207, + "step": 56988 + }, + { + "epoch": 1.46, + "learning_rate": 1.0909376578255314e-06, + "loss": 0.564, + "step": 56989 + }, + { + "epoch": 1.46, + "learning_rate": 1.0909101019869362e-06, + "loss": 0.6875, + "step": 56990 + }, + { + "epoch": 1.46, + "learning_rate": 1.0908825460787351e-06, + "loss": 0.6221, + "step": 56991 + }, + { + "epoch": 1.46, + "learning_rate": 1.0908549901009498e-06, + "loss": 0.6572, + "step": 56992 + }, + { + "epoch": 1.46, + "learning_rate": 1.0908274340536009e-06, + "loss": 0.6824, + "step": 56993 + }, + { + "epoch": 1.46, + "learning_rate": 1.0907998779367099e-06, + "loss": 0.8145, + "step": 56994 + }, + { + "epoch": 1.46, + "learning_rate": 1.0907723217502972e-06, + "loss": 0.6777, + "step": 56995 + }, + { + "epoch": 1.46, + "learning_rate": 1.0907447654943844e-06, + "loss": 0.6191, + "step": 56996 + }, + { + "epoch": 1.46, + "learning_rate": 1.0907172091689924e-06, + "loss": 0.5586, + "step": 56997 + }, + { + "epoch": 1.46, + "learning_rate": 1.0906896527741425e-06, + "loss": 0.5991, + "step": 56998 + }, + { + "epoch": 1.46, + "learning_rate": 1.0906620963098558e-06, + "loss": 0.6821, + "step": 56999 + }, + { + "epoch": 1.46, + "learning_rate": 1.0906345397761533e-06, + "loss": 0.5967, + "step": 57000 + }, + { + "epoch": 1.46, + "learning_rate": 1.090606983173056e-06, + "loss": 0.6709, + "step": 57001 + }, + { + "epoch": 1.46, + "learning_rate": 1.090579426500585e-06, + "loss": 0.6846, + "step": 57002 + }, + { + "epoch": 1.46, + "learning_rate": 1.0905518697587617e-06, + "loss": 0.4976, + "step": 57003 + }, + { + "epoch": 1.46, + "learning_rate": 1.090524312947607e-06, + "loss": 0.5015, + "step": 57004 + }, + { + "epoch": 1.46, + "learning_rate": 1.0904967560671418e-06, + "loss": 0.6787, + "step": 57005 + }, + { + "epoch": 1.46, + "learning_rate": 1.0904691991173875e-06, + "loss": 0.562, + "step": 57006 + }, + { + "epoch": 1.46, + "learning_rate": 1.0904416420983651e-06, + "loss": 0.6582, + "step": 57007 + }, + { + "epoch": 1.46, + "learning_rate": 1.0904140850100955e-06, + "loss": 0.7168, + "step": 57008 + }, + { + "epoch": 1.46, + "learning_rate": 1.0903865278526006e-06, + "loss": 0.5601, + "step": 57009 + }, + { + "epoch": 1.46, + "learning_rate": 1.0903589706259002e-06, + "loss": 0.6064, + "step": 57010 + }, + { + "epoch": 1.46, + "learning_rate": 1.0903314133300166e-06, + "loss": 0.7266, + "step": 57011 + }, + { + "epoch": 1.46, + "learning_rate": 1.09030385596497e-06, + "loss": 0.6543, + "step": 57012 + }, + { + "epoch": 1.46, + "learning_rate": 1.0902762985307821e-06, + "loss": 0.7285, + "step": 57013 + }, + { + "epoch": 1.46, + "learning_rate": 1.090248741027474e-06, + "loss": 0.5049, + "step": 57014 + }, + { + "epoch": 1.46, + "learning_rate": 1.0902211834550664e-06, + "loss": 0.9189, + "step": 57015 + }, + { + "epoch": 1.46, + "learning_rate": 1.0901936258135802e-06, + "loss": 0.5674, + "step": 57016 + }, + { + "epoch": 1.46, + "learning_rate": 1.0901660681030374e-06, + "loss": 0.7041, + "step": 57017 + }, + { + "epoch": 1.46, + "learning_rate": 1.0901385103234583e-06, + "loss": 0.6172, + "step": 57018 + }, + { + "epoch": 1.46, + "learning_rate": 1.0901109524748643e-06, + "loss": 0.6982, + "step": 57019 + }, + { + "epoch": 1.46, + "learning_rate": 1.0900833945572768e-06, + "loss": 0.8213, + "step": 57020 + }, + { + "epoch": 1.46, + "learning_rate": 1.0900558365707162e-06, + "loss": 0.4783, + "step": 57021 + }, + { + "epoch": 1.46, + "learning_rate": 1.090028278515204e-06, + "loss": 0.7314, + "step": 57022 + }, + { + "epoch": 1.46, + "learning_rate": 1.0900007203907615e-06, + "loss": 0.6084, + "step": 57023 + }, + { + "epoch": 1.46, + "learning_rate": 1.0899731621974097e-06, + "loss": 0.6372, + "step": 57024 + }, + { + "epoch": 1.46, + "learning_rate": 1.0899456039351691e-06, + "loss": 0.7573, + "step": 57025 + }, + { + "epoch": 1.46, + "learning_rate": 1.0899180456040618e-06, + "loss": 0.8203, + "step": 57026 + }, + { + "epoch": 1.46, + "learning_rate": 1.0898904872041079e-06, + "loss": 0.5903, + "step": 57027 + }, + { + "epoch": 1.46, + "learning_rate": 1.0898629287353293e-06, + "loss": 0.7822, + "step": 57028 + }, + { + "epoch": 1.46, + "learning_rate": 1.089835370197747e-06, + "loss": 0.562, + "step": 57029 + }, + { + "epoch": 1.46, + "learning_rate": 1.0898078115913817e-06, + "loss": 0.6079, + "step": 57030 + }, + { + "epoch": 1.46, + "learning_rate": 1.0897802529162545e-06, + "loss": 0.5884, + "step": 57031 + }, + { + "epoch": 1.46, + "learning_rate": 1.089752694172387e-06, + "loss": 0.7256, + "step": 57032 + }, + { + "epoch": 1.46, + "learning_rate": 1.0897251353597996e-06, + "loss": 0.7373, + "step": 57033 + }, + { + "epoch": 1.46, + "learning_rate": 1.0896975764785141e-06, + "loss": 0.7559, + "step": 57034 + }, + { + "epoch": 1.46, + "learning_rate": 1.0896700175285512e-06, + "loss": 0.647, + "step": 57035 + }, + { + "epoch": 1.46, + "learning_rate": 1.0896424585099322e-06, + "loss": 0.5938, + "step": 57036 + }, + { + "epoch": 1.46, + "learning_rate": 1.0896148994226778e-06, + "loss": 0.4333, + "step": 57037 + }, + { + "epoch": 1.46, + "learning_rate": 1.0895873402668096e-06, + "loss": 0.6992, + "step": 57038 + }, + { + "epoch": 1.46, + "learning_rate": 1.0895597810423485e-06, + "loss": 0.8135, + "step": 57039 + }, + { + "epoch": 1.46, + "learning_rate": 1.0895322217493156e-06, + "loss": 0.5771, + "step": 57040 + }, + { + "epoch": 1.46, + "learning_rate": 1.0895046623877317e-06, + "loss": 0.7051, + "step": 57041 + }, + { + "epoch": 1.46, + "learning_rate": 1.0894771029576187e-06, + "loss": 0.8242, + "step": 57042 + }, + { + "epoch": 1.46, + "learning_rate": 1.0894495434589967e-06, + "loss": 0.6875, + "step": 57043 + }, + { + "epoch": 1.46, + "learning_rate": 1.0894219838918877e-06, + "loss": 0.6313, + "step": 57044 + }, + { + "epoch": 1.46, + "learning_rate": 1.0893944242563122e-06, + "loss": 0.6499, + "step": 57045 + }, + { + "epoch": 1.46, + "learning_rate": 1.0893668645522913e-06, + "loss": 0.8184, + "step": 57046 + }, + { + "epoch": 1.46, + "learning_rate": 1.0893393047798467e-06, + "loss": 0.5708, + "step": 57047 + }, + { + "epoch": 1.46, + "learning_rate": 1.089311744938999e-06, + "loss": 0.7363, + "step": 57048 + }, + { + "epoch": 1.46, + "learning_rate": 1.0892841850297694e-06, + "loss": 0.7666, + "step": 57049 + }, + { + "epoch": 1.46, + "learning_rate": 1.089256625052179e-06, + "loss": 0.6929, + "step": 57050 + }, + { + "epoch": 1.46, + "learning_rate": 1.0892290650062487e-06, + "loss": 0.6414, + "step": 57051 + }, + { + "epoch": 1.46, + "learning_rate": 1.0892015048919999e-06, + "loss": 0.7476, + "step": 57052 + }, + { + "epoch": 1.46, + "learning_rate": 1.0891739447094536e-06, + "loss": 0.6069, + "step": 57053 + }, + { + "epoch": 1.46, + "learning_rate": 1.089146384458631e-06, + "loss": 0.7324, + "step": 57054 + }, + { + "epoch": 1.46, + "learning_rate": 1.0891188241395533e-06, + "loss": 0.8867, + "step": 57055 + }, + { + "epoch": 1.46, + "learning_rate": 1.0890912637522411e-06, + "loss": 0.6904, + "step": 57056 + }, + { + "epoch": 1.46, + "learning_rate": 1.089063703296716e-06, + "loss": 0.6963, + "step": 57057 + }, + { + "epoch": 1.46, + "learning_rate": 1.0890361427729986e-06, + "loss": 0.7461, + "step": 57058 + }, + { + "epoch": 1.46, + "learning_rate": 1.0890085821811108e-06, + "loss": 0.5735, + "step": 57059 + }, + { + "epoch": 1.46, + "learning_rate": 1.0889810215210728e-06, + "loss": 0.5161, + "step": 57060 + }, + { + "epoch": 1.46, + "learning_rate": 1.0889534607929065e-06, + "loss": 0.6777, + "step": 57061 + }, + { + "epoch": 1.46, + "learning_rate": 1.0889258999966322e-06, + "loss": 0.7139, + "step": 57062 + }, + { + "epoch": 1.46, + "learning_rate": 1.0888983391322717e-06, + "loss": 0.5424, + "step": 57063 + }, + { + "epoch": 1.46, + "learning_rate": 1.088870778199846e-06, + "loss": 0.8076, + "step": 57064 + }, + { + "epoch": 1.46, + "learning_rate": 1.0888432171993757e-06, + "loss": 0.7344, + "step": 57065 + }, + { + "epoch": 1.46, + "learning_rate": 1.0888156561308824e-06, + "loss": 0.6396, + "step": 57066 + }, + { + "epoch": 1.46, + "learning_rate": 1.088788094994387e-06, + "loss": 0.7021, + "step": 57067 + }, + { + "epoch": 1.46, + "learning_rate": 1.0887605337899105e-06, + "loss": 0.7246, + "step": 57068 + }, + { + "epoch": 1.46, + "learning_rate": 1.0887329725174743e-06, + "loss": 0.7168, + "step": 57069 + }, + { + "epoch": 1.46, + "learning_rate": 1.0887054111770994e-06, + "loss": 0.623, + "step": 57070 + }, + { + "epoch": 1.46, + "learning_rate": 1.0886778497688066e-06, + "loss": 0.8057, + "step": 57071 + }, + { + "epoch": 1.46, + "learning_rate": 1.0886502882926174e-06, + "loss": 0.709, + "step": 57072 + }, + { + "epoch": 1.46, + "learning_rate": 1.0886227267485526e-06, + "loss": 0.6982, + "step": 57073 + }, + { + "epoch": 1.46, + "learning_rate": 1.0885951651366338e-06, + "loss": 0.6279, + "step": 57074 + }, + { + "epoch": 1.46, + "learning_rate": 1.0885676034568817e-06, + "loss": 0.6353, + "step": 57075 + }, + { + "epoch": 1.46, + "learning_rate": 1.0885400417093174e-06, + "loss": 0.6514, + "step": 57076 + }, + { + "epoch": 1.46, + "learning_rate": 1.0885124798939618e-06, + "loss": 0.5371, + "step": 57077 + }, + { + "epoch": 1.46, + "learning_rate": 1.0884849180108365e-06, + "loss": 0.6543, + "step": 57078 + }, + { + "epoch": 1.46, + "learning_rate": 1.0884573560599625e-06, + "loss": 0.5718, + "step": 57079 + }, + { + "epoch": 1.46, + "learning_rate": 1.0884297940413605e-06, + "loss": 0.6602, + "step": 57080 + }, + { + "epoch": 1.46, + "learning_rate": 1.0884022319550516e-06, + "loss": 0.5908, + "step": 57081 + }, + { + "epoch": 1.46, + "learning_rate": 1.0883746698010576e-06, + "loss": 0.7803, + "step": 57082 + }, + { + "epoch": 1.46, + "learning_rate": 1.088347107579399e-06, + "loss": 0.8027, + "step": 57083 + }, + { + "epoch": 1.46, + "learning_rate": 1.0883195452900974e-06, + "loss": 0.4956, + "step": 57084 + }, + { + "epoch": 1.46, + "learning_rate": 1.0882919829331734e-06, + "loss": 0.7793, + "step": 57085 + }, + { + "epoch": 1.46, + "learning_rate": 1.0882644205086485e-06, + "loss": 0.6973, + "step": 57086 + }, + { + "epoch": 1.46, + "learning_rate": 1.088236858016543e-06, + "loss": 0.6899, + "step": 57087 + }, + { + "epoch": 1.46, + "learning_rate": 1.0882092954568792e-06, + "loss": 0.5956, + "step": 57088 + }, + { + "epoch": 1.46, + "learning_rate": 1.0881817328296775e-06, + "loss": 0.4443, + "step": 57089 + }, + { + "epoch": 1.46, + "learning_rate": 1.0881541701349586e-06, + "loss": 0.667, + "step": 57090 + }, + { + "epoch": 1.46, + "learning_rate": 1.0881266073727443e-06, + "loss": 0.5605, + "step": 57091 + }, + { + "epoch": 1.46, + "learning_rate": 1.0880990445430558e-06, + "loss": 0.6826, + "step": 57092 + }, + { + "epoch": 1.46, + "learning_rate": 1.0880714816459139e-06, + "loss": 0.5101, + "step": 57093 + }, + { + "epoch": 1.46, + "learning_rate": 1.0880439186813394e-06, + "loss": 0.5197, + "step": 57094 + }, + { + "epoch": 1.46, + "learning_rate": 1.088016355649354e-06, + "loss": 0.8662, + "step": 57095 + }, + { + "epoch": 1.46, + "learning_rate": 1.0879887925499785e-06, + "loss": 0.6616, + "step": 57096 + }, + { + "epoch": 1.46, + "learning_rate": 1.0879612293832338e-06, + "loss": 0.623, + "step": 57097 + }, + { + "epoch": 1.46, + "learning_rate": 1.0879336661491415e-06, + "loss": 0.8652, + "step": 57098 + }, + { + "epoch": 1.46, + "learning_rate": 1.0879061028477225e-06, + "loss": 0.6577, + "step": 57099 + }, + { + "epoch": 1.46, + "learning_rate": 1.0878785394789975e-06, + "loss": 0.7979, + "step": 57100 + }, + { + "epoch": 1.46, + "learning_rate": 1.0878509760429882e-06, + "loss": 0.9111, + "step": 57101 + }, + { + "epoch": 1.46, + "learning_rate": 1.0878234125397152e-06, + "loss": 0.625, + "step": 57102 + }, + { + "epoch": 1.46, + "learning_rate": 1.0877958489692e-06, + "loss": 0.6484, + "step": 57103 + }, + { + "epoch": 1.46, + "learning_rate": 1.0877682853314637e-06, + "loss": 0.7197, + "step": 57104 + }, + { + "epoch": 1.46, + "learning_rate": 1.0877407216265274e-06, + "loss": 0.6572, + "step": 57105 + }, + { + "epoch": 1.46, + "learning_rate": 1.0877131578544114e-06, + "loss": 0.8301, + "step": 57106 + }, + { + "epoch": 1.46, + "learning_rate": 1.087685594015138e-06, + "loss": 0.8311, + "step": 57107 + }, + { + "epoch": 1.46, + "learning_rate": 1.0876580301087275e-06, + "loss": 0.6606, + "step": 57108 + }, + { + "epoch": 1.46, + "learning_rate": 1.0876304661352014e-06, + "loss": 0.5508, + "step": 57109 + }, + { + "epoch": 1.46, + "learning_rate": 1.0876029020945809e-06, + "loss": 0.6025, + "step": 57110 + }, + { + "epoch": 1.46, + "learning_rate": 1.0875753379868865e-06, + "loss": 0.626, + "step": 57111 + }, + { + "epoch": 1.46, + "learning_rate": 1.08754777381214e-06, + "loss": 0.8164, + "step": 57112 + }, + { + "epoch": 1.46, + "learning_rate": 1.087520209570362e-06, + "loss": 0.6826, + "step": 57113 + }, + { + "epoch": 1.46, + "learning_rate": 1.087492645261574e-06, + "loss": 0.6451, + "step": 57114 + }, + { + "epoch": 1.46, + "learning_rate": 1.0874650808857965e-06, + "loss": 0.4966, + "step": 57115 + }, + { + "epoch": 1.46, + "learning_rate": 1.0874375164430513e-06, + "loss": 0.563, + "step": 57116 + }, + { + "epoch": 1.46, + "learning_rate": 1.0874099519333593e-06, + "loss": 0.6572, + "step": 57117 + }, + { + "epoch": 1.46, + "learning_rate": 1.0873823873567414e-06, + "loss": 0.5884, + "step": 57118 + }, + { + "epoch": 1.46, + "learning_rate": 1.0873548227132189e-06, + "loss": 0.6216, + "step": 57119 + }, + { + "epoch": 1.46, + "learning_rate": 1.0873272580028127e-06, + "loss": 0.4543, + "step": 57120 + }, + { + "epoch": 1.46, + "learning_rate": 1.0872996932255441e-06, + "loss": 0.582, + "step": 57121 + }, + { + "epoch": 1.46, + "learning_rate": 1.087272128381434e-06, + "loss": 0.7236, + "step": 57122 + }, + { + "epoch": 1.46, + "learning_rate": 1.0872445634705038e-06, + "loss": 0.7168, + "step": 57123 + }, + { + "epoch": 1.46, + "learning_rate": 1.0872169984927745e-06, + "loss": 0.5996, + "step": 57124 + }, + { + "epoch": 1.46, + "learning_rate": 1.0871894334482672e-06, + "loss": 0.604, + "step": 57125 + }, + { + "epoch": 1.46, + "learning_rate": 1.0871618683370028e-06, + "loss": 0.7461, + "step": 57126 + }, + { + "epoch": 1.46, + "learning_rate": 1.0871343031590027e-06, + "loss": 0.7627, + "step": 57127 + }, + { + "epoch": 1.46, + "learning_rate": 1.0871067379142877e-06, + "loss": 0.6958, + "step": 57128 + }, + { + "epoch": 1.46, + "learning_rate": 1.0870791726028793e-06, + "loss": 0.7256, + "step": 57129 + }, + { + "epoch": 1.46, + "learning_rate": 1.0870516072247981e-06, + "loss": 0.647, + "step": 57130 + }, + { + "epoch": 1.46, + "learning_rate": 1.0870240417800657e-06, + "loss": 0.7656, + "step": 57131 + }, + { + "epoch": 1.46, + "learning_rate": 1.0869964762687028e-06, + "loss": 0.6387, + "step": 57132 + }, + { + "epoch": 1.46, + "learning_rate": 1.0869689106907306e-06, + "loss": 0.7773, + "step": 57133 + }, + { + "epoch": 1.46, + "learning_rate": 1.0869413450461706e-06, + "loss": 0.7158, + "step": 57134 + }, + { + "epoch": 1.46, + "learning_rate": 1.0869137793350435e-06, + "loss": 0.75, + "step": 57135 + }, + { + "epoch": 1.46, + "learning_rate": 1.0868862135573707e-06, + "loss": 0.6709, + "step": 57136 + }, + { + "epoch": 1.46, + "learning_rate": 1.0868586477131729e-06, + "loss": 0.564, + "step": 57137 + }, + { + "epoch": 1.46, + "learning_rate": 1.0868310818024715e-06, + "loss": 0.6201, + "step": 57138 + }, + { + "epoch": 1.46, + "learning_rate": 1.0868035158252878e-06, + "loss": 0.708, + "step": 57139 + }, + { + "epoch": 1.46, + "learning_rate": 1.086775949781642e-06, + "loss": 0.6973, + "step": 57140 + }, + { + "epoch": 1.46, + "learning_rate": 1.0867483836715563e-06, + "loss": 0.5906, + "step": 57141 + }, + { + "epoch": 1.46, + "learning_rate": 1.0867208174950513e-06, + "loss": 0.6904, + "step": 57142 + }, + { + "epoch": 1.46, + "learning_rate": 1.086693251252148e-06, + "loss": 0.707, + "step": 57143 + }, + { + "epoch": 1.46, + "learning_rate": 1.0866656849428679e-06, + "loss": 0.5498, + "step": 57144 + }, + { + "epoch": 1.46, + "learning_rate": 1.0866381185672318e-06, + "loss": 0.6084, + "step": 57145 + }, + { + "epoch": 1.46, + "learning_rate": 1.0866105521252606e-06, + "loss": 0.5007, + "step": 57146 + }, + { + "epoch": 1.46, + "learning_rate": 1.0865829856169762e-06, + "loss": 0.6982, + "step": 57147 + }, + { + "epoch": 1.46, + "learning_rate": 1.0865554190423987e-06, + "loss": 0.6494, + "step": 57148 + }, + { + "epoch": 1.46, + "learning_rate": 1.0865278524015503e-06, + "loss": 0.6785, + "step": 57149 + }, + { + "epoch": 1.46, + "learning_rate": 1.0865002856944507e-06, + "loss": 0.5522, + "step": 57150 + }, + { + "epoch": 1.46, + "learning_rate": 1.0864727189211225e-06, + "loss": 0.7036, + "step": 57151 + }, + { + "epoch": 1.46, + "learning_rate": 1.0864451520815856e-06, + "loss": 0.6321, + "step": 57152 + }, + { + "epoch": 1.46, + "learning_rate": 1.0864175851758619e-06, + "loss": 0.4064, + "step": 57153 + }, + { + "epoch": 1.46, + "learning_rate": 1.0863900182039722e-06, + "loss": 0.6963, + "step": 57154 + }, + { + "epoch": 1.46, + "learning_rate": 1.0863624511659375e-06, + "loss": 0.5669, + "step": 57155 + }, + { + "epoch": 1.46, + "learning_rate": 1.0863348840617792e-06, + "loss": 0.6963, + "step": 57156 + }, + { + "epoch": 1.46, + "learning_rate": 1.0863073168915182e-06, + "loss": 0.7305, + "step": 57157 + }, + { + "epoch": 1.46, + "learning_rate": 1.0862797496551757e-06, + "loss": 0.603, + "step": 57158 + }, + { + "epoch": 1.47, + "learning_rate": 1.0862521823527725e-06, + "loss": 0.6309, + "step": 57159 + }, + { + "epoch": 1.47, + "learning_rate": 1.0862246149843304e-06, + "loss": 0.5933, + "step": 57160 + }, + { + "epoch": 1.47, + "learning_rate": 1.0861970475498697e-06, + "loss": 0.6431, + "step": 57161 + }, + { + "epoch": 1.47, + "learning_rate": 1.0861694800494122e-06, + "loss": 0.499, + "step": 57162 + }, + { + "epoch": 1.47, + "learning_rate": 1.0861419124829783e-06, + "loss": 0.6924, + "step": 57163 + }, + { + "epoch": 1.47, + "learning_rate": 1.08611434485059e-06, + "loss": 0.5635, + "step": 57164 + }, + { + "epoch": 1.47, + "learning_rate": 1.0860867771522676e-06, + "loss": 0.6211, + "step": 57165 + }, + { + "epoch": 1.47, + "learning_rate": 1.0860592093880326e-06, + "loss": 0.6582, + "step": 57166 + }, + { + "epoch": 1.47, + "learning_rate": 1.0860316415579058e-06, + "loss": 0.6729, + "step": 57167 + }, + { + "epoch": 1.47, + "learning_rate": 1.0860040736619087e-06, + "loss": 0.6543, + "step": 57168 + }, + { + "epoch": 1.47, + "learning_rate": 1.0859765057000624e-06, + "loss": 0.6777, + "step": 57169 + }, + { + "epoch": 1.47, + "learning_rate": 1.085948937672388e-06, + "loss": 0.5201, + "step": 57170 + }, + { + "epoch": 1.47, + "learning_rate": 1.0859213695789057e-06, + "loss": 0.6343, + "step": 57171 + }, + { + "epoch": 1.47, + "learning_rate": 1.085893801419638e-06, + "loss": 0.5688, + "step": 57172 + }, + { + "epoch": 1.47, + "learning_rate": 1.0858662331946048e-06, + "loss": 0.4475, + "step": 57173 + }, + { + "epoch": 1.47, + "learning_rate": 1.0858386649038285e-06, + "loss": 0.6392, + "step": 57174 + }, + { + "epoch": 1.47, + "learning_rate": 1.085811096547329e-06, + "loss": 0.8359, + "step": 57175 + }, + { + "epoch": 1.47, + "learning_rate": 1.0857835281251282e-06, + "loss": 0.7324, + "step": 57176 + }, + { + "epoch": 1.47, + "learning_rate": 1.0857559596372465e-06, + "loss": 0.585, + "step": 57177 + }, + { + "epoch": 1.47, + "learning_rate": 1.0857283910837057e-06, + "loss": 0.708, + "step": 57178 + }, + { + "epoch": 1.47, + "learning_rate": 1.0857008224645265e-06, + "loss": 0.7529, + "step": 57179 + }, + { + "epoch": 1.47, + "learning_rate": 1.08567325377973e-06, + "loss": 0.6895, + "step": 57180 + }, + { + "epoch": 1.47, + "learning_rate": 1.0856456850293377e-06, + "loss": 0.5962, + "step": 57181 + }, + { + "epoch": 1.47, + "learning_rate": 1.0856181162133702e-06, + "loss": 0.7324, + "step": 57182 + }, + { + "epoch": 1.47, + "learning_rate": 1.0855905473318492e-06, + "loss": 0.5724, + "step": 57183 + }, + { + "epoch": 1.47, + "learning_rate": 1.085562978384795e-06, + "loss": 0.6934, + "step": 57184 + }, + { + "epoch": 1.47, + "learning_rate": 1.0855354093722295e-06, + "loss": 0.7617, + "step": 57185 + }, + { + "epoch": 1.47, + "learning_rate": 1.0855078402941731e-06, + "loss": 0.8369, + "step": 57186 + }, + { + "epoch": 1.47, + "learning_rate": 1.0854802711506477e-06, + "loss": 0.7334, + "step": 57187 + }, + { + "epoch": 1.47, + "learning_rate": 1.0854527019416737e-06, + "loss": 0.6973, + "step": 57188 + }, + { + "epoch": 1.47, + "learning_rate": 1.0854251326672728e-06, + "loss": 0.6658, + "step": 57189 + }, + { + "epoch": 1.47, + "learning_rate": 1.0853975633274654e-06, + "loss": 0.4663, + "step": 57190 + }, + { + "epoch": 1.47, + "learning_rate": 1.0853699939222733e-06, + "loss": 0.7109, + "step": 57191 + }, + { + "epoch": 1.47, + "learning_rate": 1.0853424244517171e-06, + "loss": 0.6113, + "step": 57192 + }, + { + "epoch": 1.47, + "learning_rate": 1.0853148549158185e-06, + "loss": 0.625, + "step": 57193 + }, + { + "epoch": 1.47, + "learning_rate": 1.0852872853145977e-06, + "loss": 0.7559, + "step": 57194 + }, + { + "epoch": 1.47, + "learning_rate": 1.0852597156480769e-06, + "loss": 0.6777, + "step": 57195 + }, + { + "epoch": 1.47, + "learning_rate": 1.0852321459162762e-06, + "loss": 0.749, + "step": 57196 + }, + { + "epoch": 1.47, + "learning_rate": 1.0852045761192174e-06, + "loss": 0.5835, + "step": 57197 + }, + { + "epoch": 1.47, + "learning_rate": 1.0851770062569214e-06, + "loss": 0.5341, + "step": 57198 + }, + { + "epoch": 1.47, + "learning_rate": 1.0851494363294092e-06, + "loss": 0.6172, + "step": 57199 + }, + { + "epoch": 1.47, + "learning_rate": 1.085121866336702e-06, + "loss": 0.5371, + "step": 57200 + }, + { + "epoch": 1.47, + "learning_rate": 1.085094296278821e-06, + "loss": 0.491, + "step": 57201 + }, + { + "epoch": 1.47, + "learning_rate": 1.0850667261557871e-06, + "loss": 0.6943, + "step": 57202 + }, + { + "epoch": 1.47, + "learning_rate": 1.0850391559676215e-06, + "loss": 0.707, + "step": 57203 + }, + { + "epoch": 1.47, + "learning_rate": 1.0850115857143456e-06, + "loss": 0.52, + "step": 57204 + }, + { + "epoch": 1.47, + "learning_rate": 1.0849840153959798e-06, + "loss": 0.7012, + "step": 57205 + }, + { + "epoch": 1.47, + "learning_rate": 1.084956445012546e-06, + "loss": 0.6221, + "step": 57206 + }, + { + "epoch": 1.47, + "learning_rate": 1.0849288745640646e-06, + "loss": 0.6445, + "step": 57207 + }, + { + "epoch": 1.47, + "learning_rate": 1.0849013040505575e-06, + "loss": 0.7715, + "step": 57208 + }, + { + "epoch": 1.47, + "learning_rate": 1.084873733472045e-06, + "loss": 0.6992, + "step": 57209 + }, + { + "epoch": 1.47, + "learning_rate": 1.0848461628285487e-06, + "loss": 0.6636, + "step": 57210 + }, + { + "epoch": 1.47, + "learning_rate": 1.0848185921200897e-06, + "loss": 0.6465, + "step": 57211 + }, + { + "epoch": 1.47, + "learning_rate": 1.0847910213466888e-06, + "loss": 0.7002, + "step": 57212 + }, + { + "epoch": 1.47, + "learning_rate": 1.0847634505083675e-06, + "loss": 0.6191, + "step": 57213 + }, + { + "epoch": 1.47, + "learning_rate": 1.0847358796051468e-06, + "loss": 0.5308, + "step": 57214 + }, + { + "epoch": 1.47, + "learning_rate": 1.0847083086370476e-06, + "loss": 0.7705, + "step": 57215 + }, + { + "epoch": 1.47, + "learning_rate": 1.0846807376040913e-06, + "loss": 0.6514, + "step": 57216 + }, + { + "epoch": 1.47, + "learning_rate": 1.0846531665062986e-06, + "loss": 0.7236, + "step": 57217 + }, + { + "epoch": 1.47, + "learning_rate": 1.0846255953436912e-06, + "loss": 0.623, + "step": 57218 + }, + { + "epoch": 1.47, + "learning_rate": 1.0845980241162896e-06, + "loss": 0.665, + "step": 57219 + }, + { + "epoch": 1.47, + "learning_rate": 1.0845704528241151e-06, + "loss": 0.5986, + "step": 57220 + }, + { + "epoch": 1.47, + "learning_rate": 1.0845428814671888e-06, + "loss": 0.665, + "step": 57221 + }, + { + "epoch": 1.47, + "learning_rate": 1.0845153100455323e-06, + "loss": 0.5535, + "step": 57222 + }, + { + "epoch": 1.47, + "learning_rate": 1.0844877385591662e-06, + "loss": 0.6309, + "step": 57223 + }, + { + "epoch": 1.47, + "learning_rate": 1.0844601670081116e-06, + "loss": 0.6685, + "step": 57224 + }, + { + "epoch": 1.47, + "learning_rate": 1.0844325953923898e-06, + "loss": 0.6475, + "step": 57225 + }, + { + "epoch": 1.47, + "learning_rate": 1.0844050237120217e-06, + "loss": 0.48, + "step": 57226 + }, + { + "epoch": 1.47, + "learning_rate": 1.0843774519670287e-06, + "loss": 0.7256, + "step": 57227 + }, + { + "epoch": 1.47, + "learning_rate": 1.0843498801574317e-06, + "loss": 0.7402, + "step": 57228 + }, + { + "epoch": 1.47, + "learning_rate": 1.0843223082832522e-06, + "loss": 0.7061, + "step": 57229 + }, + { + "epoch": 1.47, + "learning_rate": 1.0842947363445104e-06, + "loss": 0.6812, + "step": 57230 + }, + { + "epoch": 1.47, + "learning_rate": 1.0842671643412285e-06, + "loss": 0.6157, + "step": 57231 + }, + { + "epoch": 1.47, + "learning_rate": 1.0842395922734269e-06, + "loss": 0.6113, + "step": 57232 + }, + { + "epoch": 1.47, + "learning_rate": 1.084212020141127e-06, + "loss": 0.5544, + "step": 57233 + }, + { + "epoch": 1.47, + "learning_rate": 1.0841844479443498e-06, + "loss": 0.688, + "step": 57234 + }, + { + "epoch": 1.47, + "learning_rate": 1.0841568756831163e-06, + "loss": 0.6035, + "step": 57235 + }, + { + "epoch": 1.47, + "learning_rate": 1.084129303357448e-06, + "loss": 0.6948, + "step": 57236 + }, + { + "epoch": 1.47, + "learning_rate": 1.0841017309673655e-06, + "loss": 0.7529, + "step": 57237 + }, + { + "epoch": 1.47, + "learning_rate": 1.0840741585128903e-06, + "loss": 0.4619, + "step": 57238 + }, + { + "epoch": 1.47, + "learning_rate": 1.0840465859940436e-06, + "loss": 0.6816, + "step": 57239 + }, + { + "epoch": 1.47, + "learning_rate": 1.0840190134108459e-06, + "loss": 0.5615, + "step": 57240 + }, + { + "epoch": 1.47, + "learning_rate": 1.0839914407633188e-06, + "loss": 0.6299, + "step": 57241 + }, + { + "epoch": 1.47, + "learning_rate": 1.0839638680514832e-06, + "loss": 0.6162, + "step": 57242 + }, + { + "epoch": 1.47, + "learning_rate": 1.0839362952753608e-06, + "loss": 0.6494, + "step": 57243 + }, + { + "epoch": 1.47, + "learning_rate": 1.083908722434972e-06, + "loss": 0.6982, + "step": 57244 + }, + { + "epoch": 1.47, + "learning_rate": 1.083881149530338e-06, + "loss": 0.8506, + "step": 57245 + }, + { + "epoch": 1.47, + "learning_rate": 1.08385357656148e-06, + "loss": 0.6787, + "step": 57246 + }, + { + "epoch": 1.47, + "learning_rate": 1.0838260035284195e-06, + "loss": 0.7222, + "step": 57247 + }, + { + "epoch": 1.47, + "learning_rate": 1.0837984304311772e-06, + "loss": 0.6567, + "step": 57248 + }, + { + "epoch": 1.47, + "learning_rate": 1.0837708572697742e-06, + "loss": 0.7427, + "step": 57249 + }, + { + "epoch": 1.47, + "learning_rate": 1.0837432840442316e-06, + "loss": 0.5601, + "step": 57250 + }, + { + "epoch": 1.47, + "learning_rate": 1.0837157107545707e-06, + "loss": 0.6924, + "step": 57251 + }, + { + "epoch": 1.47, + "learning_rate": 1.0836881374008128e-06, + "loss": 0.5874, + "step": 57252 + }, + { + "epoch": 1.47, + "learning_rate": 1.0836605639829784e-06, + "loss": 0.662, + "step": 57253 + }, + { + "epoch": 1.47, + "learning_rate": 1.083632990501089e-06, + "loss": 0.7637, + "step": 57254 + }, + { + "epoch": 1.47, + "learning_rate": 1.0836054169551656e-06, + "loss": 0.7285, + "step": 57255 + }, + { + "epoch": 1.47, + "learning_rate": 1.0835778433452295e-06, + "loss": 0.5786, + "step": 57256 + }, + { + "epoch": 1.47, + "learning_rate": 1.0835502696713018e-06, + "loss": 0.6631, + "step": 57257 + }, + { + "epoch": 1.47, + "learning_rate": 1.0835226959334036e-06, + "loss": 0.5586, + "step": 57258 + }, + { + "epoch": 1.47, + "learning_rate": 1.0834951221315556e-06, + "loss": 0.7148, + "step": 57259 + }, + { + "epoch": 1.47, + "learning_rate": 1.0834675482657794e-06, + "loss": 0.6885, + "step": 57260 + }, + { + "epoch": 1.47, + "learning_rate": 1.0834399743360955e-06, + "loss": 0.5076, + "step": 57261 + }, + { + "epoch": 1.47, + "learning_rate": 1.083412400342526e-06, + "loss": 0.6748, + "step": 57262 + }, + { + "epoch": 1.47, + "learning_rate": 1.0833848262850913e-06, + "loss": 0.7812, + "step": 57263 + }, + { + "epoch": 1.47, + "learning_rate": 1.0833572521638128e-06, + "loss": 0.7432, + "step": 57264 + }, + { + "epoch": 1.47, + "learning_rate": 1.083329677978711e-06, + "loss": 0.5398, + "step": 57265 + }, + { + "epoch": 1.47, + "learning_rate": 1.083302103729808e-06, + "loss": 0.5869, + "step": 57266 + }, + { + "epoch": 1.47, + "learning_rate": 1.0832745294171242e-06, + "loss": 0.6533, + "step": 57267 + }, + { + "epoch": 1.47, + "learning_rate": 1.083246955040681e-06, + "loss": 0.6416, + "step": 57268 + }, + { + "epoch": 1.47, + "learning_rate": 1.0832193806004994e-06, + "loss": 0.6289, + "step": 57269 + }, + { + "epoch": 1.47, + "learning_rate": 1.0831918060966003e-06, + "loss": 0.7002, + "step": 57270 + }, + { + "epoch": 1.47, + "learning_rate": 1.0831642315290055e-06, + "loss": 0.7881, + "step": 57271 + }, + { + "epoch": 1.47, + "learning_rate": 1.0831366568977353e-06, + "loss": 0.5811, + "step": 57272 + }, + { + "epoch": 1.47, + "learning_rate": 1.0831090822028116e-06, + "loss": 0.6821, + "step": 57273 + }, + { + "epoch": 1.47, + "learning_rate": 1.0830815074442548e-06, + "loss": 0.6846, + "step": 57274 + }, + { + "epoch": 1.47, + "learning_rate": 1.0830539326220864e-06, + "loss": 0.6733, + "step": 57275 + }, + { + "epoch": 1.47, + "learning_rate": 1.0830263577363273e-06, + "loss": 0.5613, + "step": 57276 + }, + { + "epoch": 1.47, + "learning_rate": 1.082998782786999e-06, + "loss": 0.5942, + "step": 57277 + }, + { + "epoch": 1.47, + "learning_rate": 1.082971207774122e-06, + "loss": 0.5935, + "step": 57278 + }, + { + "epoch": 1.47, + "learning_rate": 1.082943632697718e-06, + "loss": 0.6104, + "step": 57279 + }, + { + "epoch": 1.47, + "learning_rate": 1.0829160575578078e-06, + "loss": 0.6064, + "step": 57280 + }, + { + "epoch": 1.47, + "learning_rate": 1.0828884823544125e-06, + "loss": 0.6577, + "step": 57281 + }, + { + "epoch": 1.47, + "learning_rate": 1.0828609070875531e-06, + "loss": 0.7344, + "step": 57282 + }, + { + "epoch": 1.47, + "learning_rate": 1.0828333317572518e-06, + "loss": 0.6631, + "step": 57283 + }, + { + "epoch": 1.47, + "learning_rate": 1.082805756363528e-06, + "loss": 0.5762, + "step": 57284 + }, + { + "epoch": 1.47, + "learning_rate": 1.082778180906404e-06, + "loss": 0.7178, + "step": 57285 + }, + { + "epoch": 1.47, + "learning_rate": 1.0827506053859e-06, + "loss": 0.6904, + "step": 57286 + }, + { + "epoch": 1.47, + "learning_rate": 1.0827230298020384e-06, + "loss": 0.6338, + "step": 57287 + }, + { + "epoch": 1.47, + "learning_rate": 1.0826954541548392e-06, + "loss": 0.7202, + "step": 57288 + }, + { + "epoch": 1.47, + "learning_rate": 1.082667878444324e-06, + "loss": 0.4659, + "step": 57289 + }, + { + "epoch": 1.47, + "learning_rate": 1.0826403026705137e-06, + "loss": 0.6216, + "step": 57290 + }, + { + "epoch": 1.47, + "learning_rate": 1.0826127268334298e-06, + "loss": 0.7305, + "step": 57291 + }, + { + "epoch": 1.47, + "learning_rate": 1.0825851509330927e-06, + "loss": 0.7119, + "step": 57292 + }, + { + "epoch": 1.47, + "learning_rate": 1.0825575749695241e-06, + "loss": 0.4788, + "step": 57293 + }, + { + "epoch": 1.47, + "learning_rate": 1.0825299989427451e-06, + "loss": 0.5712, + "step": 57294 + }, + { + "epoch": 1.47, + "learning_rate": 1.0825024228527766e-06, + "loss": 0.709, + "step": 57295 + }, + { + "epoch": 1.47, + "learning_rate": 1.08247484669964e-06, + "loss": 0.6934, + "step": 57296 + }, + { + "epoch": 1.47, + "learning_rate": 1.082447270483356e-06, + "loss": 0.5928, + "step": 57297 + }, + { + "epoch": 1.47, + "learning_rate": 1.082419694203946e-06, + "loss": 0.7354, + "step": 57298 + }, + { + "epoch": 1.47, + "learning_rate": 1.0823921178614307e-06, + "loss": 0.5464, + "step": 57299 + }, + { + "epoch": 1.47, + "learning_rate": 1.0823645414558319e-06, + "loss": 0.5312, + "step": 57300 + }, + { + "epoch": 1.47, + "learning_rate": 1.0823369649871701e-06, + "loss": 0.6025, + "step": 57301 + }, + { + "epoch": 1.47, + "learning_rate": 1.0823093884554667e-06, + "loss": 0.7441, + "step": 57302 + }, + { + "epoch": 1.47, + "learning_rate": 1.082281811860743e-06, + "loss": 0.5332, + "step": 57303 + }, + { + "epoch": 1.47, + "learning_rate": 1.08225423520302e-06, + "loss": 0.457, + "step": 57304 + }, + { + "epoch": 1.47, + "learning_rate": 1.0822266584823183e-06, + "loss": 0.4556, + "step": 57305 + }, + { + "epoch": 1.47, + "learning_rate": 1.0821990816986596e-06, + "loss": 0.7041, + "step": 57306 + }, + { + "epoch": 1.47, + "learning_rate": 1.082171504852065e-06, + "loss": 0.7383, + "step": 57307 + }, + { + "epoch": 1.47, + "learning_rate": 1.0821439279425556e-06, + "loss": 0.5154, + "step": 57308 + }, + { + "epoch": 1.47, + "learning_rate": 1.082116350970152e-06, + "loss": 0.6221, + "step": 57309 + }, + { + "epoch": 1.47, + "learning_rate": 1.0820887739348758e-06, + "loss": 0.7158, + "step": 57310 + }, + { + "epoch": 1.47, + "learning_rate": 1.0820611968367479e-06, + "loss": 0.7129, + "step": 57311 + }, + { + "epoch": 1.47, + "learning_rate": 1.0820336196757898e-06, + "loss": 0.5879, + "step": 57312 + }, + { + "epoch": 1.47, + "learning_rate": 1.0820060424520222e-06, + "loss": 0.4717, + "step": 57313 + }, + { + "epoch": 1.47, + "learning_rate": 1.081978465165466e-06, + "loss": 0.7178, + "step": 57314 + }, + { + "epoch": 1.47, + "learning_rate": 1.081950887816143e-06, + "loss": 0.7861, + "step": 57315 + }, + { + "epoch": 1.47, + "learning_rate": 1.0819233104040737e-06, + "loss": 0.7422, + "step": 57316 + }, + { + "epoch": 1.47, + "learning_rate": 1.08189573292928e-06, + "loss": 0.5625, + "step": 57317 + }, + { + "epoch": 1.47, + "learning_rate": 1.0818681553917821e-06, + "loss": 0.7725, + "step": 57318 + }, + { + "epoch": 1.47, + "learning_rate": 1.0818405777916017e-06, + "loss": 0.7578, + "step": 57319 + }, + { + "epoch": 1.47, + "learning_rate": 1.0818130001287595e-06, + "loss": 0.5549, + "step": 57320 + }, + { + "epoch": 1.47, + "learning_rate": 1.0817854224032773e-06, + "loss": 0.6279, + "step": 57321 + }, + { + "epoch": 1.47, + "learning_rate": 1.0817578446151752e-06, + "loss": 0.6987, + "step": 57322 + }, + { + "epoch": 1.47, + "learning_rate": 1.0817302667644754e-06, + "loss": 0.7842, + "step": 57323 + }, + { + "epoch": 1.47, + "learning_rate": 1.0817026888511982e-06, + "loss": 0.7236, + "step": 57324 + }, + { + "epoch": 1.47, + "learning_rate": 1.081675110875365e-06, + "loss": 0.6602, + "step": 57325 + }, + { + "epoch": 1.47, + "learning_rate": 1.0816475328369969e-06, + "loss": 0.7061, + "step": 57326 + }, + { + "epoch": 1.47, + "learning_rate": 1.0816199547361152e-06, + "loss": 0.6406, + "step": 57327 + }, + { + "epoch": 1.47, + "learning_rate": 1.0815923765727408e-06, + "loss": 0.6064, + "step": 57328 + }, + { + "epoch": 1.47, + "learning_rate": 1.0815647983468949e-06, + "loss": 0.6125, + "step": 57329 + }, + { + "epoch": 1.47, + "learning_rate": 1.0815372200585984e-06, + "loss": 0.6816, + "step": 57330 + }, + { + "epoch": 1.47, + "learning_rate": 1.081509641707873e-06, + "loss": 0.7256, + "step": 57331 + }, + { + "epoch": 1.47, + "learning_rate": 1.0814820632947389e-06, + "loss": 0.4702, + "step": 57332 + }, + { + "epoch": 1.47, + "learning_rate": 1.0814544848192179e-06, + "loss": 0.5996, + "step": 57333 + }, + { + "epoch": 1.47, + "learning_rate": 1.081426906281331e-06, + "loss": 0.6211, + "step": 57334 + }, + { + "epoch": 1.47, + "learning_rate": 1.0813993276810993e-06, + "loss": 0.6924, + "step": 57335 + }, + { + "epoch": 1.47, + "learning_rate": 1.081371749018544e-06, + "loss": 0.7109, + "step": 57336 + }, + { + "epoch": 1.47, + "learning_rate": 1.0813441702936859e-06, + "loss": 0.7344, + "step": 57337 + }, + { + "epoch": 1.47, + "learning_rate": 1.0813165915065465e-06, + "loss": 0.7539, + "step": 57338 + }, + { + "epoch": 1.47, + "learning_rate": 1.0812890126571462e-06, + "loss": 0.3594, + "step": 57339 + }, + { + "epoch": 1.47, + "learning_rate": 1.0812614337455073e-06, + "loss": 0.4241, + "step": 57340 + }, + { + "epoch": 1.47, + "learning_rate": 1.0812338547716497e-06, + "loss": 0.5972, + "step": 57341 + }, + { + "epoch": 1.47, + "learning_rate": 1.0812062757355955e-06, + "loss": 0.4285, + "step": 57342 + }, + { + "epoch": 1.47, + "learning_rate": 1.0811786966373653e-06, + "loss": 0.5061, + "step": 57343 + }, + { + "epoch": 1.47, + "learning_rate": 1.0811511174769803e-06, + "loss": 0.5491, + "step": 57344 + }, + { + "epoch": 1.47, + "learning_rate": 1.0811235382544614e-06, + "loss": 0.6504, + "step": 57345 + }, + { + "epoch": 1.47, + "learning_rate": 1.0810959589698303e-06, + "loss": 0.6123, + "step": 57346 + }, + { + "epoch": 1.47, + "learning_rate": 1.0810683796231072e-06, + "loss": 0.624, + "step": 57347 + }, + { + "epoch": 1.47, + "learning_rate": 1.0810408002143145e-06, + "loss": 0.6973, + "step": 57348 + }, + { + "epoch": 1.47, + "learning_rate": 1.0810132207434722e-06, + "loss": 0.7344, + "step": 57349 + }, + { + "epoch": 1.47, + "learning_rate": 1.0809856412106018e-06, + "loss": 0.4521, + "step": 57350 + }, + { + "epoch": 1.47, + "learning_rate": 1.0809580616157243e-06, + "loss": 0.6748, + "step": 57351 + }, + { + "epoch": 1.47, + "learning_rate": 1.0809304819588612e-06, + "loss": 0.5186, + "step": 57352 + }, + { + "epoch": 1.47, + "learning_rate": 1.080902902240033e-06, + "loss": 0.6519, + "step": 57353 + }, + { + "epoch": 1.47, + "learning_rate": 1.0808753224592616e-06, + "loss": 0.8145, + "step": 57354 + }, + { + "epoch": 1.47, + "learning_rate": 1.0808477426165674e-06, + "loss": 0.6279, + "step": 57355 + }, + { + "epoch": 1.47, + "learning_rate": 1.080820162711972e-06, + "loss": 0.7354, + "step": 57356 + }, + { + "epoch": 1.47, + "learning_rate": 1.080792582745496e-06, + "loss": 0.3844, + "step": 57357 + }, + { + "epoch": 1.47, + "learning_rate": 1.0807650027171612e-06, + "loss": 0.7168, + "step": 57358 + }, + { + "epoch": 1.47, + "learning_rate": 1.080737422626988e-06, + "loss": 0.6943, + "step": 57359 + }, + { + "epoch": 1.47, + "learning_rate": 1.080709842474998e-06, + "loss": 0.5991, + "step": 57360 + }, + { + "epoch": 1.47, + "learning_rate": 1.0806822622612124e-06, + "loss": 0.5752, + "step": 57361 + }, + { + "epoch": 1.47, + "learning_rate": 1.0806546819856517e-06, + "loss": 0.6328, + "step": 57362 + }, + { + "epoch": 1.47, + "learning_rate": 1.0806271016483379e-06, + "loss": 0.6411, + "step": 57363 + }, + { + "epoch": 1.47, + "learning_rate": 1.0805995212492913e-06, + "loss": 0.7256, + "step": 57364 + }, + { + "epoch": 1.47, + "learning_rate": 1.0805719407885334e-06, + "loss": 0.5715, + "step": 57365 + }, + { + "epoch": 1.47, + "learning_rate": 1.080544360266085e-06, + "loss": 0.6152, + "step": 57366 + }, + { + "epoch": 1.47, + "learning_rate": 1.080516779681968e-06, + "loss": 0.7021, + "step": 57367 + }, + { + "epoch": 1.47, + "learning_rate": 1.0804891990362028e-06, + "loss": 0.4789, + "step": 57368 + }, + { + "epoch": 1.47, + "learning_rate": 1.080461618328811e-06, + "loss": 0.5278, + "step": 57369 + }, + { + "epoch": 1.47, + "learning_rate": 1.080434037559813e-06, + "loss": 0.5635, + "step": 57370 + }, + { + "epoch": 1.47, + "learning_rate": 1.0804064567292305e-06, + "loss": 0.4868, + "step": 57371 + }, + { + "epoch": 1.47, + "learning_rate": 1.0803788758370843e-06, + "loss": 0.666, + "step": 57372 + }, + { + "epoch": 1.47, + "learning_rate": 1.080351294883396e-06, + "loss": 0.6631, + "step": 57373 + }, + { + "epoch": 1.47, + "learning_rate": 1.0803237138681865e-06, + "loss": 0.7109, + "step": 57374 + }, + { + "epoch": 1.47, + "learning_rate": 1.0802961327914765e-06, + "loss": 0.625, + "step": 57375 + }, + { + "epoch": 1.47, + "learning_rate": 1.0802685516532875e-06, + "loss": 0.4843, + "step": 57376 + }, + { + "epoch": 1.47, + "learning_rate": 1.0802409704536406e-06, + "loss": 0.7275, + "step": 57377 + }, + { + "epoch": 1.47, + "learning_rate": 1.0802133891925569e-06, + "loss": 0.7656, + "step": 57378 + }, + { + "epoch": 1.47, + "learning_rate": 1.0801858078700573e-06, + "loss": 0.8008, + "step": 57379 + }, + { + "epoch": 1.47, + "learning_rate": 1.0801582264861636e-06, + "loss": 0.7812, + "step": 57380 + }, + { + "epoch": 1.47, + "learning_rate": 1.080130645040896e-06, + "loss": 0.5483, + "step": 57381 + }, + { + "epoch": 1.47, + "learning_rate": 1.080103063534276e-06, + "loss": 0.5073, + "step": 57382 + }, + { + "epoch": 1.47, + "learning_rate": 1.0800754819663252e-06, + "loss": 0.6646, + "step": 57383 + }, + { + "epoch": 1.47, + "learning_rate": 1.080047900337064e-06, + "loss": 0.6709, + "step": 57384 + }, + { + "epoch": 1.47, + "learning_rate": 1.0800203186465138e-06, + "loss": 0.605, + "step": 57385 + }, + { + "epoch": 1.47, + "learning_rate": 1.0799927368946956e-06, + "loss": 0.5767, + "step": 57386 + }, + { + "epoch": 1.47, + "learning_rate": 1.0799651550816308e-06, + "loss": 0.5322, + "step": 57387 + }, + { + "epoch": 1.47, + "learning_rate": 1.0799375732073406e-06, + "loss": 0.6577, + "step": 57388 + }, + { + "epoch": 1.47, + "learning_rate": 1.0799099912718456e-06, + "loss": 0.6807, + "step": 57389 + }, + { + "epoch": 1.47, + "learning_rate": 1.0798824092751672e-06, + "loss": 0.542, + "step": 57390 + }, + { + "epoch": 1.47, + "learning_rate": 1.0798548272173264e-06, + "loss": 0.7412, + "step": 57391 + }, + { + "epoch": 1.47, + "learning_rate": 1.0798272450983448e-06, + "loss": 0.748, + "step": 57392 + }, + { + "epoch": 1.47, + "learning_rate": 1.0797996629182429e-06, + "loss": 0.6289, + "step": 57393 + }, + { + "epoch": 1.47, + "learning_rate": 1.079772080677042e-06, + "loss": 0.6836, + "step": 57394 + }, + { + "epoch": 1.47, + "learning_rate": 1.0797444983747634e-06, + "loss": 0.5425, + "step": 57395 + }, + { + "epoch": 1.47, + "learning_rate": 1.0797169160114281e-06, + "loss": 0.6494, + "step": 57396 + }, + { + "epoch": 1.47, + "learning_rate": 1.0796893335870571e-06, + "loss": 0.7422, + "step": 57397 + }, + { + "epoch": 1.47, + "learning_rate": 1.079661751101672e-06, + "loss": 0.6846, + "step": 57398 + }, + { + "epoch": 1.47, + "learning_rate": 1.0796341685552933e-06, + "loss": 0.6057, + "step": 57399 + }, + { + "epoch": 1.47, + "learning_rate": 1.0796065859479424e-06, + "loss": 0.5972, + "step": 57400 + }, + { + "epoch": 1.47, + "learning_rate": 1.07957900327964e-06, + "loss": 0.665, + "step": 57401 + }, + { + "epoch": 1.47, + "learning_rate": 1.0795514205504081e-06, + "loss": 0.8848, + "step": 57402 + }, + { + "epoch": 1.47, + "learning_rate": 1.0795238377602673e-06, + "loss": 0.748, + "step": 57403 + }, + { + "epoch": 1.47, + "learning_rate": 1.0794962549092386e-06, + "loss": 0.6743, + "step": 57404 + }, + { + "epoch": 1.47, + "learning_rate": 1.0794686719973434e-06, + "loss": 0.687, + "step": 57405 + }, + { + "epoch": 1.47, + "learning_rate": 1.0794410890246026e-06, + "loss": 0.6611, + "step": 57406 + }, + { + "epoch": 1.47, + "learning_rate": 1.0794135059910374e-06, + "loss": 0.4016, + "step": 57407 + }, + { + "epoch": 1.47, + "learning_rate": 1.079385922896669e-06, + "loss": 0.707, + "step": 57408 + }, + { + "epoch": 1.47, + "learning_rate": 1.0793583397415186e-06, + "loss": 0.7705, + "step": 57409 + }, + { + "epoch": 1.47, + "learning_rate": 1.079330756525607e-06, + "loss": 0.5522, + "step": 57410 + }, + { + "epoch": 1.47, + "learning_rate": 1.0793031732489554e-06, + "loss": 0.6904, + "step": 57411 + }, + { + "epoch": 1.47, + "learning_rate": 1.0792755899115852e-06, + "loss": 0.6836, + "step": 57412 + }, + { + "epoch": 1.47, + "learning_rate": 1.0792480065135174e-06, + "loss": 0.6191, + "step": 57413 + }, + { + "epoch": 1.47, + "learning_rate": 1.0792204230547728e-06, + "loss": 0.6411, + "step": 57414 + }, + { + "epoch": 1.47, + "learning_rate": 1.0791928395353728e-06, + "loss": 0.5955, + "step": 57415 + }, + { + "epoch": 1.47, + "learning_rate": 1.0791652559553384e-06, + "loss": 0.5413, + "step": 57416 + }, + { + "epoch": 1.47, + "learning_rate": 1.079137672314691e-06, + "loss": 0.6958, + "step": 57417 + }, + { + "epoch": 1.47, + "learning_rate": 1.0791100886134515e-06, + "loss": 0.7109, + "step": 57418 + }, + { + "epoch": 1.47, + "learning_rate": 1.079082504851641e-06, + "loss": 0.5621, + "step": 57419 + }, + { + "epoch": 1.47, + "learning_rate": 1.0790549210292805e-06, + "loss": 0.6274, + "step": 57420 + }, + { + "epoch": 1.47, + "learning_rate": 1.0790273371463916e-06, + "loss": 0.6147, + "step": 57421 + }, + { + "epoch": 1.47, + "learning_rate": 1.0789997532029946e-06, + "loss": 0.7441, + "step": 57422 + }, + { + "epoch": 1.47, + "learning_rate": 1.0789721691991115e-06, + "loss": 0.6089, + "step": 57423 + }, + { + "epoch": 1.47, + "learning_rate": 1.0789445851347632e-06, + "loss": 0.7715, + "step": 57424 + }, + { + "epoch": 1.47, + "learning_rate": 1.0789170010099703e-06, + "loss": 0.6357, + "step": 57425 + }, + { + "epoch": 1.47, + "learning_rate": 1.0788894168247546e-06, + "loss": 0.5488, + "step": 57426 + }, + { + "epoch": 1.47, + "learning_rate": 1.0788618325791367e-06, + "loss": 0.7612, + "step": 57427 + }, + { + "epoch": 1.47, + "learning_rate": 1.0788342482731381e-06, + "loss": 0.5828, + "step": 57428 + }, + { + "epoch": 1.47, + "learning_rate": 1.0788066639067793e-06, + "loss": 0.6021, + "step": 57429 + }, + { + "epoch": 1.47, + "learning_rate": 1.0787790794800824e-06, + "loss": 0.6221, + "step": 57430 + }, + { + "epoch": 1.47, + "learning_rate": 1.0787514949930675e-06, + "loss": 0.7549, + "step": 57431 + }, + { + "epoch": 1.47, + "learning_rate": 1.0787239104457567e-06, + "loss": 0.5454, + "step": 57432 + }, + { + "epoch": 1.47, + "learning_rate": 1.0786963258381703e-06, + "loss": 0.637, + "step": 57433 + }, + { + "epoch": 1.47, + "learning_rate": 1.07866874117033e-06, + "loss": 0.4211, + "step": 57434 + }, + { + "epoch": 1.47, + "learning_rate": 1.0786411564422562e-06, + "loss": 0.6138, + "step": 57435 + }, + { + "epoch": 1.47, + "learning_rate": 1.0786135716539708e-06, + "loss": 0.7485, + "step": 57436 + }, + { + "epoch": 1.47, + "learning_rate": 1.0785859868054946e-06, + "loss": 0.7305, + "step": 57437 + }, + { + "epoch": 1.47, + "learning_rate": 1.0785584018968488e-06, + "loss": 0.623, + "step": 57438 + }, + { + "epoch": 1.47, + "learning_rate": 1.0785308169280543e-06, + "loss": 0.752, + "step": 57439 + }, + { + "epoch": 1.47, + "learning_rate": 1.0785032318991326e-06, + "loss": 0.6616, + "step": 57440 + }, + { + "epoch": 1.47, + "learning_rate": 1.0784756468101039e-06, + "loss": 0.3821, + "step": 57441 + }, + { + "epoch": 1.47, + "learning_rate": 1.0784480616609907e-06, + "loss": 0.7549, + "step": 57442 + }, + { + "epoch": 1.47, + "learning_rate": 1.0784204764518132e-06, + "loss": 0.6309, + "step": 57443 + }, + { + "epoch": 1.47, + "learning_rate": 1.078392891182593e-06, + "loss": 0.4417, + "step": 57444 + }, + { + "epoch": 1.47, + "learning_rate": 1.0783653058533505e-06, + "loss": 0.668, + "step": 57445 + }, + { + "epoch": 1.47, + "learning_rate": 1.0783377204641075e-06, + "loss": 0.5693, + "step": 57446 + }, + { + "epoch": 1.47, + "learning_rate": 1.0783101350148848e-06, + "loss": 0.7427, + "step": 57447 + }, + { + "epoch": 1.47, + "learning_rate": 1.0782825495057037e-06, + "loss": 0.4513, + "step": 57448 + }, + { + "epoch": 1.47, + "learning_rate": 1.0782549639365854e-06, + "loss": 0.7236, + "step": 57449 + }, + { + "epoch": 1.47, + "learning_rate": 1.0782273783075508e-06, + "loss": 0.6045, + "step": 57450 + }, + { + "epoch": 1.47, + "learning_rate": 1.078199792618621e-06, + "loss": 0.708, + "step": 57451 + }, + { + "epoch": 1.47, + "learning_rate": 1.0781722068698172e-06, + "loss": 0.4653, + "step": 57452 + }, + { + "epoch": 1.47, + "learning_rate": 1.078144621061161e-06, + "loss": 0.5991, + "step": 57453 + }, + { + "epoch": 1.47, + "learning_rate": 1.0781170351926724e-06, + "loss": 0.7666, + "step": 57454 + }, + { + "epoch": 1.47, + "learning_rate": 1.0780894492643734e-06, + "loss": 0.6621, + "step": 57455 + }, + { + "epoch": 1.47, + "learning_rate": 1.078061863276285e-06, + "loss": 0.8193, + "step": 57456 + }, + { + "epoch": 1.47, + "learning_rate": 1.0780342772284283e-06, + "loss": 0.6113, + "step": 57457 + }, + { + "epoch": 1.47, + "learning_rate": 1.0780066911208243e-06, + "loss": 0.7432, + "step": 57458 + }, + { + "epoch": 1.47, + "learning_rate": 1.077979104953494e-06, + "loss": 0.7002, + "step": 57459 + }, + { + "epoch": 1.47, + "learning_rate": 1.0779515187264586e-06, + "loss": 0.7881, + "step": 57460 + }, + { + "epoch": 1.47, + "learning_rate": 1.0779239324397396e-06, + "loss": 0.5537, + "step": 57461 + }, + { + "epoch": 1.47, + "learning_rate": 1.0778963460933576e-06, + "loss": 0.6348, + "step": 57462 + }, + { + "epoch": 1.47, + "learning_rate": 1.0778687596873344e-06, + "loss": 0.5161, + "step": 57463 + }, + { + "epoch": 1.47, + "learning_rate": 1.0778411732216902e-06, + "loss": 0.5378, + "step": 57464 + }, + { + "epoch": 1.47, + "learning_rate": 1.0778135866964466e-06, + "loss": 0.4395, + "step": 57465 + }, + { + "epoch": 1.47, + "learning_rate": 1.0777860001116249e-06, + "loss": 0.7495, + "step": 57466 + }, + { + "epoch": 1.47, + "learning_rate": 1.077758413467246e-06, + "loss": 0.439, + "step": 57467 + }, + { + "epoch": 1.47, + "learning_rate": 1.077730826763331e-06, + "loss": 0.6045, + "step": 57468 + }, + { + "epoch": 1.47, + "learning_rate": 1.0777032399999009e-06, + "loss": 0.5093, + "step": 57469 + }, + { + "epoch": 1.47, + "learning_rate": 1.0776756531769773e-06, + "loss": 0.5771, + "step": 57470 + }, + { + "epoch": 1.47, + "learning_rate": 1.077648066294581e-06, + "loss": 0.5264, + "step": 57471 + }, + { + "epoch": 1.47, + "learning_rate": 1.077620479352733e-06, + "loss": 0.7148, + "step": 57472 + }, + { + "epoch": 1.47, + "learning_rate": 1.0775928923514546e-06, + "loss": 0.5596, + "step": 57473 + }, + { + "epoch": 1.47, + "learning_rate": 1.077565305290767e-06, + "loss": 0.5957, + "step": 57474 + }, + { + "epoch": 1.47, + "learning_rate": 1.077537718170691e-06, + "loss": 0.7949, + "step": 57475 + }, + { + "epoch": 1.47, + "learning_rate": 1.0775101309912483e-06, + "loss": 0.5317, + "step": 57476 + }, + { + "epoch": 1.47, + "learning_rate": 1.0774825437524593e-06, + "loss": 0.6562, + "step": 57477 + }, + { + "epoch": 1.47, + "learning_rate": 1.0774549564543459e-06, + "loss": 0.5879, + "step": 57478 + }, + { + "epoch": 1.47, + "learning_rate": 1.0774273690969282e-06, + "loss": 0.6091, + "step": 57479 + }, + { + "epoch": 1.47, + "learning_rate": 1.0773997816802282e-06, + "loss": 0.5933, + "step": 57480 + }, + { + "epoch": 1.47, + "learning_rate": 1.0773721942042668e-06, + "loss": 0.7383, + "step": 57481 + }, + { + "epoch": 1.47, + "learning_rate": 1.0773446066690653e-06, + "loss": 0.7285, + "step": 57482 + }, + { + "epoch": 1.47, + "learning_rate": 1.0773170190746444e-06, + "loss": 0.6265, + "step": 57483 + }, + { + "epoch": 1.47, + "learning_rate": 1.0772894314210253e-06, + "loss": 0.4624, + "step": 57484 + }, + { + "epoch": 1.47, + "learning_rate": 1.077261843708229e-06, + "loss": 0.6392, + "step": 57485 + }, + { + "epoch": 1.47, + "learning_rate": 1.0772342559362773e-06, + "loss": 0.5742, + "step": 57486 + }, + { + "epoch": 1.47, + "learning_rate": 1.0772066681051908e-06, + "loss": 0.667, + "step": 57487 + }, + { + "epoch": 1.47, + "learning_rate": 1.0771790802149905e-06, + "loss": 0.5693, + "step": 57488 + }, + { + "epoch": 1.47, + "learning_rate": 1.077151492265698e-06, + "loss": 0.5913, + "step": 57489 + }, + { + "epoch": 1.47, + "learning_rate": 1.077123904257334e-06, + "loss": 0.7227, + "step": 57490 + }, + { + "epoch": 1.47, + "learning_rate": 1.0770963161899196e-06, + "loss": 0.7969, + "step": 57491 + }, + { + "epoch": 1.47, + "learning_rate": 1.0770687280634765e-06, + "loss": 0.5381, + "step": 57492 + }, + { + "epoch": 1.47, + "learning_rate": 1.0770411398780253e-06, + "loss": 0.52, + "step": 57493 + }, + { + "epoch": 1.47, + "learning_rate": 1.077013551633587e-06, + "loss": 0.708, + "step": 57494 + }, + { + "epoch": 1.47, + "learning_rate": 1.0769859633301832e-06, + "loss": 0.6514, + "step": 57495 + }, + { + "epoch": 1.47, + "learning_rate": 1.0769583749678345e-06, + "loss": 0.7148, + "step": 57496 + }, + { + "epoch": 1.47, + "learning_rate": 1.0769307865465627e-06, + "loss": 0.6514, + "step": 57497 + }, + { + "epoch": 1.47, + "learning_rate": 1.0769031980663883e-06, + "loss": 0.7666, + "step": 57498 + }, + { + "epoch": 1.47, + "learning_rate": 1.0768756095273328e-06, + "loss": 0.7578, + "step": 57499 + }, + { + "epoch": 1.47, + "learning_rate": 1.0768480209294168e-06, + "loss": 0.7236, + "step": 57500 + }, + { + "epoch": 1.47, + "learning_rate": 1.0768204322726622e-06, + "loss": 0.6729, + "step": 57501 + }, + { + "epoch": 1.47, + "learning_rate": 1.0767928435570897e-06, + "loss": 0.645, + "step": 57502 + }, + { + "epoch": 1.47, + "learning_rate": 1.0767652547827205e-06, + "loss": 0.6494, + "step": 57503 + }, + { + "epoch": 1.47, + "learning_rate": 1.0767376659495753e-06, + "loss": 0.541, + "step": 57504 + }, + { + "epoch": 1.47, + "learning_rate": 1.076710077057676e-06, + "loss": 0.5427, + "step": 57505 + }, + { + "epoch": 1.47, + "learning_rate": 1.076682488107043e-06, + "loss": 0.5806, + "step": 57506 + }, + { + "epoch": 1.47, + "learning_rate": 1.076654899097698e-06, + "loss": 0.666, + "step": 57507 + }, + { + "epoch": 1.47, + "learning_rate": 1.0766273100296616e-06, + "loss": 0.6001, + "step": 57508 + }, + { + "epoch": 1.47, + "learning_rate": 1.0765997209029556e-06, + "loss": 0.8369, + "step": 57509 + }, + { + "epoch": 1.47, + "learning_rate": 1.0765721317176002e-06, + "loss": 0.7246, + "step": 57510 + }, + { + "epoch": 1.47, + "learning_rate": 1.0765445424736174e-06, + "loss": 0.4216, + "step": 57511 + }, + { + "epoch": 1.47, + "learning_rate": 1.076516953171028e-06, + "loss": 0.4208, + "step": 57512 + }, + { + "epoch": 1.47, + "learning_rate": 1.076489363809853e-06, + "loss": 0.8428, + "step": 57513 + }, + { + "epoch": 1.47, + "learning_rate": 1.0764617743901133e-06, + "loss": 0.5283, + "step": 57514 + }, + { + "epoch": 1.47, + "learning_rate": 1.0764341849118306e-06, + "loss": 0.5918, + "step": 57515 + }, + { + "epoch": 1.47, + "learning_rate": 1.0764065953750258e-06, + "loss": 0.7471, + "step": 57516 + }, + { + "epoch": 1.47, + "learning_rate": 1.0763790057797202e-06, + "loss": 0.5713, + "step": 57517 + }, + { + "epoch": 1.47, + "learning_rate": 1.0763514161259345e-06, + "loss": 0.6689, + "step": 57518 + }, + { + "epoch": 1.47, + "learning_rate": 1.0763238264136898e-06, + "loss": 0.7061, + "step": 57519 + }, + { + "epoch": 1.47, + "learning_rate": 1.0762962366430078e-06, + "loss": 0.7178, + "step": 57520 + }, + { + "epoch": 1.47, + "learning_rate": 1.0762686468139088e-06, + "loss": 0.6318, + "step": 57521 + }, + { + "epoch": 1.47, + "learning_rate": 1.076241056926415e-06, + "loss": 0.7773, + "step": 57522 + }, + { + "epoch": 1.47, + "learning_rate": 1.0762134669805466e-06, + "loss": 0.6641, + "step": 57523 + }, + { + "epoch": 1.47, + "learning_rate": 1.0761858769763253e-06, + "loss": 0.7148, + "step": 57524 + }, + { + "epoch": 1.47, + "learning_rate": 1.0761582869137716e-06, + "loss": 0.5684, + "step": 57525 + }, + { + "epoch": 1.47, + "learning_rate": 1.0761306967929075e-06, + "loss": 0.7363, + "step": 57526 + }, + { + "epoch": 1.47, + "learning_rate": 1.076103106613753e-06, + "loss": 0.6421, + "step": 57527 + }, + { + "epoch": 1.47, + "learning_rate": 1.0760755163763305e-06, + "loss": 0.6914, + "step": 57528 + }, + { + "epoch": 1.47, + "learning_rate": 1.07604792608066e-06, + "loss": 0.6575, + "step": 57529 + }, + { + "epoch": 1.47, + "learning_rate": 1.0760203357267633e-06, + "loss": 0.5669, + "step": 57530 + }, + { + "epoch": 1.47, + "learning_rate": 1.075992745314661e-06, + "loss": 0.6152, + "step": 57531 + }, + { + "epoch": 1.47, + "learning_rate": 1.075965154844375e-06, + "loss": 0.6328, + "step": 57532 + }, + { + "epoch": 1.47, + "learning_rate": 1.0759375643159258e-06, + "loss": 0.7412, + "step": 57533 + }, + { + "epoch": 1.47, + "learning_rate": 1.0759099737293348e-06, + "loss": 0.748, + "step": 57534 + }, + { + "epoch": 1.47, + "learning_rate": 1.0758823830846227e-06, + "loss": 0.7019, + "step": 57535 + }, + { + "epoch": 1.47, + "learning_rate": 1.0758547923818114e-06, + "loss": 0.6172, + "step": 57536 + }, + { + "epoch": 1.47, + "learning_rate": 1.0758272016209213e-06, + "loss": 0.71, + "step": 57537 + }, + { + "epoch": 1.47, + "learning_rate": 1.0757996108019735e-06, + "loss": 0.5566, + "step": 57538 + }, + { + "epoch": 1.47, + "learning_rate": 1.07577201992499e-06, + "loss": 0.6934, + "step": 57539 + }, + { + "epoch": 1.47, + "learning_rate": 1.0757444289899909e-06, + "loss": 0.6396, + "step": 57540 + }, + { + "epoch": 1.47, + "learning_rate": 1.0757168379969981e-06, + "loss": 0.7061, + "step": 57541 + }, + { + "epoch": 1.47, + "learning_rate": 1.0756892469460323e-06, + "loss": 0.7041, + "step": 57542 + }, + { + "epoch": 1.47, + "learning_rate": 1.0756616558371147e-06, + "loss": 0.6714, + "step": 57543 + }, + { + "epoch": 1.47, + "learning_rate": 1.0756340646702663e-06, + "loss": 0.6001, + "step": 57544 + }, + { + "epoch": 1.47, + "learning_rate": 1.0756064734455086e-06, + "loss": 0.5388, + "step": 57545 + }, + { + "epoch": 1.47, + "learning_rate": 1.0755788821628624e-06, + "loss": 0.4956, + "step": 57546 + }, + { + "epoch": 1.47, + "learning_rate": 1.0755512908223492e-06, + "loss": 0.6069, + "step": 57547 + }, + { + "epoch": 1.47, + "learning_rate": 1.0755236994239896e-06, + "loss": 0.6123, + "step": 57548 + }, + { + "epoch": 1.48, + "learning_rate": 1.0754961079678049e-06, + "loss": 0.709, + "step": 57549 + }, + { + "epoch": 1.48, + "learning_rate": 1.0754685164538162e-06, + "loss": 0.4456, + "step": 57550 + }, + { + "epoch": 1.48, + "learning_rate": 1.0754409248820452e-06, + "loss": 0.6987, + "step": 57551 + }, + { + "epoch": 1.48, + "learning_rate": 1.0754133332525123e-06, + "loss": 0.6934, + "step": 57552 + }, + { + "epoch": 1.48, + "learning_rate": 1.0753857415652388e-06, + "loss": 0.624, + "step": 57553 + }, + { + "epoch": 1.48, + "learning_rate": 1.0753581498202458e-06, + "loss": 0.8232, + "step": 57554 + }, + { + "epoch": 1.48, + "learning_rate": 1.0753305580175548e-06, + "loss": 0.6289, + "step": 57555 + }, + { + "epoch": 1.48, + "learning_rate": 1.075302966157186e-06, + "loss": 0.6152, + "step": 57556 + }, + { + "epoch": 1.48, + "learning_rate": 1.075275374239162e-06, + "loss": 0.7627, + "step": 57557 + }, + { + "epoch": 1.48, + "learning_rate": 1.0752477822635028e-06, + "loss": 0.7017, + "step": 57558 + }, + { + "epoch": 1.48, + "learning_rate": 1.0752201902302298e-06, + "loss": 0.7354, + "step": 57559 + }, + { + "epoch": 1.48, + "learning_rate": 1.0751925981393644e-06, + "loss": 0.542, + "step": 57560 + }, + { + "epoch": 1.48, + "learning_rate": 1.0751650059909272e-06, + "loss": 0.6641, + "step": 57561 + }, + { + "epoch": 1.48, + "learning_rate": 1.0751374137849399e-06, + "loss": 0.6875, + "step": 57562 + }, + { + "epoch": 1.48, + "learning_rate": 1.075109821521423e-06, + "loss": 0.5796, + "step": 57563 + }, + { + "epoch": 1.48, + "learning_rate": 1.075082229200398e-06, + "loss": 0.5439, + "step": 57564 + }, + { + "epoch": 1.48, + "learning_rate": 1.075054636821886e-06, + "loss": 0.6113, + "step": 57565 + }, + { + "epoch": 1.48, + "learning_rate": 1.0750270443859084e-06, + "loss": 0.8682, + "step": 57566 + }, + { + "epoch": 1.48, + "learning_rate": 1.074999451892486e-06, + "loss": 0.6855, + "step": 57567 + }, + { + "epoch": 1.48, + "learning_rate": 1.0749718593416397e-06, + "loss": 0.6592, + "step": 57568 + }, + { + "epoch": 1.48, + "learning_rate": 1.074944266733391e-06, + "loss": 0.6172, + "step": 57569 + }, + { + "epoch": 1.48, + "learning_rate": 1.074916674067761e-06, + "loss": 0.5035, + "step": 57570 + }, + { + "epoch": 1.48, + "learning_rate": 1.0748890813447703e-06, + "loss": 0.6865, + "step": 57571 + }, + { + "epoch": 1.48, + "learning_rate": 1.0748614885644413e-06, + "loss": 0.4342, + "step": 57572 + }, + { + "epoch": 1.48, + "learning_rate": 1.0748338957267938e-06, + "loss": 0.6548, + "step": 57573 + }, + { + "epoch": 1.48, + "learning_rate": 1.0748063028318495e-06, + "loss": 0.7354, + "step": 57574 + }, + { + "epoch": 1.48, + "learning_rate": 1.0747787098796293e-06, + "loss": 0.7109, + "step": 57575 + }, + { + "epoch": 1.48, + "learning_rate": 1.0747511168701546e-06, + "loss": 0.5962, + "step": 57576 + }, + { + "epoch": 1.48, + "learning_rate": 1.0747235238034467e-06, + "loss": 0.6016, + "step": 57577 + }, + { + "epoch": 1.48, + "learning_rate": 1.0746959306795257e-06, + "loss": 0.6245, + "step": 57578 + }, + { + "epoch": 1.48, + "learning_rate": 1.0746683374984142e-06, + "loss": 0.6147, + "step": 57579 + }, + { + "epoch": 1.48, + "learning_rate": 1.0746407442601323e-06, + "loss": 0.5513, + "step": 57580 + }, + { + "epoch": 1.48, + "learning_rate": 1.0746131509647014e-06, + "loss": 0.6548, + "step": 57581 + }, + { + "epoch": 1.48, + "learning_rate": 1.0745855576121425e-06, + "loss": 0.4275, + "step": 57582 + }, + { + "epoch": 1.48, + "learning_rate": 1.0745579642024773e-06, + "loss": 0.749, + "step": 57583 + }, + { + "epoch": 1.48, + "learning_rate": 1.0745303707357261e-06, + "loss": 0.6416, + "step": 57584 + }, + { + "epoch": 1.48, + "learning_rate": 1.0745027772119106e-06, + "loss": 0.7217, + "step": 57585 + }, + { + "epoch": 1.48, + "learning_rate": 1.0744751836310515e-06, + "loss": 0.7188, + "step": 57586 + }, + { + "epoch": 1.48, + "learning_rate": 1.0744475899931707e-06, + "loss": 0.6372, + "step": 57587 + }, + { + "epoch": 1.48, + "learning_rate": 1.0744199962982883e-06, + "loss": 0.7158, + "step": 57588 + }, + { + "epoch": 1.48, + "learning_rate": 1.0743924025464263e-06, + "loss": 0.6455, + "step": 57589 + }, + { + "epoch": 1.48, + "learning_rate": 1.0743648087376048e-06, + "loss": 0.7139, + "step": 57590 + }, + { + "epoch": 1.48, + "learning_rate": 1.0743372148718463e-06, + "loss": 0.4658, + "step": 57591 + }, + { + "epoch": 1.48, + "learning_rate": 1.0743096209491711e-06, + "loss": 0.5859, + "step": 57592 + }, + { + "epoch": 1.48, + "learning_rate": 1.0742820269696001e-06, + "loss": 0.6797, + "step": 57593 + }, + { + "epoch": 1.48, + "learning_rate": 1.0742544329331551e-06, + "loss": 0.5222, + "step": 57594 + }, + { + "epoch": 1.48, + "learning_rate": 1.0742268388398569e-06, + "loss": 0.7041, + "step": 57595 + }, + { + "epoch": 1.48, + "learning_rate": 1.074199244689726e-06, + "loss": 0.7373, + "step": 57596 + }, + { + "epoch": 1.48, + "learning_rate": 1.0741716504827852e-06, + "loss": 0.5562, + "step": 57597 + }, + { + "epoch": 1.48, + "learning_rate": 1.074144056219054e-06, + "loss": 0.6265, + "step": 57598 + }, + { + "epoch": 1.48, + "learning_rate": 1.074116461898554e-06, + "loss": 0.7217, + "step": 57599 + }, + { + "epoch": 1.48, + "learning_rate": 1.0740888675213064e-06, + "loss": 0.6709, + "step": 57600 + }, + { + "epoch": 1.48, + "learning_rate": 1.0740612730873327e-06, + "loss": 0.7412, + "step": 57601 + }, + { + "epoch": 1.48, + "learning_rate": 1.0740336785966536e-06, + "loss": 0.5303, + "step": 57602 + }, + { + "epoch": 1.48, + "learning_rate": 1.07400608404929e-06, + "loss": 0.709, + "step": 57603 + }, + { + "epoch": 1.48, + "learning_rate": 1.0739784894452634e-06, + "loss": 0.7842, + "step": 57604 + }, + { + "epoch": 1.48, + "learning_rate": 1.073950894784595e-06, + "loss": 0.5151, + "step": 57605 + }, + { + "epoch": 1.48, + "learning_rate": 1.0739233000673061e-06, + "loss": 0.5928, + "step": 57606 + }, + { + "epoch": 1.48, + "learning_rate": 1.0738957052934173e-06, + "loss": 0.4004, + "step": 57607 + }, + { + "epoch": 1.48, + "learning_rate": 1.0738681104629498e-06, + "loss": 0.4071, + "step": 57608 + }, + { + "epoch": 1.48, + "learning_rate": 1.073840515575925e-06, + "loss": 0.4524, + "step": 57609 + }, + { + "epoch": 1.48, + "learning_rate": 1.073812920632364e-06, + "loss": 0.6362, + "step": 57610 + }, + { + "epoch": 1.48, + "learning_rate": 1.0737853256322875e-06, + "loss": 0.6162, + "step": 57611 + }, + { + "epoch": 1.48, + "learning_rate": 1.0737577305757175e-06, + "loss": 0.6875, + "step": 57612 + }, + { + "epoch": 1.48, + "learning_rate": 1.0737301354626743e-06, + "loss": 0.6274, + "step": 57613 + }, + { + "epoch": 1.48, + "learning_rate": 1.0737025402931794e-06, + "loss": 0.6426, + "step": 57614 + }, + { + "epoch": 1.48, + "learning_rate": 1.0736749450672536e-06, + "loss": 0.6304, + "step": 57615 + }, + { + "epoch": 1.48, + "learning_rate": 1.0736473497849186e-06, + "loss": 0.7607, + "step": 57616 + }, + { + "epoch": 1.48, + "learning_rate": 1.0736197544461952e-06, + "loss": 0.6172, + "step": 57617 + }, + { + "epoch": 1.48, + "learning_rate": 1.0735921590511043e-06, + "loss": 0.5383, + "step": 57618 + }, + { + "epoch": 1.48, + "learning_rate": 1.0735645635996674e-06, + "loss": 0.7939, + "step": 57619 + }, + { + "epoch": 1.48, + "learning_rate": 1.0735369680919054e-06, + "loss": 0.7393, + "step": 57620 + }, + { + "epoch": 1.48, + "learning_rate": 1.0735093725278397e-06, + "loss": 0.6338, + "step": 57621 + }, + { + "epoch": 1.48, + "learning_rate": 1.0734817769074913e-06, + "loss": 0.5708, + "step": 57622 + }, + { + "epoch": 1.48, + "learning_rate": 1.073454181230881e-06, + "loss": 0.4712, + "step": 57623 + }, + { + "epoch": 1.48, + "learning_rate": 1.0734265854980308e-06, + "loss": 0.7744, + "step": 57624 + }, + { + "epoch": 1.48, + "learning_rate": 1.0733989897089604e-06, + "loss": 0.8018, + "step": 57625 + }, + { + "epoch": 1.48, + "learning_rate": 1.0733713938636925e-06, + "loss": 0.6006, + "step": 57626 + }, + { + "epoch": 1.48, + "learning_rate": 1.0733437979622471e-06, + "loss": 0.7012, + "step": 57627 + }, + { + "epoch": 1.48, + "learning_rate": 1.0733162020046456e-06, + "loss": 0.6592, + "step": 57628 + }, + { + "epoch": 1.48, + "learning_rate": 1.0732886059909093e-06, + "loss": 0.6543, + "step": 57629 + }, + { + "epoch": 1.48, + "learning_rate": 1.0732610099210595e-06, + "loss": 0.6328, + "step": 57630 + }, + { + "epoch": 1.48, + "learning_rate": 1.0732334137951172e-06, + "loss": 0.5303, + "step": 57631 + }, + { + "epoch": 1.48, + "learning_rate": 1.0732058176131034e-06, + "loss": 0.6514, + "step": 57632 + }, + { + "epoch": 1.48, + "learning_rate": 1.0731782213750391e-06, + "loss": 0.6875, + "step": 57633 + }, + { + "epoch": 1.48, + "learning_rate": 1.0731506250809457e-06, + "loss": 0.7031, + "step": 57634 + }, + { + "epoch": 1.48, + "learning_rate": 1.0731230287308442e-06, + "loss": 0.6592, + "step": 57635 + }, + { + "epoch": 1.48, + "learning_rate": 1.0730954323247557e-06, + "loss": 0.7031, + "step": 57636 + }, + { + "epoch": 1.48, + "learning_rate": 1.0730678358627016e-06, + "loss": 0.9004, + "step": 57637 + }, + { + "epoch": 1.48, + "learning_rate": 1.0730402393447025e-06, + "loss": 0.6836, + "step": 57638 + }, + { + "epoch": 1.48, + "learning_rate": 1.0730126427707801e-06, + "loss": 0.6948, + "step": 57639 + }, + { + "epoch": 1.48, + "learning_rate": 1.072985046140955e-06, + "loss": 0.7383, + "step": 57640 + }, + { + "epoch": 1.48, + "learning_rate": 1.072957449455249e-06, + "loss": 0.6719, + "step": 57641 + }, + { + "epoch": 1.48, + "learning_rate": 1.0729298527136824e-06, + "loss": 0.6211, + "step": 57642 + }, + { + "epoch": 1.48, + "learning_rate": 1.0729022559162772e-06, + "loss": 0.5249, + "step": 57643 + }, + { + "epoch": 1.48, + "learning_rate": 1.0728746590630538e-06, + "loss": 0.6162, + "step": 57644 + }, + { + "epoch": 1.48, + "learning_rate": 1.0728470621540337e-06, + "loss": 0.7588, + "step": 57645 + }, + { + "epoch": 1.48, + "learning_rate": 1.0728194651892379e-06, + "loss": 0.5952, + "step": 57646 + }, + { + "epoch": 1.48, + "learning_rate": 1.0727918681686877e-06, + "loss": 0.574, + "step": 57647 + }, + { + "epoch": 1.48, + "learning_rate": 1.0727642710924043e-06, + "loss": 0.4351, + "step": 57648 + }, + { + "epoch": 1.48, + "learning_rate": 1.0727366739604082e-06, + "loss": 0.6011, + "step": 57649 + }, + { + "epoch": 1.48, + "learning_rate": 1.072709076772721e-06, + "loss": 0.8701, + "step": 57650 + }, + { + "epoch": 1.48, + "learning_rate": 1.0726814795293642e-06, + "loss": 0.5469, + "step": 57651 + }, + { + "epoch": 1.48, + "learning_rate": 1.0726538822303586e-06, + "loss": 0.6387, + "step": 57652 + }, + { + "epoch": 1.48, + "learning_rate": 1.0726262848757249e-06, + "loss": 0.6982, + "step": 57653 + }, + { + "epoch": 1.48, + "learning_rate": 1.0725986874654847e-06, + "loss": 0.7354, + "step": 57654 + }, + { + "epoch": 1.48, + "learning_rate": 1.0725710899996587e-06, + "loss": 0.3763, + "step": 57655 + }, + { + "epoch": 1.48, + "learning_rate": 1.0725434924782688e-06, + "loss": 0.7686, + "step": 57656 + }, + { + "epoch": 1.48, + "learning_rate": 1.0725158949013355e-06, + "loss": 0.5005, + "step": 57657 + }, + { + "epoch": 1.48, + "learning_rate": 1.0724882972688801e-06, + "loss": 0.6685, + "step": 57658 + }, + { + "epoch": 1.48, + "learning_rate": 1.0724606995809237e-06, + "loss": 0.6523, + "step": 57659 + }, + { + "epoch": 1.48, + "learning_rate": 1.0724331018374877e-06, + "loss": 0.5781, + "step": 57660 + }, + { + "epoch": 1.48, + "learning_rate": 1.0724055040385929e-06, + "loss": 0.7646, + "step": 57661 + }, + { + "epoch": 1.48, + "learning_rate": 1.0723779061842606e-06, + "loss": 0.6475, + "step": 57662 + }, + { + "epoch": 1.48, + "learning_rate": 1.0723503082745118e-06, + "loss": 0.6279, + "step": 57663 + }, + { + "epoch": 1.48, + "learning_rate": 1.0723227103093677e-06, + "loss": 0.6641, + "step": 57664 + }, + { + "epoch": 1.48, + "learning_rate": 1.0722951122888492e-06, + "loss": 0.7744, + "step": 57665 + }, + { + "epoch": 1.48, + "learning_rate": 1.072267514212978e-06, + "loss": 0.7158, + "step": 57666 + }, + { + "epoch": 1.48, + "learning_rate": 1.0722399160817747e-06, + "loss": 0.7529, + "step": 57667 + }, + { + "epoch": 1.48, + "learning_rate": 1.0722123178952604e-06, + "loss": 0.5962, + "step": 57668 + }, + { + "epoch": 1.48, + "learning_rate": 1.072184719653457e-06, + "loss": 0.5615, + "step": 57669 + }, + { + "epoch": 1.48, + "learning_rate": 1.0721571213563847e-06, + "loss": 0.5195, + "step": 57670 + }, + { + "epoch": 1.48, + "learning_rate": 1.072129523004065e-06, + "loss": 0.748, + "step": 57671 + }, + { + "epoch": 1.48, + "learning_rate": 1.0721019245965192e-06, + "loss": 0.7725, + "step": 57672 + }, + { + "epoch": 1.48, + "learning_rate": 1.0720743261337684e-06, + "loss": 0.5869, + "step": 57673 + }, + { + "epoch": 1.48, + "learning_rate": 1.0720467276158332e-06, + "loss": 0.6504, + "step": 57674 + }, + { + "epoch": 1.48, + "learning_rate": 1.0720191290427355e-06, + "loss": 0.7266, + "step": 57675 + }, + { + "epoch": 1.48, + "learning_rate": 1.0719915304144958e-06, + "loss": 0.6348, + "step": 57676 + }, + { + "epoch": 1.48, + "learning_rate": 1.0719639317311357e-06, + "loss": 0.6416, + "step": 57677 + }, + { + "epoch": 1.48, + "learning_rate": 1.0719363329926757e-06, + "loss": 0.6548, + "step": 57678 + }, + { + "epoch": 1.48, + "learning_rate": 1.071908734199138e-06, + "loss": 0.8008, + "step": 57679 + }, + { + "epoch": 1.48, + "learning_rate": 1.0718811353505426e-06, + "loss": 0.8145, + "step": 57680 + }, + { + "epoch": 1.48, + "learning_rate": 1.0718535364469114e-06, + "loss": 0.5562, + "step": 57681 + }, + { + "epoch": 1.48, + "learning_rate": 1.0718259374882652e-06, + "loss": 0.688, + "step": 57682 + }, + { + "epoch": 1.48, + "learning_rate": 1.0717983384746251e-06, + "loss": 0.6289, + "step": 57683 + }, + { + "epoch": 1.48, + "learning_rate": 1.0717707394060122e-06, + "loss": 0.5811, + "step": 57684 + }, + { + "epoch": 1.48, + "learning_rate": 1.0717431402824478e-06, + "loss": 0.584, + "step": 57685 + }, + { + "epoch": 1.48, + "learning_rate": 1.0717155411039532e-06, + "loss": 0.5508, + "step": 57686 + }, + { + "epoch": 1.48, + "learning_rate": 1.0716879418705494e-06, + "loss": 0.4966, + "step": 57687 + }, + { + "epoch": 1.48, + "learning_rate": 1.071660342582257e-06, + "loss": 0.7383, + "step": 57688 + }, + { + "epoch": 1.48, + "learning_rate": 1.0716327432390978e-06, + "loss": 0.6055, + "step": 57689 + }, + { + "epoch": 1.48, + "learning_rate": 1.0716051438410927e-06, + "loss": 0.5752, + "step": 57690 + }, + { + "epoch": 1.48, + "learning_rate": 1.0715775443882629e-06, + "loss": 0.6982, + "step": 57691 + }, + { + "epoch": 1.48, + "learning_rate": 1.0715499448806294e-06, + "loss": 0.5444, + "step": 57692 + }, + { + "epoch": 1.48, + "learning_rate": 1.0715223453182132e-06, + "loss": 0.5908, + "step": 57693 + }, + { + "epoch": 1.48, + "learning_rate": 1.071494745701036e-06, + "loss": 0.4692, + "step": 57694 + }, + { + "epoch": 1.48, + "learning_rate": 1.0714671460291183e-06, + "loss": 0.6665, + "step": 57695 + }, + { + "epoch": 1.48, + "learning_rate": 1.0714395463024815e-06, + "loss": 0.5205, + "step": 57696 + }, + { + "epoch": 1.48, + "learning_rate": 1.071411946521147e-06, + "loss": 0.6123, + "step": 57697 + }, + { + "epoch": 1.48, + "learning_rate": 1.0713843466851353e-06, + "loss": 0.7256, + "step": 57698 + }, + { + "epoch": 1.48, + "learning_rate": 1.071356746794468e-06, + "loss": 0.6421, + "step": 57699 + }, + { + "epoch": 1.48, + "learning_rate": 1.071329146849166e-06, + "loss": 0.5376, + "step": 57700 + }, + { + "epoch": 1.48, + "learning_rate": 1.0713015468492508e-06, + "loss": 0.6836, + "step": 57701 + }, + { + "epoch": 1.48, + "learning_rate": 1.0712739467947434e-06, + "loss": 0.8467, + "step": 57702 + }, + { + "epoch": 1.48, + "learning_rate": 1.0712463466856645e-06, + "loss": 0.6001, + "step": 57703 + }, + { + "epoch": 1.48, + "learning_rate": 1.0712187465220358e-06, + "loss": 0.7051, + "step": 57704 + }, + { + "epoch": 1.48, + "learning_rate": 1.0711911463038778e-06, + "loss": 0.5762, + "step": 57705 + }, + { + "epoch": 1.48, + "learning_rate": 1.0711635460312122e-06, + "loss": 0.5273, + "step": 57706 + }, + { + "epoch": 1.48, + "learning_rate": 1.07113594570406e-06, + "loss": 0.6279, + "step": 57707 + }, + { + "epoch": 1.48, + "learning_rate": 1.0711083453224425e-06, + "loss": 0.7197, + "step": 57708 + }, + { + "epoch": 1.48, + "learning_rate": 1.0710807448863804e-06, + "loss": 0.7861, + "step": 57709 + }, + { + "epoch": 1.48, + "learning_rate": 1.071053144395895e-06, + "loss": 0.5137, + "step": 57710 + }, + { + "epoch": 1.48, + "learning_rate": 1.0710255438510072e-06, + "loss": 0.5232, + "step": 57711 + }, + { + "epoch": 1.48, + "learning_rate": 1.0709979432517389e-06, + "loss": 0.5996, + "step": 57712 + }, + { + "epoch": 1.48, + "learning_rate": 1.0709703425981105e-06, + "loss": 0.6211, + "step": 57713 + }, + { + "epoch": 1.48, + "learning_rate": 1.0709427418901435e-06, + "loss": 0.6267, + "step": 57714 + }, + { + "epoch": 1.48, + "learning_rate": 1.0709151411278587e-06, + "loss": 0.7773, + "step": 57715 + }, + { + "epoch": 1.48, + "learning_rate": 1.0708875403112775e-06, + "loss": 0.6982, + "step": 57716 + }, + { + "epoch": 1.48, + "learning_rate": 1.0708599394404212e-06, + "loss": 0.6685, + "step": 57717 + }, + { + "epoch": 1.48, + "learning_rate": 1.0708323385153105e-06, + "loss": 0.7012, + "step": 57718 + }, + { + "epoch": 1.48, + "learning_rate": 1.0708047375359668e-06, + "loss": 0.5679, + "step": 57719 + }, + { + "epoch": 1.48, + "learning_rate": 1.0707771365024109e-06, + "loss": 0.5083, + "step": 57720 + }, + { + "epoch": 1.48, + "learning_rate": 1.0707495354146645e-06, + "loss": 0.543, + "step": 57721 + }, + { + "epoch": 1.48, + "learning_rate": 1.0707219342727485e-06, + "loss": 0.71, + "step": 57722 + }, + { + "epoch": 1.48, + "learning_rate": 1.0706943330766839e-06, + "loss": 0.7549, + "step": 57723 + }, + { + "epoch": 1.48, + "learning_rate": 1.0706667318264916e-06, + "loss": 0.7539, + "step": 57724 + }, + { + "epoch": 1.48, + "learning_rate": 1.0706391305221933e-06, + "loss": 0.3938, + "step": 57725 + }, + { + "epoch": 1.48, + "learning_rate": 1.0706115291638098e-06, + "loss": 0.752, + "step": 57726 + }, + { + "epoch": 1.48, + "learning_rate": 1.0705839277513627e-06, + "loss": 0.5554, + "step": 57727 + }, + { + "epoch": 1.48, + "learning_rate": 1.070556326284872e-06, + "loss": 0.8242, + "step": 57728 + }, + { + "epoch": 1.48, + "learning_rate": 1.0705287247643602e-06, + "loss": 0.6772, + "step": 57729 + }, + { + "epoch": 1.48, + "learning_rate": 1.0705011231898473e-06, + "loss": 0.5645, + "step": 57730 + }, + { + "epoch": 1.48, + "learning_rate": 1.0704735215613551e-06, + "loss": 0.5688, + "step": 57731 + }, + { + "epoch": 1.48, + "learning_rate": 1.0704459198789049e-06, + "loss": 0.5879, + "step": 57732 + }, + { + "epoch": 1.48, + "learning_rate": 1.0704183181425172e-06, + "loss": 0.707, + "step": 57733 + }, + { + "epoch": 1.48, + "learning_rate": 1.0703907163522132e-06, + "loss": 0.7266, + "step": 57734 + }, + { + "epoch": 1.48, + "learning_rate": 1.0703631145080148e-06, + "loss": 0.6387, + "step": 57735 + }, + { + "epoch": 1.48, + "learning_rate": 1.070335512609942e-06, + "loss": 0.4852, + "step": 57736 + }, + { + "epoch": 1.48, + "learning_rate": 1.0703079106580172e-06, + "loss": 0.6504, + "step": 57737 + }, + { + "epoch": 1.48, + "learning_rate": 1.0702803086522603e-06, + "loss": 0.7539, + "step": 57738 + }, + { + "epoch": 1.48, + "learning_rate": 1.0702527065926932e-06, + "loss": 0.7793, + "step": 57739 + }, + { + "epoch": 1.48, + "learning_rate": 1.070225104479337e-06, + "loss": 0.4559, + "step": 57740 + }, + { + "epoch": 1.48, + "learning_rate": 1.070197502312212e-06, + "loss": 0.709, + "step": 57741 + }, + { + "epoch": 1.48, + "learning_rate": 1.0701699000913409e-06, + "loss": 0.511, + "step": 57742 + }, + { + "epoch": 1.48, + "learning_rate": 1.0701422978167434e-06, + "loss": 0.686, + "step": 57743 + }, + { + "epoch": 1.48, + "learning_rate": 1.0701146954884415e-06, + "loss": 0.7305, + "step": 57744 + }, + { + "epoch": 1.48, + "learning_rate": 1.0700870931064555e-06, + "loss": 0.5894, + "step": 57745 + }, + { + "epoch": 1.48, + "learning_rate": 1.0700594906708077e-06, + "loss": 0.7168, + "step": 57746 + }, + { + "epoch": 1.48, + "learning_rate": 1.0700318881815183e-06, + "loss": 0.7441, + "step": 57747 + }, + { + "epoch": 1.48, + "learning_rate": 1.0700042856386085e-06, + "loss": 0.708, + "step": 57748 + }, + { + "epoch": 1.48, + "learning_rate": 1.0699766830420998e-06, + "loss": 0.7402, + "step": 57749 + }, + { + "epoch": 1.48, + "learning_rate": 1.069949080392013e-06, + "loss": 0.5923, + "step": 57750 + }, + { + "epoch": 1.48, + "learning_rate": 1.0699214776883693e-06, + "loss": 0.6396, + "step": 57751 + }, + { + "epoch": 1.48, + "learning_rate": 1.0698938749311905e-06, + "loss": 0.7412, + "step": 57752 + }, + { + "epoch": 1.48, + "learning_rate": 1.0698662721204967e-06, + "loss": 0.6172, + "step": 57753 + }, + { + "epoch": 1.48, + "learning_rate": 1.06983866925631e-06, + "loss": 0.5315, + "step": 57754 + }, + { + "epoch": 1.48, + "learning_rate": 1.0698110663386504e-06, + "loss": 0.665, + "step": 57755 + }, + { + "epoch": 1.48, + "learning_rate": 1.06978346336754e-06, + "loss": 0.7314, + "step": 57756 + }, + { + "epoch": 1.48, + "learning_rate": 1.0697558603429997e-06, + "loss": 0.6426, + "step": 57757 + }, + { + "epoch": 1.48, + "learning_rate": 1.0697282572650504e-06, + "loss": 0.6357, + "step": 57758 + }, + { + "epoch": 1.48, + "learning_rate": 1.0697006541337134e-06, + "loss": 0.7236, + "step": 57759 + }, + { + "epoch": 1.48, + "learning_rate": 1.06967305094901e-06, + "loss": 0.4971, + "step": 57760 + }, + { + "epoch": 1.48, + "learning_rate": 1.0696454477109606e-06, + "loss": 0.8311, + "step": 57761 + }, + { + "epoch": 1.48, + "learning_rate": 1.0696178444195873e-06, + "loss": 0.5381, + "step": 57762 + }, + { + "epoch": 1.48, + "learning_rate": 1.069590241074911e-06, + "loss": 0.7129, + "step": 57763 + }, + { + "epoch": 1.48, + "learning_rate": 1.0695626376769521e-06, + "loss": 0.5903, + "step": 57764 + }, + { + "epoch": 1.48, + "learning_rate": 1.0695350342257327e-06, + "loss": 0.5967, + "step": 57765 + }, + { + "epoch": 1.48, + "learning_rate": 1.0695074307212735e-06, + "loss": 0.8252, + "step": 57766 + }, + { + "epoch": 1.48, + "learning_rate": 1.0694798271635958e-06, + "loss": 0.6006, + "step": 57767 + }, + { + "epoch": 1.48, + "learning_rate": 1.0694522235527204e-06, + "loss": 0.6001, + "step": 57768 + }, + { + "epoch": 1.48, + "learning_rate": 1.0694246198886686e-06, + "loss": 0.7705, + "step": 57769 + }, + { + "epoch": 1.48, + "learning_rate": 1.0693970161714613e-06, + "loss": 0.7627, + "step": 57770 + }, + { + "epoch": 1.48, + "learning_rate": 1.0693694124011206e-06, + "loss": 0.7915, + "step": 57771 + }, + { + "epoch": 1.48, + "learning_rate": 1.0693418085776662e-06, + "loss": 0.6982, + "step": 57772 + }, + { + "epoch": 1.48, + "learning_rate": 1.0693142047011202e-06, + "loss": 0.4844, + "step": 57773 + }, + { + "epoch": 1.48, + "learning_rate": 1.0692866007715036e-06, + "loss": 0.5938, + "step": 57774 + }, + { + "epoch": 1.48, + "learning_rate": 1.0692589967888375e-06, + "loss": 0.7422, + "step": 57775 + }, + { + "epoch": 1.48, + "learning_rate": 1.069231392753143e-06, + "loss": 0.7627, + "step": 57776 + }, + { + "epoch": 1.48, + "learning_rate": 1.069203788664441e-06, + "loss": 0.575, + "step": 57777 + }, + { + "epoch": 1.48, + "learning_rate": 1.069176184522753e-06, + "loss": 0.7695, + "step": 57778 + }, + { + "epoch": 1.48, + "learning_rate": 1.0691485803280998e-06, + "loss": 0.7798, + "step": 57779 + }, + { + "epoch": 1.48, + "learning_rate": 1.0691209760805026e-06, + "loss": 0.4749, + "step": 57780 + }, + { + "epoch": 1.48, + "learning_rate": 1.0690933717799831e-06, + "loss": 0.5996, + "step": 57781 + }, + { + "epoch": 1.48, + "learning_rate": 1.0690657674265616e-06, + "loss": 0.6853, + "step": 57782 + }, + { + "epoch": 1.48, + "learning_rate": 1.0690381630202597e-06, + "loss": 0.5874, + "step": 57783 + }, + { + "epoch": 1.48, + "learning_rate": 1.0690105585610986e-06, + "loss": 0.6465, + "step": 57784 + }, + { + "epoch": 1.48, + "learning_rate": 1.0689829540490992e-06, + "loss": 0.6982, + "step": 57785 + }, + { + "epoch": 1.48, + "learning_rate": 1.0689553494842828e-06, + "loss": 0.5459, + "step": 57786 + }, + { + "epoch": 1.48, + "learning_rate": 1.0689277448666702e-06, + "loss": 0.6641, + "step": 57787 + }, + { + "epoch": 1.48, + "learning_rate": 1.068900140196283e-06, + "loss": 0.5303, + "step": 57788 + }, + { + "epoch": 1.48, + "learning_rate": 1.068872535473142e-06, + "loss": 0.5319, + "step": 57789 + }, + { + "epoch": 1.48, + "learning_rate": 1.0688449306972686e-06, + "loss": 0.7275, + "step": 57790 + }, + { + "epoch": 1.48, + "learning_rate": 1.0688173258686838e-06, + "loss": 0.6709, + "step": 57791 + }, + { + "epoch": 1.48, + "learning_rate": 1.068789720987409e-06, + "loss": 0.6377, + "step": 57792 + }, + { + "epoch": 1.48, + "learning_rate": 1.0687621160534646e-06, + "loss": 0.752, + "step": 57793 + }, + { + "epoch": 1.48, + "learning_rate": 1.0687345110668724e-06, + "loss": 0.6997, + "step": 57794 + }, + { + "epoch": 1.48, + "learning_rate": 1.0687069060276532e-06, + "loss": 0.7432, + "step": 57795 + }, + { + "epoch": 1.48, + "learning_rate": 1.0686793009358288e-06, + "loss": 0.6816, + "step": 57796 + }, + { + "epoch": 1.48, + "learning_rate": 1.0686516957914191e-06, + "loss": 0.71, + "step": 57797 + }, + { + "epoch": 1.48, + "learning_rate": 1.0686240905944466e-06, + "loss": 0.8066, + "step": 57798 + }, + { + "epoch": 1.48, + "learning_rate": 1.0685964853449312e-06, + "loss": 0.7559, + "step": 57799 + }, + { + "epoch": 1.48, + "learning_rate": 1.0685688800428948e-06, + "loss": 0.646, + "step": 57800 + }, + { + "epoch": 1.48, + "learning_rate": 1.0685412746883587e-06, + "loss": 0.4226, + "step": 57801 + }, + { + "epoch": 1.48, + "learning_rate": 1.0685136692813434e-06, + "loss": 0.4697, + "step": 57802 + }, + { + "epoch": 1.48, + "learning_rate": 1.0684860638218705e-06, + "loss": 0.7578, + "step": 57803 + }, + { + "epoch": 1.48, + "learning_rate": 1.0684584583099608e-06, + "loss": 0.7949, + "step": 57804 + }, + { + "epoch": 1.48, + "learning_rate": 1.0684308527456356e-06, + "loss": 0.7217, + "step": 57805 + }, + { + "epoch": 1.48, + "learning_rate": 1.0684032471289161e-06, + "loss": 0.667, + "step": 57806 + }, + { + "epoch": 1.48, + "learning_rate": 1.0683756414598235e-06, + "loss": 0.6992, + "step": 57807 + }, + { + "epoch": 1.48, + "learning_rate": 1.0683480357383786e-06, + "loss": 0.6123, + "step": 57808 + }, + { + "epoch": 1.48, + "learning_rate": 1.068320429964603e-06, + "loss": 0.6592, + "step": 57809 + }, + { + "epoch": 1.48, + "learning_rate": 1.0682928241385172e-06, + "loss": 0.6675, + "step": 57810 + }, + { + "epoch": 1.48, + "learning_rate": 1.0682652182601433e-06, + "loss": 0.5908, + "step": 57811 + }, + { + "epoch": 1.48, + "learning_rate": 1.0682376123295014e-06, + "loss": 0.6855, + "step": 57812 + }, + { + "epoch": 1.48, + "learning_rate": 1.0682100063466134e-06, + "loss": 0.6309, + "step": 57813 + }, + { + "epoch": 1.48, + "learning_rate": 1.0681824003114996e-06, + "loss": 0.6826, + "step": 57814 + }, + { + "epoch": 1.48, + "learning_rate": 1.0681547942241822e-06, + "loss": 0.5664, + "step": 57815 + }, + { + "epoch": 1.48, + "learning_rate": 1.0681271880846818e-06, + "loss": 0.7285, + "step": 57816 + }, + { + "epoch": 1.48, + "learning_rate": 1.0680995818930195e-06, + "loss": 0.624, + "step": 57817 + }, + { + "epoch": 1.48, + "learning_rate": 1.068071975649216e-06, + "loss": 0.6387, + "step": 57818 + }, + { + "epoch": 1.48, + "learning_rate": 1.0680443693532935e-06, + "loss": 0.6094, + "step": 57819 + }, + { + "epoch": 1.48, + "learning_rate": 1.068016763005272e-06, + "loss": 0.6807, + "step": 57820 + }, + { + "epoch": 1.48, + "learning_rate": 1.0679891566051737e-06, + "loss": 0.5024, + "step": 57821 + }, + { + "epoch": 1.48, + "learning_rate": 1.0679615501530193e-06, + "loss": 0.531, + "step": 57822 + }, + { + "epoch": 1.48, + "learning_rate": 1.0679339436488297e-06, + "loss": 0.6826, + "step": 57823 + }, + { + "epoch": 1.48, + "learning_rate": 1.067906337092626e-06, + "loss": 0.8779, + "step": 57824 + }, + { + "epoch": 1.48, + "learning_rate": 1.0678787304844297e-06, + "loss": 0.5688, + "step": 57825 + }, + { + "epoch": 1.48, + "learning_rate": 1.0678511238242618e-06, + "loss": 0.6914, + "step": 57826 + }, + { + "epoch": 1.48, + "learning_rate": 1.0678235171121432e-06, + "loss": 0.6001, + "step": 57827 + }, + { + "epoch": 1.48, + "learning_rate": 1.0677959103480956e-06, + "loss": 0.6536, + "step": 57828 + }, + { + "epoch": 1.48, + "learning_rate": 1.0677683035321394e-06, + "loss": 0.4469, + "step": 57829 + }, + { + "epoch": 1.48, + "learning_rate": 1.0677406966642964e-06, + "loss": 0.5908, + "step": 57830 + }, + { + "epoch": 1.48, + "learning_rate": 1.0677130897445874e-06, + "loss": 0.5073, + "step": 57831 + }, + { + "epoch": 1.48, + "learning_rate": 1.0676854827730336e-06, + "loss": 0.511, + "step": 57832 + }, + { + "epoch": 1.48, + "learning_rate": 1.067657875749656e-06, + "loss": 0.6104, + "step": 57833 + }, + { + "epoch": 1.48, + "learning_rate": 1.0676302686744763e-06, + "loss": 0.6738, + "step": 57834 + }, + { + "epoch": 1.48, + "learning_rate": 1.0676026615475147e-06, + "loss": 0.5466, + "step": 57835 + }, + { + "epoch": 1.48, + "learning_rate": 1.0675750543687934e-06, + "loss": 0.6282, + "step": 57836 + }, + { + "epoch": 1.48, + "learning_rate": 1.0675474471383326e-06, + "loss": 0.7285, + "step": 57837 + }, + { + "epoch": 1.48, + "learning_rate": 1.0675198398561538e-06, + "loss": 0.7598, + "step": 57838 + }, + { + "epoch": 1.48, + "learning_rate": 1.0674922325222781e-06, + "loss": 0.48, + "step": 57839 + }, + { + "epoch": 1.48, + "learning_rate": 1.067464625136727e-06, + "loss": 0.6875, + "step": 57840 + }, + { + "epoch": 1.48, + "learning_rate": 1.0674370176995214e-06, + "loss": 0.5786, + "step": 57841 + }, + { + "epoch": 1.48, + "learning_rate": 1.067409410210682e-06, + "loss": 0.4648, + "step": 57842 + }, + { + "epoch": 1.48, + "learning_rate": 1.0673818026702303e-06, + "loss": 0.5413, + "step": 57843 + }, + { + "epoch": 1.48, + "learning_rate": 1.0673541950781876e-06, + "loss": 0.5347, + "step": 57844 + }, + { + "epoch": 1.48, + "learning_rate": 1.0673265874345748e-06, + "loss": 0.7529, + "step": 57845 + }, + { + "epoch": 1.48, + "learning_rate": 1.0672989797394133e-06, + "loss": 0.6333, + "step": 57846 + }, + { + "epoch": 1.48, + "learning_rate": 1.0672713719927243e-06, + "loss": 0.7607, + "step": 57847 + }, + { + "epoch": 1.48, + "learning_rate": 1.0672437641945282e-06, + "loss": 0.5957, + "step": 57848 + }, + { + "epoch": 1.48, + "learning_rate": 1.0672161563448469e-06, + "loss": 0.7539, + "step": 57849 + }, + { + "epoch": 1.48, + "learning_rate": 1.0671885484437014e-06, + "loss": 0.7422, + "step": 57850 + }, + { + "epoch": 1.48, + "learning_rate": 1.0671609404911126e-06, + "loss": 0.5068, + "step": 57851 + }, + { + "epoch": 1.48, + "learning_rate": 1.0671333324871017e-06, + "loss": 0.7212, + "step": 57852 + }, + { + "epoch": 1.48, + "learning_rate": 1.0671057244316898e-06, + "loss": 0.4622, + "step": 57853 + }, + { + "epoch": 1.48, + "learning_rate": 1.0670781163248983e-06, + "loss": 0.542, + "step": 57854 + }, + { + "epoch": 1.48, + "learning_rate": 1.067050508166748e-06, + "loss": 0.5679, + "step": 57855 + }, + { + "epoch": 1.48, + "learning_rate": 1.0670228999572606e-06, + "loss": 0.5894, + "step": 57856 + }, + { + "epoch": 1.48, + "learning_rate": 1.0669952916964566e-06, + "loss": 0.5796, + "step": 57857 + }, + { + "epoch": 1.48, + "learning_rate": 1.066967683384357e-06, + "loss": 0.7158, + "step": 57858 + }, + { + "epoch": 1.48, + "learning_rate": 1.0669400750209839e-06, + "loss": 0.6436, + "step": 57859 + }, + { + "epoch": 1.48, + "learning_rate": 1.0669124666063577e-06, + "loss": 0.7109, + "step": 57860 + }, + { + "epoch": 1.48, + "learning_rate": 1.0668848581404997e-06, + "loss": 0.6377, + "step": 57861 + }, + { + "epoch": 1.48, + "learning_rate": 1.066857249623431e-06, + "loss": 0.7188, + "step": 57862 + }, + { + "epoch": 1.48, + "learning_rate": 1.0668296410551727e-06, + "loss": 0.5879, + "step": 57863 + }, + { + "epoch": 1.48, + "learning_rate": 1.0668020324357458e-06, + "loss": 0.6475, + "step": 57864 + }, + { + "epoch": 1.48, + "learning_rate": 1.066774423765172e-06, + "loss": 0.4983, + "step": 57865 + }, + { + "epoch": 1.48, + "learning_rate": 1.0667468150434723e-06, + "loss": 0.6143, + "step": 57866 + }, + { + "epoch": 1.48, + "learning_rate": 1.0667192062706674e-06, + "loss": 0.7334, + "step": 57867 + }, + { + "epoch": 1.48, + "learning_rate": 1.0666915974467785e-06, + "loss": 0.6265, + "step": 57868 + }, + { + "epoch": 1.48, + "learning_rate": 1.0666639885718272e-06, + "loss": 0.6904, + "step": 57869 + }, + { + "epoch": 1.48, + "learning_rate": 1.066636379645834e-06, + "loss": 0.6982, + "step": 57870 + }, + { + "epoch": 1.48, + "learning_rate": 1.0666087706688205e-06, + "loss": 0.6335, + "step": 57871 + }, + { + "epoch": 1.48, + "learning_rate": 1.066581161640808e-06, + "loss": 0.5435, + "step": 57872 + }, + { + "epoch": 1.48, + "learning_rate": 1.066553552561817e-06, + "loss": 0.6396, + "step": 57873 + }, + { + "epoch": 1.48, + "learning_rate": 1.0665259434318691e-06, + "loss": 0.5439, + "step": 57874 + }, + { + "epoch": 1.48, + "learning_rate": 1.0664983342509854e-06, + "loss": 0.6338, + "step": 57875 + }, + { + "epoch": 1.48, + "learning_rate": 1.0664707250191873e-06, + "loss": 0.6548, + "step": 57876 + }, + { + "epoch": 1.48, + "learning_rate": 1.0664431157364952e-06, + "loss": 0.61, + "step": 57877 + }, + { + "epoch": 1.48, + "learning_rate": 1.0664155064029308e-06, + "loss": 0.748, + "step": 57878 + }, + { + "epoch": 1.48, + "learning_rate": 1.066387897018515e-06, + "loss": 0.8008, + "step": 57879 + }, + { + "epoch": 1.48, + "learning_rate": 1.0663602875832691e-06, + "loss": 0.7412, + "step": 57880 + }, + { + "epoch": 1.48, + "learning_rate": 1.0663326780972144e-06, + "loss": 0.4973, + "step": 57881 + }, + { + "epoch": 1.48, + "learning_rate": 1.0663050685603716e-06, + "loss": 0.6167, + "step": 57882 + }, + { + "epoch": 1.48, + "learning_rate": 1.0662774589727619e-06, + "loss": 0.6484, + "step": 57883 + }, + { + "epoch": 1.48, + "learning_rate": 1.066249849334407e-06, + "loss": 0.5474, + "step": 57884 + }, + { + "epoch": 1.48, + "learning_rate": 1.0662222396453272e-06, + "loss": 0.8496, + "step": 57885 + }, + { + "epoch": 1.48, + "learning_rate": 1.0661946299055447e-06, + "loss": 0.584, + "step": 57886 + }, + { + "epoch": 1.48, + "learning_rate": 1.0661670201150794e-06, + "loss": 0.5291, + "step": 57887 + }, + { + "epoch": 1.48, + "learning_rate": 1.0661394102739534e-06, + "loss": 0.8438, + "step": 57888 + }, + { + "epoch": 1.48, + "learning_rate": 1.0661118003821873e-06, + "loss": 0.7764, + "step": 57889 + }, + { + "epoch": 1.48, + "learning_rate": 1.0660841904398023e-06, + "loss": 0.541, + "step": 57890 + }, + { + "epoch": 1.48, + "learning_rate": 1.06605658044682e-06, + "loss": 0.6465, + "step": 57891 + }, + { + "epoch": 1.48, + "learning_rate": 1.066028970403261e-06, + "loss": 0.6758, + "step": 57892 + }, + { + "epoch": 1.48, + "learning_rate": 1.0660013603091468e-06, + "loss": 1.0078, + "step": 57893 + }, + { + "epoch": 1.48, + "learning_rate": 1.0659737501644984e-06, + "loss": 0.6123, + "step": 57894 + }, + { + "epoch": 1.48, + "learning_rate": 1.0659461399693369e-06, + "loss": 0.6284, + "step": 57895 + }, + { + "epoch": 1.48, + "learning_rate": 1.0659185297236832e-06, + "loss": 0.4224, + "step": 57896 + }, + { + "epoch": 1.48, + "learning_rate": 1.0658909194275592e-06, + "loss": 0.5137, + "step": 57897 + }, + { + "epoch": 1.48, + "learning_rate": 1.065863309080985e-06, + "loss": 0.8096, + "step": 57898 + }, + { + "epoch": 1.48, + "learning_rate": 1.0658356986839826e-06, + "loss": 0.748, + "step": 57899 + }, + { + "epoch": 1.48, + "learning_rate": 1.0658080882365728e-06, + "loss": 0.5376, + "step": 57900 + }, + { + "epoch": 1.48, + "learning_rate": 1.065780477738777e-06, + "loss": 0.5518, + "step": 57901 + }, + { + "epoch": 1.48, + "learning_rate": 1.065752867190616e-06, + "loss": 0.5166, + "step": 57902 + }, + { + "epoch": 1.48, + "learning_rate": 1.065725256592111e-06, + "loss": 0.6089, + "step": 57903 + }, + { + "epoch": 1.48, + "learning_rate": 1.0656976459432828e-06, + "loss": 0.7178, + "step": 57904 + }, + { + "epoch": 1.48, + "learning_rate": 1.0656700352441535e-06, + "loss": 0.3619, + "step": 57905 + }, + { + "epoch": 1.48, + "learning_rate": 1.0656424244947434e-06, + "loss": 0.7046, + "step": 57906 + }, + { + "epoch": 1.48, + "learning_rate": 1.0656148136950742e-06, + "loss": 0.5942, + "step": 57907 + }, + { + "epoch": 1.48, + "learning_rate": 1.0655872028451665e-06, + "loss": 0.7178, + "step": 57908 + }, + { + "epoch": 1.48, + "learning_rate": 1.0655595919450417e-06, + "loss": 0.6953, + "step": 57909 + }, + { + "epoch": 1.48, + "learning_rate": 1.0655319809947207e-06, + "loss": 0.604, + "step": 57910 + }, + { + "epoch": 1.48, + "learning_rate": 1.0655043699942251e-06, + "loss": 0.5732, + "step": 57911 + }, + { + "epoch": 1.48, + "learning_rate": 1.065476758943576e-06, + "loss": 0.4907, + "step": 57912 + }, + { + "epoch": 1.48, + "learning_rate": 1.0654491478427945e-06, + "loss": 0.5684, + "step": 57913 + }, + { + "epoch": 1.48, + "learning_rate": 1.065421536691901e-06, + "loss": 0.7305, + "step": 57914 + }, + { + "epoch": 1.48, + "learning_rate": 1.0653939254909177e-06, + "loss": 0.5587, + "step": 57915 + }, + { + "epoch": 1.48, + "learning_rate": 1.0653663142398653e-06, + "loss": 0.6016, + "step": 57916 + }, + { + "epoch": 1.48, + "learning_rate": 1.0653387029387643e-06, + "loss": 0.5518, + "step": 57917 + }, + { + "epoch": 1.48, + "learning_rate": 1.065311091587637e-06, + "loss": 0.6948, + "step": 57918 + }, + { + "epoch": 1.48, + "learning_rate": 1.0652834801865037e-06, + "loss": 0.5488, + "step": 57919 + }, + { + "epoch": 1.48, + "learning_rate": 1.0652558687353864e-06, + "loss": 0.585, + "step": 57920 + }, + { + "epoch": 1.48, + "learning_rate": 1.0652282572343053e-06, + "loss": 0.5889, + "step": 57921 + }, + { + "epoch": 1.48, + "learning_rate": 1.065200645683282e-06, + "loss": 0.7051, + "step": 57922 + }, + { + "epoch": 1.48, + "learning_rate": 1.0651730340823373e-06, + "loss": 0.8379, + "step": 57923 + }, + { + "epoch": 1.48, + "learning_rate": 1.065145422431493e-06, + "loss": 0.6086, + "step": 57924 + }, + { + "epoch": 1.48, + "learning_rate": 1.0651178107307694e-06, + "loss": 0.6738, + "step": 57925 + }, + { + "epoch": 1.48, + "learning_rate": 1.0650901989801888e-06, + "loss": 0.5543, + "step": 57926 + }, + { + "epoch": 1.48, + "learning_rate": 1.065062587179771e-06, + "loss": 0.5913, + "step": 57927 + }, + { + "epoch": 1.48, + "learning_rate": 1.065034975329538e-06, + "loss": 0.6079, + "step": 57928 + }, + { + "epoch": 1.48, + "learning_rate": 1.0650073634295104e-06, + "loss": 0.6035, + "step": 57929 + }, + { + "epoch": 1.48, + "learning_rate": 1.06497975147971e-06, + "loss": 0.5464, + "step": 57930 + }, + { + "epoch": 1.48, + "learning_rate": 1.0649521394801575e-06, + "loss": 0.5308, + "step": 57931 + }, + { + "epoch": 1.48, + "learning_rate": 1.0649245274308743e-06, + "loss": 0.6353, + "step": 57932 + }, + { + "epoch": 1.48, + "learning_rate": 1.064896915331881e-06, + "loss": 0.6689, + "step": 57933 + }, + { + "epoch": 1.48, + "learning_rate": 1.0648693031831993e-06, + "loss": 0.5012, + "step": 57934 + }, + { + "epoch": 1.48, + "learning_rate": 1.06484169098485e-06, + "loss": 0.752, + "step": 57935 + }, + { + "epoch": 1.48, + "learning_rate": 1.064814078736855e-06, + "loss": 0.5503, + "step": 57936 + }, + { + "epoch": 1.48, + "learning_rate": 1.0647864664392342e-06, + "loss": 0.5479, + "step": 57937 + }, + { + "epoch": 1.48, + "learning_rate": 1.0647588540920096e-06, + "loss": 0.7021, + "step": 57938 + }, + { + "epoch": 1.49, + "learning_rate": 1.0647312416952022e-06, + "loss": 0.5664, + "step": 57939 + }, + { + "epoch": 1.49, + "learning_rate": 1.064703629248833e-06, + "loss": 0.5638, + "step": 57940 + }, + { + "epoch": 1.49, + "learning_rate": 1.0646760167529233e-06, + "loss": 0.6143, + "step": 57941 + }, + { + "epoch": 1.49, + "learning_rate": 1.0646484042074938e-06, + "loss": 0.7051, + "step": 57942 + }, + { + "epoch": 1.49, + "learning_rate": 1.0646207916125665e-06, + "loss": 0.7676, + "step": 57943 + }, + { + "epoch": 1.49, + "learning_rate": 1.0645931789681614e-06, + "loss": 0.7466, + "step": 57944 + }, + { + "epoch": 1.49, + "learning_rate": 1.0645655662743008e-06, + "loss": 0.5552, + "step": 57945 + }, + { + "epoch": 1.49, + "learning_rate": 1.0645379535310052e-06, + "loss": 0.4966, + "step": 57946 + }, + { + "epoch": 1.49, + "learning_rate": 1.064510340738296e-06, + "loss": 0.835, + "step": 57947 + }, + { + "epoch": 1.49, + "learning_rate": 1.064482727896194e-06, + "loss": 0.751, + "step": 57948 + }, + { + "epoch": 1.49, + "learning_rate": 1.0644551150047204e-06, + "loss": 0.729, + "step": 57949 + }, + { + "epoch": 1.49, + "learning_rate": 1.0644275020638965e-06, + "loss": 0.5242, + "step": 57950 + }, + { + "epoch": 1.49, + "learning_rate": 1.0643998890737438e-06, + "loss": 0.6104, + "step": 57951 + }, + { + "epoch": 1.49, + "learning_rate": 1.0643722760342825e-06, + "loss": 0.7114, + "step": 57952 + }, + { + "epoch": 1.49, + "learning_rate": 1.0643446629455348e-06, + "loss": 0.8223, + "step": 57953 + }, + { + "epoch": 1.49, + "learning_rate": 1.0643170498075212e-06, + "loss": 0.6978, + "step": 57954 + }, + { + "epoch": 1.49, + "learning_rate": 1.0642894366202629e-06, + "loss": 0.645, + "step": 57955 + }, + { + "epoch": 1.49, + "learning_rate": 1.0642618233837813e-06, + "loss": 0.6719, + "step": 57956 + }, + { + "epoch": 1.49, + "learning_rate": 1.0642342100980973e-06, + "loss": 0.6763, + "step": 57957 + }, + { + "epoch": 1.49, + "learning_rate": 1.064206596763232e-06, + "loss": 0.6074, + "step": 57958 + }, + { + "epoch": 1.49, + "learning_rate": 1.0641789833792067e-06, + "loss": 0.5012, + "step": 57959 + }, + { + "epoch": 1.49, + "learning_rate": 1.0641513699460424e-06, + "loss": 0.6904, + "step": 57960 + }, + { + "epoch": 1.49, + "learning_rate": 1.0641237564637606e-06, + "loss": 0.6113, + "step": 57961 + }, + { + "epoch": 1.49, + "learning_rate": 1.0640961429323822e-06, + "loss": 0.6494, + "step": 57962 + }, + { + "epoch": 1.49, + "learning_rate": 1.0640685293519282e-06, + "loss": 0.5293, + "step": 57963 + }, + { + "epoch": 1.49, + "learning_rate": 1.06404091572242e-06, + "loss": 0.4924, + "step": 57964 + }, + { + "epoch": 1.49, + "learning_rate": 1.0640133020438785e-06, + "loss": 0.8525, + "step": 57965 + }, + { + "epoch": 1.49, + "learning_rate": 1.063985688316325e-06, + "loss": 0.6523, + "step": 57966 + }, + { + "epoch": 1.49, + "learning_rate": 1.0639580745397805e-06, + "loss": 0.6162, + "step": 57967 + }, + { + "epoch": 1.49, + "learning_rate": 1.0639304607142663e-06, + "loss": 0.5034, + "step": 57968 + }, + { + "epoch": 1.49, + "learning_rate": 1.0639028468398036e-06, + "loss": 0.6406, + "step": 57969 + }, + { + "epoch": 1.49, + "learning_rate": 1.063875232916413e-06, + "loss": 0.6025, + "step": 57970 + }, + { + "epoch": 1.49, + "learning_rate": 1.0638476189441167e-06, + "loss": 0.573, + "step": 57971 + }, + { + "epoch": 1.49, + "learning_rate": 1.0638200049229352e-06, + "loss": 0.7002, + "step": 57972 + }, + { + "epoch": 1.49, + "learning_rate": 1.063792390852889e-06, + "loss": 0.6113, + "step": 57973 + }, + { + "epoch": 1.49, + "learning_rate": 1.0637647767340004e-06, + "loss": 0.6777, + "step": 57974 + }, + { + "epoch": 1.49, + "learning_rate": 1.0637371625662896e-06, + "loss": 0.6362, + "step": 57975 + }, + { + "epoch": 1.49, + "learning_rate": 1.0637095483497789e-06, + "loss": 0.5562, + "step": 57976 + }, + { + "epoch": 1.49, + "learning_rate": 1.0636819340844883e-06, + "loss": 0.7637, + "step": 57977 + }, + { + "epoch": 1.49, + "learning_rate": 1.0636543197704392e-06, + "loss": 0.5486, + "step": 57978 + }, + { + "epoch": 1.49, + "learning_rate": 1.063626705407653e-06, + "loss": 0.5166, + "step": 57979 + }, + { + "epoch": 1.49, + "learning_rate": 1.063599090996151e-06, + "loss": 0.7344, + "step": 57980 + }, + { + "epoch": 1.49, + "learning_rate": 1.0635714765359541e-06, + "loss": 0.5337, + "step": 57981 + }, + { + "epoch": 1.49, + "learning_rate": 1.0635438620270832e-06, + "loss": 0.709, + "step": 57982 + }, + { + "epoch": 1.49, + "learning_rate": 1.0635162474695597e-06, + "loss": 0.7598, + "step": 57983 + }, + { + "epoch": 1.49, + "learning_rate": 1.0634886328634047e-06, + "loss": 0.5859, + "step": 57984 + }, + { + "epoch": 1.49, + "learning_rate": 1.0634610182086396e-06, + "loss": 0.6021, + "step": 57985 + }, + { + "epoch": 1.49, + "learning_rate": 1.0634334035052854e-06, + "loss": 0.6504, + "step": 57986 + }, + { + "epoch": 1.49, + "learning_rate": 1.0634057887533633e-06, + "loss": 0.8164, + "step": 57987 + }, + { + "epoch": 1.49, + "learning_rate": 1.0633781739528936e-06, + "loss": 0.6797, + "step": 57988 + }, + { + "epoch": 1.49, + "learning_rate": 1.0633505591038987e-06, + "loss": 0.5479, + "step": 57989 + }, + { + "epoch": 1.49, + "learning_rate": 1.0633229442063987e-06, + "loss": 0.7988, + "step": 57990 + }, + { + "epoch": 1.49, + "learning_rate": 1.0632953292604158e-06, + "loss": 0.6162, + "step": 57991 + }, + { + "epoch": 1.49, + "learning_rate": 1.0632677142659703e-06, + "loss": 0.6582, + "step": 57992 + }, + { + "epoch": 1.49, + "learning_rate": 1.0632400992230836e-06, + "loss": 0.7334, + "step": 57993 + }, + { + "epoch": 1.49, + "learning_rate": 1.063212484131777e-06, + "loss": 0.6387, + "step": 57994 + }, + { + "epoch": 1.49, + "learning_rate": 1.0631848689920715e-06, + "loss": 0.5518, + "step": 57995 + }, + { + "epoch": 1.49, + "learning_rate": 1.063157253803988e-06, + "loss": 0.7031, + "step": 57996 + }, + { + "epoch": 1.49, + "learning_rate": 1.0631296385675483e-06, + "loss": 0.6182, + "step": 57997 + }, + { + "epoch": 1.49, + "learning_rate": 1.0631020232827727e-06, + "loss": 0.6445, + "step": 57998 + }, + { + "epoch": 1.49, + "learning_rate": 1.0630744079496832e-06, + "loss": 0.4954, + "step": 57999 + }, + { + "epoch": 1.49, + "learning_rate": 1.0630467925683e-06, + "loss": 0.5391, + "step": 58000 + }, + { + "epoch": 1.49, + "learning_rate": 1.0630191771386451e-06, + "loss": 0.606, + "step": 58001 + }, + { + "epoch": 1.49, + "learning_rate": 1.0629915616607395e-06, + "loss": 0.7881, + "step": 58002 + }, + { + "epoch": 1.49, + "learning_rate": 1.062963946134604e-06, + "loss": 0.7715, + "step": 58003 + }, + { + "epoch": 1.49, + "learning_rate": 1.0629363305602597e-06, + "loss": 0.8105, + "step": 58004 + }, + { + "epoch": 1.49, + "learning_rate": 1.0629087149377282e-06, + "loss": 0.4823, + "step": 58005 + }, + { + "epoch": 1.49, + "learning_rate": 1.0628810992670303e-06, + "loss": 0.5054, + "step": 58006 + }, + { + "epoch": 1.49, + "learning_rate": 1.062853483548187e-06, + "loss": 0.8369, + "step": 58007 + }, + { + "epoch": 1.49, + "learning_rate": 1.0628258677812201e-06, + "loss": 0.729, + "step": 58008 + }, + { + "epoch": 1.49, + "learning_rate": 1.06279825196615e-06, + "loss": 0.6846, + "step": 58009 + }, + { + "epoch": 1.49, + "learning_rate": 1.0627706361029984e-06, + "loss": 0.7188, + "step": 58010 + }, + { + "epoch": 1.49, + "learning_rate": 1.0627430201917863e-06, + "loss": 0.7715, + "step": 58011 + }, + { + "epoch": 1.49, + "learning_rate": 1.0627154042325345e-06, + "loss": 0.7002, + "step": 58012 + }, + { + "epoch": 1.49, + "learning_rate": 1.0626877882252644e-06, + "loss": 0.6963, + "step": 58013 + }, + { + "epoch": 1.49, + "learning_rate": 1.0626601721699971e-06, + "loss": 0.6611, + "step": 58014 + }, + { + "epoch": 1.49, + "learning_rate": 1.0626325560667538e-06, + "loss": 0.7324, + "step": 58015 + }, + { + "epoch": 1.49, + "learning_rate": 1.0626049399155558e-06, + "loss": 0.458, + "step": 58016 + }, + { + "epoch": 1.49, + "learning_rate": 1.0625773237164239e-06, + "loss": 0.6924, + "step": 58017 + }, + { + "epoch": 1.49, + "learning_rate": 1.0625497074693797e-06, + "loss": 0.6543, + "step": 58018 + }, + { + "epoch": 1.49, + "learning_rate": 1.0625220911744437e-06, + "loss": 0.5732, + "step": 58019 + }, + { + "epoch": 1.49, + "learning_rate": 1.0624944748316378e-06, + "loss": 0.8242, + "step": 58020 + }, + { + "epoch": 1.49, + "learning_rate": 1.0624668584409826e-06, + "loss": 0.3826, + "step": 58021 + }, + { + "epoch": 1.49, + "learning_rate": 1.0624392420024992e-06, + "loss": 0.7939, + "step": 58022 + }, + { + "epoch": 1.49, + "learning_rate": 1.062411625516209e-06, + "loss": 0.5111, + "step": 58023 + }, + { + "epoch": 1.49, + "learning_rate": 1.0623840089821334e-06, + "loss": 0.7451, + "step": 58024 + }, + { + "epoch": 1.49, + "learning_rate": 1.0623563924002927e-06, + "loss": 0.5903, + "step": 58025 + }, + { + "epoch": 1.49, + "learning_rate": 1.0623287757707092e-06, + "loss": 0.7812, + "step": 58026 + }, + { + "epoch": 1.49, + "learning_rate": 1.062301159093403e-06, + "loss": 0.5969, + "step": 58027 + }, + { + "epoch": 1.49, + "learning_rate": 1.0622735423683957e-06, + "loss": 0.6748, + "step": 58028 + }, + { + "epoch": 1.49, + "learning_rate": 1.0622459255957085e-06, + "loss": 0.5039, + "step": 58029 + }, + { + "epoch": 1.49, + "learning_rate": 1.0622183087753624e-06, + "loss": 0.8594, + "step": 58030 + }, + { + "epoch": 1.49, + "learning_rate": 1.062190691907379e-06, + "loss": 0.4807, + "step": 58031 + }, + { + "epoch": 1.49, + "learning_rate": 1.0621630749917782e-06, + "loss": 0.5413, + "step": 58032 + }, + { + "epoch": 1.49, + "learning_rate": 1.0621354580285825e-06, + "loss": 0.4648, + "step": 58033 + }, + { + "epoch": 1.49, + "learning_rate": 1.0621078410178126e-06, + "loss": 0.6323, + "step": 58034 + }, + { + "epoch": 1.49, + "learning_rate": 1.0620802239594894e-06, + "loss": 0.6582, + "step": 58035 + }, + { + "epoch": 1.49, + "learning_rate": 1.0620526068536347e-06, + "loss": 0.6611, + "step": 58036 + }, + { + "epoch": 1.49, + "learning_rate": 1.0620249897002687e-06, + "loss": 0.6982, + "step": 58037 + }, + { + "epoch": 1.49, + "learning_rate": 1.061997372499413e-06, + "loss": 0.6023, + "step": 58038 + }, + { + "epoch": 1.49, + "learning_rate": 1.061969755251089e-06, + "loss": 0.4709, + "step": 58039 + }, + { + "epoch": 1.49, + "learning_rate": 1.0619421379553172e-06, + "loss": 0.261, + "step": 58040 + }, + { + "epoch": 1.49, + "learning_rate": 1.06191452061212e-06, + "loss": 0.6553, + "step": 58041 + }, + { + "epoch": 1.49, + "learning_rate": 1.0618869032215167e-06, + "loss": 0.6396, + "step": 58042 + }, + { + "epoch": 1.49, + "learning_rate": 1.06185928578353e-06, + "loss": 0.7051, + "step": 58043 + }, + { + "epoch": 1.49, + "learning_rate": 1.0618316682981802e-06, + "loss": 0.8613, + "step": 58044 + }, + { + "epoch": 1.49, + "learning_rate": 1.061804050765489e-06, + "loss": 0.6372, + "step": 58045 + }, + { + "epoch": 1.49, + "learning_rate": 1.0617764331854772e-06, + "loss": 0.4725, + "step": 58046 + }, + { + "epoch": 1.49, + "learning_rate": 1.0617488155581662e-06, + "loss": 0.5691, + "step": 58047 + }, + { + "epoch": 1.49, + "learning_rate": 1.0617211978835768e-06, + "loss": 0.6519, + "step": 58048 + }, + { + "epoch": 1.49, + "learning_rate": 1.06169358016173e-06, + "loss": 0.5732, + "step": 58049 + }, + { + "epoch": 1.49, + "learning_rate": 1.0616659623926475e-06, + "loss": 0.6538, + "step": 58050 + }, + { + "epoch": 1.49, + "learning_rate": 1.0616383445763505e-06, + "loss": 0.5447, + "step": 58051 + }, + { + "epoch": 1.49, + "learning_rate": 1.0616107267128598e-06, + "loss": 0.6748, + "step": 58052 + }, + { + "epoch": 1.49, + "learning_rate": 1.0615831088021962e-06, + "loss": 0.6279, + "step": 58053 + }, + { + "epoch": 1.49, + "learning_rate": 1.0615554908443816e-06, + "loss": 0.5972, + "step": 58054 + }, + { + "epoch": 1.49, + "learning_rate": 1.0615278728394363e-06, + "loss": 0.6611, + "step": 58055 + }, + { + "epoch": 1.49, + "learning_rate": 1.0615002547873828e-06, + "loss": 0.5981, + "step": 58056 + }, + { + "epoch": 1.49, + "learning_rate": 1.0614726366882407e-06, + "loss": 0.554, + "step": 58057 + }, + { + "epoch": 1.49, + "learning_rate": 1.061445018542032e-06, + "loss": 0.7559, + "step": 58058 + }, + { + "epoch": 1.49, + "learning_rate": 1.0614174003487774e-06, + "loss": 0.7988, + "step": 58059 + }, + { + "epoch": 1.49, + "learning_rate": 1.0613897821084989e-06, + "loss": 0.5579, + "step": 58060 + }, + { + "epoch": 1.49, + "learning_rate": 1.0613621638212166e-06, + "loss": 0.5349, + "step": 58061 + }, + { + "epoch": 1.49, + "learning_rate": 1.0613345454869524e-06, + "loss": 0.6074, + "step": 58062 + }, + { + "epoch": 1.49, + "learning_rate": 1.061306927105727e-06, + "loss": 0.5996, + "step": 58063 + }, + { + "epoch": 1.49, + "learning_rate": 1.0612793086775618e-06, + "loss": 0.6104, + "step": 58064 + }, + { + "epoch": 1.49, + "learning_rate": 1.061251690202478e-06, + "loss": 0.4724, + "step": 58065 + }, + { + "epoch": 1.49, + "learning_rate": 1.0612240716804964e-06, + "loss": 0.542, + "step": 58066 + }, + { + "epoch": 1.49, + "learning_rate": 1.0611964531116381e-06, + "loss": 0.7646, + "step": 58067 + }, + { + "epoch": 1.49, + "learning_rate": 1.0611688344959248e-06, + "loss": 0.606, + "step": 58068 + }, + { + "epoch": 1.49, + "learning_rate": 1.0611412158333773e-06, + "loss": 0.5383, + "step": 58069 + }, + { + "epoch": 1.49, + "learning_rate": 1.0611135971240168e-06, + "loss": 0.5752, + "step": 58070 + }, + { + "epoch": 1.49, + "learning_rate": 1.0610859783678643e-06, + "loss": 0.6816, + "step": 58071 + }, + { + "epoch": 1.49, + "learning_rate": 1.0610583595649413e-06, + "loss": 0.7812, + "step": 58072 + }, + { + "epoch": 1.49, + "learning_rate": 1.0610307407152683e-06, + "loss": 0.543, + "step": 58073 + }, + { + "epoch": 1.49, + "learning_rate": 1.061003121818867e-06, + "loss": 0.6846, + "step": 58074 + }, + { + "epoch": 1.49, + "learning_rate": 1.060975502875759e-06, + "loss": 0.6362, + "step": 58075 + }, + { + "epoch": 1.49, + "learning_rate": 1.0609478838859643e-06, + "loss": 0.7822, + "step": 58076 + }, + { + "epoch": 1.49, + "learning_rate": 1.060920264849505e-06, + "loss": 0.6807, + "step": 58077 + }, + { + "epoch": 1.49, + "learning_rate": 1.0608926457664011e-06, + "loss": 0.7314, + "step": 58078 + }, + { + "epoch": 1.49, + "learning_rate": 1.0608650266366751e-06, + "loss": 0.5508, + "step": 58079 + }, + { + "epoch": 1.49, + "learning_rate": 1.0608374074603475e-06, + "loss": 0.7168, + "step": 58080 + }, + { + "epoch": 1.49, + "learning_rate": 1.0608097882374396e-06, + "loss": 0.7041, + "step": 58081 + }, + { + "epoch": 1.49, + "learning_rate": 1.060782168967972e-06, + "loss": 0.6704, + "step": 58082 + }, + { + "epoch": 1.49, + "learning_rate": 1.0607545496519668e-06, + "loss": 0.7393, + "step": 58083 + }, + { + "epoch": 1.49, + "learning_rate": 1.0607269302894442e-06, + "loss": 0.689, + "step": 58084 + }, + { + "epoch": 1.49, + "learning_rate": 1.060699310880426e-06, + "loss": 0.6885, + "step": 58085 + }, + { + "epoch": 1.49, + "learning_rate": 1.0606716914249331e-06, + "loss": 0.7305, + "step": 58086 + }, + { + "epoch": 1.49, + "learning_rate": 1.0606440719229868e-06, + "loss": 0.5732, + "step": 58087 + }, + { + "epoch": 1.49, + "learning_rate": 1.0606164523746078e-06, + "loss": 0.7119, + "step": 58088 + }, + { + "epoch": 1.49, + "learning_rate": 1.060588832779818e-06, + "loss": 0.7148, + "step": 58089 + }, + { + "epoch": 1.49, + "learning_rate": 1.060561213138638e-06, + "loss": 0.5051, + "step": 58090 + }, + { + "epoch": 1.49, + "learning_rate": 1.0605335934510887e-06, + "loss": 0.6494, + "step": 58091 + }, + { + "epoch": 1.49, + "learning_rate": 1.0605059737171917e-06, + "loss": 0.502, + "step": 58092 + }, + { + "epoch": 1.49, + "learning_rate": 1.0604783539369683e-06, + "loss": 0.709, + "step": 58093 + }, + { + "epoch": 1.49, + "learning_rate": 1.0604507341104392e-06, + "loss": 0.8369, + "step": 58094 + }, + { + "epoch": 1.49, + "learning_rate": 1.060423114237626e-06, + "loss": 0.7002, + "step": 58095 + }, + { + "epoch": 1.49, + "learning_rate": 1.0603954943185496e-06, + "loss": 0.6172, + "step": 58096 + }, + { + "epoch": 1.49, + "learning_rate": 1.060367874353231e-06, + "loss": 0.6211, + "step": 58097 + }, + { + "epoch": 1.49, + "learning_rate": 1.0603402543416916e-06, + "loss": 0.5898, + "step": 58098 + }, + { + "epoch": 1.49, + "learning_rate": 1.060312634283952e-06, + "loss": 0.6846, + "step": 58099 + }, + { + "epoch": 1.49, + "learning_rate": 1.0602850141800344e-06, + "loss": 0.6548, + "step": 58100 + }, + { + "epoch": 1.49, + "learning_rate": 1.060257394029959e-06, + "loss": 0.521, + "step": 58101 + }, + { + "epoch": 1.49, + "learning_rate": 1.0602297738337474e-06, + "loss": 0.5654, + "step": 58102 + }, + { + "epoch": 1.49, + "learning_rate": 1.0602021535914205e-06, + "loss": 0.6455, + "step": 58103 + }, + { + "epoch": 1.49, + "learning_rate": 1.0601745333029996e-06, + "loss": 0.457, + "step": 58104 + }, + { + "epoch": 1.49, + "learning_rate": 1.060146912968506e-06, + "loss": 0.6436, + "step": 58105 + }, + { + "epoch": 1.49, + "learning_rate": 1.0601192925879606e-06, + "loss": 0.6709, + "step": 58106 + }, + { + "epoch": 1.49, + "learning_rate": 1.0600916721613846e-06, + "loss": 0.6943, + "step": 58107 + }, + { + "epoch": 1.49, + "learning_rate": 1.0600640516887993e-06, + "loss": 0.5928, + "step": 58108 + }, + { + "epoch": 1.49, + "learning_rate": 1.0600364311702254e-06, + "loss": 0.6221, + "step": 58109 + }, + { + "epoch": 1.49, + "learning_rate": 1.0600088106056849e-06, + "loss": 0.748, + "step": 58110 + }, + { + "epoch": 1.49, + "learning_rate": 1.0599811899951977e-06, + "loss": 0.5771, + "step": 58111 + }, + { + "epoch": 1.49, + "learning_rate": 1.0599535693387861e-06, + "loss": 0.6387, + "step": 58112 + }, + { + "epoch": 1.49, + "learning_rate": 1.0599259486364706e-06, + "loss": 0.7598, + "step": 58113 + }, + { + "epoch": 1.49, + "learning_rate": 1.0598983278882728e-06, + "loss": 0.6128, + "step": 58114 + }, + { + "epoch": 1.49, + "learning_rate": 1.0598707070942137e-06, + "loss": 0.6221, + "step": 58115 + }, + { + "epoch": 1.49, + "learning_rate": 1.059843086254314e-06, + "loss": 0.5803, + "step": 58116 + }, + { + "epoch": 1.49, + "learning_rate": 1.0598154653685954e-06, + "loss": 0.6798, + "step": 58117 + }, + { + "epoch": 1.49, + "learning_rate": 1.0597878444370787e-06, + "loss": 0.6919, + "step": 58118 + }, + { + "epoch": 1.49, + "learning_rate": 1.0597602234597854e-06, + "loss": 0.5869, + "step": 58119 + }, + { + "epoch": 1.49, + "learning_rate": 1.0597326024367364e-06, + "loss": 0.7627, + "step": 58120 + }, + { + "epoch": 1.49, + "learning_rate": 1.0597049813679528e-06, + "loss": 0.7441, + "step": 58121 + }, + { + "epoch": 1.49, + "learning_rate": 1.0596773602534556e-06, + "loss": 0.5972, + "step": 58122 + }, + { + "epoch": 1.49, + "learning_rate": 1.0596497390932667e-06, + "loss": 0.7783, + "step": 58123 + }, + { + "epoch": 1.49, + "learning_rate": 1.0596221178874062e-06, + "loss": 0.5428, + "step": 58124 + }, + { + "epoch": 1.49, + "learning_rate": 1.0595944966358966e-06, + "loss": 0.8584, + "step": 58125 + }, + { + "epoch": 1.49, + "learning_rate": 1.0595668753387575e-06, + "loss": 0.6978, + "step": 58126 + }, + { + "epoch": 1.49, + "learning_rate": 1.059539253996011e-06, + "loss": 0.6934, + "step": 58127 + }, + { + "epoch": 1.49, + "learning_rate": 1.0595116326076778e-06, + "loss": 0.7344, + "step": 58128 + }, + { + "epoch": 1.49, + "learning_rate": 1.0594840111737797e-06, + "loss": 0.709, + "step": 58129 + }, + { + "epoch": 1.49, + "learning_rate": 1.0594563896943373e-06, + "loss": 0.8003, + "step": 58130 + }, + { + "epoch": 1.49, + "learning_rate": 1.0594287681693718e-06, + "loss": 0.6631, + "step": 58131 + }, + { + "epoch": 1.49, + "learning_rate": 1.0594011465989043e-06, + "loss": 0.5277, + "step": 58132 + }, + { + "epoch": 1.49, + "learning_rate": 1.0593735249829564e-06, + "loss": 0.5554, + "step": 58133 + }, + { + "epoch": 1.49, + "learning_rate": 1.0593459033215487e-06, + "loss": 0.6953, + "step": 58134 + }, + { + "epoch": 1.49, + "learning_rate": 1.0593182816147025e-06, + "loss": 0.584, + "step": 58135 + }, + { + "epoch": 1.49, + "learning_rate": 1.059290659862439e-06, + "loss": 0.749, + "step": 58136 + }, + { + "epoch": 1.49, + "learning_rate": 1.0592630380647797e-06, + "loss": 0.5386, + "step": 58137 + }, + { + "epoch": 1.49, + "learning_rate": 1.059235416221745e-06, + "loss": 0.5209, + "step": 58138 + }, + { + "epoch": 1.49, + "learning_rate": 1.0592077943333569e-06, + "loss": 0.563, + "step": 58139 + }, + { + "epoch": 1.49, + "learning_rate": 1.059180172399636e-06, + "loss": 0.7725, + "step": 58140 + }, + { + "epoch": 1.49, + "learning_rate": 1.0591525504206033e-06, + "loss": 0.7773, + "step": 58141 + }, + { + "epoch": 1.49, + "learning_rate": 1.0591249283962805e-06, + "loss": 0.6562, + "step": 58142 + }, + { + "epoch": 1.49, + "learning_rate": 1.0590973063266882e-06, + "loss": 0.6162, + "step": 58143 + }, + { + "epoch": 1.49, + "learning_rate": 1.059069684211848e-06, + "loss": 0.708, + "step": 58144 + }, + { + "epoch": 1.49, + "learning_rate": 1.0590420620517809e-06, + "loss": 0.6655, + "step": 58145 + }, + { + "epoch": 1.49, + "learning_rate": 1.059014439846508e-06, + "loss": 0.7754, + "step": 58146 + }, + { + "epoch": 1.49, + "learning_rate": 1.0589868175960502e-06, + "loss": 0.6069, + "step": 58147 + }, + { + "epoch": 1.49, + "learning_rate": 1.058959195300429e-06, + "loss": 0.6992, + "step": 58148 + }, + { + "epoch": 1.49, + "learning_rate": 1.0589315729596654e-06, + "loss": 0.6294, + "step": 58149 + }, + { + "epoch": 1.49, + "learning_rate": 1.0589039505737808e-06, + "loss": 0.609, + "step": 58150 + }, + { + "epoch": 1.49, + "learning_rate": 1.0588763281427962e-06, + "loss": 0.5664, + "step": 58151 + }, + { + "epoch": 1.49, + "learning_rate": 1.0588487056667326e-06, + "loss": 0.7832, + "step": 58152 + }, + { + "epoch": 1.49, + "learning_rate": 1.058821083145611e-06, + "loss": 0.7549, + "step": 58153 + }, + { + "epoch": 1.49, + "learning_rate": 1.0587934605794533e-06, + "loss": 0.6377, + "step": 58154 + }, + { + "epoch": 1.49, + "learning_rate": 1.0587658379682798e-06, + "loss": 0.8076, + "step": 58155 + }, + { + "epoch": 1.49, + "learning_rate": 1.0587382153121123e-06, + "loss": 0.446, + "step": 58156 + }, + { + "epoch": 1.49, + "learning_rate": 1.0587105926109712e-06, + "loss": 0.7617, + "step": 58157 + }, + { + "epoch": 1.49, + "learning_rate": 1.0586829698648785e-06, + "loss": 0.5039, + "step": 58158 + }, + { + "epoch": 1.49, + "learning_rate": 1.0586553470738545e-06, + "loss": 0.6016, + "step": 58159 + }, + { + "epoch": 1.49, + "learning_rate": 1.058627724237921e-06, + "loss": 0.7119, + "step": 58160 + }, + { + "epoch": 1.49, + "learning_rate": 1.0586001013570993e-06, + "loss": 0.6748, + "step": 58161 + }, + { + "epoch": 1.49, + "learning_rate": 1.0585724784314098e-06, + "loss": 0.625, + "step": 58162 + }, + { + "epoch": 1.49, + "learning_rate": 1.0585448554608743e-06, + "loss": 0.5459, + "step": 58163 + }, + { + "epoch": 1.49, + "learning_rate": 1.0585172324455134e-06, + "loss": 0.791, + "step": 58164 + }, + { + "epoch": 1.49, + "learning_rate": 1.058489609385349e-06, + "loss": 0.5205, + "step": 58165 + }, + { + "epoch": 1.49, + "learning_rate": 1.0584619862804014e-06, + "loss": 0.7998, + "step": 58166 + }, + { + "epoch": 1.49, + "learning_rate": 1.0584343631306922e-06, + "loss": 0.6865, + "step": 58167 + }, + { + "epoch": 1.49, + "learning_rate": 1.0584067399362423e-06, + "loss": 0.6543, + "step": 58168 + }, + { + "epoch": 1.49, + "learning_rate": 1.0583791166970735e-06, + "loss": 0.771, + "step": 58169 + }, + { + "epoch": 1.49, + "learning_rate": 1.0583514934132062e-06, + "loss": 0.7197, + "step": 58170 + }, + { + "epoch": 1.49, + "learning_rate": 1.058323870084662e-06, + "loss": 0.647, + "step": 58171 + }, + { + "epoch": 1.49, + "learning_rate": 1.0582962467114618e-06, + "loss": 0.5942, + "step": 58172 + }, + { + "epoch": 1.49, + "learning_rate": 1.0582686232936268e-06, + "loss": 0.6523, + "step": 58173 + }, + { + "epoch": 1.49, + "learning_rate": 1.0582409998311782e-06, + "loss": 0.5836, + "step": 58174 + }, + { + "epoch": 1.49, + "learning_rate": 1.0582133763241376e-06, + "loss": 0.4434, + "step": 58175 + }, + { + "epoch": 1.49, + "learning_rate": 1.058185752772525e-06, + "loss": 0.5903, + "step": 58176 + }, + { + "epoch": 1.49, + "learning_rate": 1.0581581291763628e-06, + "loss": 0.5986, + "step": 58177 + }, + { + "epoch": 1.49, + "learning_rate": 1.0581305055356711e-06, + "loss": 0.5933, + "step": 58178 + }, + { + "epoch": 1.49, + "learning_rate": 1.058102881850472e-06, + "loss": 0.6445, + "step": 58179 + }, + { + "epoch": 1.49, + "learning_rate": 1.058075258120786e-06, + "loss": 0.7559, + "step": 58180 + }, + { + "epoch": 1.49, + "learning_rate": 1.0580476343466343e-06, + "loss": 0.7251, + "step": 58181 + }, + { + "epoch": 1.49, + "learning_rate": 1.0580200105280383e-06, + "loss": 0.6865, + "step": 58182 + }, + { + "epoch": 1.49, + "learning_rate": 1.057992386665019e-06, + "loss": 0.623, + "step": 58183 + }, + { + "epoch": 1.49, + "learning_rate": 1.0579647627575979e-06, + "loss": 0.7988, + "step": 58184 + }, + { + "epoch": 1.49, + "learning_rate": 1.0579371388057957e-06, + "loss": 0.5908, + "step": 58185 + }, + { + "epoch": 1.49, + "learning_rate": 1.0579095148096335e-06, + "loss": 0.7129, + "step": 58186 + }, + { + "epoch": 1.49, + "learning_rate": 1.0578818907691326e-06, + "loss": 0.7676, + "step": 58187 + }, + { + "epoch": 1.49, + "learning_rate": 1.0578542666843145e-06, + "loss": 0.5232, + "step": 58188 + }, + { + "epoch": 1.49, + "learning_rate": 1.0578266425551995e-06, + "loss": 0.6567, + "step": 58189 + }, + { + "epoch": 1.49, + "learning_rate": 1.0577990183818102e-06, + "loss": 0.5382, + "step": 58190 + }, + { + "epoch": 1.49, + "learning_rate": 1.0577713941641663e-06, + "loss": 0.584, + "step": 58191 + }, + { + "epoch": 1.49, + "learning_rate": 1.0577437699022895e-06, + "loss": 0.75, + "step": 58192 + }, + { + "epoch": 1.49, + "learning_rate": 1.057716145596201e-06, + "loss": 0.5786, + "step": 58193 + }, + { + "epoch": 1.49, + "learning_rate": 1.0576885212459219e-06, + "loss": 0.5837, + "step": 58194 + }, + { + "epoch": 1.49, + "learning_rate": 1.0576608968514734e-06, + "loss": 0.4268, + "step": 58195 + }, + { + "epoch": 1.49, + "learning_rate": 1.0576332724128767e-06, + "loss": 0.6758, + "step": 58196 + }, + { + "epoch": 1.49, + "learning_rate": 1.0576056479301526e-06, + "loss": 0.6074, + "step": 58197 + }, + { + "epoch": 1.49, + "learning_rate": 1.0575780234033224e-06, + "loss": 0.6953, + "step": 58198 + }, + { + "epoch": 1.49, + "learning_rate": 1.0575503988324076e-06, + "loss": 0.7119, + "step": 58199 + }, + { + "epoch": 1.49, + "learning_rate": 1.0575227742174294e-06, + "loss": 0.6367, + "step": 58200 + }, + { + "epoch": 1.49, + "learning_rate": 1.057495149558408e-06, + "loss": 0.7334, + "step": 58201 + }, + { + "epoch": 1.49, + "learning_rate": 1.0574675248553658e-06, + "loss": 0.485, + "step": 58202 + }, + { + "epoch": 1.49, + "learning_rate": 1.057439900108323e-06, + "loss": 0.4888, + "step": 58203 + }, + { + "epoch": 1.49, + "learning_rate": 1.057412275317301e-06, + "loss": 0.4397, + "step": 58204 + }, + { + "epoch": 1.49, + "learning_rate": 1.0573846504823216e-06, + "loss": 0.7412, + "step": 58205 + }, + { + "epoch": 1.49, + "learning_rate": 1.0573570256034048e-06, + "loss": 0.5068, + "step": 58206 + }, + { + "epoch": 1.49, + "learning_rate": 1.057329400680573e-06, + "loss": 0.709, + "step": 58207 + }, + { + "epoch": 1.49, + "learning_rate": 1.0573017757138461e-06, + "loss": 0.5859, + "step": 58208 + }, + { + "epoch": 1.49, + "learning_rate": 1.0572741507032462e-06, + "loss": 0.7588, + "step": 58209 + }, + { + "epoch": 1.49, + "learning_rate": 1.057246525648794e-06, + "loss": 0.707, + "step": 58210 + }, + { + "epoch": 1.49, + "learning_rate": 1.0572189005505108e-06, + "loss": 0.4924, + "step": 58211 + }, + { + "epoch": 1.49, + "learning_rate": 1.0571912754084175e-06, + "loss": 0.6816, + "step": 58212 + }, + { + "epoch": 1.49, + "learning_rate": 1.0571636502225358e-06, + "loss": 0.6299, + "step": 58213 + }, + { + "epoch": 1.49, + "learning_rate": 1.0571360249928865e-06, + "loss": 0.4675, + "step": 58214 + }, + { + "epoch": 1.49, + "learning_rate": 1.057108399719491e-06, + "loss": 0.6685, + "step": 58215 + }, + { + "epoch": 1.49, + "learning_rate": 1.0570807744023696e-06, + "loss": 0.5898, + "step": 58216 + }, + { + "epoch": 1.49, + "learning_rate": 1.0570531490415444e-06, + "loss": 0.4187, + "step": 58217 + }, + { + "epoch": 1.49, + "learning_rate": 1.0570255236370363e-06, + "loss": 0.71, + "step": 58218 + }, + { + "epoch": 1.49, + "learning_rate": 1.0569978981888663e-06, + "loss": 0.562, + "step": 58219 + }, + { + "epoch": 1.49, + "learning_rate": 1.0569702726970555e-06, + "loss": 0.6953, + "step": 58220 + }, + { + "epoch": 1.49, + "learning_rate": 1.0569426471616253e-06, + "loss": 0.7031, + "step": 58221 + }, + { + "epoch": 1.49, + "learning_rate": 1.0569150215825968e-06, + "loss": 0.7074, + "step": 58222 + }, + { + "epoch": 1.49, + "learning_rate": 1.056887395959991e-06, + "loss": 0.6631, + "step": 58223 + }, + { + "epoch": 1.49, + "learning_rate": 1.0568597702938291e-06, + "loss": 0.6904, + "step": 58224 + }, + { + "epoch": 1.49, + "learning_rate": 1.0568321445841325e-06, + "loss": 0.5918, + "step": 58225 + }, + { + "epoch": 1.49, + "learning_rate": 1.056804518830922e-06, + "loss": 0.6826, + "step": 58226 + }, + { + "epoch": 1.49, + "learning_rate": 1.056776893034219e-06, + "loss": 0.4463, + "step": 58227 + }, + { + "epoch": 1.49, + "learning_rate": 1.056749267194044e-06, + "loss": 0.7339, + "step": 58228 + }, + { + "epoch": 1.49, + "learning_rate": 1.0567216413104194e-06, + "loss": 0.6143, + "step": 58229 + }, + { + "epoch": 1.49, + "learning_rate": 1.0566940153833654e-06, + "loss": 0.5266, + "step": 58230 + }, + { + "epoch": 1.49, + "learning_rate": 1.0566663894129033e-06, + "loss": 0.645, + "step": 58231 + }, + { + "epoch": 1.49, + "learning_rate": 1.0566387633990545e-06, + "loss": 0.7129, + "step": 58232 + }, + { + "epoch": 1.49, + "learning_rate": 1.0566111373418399e-06, + "loss": 0.7285, + "step": 58233 + }, + { + "epoch": 1.49, + "learning_rate": 1.0565835112412807e-06, + "loss": 0.5386, + "step": 58234 + }, + { + "epoch": 1.49, + "learning_rate": 1.0565558850973983e-06, + "loss": 0.708, + "step": 58235 + }, + { + "epoch": 1.49, + "learning_rate": 1.0565282589102135e-06, + "loss": 0.9082, + "step": 58236 + }, + { + "epoch": 1.49, + "learning_rate": 1.0565006326797477e-06, + "loss": 0.5706, + "step": 58237 + }, + { + "epoch": 1.49, + "learning_rate": 1.056473006406022e-06, + "loss": 0.6719, + "step": 58238 + }, + { + "epoch": 1.49, + "learning_rate": 1.056445380089057e-06, + "loss": 0.6797, + "step": 58239 + }, + { + "epoch": 1.49, + "learning_rate": 1.0564177537288751e-06, + "loss": 0.6616, + "step": 58240 + }, + { + "epoch": 1.49, + "learning_rate": 1.0563901273254966e-06, + "loss": 0.7139, + "step": 58241 + }, + { + "epoch": 1.49, + "learning_rate": 1.0563625008789425e-06, + "loss": 0.8149, + "step": 58242 + }, + { + "epoch": 1.49, + "learning_rate": 1.0563348743892341e-06, + "loss": 0.7969, + "step": 58243 + }, + { + "epoch": 1.49, + "learning_rate": 1.056307247856393e-06, + "loss": 0.6279, + "step": 58244 + }, + { + "epoch": 1.49, + "learning_rate": 1.0562796212804401e-06, + "loss": 0.7754, + "step": 58245 + }, + { + "epoch": 1.49, + "learning_rate": 1.0562519946613964e-06, + "loss": 0.6475, + "step": 58246 + }, + { + "epoch": 1.49, + "learning_rate": 1.0562243679992828e-06, + "loss": 0.624, + "step": 58247 + }, + { + "epoch": 1.49, + "learning_rate": 1.056196741294121e-06, + "loss": 0.7363, + "step": 58248 + }, + { + "epoch": 1.49, + "learning_rate": 1.056169114545932e-06, + "loss": 0.9355, + "step": 58249 + }, + { + "epoch": 1.49, + "learning_rate": 1.0561414877547368e-06, + "loss": 0.4019, + "step": 58250 + }, + { + "epoch": 1.49, + "learning_rate": 1.056113860920557e-06, + "loss": 0.792, + "step": 58251 + }, + { + "epoch": 1.49, + "learning_rate": 1.0560862340434127e-06, + "loss": 0.7158, + "step": 58252 + }, + { + "epoch": 1.49, + "learning_rate": 1.0560586071233263e-06, + "loss": 0.7578, + "step": 58253 + }, + { + "epoch": 1.49, + "learning_rate": 1.0560309801603182e-06, + "loss": 0.645, + "step": 58254 + }, + { + "epoch": 1.49, + "learning_rate": 1.0560033531544102e-06, + "loss": 0.7188, + "step": 58255 + }, + { + "epoch": 1.49, + "learning_rate": 1.0559757261056224e-06, + "loss": 0.6533, + "step": 58256 + }, + { + "epoch": 1.49, + "learning_rate": 1.055948099013977e-06, + "loss": 0.6089, + "step": 58257 + }, + { + "epoch": 1.49, + "learning_rate": 1.0559204718794942e-06, + "loss": 0.6748, + "step": 58258 + }, + { + "epoch": 1.49, + "learning_rate": 1.055892844702196e-06, + "loss": 0.749, + "step": 58259 + }, + { + "epoch": 1.49, + "learning_rate": 1.0558652174821033e-06, + "loss": 0.7656, + "step": 58260 + }, + { + "epoch": 1.49, + "learning_rate": 1.055837590219237e-06, + "loss": 0.5234, + "step": 58261 + }, + { + "epoch": 1.49, + "learning_rate": 1.0558099629136183e-06, + "loss": 0.6016, + "step": 58262 + }, + { + "epoch": 1.49, + "learning_rate": 1.0557823355652686e-06, + "loss": 0.6201, + "step": 58263 + }, + { + "epoch": 1.49, + "learning_rate": 1.0557547081742088e-06, + "loss": 0.6597, + "step": 58264 + }, + { + "epoch": 1.49, + "learning_rate": 1.0557270807404608e-06, + "loss": 0.5327, + "step": 58265 + }, + { + "epoch": 1.49, + "learning_rate": 1.0556994532640447e-06, + "loss": 0.5654, + "step": 58266 + }, + { + "epoch": 1.49, + "learning_rate": 1.0556718257449819e-06, + "loss": 0.4829, + "step": 58267 + }, + { + "epoch": 1.49, + "learning_rate": 1.055644198183294e-06, + "loss": 0.6851, + "step": 58268 + }, + { + "epoch": 1.49, + "learning_rate": 1.055616570579002e-06, + "loss": 0.8701, + "step": 58269 + }, + { + "epoch": 1.49, + "learning_rate": 1.0555889429321267e-06, + "loss": 0.5017, + "step": 58270 + }, + { + "epoch": 1.49, + "learning_rate": 1.0555613152426894e-06, + "loss": 0.479, + "step": 58271 + }, + { + "epoch": 1.49, + "learning_rate": 1.0555336875107115e-06, + "loss": 0.8398, + "step": 58272 + }, + { + "epoch": 1.49, + "learning_rate": 1.0555060597362143e-06, + "loss": 0.6182, + "step": 58273 + }, + { + "epoch": 1.49, + "learning_rate": 1.0554784319192183e-06, + "loss": 0.8008, + "step": 58274 + }, + { + "epoch": 1.49, + "learning_rate": 1.055450804059745e-06, + "loss": 0.6279, + "step": 58275 + }, + { + "epoch": 1.49, + "learning_rate": 1.0554231761578159e-06, + "loss": 0.4871, + "step": 58276 + }, + { + "epoch": 1.49, + "learning_rate": 1.0553955482134513e-06, + "loss": 0.7476, + "step": 58277 + }, + { + "epoch": 1.49, + "learning_rate": 1.0553679202266734e-06, + "loss": 0.7451, + "step": 58278 + }, + { + "epoch": 1.49, + "learning_rate": 1.0553402921975024e-06, + "loss": 0.665, + "step": 58279 + }, + { + "epoch": 1.49, + "learning_rate": 1.0553126641259604e-06, + "loss": 0.6069, + "step": 58280 + }, + { + "epoch": 1.49, + "learning_rate": 1.0552850360120675e-06, + "loss": 0.6782, + "step": 58281 + }, + { + "epoch": 1.49, + "learning_rate": 1.0552574078558457e-06, + "loss": 0.3735, + "step": 58282 + }, + { + "epoch": 1.49, + "learning_rate": 1.0552297796573158e-06, + "loss": 0.709, + "step": 58283 + }, + { + "epoch": 1.49, + "learning_rate": 1.055202151416499e-06, + "loss": 0.6494, + "step": 58284 + }, + { + "epoch": 1.49, + "learning_rate": 1.0551745231334165e-06, + "loss": 0.5156, + "step": 58285 + }, + { + "epoch": 1.49, + "learning_rate": 1.0551468948080893e-06, + "loss": 0.5635, + "step": 58286 + }, + { + "epoch": 1.49, + "learning_rate": 1.0551192664405385e-06, + "loss": 0.6831, + "step": 58287 + }, + { + "epoch": 1.49, + "learning_rate": 1.0550916380307856e-06, + "loss": 0.5298, + "step": 58288 + }, + { + "epoch": 1.49, + "learning_rate": 1.0550640095788516e-06, + "loss": 0.7158, + "step": 58289 + }, + { + "epoch": 1.49, + "learning_rate": 1.0550363810847577e-06, + "loss": 0.7559, + "step": 58290 + }, + { + "epoch": 1.49, + "learning_rate": 1.055008752548525e-06, + "loss": 0.665, + "step": 58291 + }, + { + "epoch": 1.49, + "learning_rate": 1.0549811239701745e-06, + "loss": 0.6416, + "step": 58292 + }, + { + "epoch": 1.49, + "learning_rate": 1.0549534953497272e-06, + "loss": 0.6016, + "step": 58293 + }, + { + "epoch": 1.49, + "learning_rate": 1.0549258666872049e-06, + "loss": 0.7432, + "step": 58294 + }, + { + "epoch": 1.49, + "learning_rate": 1.0548982379826284e-06, + "loss": 0.5854, + "step": 58295 + }, + { + "epoch": 1.49, + "learning_rate": 1.0548706092360184e-06, + "loss": 0.5308, + "step": 58296 + }, + { + "epoch": 1.49, + "learning_rate": 1.054842980447397e-06, + "loss": 0.4374, + "step": 58297 + }, + { + "epoch": 1.49, + "learning_rate": 1.0548153516167846e-06, + "loss": 0.5562, + "step": 58298 + }, + { + "epoch": 1.49, + "learning_rate": 1.0547877227442027e-06, + "loss": 0.4853, + "step": 58299 + }, + { + "epoch": 1.49, + "learning_rate": 1.0547600938296724e-06, + "loss": 0.8037, + "step": 58300 + }, + { + "epoch": 1.49, + "learning_rate": 1.054732464873215e-06, + "loss": 0.6055, + "step": 58301 + }, + { + "epoch": 1.49, + "learning_rate": 1.0547048358748509e-06, + "loss": 0.6455, + "step": 58302 + }, + { + "epoch": 1.49, + "learning_rate": 1.0546772068346025e-06, + "loss": 0.479, + "step": 58303 + }, + { + "epoch": 1.49, + "learning_rate": 1.0546495777524894e-06, + "loss": 0.5101, + "step": 58304 + }, + { + "epoch": 1.49, + "learning_rate": 1.0546219486285347e-06, + "loss": 0.749, + "step": 58305 + }, + { + "epoch": 1.49, + "learning_rate": 1.0545943194627579e-06, + "loss": 0.6709, + "step": 58306 + }, + { + "epoch": 1.49, + "learning_rate": 1.0545666902551806e-06, + "loss": 0.6973, + "step": 58307 + }, + { + "epoch": 1.49, + "learning_rate": 1.0545390610058241e-06, + "loss": 0.6108, + "step": 58308 + }, + { + "epoch": 1.49, + "learning_rate": 1.05451143171471e-06, + "loss": 0.6055, + "step": 58309 + }, + { + "epoch": 1.49, + "learning_rate": 1.0544838023818587e-06, + "loss": 0.6406, + "step": 58310 + }, + { + "epoch": 1.49, + "learning_rate": 1.0544561730072919e-06, + "loss": 0.7979, + "step": 58311 + }, + { + "epoch": 1.49, + "learning_rate": 1.05442854359103e-06, + "loss": 0.5227, + "step": 58312 + }, + { + "epoch": 1.49, + "learning_rate": 1.054400914133095e-06, + "loss": 0.531, + "step": 58313 + }, + { + "epoch": 1.49, + "learning_rate": 1.0543732846335077e-06, + "loss": 0.7109, + "step": 58314 + }, + { + "epoch": 1.49, + "learning_rate": 1.0543456550922892e-06, + "loss": 0.6606, + "step": 58315 + }, + { + "epoch": 1.49, + "learning_rate": 1.0543180255094607e-06, + "loss": 0.6846, + "step": 58316 + }, + { + "epoch": 1.49, + "learning_rate": 1.0542903958850438e-06, + "loss": 0.4963, + "step": 58317 + }, + { + "epoch": 1.49, + "learning_rate": 1.0542627662190589e-06, + "loss": 0.7451, + "step": 58318 + }, + { + "epoch": 1.49, + "learning_rate": 1.0542351365115274e-06, + "loss": 0.6392, + "step": 58319 + }, + { + "epoch": 1.49, + "learning_rate": 1.0542075067624708e-06, + "loss": 0.5283, + "step": 58320 + }, + { + "epoch": 1.49, + "learning_rate": 1.0541798769719096e-06, + "loss": 0.4907, + "step": 58321 + }, + { + "epoch": 1.49, + "learning_rate": 1.0541522471398658e-06, + "loss": 0.6709, + "step": 58322 + }, + { + "epoch": 1.49, + "learning_rate": 1.0541246172663597e-06, + "loss": 0.6426, + "step": 58323 + }, + { + "epoch": 1.49, + "learning_rate": 1.0540969873514134e-06, + "loss": 0.5371, + "step": 58324 + }, + { + "epoch": 1.49, + "learning_rate": 1.0540693573950472e-06, + "loss": 0.6685, + "step": 58325 + }, + { + "epoch": 1.49, + "learning_rate": 1.0540417273972826e-06, + "loss": 0.6201, + "step": 58326 + }, + { + "epoch": 1.49, + "learning_rate": 1.0540140973581406e-06, + "loss": 0.5547, + "step": 58327 + }, + { + "epoch": 1.49, + "learning_rate": 1.053986467277643e-06, + "loss": 0.7168, + "step": 58328 + }, + { + "epoch": 1.5, + "learning_rate": 1.0539588371558097e-06, + "loss": 0.606, + "step": 58329 + }, + { + "epoch": 1.5, + "learning_rate": 1.0539312069926634e-06, + "loss": 0.3275, + "step": 58330 + }, + { + "epoch": 1.5, + "learning_rate": 1.053903576788224e-06, + "loss": 0.8062, + "step": 58331 + }, + { + "epoch": 1.5, + "learning_rate": 1.0538759465425131e-06, + "loss": 0.5244, + "step": 58332 + }, + { + "epoch": 1.5, + "learning_rate": 1.0538483162555516e-06, + "loss": 0.7559, + "step": 58333 + }, + { + "epoch": 1.5, + "learning_rate": 1.0538206859273615e-06, + "loss": 0.4357, + "step": 58334 + }, + { + "epoch": 1.5, + "learning_rate": 1.0537930555579631e-06, + "loss": 0.5488, + "step": 58335 + }, + { + "epoch": 1.5, + "learning_rate": 1.053765425147378e-06, + "loss": 0.6025, + "step": 58336 + }, + { + "epoch": 1.5, + "learning_rate": 1.0537377946956267e-06, + "loss": 0.5386, + "step": 58337 + }, + { + "epoch": 1.5, + "learning_rate": 1.0537101642027312e-06, + "loss": 0.7031, + "step": 58338 + }, + { + "epoch": 1.5, + "learning_rate": 1.0536825336687122e-06, + "loss": 0.5957, + "step": 58339 + }, + { + "epoch": 1.5, + "learning_rate": 1.053654903093591e-06, + "loss": 0.53, + "step": 58340 + }, + { + "epoch": 1.5, + "learning_rate": 1.0536272724773888e-06, + "loss": 0.6128, + "step": 58341 + }, + { + "epoch": 1.5, + "learning_rate": 1.0535996418201266e-06, + "loss": 0.7031, + "step": 58342 + }, + { + "epoch": 1.5, + "learning_rate": 1.0535720111218255e-06, + "loss": 0.6494, + "step": 58343 + }, + { + "epoch": 1.5, + "learning_rate": 1.0535443803825067e-06, + "loss": 0.6904, + "step": 58344 + }, + { + "epoch": 1.5, + "learning_rate": 1.0535167496021922e-06, + "loss": 0.6084, + "step": 58345 + }, + { + "epoch": 1.5, + "learning_rate": 1.0534891187809016e-06, + "loss": 0.8672, + "step": 58346 + }, + { + "epoch": 1.5, + "learning_rate": 1.0534614879186569e-06, + "loss": 0.6631, + "step": 58347 + }, + { + "epoch": 1.5, + "learning_rate": 1.0534338570154794e-06, + "loss": 0.6406, + "step": 58348 + }, + { + "epoch": 1.5, + "learning_rate": 1.0534062260713901e-06, + "loss": 0.5269, + "step": 58349 + }, + { + "epoch": 1.5, + "learning_rate": 1.05337859508641e-06, + "loss": 0.502, + "step": 58350 + }, + { + "epoch": 1.5, + "learning_rate": 1.0533509640605605e-06, + "loss": 0.668, + "step": 58351 + }, + { + "epoch": 1.5, + "learning_rate": 1.0533233329938622e-06, + "loss": 0.8418, + "step": 58352 + }, + { + "epoch": 1.5, + "learning_rate": 1.053295701886337e-06, + "loss": 0.5957, + "step": 58353 + }, + { + "epoch": 1.5, + "learning_rate": 1.0532680707380058e-06, + "loss": 0.7471, + "step": 58354 + }, + { + "epoch": 1.5, + "learning_rate": 1.0532404395488896e-06, + "loss": 0.7188, + "step": 58355 + }, + { + "epoch": 1.5, + "learning_rate": 1.0532128083190096e-06, + "loss": 0.6108, + "step": 58356 + }, + { + "epoch": 1.5, + "learning_rate": 1.053185177048387e-06, + "loss": 0.5371, + "step": 58357 + }, + { + "epoch": 1.5, + "learning_rate": 1.053157545737043e-06, + "loss": 0.6167, + "step": 58358 + }, + { + "epoch": 1.5, + "learning_rate": 1.0531299143849985e-06, + "loss": 0.7061, + "step": 58359 + }, + { + "epoch": 1.5, + "learning_rate": 1.0531022829922753e-06, + "loss": 0.5898, + "step": 58360 + }, + { + "epoch": 1.5, + "learning_rate": 1.0530746515588937e-06, + "loss": 0.7451, + "step": 58361 + }, + { + "epoch": 1.5, + "learning_rate": 1.0530470200848755e-06, + "loss": 0.7266, + "step": 58362 + }, + { + "epoch": 1.5, + "learning_rate": 1.0530193885702416e-06, + "loss": 0.6211, + "step": 58363 + }, + { + "epoch": 1.5, + "learning_rate": 1.0529917570150132e-06, + "loss": 0.6328, + "step": 58364 + }, + { + "epoch": 1.5, + "learning_rate": 1.0529641254192113e-06, + "loss": 0.71, + "step": 58365 + }, + { + "epoch": 1.5, + "learning_rate": 1.0529364937828575e-06, + "loss": 0.5649, + "step": 58366 + }, + { + "epoch": 1.5, + "learning_rate": 1.0529088621059724e-06, + "loss": 0.7007, + "step": 58367 + }, + { + "epoch": 1.5, + "learning_rate": 1.0528812303885776e-06, + "loss": 0.6582, + "step": 58368 + }, + { + "epoch": 1.5, + "learning_rate": 1.052853598630694e-06, + "loss": 0.5229, + "step": 58369 + }, + { + "epoch": 1.5, + "learning_rate": 1.052825966832343e-06, + "loss": 0.5342, + "step": 58370 + }, + { + "epoch": 1.5, + "learning_rate": 1.0527983349935453e-06, + "loss": 0.5176, + "step": 58371 + }, + { + "epoch": 1.5, + "learning_rate": 1.0527707031143224e-06, + "loss": 0.6494, + "step": 58372 + }, + { + "epoch": 1.5, + "learning_rate": 1.0527430711946954e-06, + "loss": 0.7686, + "step": 58373 + }, + { + "epoch": 1.5, + "learning_rate": 1.0527154392346858e-06, + "loss": 0.79, + "step": 58374 + }, + { + "epoch": 1.5, + "learning_rate": 1.052687807234314e-06, + "loss": 0.5869, + "step": 58375 + }, + { + "epoch": 1.5, + "learning_rate": 1.0526601751936018e-06, + "loss": 0.6963, + "step": 58376 + }, + { + "epoch": 1.5, + "learning_rate": 1.0526325431125697e-06, + "loss": 0.6631, + "step": 58377 + }, + { + "epoch": 1.5, + "learning_rate": 1.0526049109912396e-06, + "loss": 0.6562, + "step": 58378 + }, + { + "epoch": 1.5, + "learning_rate": 1.0525772788296326e-06, + "loss": 0.5176, + "step": 58379 + }, + { + "epoch": 1.5, + "learning_rate": 1.0525496466277693e-06, + "loss": 0.6836, + "step": 58380 + }, + { + "epoch": 1.5, + "learning_rate": 1.052522014385671e-06, + "loss": 0.6465, + "step": 58381 + }, + { + "epoch": 1.5, + "learning_rate": 1.0524943821033592e-06, + "loss": 0.3567, + "step": 58382 + }, + { + "epoch": 1.5, + "learning_rate": 1.0524667497808548e-06, + "loss": 0.7266, + "step": 58383 + }, + { + "epoch": 1.5, + "learning_rate": 1.052439117418179e-06, + "loss": 0.7344, + "step": 58384 + }, + { + "epoch": 1.5, + "learning_rate": 1.0524114850153532e-06, + "loss": 0.6719, + "step": 58385 + }, + { + "epoch": 1.5, + "learning_rate": 1.0523838525723981e-06, + "loss": 0.5991, + "step": 58386 + }, + { + "epoch": 1.5, + "learning_rate": 1.0523562200893352e-06, + "loss": 0.6299, + "step": 58387 + }, + { + "epoch": 1.5, + "learning_rate": 1.0523285875661853e-06, + "loss": 0.5327, + "step": 58388 + }, + { + "epoch": 1.5, + "learning_rate": 1.0523009550029704e-06, + "loss": 0.6558, + "step": 58389 + }, + { + "epoch": 1.5, + "learning_rate": 1.0522733223997105e-06, + "loss": 0.6025, + "step": 58390 + }, + { + "epoch": 1.5, + "learning_rate": 1.0522456897564276e-06, + "loss": 0.7576, + "step": 58391 + }, + { + "epoch": 1.5, + "learning_rate": 1.0522180570731424e-06, + "loss": 0.6602, + "step": 58392 + }, + { + "epoch": 1.5, + "learning_rate": 1.0521904243498765e-06, + "loss": 0.7266, + "step": 58393 + }, + { + "epoch": 1.5, + "learning_rate": 1.0521627915866507e-06, + "loss": 0.4976, + "step": 58394 + }, + { + "epoch": 1.5, + "learning_rate": 1.0521351587834861e-06, + "loss": 0.5437, + "step": 58395 + }, + { + "epoch": 1.5, + "learning_rate": 1.052107525940404e-06, + "loss": 0.6641, + "step": 58396 + }, + { + "epoch": 1.5, + "learning_rate": 1.0520798930574257e-06, + "loss": 0.7031, + "step": 58397 + }, + { + "epoch": 1.5, + "learning_rate": 1.052052260134572e-06, + "loss": 0.542, + "step": 58398 + }, + { + "epoch": 1.5, + "learning_rate": 1.0520246271718646e-06, + "loss": 0.6348, + "step": 58399 + }, + { + "epoch": 1.5, + "learning_rate": 1.0519969941693242e-06, + "loss": 0.6953, + "step": 58400 + }, + { + "epoch": 1.5, + "learning_rate": 1.0519693611269721e-06, + "loss": 0.5923, + "step": 58401 + }, + { + "epoch": 1.5, + "learning_rate": 1.0519417280448292e-06, + "loss": 0.7402, + "step": 58402 + }, + { + "epoch": 1.5, + "learning_rate": 1.0519140949229173e-06, + "loss": 0.6699, + "step": 58403 + }, + { + "epoch": 1.5, + "learning_rate": 1.051886461761257e-06, + "loss": 0.7725, + "step": 58404 + }, + { + "epoch": 1.5, + "learning_rate": 1.0518588285598695e-06, + "loss": 0.5859, + "step": 58405 + }, + { + "epoch": 1.5, + "learning_rate": 1.0518311953187762e-06, + "loss": 0.6069, + "step": 58406 + }, + { + "epoch": 1.5, + "learning_rate": 1.0518035620379981e-06, + "loss": 0.6616, + "step": 58407 + }, + { + "epoch": 1.5, + "learning_rate": 1.0517759287175565e-06, + "loss": 0.4846, + "step": 58408 + }, + { + "epoch": 1.5, + "learning_rate": 1.0517482953574722e-06, + "loss": 0.4429, + "step": 58409 + }, + { + "epoch": 1.5, + "learning_rate": 1.051720661957767e-06, + "loss": 0.7173, + "step": 58410 + }, + { + "epoch": 1.5, + "learning_rate": 1.0516930285184614e-06, + "loss": 0.5498, + "step": 58411 + }, + { + "epoch": 1.5, + "learning_rate": 1.051665395039577e-06, + "loss": 0.5005, + "step": 58412 + }, + { + "epoch": 1.5, + "learning_rate": 1.0516377615211346e-06, + "loss": 0.7881, + "step": 58413 + }, + { + "epoch": 1.5, + "learning_rate": 1.0516101279631557e-06, + "loss": 0.5669, + "step": 58414 + }, + { + "epoch": 1.5, + "learning_rate": 1.051582494365661e-06, + "loss": 0.8184, + "step": 58415 + }, + { + "epoch": 1.5, + "learning_rate": 1.0515548607286723e-06, + "loss": 0.481, + "step": 58416 + }, + { + "epoch": 1.5, + "learning_rate": 1.0515272270522103e-06, + "loss": 0.6465, + "step": 58417 + }, + { + "epoch": 1.5, + "learning_rate": 1.0514995933362961e-06, + "loss": 0.5596, + "step": 58418 + }, + { + "epoch": 1.5, + "learning_rate": 1.0514719595809514e-06, + "loss": 0.4922, + "step": 58419 + }, + { + "epoch": 1.5, + "learning_rate": 1.0514443257861967e-06, + "loss": 0.5581, + "step": 58420 + }, + { + "epoch": 1.5, + "learning_rate": 1.0514166919520533e-06, + "loss": 0.6582, + "step": 58421 + }, + { + "epoch": 1.5, + "learning_rate": 1.051389058078543e-06, + "loss": 0.6973, + "step": 58422 + }, + { + "epoch": 1.5, + "learning_rate": 1.0513614241656858e-06, + "loss": 0.7744, + "step": 58423 + }, + { + "epoch": 1.5, + "learning_rate": 1.051333790213504e-06, + "loss": 0.7041, + "step": 58424 + }, + { + "epoch": 1.5, + "learning_rate": 1.0513061562220182e-06, + "loss": 0.5425, + "step": 58425 + }, + { + "epoch": 1.5, + "learning_rate": 1.0512785221912497e-06, + "loss": 0.7051, + "step": 58426 + }, + { + "epoch": 1.5, + "learning_rate": 1.0512508881212195e-06, + "loss": 0.625, + "step": 58427 + }, + { + "epoch": 1.5, + "learning_rate": 1.0512232540119487e-06, + "loss": 0.5669, + "step": 58428 + }, + { + "epoch": 1.5, + "learning_rate": 1.051195619863459e-06, + "loss": 0.8115, + "step": 58429 + }, + { + "epoch": 1.5, + "learning_rate": 1.0511679856757707e-06, + "loss": 0.709, + "step": 58430 + }, + { + "epoch": 1.5, + "learning_rate": 1.0511403514489056e-06, + "loss": 0.7324, + "step": 58431 + }, + { + "epoch": 1.5, + "learning_rate": 1.0511127171828846e-06, + "loss": 0.752, + "step": 58432 + }, + { + "epoch": 1.5, + "learning_rate": 1.051085082877729e-06, + "loss": 0.5711, + "step": 58433 + }, + { + "epoch": 1.5, + "learning_rate": 1.0510574485334603e-06, + "loss": 0.4685, + "step": 58434 + }, + { + "epoch": 1.5, + "learning_rate": 1.051029814150099e-06, + "loss": 0.5928, + "step": 58435 + }, + { + "epoch": 1.5, + "learning_rate": 1.0510021797276662e-06, + "loss": 0.4385, + "step": 58436 + }, + { + "epoch": 1.5, + "learning_rate": 1.0509745452661838e-06, + "loss": 0.5908, + "step": 58437 + }, + { + "epoch": 1.5, + "learning_rate": 1.0509469107656721e-06, + "loss": 0.7393, + "step": 58438 + }, + { + "epoch": 1.5, + "learning_rate": 1.0509192762261534e-06, + "loss": 0.7256, + "step": 58439 + }, + { + "epoch": 1.5, + "learning_rate": 1.0508916416476474e-06, + "loss": 0.563, + "step": 58440 + }, + { + "epoch": 1.5, + "learning_rate": 1.0508640070301763e-06, + "loss": 0.5493, + "step": 58441 + }, + { + "epoch": 1.5, + "learning_rate": 1.050836372373761e-06, + "loss": 0.7881, + "step": 58442 + }, + { + "epoch": 1.5, + "learning_rate": 1.0508087376784228e-06, + "loss": 0.5332, + "step": 58443 + }, + { + "epoch": 1.5, + "learning_rate": 1.0507811029441823e-06, + "loss": 0.5649, + "step": 58444 + }, + { + "epoch": 1.5, + "learning_rate": 1.0507534681710614e-06, + "loss": 0.7373, + "step": 58445 + }, + { + "epoch": 1.5, + "learning_rate": 1.0507258333590807e-06, + "loss": 0.6641, + "step": 58446 + }, + { + "epoch": 1.5, + "learning_rate": 1.0506981985082617e-06, + "loss": 0.668, + "step": 58447 + }, + { + "epoch": 1.5, + "learning_rate": 1.0506705636186252e-06, + "loss": 0.8242, + "step": 58448 + }, + { + "epoch": 1.5, + "learning_rate": 1.0506429286901928e-06, + "loss": 0.7422, + "step": 58449 + }, + { + "epoch": 1.5, + "learning_rate": 1.0506152937229852e-06, + "loss": 0.4829, + "step": 58450 + }, + { + "epoch": 1.5, + "learning_rate": 1.0505876587170238e-06, + "loss": 0.6865, + "step": 58451 + }, + { + "epoch": 1.5, + "learning_rate": 1.0505600236723302e-06, + "loss": 0.4529, + "step": 58452 + }, + { + "epoch": 1.5, + "learning_rate": 1.0505323885889248e-06, + "loss": 0.6343, + "step": 58453 + }, + { + "epoch": 1.5, + "learning_rate": 1.0505047534668292e-06, + "loss": 0.6841, + "step": 58454 + }, + { + "epoch": 1.5, + "learning_rate": 1.050477118306064e-06, + "loss": 0.6855, + "step": 58455 + }, + { + "epoch": 1.5, + "learning_rate": 1.0504494831066514e-06, + "loss": 0.7075, + "step": 58456 + }, + { + "epoch": 1.5, + "learning_rate": 1.0504218478686116e-06, + "loss": 0.4905, + "step": 58457 + }, + { + "epoch": 1.5, + "learning_rate": 1.050394212591966e-06, + "loss": 0.7246, + "step": 58458 + }, + { + "epoch": 1.5, + "learning_rate": 1.0503665772767362e-06, + "loss": 0.7607, + "step": 58459 + }, + { + "epoch": 1.5, + "learning_rate": 1.050338941922943e-06, + "loss": 0.6377, + "step": 58460 + }, + { + "epoch": 1.5, + "learning_rate": 1.0503113065306073e-06, + "loss": 0.7266, + "step": 58461 + }, + { + "epoch": 1.5, + "learning_rate": 1.0502836710997507e-06, + "loss": 0.6348, + "step": 58462 + }, + { + "epoch": 1.5, + "learning_rate": 1.0502560356303939e-06, + "loss": 0.7598, + "step": 58463 + }, + { + "epoch": 1.5, + "learning_rate": 1.0502284001225591e-06, + "loss": 0.6421, + "step": 58464 + }, + { + "epoch": 1.5, + "learning_rate": 1.0502007645762663e-06, + "loss": 0.5757, + "step": 58465 + }, + { + "epoch": 1.5, + "learning_rate": 1.050173128991537e-06, + "loss": 0.752, + "step": 58466 + }, + { + "epoch": 1.5, + "learning_rate": 1.0501454933683925e-06, + "loss": 0.7529, + "step": 58467 + }, + { + "epoch": 1.5, + "learning_rate": 1.0501178577068539e-06, + "loss": 0.6558, + "step": 58468 + }, + { + "epoch": 1.5, + "learning_rate": 1.0500902220069425e-06, + "loss": 0.5107, + "step": 58469 + }, + { + "epoch": 1.5, + "learning_rate": 1.0500625862686792e-06, + "loss": 0.7188, + "step": 58470 + }, + { + "epoch": 1.5, + "learning_rate": 1.0500349504920851e-06, + "loss": 0.563, + "step": 58471 + }, + { + "epoch": 1.5, + "learning_rate": 1.050007314677182e-06, + "loss": 0.6797, + "step": 58472 + }, + { + "epoch": 1.5, + "learning_rate": 1.0499796788239901e-06, + "loss": 0.665, + "step": 58473 + }, + { + "epoch": 1.5, + "learning_rate": 1.0499520429325312e-06, + "loss": 0.5664, + "step": 58474 + }, + { + "epoch": 1.5, + "learning_rate": 1.0499244070028266e-06, + "loss": 0.7046, + "step": 58475 + }, + { + "epoch": 1.5, + "learning_rate": 1.0498967710348966e-06, + "loss": 0.7495, + "step": 58476 + }, + { + "epoch": 1.5, + "learning_rate": 1.0498691350287636e-06, + "loss": 0.7468, + "step": 58477 + }, + { + "epoch": 1.5, + "learning_rate": 1.0498414989844476e-06, + "loss": 0.5112, + "step": 58478 + }, + { + "epoch": 1.5, + "learning_rate": 1.0498138629019709e-06, + "loss": 0.6641, + "step": 58479 + }, + { + "epoch": 1.5, + "learning_rate": 1.0497862267813533e-06, + "loss": 0.748, + "step": 58480 + }, + { + "epoch": 1.5, + "learning_rate": 1.0497585906226169e-06, + "loss": 0.5366, + "step": 58481 + }, + { + "epoch": 1.5, + "learning_rate": 1.0497309544257826e-06, + "loss": 0.4563, + "step": 58482 + }, + { + "epoch": 1.5, + "learning_rate": 1.049703318190872e-06, + "loss": 0.6519, + "step": 58483 + }, + { + "epoch": 1.5, + "learning_rate": 1.0496756819179053e-06, + "loss": 0.7637, + "step": 58484 + }, + { + "epoch": 1.5, + "learning_rate": 1.0496480456069046e-06, + "loss": 0.6484, + "step": 58485 + }, + { + "epoch": 1.5, + "learning_rate": 1.0496204092578905e-06, + "loss": 0.6177, + "step": 58486 + }, + { + "epoch": 1.5, + "learning_rate": 1.0495927728708845e-06, + "loss": 0.6758, + "step": 58487 + }, + { + "epoch": 1.5, + "learning_rate": 1.049565136445907e-06, + "loss": 0.4912, + "step": 58488 + }, + { + "epoch": 1.5, + "learning_rate": 1.0495374999829807e-06, + "loss": 0.5452, + "step": 58489 + }, + { + "epoch": 1.5, + "learning_rate": 1.0495098634821252e-06, + "loss": 0.5887, + "step": 58490 + }, + { + "epoch": 1.5, + "learning_rate": 1.0494822269433624e-06, + "loss": 0.5928, + "step": 58491 + }, + { + "epoch": 1.5, + "learning_rate": 1.049454590366713e-06, + "loss": 0.7236, + "step": 58492 + }, + { + "epoch": 1.5, + "learning_rate": 1.049426953752199e-06, + "loss": 0.6738, + "step": 58493 + }, + { + "epoch": 1.5, + "learning_rate": 1.049399317099841e-06, + "loss": 0.4467, + "step": 58494 + }, + { + "epoch": 1.5, + "learning_rate": 1.04937168040966e-06, + "loss": 0.5649, + "step": 58495 + }, + { + "epoch": 1.5, + "learning_rate": 1.0493440436816773e-06, + "loss": 0.4194, + "step": 58496 + }, + { + "epoch": 1.5, + "learning_rate": 1.0493164069159144e-06, + "loss": 0.6748, + "step": 58497 + }, + { + "epoch": 1.5, + "learning_rate": 1.049288770112392e-06, + "loss": 0.5095, + "step": 58498 + }, + { + "epoch": 1.5, + "learning_rate": 1.0492611332711319e-06, + "loss": 0.748, + "step": 58499 + }, + { + "epoch": 1.5, + "learning_rate": 1.0492334963921542e-06, + "loss": 0.7246, + "step": 58500 + }, + { + "epoch": 1.5, + "learning_rate": 1.049205859475481e-06, + "loss": 0.6831, + "step": 58501 + }, + { + "epoch": 1.5, + "learning_rate": 1.0491782225211332e-06, + "loss": 0.5317, + "step": 58502 + }, + { + "epoch": 1.5, + "learning_rate": 1.0491505855291316e-06, + "loss": 0.7314, + "step": 58503 + }, + { + "epoch": 1.5, + "learning_rate": 1.0491229484994981e-06, + "loss": 0.6484, + "step": 58504 + }, + { + "epoch": 1.5, + "learning_rate": 1.0490953114322529e-06, + "loss": 0.7314, + "step": 58505 + }, + { + "epoch": 1.5, + "learning_rate": 1.0490676743274181e-06, + "loss": 0.8418, + "step": 58506 + }, + { + "epoch": 1.5, + "learning_rate": 1.0490400371850141e-06, + "loss": 0.666, + "step": 58507 + }, + { + "epoch": 1.5, + "learning_rate": 1.0490124000050626e-06, + "loss": 0.452, + "step": 58508 + }, + { + "epoch": 1.5, + "learning_rate": 1.0489847627875846e-06, + "loss": 0.6348, + "step": 58509 + }, + { + "epoch": 1.5, + "learning_rate": 1.0489571255326012e-06, + "loss": 0.6235, + "step": 58510 + }, + { + "epoch": 1.5, + "learning_rate": 1.0489294882401335e-06, + "loss": 0.5095, + "step": 58511 + }, + { + "epoch": 1.5, + "learning_rate": 1.0489018509102027e-06, + "loss": 0.6445, + "step": 58512 + }, + { + "epoch": 1.5, + "learning_rate": 1.04887421354283e-06, + "loss": 0.5103, + "step": 58513 + }, + { + "epoch": 1.5, + "learning_rate": 1.0488465761380367e-06, + "loss": 0.6973, + "step": 58514 + }, + { + "epoch": 1.5, + "learning_rate": 1.0488189386958436e-06, + "loss": 0.708, + "step": 58515 + }, + { + "epoch": 1.5, + "learning_rate": 1.0487913012162726e-06, + "loss": 0.6338, + "step": 58516 + }, + { + "epoch": 1.5, + "learning_rate": 1.0487636636993437e-06, + "loss": 0.6152, + "step": 58517 + }, + { + "epoch": 1.5, + "learning_rate": 1.048736026145079e-06, + "loss": 0.4949, + "step": 58518 + }, + { + "epoch": 1.5, + "learning_rate": 1.0487083885534996e-06, + "loss": 0.4866, + "step": 58519 + }, + { + "epoch": 1.5, + "learning_rate": 1.0486807509246259e-06, + "loss": 0.5415, + "step": 58520 + }, + { + "epoch": 1.5, + "learning_rate": 1.04865311325848e-06, + "loss": 0.6895, + "step": 58521 + }, + { + "epoch": 1.5, + "learning_rate": 1.0486254755550823e-06, + "loss": 0.5312, + "step": 58522 + }, + { + "epoch": 1.5, + "learning_rate": 1.0485978378144547e-06, + "loss": 0.7021, + "step": 58523 + }, + { + "epoch": 1.5, + "learning_rate": 1.0485702000366178e-06, + "loss": 0.5151, + "step": 58524 + }, + { + "epoch": 1.5, + "learning_rate": 1.048542562221593e-06, + "loss": 0.5029, + "step": 58525 + }, + { + "epoch": 1.5, + "learning_rate": 1.0485149243694012e-06, + "loss": 0.5942, + "step": 58526 + }, + { + "epoch": 1.5, + "learning_rate": 1.0484872864800638e-06, + "loss": 0.5752, + "step": 58527 + }, + { + "epoch": 1.5, + "learning_rate": 1.0484596485536018e-06, + "loss": 0.5535, + "step": 58528 + }, + { + "epoch": 1.5, + "learning_rate": 1.048432010590037e-06, + "loss": 0.6758, + "step": 58529 + }, + { + "epoch": 1.5, + "learning_rate": 1.0484043725893896e-06, + "loss": 0.6392, + "step": 58530 + }, + { + "epoch": 1.5, + "learning_rate": 1.0483767345516813e-06, + "loss": 0.7549, + "step": 58531 + }, + { + "epoch": 1.5, + "learning_rate": 1.0483490964769331e-06, + "loss": 0.6555, + "step": 58532 + }, + { + "epoch": 1.5, + "learning_rate": 1.0483214583651662e-06, + "loss": 0.6724, + "step": 58533 + }, + { + "epoch": 1.5, + "learning_rate": 1.0482938202164021e-06, + "loss": 0.5034, + "step": 58534 + }, + { + "epoch": 1.5, + "learning_rate": 1.0482661820306612e-06, + "loss": 0.6235, + "step": 58535 + }, + { + "epoch": 1.5, + "learning_rate": 1.0482385438079654e-06, + "loss": 0.6943, + "step": 58536 + }, + { + "epoch": 1.5, + "learning_rate": 1.0482109055483355e-06, + "loss": 0.6572, + "step": 58537 + }, + { + "epoch": 1.5, + "learning_rate": 1.0481832672517926e-06, + "loss": 0.5591, + "step": 58538 + }, + { + "epoch": 1.5, + "learning_rate": 1.048155628918358e-06, + "loss": 0.6704, + "step": 58539 + }, + { + "epoch": 1.5, + "learning_rate": 1.0481279905480528e-06, + "loss": 0.6299, + "step": 58540 + }, + { + "epoch": 1.5, + "learning_rate": 1.0481003521408984e-06, + "loss": 0.6289, + "step": 58541 + }, + { + "epoch": 1.5, + "learning_rate": 1.0480727136969156e-06, + "loss": 0.4922, + "step": 58542 + }, + { + "epoch": 1.5, + "learning_rate": 1.048045075216126e-06, + "loss": 0.5938, + "step": 58543 + }, + { + "epoch": 1.5, + "learning_rate": 1.0480174366985503e-06, + "loss": 0.5967, + "step": 58544 + }, + { + "epoch": 1.5, + "learning_rate": 1.04798979814421e-06, + "loss": 0.6548, + "step": 58545 + }, + { + "epoch": 1.5, + "learning_rate": 1.047962159553126e-06, + "loss": 0.5098, + "step": 58546 + }, + { + "epoch": 1.5, + "learning_rate": 1.0479345209253194e-06, + "loss": 0.7256, + "step": 58547 + }, + { + "epoch": 1.5, + "learning_rate": 1.047906882260812e-06, + "loss": 0.6855, + "step": 58548 + }, + { + "epoch": 1.5, + "learning_rate": 1.0478792435596242e-06, + "loss": 0.6299, + "step": 58549 + }, + { + "epoch": 1.5, + "learning_rate": 1.0478516048217775e-06, + "loss": 0.7217, + "step": 58550 + }, + { + "epoch": 1.5, + "learning_rate": 1.0478239660472929e-06, + "loss": 0.6904, + "step": 58551 + }, + { + "epoch": 1.5, + "learning_rate": 1.0477963272361918e-06, + "loss": 0.5503, + "step": 58552 + }, + { + "epoch": 1.5, + "learning_rate": 1.0477686883884951e-06, + "loss": 0.6113, + "step": 58553 + }, + { + "epoch": 1.5, + "learning_rate": 1.0477410495042246e-06, + "loss": 0.5396, + "step": 58554 + }, + { + "epoch": 1.5, + "learning_rate": 1.0477134105834004e-06, + "loss": 0.6748, + "step": 58555 + }, + { + "epoch": 1.5, + "learning_rate": 1.0476857716260447e-06, + "loss": 0.6758, + "step": 58556 + }, + { + "epoch": 1.5, + "learning_rate": 1.0476581326321779e-06, + "loss": 0.605, + "step": 58557 + }, + { + "epoch": 1.5, + "learning_rate": 1.0476304936018215e-06, + "loss": 0.6587, + "step": 58558 + }, + { + "epoch": 1.5, + "learning_rate": 1.047602854534997e-06, + "loss": 0.6025, + "step": 58559 + }, + { + "epoch": 1.5, + "learning_rate": 1.0475752154317248e-06, + "loss": 0.5339, + "step": 58560 + }, + { + "epoch": 1.5, + "learning_rate": 1.0475475762920262e-06, + "loss": 0.6143, + "step": 58561 + }, + { + "epoch": 1.5, + "learning_rate": 1.047519937115923e-06, + "loss": 0.8467, + "step": 58562 + }, + { + "epoch": 1.5, + "learning_rate": 1.0474922979034356e-06, + "loss": 0.6562, + "step": 58563 + }, + { + "epoch": 1.5, + "learning_rate": 1.0474646586545858e-06, + "loss": 0.4539, + "step": 58564 + }, + { + "epoch": 1.5, + "learning_rate": 1.0474370193693947e-06, + "loss": 0.625, + "step": 58565 + }, + { + "epoch": 1.5, + "learning_rate": 1.0474093800478828e-06, + "loss": 0.4083, + "step": 58566 + }, + { + "epoch": 1.5, + "learning_rate": 1.0473817406900722e-06, + "loss": 0.6465, + "step": 58567 + }, + { + "epoch": 1.5, + "learning_rate": 1.0473541012959831e-06, + "loss": 0.6035, + "step": 58568 + }, + { + "epoch": 1.5, + "learning_rate": 1.0473264618656377e-06, + "loss": 0.8369, + "step": 58569 + }, + { + "epoch": 1.5, + "learning_rate": 1.0472988223990562e-06, + "loss": 0.7686, + "step": 58570 + }, + { + "epoch": 1.5, + "learning_rate": 1.0472711828962604e-06, + "loss": 0.7598, + "step": 58571 + }, + { + "epoch": 1.5, + "learning_rate": 1.0472435433572709e-06, + "loss": 0.7588, + "step": 58572 + }, + { + "epoch": 1.5, + "learning_rate": 1.0472159037821092e-06, + "loss": 0.5759, + "step": 58573 + }, + { + "epoch": 1.5, + "learning_rate": 1.0471882641707969e-06, + "loss": 0.5776, + "step": 58574 + }, + { + "epoch": 1.5, + "learning_rate": 1.0471606245233546e-06, + "loss": 0.5869, + "step": 58575 + }, + { + "epoch": 1.5, + "learning_rate": 1.0471329848398032e-06, + "loss": 0.5088, + "step": 58576 + }, + { + "epoch": 1.5, + "learning_rate": 1.0471053451201647e-06, + "loss": 0.6152, + "step": 58577 + }, + { + "epoch": 1.5, + "learning_rate": 1.0470777053644592e-06, + "loss": 0.7422, + "step": 58578 + }, + { + "epoch": 1.5, + "learning_rate": 1.0470500655727092e-06, + "loss": 0.6768, + "step": 58579 + }, + { + "epoch": 1.5, + "learning_rate": 1.0470224257449346e-06, + "loss": 0.6431, + "step": 58580 + }, + { + "epoch": 1.5, + "learning_rate": 1.0469947858811575e-06, + "loss": 0.4226, + "step": 58581 + }, + { + "epoch": 1.5, + "learning_rate": 1.046967145981398e-06, + "loss": 0.6553, + "step": 58582 + }, + { + "epoch": 1.5, + "learning_rate": 1.0469395060456784e-06, + "loss": 0.5879, + "step": 58583 + }, + { + "epoch": 1.5, + "learning_rate": 1.0469118660740194e-06, + "loss": 0.5923, + "step": 58584 + }, + { + "epoch": 1.5, + "learning_rate": 1.046884226066442e-06, + "loss": 0.6768, + "step": 58585 + }, + { + "epoch": 1.5, + "learning_rate": 1.0468565860229675e-06, + "loss": 0.6377, + "step": 58586 + }, + { + "epoch": 1.5, + "learning_rate": 1.046828945943617e-06, + "loss": 0.6074, + "step": 58587 + }, + { + "epoch": 1.5, + "learning_rate": 1.046801305828412e-06, + "loss": 0.5229, + "step": 58588 + }, + { + "epoch": 1.5, + "learning_rate": 1.046773665677373e-06, + "loss": 0.6621, + "step": 58589 + }, + { + "epoch": 1.5, + "learning_rate": 1.0467460254905221e-06, + "loss": 0.7012, + "step": 58590 + }, + { + "epoch": 1.5, + "learning_rate": 1.0467183852678794e-06, + "loss": 0.6479, + "step": 58591 + }, + { + "epoch": 1.5, + "learning_rate": 1.046690745009467e-06, + "loss": 0.7725, + "step": 58592 + }, + { + "epoch": 1.5, + "learning_rate": 1.0466631047153052e-06, + "loss": 0.4902, + "step": 58593 + }, + { + "epoch": 1.5, + "learning_rate": 1.046635464385416e-06, + "loss": 0.6245, + "step": 58594 + }, + { + "epoch": 1.5, + "learning_rate": 1.04660782401982e-06, + "loss": 0.6846, + "step": 58595 + }, + { + "epoch": 1.5, + "learning_rate": 1.0465801836185387e-06, + "loss": 0.7529, + "step": 58596 + }, + { + "epoch": 1.5, + "learning_rate": 1.0465525431815926e-06, + "loss": 0.6401, + "step": 58597 + }, + { + "epoch": 1.5, + "learning_rate": 1.0465249027090038e-06, + "loss": 0.5767, + "step": 58598 + }, + { + "epoch": 1.5, + "learning_rate": 1.046497262200793e-06, + "loss": 0.4673, + "step": 58599 + }, + { + "epoch": 1.5, + "learning_rate": 1.0464696216569813e-06, + "loss": 0.752, + "step": 58600 + }, + { + "epoch": 1.5, + "learning_rate": 1.0464419810775899e-06, + "loss": 0.6152, + "step": 58601 + }, + { + "epoch": 1.5, + "learning_rate": 1.04641434046264e-06, + "loss": 0.605, + "step": 58602 + }, + { + "epoch": 1.5, + "learning_rate": 1.0463866998121527e-06, + "loss": 0.5776, + "step": 58603 + }, + { + "epoch": 1.5, + "learning_rate": 1.0463590591261496e-06, + "loss": 0.5586, + "step": 58604 + }, + { + "epoch": 1.5, + "learning_rate": 1.0463314184046512e-06, + "loss": 0.4041, + "step": 58605 + }, + { + "epoch": 1.5, + "learning_rate": 1.0463037776476792e-06, + "loss": 0.7783, + "step": 58606 + }, + { + "epoch": 1.5, + "learning_rate": 1.0462761368552541e-06, + "loss": 0.6953, + "step": 58607 + }, + { + "epoch": 1.5, + "learning_rate": 1.046248496027398e-06, + "loss": 0.7861, + "step": 58608 + }, + { + "epoch": 1.5, + "learning_rate": 1.0462208551641313e-06, + "loss": 0.6387, + "step": 58609 + }, + { + "epoch": 1.5, + "learning_rate": 1.0461932142654751e-06, + "loss": 0.6382, + "step": 58610 + }, + { + "epoch": 1.5, + "learning_rate": 1.0461655733314514e-06, + "loss": 0.5511, + "step": 58611 + }, + { + "epoch": 1.5, + "learning_rate": 1.0461379323620805e-06, + "loss": 0.4585, + "step": 58612 + }, + { + "epoch": 1.5, + "learning_rate": 1.0461102913573841e-06, + "loss": 0.5942, + "step": 58613 + }, + { + "epoch": 1.5, + "learning_rate": 1.0460826503173832e-06, + "loss": 0.6455, + "step": 58614 + }, + { + "epoch": 1.5, + "learning_rate": 1.046055009242099e-06, + "loss": 0.4969, + "step": 58615 + }, + { + "epoch": 1.5, + "learning_rate": 1.046027368131552e-06, + "loss": 0.7148, + "step": 58616 + }, + { + "epoch": 1.5, + "learning_rate": 1.0459997269857645e-06, + "loss": 0.7793, + "step": 58617 + }, + { + "epoch": 1.5, + "learning_rate": 1.045972085804757e-06, + "loss": 0.7383, + "step": 58618 + }, + { + "epoch": 1.5, + "learning_rate": 1.0459444445885512e-06, + "loss": 0.8477, + "step": 58619 + }, + { + "epoch": 1.5, + "learning_rate": 1.0459168033371673e-06, + "loss": 0.6484, + "step": 58620 + }, + { + "epoch": 1.5, + "learning_rate": 1.0458891620506272e-06, + "loss": 0.542, + "step": 58621 + }, + { + "epoch": 1.5, + "learning_rate": 1.0458615207289519e-06, + "loss": 0.6753, + "step": 58622 + }, + { + "epoch": 1.5, + "learning_rate": 1.0458338793721623e-06, + "loss": 0.5867, + "step": 58623 + }, + { + "epoch": 1.5, + "learning_rate": 1.0458062379802802e-06, + "loss": 0.6304, + "step": 58624 + }, + { + "epoch": 1.5, + "learning_rate": 1.0457785965533263e-06, + "loss": 0.6479, + "step": 58625 + }, + { + "epoch": 1.5, + "learning_rate": 1.0457509550913215e-06, + "loss": 0.6113, + "step": 58626 + }, + { + "epoch": 1.5, + "learning_rate": 1.0457233135942876e-06, + "loss": 0.4907, + "step": 58627 + }, + { + "epoch": 1.5, + "learning_rate": 1.0456956720622452e-06, + "loss": 0.6377, + "step": 58628 + }, + { + "epoch": 1.5, + "learning_rate": 1.045668030495216e-06, + "loss": 0.644, + "step": 58629 + }, + { + "epoch": 1.5, + "learning_rate": 1.0456403888932208e-06, + "loss": 0.6152, + "step": 58630 + }, + { + "epoch": 1.5, + "learning_rate": 1.0456127472562808e-06, + "loss": 0.5205, + "step": 58631 + }, + { + "epoch": 1.5, + "learning_rate": 1.0455851055844174e-06, + "loss": 0.6992, + "step": 58632 + }, + { + "epoch": 1.5, + "learning_rate": 1.0455574638776514e-06, + "loss": 0.7256, + "step": 58633 + }, + { + "epoch": 1.5, + "learning_rate": 1.0455298221360042e-06, + "loss": 0.8281, + "step": 58634 + }, + { + "epoch": 1.5, + "learning_rate": 1.0455021803594967e-06, + "loss": 0.6875, + "step": 58635 + }, + { + "epoch": 1.5, + "learning_rate": 1.0454745385481508e-06, + "loss": 0.6885, + "step": 58636 + }, + { + "epoch": 1.5, + "learning_rate": 1.0454468967019864e-06, + "loss": 0.5, + "step": 58637 + }, + { + "epoch": 1.5, + "learning_rate": 1.0454192548210258e-06, + "loss": 0.6284, + "step": 58638 + }, + { + "epoch": 1.5, + "learning_rate": 1.04539161290529e-06, + "loss": 0.5679, + "step": 58639 + }, + { + "epoch": 1.5, + "learning_rate": 1.0453639709547996e-06, + "loss": 0.748, + "step": 58640 + }, + { + "epoch": 1.5, + "learning_rate": 1.0453363289695762e-06, + "loss": 0.6392, + "step": 58641 + }, + { + "epoch": 1.5, + "learning_rate": 1.0453086869496408e-06, + "loss": 0.6943, + "step": 58642 + }, + { + "epoch": 1.5, + "learning_rate": 1.0452810448950146e-06, + "loss": 0.5957, + "step": 58643 + }, + { + "epoch": 1.5, + "learning_rate": 1.0452534028057193e-06, + "loss": 0.7393, + "step": 58644 + }, + { + "epoch": 1.5, + "learning_rate": 1.045225760681775e-06, + "loss": 0.4663, + "step": 58645 + }, + { + "epoch": 1.5, + "learning_rate": 1.0451981185232035e-06, + "loss": 0.6797, + "step": 58646 + }, + { + "epoch": 1.5, + "learning_rate": 1.0451704763300256e-06, + "loss": 0.7051, + "step": 58647 + }, + { + "epoch": 1.5, + "learning_rate": 1.0451428341022633e-06, + "loss": 0.8662, + "step": 58648 + }, + { + "epoch": 1.5, + "learning_rate": 1.0451151918399368e-06, + "loss": 0.7617, + "step": 58649 + }, + { + "epoch": 1.5, + "learning_rate": 1.045087549543068e-06, + "loss": 0.6284, + "step": 58650 + }, + { + "epoch": 1.5, + "learning_rate": 1.0450599072116774e-06, + "loss": 0.8438, + "step": 58651 + }, + { + "epoch": 1.5, + "learning_rate": 1.0450322648457868e-06, + "loss": 0.4927, + "step": 58652 + }, + { + "epoch": 1.5, + "learning_rate": 1.0450046224454167e-06, + "loss": 0.7959, + "step": 58653 + }, + { + "epoch": 1.5, + "learning_rate": 1.044976980010589e-06, + "loss": 0.5374, + "step": 58654 + }, + { + "epoch": 1.5, + "learning_rate": 1.0449493375413242e-06, + "loss": 0.4966, + "step": 58655 + }, + { + "epoch": 1.5, + "learning_rate": 1.0449216950376438e-06, + "loss": 0.6406, + "step": 58656 + }, + { + "epoch": 1.5, + "learning_rate": 1.0448940524995692e-06, + "loss": 0.6553, + "step": 58657 + }, + { + "epoch": 1.5, + "learning_rate": 1.0448664099271211e-06, + "loss": 0.6963, + "step": 58658 + }, + { + "epoch": 1.5, + "learning_rate": 1.044838767320321e-06, + "loss": 0.7666, + "step": 58659 + }, + { + "epoch": 1.5, + "learning_rate": 1.0448111246791898e-06, + "loss": 0.7393, + "step": 58660 + }, + { + "epoch": 1.5, + "learning_rate": 1.0447834820037487e-06, + "loss": 0.7441, + "step": 58661 + }, + { + "epoch": 1.5, + "learning_rate": 1.044755839294019e-06, + "loss": 0.7148, + "step": 58662 + }, + { + "epoch": 1.5, + "learning_rate": 1.044728196550022e-06, + "loss": 0.5586, + "step": 58663 + }, + { + "epoch": 1.5, + "learning_rate": 1.0447005537717784e-06, + "loss": 0.8389, + "step": 58664 + }, + { + "epoch": 1.5, + "learning_rate": 1.0446729109593098e-06, + "loss": 0.6426, + "step": 58665 + }, + { + "epoch": 1.5, + "learning_rate": 1.044645268112637e-06, + "loss": 0.5996, + "step": 58666 + }, + { + "epoch": 1.5, + "learning_rate": 1.0446176252317815e-06, + "loss": 0.5227, + "step": 58667 + }, + { + "epoch": 1.5, + "learning_rate": 1.0445899823167645e-06, + "loss": 0.575, + "step": 58668 + }, + { + "epoch": 1.5, + "learning_rate": 1.044562339367607e-06, + "loss": 0.5474, + "step": 58669 + }, + { + "epoch": 1.5, + "learning_rate": 1.0445346963843297e-06, + "loss": 0.7422, + "step": 58670 + }, + { + "epoch": 1.5, + "learning_rate": 1.044507053366955e-06, + "loss": 0.6772, + "step": 58671 + }, + { + "epoch": 1.5, + "learning_rate": 1.0444794103155026e-06, + "loss": 0.5298, + "step": 58672 + }, + { + "epoch": 1.5, + "learning_rate": 1.0444517672299946e-06, + "loss": 0.625, + "step": 58673 + }, + { + "epoch": 1.5, + "learning_rate": 1.0444241241104522e-06, + "loss": 0.5879, + "step": 58674 + }, + { + "epoch": 1.5, + "learning_rate": 1.0443964809568957e-06, + "loss": 0.3336, + "step": 58675 + }, + { + "epoch": 1.5, + "learning_rate": 1.0443688377693472e-06, + "loss": 0.4768, + "step": 58676 + }, + { + "epoch": 1.5, + "learning_rate": 1.0443411945478273e-06, + "loss": 0.4497, + "step": 58677 + }, + { + "epoch": 1.5, + "learning_rate": 1.044313551292358e-06, + "loss": 0.6851, + "step": 58678 + }, + { + "epoch": 1.5, + "learning_rate": 1.0442859080029593e-06, + "loss": 0.5322, + "step": 58679 + }, + { + "epoch": 1.5, + "learning_rate": 1.0442582646796532e-06, + "loss": 0.6367, + "step": 58680 + }, + { + "epoch": 1.5, + "learning_rate": 1.0442306213224603e-06, + "loss": 0.7881, + "step": 58681 + }, + { + "epoch": 1.5, + "learning_rate": 1.044202977931402e-06, + "loss": 0.7305, + "step": 58682 + }, + { + "epoch": 1.5, + "learning_rate": 1.0441753345064999e-06, + "loss": 0.8281, + "step": 58683 + }, + { + "epoch": 1.5, + "learning_rate": 1.0441476910477748e-06, + "loss": 0.5469, + "step": 58684 + }, + { + "epoch": 1.5, + "learning_rate": 1.0441200475552473e-06, + "loss": 0.7891, + "step": 58685 + }, + { + "epoch": 1.5, + "learning_rate": 1.0440924040289396e-06, + "loss": 0.5791, + "step": 58686 + }, + { + "epoch": 1.5, + "learning_rate": 1.044064760468872e-06, + "loss": 0.6631, + "step": 58687 + }, + { + "epoch": 1.5, + "learning_rate": 1.0440371168750666e-06, + "loss": 0.6055, + "step": 58688 + }, + { + "epoch": 1.5, + "learning_rate": 1.0440094732475435e-06, + "loss": 0.5894, + "step": 58689 + }, + { + "epoch": 1.5, + "learning_rate": 1.0439818295863246e-06, + "loss": 0.7217, + "step": 58690 + }, + { + "epoch": 1.5, + "learning_rate": 1.0439541858914306e-06, + "loss": 0.5195, + "step": 58691 + }, + { + "epoch": 1.5, + "learning_rate": 1.0439265421628832e-06, + "loss": 0.582, + "step": 58692 + }, + { + "epoch": 1.5, + "learning_rate": 1.043898898400703e-06, + "loss": 0.6084, + "step": 58693 + }, + { + "epoch": 1.5, + "learning_rate": 1.0438712546049115e-06, + "loss": 0.5107, + "step": 58694 + }, + { + "epoch": 1.5, + "learning_rate": 1.04384361077553e-06, + "loss": 0.6006, + "step": 58695 + }, + { + "epoch": 1.5, + "learning_rate": 1.0438159669125795e-06, + "loss": 0.5933, + "step": 58696 + }, + { + "epoch": 1.5, + "learning_rate": 1.0437883230160807e-06, + "loss": 0.6284, + "step": 58697 + }, + { + "epoch": 1.5, + "learning_rate": 1.0437606790860554e-06, + "loss": 0.6001, + "step": 58698 + }, + { + "epoch": 1.5, + "learning_rate": 1.0437330351225247e-06, + "loss": 0.6201, + "step": 58699 + }, + { + "epoch": 1.5, + "learning_rate": 1.0437053911255093e-06, + "loss": 0.6279, + "step": 58700 + }, + { + "epoch": 1.5, + "learning_rate": 1.043677747095031e-06, + "loss": 0.6069, + "step": 58701 + }, + { + "epoch": 1.5, + "learning_rate": 1.0436501030311105e-06, + "loss": 0.6455, + "step": 58702 + }, + { + "epoch": 1.5, + "learning_rate": 1.0436224589337695e-06, + "loss": 0.5942, + "step": 58703 + }, + { + "epoch": 1.5, + "learning_rate": 1.0435948148030282e-06, + "loss": 0.6689, + "step": 58704 + }, + { + "epoch": 1.5, + "learning_rate": 1.0435671706389089e-06, + "loss": 0.5508, + "step": 58705 + }, + { + "epoch": 1.5, + "learning_rate": 1.0435395264414317e-06, + "loss": 0.6914, + "step": 58706 + }, + { + "epoch": 1.5, + "learning_rate": 1.0435118822106185e-06, + "loss": 0.7178, + "step": 58707 + }, + { + "epoch": 1.5, + "learning_rate": 1.0434842379464906e-06, + "loss": 0.5938, + "step": 58708 + }, + { + "epoch": 1.5, + "learning_rate": 1.0434565936490685e-06, + "loss": 0.6025, + "step": 58709 + }, + { + "epoch": 1.5, + "learning_rate": 1.0434289493183738e-06, + "loss": 0.7324, + "step": 58710 + }, + { + "epoch": 1.5, + "learning_rate": 1.0434013049544273e-06, + "loss": 0.5627, + "step": 58711 + }, + { + "epoch": 1.5, + "learning_rate": 1.0433736605572505e-06, + "loss": 0.7178, + "step": 58712 + }, + { + "epoch": 1.5, + "learning_rate": 1.0433460161268649e-06, + "loss": 0.6475, + "step": 58713 + }, + { + "epoch": 1.5, + "learning_rate": 1.0433183716632908e-06, + "loss": 0.6699, + "step": 58714 + }, + { + "epoch": 1.5, + "learning_rate": 1.04329072716655e-06, + "loss": 0.7461, + "step": 58715 + }, + { + "epoch": 1.5, + "learning_rate": 1.0432630826366632e-06, + "loss": 0.6836, + "step": 58716 + }, + { + "epoch": 1.5, + "learning_rate": 1.043235438073652e-06, + "loss": 0.7227, + "step": 58717 + }, + { + "epoch": 1.5, + "learning_rate": 1.0432077934775377e-06, + "loss": 0.6362, + "step": 58718 + }, + { + "epoch": 1.5, + "learning_rate": 1.0431801488483408e-06, + "loss": 0.689, + "step": 58719 + }, + { + "epoch": 1.51, + "learning_rate": 1.0431525041860829e-06, + "loss": 0.6157, + "step": 58720 + }, + { + "epoch": 1.51, + "learning_rate": 1.0431248594907852e-06, + "loss": 0.792, + "step": 58721 + }, + { + "epoch": 1.51, + "learning_rate": 1.0430972147624686e-06, + "loss": 0.6973, + "step": 58722 + }, + { + "epoch": 1.51, + "learning_rate": 1.0430695700011547e-06, + "loss": 0.6572, + "step": 58723 + }, + { + "epoch": 1.51, + "learning_rate": 1.0430419252068644e-06, + "loss": 0.7617, + "step": 58724 + }, + { + "epoch": 1.51, + "learning_rate": 1.0430142803796187e-06, + "loss": 0.5459, + "step": 58725 + }, + { + "epoch": 1.51, + "learning_rate": 1.0429866355194393e-06, + "loss": 0.7461, + "step": 58726 + }, + { + "epoch": 1.51, + "learning_rate": 1.0429589906263465e-06, + "loss": 0.6611, + "step": 58727 + }, + { + "epoch": 1.51, + "learning_rate": 1.0429313457003625e-06, + "loss": 0.6047, + "step": 58728 + }, + { + "epoch": 1.51, + "learning_rate": 1.0429037007415075e-06, + "loss": 0.4412, + "step": 58729 + }, + { + "epoch": 1.51, + "learning_rate": 1.0428760557498034e-06, + "loss": 0.6816, + "step": 58730 + }, + { + "epoch": 1.51, + "learning_rate": 1.042848410725271e-06, + "loss": 0.667, + "step": 58731 + }, + { + "epoch": 1.51, + "learning_rate": 1.0428207656679313e-06, + "loss": 0.7041, + "step": 58732 + }, + { + "epoch": 1.51, + "learning_rate": 1.042793120577806e-06, + "loss": 0.6924, + "step": 58733 + }, + { + "epoch": 1.51, + "learning_rate": 1.042765475454916e-06, + "loss": 0.8447, + "step": 58734 + }, + { + "epoch": 1.51, + "learning_rate": 1.0427378302992821e-06, + "loss": 0.6641, + "step": 58735 + }, + { + "epoch": 1.51, + "learning_rate": 1.0427101851109261e-06, + "loss": 0.6748, + "step": 58736 + }, + { + "epoch": 1.51, + "learning_rate": 1.0426825398898687e-06, + "loss": 0.5391, + "step": 58737 + }, + { + "epoch": 1.51, + "learning_rate": 1.0426548946361315e-06, + "loss": 0.5601, + "step": 58738 + }, + { + "epoch": 1.51, + "learning_rate": 1.0426272493497353e-06, + "loss": 0.5444, + "step": 58739 + }, + { + "epoch": 1.51, + "learning_rate": 1.0425996040307012e-06, + "loss": 0.5571, + "step": 58740 + }, + { + "epoch": 1.51, + "learning_rate": 1.0425719586790508e-06, + "loss": 0.623, + "step": 58741 + }, + { + "epoch": 1.51, + "learning_rate": 1.0425443132948048e-06, + "loss": 0.6758, + "step": 58742 + }, + { + "epoch": 1.51, + "learning_rate": 1.0425166678779848e-06, + "loss": 0.6143, + "step": 58743 + }, + { + "epoch": 1.51, + "learning_rate": 1.0424890224286115e-06, + "loss": 0.5557, + "step": 58744 + }, + { + "epoch": 1.51, + "learning_rate": 1.0424613769467065e-06, + "loss": 0.6963, + "step": 58745 + }, + { + "epoch": 1.51, + "learning_rate": 1.0424337314322907e-06, + "loss": 0.6445, + "step": 58746 + }, + { + "epoch": 1.51, + "learning_rate": 1.0424060858853852e-06, + "loss": 0.7212, + "step": 58747 + }, + { + "epoch": 1.51, + "learning_rate": 1.0423784403060117e-06, + "loss": 0.6001, + "step": 58748 + }, + { + "epoch": 1.51, + "learning_rate": 1.0423507946941907e-06, + "loss": 0.4915, + "step": 58749 + }, + { + "epoch": 1.51, + "learning_rate": 1.0423231490499436e-06, + "loss": 0.6125, + "step": 58750 + }, + { + "epoch": 1.51, + "learning_rate": 1.0422955033732917e-06, + "loss": 0.6719, + "step": 58751 + }, + { + "epoch": 1.51, + "learning_rate": 1.0422678576642559e-06, + "loss": 0.5439, + "step": 58752 + }, + { + "epoch": 1.51, + "learning_rate": 1.0422402119228579e-06, + "loss": 0.8643, + "step": 58753 + }, + { + "epoch": 1.51, + "learning_rate": 1.042212566149118e-06, + "loss": 0.5845, + "step": 58754 + }, + { + "epoch": 1.51, + "learning_rate": 1.0421849203430584e-06, + "loss": 0.4346, + "step": 58755 + }, + { + "epoch": 1.51, + "learning_rate": 1.0421572745046995e-06, + "loss": 0.8096, + "step": 58756 + }, + { + "epoch": 1.51, + "learning_rate": 1.0421296286340629e-06, + "loss": 0.7412, + "step": 58757 + }, + { + "epoch": 1.51, + "learning_rate": 1.0421019827311694e-06, + "loss": 0.6187, + "step": 58758 + }, + { + "epoch": 1.51, + "learning_rate": 1.0420743367960403e-06, + "loss": 0.5757, + "step": 58759 + }, + { + "epoch": 1.51, + "learning_rate": 1.042046690828697e-06, + "loss": 0.6357, + "step": 58760 + }, + { + "epoch": 1.51, + "learning_rate": 1.0420190448291603e-06, + "loss": 0.7432, + "step": 58761 + }, + { + "epoch": 1.51, + "learning_rate": 1.0419913987974515e-06, + "loss": 0.5493, + "step": 58762 + }, + { + "epoch": 1.51, + "learning_rate": 1.041963752733592e-06, + "loss": 0.6699, + "step": 58763 + }, + { + "epoch": 1.51, + "learning_rate": 1.0419361066376026e-06, + "loss": 0.6797, + "step": 58764 + }, + { + "epoch": 1.51, + "learning_rate": 1.0419084605095048e-06, + "loss": 0.7002, + "step": 58765 + }, + { + "epoch": 1.51, + "learning_rate": 1.0418808143493196e-06, + "loss": 0.6548, + "step": 58766 + }, + { + "epoch": 1.51, + "learning_rate": 1.0418531681570682e-06, + "loss": 0.5938, + "step": 58767 + }, + { + "epoch": 1.51, + "learning_rate": 1.0418255219327718e-06, + "loss": 0.5659, + "step": 58768 + }, + { + "epoch": 1.51, + "learning_rate": 1.0417978756764515e-06, + "loss": 0.6006, + "step": 58769 + }, + { + "epoch": 1.51, + "learning_rate": 1.0417702293881285e-06, + "loss": 0.5493, + "step": 58770 + }, + { + "epoch": 1.51, + "learning_rate": 1.0417425830678237e-06, + "loss": 0.7393, + "step": 58771 + }, + { + "epoch": 1.51, + "learning_rate": 1.041714936715559e-06, + "loss": 0.4741, + "step": 58772 + }, + { + "epoch": 1.51, + "learning_rate": 1.0416872903313548e-06, + "loss": 0.5869, + "step": 58773 + }, + { + "epoch": 1.51, + "learning_rate": 1.0416596439152326e-06, + "loss": 0.7373, + "step": 58774 + }, + { + "epoch": 1.51, + "learning_rate": 1.0416319974672132e-06, + "loss": 0.6943, + "step": 58775 + }, + { + "epoch": 1.51, + "learning_rate": 1.0416043509873186e-06, + "loss": 0.6816, + "step": 58776 + }, + { + "epoch": 1.51, + "learning_rate": 1.041576704475569e-06, + "loss": 0.7051, + "step": 58777 + }, + { + "epoch": 1.51, + "learning_rate": 1.0415490579319866e-06, + "loss": 0.5557, + "step": 58778 + }, + { + "epoch": 1.51, + "learning_rate": 1.0415214113565915e-06, + "loss": 0.447, + "step": 58779 + }, + { + "epoch": 1.51, + "learning_rate": 1.0414937647494058e-06, + "loss": 0.4597, + "step": 58780 + }, + { + "epoch": 1.51, + "learning_rate": 1.0414661181104497e-06, + "loss": 0.6978, + "step": 58781 + }, + { + "epoch": 1.51, + "learning_rate": 1.0414384714397452e-06, + "loss": 0.7979, + "step": 58782 + }, + { + "epoch": 1.51, + "learning_rate": 1.0414108247373131e-06, + "loss": 0.7686, + "step": 58783 + }, + { + "epoch": 1.51, + "learning_rate": 1.0413831780031747e-06, + "loss": 0.6675, + "step": 58784 + }, + { + "epoch": 1.51, + "learning_rate": 1.0413555312373512e-06, + "loss": 0.4761, + "step": 58785 + }, + { + "epoch": 1.51, + "learning_rate": 1.0413278844398636e-06, + "loss": 0.6924, + "step": 58786 + }, + { + "epoch": 1.51, + "learning_rate": 1.041300237610733e-06, + "loss": 0.5234, + "step": 58787 + }, + { + "epoch": 1.51, + "learning_rate": 1.041272590749981e-06, + "loss": 0.7031, + "step": 58788 + }, + { + "epoch": 1.51, + "learning_rate": 1.0412449438576282e-06, + "loss": 0.6709, + "step": 58789 + }, + { + "epoch": 1.51, + "learning_rate": 1.0412172969336958e-06, + "loss": 0.6411, + "step": 58790 + }, + { + "epoch": 1.51, + "learning_rate": 1.0411896499782059e-06, + "loss": 0.7988, + "step": 58791 + }, + { + "epoch": 1.51, + "learning_rate": 1.0411620029911784e-06, + "loss": 0.6035, + "step": 58792 + }, + { + "epoch": 1.51, + "learning_rate": 1.0411343559726355e-06, + "loss": 0.5701, + "step": 58793 + }, + { + "epoch": 1.51, + "learning_rate": 1.0411067089225975e-06, + "loss": 0.4143, + "step": 58794 + }, + { + "epoch": 1.51, + "learning_rate": 1.0410790618410864e-06, + "loss": 0.4883, + "step": 58795 + }, + { + "epoch": 1.51, + "learning_rate": 1.0410514147281225e-06, + "loss": 0.5679, + "step": 58796 + }, + { + "epoch": 1.51, + "learning_rate": 1.0410237675837277e-06, + "loss": 0.625, + "step": 58797 + }, + { + "epoch": 1.51, + "learning_rate": 1.0409961204079228e-06, + "loss": 0.5234, + "step": 58798 + }, + { + "epoch": 1.51, + "learning_rate": 1.0409684732007292e-06, + "loss": 0.5459, + "step": 58799 + }, + { + "epoch": 1.51, + "learning_rate": 1.0409408259621674e-06, + "loss": 0.8066, + "step": 58800 + }, + { + "epoch": 1.51, + "learning_rate": 1.0409131786922597e-06, + "loss": 0.7163, + "step": 58801 + }, + { + "epoch": 1.51, + "learning_rate": 1.0408855313910264e-06, + "loss": 0.6812, + "step": 58802 + }, + { + "epoch": 1.51, + "learning_rate": 1.040857884058489e-06, + "loss": 0.7236, + "step": 58803 + }, + { + "epoch": 1.51, + "learning_rate": 1.0408302366946687e-06, + "loss": 0.5183, + "step": 58804 + }, + { + "epoch": 1.51, + "learning_rate": 1.0408025892995865e-06, + "loss": 0.7773, + "step": 58805 + }, + { + "epoch": 1.51, + "learning_rate": 1.0407749418732633e-06, + "loss": 0.6299, + "step": 58806 + }, + { + "epoch": 1.51, + "learning_rate": 1.0407472944157209e-06, + "loss": 0.6924, + "step": 58807 + }, + { + "epoch": 1.51, + "learning_rate": 1.0407196469269803e-06, + "loss": 0.3357, + "step": 58808 + }, + { + "epoch": 1.51, + "learning_rate": 1.0406919994070622e-06, + "loss": 0.6499, + "step": 58809 + }, + { + "epoch": 1.51, + "learning_rate": 1.0406643518559884e-06, + "loss": 0.647, + "step": 58810 + }, + { + "epoch": 1.51, + "learning_rate": 1.0406367042737797e-06, + "loss": 0.5857, + "step": 58811 + }, + { + "epoch": 1.51, + "learning_rate": 1.040609056660457e-06, + "loss": 0.6133, + "step": 58812 + }, + { + "epoch": 1.51, + "learning_rate": 1.0405814090160422e-06, + "loss": 0.502, + "step": 58813 + }, + { + "epoch": 1.51, + "learning_rate": 1.040553761340556e-06, + "loss": 0.6597, + "step": 58814 + }, + { + "epoch": 1.51, + "learning_rate": 1.0405261136340198e-06, + "loss": 0.8496, + "step": 58815 + }, + { + "epoch": 1.51, + "learning_rate": 1.0404984658964544e-06, + "loss": 0.7432, + "step": 58816 + }, + { + "epoch": 1.51, + "learning_rate": 1.0404708181278813e-06, + "loss": 0.4575, + "step": 58817 + }, + { + "epoch": 1.51, + "learning_rate": 1.0404431703283215e-06, + "loss": 0.8276, + "step": 58818 + }, + { + "epoch": 1.51, + "learning_rate": 1.0404155224977962e-06, + "loss": 0.6177, + "step": 58819 + }, + { + "epoch": 1.51, + "learning_rate": 1.0403878746363268e-06, + "loss": 0.5623, + "step": 58820 + }, + { + "epoch": 1.51, + "learning_rate": 1.040360226743934e-06, + "loss": 0.709, + "step": 58821 + }, + { + "epoch": 1.51, + "learning_rate": 1.0403325788206394e-06, + "loss": 0.7061, + "step": 58822 + }, + { + "epoch": 1.51, + "learning_rate": 1.040304930866464e-06, + "loss": 0.792, + "step": 58823 + }, + { + "epoch": 1.51, + "learning_rate": 1.0402772828814288e-06, + "loss": 0.5425, + "step": 58824 + }, + { + "epoch": 1.51, + "learning_rate": 1.040249634865555e-06, + "loss": 0.395, + "step": 58825 + }, + { + "epoch": 1.51, + "learning_rate": 1.0402219868188644e-06, + "loss": 0.6372, + "step": 58826 + }, + { + "epoch": 1.51, + "learning_rate": 1.0401943387413772e-06, + "loss": 0.6089, + "step": 58827 + }, + { + "epoch": 1.51, + "learning_rate": 1.0401666906331153e-06, + "loss": 0.6021, + "step": 58828 + }, + { + "epoch": 1.51, + "learning_rate": 1.0401390424940997e-06, + "loss": 0.6641, + "step": 58829 + }, + { + "epoch": 1.51, + "learning_rate": 1.0401113943243512e-06, + "loss": 0.7764, + "step": 58830 + }, + { + "epoch": 1.51, + "learning_rate": 1.0400837461238914e-06, + "loss": 0.6777, + "step": 58831 + }, + { + "epoch": 1.51, + "learning_rate": 1.0400560978927413e-06, + "loss": 0.7568, + "step": 58832 + }, + { + "epoch": 1.51, + "learning_rate": 1.0400284496309222e-06, + "loss": 0.6602, + "step": 58833 + }, + { + "epoch": 1.51, + "learning_rate": 1.040000801338455e-06, + "loss": 0.5764, + "step": 58834 + }, + { + "epoch": 1.51, + "learning_rate": 1.039973153015361e-06, + "loss": 0.5654, + "step": 58835 + }, + { + "epoch": 1.51, + "learning_rate": 1.0399455046616614e-06, + "loss": 0.7085, + "step": 58836 + }, + { + "epoch": 1.51, + "learning_rate": 1.0399178562773776e-06, + "loss": 0.6724, + "step": 58837 + }, + { + "epoch": 1.51, + "learning_rate": 1.0398902078625304e-06, + "loss": 0.6396, + "step": 58838 + }, + { + "epoch": 1.51, + "learning_rate": 1.039862559417141e-06, + "loss": 0.6582, + "step": 58839 + }, + { + "epoch": 1.51, + "learning_rate": 1.0398349109412308e-06, + "loss": 0.5049, + "step": 58840 + }, + { + "epoch": 1.51, + "learning_rate": 1.0398072624348206e-06, + "loss": 0.6309, + "step": 58841 + }, + { + "epoch": 1.51, + "learning_rate": 1.039779613897932e-06, + "loss": 0.5654, + "step": 58842 + }, + { + "epoch": 1.51, + "learning_rate": 1.0397519653305863e-06, + "loss": 0.7061, + "step": 58843 + }, + { + "epoch": 1.51, + "learning_rate": 1.0397243167328039e-06, + "loss": 0.6509, + "step": 58844 + }, + { + "epoch": 1.51, + "learning_rate": 1.0396966681046064e-06, + "loss": 0.5732, + "step": 58845 + }, + { + "epoch": 1.51, + "learning_rate": 1.039669019446015e-06, + "loss": 0.7031, + "step": 58846 + }, + { + "epoch": 1.51, + "learning_rate": 1.039641370757051e-06, + "loss": 0.6846, + "step": 58847 + }, + { + "epoch": 1.51, + "learning_rate": 1.0396137220377357e-06, + "loss": 0.7227, + "step": 58848 + }, + { + "epoch": 1.51, + "learning_rate": 1.0395860732880896e-06, + "loss": 0.5596, + "step": 58849 + }, + { + "epoch": 1.51, + "learning_rate": 1.0395584245081344e-06, + "loss": 0.6084, + "step": 58850 + }, + { + "epoch": 1.51, + "learning_rate": 1.039530775697891e-06, + "loss": 0.6816, + "step": 58851 + }, + { + "epoch": 1.51, + "learning_rate": 1.0395031268573808e-06, + "loss": 0.7471, + "step": 58852 + }, + { + "epoch": 1.51, + "learning_rate": 1.0394754779866249e-06, + "loss": 0.7725, + "step": 58853 + }, + { + "epoch": 1.51, + "learning_rate": 1.0394478290856445e-06, + "loss": 0.7041, + "step": 58854 + }, + { + "epoch": 1.51, + "learning_rate": 1.0394201801544604e-06, + "loss": 0.6309, + "step": 58855 + }, + { + "epoch": 1.51, + "learning_rate": 1.0393925311930944e-06, + "loss": 0.6042, + "step": 58856 + }, + { + "epoch": 1.51, + "learning_rate": 1.039364882201567e-06, + "loss": 0.6333, + "step": 58857 + }, + { + "epoch": 1.51, + "learning_rate": 1.0393372331799005e-06, + "loss": 0.5581, + "step": 58858 + }, + { + "epoch": 1.51, + "learning_rate": 1.0393095841281146e-06, + "loss": 0.6211, + "step": 58859 + }, + { + "epoch": 1.51, + "learning_rate": 1.0392819350462312e-06, + "loss": 0.7061, + "step": 58860 + }, + { + "epoch": 1.51, + "learning_rate": 1.0392542859342714e-06, + "loss": 0.6533, + "step": 58861 + }, + { + "epoch": 1.51, + "learning_rate": 1.0392266367922566e-06, + "loss": 0.7119, + "step": 58862 + }, + { + "epoch": 1.51, + "learning_rate": 1.0391989876202079e-06, + "loss": 0.4331, + "step": 58863 + }, + { + "epoch": 1.51, + "learning_rate": 1.0391713384181462e-06, + "loss": 0.7754, + "step": 58864 + }, + { + "epoch": 1.51, + "learning_rate": 1.0391436891860926e-06, + "loss": 0.543, + "step": 58865 + }, + { + "epoch": 1.51, + "learning_rate": 1.0391160399240689e-06, + "loss": 0.6025, + "step": 58866 + }, + { + "epoch": 1.51, + "learning_rate": 1.0390883906320953e-06, + "loss": 0.5815, + "step": 58867 + }, + { + "epoch": 1.51, + "learning_rate": 1.0390607413101942e-06, + "loss": 0.8203, + "step": 58868 + }, + { + "epoch": 1.51, + "learning_rate": 1.0390330919583854e-06, + "loss": 0.7666, + "step": 58869 + }, + { + "epoch": 1.51, + "learning_rate": 1.0390054425766911e-06, + "loss": 0.4297, + "step": 58870 + }, + { + "epoch": 1.51, + "learning_rate": 1.038977793165132e-06, + "loss": 0.4929, + "step": 58871 + }, + { + "epoch": 1.51, + "learning_rate": 1.0389501437237295e-06, + "loss": 0.7275, + "step": 58872 + }, + { + "epoch": 1.51, + "learning_rate": 1.0389224942525047e-06, + "loss": 0.4639, + "step": 58873 + }, + { + "epoch": 1.51, + "learning_rate": 1.0388948447514786e-06, + "loss": 0.7549, + "step": 58874 + }, + { + "epoch": 1.51, + "learning_rate": 1.0388671952206724e-06, + "loss": 0.6816, + "step": 58875 + }, + { + "epoch": 1.51, + "learning_rate": 1.0388395456601077e-06, + "loss": 0.522, + "step": 58876 + }, + { + "epoch": 1.51, + "learning_rate": 1.0388118960698051e-06, + "loss": 0.5254, + "step": 58877 + }, + { + "epoch": 1.51, + "learning_rate": 1.0387842464497863e-06, + "loss": 0.8662, + "step": 58878 + }, + { + "epoch": 1.51, + "learning_rate": 1.038756596800072e-06, + "loss": 0.6333, + "step": 58879 + }, + { + "epoch": 1.51, + "learning_rate": 1.0387289471206835e-06, + "loss": 0.6631, + "step": 58880 + }, + { + "epoch": 1.51, + "learning_rate": 1.038701297411642e-06, + "loss": 0.5488, + "step": 58881 + }, + { + "epoch": 1.51, + "learning_rate": 1.0386736476729686e-06, + "loss": 0.8271, + "step": 58882 + }, + { + "epoch": 1.51, + "learning_rate": 1.0386459979046852e-06, + "loss": 0.6689, + "step": 58883 + }, + { + "epoch": 1.51, + "learning_rate": 1.0386183481068117e-06, + "loss": 0.5718, + "step": 58884 + }, + { + "epoch": 1.51, + "learning_rate": 1.03859069827937e-06, + "loss": 0.5977, + "step": 58885 + }, + { + "epoch": 1.51, + "learning_rate": 1.0385630484223811e-06, + "loss": 0.7012, + "step": 58886 + }, + { + "epoch": 1.51, + "learning_rate": 1.0385353985358665e-06, + "loss": 0.7812, + "step": 58887 + }, + { + "epoch": 1.51, + "learning_rate": 1.0385077486198473e-06, + "loss": 0.6055, + "step": 58888 + }, + { + "epoch": 1.51, + "learning_rate": 1.038480098674344e-06, + "loss": 0.4277, + "step": 58889 + }, + { + "epoch": 1.51, + "learning_rate": 1.0384524486993783e-06, + "loss": 0.6099, + "step": 58890 + }, + { + "epoch": 1.51, + "learning_rate": 1.0384247986949717e-06, + "loss": 0.6855, + "step": 58891 + }, + { + "epoch": 1.51, + "learning_rate": 1.0383971486611447e-06, + "loss": 0.6582, + "step": 58892 + }, + { + "epoch": 1.51, + "learning_rate": 1.0383694985979193e-06, + "loss": 0.5459, + "step": 58893 + }, + { + "epoch": 1.51, + "learning_rate": 1.0383418485053156e-06, + "loss": 0.8086, + "step": 58894 + }, + { + "epoch": 1.51, + "learning_rate": 1.0383141983833552e-06, + "loss": 0.7764, + "step": 58895 + }, + { + "epoch": 1.51, + "learning_rate": 1.0382865482320595e-06, + "loss": 0.6494, + "step": 58896 + }, + { + "epoch": 1.51, + "learning_rate": 1.0382588980514497e-06, + "loss": 0.6357, + "step": 58897 + }, + { + "epoch": 1.51, + "learning_rate": 1.038231247841547e-06, + "loss": 0.8164, + "step": 58898 + }, + { + "epoch": 1.51, + "learning_rate": 1.038203597602372e-06, + "loss": 0.5947, + "step": 58899 + }, + { + "epoch": 1.51, + "learning_rate": 1.0381759473339465e-06, + "loss": 0.5845, + "step": 58900 + }, + { + "epoch": 1.51, + "learning_rate": 1.0381482970362912e-06, + "loss": 0.7598, + "step": 58901 + }, + { + "epoch": 1.51, + "learning_rate": 1.0381206467094276e-06, + "loss": 0.5449, + "step": 58902 + }, + { + "epoch": 1.51, + "learning_rate": 1.038092996353377e-06, + "loss": 0.583, + "step": 58903 + }, + { + "epoch": 1.51, + "learning_rate": 1.0380653459681602e-06, + "loss": 0.6172, + "step": 58904 + }, + { + "epoch": 1.51, + "learning_rate": 1.0380376955537983e-06, + "loss": 0.5488, + "step": 58905 + }, + { + "epoch": 1.51, + "learning_rate": 1.0380100451103129e-06, + "loss": 0.7598, + "step": 58906 + }, + { + "epoch": 1.51, + "learning_rate": 1.037982394637725e-06, + "loss": 0.6421, + "step": 58907 + }, + { + "epoch": 1.51, + "learning_rate": 1.037954744136056e-06, + "loss": 0.623, + "step": 58908 + }, + { + "epoch": 1.51, + "learning_rate": 1.0379270936053261e-06, + "loss": 0.6562, + "step": 58909 + }, + { + "epoch": 1.51, + "learning_rate": 1.0378994430455577e-06, + "loss": 0.7339, + "step": 58910 + }, + { + "epoch": 1.51, + "learning_rate": 1.037871792456771e-06, + "loss": 0.6367, + "step": 58911 + }, + { + "epoch": 1.51, + "learning_rate": 1.0378441418389878e-06, + "loss": 0.4038, + "step": 58912 + }, + { + "epoch": 1.51, + "learning_rate": 1.0378164911922293e-06, + "loss": 0.7139, + "step": 58913 + }, + { + "epoch": 1.51, + "learning_rate": 1.0377888405165165e-06, + "loss": 0.6494, + "step": 58914 + }, + { + "epoch": 1.51, + "learning_rate": 1.03776118981187e-06, + "loss": 0.7012, + "step": 58915 + }, + { + "epoch": 1.51, + "learning_rate": 1.037733539078312e-06, + "loss": 0.5566, + "step": 58916 + }, + { + "epoch": 1.51, + "learning_rate": 1.0377058883158628e-06, + "loss": 0.7109, + "step": 58917 + }, + { + "epoch": 1.51, + "learning_rate": 1.0376782375245444e-06, + "loss": 0.6665, + "step": 58918 + }, + { + "epoch": 1.51, + "learning_rate": 1.0376505867043773e-06, + "loss": 0.5713, + "step": 58919 + }, + { + "epoch": 1.51, + "learning_rate": 1.0376229358553825e-06, + "loss": 0.6099, + "step": 58920 + }, + { + "epoch": 1.51, + "learning_rate": 1.037595284977582e-06, + "loss": 0.626, + "step": 58921 + }, + { + "epoch": 1.51, + "learning_rate": 1.0375676340709963e-06, + "loss": 0.748, + "step": 58922 + }, + { + "epoch": 1.51, + "learning_rate": 1.0375399831356471e-06, + "loss": 0.5571, + "step": 58923 + }, + { + "epoch": 1.51, + "learning_rate": 1.0375123321715547e-06, + "loss": 0.3448, + "step": 58924 + }, + { + "epoch": 1.51, + "learning_rate": 1.0374846811787411e-06, + "loss": 0.6455, + "step": 58925 + }, + { + "epoch": 1.51, + "learning_rate": 1.037457030157227e-06, + "loss": 0.6484, + "step": 58926 + }, + { + "epoch": 1.51, + "learning_rate": 1.0374293791070342e-06, + "loss": 0.4635, + "step": 58927 + }, + { + "epoch": 1.51, + "learning_rate": 1.0374017280281835e-06, + "loss": 0.4885, + "step": 58928 + }, + { + "epoch": 1.51, + "learning_rate": 1.0373740769206958e-06, + "loss": 0.6797, + "step": 58929 + }, + { + "epoch": 1.51, + "learning_rate": 1.0373464257845926e-06, + "loss": 0.7393, + "step": 58930 + }, + { + "epoch": 1.51, + "learning_rate": 1.0373187746198948e-06, + "loss": 0.5806, + "step": 58931 + }, + { + "epoch": 1.51, + "learning_rate": 1.0372911234266235e-06, + "loss": 0.5996, + "step": 58932 + }, + { + "epoch": 1.51, + "learning_rate": 1.0372634722048008e-06, + "loss": 0.6694, + "step": 58933 + }, + { + "epoch": 1.51, + "learning_rate": 1.0372358209544466e-06, + "loss": 0.593, + "step": 58934 + }, + { + "epoch": 1.51, + "learning_rate": 1.0372081696755828e-06, + "loss": 0.8135, + "step": 58935 + }, + { + "epoch": 1.51, + "learning_rate": 1.0371805183682303e-06, + "loss": 0.5583, + "step": 58936 + }, + { + "epoch": 1.51, + "learning_rate": 1.0371528670324105e-06, + "loss": 0.4648, + "step": 58937 + }, + { + "epoch": 1.51, + "learning_rate": 1.0371252156681445e-06, + "loss": 0.7119, + "step": 58938 + }, + { + "epoch": 1.51, + "learning_rate": 1.0370975642754535e-06, + "loss": 0.625, + "step": 58939 + }, + { + "epoch": 1.51, + "learning_rate": 1.0370699128543582e-06, + "loss": 0.6592, + "step": 58940 + }, + { + "epoch": 1.51, + "learning_rate": 1.0370422614048806e-06, + "loss": 0.7065, + "step": 58941 + }, + { + "epoch": 1.51, + "learning_rate": 1.037014609927041e-06, + "loss": 0.791, + "step": 58942 + }, + { + "epoch": 1.51, + "learning_rate": 1.0369869584208616e-06, + "loss": 0.7324, + "step": 58943 + }, + { + "epoch": 1.51, + "learning_rate": 1.0369593068863628e-06, + "loss": 0.6138, + "step": 58944 + }, + { + "epoch": 1.51, + "learning_rate": 1.0369316553235657e-06, + "loss": 0.6787, + "step": 58945 + }, + { + "epoch": 1.51, + "learning_rate": 1.0369040037324918e-06, + "loss": 0.7256, + "step": 58946 + }, + { + "epoch": 1.51, + "learning_rate": 1.0368763521131623e-06, + "loss": 0.6348, + "step": 58947 + }, + { + "epoch": 1.51, + "learning_rate": 1.0368487004655984e-06, + "loss": 0.5908, + "step": 58948 + }, + { + "epoch": 1.51, + "learning_rate": 1.0368210487898208e-06, + "loss": 0.5139, + "step": 58949 + }, + { + "epoch": 1.51, + "learning_rate": 1.0367933970858513e-06, + "loss": 0.8223, + "step": 58950 + }, + { + "epoch": 1.51, + "learning_rate": 1.0367657453537107e-06, + "loss": 0.749, + "step": 58951 + }, + { + "epoch": 1.51, + "learning_rate": 1.0367380935934205e-06, + "loss": 0.5327, + "step": 58952 + }, + { + "epoch": 1.51, + "learning_rate": 1.0367104418050013e-06, + "loss": 0.7568, + "step": 58953 + }, + { + "epoch": 1.51, + "learning_rate": 1.0366827899884746e-06, + "loss": 0.7197, + "step": 58954 + }, + { + "epoch": 1.51, + "learning_rate": 1.0366551381438618e-06, + "loss": 0.6611, + "step": 58955 + }, + { + "epoch": 1.51, + "learning_rate": 1.0366274862711837e-06, + "loss": 0.5527, + "step": 58956 + }, + { + "epoch": 1.51, + "learning_rate": 1.0365998343704617e-06, + "loss": 0.6875, + "step": 58957 + }, + { + "epoch": 1.51, + "learning_rate": 1.036572182441717e-06, + "loss": 0.5715, + "step": 58958 + }, + { + "epoch": 1.51, + "learning_rate": 1.0365445304849703e-06, + "loss": 0.8408, + "step": 58959 + }, + { + "epoch": 1.51, + "learning_rate": 1.0365168785002432e-06, + "loss": 0.7324, + "step": 58960 + }, + { + "epoch": 1.51, + "learning_rate": 1.0364892264875569e-06, + "loss": 0.7148, + "step": 58961 + }, + { + "epoch": 1.51, + "learning_rate": 1.0364615744469326e-06, + "loss": 0.4624, + "step": 58962 + }, + { + "epoch": 1.51, + "learning_rate": 1.0364339223783914e-06, + "loss": 0.5288, + "step": 58963 + }, + { + "epoch": 1.51, + "learning_rate": 1.036406270281954e-06, + "loss": 0.7148, + "step": 58964 + }, + { + "epoch": 1.51, + "learning_rate": 1.0363786181576424e-06, + "loss": 0.6592, + "step": 58965 + }, + { + "epoch": 1.51, + "learning_rate": 1.0363509660054773e-06, + "loss": 0.4767, + "step": 58966 + }, + { + "epoch": 1.51, + "learning_rate": 1.0363233138254799e-06, + "loss": 0.48, + "step": 58967 + }, + { + "epoch": 1.51, + "learning_rate": 1.0362956616176712e-06, + "loss": 0.6265, + "step": 58968 + }, + { + "epoch": 1.51, + "learning_rate": 1.0362680093820729e-06, + "loss": 0.6831, + "step": 58969 + }, + { + "epoch": 1.51, + "learning_rate": 1.0362403571187054e-06, + "loss": 0.4761, + "step": 58970 + }, + { + "epoch": 1.51, + "learning_rate": 1.0362127048275908e-06, + "loss": 0.5173, + "step": 58971 + }, + { + "epoch": 1.51, + "learning_rate": 1.0361850525087497e-06, + "loss": 0.6069, + "step": 58972 + }, + { + "epoch": 1.51, + "learning_rate": 1.0361574001622034e-06, + "loss": 0.6763, + "step": 58973 + }, + { + "epoch": 1.51, + "learning_rate": 1.0361297477879727e-06, + "loss": 0.6943, + "step": 58974 + }, + { + "epoch": 1.51, + "learning_rate": 1.0361020953860795e-06, + "loss": 0.6704, + "step": 58975 + }, + { + "epoch": 1.51, + "learning_rate": 1.0360744429565443e-06, + "loss": 0.7205, + "step": 58976 + }, + { + "epoch": 1.51, + "learning_rate": 1.036046790499389e-06, + "loss": 0.553, + "step": 58977 + }, + { + "epoch": 1.51, + "learning_rate": 1.0360191380146338e-06, + "loss": 0.5498, + "step": 58978 + }, + { + "epoch": 1.51, + "learning_rate": 1.0359914855023007e-06, + "loss": 0.667, + "step": 58979 + }, + { + "epoch": 1.51, + "learning_rate": 1.0359638329624103e-06, + "loss": 0.6484, + "step": 58980 + }, + { + "epoch": 1.51, + "learning_rate": 1.0359361803949844e-06, + "loss": 0.7568, + "step": 58981 + }, + { + "epoch": 1.51, + "learning_rate": 1.0359085278000436e-06, + "loss": 0.6709, + "step": 58982 + }, + { + "epoch": 1.51, + "learning_rate": 1.0358808751776096e-06, + "loss": 0.5903, + "step": 58983 + }, + { + "epoch": 1.51, + "learning_rate": 1.0358532225277028e-06, + "loss": 0.6172, + "step": 58984 + }, + { + "epoch": 1.51, + "learning_rate": 1.0358255698503453e-06, + "loss": 0.6982, + "step": 58985 + }, + { + "epoch": 1.51, + "learning_rate": 1.0357979171455574e-06, + "loss": 0.7168, + "step": 58986 + }, + { + "epoch": 1.51, + "learning_rate": 1.0357702644133608e-06, + "loss": 0.4629, + "step": 58987 + }, + { + "epoch": 1.51, + "learning_rate": 1.0357426116537766e-06, + "loss": 0.6826, + "step": 58988 + }, + { + "epoch": 1.51, + "learning_rate": 1.035714958866826e-06, + "loss": 0.9453, + "step": 58989 + }, + { + "epoch": 1.51, + "learning_rate": 1.03568730605253e-06, + "loss": 0.5552, + "step": 58990 + }, + { + "epoch": 1.51, + "learning_rate": 1.0356596532109099e-06, + "loss": 0.6846, + "step": 58991 + }, + { + "epoch": 1.51, + "learning_rate": 1.035632000341987e-06, + "loss": 0.6904, + "step": 58992 + }, + { + "epoch": 1.51, + "learning_rate": 1.035604347445782e-06, + "loss": 0.6387, + "step": 58993 + }, + { + "epoch": 1.51, + "learning_rate": 1.0355766945223166e-06, + "loss": 0.6504, + "step": 58994 + }, + { + "epoch": 1.51, + "learning_rate": 1.0355490415716115e-06, + "loss": 0.6816, + "step": 58995 + }, + { + "epoch": 1.51, + "learning_rate": 1.0355213885936885e-06, + "loss": 0.7139, + "step": 58996 + }, + { + "epoch": 1.51, + "learning_rate": 1.0354937355885682e-06, + "loss": 0.7217, + "step": 58997 + }, + { + "epoch": 1.51, + "learning_rate": 1.0354660825562722e-06, + "loss": 0.5776, + "step": 58998 + }, + { + "epoch": 1.51, + "learning_rate": 1.0354384294968213e-06, + "loss": 0.8604, + "step": 58999 + }, + { + "epoch": 1.51, + "learning_rate": 1.0354107764102367e-06, + "loss": 0.5859, + "step": 59000 + }, + { + "epoch": 1.51, + "learning_rate": 1.0353831232965398e-06, + "loss": 0.6768, + "step": 59001 + }, + { + "epoch": 1.51, + "learning_rate": 1.035355470155752e-06, + "loss": 0.7119, + "step": 59002 + }, + { + "epoch": 1.51, + "learning_rate": 1.0353278169878934e-06, + "loss": 0.6465, + "step": 59003 + }, + { + "epoch": 1.51, + "learning_rate": 1.0353001637929867e-06, + "loss": 0.666, + "step": 59004 + }, + { + "epoch": 1.51, + "learning_rate": 1.0352725105710515e-06, + "loss": 0.7305, + "step": 59005 + }, + { + "epoch": 1.51, + "learning_rate": 1.0352448573221102e-06, + "loss": 0.5483, + "step": 59006 + }, + { + "epoch": 1.51, + "learning_rate": 1.0352172040461838e-06, + "loss": 0.4958, + "step": 59007 + }, + { + "epoch": 1.51, + "learning_rate": 1.0351895507432926e-06, + "loss": 0.8193, + "step": 59008 + }, + { + "epoch": 1.51, + "learning_rate": 1.0351618974134588e-06, + "loss": 0.5845, + "step": 59009 + }, + { + "epoch": 1.51, + "learning_rate": 1.0351342440567031e-06, + "loss": 0.6748, + "step": 59010 + }, + { + "epoch": 1.51, + "learning_rate": 1.0351065906730465e-06, + "loss": 0.6719, + "step": 59011 + }, + { + "epoch": 1.51, + "learning_rate": 1.0350789372625105e-06, + "loss": 0.6572, + "step": 59012 + }, + { + "epoch": 1.51, + "learning_rate": 1.0350512838251164e-06, + "loss": 0.6953, + "step": 59013 + }, + { + "epoch": 1.51, + "learning_rate": 1.035023630360885e-06, + "loss": 0.6226, + "step": 59014 + }, + { + "epoch": 1.51, + "learning_rate": 1.0349959768698375e-06, + "loss": 0.832, + "step": 59015 + }, + { + "epoch": 1.51, + "learning_rate": 1.0349683233519951e-06, + "loss": 0.6104, + "step": 59016 + }, + { + "epoch": 1.51, + "learning_rate": 1.0349406698073798e-06, + "loss": 0.6606, + "step": 59017 + }, + { + "epoch": 1.51, + "learning_rate": 1.0349130162360111e-06, + "loss": 0.7087, + "step": 59018 + }, + { + "epoch": 1.51, + "learning_rate": 1.0348853626379116e-06, + "loss": 0.6641, + "step": 59019 + }, + { + "epoch": 1.51, + "learning_rate": 1.034857709013102e-06, + "loss": 0.6577, + "step": 59020 + }, + { + "epoch": 1.51, + "learning_rate": 1.0348300553616031e-06, + "loss": 0.6836, + "step": 59021 + }, + { + "epoch": 1.51, + "learning_rate": 1.034802401683437e-06, + "loss": 0.4834, + "step": 59022 + }, + { + "epoch": 1.51, + "learning_rate": 1.034774747978624e-06, + "loss": 0.5962, + "step": 59023 + }, + { + "epoch": 1.51, + "learning_rate": 1.0347470942471851e-06, + "loss": 0.4722, + "step": 59024 + }, + { + "epoch": 1.51, + "learning_rate": 1.0347194404891427e-06, + "loss": 0.5493, + "step": 59025 + }, + { + "epoch": 1.51, + "learning_rate": 1.0346917867045166e-06, + "loss": 0.7251, + "step": 59026 + }, + { + "epoch": 1.51, + "learning_rate": 1.034664132893329e-06, + "loss": 0.6167, + "step": 59027 + }, + { + "epoch": 1.51, + "learning_rate": 1.0346364790556008e-06, + "loss": 0.3945, + "step": 59028 + }, + { + "epoch": 1.51, + "learning_rate": 1.0346088251913527e-06, + "loss": 0.5795, + "step": 59029 + }, + { + "epoch": 1.51, + "learning_rate": 1.0345811713006063e-06, + "loss": 0.7617, + "step": 59030 + }, + { + "epoch": 1.51, + "learning_rate": 1.0345535173833828e-06, + "loss": 0.5449, + "step": 59031 + }, + { + "epoch": 1.51, + "learning_rate": 1.0345258634397032e-06, + "loss": 0.5752, + "step": 59032 + }, + { + "epoch": 1.51, + "learning_rate": 1.0344982094695885e-06, + "loss": 0.3206, + "step": 59033 + }, + { + "epoch": 1.51, + "learning_rate": 1.0344705554730603e-06, + "loss": 0.499, + "step": 59034 + }, + { + "epoch": 1.51, + "learning_rate": 1.0344429014501394e-06, + "loss": 0.6287, + "step": 59035 + }, + { + "epoch": 1.51, + "learning_rate": 1.0344152474008477e-06, + "loss": 0.5454, + "step": 59036 + }, + { + "epoch": 1.51, + "learning_rate": 1.0343875933252054e-06, + "loss": 0.4938, + "step": 59037 + }, + { + "epoch": 1.51, + "learning_rate": 1.0343599392232343e-06, + "loss": 0.7471, + "step": 59038 + }, + { + "epoch": 1.51, + "learning_rate": 1.034332285094955e-06, + "loss": 0.7607, + "step": 59039 + }, + { + "epoch": 1.51, + "learning_rate": 1.0343046309403894e-06, + "loss": 0.4756, + "step": 59040 + }, + { + "epoch": 1.51, + "learning_rate": 1.034276976759558e-06, + "loss": 0.751, + "step": 59041 + }, + { + "epoch": 1.51, + "learning_rate": 1.034249322552483e-06, + "loss": 0.486, + "step": 59042 + }, + { + "epoch": 1.51, + "learning_rate": 1.034221668319184e-06, + "loss": 0.3964, + "step": 59043 + }, + { + "epoch": 1.51, + "learning_rate": 1.0341940140596837e-06, + "loss": 0.5742, + "step": 59044 + }, + { + "epoch": 1.51, + "learning_rate": 1.034166359774002e-06, + "loss": 0.75, + "step": 59045 + }, + { + "epoch": 1.51, + "learning_rate": 1.0341387054621612e-06, + "loss": 0.6084, + "step": 59046 + }, + { + "epoch": 1.51, + "learning_rate": 1.034111051124182e-06, + "loss": 0.4961, + "step": 59047 + }, + { + "epoch": 1.51, + "learning_rate": 1.0340833967600853e-06, + "loss": 0.4958, + "step": 59048 + }, + { + "epoch": 1.51, + "learning_rate": 1.0340557423698922e-06, + "loss": 0.8477, + "step": 59049 + }, + { + "epoch": 1.51, + "learning_rate": 1.0340280879536247e-06, + "loss": 0.5347, + "step": 59050 + }, + { + "epoch": 1.51, + "learning_rate": 1.0340004335113031e-06, + "loss": 0.5879, + "step": 59051 + }, + { + "epoch": 1.51, + "learning_rate": 1.0339727790429492e-06, + "loss": 0.6079, + "step": 59052 + }, + { + "epoch": 1.51, + "learning_rate": 1.033945124548584e-06, + "loss": 0.7197, + "step": 59053 + }, + { + "epoch": 1.51, + "learning_rate": 1.0339174700282282e-06, + "loss": 0.6157, + "step": 59054 + }, + { + "epoch": 1.51, + "learning_rate": 1.0338898154819035e-06, + "loss": 0.5447, + "step": 59055 + }, + { + "epoch": 1.51, + "learning_rate": 1.0338621609096311e-06, + "loss": 0.5352, + "step": 59056 + }, + { + "epoch": 1.51, + "learning_rate": 1.033834506311432e-06, + "loss": 0.8145, + "step": 59057 + }, + { + "epoch": 1.51, + "learning_rate": 1.0338068516873271e-06, + "loss": 0.7109, + "step": 59058 + }, + { + "epoch": 1.51, + "learning_rate": 1.033779197037338e-06, + "loss": 0.7092, + "step": 59059 + }, + { + "epoch": 1.51, + "learning_rate": 1.0337515423614856e-06, + "loss": 0.3816, + "step": 59060 + }, + { + "epoch": 1.51, + "learning_rate": 1.0337238876597913e-06, + "loss": 0.6191, + "step": 59061 + }, + { + "epoch": 1.51, + "learning_rate": 1.0336962329322763e-06, + "loss": 0.6055, + "step": 59062 + }, + { + "epoch": 1.51, + "learning_rate": 1.0336685781789616e-06, + "loss": 0.7471, + "step": 59063 + }, + { + "epoch": 1.51, + "learning_rate": 1.0336409233998682e-06, + "loss": 0.7939, + "step": 59064 + }, + { + "epoch": 1.51, + "learning_rate": 1.0336132685950178e-06, + "loss": 0.7227, + "step": 59065 + }, + { + "epoch": 1.51, + "learning_rate": 1.033585613764431e-06, + "loss": 0.7178, + "step": 59066 + }, + { + "epoch": 1.51, + "learning_rate": 1.0335579589081295e-06, + "loss": 0.6523, + "step": 59067 + }, + { + "epoch": 1.51, + "learning_rate": 1.033530304026134e-06, + "loss": 0.6553, + "step": 59068 + }, + { + "epoch": 1.51, + "learning_rate": 1.033502649118466e-06, + "loss": 0.5977, + "step": 59069 + }, + { + "epoch": 1.51, + "learning_rate": 1.0334749941851464e-06, + "loss": 0.5127, + "step": 59070 + }, + { + "epoch": 1.51, + "learning_rate": 1.0334473392261966e-06, + "loss": 0.5151, + "step": 59071 + }, + { + "epoch": 1.51, + "learning_rate": 1.033419684241638e-06, + "loss": 0.5703, + "step": 59072 + }, + { + "epoch": 1.51, + "learning_rate": 1.033392029231491e-06, + "loss": 0.6982, + "step": 59073 + }, + { + "epoch": 1.51, + "learning_rate": 1.0333643741957776e-06, + "loss": 0.5781, + "step": 59074 + }, + { + "epoch": 1.51, + "learning_rate": 1.0333367191345186e-06, + "loss": 0.7764, + "step": 59075 + }, + { + "epoch": 1.51, + "learning_rate": 1.033309064047735e-06, + "loss": 0.5571, + "step": 59076 + }, + { + "epoch": 1.51, + "learning_rate": 1.0332814089354482e-06, + "loss": 0.4095, + "step": 59077 + }, + { + "epoch": 1.51, + "learning_rate": 1.0332537537976797e-06, + "loss": 0.5781, + "step": 59078 + }, + { + "epoch": 1.51, + "learning_rate": 1.0332260986344498e-06, + "loss": 0.5693, + "step": 59079 + }, + { + "epoch": 1.51, + "learning_rate": 1.0331984434457808e-06, + "loss": 0.7681, + "step": 59080 + }, + { + "epoch": 1.51, + "learning_rate": 1.0331707882316928e-06, + "loss": 0.6602, + "step": 59081 + }, + { + "epoch": 1.51, + "learning_rate": 1.0331431329922077e-06, + "loss": 0.5859, + "step": 59082 + }, + { + "epoch": 1.51, + "learning_rate": 1.0331154777273464e-06, + "loss": 0.7012, + "step": 59083 + }, + { + "epoch": 1.51, + "learning_rate": 1.0330878224371302e-06, + "loss": 0.5232, + "step": 59084 + }, + { + "epoch": 1.51, + "learning_rate": 1.0330601671215797e-06, + "loss": 0.6426, + "step": 59085 + }, + { + "epoch": 1.51, + "learning_rate": 1.033032511780717e-06, + "loss": 0.564, + "step": 59086 + }, + { + "epoch": 1.51, + "learning_rate": 1.0330048564145628e-06, + "loss": 0.7148, + "step": 59087 + }, + { + "epoch": 1.51, + "learning_rate": 1.0329772010231383e-06, + "loss": 0.6733, + "step": 59088 + }, + { + "epoch": 1.51, + "learning_rate": 1.0329495456064645e-06, + "loss": 0.4561, + "step": 59089 + }, + { + "epoch": 1.51, + "learning_rate": 1.032921890164563e-06, + "loss": 0.665, + "step": 59090 + }, + { + "epoch": 1.51, + "learning_rate": 1.0328942346974543e-06, + "loss": 0.5615, + "step": 59091 + }, + { + "epoch": 1.51, + "learning_rate": 1.0328665792051606e-06, + "loss": 0.6008, + "step": 59092 + }, + { + "epoch": 1.51, + "learning_rate": 1.032838923687702e-06, + "loss": 0.5967, + "step": 59093 + }, + { + "epoch": 1.51, + "learning_rate": 1.0328112681451002e-06, + "loss": 0.7822, + "step": 59094 + }, + { + "epoch": 1.51, + "learning_rate": 1.0327836125773763e-06, + "loss": 0.7148, + "step": 59095 + }, + { + "epoch": 1.51, + "learning_rate": 1.0327559569845517e-06, + "loss": 0.5708, + "step": 59096 + }, + { + "epoch": 1.51, + "learning_rate": 1.0327283013666473e-06, + "loss": 0.4622, + "step": 59097 + }, + { + "epoch": 1.51, + "learning_rate": 1.0327006457236842e-06, + "loss": 0.6123, + "step": 59098 + }, + { + "epoch": 1.51, + "learning_rate": 1.0326729900556839e-06, + "loss": 0.5303, + "step": 59099 + }, + { + "epoch": 1.51, + "learning_rate": 1.032645334362667e-06, + "loss": 0.5542, + "step": 59100 + }, + { + "epoch": 1.51, + "learning_rate": 1.0326176786446556e-06, + "loss": 0.7432, + "step": 59101 + }, + { + "epoch": 1.51, + "learning_rate": 1.0325900229016703e-06, + "loss": 0.6323, + "step": 59102 + }, + { + "epoch": 1.51, + "learning_rate": 1.0325623671337321e-06, + "loss": 0.6211, + "step": 59103 + }, + { + "epoch": 1.51, + "learning_rate": 1.0325347113408622e-06, + "loss": 0.6621, + "step": 59104 + }, + { + "epoch": 1.51, + "learning_rate": 1.0325070555230824e-06, + "loss": 0.5962, + "step": 59105 + }, + { + "epoch": 1.51, + "learning_rate": 1.032479399680413e-06, + "loss": 0.397, + "step": 59106 + }, + { + "epoch": 1.51, + "learning_rate": 1.0324517438128764e-06, + "loss": 0.5908, + "step": 59107 + }, + { + "epoch": 1.51, + "learning_rate": 1.0324240879204922e-06, + "loss": 0.6797, + "step": 59108 + }, + { + "epoch": 1.51, + "learning_rate": 1.0323964320032827e-06, + "loss": 0.4375, + "step": 59109 + }, + { + "epoch": 1.52, + "learning_rate": 1.0323687760612685e-06, + "loss": 0.5958, + "step": 59110 + }, + { + "epoch": 1.52, + "learning_rate": 1.0323411200944712e-06, + "loss": 0.7178, + "step": 59111 + }, + { + "epoch": 1.52, + "learning_rate": 1.032313464102912e-06, + "loss": 0.8262, + "step": 59112 + }, + { + "epoch": 1.52, + "learning_rate": 1.0322858080866117e-06, + "loss": 0.665, + "step": 59113 + }, + { + "epoch": 1.52, + "learning_rate": 1.0322581520455912e-06, + "loss": 0.5854, + "step": 59114 + }, + { + "epoch": 1.52, + "learning_rate": 1.0322304959798727e-06, + "loss": 0.6611, + "step": 59115 + }, + { + "epoch": 1.52, + "learning_rate": 1.0322028398894764e-06, + "loss": 0.6816, + "step": 59116 + }, + { + "epoch": 1.52, + "learning_rate": 1.0321751837744241e-06, + "loss": 0.6904, + "step": 59117 + }, + { + "epoch": 1.52, + "learning_rate": 1.0321475276347368e-06, + "loss": 0.6699, + "step": 59118 + }, + { + "epoch": 1.52, + "learning_rate": 1.0321198714704355e-06, + "loss": 0.8008, + "step": 59119 + }, + { + "epoch": 1.52, + "learning_rate": 1.0320922152815415e-06, + "loss": 0.6626, + "step": 59120 + }, + { + "epoch": 1.52, + "learning_rate": 1.0320645590680762e-06, + "loss": 0.5957, + "step": 59121 + }, + { + "epoch": 1.52, + "learning_rate": 1.0320369028300602e-06, + "loss": 0.6807, + "step": 59122 + }, + { + "epoch": 1.52, + "learning_rate": 1.032009246567515e-06, + "loss": 0.5454, + "step": 59123 + }, + { + "epoch": 1.52, + "learning_rate": 1.031981590280462e-06, + "loss": 0.7246, + "step": 59124 + }, + { + "epoch": 1.52, + "learning_rate": 1.0319539339689222e-06, + "loss": 0.7979, + "step": 59125 + }, + { + "epoch": 1.52, + "learning_rate": 1.0319262776329165e-06, + "loss": 0.7246, + "step": 59126 + }, + { + "epoch": 1.52, + "learning_rate": 1.0318986212724666e-06, + "loss": 0.5698, + "step": 59127 + }, + { + "epoch": 1.52, + "learning_rate": 1.0318709648875933e-06, + "loss": 0.4902, + "step": 59128 + }, + { + "epoch": 1.52, + "learning_rate": 1.0318433084783176e-06, + "loss": 0.6577, + "step": 59129 + }, + { + "epoch": 1.52, + "learning_rate": 1.0318156520446613e-06, + "loss": 0.7197, + "step": 59130 + }, + { + "epoch": 1.52, + "learning_rate": 1.0317879955866448e-06, + "loss": 0.541, + "step": 59131 + }, + { + "epoch": 1.52, + "learning_rate": 1.0317603391042901e-06, + "loss": 0.6821, + "step": 59132 + }, + { + "epoch": 1.52, + "learning_rate": 1.0317326825976177e-06, + "loss": 0.5918, + "step": 59133 + }, + { + "epoch": 1.52, + "learning_rate": 1.0317050260666492e-06, + "loss": 0.647, + "step": 59134 + }, + { + "epoch": 1.52, + "learning_rate": 1.0316773695114056e-06, + "loss": 0.626, + "step": 59135 + }, + { + "epoch": 1.52, + "learning_rate": 1.031649712931908e-06, + "loss": 0.5717, + "step": 59136 + }, + { + "epoch": 1.52, + "learning_rate": 1.0316220563281782e-06, + "loss": 0.8037, + "step": 59137 + }, + { + "epoch": 1.52, + "learning_rate": 1.0315943997002363e-06, + "loss": 0.5596, + "step": 59138 + }, + { + "epoch": 1.52, + "learning_rate": 1.031566743048104e-06, + "loss": 0.7393, + "step": 59139 + }, + { + "epoch": 1.52, + "learning_rate": 1.0315390863718027e-06, + "loss": 0.6042, + "step": 59140 + }, + { + "epoch": 1.52, + "learning_rate": 1.0315114296713533e-06, + "loss": 0.5396, + "step": 59141 + }, + { + "epoch": 1.52, + "learning_rate": 1.031483772946777e-06, + "loss": 0.6133, + "step": 59142 + }, + { + "epoch": 1.52, + "learning_rate": 1.031456116198095e-06, + "loss": 0.7832, + "step": 59143 + }, + { + "epoch": 1.52, + "learning_rate": 1.0314284594253285e-06, + "loss": 0.584, + "step": 59144 + }, + { + "epoch": 1.52, + "learning_rate": 1.0314008026284988e-06, + "loss": 0.5825, + "step": 59145 + }, + { + "epoch": 1.52, + "learning_rate": 1.031373145807627e-06, + "loss": 0.7012, + "step": 59146 + }, + { + "epoch": 1.52, + "learning_rate": 1.0313454889627343e-06, + "loss": 0.6699, + "step": 59147 + }, + { + "epoch": 1.52, + "learning_rate": 1.0313178320938414e-06, + "loss": 0.7822, + "step": 59148 + }, + { + "epoch": 1.52, + "learning_rate": 1.03129017520097e-06, + "loss": 0.6641, + "step": 59149 + }, + { + "epoch": 1.52, + "learning_rate": 1.0312625182841412e-06, + "loss": 0.5669, + "step": 59150 + }, + { + "epoch": 1.52, + "learning_rate": 1.031234861343376e-06, + "loss": 0.6372, + "step": 59151 + }, + { + "epoch": 1.52, + "learning_rate": 1.0312072043786962e-06, + "loss": 0.647, + "step": 59152 + }, + { + "epoch": 1.52, + "learning_rate": 1.0311795473901222e-06, + "loss": 0.7285, + "step": 59153 + }, + { + "epoch": 1.52, + "learning_rate": 1.0311518903776752e-06, + "loss": 0.6738, + "step": 59154 + }, + { + "epoch": 1.52, + "learning_rate": 1.031124233341377e-06, + "loss": 0.7423, + "step": 59155 + }, + { + "epoch": 1.52, + "learning_rate": 1.031096576281248e-06, + "loss": 0.488, + "step": 59156 + }, + { + "epoch": 1.52, + "learning_rate": 1.0310689191973104e-06, + "loss": 0.6472, + "step": 59157 + }, + { + "epoch": 1.52, + "learning_rate": 1.031041262089584e-06, + "loss": 0.5801, + "step": 59158 + }, + { + "epoch": 1.52, + "learning_rate": 1.0310136049580912e-06, + "loss": 0.8027, + "step": 59159 + }, + { + "epoch": 1.52, + "learning_rate": 1.0309859478028527e-06, + "loss": 0.6714, + "step": 59160 + }, + { + "epoch": 1.52, + "learning_rate": 1.0309582906238896e-06, + "loss": 0.5713, + "step": 59161 + }, + { + "epoch": 1.52, + "learning_rate": 1.0309306334212231e-06, + "loss": 0.7559, + "step": 59162 + }, + { + "epoch": 1.52, + "learning_rate": 1.0309029761948745e-06, + "loss": 0.7021, + "step": 59163 + }, + { + "epoch": 1.52, + "learning_rate": 1.0308753189448648e-06, + "loss": 0.6689, + "step": 59164 + }, + { + "epoch": 1.52, + "learning_rate": 1.0308476616712155e-06, + "loss": 0.413, + "step": 59165 + }, + { + "epoch": 1.52, + "learning_rate": 1.0308200043739476e-06, + "loss": 0.562, + "step": 59166 + }, + { + "epoch": 1.52, + "learning_rate": 1.0307923470530819e-06, + "loss": 0.6602, + "step": 59167 + }, + { + "epoch": 1.52, + "learning_rate": 1.0307646897086401e-06, + "loss": 0.582, + "step": 59168 + }, + { + "epoch": 1.52, + "learning_rate": 1.0307370323406432e-06, + "loss": 0.6758, + "step": 59169 + }, + { + "epoch": 1.52, + "learning_rate": 1.0307093749491125e-06, + "loss": 0.6299, + "step": 59170 + }, + { + "epoch": 1.52, + "learning_rate": 1.0306817175340687e-06, + "loss": 0.6709, + "step": 59171 + }, + { + "epoch": 1.52, + "learning_rate": 1.0306540600955338e-06, + "loss": 0.6948, + "step": 59172 + }, + { + "epoch": 1.52, + "learning_rate": 1.0306264026335281e-06, + "loss": 0.6172, + "step": 59173 + }, + { + "epoch": 1.52, + "learning_rate": 1.0305987451480736e-06, + "loss": 0.8633, + "step": 59174 + }, + { + "epoch": 1.52, + "learning_rate": 1.0305710876391905e-06, + "loss": 0.6201, + "step": 59175 + }, + { + "epoch": 1.52, + "learning_rate": 1.0305434301069008e-06, + "loss": 0.6465, + "step": 59176 + }, + { + "epoch": 1.52, + "learning_rate": 1.0305157725512255e-06, + "loss": 0.6709, + "step": 59177 + }, + { + "epoch": 1.52, + "learning_rate": 1.0304881149721857e-06, + "loss": 0.564, + "step": 59178 + }, + { + "epoch": 1.52, + "learning_rate": 1.0304604573698022e-06, + "loss": 0.7559, + "step": 59179 + }, + { + "epoch": 1.52, + "learning_rate": 1.0304327997440966e-06, + "loss": 0.5786, + "step": 59180 + }, + { + "epoch": 1.52, + "learning_rate": 1.0304051420950902e-06, + "loss": 0.8828, + "step": 59181 + }, + { + "epoch": 1.52, + "learning_rate": 1.030377484422804e-06, + "loss": 0.6101, + "step": 59182 + }, + { + "epoch": 1.52, + "learning_rate": 1.030349826727259e-06, + "loss": 0.457, + "step": 59183 + }, + { + "epoch": 1.52, + "learning_rate": 1.0303221690084766e-06, + "loss": 0.4658, + "step": 59184 + }, + { + "epoch": 1.52, + "learning_rate": 1.030294511266478e-06, + "loss": 0.4958, + "step": 59185 + }, + { + "epoch": 1.52, + "learning_rate": 1.030266853501284e-06, + "loss": 0.7144, + "step": 59186 + }, + { + "epoch": 1.52, + "learning_rate": 1.0302391957129166e-06, + "loss": 0.7148, + "step": 59187 + }, + { + "epoch": 1.52, + "learning_rate": 1.0302115379013959e-06, + "loss": 0.6216, + "step": 59188 + }, + { + "epoch": 1.52, + "learning_rate": 1.030183880066744e-06, + "loss": 0.7158, + "step": 59189 + }, + { + "epoch": 1.52, + "learning_rate": 1.0301562222089811e-06, + "loss": 0.604, + "step": 59190 + }, + { + "epoch": 1.52, + "learning_rate": 1.0301285643281297e-06, + "loss": 0.6213, + "step": 59191 + }, + { + "epoch": 1.52, + "learning_rate": 1.03010090642421e-06, + "loss": 0.6602, + "step": 59192 + }, + { + "epoch": 1.52, + "learning_rate": 1.0300732484972433e-06, + "loss": 0.6265, + "step": 59193 + }, + { + "epoch": 1.52, + "learning_rate": 1.030045590547251e-06, + "loss": 0.5864, + "step": 59194 + }, + { + "epoch": 1.52, + "learning_rate": 1.030017932574254e-06, + "loss": 0.645, + "step": 59195 + }, + { + "epoch": 1.52, + "learning_rate": 1.0299902745782736e-06, + "loss": 0.6553, + "step": 59196 + }, + { + "epoch": 1.52, + "learning_rate": 1.0299626165593316e-06, + "loss": 0.626, + "step": 59197 + }, + { + "epoch": 1.52, + "learning_rate": 1.029934958517448e-06, + "loss": 0.6113, + "step": 59198 + }, + { + "epoch": 1.52, + "learning_rate": 1.0299073004526448e-06, + "loss": 0.7109, + "step": 59199 + }, + { + "epoch": 1.52, + "learning_rate": 1.0298796423649428e-06, + "loss": 0.6523, + "step": 59200 + }, + { + "epoch": 1.52, + "learning_rate": 1.0298519842543635e-06, + "loss": 0.5427, + "step": 59201 + }, + { + "epoch": 1.52, + "learning_rate": 1.029824326120928e-06, + "loss": 0.7451, + "step": 59202 + }, + { + "epoch": 1.52, + "learning_rate": 1.0297966679646572e-06, + "loss": 0.6885, + "step": 59203 + }, + { + "epoch": 1.52, + "learning_rate": 1.0297690097855724e-06, + "loss": 0.6216, + "step": 59204 + }, + { + "epoch": 1.52, + "learning_rate": 1.029741351583695e-06, + "loss": 0.814, + "step": 59205 + }, + { + "epoch": 1.52, + "learning_rate": 1.0297136933590457e-06, + "loss": 0.5938, + "step": 59206 + }, + { + "epoch": 1.52, + "learning_rate": 1.0296860351116465e-06, + "loss": 0.6626, + "step": 59207 + }, + { + "epoch": 1.52, + "learning_rate": 1.029658376841518e-06, + "loss": 0.7246, + "step": 59208 + }, + { + "epoch": 1.52, + "learning_rate": 1.0296307185486812e-06, + "loss": 0.5972, + "step": 59209 + }, + { + "epoch": 1.52, + "learning_rate": 1.0296030602331574e-06, + "loss": 0.417, + "step": 59210 + }, + { + "epoch": 1.52, + "learning_rate": 1.0295754018949683e-06, + "loss": 0.5449, + "step": 59211 + }, + { + "epoch": 1.52, + "learning_rate": 1.0295477435341344e-06, + "loss": 0.6182, + "step": 59212 + }, + { + "epoch": 1.52, + "learning_rate": 1.0295200851506772e-06, + "loss": 0.637, + "step": 59213 + }, + { + "epoch": 1.52, + "learning_rate": 1.0294924267446179e-06, + "loss": 0.6792, + "step": 59214 + }, + { + "epoch": 1.52, + "learning_rate": 1.0294647683159773e-06, + "loss": 0.7383, + "step": 59215 + }, + { + "epoch": 1.52, + "learning_rate": 1.029437109864777e-06, + "loss": 0.4993, + "step": 59216 + }, + { + "epoch": 1.52, + "learning_rate": 1.0294094513910386e-06, + "loss": 0.7949, + "step": 59217 + }, + { + "epoch": 1.52, + "learning_rate": 1.0293817928947824e-06, + "loss": 0.7422, + "step": 59218 + }, + { + "epoch": 1.52, + "learning_rate": 1.0293541343760294e-06, + "loss": 0.6094, + "step": 59219 + }, + { + "epoch": 1.52, + "learning_rate": 1.0293264758348018e-06, + "loss": 0.5923, + "step": 59220 + }, + { + "epoch": 1.52, + "learning_rate": 1.02929881727112e-06, + "loss": 0.7129, + "step": 59221 + }, + { + "epoch": 1.52, + "learning_rate": 1.029271158685006e-06, + "loss": 0.7036, + "step": 59222 + }, + { + "epoch": 1.52, + "learning_rate": 1.0292435000764802e-06, + "loss": 0.5996, + "step": 59223 + }, + { + "epoch": 1.52, + "learning_rate": 1.029215841445564e-06, + "loss": 0.5718, + "step": 59224 + }, + { + "epoch": 1.52, + "learning_rate": 1.029188182792278e-06, + "loss": 0.583, + "step": 59225 + }, + { + "epoch": 1.52, + "learning_rate": 1.0291605241166443e-06, + "loss": 0.7754, + "step": 59226 + }, + { + "epoch": 1.52, + "learning_rate": 1.0291328654186839e-06, + "loss": 0.5935, + "step": 59227 + }, + { + "epoch": 1.52, + "learning_rate": 1.029105206698418e-06, + "loss": 0.5693, + "step": 59228 + }, + { + "epoch": 1.52, + "learning_rate": 1.0290775479558671e-06, + "loss": 0.6377, + "step": 59229 + }, + { + "epoch": 1.52, + "learning_rate": 1.029049889191053e-06, + "loss": 0.7368, + "step": 59230 + }, + { + "epoch": 1.52, + "learning_rate": 1.0290222304039966e-06, + "loss": 0.666, + "step": 59231 + }, + { + "epoch": 1.52, + "learning_rate": 1.0289945715947195e-06, + "loss": 0.6465, + "step": 59232 + }, + { + "epoch": 1.52, + "learning_rate": 1.0289669127632426e-06, + "loss": 0.7539, + "step": 59233 + }, + { + "epoch": 1.52, + "learning_rate": 1.0289392539095867e-06, + "loss": 0.4158, + "step": 59234 + }, + { + "epoch": 1.52, + "learning_rate": 1.0289115950337736e-06, + "loss": 0.5889, + "step": 59235 + }, + { + "epoch": 1.52, + "learning_rate": 1.028883936135824e-06, + "loss": 0.666, + "step": 59236 + }, + { + "epoch": 1.52, + "learning_rate": 1.0288562772157602e-06, + "loss": 0.7783, + "step": 59237 + }, + { + "epoch": 1.52, + "learning_rate": 1.0288286182736014e-06, + "loss": 0.7754, + "step": 59238 + }, + { + "epoch": 1.52, + "learning_rate": 1.0288009593093703e-06, + "loss": 0.5869, + "step": 59239 + }, + { + "epoch": 1.52, + "learning_rate": 1.0287733003230873e-06, + "loss": 0.5938, + "step": 59240 + }, + { + "epoch": 1.52, + "learning_rate": 1.0287456413147745e-06, + "loss": 0.3835, + "step": 59241 + }, + { + "epoch": 1.52, + "learning_rate": 1.0287179822844523e-06, + "loss": 0.4558, + "step": 59242 + }, + { + "epoch": 1.52, + "learning_rate": 1.0286903232321418e-06, + "loss": 0.5454, + "step": 59243 + }, + { + "epoch": 1.52, + "learning_rate": 1.0286626641578644e-06, + "loss": 0.686, + "step": 59244 + }, + { + "epoch": 1.52, + "learning_rate": 1.0286350050616418e-06, + "loss": 0.6519, + "step": 59245 + }, + { + "epoch": 1.52, + "learning_rate": 1.0286073459434944e-06, + "loss": 0.7227, + "step": 59246 + }, + { + "epoch": 1.52, + "learning_rate": 1.0285796868034436e-06, + "loss": 0.7783, + "step": 59247 + }, + { + "epoch": 1.52, + "learning_rate": 1.0285520276415105e-06, + "loss": 0.4767, + "step": 59248 + }, + { + "epoch": 1.52, + "learning_rate": 1.0285243684577168e-06, + "loss": 0.5996, + "step": 59249 + }, + { + "epoch": 1.52, + "learning_rate": 1.028496709252083e-06, + "loss": 0.6621, + "step": 59250 + }, + { + "epoch": 1.52, + "learning_rate": 1.0284690500246306e-06, + "loss": 0.6318, + "step": 59251 + }, + { + "epoch": 1.52, + "learning_rate": 1.0284413907753811e-06, + "loss": 0.7056, + "step": 59252 + }, + { + "epoch": 1.52, + "learning_rate": 1.0284137315043549e-06, + "loss": 0.7275, + "step": 59253 + }, + { + "epoch": 1.52, + "learning_rate": 1.0283860722115739e-06, + "loss": 0.7529, + "step": 59254 + }, + { + "epoch": 1.52, + "learning_rate": 1.0283584128970588e-06, + "loss": 0.4888, + "step": 59255 + }, + { + "epoch": 1.52, + "learning_rate": 1.0283307535608311e-06, + "loss": 0.5466, + "step": 59256 + }, + { + "epoch": 1.52, + "learning_rate": 1.0283030942029118e-06, + "loss": 0.6221, + "step": 59257 + }, + { + "epoch": 1.52, + "learning_rate": 1.028275434823322e-06, + "loss": 0.5347, + "step": 59258 + }, + { + "epoch": 1.52, + "learning_rate": 1.028247775422083e-06, + "loss": 0.793, + "step": 59259 + }, + { + "epoch": 1.52, + "learning_rate": 1.0282201159992164e-06, + "loss": 0.7051, + "step": 59260 + }, + { + "epoch": 1.52, + "learning_rate": 1.0281924565547425e-06, + "loss": 0.5767, + "step": 59261 + }, + { + "epoch": 1.52, + "learning_rate": 1.0281647970886833e-06, + "loss": 0.7695, + "step": 59262 + }, + { + "epoch": 1.52, + "learning_rate": 1.0281371376010593e-06, + "loss": 0.667, + "step": 59263 + }, + { + "epoch": 1.52, + "learning_rate": 1.0281094780918919e-06, + "loss": 0.6973, + "step": 59264 + }, + { + "epoch": 1.52, + "learning_rate": 1.0280818185612026e-06, + "loss": 0.5764, + "step": 59265 + }, + { + "epoch": 1.52, + "learning_rate": 1.0280541590090126e-06, + "loss": 0.665, + "step": 59266 + }, + { + "epoch": 1.52, + "learning_rate": 1.0280264994353424e-06, + "loss": 0.4692, + "step": 59267 + }, + { + "epoch": 1.52, + "learning_rate": 1.0279988398402138e-06, + "loss": 0.5913, + "step": 59268 + }, + { + "epoch": 1.52, + "learning_rate": 1.0279711802236474e-06, + "loss": 0.7266, + "step": 59269 + }, + { + "epoch": 1.52, + "learning_rate": 1.0279435205856653e-06, + "loss": 0.6729, + "step": 59270 + }, + { + "epoch": 1.52, + "learning_rate": 1.027915860926288e-06, + "loss": 0.4204, + "step": 59271 + }, + { + "epoch": 1.52, + "learning_rate": 1.0278882012455364e-06, + "loss": 0.5271, + "step": 59272 + }, + { + "epoch": 1.52, + "learning_rate": 1.0278605415434325e-06, + "loss": 0.7573, + "step": 59273 + }, + { + "epoch": 1.52, + "learning_rate": 1.0278328818199968e-06, + "loss": 0.8223, + "step": 59274 + }, + { + "epoch": 1.52, + "learning_rate": 1.0278052220752509e-06, + "loss": 0.5952, + "step": 59275 + }, + { + "epoch": 1.52, + "learning_rate": 1.0277775623092158e-06, + "loss": 0.6309, + "step": 59276 + }, + { + "epoch": 1.52, + "learning_rate": 1.0277499025219128e-06, + "loss": 0.7183, + "step": 59277 + }, + { + "epoch": 1.52, + "learning_rate": 1.0277222427133628e-06, + "loss": 0.511, + "step": 59278 + }, + { + "epoch": 1.52, + "learning_rate": 1.0276945828835872e-06, + "loss": 0.5767, + "step": 59279 + }, + { + "epoch": 1.52, + "learning_rate": 1.0276669230326068e-06, + "loss": 0.6123, + "step": 59280 + }, + { + "epoch": 1.52, + "learning_rate": 1.027639263160444e-06, + "loss": 0.6201, + "step": 59281 + }, + { + "epoch": 1.52, + "learning_rate": 1.0276116032671184e-06, + "loss": 0.5798, + "step": 59282 + }, + { + "epoch": 1.52, + "learning_rate": 1.027583943352652e-06, + "loss": 0.6592, + "step": 59283 + }, + { + "epoch": 1.52, + "learning_rate": 1.0275562834170657e-06, + "loss": 0.5923, + "step": 59284 + }, + { + "epoch": 1.52, + "learning_rate": 1.0275286234603811e-06, + "loss": 0.834, + "step": 59285 + }, + { + "epoch": 1.52, + "learning_rate": 1.0275009634826192e-06, + "loss": 0.6387, + "step": 59286 + }, + { + "epoch": 1.52, + "learning_rate": 1.0274733034838008e-06, + "loss": 0.5908, + "step": 59287 + }, + { + "epoch": 1.52, + "learning_rate": 1.027445643463947e-06, + "loss": 0.585, + "step": 59288 + }, + { + "epoch": 1.52, + "learning_rate": 1.02741798342308e-06, + "loss": 0.6289, + "step": 59289 + }, + { + "epoch": 1.52, + "learning_rate": 1.02739032336122e-06, + "loss": 0.751, + "step": 59290 + }, + { + "epoch": 1.52, + "learning_rate": 1.0273626632783887e-06, + "loss": 0.6172, + "step": 59291 + }, + { + "epoch": 1.52, + "learning_rate": 1.0273350031746069e-06, + "loss": 0.481, + "step": 59292 + }, + { + "epoch": 1.52, + "learning_rate": 1.027307343049896e-06, + "loss": 0.5986, + "step": 59293 + }, + { + "epoch": 1.52, + "learning_rate": 1.027279682904277e-06, + "loss": 0.6855, + "step": 59294 + }, + { + "epoch": 1.52, + "learning_rate": 1.0272520227377713e-06, + "loss": 0.5591, + "step": 59295 + }, + { + "epoch": 1.52, + "learning_rate": 1.0272243625504e-06, + "loss": 0.7227, + "step": 59296 + }, + { + "epoch": 1.52, + "learning_rate": 1.027196702342184e-06, + "loss": 0.5593, + "step": 59297 + }, + { + "epoch": 1.52, + "learning_rate": 1.027169042113145e-06, + "loss": 0.75, + "step": 59298 + }, + { + "epoch": 1.52, + "learning_rate": 1.027141381863304e-06, + "loss": 0.7227, + "step": 59299 + }, + { + "epoch": 1.52, + "learning_rate": 1.0271137215926816e-06, + "loss": 0.6226, + "step": 59300 + }, + { + "epoch": 1.52, + "learning_rate": 1.0270860613013002e-06, + "loss": 0.9805, + "step": 59301 + }, + { + "epoch": 1.52, + "learning_rate": 1.0270584009891799e-06, + "loss": 0.6553, + "step": 59302 + }, + { + "epoch": 1.52, + "learning_rate": 1.0270307406563419e-06, + "loss": 0.6689, + "step": 59303 + }, + { + "epoch": 1.52, + "learning_rate": 1.0270030803028082e-06, + "loss": 0.832, + "step": 59304 + }, + { + "epoch": 1.52, + "learning_rate": 1.0269754199285992e-06, + "loss": 0.5835, + "step": 59305 + }, + { + "epoch": 1.52, + "learning_rate": 1.0269477595337366e-06, + "loss": 0.6743, + "step": 59306 + }, + { + "epoch": 1.52, + "learning_rate": 1.026920099118241e-06, + "loss": 0.5605, + "step": 59307 + }, + { + "epoch": 1.52, + "learning_rate": 1.0268924386821342e-06, + "loss": 0.6118, + "step": 59308 + }, + { + "epoch": 1.52, + "learning_rate": 1.026864778225437e-06, + "loss": 0.7412, + "step": 59309 + }, + { + "epoch": 1.52, + "learning_rate": 1.0268371177481708e-06, + "loss": 0.7598, + "step": 59310 + }, + { + "epoch": 1.52, + "learning_rate": 1.0268094572503564e-06, + "loss": 0.4661, + "step": 59311 + }, + { + "epoch": 1.52, + "learning_rate": 1.0267817967320155e-06, + "loss": 0.6177, + "step": 59312 + }, + { + "epoch": 1.52, + "learning_rate": 1.0267541361931685e-06, + "loss": 0.6265, + "step": 59313 + }, + { + "epoch": 1.52, + "learning_rate": 1.0267264756338376e-06, + "loss": 0.6982, + "step": 59314 + }, + { + "epoch": 1.52, + "learning_rate": 1.0266988150540431e-06, + "loss": 0.5737, + "step": 59315 + }, + { + "epoch": 1.52, + "learning_rate": 1.0266711544538075e-06, + "loss": 0.6953, + "step": 59316 + }, + { + "epoch": 1.52, + "learning_rate": 1.0266434938331498e-06, + "loss": 0.7725, + "step": 59317 + }, + { + "epoch": 1.52, + "learning_rate": 1.026615833192093e-06, + "loss": 0.4285, + "step": 59318 + }, + { + "epoch": 1.52, + "learning_rate": 1.0265881725306576e-06, + "loss": 0.7383, + "step": 59319 + }, + { + "epoch": 1.52, + "learning_rate": 1.026560511848865e-06, + "loss": 0.5381, + "step": 59320 + }, + { + "epoch": 1.52, + "learning_rate": 1.0265328511467358e-06, + "loss": 0.582, + "step": 59321 + }, + { + "epoch": 1.52, + "learning_rate": 1.0265051904242917e-06, + "loss": 0.5229, + "step": 59322 + }, + { + "epoch": 1.52, + "learning_rate": 1.0264775296815542e-06, + "loss": 0.667, + "step": 59323 + }, + { + "epoch": 1.52, + "learning_rate": 1.0264498689185436e-06, + "loss": 0.6099, + "step": 59324 + }, + { + "epoch": 1.52, + "learning_rate": 1.026422208135282e-06, + "loss": 0.5491, + "step": 59325 + }, + { + "epoch": 1.52, + "learning_rate": 1.02639454733179e-06, + "loss": 0.5532, + "step": 59326 + }, + { + "epoch": 1.52, + "learning_rate": 1.026366886508089e-06, + "loss": 0.5376, + "step": 59327 + }, + { + "epoch": 1.52, + "learning_rate": 1.0263392256641997e-06, + "loss": 0.7539, + "step": 59328 + }, + { + "epoch": 1.52, + "learning_rate": 1.0263115648001442e-06, + "loss": 0.6948, + "step": 59329 + }, + { + "epoch": 1.52, + "learning_rate": 1.0262839039159426e-06, + "loss": 0.4434, + "step": 59330 + }, + { + "epoch": 1.52, + "learning_rate": 1.026256243011617e-06, + "loss": 0.4946, + "step": 59331 + }, + { + "epoch": 1.52, + "learning_rate": 1.026228582087188e-06, + "loss": 0.54, + "step": 59332 + }, + { + "epoch": 1.52, + "learning_rate": 1.0262009211426773e-06, + "loss": 0.6797, + "step": 59333 + }, + { + "epoch": 1.52, + "learning_rate": 1.0261732601781052e-06, + "loss": 0.6362, + "step": 59334 + }, + { + "epoch": 1.52, + "learning_rate": 1.0261455991934938e-06, + "loss": 0.6089, + "step": 59335 + }, + { + "epoch": 1.52, + "learning_rate": 1.026117938188864e-06, + "loss": 0.6411, + "step": 59336 + }, + { + "epoch": 1.52, + "learning_rate": 1.0260902771642367e-06, + "loss": 0.7017, + "step": 59337 + }, + { + "epoch": 1.52, + "learning_rate": 1.0260626161196334e-06, + "loss": 0.7676, + "step": 59338 + }, + { + "epoch": 1.52, + "learning_rate": 1.026034955055075e-06, + "loss": 0.6572, + "step": 59339 + }, + { + "epoch": 1.52, + "learning_rate": 1.0260072939705827e-06, + "loss": 0.8301, + "step": 59340 + }, + { + "epoch": 1.52, + "learning_rate": 1.0259796328661782e-06, + "loss": 0.6343, + "step": 59341 + }, + { + "epoch": 1.52, + "learning_rate": 1.0259519717418822e-06, + "loss": 0.7197, + "step": 59342 + }, + { + "epoch": 1.52, + "learning_rate": 1.0259243105977159e-06, + "loss": 0.5833, + "step": 59343 + }, + { + "epoch": 1.52, + "learning_rate": 1.0258966494337004e-06, + "loss": 0.9023, + "step": 59344 + }, + { + "epoch": 1.52, + "learning_rate": 1.0258689882498573e-06, + "loss": 0.4688, + "step": 59345 + }, + { + "epoch": 1.52, + "learning_rate": 1.0258413270462074e-06, + "loss": 0.6382, + "step": 59346 + }, + { + "epoch": 1.52, + "learning_rate": 1.025813665822772e-06, + "loss": 0.3816, + "step": 59347 + }, + { + "epoch": 1.52, + "learning_rate": 1.0257860045795722e-06, + "loss": 0.7686, + "step": 59348 + }, + { + "epoch": 1.52, + "learning_rate": 1.025758343316629e-06, + "loss": 0.71, + "step": 59349 + }, + { + "epoch": 1.52, + "learning_rate": 1.0257306820339642e-06, + "loss": 0.7285, + "step": 59350 + }, + { + "epoch": 1.52, + "learning_rate": 1.0257030207315986e-06, + "loss": 0.6035, + "step": 59351 + }, + { + "epoch": 1.52, + "learning_rate": 1.0256753594095532e-06, + "loss": 0.5229, + "step": 59352 + }, + { + "epoch": 1.52, + "learning_rate": 1.0256476980678492e-06, + "loss": 0.5835, + "step": 59353 + }, + { + "epoch": 1.52, + "learning_rate": 1.0256200367065085e-06, + "loss": 0.52, + "step": 59354 + }, + { + "epoch": 1.52, + "learning_rate": 1.0255923753255511e-06, + "loss": 0.7139, + "step": 59355 + }, + { + "epoch": 1.52, + "learning_rate": 1.0255647139249993e-06, + "loss": 0.8535, + "step": 59356 + }, + { + "epoch": 1.52, + "learning_rate": 1.0255370525048735e-06, + "loss": 0.5415, + "step": 59357 + }, + { + "epoch": 1.52, + "learning_rate": 1.0255093910651953e-06, + "loss": 0.7051, + "step": 59358 + }, + { + "epoch": 1.52, + "learning_rate": 1.0254817296059854e-06, + "loss": 0.707, + "step": 59359 + }, + { + "epoch": 1.52, + "learning_rate": 1.0254540681272656e-06, + "loss": 0.7012, + "step": 59360 + }, + { + "epoch": 1.52, + "learning_rate": 1.0254264066290567e-06, + "loss": 0.73, + "step": 59361 + }, + { + "epoch": 1.52, + "learning_rate": 1.0253987451113801e-06, + "loss": 0.7383, + "step": 59362 + }, + { + "epoch": 1.52, + "learning_rate": 1.0253710835742566e-06, + "loss": 0.585, + "step": 59363 + }, + { + "epoch": 1.52, + "learning_rate": 1.025343422017708e-06, + "loss": 0.834, + "step": 59364 + }, + { + "epoch": 1.52, + "learning_rate": 1.0253157604417545e-06, + "loss": 0.6111, + "step": 59365 + }, + { + "epoch": 1.52, + "learning_rate": 1.0252880988464186e-06, + "loss": 0.5825, + "step": 59366 + }, + { + "epoch": 1.52, + "learning_rate": 1.0252604372317204e-06, + "loss": 0.6387, + "step": 59367 + }, + { + "epoch": 1.52, + "learning_rate": 1.0252327755976812e-06, + "loss": 0.835, + "step": 59368 + }, + { + "epoch": 1.52, + "learning_rate": 1.0252051139443227e-06, + "loss": 0.7148, + "step": 59369 + }, + { + "epoch": 1.52, + "learning_rate": 1.0251774522716658e-06, + "loss": 0.6157, + "step": 59370 + }, + { + "epoch": 1.52, + "learning_rate": 1.025149790579732e-06, + "loss": 0.7061, + "step": 59371 + }, + { + "epoch": 1.52, + "learning_rate": 1.0251221288685416e-06, + "loss": 0.5215, + "step": 59372 + }, + { + "epoch": 1.52, + "learning_rate": 1.0250944671381169e-06, + "loss": 0.6875, + "step": 59373 + }, + { + "epoch": 1.52, + "learning_rate": 1.0250668053884778e-06, + "loss": 0.5693, + "step": 59374 + }, + { + "epoch": 1.52, + "learning_rate": 1.0250391436196469e-06, + "loss": 0.6626, + "step": 59375 + }, + { + "epoch": 1.52, + "learning_rate": 1.0250114818316442e-06, + "loss": 0.4661, + "step": 59376 + }, + { + "epoch": 1.52, + "learning_rate": 1.0249838200244918e-06, + "loss": 0.7178, + "step": 59377 + }, + { + "epoch": 1.52, + "learning_rate": 1.02495615819821e-06, + "loss": 0.8125, + "step": 59378 + }, + { + "epoch": 1.52, + "learning_rate": 1.0249284963528207e-06, + "loss": 0.4993, + "step": 59379 + }, + { + "epoch": 1.52, + "learning_rate": 1.0249008344883445e-06, + "loss": 0.5596, + "step": 59380 + }, + { + "epoch": 1.52, + "learning_rate": 1.0248731726048033e-06, + "loss": 0.7139, + "step": 59381 + }, + { + "epoch": 1.52, + "learning_rate": 1.0248455107022177e-06, + "loss": 0.6807, + "step": 59382 + }, + { + "epoch": 1.52, + "learning_rate": 1.024817848780609e-06, + "loss": 0.7354, + "step": 59383 + }, + { + "epoch": 1.52, + "learning_rate": 1.0247901868399982e-06, + "loss": 0.4683, + "step": 59384 + }, + { + "epoch": 1.52, + "learning_rate": 1.0247625248804068e-06, + "loss": 0.7432, + "step": 59385 + }, + { + "epoch": 1.52, + "learning_rate": 1.024734862901856e-06, + "loss": 0.5918, + "step": 59386 + }, + { + "epoch": 1.52, + "learning_rate": 1.0247072009043667e-06, + "loss": 0.6445, + "step": 59387 + }, + { + "epoch": 1.52, + "learning_rate": 1.0246795388879603e-06, + "loss": 0.5732, + "step": 59388 + }, + { + "epoch": 1.52, + "learning_rate": 1.0246518768526581e-06, + "loss": 0.6709, + "step": 59389 + }, + { + "epoch": 1.52, + "learning_rate": 1.0246242147984807e-06, + "loss": 0.6758, + "step": 59390 + }, + { + "epoch": 1.52, + "learning_rate": 1.0245965527254501e-06, + "loss": 0.8398, + "step": 59391 + }, + { + "epoch": 1.52, + "learning_rate": 1.024568890633587e-06, + "loss": 0.5322, + "step": 59392 + }, + { + "epoch": 1.52, + "learning_rate": 1.0245412285229123e-06, + "loss": 0.7119, + "step": 59393 + }, + { + "epoch": 1.52, + "learning_rate": 1.0245135663934476e-06, + "loss": 0.6294, + "step": 59394 + }, + { + "epoch": 1.52, + "learning_rate": 1.0244859042452141e-06, + "loss": 0.6313, + "step": 59395 + }, + { + "epoch": 1.52, + "learning_rate": 1.024458242078233e-06, + "loss": 0.7529, + "step": 59396 + }, + { + "epoch": 1.52, + "learning_rate": 1.024430579892525e-06, + "loss": 0.561, + "step": 59397 + }, + { + "epoch": 1.52, + "learning_rate": 1.024402917688112e-06, + "loss": 0.875, + "step": 59398 + }, + { + "epoch": 1.52, + "learning_rate": 1.0243752554650145e-06, + "loss": 0.6416, + "step": 59399 + }, + { + "epoch": 1.52, + "learning_rate": 1.0243475932232542e-06, + "loss": 0.623, + "step": 59400 + }, + { + "epoch": 1.52, + "learning_rate": 1.0243199309628522e-06, + "loss": 0.5015, + "step": 59401 + }, + { + "epoch": 1.52, + "learning_rate": 1.0242922686838294e-06, + "loss": 0.5576, + "step": 59402 + }, + { + "epoch": 1.52, + "learning_rate": 1.0242646063862068e-06, + "loss": 0.6274, + "step": 59403 + }, + { + "epoch": 1.52, + "learning_rate": 1.0242369440700063e-06, + "loss": 0.3384, + "step": 59404 + }, + { + "epoch": 1.52, + "learning_rate": 1.0242092817352483e-06, + "loss": 0.6777, + "step": 59405 + }, + { + "epoch": 1.52, + "learning_rate": 1.024181619381955e-06, + "loss": 0.4412, + "step": 59406 + }, + { + "epoch": 1.52, + "learning_rate": 1.0241539570101462e-06, + "loss": 0.7373, + "step": 59407 + }, + { + "epoch": 1.52, + "learning_rate": 1.0241262946198443e-06, + "loss": 0.7402, + "step": 59408 + }, + { + "epoch": 1.52, + "learning_rate": 1.0240986322110698e-06, + "loss": 0.5752, + "step": 59409 + }, + { + "epoch": 1.52, + "learning_rate": 1.0240709697838444e-06, + "loss": 0.5327, + "step": 59410 + }, + { + "epoch": 1.52, + "learning_rate": 1.0240433073381888e-06, + "loss": 0.6152, + "step": 59411 + }, + { + "epoch": 1.52, + "learning_rate": 1.024015644874124e-06, + "loss": 0.5579, + "step": 59412 + }, + { + "epoch": 1.52, + "learning_rate": 1.023987982391672e-06, + "loss": 0.6108, + "step": 59413 + }, + { + "epoch": 1.52, + "learning_rate": 1.0239603198908534e-06, + "loss": 0.6255, + "step": 59414 + }, + { + "epoch": 1.52, + "learning_rate": 1.0239326573716893e-06, + "loss": 0.5479, + "step": 59415 + }, + { + "epoch": 1.52, + "learning_rate": 1.0239049948342014e-06, + "loss": 0.71, + "step": 59416 + }, + { + "epoch": 1.52, + "learning_rate": 1.0238773322784102e-06, + "loss": 0.6792, + "step": 59417 + }, + { + "epoch": 1.52, + "learning_rate": 1.0238496697043372e-06, + "loss": 0.6221, + "step": 59418 + }, + { + "epoch": 1.52, + "learning_rate": 1.0238220071120037e-06, + "loss": 0.8418, + "step": 59419 + }, + { + "epoch": 1.52, + "learning_rate": 1.0237943445014307e-06, + "loss": 0.6157, + "step": 59420 + }, + { + "epoch": 1.52, + "learning_rate": 1.02376668187264e-06, + "loss": 0.6895, + "step": 59421 + }, + { + "epoch": 1.52, + "learning_rate": 1.0237390192256517e-06, + "loss": 0.707, + "step": 59422 + }, + { + "epoch": 1.52, + "learning_rate": 1.0237113565604878e-06, + "loss": 0.5166, + "step": 59423 + }, + { + "epoch": 1.52, + "learning_rate": 1.023683693877169e-06, + "loss": 0.6572, + "step": 59424 + }, + { + "epoch": 1.52, + "learning_rate": 1.0236560311757167e-06, + "loss": 0.7603, + "step": 59425 + }, + { + "epoch": 1.52, + "learning_rate": 1.0236283684561523e-06, + "loss": 0.6895, + "step": 59426 + }, + { + "epoch": 1.52, + "learning_rate": 1.0236007057184965e-06, + "loss": 0.7002, + "step": 59427 + }, + { + "epoch": 1.52, + "learning_rate": 1.0235730429627708e-06, + "loss": 0.5215, + "step": 59428 + }, + { + "epoch": 1.52, + "learning_rate": 1.0235453801889964e-06, + "loss": 0.7095, + "step": 59429 + }, + { + "epoch": 1.52, + "learning_rate": 1.023517717397194e-06, + "loss": 0.6626, + "step": 59430 + }, + { + "epoch": 1.52, + "learning_rate": 1.0234900545873855e-06, + "loss": 0.6875, + "step": 59431 + }, + { + "epoch": 1.52, + "learning_rate": 1.0234623917595917e-06, + "loss": 0.5957, + "step": 59432 + }, + { + "epoch": 1.52, + "learning_rate": 1.0234347289138338e-06, + "loss": 0.5942, + "step": 59433 + }, + { + "epoch": 1.52, + "learning_rate": 1.0234070660501332e-06, + "loss": 0.6841, + "step": 59434 + }, + { + "epoch": 1.52, + "learning_rate": 1.0233794031685106e-06, + "loss": 0.7617, + "step": 59435 + }, + { + "epoch": 1.52, + "learning_rate": 1.0233517402689877e-06, + "loss": 0.6479, + "step": 59436 + }, + { + "epoch": 1.52, + "learning_rate": 1.0233240773515852e-06, + "loss": 0.4231, + "step": 59437 + }, + { + "epoch": 1.52, + "learning_rate": 1.0232964144163247e-06, + "loss": 0.7207, + "step": 59438 + }, + { + "epoch": 1.52, + "learning_rate": 1.023268751463227e-06, + "loss": 0.4351, + "step": 59439 + }, + { + "epoch": 1.52, + "learning_rate": 1.0232410884923137e-06, + "loss": 0.7026, + "step": 59440 + }, + { + "epoch": 1.52, + "learning_rate": 1.0232134255036059e-06, + "loss": 0.5266, + "step": 59441 + }, + { + "epoch": 1.52, + "learning_rate": 1.0231857624971245e-06, + "loss": 0.7246, + "step": 59442 + }, + { + "epoch": 1.52, + "learning_rate": 1.0231580994728906e-06, + "loss": 0.6514, + "step": 59443 + }, + { + "epoch": 1.52, + "learning_rate": 1.023130436430926e-06, + "loss": 0.8066, + "step": 59444 + }, + { + "epoch": 1.52, + "learning_rate": 1.023102773371251e-06, + "loss": 0.6831, + "step": 59445 + }, + { + "epoch": 1.52, + "learning_rate": 1.0230751102938877e-06, + "loss": 0.6309, + "step": 59446 + }, + { + "epoch": 1.52, + "learning_rate": 1.0230474471988567e-06, + "loss": 0.7168, + "step": 59447 + }, + { + "epoch": 1.52, + "learning_rate": 1.0230197840861794e-06, + "loss": 0.7559, + "step": 59448 + }, + { + "epoch": 1.52, + "learning_rate": 1.0229921209558767e-06, + "loss": 0.7012, + "step": 59449 + }, + { + "epoch": 1.52, + "learning_rate": 1.0229644578079702e-06, + "loss": 0.6675, + "step": 59450 + }, + { + "epoch": 1.52, + "learning_rate": 1.0229367946424807e-06, + "loss": 0.6572, + "step": 59451 + }, + { + "epoch": 1.52, + "learning_rate": 1.0229091314594298e-06, + "loss": 0.583, + "step": 59452 + }, + { + "epoch": 1.52, + "learning_rate": 1.0228814682588383e-06, + "loss": 0.5084, + "step": 59453 + }, + { + "epoch": 1.52, + "learning_rate": 1.0228538050407275e-06, + "loss": 0.624, + "step": 59454 + }, + { + "epoch": 1.52, + "learning_rate": 1.0228261418051182e-06, + "loss": 0.3838, + "step": 59455 + }, + { + "epoch": 1.52, + "learning_rate": 1.0227984785520325e-06, + "loss": 0.644, + "step": 59456 + }, + { + "epoch": 1.52, + "learning_rate": 1.0227708152814912e-06, + "loss": 0.5852, + "step": 59457 + }, + { + "epoch": 1.52, + "learning_rate": 1.0227431519935147e-06, + "loss": 0.7354, + "step": 59458 + }, + { + "epoch": 1.52, + "learning_rate": 1.0227154886881254e-06, + "loss": 0.6318, + "step": 59459 + }, + { + "epoch": 1.52, + "learning_rate": 1.0226878253653435e-06, + "loss": 0.5728, + "step": 59460 + }, + { + "epoch": 1.52, + "learning_rate": 1.0226601620251908e-06, + "loss": 0.5874, + "step": 59461 + }, + { + "epoch": 1.52, + "learning_rate": 1.0226324986676882e-06, + "loss": 0.5571, + "step": 59462 + }, + { + "epoch": 1.52, + "learning_rate": 1.022604835292857e-06, + "loss": 0.6743, + "step": 59463 + }, + { + "epoch": 1.52, + "learning_rate": 1.0225771719007182e-06, + "loss": 0.6904, + "step": 59464 + }, + { + "epoch": 1.52, + "learning_rate": 1.0225495084912933e-06, + "loss": 0.7109, + "step": 59465 + }, + { + "epoch": 1.52, + "learning_rate": 1.0225218450646029e-06, + "loss": 0.792, + "step": 59466 + }, + { + "epoch": 1.52, + "learning_rate": 1.022494181620669e-06, + "loss": 0.5693, + "step": 59467 + }, + { + "epoch": 1.52, + "learning_rate": 1.0224665181595118e-06, + "loss": 0.6084, + "step": 59468 + }, + { + "epoch": 1.52, + "learning_rate": 1.0224388546811535e-06, + "loss": 0.8203, + "step": 59469 + }, + { + "epoch": 1.52, + "learning_rate": 1.0224111911856143e-06, + "loss": 0.6143, + "step": 59470 + }, + { + "epoch": 1.52, + "learning_rate": 1.0223835276729167e-06, + "loss": 0.6846, + "step": 59471 + }, + { + "epoch": 1.52, + "learning_rate": 1.0223558641430803e-06, + "loss": 0.5864, + "step": 59472 + }, + { + "epoch": 1.52, + "learning_rate": 1.0223282005961276e-06, + "loss": 0.4028, + "step": 59473 + }, + { + "epoch": 1.52, + "learning_rate": 1.0223005370320787e-06, + "loss": 0.4946, + "step": 59474 + }, + { + "epoch": 1.52, + "learning_rate": 1.0222728734509556e-06, + "loss": 0.6558, + "step": 59475 + }, + { + "epoch": 1.52, + "learning_rate": 1.0222452098527791e-06, + "loss": 0.4904, + "step": 59476 + }, + { + "epoch": 1.52, + "learning_rate": 1.0222175462375703e-06, + "loss": 0.6416, + "step": 59477 + }, + { + "epoch": 1.52, + "learning_rate": 1.022189882605351e-06, + "loss": 0.7314, + "step": 59478 + }, + { + "epoch": 1.52, + "learning_rate": 1.0221622189561417e-06, + "loss": 0.6631, + "step": 59479 + }, + { + "epoch": 1.52, + "learning_rate": 1.0221345552899635e-06, + "loss": 0.8174, + "step": 59480 + }, + { + "epoch": 1.52, + "learning_rate": 1.0221068916068386e-06, + "loss": 0.4692, + "step": 59481 + }, + { + "epoch": 1.52, + "learning_rate": 1.022079227906787e-06, + "loss": 0.7334, + "step": 59482 + }, + { + "epoch": 1.52, + "learning_rate": 1.0220515641898302e-06, + "loss": 0.6162, + "step": 59483 + }, + { + "epoch": 1.52, + "learning_rate": 1.0220239004559896e-06, + "loss": 0.5435, + "step": 59484 + }, + { + "epoch": 1.52, + "learning_rate": 1.0219962367052862e-06, + "loss": 0.4768, + "step": 59485 + }, + { + "epoch": 1.52, + "learning_rate": 1.0219685729377422e-06, + "loss": 0.6367, + "step": 59486 + }, + { + "epoch": 1.52, + "learning_rate": 1.0219409091533769e-06, + "loss": 0.6924, + "step": 59487 + }, + { + "epoch": 1.52, + "learning_rate": 1.0219132453522128e-06, + "loss": 0.6646, + "step": 59488 + }, + { + "epoch": 1.52, + "learning_rate": 1.0218855815342707e-06, + "loss": 0.6934, + "step": 59489 + }, + { + "epoch": 1.52, + "learning_rate": 1.0218579176995715e-06, + "loss": 0.5806, + "step": 59490 + }, + { + "epoch": 1.52, + "learning_rate": 1.0218302538481373e-06, + "loss": 0.3357, + "step": 59491 + }, + { + "epoch": 1.52, + "learning_rate": 1.0218025899799884e-06, + "loss": 0.7119, + "step": 59492 + }, + { + "epoch": 1.52, + "learning_rate": 1.021774926095146e-06, + "loss": 0.5449, + "step": 59493 + }, + { + "epoch": 1.52, + "learning_rate": 1.021747262193632e-06, + "loss": 0.627, + "step": 59494 + }, + { + "epoch": 1.52, + "learning_rate": 1.0217195982754668e-06, + "loss": 0.6816, + "step": 59495 + }, + { + "epoch": 1.52, + "learning_rate": 1.021691934340672e-06, + "loss": 0.8057, + "step": 59496 + }, + { + "epoch": 1.52, + "learning_rate": 1.021664270389269e-06, + "loss": 0.5205, + "step": 59497 + }, + { + "epoch": 1.52, + "learning_rate": 1.0216366064212783e-06, + "loss": 0.6904, + "step": 59498 + }, + { + "epoch": 1.52, + "learning_rate": 1.0216089424367214e-06, + "loss": 0.751, + "step": 59499 + }, + { + "epoch": 1.53, + "learning_rate": 1.0215812784356195e-06, + "loss": 0.7119, + "step": 59500 + }, + { + "epoch": 1.53, + "learning_rate": 1.0215536144179942e-06, + "loss": 0.7061, + "step": 59501 + }, + { + "epoch": 1.53, + "learning_rate": 1.0215259503838658e-06, + "loss": 0.6826, + "step": 59502 + }, + { + "epoch": 1.53, + "learning_rate": 1.0214982863332562e-06, + "loss": 0.5996, + "step": 59503 + }, + { + "epoch": 1.53, + "learning_rate": 1.0214706222661863e-06, + "loss": 0.6587, + "step": 59504 + }, + { + "epoch": 1.53, + "learning_rate": 1.0214429581826773e-06, + "loss": 0.6758, + "step": 59505 + }, + { + "epoch": 1.53, + "learning_rate": 1.0214152940827505e-06, + "loss": 0.7812, + "step": 59506 + }, + { + "epoch": 1.53, + "learning_rate": 1.0213876299664273e-06, + "loss": 0.4482, + "step": 59507 + }, + { + "epoch": 1.53, + "learning_rate": 1.021359965833728e-06, + "loss": 0.5518, + "step": 59508 + }, + { + "epoch": 1.53, + "learning_rate": 1.0213323016846746e-06, + "loss": 0.4028, + "step": 59509 + }, + { + "epoch": 1.53, + "learning_rate": 1.021304637519288e-06, + "loss": 0.5471, + "step": 59510 + }, + { + "epoch": 1.53, + "learning_rate": 1.0212769733375897e-06, + "loss": 0.6533, + "step": 59511 + }, + { + "epoch": 1.53, + "learning_rate": 1.0212493091396002e-06, + "loss": 0.665, + "step": 59512 + }, + { + "epoch": 1.53, + "learning_rate": 1.0212216449253412e-06, + "loss": 0.6279, + "step": 59513 + }, + { + "epoch": 1.53, + "learning_rate": 1.0211939806948337e-06, + "loss": 0.502, + "step": 59514 + }, + { + "epoch": 1.53, + "learning_rate": 1.0211663164480993e-06, + "loss": 0.5435, + "step": 59515 + }, + { + "epoch": 1.53, + "learning_rate": 1.0211386521851585e-06, + "loss": 0.584, + "step": 59516 + }, + { + "epoch": 1.53, + "learning_rate": 1.021110987906033e-06, + "loss": 0.5996, + "step": 59517 + }, + { + "epoch": 1.53, + "learning_rate": 1.0210833236107434e-06, + "loss": 0.6211, + "step": 59518 + }, + { + "epoch": 1.53, + "learning_rate": 1.0210556592993118e-06, + "loss": 0.5725, + "step": 59519 + }, + { + "epoch": 1.53, + "learning_rate": 1.0210279949717585e-06, + "loss": 0.6899, + "step": 59520 + }, + { + "epoch": 1.53, + "learning_rate": 1.0210003306281052e-06, + "loss": 0.605, + "step": 59521 + }, + { + "epoch": 1.53, + "learning_rate": 1.0209726662683729e-06, + "loss": 0.7393, + "step": 59522 + }, + { + "epoch": 1.53, + "learning_rate": 1.0209450018925825e-06, + "loss": 0.6216, + "step": 59523 + }, + { + "epoch": 1.53, + "learning_rate": 1.0209173375007559e-06, + "loss": 0.6426, + "step": 59524 + }, + { + "epoch": 1.53, + "learning_rate": 1.0208896730929135e-06, + "loss": 0.5181, + "step": 59525 + }, + { + "epoch": 1.53, + "learning_rate": 1.0208620086690771e-06, + "loss": 0.6104, + "step": 59526 + }, + { + "epoch": 1.53, + "learning_rate": 1.0208343442292676e-06, + "loss": 0.7578, + "step": 59527 + }, + { + "epoch": 1.53, + "learning_rate": 1.020806679773506e-06, + "loss": 0.6069, + "step": 59528 + }, + { + "epoch": 1.53, + "learning_rate": 1.0207790153018135e-06, + "loss": 0.7246, + "step": 59529 + }, + { + "epoch": 1.53, + "learning_rate": 1.020751350814212e-06, + "loss": 0.4556, + "step": 59530 + }, + { + "epoch": 1.53, + "learning_rate": 1.020723686310722e-06, + "loss": 0.7207, + "step": 59531 + }, + { + "epoch": 1.53, + "learning_rate": 1.0206960217913648e-06, + "loss": 0.6396, + "step": 59532 + }, + { + "epoch": 1.53, + "learning_rate": 1.0206683572561613e-06, + "loss": 0.8232, + "step": 59533 + }, + { + "epoch": 1.53, + "learning_rate": 1.0206406927051334e-06, + "loss": 0.6265, + "step": 59534 + }, + { + "epoch": 1.53, + "learning_rate": 1.0206130281383017e-06, + "loss": 0.4194, + "step": 59535 + }, + { + "epoch": 1.53, + "learning_rate": 1.0205853635556877e-06, + "loss": 0.6382, + "step": 59536 + }, + { + "epoch": 1.53, + "learning_rate": 1.020557698957312e-06, + "loss": 0.5742, + "step": 59537 + }, + { + "epoch": 1.53, + "learning_rate": 1.0205300343431967e-06, + "loss": 0.7305, + "step": 59538 + }, + { + "epoch": 1.53, + "learning_rate": 1.020502369713362e-06, + "loss": 0.8447, + "step": 59539 + }, + { + "epoch": 1.53, + "learning_rate": 1.0204747050678302e-06, + "loss": 0.5732, + "step": 59540 + }, + { + "epoch": 1.53, + "learning_rate": 1.0204470404066215e-06, + "loss": 0.2485, + "step": 59541 + }, + { + "epoch": 1.53, + "learning_rate": 1.0204193757297575e-06, + "loss": 0.7246, + "step": 59542 + }, + { + "epoch": 1.53, + "learning_rate": 1.0203917110372594e-06, + "loss": 0.4927, + "step": 59543 + }, + { + "epoch": 1.53, + "learning_rate": 1.0203640463291481e-06, + "loss": 0.584, + "step": 59544 + }, + { + "epoch": 1.53, + "learning_rate": 1.0203363816054451e-06, + "loss": 0.6465, + "step": 59545 + }, + { + "epoch": 1.53, + "learning_rate": 1.0203087168661713e-06, + "loss": 0.5508, + "step": 59546 + }, + { + "epoch": 1.53, + "learning_rate": 1.0202810521113483e-06, + "loss": 0.7427, + "step": 59547 + }, + { + "epoch": 1.53, + "learning_rate": 1.0202533873409968e-06, + "loss": 0.5903, + "step": 59548 + }, + { + "epoch": 1.53, + "learning_rate": 1.0202257225551385e-06, + "loss": 0.6836, + "step": 59549 + }, + { + "epoch": 1.53, + "learning_rate": 1.0201980577537941e-06, + "loss": 0.7988, + "step": 59550 + }, + { + "epoch": 1.53, + "learning_rate": 1.020170392936985e-06, + "loss": 0.6416, + "step": 59551 + }, + { + "epoch": 1.53, + "learning_rate": 1.0201427281047324e-06, + "loss": 0.6216, + "step": 59552 + }, + { + "epoch": 1.53, + "learning_rate": 1.0201150632570574e-06, + "loss": 0.6187, + "step": 59553 + }, + { + "epoch": 1.53, + "learning_rate": 1.0200873983939813e-06, + "loss": 0.7246, + "step": 59554 + }, + { + "epoch": 1.53, + "learning_rate": 1.0200597335155251e-06, + "loss": 0.6973, + "step": 59555 + }, + { + "epoch": 1.53, + "learning_rate": 1.0200320686217102e-06, + "loss": 0.5332, + "step": 59556 + }, + { + "epoch": 1.53, + "learning_rate": 1.0200044037125577e-06, + "loss": 0.6069, + "step": 59557 + }, + { + "epoch": 1.53, + "learning_rate": 1.0199767387880884e-06, + "loss": 0.7842, + "step": 59558 + }, + { + "epoch": 1.53, + "learning_rate": 1.0199490738483242e-06, + "loss": 0.7617, + "step": 59559 + }, + { + "epoch": 1.53, + "learning_rate": 1.019921408893286e-06, + "loss": 0.6196, + "step": 59560 + }, + { + "epoch": 1.53, + "learning_rate": 1.0198937439229947e-06, + "loss": 0.3867, + "step": 59561 + }, + { + "epoch": 1.53, + "learning_rate": 1.0198660789374712e-06, + "loss": 0.6204, + "step": 59562 + }, + { + "epoch": 1.53, + "learning_rate": 1.019838413936738e-06, + "loss": 0.6826, + "step": 59563 + }, + { + "epoch": 1.53, + "learning_rate": 1.0198107489208148e-06, + "loss": 0.7256, + "step": 59564 + }, + { + "epoch": 1.53, + "learning_rate": 1.0197830838897237e-06, + "loss": 0.8037, + "step": 59565 + }, + { + "epoch": 1.53, + "learning_rate": 1.0197554188434856e-06, + "loss": 0.7007, + "step": 59566 + }, + { + "epoch": 1.53, + "learning_rate": 1.0197277537821216e-06, + "loss": 0.5283, + "step": 59567 + }, + { + "epoch": 1.53, + "learning_rate": 1.019700088705653e-06, + "loss": 0.791, + "step": 59568 + }, + { + "epoch": 1.53, + "learning_rate": 1.0196724236141008e-06, + "loss": 0.832, + "step": 59569 + }, + { + "epoch": 1.53, + "learning_rate": 1.0196447585074868e-06, + "loss": 0.8604, + "step": 59570 + }, + { + "epoch": 1.53, + "learning_rate": 1.0196170933858311e-06, + "loss": 0.75, + "step": 59571 + }, + { + "epoch": 1.53, + "learning_rate": 1.0195894282491561e-06, + "loss": 0.873, + "step": 59572 + }, + { + "epoch": 1.53, + "learning_rate": 1.0195617630974819e-06, + "loss": 0.7256, + "step": 59573 + }, + { + "epoch": 1.53, + "learning_rate": 1.0195340979308304e-06, + "loss": 0.5046, + "step": 59574 + }, + { + "epoch": 1.53, + "learning_rate": 1.0195064327492226e-06, + "loss": 0.6826, + "step": 59575 + }, + { + "epoch": 1.53, + "learning_rate": 1.0194787675526796e-06, + "loss": 0.4978, + "step": 59576 + }, + { + "epoch": 1.53, + "learning_rate": 1.0194511023412222e-06, + "loss": 0.6875, + "step": 59577 + }, + { + "epoch": 1.53, + "learning_rate": 1.0194234371148724e-06, + "loss": 0.5635, + "step": 59578 + }, + { + "epoch": 1.53, + "learning_rate": 1.0193957718736507e-06, + "loss": 0.7119, + "step": 59579 + }, + { + "epoch": 1.53, + "learning_rate": 1.019368106617579e-06, + "loss": 0.7246, + "step": 59580 + }, + { + "epoch": 1.53, + "learning_rate": 1.0193404413466774e-06, + "loss": 0.6084, + "step": 59581 + }, + { + "epoch": 1.53, + "learning_rate": 1.0193127760609683e-06, + "loss": 0.6738, + "step": 59582 + }, + { + "epoch": 1.53, + "learning_rate": 1.0192851107604718e-06, + "loss": 0.4426, + "step": 59583 + }, + { + "epoch": 1.53, + "learning_rate": 1.01925744544521e-06, + "loss": 0.3772, + "step": 59584 + }, + { + "epoch": 1.53, + "learning_rate": 1.0192297801152036e-06, + "loss": 0.6477, + "step": 59585 + }, + { + "epoch": 1.53, + "learning_rate": 1.0192021147704734e-06, + "loss": 0.4814, + "step": 59586 + }, + { + "epoch": 1.53, + "learning_rate": 1.0191744494110415e-06, + "loss": 0.469, + "step": 59587 + }, + { + "epoch": 1.53, + "learning_rate": 1.0191467840369285e-06, + "loss": 0.7178, + "step": 59588 + }, + { + "epoch": 1.53, + "learning_rate": 1.0191191186481556e-06, + "loss": 0.4893, + "step": 59589 + }, + { + "epoch": 1.53, + "learning_rate": 1.0190914532447442e-06, + "loss": 0.6135, + "step": 59590 + }, + { + "epoch": 1.53, + "learning_rate": 1.0190637878267151e-06, + "loss": 0.7891, + "step": 59591 + }, + { + "epoch": 1.53, + "learning_rate": 1.01903612239409e-06, + "loss": 0.6846, + "step": 59592 + }, + { + "epoch": 1.53, + "learning_rate": 1.0190084569468897e-06, + "loss": 0.665, + "step": 59593 + }, + { + "epoch": 1.53, + "learning_rate": 1.0189807914851354e-06, + "loss": 0.6333, + "step": 59594 + }, + { + "epoch": 1.53, + "learning_rate": 1.0189531260088489e-06, + "loss": 0.5837, + "step": 59595 + }, + { + "epoch": 1.53, + "learning_rate": 1.0189254605180501e-06, + "loss": 0.5918, + "step": 59596 + }, + { + "epoch": 1.53, + "learning_rate": 1.0188977950127614e-06, + "loss": 0.6289, + "step": 59597 + }, + { + "epoch": 1.53, + "learning_rate": 1.0188701294930033e-06, + "loss": 0.6973, + "step": 59598 + }, + { + "epoch": 1.53, + "learning_rate": 1.0188424639587973e-06, + "loss": 0.748, + "step": 59599 + }, + { + "epoch": 1.53, + "learning_rate": 1.0188147984101647e-06, + "loss": 0.71, + "step": 59600 + }, + { + "epoch": 1.53, + "learning_rate": 1.0187871328471265e-06, + "loss": 0.5713, + "step": 59601 + }, + { + "epoch": 1.53, + "learning_rate": 1.0187594672697033e-06, + "loss": 0.6904, + "step": 59602 + }, + { + "epoch": 1.53, + "learning_rate": 1.0187318016779175e-06, + "loss": 0.7158, + "step": 59603 + }, + { + "epoch": 1.53, + "learning_rate": 1.0187041360717889e-06, + "loss": 0.7744, + "step": 59604 + }, + { + "epoch": 1.53, + "learning_rate": 1.01867647045134e-06, + "loss": 0.7803, + "step": 59605 + }, + { + "epoch": 1.53, + "learning_rate": 1.0186488048165913e-06, + "loss": 0.7891, + "step": 59606 + }, + { + "epoch": 1.53, + "learning_rate": 1.018621139167564e-06, + "loss": 0.626, + "step": 59607 + }, + { + "epoch": 1.53, + "learning_rate": 1.0185934735042792e-06, + "loss": 0.7314, + "step": 59608 + }, + { + "epoch": 1.53, + "learning_rate": 1.0185658078267584e-06, + "loss": 0.8184, + "step": 59609 + }, + { + "epoch": 1.53, + "learning_rate": 1.0185381421350227e-06, + "loss": 0.6768, + "step": 59610 + }, + { + "epoch": 1.53, + "learning_rate": 1.0185104764290929e-06, + "loss": 0.668, + "step": 59611 + }, + { + "epoch": 1.53, + "learning_rate": 1.0184828107089907e-06, + "loss": 0.8281, + "step": 59612 + }, + { + "epoch": 1.53, + "learning_rate": 1.018455144974737e-06, + "loss": 0.7988, + "step": 59613 + }, + { + "epoch": 1.53, + "learning_rate": 1.018427479226353e-06, + "loss": 0.6074, + "step": 59614 + }, + { + "epoch": 1.53, + "learning_rate": 1.0183998134638601e-06, + "loss": 0.6897, + "step": 59615 + }, + { + "epoch": 1.53, + "learning_rate": 1.018372147687279e-06, + "loss": 0.6982, + "step": 59616 + }, + { + "epoch": 1.53, + "learning_rate": 1.0183444818966313e-06, + "loss": 0.6006, + "step": 59617 + }, + { + "epoch": 1.53, + "learning_rate": 1.0183168160919385e-06, + "loss": 0.574, + "step": 59618 + }, + { + "epoch": 1.53, + "learning_rate": 1.0182891502732207e-06, + "loss": 0.7051, + "step": 59619 + }, + { + "epoch": 1.53, + "learning_rate": 1.0182614844405004e-06, + "loss": 0.8018, + "step": 59620 + }, + { + "epoch": 1.53, + "learning_rate": 1.0182338185937975e-06, + "loss": 0.7773, + "step": 59621 + }, + { + "epoch": 1.53, + "learning_rate": 1.0182061527331343e-06, + "loss": 0.5901, + "step": 59622 + }, + { + "epoch": 1.53, + "learning_rate": 1.018178486858531e-06, + "loss": 0.2466, + "step": 59623 + }, + { + "epoch": 1.53, + "learning_rate": 1.0181508209700096e-06, + "loss": 0.4519, + "step": 59624 + }, + { + "epoch": 1.53, + "learning_rate": 1.0181231550675908e-06, + "loss": 0.5034, + "step": 59625 + }, + { + "epoch": 1.53, + "learning_rate": 1.0180954891512963e-06, + "loss": 0.7529, + "step": 59626 + }, + { + "epoch": 1.53, + "learning_rate": 1.0180678232211464e-06, + "loss": 0.5933, + "step": 59627 + }, + { + "epoch": 1.53, + "learning_rate": 1.018040157277163e-06, + "loss": 0.6064, + "step": 59628 + }, + { + "epoch": 1.53, + "learning_rate": 1.0180124913193671e-06, + "loss": 0.6836, + "step": 59629 + }, + { + "epoch": 1.53, + "learning_rate": 1.0179848253477798e-06, + "loss": 0.6172, + "step": 59630 + }, + { + "epoch": 1.53, + "learning_rate": 1.0179571593624225e-06, + "loss": 0.4814, + "step": 59631 + }, + { + "epoch": 1.53, + "learning_rate": 1.0179294933633163e-06, + "loss": 0.5737, + "step": 59632 + }, + { + "epoch": 1.53, + "learning_rate": 1.017901827350482e-06, + "loss": 0.5583, + "step": 59633 + }, + { + "epoch": 1.53, + "learning_rate": 1.0178741613239412e-06, + "loss": 0.5767, + "step": 59634 + }, + { + "epoch": 1.53, + "learning_rate": 1.0178464952837152e-06, + "loss": 0.5791, + "step": 59635 + }, + { + "epoch": 1.53, + "learning_rate": 1.0178188292298246e-06, + "loss": 0.5913, + "step": 59636 + }, + { + "epoch": 1.53, + "learning_rate": 1.0177911631622913e-06, + "loss": 0.568, + "step": 59637 + }, + { + "epoch": 1.53, + "learning_rate": 1.0177634970811357e-06, + "loss": 0.7061, + "step": 59638 + }, + { + "epoch": 1.53, + "learning_rate": 1.0177358309863798e-06, + "loss": 0.6616, + "step": 59639 + }, + { + "epoch": 1.53, + "learning_rate": 1.0177081648780443e-06, + "loss": 0.6987, + "step": 59640 + }, + { + "epoch": 1.53, + "learning_rate": 1.0176804987561505e-06, + "loss": 0.6089, + "step": 59641 + }, + { + "epoch": 1.53, + "learning_rate": 1.0176528326207193e-06, + "loss": 0.6577, + "step": 59642 + }, + { + "epoch": 1.53, + "learning_rate": 1.0176251664717724e-06, + "loss": 0.6943, + "step": 59643 + }, + { + "epoch": 1.53, + "learning_rate": 1.0175975003093305e-06, + "loss": 0.5161, + "step": 59644 + }, + { + "epoch": 1.53, + "learning_rate": 1.0175698341334154e-06, + "loss": 0.5854, + "step": 59645 + }, + { + "epoch": 1.53, + "learning_rate": 1.0175421679440474e-06, + "loss": 0.7207, + "step": 59646 + }, + { + "epoch": 1.53, + "learning_rate": 1.0175145017412485e-06, + "loss": 0.6895, + "step": 59647 + }, + { + "epoch": 1.53, + "learning_rate": 1.0174868355250393e-06, + "loss": 0.667, + "step": 59648 + }, + { + "epoch": 1.53, + "learning_rate": 1.0174591692954415e-06, + "loss": 0.5386, + "step": 59649 + }, + { + "epoch": 1.53, + "learning_rate": 1.017431503052476e-06, + "loss": 0.8076, + "step": 59650 + }, + { + "epoch": 1.53, + "learning_rate": 1.0174038367961639e-06, + "loss": 0.6631, + "step": 59651 + }, + { + "epoch": 1.53, + "learning_rate": 1.0173761705265262e-06, + "loss": 0.6372, + "step": 59652 + }, + { + "epoch": 1.53, + "learning_rate": 1.0173485042435848e-06, + "loss": 0.7939, + "step": 59653 + }, + { + "epoch": 1.53, + "learning_rate": 1.01732083794736e-06, + "loss": 0.7422, + "step": 59654 + }, + { + "epoch": 1.53, + "learning_rate": 1.017293171637874e-06, + "loss": 0.5459, + "step": 59655 + }, + { + "epoch": 1.53, + "learning_rate": 1.0172655053151472e-06, + "loss": 0.5664, + "step": 59656 + }, + { + "epoch": 1.53, + "learning_rate": 1.0172378389792006e-06, + "loss": 0.6099, + "step": 59657 + }, + { + "epoch": 1.53, + "learning_rate": 1.0172101726300564e-06, + "loss": 0.6689, + "step": 59658 + }, + { + "epoch": 1.53, + "learning_rate": 1.0171825062677347e-06, + "loss": 0.6982, + "step": 59659 + }, + { + "epoch": 1.53, + "learning_rate": 1.0171548398922577e-06, + "loss": 0.5051, + "step": 59660 + }, + { + "epoch": 1.53, + "learning_rate": 1.0171271735036453e-06, + "loss": 0.8027, + "step": 59661 + }, + { + "epoch": 1.53, + "learning_rate": 1.0170995071019199e-06, + "loss": 0.5928, + "step": 59662 + }, + { + "epoch": 1.53, + "learning_rate": 1.017071840687102e-06, + "loss": 0.6025, + "step": 59663 + }, + { + "epoch": 1.53, + "learning_rate": 1.0170441742592132e-06, + "loss": 0.5801, + "step": 59664 + }, + { + "epoch": 1.53, + "learning_rate": 1.0170165078182743e-06, + "loss": 0.5859, + "step": 59665 + }, + { + "epoch": 1.53, + "learning_rate": 1.0169888413643066e-06, + "loss": 0.7354, + "step": 59666 + }, + { + "epoch": 1.53, + "learning_rate": 1.0169611748973312e-06, + "loss": 0.6982, + "step": 59667 + }, + { + "epoch": 1.53, + "learning_rate": 1.0169335084173695e-06, + "loss": 0.5535, + "step": 59668 + }, + { + "epoch": 1.53, + "learning_rate": 1.0169058419244425e-06, + "loss": 0.6245, + "step": 59669 + }, + { + "epoch": 1.53, + "learning_rate": 1.016878175418572e-06, + "loss": 0.7188, + "step": 59670 + }, + { + "epoch": 1.53, + "learning_rate": 1.016850508899778e-06, + "loss": 0.6426, + "step": 59671 + }, + { + "epoch": 1.53, + "learning_rate": 1.0168228423680828e-06, + "loss": 0.7007, + "step": 59672 + }, + { + "epoch": 1.53, + "learning_rate": 1.0167951758235067e-06, + "loss": 0.6851, + "step": 59673 + }, + { + "epoch": 1.53, + "learning_rate": 1.0167675092660716e-06, + "loss": 0.5918, + "step": 59674 + }, + { + "epoch": 1.53, + "learning_rate": 1.0167398426957984e-06, + "loss": 0.6758, + "step": 59675 + }, + { + "epoch": 1.53, + "learning_rate": 1.0167121761127082e-06, + "loss": 0.7256, + "step": 59676 + }, + { + "epoch": 1.53, + "learning_rate": 1.0166845095168224e-06, + "loss": 0.7734, + "step": 59677 + }, + { + "epoch": 1.53, + "learning_rate": 1.016656842908162e-06, + "loss": 0.582, + "step": 59678 + }, + { + "epoch": 1.53, + "learning_rate": 1.0166291762867479e-06, + "loss": 0.7295, + "step": 59679 + }, + { + "epoch": 1.53, + "learning_rate": 1.016601509652602e-06, + "loss": 0.6436, + "step": 59680 + }, + { + "epoch": 1.53, + "learning_rate": 1.0165738430057448e-06, + "loss": 0.5828, + "step": 59681 + }, + { + "epoch": 1.53, + "learning_rate": 1.0165461763461978e-06, + "loss": 0.7002, + "step": 59682 + }, + { + "epoch": 1.53, + "learning_rate": 1.0165185096739823e-06, + "loss": 0.6626, + "step": 59683 + }, + { + "epoch": 1.53, + "learning_rate": 1.0164908429891193e-06, + "loss": 0.6611, + "step": 59684 + }, + { + "epoch": 1.53, + "learning_rate": 1.0164631762916302e-06, + "loss": 0.5142, + "step": 59685 + }, + { + "epoch": 1.53, + "learning_rate": 1.0164355095815356e-06, + "loss": 0.6558, + "step": 59686 + }, + { + "epoch": 1.53, + "learning_rate": 1.0164078428588573e-06, + "loss": 0.5786, + "step": 59687 + }, + { + "epoch": 1.53, + "learning_rate": 1.0163801761236162e-06, + "loss": 0.8125, + "step": 59688 + }, + { + "epoch": 1.53, + "learning_rate": 1.0163525093758335e-06, + "loss": 0.4976, + "step": 59689 + }, + { + "epoch": 1.53, + "learning_rate": 1.0163248426155308e-06, + "loss": 0.6621, + "step": 59690 + }, + { + "epoch": 1.53, + "learning_rate": 1.0162971758427287e-06, + "loss": 0.6069, + "step": 59691 + }, + { + "epoch": 1.53, + "learning_rate": 1.0162695090574485e-06, + "loss": 0.6006, + "step": 59692 + }, + { + "epoch": 1.53, + "learning_rate": 1.0162418422597116e-06, + "loss": 0.5327, + "step": 59693 + }, + { + "epoch": 1.53, + "learning_rate": 1.0162141754495388e-06, + "loss": 0.5908, + "step": 59694 + }, + { + "epoch": 1.53, + "learning_rate": 1.016186508626952e-06, + "loss": 0.7129, + "step": 59695 + }, + { + "epoch": 1.53, + "learning_rate": 1.0161588417919718e-06, + "loss": 0.7119, + "step": 59696 + }, + { + "epoch": 1.53, + "learning_rate": 1.0161311749446193e-06, + "loss": 0.5703, + "step": 59697 + }, + { + "epoch": 1.53, + "learning_rate": 1.016103508084916e-06, + "loss": 0.7002, + "step": 59698 + }, + { + "epoch": 1.53, + "learning_rate": 1.0160758412128831e-06, + "loss": 0.5029, + "step": 59699 + }, + { + "epoch": 1.53, + "learning_rate": 1.0160481743285416e-06, + "loss": 0.5327, + "step": 59700 + }, + { + "epoch": 1.53, + "learning_rate": 1.0160205074319125e-06, + "loss": 0.6978, + "step": 59701 + }, + { + "epoch": 1.53, + "learning_rate": 1.0159928405230176e-06, + "loss": 0.5752, + "step": 59702 + }, + { + "epoch": 1.53, + "learning_rate": 1.0159651736018775e-06, + "loss": 0.9062, + "step": 59703 + }, + { + "epoch": 1.53, + "learning_rate": 1.0159375066685135e-06, + "loss": 0.7871, + "step": 59704 + }, + { + "epoch": 1.53, + "learning_rate": 1.0159098397229474e-06, + "loss": 0.6123, + "step": 59705 + }, + { + "epoch": 1.53, + "learning_rate": 1.0158821727651996e-06, + "loss": 0.6631, + "step": 59706 + }, + { + "epoch": 1.53, + "learning_rate": 1.0158545057952912e-06, + "loss": 0.583, + "step": 59707 + }, + { + "epoch": 1.53, + "learning_rate": 1.015826838813244e-06, + "loss": 0.7139, + "step": 59708 + }, + { + "epoch": 1.53, + "learning_rate": 1.0157991718190789e-06, + "loss": 0.6738, + "step": 59709 + }, + { + "epoch": 1.53, + "learning_rate": 1.0157715048128175e-06, + "loss": 0.3671, + "step": 59710 + }, + { + "epoch": 1.53, + "learning_rate": 1.01574383779448e-06, + "loss": 0.5496, + "step": 59711 + }, + { + "epoch": 1.53, + "learning_rate": 1.0157161707640884e-06, + "loss": 0.5559, + "step": 59712 + }, + { + "epoch": 1.53, + "learning_rate": 1.0156885037216636e-06, + "loss": 0.6553, + "step": 59713 + }, + { + "epoch": 1.53, + "learning_rate": 1.015660836667227e-06, + "loss": 0.8184, + "step": 59714 + }, + { + "epoch": 1.53, + "learning_rate": 1.0156331696007994e-06, + "loss": 0.6992, + "step": 59715 + }, + { + "epoch": 1.53, + "learning_rate": 1.0156055025224024e-06, + "loss": 0.7246, + "step": 59716 + }, + { + "epoch": 1.53, + "learning_rate": 1.0155778354320567e-06, + "loss": 0.6328, + "step": 59717 + }, + { + "epoch": 1.53, + "learning_rate": 1.015550168329784e-06, + "loss": 0.6309, + "step": 59718 + }, + { + "epoch": 1.53, + "learning_rate": 1.015522501215605e-06, + "loss": 0.7539, + "step": 59719 + }, + { + "epoch": 1.53, + "learning_rate": 1.0154948340895415e-06, + "loss": 0.7178, + "step": 59720 + }, + { + "epoch": 1.53, + "learning_rate": 1.0154671669516142e-06, + "loss": 0.7031, + "step": 59721 + }, + { + "epoch": 1.53, + "learning_rate": 1.0154394998018445e-06, + "loss": 0.6943, + "step": 59722 + }, + { + "epoch": 1.53, + "learning_rate": 1.0154118326402531e-06, + "loss": 0.3767, + "step": 59723 + }, + { + "epoch": 1.53, + "learning_rate": 1.0153841654668618e-06, + "loss": 0.6299, + "step": 59724 + }, + { + "epoch": 1.53, + "learning_rate": 1.0153564982816918e-06, + "loss": 0.6982, + "step": 59725 + }, + { + "epoch": 1.53, + "learning_rate": 1.0153288310847636e-06, + "loss": 0.7754, + "step": 59726 + }, + { + "epoch": 1.53, + "learning_rate": 1.015301163876099e-06, + "loss": 0.9277, + "step": 59727 + }, + { + "epoch": 1.53, + "learning_rate": 1.0152734966557187e-06, + "loss": 0.6104, + "step": 59728 + }, + { + "epoch": 1.53, + "learning_rate": 1.0152458294236447e-06, + "loss": 0.6729, + "step": 59729 + }, + { + "epoch": 1.53, + "learning_rate": 1.0152181621798976e-06, + "loss": 0.4128, + "step": 59730 + }, + { + "epoch": 1.53, + "learning_rate": 1.0151904949244984e-06, + "loss": 0.7397, + "step": 59731 + }, + { + "epoch": 1.53, + "learning_rate": 1.0151628276574686e-06, + "loss": 0.7109, + "step": 59732 + }, + { + "epoch": 1.53, + "learning_rate": 1.0151351603788294e-06, + "loss": 0.8369, + "step": 59733 + }, + { + "epoch": 1.53, + "learning_rate": 1.015107493088602e-06, + "loss": 0.6445, + "step": 59734 + }, + { + "epoch": 1.53, + "learning_rate": 1.0150798257868074e-06, + "loss": 0.5894, + "step": 59735 + }, + { + "epoch": 1.53, + "learning_rate": 1.0150521584734668e-06, + "loss": 0.6914, + "step": 59736 + }, + { + "epoch": 1.53, + "learning_rate": 1.0150244911486014e-06, + "loss": 0.6133, + "step": 59737 + }, + { + "epoch": 1.53, + "learning_rate": 1.0149968238122326e-06, + "loss": 0.562, + "step": 59738 + }, + { + "epoch": 1.53, + "learning_rate": 1.0149691564643813e-06, + "loss": 0.5601, + "step": 59739 + }, + { + "epoch": 1.53, + "learning_rate": 1.014941489105069e-06, + "loss": 0.7881, + "step": 59740 + }, + { + "epoch": 1.53, + "learning_rate": 1.0149138217343164e-06, + "loss": 0.6475, + "step": 59741 + }, + { + "epoch": 1.53, + "learning_rate": 1.0148861543521452e-06, + "loss": 0.5596, + "step": 59742 + }, + { + "epoch": 1.53, + "learning_rate": 1.0148584869585764e-06, + "loss": 0.8262, + "step": 59743 + }, + { + "epoch": 1.53, + "learning_rate": 1.0148308195536308e-06, + "loss": 0.6982, + "step": 59744 + }, + { + "epoch": 1.53, + "learning_rate": 1.01480315213733e-06, + "loss": 0.6211, + "step": 59745 + }, + { + "epoch": 1.53, + "learning_rate": 1.0147754847096955e-06, + "loss": 0.7422, + "step": 59746 + }, + { + "epoch": 1.53, + "learning_rate": 1.0147478172707474e-06, + "loss": 0.5957, + "step": 59747 + }, + { + "epoch": 1.53, + "learning_rate": 1.0147201498205083e-06, + "loss": 0.542, + "step": 59748 + }, + { + "epoch": 1.53, + "learning_rate": 1.0146924823589982e-06, + "loss": 0.8447, + "step": 59749 + }, + { + "epoch": 1.53, + "learning_rate": 1.0146648148862392e-06, + "loss": 0.561, + "step": 59750 + }, + { + "epoch": 1.53, + "learning_rate": 1.0146371474022517e-06, + "loss": 0.5747, + "step": 59751 + }, + { + "epoch": 1.53, + "learning_rate": 1.0146094799070573e-06, + "loss": 0.5459, + "step": 59752 + }, + { + "epoch": 1.53, + "learning_rate": 1.014581812400677e-06, + "loss": 0.7822, + "step": 59753 + }, + { + "epoch": 1.53, + "learning_rate": 1.014554144883132e-06, + "loss": 0.4893, + "step": 59754 + }, + { + "epoch": 1.53, + "learning_rate": 1.0145264773544437e-06, + "loss": 0.7236, + "step": 59755 + }, + { + "epoch": 1.53, + "learning_rate": 1.0144988098146333e-06, + "loss": 0.6313, + "step": 59756 + }, + { + "epoch": 1.53, + "learning_rate": 1.0144711422637213e-06, + "loss": 0.7207, + "step": 59757 + }, + { + "epoch": 1.53, + "learning_rate": 1.0144434747017299e-06, + "loss": 0.6455, + "step": 59758 + }, + { + "epoch": 1.53, + "learning_rate": 1.0144158071286794e-06, + "loss": 0.7314, + "step": 59759 + }, + { + "epoch": 1.53, + "learning_rate": 1.014388139544592e-06, + "loss": 0.7783, + "step": 59760 + }, + { + "epoch": 1.53, + "learning_rate": 1.0143604719494878e-06, + "loss": 0.4931, + "step": 59761 + }, + { + "epoch": 1.53, + "learning_rate": 1.0143328043433886e-06, + "loss": 0.7004, + "step": 59762 + }, + { + "epoch": 1.53, + "learning_rate": 1.014305136726315e-06, + "loss": 0.623, + "step": 59763 + }, + { + "epoch": 1.53, + "learning_rate": 1.0142774690982894e-06, + "loss": 0.79, + "step": 59764 + }, + { + "epoch": 1.53, + "learning_rate": 1.0142498014593317e-06, + "loss": 0.5896, + "step": 59765 + }, + { + "epoch": 1.53, + "learning_rate": 1.0142221338094637e-06, + "loss": 0.6836, + "step": 59766 + }, + { + "epoch": 1.53, + "learning_rate": 1.0141944661487064e-06, + "loss": 0.7207, + "step": 59767 + }, + { + "epoch": 1.53, + "learning_rate": 1.0141667984770812e-06, + "loss": 0.605, + "step": 59768 + }, + { + "epoch": 1.53, + "learning_rate": 1.0141391307946088e-06, + "loss": 0.7715, + "step": 59769 + }, + { + "epoch": 1.53, + "learning_rate": 1.014111463101311e-06, + "loss": 0.5693, + "step": 59770 + }, + { + "epoch": 1.53, + "learning_rate": 1.0140837953972088e-06, + "loss": 0.6846, + "step": 59771 + }, + { + "epoch": 1.53, + "learning_rate": 1.0140561276823229e-06, + "loss": 0.6929, + "step": 59772 + }, + { + "epoch": 1.53, + "learning_rate": 1.0140284599566752e-06, + "loss": 0.6206, + "step": 59773 + }, + { + "epoch": 1.53, + "learning_rate": 1.0140007922202862e-06, + "loss": 0.5635, + "step": 59774 + }, + { + "epoch": 1.53, + "learning_rate": 1.0139731244731779e-06, + "loss": 0.5752, + "step": 59775 + }, + { + "epoch": 1.53, + "learning_rate": 1.0139454567153707e-06, + "loss": 0.7634, + "step": 59776 + }, + { + "epoch": 1.53, + "learning_rate": 1.0139177889468864e-06, + "loss": 0.7559, + "step": 59777 + }, + { + "epoch": 1.53, + "learning_rate": 1.0138901211677456e-06, + "loss": 0.8848, + "step": 59778 + }, + { + "epoch": 1.53, + "learning_rate": 1.0138624533779698e-06, + "loss": 0.7979, + "step": 59779 + }, + { + "epoch": 1.53, + "learning_rate": 1.0138347855775801e-06, + "loss": 0.7012, + "step": 59780 + }, + { + "epoch": 1.53, + "learning_rate": 1.013807117766598e-06, + "loss": 0.8018, + "step": 59781 + }, + { + "epoch": 1.53, + "learning_rate": 1.0137794499450442e-06, + "loss": 0.6499, + "step": 59782 + }, + { + "epoch": 1.53, + "learning_rate": 1.0137517821129403e-06, + "loss": 0.626, + "step": 59783 + }, + { + "epoch": 1.53, + "learning_rate": 1.013724114270307e-06, + "loss": 0.5959, + "step": 59784 + }, + { + "epoch": 1.53, + "learning_rate": 1.0136964464171662e-06, + "loss": 0.7441, + "step": 59785 + }, + { + "epoch": 1.53, + "learning_rate": 1.0136687785535385e-06, + "loss": 0.6196, + "step": 59786 + }, + { + "epoch": 1.53, + "learning_rate": 1.0136411106794451e-06, + "loss": 0.6689, + "step": 59787 + }, + { + "epoch": 1.53, + "learning_rate": 1.0136134427949071e-06, + "loss": 0.6826, + "step": 59788 + }, + { + "epoch": 1.53, + "learning_rate": 1.0135857748999467e-06, + "loss": 0.7354, + "step": 59789 + }, + { + "epoch": 1.53, + "learning_rate": 1.0135581069945837e-06, + "loss": 0.46, + "step": 59790 + }, + { + "epoch": 1.53, + "learning_rate": 1.0135304390788398e-06, + "loss": 0.7354, + "step": 59791 + }, + { + "epoch": 1.53, + "learning_rate": 1.0135027711527367e-06, + "loss": 0.5822, + "step": 59792 + }, + { + "epoch": 1.53, + "learning_rate": 1.0134751032162946e-06, + "loss": 0.6748, + "step": 59793 + }, + { + "epoch": 1.53, + "learning_rate": 1.0134474352695358e-06, + "loss": 0.5498, + "step": 59794 + }, + { + "epoch": 1.53, + "learning_rate": 1.0134197673124805e-06, + "loss": 0.4709, + "step": 59795 + }, + { + "epoch": 1.53, + "learning_rate": 1.0133920993451506e-06, + "loss": 0.5996, + "step": 59796 + }, + { + "epoch": 1.53, + "learning_rate": 1.0133644313675667e-06, + "loss": 0.7041, + "step": 59797 + }, + { + "epoch": 1.53, + "learning_rate": 1.0133367633797504e-06, + "loss": 0.6528, + "step": 59798 + }, + { + "epoch": 1.53, + "learning_rate": 1.0133090953817228e-06, + "loss": 0.6738, + "step": 59799 + }, + { + "epoch": 1.53, + "learning_rate": 1.013281427373505e-06, + "loss": 0.5791, + "step": 59800 + }, + { + "epoch": 1.53, + "learning_rate": 1.0132537593551183e-06, + "loss": 0.6064, + "step": 59801 + }, + { + "epoch": 1.53, + "learning_rate": 1.0132260913265837e-06, + "loss": 0.7129, + "step": 59802 + }, + { + "epoch": 1.53, + "learning_rate": 1.0131984232879226e-06, + "loss": 0.6121, + "step": 59803 + }, + { + "epoch": 1.53, + "learning_rate": 1.013170755239156e-06, + "loss": 0.4087, + "step": 59804 + }, + { + "epoch": 1.53, + "learning_rate": 1.0131430871803052e-06, + "loss": 0.4971, + "step": 59805 + }, + { + "epoch": 1.53, + "learning_rate": 1.0131154191113914e-06, + "loss": 0.6846, + "step": 59806 + }, + { + "epoch": 1.53, + "learning_rate": 1.0130877510324355e-06, + "loss": 0.7686, + "step": 59807 + }, + { + "epoch": 1.53, + "learning_rate": 1.013060082943459e-06, + "loss": 0.6592, + "step": 59808 + }, + { + "epoch": 1.53, + "learning_rate": 1.0130324148444829e-06, + "loss": 0.5713, + "step": 59809 + }, + { + "epoch": 1.53, + "learning_rate": 1.0130047467355286e-06, + "loss": 0.7764, + "step": 59810 + }, + { + "epoch": 1.53, + "learning_rate": 1.0129770786166173e-06, + "loss": 0.542, + "step": 59811 + }, + { + "epoch": 1.53, + "learning_rate": 1.01294941048777e-06, + "loss": 0.5562, + "step": 59812 + }, + { + "epoch": 1.53, + "learning_rate": 1.0129217423490078e-06, + "loss": 0.4797, + "step": 59813 + }, + { + "epoch": 1.53, + "learning_rate": 1.012894074200352e-06, + "loss": 0.8652, + "step": 59814 + }, + { + "epoch": 1.53, + "learning_rate": 1.012866406041824e-06, + "loss": 0.6631, + "step": 59815 + }, + { + "epoch": 1.53, + "learning_rate": 1.0128387378734444e-06, + "loss": 0.7598, + "step": 59816 + }, + { + "epoch": 1.53, + "learning_rate": 1.0128110696952352e-06, + "loss": 0.585, + "step": 59817 + }, + { + "epoch": 1.53, + "learning_rate": 1.0127834015072168e-06, + "loss": 0.5522, + "step": 59818 + }, + { + "epoch": 1.53, + "learning_rate": 1.012755733309411e-06, + "loss": 0.4041, + "step": 59819 + }, + { + "epoch": 1.53, + "learning_rate": 1.0127280651018387e-06, + "loss": 0.5005, + "step": 59820 + }, + { + "epoch": 1.53, + "learning_rate": 1.0127003968845212e-06, + "loss": 0.5854, + "step": 59821 + }, + { + "epoch": 1.53, + "learning_rate": 1.0126727286574793e-06, + "loss": 0.6631, + "step": 59822 + }, + { + "epoch": 1.53, + "learning_rate": 1.0126450604207346e-06, + "loss": 0.7656, + "step": 59823 + }, + { + "epoch": 1.53, + "learning_rate": 1.012617392174308e-06, + "loss": 0.4229, + "step": 59824 + }, + { + "epoch": 1.53, + "learning_rate": 1.0125897239182213e-06, + "loss": 0.6963, + "step": 59825 + }, + { + "epoch": 1.53, + "learning_rate": 1.0125620556524948e-06, + "loss": 0.8701, + "step": 59826 + }, + { + "epoch": 1.53, + "learning_rate": 1.01253438737715e-06, + "loss": 0.4637, + "step": 59827 + }, + { + "epoch": 1.53, + "learning_rate": 1.0125067190922086e-06, + "loss": 0.7129, + "step": 59828 + }, + { + "epoch": 1.53, + "learning_rate": 1.0124790507976912e-06, + "loss": 0.8867, + "step": 59829 + }, + { + "epoch": 1.53, + "learning_rate": 1.0124513824936193e-06, + "loss": 0.5278, + "step": 59830 + }, + { + "epoch": 1.53, + "learning_rate": 1.0124237141800139e-06, + "loss": 0.7588, + "step": 59831 + }, + { + "epoch": 1.53, + "learning_rate": 1.012396045856896e-06, + "loss": 0.5566, + "step": 59832 + }, + { + "epoch": 1.53, + "learning_rate": 1.0123683775242873e-06, + "loss": 0.6914, + "step": 59833 + }, + { + "epoch": 1.53, + "learning_rate": 1.0123407091822084e-06, + "loss": 0.6187, + "step": 59834 + }, + { + "epoch": 1.53, + "learning_rate": 1.012313040830681e-06, + "loss": 0.71, + "step": 59835 + }, + { + "epoch": 1.53, + "learning_rate": 1.0122853724697263e-06, + "loss": 0.5798, + "step": 59836 + }, + { + "epoch": 1.53, + "learning_rate": 1.0122577040993647e-06, + "loss": 0.4875, + "step": 59837 + }, + { + "epoch": 1.53, + "learning_rate": 1.0122300357196183e-06, + "loss": 0.8237, + "step": 59838 + }, + { + "epoch": 1.53, + "learning_rate": 1.012202367330508e-06, + "loss": 0.707, + "step": 59839 + }, + { + "epoch": 1.53, + "learning_rate": 1.0121746989320547e-06, + "loss": 0.6797, + "step": 59840 + }, + { + "epoch": 1.53, + "learning_rate": 1.0121470305242799e-06, + "loss": 0.5013, + "step": 59841 + }, + { + "epoch": 1.53, + "learning_rate": 1.0121193621072047e-06, + "loss": 0.574, + "step": 59842 + }, + { + "epoch": 1.53, + "learning_rate": 1.0120916936808498e-06, + "loss": 0.8086, + "step": 59843 + }, + { + "epoch": 1.53, + "learning_rate": 1.0120640252452377e-06, + "loss": 0.7354, + "step": 59844 + }, + { + "epoch": 1.53, + "learning_rate": 1.0120363568003883e-06, + "loss": 0.5576, + "step": 59845 + }, + { + "epoch": 1.53, + "learning_rate": 1.012008688346323e-06, + "loss": 0.5605, + "step": 59846 + }, + { + "epoch": 1.53, + "learning_rate": 1.0119810198830635e-06, + "loss": 0.7563, + "step": 59847 + }, + { + "epoch": 1.53, + "learning_rate": 1.0119533514106304e-06, + "loss": 0.6318, + "step": 59848 + }, + { + "epoch": 1.53, + "learning_rate": 1.0119256829290454e-06, + "loss": 0.5859, + "step": 59849 + }, + { + "epoch": 1.53, + "learning_rate": 1.0118980144383296e-06, + "loss": 0.6094, + "step": 59850 + }, + { + "epoch": 1.53, + "learning_rate": 1.0118703459385037e-06, + "loss": 0.6797, + "step": 59851 + }, + { + "epoch": 1.53, + "learning_rate": 1.0118426774295894e-06, + "loss": 0.5565, + "step": 59852 + }, + { + "epoch": 1.53, + "learning_rate": 1.0118150089116076e-06, + "loss": 0.5762, + "step": 59853 + }, + { + "epoch": 1.53, + "learning_rate": 1.0117873403845797e-06, + "loss": 0.6685, + "step": 59854 + }, + { + "epoch": 1.53, + "learning_rate": 1.0117596718485268e-06, + "loss": 0.71, + "step": 59855 + }, + { + "epoch": 1.53, + "learning_rate": 1.0117320033034698e-06, + "loss": 0.793, + "step": 59856 + }, + { + "epoch": 1.53, + "learning_rate": 1.0117043347494304e-06, + "loss": 0.6787, + "step": 59857 + }, + { + "epoch": 1.53, + "learning_rate": 1.0116766661864295e-06, + "loss": 0.7119, + "step": 59858 + }, + { + "epoch": 1.53, + "learning_rate": 1.0116489976144885e-06, + "loss": 0.5421, + "step": 59859 + }, + { + "epoch": 1.53, + "learning_rate": 1.011621329033628e-06, + "loss": 0.7754, + "step": 59860 + }, + { + "epoch": 1.53, + "learning_rate": 1.0115936604438697e-06, + "loss": 0.627, + "step": 59861 + }, + { + "epoch": 1.53, + "learning_rate": 1.0115659918452347e-06, + "loss": 0.6797, + "step": 59862 + }, + { + "epoch": 1.53, + "learning_rate": 1.0115383232377441e-06, + "loss": 0.6924, + "step": 59863 + }, + { + "epoch": 1.53, + "learning_rate": 1.0115106546214194e-06, + "loss": 0.7217, + "step": 59864 + }, + { + "epoch": 1.53, + "learning_rate": 1.0114829859962814e-06, + "loss": 0.4402, + "step": 59865 + }, + { + "epoch": 1.53, + "learning_rate": 1.0114553173623512e-06, + "loss": 0.5667, + "step": 59866 + }, + { + "epoch": 1.53, + "learning_rate": 1.0114276487196505e-06, + "loss": 0.3584, + "step": 59867 + }, + { + "epoch": 1.53, + "learning_rate": 1.0113999800681998e-06, + "loss": 0.554, + "step": 59868 + }, + { + "epoch": 1.53, + "learning_rate": 1.011372311408021e-06, + "loss": 0.7383, + "step": 59869 + }, + { + "epoch": 1.53, + "learning_rate": 1.0113446427391348e-06, + "loss": 0.8745, + "step": 59870 + }, + { + "epoch": 1.53, + "learning_rate": 1.0113169740615625e-06, + "loss": 0.5791, + "step": 59871 + }, + { + "epoch": 1.53, + "learning_rate": 1.0112893053753254e-06, + "loss": 0.748, + "step": 59872 + }, + { + "epoch": 1.53, + "learning_rate": 1.0112616366804446e-06, + "loss": 0.6719, + "step": 59873 + }, + { + "epoch": 1.53, + "learning_rate": 1.0112339679769414e-06, + "loss": 0.8779, + "step": 59874 + }, + { + "epoch": 1.53, + "learning_rate": 1.0112062992648365e-06, + "loss": 0.6069, + "step": 59875 + }, + { + "epoch": 1.53, + "learning_rate": 1.0111786305441517e-06, + "loss": 0.5693, + "step": 59876 + }, + { + "epoch": 1.53, + "learning_rate": 1.0111509618149078e-06, + "loss": 0.7559, + "step": 59877 + }, + { + "epoch": 1.53, + "learning_rate": 1.011123293077126e-06, + "loss": 0.6758, + "step": 59878 + }, + { + "epoch": 1.53, + "learning_rate": 1.011095624330828e-06, + "loss": 0.5947, + "step": 59879 + }, + { + "epoch": 1.53, + "learning_rate": 1.0110679555760343e-06, + "loss": 0.5295, + "step": 59880 + }, + { + "epoch": 1.53, + "learning_rate": 1.0110402868127666e-06, + "loss": 0.6553, + "step": 59881 + }, + { + "epoch": 1.53, + "learning_rate": 1.0110126180410457e-06, + "loss": 0.6274, + "step": 59882 + }, + { + "epoch": 1.53, + "learning_rate": 1.0109849492608928e-06, + "loss": 0.7808, + "step": 59883 + }, + { + "epoch": 1.53, + "learning_rate": 1.0109572804723297e-06, + "loss": 0.5605, + "step": 59884 + }, + { + "epoch": 1.53, + "learning_rate": 1.0109296116753767e-06, + "loss": 0.7705, + "step": 59885 + }, + { + "epoch": 1.53, + "learning_rate": 1.0109019428700555e-06, + "loss": 0.5918, + "step": 59886 + }, + { + "epoch": 1.53, + "learning_rate": 1.0108742740563872e-06, + "loss": 0.498, + "step": 59887 + }, + { + "epoch": 1.53, + "learning_rate": 1.0108466052343932e-06, + "loss": 0.6582, + "step": 59888 + }, + { + "epoch": 1.53, + "learning_rate": 1.0108189364040942e-06, + "loss": 0.7773, + "step": 59889 + }, + { + "epoch": 1.54, + "learning_rate": 1.0107912675655117e-06, + "loss": 0.7637, + "step": 59890 + }, + { + "epoch": 1.54, + "learning_rate": 1.0107635987186666e-06, + "loss": 0.6602, + "step": 59891 + }, + { + "epoch": 1.54, + "learning_rate": 1.0107359298635807e-06, + "loss": 0.6445, + "step": 59892 + }, + { + "epoch": 1.54, + "learning_rate": 1.0107082610002744e-06, + "loss": 0.7793, + "step": 59893 + }, + { + "epoch": 1.54, + "learning_rate": 1.0106805921287698e-06, + "loss": 0.5635, + "step": 59894 + }, + { + "epoch": 1.54, + "learning_rate": 1.0106529232490871e-06, + "loss": 0.7744, + "step": 59895 + }, + { + "epoch": 1.54, + "learning_rate": 1.0106252543612482e-06, + "loss": 0.6045, + "step": 59896 + }, + { + "epoch": 1.54, + "learning_rate": 1.0105975854652736e-06, + "loss": 0.6572, + "step": 59897 + }, + { + "epoch": 1.54, + "learning_rate": 1.0105699165611854e-06, + "loss": 0.6309, + "step": 59898 + }, + { + "epoch": 1.54, + "learning_rate": 1.0105422476490042e-06, + "loss": 0.8232, + "step": 59899 + }, + { + "epoch": 1.54, + "learning_rate": 1.010514578728751e-06, + "loss": 0.7803, + "step": 59900 + }, + { + "epoch": 1.54, + "learning_rate": 1.0104869098004476e-06, + "loss": 0.9287, + "step": 59901 + }, + { + "epoch": 1.54, + "learning_rate": 1.010459240864115e-06, + "loss": 0.6147, + "step": 59902 + }, + { + "epoch": 1.54, + "learning_rate": 1.0104315719197736e-06, + "loss": 0.668, + "step": 59903 + }, + { + "epoch": 1.54, + "learning_rate": 1.0104039029674455e-06, + "loss": 0.6719, + "step": 59904 + }, + { + "epoch": 1.54, + "learning_rate": 1.010376234007152e-06, + "loss": 0.5923, + "step": 59905 + }, + { + "epoch": 1.54, + "learning_rate": 1.0103485650389135e-06, + "loss": 0.6104, + "step": 59906 + }, + { + "epoch": 1.54, + "learning_rate": 1.0103208960627517e-06, + "loss": 0.4648, + "step": 59907 + }, + { + "epoch": 1.54, + "learning_rate": 1.0102932270786874e-06, + "loss": 0.5532, + "step": 59908 + }, + { + "epoch": 1.54, + "learning_rate": 1.0102655580867428e-06, + "loss": 0.792, + "step": 59909 + }, + { + "epoch": 1.54, + "learning_rate": 1.0102378890869375e-06, + "loss": 0.6943, + "step": 59910 + }, + { + "epoch": 1.54, + "learning_rate": 1.0102102200792938e-06, + "loss": 0.7305, + "step": 59911 + }, + { + "epoch": 1.54, + "learning_rate": 1.0101825510638326e-06, + "loss": 0.3728, + "step": 59912 + }, + { + "epoch": 1.54, + "learning_rate": 1.0101548820405753e-06, + "loss": 0.4618, + "step": 59913 + }, + { + "epoch": 1.54, + "learning_rate": 1.0101272130095429e-06, + "loss": 0.7852, + "step": 59914 + }, + { + "epoch": 1.54, + "learning_rate": 1.0100995439707565e-06, + "loss": 0.6309, + "step": 59915 + }, + { + "epoch": 1.54, + "learning_rate": 1.010071874924237e-06, + "loss": 0.5938, + "step": 59916 + }, + { + "epoch": 1.54, + "learning_rate": 1.0100442058700062e-06, + "loss": 0.6631, + "step": 59917 + }, + { + "epoch": 1.54, + "learning_rate": 1.0100165368080848e-06, + "loss": 0.502, + "step": 59918 + }, + { + "epoch": 1.54, + "learning_rate": 1.0099888677384944e-06, + "loss": 0.8232, + "step": 59919 + }, + { + "epoch": 1.54, + "learning_rate": 1.0099611986612559e-06, + "loss": 0.6885, + "step": 59920 + }, + { + "epoch": 1.54, + "learning_rate": 1.009933529576391e-06, + "loss": 0.4452, + "step": 59921 + }, + { + "epoch": 1.54, + "learning_rate": 1.0099058604839196e-06, + "loss": 0.5957, + "step": 59922 + }, + { + "epoch": 1.54, + "learning_rate": 1.0098781913838646e-06, + "loss": 0.7383, + "step": 59923 + }, + { + "epoch": 1.54, + "learning_rate": 1.009850522276246e-06, + "loss": 0.3878, + "step": 59924 + }, + { + "epoch": 1.54, + "learning_rate": 1.0098228531610848e-06, + "loss": 0.7441, + "step": 59925 + }, + { + "epoch": 1.54, + "learning_rate": 1.0097951840384034e-06, + "loss": 0.5552, + "step": 59926 + }, + { + "epoch": 1.54, + "learning_rate": 1.009767514908222e-06, + "loss": 0.79, + "step": 59927 + }, + { + "epoch": 1.54, + "learning_rate": 1.009739845770562e-06, + "loss": 0.7598, + "step": 59928 + }, + { + "epoch": 1.54, + "learning_rate": 1.0097121766254449e-06, + "loss": 0.6198, + "step": 59929 + }, + { + "epoch": 1.54, + "learning_rate": 1.0096845074728912e-06, + "loss": 0.7686, + "step": 59930 + }, + { + "epoch": 1.54, + "learning_rate": 1.0096568383129227e-06, + "loss": 0.6787, + "step": 59931 + }, + { + "epoch": 1.54, + "learning_rate": 1.0096291691455606e-06, + "loss": 0.5408, + "step": 59932 + }, + { + "epoch": 1.54, + "learning_rate": 1.0096014999708256e-06, + "loss": 0.6348, + "step": 59933 + }, + { + "epoch": 1.54, + "learning_rate": 1.0095738307887397e-06, + "loss": 0.6758, + "step": 59934 + }, + { + "epoch": 1.54, + "learning_rate": 1.0095461615993231e-06, + "loss": 0.6484, + "step": 59935 + }, + { + "epoch": 1.54, + "learning_rate": 1.0095184924025975e-06, + "loss": 0.7979, + "step": 59936 + }, + { + "epoch": 1.54, + "learning_rate": 1.009490823198584e-06, + "loss": 0.5439, + "step": 59937 + }, + { + "epoch": 1.54, + "learning_rate": 1.009463153987304e-06, + "loss": 0.5127, + "step": 59938 + }, + { + "epoch": 1.54, + "learning_rate": 1.0094354847687783e-06, + "loss": 0.5957, + "step": 59939 + }, + { + "epoch": 1.54, + "learning_rate": 1.0094078155430285e-06, + "loss": 0.6279, + "step": 59940 + }, + { + "epoch": 1.54, + "learning_rate": 1.0093801463100753e-06, + "loss": 0.751, + "step": 59941 + }, + { + "epoch": 1.54, + "learning_rate": 1.0093524770699403e-06, + "loss": 0.6191, + "step": 59942 + }, + { + "epoch": 1.54, + "learning_rate": 1.0093248078226444e-06, + "loss": 0.6719, + "step": 59943 + }, + { + "epoch": 1.54, + "learning_rate": 1.009297138568209e-06, + "loss": 0.6973, + "step": 59944 + }, + { + "epoch": 1.54, + "learning_rate": 1.0092694693066555e-06, + "loss": 0.6719, + "step": 59945 + }, + { + "epoch": 1.54, + "learning_rate": 1.0092418000380043e-06, + "loss": 0.5933, + "step": 59946 + }, + { + "epoch": 1.54, + "learning_rate": 1.0092141307622774e-06, + "loss": 0.7427, + "step": 59947 + }, + { + "epoch": 1.54, + "learning_rate": 1.0091864614794955e-06, + "loss": 0.7363, + "step": 59948 + }, + { + "epoch": 1.54, + "learning_rate": 1.0091587921896804e-06, + "loss": 0.6807, + "step": 59949 + }, + { + "epoch": 1.54, + "learning_rate": 1.0091311228928522e-06, + "loss": 0.6475, + "step": 59950 + }, + { + "epoch": 1.54, + "learning_rate": 1.009103453589033e-06, + "loss": 0.6187, + "step": 59951 + }, + { + "epoch": 1.54, + "learning_rate": 1.0090757842782436e-06, + "loss": 0.5903, + "step": 59952 + }, + { + "epoch": 1.54, + "learning_rate": 1.0090481149605055e-06, + "loss": 0.4103, + "step": 59953 + }, + { + "epoch": 1.54, + "learning_rate": 1.0090204456358396e-06, + "loss": 0.5996, + "step": 59954 + }, + { + "epoch": 1.54, + "learning_rate": 1.0089927763042672e-06, + "loss": 0.7881, + "step": 59955 + }, + { + "epoch": 1.54, + "learning_rate": 1.0089651069658093e-06, + "loss": 0.748, + "step": 59956 + }, + { + "epoch": 1.54, + "learning_rate": 1.0089374376204872e-06, + "loss": 0.5623, + "step": 59957 + }, + { + "epoch": 1.54, + "learning_rate": 1.008909768268322e-06, + "loss": 0.6899, + "step": 59958 + }, + { + "epoch": 1.54, + "learning_rate": 1.0088820989093357e-06, + "loss": 0.8389, + "step": 59959 + }, + { + "epoch": 1.54, + "learning_rate": 1.008854429543548e-06, + "loss": 0.5933, + "step": 59960 + }, + { + "epoch": 1.54, + "learning_rate": 1.0088267601709813e-06, + "loss": 0.6293, + "step": 59961 + }, + { + "epoch": 1.54, + "learning_rate": 1.008799090791656e-06, + "loss": 0.7607, + "step": 59962 + }, + { + "epoch": 1.54, + "learning_rate": 1.008771421405594e-06, + "loss": 0.5068, + "step": 59963 + }, + { + "epoch": 1.54, + "learning_rate": 1.008743752012816e-06, + "loss": 0.6787, + "step": 59964 + }, + { + "epoch": 1.54, + "learning_rate": 1.0087160826133434e-06, + "loss": 0.5649, + "step": 59965 + }, + { + "epoch": 1.54, + "learning_rate": 1.0086884132071972e-06, + "loss": 0.6338, + "step": 59966 + }, + { + "epoch": 1.54, + "learning_rate": 1.0086607437943985e-06, + "loss": 0.7261, + "step": 59967 + }, + { + "epoch": 1.54, + "learning_rate": 1.0086330743749687e-06, + "loss": 0.5742, + "step": 59968 + }, + { + "epoch": 1.54, + "learning_rate": 1.0086054049489292e-06, + "loss": 0.6279, + "step": 59969 + }, + { + "epoch": 1.54, + "learning_rate": 1.008577735516301e-06, + "loss": 0.5205, + "step": 59970 + }, + { + "epoch": 1.54, + "learning_rate": 1.0085500660771049e-06, + "loss": 0.5962, + "step": 59971 + }, + { + "epoch": 1.54, + "learning_rate": 1.0085223966313626e-06, + "loss": 0.7822, + "step": 59972 + }, + { + "epoch": 1.54, + "learning_rate": 1.008494727179095e-06, + "loss": 0.8594, + "step": 59973 + }, + { + "epoch": 1.54, + "learning_rate": 1.0084670577203236e-06, + "loss": 0.7695, + "step": 59974 + }, + { + "epoch": 1.54, + "learning_rate": 1.008439388255069e-06, + "loss": 0.6782, + "step": 59975 + }, + { + "epoch": 1.54, + "learning_rate": 1.008411718783353e-06, + "loss": 0.5991, + "step": 59976 + }, + { + "epoch": 1.54, + "learning_rate": 1.0083840493051964e-06, + "loss": 0.6533, + "step": 59977 + }, + { + "epoch": 1.54, + "learning_rate": 1.0083563798206206e-06, + "loss": 0.6826, + "step": 59978 + }, + { + "epoch": 1.54, + "learning_rate": 1.0083287103296467e-06, + "loss": 0.7334, + "step": 59979 + }, + { + "epoch": 1.54, + "learning_rate": 1.008301040832296e-06, + "loss": 0.6279, + "step": 59980 + }, + { + "epoch": 1.54, + "learning_rate": 1.0082733713285893e-06, + "loss": 0.6904, + "step": 59981 + }, + { + "epoch": 1.54, + "learning_rate": 1.0082457018185483e-06, + "loss": 0.5288, + "step": 59982 + }, + { + "epoch": 1.54, + "learning_rate": 1.0082180323021937e-06, + "loss": 0.5874, + "step": 59983 + }, + { + "epoch": 1.54, + "learning_rate": 1.0081903627795474e-06, + "loss": 0.6235, + "step": 59984 + }, + { + "epoch": 1.54, + "learning_rate": 1.0081626932506297e-06, + "loss": 0.5815, + "step": 59985 + }, + { + "epoch": 1.54, + "learning_rate": 1.0081350237154625e-06, + "loss": 0.7266, + "step": 59986 + }, + { + "epoch": 1.54, + "learning_rate": 1.0081073541740663e-06, + "loss": 0.5562, + "step": 59987 + }, + { + "epoch": 1.54, + "learning_rate": 1.008079684626463e-06, + "loss": 0.6802, + "step": 59988 + }, + { + "epoch": 1.54, + "learning_rate": 1.0080520150726731e-06, + "loss": 0.6147, + "step": 59989 + }, + { + "epoch": 1.54, + "learning_rate": 1.0080243455127184e-06, + "loss": 0.6729, + "step": 59990 + }, + { + "epoch": 1.54, + "learning_rate": 1.00799667594662e-06, + "loss": 0.625, + "step": 59991 + }, + { + "epoch": 1.54, + "learning_rate": 1.0079690063743984e-06, + "loss": 0.5186, + "step": 59992 + }, + { + "epoch": 1.54, + "learning_rate": 1.0079413367960756e-06, + "loss": 0.5469, + "step": 59993 + }, + { + "epoch": 1.54, + "learning_rate": 1.0079136672116725e-06, + "loss": 0.5332, + "step": 59994 + }, + { + "epoch": 1.54, + "learning_rate": 1.0078859976212106e-06, + "loss": 0.6523, + "step": 59995 + }, + { + "epoch": 1.54, + "learning_rate": 1.0078583280247102e-06, + "loss": 0.5415, + "step": 59996 + }, + { + "epoch": 1.54, + "learning_rate": 1.0078306584221934e-06, + "loss": 0.4824, + "step": 59997 + }, + { + "epoch": 1.54, + "learning_rate": 1.0078029888136808e-06, + "loss": 0.7109, + "step": 59998 + }, + { + "epoch": 1.54, + "learning_rate": 1.007775319199194e-06, + "loss": 0.6172, + "step": 59999 + }, + { + "epoch": 1.54, + "learning_rate": 1.0077476495787537e-06, + "loss": 0.7861, + "step": 60000 + }, + { + "epoch": 1.54, + "learning_rate": 1.0077199799523817e-06, + "loss": 0.6147, + "step": 60001 + }, + { + "epoch": 1.54, + "learning_rate": 1.0076923103200988e-06, + "loss": 0.6504, + "step": 60002 + }, + { + "epoch": 1.54, + "learning_rate": 1.007664640681926e-06, + "loss": 0.6758, + "step": 60003 + }, + { + "epoch": 1.54, + "learning_rate": 1.007636971037885e-06, + "loss": 0.646, + "step": 60004 + }, + { + "epoch": 1.54, + "learning_rate": 1.0076093013879966e-06, + "loss": 0.5085, + "step": 60005 + }, + { + "epoch": 1.54, + "learning_rate": 1.0075816317322823e-06, + "loss": 0.6406, + "step": 60006 + }, + { + "epoch": 1.54, + "learning_rate": 1.007553962070763e-06, + "loss": 0.5791, + "step": 60007 + }, + { + "epoch": 1.54, + "learning_rate": 1.0075262924034598e-06, + "loss": 0.5474, + "step": 60008 + }, + { + "epoch": 1.54, + "learning_rate": 1.0074986227303941e-06, + "loss": 0.5283, + "step": 60009 + }, + { + "epoch": 1.54, + "learning_rate": 1.0074709530515873e-06, + "loss": 0.5752, + "step": 60010 + }, + { + "epoch": 1.54, + "learning_rate": 1.0074432833670603e-06, + "loss": 0.7285, + "step": 60011 + }, + { + "epoch": 1.54, + "learning_rate": 1.0074156136768338e-06, + "loss": 0.6914, + "step": 60012 + }, + { + "epoch": 1.54, + "learning_rate": 1.00738794398093e-06, + "loss": 0.7441, + "step": 60013 + }, + { + "epoch": 1.54, + "learning_rate": 1.0073602742793697e-06, + "loss": 0.6746, + "step": 60014 + }, + { + "epoch": 1.54, + "learning_rate": 1.0073326045721735e-06, + "loss": 0.5845, + "step": 60015 + }, + { + "epoch": 1.54, + "learning_rate": 1.0073049348593634e-06, + "loss": 0.5962, + "step": 60016 + }, + { + "epoch": 1.54, + "learning_rate": 1.0072772651409601e-06, + "loss": 0.6367, + "step": 60017 + }, + { + "epoch": 1.54, + "learning_rate": 1.007249595416985e-06, + "loss": 0.4041, + "step": 60018 + }, + { + "epoch": 1.54, + "learning_rate": 1.0072219256874594e-06, + "loss": 0.6875, + "step": 60019 + }, + { + "epoch": 1.54, + "learning_rate": 1.0071942559524044e-06, + "loss": 0.5161, + "step": 60020 + }, + { + "epoch": 1.54, + "learning_rate": 1.0071665862118406e-06, + "loss": 0.7578, + "step": 60021 + }, + { + "epoch": 1.54, + "learning_rate": 1.0071389164657898e-06, + "loss": 0.6685, + "step": 60022 + }, + { + "epoch": 1.54, + "learning_rate": 1.007111246714273e-06, + "loss": 0.7705, + "step": 60023 + }, + { + "epoch": 1.54, + "learning_rate": 1.0070835769573118e-06, + "loss": 0.5806, + "step": 60024 + }, + { + "epoch": 1.54, + "learning_rate": 1.0070559071949267e-06, + "loss": 0.5693, + "step": 60025 + }, + { + "epoch": 1.54, + "learning_rate": 1.0070282374271395e-06, + "loss": 0.6201, + "step": 60026 + }, + { + "epoch": 1.54, + "learning_rate": 1.0070005676539707e-06, + "loss": 0.8076, + "step": 60027 + }, + { + "epoch": 1.54, + "learning_rate": 1.0069728978754423e-06, + "loss": 0.5425, + "step": 60028 + }, + { + "epoch": 1.54, + "learning_rate": 1.006945228091575e-06, + "loss": 0.7354, + "step": 60029 + }, + { + "epoch": 1.54, + "learning_rate": 1.0069175583023901e-06, + "loss": 0.6104, + "step": 60030 + }, + { + "epoch": 1.54, + "learning_rate": 1.0068898885079085e-06, + "loss": 0.5293, + "step": 60031 + }, + { + "epoch": 1.54, + "learning_rate": 1.0068622187081517e-06, + "loss": 0.5615, + "step": 60032 + }, + { + "epoch": 1.54, + "learning_rate": 1.0068345489031406e-06, + "loss": 0.5, + "step": 60033 + }, + { + "epoch": 1.54, + "learning_rate": 1.006806879092897e-06, + "loss": 0.5669, + "step": 60034 + }, + { + "epoch": 1.54, + "learning_rate": 1.0067792092774417e-06, + "loss": 0.6621, + "step": 60035 + }, + { + "epoch": 1.54, + "learning_rate": 1.0067515394567957e-06, + "loss": 0.6626, + "step": 60036 + }, + { + "epoch": 1.54, + "learning_rate": 1.0067238696309804e-06, + "loss": 0.7451, + "step": 60037 + }, + { + "epoch": 1.54, + "learning_rate": 1.006696199800017e-06, + "loss": 0.6069, + "step": 60038 + }, + { + "epoch": 1.54, + "learning_rate": 1.0066685299639264e-06, + "loss": 0.4805, + "step": 60039 + }, + { + "epoch": 1.54, + "learning_rate": 1.00664086012273e-06, + "loss": 0.7539, + "step": 60040 + }, + { + "epoch": 1.54, + "learning_rate": 1.0066131902764491e-06, + "loss": 0.7568, + "step": 60041 + }, + { + "epoch": 1.54, + "learning_rate": 1.0065855204251049e-06, + "loss": 0.5173, + "step": 60042 + }, + { + "epoch": 1.54, + "learning_rate": 1.0065578505687185e-06, + "loss": 0.6086, + "step": 60043 + }, + { + "epoch": 1.54, + "learning_rate": 1.006530180707311e-06, + "loss": 0.473, + "step": 60044 + }, + { + "epoch": 1.54, + "learning_rate": 1.0065025108409038e-06, + "loss": 0.6768, + "step": 60045 + }, + { + "epoch": 1.54, + "learning_rate": 1.0064748409695173e-06, + "loss": 0.605, + "step": 60046 + }, + { + "epoch": 1.54, + "learning_rate": 1.006447171093174e-06, + "loss": 0.627, + "step": 60047 + }, + { + "epoch": 1.54, + "learning_rate": 1.0064195012118939e-06, + "loss": 0.4822, + "step": 60048 + }, + { + "epoch": 1.54, + "learning_rate": 1.0063918313256991e-06, + "loss": 0.4761, + "step": 60049 + }, + { + "epoch": 1.54, + "learning_rate": 1.0063641614346102e-06, + "loss": 0.6006, + "step": 60050 + }, + { + "epoch": 1.54, + "learning_rate": 1.0063364915386485e-06, + "loss": 0.6597, + "step": 60051 + }, + { + "epoch": 1.54, + "learning_rate": 1.0063088216378352e-06, + "loss": 0.7993, + "step": 60052 + }, + { + "epoch": 1.54, + "learning_rate": 1.0062811517321917e-06, + "loss": 0.4128, + "step": 60053 + }, + { + "epoch": 1.54, + "learning_rate": 1.006253481821739e-06, + "loss": 0.5306, + "step": 60054 + }, + { + "epoch": 1.54, + "learning_rate": 1.0062258119064984e-06, + "loss": 0.6035, + "step": 60055 + }, + { + "epoch": 1.54, + "learning_rate": 1.0061981419864905e-06, + "loss": 0.6465, + "step": 60056 + }, + { + "epoch": 1.54, + "learning_rate": 1.0061704720617375e-06, + "loss": 0.6089, + "step": 60057 + }, + { + "epoch": 1.54, + "learning_rate": 1.0061428021322596e-06, + "loss": 0.6396, + "step": 60058 + }, + { + "epoch": 1.54, + "learning_rate": 1.0061151321980787e-06, + "loss": 0.6079, + "step": 60059 + }, + { + "epoch": 1.54, + "learning_rate": 1.0060874622592156e-06, + "loss": 0.6519, + "step": 60060 + }, + { + "epoch": 1.54, + "learning_rate": 1.0060597923156918e-06, + "loss": 0.7021, + "step": 60061 + }, + { + "epoch": 1.54, + "learning_rate": 1.006032122367528e-06, + "loss": 0.6455, + "step": 60062 + }, + { + "epoch": 1.54, + "learning_rate": 1.0060044524147457e-06, + "loss": 0.7363, + "step": 60063 + }, + { + "epoch": 1.54, + "learning_rate": 1.0059767824573667e-06, + "loss": 0.5117, + "step": 60064 + }, + { + "epoch": 1.54, + "learning_rate": 1.005949112495411e-06, + "loss": 0.4927, + "step": 60065 + }, + { + "epoch": 1.54, + "learning_rate": 1.0059214425289003e-06, + "loss": 0.7402, + "step": 60066 + }, + { + "epoch": 1.54, + "learning_rate": 1.0058937725578557e-06, + "loss": 0.7021, + "step": 60067 + }, + { + "epoch": 1.54, + "learning_rate": 1.005866102582299e-06, + "loss": 0.5708, + "step": 60068 + }, + { + "epoch": 1.54, + "learning_rate": 1.0058384326022506e-06, + "loss": 0.7539, + "step": 60069 + }, + { + "epoch": 1.54, + "learning_rate": 1.0058107626177323e-06, + "loss": 0.6787, + "step": 60070 + }, + { + "epoch": 1.54, + "learning_rate": 1.0057830926287645e-06, + "loss": 0.5649, + "step": 60071 + }, + { + "epoch": 1.54, + "learning_rate": 1.005755422635369e-06, + "loss": 0.6182, + "step": 60072 + }, + { + "epoch": 1.54, + "learning_rate": 1.0057277526375668e-06, + "loss": 0.6313, + "step": 60073 + }, + { + "epoch": 1.54, + "learning_rate": 1.0057000826353796e-06, + "loss": 0.6309, + "step": 60074 + }, + { + "epoch": 1.54, + "learning_rate": 1.0056724126288276e-06, + "loss": 0.5007, + "step": 60075 + }, + { + "epoch": 1.54, + "learning_rate": 1.0056447426179326e-06, + "loss": 0.7012, + "step": 60076 + }, + { + "epoch": 1.54, + "learning_rate": 1.0056170726027157e-06, + "loss": 0.6748, + "step": 60077 + }, + { + "epoch": 1.54, + "learning_rate": 1.005589402583198e-06, + "loss": 0.7627, + "step": 60078 + }, + { + "epoch": 1.54, + "learning_rate": 1.0055617325594007e-06, + "loss": 0.5957, + "step": 60079 + }, + { + "epoch": 1.54, + "learning_rate": 1.005534062531345e-06, + "loss": 0.7061, + "step": 60080 + }, + { + "epoch": 1.54, + "learning_rate": 1.0055063924990526e-06, + "loss": 0.5654, + "step": 60081 + }, + { + "epoch": 1.54, + "learning_rate": 1.0054787224625436e-06, + "loss": 0.5459, + "step": 60082 + }, + { + "epoch": 1.54, + "learning_rate": 1.0054510524218402e-06, + "loss": 0.7686, + "step": 60083 + }, + { + "epoch": 1.54, + "learning_rate": 1.0054233823769632e-06, + "loss": 0.6733, + "step": 60084 + }, + { + "epoch": 1.54, + "learning_rate": 1.0053957123279337e-06, + "loss": 0.7705, + "step": 60085 + }, + { + "epoch": 1.54, + "learning_rate": 1.0053680422747727e-06, + "loss": 0.6714, + "step": 60086 + }, + { + "epoch": 1.54, + "learning_rate": 1.0053403722175018e-06, + "loss": 0.4596, + "step": 60087 + }, + { + "epoch": 1.54, + "learning_rate": 1.005312702156142e-06, + "loss": 0.8486, + "step": 60088 + }, + { + "epoch": 1.54, + "learning_rate": 1.0052850320907147e-06, + "loss": 0.5015, + "step": 60089 + }, + { + "epoch": 1.54, + "learning_rate": 1.0052573620212405e-06, + "loss": 0.481, + "step": 60090 + }, + { + "epoch": 1.54, + "learning_rate": 1.0052296919477415e-06, + "loss": 0.5908, + "step": 60091 + }, + { + "epoch": 1.54, + "learning_rate": 1.005202021870238e-06, + "loss": 0.5354, + "step": 60092 + }, + { + "epoch": 1.54, + "learning_rate": 1.0051743517887517e-06, + "loss": 0.6914, + "step": 60093 + }, + { + "epoch": 1.54, + "learning_rate": 1.0051466817033035e-06, + "loss": 0.6006, + "step": 60094 + }, + { + "epoch": 1.54, + "learning_rate": 1.0051190116139148e-06, + "loss": 0.6738, + "step": 60095 + }, + { + "epoch": 1.54, + "learning_rate": 1.0050913415206065e-06, + "loss": 0.6233, + "step": 60096 + }, + { + "epoch": 1.54, + "learning_rate": 1.0050636714234004e-06, + "loss": 0.6709, + "step": 60097 + }, + { + "epoch": 1.54, + "learning_rate": 1.005036001322317e-06, + "loss": 0.5103, + "step": 60098 + }, + { + "epoch": 1.54, + "learning_rate": 1.0050083312173778e-06, + "loss": 0.6895, + "step": 60099 + }, + { + "epoch": 1.54, + "learning_rate": 1.004980661108604e-06, + "loss": 0.7451, + "step": 60100 + }, + { + "epoch": 1.54, + "learning_rate": 1.0049529909960168e-06, + "loss": 0.6064, + "step": 60101 + }, + { + "epoch": 1.54, + "learning_rate": 1.0049253208796372e-06, + "loss": 0.8926, + "step": 60102 + }, + { + "epoch": 1.54, + "learning_rate": 1.0048976507594866e-06, + "loss": 0.6123, + "step": 60103 + }, + { + "epoch": 1.54, + "learning_rate": 1.004869980635586e-06, + "loss": 0.6499, + "step": 60104 + }, + { + "epoch": 1.54, + "learning_rate": 1.0048423105079566e-06, + "loss": 0.6709, + "step": 60105 + }, + { + "epoch": 1.54, + "learning_rate": 1.00481464037662e-06, + "loss": 0.5034, + "step": 60106 + }, + { + "epoch": 1.54, + "learning_rate": 1.0047869702415967e-06, + "loss": 0.665, + "step": 60107 + }, + { + "epoch": 1.54, + "learning_rate": 1.0047593001029084e-06, + "loss": 0.6699, + "step": 60108 + }, + { + "epoch": 1.54, + "learning_rate": 1.0047316299605762e-06, + "loss": 0.7256, + "step": 60109 + }, + { + "epoch": 1.54, + "learning_rate": 1.0047039598146212e-06, + "loss": 0.7793, + "step": 60110 + }, + { + "epoch": 1.54, + "learning_rate": 1.0046762896650642e-06, + "loss": 0.79, + "step": 60111 + }, + { + "epoch": 1.54, + "learning_rate": 1.0046486195119272e-06, + "loss": 0.5295, + "step": 60112 + }, + { + "epoch": 1.54, + "learning_rate": 1.004620949355231e-06, + "loss": 0.6631, + "step": 60113 + }, + { + "epoch": 1.54, + "learning_rate": 1.0045932791949967e-06, + "loss": 0.6162, + "step": 60114 + }, + { + "epoch": 1.54, + "learning_rate": 1.0045656090312453e-06, + "loss": 0.6543, + "step": 60115 + }, + { + "epoch": 1.54, + "learning_rate": 1.0045379388639984e-06, + "loss": 0.7676, + "step": 60116 + }, + { + "epoch": 1.54, + "learning_rate": 1.0045102686932768e-06, + "loss": 0.4463, + "step": 60117 + }, + { + "epoch": 1.54, + "learning_rate": 1.004482598519102e-06, + "loss": 0.7959, + "step": 60118 + }, + { + "epoch": 1.54, + "learning_rate": 1.0044549283414954e-06, + "loss": 0.5361, + "step": 60119 + }, + { + "epoch": 1.54, + "learning_rate": 1.0044272581604779e-06, + "loss": 0.7056, + "step": 60120 + }, + { + "epoch": 1.54, + "learning_rate": 1.0043995879760701e-06, + "loss": 0.4377, + "step": 60121 + }, + { + "epoch": 1.54, + "learning_rate": 1.004371917788294e-06, + "loss": 0.5593, + "step": 60122 + }, + { + "epoch": 1.54, + "learning_rate": 1.0043442475971705e-06, + "loss": 0.7285, + "step": 60123 + }, + { + "epoch": 1.54, + "learning_rate": 1.0043165774027207e-06, + "loss": 0.5244, + "step": 60124 + }, + { + "epoch": 1.54, + "learning_rate": 1.0042889072049663e-06, + "loss": 0.5249, + "step": 60125 + }, + { + "epoch": 1.54, + "learning_rate": 1.0042612370039276e-06, + "loss": 0.5913, + "step": 60126 + }, + { + "epoch": 1.54, + "learning_rate": 1.0042335667996265e-06, + "loss": 0.5762, + "step": 60127 + }, + { + "epoch": 1.54, + "learning_rate": 1.0042058965920841e-06, + "loss": 0.5957, + "step": 60128 + }, + { + "epoch": 1.54, + "learning_rate": 1.0041782263813212e-06, + "loss": 0.7148, + "step": 60129 + }, + { + "epoch": 1.54, + "learning_rate": 1.0041505561673592e-06, + "loss": 0.6528, + "step": 60130 + }, + { + "epoch": 1.54, + "learning_rate": 1.0041228859502195e-06, + "loss": 0.5476, + "step": 60131 + }, + { + "epoch": 1.54, + "learning_rate": 1.0040952157299228e-06, + "loss": 0.6299, + "step": 60132 + }, + { + "epoch": 1.54, + "learning_rate": 1.0040675455064911e-06, + "loss": 0.5935, + "step": 60133 + }, + { + "epoch": 1.54, + "learning_rate": 1.0040398752799446e-06, + "loss": 0.5527, + "step": 60134 + }, + { + "epoch": 1.54, + "learning_rate": 1.0040122050503052e-06, + "loss": 0.5742, + "step": 60135 + }, + { + "epoch": 1.54, + "learning_rate": 1.0039845348175935e-06, + "loss": 0.4805, + "step": 60136 + }, + { + "epoch": 1.54, + "learning_rate": 1.0039568645818314e-06, + "loss": 0.52, + "step": 60137 + }, + { + "epoch": 1.54, + "learning_rate": 1.0039291943430397e-06, + "loss": 0.71, + "step": 60138 + }, + { + "epoch": 1.54, + "learning_rate": 1.0039015241012396e-06, + "loss": 0.5337, + "step": 60139 + }, + { + "epoch": 1.54, + "learning_rate": 1.003873853856452e-06, + "loss": 0.7881, + "step": 60140 + }, + { + "epoch": 1.54, + "learning_rate": 1.0038461836086984e-06, + "loss": 0.7461, + "step": 60141 + }, + { + "epoch": 1.54, + "learning_rate": 1.0038185133580001e-06, + "loss": 0.6104, + "step": 60142 + }, + { + "epoch": 1.54, + "learning_rate": 1.0037908431043781e-06, + "loss": 0.6396, + "step": 60143 + }, + { + "epoch": 1.54, + "learning_rate": 1.0037631728478538e-06, + "loss": 0.5122, + "step": 60144 + }, + { + "epoch": 1.54, + "learning_rate": 1.0037355025884482e-06, + "loss": 0.7124, + "step": 60145 + }, + { + "epoch": 1.54, + "learning_rate": 1.003707832326182e-06, + "loss": 0.5923, + "step": 60146 + }, + { + "epoch": 1.54, + "learning_rate": 1.0036801620610775e-06, + "loss": 0.6245, + "step": 60147 + }, + { + "epoch": 1.54, + "learning_rate": 1.003652491793155e-06, + "loss": 0.6582, + "step": 60148 + }, + { + "epoch": 1.54, + "learning_rate": 1.003624821522436e-06, + "loss": 0.707, + "step": 60149 + }, + { + "epoch": 1.54, + "learning_rate": 1.0035971512489414e-06, + "loss": 0.6826, + "step": 60150 + }, + { + "epoch": 1.54, + "learning_rate": 1.0035694809726927e-06, + "loss": 0.5928, + "step": 60151 + }, + { + "epoch": 1.54, + "learning_rate": 1.0035418106937111e-06, + "loss": 0.6904, + "step": 60152 + }, + { + "epoch": 1.54, + "learning_rate": 1.003514140412018e-06, + "loss": 0.6016, + "step": 60153 + }, + { + "epoch": 1.54, + "learning_rate": 1.003486470127634e-06, + "loss": 0.707, + "step": 60154 + }, + { + "epoch": 1.54, + "learning_rate": 1.0034587998405806e-06, + "loss": 0.7017, + "step": 60155 + }, + { + "epoch": 1.54, + "learning_rate": 1.003431129550879e-06, + "loss": 0.4719, + "step": 60156 + }, + { + "epoch": 1.54, + "learning_rate": 1.00340345925855e-06, + "loss": 0.6016, + "step": 60157 + }, + { + "epoch": 1.54, + "learning_rate": 1.0033757889636159e-06, + "loss": 0.6406, + "step": 60158 + }, + { + "epoch": 1.54, + "learning_rate": 1.0033481186660964e-06, + "loss": 0.5723, + "step": 60159 + }, + { + "epoch": 1.54, + "learning_rate": 1.0033204483660138e-06, + "loss": 0.7852, + "step": 60160 + }, + { + "epoch": 1.54, + "learning_rate": 1.0032927780633884e-06, + "loss": 0.7988, + "step": 60161 + }, + { + "epoch": 1.54, + "learning_rate": 1.0032651077582424e-06, + "loss": 0.5034, + "step": 60162 + }, + { + "epoch": 1.54, + "learning_rate": 1.0032374374505963e-06, + "loss": 0.5688, + "step": 60163 + }, + { + "epoch": 1.54, + "learning_rate": 1.0032097671404713e-06, + "loss": 0.5439, + "step": 60164 + }, + { + "epoch": 1.54, + "learning_rate": 1.0031820968278888e-06, + "loss": 0.6143, + "step": 60165 + }, + { + "epoch": 1.54, + "learning_rate": 1.00315442651287e-06, + "loss": 0.668, + "step": 60166 + }, + { + "epoch": 1.54, + "learning_rate": 1.0031267561954357e-06, + "loss": 0.7832, + "step": 60167 + }, + { + "epoch": 1.54, + "learning_rate": 1.003099085875608e-06, + "loss": 0.7334, + "step": 60168 + }, + { + "epoch": 1.54, + "learning_rate": 1.003071415553407e-06, + "loss": 0.8301, + "step": 60169 + }, + { + "epoch": 1.54, + "learning_rate": 1.0030437452288543e-06, + "loss": 0.6785, + "step": 60170 + }, + { + "epoch": 1.54, + "learning_rate": 1.0030160749019713e-06, + "loss": 0.5601, + "step": 60171 + }, + { + "epoch": 1.54, + "learning_rate": 1.002988404572779e-06, + "loss": 0.5518, + "step": 60172 + }, + { + "epoch": 1.54, + "learning_rate": 1.002960734241299e-06, + "loss": 0.6606, + "step": 60173 + }, + { + "epoch": 1.54, + "learning_rate": 1.0029330639075515e-06, + "loss": 0.7402, + "step": 60174 + }, + { + "epoch": 1.54, + "learning_rate": 1.0029053935715585e-06, + "loss": 0.6836, + "step": 60175 + }, + { + "epoch": 1.54, + "learning_rate": 1.002877723233341e-06, + "loss": 0.4028, + "step": 60176 + }, + { + "epoch": 1.54, + "learning_rate": 1.0028500528929201e-06, + "loss": 0.8057, + "step": 60177 + }, + { + "epoch": 1.54, + "learning_rate": 1.0028223825503173e-06, + "loss": 0.8066, + "step": 60178 + }, + { + "epoch": 1.54, + "learning_rate": 1.0027947122055533e-06, + "loss": 0.6768, + "step": 60179 + }, + { + "epoch": 1.54, + "learning_rate": 1.0027670418586493e-06, + "loss": 0.6699, + "step": 60180 + }, + { + "epoch": 1.54, + "learning_rate": 1.0027393715096273e-06, + "loss": 0.707, + "step": 60181 + }, + { + "epoch": 1.54, + "learning_rate": 1.0027117011585073e-06, + "loss": 0.625, + "step": 60182 + }, + { + "epoch": 1.54, + "learning_rate": 1.0026840308053115e-06, + "loss": 0.5796, + "step": 60183 + }, + { + "epoch": 1.54, + "learning_rate": 1.0026563604500604e-06, + "loss": 0.6001, + "step": 60184 + }, + { + "epoch": 1.54, + "learning_rate": 1.0026286900927756e-06, + "loss": 0.5295, + "step": 60185 + }, + { + "epoch": 1.54, + "learning_rate": 1.002601019733478e-06, + "loss": 0.688, + "step": 60186 + }, + { + "epoch": 1.54, + "learning_rate": 1.0025733493721892e-06, + "loss": 0.6338, + "step": 60187 + }, + { + "epoch": 1.54, + "learning_rate": 1.0025456790089298e-06, + "loss": 0.8564, + "step": 60188 + }, + { + "epoch": 1.54, + "learning_rate": 1.0025180086437214e-06, + "loss": 0.5303, + "step": 60189 + }, + { + "epoch": 1.54, + "learning_rate": 1.002490338276585e-06, + "loss": 0.5442, + "step": 60190 + }, + { + "epoch": 1.54, + "learning_rate": 1.002462667907542e-06, + "loss": 0.5757, + "step": 60191 + }, + { + "epoch": 1.54, + "learning_rate": 1.002434997536613e-06, + "loss": 0.6729, + "step": 60192 + }, + { + "epoch": 1.54, + "learning_rate": 1.0024073271638203e-06, + "loss": 0.5165, + "step": 60193 + }, + { + "epoch": 1.54, + "learning_rate": 1.0023796567891842e-06, + "loss": 0.5688, + "step": 60194 + }, + { + "epoch": 1.54, + "learning_rate": 1.002351986412726e-06, + "loss": 0.6377, + "step": 60195 + }, + { + "epoch": 1.54, + "learning_rate": 1.002324316034467e-06, + "loss": 0.6899, + "step": 60196 + }, + { + "epoch": 1.54, + "learning_rate": 1.0022966456544282e-06, + "loss": 0.7656, + "step": 60197 + }, + { + "epoch": 1.54, + "learning_rate": 1.0022689752726315e-06, + "loss": 0.6777, + "step": 60198 + }, + { + "epoch": 1.54, + "learning_rate": 1.002241304889097e-06, + "loss": 0.5797, + "step": 60199 + }, + { + "epoch": 1.54, + "learning_rate": 1.0022136345038468e-06, + "loss": 0.5132, + "step": 60200 + }, + { + "epoch": 1.54, + "learning_rate": 1.0021859641169012e-06, + "loss": 0.5386, + "step": 60201 + }, + { + "epoch": 1.54, + "learning_rate": 1.0021582937282824e-06, + "loss": 0.6709, + "step": 60202 + }, + { + "epoch": 1.54, + "learning_rate": 1.0021306233380112e-06, + "loss": 0.5337, + "step": 60203 + }, + { + "epoch": 1.54, + "learning_rate": 1.0021029529461085e-06, + "loss": 0.51, + "step": 60204 + }, + { + "epoch": 1.54, + "learning_rate": 1.0020752825525956e-06, + "loss": 0.748, + "step": 60205 + }, + { + "epoch": 1.54, + "learning_rate": 1.0020476121574937e-06, + "loss": 0.5137, + "step": 60206 + }, + { + "epoch": 1.54, + "learning_rate": 1.002019941760824e-06, + "loss": 0.6523, + "step": 60207 + }, + { + "epoch": 1.54, + "learning_rate": 1.0019922713626082e-06, + "loss": 0.6201, + "step": 60208 + }, + { + "epoch": 1.54, + "learning_rate": 1.0019646009628664e-06, + "loss": 0.7549, + "step": 60209 + }, + { + "epoch": 1.54, + "learning_rate": 1.0019369305616208e-06, + "loss": 0.5972, + "step": 60210 + }, + { + "epoch": 1.54, + "learning_rate": 1.0019092601588918e-06, + "loss": 0.6206, + "step": 60211 + }, + { + "epoch": 1.54, + "learning_rate": 1.0018815897547012e-06, + "loss": 0.6193, + "step": 60212 + }, + { + "epoch": 1.54, + "learning_rate": 1.00185391934907e-06, + "loss": 0.6025, + "step": 60213 + }, + { + "epoch": 1.54, + "learning_rate": 1.001826248942019e-06, + "loss": 0.7393, + "step": 60214 + }, + { + "epoch": 1.54, + "learning_rate": 1.0017985785335702e-06, + "loss": 0.6816, + "step": 60215 + }, + { + "epoch": 1.54, + "learning_rate": 1.001770908123744e-06, + "loss": 0.7607, + "step": 60216 + }, + { + "epoch": 1.54, + "learning_rate": 1.0017432377125621e-06, + "loss": 0.5811, + "step": 60217 + }, + { + "epoch": 1.54, + "learning_rate": 1.0017155673000454e-06, + "loss": 0.5757, + "step": 60218 + }, + { + "epoch": 1.54, + "learning_rate": 1.0016878968862152e-06, + "loss": 0.5703, + "step": 60219 + }, + { + "epoch": 1.54, + "learning_rate": 1.0016602264710924e-06, + "loss": 0.604, + "step": 60220 + }, + { + "epoch": 1.54, + "learning_rate": 1.001632556054699e-06, + "loss": 0.459, + "step": 60221 + }, + { + "epoch": 1.54, + "learning_rate": 1.0016048856370549e-06, + "loss": 0.7949, + "step": 60222 + }, + { + "epoch": 1.54, + "learning_rate": 1.0015772152181827e-06, + "loss": 0.8184, + "step": 60223 + }, + { + "epoch": 1.54, + "learning_rate": 1.0015495447981026e-06, + "loss": 0.5781, + "step": 60224 + }, + { + "epoch": 1.54, + "learning_rate": 1.001521874376836e-06, + "loss": 0.7134, + "step": 60225 + }, + { + "epoch": 1.54, + "learning_rate": 1.0014942039544042e-06, + "loss": 0.6992, + "step": 60226 + }, + { + "epoch": 1.54, + "learning_rate": 1.0014665335308285e-06, + "loss": 0.873, + "step": 60227 + }, + { + "epoch": 1.54, + "learning_rate": 1.00143886310613e-06, + "loss": 0.8086, + "step": 60228 + }, + { + "epoch": 1.54, + "learning_rate": 1.0014111926803297e-06, + "loss": 0.6494, + "step": 60229 + }, + { + "epoch": 1.54, + "learning_rate": 1.0013835222534488e-06, + "loss": 0.7881, + "step": 60230 + }, + { + "epoch": 1.54, + "learning_rate": 1.0013558518255087e-06, + "loss": 0.7275, + "step": 60231 + }, + { + "epoch": 1.54, + "learning_rate": 1.0013281813965303e-06, + "loss": 0.6042, + "step": 60232 + }, + { + "epoch": 1.54, + "learning_rate": 1.0013005109665353e-06, + "loss": 0.6392, + "step": 60233 + }, + { + "epoch": 1.54, + "learning_rate": 1.0012728405355444e-06, + "loss": 0.6592, + "step": 60234 + }, + { + "epoch": 1.54, + "learning_rate": 1.0012451701035792e-06, + "loss": 0.6455, + "step": 60235 + }, + { + "epoch": 1.54, + "learning_rate": 1.0012174996706602e-06, + "loss": 0.6794, + "step": 60236 + }, + { + "epoch": 1.54, + "learning_rate": 1.0011898292368093e-06, + "loss": 0.7324, + "step": 60237 + }, + { + "epoch": 1.54, + "learning_rate": 1.0011621588020474e-06, + "loss": 0.4565, + "step": 60238 + }, + { + "epoch": 1.54, + "learning_rate": 1.0011344883663953e-06, + "loss": 0.5864, + "step": 60239 + }, + { + "epoch": 1.54, + "learning_rate": 1.001106817929875e-06, + "loss": 0.5425, + "step": 60240 + }, + { + "epoch": 1.54, + "learning_rate": 1.001079147492507e-06, + "loss": 0.7979, + "step": 60241 + }, + { + "epoch": 1.54, + "learning_rate": 1.001051477054313e-06, + "loss": 0.7158, + "step": 60242 + }, + { + "epoch": 1.54, + "learning_rate": 1.0010238066153137e-06, + "loss": 0.9268, + "step": 60243 + }, + { + "epoch": 1.54, + "learning_rate": 1.0009961361755308e-06, + "loss": 0.7725, + "step": 60244 + }, + { + "epoch": 1.54, + "learning_rate": 1.0009684657349848e-06, + "loss": 0.627, + "step": 60245 + }, + { + "epoch": 1.54, + "learning_rate": 1.0009407952936978e-06, + "loss": 0.5664, + "step": 60246 + }, + { + "epoch": 1.54, + "learning_rate": 1.00091312485169e-06, + "loss": 0.6504, + "step": 60247 + }, + { + "epoch": 1.54, + "learning_rate": 1.0008854544089835e-06, + "loss": 0.5271, + "step": 60248 + }, + { + "epoch": 1.54, + "learning_rate": 1.0008577839655988e-06, + "loss": 0.6689, + "step": 60249 + }, + { + "epoch": 1.54, + "learning_rate": 1.0008301135215572e-06, + "loss": 0.5752, + "step": 60250 + }, + { + "epoch": 1.54, + "learning_rate": 1.00080244307688e-06, + "loss": 0.7422, + "step": 60251 + }, + { + "epoch": 1.54, + "learning_rate": 1.0007747726315886e-06, + "loss": 0.5908, + "step": 60252 + }, + { + "epoch": 1.54, + "learning_rate": 1.0007471021857041e-06, + "loss": 0.6245, + "step": 60253 + }, + { + "epoch": 1.54, + "learning_rate": 1.0007194317392475e-06, + "loss": 0.5303, + "step": 60254 + }, + { + "epoch": 1.54, + "learning_rate": 1.0006917612922398e-06, + "loss": 0.4619, + "step": 60255 + }, + { + "epoch": 1.54, + "learning_rate": 1.0006640908447027e-06, + "loss": 0.4778, + "step": 60256 + }, + { + "epoch": 1.54, + "learning_rate": 1.000636420396657e-06, + "loss": 0.6582, + "step": 60257 + }, + { + "epoch": 1.54, + "learning_rate": 1.0006087499481243e-06, + "loss": 0.7783, + "step": 60258 + }, + { + "epoch": 1.54, + "learning_rate": 1.0005810794991255e-06, + "loss": 0.5913, + "step": 60259 + }, + { + "epoch": 1.54, + "learning_rate": 1.0005534090496815e-06, + "loss": 0.7363, + "step": 60260 + }, + { + "epoch": 1.54, + "learning_rate": 1.0005257385998139e-06, + "loss": 0.626, + "step": 60261 + }, + { + "epoch": 1.54, + "learning_rate": 1.0004980681495436e-06, + "loss": 0.5239, + "step": 60262 + }, + { + "epoch": 1.54, + "learning_rate": 1.0004703976988925e-06, + "loss": 0.4545, + "step": 60263 + }, + { + "epoch": 1.54, + "learning_rate": 1.0004427272478807e-06, + "loss": 0.7773, + "step": 60264 + }, + { + "epoch": 1.54, + "learning_rate": 1.0004150567965298e-06, + "loss": 0.7275, + "step": 60265 + }, + { + "epoch": 1.54, + "learning_rate": 1.0003873863448616e-06, + "loss": 0.9746, + "step": 60266 + }, + { + "epoch": 1.54, + "learning_rate": 1.0003597158928965e-06, + "loss": 0.5538, + "step": 60267 + }, + { + "epoch": 1.54, + "learning_rate": 1.000332045440656e-06, + "loss": 0.6333, + "step": 60268 + }, + { + "epoch": 1.54, + "learning_rate": 1.0003043749881615e-06, + "loss": 0.5977, + "step": 60269 + }, + { + "epoch": 1.54, + "learning_rate": 1.0002767045354336e-06, + "loss": 0.4883, + "step": 60270 + }, + { + "epoch": 1.54, + "learning_rate": 1.0002490340824942e-06, + "loss": 0.5415, + "step": 60271 + }, + { + "epoch": 1.54, + "learning_rate": 1.0002213636293638e-06, + "loss": 0.6055, + "step": 60272 + }, + { + "epoch": 1.54, + "learning_rate": 1.0001936931760643e-06, + "loss": 0.8164, + "step": 60273 + }, + { + "epoch": 1.54, + "learning_rate": 1.000166022722616e-06, + "loss": 0.7295, + "step": 60274 + }, + { + "epoch": 1.54, + "learning_rate": 1.0001383522690411e-06, + "loss": 0.575, + "step": 60275 + }, + { + "epoch": 1.54, + "learning_rate": 1.00011068181536e-06, + "loss": 0.749, + "step": 60276 + }, + { + "epoch": 1.54, + "learning_rate": 1.0000830113615942e-06, + "loss": 0.4927, + "step": 60277 + }, + { + "epoch": 1.54, + "learning_rate": 1.0000553409077647e-06, + "loss": 0.5247, + "step": 60278 + }, + { + "epoch": 1.54, + "learning_rate": 1.0000276704538927e-06, + "loss": 0.7324, + "step": 60279 + }, + { + "epoch": 1.55, + "learning_rate": 1e-06, + "loss": 0.7705, + "step": 60280 + }, + { + "epoch": 1.55, + "learning_rate": 9.999723295461072e-07, + "loss": 0.7637, + "step": 60281 + }, + { + "epoch": 1.55, + "learning_rate": 9.999446590922352e-07, + "loss": 0.7344, + "step": 60282 + }, + { + "epoch": 1.55, + "learning_rate": 9.99916988638406e-07, + "loss": 0.7314, + "step": 60283 + }, + { + "epoch": 1.55, + "learning_rate": 9.9988931818464e-07, + "loss": 0.4971, + "step": 60284 + }, + { + "epoch": 1.55, + "learning_rate": 9.998616477309592e-07, + "loss": 0.668, + "step": 60285 + }, + { + "epoch": 1.55, + "learning_rate": 9.99833977277384e-07, + "loss": 0.6865, + "step": 60286 + }, + { + "epoch": 1.55, + "learning_rate": 9.998063068239358e-07, + "loss": 0.5713, + "step": 60287 + }, + { + "epoch": 1.55, + "learning_rate": 9.997786363706362e-07, + "loss": 0.5596, + "step": 60288 + }, + { + "epoch": 1.55, + "learning_rate": 9.99750965917506e-07, + "loss": 0.6802, + "step": 60289 + }, + { + "epoch": 1.55, + "learning_rate": 9.997232954645663e-07, + "loss": 0.6846, + "step": 60290 + }, + { + "epoch": 1.55, + "learning_rate": 9.996956250118384e-07, + "loss": 0.7295, + "step": 60291 + }, + { + "epoch": 1.55, + "learning_rate": 9.996679545593439e-07, + "loss": 0.6768, + "step": 60292 + }, + { + "epoch": 1.55, + "learning_rate": 9.996402841071032e-07, + "loss": 0.5918, + "step": 60293 + }, + { + "epoch": 1.55, + "learning_rate": 9.996126136551383e-07, + "loss": 0.8623, + "step": 60294 + }, + { + "epoch": 1.55, + "learning_rate": 9.995849432034703e-07, + "loss": 0.7861, + "step": 60295 + }, + { + "epoch": 1.55, + "learning_rate": 9.995572727521195e-07, + "loss": 0.6943, + "step": 60296 + }, + { + "epoch": 1.55, + "learning_rate": 9.995296023011079e-07, + "loss": 0.4783, + "step": 60297 + }, + { + "epoch": 1.55, + "learning_rate": 9.995019318504565e-07, + "loss": 0.5502, + "step": 60298 + }, + { + "epoch": 1.55, + "learning_rate": 9.994742614001863e-07, + "loss": 0.6118, + "step": 60299 + }, + { + "epoch": 1.55, + "learning_rate": 9.994465909503186e-07, + "loss": 0.7256, + "step": 60300 + }, + { + "epoch": 1.55, + "learning_rate": 9.994189205008747e-07, + "loss": 0.6523, + "step": 60301 + }, + { + "epoch": 1.55, + "learning_rate": 9.993912500518758e-07, + "loss": 0.7832, + "step": 60302 + }, + { + "epoch": 1.55, + "learning_rate": 9.993635796033427e-07, + "loss": 0.5573, + "step": 60303 + }, + { + "epoch": 1.55, + "learning_rate": 9.993359091552972e-07, + "loss": 0.4624, + "step": 60304 + }, + { + "epoch": 1.55, + "learning_rate": 9.993082387077603e-07, + "loss": 0.7188, + "step": 60305 + }, + { + "epoch": 1.55, + "learning_rate": 9.992805682607527e-07, + "loss": 0.7246, + "step": 60306 + }, + { + "epoch": 1.55, + "learning_rate": 9.992528978142962e-07, + "loss": 0.6367, + "step": 60307 + }, + { + "epoch": 1.55, + "learning_rate": 9.992252273684113e-07, + "loss": 0.6646, + "step": 60308 + }, + { + "epoch": 1.55, + "learning_rate": 9.9919755692312e-07, + "loss": 0.7266, + "step": 60309 + }, + { + "epoch": 1.55, + "learning_rate": 9.991698864784429e-07, + "loss": 0.5603, + "step": 60310 + }, + { + "epoch": 1.55, + "learning_rate": 9.991422160344013e-07, + "loss": 0.5034, + "step": 60311 + }, + { + "epoch": 1.55, + "learning_rate": 9.991145455910164e-07, + "loss": 0.563, + "step": 60312 + }, + { + "epoch": 1.55, + "learning_rate": 9.9908687514831e-07, + "loss": 0.749, + "step": 60313 + }, + { + "epoch": 1.55, + "learning_rate": 9.990592047063022e-07, + "loss": 0.8057, + "step": 60314 + }, + { + "epoch": 1.55, + "learning_rate": 9.990315342650154e-07, + "loss": 0.6445, + "step": 60315 + }, + { + "epoch": 1.55, + "learning_rate": 9.990038638244695e-07, + "loss": 0.5535, + "step": 60316 + }, + { + "epoch": 1.55, + "learning_rate": 9.989761933846864e-07, + "loss": 0.8467, + "step": 60317 + }, + { + "epoch": 1.55, + "learning_rate": 9.98948522945687e-07, + "loss": 0.6509, + "step": 60318 + }, + { + "epoch": 1.55, + "learning_rate": 9.98920852507493e-07, + "loss": 0.5624, + "step": 60319 + }, + { + "epoch": 1.55, + "learning_rate": 9.988931820701251e-07, + "loss": 0.6631, + "step": 60320 + }, + { + "epoch": 1.55, + "learning_rate": 9.988655116336046e-07, + "loss": 0.5481, + "step": 60321 + }, + { + "epoch": 1.55, + "learning_rate": 9.988378411979527e-07, + "loss": 0.5747, + "step": 60322 + }, + { + "epoch": 1.55, + "learning_rate": 9.988101707631908e-07, + "loss": 0.7188, + "step": 60323 + }, + { + "epoch": 1.55, + "learning_rate": 9.987825003293397e-07, + "loss": 0.7695, + "step": 60324 + }, + { + "epoch": 1.55, + "learning_rate": 9.987548298964211e-07, + "loss": 0.7036, + "step": 60325 + }, + { + "epoch": 1.55, + "learning_rate": 9.98727159464456e-07, + "loss": 0.6816, + "step": 60326 + }, + { + "epoch": 1.55, + "learning_rate": 9.986994890334648e-07, + "loss": 0.6533, + "step": 60327 + }, + { + "epoch": 1.55, + "learning_rate": 9.986718186034698e-07, + "loss": 0.7344, + "step": 60328 + }, + { + "epoch": 1.55, + "learning_rate": 9.986441481744912e-07, + "loss": 0.4391, + "step": 60329 + }, + { + "epoch": 1.55, + "learning_rate": 9.986164777465513e-07, + "loss": 0.5654, + "step": 60330 + }, + { + "epoch": 1.55, + "learning_rate": 9.985888073196702e-07, + "loss": 0.8242, + "step": 60331 + }, + { + "epoch": 1.55, + "learning_rate": 9.985611368938702e-07, + "loss": 0.577, + "step": 60332 + }, + { + "epoch": 1.55, + "learning_rate": 9.985334664691712e-07, + "loss": 0.5747, + "step": 60333 + }, + { + "epoch": 1.55, + "learning_rate": 9.985057960455957e-07, + "loss": 0.7734, + "step": 60334 + }, + { + "epoch": 1.55, + "learning_rate": 9.98478125623164e-07, + "loss": 0.7012, + "step": 60335 + }, + { + "epoch": 1.55, + "learning_rate": 9.984504552018977e-07, + "loss": 0.6101, + "step": 60336 + }, + { + "epoch": 1.55, + "learning_rate": 9.984227847818174e-07, + "loss": 0.7617, + "step": 60337 + }, + { + "epoch": 1.55, + "learning_rate": 9.98395114362945e-07, + "loss": 0.4521, + "step": 60338 + }, + { + "epoch": 1.55, + "learning_rate": 9.98367443945301e-07, + "loss": 0.7695, + "step": 60339 + }, + { + "epoch": 1.55, + "learning_rate": 9.983397735289075e-07, + "loss": 0.6626, + "step": 60340 + }, + { + "epoch": 1.55, + "learning_rate": 9.983121031137847e-07, + "loss": 0.585, + "step": 60341 + }, + { + "epoch": 1.55, + "learning_rate": 9.982844326999545e-07, + "loss": 0.6816, + "step": 60342 + }, + { + "epoch": 1.55, + "learning_rate": 9.982567622874378e-07, + "loss": 0.8237, + "step": 60343 + }, + { + "epoch": 1.55, + "learning_rate": 9.982290918762558e-07, + "loss": 0.7266, + "step": 60344 + }, + { + "epoch": 1.55, + "learning_rate": 9.982014214664301e-07, + "loss": 0.8037, + "step": 60345 + }, + { + "epoch": 1.55, + "learning_rate": 9.981737510579809e-07, + "loss": 0.707, + "step": 60346 + }, + { + "epoch": 1.55, + "learning_rate": 9.9814608065093e-07, + "loss": 0.6455, + "step": 60347 + }, + { + "epoch": 1.55, + "learning_rate": 9.98118410245299e-07, + "loss": 0.7744, + "step": 60348 + }, + { + "epoch": 1.55, + "learning_rate": 9.980907398411082e-07, + "loss": 0.7402, + "step": 60349 + }, + { + "epoch": 1.55, + "learning_rate": 9.980630694383794e-07, + "loss": 0.5732, + "step": 60350 + }, + { + "epoch": 1.55, + "learning_rate": 9.980353990371337e-07, + "loss": 0.8701, + "step": 60351 + }, + { + "epoch": 1.55, + "learning_rate": 9.98007728637392e-07, + "loss": 0.6528, + "step": 60352 + }, + { + "epoch": 1.55, + "learning_rate": 9.97980058239176e-07, + "loss": 0.6377, + "step": 60353 + }, + { + "epoch": 1.55, + "learning_rate": 9.979523878425064e-07, + "loss": 0.7041, + "step": 60354 + }, + { + "epoch": 1.55, + "learning_rate": 9.97924717447405e-07, + "loss": 0.6797, + "step": 60355 + }, + { + "epoch": 1.55, + "learning_rate": 9.978970470538918e-07, + "loss": 0.6431, + "step": 60356 + }, + { + "epoch": 1.55, + "learning_rate": 9.978693766619892e-07, + "loss": 0.5562, + "step": 60357 + }, + { + "epoch": 1.55, + "learning_rate": 9.978417062717175e-07, + "loss": 0.7607, + "step": 60358 + }, + { + "epoch": 1.55, + "learning_rate": 9.978140358830987e-07, + "loss": 0.6108, + "step": 60359 + }, + { + "epoch": 1.55, + "learning_rate": 9.977863654961533e-07, + "loss": 0.6836, + "step": 60360 + }, + { + "epoch": 1.55, + "learning_rate": 9.97758695110903e-07, + "loss": 0.6821, + "step": 60361 + }, + { + "epoch": 1.55, + "learning_rate": 9.977310247273687e-07, + "loss": 0.6553, + "step": 60362 + }, + { + "epoch": 1.55, + "learning_rate": 9.977033543455715e-07, + "loss": 0.7334, + "step": 60363 + }, + { + "epoch": 1.55, + "learning_rate": 9.976756839655328e-07, + "loss": 0.5081, + "step": 60364 + }, + { + "epoch": 1.55, + "learning_rate": 9.976480135872742e-07, + "loss": 0.5137, + "step": 60365 + }, + { + "epoch": 1.55, + "learning_rate": 9.976203432108161e-07, + "loss": 0.707, + "step": 60366 + }, + { + "epoch": 1.55, + "learning_rate": 9.975926728361798e-07, + "loss": 0.7207, + "step": 60367 + }, + { + "epoch": 1.55, + "learning_rate": 9.975650024633868e-07, + "loss": 0.5654, + "step": 60368 + }, + { + "epoch": 1.55, + "learning_rate": 9.97537332092458e-07, + "loss": 0.6362, + "step": 60369 + }, + { + "epoch": 1.55, + "learning_rate": 9.97509661723415e-07, + "loss": 0.4802, + "step": 60370 + }, + { + "epoch": 1.55, + "learning_rate": 9.974819913562788e-07, + "loss": 0.583, + "step": 60371 + }, + { + "epoch": 1.55, + "learning_rate": 9.974543209910701e-07, + "loss": 0.6748, + "step": 60372 + }, + { + "epoch": 1.55, + "learning_rate": 9.97426650627811e-07, + "loss": 0.7305, + "step": 60373 + }, + { + "epoch": 1.55, + "learning_rate": 9.973989802665218e-07, + "loss": 0.6777, + "step": 60374 + }, + { + "epoch": 1.55, + "learning_rate": 9.973713099072246e-07, + "loss": 0.5249, + "step": 60375 + }, + { + "epoch": 1.55, + "learning_rate": 9.9734363954994e-07, + "loss": 0.5957, + "step": 60376 + }, + { + "epoch": 1.55, + "learning_rate": 9.973159691946886e-07, + "loss": 0.791, + "step": 60377 + }, + { + "epoch": 1.55, + "learning_rate": 9.972882988414928e-07, + "loss": 0.6313, + "step": 60378 + }, + { + "epoch": 1.55, + "learning_rate": 9.972606284903729e-07, + "loss": 0.7393, + "step": 60379 + }, + { + "epoch": 1.55, + "learning_rate": 9.972329581413506e-07, + "loss": 0.6211, + "step": 60380 + }, + { + "epoch": 1.55, + "learning_rate": 9.972052877944468e-07, + "loss": 0.708, + "step": 60381 + }, + { + "epoch": 1.55, + "learning_rate": 9.971776174496828e-07, + "loss": 0.7686, + "step": 60382 + }, + { + "epoch": 1.55, + "learning_rate": 9.971499471070798e-07, + "loss": 0.6772, + "step": 60383 + }, + { + "epoch": 1.55, + "learning_rate": 9.97122276766659e-07, + "loss": 0.5923, + "step": 60384 + }, + { + "epoch": 1.55, + "learning_rate": 9.970946064284416e-07, + "loss": 0.8496, + "step": 60385 + }, + { + "epoch": 1.55, + "learning_rate": 9.970669360924486e-07, + "loss": 0.5586, + "step": 60386 + }, + { + "epoch": 1.55, + "learning_rate": 9.970392657587014e-07, + "loss": 0.5947, + "step": 60387 + }, + { + "epoch": 1.55, + "learning_rate": 9.970115954272212e-07, + "loss": 0.6265, + "step": 60388 + }, + { + "epoch": 1.55, + "learning_rate": 9.969839250980288e-07, + "loss": 0.749, + "step": 60389 + }, + { + "epoch": 1.55, + "learning_rate": 9.969562547711459e-07, + "loss": 0.5977, + "step": 60390 + }, + { + "epoch": 1.55, + "learning_rate": 9.969285844465931e-07, + "loss": 0.7051, + "step": 60391 + }, + { + "epoch": 1.55, + "learning_rate": 9.969009141243922e-07, + "loss": 0.7051, + "step": 60392 + }, + { + "epoch": 1.55, + "learning_rate": 9.968732438045642e-07, + "loss": 0.6692, + "step": 60393 + }, + { + "epoch": 1.55, + "learning_rate": 9.9684557348713e-07, + "loss": 0.2661, + "step": 60394 + }, + { + "epoch": 1.55, + "learning_rate": 9.968179031721116e-07, + "loss": 0.6196, + "step": 60395 + }, + { + "epoch": 1.55, + "learning_rate": 9.967902328595289e-07, + "loss": 0.5874, + "step": 60396 + }, + { + "epoch": 1.55, + "learning_rate": 9.967625625494038e-07, + "loss": 0.6836, + "step": 60397 + }, + { + "epoch": 1.55, + "learning_rate": 9.967348922417577e-07, + "loss": 0.6621, + "step": 60398 + }, + { + "epoch": 1.55, + "learning_rate": 9.967072219366115e-07, + "loss": 0.5674, + "step": 60399 + }, + { + "epoch": 1.55, + "learning_rate": 9.966795516339863e-07, + "loss": 0.5516, + "step": 60400 + }, + { + "epoch": 1.55, + "learning_rate": 9.966518813339037e-07, + "loss": 0.6528, + "step": 60401 + }, + { + "epoch": 1.55, + "learning_rate": 9.966242110363843e-07, + "loss": 0.5772, + "step": 60402 + }, + { + "epoch": 1.55, + "learning_rate": 9.965965407414497e-07, + "loss": 0.6558, + "step": 60403 + }, + { + "epoch": 1.55, + "learning_rate": 9.965688704491209e-07, + "loss": 0.5571, + "step": 60404 + }, + { + "epoch": 1.55, + "learning_rate": 9.965412001594197e-07, + "loss": 0.6665, + "step": 60405 + }, + { + "epoch": 1.55, + "learning_rate": 9.965135298723662e-07, + "loss": 0.7598, + "step": 60406 + }, + { + "epoch": 1.55, + "learning_rate": 9.964858595879823e-07, + "loss": 0.6738, + "step": 60407 + }, + { + "epoch": 1.55, + "learning_rate": 9.964581893062888e-07, + "loss": 0.5864, + "step": 60408 + }, + { + "epoch": 1.55, + "learning_rate": 9.964305190273072e-07, + "loss": 0.613, + "step": 60409 + }, + { + "epoch": 1.55, + "learning_rate": 9.964028487510585e-07, + "loss": 0.6123, + "step": 60410 + }, + { + "epoch": 1.55, + "learning_rate": 9.963751784775642e-07, + "loss": 0.6865, + "step": 60411 + }, + { + "epoch": 1.55, + "learning_rate": 9.96347508206845e-07, + "loss": 0.5181, + "step": 60412 + }, + { + "epoch": 1.55, + "learning_rate": 9.963198379389226e-07, + "loss": 0.5457, + "step": 60413 + }, + { + "epoch": 1.55, + "learning_rate": 9.962921676738178e-07, + "loss": 0.5444, + "step": 60414 + }, + { + "epoch": 1.55, + "learning_rate": 9.96264497411552e-07, + "loss": 0.7949, + "step": 60415 + }, + { + "epoch": 1.55, + "learning_rate": 9.962368271521466e-07, + "loss": 0.7764, + "step": 60416 + }, + { + "epoch": 1.55, + "learning_rate": 9.96209156895622e-07, + "loss": 0.5508, + "step": 60417 + }, + { + "epoch": 1.55, + "learning_rate": 9.96181486642e-07, + "loss": 0.457, + "step": 60418 + }, + { + "epoch": 1.55, + "learning_rate": 9.961538163913015e-07, + "loss": 0.5962, + "step": 60419 + }, + { + "epoch": 1.55, + "learning_rate": 9.96126146143548e-07, + "loss": 0.8086, + "step": 60420 + }, + { + "epoch": 1.55, + "learning_rate": 9.960984758987606e-07, + "loss": 0.6675, + "step": 60421 + }, + { + "epoch": 1.55, + "learning_rate": 9.960708056569604e-07, + "loss": 0.7178, + "step": 60422 + }, + { + "epoch": 1.55, + "learning_rate": 9.960431354181685e-07, + "loss": 0.5913, + "step": 60423 + }, + { + "epoch": 1.55, + "learning_rate": 9.960154651824062e-07, + "loss": 0.6714, + "step": 60424 + }, + { + "epoch": 1.55, + "learning_rate": 9.95987794949695e-07, + "loss": 0.4756, + "step": 60425 + }, + { + "epoch": 1.55, + "learning_rate": 9.959601247200556e-07, + "loss": 0.6289, + "step": 60426 + }, + { + "epoch": 1.55, + "learning_rate": 9.959324544935092e-07, + "loss": 0.5896, + "step": 60427 + }, + { + "epoch": 1.55, + "learning_rate": 9.959047842700772e-07, + "loss": 0.5957, + "step": 60428 + }, + { + "epoch": 1.55, + "learning_rate": 9.958771140497806e-07, + "loss": 0.7588, + "step": 60429 + }, + { + "epoch": 1.55, + "learning_rate": 9.958494438326408e-07, + "loss": 0.542, + "step": 60430 + }, + { + "epoch": 1.55, + "learning_rate": 9.958217736186787e-07, + "loss": 0.7695, + "step": 60431 + }, + { + "epoch": 1.55, + "learning_rate": 9.95794103407916e-07, + "loss": 0.7061, + "step": 60432 + }, + { + "epoch": 1.55, + "learning_rate": 9.957664332003734e-07, + "loss": 0.6426, + "step": 60433 + }, + { + "epoch": 1.55, + "learning_rate": 9.957387629960723e-07, + "loss": 0.6865, + "step": 60434 + }, + { + "epoch": 1.55, + "learning_rate": 9.95711092795034e-07, + "loss": 0.6455, + "step": 60435 + }, + { + "epoch": 1.55, + "learning_rate": 9.956834225972792e-07, + "loss": 0.5928, + "step": 60436 + }, + { + "epoch": 1.55, + "learning_rate": 9.956557524028297e-07, + "loss": 0.4871, + "step": 60437 + }, + { + "epoch": 1.55, + "learning_rate": 9.95628082211706e-07, + "loss": 0.6592, + "step": 60438 + }, + { + "epoch": 1.55, + "learning_rate": 9.9560041202393e-07, + "loss": 0.6533, + "step": 60439 + }, + { + "epoch": 1.55, + "learning_rate": 9.955727418395223e-07, + "loss": 0.5703, + "step": 60440 + }, + { + "epoch": 1.55, + "learning_rate": 9.955450716585048e-07, + "loss": 0.6157, + "step": 60441 + }, + { + "epoch": 1.55, + "learning_rate": 9.955174014808976e-07, + "loss": 0.7144, + "step": 60442 + }, + { + "epoch": 1.55, + "learning_rate": 9.95489731306723e-07, + "loss": 0.5686, + "step": 60443 + }, + { + "epoch": 1.55, + "learning_rate": 9.954620611360017e-07, + "loss": 0.707, + "step": 60444 + }, + { + "epoch": 1.55, + "learning_rate": 9.95434390968755e-07, + "loss": 0.624, + "step": 60445 + }, + { + "epoch": 1.55, + "learning_rate": 9.954067208050034e-07, + "loss": 0.6235, + "step": 60446 + }, + { + "epoch": 1.55, + "learning_rate": 9.953790506447692e-07, + "loss": 0.7422, + "step": 60447 + }, + { + "epoch": 1.55, + "learning_rate": 9.953513804880727e-07, + "loss": 0.665, + "step": 60448 + }, + { + "epoch": 1.55, + "learning_rate": 9.953237103349357e-07, + "loss": 0.5537, + "step": 60449 + }, + { + "epoch": 1.55, + "learning_rate": 9.952960401853787e-07, + "loss": 0.7295, + "step": 60450 + }, + { + "epoch": 1.55, + "learning_rate": 9.95268370039424e-07, + "loss": 0.5166, + "step": 60451 + }, + { + "epoch": 1.55, + "learning_rate": 9.952406998970913e-07, + "loss": 0.6851, + "step": 60452 + }, + { + "epoch": 1.55, + "learning_rate": 9.952130297584032e-07, + "loss": 0.5947, + "step": 60453 + }, + { + "epoch": 1.55, + "learning_rate": 9.9518535962338e-07, + "loss": 0.564, + "step": 60454 + }, + { + "epoch": 1.55, + "learning_rate": 9.951576894920433e-07, + "loss": 0.7627, + "step": 60455 + }, + { + "epoch": 1.55, + "learning_rate": 9.95130019364414e-07, + "loss": 0.5652, + "step": 60456 + }, + { + "epoch": 1.55, + "learning_rate": 9.951023492405135e-07, + "loss": 0.625, + "step": 60457 + }, + { + "epoch": 1.55, + "learning_rate": 9.95074679120363e-07, + "loss": 0.7637, + "step": 60458 + }, + { + "epoch": 1.55, + "learning_rate": 9.950470090039831e-07, + "loss": 0.6499, + "step": 60459 + }, + { + "epoch": 1.55, + "learning_rate": 9.95019338891396e-07, + "loss": 0.6465, + "step": 60460 + }, + { + "epoch": 1.55, + "learning_rate": 9.949916687826223e-07, + "loss": 0.71, + "step": 60461 + }, + { + "epoch": 1.55, + "learning_rate": 9.94963998677683e-07, + "loss": 0.4968, + "step": 60462 + }, + { + "epoch": 1.55, + "learning_rate": 9.949363285765997e-07, + "loss": 0.4373, + "step": 60463 + }, + { + "epoch": 1.55, + "learning_rate": 9.949086584793932e-07, + "loss": 0.8281, + "step": 60464 + }, + { + "epoch": 1.55, + "learning_rate": 9.948809883860853e-07, + "loss": 0.7627, + "step": 60465 + }, + { + "epoch": 1.55, + "learning_rate": 9.948533182966966e-07, + "loss": 0.7373, + "step": 60466 + }, + { + "epoch": 1.55, + "learning_rate": 9.948256482112484e-07, + "loss": 0.6328, + "step": 60467 + }, + { + "epoch": 1.55, + "learning_rate": 9.947979781297621e-07, + "loss": 0.75, + "step": 60468 + }, + { + "epoch": 1.55, + "learning_rate": 9.947703080522586e-07, + "loss": 0.6865, + "step": 60469 + }, + { + "epoch": 1.55, + "learning_rate": 9.947426379787594e-07, + "loss": 0.8193, + "step": 60470 + }, + { + "epoch": 1.55, + "learning_rate": 9.947149679092852e-07, + "loss": 0.6113, + "step": 60471 + }, + { + "epoch": 1.55, + "learning_rate": 9.946872978438578e-07, + "loss": 0.7549, + "step": 60472 + }, + { + "epoch": 1.55, + "learning_rate": 9.94659627782498e-07, + "loss": 0.8779, + "step": 60473 + }, + { + "epoch": 1.55, + "learning_rate": 9.94631957725227e-07, + "loss": 0.7422, + "step": 60474 + }, + { + "epoch": 1.55, + "learning_rate": 9.946042876720666e-07, + "loss": 0.6152, + "step": 60475 + }, + { + "epoch": 1.55, + "learning_rate": 9.94576617623037e-07, + "loss": 0.7129, + "step": 60476 + }, + { + "epoch": 1.55, + "learning_rate": 9.945489475781599e-07, + "loss": 0.6533, + "step": 60477 + }, + { + "epoch": 1.55, + "learning_rate": 9.945212775374563e-07, + "loss": 0.6885, + "step": 60478 + }, + { + "epoch": 1.55, + "learning_rate": 9.944936075009475e-07, + "loss": 0.6963, + "step": 60479 + }, + { + "epoch": 1.55, + "learning_rate": 9.944659374686548e-07, + "loss": 0.7026, + "step": 60480 + }, + { + "epoch": 1.55, + "learning_rate": 9.944382674405992e-07, + "loss": 0.594, + "step": 60481 + }, + { + "epoch": 1.55, + "learning_rate": 9.94410597416802e-07, + "loss": 0.7402, + "step": 60482 + }, + { + "epoch": 1.55, + "learning_rate": 9.943829273972843e-07, + "loss": 0.6196, + "step": 60483 + }, + { + "epoch": 1.55, + "learning_rate": 9.943552573820673e-07, + "loss": 0.6318, + "step": 60484 + }, + { + "epoch": 1.55, + "learning_rate": 9.943275873711728e-07, + "loss": 0.7109, + "step": 60485 + }, + { + "epoch": 1.55, + "learning_rate": 9.942999173646208e-07, + "loss": 0.6011, + "step": 60486 + }, + { + "epoch": 1.55, + "learning_rate": 9.942722473624333e-07, + "loss": 0.8623, + "step": 60487 + }, + { + "epoch": 1.55, + "learning_rate": 9.94244577364631e-07, + "loss": 0.665, + "step": 60488 + }, + { + "epoch": 1.55, + "learning_rate": 9.942169073712355e-07, + "loss": 0.7461, + "step": 60489 + }, + { + "epoch": 1.55, + "learning_rate": 9.941892373822678e-07, + "loss": 0.6675, + "step": 60490 + }, + { + "epoch": 1.55, + "learning_rate": 9.941615673977493e-07, + "loss": 0.5985, + "step": 60491 + }, + { + "epoch": 1.55, + "learning_rate": 9.941338974177007e-07, + "loss": 0.6045, + "step": 60492 + }, + { + "epoch": 1.55, + "learning_rate": 9.94106227442144e-07, + "loss": 0.5308, + "step": 60493 + }, + { + "epoch": 1.55, + "learning_rate": 9.940785574710994e-07, + "loss": 0.8789, + "step": 60494 + }, + { + "epoch": 1.55, + "learning_rate": 9.940508875045891e-07, + "loss": 0.6953, + "step": 60495 + }, + { + "epoch": 1.55, + "learning_rate": 9.940232175426336e-07, + "loss": 0.6416, + "step": 60496 + }, + { + "epoch": 1.55, + "learning_rate": 9.939955475852542e-07, + "loss": 0.7256, + "step": 60497 + }, + { + "epoch": 1.55, + "learning_rate": 9.939678776324719e-07, + "loss": 0.6294, + "step": 60498 + }, + { + "epoch": 1.55, + "learning_rate": 9.939402076843084e-07, + "loss": 0.6426, + "step": 60499 + }, + { + "epoch": 1.55, + "learning_rate": 9.939125377407843e-07, + "loss": 0.6499, + "step": 60500 + }, + { + "epoch": 1.55, + "learning_rate": 9.938848678019214e-07, + "loss": 0.6782, + "step": 60501 + }, + { + "epoch": 1.55, + "learning_rate": 9.938571978677403e-07, + "loss": 0.7051, + "step": 60502 + }, + { + "epoch": 1.55, + "learning_rate": 9.938295279382626e-07, + "loss": 0.8506, + "step": 60503 + }, + { + "epoch": 1.55, + "learning_rate": 9.938018580135092e-07, + "loss": 0.7344, + "step": 60504 + }, + { + "epoch": 1.55, + "learning_rate": 9.93774188093502e-07, + "loss": 0.5771, + "step": 60505 + }, + { + "epoch": 1.55, + "learning_rate": 9.937465181782613e-07, + "loss": 0.5654, + "step": 60506 + }, + { + "epoch": 1.55, + "learning_rate": 9.937188482678082e-07, + "loss": 0.7588, + "step": 60507 + }, + { + "epoch": 1.55, + "learning_rate": 9.936911783621647e-07, + "loss": 0.6196, + "step": 60508 + }, + { + "epoch": 1.55, + "learning_rate": 9.936635084613514e-07, + "loss": 0.7002, + "step": 60509 + }, + { + "epoch": 1.55, + "learning_rate": 9.9363583856539e-07, + "loss": 0.5679, + "step": 60510 + }, + { + "epoch": 1.55, + "learning_rate": 9.936081686743008e-07, + "loss": 0.5186, + "step": 60511 + }, + { + "epoch": 1.55, + "learning_rate": 9.935804987881058e-07, + "loss": 0.7295, + "step": 60512 + }, + { + "epoch": 1.55, + "learning_rate": 9.93552828906826e-07, + "loss": 0.6396, + "step": 60513 + }, + { + "epoch": 1.55, + "learning_rate": 9.935251590304824e-07, + "loss": 0.6719, + "step": 60514 + }, + { + "epoch": 1.55, + "learning_rate": 9.934974891590965e-07, + "loss": 0.543, + "step": 60515 + }, + { + "epoch": 1.55, + "learning_rate": 9.934698192926893e-07, + "loss": 0.7559, + "step": 60516 + }, + { + "epoch": 1.55, + "learning_rate": 9.934421494312816e-07, + "loss": 0.707, + "step": 60517 + }, + { + "epoch": 1.55, + "learning_rate": 9.93414479574895e-07, + "loss": 0.5161, + "step": 60518 + }, + { + "epoch": 1.55, + "learning_rate": 9.933868097235508e-07, + "loss": 0.4829, + "step": 60519 + }, + { + "epoch": 1.55, + "learning_rate": 9.9335913987727e-07, + "loss": 0.4512, + "step": 60520 + }, + { + "epoch": 1.55, + "learning_rate": 9.933314700360735e-07, + "loss": 0.584, + "step": 60521 + }, + { + "epoch": 1.55, + "learning_rate": 9.93303800199983e-07, + "loss": 0.5981, + "step": 60522 + }, + { + "epoch": 1.55, + "learning_rate": 9.932761303690195e-07, + "loss": 0.7036, + "step": 60523 + }, + { + "epoch": 1.55, + "learning_rate": 9.932484605432042e-07, + "loss": 0.7188, + "step": 60524 + }, + { + "epoch": 1.55, + "learning_rate": 9.932207907225586e-07, + "loss": 0.5693, + "step": 60525 + }, + { + "epoch": 1.55, + "learning_rate": 9.93193120907103e-07, + "loss": 0.2461, + "step": 60526 + }, + { + "epoch": 1.55, + "learning_rate": 9.931654510968593e-07, + "loss": 0.7266, + "step": 60527 + }, + { + "epoch": 1.55, + "learning_rate": 9.931377812918484e-07, + "loss": 0.6611, + "step": 60528 + }, + { + "epoch": 1.55, + "learning_rate": 9.931101114920916e-07, + "loss": 0.6899, + "step": 60529 + }, + { + "epoch": 1.55, + "learning_rate": 9.9308244169761e-07, + "loss": 0.6895, + "step": 60530 + }, + { + "epoch": 1.55, + "learning_rate": 9.93054771908425e-07, + "loss": 0.7344, + "step": 60531 + }, + { + "epoch": 1.55, + "learning_rate": 9.930271021245574e-07, + "loss": 0.6841, + "step": 60532 + }, + { + "epoch": 1.55, + "learning_rate": 9.92999432346029e-07, + "loss": 0.752, + "step": 60533 + }, + { + "epoch": 1.55, + "learning_rate": 9.929717625728606e-07, + "loss": 0.6299, + "step": 60534 + }, + { + "epoch": 1.55, + "learning_rate": 9.929440928050734e-07, + "loss": 0.6357, + "step": 60535 + }, + { + "epoch": 1.55, + "learning_rate": 9.929164230426884e-07, + "loss": 0.6592, + "step": 60536 + }, + { + "epoch": 1.55, + "learning_rate": 9.928887532857269e-07, + "loss": 0.5347, + "step": 60537 + }, + { + "epoch": 1.55, + "learning_rate": 9.928610835342101e-07, + "loss": 0.7705, + "step": 60538 + }, + { + "epoch": 1.55, + "learning_rate": 9.928334137881595e-07, + "loss": 0.748, + "step": 60539 + }, + { + "epoch": 1.55, + "learning_rate": 9.92805744047596e-07, + "loss": 0.5693, + "step": 60540 + }, + { + "epoch": 1.55, + "learning_rate": 9.927780743125407e-07, + "loss": 0.4807, + "step": 60541 + }, + { + "epoch": 1.55, + "learning_rate": 9.927504045830148e-07, + "loss": 0.5027, + "step": 60542 + }, + { + "epoch": 1.55, + "learning_rate": 9.927227348590398e-07, + "loss": 0.6377, + "step": 60543 + }, + { + "epoch": 1.55, + "learning_rate": 9.926950651406363e-07, + "loss": 0.7129, + "step": 60544 + }, + { + "epoch": 1.55, + "learning_rate": 9.926673954278264e-07, + "loss": 0.7529, + "step": 60545 + }, + { + "epoch": 1.55, + "learning_rate": 9.926397257206307e-07, + "loss": 0.6045, + "step": 60546 + }, + { + "epoch": 1.55, + "learning_rate": 9.9261205601907e-07, + "loss": 0.6016, + "step": 60547 + }, + { + "epoch": 1.55, + "learning_rate": 9.92584386323166e-07, + "loss": 0.7617, + "step": 60548 + }, + { + "epoch": 1.55, + "learning_rate": 9.925567166329398e-07, + "loss": 0.6133, + "step": 60549 + }, + { + "epoch": 1.55, + "learning_rate": 9.925290469484128e-07, + "loss": 0.5754, + "step": 60550 + }, + { + "epoch": 1.55, + "learning_rate": 9.92501377269606e-07, + "loss": 0.6406, + "step": 60551 + }, + { + "epoch": 1.55, + "learning_rate": 9.924737075965402e-07, + "loss": 0.6665, + "step": 60552 + }, + { + "epoch": 1.55, + "learning_rate": 9.924460379292371e-07, + "loss": 0.7891, + "step": 60553 + }, + { + "epoch": 1.55, + "learning_rate": 9.924183682677176e-07, + "loss": 0.79, + "step": 60554 + }, + { + "epoch": 1.55, + "learning_rate": 9.923906986120035e-07, + "loss": 0.5815, + "step": 60555 + }, + { + "epoch": 1.55, + "learning_rate": 9.923630289621152e-07, + "loss": 0.6855, + "step": 60556 + }, + { + "epoch": 1.55, + "learning_rate": 9.92335359318074e-07, + "loss": 0.6416, + "step": 60557 + }, + { + "epoch": 1.55, + "learning_rate": 9.923076896799013e-07, + "loss": 0.8984, + "step": 60558 + }, + { + "epoch": 1.55, + "learning_rate": 9.922800200476185e-07, + "loss": 0.8232, + "step": 60559 + }, + { + "epoch": 1.55, + "learning_rate": 9.922523504212462e-07, + "loss": 0.7285, + "step": 60560 + }, + { + "epoch": 1.55, + "learning_rate": 9.92224680800806e-07, + "loss": 0.5928, + "step": 60561 + }, + { + "epoch": 1.55, + "learning_rate": 9.921970111863192e-07, + "loss": 0.5542, + "step": 60562 + }, + { + "epoch": 1.55, + "learning_rate": 9.921693415778066e-07, + "loss": 0.5701, + "step": 60563 + }, + { + "epoch": 1.55, + "learning_rate": 9.921416719752897e-07, + "loss": 0.6665, + "step": 60564 + }, + { + "epoch": 1.55, + "learning_rate": 9.921140023787897e-07, + "loss": 0.708, + "step": 60565 + }, + { + "epoch": 1.55, + "learning_rate": 9.920863327883274e-07, + "loss": 0.6016, + "step": 60566 + }, + { + "epoch": 1.55, + "learning_rate": 9.920586632039243e-07, + "loss": 0.7227, + "step": 60567 + }, + { + "epoch": 1.55, + "learning_rate": 9.920309936256017e-07, + "loss": 0.5791, + "step": 60568 + }, + { + "epoch": 1.55, + "learning_rate": 9.920033240533802e-07, + "loss": 0.5645, + "step": 60569 + }, + { + "epoch": 1.55, + "learning_rate": 9.919756544872815e-07, + "loss": 1.0068, + "step": 60570 + }, + { + "epoch": 1.55, + "learning_rate": 9.919479849273268e-07, + "loss": 0.4917, + "step": 60571 + }, + { + "epoch": 1.55, + "learning_rate": 9.919203153735372e-07, + "loss": 0.7275, + "step": 60572 + }, + { + "epoch": 1.55, + "learning_rate": 9.918926458259337e-07, + "loss": 0.7656, + "step": 60573 + }, + { + "epoch": 1.55, + "learning_rate": 9.918649762845376e-07, + "loss": 0.6328, + "step": 60574 + }, + { + "epoch": 1.55, + "learning_rate": 9.918373067493705e-07, + "loss": 0.6147, + "step": 60575 + }, + { + "epoch": 1.55, + "learning_rate": 9.91809637220453e-07, + "loss": 0.6895, + "step": 60576 + }, + { + "epoch": 1.55, + "learning_rate": 9.917819676978064e-07, + "loss": 0.709, + "step": 60577 + }, + { + "epoch": 1.55, + "learning_rate": 9.917542981814518e-07, + "loss": 0.5693, + "step": 60578 + }, + { + "epoch": 1.55, + "learning_rate": 9.917266286714106e-07, + "loss": 0.8076, + "step": 60579 + }, + { + "epoch": 1.55, + "learning_rate": 9.91698959167704e-07, + "loss": 0.6758, + "step": 60580 + }, + { + "epoch": 1.55, + "learning_rate": 9.916712896703532e-07, + "loss": 0.5542, + "step": 60581 + }, + { + "epoch": 1.55, + "learning_rate": 9.916436201793791e-07, + "loss": 0.6694, + "step": 60582 + }, + { + "epoch": 1.55, + "learning_rate": 9.916159506948033e-07, + "loss": 0.6465, + "step": 60583 + }, + { + "epoch": 1.55, + "learning_rate": 9.915882812166472e-07, + "loss": 0.8535, + "step": 60584 + }, + { + "epoch": 1.55, + "learning_rate": 9.91560611744931e-07, + "loss": 0.6675, + "step": 60585 + }, + { + "epoch": 1.55, + "learning_rate": 9.915329422796767e-07, + "loss": 0.6006, + "step": 60586 + }, + { + "epoch": 1.55, + "learning_rate": 9.915052728209052e-07, + "loss": 0.7812, + "step": 60587 + }, + { + "epoch": 1.55, + "learning_rate": 9.914776033686375e-07, + "loss": 0.73, + "step": 60588 + }, + { + "epoch": 1.55, + "learning_rate": 9.914499339228953e-07, + "loss": 0.5088, + "step": 60589 + }, + { + "epoch": 1.55, + "learning_rate": 9.914222644836992e-07, + "loss": 0.6931, + "step": 60590 + }, + { + "epoch": 1.55, + "learning_rate": 9.913945950510707e-07, + "loss": 0.6152, + "step": 60591 + }, + { + "epoch": 1.55, + "learning_rate": 9.91366925625031e-07, + "loss": 0.5117, + "step": 60592 + }, + { + "epoch": 1.55, + "learning_rate": 9.913392562056014e-07, + "loss": 0.5791, + "step": 60593 + }, + { + "epoch": 1.55, + "learning_rate": 9.913115867928032e-07, + "loss": 0.5659, + "step": 60594 + }, + { + "epoch": 1.55, + "learning_rate": 9.91283917386657e-07, + "loss": 0.5684, + "step": 60595 + }, + { + "epoch": 1.55, + "learning_rate": 9.912562479871842e-07, + "loss": 0.5933, + "step": 60596 + }, + { + "epoch": 1.55, + "learning_rate": 9.91228578594406e-07, + "loss": 0.7979, + "step": 60597 + }, + { + "epoch": 1.55, + "learning_rate": 9.91200909208344e-07, + "loss": 0.7637, + "step": 60598 + }, + { + "epoch": 1.55, + "learning_rate": 9.911732398290188e-07, + "loss": 0.7344, + "step": 60599 + }, + { + "epoch": 1.55, + "learning_rate": 9.91145570456452e-07, + "loss": 0.6338, + "step": 60600 + }, + { + "epoch": 1.55, + "learning_rate": 9.911179010906645e-07, + "loss": 0.637, + "step": 60601 + }, + { + "epoch": 1.55, + "learning_rate": 9.910902317316778e-07, + "loss": 0.582, + "step": 60602 + }, + { + "epoch": 1.55, + "learning_rate": 9.910625623795125e-07, + "loss": 0.6821, + "step": 60603 + }, + { + "epoch": 1.55, + "learning_rate": 9.91034893034191e-07, + "loss": 0.6802, + "step": 60604 + }, + { + "epoch": 1.55, + "learning_rate": 9.910072236957331e-07, + "loss": 0.4978, + "step": 60605 + }, + { + "epoch": 1.55, + "learning_rate": 9.909795543641607e-07, + "loss": 0.6211, + "step": 60606 + }, + { + "epoch": 1.55, + "learning_rate": 9.909518850394946e-07, + "loss": 0.5867, + "step": 60607 + }, + { + "epoch": 1.55, + "learning_rate": 9.909242157217565e-07, + "loss": 0.5938, + "step": 60608 + }, + { + "epoch": 1.55, + "learning_rate": 9.90896546410967e-07, + "loss": 0.5732, + "step": 60609 + }, + { + "epoch": 1.55, + "learning_rate": 9.908688771071477e-07, + "loss": 0.5112, + "step": 60610 + }, + { + "epoch": 1.55, + "learning_rate": 9.908412078103198e-07, + "loss": 0.6118, + "step": 60611 + }, + { + "epoch": 1.55, + "learning_rate": 9.908135385205044e-07, + "loss": 0.6572, + "step": 60612 + }, + { + "epoch": 1.55, + "learning_rate": 9.907858692377225e-07, + "loss": 0.5695, + "step": 60613 + }, + { + "epoch": 1.55, + "learning_rate": 9.907581999619956e-07, + "loss": 0.6655, + "step": 60614 + }, + { + "epoch": 1.55, + "learning_rate": 9.907305306933448e-07, + "loss": 0.7793, + "step": 60615 + }, + { + "epoch": 1.55, + "learning_rate": 9.90702861431791e-07, + "loss": 0.5444, + "step": 60616 + }, + { + "epoch": 1.55, + "learning_rate": 9.906751921773557e-07, + "loss": 0.6816, + "step": 60617 + }, + { + "epoch": 1.55, + "learning_rate": 9.906475229300597e-07, + "loss": 0.7031, + "step": 60618 + }, + { + "epoch": 1.55, + "learning_rate": 9.906198536899249e-07, + "loss": 0.6333, + "step": 60619 + }, + { + "epoch": 1.55, + "learning_rate": 9.905921844569716e-07, + "loss": 0.5903, + "step": 60620 + }, + { + "epoch": 1.55, + "learning_rate": 9.905645152312218e-07, + "loss": 0.6431, + "step": 60621 + }, + { + "epoch": 1.55, + "learning_rate": 9.905368460126959e-07, + "loss": 0.488, + "step": 60622 + }, + { + "epoch": 1.55, + "learning_rate": 9.90509176801416e-07, + "loss": 0.6406, + "step": 60623 + }, + { + "epoch": 1.55, + "learning_rate": 9.904815075974028e-07, + "loss": 0.7051, + "step": 60624 + }, + { + "epoch": 1.55, + "learning_rate": 9.904538384006772e-07, + "loss": 0.5442, + "step": 60625 + }, + { + "epoch": 1.55, + "learning_rate": 9.904261692112606e-07, + "loss": 0.6787, + "step": 60626 + }, + { + "epoch": 1.55, + "learning_rate": 9.903985000291743e-07, + "loss": 0.6787, + "step": 60627 + }, + { + "epoch": 1.55, + "learning_rate": 9.903708308544393e-07, + "loss": 0.8682, + "step": 60628 + }, + { + "epoch": 1.55, + "learning_rate": 9.903431616870772e-07, + "loss": 0.7822, + "step": 60629 + }, + { + "epoch": 1.55, + "learning_rate": 9.903154925271088e-07, + "loss": 0.71, + "step": 60630 + }, + { + "epoch": 1.55, + "learning_rate": 9.902878233745553e-07, + "loss": 0.4467, + "step": 60631 + }, + { + "epoch": 1.55, + "learning_rate": 9.902601542294379e-07, + "loss": 0.4531, + "step": 60632 + }, + { + "epoch": 1.55, + "learning_rate": 9.90232485091778e-07, + "loss": 0.7158, + "step": 60633 + }, + { + "epoch": 1.55, + "learning_rate": 9.90204815961597e-07, + "loss": 0.7373, + "step": 60634 + }, + { + "epoch": 1.55, + "learning_rate": 9.901771468389152e-07, + "loss": 0.605, + "step": 60635 + }, + { + "epoch": 1.55, + "learning_rate": 9.901494777237544e-07, + "loss": 0.6533, + "step": 60636 + }, + { + "epoch": 1.55, + "learning_rate": 9.901218086161355e-07, + "loss": 0.9014, + "step": 60637 + }, + { + "epoch": 1.55, + "learning_rate": 9.900941395160803e-07, + "loss": 0.7305, + "step": 60638 + }, + { + "epoch": 1.55, + "learning_rate": 9.900664704236092e-07, + "loss": 0.583, + "step": 60639 + }, + { + "epoch": 1.55, + "learning_rate": 9.90038801338744e-07, + "loss": 0.6069, + "step": 60640 + }, + { + "epoch": 1.55, + "learning_rate": 9.900111322615055e-07, + "loss": 0.5979, + "step": 60641 + }, + { + "epoch": 1.55, + "learning_rate": 9.89983463191915e-07, + "loss": 0.5586, + "step": 60642 + }, + { + "epoch": 1.55, + "learning_rate": 9.89955794129994e-07, + "loss": 0.6514, + "step": 60643 + }, + { + "epoch": 1.55, + "learning_rate": 9.899281250757634e-07, + "loss": 0.6704, + "step": 60644 + }, + { + "epoch": 1.55, + "learning_rate": 9.899004560292438e-07, + "loss": 0.7222, + "step": 60645 + }, + { + "epoch": 1.55, + "learning_rate": 9.898727869904574e-07, + "loss": 0.4342, + "step": 60646 + }, + { + "epoch": 1.55, + "learning_rate": 9.898451179594248e-07, + "loss": 0.5474, + "step": 60647 + }, + { + "epoch": 1.55, + "learning_rate": 9.898174489361673e-07, + "loss": 0.6172, + "step": 60648 + }, + { + "epoch": 1.55, + "learning_rate": 9.89789779920706e-07, + "loss": 0.5228, + "step": 60649 + }, + { + "epoch": 1.55, + "learning_rate": 9.897621109130626e-07, + "loss": 0.7666, + "step": 60650 + }, + { + "epoch": 1.55, + "learning_rate": 9.897344419132573e-07, + "loss": 0.4736, + "step": 60651 + }, + { + "epoch": 1.55, + "learning_rate": 9.897067729213123e-07, + "loss": 0.6953, + "step": 60652 + }, + { + "epoch": 1.55, + "learning_rate": 9.896791039372482e-07, + "loss": 0.6416, + "step": 60653 + }, + { + "epoch": 1.55, + "learning_rate": 9.896514349610866e-07, + "loss": 0.7266, + "step": 60654 + }, + { + "epoch": 1.55, + "learning_rate": 9.896237659928483e-07, + "loss": 0.6826, + "step": 60655 + }, + { + "epoch": 1.55, + "learning_rate": 9.895960970325544e-07, + "loss": 0.5879, + "step": 60656 + }, + { + "epoch": 1.55, + "learning_rate": 9.895684280802264e-07, + "loss": 0.5605, + "step": 60657 + }, + { + "epoch": 1.55, + "learning_rate": 9.895407591358852e-07, + "loss": 0.6375, + "step": 60658 + }, + { + "epoch": 1.55, + "learning_rate": 9.895130901995526e-07, + "loss": 0.6621, + "step": 60659 + }, + { + "epoch": 1.55, + "learning_rate": 9.89485421271249e-07, + "loss": 0.7173, + "step": 60660 + }, + { + "epoch": 1.55, + "learning_rate": 9.89457752350996e-07, + "loss": 0.665, + "step": 60661 + }, + { + "epoch": 1.55, + "learning_rate": 9.894300834388147e-07, + "loss": 0.5425, + "step": 60662 + }, + { + "epoch": 1.55, + "learning_rate": 9.894024145347263e-07, + "loss": 0.6475, + "step": 60663 + }, + { + "epoch": 1.55, + "learning_rate": 9.893747456387522e-07, + "loss": 0.5139, + "step": 60664 + }, + { + "epoch": 1.55, + "learning_rate": 9.893470767509132e-07, + "loss": 0.5759, + "step": 60665 + }, + { + "epoch": 1.55, + "learning_rate": 9.893194078712305e-07, + "loss": 0.5042, + "step": 60666 + }, + { + "epoch": 1.55, + "learning_rate": 9.892917389997256e-07, + "loss": 0.749, + "step": 60667 + }, + { + "epoch": 1.55, + "learning_rate": 9.892640701364194e-07, + "loss": 0.6646, + "step": 60668 + }, + { + "epoch": 1.55, + "learning_rate": 9.892364012813333e-07, + "loss": 0.7021, + "step": 60669 + }, + { + "epoch": 1.56, + "learning_rate": 9.892087324344884e-07, + "loss": 0.604, + "step": 60670 + }, + { + "epoch": 1.56, + "learning_rate": 9.89181063595906e-07, + "loss": 0.7666, + "step": 60671 + }, + { + "epoch": 1.56, + "learning_rate": 9.891533947656067e-07, + "loss": 0.6675, + "step": 60672 + }, + { + "epoch": 1.56, + "learning_rate": 9.891257259436127e-07, + "loss": 0.748, + "step": 60673 + }, + { + "epoch": 1.56, + "learning_rate": 9.890980571299446e-07, + "loss": 0.7588, + "step": 60674 + }, + { + "epoch": 1.56, + "learning_rate": 9.890703883246234e-07, + "loss": 0.7588, + "step": 60675 + }, + { + "epoch": 1.56, + "learning_rate": 9.890427195276704e-07, + "loss": 0.6797, + "step": 60676 + }, + { + "epoch": 1.56, + "learning_rate": 9.890150507391071e-07, + "loss": 0.7549, + "step": 60677 + }, + { + "epoch": 1.56, + "learning_rate": 9.889873819589544e-07, + "loss": 0.5635, + "step": 60678 + }, + { + "epoch": 1.56, + "learning_rate": 9.889597131872335e-07, + "loss": 0.5991, + "step": 60679 + }, + { + "epoch": 1.56, + "learning_rate": 9.889320444239656e-07, + "loss": 0.6689, + "step": 60680 + }, + { + "epoch": 1.56, + "learning_rate": 9.88904375669172e-07, + "loss": 0.6748, + "step": 60681 + }, + { + "epoch": 1.56, + "learning_rate": 9.888767069228737e-07, + "loss": 0.5649, + "step": 60682 + }, + { + "epoch": 1.56, + "learning_rate": 9.888490381850923e-07, + "loss": 0.748, + "step": 60683 + }, + { + "epoch": 1.56, + "learning_rate": 9.888213694558486e-07, + "loss": 0.5127, + "step": 60684 + }, + { + "epoch": 1.56, + "learning_rate": 9.887937007351636e-07, + "loss": 0.6675, + "step": 60685 + }, + { + "epoch": 1.56, + "learning_rate": 9.887660320230592e-07, + "loss": 0.5952, + "step": 60686 + }, + { + "epoch": 1.56, + "learning_rate": 9.887383633195556e-07, + "loss": 0.5259, + "step": 60687 + }, + { + "epoch": 1.56, + "learning_rate": 9.887106946246747e-07, + "loss": 0.6699, + "step": 60688 + }, + { + "epoch": 1.56, + "learning_rate": 9.886830259384374e-07, + "loss": 0.4629, + "step": 60689 + }, + { + "epoch": 1.56, + "learning_rate": 9.886553572608653e-07, + "loss": 0.6309, + "step": 60690 + }, + { + "epoch": 1.56, + "learning_rate": 9.88627688591979e-07, + "loss": 0.7676, + "step": 60691 + }, + { + "epoch": 1.56, + "learning_rate": 9.886000199318e-07, + "loss": 0.7646, + "step": 60692 + }, + { + "epoch": 1.56, + "learning_rate": 9.885723512803494e-07, + "loss": 0.7842, + "step": 60693 + }, + { + "epoch": 1.56, + "learning_rate": 9.885446826376492e-07, + "loss": 0.6826, + "step": 60694 + }, + { + "epoch": 1.56, + "learning_rate": 9.88517014003719e-07, + "loss": 0.5723, + "step": 60695 + }, + { + "epoch": 1.56, + "learning_rate": 9.884893453785809e-07, + "loss": 0.6177, + "step": 60696 + }, + { + "epoch": 1.56, + "learning_rate": 9.884616767622558e-07, + "loss": 0.563, + "step": 60697 + }, + { + "epoch": 1.56, + "learning_rate": 9.884340081547655e-07, + "loss": 0.6418, + "step": 60698 + }, + { + "epoch": 1.56, + "learning_rate": 9.884063395561302e-07, + "loss": 0.5928, + "step": 60699 + }, + { + "epoch": 1.56, + "learning_rate": 9.883786709663721e-07, + "loss": 0.6182, + "step": 60700 + }, + { + "epoch": 1.56, + "learning_rate": 9.883510023855117e-07, + "loss": 0.5571, + "step": 60701 + }, + { + "epoch": 1.56, + "learning_rate": 9.883233338135705e-07, + "loss": 0.5728, + "step": 60702 + }, + { + "epoch": 1.56, + "learning_rate": 9.882956652505695e-07, + "loss": 0.3381, + "step": 60703 + }, + { + "epoch": 1.56, + "learning_rate": 9.882679966965303e-07, + "loss": 0.6675, + "step": 60704 + }, + { + "epoch": 1.56, + "learning_rate": 9.882403281514735e-07, + "loss": 0.6191, + "step": 60705 + }, + { + "epoch": 1.56, + "learning_rate": 9.882126596154202e-07, + "loss": 0.7852, + "step": 60706 + }, + { + "epoch": 1.56, + "learning_rate": 9.881849910883925e-07, + "loss": 0.47, + "step": 60707 + }, + { + "epoch": 1.56, + "learning_rate": 9.881573225704105e-07, + "loss": 0.5353, + "step": 60708 + }, + { + "epoch": 1.56, + "learning_rate": 9.881296540614964e-07, + "loss": 0.5688, + "step": 60709 + }, + { + "epoch": 1.56, + "learning_rate": 9.881019855616705e-07, + "loss": 0.6406, + "step": 60710 + }, + { + "epoch": 1.56, + "learning_rate": 9.880743170709545e-07, + "loss": 0.6504, + "step": 60711 + }, + { + "epoch": 1.56, + "learning_rate": 9.880466485893693e-07, + "loss": 0.6973, + "step": 60712 + }, + { + "epoch": 1.56, + "learning_rate": 9.880189801169364e-07, + "loss": 0.6289, + "step": 60713 + }, + { + "epoch": 1.56, + "learning_rate": 9.879913116536772e-07, + "loss": 0.6094, + "step": 60714 + }, + { + "epoch": 1.56, + "learning_rate": 9.87963643199612e-07, + "loss": 0.8193, + "step": 60715 + }, + { + "epoch": 1.56, + "learning_rate": 9.879359747547626e-07, + "loss": 0.644, + "step": 60716 + }, + { + "epoch": 1.56, + "learning_rate": 9.879083063191501e-07, + "loss": 0.4155, + "step": 60717 + }, + { + "epoch": 1.56, + "learning_rate": 9.878806378927954e-07, + "loss": 0.5391, + "step": 60718 + }, + { + "epoch": 1.56, + "learning_rate": 9.878529694757202e-07, + "loss": 0.4857, + "step": 60719 + }, + { + "epoch": 1.56, + "learning_rate": 9.878253010679453e-07, + "loss": 0.7021, + "step": 60720 + }, + { + "epoch": 1.56, + "learning_rate": 9.87797632669492e-07, + "loss": 0.583, + "step": 60721 + }, + { + "epoch": 1.56, + "learning_rate": 9.877699642803814e-07, + "loss": 0.53, + "step": 60722 + }, + { + "epoch": 1.56, + "learning_rate": 9.87742295900635e-07, + "loss": 0.6841, + "step": 60723 + }, + { + "epoch": 1.56, + "learning_rate": 9.87714627530274e-07, + "loss": 0.6748, + "step": 60724 + }, + { + "epoch": 1.56, + "learning_rate": 9.87686959169319e-07, + "loss": 0.7324, + "step": 60725 + }, + { + "epoch": 1.56, + "learning_rate": 9.876592908177917e-07, + "loss": 0.6982, + "step": 60726 + }, + { + "epoch": 1.56, + "learning_rate": 9.876316224757128e-07, + "loss": 0.6797, + "step": 60727 + }, + { + "epoch": 1.56, + "learning_rate": 9.876039541431041e-07, + "loss": 0.6694, + "step": 60728 + }, + { + "epoch": 1.56, + "learning_rate": 9.875762858199863e-07, + "loss": 0.5552, + "step": 60729 + }, + { + "epoch": 1.56, + "learning_rate": 9.875486175063808e-07, + "loss": 0.6475, + "step": 60730 + }, + { + "epoch": 1.56, + "learning_rate": 9.875209492023087e-07, + "loss": 0.6997, + "step": 60731 + }, + { + "epoch": 1.56, + "learning_rate": 9.874932809077913e-07, + "loss": 0.458, + "step": 60732 + }, + { + "epoch": 1.56, + "learning_rate": 9.874656126228499e-07, + "loss": 0.6084, + "step": 60733 + }, + { + "epoch": 1.56, + "learning_rate": 9.874379443475055e-07, + "loss": 0.5913, + "step": 60734 + }, + { + "epoch": 1.56, + "learning_rate": 9.87410276081779e-07, + "loss": 0.6626, + "step": 60735 + }, + { + "epoch": 1.56, + "learning_rate": 9.873826078256921e-07, + "loss": 0.606, + "step": 60736 + }, + { + "epoch": 1.56, + "learning_rate": 9.873549395792655e-07, + "loss": 0.6388, + "step": 60737 + }, + { + "epoch": 1.56, + "learning_rate": 9.873272713425208e-07, + "loss": 0.6406, + "step": 60738 + }, + { + "epoch": 1.56, + "learning_rate": 9.87299603115479e-07, + "loss": 0.7197, + "step": 60739 + }, + { + "epoch": 1.56, + "learning_rate": 9.872719348981614e-07, + "loss": 0.5583, + "step": 60740 + }, + { + "epoch": 1.56, + "learning_rate": 9.872442666905888e-07, + "loss": 0.6348, + "step": 60741 + }, + { + "epoch": 1.56, + "learning_rate": 9.872165984927831e-07, + "loss": 0.6738, + "step": 60742 + }, + { + "epoch": 1.56, + "learning_rate": 9.871889303047647e-07, + "loss": 0.6094, + "step": 60743 + }, + { + "epoch": 1.56, + "learning_rate": 9.871612621265555e-07, + "loss": 0.7002, + "step": 60744 + }, + { + "epoch": 1.56, + "learning_rate": 9.871335939581762e-07, + "loss": 0.624, + "step": 60745 + }, + { + "epoch": 1.56, + "learning_rate": 9.87105925799648e-07, + "loss": 0.6882, + "step": 60746 + }, + { + "epoch": 1.56, + "learning_rate": 9.870782576509923e-07, + "loss": 0.5571, + "step": 60747 + }, + { + "epoch": 1.56, + "learning_rate": 9.8705058951223e-07, + "loss": 0.7202, + "step": 60748 + }, + { + "epoch": 1.56, + "learning_rate": 9.870229213833826e-07, + "loss": 0.7295, + "step": 60749 + }, + { + "epoch": 1.56, + "learning_rate": 9.869952532644715e-07, + "loss": 0.5601, + "step": 60750 + }, + { + "epoch": 1.56, + "learning_rate": 9.86967585155517e-07, + "loss": 0.5586, + "step": 60751 + }, + { + "epoch": 1.56, + "learning_rate": 9.86939917056541e-07, + "loss": 0.6172, + "step": 60752 + }, + { + "epoch": 1.56, + "learning_rate": 9.869122489675645e-07, + "loss": 0.5552, + "step": 60753 + }, + { + "epoch": 1.56, + "learning_rate": 9.86884580888609e-07, + "loss": 0.7637, + "step": 60754 + }, + { + "epoch": 1.56, + "learning_rate": 9.868569128196952e-07, + "loss": 0.6436, + "step": 60755 + }, + { + "epoch": 1.56, + "learning_rate": 9.868292447608442e-07, + "loss": 0.6025, + "step": 60756 + }, + { + "epoch": 1.56, + "learning_rate": 9.868015767120775e-07, + "loss": 0.5936, + "step": 60757 + }, + { + "epoch": 1.56, + "learning_rate": 9.867739086734162e-07, + "loss": 0.7051, + "step": 60758 + }, + { + "epoch": 1.56, + "learning_rate": 9.867462406448818e-07, + "loss": 0.561, + "step": 60759 + }, + { + "epoch": 1.56, + "learning_rate": 9.867185726264948e-07, + "loss": 0.6196, + "step": 60760 + }, + { + "epoch": 1.56, + "learning_rate": 9.866909046182771e-07, + "loss": 0.7471, + "step": 60761 + }, + { + "epoch": 1.56, + "learning_rate": 9.866632366202493e-07, + "loss": 0.7998, + "step": 60762 + }, + { + "epoch": 1.56, + "learning_rate": 9.866355686324332e-07, + "loss": 0.7339, + "step": 60763 + }, + { + "epoch": 1.56, + "learning_rate": 9.866079006548497e-07, + "loss": 0.7197, + "step": 60764 + }, + { + "epoch": 1.56, + "learning_rate": 9.865802326875194e-07, + "loss": 0.8125, + "step": 60765 + }, + { + "epoch": 1.56, + "learning_rate": 9.865525647304644e-07, + "loss": 0.709, + "step": 60766 + }, + { + "epoch": 1.56, + "learning_rate": 9.865248967837055e-07, + "loss": 0.5068, + "step": 60767 + }, + { + "epoch": 1.56, + "learning_rate": 9.864972288472634e-07, + "loss": 0.5835, + "step": 60768 + }, + { + "epoch": 1.56, + "learning_rate": 9.8646956092116e-07, + "loss": 0.3438, + "step": 60769 + }, + { + "epoch": 1.56, + "learning_rate": 9.864418930054164e-07, + "loss": 0.793, + "step": 60770 + }, + { + "epoch": 1.56, + "learning_rate": 9.864142251000535e-07, + "loss": 0.7266, + "step": 60771 + }, + { + "epoch": 1.56, + "learning_rate": 9.863865572050925e-07, + "loss": 0.7617, + "step": 60772 + }, + { + "epoch": 1.56, + "learning_rate": 9.863588893205548e-07, + "loss": 0.585, + "step": 60773 + }, + { + "epoch": 1.56, + "learning_rate": 9.863312214464618e-07, + "loss": 0.7959, + "step": 60774 + }, + { + "epoch": 1.56, + "learning_rate": 9.86303553582834e-07, + "loss": 0.665, + "step": 60775 + }, + { + "epoch": 1.56, + "learning_rate": 9.86275885729693e-07, + "loss": 0.7383, + "step": 60776 + }, + { + "epoch": 1.56, + "learning_rate": 9.862482178870598e-07, + "loss": 0.6436, + "step": 60777 + }, + { + "epoch": 1.56, + "learning_rate": 9.862205500549557e-07, + "loss": 0.6738, + "step": 60778 + }, + { + "epoch": 1.56, + "learning_rate": 9.861928822334018e-07, + "loss": 0.6846, + "step": 60779 + }, + { + "epoch": 1.56, + "learning_rate": 9.861652144224198e-07, + "loss": 0.4863, + "step": 60780 + }, + { + "epoch": 1.56, + "learning_rate": 9.861375466220299e-07, + "loss": 0.7559, + "step": 60781 + }, + { + "epoch": 1.56, + "learning_rate": 9.861098788322544e-07, + "loss": 0.6362, + "step": 60782 + }, + { + "epoch": 1.56, + "learning_rate": 9.860822110531135e-07, + "loss": 0.48, + "step": 60783 + }, + { + "epoch": 1.56, + "learning_rate": 9.860545432846295e-07, + "loss": 0.6499, + "step": 60784 + }, + { + "epoch": 1.56, + "learning_rate": 9.860268755268222e-07, + "loss": 0.5376, + "step": 60785 + }, + { + "epoch": 1.56, + "learning_rate": 9.859992077797139e-07, + "loss": 0.6455, + "step": 60786 + }, + { + "epoch": 1.56, + "learning_rate": 9.85971540043325e-07, + "loss": 0.6973, + "step": 60787 + }, + { + "epoch": 1.56, + "learning_rate": 9.859438723176772e-07, + "loss": 0.6606, + "step": 60788 + }, + { + "epoch": 1.56, + "learning_rate": 9.859162046027913e-07, + "loss": 0.6411, + "step": 60789 + }, + { + "epoch": 1.56, + "learning_rate": 9.85888536898689e-07, + "loss": 0.8457, + "step": 60790 + }, + { + "epoch": 1.56, + "learning_rate": 9.85860869205391e-07, + "loss": 0.7627, + "step": 60791 + }, + { + "epoch": 1.56, + "learning_rate": 9.85833201522919e-07, + "loss": 0.5786, + "step": 60792 + }, + { + "epoch": 1.56, + "learning_rate": 9.858055338512935e-07, + "loss": 0.6172, + "step": 60793 + }, + { + "epoch": 1.56, + "learning_rate": 9.857778661905366e-07, + "loss": 0.6255, + "step": 60794 + }, + { + "epoch": 1.56, + "learning_rate": 9.857501985406685e-07, + "loss": 0.6504, + "step": 60795 + }, + { + "epoch": 1.56, + "learning_rate": 9.857225309017108e-07, + "loss": 0.6826, + "step": 60796 + }, + { + "epoch": 1.56, + "learning_rate": 9.856948632736849e-07, + "loss": 0.6787, + "step": 60797 + }, + { + "epoch": 1.56, + "learning_rate": 9.856671956566113e-07, + "loss": 0.625, + "step": 60798 + }, + { + "epoch": 1.56, + "learning_rate": 9.856395280505121e-07, + "loss": 0.7061, + "step": 60799 + }, + { + "epoch": 1.56, + "learning_rate": 9.85611860455408e-07, + "loss": 0.7451, + "step": 60800 + }, + { + "epoch": 1.56, + "learning_rate": 9.855841928713203e-07, + "loss": 0.5212, + "step": 60801 + }, + { + "epoch": 1.56, + "learning_rate": 9.8555652529827e-07, + "loss": 0.6992, + "step": 60802 + }, + { + "epoch": 1.56, + "learning_rate": 9.855288577362784e-07, + "loss": 0.6685, + "step": 60803 + }, + { + "epoch": 1.56, + "learning_rate": 9.85501190185367e-07, + "loss": 0.708, + "step": 60804 + }, + { + "epoch": 1.56, + "learning_rate": 9.854735226455564e-07, + "loss": 0.6108, + "step": 60805 + }, + { + "epoch": 1.56, + "learning_rate": 9.85445855116868e-07, + "loss": 0.7012, + "step": 60806 + }, + { + "epoch": 1.56, + "learning_rate": 9.854181875993232e-07, + "loss": 0.6895, + "step": 60807 + }, + { + "epoch": 1.56, + "learning_rate": 9.853905200929429e-07, + "loss": 0.8359, + "step": 60808 + }, + { + "epoch": 1.56, + "learning_rate": 9.853628525977485e-07, + "loss": 0.5256, + "step": 60809 + }, + { + "epoch": 1.56, + "learning_rate": 9.853351851137607e-07, + "loss": 0.7397, + "step": 60810 + }, + { + "epoch": 1.56, + "learning_rate": 9.853075176410017e-07, + "loss": 0.7256, + "step": 60811 + }, + { + "epoch": 1.56, + "learning_rate": 9.852798501794917e-07, + "loss": 0.5217, + "step": 60812 + }, + { + "epoch": 1.56, + "learning_rate": 9.85252182729252e-07, + "loss": 0.6836, + "step": 60813 + }, + { + "epoch": 1.56, + "learning_rate": 9.852245152903049e-07, + "loss": 0.6479, + "step": 60814 + }, + { + "epoch": 1.56, + "learning_rate": 9.851968478626698e-07, + "loss": 0.6162, + "step": 60815 + }, + { + "epoch": 1.56, + "learning_rate": 9.851691804463693e-07, + "loss": 0.6235, + "step": 60816 + }, + { + "epoch": 1.56, + "learning_rate": 9.851415130414238e-07, + "loss": 0.8105, + "step": 60817 + }, + { + "epoch": 1.56, + "learning_rate": 9.851138456478549e-07, + "loss": 0.7793, + "step": 60818 + }, + { + "epoch": 1.56, + "learning_rate": 9.850861782656835e-07, + "loss": 0.8496, + "step": 60819 + }, + { + "epoch": 1.56, + "learning_rate": 9.850585108949311e-07, + "loss": 0.7529, + "step": 60820 + }, + { + "epoch": 1.56, + "learning_rate": 9.850308435356186e-07, + "loss": 0.6758, + "step": 60821 + }, + { + "epoch": 1.56, + "learning_rate": 9.850031761877673e-07, + "loss": 0.7451, + "step": 60822 + }, + { + "epoch": 1.56, + "learning_rate": 9.849755088513985e-07, + "loss": 0.5602, + "step": 60823 + }, + { + "epoch": 1.56, + "learning_rate": 9.849478415265334e-07, + "loss": 0.4722, + "step": 60824 + }, + { + "epoch": 1.56, + "learning_rate": 9.849201742131927e-07, + "loss": 0.7061, + "step": 60825 + }, + { + "epoch": 1.56, + "learning_rate": 9.848925069113981e-07, + "loss": 0.8359, + "step": 60826 + }, + { + "epoch": 1.56, + "learning_rate": 9.848648396211705e-07, + "loss": 0.5546, + "step": 60827 + }, + { + "epoch": 1.56, + "learning_rate": 9.848371723425315e-07, + "loss": 0.5664, + "step": 60828 + }, + { + "epoch": 1.56, + "learning_rate": 9.848095050755015e-07, + "loss": 0.6211, + "step": 60829 + }, + { + "epoch": 1.56, + "learning_rate": 9.847818378201025e-07, + "loss": 0.563, + "step": 60830 + }, + { + "epoch": 1.56, + "learning_rate": 9.847541705763552e-07, + "loss": 0.6475, + "step": 60831 + }, + { + "epoch": 1.56, + "learning_rate": 9.84726503344281e-07, + "loss": 0.7334, + "step": 60832 + }, + { + "epoch": 1.56, + "learning_rate": 9.846988361239009e-07, + "loss": 0.5088, + "step": 60833 + }, + { + "epoch": 1.56, + "learning_rate": 9.846711689152366e-07, + "loss": 0.6567, + "step": 60834 + }, + { + "epoch": 1.56, + "learning_rate": 9.846435017183085e-07, + "loss": 0.668, + "step": 60835 + }, + { + "epoch": 1.56, + "learning_rate": 9.846158345331381e-07, + "loss": 0.5813, + "step": 60836 + }, + { + "epoch": 1.56, + "learning_rate": 9.84588167359747e-07, + "loss": 0.7031, + "step": 60837 + }, + { + "epoch": 1.56, + "learning_rate": 9.845605001981557e-07, + "loss": 0.5449, + "step": 60838 + }, + { + "epoch": 1.56, + "learning_rate": 9.84532833048386e-07, + "loss": 0.6978, + "step": 60839 + }, + { + "epoch": 1.56, + "learning_rate": 9.845051659104584e-07, + "loss": 0.6602, + "step": 60840 + }, + { + "epoch": 1.56, + "learning_rate": 9.844774987843946e-07, + "loss": 0.6191, + "step": 60841 + }, + { + "epoch": 1.56, + "learning_rate": 9.84449831670216e-07, + "loss": 0.6973, + "step": 60842 + }, + { + "epoch": 1.56, + "learning_rate": 9.84422164567943e-07, + "loss": 0.4824, + "step": 60843 + }, + { + "epoch": 1.56, + "learning_rate": 9.84394497477598e-07, + "loss": 0.5425, + "step": 60844 + }, + { + "epoch": 1.56, + "learning_rate": 9.843668303992007e-07, + "loss": 0.7871, + "step": 60845 + }, + { + "epoch": 1.56, + "learning_rate": 9.843391633327731e-07, + "loss": 0.5996, + "step": 60846 + }, + { + "epoch": 1.56, + "learning_rate": 9.843114962783363e-07, + "loss": 0.7021, + "step": 60847 + }, + { + "epoch": 1.56, + "learning_rate": 9.842838292359115e-07, + "loss": 0.6104, + "step": 60848 + }, + { + "epoch": 1.56, + "learning_rate": 9.842561622055199e-07, + "loss": 0.6758, + "step": 60849 + }, + { + "epoch": 1.56, + "learning_rate": 9.842284951871826e-07, + "loss": 0.5513, + "step": 60850 + }, + { + "epoch": 1.56, + "learning_rate": 9.842008281809208e-07, + "loss": 0.5596, + "step": 60851 + }, + { + "epoch": 1.56, + "learning_rate": 9.841731611867557e-07, + "loss": 0.4653, + "step": 60852 + }, + { + "epoch": 1.56, + "learning_rate": 9.841454942047087e-07, + "loss": 0.6558, + "step": 60853 + }, + { + "epoch": 1.56, + "learning_rate": 9.841178272348007e-07, + "loss": 0.6738, + "step": 60854 + }, + { + "epoch": 1.56, + "learning_rate": 9.840901602770527e-07, + "loss": 0.6777, + "step": 60855 + }, + { + "epoch": 1.56, + "learning_rate": 9.840624933314864e-07, + "loss": 0.7256, + "step": 60856 + }, + { + "epoch": 1.56, + "learning_rate": 9.840348263981226e-07, + "loss": 0.6201, + "step": 60857 + }, + { + "epoch": 1.56, + "learning_rate": 9.840071594769825e-07, + "loss": 0.6753, + "step": 60858 + }, + { + "epoch": 1.56, + "learning_rate": 9.839794925680874e-07, + "loss": 0.7007, + "step": 60859 + }, + { + "epoch": 1.56, + "learning_rate": 9.839518256714583e-07, + "loss": 0.5044, + "step": 60860 + }, + { + "epoch": 1.56, + "learning_rate": 9.83924158787117e-07, + "loss": 0.8047, + "step": 60861 + }, + { + "epoch": 1.56, + "learning_rate": 9.838964919150839e-07, + "loss": 0.583, + "step": 60862 + }, + { + "epoch": 1.56, + "learning_rate": 9.838688250553806e-07, + "loss": 0.6885, + "step": 60863 + }, + { + "epoch": 1.56, + "learning_rate": 9.838411582080286e-07, + "loss": 0.6973, + "step": 60864 + }, + { + "epoch": 1.56, + "learning_rate": 9.83813491373048e-07, + "loss": 0.6914, + "step": 60865 + }, + { + "epoch": 1.56, + "learning_rate": 9.837858245504611e-07, + "loss": 0.6553, + "step": 60866 + }, + { + "epoch": 1.56, + "learning_rate": 9.837581577402885e-07, + "loss": 0.7246, + "step": 60867 + }, + { + "epoch": 1.56, + "learning_rate": 9.837304909425516e-07, + "loss": 0.6143, + "step": 60868 + }, + { + "epoch": 1.56, + "learning_rate": 9.837028241572712e-07, + "loss": 0.6182, + "step": 60869 + }, + { + "epoch": 1.56, + "learning_rate": 9.83675157384469e-07, + "loss": 0.5664, + "step": 60870 + }, + { + "epoch": 1.56, + "learning_rate": 9.83647490624166e-07, + "loss": 0.4873, + "step": 60871 + }, + { + "epoch": 1.56, + "learning_rate": 9.836198238763835e-07, + "loss": 0.5488, + "step": 60872 + }, + { + "epoch": 1.56, + "learning_rate": 9.835921571411428e-07, + "loss": 0.7588, + "step": 60873 + }, + { + "epoch": 1.56, + "learning_rate": 9.835644904184645e-07, + "loss": 0.7666, + "step": 60874 + }, + { + "epoch": 1.56, + "learning_rate": 9.8353682370837e-07, + "loss": 0.5935, + "step": 60875 + }, + { + "epoch": 1.56, + "learning_rate": 9.835091570108808e-07, + "loss": 0.6777, + "step": 60876 + }, + { + "epoch": 1.56, + "learning_rate": 9.834814903260177e-07, + "loss": 0.6758, + "step": 60877 + }, + { + "epoch": 1.56, + "learning_rate": 9.834538236538022e-07, + "loss": 0.6621, + "step": 60878 + }, + { + "epoch": 1.56, + "learning_rate": 9.83426156994255e-07, + "loss": 0.6001, + "step": 60879 + }, + { + "epoch": 1.56, + "learning_rate": 9.83398490347398e-07, + "loss": 0.7686, + "step": 60880 + }, + { + "epoch": 1.56, + "learning_rate": 9.833708237132518e-07, + "loss": 0.5254, + "step": 60881 + }, + { + "epoch": 1.56, + "learning_rate": 9.833431570918382e-07, + "loss": 0.6748, + "step": 60882 + }, + { + "epoch": 1.56, + "learning_rate": 9.83315490483178e-07, + "loss": 0.5039, + "step": 60883 + }, + { + "epoch": 1.56, + "learning_rate": 9.832878238872917e-07, + "loss": 0.5809, + "step": 60884 + }, + { + "epoch": 1.56, + "learning_rate": 9.832601573042017e-07, + "loss": 0.7783, + "step": 60885 + }, + { + "epoch": 1.56, + "learning_rate": 9.832324907339283e-07, + "loss": 0.4893, + "step": 60886 + }, + { + "epoch": 1.56, + "learning_rate": 9.832048241764932e-07, + "loss": 0.6372, + "step": 60887 + }, + { + "epoch": 1.56, + "learning_rate": 9.831771576319173e-07, + "loss": 0.665, + "step": 60888 + }, + { + "epoch": 1.56, + "learning_rate": 9.83149491100222e-07, + "loss": 0.6758, + "step": 60889 + }, + { + "epoch": 1.56, + "learning_rate": 9.83121824581428e-07, + "loss": 0.6777, + "step": 60890 + }, + { + "epoch": 1.56, + "learning_rate": 9.830941580755572e-07, + "loss": 0.7393, + "step": 60891 + }, + { + "epoch": 1.56, + "learning_rate": 9.830664915826302e-07, + "loss": 0.6082, + "step": 60892 + }, + { + "epoch": 1.56, + "learning_rate": 9.830388251026691e-07, + "loss": 0.6504, + "step": 60893 + }, + { + "epoch": 1.56, + "learning_rate": 9.830111586356938e-07, + "loss": 0.8008, + "step": 60894 + }, + { + "epoch": 1.56, + "learning_rate": 9.829834921817263e-07, + "loss": 0.6108, + "step": 60895 + }, + { + "epoch": 1.56, + "learning_rate": 9.82955825740787e-07, + "loss": 0.6143, + "step": 60896 + }, + { + "epoch": 1.56, + "learning_rate": 9.829281593128981e-07, + "loss": 0.6064, + "step": 60897 + }, + { + "epoch": 1.56, + "learning_rate": 9.829004928980803e-07, + "loss": 0.6073, + "step": 60898 + }, + { + "epoch": 1.56, + "learning_rate": 9.828728264963546e-07, + "loss": 0.6914, + "step": 60899 + }, + { + "epoch": 1.56, + "learning_rate": 9.828451601077424e-07, + "loss": 0.707, + "step": 60900 + }, + { + "epoch": 1.56, + "learning_rate": 9.828174937322652e-07, + "loss": 0.6021, + "step": 60901 + }, + { + "epoch": 1.56, + "learning_rate": 9.827898273699435e-07, + "loss": 0.6313, + "step": 60902 + }, + { + "epoch": 1.56, + "learning_rate": 9.827621610207993e-07, + "loss": 0.7539, + "step": 60903 + }, + { + "epoch": 1.56, + "learning_rate": 9.82734494684853e-07, + "loss": 0.6353, + "step": 60904 + }, + { + "epoch": 1.56, + "learning_rate": 9.82706828362126e-07, + "loss": 0.6714, + "step": 60905 + }, + { + "epoch": 1.56, + "learning_rate": 9.826791620526399e-07, + "loss": 0.6538, + "step": 60906 + }, + { + "epoch": 1.56, + "learning_rate": 9.82651495756415e-07, + "loss": 0.5698, + "step": 60907 + }, + { + "epoch": 1.56, + "learning_rate": 9.826238294734737e-07, + "loss": 0.5266, + "step": 60908 + }, + { + "epoch": 1.56, + "learning_rate": 9.82596163203836e-07, + "loss": 0.5205, + "step": 60909 + }, + { + "epoch": 1.56, + "learning_rate": 9.82568496947524e-07, + "loss": 0.6328, + "step": 60910 + }, + { + "epoch": 1.56, + "learning_rate": 9.825408307045582e-07, + "loss": 0.6758, + "step": 60911 + }, + { + "epoch": 1.56, + "learning_rate": 9.825131644749604e-07, + "loss": 0.7178, + "step": 60912 + }, + { + "epoch": 1.56, + "learning_rate": 9.824854982587517e-07, + "loss": 0.5781, + "step": 60913 + }, + { + "epoch": 1.56, + "learning_rate": 9.824578320559527e-07, + "loss": 0.751, + "step": 60914 + }, + { + "epoch": 1.56, + "learning_rate": 9.82430165866585e-07, + "loss": 0.646, + "step": 60915 + }, + { + "epoch": 1.56, + "learning_rate": 9.824024996906696e-07, + "loss": 0.7461, + "step": 60916 + }, + { + "epoch": 1.56, + "learning_rate": 9.823748335282275e-07, + "loss": 0.5369, + "step": 60917 + }, + { + "epoch": 1.56, + "learning_rate": 9.823471673792806e-07, + "loss": 0.5518, + "step": 60918 + }, + { + "epoch": 1.56, + "learning_rate": 9.823195012438496e-07, + "loss": 0.499, + "step": 60919 + }, + { + "epoch": 1.56, + "learning_rate": 9.822918351219558e-07, + "loss": 0.6523, + "step": 60920 + }, + { + "epoch": 1.56, + "learning_rate": 9.822641690136201e-07, + "loss": 0.5681, + "step": 60921 + }, + { + "epoch": 1.56, + "learning_rate": 9.82236502918864e-07, + "loss": 0.7588, + "step": 60922 + }, + { + "epoch": 1.56, + "learning_rate": 9.82208836837709e-07, + "loss": 0.6572, + "step": 60923 + }, + { + "epoch": 1.56, + "learning_rate": 9.821811707701753e-07, + "loss": 0.509, + "step": 60924 + }, + { + "epoch": 1.56, + "learning_rate": 9.82153504716285e-07, + "loss": 0.7373, + "step": 60925 + }, + { + "epoch": 1.56, + "learning_rate": 9.821258386760587e-07, + "loss": 0.5264, + "step": 60926 + }, + { + "epoch": 1.56, + "learning_rate": 9.82098172649518e-07, + "loss": 0.4202, + "step": 60927 + }, + { + "epoch": 1.56, + "learning_rate": 9.820705066366838e-07, + "loss": 0.5679, + "step": 60928 + }, + { + "epoch": 1.56, + "learning_rate": 9.820428406375774e-07, + "loss": 0.667, + "step": 60929 + }, + { + "epoch": 1.56, + "learning_rate": 9.8201517465222e-07, + "loss": 0.6709, + "step": 60930 + }, + { + "epoch": 1.56, + "learning_rate": 9.819875086806328e-07, + "loss": 0.562, + "step": 60931 + }, + { + "epoch": 1.56, + "learning_rate": 9.819598427228368e-07, + "loss": 0.6655, + "step": 60932 + }, + { + "epoch": 1.56, + "learning_rate": 9.81932176778854e-07, + "loss": 0.7803, + "step": 60933 + }, + { + "epoch": 1.56, + "learning_rate": 9.81904510848704e-07, + "loss": 0.668, + "step": 60934 + }, + { + "epoch": 1.56, + "learning_rate": 9.818768449324094e-07, + "loss": 0.5349, + "step": 60935 + }, + { + "epoch": 1.56, + "learning_rate": 9.818491790299905e-07, + "loss": 0.585, + "step": 60936 + }, + { + "epoch": 1.56, + "learning_rate": 9.81821513141469e-07, + "loss": 0.6289, + "step": 60937 + }, + { + "epoch": 1.56, + "learning_rate": 9.817938472668659e-07, + "loss": 0.4854, + "step": 60938 + }, + { + "epoch": 1.56, + "learning_rate": 9.817661814062026e-07, + "loss": 0.6514, + "step": 60939 + }, + { + "epoch": 1.56, + "learning_rate": 9.817385155594997e-07, + "loss": 0.5459, + "step": 60940 + }, + { + "epoch": 1.56, + "learning_rate": 9.817108497267792e-07, + "loss": 0.4534, + "step": 60941 + }, + { + "epoch": 1.56, + "learning_rate": 9.816831839080614e-07, + "loss": 0.5558, + "step": 60942 + }, + { + "epoch": 1.56, + "learning_rate": 9.816555181033686e-07, + "loss": 0.6206, + "step": 60943 + }, + { + "epoch": 1.56, + "learning_rate": 9.81627852312721e-07, + "loss": 0.5386, + "step": 60944 + }, + { + "epoch": 1.56, + "learning_rate": 9.8160018653614e-07, + "loss": 0.4768, + "step": 60945 + }, + { + "epoch": 1.56, + "learning_rate": 9.81572520773647e-07, + "loss": 0.6357, + "step": 60946 + }, + { + "epoch": 1.56, + "learning_rate": 9.815448550252632e-07, + "loss": 0.6245, + "step": 60947 + }, + { + "epoch": 1.56, + "learning_rate": 9.815171892910094e-07, + "loss": 0.6973, + "step": 60948 + }, + { + "epoch": 1.56, + "learning_rate": 9.814895235709072e-07, + "loss": 0.5933, + "step": 60949 + }, + { + "epoch": 1.56, + "learning_rate": 9.814618578649774e-07, + "loss": 0.6523, + "step": 60950 + }, + { + "epoch": 1.56, + "learning_rate": 9.814341921732417e-07, + "loss": 0.6982, + "step": 60951 + }, + { + "epoch": 1.56, + "learning_rate": 9.814065264957207e-07, + "loss": 0.6826, + "step": 60952 + }, + { + "epoch": 1.56, + "learning_rate": 9.813788608324363e-07, + "loss": 0.7104, + "step": 60953 + }, + { + "epoch": 1.56, + "learning_rate": 9.813511951834088e-07, + "loss": 0.5635, + "step": 60954 + }, + { + "epoch": 1.56, + "learning_rate": 9.8132352954866e-07, + "loss": 0.6567, + "step": 60955 + }, + { + "epoch": 1.56, + "learning_rate": 9.81295863928211e-07, + "loss": 0.6738, + "step": 60956 + }, + { + "epoch": 1.56, + "learning_rate": 9.812681983220827e-07, + "loss": 0.4839, + "step": 60957 + }, + { + "epoch": 1.56, + "learning_rate": 9.812405327302967e-07, + "loss": 0.709, + "step": 60958 + }, + { + "epoch": 1.56, + "learning_rate": 9.812128671528736e-07, + "loss": 0.7783, + "step": 60959 + }, + { + "epoch": 1.56, + "learning_rate": 9.811852015898352e-07, + "loss": 0.519, + "step": 60960 + }, + { + "epoch": 1.56, + "learning_rate": 9.811575360412024e-07, + "loss": 0.8018, + "step": 60961 + }, + { + "epoch": 1.56, + "learning_rate": 9.811298705069964e-07, + "loss": 0.7393, + "step": 60962 + }, + { + "epoch": 1.56, + "learning_rate": 9.811022049872389e-07, + "loss": 0.5239, + "step": 60963 + }, + { + "epoch": 1.56, + "learning_rate": 9.8107453948195e-07, + "loss": 0.7334, + "step": 60964 + }, + { + "epoch": 1.56, + "learning_rate": 9.810468739911515e-07, + "loss": 0.4501, + "step": 60965 + }, + { + "epoch": 1.56, + "learning_rate": 9.810192085148645e-07, + "loss": 0.6562, + "step": 60966 + }, + { + "epoch": 1.56, + "learning_rate": 9.809915430531102e-07, + "loss": 0.6348, + "step": 60967 + }, + { + "epoch": 1.56, + "learning_rate": 9.809638776059101e-07, + "loss": 0.6357, + "step": 60968 + }, + { + "epoch": 1.56, + "learning_rate": 9.809362121732848e-07, + "loss": 0.3662, + "step": 60969 + }, + { + "epoch": 1.56, + "learning_rate": 9.80908546755256e-07, + "loss": 0.6577, + "step": 60970 + }, + { + "epoch": 1.56, + "learning_rate": 9.808808813518441e-07, + "loss": 0.4836, + "step": 60971 + }, + { + "epoch": 1.56, + "learning_rate": 9.808532159630714e-07, + "loss": 0.5376, + "step": 60972 + }, + { + "epoch": 1.56, + "learning_rate": 9.808255505889587e-07, + "loss": 0.6257, + "step": 60973 + }, + { + "epoch": 1.56, + "learning_rate": 9.807978852295265e-07, + "loss": 0.6123, + "step": 60974 + }, + { + "epoch": 1.56, + "learning_rate": 9.807702198847967e-07, + "loss": 0.4752, + "step": 60975 + }, + { + "epoch": 1.56, + "learning_rate": 9.8074255455479e-07, + "loss": 0.5537, + "step": 60976 + }, + { + "epoch": 1.56, + "learning_rate": 9.80714889239528e-07, + "loss": 0.623, + "step": 60977 + }, + { + "epoch": 1.56, + "learning_rate": 9.806872239390316e-07, + "loss": 0.5981, + "step": 60978 + }, + { + "epoch": 1.56, + "learning_rate": 9.806595586533225e-07, + "loss": 0.572, + "step": 60979 + }, + { + "epoch": 1.56, + "learning_rate": 9.80631893382421e-07, + "loss": 0.6846, + "step": 60980 + }, + { + "epoch": 1.56, + "learning_rate": 9.80604228126349e-07, + "loss": 0.5056, + "step": 60981 + }, + { + "epoch": 1.56, + "learning_rate": 9.805765628851273e-07, + "loss": 0.6396, + "step": 60982 + }, + { + "epoch": 1.56, + "learning_rate": 9.80548897658778e-07, + "loss": 0.376, + "step": 60983 + }, + { + "epoch": 1.56, + "learning_rate": 9.805212324473208e-07, + "loss": 0.5879, + "step": 60984 + }, + { + "epoch": 1.56, + "learning_rate": 9.804935672507777e-07, + "loss": 0.5342, + "step": 60985 + }, + { + "epoch": 1.56, + "learning_rate": 9.804659020691695e-07, + "loss": 0.6406, + "step": 60986 + }, + { + "epoch": 1.56, + "learning_rate": 9.804382369025182e-07, + "loss": 0.6035, + "step": 60987 + }, + { + "epoch": 1.56, + "learning_rate": 9.80410571750844e-07, + "loss": 0.6343, + "step": 60988 + }, + { + "epoch": 1.56, + "learning_rate": 9.803829066141688e-07, + "loss": 0.5669, + "step": 60989 + }, + { + "epoch": 1.56, + "learning_rate": 9.803552414925132e-07, + "loss": 0.666, + "step": 60990 + }, + { + "epoch": 1.56, + "learning_rate": 9.80327576385899e-07, + "loss": 0.5042, + "step": 60991 + }, + { + "epoch": 1.56, + "learning_rate": 9.802999112943467e-07, + "loss": 0.624, + "step": 60992 + }, + { + "epoch": 1.56, + "learning_rate": 9.802722462178785e-07, + "loss": 0.6748, + "step": 60993 + }, + { + "epoch": 1.56, + "learning_rate": 9.802445811565147e-07, + "loss": 0.675, + "step": 60994 + }, + { + "epoch": 1.56, + "learning_rate": 9.802169161102764e-07, + "loss": 0.6743, + "step": 60995 + }, + { + "epoch": 1.56, + "learning_rate": 9.801892510791853e-07, + "loss": 0.7734, + "step": 60996 + }, + { + "epoch": 1.56, + "learning_rate": 9.80161586063262e-07, + "loss": 0.7871, + "step": 60997 + }, + { + "epoch": 1.56, + "learning_rate": 9.801339210625287e-07, + "loss": 0.7598, + "step": 60998 + }, + { + "epoch": 1.56, + "learning_rate": 9.801062560770054e-07, + "loss": 0.668, + "step": 60999 + }, + { + "epoch": 1.56, + "learning_rate": 9.800785911067142e-07, + "loss": 0.6389, + "step": 61000 + }, + { + "epoch": 1.56, + "learning_rate": 9.800509261516757e-07, + "loss": 0.7178, + "step": 61001 + }, + { + "epoch": 1.56, + "learning_rate": 9.800232612119113e-07, + "loss": 0.4868, + "step": 61002 + }, + { + "epoch": 1.56, + "learning_rate": 9.799955962874426e-07, + "loss": 0.5591, + "step": 61003 + }, + { + "epoch": 1.56, + "learning_rate": 9.7996793137829e-07, + "loss": 0.4751, + "step": 61004 + }, + { + "epoch": 1.56, + "learning_rate": 9.79940266484475e-07, + "loss": 0.4846, + "step": 61005 + }, + { + "epoch": 1.56, + "learning_rate": 9.799126016060188e-07, + "loss": 0.5884, + "step": 61006 + }, + { + "epoch": 1.56, + "learning_rate": 9.798849367429427e-07, + "loss": 0.6509, + "step": 61007 + }, + { + "epoch": 1.56, + "learning_rate": 9.798572718952677e-07, + "loss": 0.6855, + "step": 61008 + }, + { + "epoch": 1.56, + "learning_rate": 9.798296070630149e-07, + "loss": 0.7063, + "step": 61009 + }, + { + "epoch": 1.56, + "learning_rate": 9.798019422462058e-07, + "loss": 0.6851, + "step": 61010 + }, + { + "epoch": 1.56, + "learning_rate": 9.797742774448614e-07, + "loss": 0.7529, + "step": 61011 + }, + { + "epoch": 1.56, + "learning_rate": 9.797466126590029e-07, + "loss": 0.4448, + "step": 61012 + }, + { + "epoch": 1.56, + "learning_rate": 9.79718947888652e-07, + "loss": 0.5659, + "step": 61013 + }, + { + "epoch": 1.56, + "learning_rate": 9.796912831338286e-07, + "loss": 0.6465, + "step": 61014 + }, + { + "epoch": 1.56, + "learning_rate": 9.796636183945552e-07, + "loss": 0.5288, + "step": 61015 + }, + { + "epoch": 1.56, + "learning_rate": 9.79635953670852e-07, + "loss": 0.5364, + "step": 61016 + }, + { + "epoch": 1.56, + "learning_rate": 9.79608288962741e-07, + "loss": 0.7461, + "step": 61017 + }, + { + "epoch": 1.56, + "learning_rate": 9.795806242702424e-07, + "loss": 0.7017, + "step": 61018 + }, + { + "epoch": 1.56, + "learning_rate": 9.795529595933786e-07, + "loss": 0.5864, + "step": 61019 + }, + { + "epoch": 1.56, + "learning_rate": 9.795252949321699e-07, + "loss": 0.5273, + "step": 61020 + }, + { + "epoch": 1.56, + "learning_rate": 9.794976302866376e-07, + "loss": 0.625, + "step": 61021 + }, + { + "epoch": 1.56, + "learning_rate": 9.794699656568032e-07, + "loss": 0.7383, + "step": 61022 + }, + { + "epoch": 1.56, + "learning_rate": 9.79442301042688e-07, + "loss": 0.708, + "step": 61023 + }, + { + "epoch": 1.56, + "learning_rate": 9.794146364443124e-07, + "loss": 0.7085, + "step": 61024 + }, + { + "epoch": 1.56, + "learning_rate": 9.793869718616984e-07, + "loss": 0.7451, + "step": 61025 + }, + { + "epoch": 1.56, + "learning_rate": 9.793593072948665e-07, + "loss": 0.6572, + "step": 61026 + }, + { + "epoch": 1.56, + "learning_rate": 9.793316427438386e-07, + "loss": 0.6572, + "step": 61027 + }, + { + "epoch": 1.56, + "learning_rate": 9.793039782086351e-07, + "loss": 0.4731, + "step": 61028 + }, + { + "epoch": 1.56, + "learning_rate": 9.792763136892782e-07, + "loss": 0.5835, + "step": 61029 + }, + { + "epoch": 1.56, + "learning_rate": 9.792486491857878e-07, + "loss": 0.7178, + "step": 61030 + }, + { + "epoch": 1.56, + "learning_rate": 9.792209846981861e-07, + "loss": 0.6665, + "step": 61031 + }, + { + "epoch": 1.56, + "learning_rate": 9.791933202264939e-07, + "loss": 0.5322, + "step": 61032 + }, + { + "epoch": 1.56, + "learning_rate": 9.791656557707326e-07, + "loss": 0.7832, + "step": 61033 + }, + { + "epoch": 1.56, + "learning_rate": 9.791379913309232e-07, + "loss": 0.6182, + "step": 61034 + }, + { + "epoch": 1.56, + "learning_rate": 9.791103269070864e-07, + "loss": 0.7373, + "step": 61035 + }, + { + "epoch": 1.56, + "learning_rate": 9.790826624992443e-07, + "loss": 0.7178, + "step": 61036 + }, + { + "epoch": 1.56, + "learning_rate": 9.790549981074176e-07, + "loss": 0.7422, + "step": 61037 + }, + { + "epoch": 1.56, + "learning_rate": 9.790273337316273e-07, + "loss": 0.5347, + "step": 61038 + }, + { + "epoch": 1.56, + "learning_rate": 9.78999669371895e-07, + "loss": 0.9043, + "step": 61039 + }, + { + "epoch": 1.56, + "learning_rate": 9.789720050282414e-07, + "loss": 0.6631, + "step": 61040 + }, + { + "epoch": 1.56, + "learning_rate": 9.789443407006883e-07, + "loss": 0.7734, + "step": 61041 + }, + { + "epoch": 1.56, + "learning_rate": 9.789166763892563e-07, + "loss": 0.7373, + "step": 61042 + }, + { + "epoch": 1.56, + "learning_rate": 9.788890120939673e-07, + "loss": 0.5139, + "step": 61043 + }, + { + "epoch": 1.56, + "learning_rate": 9.788613478148416e-07, + "loss": 0.709, + "step": 61044 + }, + { + "epoch": 1.56, + "learning_rate": 9.788336835519008e-07, + "loss": 0.7236, + "step": 61045 + }, + { + "epoch": 1.56, + "learning_rate": 9.788060193051663e-07, + "loss": 0.4851, + "step": 61046 + }, + { + "epoch": 1.56, + "learning_rate": 9.787783550746587e-07, + "loss": 0.6436, + "step": 61047 + }, + { + "epoch": 1.56, + "learning_rate": 9.787506908603999e-07, + "loss": 0.5546, + "step": 61048 + }, + { + "epoch": 1.56, + "learning_rate": 9.787230266624104e-07, + "loss": 0.6592, + "step": 61049 + }, + { + "epoch": 1.56, + "learning_rate": 9.78695362480712e-07, + "loss": 0.5291, + "step": 61050 + }, + { + "epoch": 1.56, + "learning_rate": 9.786676983153251e-07, + "loss": 0.3342, + "step": 61051 + }, + { + "epoch": 1.56, + "learning_rate": 9.78640034166272e-07, + "loss": 0.6543, + "step": 61052 + }, + { + "epoch": 1.56, + "learning_rate": 9.78612370033573e-07, + "loss": 0.667, + "step": 61053 + }, + { + "epoch": 1.56, + "learning_rate": 9.785847059172496e-07, + "loss": 0.752, + "step": 61054 + }, + { + "epoch": 1.56, + "learning_rate": 9.785570418173226e-07, + "loss": 0.6006, + "step": 61055 + }, + { + "epoch": 1.56, + "learning_rate": 9.785293777338138e-07, + "loss": 0.6289, + "step": 61056 + }, + { + "epoch": 1.56, + "learning_rate": 9.785017136667439e-07, + "loss": 0.6416, + "step": 61057 + }, + { + "epoch": 1.56, + "learning_rate": 9.784740496161343e-07, + "loss": 0.6387, + "step": 61058 + }, + { + "epoch": 1.56, + "learning_rate": 9.78446385582006e-07, + "loss": 0.6836, + "step": 61059 + }, + { + "epoch": 1.56, + "learning_rate": 9.784187215643804e-07, + "loss": 0.6641, + "step": 61060 + }, + { + "epoch": 1.57, + "learning_rate": 9.783910575632785e-07, + "loss": 0.5264, + "step": 61061 + }, + { + "epoch": 1.57, + "learning_rate": 9.783633935787218e-07, + "loss": 0.5344, + "step": 61062 + }, + { + "epoch": 1.57, + "learning_rate": 9.783357296107314e-07, + "loss": 0.6777, + "step": 61063 + }, + { + "epoch": 1.57, + "learning_rate": 9.78308065659328e-07, + "loss": 0.8232, + "step": 61064 + }, + { + "epoch": 1.57, + "learning_rate": 9.782804017245333e-07, + "loss": 0.6436, + "step": 61065 + }, + { + "epoch": 1.57, + "learning_rate": 9.782527378063682e-07, + "loss": 0.6348, + "step": 61066 + }, + { + "epoch": 1.57, + "learning_rate": 9.78225073904854e-07, + "loss": 0.6187, + "step": 61067 + }, + { + "epoch": 1.57, + "learning_rate": 9.781974100200115e-07, + "loss": 0.6494, + "step": 61068 + }, + { + "epoch": 1.57, + "learning_rate": 9.781697461518628e-07, + "loss": 0.5181, + "step": 61069 + }, + { + "epoch": 1.57, + "learning_rate": 9.78142082300428e-07, + "loss": 0.6221, + "step": 61070 + }, + { + "epoch": 1.57, + "learning_rate": 9.781144184657292e-07, + "loss": 0.5933, + "step": 61071 + }, + { + "epoch": 1.57, + "learning_rate": 9.78086754647787e-07, + "loss": 0.8154, + "step": 61072 + }, + { + "epoch": 1.57, + "learning_rate": 9.780590908466235e-07, + "loss": 0.6748, + "step": 61073 + }, + { + "epoch": 1.57, + "learning_rate": 9.780314270622584e-07, + "loss": 0.7158, + "step": 61074 + }, + { + "epoch": 1.57, + "learning_rate": 9.780037632947137e-07, + "loss": 0.5032, + "step": 61075 + }, + { + "epoch": 1.57, + "learning_rate": 9.779760995440103e-07, + "loss": 0.7285, + "step": 61076 + }, + { + "epoch": 1.57, + "learning_rate": 9.7794843581017e-07, + "loss": 0.5964, + "step": 61077 + }, + { + "epoch": 1.57, + "learning_rate": 9.779207720932132e-07, + "loss": 0.5481, + "step": 61078 + }, + { + "epoch": 1.57, + "learning_rate": 9.778931083931615e-07, + "loss": 0.6431, + "step": 61079 + }, + { + "epoch": 1.57, + "learning_rate": 9.778654447100362e-07, + "loss": 0.5439, + "step": 61080 + }, + { + "epoch": 1.57, + "learning_rate": 9.778377810438582e-07, + "loss": 0.5151, + "step": 61081 + }, + { + "epoch": 1.57, + "learning_rate": 9.77810117394649e-07, + "loss": 0.5405, + "step": 61082 + }, + { + "epoch": 1.57, + "learning_rate": 9.777824537624296e-07, + "loss": 0.7686, + "step": 61083 + }, + { + "epoch": 1.57, + "learning_rate": 9.77754790147221e-07, + "loss": 0.6885, + "step": 61084 + }, + { + "epoch": 1.57, + "learning_rate": 9.777271265490443e-07, + "loss": 0.6611, + "step": 61085 + }, + { + "epoch": 1.57, + "learning_rate": 9.776994629679214e-07, + "loss": 0.498, + "step": 61086 + }, + { + "epoch": 1.57, + "learning_rate": 9.776717994038726e-07, + "loss": 0.4708, + "step": 61087 + }, + { + "epoch": 1.57, + "learning_rate": 9.776441358569196e-07, + "loss": 0.5017, + "step": 61088 + }, + { + "epoch": 1.57, + "learning_rate": 9.776164723270833e-07, + "loss": 0.582, + "step": 61089 + }, + { + "epoch": 1.57, + "learning_rate": 9.775888088143854e-07, + "loss": 0.5513, + "step": 61090 + }, + { + "epoch": 1.57, + "learning_rate": 9.775611453188464e-07, + "loss": 0.5508, + "step": 61091 + }, + { + "epoch": 1.57, + "learning_rate": 9.775334818404879e-07, + "loss": 0.7207, + "step": 61092 + }, + { + "epoch": 1.57, + "learning_rate": 9.775058183793313e-07, + "loss": 0.7578, + "step": 61093 + }, + { + "epoch": 1.57, + "learning_rate": 9.774781549353972e-07, + "loss": 0.6309, + "step": 61094 + }, + { + "epoch": 1.57, + "learning_rate": 9.774504915087069e-07, + "loss": 0.7803, + "step": 61095 + }, + { + "epoch": 1.57, + "learning_rate": 9.77422828099282e-07, + "loss": 0.5283, + "step": 61096 + }, + { + "epoch": 1.57, + "learning_rate": 9.77395164707143e-07, + "loss": 0.5811, + "step": 61097 + }, + { + "epoch": 1.57, + "learning_rate": 9.773675013323119e-07, + "loss": 0.8672, + "step": 61098 + }, + { + "epoch": 1.57, + "learning_rate": 9.77339837974809e-07, + "loss": 0.6992, + "step": 61099 + }, + { + "epoch": 1.57, + "learning_rate": 9.773121746346564e-07, + "loss": 0.7041, + "step": 61100 + }, + { + "epoch": 1.57, + "learning_rate": 9.772845113118745e-07, + "loss": 0.5869, + "step": 61101 + }, + { + "epoch": 1.57, + "learning_rate": 9.77256848006485e-07, + "loss": 0.7275, + "step": 61102 + }, + { + "epoch": 1.57, + "learning_rate": 9.772291847185092e-07, + "loss": 0.7285, + "step": 61103 + }, + { + "epoch": 1.57, + "learning_rate": 9.772015214479674e-07, + "loss": 0.6445, + "step": 61104 + }, + { + "epoch": 1.57, + "learning_rate": 9.771738581948817e-07, + "loss": 0.595, + "step": 61105 + }, + { + "epoch": 1.57, + "learning_rate": 9.771461949592726e-07, + "loss": 0.4692, + "step": 61106 + }, + { + "epoch": 1.57, + "learning_rate": 9.771185317411618e-07, + "loss": 0.7607, + "step": 61107 + }, + { + "epoch": 1.57, + "learning_rate": 9.770908685405701e-07, + "loss": 0.6152, + "step": 61108 + }, + { + "epoch": 1.57, + "learning_rate": 9.770632053575192e-07, + "loss": 0.543, + "step": 61109 + }, + { + "epoch": 1.57, + "learning_rate": 9.770355421920299e-07, + "loss": 0.4549, + "step": 61110 + }, + { + "epoch": 1.57, + "learning_rate": 9.770078790441232e-07, + "loss": 0.6572, + "step": 61111 + }, + { + "epoch": 1.57, + "learning_rate": 9.769802159138207e-07, + "loss": 0.6265, + "step": 61112 + }, + { + "epoch": 1.57, + "learning_rate": 9.769525528011436e-07, + "loss": 0.7202, + "step": 61113 + }, + { + "epoch": 1.57, + "learning_rate": 9.769248897061124e-07, + "loss": 0.687, + "step": 61114 + }, + { + "epoch": 1.57, + "learning_rate": 9.76897226628749e-07, + "loss": 0.7354, + "step": 61115 + }, + { + "epoch": 1.57, + "learning_rate": 9.768695635690742e-07, + "loss": 0.5244, + "step": 61116 + }, + { + "epoch": 1.57, + "learning_rate": 9.768419005271095e-07, + "loss": 0.6982, + "step": 61117 + }, + { + "epoch": 1.57, + "learning_rate": 9.768142375028756e-07, + "loss": 0.6953, + "step": 61118 + }, + { + "epoch": 1.57, + "learning_rate": 9.767865744963942e-07, + "loss": 0.6489, + "step": 61119 + }, + { + "epoch": 1.57, + "learning_rate": 9.767589115076862e-07, + "loss": 0.5972, + "step": 61120 + }, + { + "epoch": 1.57, + "learning_rate": 9.767312485367728e-07, + "loss": 0.5928, + "step": 61121 + }, + { + "epoch": 1.57, + "learning_rate": 9.767035855836752e-07, + "loss": 0.5491, + "step": 61122 + }, + { + "epoch": 1.57, + "learning_rate": 9.766759226484147e-07, + "loss": 0.729, + "step": 61123 + }, + { + "epoch": 1.57, + "learning_rate": 9.766482597310124e-07, + "loss": 0.4917, + "step": 61124 + }, + { + "epoch": 1.57, + "learning_rate": 9.766205968314893e-07, + "loss": 0.5488, + "step": 61125 + }, + { + "epoch": 1.57, + "learning_rate": 9.76592933949867e-07, + "loss": 0.6235, + "step": 61126 + }, + { + "epoch": 1.57, + "learning_rate": 9.765652710861663e-07, + "loss": 0.625, + "step": 61127 + }, + { + "epoch": 1.57, + "learning_rate": 9.765376082404082e-07, + "loss": 0.5513, + "step": 61128 + }, + { + "epoch": 1.57, + "learning_rate": 9.765099454126144e-07, + "loss": 0.5452, + "step": 61129 + }, + { + "epoch": 1.57, + "learning_rate": 9.764822826028058e-07, + "loss": 0.6479, + "step": 61130 + }, + { + "epoch": 1.57, + "learning_rate": 9.764546198110037e-07, + "loss": 0.5557, + "step": 61131 + }, + { + "epoch": 1.57, + "learning_rate": 9.764269570372292e-07, + "loss": 0.7354, + "step": 61132 + }, + { + "epoch": 1.57, + "learning_rate": 9.763992942815036e-07, + "loss": 0.5225, + "step": 61133 + }, + { + "epoch": 1.57, + "learning_rate": 9.76371631543848e-07, + "loss": 0.6885, + "step": 61134 + }, + { + "epoch": 1.57, + "learning_rate": 9.763439688242832e-07, + "loss": 0.5327, + "step": 61135 + }, + { + "epoch": 1.57, + "learning_rate": 9.763163061228311e-07, + "loss": 0.6816, + "step": 61136 + }, + { + "epoch": 1.57, + "learning_rate": 9.762886434395121e-07, + "loss": 0.5806, + "step": 61137 + }, + { + "epoch": 1.57, + "learning_rate": 9.762609807743482e-07, + "loss": 0.7373, + "step": 61138 + }, + { + "epoch": 1.57, + "learning_rate": 9.762333181273599e-07, + "loss": 0.6548, + "step": 61139 + }, + { + "epoch": 1.57, + "learning_rate": 9.762056554985688e-07, + "loss": 0.6309, + "step": 61140 + }, + { + "epoch": 1.57, + "learning_rate": 9.76177992887996e-07, + "loss": 0.563, + "step": 61141 + }, + { + "epoch": 1.57, + "learning_rate": 9.761503302956625e-07, + "loss": 0.5972, + "step": 61142 + }, + { + "epoch": 1.57, + "learning_rate": 9.7612266772159e-07, + "loss": 0.5762, + "step": 61143 + }, + { + "epoch": 1.57, + "learning_rate": 9.76095005165799e-07, + "loss": 0.6587, + "step": 61144 + }, + { + "epoch": 1.57, + "learning_rate": 9.760673426283108e-07, + "loss": 0.4727, + "step": 61145 + }, + { + "epoch": 1.57, + "learning_rate": 9.760396801091468e-07, + "loss": 0.8438, + "step": 61146 + }, + { + "epoch": 1.57, + "learning_rate": 9.76012017608328e-07, + "loss": 0.6328, + "step": 61147 + }, + { + "epoch": 1.57, + "learning_rate": 9.759843551258758e-07, + "loss": 0.478, + "step": 61148 + }, + { + "epoch": 1.57, + "learning_rate": 9.759566926618113e-07, + "loss": 0.624, + "step": 61149 + }, + { + "epoch": 1.57, + "learning_rate": 9.759290302161557e-07, + "loss": 0.6934, + "step": 61150 + }, + { + "epoch": 1.57, + "learning_rate": 9.7590136778893e-07, + "loss": 0.7373, + "step": 61151 + }, + { + "epoch": 1.57, + "learning_rate": 9.758737053801556e-07, + "loss": 0.5991, + "step": 61152 + }, + { + "epoch": 1.57, + "learning_rate": 9.75846042989854e-07, + "loss": 0.6699, + "step": 61153 + }, + { + "epoch": 1.57, + "learning_rate": 9.758183806180454e-07, + "loss": 0.6343, + "step": 61154 + }, + { + "epoch": 1.57, + "learning_rate": 9.757907182647516e-07, + "loss": 0.6455, + "step": 61155 + }, + { + "epoch": 1.57, + "learning_rate": 9.757630559299936e-07, + "loss": 0.7007, + "step": 61156 + }, + { + "epoch": 1.57, + "learning_rate": 9.75735393613793e-07, + "loss": 0.6865, + "step": 61157 + }, + { + "epoch": 1.57, + "learning_rate": 9.757077313161707e-07, + "loss": 0.6003, + "step": 61158 + }, + { + "epoch": 1.57, + "learning_rate": 9.75680069037148e-07, + "loss": 0.6299, + "step": 61159 + }, + { + "epoch": 1.57, + "learning_rate": 9.756524067767457e-07, + "loss": 0.6992, + "step": 61160 + }, + { + "epoch": 1.57, + "learning_rate": 9.756247445349854e-07, + "loss": 0.6143, + "step": 61161 + }, + { + "epoch": 1.57, + "learning_rate": 9.755970823118877e-07, + "loss": 0.6025, + "step": 61162 + }, + { + "epoch": 1.57, + "learning_rate": 9.755694201074752e-07, + "loss": 0.5796, + "step": 61163 + }, + { + "epoch": 1.57, + "learning_rate": 9.755417579217673e-07, + "loss": 0.6943, + "step": 61164 + }, + { + "epoch": 1.57, + "learning_rate": 9.75514095754786e-07, + "loss": 0.8027, + "step": 61165 + }, + { + "epoch": 1.57, + "learning_rate": 9.754864336065523e-07, + "loss": 0.707, + "step": 61166 + }, + { + "epoch": 1.57, + "learning_rate": 9.754587714770878e-07, + "loss": 0.5803, + "step": 61167 + }, + { + "epoch": 1.57, + "learning_rate": 9.754311093664132e-07, + "loss": 0.5264, + "step": 61168 + }, + { + "epoch": 1.57, + "learning_rate": 9.7540344727455e-07, + "loss": 0.6128, + "step": 61169 + }, + { + "epoch": 1.57, + "learning_rate": 9.75375785201519e-07, + "loss": 0.4795, + "step": 61170 + }, + { + "epoch": 1.57, + "learning_rate": 9.75348123147342e-07, + "loss": 0.6289, + "step": 61171 + }, + { + "epoch": 1.57, + "learning_rate": 9.7532046111204e-07, + "loss": 0.7197, + "step": 61172 + }, + { + "epoch": 1.57, + "learning_rate": 9.752927990956332e-07, + "loss": 0.6367, + "step": 61173 + }, + { + "epoch": 1.57, + "learning_rate": 9.75265137098144e-07, + "loss": 0.6484, + "step": 61174 + }, + { + "epoch": 1.57, + "learning_rate": 9.75237475119593e-07, + "loss": 0.481, + "step": 61175 + }, + { + "epoch": 1.57, + "learning_rate": 9.75209813160002e-07, + "loss": 0.9219, + "step": 61176 + }, + { + "epoch": 1.57, + "learning_rate": 9.751821512193912e-07, + "loss": 0.6172, + "step": 61177 + }, + { + "epoch": 1.57, + "learning_rate": 9.751544892977825e-07, + "loss": 0.7021, + "step": 61178 + }, + { + "epoch": 1.57, + "learning_rate": 9.751268273951968e-07, + "loss": 0.499, + "step": 61179 + }, + { + "epoch": 1.57, + "learning_rate": 9.750991655116554e-07, + "loss": 0.6621, + "step": 61180 + }, + { + "epoch": 1.57, + "learning_rate": 9.750715036471792e-07, + "loss": 0.7007, + "step": 61181 + }, + { + "epoch": 1.57, + "learning_rate": 9.750438418017903e-07, + "loss": 0.7246, + "step": 61182 + }, + { + "epoch": 1.57, + "learning_rate": 9.750161799755085e-07, + "loss": 0.3639, + "step": 61183 + }, + { + "epoch": 1.57, + "learning_rate": 9.749885181683559e-07, + "loss": 0.6255, + "step": 61184 + }, + { + "epoch": 1.57, + "learning_rate": 9.749608563803532e-07, + "loss": 0.6025, + "step": 61185 + }, + { + "epoch": 1.57, + "learning_rate": 9.749331946115221e-07, + "loss": 0.8447, + "step": 61186 + }, + { + "epoch": 1.57, + "learning_rate": 9.749055328618835e-07, + "loss": 0.6929, + "step": 61187 + }, + { + "epoch": 1.57, + "learning_rate": 9.748778711314583e-07, + "loss": 0.4937, + "step": 61188 + }, + { + "epoch": 1.57, + "learning_rate": 9.74850209420268e-07, + "loss": 0.6328, + "step": 61189 + }, + { + "epoch": 1.57, + "learning_rate": 9.748225477283341e-07, + "loss": 0.5112, + "step": 61190 + }, + { + "epoch": 1.57, + "learning_rate": 9.74794886055677e-07, + "loss": 0.5508, + "step": 61191 + }, + { + "epoch": 1.57, + "learning_rate": 9.747672244023187e-07, + "loss": 0.6028, + "step": 61192 + }, + { + "epoch": 1.57, + "learning_rate": 9.7473956276828e-07, + "loss": 0.7549, + "step": 61193 + }, + { + "epoch": 1.57, + "learning_rate": 9.747119011535815e-07, + "loss": 0.7725, + "step": 61194 + }, + { + "epoch": 1.57, + "learning_rate": 9.746842395582454e-07, + "loss": 0.7485, + "step": 61195 + }, + { + "epoch": 1.57, + "learning_rate": 9.746565779822921e-07, + "loss": 0.5923, + "step": 61196 + }, + { + "epoch": 1.57, + "learning_rate": 9.746289164257433e-07, + "loss": 0.5752, + "step": 61197 + }, + { + "epoch": 1.57, + "learning_rate": 9.746012548886198e-07, + "loss": 0.8032, + "step": 61198 + }, + { + "epoch": 1.57, + "learning_rate": 9.745735933709432e-07, + "loss": 0.7559, + "step": 61199 + }, + { + "epoch": 1.57, + "learning_rate": 9.745459318727345e-07, + "loss": 0.6602, + "step": 61200 + }, + { + "epoch": 1.57, + "learning_rate": 9.745182703940145e-07, + "loss": 0.6562, + "step": 61201 + }, + { + "epoch": 1.57, + "learning_rate": 9.74490608934805e-07, + "loss": 0.7461, + "step": 61202 + }, + { + "epoch": 1.57, + "learning_rate": 9.744629474951269e-07, + "loss": 0.6406, + "step": 61203 + }, + { + "epoch": 1.57, + "learning_rate": 9.74435286075001e-07, + "loss": 0.7373, + "step": 61204 + }, + { + "epoch": 1.57, + "learning_rate": 9.74407624674449e-07, + "loss": 0.6152, + "step": 61205 + }, + { + "epoch": 1.57, + "learning_rate": 9.743799632934916e-07, + "loss": 0.6846, + "step": 61206 + }, + { + "epoch": 1.57, + "learning_rate": 9.743523019321507e-07, + "loss": 0.5527, + "step": 61207 + }, + { + "epoch": 1.57, + "learning_rate": 9.743246405904467e-07, + "loss": 0.531, + "step": 61208 + }, + { + "epoch": 1.57, + "learning_rate": 9.742969792684015e-07, + "loss": 0.6958, + "step": 61209 + }, + { + "epoch": 1.57, + "learning_rate": 9.742693179660357e-07, + "loss": 0.6729, + "step": 61210 + }, + { + "epoch": 1.57, + "learning_rate": 9.742416566833708e-07, + "loss": 0.5466, + "step": 61211 + }, + { + "epoch": 1.57, + "learning_rate": 9.742139954204282e-07, + "loss": 0.4937, + "step": 61212 + }, + { + "epoch": 1.57, + "learning_rate": 9.741863341772282e-07, + "loss": 0.7285, + "step": 61213 + }, + { + "epoch": 1.57, + "learning_rate": 9.74158672953793e-07, + "loss": 0.7842, + "step": 61214 + }, + { + "epoch": 1.57, + "learning_rate": 9.741310117501428e-07, + "loss": 0.7002, + "step": 61215 + }, + { + "epoch": 1.57, + "learning_rate": 9.741033505662995e-07, + "loss": 0.8623, + "step": 61216 + }, + { + "epoch": 1.57, + "learning_rate": 9.740756894022842e-07, + "loss": 0.7393, + "step": 61217 + }, + { + "epoch": 1.57, + "learning_rate": 9.74048028258118e-07, + "loss": 0.748, + "step": 61218 + }, + { + "epoch": 1.57, + "learning_rate": 9.740203671338219e-07, + "loss": 0.5308, + "step": 61219 + }, + { + "epoch": 1.57, + "learning_rate": 9.73992706029417e-07, + "loss": 0.751, + "step": 61220 + }, + { + "epoch": 1.57, + "learning_rate": 9.739650449449251e-07, + "loss": 0.7197, + "step": 61221 + }, + { + "epoch": 1.57, + "learning_rate": 9.73937383880367e-07, + "loss": 0.6367, + "step": 61222 + }, + { + "epoch": 1.57, + "learning_rate": 9.739097228357634e-07, + "loss": 0.7871, + "step": 61223 + }, + { + "epoch": 1.57, + "learning_rate": 9.738820618111363e-07, + "loss": 0.5142, + "step": 61224 + }, + { + "epoch": 1.57, + "learning_rate": 9.73854400806506e-07, + "loss": 0.4839, + "step": 61225 + }, + { + "epoch": 1.57, + "learning_rate": 9.738267398218947e-07, + "loss": 0.7192, + "step": 61226 + }, + { + "epoch": 1.57, + "learning_rate": 9.737990788573229e-07, + "loss": 0.7119, + "step": 61227 + }, + { + "epoch": 1.57, + "learning_rate": 9.737714179128121e-07, + "loss": 0.6826, + "step": 61228 + }, + { + "epoch": 1.57, + "learning_rate": 9.73743756988383e-07, + "loss": 0.6504, + "step": 61229 + }, + { + "epoch": 1.57, + "learning_rate": 9.737160960840573e-07, + "loss": 0.6621, + "step": 61230 + }, + { + "epoch": 1.57, + "learning_rate": 9.736884351998557e-07, + "loss": 0.4495, + "step": 61231 + }, + { + "epoch": 1.57, + "learning_rate": 9.736607743358004e-07, + "loss": 0.6963, + "step": 61232 + }, + { + "epoch": 1.57, + "learning_rate": 9.736331134919112e-07, + "loss": 0.6284, + "step": 61233 + }, + { + "epoch": 1.57, + "learning_rate": 9.7360545266821e-07, + "loss": 0.8301, + "step": 61234 + }, + { + "epoch": 1.57, + "learning_rate": 9.73577791864718e-07, + "loss": 0.6338, + "step": 61235 + }, + { + "epoch": 1.57, + "learning_rate": 9.735501310814563e-07, + "loss": 0.5437, + "step": 61236 + }, + { + "epoch": 1.57, + "learning_rate": 9.73522470318446e-07, + "loss": 0.7275, + "step": 61237 + }, + { + "epoch": 1.57, + "learning_rate": 9.734948095757082e-07, + "loss": 0.6233, + "step": 61238 + }, + { + "epoch": 1.57, + "learning_rate": 9.73467148853264e-07, + "loss": 0.5801, + "step": 61239 + }, + { + "epoch": 1.57, + "learning_rate": 9.734394881511352e-07, + "loss": 0.7861, + "step": 61240 + }, + { + "epoch": 1.57, + "learning_rate": 9.734118274693423e-07, + "loss": 0.5747, + "step": 61241 + }, + { + "epoch": 1.57, + "learning_rate": 9.73384166807907e-07, + "loss": 0.835, + "step": 61242 + }, + { + "epoch": 1.57, + "learning_rate": 9.733565061668503e-07, + "loss": 0.7695, + "step": 61243 + }, + { + "epoch": 1.57, + "learning_rate": 9.73328845546193e-07, + "loss": 0.5195, + "step": 61244 + }, + { + "epoch": 1.57, + "learning_rate": 9.733011849459568e-07, + "loss": 0.667, + "step": 61245 + }, + { + "epoch": 1.57, + "learning_rate": 9.732735243661623e-07, + "loss": 0.5278, + "step": 61246 + }, + { + "epoch": 1.57, + "learning_rate": 9.732458638068314e-07, + "loss": 0.7461, + "step": 61247 + }, + { + "epoch": 1.57, + "learning_rate": 9.732182032679846e-07, + "loss": 0.5159, + "step": 61248 + }, + { + "epoch": 1.57, + "learning_rate": 9.731905427496437e-07, + "loss": 0.5, + "step": 61249 + }, + { + "epoch": 1.57, + "learning_rate": 9.731628822518291e-07, + "loss": 0.6387, + "step": 61250 + }, + { + "epoch": 1.57, + "learning_rate": 9.73135221774563e-07, + "loss": 0.7695, + "step": 61251 + }, + { + "epoch": 1.57, + "learning_rate": 9.73107561317866e-07, + "loss": 0.6426, + "step": 61252 + }, + { + "epoch": 1.57, + "learning_rate": 9.730799008817592e-07, + "loss": 0.3396, + "step": 61253 + }, + { + "epoch": 1.57, + "learning_rate": 9.730522404662637e-07, + "loss": 0.6338, + "step": 61254 + }, + { + "epoch": 1.57, + "learning_rate": 9.73024580071401e-07, + "loss": 0.6045, + "step": 61255 + }, + { + "epoch": 1.57, + "learning_rate": 9.72996919697192e-07, + "loss": 0.7871, + "step": 61256 + }, + { + "epoch": 1.57, + "learning_rate": 9.72969259343658e-07, + "loss": 0.4629, + "step": 61257 + }, + { + "epoch": 1.57, + "learning_rate": 9.729415990108203e-07, + "loss": 0.6562, + "step": 61258 + }, + { + "epoch": 1.57, + "learning_rate": 9.729139386986999e-07, + "loss": 0.5967, + "step": 61259 + }, + { + "epoch": 1.57, + "learning_rate": 9.72886278407318e-07, + "loss": 0.6279, + "step": 61260 + }, + { + "epoch": 1.57, + "learning_rate": 9.72858618136696e-07, + "loss": 0.8145, + "step": 61261 + }, + { + "epoch": 1.57, + "learning_rate": 9.728309578868551e-07, + "loss": 0.6533, + "step": 61262 + }, + { + "epoch": 1.57, + "learning_rate": 9.72803297657816e-07, + "loss": 0.7471, + "step": 61263 + }, + { + "epoch": 1.57, + "learning_rate": 9.727756374496003e-07, + "loss": 0.5056, + "step": 61264 + }, + { + "epoch": 1.57, + "learning_rate": 9.727479772622288e-07, + "loss": 0.5708, + "step": 61265 + }, + { + "epoch": 1.57, + "learning_rate": 9.727203170957231e-07, + "loss": 0.6851, + "step": 61266 + }, + { + "epoch": 1.57, + "learning_rate": 9.72692656950104e-07, + "loss": 0.5996, + "step": 61267 + }, + { + "epoch": 1.57, + "learning_rate": 9.726649968253933e-07, + "loss": 0.5793, + "step": 61268 + }, + { + "epoch": 1.57, + "learning_rate": 9.726373367216112e-07, + "loss": 0.7139, + "step": 61269 + }, + { + "epoch": 1.57, + "learning_rate": 9.7260967663878e-07, + "loss": 0.668, + "step": 61270 + }, + { + "epoch": 1.57, + "learning_rate": 9.725820165769196e-07, + "loss": 0.6963, + "step": 61271 + }, + { + "epoch": 1.57, + "learning_rate": 9.72554356536053e-07, + "loss": 0.4697, + "step": 61272 + }, + { + "epoch": 1.57, + "learning_rate": 9.725266965161995e-07, + "loss": 0.6597, + "step": 61273 + }, + { + "epoch": 1.57, + "learning_rate": 9.724990365173812e-07, + "loss": 0.6875, + "step": 61274 + }, + { + "epoch": 1.57, + "learning_rate": 9.72471376539619e-07, + "loss": 0.5327, + "step": 61275 + }, + { + "epoch": 1.57, + "learning_rate": 9.724437165829344e-07, + "loss": 0.7529, + "step": 61276 + }, + { + "epoch": 1.57, + "learning_rate": 9.724160566473481e-07, + "loss": 0.5229, + "step": 61277 + }, + { + "epoch": 1.57, + "learning_rate": 9.723883967328818e-07, + "loss": 0.7334, + "step": 61278 + }, + { + "epoch": 1.57, + "learning_rate": 9.72360736839556e-07, + "loss": 0.5879, + "step": 61279 + }, + { + "epoch": 1.57, + "learning_rate": 9.723330769673928e-07, + "loss": 0.6602, + "step": 61280 + }, + { + "epoch": 1.57, + "learning_rate": 9.723054171164127e-07, + "loss": 0.5977, + "step": 61281 + }, + { + "epoch": 1.57, + "learning_rate": 9.722777572866373e-07, + "loss": 0.7861, + "step": 61282 + }, + { + "epoch": 1.57, + "learning_rate": 9.722500974780875e-07, + "loss": 0.6875, + "step": 61283 + }, + { + "epoch": 1.57, + "learning_rate": 9.722224376907843e-07, + "loss": 0.3678, + "step": 61284 + }, + { + "epoch": 1.57, + "learning_rate": 9.721947779247493e-07, + "loss": 0.6919, + "step": 61285 + }, + { + "epoch": 1.57, + "learning_rate": 9.721671181800031e-07, + "loss": 0.7148, + "step": 61286 + }, + { + "epoch": 1.57, + "learning_rate": 9.721394584565677e-07, + "loss": 0.5737, + "step": 61287 + }, + { + "epoch": 1.57, + "learning_rate": 9.721117987544635e-07, + "loss": 0.7188, + "step": 61288 + }, + { + "epoch": 1.57, + "learning_rate": 9.720841390737121e-07, + "loss": 0.5781, + "step": 61289 + }, + { + "epoch": 1.57, + "learning_rate": 9.720564794143348e-07, + "loss": 0.6826, + "step": 61290 + }, + { + "epoch": 1.57, + "learning_rate": 9.720288197763523e-07, + "loss": 0.5381, + "step": 61291 + }, + { + "epoch": 1.57, + "learning_rate": 9.720011601597866e-07, + "loss": 0.7666, + "step": 61292 + }, + { + "epoch": 1.57, + "learning_rate": 9.71973500564658e-07, + "loss": 0.7207, + "step": 61293 + }, + { + "epoch": 1.57, + "learning_rate": 9.719458409909877e-07, + "loss": 0.6191, + "step": 61294 + }, + { + "epoch": 1.57, + "learning_rate": 9.719181814387975e-07, + "loss": 0.6934, + "step": 61295 + }, + { + "epoch": 1.57, + "learning_rate": 9.71890521908108e-07, + "loss": 0.4392, + "step": 61296 + }, + { + "epoch": 1.57, + "learning_rate": 9.718628623989408e-07, + "loss": 0.7109, + "step": 61297 + }, + { + "epoch": 1.57, + "learning_rate": 9.718352029113168e-07, + "loss": 0.48, + "step": 61298 + }, + { + "epoch": 1.57, + "learning_rate": 9.718075434452574e-07, + "loss": 0.5203, + "step": 61299 + }, + { + "epoch": 1.57, + "learning_rate": 9.717798840007835e-07, + "loss": 0.8047, + "step": 61300 + }, + { + "epoch": 1.57, + "learning_rate": 9.717522245779167e-07, + "loss": 0.5278, + "step": 61301 + }, + { + "epoch": 1.57, + "learning_rate": 9.717245651766782e-07, + "loss": 0.6538, + "step": 61302 + }, + { + "epoch": 1.57, + "learning_rate": 9.716969057970883e-07, + "loss": 0.6343, + "step": 61303 + }, + { + "epoch": 1.57, + "learning_rate": 9.71669246439169e-07, + "loss": 0.5679, + "step": 61304 + }, + { + "epoch": 1.57, + "learning_rate": 9.71641587102941e-07, + "loss": 0.4775, + "step": 61305 + }, + { + "epoch": 1.57, + "learning_rate": 9.716139277884263e-07, + "loss": 0.7761, + "step": 61306 + }, + { + "epoch": 1.57, + "learning_rate": 9.715862684956452e-07, + "loss": 0.5243, + "step": 61307 + }, + { + "epoch": 1.57, + "learning_rate": 9.71558609224619e-07, + "loss": 0.8184, + "step": 61308 + }, + { + "epoch": 1.57, + "learning_rate": 9.715309499753695e-07, + "loss": 0.4261, + "step": 61309 + }, + { + "epoch": 1.57, + "learning_rate": 9.71503290747917e-07, + "loss": 0.5771, + "step": 61310 + }, + { + "epoch": 1.57, + "learning_rate": 9.714756315422834e-07, + "loss": 0.5815, + "step": 61311 + }, + { + "epoch": 1.57, + "learning_rate": 9.714479723584898e-07, + "loss": 0.7476, + "step": 61312 + }, + { + "epoch": 1.57, + "learning_rate": 9.714203131965568e-07, + "loss": 0.6558, + "step": 61313 + }, + { + "epoch": 1.57, + "learning_rate": 9.71392654056506e-07, + "loss": 0.6445, + "step": 61314 + }, + { + "epoch": 1.57, + "learning_rate": 9.713649949383583e-07, + "loss": 0.5718, + "step": 61315 + }, + { + "epoch": 1.57, + "learning_rate": 9.713373358421355e-07, + "loss": 0.6431, + "step": 61316 + }, + { + "epoch": 1.57, + "learning_rate": 9.71309676767858e-07, + "loss": 0.6919, + "step": 61317 + }, + { + "epoch": 1.57, + "learning_rate": 9.712820177155478e-07, + "loss": 0.5109, + "step": 61318 + }, + { + "epoch": 1.57, + "learning_rate": 9.712543586852252e-07, + "loss": 0.3787, + "step": 61319 + }, + { + "epoch": 1.57, + "learning_rate": 9.712266996769122e-07, + "loss": 0.668, + "step": 61320 + }, + { + "epoch": 1.57, + "learning_rate": 9.711990406906294e-07, + "loss": 0.4607, + "step": 61321 + }, + { + "epoch": 1.57, + "learning_rate": 9.711713817263985e-07, + "loss": 0.6758, + "step": 61322 + }, + { + "epoch": 1.57, + "learning_rate": 9.711437227842404e-07, + "loss": 0.9092, + "step": 61323 + }, + { + "epoch": 1.57, + "learning_rate": 9.711160638641759e-07, + "loss": 0.5404, + "step": 61324 + }, + { + "epoch": 1.57, + "learning_rate": 9.710884049662263e-07, + "loss": 0.5874, + "step": 61325 + }, + { + "epoch": 1.57, + "learning_rate": 9.710607460904132e-07, + "loss": 0.4418, + "step": 61326 + }, + { + "epoch": 1.57, + "learning_rate": 9.710330872367575e-07, + "loss": 0.6337, + "step": 61327 + }, + { + "epoch": 1.57, + "learning_rate": 9.710054284052806e-07, + "loss": 0.7334, + "step": 61328 + }, + { + "epoch": 1.57, + "learning_rate": 9.709777695960031e-07, + "loss": 0.8887, + "step": 61329 + }, + { + "epoch": 1.57, + "learning_rate": 9.70950110808947e-07, + "loss": 0.626, + "step": 61330 + }, + { + "epoch": 1.57, + "learning_rate": 9.709224520441328e-07, + "loss": 0.6738, + "step": 61331 + }, + { + "epoch": 1.57, + "learning_rate": 9.708947933015824e-07, + "loss": 0.6128, + "step": 61332 + }, + { + "epoch": 1.57, + "learning_rate": 9.708671345813163e-07, + "loss": 0.7705, + "step": 61333 + }, + { + "epoch": 1.57, + "learning_rate": 9.708394758833557e-07, + "loss": 0.5479, + "step": 61334 + }, + { + "epoch": 1.57, + "learning_rate": 9.70811817207722e-07, + "loss": 0.6245, + "step": 61335 + }, + { + "epoch": 1.57, + "learning_rate": 9.707841585544362e-07, + "loss": 0.6533, + "step": 61336 + }, + { + "epoch": 1.57, + "learning_rate": 9.7075649992352e-07, + "loss": 0.4175, + "step": 61337 + }, + { + "epoch": 1.57, + "learning_rate": 9.70728841314994e-07, + "loss": 0.7471, + "step": 61338 + }, + { + "epoch": 1.57, + "learning_rate": 9.707011827288796e-07, + "loss": 0.5356, + "step": 61339 + }, + { + "epoch": 1.57, + "learning_rate": 9.706735241651979e-07, + "loss": 0.5884, + "step": 61340 + }, + { + "epoch": 1.57, + "learning_rate": 9.706458656239701e-07, + "loss": 0.4736, + "step": 61341 + }, + { + "epoch": 1.57, + "learning_rate": 9.70618207105218e-07, + "loss": 0.6338, + "step": 61342 + }, + { + "epoch": 1.57, + "learning_rate": 9.70590548608962e-07, + "loss": 0.7061, + "step": 61343 + }, + { + "epoch": 1.57, + "learning_rate": 9.705628901352228e-07, + "loss": 0.7148, + "step": 61344 + }, + { + "epoch": 1.57, + "learning_rate": 9.705352316840228e-07, + "loss": 0.5459, + "step": 61345 + }, + { + "epoch": 1.57, + "learning_rate": 9.705075732553822e-07, + "loss": 0.687, + "step": 61346 + }, + { + "epoch": 1.57, + "learning_rate": 9.70479914849323e-07, + "loss": 0.7656, + "step": 61347 + }, + { + "epoch": 1.57, + "learning_rate": 9.704522564658657e-07, + "loss": 0.532, + "step": 61348 + }, + { + "epoch": 1.57, + "learning_rate": 9.704245981050318e-07, + "loss": 0.6973, + "step": 61349 + }, + { + "epoch": 1.57, + "learning_rate": 9.703969397668423e-07, + "loss": 0.7783, + "step": 61350 + }, + { + "epoch": 1.57, + "learning_rate": 9.703692814513188e-07, + "loss": 0.8232, + "step": 61351 + }, + { + "epoch": 1.57, + "learning_rate": 9.703416231584824e-07, + "loss": 0.6631, + "step": 61352 + }, + { + "epoch": 1.57, + "learning_rate": 9.703139648883536e-07, + "loss": 0.6689, + "step": 61353 + }, + { + "epoch": 1.57, + "learning_rate": 9.702863066409542e-07, + "loss": 0.6094, + "step": 61354 + }, + { + "epoch": 1.57, + "learning_rate": 9.70258648416305e-07, + "loss": 0.5381, + "step": 61355 + }, + { + "epoch": 1.57, + "learning_rate": 9.702309902144277e-07, + "loss": 0.626, + "step": 61356 + }, + { + "epoch": 1.57, + "learning_rate": 9.702033320353427e-07, + "loss": 0.6299, + "step": 61357 + }, + { + "epoch": 1.57, + "learning_rate": 9.70175673879072e-07, + "loss": 0.7236, + "step": 61358 + }, + { + "epoch": 1.57, + "learning_rate": 9.701480157456364e-07, + "loss": 0.7324, + "step": 61359 + }, + { + "epoch": 1.57, + "learning_rate": 9.701203576350571e-07, + "loss": 0.5066, + "step": 61360 + }, + { + "epoch": 1.57, + "learning_rate": 9.700926995473551e-07, + "loss": 0.5635, + "step": 61361 + }, + { + "epoch": 1.57, + "learning_rate": 9.700650414825523e-07, + "loss": 0.5811, + "step": 61362 + }, + { + "epoch": 1.57, + "learning_rate": 9.700373834406687e-07, + "loss": 0.6113, + "step": 61363 + }, + { + "epoch": 1.57, + "learning_rate": 9.700097254217265e-07, + "loss": 0.7056, + "step": 61364 + }, + { + "epoch": 1.57, + "learning_rate": 9.699820674257462e-07, + "loss": 0.6553, + "step": 61365 + }, + { + "epoch": 1.57, + "learning_rate": 9.699544094527492e-07, + "loss": 0.7065, + "step": 61366 + }, + { + "epoch": 1.57, + "learning_rate": 9.699267515027568e-07, + "loss": 0.6191, + "step": 61367 + }, + { + "epoch": 1.57, + "learning_rate": 9.698990935757901e-07, + "loss": 0.6338, + "step": 61368 + }, + { + "epoch": 1.57, + "learning_rate": 9.698714356718702e-07, + "loss": 0.7632, + "step": 61369 + }, + { + "epoch": 1.57, + "learning_rate": 9.698437777910185e-07, + "loss": 0.3727, + "step": 61370 + }, + { + "epoch": 1.57, + "learning_rate": 9.698161199332558e-07, + "loss": 0.4746, + "step": 61371 + }, + { + "epoch": 1.57, + "learning_rate": 9.69788462098604e-07, + "loss": 0.7109, + "step": 61372 + }, + { + "epoch": 1.57, + "learning_rate": 9.697608042870837e-07, + "loss": 0.5916, + "step": 61373 + }, + { + "epoch": 1.57, + "learning_rate": 9.697331464987158e-07, + "loss": 0.623, + "step": 61374 + }, + { + "epoch": 1.57, + "learning_rate": 9.69705488733522e-07, + "loss": 0.6772, + "step": 61375 + }, + { + "epoch": 1.57, + "learning_rate": 9.696778309915233e-07, + "loss": 0.4282, + "step": 61376 + }, + { + "epoch": 1.57, + "learning_rate": 9.69650173272741e-07, + "loss": 0.6616, + "step": 61377 + }, + { + "epoch": 1.57, + "learning_rate": 9.696225155771958e-07, + "loss": 0.7104, + "step": 61378 + }, + { + "epoch": 1.57, + "learning_rate": 9.695948579049097e-07, + "loss": 0.5989, + "step": 61379 + }, + { + "epoch": 1.57, + "learning_rate": 9.695672002559033e-07, + "loss": 0.707, + "step": 61380 + }, + { + "epoch": 1.57, + "learning_rate": 9.695395426301977e-07, + "loss": 0.6816, + "step": 61381 + }, + { + "epoch": 1.57, + "learning_rate": 9.695118850278147e-07, + "loss": 0.7188, + "step": 61382 + }, + { + "epoch": 1.57, + "learning_rate": 9.694842274487748e-07, + "loss": 0.645, + "step": 61383 + }, + { + "epoch": 1.57, + "learning_rate": 9.694565698930991e-07, + "loss": 0.6968, + "step": 61384 + }, + { + "epoch": 1.57, + "learning_rate": 9.694289123608096e-07, + "loss": 0.6338, + "step": 61385 + }, + { + "epoch": 1.57, + "learning_rate": 9.694012548519266e-07, + "loss": 0.4893, + "step": 61386 + }, + { + "epoch": 1.57, + "learning_rate": 9.693735973664718e-07, + "loss": 0.6978, + "step": 61387 + }, + { + "epoch": 1.57, + "learning_rate": 9.69345939904466e-07, + "loss": 0.5757, + "step": 61388 + }, + { + "epoch": 1.57, + "learning_rate": 9.69318282465931e-07, + "loss": 0.6553, + "step": 61389 + }, + { + "epoch": 1.57, + "learning_rate": 9.692906250508874e-07, + "loss": 0.6753, + "step": 61390 + }, + { + "epoch": 1.57, + "learning_rate": 9.692629676593565e-07, + "loss": 0.7529, + "step": 61391 + }, + { + "epoch": 1.57, + "learning_rate": 9.6923531029136e-07, + "loss": 0.689, + "step": 61392 + }, + { + "epoch": 1.57, + "learning_rate": 9.69207652946918e-07, + "loss": 0.6729, + "step": 61393 + }, + { + "epoch": 1.57, + "learning_rate": 9.691799956260528e-07, + "loss": 0.666, + "step": 61394 + }, + { + "epoch": 1.57, + "learning_rate": 9.691523383287844e-07, + "loss": 0.4927, + "step": 61395 + }, + { + "epoch": 1.57, + "learning_rate": 9.69124681055135e-07, + "loss": 0.6689, + "step": 61396 + }, + { + "epoch": 1.57, + "learning_rate": 9.690970238051256e-07, + "loss": 0.5488, + "step": 61397 + }, + { + "epoch": 1.57, + "learning_rate": 9.690693665787768e-07, + "loss": 0.5833, + "step": 61398 + }, + { + "epoch": 1.57, + "learning_rate": 9.690417093761105e-07, + "loss": 0.5627, + "step": 61399 + }, + { + "epoch": 1.57, + "learning_rate": 9.690140521971472e-07, + "loss": 0.6191, + "step": 61400 + }, + { + "epoch": 1.57, + "learning_rate": 9.689863950419087e-07, + "loss": 0.6641, + "step": 61401 + }, + { + "epoch": 1.57, + "learning_rate": 9.68958737910416e-07, + "loss": 0.7344, + "step": 61402 + }, + { + "epoch": 1.57, + "learning_rate": 9.6893108080269e-07, + "loss": 0.5315, + "step": 61403 + }, + { + "epoch": 1.57, + "learning_rate": 9.68903423718752e-07, + "loss": 0.7529, + "step": 61404 + }, + { + "epoch": 1.57, + "learning_rate": 9.68875766658623e-07, + "loss": 0.5244, + "step": 61405 + }, + { + "epoch": 1.57, + "learning_rate": 9.68848109622325e-07, + "loss": 0.6318, + "step": 61406 + }, + { + "epoch": 1.57, + "learning_rate": 9.68820452609878e-07, + "loss": 0.8496, + "step": 61407 + }, + { + "epoch": 1.57, + "learning_rate": 9.68792795621304e-07, + "loss": 0.6558, + "step": 61408 + }, + { + "epoch": 1.57, + "learning_rate": 9.687651386566237e-07, + "loss": 0.5947, + "step": 61409 + }, + { + "epoch": 1.57, + "learning_rate": 9.687374817158587e-07, + "loss": 0.4824, + "step": 61410 + }, + { + "epoch": 1.57, + "learning_rate": 9.687098247990297e-07, + "loss": 0.7266, + "step": 61411 + }, + { + "epoch": 1.57, + "learning_rate": 9.686821679061587e-07, + "loss": 0.5688, + "step": 61412 + }, + { + "epoch": 1.57, + "learning_rate": 9.68654511037266e-07, + "loss": 0.7139, + "step": 61413 + }, + { + "epoch": 1.57, + "learning_rate": 9.686268541923732e-07, + "loss": 0.7393, + "step": 61414 + }, + { + "epoch": 1.57, + "learning_rate": 9.685991973715011e-07, + "loss": 0.4573, + "step": 61415 + }, + { + "epoch": 1.57, + "learning_rate": 9.685715405746714e-07, + "loss": 0.8174, + "step": 61416 + }, + { + "epoch": 1.57, + "learning_rate": 9.68543883801905e-07, + "loss": 0.5273, + "step": 61417 + }, + { + "epoch": 1.57, + "learning_rate": 9.685162270532231e-07, + "loss": 0.5737, + "step": 61418 + }, + { + "epoch": 1.57, + "learning_rate": 9.684885703286466e-07, + "loss": 0.8008, + "step": 61419 + }, + { + "epoch": 1.57, + "learning_rate": 9.684609136281974e-07, + "loss": 0.7734, + "step": 61420 + }, + { + "epoch": 1.57, + "learning_rate": 9.684332569518959e-07, + "loss": 0.5747, + "step": 61421 + }, + { + "epoch": 1.57, + "learning_rate": 9.68405600299764e-07, + "loss": 0.7275, + "step": 61422 + }, + { + "epoch": 1.57, + "learning_rate": 9.683779436718223e-07, + "loss": 0.6953, + "step": 61423 + }, + { + "epoch": 1.57, + "learning_rate": 9.683502870680918e-07, + "loss": 0.6111, + "step": 61424 + }, + { + "epoch": 1.57, + "learning_rate": 9.683226304885945e-07, + "loss": 0.5342, + "step": 61425 + }, + { + "epoch": 1.57, + "learning_rate": 9.682949739333507e-07, + "loss": 0.6631, + "step": 61426 + }, + { + "epoch": 1.57, + "learning_rate": 9.682673174023822e-07, + "loss": 0.4697, + "step": 61427 + }, + { + "epoch": 1.57, + "learning_rate": 9.682396608957098e-07, + "loss": 0.5684, + "step": 61428 + }, + { + "epoch": 1.57, + "learning_rate": 9.68212004413355e-07, + "loss": 0.6826, + "step": 61429 + }, + { + "epoch": 1.57, + "learning_rate": 9.681843479553386e-07, + "loss": 0.3916, + "step": 61430 + }, + { + "epoch": 1.57, + "learning_rate": 9.681566915216823e-07, + "loss": 0.8154, + "step": 61431 + }, + { + "epoch": 1.57, + "learning_rate": 9.68129035112407e-07, + "loss": 0.6865, + "step": 61432 + }, + { + "epoch": 1.57, + "learning_rate": 9.681013787275338e-07, + "loss": 0.543, + "step": 61433 + }, + { + "epoch": 1.57, + "learning_rate": 9.680737223670836e-07, + "loss": 0.6641, + "step": 61434 + }, + { + "epoch": 1.57, + "learning_rate": 9.680460660310782e-07, + "loss": 0.6367, + "step": 61435 + }, + { + "epoch": 1.57, + "learning_rate": 9.68018409719538e-07, + "loss": 0.8086, + "step": 61436 + }, + { + "epoch": 1.57, + "learning_rate": 9.67990753432485e-07, + "loss": 0.5693, + "step": 61437 + }, + { + "epoch": 1.57, + "learning_rate": 9.679630971699397e-07, + "loss": 0.6348, + "step": 61438 + }, + { + "epoch": 1.57, + "learning_rate": 9.67935440931924e-07, + "loss": 0.7715, + "step": 61439 + }, + { + "epoch": 1.57, + "learning_rate": 9.679077847184582e-07, + "loss": 0.728, + "step": 61440 + }, + { + "epoch": 1.57, + "learning_rate": 9.678801285295644e-07, + "loss": 0.5024, + "step": 61441 + }, + { + "epoch": 1.57, + "learning_rate": 9.678524723652633e-07, + "loss": 0.8652, + "step": 61442 + }, + { + "epoch": 1.57, + "learning_rate": 9.67824816225576e-07, + "loss": 0.5698, + "step": 61443 + }, + { + "epoch": 1.57, + "learning_rate": 9.677971601105236e-07, + "loss": 0.6313, + "step": 61444 + }, + { + "epoch": 1.57, + "learning_rate": 9.677695040201272e-07, + "loss": 0.6001, + "step": 61445 + }, + { + "epoch": 1.57, + "learning_rate": 9.677418479544087e-07, + "loss": 0.688, + "step": 61446 + }, + { + "epoch": 1.57, + "learning_rate": 9.677141919133884e-07, + "loss": 0.6963, + "step": 61447 + }, + { + "epoch": 1.57, + "learning_rate": 9.676865358970882e-07, + "loss": 0.7524, + "step": 61448 + }, + { + "epoch": 1.57, + "learning_rate": 9.676588799055285e-07, + "loss": 0.6592, + "step": 61449 + }, + { + "epoch": 1.57, + "learning_rate": 9.676312239387314e-07, + "loss": 0.5669, + "step": 61450 + }, + { + "epoch": 1.58, + "learning_rate": 9.676035679967172e-07, + "loss": 0.626, + "step": 61451 + }, + { + "epoch": 1.58, + "learning_rate": 9.675759120795082e-07, + "loss": 0.532, + "step": 61452 + }, + { + "epoch": 1.58, + "learning_rate": 9.67548256187124e-07, + "loss": 0.5752, + "step": 61453 + }, + { + "epoch": 1.58, + "learning_rate": 9.675206003195868e-07, + "loss": 0.6494, + "step": 61454 + }, + { + "epoch": 1.58, + "learning_rate": 9.674929444769177e-07, + "loss": 0.6631, + "step": 61455 + }, + { + "epoch": 1.58, + "learning_rate": 9.674652886591377e-07, + "loss": 0.3945, + "step": 61456 + }, + { + "epoch": 1.58, + "learning_rate": 9.67437632866268e-07, + "loss": 0.6235, + "step": 61457 + }, + { + "epoch": 1.58, + "learning_rate": 9.674099770983299e-07, + "loss": 0.6758, + "step": 61458 + }, + { + "epoch": 1.58, + "learning_rate": 9.67382321355344e-07, + "loss": 0.6416, + "step": 61459 + }, + { + "epoch": 1.58, + "learning_rate": 9.673546656373326e-07, + "loss": 0.5869, + "step": 61460 + }, + { + "epoch": 1.58, + "learning_rate": 9.67327009944316e-07, + "loss": 0.606, + "step": 61461 + }, + { + "epoch": 1.58, + "learning_rate": 9.672993542763157e-07, + "loss": 0.7891, + "step": 61462 + }, + { + "epoch": 1.58, + "learning_rate": 9.672716986333529e-07, + "loss": 0.5386, + "step": 61463 + }, + { + "epoch": 1.58, + "learning_rate": 9.672440430154484e-07, + "loss": 0.6724, + "step": 61464 + }, + { + "epoch": 1.58, + "learning_rate": 9.672163874226238e-07, + "loss": 0.752, + "step": 61465 + }, + { + "epoch": 1.58, + "learning_rate": 9.671887318548997e-07, + "loss": 0.7051, + "step": 61466 + }, + { + "epoch": 1.58, + "learning_rate": 9.67161076312298e-07, + "loss": 0.6143, + "step": 61467 + }, + { + "epoch": 1.58, + "learning_rate": 9.671334207948395e-07, + "loss": 0.7905, + "step": 61468 + }, + { + "epoch": 1.58, + "learning_rate": 9.671057653025454e-07, + "loss": 0.5875, + "step": 61469 + }, + { + "epoch": 1.58, + "learning_rate": 9.670781098354372e-07, + "loss": 0.6733, + "step": 61470 + }, + { + "epoch": 1.58, + "learning_rate": 9.670504543935358e-07, + "loss": 0.5986, + "step": 61471 + }, + { + "epoch": 1.58, + "learning_rate": 9.670227989768618e-07, + "loss": 0.5327, + "step": 61472 + }, + { + "epoch": 1.58, + "learning_rate": 9.669951435854375e-07, + "loss": 0.6768, + "step": 61473 + }, + { + "epoch": 1.58, + "learning_rate": 9.669674882192829e-07, + "loss": 0.5241, + "step": 61474 + }, + { + "epoch": 1.58, + "learning_rate": 9.669398328784203e-07, + "loss": 0.6724, + "step": 61475 + }, + { + "epoch": 1.58, + "learning_rate": 9.6691217756287e-07, + "loss": 0.6289, + "step": 61476 + }, + { + "epoch": 1.58, + "learning_rate": 9.668845222726535e-07, + "loss": 0.7441, + "step": 61477 + }, + { + "epoch": 1.58, + "learning_rate": 9.668568670077922e-07, + "loss": 0.4766, + "step": 61478 + }, + { + "epoch": 1.58, + "learning_rate": 9.668292117683071e-07, + "loss": 0.8262, + "step": 61479 + }, + { + "epoch": 1.58, + "learning_rate": 9.66801556554219e-07, + "loss": 0.3895, + "step": 61480 + }, + { + "epoch": 1.58, + "learning_rate": 9.6677390136555e-07, + "loss": 0.748, + "step": 61481 + }, + { + "epoch": 1.58, + "learning_rate": 9.667462462023206e-07, + "loss": 0.606, + "step": 61482 + }, + { + "epoch": 1.58, + "learning_rate": 9.667185910645517e-07, + "loss": 0.5337, + "step": 61483 + }, + { + "epoch": 1.58, + "learning_rate": 9.666909359522652e-07, + "loss": 0.6504, + "step": 61484 + }, + { + "epoch": 1.58, + "learning_rate": 9.666632808654815e-07, + "loss": 0.6855, + "step": 61485 + }, + { + "epoch": 1.58, + "learning_rate": 9.666356258042226e-07, + "loss": 0.8535, + "step": 61486 + }, + { + "epoch": 1.58, + "learning_rate": 9.66607970768509e-07, + "loss": 0.4211, + "step": 61487 + }, + { + "epoch": 1.58, + "learning_rate": 9.665803157583622e-07, + "loss": 0.668, + "step": 61488 + }, + { + "epoch": 1.58, + "learning_rate": 9.665526607738033e-07, + "loss": 0.5232, + "step": 61489 + }, + { + "epoch": 1.58, + "learning_rate": 9.665250058148535e-07, + "loss": 0.5203, + "step": 61490 + }, + { + "epoch": 1.58, + "learning_rate": 9.664973508815342e-07, + "loss": 0.6318, + "step": 61491 + }, + { + "epoch": 1.58, + "learning_rate": 9.664696959738662e-07, + "loss": 0.6006, + "step": 61492 + }, + { + "epoch": 1.58, + "learning_rate": 9.664420410918706e-07, + "loss": 0.7705, + "step": 61493 + }, + { + "epoch": 1.58, + "learning_rate": 9.664143862355692e-07, + "loss": 0.623, + "step": 61494 + }, + { + "epoch": 1.58, + "learning_rate": 9.663867314049823e-07, + "loss": 0.519, + "step": 61495 + }, + { + "epoch": 1.58, + "learning_rate": 9.663590766001317e-07, + "loss": 0.6226, + "step": 61496 + }, + { + "epoch": 1.58, + "learning_rate": 9.663314218210383e-07, + "loss": 0.5669, + "step": 61497 + }, + { + "epoch": 1.58, + "learning_rate": 9.663037670677236e-07, + "loss": 0.7393, + "step": 61498 + }, + { + "epoch": 1.58, + "learning_rate": 9.662761123402084e-07, + "loss": 0.6797, + "step": 61499 + }, + { + "epoch": 1.58, + "learning_rate": 9.66248457638514e-07, + "loss": 0.792, + "step": 61500 + }, + { + "epoch": 1.58, + "learning_rate": 9.66220802962662e-07, + "loss": 0.5913, + "step": 61501 + }, + { + "epoch": 1.58, + "learning_rate": 9.66193148312673e-07, + "loss": 0.6099, + "step": 61502 + }, + { + "epoch": 1.58, + "learning_rate": 9.661654936885682e-07, + "loss": 0.6172, + "step": 61503 + }, + { + "epoch": 1.58, + "learning_rate": 9.66137839090369e-07, + "loss": 0.666, + "step": 61504 + }, + { + "epoch": 1.58, + "learning_rate": 9.661101845180964e-07, + "loss": 0.6431, + "step": 61505 + }, + { + "epoch": 1.58, + "learning_rate": 9.660825299717719e-07, + "loss": 0.7227, + "step": 61506 + }, + { + "epoch": 1.58, + "learning_rate": 9.66054875451416e-07, + "loss": 0.5049, + "step": 61507 + }, + { + "epoch": 1.58, + "learning_rate": 9.660272209570509e-07, + "loss": 0.6392, + "step": 61508 + }, + { + "epoch": 1.58, + "learning_rate": 9.659995664886966e-07, + "loss": 0.7334, + "step": 61509 + }, + { + "epoch": 1.58, + "learning_rate": 9.659719120463754e-07, + "loss": 0.6226, + "step": 61510 + }, + { + "epoch": 1.58, + "learning_rate": 9.659442576301079e-07, + "loss": 0.4514, + "step": 61511 + }, + { + "epoch": 1.58, + "learning_rate": 9.65916603239915e-07, + "loss": 0.3894, + "step": 61512 + }, + { + "epoch": 1.58, + "learning_rate": 9.658889488758184e-07, + "loss": 0.5908, + "step": 61513 + }, + { + "epoch": 1.58, + "learning_rate": 9.658612945378387e-07, + "loss": 0.583, + "step": 61514 + }, + { + "epoch": 1.58, + "learning_rate": 9.65833640225998e-07, + "loss": 0.5947, + "step": 61515 + }, + { + "epoch": 1.58, + "learning_rate": 9.658059859403164e-07, + "loss": 0.72, + "step": 61516 + }, + { + "epoch": 1.58, + "learning_rate": 9.657783316808159e-07, + "loss": 0.6455, + "step": 61517 + }, + { + "epoch": 1.58, + "learning_rate": 9.657506774475172e-07, + "loss": 0.6572, + "step": 61518 + }, + { + "epoch": 1.58, + "learning_rate": 9.657230232404418e-07, + "loss": 0.71, + "step": 61519 + }, + { + "epoch": 1.58, + "learning_rate": 9.656953690596103e-07, + "loss": 0.7461, + "step": 61520 + }, + { + "epoch": 1.58, + "learning_rate": 9.656677149050449e-07, + "loss": 0.7432, + "step": 61521 + }, + { + "epoch": 1.58, + "learning_rate": 9.65640060776766e-07, + "loss": 0.751, + "step": 61522 + }, + { + "epoch": 1.58, + "learning_rate": 9.656124066747947e-07, + "loss": 0.8052, + "step": 61523 + }, + { + "epoch": 1.58, + "learning_rate": 9.655847525991524e-07, + "loss": 0.6025, + "step": 61524 + }, + { + "epoch": 1.58, + "learning_rate": 9.655570985498605e-07, + "loss": 0.6826, + "step": 61525 + }, + { + "epoch": 1.58, + "learning_rate": 9.655294445269396e-07, + "loss": 0.8037, + "step": 61526 + }, + { + "epoch": 1.58, + "learning_rate": 9.655017905304114e-07, + "loss": 0.7534, + "step": 61527 + }, + { + "epoch": 1.58, + "learning_rate": 9.65474136560297e-07, + "loss": 0.5708, + "step": 61528 + }, + { + "epoch": 1.58, + "learning_rate": 9.654464826166173e-07, + "loss": 0.6426, + "step": 61529 + }, + { + "epoch": 1.58, + "learning_rate": 9.654188286993936e-07, + "loss": 0.5266, + "step": 61530 + }, + { + "epoch": 1.58, + "learning_rate": 9.653911748086476e-07, + "loss": 0.7598, + "step": 61531 + }, + { + "epoch": 1.58, + "learning_rate": 9.653635209443995e-07, + "loss": 0.4529, + "step": 61532 + }, + { + "epoch": 1.58, + "learning_rate": 9.65335867106671e-07, + "loss": 0.584, + "step": 61533 + }, + { + "epoch": 1.58, + "learning_rate": 9.653082132954833e-07, + "loss": 0.5776, + "step": 61534 + }, + { + "epoch": 1.58, + "learning_rate": 9.652805595108574e-07, + "loss": 0.5928, + "step": 61535 + }, + { + "epoch": 1.58, + "learning_rate": 9.652529057528148e-07, + "loss": 0.6641, + "step": 61536 + }, + { + "epoch": 1.58, + "learning_rate": 9.652252520213762e-07, + "loss": 0.6611, + "step": 61537 + }, + { + "epoch": 1.58, + "learning_rate": 9.651975983165632e-07, + "loss": 0.667, + "step": 61538 + }, + { + "epoch": 1.58, + "learning_rate": 9.651699446383966e-07, + "loss": 0.5239, + "step": 61539 + }, + { + "epoch": 1.58, + "learning_rate": 9.65142290986898e-07, + "loss": 0.5981, + "step": 61540 + }, + { + "epoch": 1.58, + "learning_rate": 9.651146373620885e-07, + "loss": 0.5908, + "step": 61541 + }, + { + "epoch": 1.58, + "learning_rate": 9.65086983763989e-07, + "loss": 0.6006, + "step": 61542 + }, + { + "epoch": 1.58, + "learning_rate": 9.650593301926205e-07, + "loss": 0.7246, + "step": 61543 + }, + { + "epoch": 1.58, + "learning_rate": 9.650316766480048e-07, + "loss": 0.5771, + "step": 61544 + }, + { + "epoch": 1.58, + "learning_rate": 9.650040231301624e-07, + "loss": 0.7637, + "step": 61545 + }, + { + "epoch": 1.58, + "learning_rate": 9.649763696391152e-07, + "loss": 0.6987, + "step": 61546 + }, + { + "epoch": 1.58, + "learning_rate": 9.649487161748835e-07, + "loss": 0.5962, + "step": 61547 + }, + { + "epoch": 1.58, + "learning_rate": 9.649210627374894e-07, + "loss": 0.7358, + "step": 61548 + }, + { + "epoch": 1.58, + "learning_rate": 9.648934093269532e-07, + "loss": 0.7666, + "step": 61549 + }, + { + "epoch": 1.58, + "learning_rate": 9.648657559432968e-07, + "loss": 0.6001, + "step": 61550 + }, + { + "epoch": 1.58, + "learning_rate": 9.648381025865415e-07, + "loss": 0.6558, + "step": 61551 + }, + { + "epoch": 1.58, + "learning_rate": 9.648104492567075e-07, + "loss": 0.4612, + "step": 61552 + }, + { + "epoch": 1.58, + "learning_rate": 9.647827959538167e-07, + "loss": 0.5488, + "step": 61553 + }, + { + "epoch": 1.58, + "learning_rate": 9.647551426778898e-07, + "loss": 0.499, + "step": 61554 + }, + { + "epoch": 1.58, + "learning_rate": 9.647274894289484e-07, + "loss": 0.6182, + "step": 61555 + }, + { + "epoch": 1.58, + "learning_rate": 9.646998362070135e-07, + "loss": 0.4961, + "step": 61556 + }, + { + "epoch": 1.58, + "learning_rate": 9.646721830121065e-07, + "loss": 0.6816, + "step": 61557 + }, + { + "epoch": 1.58, + "learning_rate": 9.646445298442482e-07, + "loss": 0.8066, + "step": 61558 + }, + { + "epoch": 1.58, + "learning_rate": 9.6461687670346e-07, + "loss": 0.4504, + "step": 61559 + }, + { + "epoch": 1.58, + "learning_rate": 9.645892235897632e-07, + "loss": 0.6934, + "step": 61560 + }, + { + "epoch": 1.58, + "learning_rate": 9.64561570503179e-07, + "loss": 0.6758, + "step": 61561 + }, + { + "epoch": 1.58, + "learning_rate": 9.64533917443728e-07, + "loss": 0.6602, + "step": 61562 + }, + { + "epoch": 1.58, + "learning_rate": 9.64506264411432e-07, + "loss": 0.7773, + "step": 61563 + }, + { + "epoch": 1.58, + "learning_rate": 9.644786114063114e-07, + "loss": 0.7202, + "step": 61564 + }, + { + "epoch": 1.58, + "learning_rate": 9.644509584283884e-07, + "loss": 0.7129, + "step": 61565 + }, + { + "epoch": 1.58, + "learning_rate": 9.644233054776834e-07, + "loss": 0.6699, + "step": 61566 + }, + { + "epoch": 1.58, + "learning_rate": 9.64395652554218e-07, + "loss": 0.4277, + "step": 61567 + }, + { + "epoch": 1.58, + "learning_rate": 9.64367999658013e-07, + "loss": 0.6021, + "step": 61568 + }, + { + "epoch": 1.58, + "learning_rate": 9.6434034678909e-07, + "loss": 0.4104, + "step": 61569 + }, + { + "epoch": 1.58, + "learning_rate": 9.643126939474699e-07, + "loss": 0.7109, + "step": 61570 + }, + { + "epoch": 1.58, + "learning_rate": 9.642850411331742e-07, + "loss": 0.6235, + "step": 61571 + }, + { + "epoch": 1.58, + "learning_rate": 9.642573883462235e-07, + "loss": 0.7227, + "step": 61572 + }, + { + "epoch": 1.58, + "learning_rate": 9.642297355866391e-07, + "loss": 0.7471, + "step": 61573 + }, + { + "epoch": 1.58, + "learning_rate": 9.642020828544427e-07, + "loss": 0.6836, + "step": 61574 + }, + { + "epoch": 1.58, + "learning_rate": 9.641744301496549e-07, + "loss": 0.6895, + "step": 61575 + }, + { + "epoch": 1.58, + "learning_rate": 9.64146777472297e-07, + "loss": 0.5042, + "step": 61576 + }, + { + "epoch": 1.58, + "learning_rate": 9.641191248223904e-07, + "loss": 0.4296, + "step": 61577 + }, + { + "epoch": 1.58, + "learning_rate": 9.640914721999563e-07, + "loss": 0.5493, + "step": 61578 + }, + { + "epoch": 1.58, + "learning_rate": 9.640638196050157e-07, + "loss": 0.4976, + "step": 61579 + }, + { + "epoch": 1.58, + "learning_rate": 9.640361670375894e-07, + "loss": 0.6367, + "step": 61580 + }, + { + "epoch": 1.58, + "learning_rate": 9.640085144976996e-07, + "loss": 0.5991, + "step": 61581 + }, + { + "epoch": 1.58, + "learning_rate": 9.639808619853665e-07, + "loss": 0.4822, + "step": 61582 + }, + { + "epoch": 1.58, + "learning_rate": 9.639532095006113e-07, + "loss": 0.6357, + "step": 61583 + }, + { + "epoch": 1.58, + "learning_rate": 9.639255570434558e-07, + "loss": 0.7324, + "step": 61584 + }, + { + "epoch": 1.58, + "learning_rate": 9.638979046139206e-07, + "loss": 0.7715, + "step": 61585 + }, + { + "epoch": 1.58, + "learning_rate": 9.638702522120273e-07, + "loss": 0.7334, + "step": 61586 + }, + { + "epoch": 1.58, + "learning_rate": 9.638425998377967e-07, + "loss": 0.668, + "step": 61587 + }, + { + "epoch": 1.58, + "learning_rate": 9.638149474912504e-07, + "loss": 0.4666, + "step": 61588 + }, + { + "epoch": 1.58, + "learning_rate": 9.63787295172409e-07, + "loss": 0.4268, + "step": 61589 + }, + { + "epoch": 1.58, + "learning_rate": 9.637596428812943e-07, + "loss": 0.5122, + "step": 61590 + }, + { + "epoch": 1.58, + "learning_rate": 9.637319906179275e-07, + "loss": 0.7166, + "step": 61591 + }, + { + "epoch": 1.58, + "learning_rate": 9.63704338382329e-07, + "loss": 0.5332, + "step": 61592 + }, + { + "epoch": 1.58, + "learning_rate": 9.636766861745205e-07, + "loss": 0.7178, + "step": 61593 + }, + { + "epoch": 1.58, + "learning_rate": 9.636490339945228e-07, + "loss": 0.6064, + "step": 61594 + }, + { + "epoch": 1.58, + "learning_rate": 9.636213818423577e-07, + "loss": 0.7207, + "step": 61595 + }, + { + "epoch": 1.58, + "learning_rate": 9.635937297180461e-07, + "loss": 0.791, + "step": 61596 + }, + { + "epoch": 1.58, + "learning_rate": 9.635660776216087e-07, + "loss": 0.7354, + "step": 61597 + }, + { + "epoch": 1.58, + "learning_rate": 9.635384255530675e-07, + "loss": 0.585, + "step": 61598 + }, + { + "epoch": 1.58, + "learning_rate": 9.63510773512443e-07, + "loss": 0.4575, + "step": 61599 + }, + { + "epoch": 1.58, + "learning_rate": 9.634831214997567e-07, + "loss": 0.5488, + "step": 61600 + }, + { + "epoch": 1.58, + "learning_rate": 9.6345546951503e-07, + "loss": 0.5718, + "step": 61601 + }, + { + "epoch": 1.58, + "learning_rate": 9.634278175582834e-07, + "loss": 0.7061, + "step": 61602 + }, + { + "epoch": 1.58, + "learning_rate": 9.634001656295386e-07, + "loss": 0.6543, + "step": 61603 + }, + { + "epoch": 1.58, + "learning_rate": 9.633725137288165e-07, + "loss": 0.6357, + "step": 61604 + }, + { + "epoch": 1.58, + "learning_rate": 9.633448618561383e-07, + "loss": 0.3599, + "step": 61605 + }, + { + "epoch": 1.58, + "learning_rate": 9.633172100115253e-07, + "loss": 0.6982, + "step": 61606 + }, + { + "epoch": 1.58, + "learning_rate": 9.632895581949988e-07, + "loss": 0.6558, + "step": 61607 + }, + { + "epoch": 1.58, + "learning_rate": 9.632619064065795e-07, + "loss": 0.5283, + "step": 61608 + }, + { + "epoch": 1.58, + "learning_rate": 9.632342546462892e-07, + "loss": 0.583, + "step": 61609 + }, + { + "epoch": 1.58, + "learning_rate": 9.632066029141484e-07, + "loss": 0.626, + "step": 61610 + }, + { + "epoch": 1.58, + "learning_rate": 9.63178951210179e-07, + "loss": 0.7715, + "step": 61611 + }, + { + "epoch": 1.58, + "learning_rate": 9.631512995344018e-07, + "loss": 0.6133, + "step": 61612 + }, + { + "epoch": 1.58, + "learning_rate": 9.631236478868378e-07, + "loss": 0.603, + "step": 61613 + }, + { + "epoch": 1.58, + "learning_rate": 9.63095996267508e-07, + "loss": 0.624, + "step": 61614 + }, + { + "epoch": 1.58, + "learning_rate": 9.630683446764345e-07, + "loss": 0.5068, + "step": 61615 + }, + { + "epoch": 1.58, + "learning_rate": 9.630406931136374e-07, + "loss": 0.748, + "step": 61616 + }, + { + "epoch": 1.58, + "learning_rate": 9.630130415791386e-07, + "loss": 0.7637, + "step": 61617 + }, + { + "epoch": 1.58, + "learning_rate": 9.629853900729586e-07, + "loss": 0.5967, + "step": 61618 + }, + { + "epoch": 1.58, + "learning_rate": 9.629577385951194e-07, + "loss": 0.6772, + "step": 61619 + }, + { + "epoch": 1.58, + "learning_rate": 9.629300871456415e-07, + "loss": 0.7686, + "step": 61620 + }, + { + "epoch": 1.58, + "learning_rate": 9.629024357245469e-07, + "loss": 0.708, + "step": 61621 + }, + { + "epoch": 1.58, + "learning_rate": 9.628747843318558e-07, + "loss": 0.5854, + "step": 61622 + }, + { + "epoch": 1.58, + "learning_rate": 9.628471329675897e-07, + "loss": 0.6411, + "step": 61623 + }, + { + "epoch": 1.58, + "learning_rate": 9.628194816317699e-07, + "loss": 0.7197, + "step": 61624 + }, + { + "epoch": 1.58, + "learning_rate": 9.627918303244171e-07, + "loss": 0.6763, + "step": 61625 + }, + { + "epoch": 1.58, + "learning_rate": 9.627641790455535e-07, + "loss": 0.449, + "step": 61626 + }, + { + "epoch": 1.58, + "learning_rate": 9.627365277951994e-07, + "loss": 0.666, + "step": 61627 + }, + { + "epoch": 1.58, + "learning_rate": 9.627088765733762e-07, + "loss": 0.6499, + "step": 61628 + }, + { + "epoch": 1.58, + "learning_rate": 9.62681225380105e-07, + "loss": 0.625, + "step": 61629 + }, + { + "epoch": 1.58, + "learning_rate": 9.626535742154073e-07, + "loss": 0.7422, + "step": 61630 + }, + { + "epoch": 1.58, + "learning_rate": 9.626259230793043e-07, + "loss": 0.6523, + "step": 61631 + }, + { + "epoch": 1.58, + "learning_rate": 9.625982719718167e-07, + "loss": 0.7988, + "step": 61632 + }, + { + "epoch": 1.58, + "learning_rate": 9.625706208929657e-07, + "loss": 0.668, + "step": 61633 + }, + { + "epoch": 1.58, + "learning_rate": 9.625429698427728e-07, + "loss": 0.7236, + "step": 61634 + }, + { + "epoch": 1.58, + "learning_rate": 9.625153188212588e-07, + "loss": 0.8213, + "step": 61635 + }, + { + "epoch": 1.58, + "learning_rate": 9.624876678284452e-07, + "loss": 0.6543, + "step": 61636 + }, + { + "epoch": 1.58, + "learning_rate": 9.62460016864353e-07, + "loss": 0.6577, + "step": 61637 + }, + { + "epoch": 1.58, + "learning_rate": 9.624323659290036e-07, + "loss": 0.4976, + "step": 61638 + }, + { + "epoch": 1.58, + "learning_rate": 9.62404715022418e-07, + "loss": 0.6416, + "step": 61639 + }, + { + "epoch": 1.58, + "learning_rate": 9.623770641446172e-07, + "loss": 0.493, + "step": 61640 + }, + { + "epoch": 1.58, + "learning_rate": 9.62349413295623e-07, + "loss": 0.5718, + "step": 61641 + }, + { + "epoch": 1.58, + "learning_rate": 9.623217624754557e-07, + "loss": 0.5129, + "step": 61642 + }, + { + "epoch": 1.58, + "learning_rate": 9.622941116841373e-07, + "loss": 0.6313, + "step": 61643 + }, + { + "epoch": 1.58, + "learning_rate": 9.62266460921688e-07, + "loss": 0.6543, + "step": 61644 + }, + { + "epoch": 1.58, + "learning_rate": 9.622388101881299e-07, + "loss": 0.6338, + "step": 61645 + }, + { + "epoch": 1.58, + "learning_rate": 9.622111594834837e-07, + "loss": 0.4424, + "step": 61646 + }, + { + "epoch": 1.58, + "learning_rate": 9.621835088077706e-07, + "loss": 0.7803, + "step": 61647 + }, + { + "epoch": 1.58, + "learning_rate": 9.62155858161012e-07, + "loss": 0.6421, + "step": 61648 + }, + { + "epoch": 1.58, + "learning_rate": 9.621282075432287e-07, + "loss": 0.5938, + "step": 61649 + }, + { + "epoch": 1.58, + "learning_rate": 9.621005569544424e-07, + "loss": 0.5356, + "step": 61650 + }, + { + "epoch": 1.58, + "learning_rate": 9.620729063946742e-07, + "loss": 0.6865, + "step": 61651 + }, + { + "epoch": 1.58, + "learning_rate": 9.620452558639444e-07, + "loss": 0.7227, + "step": 61652 + }, + { + "epoch": 1.58, + "learning_rate": 9.620176053622752e-07, + "loss": 0.6963, + "step": 61653 + }, + { + "epoch": 1.58, + "learning_rate": 9.61989954889687e-07, + "loss": 0.626, + "step": 61654 + }, + { + "epoch": 1.58, + "learning_rate": 9.619623044462018e-07, + "loss": 0.552, + "step": 61655 + }, + { + "epoch": 1.58, + "learning_rate": 9.619346540318397e-07, + "loss": 0.6086, + "step": 61656 + }, + { + "epoch": 1.58, + "learning_rate": 9.619070036466232e-07, + "loss": 0.6138, + "step": 61657 + }, + { + "epoch": 1.58, + "learning_rate": 9.618793532905723e-07, + "loss": 0.6689, + "step": 61658 + }, + { + "epoch": 1.58, + "learning_rate": 9.618517029637088e-07, + "loss": 0.3191, + "step": 61659 + }, + { + "epoch": 1.58, + "learning_rate": 9.618240526660534e-07, + "loss": 0.708, + "step": 61660 + }, + { + "epoch": 1.58, + "learning_rate": 9.61796402397628e-07, + "loss": 0.5283, + "step": 61661 + }, + { + "epoch": 1.58, + "learning_rate": 9.617687521584534e-07, + "loss": 0.7788, + "step": 61662 + }, + { + "epoch": 1.58, + "learning_rate": 9.617411019485502e-07, + "loss": 0.5762, + "step": 61663 + }, + { + "epoch": 1.58, + "learning_rate": 9.617134517679404e-07, + "loss": 0.5405, + "step": 61664 + }, + { + "epoch": 1.58, + "learning_rate": 9.616858016166447e-07, + "loss": 0.6821, + "step": 61665 + }, + { + "epoch": 1.58, + "learning_rate": 9.616581514946846e-07, + "loss": 0.7852, + "step": 61666 + }, + { + "epoch": 1.58, + "learning_rate": 9.616305014020809e-07, + "loss": 0.7432, + "step": 61667 + }, + { + "epoch": 1.58, + "learning_rate": 9.61602851338855e-07, + "loss": 0.5564, + "step": 61668 + }, + { + "epoch": 1.58, + "learning_rate": 9.615752013050284e-07, + "loss": 0.5366, + "step": 61669 + }, + { + "epoch": 1.58, + "learning_rate": 9.615475513006214e-07, + "loss": 0.5908, + "step": 61670 + }, + { + "epoch": 1.58, + "learning_rate": 9.615199013256561e-07, + "loss": 0.5171, + "step": 61671 + }, + { + "epoch": 1.58, + "learning_rate": 9.61492251380153e-07, + "loss": 0.6504, + "step": 61672 + }, + { + "epoch": 1.58, + "learning_rate": 9.614646014641334e-07, + "loss": 0.5913, + "step": 61673 + }, + { + "epoch": 1.58, + "learning_rate": 9.614369515776188e-07, + "loss": 0.5981, + "step": 61674 + }, + { + "epoch": 1.58, + "learning_rate": 9.6140930172063e-07, + "loss": 0.7939, + "step": 61675 + }, + { + "epoch": 1.58, + "learning_rate": 9.613816518931885e-07, + "loss": 0.5391, + "step": 61676 + }, + { + "epoch": 1.58, + "learning_rate": 9.61354002095315e-07, + "loss": 0.5908, + "step": 61677 + }, + { + "epoch": 1.58, + "learning_rate": 9.613263523270313e-07, + "loss": 0.7393, + "step": 61678 + }, + { + "epoch": 1.58, + "learning_rate": 9.612987025883577e-07, + "loss": 0.6558, + "step": 61679 + }, + { + "epoch": 1.58, + "learning_rate": 9.612710528793164e-07, + "loss": 0.5732, + "step": 61680 + }, + { + "epoch": 1.58, + "learning_rate": 9.612434031999282e-07, + "loss": 0.4714, + "step": 61681 + }, + { + "epoch": 1.58, + "learning_rate": 9.612157535502138e-07, + "loss": 0.6475, + "step": 61682 + }, + { + "epoch": 1.58, + "learning_rate": 9.611881039301948e-07, + "loss": 0.6528, + "step": 61683 + }, + { + "epoch": 1.58, + "learning_rate": 9.611604543398922e-07, + "loss": 0.6367, + "step": 61684 + }, + { + "epoch": 1.58, + "learning_rate": 9.611328047793275e-07, + "loss": 0.6543, + "step": 61685 + }, + { + "epoch": 1.58, + "learning_rate": 9.611051552485215e-07, + "loss": 0.7236, + "step": 61686 + }, + { + "epoch": 1.58, + "learning_rate": 9.610775057474954e-07, + "loss": 0.6006, + "step": 61687 + }, + { + "epoch": 1.58, + "learning_rate": 9.610498562762706e-07, + "loss": 0.7607, + "step": 61688 + }, + { + "epoch": 1.58, + "learning_rate": 9.61022206834868e-07, + "loss": 0.5713, + "step": 61689 + }, + { + "epoch": 1.58, + "learning_rate": 9.60994557423309e-07, + "loss": 0.7646, + "step": 61690 + }, + { + "epoch": 1.58, + "learning_rate": 9.609669080416147e-07, + "loss": 0.6387, + "step": 61691 + }, + { + "epoch": 1.58, + "learning_rate": 9.609392586898061e-07, + "loss": 0.3875, + "step": 61692 + }, + { + "epoch": 1.58, + "learning_rate": 9.609116093679048e-07, + "loss": 0.6592, + "step": 61693 + }, + { + "epoch": 1.58, + "learning_rate": 9.608839600759312e-07, + "loss": 0.5747, + "step": 61694 + }, + { + "epoch": 1.58, + "learning_rate": 9.608563108139073e-07, + "loss": 0.6855, + "step": 61695 + }, + { + "epoch": 1.58, + "learning_rate": 9.60828661581854e-07, + "loss": 0.4943, + "step": 61696 + }, + { + "epoch": 1.58, + "learning_rate": 9.608010123797923e-07, + "loss": 0.5142, + "step": 61697 + }, + { + "epoch": 1.58, + "learning_rate": 9.60773363207743e-07, + "loss": 0.6509, + "step": 61698 + }, + { + "epoch": 1.58, + "learning_rate": 9.607457140657283e-07, + "loss": 0.7314, + "step": 61699 + }, + { + "epoch": 1.58, + "learning_rate": 9.607180649537685e-07, + "loss": 0.8223, + "step": 61700 + }, + { + "epoch": 1.58, + "learning_rate": 9.606904158718856e-07, + "loss": 0.6401, + "step": 61701 + }, + { + "epoch": 1.58, + "learning_rate": 9.606627668200998e-07, + "loss": 0.6157, + "step": 61702 + }, + { + "epoch": 1.58, + "learning_rate": 9.60635117798433e-07, + "loss": 0.5398, + "step": 61703 + }, + { + "epoch": 1.58, + "learning_rate": 9.606074688069058e-07, + "loss": 0.4568, + "step": 61704 + }, + { + "epoch": 1.58, + "learning_rate": 9.605798198455395e-07, + "loss": 0.7295, + "step": 61705 + }, + { + "epoch": 1.58, + "learning_rate": 9.605521709143556e-07, + "loss": 0.6626, + "step": 61706 + }, + { + "epoch": 1.58, + "learning_rate": 9.605245220133753e-07, + "loss": 0.6523, + "step": 61707 + }, + { + "epoch": 1.58, + "learning_rate": 9.604968731426191e-07, + "loss": 0.625, + "step": 61708 + }, + { + "epoch": 1.58, + "learning_rate": 9.60469224302109e-07, + "loss": 0.6641, + "step": 61709 + }, + { + "epoch": 1.58, + "learning_rate": 9.604415754918656e-07, + "loss": 0.699, + "step": 61710 + }, + { + "epoch": 1.58, + "learning_rate": 9.604139267119105e-07, + "loss": 0.6641, + "step": 61711 + }, + { + "epoch": 1.58, + "learning_rate": 9.603862779622646e-07, + "loss": 0.6709, + "step": 61712 + }, + { + "epoch": 1.58, + "learning_rate": 9.603586292429489e-07, + "loss": 0.5723, + "step": 61713 + }, + { + "epoch": 1.58, + "learning_rate": 9.60330980553985e-07, + "loss": 0.5786, + "step": 61714 + }, + { + "epoch": 1.58, + "learning_rate": 9.603033318953935e-07, + "loss": 0.5415, + "step": 61715 + }, + { + "epoch": 1.58, + "learning_rate": 9.602756832671963e-07, + "loss": 0.5161, + "step": 61716 + }, + { + "epoch": 1.58, + "learning_rate": 9.602480346694136e-07, + "loss": 0.7588, + "step": 61717 + }, + { + "epoch": 1.58, + "learning_rate": 9.602203861020679e-07, + "loss": 0.616, + "step": 61718 + }, + { + "epoch": 1.58, + "learning_rate": 9.60192737565179e-07, + "loss": 0.6826, + "step": 61719 + }, + { + "epoch": 1.58, + "learning_rate": 9.60165089058769e-07, + "loss": 0.4333, + "step": 61720 + }, + { + "epoch": 1.58, + "learning_rate": 9.601374405828593e-07, + "loss": 0.7559, + "step": 61721 + }, + { + "epoch": 1.58, + "learning_rate": 9.6010979213747e-07, + "loss": 0.6172, + "step": 61722 + }, + { + "epoch": 1.58, + "learning_rate": 9.600821437226225e-07, + "loss": 0.6594, + "step": 61723 + }, + { + "epoch": 1.58, + "learning_rate": 9.600544953383385e-07, + "loss": 0.4338, + "step": 61724 + }, + { + "epoch": 1.58, + "learning_rate": 9.60026846984639e-07, + "loss": 0.7109, + "step": 61725 + }, + { + "epoch": 1.58, + "learning_rate": 9.599991986615452e-07, + "loss": 0.5352, + "step": 61726 + }, + { + "epoch": 1.58, + "learning_rate": 9.59971550369078e-07, + "loss": 0.6411, + "step": 61727 + }, + { + "epoch": 1.58, + "learning_rate": 9.599439021072586e-07, + "loss": 0.7729, + "step": 61728 + }, + { + "epoch": 1.58, + "learning_rate": 9.599162538761085e-07, + "loss": 0.4937, + "step": 61729 + }, + { + "epoch": 1.58, + "learning_rate": 9.598886056756487e-07, + "loss": 0.7261, + "step": 61730 + }, + { + "epoch": 1.58, + "learning_rate": 9.598609575059006e-07, + "loss": 0.407, + "step": 61731 + }, + { + "epoch": 1.58, + "learning_rate": 9.598333093668846e-07, + "loss": 0.5642, + "step": 61732 + }, + { + "epoch": 1.58, + "learning_rate": 9.598056612586229e-07, + "loss": 0.6699, + "step": 61733 + }, + { + "epoch": 1.58, + "learning_rate": 9.597780131811357e-07, + "loss": 0.5316, + "step": 61734 + }, + { + "epoch": 1.58, + "learning_rate": 9.597503651344448e-07, + "loss": 0.6543, + "step": 61735 + }, + { + "epoch": 1.58, + "learning_rate": 9.59722717118571e-07, + "loss": 0.6758, + "step": 61736 + }, + { + "epoch": 1.58, + "learning_rate": 9.596950691335361e-07, + "loss": 0.6465, + "step": 61737 + }, + { + "epoch": 1.58, + "learning_rate": 9.596674211793605e-07, + "loss": 0.7178, + "step": 61738 + }, + { + "epoch": 1.58, + "learning_rate": 9.59639773256066e-07, + "loss": 0.4648, + "step": 61739 + }, + { + "epoch": 1.58, + "learning_rate": 9.596121253636729e-07, + "loss": 0.6577, + "step": 61740 + }, + { + "epoch": 1.58, + "learning_rate": 9.59584477502204e-07, + "loss": 0.6787, + "step": 61741 + }, + { + "epoch": 1.58, + "learning_rate": 9.595568296716786e-07, + "loss": 0.5386, + "step": 61742 + }, + { + "epoch": 1.58, + "learning_rate": 9.595291818721188e-07, + "loss": 0.7666, + "step": 61743 + }, + { + "epoch": 1.58, + "learning_rate": 9.595015341035455e-07, + "loss": 0.5469, + "step": 61744 + }, + { + "epoch": 1.58, + "learning_rate": 9.594738863659803e-07, + "loss": 0.4487, + "step": 61745 + }, + { + "epoch": 1.58, + "learning_rate": 9.594462386594438e-07, + "loss": 0.5015, + "step": 61746 + }, + { + "epoch": 1.58, + "learning_rate": 9.594185909839577e-07, + "loss": 0.7354, + "step": 61747 + }, + { + "epoch": 1.58, + "learning_rate": 9.593909433395426e-07, + "loss": 0.5073, + "step": 61748 + }, + { + "epoch": 1.58, + "learning_rate": 9.593632957262202e-07, + "loss": 0.6333, + "step": 61749 + }, + { + "epoch": 1.58, + "learning_rate": 9.593356481440115e-07, + "loss": 0.6377, + "step": 61750 + }, + { + "epoch": 1.58, + "learning_rate": 9.593080005929378e-07, + "loss": 0.551, + "step": 61751 + }, + { + "epoch": 1.58, + "learning_rate": 9.5928035307302e-07, + "loss": 0.7295, + "step": 61752 + }, + { + "epoch": 1.58, + "learning_rate": 9.59252705584279e-07, + "loss": 0.7734, + "step": 61753 + }, + { + "epoch": 1.58, + "learning_rate": 9.592250581267368e-07, + "loss": 0.5841, + "step": 61754 + }, + { + "epoch": 1.58, + "learning_rate": 9.591974107004136e-07, + "loss": 0.8115, + "step": 61755 + }, + { + "epoch": 1.58, + "learning_rate": 9.591697633053314e-07, + "loss": 0.6025, + "step": 61756 + }, + { + "epoch": 1.58, + "learning_rate": 9.591421159415108e-07, + "loss": 0.6475, + "step": 61757 + }, + { + "epoch": 1.58, + "learning_rate": 9.591144686089735e-07, + "loss": 0.6084, + "step": 61758 + }, + { + "epoch": 1.58, + "learning_rate": 9.590868213077404e-07, + "loss": 0.8398, + "step": 61759 + }, + { + "epoch": 1.58, + "learning_rate": 9.590591740378327e-07, + "loss": 0.7686, + "step": 61760 + }, + { + "epoch": 1.58, + "learning_rate": 9.590315267992712e-07, + "loss": 0.7637, + "step": 61761 + }, + { + "epoch": 1.58, + "learning_rate": 9.590038795920776e-07, + "loss": 0.5205, + "step": 61762 + }, + { + "epoch": 1.58, + "learning_rate": 9.589762324162725e-07, + "loss": 0.6836, + "step": 61763 + }, + { + "epoch": 1.58, + "learning_rate": 9.589485852718777e-07, + "loss": 0.5947, + "step": 61764 + }, + { + "epoch": 1.58, + "learning_rate": 9.58920938158914e-07, + "loss": 0.6777, + "step": 61765 + }, + { + "epoch": 1.58, + "learning_rate": 9.588932910774027e-07, + "loss": 0.6719, + "step": 61766 + }, + { + "epoch": 1.58, + "learning_rate": 9.588656440273646e-07, + "loss": 0.6113, + "step": 61767 + }, + { + "epoch": 1.58, + "learning_rate": 9.588379970088215e-07, + "loss": 0.5601, + "step": 61768 + }, + { + "epoch": 1.58, + "learning_rate": 9.58810350021794e-07, + "loss": 0.5659, + "step": 61769 + }, + { + "epoch": 1.58, + "learning_rate": 9.587827030663041e-07, + "loss": 0.6865, + "step": 61770 + }, + { + "epoch": 1.58, + "learning_rate": 9.587550561423721e-07, + "loss": 0.7402, + "step": 61771 + }, + { + "epoch": 1.58, + "learning_rate": 9.587274092500192e-07, + "loss": 0.603, + "step": 61772 + }, + { + "epoch": 1.58, + "learning_rate": 9.586997623892671e-07, + "loss": 0.7227, + "step": 61773 + }, + { + "epoch": 1.58, + "learning_rate": 9.586721155601363e-07, + "loss": 0.6846, + "step": 61774 + }, + { + "epoch": 1.58, + "learning_rate": 9.586444687626487e-07, + "loss": 0.5178, + "step": 61775 + }, + { + "epoch": 1.58, + "learning_rate": 9.586168219968254e-07, + "loss": 0.5518, + "step": 61776 + }, + { + "epoch": 1.58, + "learning_rate": 9.585891752626868e-07, + "loss": 0.7695, + "step": 61777 + }, + { + "epoch": 1.58, + "learning_rate": 9.585615285602547e-07, + "loss": 0.4602, + "step": 61778 + }, + { + "epoch": 1.58, + "learning_rate": 9.585338818895502e-07, + "loss": 0.6343, + "step": 61779 + }, + { + "epoch": 1.58, + "learning_rate": 9.585062352505946e-07, + "loss": 0.624, + "step": 61780 + }, + { + "epoch": 1.58, + "learning_rate": 9.584785886434086e-07, + "loss": 0.6294, + "step": 61781 + }, + { + "epoch": 1.58, + "learning_rate": 9.584509420680135e-07, + "loss": 0.6719, + "step": 61782 + }, + { + "epoch": 1.58, + "learning_rate": 9.58423295524431e-07, + "loss": 0.7002, + "step": 61783 + }, + { + "epoch": 1.58, + "learning_rate": 9.583956490126814e-07, + "loss": 0.5298, + "step": 61784 + }, + { + "epoch": 1.58, + "learning_rate": 9.583680025327867e-07, + "loss": 0.7588, + "step": 61785 + }, + { + "epoch": 1.58, + "learning_rate": 9.583403560847675e-07, + "loss": 0.4594, + "step": 61786 + }, + { + "epoch": 1.58, + "learning_rate": 9.583127096686453e-07, + "loss": 0.5571, + "step": 61787 + }, + { + "epoch": 1.58, + "learning_rate": 9.58285063284441e-07, + "loss": 0.6982, + "step": 61788 + }, + { + "epoch": 1.58, + "learning_rate": 9.582574169321762e-07, + "loss": 0.5469, + "step": 61789 + }, + { + "epoch": 1.58, + "learning_rate": 9.582297706118718e-07, + "loss": 0.6074, + "step": 61790 + }, + { + "epoch": 1.58, + "learning_rate": 9.582021243235487e-07, + "loss": 0.6289, + "step": 61791 + }, + { + "epoch": 1.58, + "learning_rate": 9.581744780672283e-07, + "loss": 0.7227, + "step": 61792 + }, + { + "epoch": 1.58, + "learning_rate": 9.58146831842932e-07, + "loss": 0.6914, + "step": 61793 + }, + { + "epoch": 1.58, + "learning_rate": 9.581191856506803e-07, + "loss": 0.7246, + "step": 61794 + }, + { + "epoch": 1.58, + "learning_rate": 9.580915394904953e-07, + "loss": 0.7705, + "step": 61795 + }, + { + "epoch": 1.58, + "learning_rate": 9.580638933623973e-07, + "loss": 0.5115, + "step": 61796 + }, + { + "epoch": 1.58, + "learning_rate": 9.58036247266408e-07, + "loss": 0.5595, + "step": 61797 + }, + { + "epoch": 1.58, + "learning_rate": 9.580086012025484e-07, + "loss": 0.6753, + "step": 61798 + }, + { + "epoch": 1.58, + "learning_rate": 9.579809551708398e-07, + "loss": 0.6929, + "step": 61799 + }, + { + "epoch": 1.58, + "learning_rate": 9.579533091713034e-07, + "loss": 0.5366, + "step": 61800 + }, + { + "epoch": 1.58, + "learning_rate": 9.579256632039598e-07, + "loss": 0.7832, + "step": 61801 + }, + { + "epoch": 1.58, + "learning_rate": 9.57898017268831e-07, + "loss": 0.5342, + "step": 61802 + }, + { + "epoch": 1.58, + "learning_rate": 9.578703713659372e-07, + "loss": 0.6895, + "step": 61803 + }, + { + "epoch": 1.58, + "learning_rate": 9.578427254953007e-07, + "loss": 0.751, + "step": 61804 + }, + { + "epoch": 1.58, + "learning_rate": 9.578150796569417e-07, + "loss": 0.8105, + "step": 61805 + }, + { + "epoch": 1.58, + "learning_rate": 9.577874338508819e-07, + "loss": 0.7588, + "step": 61806 + }, + { + "epoch": 1.58, + "learning_rate": 9.57759788077142e-07, + "loss": 0.7549, + "step": 61807 + }, + { + "epoch": 1.58, + "learning_rate": 9.57732142335744e-07, + "loss": 0.6409, + "step": 61808 + }, + { + "epoch": 1.58, + "learning_rate": 9.577044966267082e-07, + "loss": 0.877, + "step": 61809 + }, + { + "epoch": 1.58, + "learning_rate": 9.576768509500568e-07, + "loss": 0.7119, + "step": 61810 + }, + { + "epoch": 1.58, + "learning_rate": 9.576492053058096e-07, + "loss": 0.6133, + "step": 61811 + }, + { + "epoch": 1.58, + "learning_rate": 9.576215596939888e-07, + "loss": 0.5669, + "step": 61812 + }, + { + "epoch": 1.58, + "learning_rate": 9.575939141146147e-07, + "loss": 0.7559, + "step": 61813 + }, + { + "epoch": 1.58, + "learning_rate": 9.575662685677094e-07, + "loss": 0.7998, + "step": 61814 + }, + { + "epoch": 1.58, + "learning_rate": 9.575386230532936e-07, + "loss": 0.791, + "step": 61815 + }, + { + "epoch": 1.58, + "learning_rate": 9.575109775713886e-07, + "loss": 0.5601, + "step": 61816 + }, + { + "epoch": 1.58, + "learning_rate": 9.574833321220151e-07, + "loss": 0.6387, + "step": 61817 + }, + { + "epoch": 1.58, + "learning_rate": 9.57455686705195e-07, + "loss": 0.4011, + "step": 61818 + }, + { + "epoch": 1.58, + "learning_rate": 9.57428041320949e-07, + "loss": 0.5176, + "step": 61819 + }, + { + "epoch": 1.58, + "learning_rate": 9.57400395969299e-07, + "loss": 0.6084, + "step": 61820 + }, + { + "epoch": 1.58, + "learning_rate": 9.573727506502648e-07, + "loss": 0.4901, + "step": 61821 + }, + { + "epoch": 1.58, + "learning_rate": 9.573451053638686e-07, + "loss": 0.6396, + "step": 61822 + }, + { + "epoch": 1.58, + "learning_rate": 9.573174601101312e-07, + "loss": 0.4089, + "step": 61823 + }, + { + "epoch": 1.58, + "learning_rate": 9.57289814889074e-07, + "loss": 0.6084, + "step": 61824 + }, + { + "epoch": 1.58, + "learning_rate": 9.572621697007178e-07, + "loss": 0.6411, + "step": 61825 + }, + { + "epoch": 1.58, + "learning_rate": 9.572345245450841e-07, + "loss": 0.7266, + "step": 61826 + }, + { + "epoch": 1.58, + "learning_rate": 9.57206879422194e-07, + "loss": 0.6025, + "step": 61827 + }, + { + "epoch": 1.58, + "learning_rate": 9.571792343320684e-07, + "loss": 0.7378, + "step": 61828 + }, + { + "epoch": 1.58, + "learning_rate": 9.57151589274729e-07, + "loss": 0.6797, + "step": 61829 + }, + { + "epoch": 1.58, + "learning_rate": 9.57123944250197e-07, + "loss": 0.5596, + "step": 61830 + }, + { + "epoch": 1.58, + "learning_rate": 9.570962992584928e-07, + "loss": 0.6904, + "step": 61831 + }, + { + "epoch": 1.58, + "learning_rate": 9.570686542996378e-07, + "loss": 0.5645, + "step": 61832 + }, + { + "epoch": 1.58, + "learning_rate": 9.570410093736537e-07, + "loss": 0.572, + "step": 61833 + }, + { + "epoch": 1.58, + "learning_rate": 9.570133644805609e-07, + "loss": 0.5603, + "step": 61834 + }, + { + "epoch": 1.58, + "learning_rate": 9.569857196203814e-07, + "loss": 0.5615, + "step": 61835 + }, + { + "epoch": 1.58, + "learning_rate": 9.569580747931357e-07, + "loss": 0.7715, + "step": 61836 + }, + { + "epoch": 1.58, + "learning_rate": 9.569304299988452e-07, + "loss": 0.5496, + "step": 61837 + }, + { + "epoch": 1.58, + "learning_rate": 9.56902785237531e-07, + "loss": 0.5205, + "step": 61838 + }, + { + "epoch": 1.58, + "learning_rate": 9.568751405092147e-07, + "loss": 0.6841, + "step": 61839 + }, + { + "epoch": 1.58, + "learning_rate": 9.568474958139173e-07, + "loss": 0.793, + "step": 61840 + }, + { + "epoch": 1.59, + "learning_rate": 9.568198511516593e-07, + "loss": 0.606, + "step": 61841 + }, + { + "epoch": 1.59, + "learning_rate": 9.567922065224628e-07, + "loss": 0.6963, + "step": 61842 + }, + { + "epoch": 1.59, + "learning_rate": 9.56764561926348e-07, + "loss": 0.6299, + "step": 61843 + }, + { + "epoch": 1.59, + "learning_rate": 9.56736917363337e-07, + "loss": 0.7305, + "step": 61844 + }, + { + "epoch": 1.59, + "learning_rate": 9.567092728334502e-07, + "loss": 0.665, + "step": 61845 + }, + { + "epoch": 1.59, + "learning_rate": 9.566816283367093e-07, + "loss": 0.5249, + "step": 61846 + }, + { + "epoch": 1.59, + "learning_rate": 9.566539838731352e-07, + "loss": 0.4888, + "step": 61847 + }, + { + "epoch": 1.59, + "learning_rate": 9.566263394427494e-07, + "loss": 0.5615, + "step": 61848 + }, + { + "epoch": 1.59, + "learning_rate": 9.565986950455726e-07, + "loss": 0.5494, + "step": 61849 + }, + { + "epoch": 1.59, + "learning_rate": 9.565710506816268e-07, + "loss": 0.4373, + "step": 61850 + }, + { + "epoch": 1.59, + "learning_rate": 9.565434063509317e-07, + "loss": 0.8018, + "step": 61851 + }, + { + "epoch": 1.59, + "learning_rate": 9.565157620535097e-07, + "loss": 0.3726, + "step": 61852 + }, + { + "epoch": 1.59, + "learning_rate": 9.564881177893814e-07, + "loss": 0.5945, + "step": 61853 + }, + { + "epoch": 1.59, + "learning_rate": 9.564604735585682e-07, + "loss": 0.6575, + "step": 61854 + }, + { + "epoch": 1.59, + "learning_rate": 9.564328293610912e-07, + "loss": 0.6228, + "step": 61855 + }, + { + "epoch": 1.59, + "learning_rate": 9.564051851969717e-07, + "loss": 0.6484, + "step": 61856 + }, + { + "epoch": 1.59, + "learning_rate": 9.563775410662304e-07, + "loss": 0.79, + "step": 61857 + }, + { + "epoch": 1.59, + "learning_rate": 9.563498969688894e-07, + "loss": 0.6689, + "step": 61858 + }, + { + "epoch": 1.59, + "learning_rate": 9.563222529049686e-07, + "loss": 0.6902, + "step": 61859 + }, + { + "epoch": 1.59, + "learning_rate": 9.562946088744906e-07, + "loss": 0.6621, + "step": 61860 + }, + { + "epoch": 1.59, + "learning_rate": 9.562669648774754e-07, + "loss": 0.6572, + "step": 61861 + }, + { + "epoch": 1.59, + "learning_rate": 9.562393209139445e-07, + "loss": 0.8711, + "step": 61862 + }, + { + "epoch": 1.59, + "learning_rate": 9.562116769839195e-07, + "loss": 0.6069, + "step": 61863 + }, + { + "epoch": 1.59, + "learning_rate": 9.561840330874206e-07, + "loss": 0.6543, + "step": 61864 + }, + { + "epoch": 1.59, + "learning_rate": 9.5615638922447e-07, + "loss": 0.7744, + "step": 61865 + }, + { + "epoch": 1.59, + "learning_rate": 9.561287453950884e-07, + "loss": 0.533, + "step": 61866 + }, + { + "epoch": 1.59, + "learning_rate": 9.56101101599297e-07, + "loss": 0.6519, + "step": 61867 + }, + { + "epoch": 1.59, + "learning_rate": 9.56073457837117e-07, + "loss": 0.5522, + "step": 61868 + }, + { + "epoch": 1.59, + "learning_rate": 9.560458141085693e-07, + "loss": 0.6201, + "step": 61869 + }, + { + "epoch": 1.59, + "learning_rate": 9.560181704136755e-07, + "loss": 0.6836, + "step": 61870 + }, + { + "epoch": 1.59, + "learning_rate": 9.559905267524568e-07, + "loss": 0.6719, + "step": 61871 + }, + { + "epoch": 1.59, + "learning_rate": 9.559628831249337e-07, + "loss": 0.6816, + "step": 61872 + }, + { + "epoch": 1.59, + "learning_rate": 9.55935239531128e-07, + "loss": 0.5591, + "step": 61873 + }, + { + "epoch": 1.59, + "learning_rate": 9.559075959710603e-07, + "loss": 0.4646, + "step": 61874 + }, + { + "epoch": 1.59, + "learning_rate": 9.558799524447526e-07, + "loss": 0.6104, + "step": 61875 + }, + { + "epoch": 1.59, + "learning_rate": 9.558523089522254e-07, + "loss": 0.668, + "step": 61876 + }, + { + "epoch": 1.59, + "learning_rate": 9.558246654935e-07, + "loss": 0.6963, + "step": 61877 + }, + { + "epoch": 1.59, + "learning_rate": 9.557970220685976e-07, + "loss": 0.7432, + "step": 61878 + }, + { + "epoch": 1.59, + "learning_rate": 9.557693786775397e-07, + "loss": 0.541, + "step": 61879 + }, + { + "epoch": 1.59, + "learning_rate": 9.557417353203471e-07, + "loss": 0.6079, + "step": 61880 + }, + { + "epoch": 1.59, + "learning_rate": 9.557140919970408e-07, + "loss": 0.4531, + "step": 61881 + }, + { + "epoch": 1.59, + "learning_rate": 9.556864487076422e-07, + "loss": 0.6499, + "step": 61882 + }, + { + "epoch": 1.59, + "learning_rate": 9.556588054521726e-07, + "loss": 0.5444, + "step": 61883 + }, + { + "epoch": 1.59, + "learning_rate": 9.556311622306528e-07, + "loss": 0.6714, + "step": 61884 + }, + { + "epoch": 1.59, + "learning_rate": 9.556035190431044e-07, + "loss": 0.5049, + "step": 61885 + }, + { + "epoch": 1.59, + "learning_rate": 9.555758758895481e-07, + "loss": 0.7695, + "step": 61886 + }, + { + "epoch": 1.59, + "learning_rate": 9.555482327700053e-07, + "loss": 0.4585, + "step": 61887 + }, + { + "epoch": 1.59, + "learning_rate": 9.555205896844973e-07, + "loss": 0.748, + "step": 61888 + }, + { + "epoch": 1.59, + "learning_rate": 9.554929466330454e-07, + "loss": 0.7432, + "step": 61889 + }, + { + "epoch": 1.59, + "learning_rate": 9.554653036156704e-07, + "loss": 0.6494, + "step": 61890 + }, + { + "epoch": 1.59, + "learning_rate": 9.554376606323933e-07, + "loss": 0.4958, + "step": 61891 + }, + { + "epoch": 1.59, + "learning_rate": 9.554100176832356e-07, + "loss": 0.6357, + "step": 61892 + }, + { + "epoch": 1.59, + "learning_rate": 9.553823747682184e-07, + "loss": 0.7529, + "step": 61893 + }, + { + "epoch": 1.59, + "learning_rate": 9.55354731887363e-07, + "loss": 0.7178, + "step": 61894 + }, + { + "epoch": 1.59, + "learning_rate": 9.553270890406903e-07, + "loss": 0.4391, + "step": 61895 + }, + { + "epoch": 1.59, + "learning_rate": 9.552994462282217e-07, + "loss": 0.7012, + "step": 61896 + }, + { + "epoch": 1.59, + "learning_rate": 9.55271803449978e-07, + "loss": 0.5161, + "step": 61897 + }, + { + "epoch": 1.59, + "learning_rate": 9.552441607059809e-07, + "loss": 0.6562, + "step": 61898 + }, + { + "epoch": 1.59, + "learning_rate": 9.55216517996251e-07, + "loss": 0.6904, + "step": 61899 + }, + { + "epoch": 1.59, + "learning_rate": 9.551888753208105e-07, + "loss": 0.5854, + "step": 61900 + }, + { + "epoch": 1.59, + "learning_rate": 9.55161232679679e-07, + "loss": 0.6338, + "step": 61901 + }, + { + "epoch": 1.59, + "learning_rate": 9.55133590072879e-07, + "loss": 0.5752, + "step": 61902 + }, + { + "epoch": 1.59, + "learning_rate": 9.55105947500431e-07, + "loss": 0.583, + "step": 61903 + }, + { + "epoch": 1.59, + "learning_rate": 9.55078304962356e-07, + "loss": 0.6204, + "step": 61904 + }, + { + "epoch": 1.59, + "learning_rate": 9.550506624586757e-07, + "loss": 0.7412, + "step": 61905 + }, + { + "epoch": 1.59, + "learning_rate": 9.55023019989411e-07, + "loss": 0.6504, + "step": 61906 + }, + { + "epoch": 1.59, + "learning_rate": 9.549953775545832e-07, + "loss": 0.7695, + "step": 61907 + }, + { + "epoch": 1.59, + "learning_rate": 9.549677351542133e-07, + "loss": 0.5449, + "step": 61908 + }, + { + "epoch": 1.59, + "learning_rate": 9.549400927883225e-07, + "loss": 0.4722, + "step": 61909 + }, + { + "epoch": 1.59, + "learning_rate": 9.549124504569321e-07, + "loss": 0.5757, + "step": 61910 + }, + { + "epoch": 1.59, + "learning_rate": 9.548848081600633e-07, + "loss": 0.7598, + "step": 61911 + }, + { + "epoch": 1.59, + "learning_rate": 9.548571658977369e-07, + "loss": 0.5757, + "step": 61912 + }, + { + "epoch": 1.59, + "learning_rate": 9.548295236699745e-07, + "loss": 0.6338, + "step": 61913 + }, + { + "epoch": 1.59, + "learning_rate": 9.548018814767966e-07, + "loss": 0.4045, + "step": 61914 + }, + { + "epoch": 1.59, + "learning_rate": 9.547742393182252e-07, + "loss": 0.5967, + "step": 61915 + }, + { + "epoch": 1.59, + "learning_rate": 9.547465971942809e-07, + "loss": 0.7109, + "step": 61916 + }, + { + "epoch": 1.59, + "learning_rate": 9.547189551049853e-07, + "loss": 0.7559, + "step": 61917 + }, + { + "epoch": 1.59, + "learning_rate": 9.54691313050359e-07, + "loss": 0.5425, + "step": 61918 + }, + { + "epoch": 1.59, + "learning_rate": 9.546636710304237e-07, + "loss": 0.6348, + "step": 61919 + }, + { + "epoch": 1.59, + "learning_rate": 9.546360290452005e-07, + "loss": 0.667, + "step": 61920 + }, + { + "epoch": 1.59, + "learning_rate": 9.546083870947103e-07, + "loss": 0.5874, + "step": 61921 + }, + { + "epoch": 1.59, + "learning_rate": 9.545807451789741e-07, + "loss": 0.6689, + "step": 61922 + }, + { + "epoch": 1.59, + "learning_rate": 9.545531032980135e-07, + "loss": 0.6738, + "step": 61923 + }, + { + "epoch": 1.59, + "learning_rate": 9.545254614518494e-07, + "loss": 0.6274, + "step": 61924 + }, + { + "epoch": 1.59, + "learning_rate": 9.544978196405032e-07, + "loss": 0.5903, + "step": 61925 + }, + { + "epoch": 1.59, + "learning_rate": 9.544701778639957e-07, + "loss": 0.772, + "step": 61926 + }, + { + "epoch": 1.59, + "learning_rate": 9.544425361223487e-07, + "loss": 0.5024, + "step": 61927 + }, + { + "epoch": 1.59, + "learning_rate": 9.544148944155825e-07, + "loss": 0.6436, + "step": 61928 + }, + { + "epoch": 1.59, + "learning_rate": 9.54387252743719e-07, + "loss": 0.4553, + "step": 61929 + }, + { + "epoch": 1.59, + "learning_rate": 9.543596111067794e-07, + "loss": 0.751, + "step": 61930 + }, + { + "epoch": 1.59, + "learning_rate": 9.54331969504784e-07, + "loss": 0.6943, + "step": 61931 + }, + { + "epoch": 1.59, + "learning_rate": 9.543043279377549e-07, + "loss": 0.6914, + "step": 61932 + }, + { + "epoch": 1.59, + "learning_rate": 9.542766864057125e-07, + "loss": 0.8125, + "step": 61933 + }, + { + "epoch": 1.59, + "learning_rate": 9.542490449086785e-07, + "loss": 0.5635, + "step": 61934 + }, + { + "epoch": 1.59, + "learning_rate": 9.542214034466739e-07, + "loss": 0.8135, + "step": 61935 + }, + { + "epoch": 1.59, + "learning_rate": 9.541937620197197e-07, + "loss": 0.6279, + "step": 61936 + }, + { + "epoch": 1.59, + "learning_rate": 9.541661206278374e-07, + "loss": 0.6494, + "step": 61937 + }, + { + "epoch": 1.59, + "learning_rate": 9.54138479271048e-07, + "loss": 0.707, + "step": 61938 + }, + { + "epoch": 1.59, + "learning_rate": 9.541108379493727e-07, + "loss": 0.6792, + "step": 61939 + }, + { + "epoch": 1.59, + "learning_rate": 9.54083196662833e-07, + "loss": 0.5474, + "step": 61940 + }, + { + "epoch": 1.59, + "learning_rate": 9.540555554114491e-07, + "loss": 0.5957, + "step": 61941 + }, + { + "epoch": 1.59, + "learning_rate": 9.54027914195243e-07, + "loss": 0.5557, + "step": 61942 + }, + { + "epoch": 1.59, + "learning_rate": 9.540002730142354e-07, + "loss": 0.6719, + "step": 61943 + }, + { + "epoch": 1.59, + "learning_rate": 9.539726318684479e-07, + "loss": 0.5684, + "step": 61944 + }, + { + "epoch": 1.59, + "learning_rate": 9.539449907579012e-07, + "loss": 0.5581, + "step": 61945 + }, + { + "epoch": 1.59, + "learning_rate": 9.539173496826169e-07, + "loss": 0.4077, + "step": 61946 + }, + { + "epoch": 1.59, + "learning_rate": 9.538897086426158e-07, + "loss": 0.6055, + "step": 61947 + }, + { + "epoch": 1.59, + "learning_rate": 9.538620676379194e-07, + "loss": 0.7637, + "step": 61948 + }, + { + "epoch": 1.59, + "learning_rate": 9.538344266685483e-07, + "loss": 0.7617, + "step": 61949 + }, + { + "epoch": 1.59, + "learning_rate": 9.538067857345248e-07, + "loss": 0.5361, + "step": 61950 + }, + { + "epoch": 1.59, + "learning_rate": 9.537791448358689e-07, + "loss": 0.7031, + "step": 61951 + }, + { + "epoch": 1.59, + "learning_rate": 9.537515039726022e-07, + "loss": 0.6865, + "step": 61952 + }, + { + "epoch": 1.59, + "learning_rate": 9.537238631447458e-07, + "loss": 0.8125, + "step": 61953 + }, + { + "epoch": 1.59, + "learning_rate": 9.536962223523207e-07, + "loss": 0.5786, + "step": 61954 + }, + { + "epoch": 1.59, + "learning_rate": 9.536685815953488e-07, + "loss": 0.7129, + "step": 61955 + }, + { + "epoch": 1.59, + "learning_rate": 9.536409408738505e-07, + "loss": 0.6855, + "step": 61956 + }, + { + "epoch": 1.59, + "learning_rate": 9.536133001878471e-07, + "loss": 0.7051, + "step": 61957 + }, + { + "epoch": 1.59, + "learning_rate": 9.5358565953736e-07, + "loss": 0.7417, + "step": 61958 + }, + { + "epoch": 1.59, + "learning_rate": 9.535580189224099e-07, + "loss": 0.439, + "step": 61959 + }, + { + "epoch": 1.59, + "learning_rate": 9.535303783430188e-07, + "loss": 0.522, + "step": 61960 + }, + { + "epoch": 1.59, + "learning_rate": 9.535027377992072e-07, + "loss": 0.636, + "step": 61961 + }, + { + "epoch": 1.59, + "learning_rate": 9.534750972909962e-07, + "loss": 0.6343, + "step": 61962 + }, + { + "epoch": 1.59, + "learning_rate": 9.534474568184073e-07, + "loss": 0.5181, + "step": 61963 + }, + { + "epoch": 1.59, + "learning_rate": 9.534198163814614e-07, + "loss": 0.4386, + "step": 61964 + }, + { + "epoch": 1.59, + "learning_rate": 9.533921759801801e-07, + "loss": 0.7871, + "step": 61965 + }, + { + "epoch": 1.59, + "learning_rate": 9.53364535614584e-07, + "loss": 0.6021, + "step": 61966 + }, + { + "epoch": 1.59, + "learning_rate": 9.533368952846946e-07, + "loss": 0.7139, + "step": 61967 + }, + { + "epoch": 1.59, + "learning_rate": 9.53309254990533e-07, + "loss": 0.8203, + "step": 61968 + }, + { + "epoch": 1.59, + "learning_rate": 9.532816147321203e-07, + "loss": 0.7188, + "step": 61969 + }, + { + "epoch": 1.59, + "learning_rate": 9.532539745094782e-07, + "loss": 0.5815, + "step": 61970 + }, + { + "epoch": 1.59, + "learning_rate": 9.532263343226268e-07, + "loss": 0.7373, + "step": 61971 + }, + { + "epoch": 1.59, + "learning_rate": 9.531986941715882e-07, + "loss": 0.5698, + "step": 61972 + }, + { + "epoch": 1.59, + "learning_rate": 9.53171054056383e-07, + "loss": 0.6641, + "step": 61973 + }, + { + "epoch": 1.59, + "learning_rate": 9.531434139770325e-07, + "loss": 0.6514, + "step": 61974 + }, + { + "epoch": 1.59, + "learning_rate": 9.531157739335582e-07, + "loss": 0.6436, + "step": 61975 + }, + { + "epoch": 1.59, + "learning_rate": 9.530881339259806e-07, + "loss": 0.7969, + "step": 61976 + }, + { + "epoch": 1.59, + "learning_rate": 9.530604939543215e-07, + "loss": 0.7363, + "step": 61977 + }, + { + "epoch": 1.59, + "learning_rate": 9.530328540186018e-07, + "loss": 0.605, + "step": 61978 + }, + { + "epoch": 1.59, + "learning_rate": 9.530052141188427e-07, + "loss": 0.6494, + "step": 61979 + }, + { + "epoch": 1.59, + "learning_rate": 9.529775742550656e-07, + "loss": 0.7627, + "step": 61980 + }, + { + "epoch": 1.59, + "learning_rate": 9.529499344272911e-07, + "loss": 0.5078, + "step": 61981 + }, + { + "epoch": 1.59, + "learning_rate": 9.529222946355408e-07, + "loss": 0.4312, + "step": 61982 + }, + { + "epoch": 1.59, + "learning_rate": 9.528946548798356e-07, + "loss": 0.6235, + "step": 61983 + }, + { + "epoch": 1.59, + "learning_rate": 9.528670151601968e-07, + "loss": 0.8359, + "step": 61984 + }, + { + "epoch": 1.59, + "learning_rate": 9.528393754766455e-07, + "loss": 0.7617, + "step": 61985 + }, + { + "epoch": 1.59, + "learning_rate": 9.528117358292031e-07, + "loss": 0.4795, + "step": 61986 + }, + { + "epoch": 1.59, + "learning_rate": 9.527840962178904e-07, + "loss": 0.6157, + "step": 61987 + }, + { + "epoch": 1.59, + "learning_rate": 9.527564566427289e-07, + "loss": 0.5508, + "step": 61988 + }, + { + "epoch": 1.59, + "learning_rate": 9.527288171037395e-07, + "loss": 0.6047, + "step": 61989 + }, + { + "epoch": 1.59, + "learning_rate": 9.527011776009441e-07, + "loss": 0.752, + "step": 61990 + }, + { + "epoch": 1.59, + "learning_rate": 9.526735381343624e-07, + "loss": 0.5918, + "step": 61991 + }, + { + "epoch": 1.59, + "learning_rate": 9.526458987040169e-07, + "loss": 0.6865, + "step": 61992 + }, + { + "epoch": 1.59, + "learning_rate": 9.526182593099279e-07, + "loss": 0.6367, + "step": 61993 + }, + { + "epoch": 1.59, + "learning_rate": 9.525906199521171e-07, + "loss": 0.667, + "step": 61994 + }, + { + "epoch": 1.59, + "learning_rate": 9.525629806306053e-07, + "loss": 0.6484, + "step": 61995 + }, + { + "epoch": 1.59, + "learning_rate": 9.525353413454141e-07, + "loss": 0.5154, + "step": 61996 + }, + { + "epoch": 1.59, + "learning_rate": 9.525077020965641e-07, + "loss": 0.5786, + "step": 61997 + }, + { + "epoch": 1.59, + "learning_rate": 9.52480062884077e-07, + "loss": 0.4736, + "step": 61998 + }, + { + "epoch": 1.59, + "learning_rate": 9.524524237079736e-07, + "loss": 0.624, + "step": 61999 + }, + { + "epoch": 1.59, + "learning_rate": 9.524247845682756e-07, + "loss": 0.604, + "step": 62000 + }, + { + "epoch": 1.59, + "learning_rate": 9.523971454650035e-07, + "loss": 0.7588, + "step": 62001 + }, + { + "epoch": 1.59, + "learning_rate": 9.523695063981784e-07, + "loss": 0.6621, + "step": 62002 + }, + { + "epoch": 1.59, + "learning_rate": 9.523418673678222e-07, + "loss": 0.3718, + "step": 62003 + }, + { + "epoch": 1.59, + "learning_rate": 9.523142283739553e-07, + "loss": 0.4351, + "step": 62004 + }, + { + "epoch": 1.59, + "learning_rate": 9.522865894165994e-07, + "loss": 0.5708, + "step": 62005 + }, + { + "epoch": 1.59, + "learning_rate": 9.522589504957754e-07, + "loss": 0.626, + "step": 62006 + }, + { + "epoch": 1.59, + "learning_rate": 9.522313116115046e-07, + "loss": 0.6748, + "step": 62007 + }, + { + "epoch": 1.59, + "learning_rate": 9.52203672763808e-07, + "loss": 0.5635, + "step": 62008 + }, + { + "epoch": 1.59, + "learning_rate": 9.521760339527069e-07, + "loss": 0.5776, + "step": 62009 + }, + { + "epoch": 1.59, + "learning_rate": 9.521483951782228e-07, + "loss": 0.5581, + "step": 62010 + }, + { + "epoch": 1.59, + "learning_rate": 9.521207564403761e-07, + "loss": 0.7393, + "step": 62011 + }, + { + "epoch": 1.59, + "learning_rate": 9.520931177391883e-07, + "loss": 0.5786, + "step": 62012 + }, + { + "epoch": 1.59, + "learning_rate": 9.520654790746806e-07, + "loss": 0.8105, + "step": 62013 + }, + { + "epoch": 1.59, + "learning_rate": 9.52037840446874e-07, + "loss": 0.6504, + "step": 62014 + }, + { + "epoch": 1.59, + "learning_rate": 9.520102018557902e-07, + "loss": 0.5103, + "step": 62015 + }, + { + "epoch": 1.59, + "learning_rate": 9.519825633014495e-07, + "loss": 0.7295, + "step": 62016 + }, + { + "epoch": 1.59, + "learning_rate": 9.51954924783874e-07, + "loss": 0.7275, + "step": 62017 + }, + { + "epoch": 1.59, + "learning_rate": 9.519272863030841e-07, + "loss": 0.7217, + "step": 62018 + }, + { + "epoch": 1.59, + "learning_rate": 9.518996478591015e-07, + "loss": 0.4031, + "step": 62019 + }, + { + "epoch": 1.59, + "learning_rate": 9.518720094519472e-07, + "loss": 0.4856, + "step": 62020 + }, + { + "epoch": 1.59, + "learning_rate": 9.518443710816421e-07, + "loss": 0.5181, + "step": 62021 + }, + { + "epoch": 1.59, + "learning_rate": 9.518167327482077e-07, + "loss": 0.7529, + "step": 62022 + }, + { + "epoch": 1.59, + "learning_rate": 9.517890944516646e-07, + "loss": 0.6865, + "step": 62023 + }, + { + "epoch": 1.59, + "learning_rate": 9.517614561920347e-07, + "loss": 0.752, + "step": 62024 + }, + { + "epoch": 1.59, + "learning_rate": 9.517338179693387e-07, + "loss": 0.7417, + "step": 62025 + }, + { + "epoch": 1.59, + "learning_rate": 9.51706179783598e-07, + "loss": 0.6826, + "step": 62026 + }, + { + "epoch": 1.59, + "learning_rate": 9.516785416348335e-07, + "loss": 0.6216, + "step": 62027 + }, + { + "epoch": 1.59, + "learning_rate": 9.516509035230668e-07, + "loss": 0.6602, + "step": 62028 + }, + { + "epoch": 1.59, + "learning_rate": 9.516232654483187e-07, + "loss": 0.5713, + "step": 62029 + }, + { + "epoch": 1.59, + "learning_rate": 9.515956274106107e-07, + "loss": 0.7285, + "step": 62030 + }, + { + "epoch": 1.59, + "learning_rate": 9.515679894099633e-07, + "loss": 0.5693, + "step": 62031 + }, + { + "epoch": 1.59, + "learning_rate": 9.515403514463982e-07, + "loss": 0.5225, + "step": 62032 + }, + { + "epoch": 1.59, + "learning_rate": 9.515127135199362e-07, + "loss": 0.7168, + "step": 62033 + }, + { + "epoch": 1.59, + "learning_rate": 9.51485075630599e-07, + "loss": 0.5249, + "step": 62034 + }, + { + "epoch": 1.59, + "learning_rate": 9.514574377784072e-07, + "loss": 0.4597, + "step": 62035 + }, + { + "epoch": 1.59, + "learning_rate": 9.514297999633822e-07, + "loss": 0.665, + "step": 62036 + }, + { + "epoch": 1.59, + "learning_rate": 9.514021621855452e-07, + "loss": 0.4883, + "step": 62037 + }, + { + "epoch": 1.59, + "learning_rate": 9.513745244449175e-07, + "loss": 0.6348, + "step": 62038 + }, + { + "epoch": 1.59, + "learning_rate": 9.513468867415199e-07, + "loss": 0.6064, + "step": 62039 + }, + { + "epoch": 1.59, + "learning_rate": 9.513192490753741e-07, + "loss": 0.4253, + "step": 62040 + }, + { + "epoch": 1.59, + "learning_rate": 9.512916114465009e-07, + "loss": 0.7183, + "step": 62041 + }, + { + "epoch": 1.59, + "learning_rate": 9.51263973854921e-07, + "loss": 0.5698, + "step": 62042 + }, + { + "epoch": 1.59, + "learning_rate": 9.512363363006563e-07, + "loss": 0.6777, + "step": 62043 + }, + { + "epoch": 1.59, + "learning_rate": 9.512086987837276e-07, + "loss": 0.7793, + "step": 62044 + }, + { + "epoch": 1.59, + "learning_rate": 9.511810613041562e-07, + "loss": 0.7285, + "step": 62045 + }, + { + "epoch": 1.59, + "learning_rate": 9.511534238619634e-07, + "loss": 0.6299, + "step": 62046 + }, + { + "epoch": 1.59, + "learning_rate": 9.511257864571699e-07, + "loss": 0.7017, + "step": 62047 + }, + { + "epoch": 1.59, + "learning_rate": 9.510981490897973e-07, + "loss": 0.6729, + "step": 62048 + }, + { + "epoch": 1.59, + "learning_rate": 9.510705117598664e-07, + "loss": 0.644, + "step": 62049 + }, + { + "epoch": 1.59, + "learning_rate": 9.510428744673991e-07, + "loss": 0.4419, + "step": 62050 + }, + { + "epoch": 1.59, + "learning_rate": 9.510152372124156e-07, + "loss": 0.5234, + "step": 62051 + }, + { + "epoch": 1.59, + "learning_rate": 9.509875999949374e-07, + "loss": 0.4214, + "step": 62052 + }, + { + "epoch": 1.59, + "learning_rate": 9.509599628149859e-07, + "loss": 0.7002, + "step": 62053 + }, + { + "epoch": 1.59, + "learning_rate": 9.50932325672582e-07, + "loss": 0.7891, + "step": 62054 + }, + { + "epoch": 1.59, + "learning_rate": 9.509046885677471e-07, + "loss": 0.6855, + "step": 62055 + }, + { + "epoch": 1.59, + "learning_rate": 9.508770515005019e-07, + "loss": 0.5908, + "step": 62056 + }, + { + "epoch": 1.59, + "learning_rate": 9.508494144708683e-07, + "loss": 0.6172, + "step": 62057 + }, + { + "epoch": 1.59, + "learning_rate": 9.508217774788667e-07, + "loss": 0.8174, + "step": 62058 + }, + { + "epoch": 1.59, + "learning_rate": 9.50794140524519e-07, + "loss": 0.6216, + "step": 62059 + }, + { + "epoch": 1.59, + "learning_rate": 9.507665036078458e-07, + "loss": 0.7432, + "step": 62060 + }, + { + "epoch": 1.59, + "learning_rate": 9.507388667288683e-07, + "loss": 0.6499, + "step": 62061 + }, + { + "epoch": 1.59, + "learning_rate": 9.507112298876079e-07, + "loss": 0.657, + "step": 62062 + }, + { + "epoch": 1.59, + "learning_rate": 9.506835930840856e-07, + "loss": 0.6641, + "step": 62063 + }, + { + "epoch": 1.59, + "learning_rate": 9.506559563183226e-07, + "loss": 0.7412, + "step": 62064 + }, + { + "epoch": 1.59, + "learning_rate": 9.506283195903401e-07, + "loss": 0.6216, + "step": 62065 + }, + { + "epoch": 1.59, + "learning_rate": 9.506006829001591e-07, + "loss": 0.7539, + "step": 62066 + }, + { + "epoch": 1.59, + "learning_rate": 9.50573046247801e-07, + "loss": 0.7598, + "step": 62067 + }, + { + "epoch": 1.59, + "learning_rate": 9.505454096332866e-07, + "loss": 0.4873, + "step": 62068 + }, + { + "epoch": 1.59, + "learning_rate": 9.505177730566378e-07, + "loss": 0.5879, + "step": 62069 + }, + { + "epoch": 1.59, + "learning_rate": 9.504901365178751e-07, + "loss": 0.7422, + "step": 62070 + }, + { + "epoch": 1.59, + "learning_rate": 9.504625000170195e-07, + "loss": 0.6348, + "step": 62071 + }, + { + "epoch": 1.59, + "learning_rate": 9.504348635540928e-07, + "loss": 0.7539, + "step": 62072 + }, + { + "epoch": 1.59, + "learning_rate": 9.504072271291157e-07, + "loss": 0.4907, + "step": 62073 + }, + { + "epoch": 1.59, + "learning_rate": 9.503795907421096e-07, + "loss": 0.6641, + "step": 62074 + }, + { + "epoch": 1.59, + "learning_rate": 9.503519543930953e-07, + "loss": 0.5186, + "step": 62075 + }, + { + "epoch": 1.59, + "learning_rate": 9.503243180820946e-07, + "loss": 0.876, + "step": 62076 + }, + { + "epoch": 1.59, + "learning_rate": 9.502966818091281e-07, + "loss": 0.5786, + "step": 62077 + }, + { + "epoch": 1.59, + "learning_rate": 9.502690455742172e-07, + "loss": 0.5942, + "step": 62078 + }, + { + "epoch": 1.59, + "learning_rate": 9.502414093773832e-07, + "loss": 0.5503, + "step": 62079 + }, + { + "epoch": 1.59, + "learning_rate": 9.502137732186467e-07, + "loss": 0.4368, + "step": 62080 + }, + { + "epoch": 1.59, + "learning_rate": 9.501861370980295e-07, + "loss": 0.6499, + "step": 62081 + }, + { + "epoch": 1.59, + "learning_rate": 9.501585010155524e-07, + "loss": 0.5222, + "step": 62082 + }, + { + "epoch": 1.59, + "learning_rate": 9.501308649712365e-07, + "loss": 0.5591, + "step": 62083 + }, + { + "epoch": 1.59, + "learning_rate": 9.501032289651033e-07, + "loss": 0.5967, + "step": 62084 + }, + { + "epoch": 1.59, + "learning_rate": 9.500755929971734e-07, + "loss": 0.8379, + "step": 62085 + }, + { + "epoch": 1.59, + "learning_rate": 9.500479570674687e-07, + "loss": 0.7114, + "step": 62086 + }, + { + "epoch": 1.59, + "learning_rate": 9.500203211760099e-07, + "loss": 0.7212, + "step": 62087 + }, + { + "epoch": 1.59, + "learning_rate": 9.499926853228182e-07, + "loss": 0.6475, + "step": 62088 + }, + { + "epoch": 1.59, + "learning_rate": 9.499650495079151e-07, + "loss": 0.6152, + "step": 62089 + }, + { + "epoch": 1.59, + "learning_rate": 9.499374137313209e-07, + "loss": 0.7656, + "step": 62090 + }, + { + "epoch": 1.59, + "learning_rate": 9.499097779930578e-07, + "loss": 0.604, + "step": 62091 + }, + { + "epoch": 1.59, + "learning_rate": 9.498821422931462e-07, + "loss": 0.5112, + "step": 62092 + }, + { + "epoch": 1.59, + "learning_rate": 9.498545066316076e-07, + "loss": 0.5586, + "step": 62093 + }, + { + "epoch": 1.59, + "learning_rate": 9.498268710084631e-07, + "loss": 0.4924, + "step": 62094 + }, + { + "epoch": 1.59, + "learning_rate": 9.497992354237338e-07, + "loss": 0.5645, + "step": 62095 + }, + { + "epoch": 1.59, + "learning_rate": 9.497715998774409e-07, + "loss": 0.6113, + "step": 62096 + }, + { + "epoch": 1.59, + "learning_rate": 9.497439643696057e-07, + "loss": 0.6035, + "step": 62097 + }, + { + "epoch": 1.59, + "learning_rate": 9.497163289002491e-07, + "loss": 0.7219, + "step": 62098 + }, + { + "epoch": 1.59, + "learning_rate": 9.49688693469393e-07, + "loss": 0.7056, + "step": 62099 + }, + { + "epoch": 1.59, + "learning_rate": 9.496610580770573e-07, + "loss": 0.8398, + "step": 62100 + }, + { + "epoch": 1.59, + "learning_rate": 9.496334227232641e-07, + "loss": 0.4678, + "step": 62101 + }, + { + "epoch": 1.59, + "learning_rate": 9.496057874080339e-07, + "loss": 0.6689, + "step": 62102 + }, + { + "epoch": 1.59, + "learning_rate": 9.495781521313886e-07, + "loss": 0.7041, + "step": 62103 + }, + { + "epoch": 1.59, + "learning_rate": 9.495505168933487e-07, + "loss": 0.5391, + "step": 62104 + }, + { + "epoch": 1.59, + "learning_rate": 9.495228816939359e-07, + "loss": 0.6069, + "step": 62105 + }, + { + "epoch": 1.59, + "learning_rate": 9.494952465331708e-07, + "loss": 0.6572, + "step": 62106 + }, + { + "epoch": 1.59, + "learning_rate": 9.494676114110753e-07, + "loss": 0.6106, + "step": 62107 + }, + { + "epoch": 1.59, + "learning_rate": 9.494399763276697e-07, + "loss": 0.5853, + "step": 62108 + }, + { + "epoch": 1.59, + "learning_rate": 9.494123412829761e-07, + "loss": 0.5288, + "step": 62109 + }, + { + "epoch": 1.59, + "learning_rate": 9.493847062770148e-07, + "loss": 0.7861, + "step": 62110 + }, + { + "epoch": 1.59, + "learning_rate": 9.493570713098073e-07, + "loss": 0.5864, + "step": 62111 + }, + { + "epoch": 1.59, + "learning_rate": 9.493294363813749e-07, + "loss": 0.6741, + "step": 62112 + }, + { + "epoch": 1.59, + "learning_rate": 9.493018014917383e-07, + "loss": 0.5498, + "step": 62113 + }, + { + "epoch": 1.59, + "learning_rate": 9.492741666409193e-07, + "loss": 0.376, + "step": 62114 + }, + { + "epoch": 1.59, + "learning_rate": 9.492465318289386e-07, + "loss": 0.7656, + "step": 62115 + }, + { + "epoch": 1.59, + "learning_rate": 9.492188970558175e-07, + "loss": 0.666, + "step": 62116 + }, + { + "epoch": 1.59, + "learning_rate": 9.491912623215771e-07, + "loss": 0.6953, + "step": 62117 + }, + { + "epoch": 1.59, + "learning_rate": 9.491636276262388e-07, + "loss": 0.7178, + "step": 62118 + }, + { + "epoch": 1.59, + "learning_rate": 9.491359929698237e-07, + "loss": 0.4448, + "step": 62119 + }, + { + "epoch": 1.59, + "learning_rate": 9.491083583523527e-07, + "loss": 0.7173, + "step": 62120 + }, + { + "epoch": 1.59, + "learning_rate": 9.49080723773847e-07, + "loss": 0.6177, + "step": 62121 + }, + { + "epoch": 1.59, + "learning_rate": 9.490530892343278e-07, + "loss": 0.6191, + "step": 62122 + }, + { + "epoch": 1.59, + "learning_rate": 9.490254547338162e-07, + "loss": 0.425, + "step": 62123 + }, + { + "epoch": 1.59, + "learning_rate": 9.489978202723338e-07, + "loss": 0.5879, + "step": 62124 + }, + { + "epoch": 1.59, + "learning_rate": 9.489701858499011e-07, + "loss": 0.6875, + "step": 62125 + }, + { + "epoch": 1.59, + "learning_rate": 9.489425514665398e-07, + "loss": 0.707, + "step": 62126 + }, + { + "epoch": 1.59, + "learning_rate": 9.489149171222705e-07, + "loss": 0.4863, + "step": 62127 + }, + { + "epoch": 1.59, + "learning_rate": 9.488872828171152e-07, + "loss": 0.7061, + "step": 62128 + }, + { + "epoch": 1.59, + "learning_rate": 9.488596485510945e-07, + "loss": 0.6055, + "step": 62129 + }, + { + "epoch": 1.59, + "learning_rate": 9.488320143242293e-07, + "loss": 0.3149, + "step": 62130 + }, + { + "epoch": 1.59, + "learning_rate": 9.488043801365413e-07, + "loss": 0.6509, + "step": 62131 + }, + { + "epoch": 1.59, + "learning_rate": 9.487767459880513e-07, + "loss": 0.6338, + "step": 62132 + }, + { + "epoch": 1.59, + "learning_rate": 9.487491118787807e-07, + "loss": 0.7109, + "step": 62133 + }, + { + "epoch": 1.59, + "learning_rate": 9.487214778087503e-07, + "loss": 0.5107, + "step": 62134 + }, + { + "epoch": 1.59, + "learning_rate": 9.486938437779818e-07, + "loss": 0.6108, + "step": 62135 + }, + { + "epoch": 1.59, + "learning_rate": 9.486662097864961e-07, + "loss": 0.6392, + "step": 62136 + }, + { + "epoch": 1.59, + "learning_rate": 9.48638575834314e-07, + "loss": 0.6436, + "step": 62137 + }, + { + "epoch": 1.59, + "learning_rate": 9.486109419214572e-07, + "loss": 0.5251, + "step": 62138 + }, + { + "epoch": 1.59, + "learning_rate": 9.485833080479469e-07, + "loss": 0.4761, + "step": 62139 + }, + { + "epoch": 1.59, + "learning_rate": 9.485556742138036e-07, + "loss": 0.6616, + "step": 62140 + }, + { + "epoch": 1.59, + "learning_rate": 9.48528040419049e-07, + "loss": 0.6074, + "step": 62141 + }, + { + "epoch": 1.59, + "learning_rate": 9.485004066637039e-07, + "loss": 0.6045, + "step": 62142 + }, + { + "epoch": 1.59, + "learning_rate": 9.4847277294779e-07, + "loss": 0.6763, + "step": 62143 + }, + { + "epoch": 1.59, + "learning_rate": 9.484451392713278e-07, + "loss": 0.5664, + "step": 62144 + }, + { + "epoch": 1.59, + "learning_rate": 9.48417505634339e-07, + "loss": 0.5552, + "step": 62145 + }, + { + "epoch": 1.59, + "learning_rate": 9.483898720368442e-07, + "loss": 0.7441, + "step": 62146 + }, + { + "epoch": 1.59, + "learning_rate": 9.483622384788654e-07, + "loss": 0.7002, + "step": 62147 + }, + { + "epoch": 1.59, + "learning_rate": 9.483346049604229e-07, + "loss": 0.6262, + "step": 62148 + }, + { + "epoch": 1.59, + "learning_rate": 9.483069714815387e-07, + "loss": 0.5972, + "step": 62149 + }, + { + "epoch": 1.59, + "learning_rate": 9.482793380422332e-07, + "loss": 0.7285, + "step": 62150 + }, + { + "epoch": 1.59, + "learning_rate": 9.482517046425276e-07, + "loss": 0.5947, + "step": 62151 + }, + { + "epoch": 1.59, + "learning_rate": 9.482240712824435e-07, + "loss": 0.6187, + "step": 62152 + }, + { + "epoch": 1.59, + "learning_rate": 9.48196437962002e-07, + "loss": 0.6123, + "step": 62153 + }, + { + "epoch": 1.59, + "learning_rate": 9.481688046812237e-07, + "loss": 0.5947, + "step": 62154 + }, + { + "epoch": 1.59, + "learning_rate": 9.481411714401305e-07, + "loss": 0.6333, + "step": 62155 + }, + { + "epoch": 1.59, + "learning_rate": 9.48113538238743e-07, + "loss": 0.7129, + "step": 62156 + }, + { + "epoch": 1.59, + "learning_rate": 9.480859050770827e-07, + "loss": 0.6699, + "step": 62157 + }, + { + "epoch": 1.59, + "learning_rate": 9.480582719551705e-07, + "loss": 0.8203, + "step": 62158 + }, + { + "epoch": 1.59, + "learning_rate": 9.480306388730281e-07, + "loss": 0.4741, + "step": 62159 + }, + { + "epoch": 1.59, + "learning_rate": 9.480030058306761e-07, + "loss": 0.6353, + "step": 62160 + }, + { + "epoch": 1.59, + "learning_rate": 9.479753728281355e-07, + "loss": 0.5079, + "step": 62161 + }, + { + "epoch": 1.59, + "learning_rate": 9.47947739865428e-07, + "loss": 0.6914, + "step": 62162 + }, + { + "epoch": 1.59, + "learning_rate": 9.479201069425743e-07, + "loss": 0.5161, + "step": 62163 + }, + { + "epoch": 1.59, + "learning_rate": 9.47892474059596e-07, + "loss": 0.6543, + "step": 62164 + }, + { + "epoch": 1.59, + "learning_rate": 9.478648412165139e-07, + "loss": 0.7803, + "step": 62165 + }, + { + "epoch": 1.59, + "learning_rate": 9.478372084133495e-07, + "loss": 0.6807, + "step": 62166 + }, + { + "epoch": 1.59, + "learning_rate": 9.478095756501235e-07, + "loss": 0.7363, + "step": 62167 + }, + { + "epoch": 1.59, + "learning_rate": 9.477819429268574e-07, + "loss": 0.7637, + "step": 62168 + }, + { + "epoch": 1.59, + "learning_rate": 9.477543102435726e-07, + "loss": 0.5029, + "step": 62169 + }, + { + "epoch": 1.59, + "learning_rate": 9.477266776002894e-07, + "loss": 0.6733, + "step": 62170 + }, + { + "epoch": 1.59, + "learning_rate": 9.476990449970297e-07, + "loss": 0.7148, + "step": 62171 + }, + { + "epoch": 1.59, + "learning_rate": 9.476714124338147e-07, + "loss": 0.708, + "step": 62172 + }, + { + "epoch": 1.59, + "learning_rate": 9.476437799106648e-07, + "loss": 0.6548, + "step": 62173 + }, + { + "epoch": 1.59, + "learning_rate": 9.47616147427602e-07, + "loss": 0.79, + "step": 62174 + }, + { + "epoch": 1.59, + "learning_rate": 9.475885149846469e-07, + "loss": 0.5215, + "step": 62175 + }, + { + "epoch": 1.59, + "learning_rate": 9.47560882581821e-07, + "loss": 0.6704, + "step": 62176 + }, + { + "epoch": 1.59, + "learning_rate": 9.47533250219145e-07, + "loss": 0.5735, + "step": 62177 + }, + { + "epoch": 1.59, + "learning_rate": 9.475056178966408e-07, + "loss": 0.5908, + "step": 62178 + }, + { + "epoch": 1.59, + "learning_rate": 9.474779856143292e-07, + "loss": 0.5645, + "step": 62179 + }, + { + "epoch": 1.59, + "learning_rate": 9.47450353372231e-07, + "loss": 0.6006, + "step": 62180 + }, + { + "epoch": 1.59, + "learning_rate": 9.474227211703678e-07, + "loss": 0.6216, + "step": 62181 + }, + { + "epoch": 1.59, + "learning_rate": 9.473950890087604e-07, + "loss": 0.5889, + "step": 62182 + }, + { + "epoch": 1.59, + "learning_rate": 9.473674568874304e-07, + "loss": 0.6094, + "step": 62183 + }, + { + "epoch": 1.59, + "learning_rate": 9.473398248063984e-07, + "loss": 0.6523, + "step": 62184 + }, + { + "epoch": 1.59, + "learning_rate": 9.473121927656862e-07, + "loss": 0.6118, + "step": 62185 + }, + { + "epoch": 1.59, + "learning_rate": 9.472845607653144e-07, + "loss": 0.5469, + "step": 62186 + }, + { + "epoch": 1.59, + "learning_rate": 9.472569288053045e-07, + "loss": 0.5233, + "step": 62187 + }, + { + "epoch": 1.59, + "learning_rate": 9.472292968856774e-07, + "loss": 0.6924, + "step": 62188 + }, + { + "epoch": 1.59, + "learning_rate": 9.47201665006455e-07, + "loss": 0.7363, + "step": 62189 + }, + { + "epoch": 1.59, + "learning_rate": 9.471740331676573e-07, + "loss": 0.6577, + "step": 62190 + }, + { + "epoch": 1.59, + "learning_rate": 9.471464013693062e-07, + "loss": 0.6621, + "step": 62191 + }, + { + "epoch": 1.59, + "learning_rate": 9.471187696114225e-07, + "loss": 0.5979, + "step": 62192 + }, + { + "epoch": 1.59, + "learning_rate": 9.470911378940276e-07, + "loss": 0.6504, + "step": 62193 + }, + { + "epoch": 1.59, + "learning_rate": 9.470635062171425e-07, + "loss": 0.7129, + "step": 62194 + }, + { + "epoch": 1.59, + "learning_rate": 9.470358745807886e-07, + "loss": 0.6553, + "step": 62195 + }, + { + "epoch": 1.59, + "learning_rate": 9.470082429849867e-07, + "loss": 0.7246, + "step": 62196 + }, + { + "epoch": 1.59, + "learning_rate": 9.469806114297583e-07, + "loss": 0.516, + "step": 62197 + }, + { + "epoch": 1.59, + "learning_rate": 9.469529799151243e-07, + "loss": 0.5913, + "step": 62198 + }, + { + "epoch": 1.59, + "learning_rate": 9.469253484411064e-07, + "loss": 0.6587, + "step": 62199 + }, + { + "epoch": 1.59, + "learning_rate": 9.46897717007725e-07, + "loss": 0.7559, + "step": 62200 + }, + { + "epoch": 1.59, + "learning_rate": 9.468700856150014e-07, + "loss": 0.5911, + "step": 62201 + }, + { + "epoch": 1.59, + "learning_rate": 9.468424542629572e-07, + "loss": 0.519, + "step": 62202 + }, + { + "epoch": 1.59, + "learning_rate": 9.46814822951613e-07, + "loss": 0.6729, + "step": 62203 + }, + { + "epoch": 1.59, + "learning_rate": 9.467871916809906e-07, + "loss": 0.6777, + "step": 62204 + }, + { + "epoch": 1.59, + "learning_rate": 9.467595604511104e-07, + "loss": 0.6719, + "step": 62205 + }, + { + "epoch": 1.59, + "learning_rate": 9.467319292619941e-07, + "loss": 0.7734, + "step": 62206 + }, + { + "epoch": 1.59, + "learning_rate": 9.467042981136627e-07, + "loss": 0.6387, + "step": 62207 + }, + { + "epoch": 1.59, + "learning_rate": 9.466766670061375e-07, + "loss": 0.6836, + "step": 62208 + }, + { + "epoch": 1.59, + "learning_rate": 9.466490359394399e-07, + "loss": 0.6221, + "step": 62209 + }, + { + "epoch": 1.59, + "learning_rate": 9.466214049135904e-07, + "loss": 0.8076, + "step": 62210 + }, + { + "epoch": 1.59, + "learning_rate": 9.465937739286101e-07, + "loss": 0.6211, + "step": 62211 + }, + { + "epoch": 1.59, + "learning_rate": 9.465661429845207e-07, + "loss": 0.4642, + "step": 62212 + }, + { + "epoch": 1.59, + "learning_rate": 9.465385120813429e-07, + "loss": 0.6885, + "step": 62213 + }, + { + "epoch": 1.59, + "learning_rate": 9.465108812190985e-07, + "loss": 0.6548, + "step": 62214 + }, + { + "epoch": 1.59, + "learning_rate": 9.464832503978079e-07, + "loss": 0.3291, + "step": 62215 + }, + { + "epoch": 1.59, + "learning_rate": 9.464556196174929e-07, + "loss": 0.5129, + "step": 62216 + }, + { + "epoch": 1.59, + "learning_rate": 9.464279888781741e-07, + "loss": 0.5498, + "step": 62217 + }, + { + "epoch": 1.59, + "learning_rate": 9.464003581798731e-07, + "loss": 0.751, + "step": 62218 + }, + { + "epoch": 1.59, + "learning_rate": 9.463727275226113e-07, + "loss": 0.6016, + "step": 62219 + }, + { + "epoch": 1.59, + "learning_rate": 9.463450969064088e-07, + "loss": 0.6738, + "step": 62220 + }, + { + "epoch": 1.59, + "learning_rate": 9.463174663312878e-07, + "loss": 0.7598, + "step": 62221 + }, + { + "epoch": 1.59, + "learning_rate": 9.462898357972687e-07, + "loss": 0.6841, + "step": 62222 + }, + { + "epoch": 1.59, + "learning_rate": 9.462622053043733e-07, + "loss": 0.5264, + "step": 62223 + }, + { + "epoch": 1.59, + "learning_rate": 9.462345748526222e-07, + "loss": 0.5146, + "step": 62224 + }, + { + "epoch": 1.59, + "learning_rate": 9.46206944442037e-07, + "loss": 0.4814, + "step": 62225 + }, + { + "epoch": 1.59, + "learning_rate": 9.461793140726387e-07, + "loss": 0.7461, + "step": 62226 + }, + { + "epoch": 1.59, + "learning_rate": 9.46151683744448e-07, + "loss": 0.6582, + "step": 62227 + }, + { + "epoch": 1.59, + "learning_rate": 9.46124053457487e-07, + "loss": 0.7559, + "step": 62228 + }, + { + "epoch": 1.59, + "learning_rate": 9.460964232117764e-07, + "loss": 0.5396, + "step": 62229 + }, + { + "epoch": 1.59, + "learning_rate": 9.460687930073369e-07, + "loss": 0.44, + "step": 62230 + }, + { + "epoch": 1.6, + "learning_rate": 9.460411628441904e-07, + "loss": 0.5938, + "step": 62231 + }, + { + "epoch": 1.6, + "learning_rate": 9.460135327223573e-07, + "loss": 0.7402, + "step": 62232 + }, + { + "epoch": 1.6, + "learning_rate": 9.459859026418593e-07, + "loss": 0.4114, + "step": 62233 + }, + { + "epoch": 1.6, + "learning_rate": 9.459582726027174e-07, + "loss": 0.6602, + "step": 62234 + }, + { + "epoch": 1.6, + "learning_rate": 9.459306426049528e-07, + "loss": 0.7427, + "step": 62235 + }, + { + "epoch": 1.6, + "learning_rate": 9.459030126485865e-07, + "loss": 0.6016, + "step": 62236 + }, + { + "epoch": 1.6, + "learning_rate": 9.4587538273364e-07, + "loss": 0.6504, + "step": 62237 + }, + { + "epoch": 1.6, + "learning_rate": 9.458477528601339e-07, + "loss": 0.7285, + "step": 62238 + }, + { + "epoch": 1.6, + "learning_rate": 9.458201230280903e-07, + "loss": 0.5547, + "step": 62239 + }, + { + "epoch": 1.6, + "learning_rate": 9.457924932375295e-07, + "loss": 0.4927, + "step": 62240 + }, + { + "epoch": 1.6, + "learning_rate": 9.457648634884726e-07, + "loss": 0.7529, + "step": 62241 + }, + { + "epoch": 1.6, + "learning_rate": 9.457372337809413e-07, + "loss": 0.5869, + "step": 62242 + }, + { + "epoch": 1.6, + "learning_rate": 9.457096041149562e-07, + "loss": 0.5132, + "step": 62243 + }, + { + "epoch": 1.6, + "learning_rate": 9.456819744905391e-07, + "loss": 0.8008, + "step": 62244 + }, + { + "epoch": 1.6, + "learning_rate": 9.456543449077108e-07, + "loss": 0.7197, + "step": 62245 + }, + { + "epoch": 1.6, + "learning_rate": 9.456267153664922e-07, + "loss": 0.668, + "step": 62246 + }, + { + "epoch": 1.6, + "learning_rate": 9.455990858669049e-07, + "loss": 0.6802, + "step": 62247 + }, + { + "epoch": 1.6, + "learning_rate": 9.455714564089697e-07, + "loss": 0.7568, + "step": 62248 + }, + { + "epoch": 1.6, + "learning_rate": 9.455438269927085e-07, + "loss": 0.5898, + "step": 62249 + }, + { + "epoch": 1.6, + "learning_rate": 9.455161976181415e-07, + "loss": 0.582, + "step": 62250 + }, + { + "epoch": 1.6, + "learning_rate": 9.454885682852901e-07, + "loss": 0.7129, + "step": 62251 + }, + { + "epoch": 1.6, + "learning_rate": 9.454609389941758e-07, + "loss": 0.5752, + "step": 62252 + }, + { + "epoch": 1.6, + "learning_rate": 9.454333097448194e-07, + "loss": 0.7539, + "step": 62253 + }, + { + "epoch": 1.6, + "learning_rate": 9.454056805372423e-07, + "loss": 0.7549, + "step": 62254 + }, + { + "epoch": 1.6, + "learning_rate": 9.453780513714654e-07, + "loss": 0.494, + "step": 62255 + }, + { + "epoch": 1.6, + "learning_rate": 9.453504222475103e-07, + "loss": 0.5854, + "step": 62256 + }, + { + "epoch": 1.6, + "learning_rate": 9.453227931653975e-07, + "loss": 0.5444, + "step": 62257 + }, + { + "epoch": 1.6, + "learning_rate": 9.452951641251489e-07, + "loss": 0.6299, + "step": 62258 + }, + { + "epoch": 1.6, + "learning_rate": 9.452675351267853e-07, + "loss": 0.667, + "step": 62259 + }, + { + "epoch": 1.6, + "learning_rate": 9.452399061703275e-07, + "loss": 0.8516, + "step": 62260 + }, + { + "epoch": 1.6, + "learning_rate": 9.452122772557973e-07, + "loss": 0.9287, + "step": 62261 + }, + { + "epoch": 1.6, + "learning_rate": 9.451846483832155e-07, + "loss": 0.564, + "step": 62262 + }, + { + "epoch": 1.6, + "learning_rate": 9.451570195526029e-07, + "loss": 0.5381, + "step": 62263 + }, + { + "epoch": 1.6, + "learning_rate": 9.451293907639814e-07, + "loss": 0.5542, + "step": 62264 + }, + { + "epoch": 1.6, + "learning_rate": 9.451017620173717e-07, + "loss": 0.5717, + "step": 62265 + }, + { + "epoch": 1.6, + "learning_rate": 9.450741333127951e-07, + "loss": 0.6484, + "step": 62266 + }, + { + "epoch": 1.6, + "learning_rate": 9.450465046502726e-07, + "loss": 0.4825, + "step": 62267 + }, + { + "epoch": 1.6, + "learning_rate": 9.450188760298256e-07, + "loss": 0.6038, + "step": 62268 + }, + { + "epoch": 1.6, + "learning_rate": 9.449912474514754e-07, + "loss": 0.3607, + "step": 62269 + }, + { + "epoch": 1.6, + "learning_rate": 9.449636189152425e-07, + "loss": 0.5649, + "step": 62270 + }, + { + "epoch": 1.6, + "learning_rate": 9.449359904211484e-07, + "loss": 0.6152, + "step": 62271 + }, + { + "epoch": 1.6, + "learning_rate": 9.449083619692143e-07, + "loss": 0.6211, + "step": 62272 + }, + { + "epoch": 1.6, + "learning_rate": 9.448807335594614e-07, + "loss": 0.7266, + "step": 62273 + }, + { + "epoch": 1.6, + "learning_rate": 9.448531051919106e-07, + "loss": 0.5273, + "step": 62274 + }, + { + "epoch": 1.6, + "learning_rate": 9.448254768665836e-07, + "loss": 0.7275, + "step": 62275 + }, + { + "epoch": 1.6, + "learning_rate": 9.447978485835008e-07, + "loss": 0.7976, + "step": 62276 + }, + { + "epoch": 1.6, + "learning_rate": 9.44770220342684e-07, + "loss": 0.8037, + "step": 62277 + }, + { + "epoch": 1.6, + "learning_rate": 9.44742592144154e-07, + "loss": 0.5215, + "step": 62278 + }, + { + "epoch": 1.6, + "learning_rate": 9.447149639879326e-07, + "loss": 0.7197, + "step": 62279 + }, + { + "epoch": 1.6, + "learning_rate": 9.446873358740398e-07, + "loss": 0.4393, + "step": 62280 + }, + { + "epoch": 1.6, + "learning_rate": 9.446597078024976e-07, + "loss": 0.4438, + "step": 62281 + }, + { + "epoch": 1.6, + "learning_rate": 9.446320797733267e-07, + "loss": 0.5527, + "step": 62282 + }, + { + "epoch": 1.6, + "learning_rate": 9.446044517865487e-07, + "loss": 0.6274, + "step": 62283 + }, + { + "epoch": 1.6, + "learning_rate": 9.445768238421841e-07, + "loss": 0.8359, + "step": 62284 + }, + { + "epoch": 1.6, + "learning_rate": 9.445491959402549e-07, + "loss": 0.7295, + "step": 62285 + }, + { + "epoch": 1.6, + "learning_rate": 9.445215680807817e-07, + "loss": 0.7061, + "step": 62286 + }, + { + "epoch": 1.6, + "learning_rate": 9.444939402637858e-07, + "loss": 0.7432, + "step": 62287 + }, + { + "epoch": 1.6, + "learning_rate": 9.444663124892882e-07, + "loss": 0.6855, + "step": 62288 + }, + { + "epoch": 1.6, + "learning_rate": 9.444386847573107e-07, + "loss": 0.457, + "step": 62289 + }, + { + "epoch": 1.6, + "learning_rate": 9.444110570678736e-07, + "loss": 0.6562, + "step": 62290 + }, + { + "epoch": 1.6, + "learning_rate": 9.443834294209983e-07, + "loss": 0.6138, + "step": 62291 + }, + { + "epoch": 1.6, + "learning_rate": 9.443558018167062e-07, + "loss": 0.6313, + "step": 62292 + }, + { + "epoch": 1.6, + "learning_rate": 9.443281742550179e-07, + "loss": 0.4912, + "step": 62293 + }, + { + "epoch": 1.6, + "learning_rate": 9.443005467359555e-07, + "loss": 0.4243, + "step": 62294 + }, + { + "epoch": 1.6, + "learning_rate": 9.442729192595392e-07, + "loss": 0.5923, + "step": 62295 + }, + { + "epoch": 1.6, + "learning_rate": 9.442452918257908e-07, + "loss": 0.4585, + "step": 62296 + }, + { + "epoch": 1.6, + "learning_rate": 9.442176644347311e-07, + "loss": 0.7324, + "step": 62297 + }, + { + "epoch": 1.6, + "learning_rate": 9.441900370863815e-07, + "loss": 0.6387, + "step": 62298 + }, + { + "epoch": 1.6, + "learning_rate": 9.441624097807632e-07, + "loss": 0.6152, + "step": 62299 + }, + { + "epoch": 1.6, + "learning_rate": 9.441347825178972e-07, + "loss": 0.8389, + "step": 62300 + }, + { + "epoch": 1.6, + "learning_rate": 9.441071552978042e-07, + "loss": 0.6826, + "step": 62301 + }, + { + "epoch": 1.6, + "learning_rate": 9.44079528120506e-07, + "loss": 0.687, + "step": 62302 + }, + { + "epoch": 1.6, + "learning_rate": 9.440519009860233e-07, + "loss": 0.6333, + "step": 62303 + }, + { + "epoch": 1.6, + "learning_rate": 9.440242738943778e-07, + "loss": 0.5781, + "step": 62304 + }, + { + "epoch": 1.6, + "learning_rate": 9.4399664684559e-07, + "loss": 0.666, + "step": 62305 + }, + { + "epoch": 1.6, + "learning_rate": 9.439690198396817e-07, + "loss": 0.5825, + "step": 62306 + }, + { + "epoch": 1.6, + "learning_rate": 9.439413928766735e-07, + "loss": 0.666, + "step": 62307 + }, + { + "epoch": 1.6, + "learning_rate": 9.43913765956587e-07, + "loss": 0.6118, + "step": 62308 + }, + { + "epoch": 1.6, + "learning_rate": 9.438861390794434e-07, + "loss": 0.5776, + "step": 62309 + }, + { + "epoch": 1.6, + "learning_rate": 9.438585122452631e-07, + "loss": 0.6328, + "step": 62310 + }, + { + "epoch": 1.6, + "learning_rate": 9.438308854540681e-07, + "loss": 0.4883, + "step": 62311 + }, + { + "epoch": 1.6, + "learning_rate": 9.43803258705879e-07, + "loss": 0.5649, + "step": 62312 + }, + { + "epoch": 1.6, + "learning_rate": 9.437756320007172e-07, + "loss": 0.6807, + "step": 62313 + }, + { + "epoch": 1.6, + "learning_rate": 9.437480053386038e-07, + "loss": 0.4487, + "step": 62314 + }, + { + "epoch": 1.6, + "learning_rate": 9.4372037871956e-07, + "loss": 0.5539, + "step": 62315 + }, + { + "epoch": 1.6, + "learning_rate": 9.43692752143607e-07, + "loss": 0.5591, + "step": 62316 + }, + { + "epoch": 1.6, + "learning_rate": 9.436651256107656e-07, + "loss": 0.7109, + "step": 62317 + }, + { + "epoch": 1.6, + "learning_rate": 9.436374991210575e-07, + "loss": 0.5071, + "step": 62318 + }, + { + "epoch": 1.6, + "learning_rate": 9.436098726745039e-07, + "loss": 0.4346, + "step": 62319 + }, + { + "epoch": 1.6, + "learning_rate": 9.43582246271125e-07, + "loss": 0.6816, + "step": 62320 + }, + { + "epoch": 1.6, + "learning_rate": 9.435546199109428e-07, + "loss": 0.686, + "step": 62321 + }, + { + "epoch": 1.6, + "learning_rate": 9.435269935939782e-07, + "loss": 0.5586, + "step": 62322 + }, + { + "epoch": 1.6, + "learning_rate": 9.434993673202524e-07, + "loss": 0.5476, + "step": 62323 + }, + { + "epoch": 1.6, + "learning_rate": 9.434717410897865e-07, + "loss": 0.5679, + "step": 62324 + }, + { + "epoch": 1.6, + "learning_rate": 9.434441149026018e-07, + "loss": 0.6875, + "step": 62325 + }, + { + "epoch": 1.6, + "learning_rate": 9.434164887587191e-07, + "loss": 0.7256, + "step": 62326 + }, + { + "epoch": 1.6, + "learning_rate": 9.4338886265816e-07, + "loss": 0.6401, + "step": 62327 + }, + { + "epoch": 1.6, + "learning_rate": 9.433612366009453e-07, + "loss": 0.5649, + "step": 62328 + }, + { + "epoch": 1.6, + "learning_rate": 9.433336105870968e-07, + "loss": 0.6753, + "step": 62329 + }, + { + "epoch": 1.6, + "learning_rate": 9.433059846166348e-07, + "loss": 0.613, + "step": 62330 + }, + { + "epoch": 1.6, + "learning_rate": 9.432783586895806e-07, + "loss": 0.6064, + "step": 62331 + }, + { + "epoch": 1.6, + "learning_rate": 9.432507328059558e-07, + "loss": 0.5549, + "step": 62332 + }, + { + "epoch": 1.6, + "learning_rate": 9.432231069657811e-07, + "loss": 0.7334, + "step": 62333 + }, + { + "epoch": 1.6, + "learning_rate": 9.431954811690781e-07, + "loss": 0.5986, + "step": 62334 + }, + { + "epoch": 1.6, + "learning_rate": 9.431678554158677e-07, + "loss": 0.6904, + "step": 62335 + }, + { + "epoch": 1.6, + "learning_rate": 9.431402297061707e-07, + "loss": 0.5833, + "step": 62336 + }, + { + "epoch": 1.6, + "learning_rate": 9.43112604040009e-07, + "loss": 0.5358, + "step": 62337 + }, + { + "epoch": 1.6, + "learning_rate": 9.430849784174031e-07, + "loss": 0.4495, + "step": 62338 + }, + { + "epoch": 1.6, + "learning_rate": 9.430573528383747e-07, + "loss": 0.7246, + "step": 62339 + }, + { + "epoch": 1.6, + "learning_rate": 9.430297273029446e-07, + "loss": 0.7539, + "step": 62340 + }, + { + "epoch": 1.6, + "learning_rate": 9.430021018111338e-07, + "loss": 0.6914, + "step": 62341 + }, + { + "epoch": 1.6, + "learning_rate": 9.429744763629639e-07, + "loss": 0.6294, + "step": 62342 + }, + { + "epoch": 1.6, + "learning_rate": 9.429468509584556e-07, + "loss": 0.6187, + "step": 62343 + }, + { + "epoch": 1.6, + "learning_rate": 9.429192255976304e-07, + "loss": 0.6436, + "step": 62344 + }, + { + "epoch": 1.6, + "learning_rate": 9.428916002805092e-07, + "loss": 0.6167, + "step": 62345 + }, + { + "epoch": 1.6, + "learning_rate": 9.428639750071135e-07, + "loss": 0.478, + "step": 62346 + }, + { + "epoch": 1.6, + "learning_rate": 9.428363497774639e-07, + "loss": 0.7715, + "step": 62347 + }, + { + "epoch": 1.6, + "learning_rate": 9.428087245915822e-07, + "loss": 0.4993, + "step": 62348 + }, + { + "epoch": 1.6, + "learning_rate": 9.427810994494894e-07, + "loss": 0.6816, + "step": 62349 + }, + { + "epoch": 1.6, + "learning_rate": 9.427534743512061e-07, + "loss": 0.7061, + "step": 62350 + }, + { + "epoch": 1.6, + "learning_rate": 9.42725849296754e-07, + "loss": 0.6714, + "step": 62351 + }, + { + "epoch": 1.6, + "learning_rate": 9.426982242861541e-07, + "loss": 0.6143, + "step": 62352 + }, + { + "epoch": 1.6, + "learning_rate": 9.426705993194273e-07, + "loss": 0.6787, + "step": 62353 + }, + { + "epoch": 1.6, + "learning_rate": 9.426429743965952e-07, + "loss": 0.6621, + "step": 62354 + }, + { + "epoch": 1.6, + "learning_rate": 9.426153495176786e-07, + "loss": 0.3123, + "step": 62355 + }, + { + "epoch": 1.6, + "learning_rate": 9.425877246826988e-07, + "loss": 0.605, + "step": 62356 + }, + { + "epoch": 1.6, + "learning_rate": 9.42560099891677e-07, + "loss": 0.6187, + "step": 62357 + }, + { + "epoch": 1.6, + "learning_rate": 9.425324751446345e-07, + "loss": 0.8174, + "step": 62358 + }, + { + "epoch": 1.6, + "learning_rate": 9.425048504415922e-07, + "loss": 0.6304, + "step": 62359 + }, + { + "epoch": 1.6, + "learning_rate": 9.424772257825709e-07, + "loss": 0.4212, + "step": 62360 + }, + { + "epoch": 1.6, + "learning_rate": 9.424496011675925e-07, + "loss": 0.6738, + "step": 62361 + }, + { + "epoch": 1.6, + "learning_rate": 9.424219765966774e-07, + "loss": 0.6631, + "step": 62362 + }, + { + "epoch": 1.6, + "learning_rate": 9.423943520698476e-07, + "loss": 0.4971, + "step": 62363 + }, + { + "epoch": 1.6, + "learning_rate": 9.423667275871234e-07, + "loss": 0.4692, + "step": 62364 + }, + { + "epoch": 1.6, + "learning_rate": 9.423391031485267e-07, + "loss": 0.6416, + "step": 62365 + }, + { + "epoch": 1.6, + "learning_rate": 9.423114787540781e-07, + "loss": 0.6026, + "step": 62366 + }, + { + "epoch": 1.6, + "learning_rate": 9.42283854403799e-07, + "loss": 0.7383, + "step": 62367 + }, + { + "epoch": 1.6, + "learning_rate": 9.422562300977108e-07, + "loss": 0.6016, + "step": 62368 + }, + { + "epoch": 1.6, + "learning_rate": 9.422286058358341e-07, + "loss": 0.6807, + "step": 62369 + }, + { + "epoch": 1.6, + "learning_rate": 9.422009816181901e-07, + "loss": 0.5537, + "step": 62370 + }, + { + "epoch": 1.6, + "learning_rate": 9.421733574448003e-07, + "loss": 0.6035, + "step": 62371 + }, + { + "epoch": 1.6, + "learning_rate": 9.421457333156856e-07, + "loss": 0.3418, + "step": 62372 + }, + { + "epoch": 1.6, + "learning_rate": 9.421181092308674e-07, + "loss": 0.4365, + "step": 62373 + }, + { + "epoch": 1.6, + "learning_rate": 9.420904851903665e-07, + "loss": 0.5728, + "step": 62374 + }, + { + "epoch": 1.6, + "learning_rate": 9.420628611942045e-07, + "loss": 0.6885, + "step": 62375 + }, + { + "epoch": 1.6, + "learning_rate": 9.420352372424021e-07, + "loss": 0.5122, + "step": 62376 + }, + { + "epoch": 1.6, + "learning_rate": 9.420076133349808e-07, + "loss": 0.4312, + "step": 62377 + }, + { + "epoch": 1.6, + "learning_rate": 9.419799894719619e-07, + "loss": 0.6689, + "step": 62378 + }, + { + "epoch": 1.6, + "learning_rate": 9.419523656533658e-07, + "loss": 0.5518, + "step": 62379 + }, + { + "epoch": 1.6, + "learning_rate": 9.419247418792143e-07, + "loss": 0.6021, + "step": 62380 + }, + { + "epoch": 1.6, + "learning_rate": 9.418971181495281e-07, + "loss": 0.4268, + "step": 62381 + }, + { + "epoch": 1.6, + "learning_rate": 9.418694944643289e-07, + "loss": 0.71, + "step": 62382 + }, + { + "epoch": 1.6, + "learning_rate": 9.418418708236373e-07, + "loss": 0.6699, + "step": 62383 + }, + { + "epoch": 1.6, + "learning_rate": 9.418142472274749e-07, + "loss": 0.6133, + "step": 62384 + }, + { + "epoch": 1.6, + "learning_rate": 9.417866236758625e-07, + "loss": 0.7559, + "step": 62385 + }, + { + "epoch": 1.6, + "learning_rate": 9.417590001688215e-07, + "loss": 0.6699, + "step": 62386 + }, + { + "epoch": 1.6, + "learning_rate": 9.417313767063728e-07, + "loss": 0.6064, + "step": 62387 + }, + { + "epoch": 1.6, + "learning_rate": 9.417037532885385e-07, + "loss": 0.4929, + "step": 62388 + }, + { + "epoch": 1.6, + "learning_rate": 9.41676129915338e-07, + "loss": 0.6895, + "step": 62389 + }, + { + "epoch": 1.6, + "learning_rate": 9.416485065867939e-07, + "loss": 0.6719, + "step": 62390 + }, + { + "epoch": 1.6, + "learning_rate": 9.416208833029266e-07, + "loss": 0.4021, + "step": 62391 + }, + { + "epoch": 1.6, + "learning_rate": 9.415932600637576e-07, + "loss": 0.5247, + "step": 62392 + }, + { + "epoch": 1.6, + "learning_rate": 9.415656368693078e-07, + "loss": 0.7705, + "step": 62393 + }, + { + "epoch": 1.6, + "learning_rate": 9.415380137195987e-07, + "loss": 0.5725, + "step": 62394 + }, + { + "epoch": 1.6, + "learning_rate": 9.41510390614651e-07, + "loss": 0.644, + "step": 62395 + }, + { + "epoch": 1.6, + "learning_rate": 9.414827675544865e-07, + "loss": 0.5498, + "step": 62396 + }, + { + "epoch": 1.6, + "learning_rate": 9.414551445391256e-07, + "loss": 0.7432, + "step": 62397 + }, + { + "epoch": 1.6, + "learning_rate": 9.414275215685903e-07, + "loss": 0.749, + "step": 62398 + }, + { + "epoch": 1.6, + "learning_rate": 9.413998986429009e-07, + "loss": 0.6328, + "step": 62399 + }, + { + "epoch": 1.6, + "learning_rate": 9.413722757620789e-07, + "loss": 0.6904, + "step": 62400 + }, + { + "epoch": 1.6, + "learning_rate": 9.413446529261455e-07, + "loss": 0.6855, + "step": 62401 + }, + { + "epoch": 1.6, + "learning_rate": 9.413170301351217e-07, + "loss": 0.5386, + "step": 62402 + }, + { + "epoch": 1.6, + "learning_rate": 9.412894073890289e-07, + "loss": 0.6606, + "step": 62403 + }, + { + "epoch": 1.6, + "learning_rate": 9.412617846878879e-07, + "loss": 0.6729, + "step": 62404 + }, + { + "epoch": 1.6, + "learning_rate": 9.412341620317201e-07, + "loss": 0.7998, + "step": 62405 + }, + { + "epoch": 1.6, + "learning_rate": 9.412065394205467e-07, + "loss": 0.7598, + "step": 62406 + }, + { + "epoch": 1.6, + "learning_rate": 9.411789168543887e-07, + "loss": 0.5032, + "step": 62407 + }, + { + "epoch": 1.6, + "learning_rate": 9.411512943332677e-07, + "loss": 0.6104, + "step": 62408 + }, + { + "epoch": 1.6, + "learning_rate": 9.411236718572041e-07, + "loss": 0.7578, + "step": 62409 + }, + { + "epoch": 1.6, + "learning_rate": 9.410960494262192e-07, + "loss": 0.5389, + "step": 62410 + }, + { + "epoch": 1.6, + "learning_rate": 9.410684270403347e-07, + "loss": 0.7188, + "step": 62411 + }, + { + "epoch": 1.6, + "learning_rate": 9.41040804699571e-07, + "loss": 0.7129, + "step": 62412 + }, + { + "epoch": 1.6, + "learning_rate": 9.4101318240395e-07, + "loss": 0.6357, + "step": 62413 + }, + { + "epoch": 1.6, + "learning_rate": 9.409855601534922e-07, + "loss": 0.666, + "step": 62414 + }, + { + "epoch": 1.6, + "learning_rate": 9.409579379482192e-07, + "loss": 0.584, + "step": 62415 + }, + { + "epoch": 1.6, + "learning_rate": 9.409303157881519e-07, + "loss": 0.791, + "step": 62416 + }, + { + "epoch": 1.6, + "learning_rate": 9.409026936733117e-07, + "loss": 0.6216, + "step": 62417 + }, + { + "epoch": 1.6, + "learning_rate": 9.408750716037198e-07, + "loss": 0.4746, + "step": 62418 + }, + { + "epoch": 1.6, + "learning_rate": 9.408474495793968e-07, + "loss": 0.7046, + "step": 62419 + }, + { + "epoch": 1.6, + "learning_rate": 9.408198276003642e-07, + "loss": 0.7314, + "step": 62420 + }, + { + "epoch": 1.6, + "learning_rate": 9.40792205666643e-07, + "loss": 0.562, + "step": 62421 + }, + { + "epoch": 1.6, + "learning_rate": 9.407645837782548e-07, + "loss": 0.627, + "step": 62422 + }, + { + "epoch": 1.6, + "learning_rate": 9.407369619352203e-07, + "loss": 0.6211, + "step": 62423 + }, + { + "epoch": 1.6, + "learning_rate": 9.407093401375607e-07, + "loss": 0.8408, + "step": 62424 + }, + { + "epoch": 1.6, + "learning_rate": 9.406817183852975e-07, + "loss": 0.6602, + "step": 62425 + }, + { + "epoch": 1.6, + "learning_rate": 9.406540966784512e-07, + "loss": 0.6953, + "step": 62426 + }, + { + "epoch": 1.6, + "learning_rate": 9.406264750170436e-07, + "loss": 0.5596, + "step": 62427 + }, + { + "epoch": 1.6, + "learning_rate": 9.405988534010958e-07, + "loss": 0.6699, + "step": 62428 + }, + { + "epoch": 1.6, + "learning_rate": 9.405712318306283e-07, + "loss": 0.6392, + "step": 62429 + }, + { + "epoch": 1.6, + "learning_rate": 9.40543610305663e-07, + "loss": 0.6182, + "step": 62430 + }, + { + "epoch": 1.6, + "learning_rate": 9.405159888262203e-07, + "loss": 0.6357, + "step": 62431 + }, + { + "epoch": 1.6, + "learning_rate": 9.40488367392322e-07, + "loss": 0.6846, + "step": 62432 + }, + { + "epoch": 1.6, + "learning_rate": 9.404607460039889e-07, + "loss": 0.5879, + "step": 62433 + }, + { + "epoch": 1.6, + "learning_rate": 9.404331246612425e-07, + "loss": 0.582, + "step": 62434 + }, + { + "epoch": 1.6, + "learning_rate": 9.404055033641036e-07, + "loss": 0.3972, + "step": 62435 + }, + { + "epoch": 1.6, + "learning_rate": 9.403778821125935e-07, + "loss": 0.6475, + "step": 62436 + }, + { + "epoch": 1.6, + "learning_rate": 9.403502609067331e-07, + "loss": 0.4285, + "step": 62437 + }, + { + "epoch": 1.6, + "learning_rate": 9.403226397465442e-07, + "loss": 0.5962, + "step": 62438 + }, + { + "epoch": 1.6, + "learning_rate": 9.402950186320474e-07, + "loss": 0.4026, + "step": 62439 + }, + { + "epoch": 1.6, + "learning_rate": 9.402673975632637e-07, + "loss": 0.7041, + "step": 62440 + }, + { + "epoch": 1.6, + "learning_rate": 9.402397765402147e-07, + "loss": 0.5796, + "step": 62441 + }, + { + "epoch": 1.6, + "learning_rate": 9.402121555629214e-07, + "loss": 0.6147, + "step": 62442 + }, + { + "epoch": 1.6, + "learning_rate": 9.401845346314046e-07, + "loss": 0.6128, + "step": 62443 + }, + { + "epoch": 1.6, + "learning_rate": 9.401569137456861e-07, + "loss": 0.7412, + "step": 62444 + }, + { + "epoch": 1.6, + "learning_rate": 9.401292929057864e-07, + "loss": 0.6597, + "step": 62445 + }, + { + "epoch": 1.6, + "learning_rate": 9.401016721117271e-07, + "loss": 0.5869, + "step": 62446 + }, + { + "epoch": 1.6, + "learning_rate": 9.40074051363529e-07, + "loss": 0.6069, + "step": 62447 + }, + { + "epoch": 1.6, + "learning_rate": 9.40046430661214e-07, + "loss": 0.708, + "step": 62448 + }, + { + "epoch": 1.6, + "learning_rate": 9.400188100048024e-07, + "loss": 0.3684, + "step": 62449 + }, + { + "epoch": 1.6, + "learning_rate": 9.399911893943154e-07, + "loss": 0.5663, + "step": 62450 + }, + { + "epoch": 1.6, + "learning_rate": 9.399635688297746e-07, + "loss": 0.5349, + "step": 62451 + }, + { + "epoch": 1.6, + "learning_rate": 9.399359483112008e-07, + "loss": 0.4644, + "step": 62452 + }, + { + "epoch": 1.6, + "learning_rate": 9.399083278386154e-07, + "loss": 0.7056, + "step": 62453 + }, + { + "epoch": 1.6, + "learning_rate": 9.398807074120393e-07, + "loss": 0.3629, + "step": 62454 + }, + { + "epoch": 1.6, + "learning_rate": 9.398530870314939e-07, + "loss": 0.6465, + "step": 62455 + }, + { + "epoch": 1.6, + "learning_rate": 9.39825466697e-07, + "loss": 0.7393, + "step": 62456 + }, + { + "epoch": 1.6, + "learning_rate": 9.397978464085793e-07, + "loss": 0.605, + "step": 62457 + }, + { + "epoch": 1.6, + "learning_rate": 9.397702261662527e-07, + "loss": 0.5293, + "step": 62458 + }, + { + "epoch": 1.6, + "learning_rate": 9.397426059700412e-07, + "loss": 0.4128, + "step": 62459 + }, + { + "epoch": 1.6, + "learning_rate": 9.397149858199658e-07, + "loss": 0.5996, + "step": 62460 + }, + { + "epoch": 1.6, + "learning_rate": 9.39687365716048e-07, + "loss": 0.6099, + "step": 62461 + }, + { + "epoch": 1.6, + "learning_rate": 9.396597456583087e-07, + "loss": 0.7441, + "step": 62462 + }, + { + "epoch": 1.6, + "learning_rate": 9.396321256467692e-07, + "loss": 0.5566, + "step": 62463 + }, + { + "epoch": 1.6, + "learning_rate": 9.396045056814504e-07, + "loss": 0.5537, + "step": 62464 + }, + { + "epoch": 1.6, + "learning_rate": 9.39576885762374e-07, + "loss": 0.4681, + "step": 62465 + }, + { + "epoch": 1.6, + "learning_rate": 9.395492658895605e-07, + "loss": 0.5273, + "step": 62466 + }, + { + "epoch": 1.6, + "learning_rate": 9.395216460630317e-07, + "loss": 0.7822, + "step": 62467 + }, + { + "epoch": 1.6, + "learning_rate": 9.394940262828084e-07, + "loss": 0.7217, + "step": 62468 + }, + { + "epoch": 1.6, + "learning_rate": 9.394664065489114e-07, + "loss": 0.6436, + "step": 62469 + }, + { + "epoch": 1.6, + "learning_rate": 9.394387868613625e-07, + "loss": 0.5035, + "step": 62470 + }, + { + "epoch": 1.6, + "learning_rate": 9.394111672201822e-07, + "loss": 0.8418, + "step": 62471 + }, + { + "epoch": 1.6, + "learning_rate": 9.393835476253922e-07, + "loss": 0.6084, + "step": 62472 + }, + { + "epoch": 1.6, + "learning_rate": 9.393559280770133e-07, + "loss": 0.5776, + "step": 62473 + }, + { + "epoch": 1.6, + "learning_rate": 9.393283085750669e-07, + "loss": 0.709, + "step": 62474 + }, + { + "epoch": 1.6, + "learning_rate": 9.393006891195739e-07, + "loss": 0.7578, + "step": 62475 + }, + { + "epoch": 1.6, + "learning_rate": 9.392730697105558e-07, + "loss": 0.5972, + "step": 62476 + }, + { + "epoch": 1.6, + "learning_rate": 9.392454503480332e-07, + "loss": 0.7529, + "step": 62477 + }, + { + "epoch": 1.6, + "learning_rate": 9.392178310320283e-07, + "loss": 0.7344, + "step": 62478 + }, + { + "epoch": 1.6, + "learning_rate": 9.391902117625608e-07, + "loss": 0.4397, + "step": 62479 + }, + { + "epoch": 1.6, + "learning_rate": 9.391625925396527e-07, + "loss": 0.5405, + "step": 62480 + }, + { + "epoch": 1.6, + "learning_rate": 9.391349733633249e-07, + "loss": 0.7588, + "step": 62481 + }, + { + "epoch": 1.6, + "learning_rate": 9.391073542335989e-07, + "loss": 0.6133, + "step": 62482 + }, + { + "epoch": 1.6, + "learning_rate": 9.390797351504953e-07, + "loss": 0.4644, + "step": 62483 + }, + { + "epoch": 1.6, + "learning_rate": 9.390521161140358e-07, + "loss": 0.5037, + "step": 62484 + }, + { + "epoch": 1.6, + "learning_rate": 9.390244971242411e-07, + "loss": 0.6484, + "step": 62485 + }, + { + "epoch": 1.6, + "learning_rate": 9.389968781811327e-07, + "loss": 0.5459, + "step": 62486 + }, + { + "epoch": 1.6, + "learning_rate": 9.389692592847314e-07, + "loss": 0.6768, + "step": 62487 + }, + { + "epoch": 1.6, + "learning_rate": 9.38941640435059e-07, + "loss": 0.6689, + "step": 62488 + }, + { + "epoch": 1.6, + "learning_rate": 9.389140216321359e-07, + "loss": 0.6777, + "step": 62489 + }, + { + "epoch": 1.6, + "learning_rate": 9.388864028759833e-07, + "loss": 0.6616, + "step": 62490 + }, + { + "epoch": 1.6, + "learning_rate": 9.388587841666228e-07, + "loss": 0.4568, + "step": 62491 + }, + { + "epoch": 1.6, + "learning_rate": 9.388311655040751e-07, + "loss": 0.5425, + "step": 62492 + }, + { + "epoch": 1.6, + "learning_rate": 9.388035468883619e-07, + "loss": 0.7109, + "step": 62493 + }, + { + "epoch": 1.6, + "learning_rate": 9.387759283195036e-07, + "loss": 0.5532, + "step": 62494 + }, + { + "epoch": 1.6, + "learning_rate": 9.387483097975221e-07, + "loss": 0.6431, + "step": 62495 + }, + { + "epoch": 1.6, + "learning_rate": 9.387206913224379e-07, + "loss": 0.5234, + "step": 62496 + }, + { + "epoch": 1.6, + "learning_rate": 9.386930728942728e-07, + "loss": 0.5605, + "step": 62497 + }, + { + "epoch": 1.6, + "learning_rate": 9.386654545130477e-07, + "loss": 0.646, + "step": 62498 + }, + { + "epoch": 1.6, + "learning_rate": 9.386378361787835e-07, + "loss": 0.5356, + "step": 62499 + }, + { + "epoch": 1.6, + "learning_rate": 9.386102178915012e-07, + "loss": 0.6792, + "step": 62500 + }, + { + "epoch": 1.6, + "learning_rate": 9.385825996512224e-07, + "loss": 0.6943, + "step": 62501 + }, + { + "epoch": 1.6, + "learning_rate": 9.38554981457968e-07, + "loss": 0.5645, + "step": 62502 + }, + { + "epoch": 1.6, + "learning_rate": 9.385273633117594e-07, + "loss": 0.6304, + "step": 62503 + }, + { + "epoch": 1.6, + "learning_rate": 9.384997452126174e-07, + "loss": 0.6113, + "step": 62504 + }, + { + "epoch": 1.6, + "learning_rate": 9.384721271605634e-07, + "loss": 0.6309, + "step": 62505 + }, + { + "epoch": 1.6, + "learning_rate": 9.384445091556184e-07, + "loss": 0.5864, + "step": 62506 + }, + { + "epoch": 1.6, + "learning_rate": 9.384168911978036e-07, + "loss": 0.676, + "step": 62507 + }, + { + "epoch": 1.6, + "learning_rate": 9.383892732871406e-07, + "loss": 0.4158, + "step": 62508 + }, + { + "epoch": 1.6, + "learning_rate": 9.383616554236496e-07, + "loss": 0.7144, + "step": 62509 + }, + { + "epoch": 1.6, + "learning_rate": 9.383340376073524e-07, + "loss": 0.5322, + "step": 62510 + }, + { + "epoch": 1.6, + "learning_rate": 9.383064198382697e-07, + "loss": 0.6182, + "step": 62511 + }, + { + "epoch": 1.6, + "learning_rate": 9.382788021164234e-07, + "loss": 0.5981, + "step": 62512 + }, + { + "epoch": 1.6, + "learning_rate": 9.382511844418338e-07, + "loss": 0.5715, + "step": 62513 + }, + { + "epoch": 1.6, + "learning_rate": 9.382235668145227e-07, + "loss": 0.7935, + "step": 62514 + }, + { + "epoch": 1.6, + "learning_rate": 9.381959492345109e-07, + "loss": 0.6465, + "step": 62515 + }, + { + "epoch": 1.6, + "learning_rate": 9.381683317018195e-07, + "loss": 0.6553, + "step": 62516 + }, + { + "epoch": 1.6, + "learning_rate": 9.381407142164699e-07, + "loss": 0.6301, + "step": 62517 + }, + { + "epoch": 1.6, + "learning_rate": 9.381130967784833e-07, + "loss": 0.6284, + "step": 62518 + }, + { + "epoch": 1.6, + "learning_rate": 9.380854793878804e-07, + "loss": 0.5215, + "step": 62519 + }, + { + "epoch": 1.6, + "learning_rate": 9.380578620446828e-07, + "loss": 0.4424, + "step": 62520 + }, + { + "epoch": 1.6, + "learning_rate": 9.380302447489111e-07, + "loss": 0.6348, + "step": 62521 + }, + { + "epoch": 1.6, + "learning_rate": 9.38002627500587e-07, + "loss": 0.606, + "step": 62522 + }, + { + "epoch": 1.6, + "learning_rate": 9.379750102997312e-07, + "loss": 0.6421, + "step": 62523 + }, + { + "epoch": 1.6, + "learning_rate": 9.379473931463655e-07, + "loss": 0.53, + "step": 62524 + }, + { + "epoch": 1.6, + "learning_rate": 9.379197760405102e-07, + "loss": 0.6221, + "step": 62525 + }, + { + "epoch": 1.6, + "learning_rate": 9.378921589821872e-07, + "loss": 0.4111, + "step": 62526 + }, + { + "epoch": 1.6, + "learning_rate": 9.37864541971417e-07, + "loss": 0.6475, + "step": 62527 + }, + { + "epoch": 1.6, + "learning_rate": 9.378369250082217e-07, + "loss": 0.7695, + "step": 62528 + }, + { + "epoch": 1.6, + "learning_rate": 9.378093080926215e-07, + "loss": 0.5835, + "step": 62529 + }, + { + "epoch": 1.6, + "learning_rate": 9.377816912246376e-07, + "loss": 0.6328, + "step": 62530 + }, + { + "epoch": 1.6, + "learning_rate": 9.377540744042916e-07, + "loss": 0.5903, + "step": 62531 + }, + { + "epoch": 1.6, + "learning_rate": 9.377264576316044e-07, + "loss": 0.8008, + "step": 62532 + }, + { + "epoch": 1.6, + "learning_rate": 9.37698840906597e-07, + "loss": 0.6807, + "step": 62533 + }, + { + "epoch": 1.6, + "learning_rate": 9.37671224229291e-07, + "loss": 0.4851, + "step": 62534 + }, + { + "epoch": 1.6, + "learning_rate": 9.376436075997071e-07, + "loss": 0.5444, + "step": 62535 + }, + { + "epoch": 1.6, + "learning_rate": 9.376159910178667e-07, + "loss": 0.5239, + "step": 62536 + }, + { + "epoch": 1.6, + "learning_rate": 9.375883744837907e-07, + "loss": 0.5977, + "step": 62537 + }, + { + "epoch": 1.6, + "learning_rate": 9.375607579975009e-07, + "loss": 0.623, + "step": 62538 + }, + { + "epoch": 1.6, + "learning_rate": 9.375331415590178e-07, + "loss": 0.4878, + "step": 62539 + }, + { + "epoch": 1.6, + "learning_rate": 9.375055251683624e-07, + "loss": 0.5181, + "step": 62540 + }, + { + "epoch": 1.6, + "learning_rate": 9.374779088255564e-07, + "loss": 0.6689, + "step": 62541 + }, + { + "epoch": 1.6, + "learning_rate": 9.374502925306203e-07, + "loss": 0.5703, + "step": 62542 + }, + { + "epoch": 1.6, + "learning_rate": 9.374226762835759e-07, + "loss": 0.47, + "step": 62543 + }, + { + "epoch": 1.6, + "learning_rate": 9.37395060084444e-07, + "loss": 0.7549, + "step": 62544 + }, + { + "epoch": 1.6, + "learning_rate": 9.37367443933246e-07, + "loss": 0.6943, + "step": 62545 + }, + { + "epoch": 1.6, + "learning_rate": 9.373398278300027e-07, + "loss": 0.7412, + "step": 62546 + }, + { + "epoch": 1.6, + "learning_rate": 9.373122117747356e-07, + "loss": 0.6158, + "step": 62547 + }, + { + "epoch": 1.6, + "learning_rate": 9.372845957674658e-07, + "loss": 0.4146, + "step": 62548 + }, + { + "epoch": 1.6, + "learning_rate": 9.372569798082142e-07, + "loss": 0.6045, + "step": 62549 + }, + { + "epoch": 1.6, + "learning_rate": 9.372293638970016e-07, + "loss": 0.5801, + "step": 62550 + }, + { + "epoch": 1.6, + "learning_rate": 9.3720174803385e-07, + "loss": 0.7646, + "step": 62551 + }, + { + "epoch": 1.6, + "learning_rate": 9.371741322187799e-07, + "loss": 0.541, + "step": 62552 + }, + { + "epoch": 1.6, + "learning_rate": 9.371465164518128e-07, + "loss": 0.5508, + "step": 62553 + }, + { + "epoch": 1.6, + "learning_rate": 9.371189007329696e-07, + "loss": 0.7441, + "step": 62554 + }, + { + "epoch": 1.6, + "learning_rate": 9.370912850622719e-07, + "loss": 0.8262, + "step": 62555 + }, + { + "epoch": 1.6, + "learning_rate": 9.370636694397401e-07, + "loss": 0.5229, + "step": 62556 + }, + { + "epoch": 1.6, + "learning_rate": 9.370360538653961e-07, + "loss": 0.6157, + "step": 62557 + }, + { + "epoch": 1.6, + "learning_rate": 9.370084383392608e-07, + "loss": 0.6113, + "step": 62558 + }, + { + "epoch": 1.6, + "learning_rate": 9.369808228613548e-07, + "loss": 0.5513, + "step": 62559 + }, + { + "epoch": 1.6, + "learning_rate": 9.369532074316999e-07, + "loss": 0.4302, + "step": 62560 + }, + { + "epoch": 1.6, + "learning_rate": 9.36925592050317e-07, + "loss": 0.6509, + "step": 62561 + }, + { + "epoch": 1.6, + "learning_rate": 9.368979767172272e-07, + "loss": 0.8359, + "step": 62562 + }, + { + "epoch": 1.6, + "learning_rate": 9.368703614324518e-07, + "loss": 0.752, + "step": 62563 + }, + { + "epoch": 1.6, + "learning_rate": 9.368427461960119e-07, + "loss": 0.4971, + "step": 62564 + }, + { + "epoch": 1.6, + "learning_rate": 9.368151310079285e-07, + "loss": 0.791, + "step": 62565 + }, + { + "epoch": 1.6, + "learning_rate": 9.36787515868223e-07, + "loss": 0.6934, + "step": 62566 + }, + { + "epoch": 1.6, + "learning_rate": 9.367599007769161e-07, + "loss": 0.6992, + "step": 62567 + }, + { + "epoch": 1.6, + "learning_rate": 9.367322857340299e-07, + "loss": 0.8164, + "step": 62568 + }, + { + "epoch": 1.6, + "learning_rate": 9.367046707395843e-07, + "loss": 0.5947, + "step": 62569 + }, + { + "epoch": 1.6, + "learning_rate": 9.366770557936012e-07, + "loss": 0.6045, + "step": 62570 + }, + { + "epoch": 1.6, + "learning_rate": 9.366494408961014e-07, + "loss": 0.6265, + "step": 62571 + }, + { + "epoch": 1.6, + "learning_rate": 9.366218260471064e-07, + "loss": 0.7871, + "step": 62572 + }, + { + "epoch": 1.6, + "learning_rate": 9.36594211246637e-07, + "loss": 0.749, + "step": 62573 + }, + { + "epoch": 1.6, + "learning_rate": 9.365665964947146e-07, + "loss": 0.5723, + "step": 62574 + }, + { + "epoch": 1.6, + "learning_rate": 9.3653898179136e-07, + "loss": 0.5381, + "step": 62575 + }, + { + "epoch": 1.6, + "learning_rate": 9.36511367136595e-07, + "loss": 0.6265, + "step": 62576 + }, + { + "epoch": 1.6, + "learning_rate": 9.3648375253044e-07, + "loss": 0.6387, + "step": 62577 + }, + { + "epoch": 1.6, + "learning_rate": 9.364561379729167e-07, + "loss": 0.7891, + "step": 62578 + }, + { + "epoch": 1.6, + "learning_rate": 9.364285234640461e-07, + "loss": 0.6294, + "step": 62579 + }, + { + "epoch": 1.6, + "learning_rate": 9.36400909003849e-07, + "loss": 0.5088, + "step": 62580 + }, + { + "epoch": 1.6, + "learning_rate": 9.363732945923469e-07, + "loss": 0.5864, + "step": 62581 + }, + { + "epoch": 1.6, + "learning_rate": 9.363456802295606e-07, + "loss": 0.5786, + "step": 62582 + }, + { + "epoch": 1.6, + "learning_rate": 9.363180659155119e-07, + "loss": 0.6416, + "step": 62583 + }, + { + "epoch": 1.6, + "learning_rate": 9.362904516502212e-07, + "loss": 0.564, + "step": 62584 + }, + { + "epoch": 1.6, + "learning_rate": 9.3626283743371e-07, + "loss": 0.7695, + "step": 62585 + }, + { + "epoch": 1.6, + "learning_rate": 9.362352232659995e-07, + "loss": 0.5354, + "step": 62586 + }, + { + "epoch": 1.6, + "learning_rate": 9.362076091471109e-07, + "loss": 0.6841, + "step": 62587 + }, + { + "epoch": 1.6, + "learning_rate": 9.361799950770653e-07, + "loss": 0.5435, + "step": 62588 + }, + { + "epoch": 1.6, + "learning_rate": 9.361523810558836e-07, + "loss": 0.7139, + "step": 62589 + }, + { + "epoch": 1.6, + "learning_rate": 9.361247670835868e-07, + "loss": 0.5889, + "step": 62590 + }, + { + "epoch": 1.6, + "learning_rate": 9.360971531601967e-07, + "loss": 0.6133, + "step": 62591 + }, + { + "epoch": 1.6, + "learning_rate": 9.360695392857336e-07, + "loss": 0.3765, + "step": 62592 + }, + { + "epoch": 1.6, + "learning_rate": 9.360419254602195e-07, + "loss": 0.6992, + "step": 62593 + }, + { + "epoch": 1.6, + "learning_rate": 9.36014311683675e-07, + "loss": 0.5952, + "step": 62594 + }, + { + "epoch": 1.6, + "learning_rate": 9.359866979561215e-07, + "loss": 0.6895, + "step": 62595 + }, + { + "epoch": 1.6, + "learning_rate": 9.359590842775798e-07, + "loss": 0.6899, + "step": 62596 + }, + { + "epoch": 1.6, + "learning_rate": 9.359314706480716e-07, + "loss": 0.708, + "step": 62597 + }, + { + "epoch": 1.6, + "learning_rate": 9.35903857067618e-07, + "loss": 0.4442, + "step": 62598 + }, + { + "epoch": 1.6, + "learning_rate": 9.358762435362393e-07, + "loss": 0.6421, + "step": 62599 + }, + { + "epoch": 1.6, + "learning_rate": 9.358486300539575e-07, + "loss": 0.4393, + "step": 62600 + }, + { + "epoch": 1.6, + "learning_rate": 9.358210166207932e-07, + "loss": 0.7256, + "step": 62601 + }, + { + "epoch": 1.6, + "learning_rate": 9.35793403236768e-07, + "loss": 0.6309, + "step": 62602 + }, + { + "epoch": 1.6, + "learning_rate": 9.357657899019027e-07, + "loss": 0.7549, + "step": 62603 + }, + { + "epoch": 1.6, + "learning_rate": 9.357381766162187e-07, + "loss": 0.6938, + "step": 62604 + }, + { + "epoch": 1.6, + "learning_rate": 9.357105633797371e-07, + "loss": 0.6895, + "step": 62605 + }, + { + "epoch": 1.6, + "learning_rate": 9.356829501924788e-07, + "loss": 0.521, + "step": 62606 + }, + { + "epoch": 1.6, + "learning_rate": 9.356553370544653e-07, + "loss": 0.7261, + "step": 62607 + }, + { + "epoch": 1.6, + "learning_rate": 9.356277239657176e-07, + "loss": 0.7461, + "step": 62608 + }, + { + "epoch": 1.6, + "learning_rate": 9.356001109262564e-07, + "loss": 0.4991, + "step": 62609 + }, + { + "epoch": 1.6, + "learning_rate": 9.355724979361036e-07, + "loss": 0.6528, + "step": 62610 + }, + { + "epoch": 1.6, + "learning_rate": 9.355448849952797e-07, + "loss": 0.6743, + "step": 62611 + }, + { + "epoch": 1.6, + "learning_rate": 9.355172721038063e-07, + "loss": 0.3672, + "step": 62612 + }, + { + "epoch": 1.6, + "learning_rate": 9.354896592617041e-07, + "loss": 0.7217, + "step": 62613 + }, + { + "epoch": 1.6, + "learning_rate": 9.354620464689949e-07, + "loss": 0.6743, + "step": 62614 + }, + { + "epoch": 1.6, + "learning_rate": 9.35434433725699e-07, + "loss": 0.8545, + "step": 62615 + }, + { + "epoch": 1.6, + "learning_rate": 9.354068210318383e-07, + "loss": 0.6543, + "step": 62616 + }, + { + "epoch": 1.6, + "learning_rate": 9.353792083874334e-07, + "loss": 0.4402, + "step": 62617 + }, + { + "epoch": 1.6, + "learning_rate": 9.353515957925061e-07, + "loss": 0.6963, + "step": 62618 + }, + { + "epoch": 1.6, + "learning_rate": 9.35323983247077e-07, + "loss": 0.5459, + "step": 62619 + }, + { + "epoch": 1.6, + "learning_rate": 9.35296370751167e-07, + "loss": 0.666, + "step": 62620 + }, + { + "epoch": 1.61, + "learning_rate": 9.352687583047978e-07, + "loss": 0.8037, + "step": 62621 + }, + { + "epoch": 1.61, + "learning_rate": 9.352411459079904e-07, + "loss": 0.6914, + "step": 62622 + }, + { + "epoch": 1.61, + "learning_rate": 9.352135335607657e-07, + "loss": 0.48, + "step": 62623 + }, + { + "epoch": 1.61, + "learning_rate": 9.351859212631452e-07, + "loss": 0.6001, + "step": 62624 + }, + { + "epoch": 1.61, + "learning_rate": 9.351583090151496e-07, + "loss": 0.6316, + "step": 62625 + }, + { + "epoch": 1.61, + "learning_rate": 9.351306968168006e-07, + "loss": 0.6533, + "step": 62626 + }, + { + "epoch": 1.61, + "learning_rate": 9.351030846681187e-07, + "loss": 0.5764, + "step": 62627 + }, + { + "epoch": 1.61, + "learning_rate": 9.350754725691259e-07, + "loss": 0.7617, + "step": 62628 + }, + { + "epoch": 1.61, + "learning_rate": 9.350478605198427e-07, + "loss": 0.749, + "step": 62629 + }, + { + "epoch": 1.61, + "learning_rate": 9.3502024852029e-07, + "loss": 0.7041, + "step": 62630 + }, + { + "epoch": 1.61, + "learning_rate": 9.349926365704895e-07, + "loss": 0.6895, + "step": 62631 + }, + { + "epoch": 1.61, + "learning_rate": 9.349650246704622e-07, + "loss": 0.5076, + "step": 62632 + }, + { + "epoch": 1.61, + "learning_rate": 9.349374128202291e-07, + "loss": 0.6187, + "step": 62633 + }, + { + "epoch": 1.61, + "learning_rate": 9.349098010198113e-07, + "loss": 0.647, + "step": 62634 + }, + { + "epoch": 1.61, + "learning_rate": 9.348821892692304e-07, + "loss": 0.4836, + "step": 62635 + }, + { + "epoch": 1.61, + "learning_rate": 9.348545775685068e-07, + "loss": 0.6357, + "step": 62636 + }, + { + "epoch": 1.61, + "learning_rate": 9.348269659176624e-07, + "loss": 0.5806, + "step": 62637 + }, + { + "epoch": 1.61, + "learning_rate": 9.347993543167182e-07, + "loss": 0.4961, + "step": 62638 + }, + { + "epoch": 1.61, + "learning_rate": 9.347717427656949e-07, + "loss": 0.5923, + "step": 62639 + }, + { + "epoch": 1.61, + "learning_rate": 9.347441312646137e-07, + "loss": 0.4724, + "step": 62640 + }, + { + "epoch": 1.61, + "learning_rate": 9.347165198134961e-07, + "loss": 0.7021, + "step": 62641 + }, + { + "epoch": 1.61, + "learning_rate": 9.346889084123629e-07, + "loss": 0.5493, + "step": 62642 + }, + { + "epoch": 1.61, + "learning_rate": 9.346612970612355e-07, + "loss": 0.6558, + "step": 62643 + }, + { + "epoch": 1.61, + "learning_rate": 9.346336857601349e-07, + "loss": 0.6484, + "step": 62644 + }, + { + "epoch": 1.61, + "learning_rate": 9.346060745090824e-07, + "loss": 0.5571, + "step": 62645 + }, + { + "epoch": 1.61, + "learning_rate": 9.345784633080987e-07, + "loss": 0.6675, + "step": 62646 + }, + { + "epoch": 1.61, + "learning_rate": 9.345508521572059e-07, + "loss": 0.4613, + "step": 62647 + }, + { + "epoch": 1.61, + "learning_rate": 9.345232410564241e-07, + "loss": 0.7056, + "step": 62648 + }, + { + "epoch": 1.61, + "learning_rate": 9.344956300057747e-07, + "loss": 0.4182, + "step": 62649 + }, + { + "epoch": 1.61, + "learning_rate": 9.344680190052793e-07, + "loss": 0.5493, + "step": 62650 + }, + { + "epoch": 1.61, + "learning_rate": 9.344404080549584e-07, + "loss": 0.6792, + "step": 62651 + }, + { + "epoch": 1.61, + "learning_rate": 9.344127971548336e-07, + "loss": 0.7104, + "step": 62652 + }, + { + "epoch": 1.61, + "learning_rate": 9.343851863049259e-07, + "loss": 0.519, + "step": 62653 + }, + { + "epoch": 1.61, + "learning_rate": 9.343575755052565e-07, + "loss": 0.4983, + "step": 62654 + }, + { + "epoch": 1.61, + "learning_rate": 9.343299647558463e-07, + "loss": 0.7021, + "step": 62655 + }, + { + "epoch": 1.61, + "learning_rate": 9.343023540567169e-07, + "loss": 0.6777, + "step": 62656 + }, + { + "epoch": 1.61, + "learning_rate": 9.342747434078894e-07, + "loss": 0.6206, + "step": 62657 + }, + { + "epoch": 1.61, + "learning_rate": 9.342471328093844e-07, + "loss": 0.6729, + "step": 62658 + }, + { + "epoch": 1.61, + "learning_rate": 9.342195222612231e-07, + "loss": 0.7607, + "step": 62659 + }, + { + "epoch": 1.61, + "learning_rate": 9.341919117634272e-07, + "loss": 0.7656, + "step": 62660 + }, + { + "epoch": 1.61, + "learning_rate": 9.341643013160173e-07, + "loss": 0.7715, + "step": 62661 + }, + { + "epoch": 1.61, + "learning_rate": 9.34136690919015e-07, + "loss": 0.6606, + "step": 62662 + }, + { + "epoch": 1.61, + "learning_rate": 9.341090805724408e-07, + "loss": 0.5261, + "step": 62663 + }, + { + "epoch": 1.61, + "learning_rate": 9.340814702763166e-07, + "loss": 0.3267, + "step": 62664 + }, + { + "epoch": 1.61, + "learning_rate": 9.340538600306631e-07, + "loss": 0.5103, + "step": 62665 + }, + { + "epoch": 1.61, + "learning_rate": 9.340262498355016e-07, + "loss": 0.6133, + "step": 62666 + }, + { + "epoch": 1.61, + "learning_rate": 9.339986396908534e-07, + "loss": 0.5127, + "step": 62667 + }, + { + "epoch": 1.61, + "learning_rate": 9.33971029596739e-07, + "loss": 0.6108, + "step": 62668 + }, + { + "epoch": 1.61, + "learning_rate": 9.339434195531802e-07, + "loss": 0.5061, + "step": 62669 + }, + { + "epoch": 1.61, + "learning_rate": 9.339158095601977e-07, + "loss": 0.624, + "step": 62670 + }, + { + "epoch": 1.61, + "learning_rate": 9.33888199617813e-07, + "loss": 0.624, + "step": 62671 + }, + { + "epoch": 1.61, + "learning_rate": 9.338605897260467e-07, + "loss": 0.7139, + "step": 62672 + }, + { + "epoch": 1.61, + "learning_rate": 9.338329798849207e-07, + "loss": 0.6592, + "step": 62673 + }, + { + "epoch": 1.61, + "learning_rate": 9.338053700944554e-07, + "loss": 0.707, + "step": 62674 + }, + { + "epoch": 1.61, + "learning_rate": 9.337777603546726e-07, + "loss": 0.6606, + "step": 62675 + }, + { + "epoch": 1.61, + "learning_rate": 9.337501506655928e-07, + "loss": 0.6621, + "step": 62676 + }, + { + "epoch": 1.61, + "learning_rate": 9.337225410272382e-07, + "loss": 0.623, + "step": 62677 + }, + { + "epoch": 1.61, + "learning_rate": 9.336949314396286e-07, + "loss": 0.5532, + "step": 62678 + }, + { + "epoch": 1.61, + "learning_rate": 9.336673219027858e-07, + "loss": 0.5476, + "step": 62679 + }, + { + "epoch": 1.61, + "learning_rate": 9.336397124167309e-07, + "loss": 0.4976, + "step": 62680 + }, + { + "epoch": 1.61, + "learning_rate": 9.33612102981485e-07, + "loss": 0.7046, + "step": 62681 + }, + { + "epoch": 1.61, + "learning_rate": 9.335844935970691e-07, + "loss": 0.7236, + "step": 62682 + }, + { + "epoch": 1.61, + "learning_rate": 9.335568842635049e-07, + "loss": 0.6846, + "step": 62683 + }, + { + "epoch": 1.61, + "learning_rate": 9.335292749808127e-07, + "loss": 0.8428, + "step": 62684 + }, + { + "epoch": 1.61, + "learning_rate": 9.335016657490144e-07, + "loss": 0.6055, + "step": 62685 + }, + { + "epoch": 1.61, + "learning_rate": 9.334740565681306e-07, + "loss": 0.6953, + "step": 62686 + }, + { + "epoch": 1.61, + "learning_rate": 9.33446447438183e-07, + "loss": 0.4355, + "step": 62687 + }, + { + "epoch": 1.61, + "learning_rate": 9.334188383591923e-07, + "loss": 0.561, + "step": 62688 + }, + { + "epoch": 1.61, + "learning_rate": 9.333912293311794e-07, + "loss": 0.6611, + "step": 62689 + }, + { + "epoch": 1.61, + "learning_rate": 9.333636203541662e-07, + "loss": 0.6826, + "step": 62690 + }, + { + "epoch": 1.61, + "learning_rate": 9.333360114281729e-07, + "loss": 0.6401, + "step": 62691 + }, + { + "epoch": 1.61, + "learning_rate": 9.333084025532216e-07, + "loss": 0.6318, + "step": 62692 + }, + { + "epoch": 1.61, + "learning_rate": 9.332807937293327e-07, + "loss": 0.4622, + "step": 62693 + }, + { + "epoch": 1.61, + "learning_rate": 9.332531849565279e-07, + "loss": 0.5474, + "step": 62694 + }, + { + "epoch": 1.61, + "learning_rate": 9.332255762348279e-07, + "loss": 0.7715, + "step": 62695 + }, + { + "epoch": 1.61, + "learning_rate": 9.331979675642538e-07, + "loss": 0.4868, + "step": 62696 + }, + { + "epoch": 1.61, + "learning_rate": 9.331703589448275e-07, + "loss": 0.6294, + "step": 62697 + }, + { + "epoch": 1.61, + "learning_rate": 9.331427503765694e-07, + "loss": 0.5947, + "step": 62698 + }, + { + "epoch": 1.61, + "learning_rate": 9.331151418595005e-07, + "loss": 0.7324, + "step": 62699 + }, + { + "epoch": 1.61, + "learning_rate": 9.330875333936426e-07, + "loss": 0.7217, + "step": 62700 + }, + { + "epoch": 1.61, + "learning_rate": 9.33059924979016e-07, + "loss": 0.6509, + "step": 62701 + }, + { + "epoch": 1.61, + "learning_rate": 9.330323166156428e-07, + "loss": 0.7227, + "step": 62702 + }, + { + "epoch": 1.61, + "learning_rate": 9.330047083035435e-07, + "loss": 0.6133, + "step": 62703 + }, + { + "epoch": 1.61, + "learning_rate": 9.329771000427395e-07, + "loss": 0.6133, + "step": 62704 + }, + { + "epoch": 1.61, + "learning_rate": 9.329494918332517e-07, + "loss": 0.6953, + "step": 62705 + }, + { + "epoch": 1.61, + "learning_rate": 9.329218836751016e-07, + "loss": 0.5986, + "step": 62706 + }, + { + "epoch": 1.61, + "learning_rate": 9.328942755683104e-07, + "loss": 0.5952, + "step": 62707 + }, + { + "epoch": 1.61, + "learning_rate": 9.328666675128985e-07, + "loss": 0.686, + "step": 62708 + }, + { + "epoch": 1.61, + "learning_rate": 9.328390595088877e-07, + "loss": 0.6445, + "step": 62709 + }, + { + "epoch": 1.61, + "learning_rate": 9.328114515562985e-07, + "loss": 0.5703, + "step": 62710 + }, + { + "epoch": 1.61, + "learning_rate": 9.32783843655153e-07, + "loss": 0.5803, + "step": 62711 + }, + { + "epoch": 1.61, + "learning_rate": 9.327562358054718e-07, + "loss": 0.5894, + "step": 62712 + }, + { + "epoch": 1.61, + "learning_rate": 9.327286280072757e-07, + "loss": 0.4177, + "step": 62713 + }, + { + "epoch": 1.61, + "learning_rate": 9.327010202605865e-07, + "loss": 0.6885, + "step": 62714 + }, + { + "epoch": 1.61, + "learning_rate": 9.326734125654249e-07, + "loss": 0.8569, + "step": 62715 + }, + { + "epoch": 1.61, + "learning_rate": 9.326458049218122e-07, + "loss": 0.814, + "step": 62716 + }, + { + "epoch": 1.61, + "learning_rate": 9.326181973297699e-07, + "loss": 0.7646, + "step": 62717 + }, + { + "epoch": 1.61, + "learning_rate": 9.325905897893182e-07, + "loss": 0.4868, + "step": 62718 + }, + { + "epoch": 1.61, + "learning_rate": 9.325629823004791e-07, + "loss": 0.6797, + "step": 62719 + }, + { + "epoch": 1.61, + "learning_rate": 9.325353748632731e-07, + "loss": 0.6084, + "step": 62720 + }, + { + "epoch": 1.61, + "learning_rate": 9.325077674777219e-07, + "loss": 0.6533, + "step": 62721 + }, + { + "epoch": 1.61, + "learning_rate": 9.324801601438462e-07, + "loss": 0.6963, + "step": 62722 + }, + { + "epoch": 1.61, + "learning_rate": 9.324525528616676e-07, + "loss": 0.5962, + "step": 62723 + }, + { + "epoch": 1.61, + "learning_rate": 9.324249456312066e-07, + "loss": 0.6626, + "step": 62724 + }, + { + "epoch": 1.61, + "learning_rate": 9.323973384524851e-07, + "loss": 0.542, + "step": 62725 + }, + { + "epoch": 1.61, + "learning_rate": 9.323697313255236e-07, + "loss": 0.5181, + "step": 62726 + }, + { + "epoch": 1.61, + "learning_rate": 9.32342124250344e-07, + "loss": 0.4622, + "step": 62727 + }, + { + "epoch": 1.61, + "learning_rate": 9.323145172269665e-07, + "loss": 0.6348, + "step": 62728 + }, + { + "epoch": 1.61, + "learning_rate": 9.322869102554128e-07, + "loss": 0.6245, + "step": 62729 + }, + { + "epoch": 1.61, + "learning_rate": 9.322593033357036e-07, + "loss": 0.6611, + "step": 62730 + }, + { + "epoch": 1.61, + "learning_rate": 9.322316964678607e-07, + "loss": 0.6553, + "step": 62731 + }, + { + "epoch": 1.61, + "learning_rate": 9.322040896519046e-07, + "loss": 0.5811, + "step": 62732 + }, + { + "epoch": 1.61, + "learning_rate": 9.321764828878567e-07, + "loss": 0.6284, + "step": 62733 + }, + { + "epoch": 1.61, + "learning_rate": 9.321488761757383e-07, + "loss": 0.627, + "step": 62734 + }, + { + "epoch": 1.61, + "learning_rate": 9.321212695155703e-07, + "loss": 0.7861, + "step": 62735 + }, + { + "epoch": 1.61, + "learning_rate": 9.320936629073739e-07, + "loss": 0.5027, + "step": 62736 + }, + { + "epoch": 1.61, + "learning_rate": 9.320660563511706e-07, + "loss": 0.7061, + "step": 62737 + }, + { + "epoch": 1.61, + "learning_rate": 9.32038449846981e-07, + "loss": 0.7041, + "step": 62738 + }, + { + "epoch": 1.61, + "learning_rate": 9.320108433948263e-07, + "loss": 0.5557, + "step": 62739 + }, + { + "epoch": 1.61, + "learning_rate": 9.319832369947279e-07, + "loss": 0.7275, + "step": 62740 + }, + { + "epoch": 1.61, + "learning_rate": 9.319556306467066e-07, + "loss": 0.5786, + "step": 62741 + }, + { + "epoch": 1.61, + "learning_rate": 9.319280243507839e-07, + "loss": 0.7295, + "step": 62742 + }, + { + "epoch": 1.61, + "learning_rate": 9.319004181069806e-07, + "loss": 0.668, + "step": 62743 + }, + { + "epoch": 1.61, + "learning_rate": 9.318728119153183e-07, + "loss": 0.6895, + "step": 62744 + }, + { + "epoch": 1.61, + "learning_rate": 9.318452057758176e-07, + "loss": 0.6226, + "step": 62745 + }, + { + "epoch": 1.61, + "learning_rate": 9.318175996885002e-07, + "loss": 0.791, + "step": 62746 + }, + { + "epoch": 1.61, + "learning_rate": 9.31789993653387e-07, + "loss": 0.5972, + "step": 62747 + }, + { + "epoch": 1.61, + "learning_rate": 9.317623876704988e-07, + "loss": 0.6533, + "step": 62748 + }, + { + "epoch": 1.61, + "learning_rate": 9.31734781739857e-07, + "loss": 0.6074, + "step": 62749 + }, + { + "epoch": 1.61, + "learning_rate": 9.317071758614828e-07, + "loss": 0.8213, + "step": 62750 + }, + { + "epoch": 1.61, + "learning_rate": 9.316795700353971e-07, + "loss": 0.4839, + "step": 62751 + }, + { + "epoch": 1.61, + "learning_rate": 9.316519642616214e-07, + "loss": 0.7002, + "step": 62752 + }, + { + "epoch": 1.61, + "learning_rate": 9.316243585401765e-07, + "loss": 0.7627, + "step": 62753 + }, + { + "epoch": 1.61, + "learning_rate": 9.315967528710839e-07, + "loss": 0.7822, + "step": 62754 + }, + { + "epoch": 1.61, + "learning_rate": 9.315691472543642e-07, + "loss": 0.5444, + "step": 62755 + }, + { + "epoch": 1.61, + "learning_rate": 9.315415416900392e-07, + "loss": 0.5405, + "step": 62756 + }, + { + "epoch": 1.61, + "learning_rate": 9.315139361781299e-07, + "loss": 0.6357, + "step": 62757 + }, + { + "epoch": 1.61, + "learning_rate": 9.314863307186567e-07, + "loss": 0.5566, + "step": 62758 + }, + { + "epoch": 1.61, + "learning_rate": 9.314587253116415e-07, + "loss": 0.6279, + "step": 62759 + }, + { + "epoch": 1.61, + "learning_rate": 9.31431119957105e-07, + "loss": 0.5298, + "step": 62760 + }, + { + "epoch": 1.61, + "learning_rate": 9.314035146550688e-07, + "loss": 0.6621, + "step": 62761 + }, + { + "epoch": 1.61, + "learning_rate": 9.313759094055535e-07, + "loss": 0.6465, + "step": 62762 + }, + { + "epoch": 1.61, + "learning_rate": 9.313483042085808e-07, + "loss": 0.6582, + "step": 62763 + }, + { + "epoch": 1.61, + "learning_rate": 9.313206990641713e-07, + "loss": 0.425, + "step": 62764 + }, + { + "epoch": 1.61, + "learning_rate": 9.312930939723465e-07, + "loss": 0.6097, + "step": 62765 + }, + { + "epoch": 1.61, + "learning_rate": 9.312654889331274e-07, + "loss": 0.5688, + "step": 62766 + }, + { + "epoch": 1.61, + "learning_rate": 9.312378839465357e-07, + "loss": 0.4829, + "step": 62767 + }, + { + "epoch": 1.61, + "learning_rate": 9.312102790125913e-07, + "loss": 0.8828, + "step": 62768 + }, + { + "epoch": 1.61, + "learning_rate": 9.311826741313164e-07, + "loss": 0.5918, + "step": 62769 + }, + { + "epoch": 1.61, + "learning_rate": 9.311550693027313e-07, + "loss": 0.7158, + "step": 62770 + }, + { + "epoch": 1.61, + "learning_rate": 9.311274645268579e-07, + "loss": 0.5869, + "step": 62771 + }, + { + "epoch": 1.61, + "learning_rate": 9.310998598037169e-07, + "loss": 0.6724, + "step": 62772 + }, + { + "epoch": 1.61, + "learning_rate": 9.310722551333298e-07, + "loss": 0.5237, + "step": 62773 + }, + { + "epoch": 1.61, + "learning_rate": 9.310446505157172e-07, + "loss": 0.6641, + "step": 62774 + }, + { + "epoch": 1.61, + "learning_rate": 9.310170459509008e-07, + "loss": 0.5486, + "step": 62775 + }, + { + "epoch": 1.61, + "learning_rate": 9.309894414389012e-07, + "loss": 0.7314, + "step": 62776 + }, + { + "epoch": 1.61, + "learning_rate": 9.309618369797403e-07, + "loss": 0.7148, + "step": 62777 + }, + { + "epoch": 1.61, + "learning_rate": 9.309342325734385e-07, + "loss": 0.5, + "step": 62778 + }, + { + "epoch": 1.61, + "learning_rate": 9.309066282200171e-07, + "loss": 0.5605, + "step": 62779 + }, + { + "epoch": 1.61, + "learning_rate": 9.308790239194973e-07, + "loss": 0.5811, + "step": 62780 + }, + { + "epoch": 1.61, + "learning_rate": 9.308514196719002e-07, + "loss": 0.625, + "step": 62781 + }, + { + "epoch": 1.61, + "learning_rate": 9.308238154772472e-07, + "loss": 0.7158, + "step": 62782 + }, + { + "epoch": 1.61, + "learning_rate": 9.30796211335559e-07, + "loss": 0.6465, + "step": 62783 + }, + { + "epoch": 1.61, + "learning_rate": 9.307686072468572e-07, + "loss": 0.5649, + "step": 62784 + }, + { + "epoch": 1.61, + "learning_rate": 9.307410032111626e-07, + "loss": 0.5021, + "step": 62785 + }, + { + "epoch": 1.61, + "learning_rate": 9.307133992284962e-07, + "loss": 0.5332, + "step": 62786 + }, + { + "epoch": 1.61, + "learning_rate": 9.306857952988798e-07, + "loss": 0.5291, + "step": 62787 + }, + { + "epoch": 1.61, + "learning_rate": 9.306581914223339e-07, + "loss": 0.7285, + "step": 62788 + }, + { + "epoch": 1.61, + "learning_rate": 9.306305875988796e-07, + "loss": 0.7666, + "step": 62789 + }, + { + "epoch": 1.61, + "learning_rate": 9.306029838285387e-07, + "loss": 0.5466, + "step": 62790 + }, + { + "epoch": 1.61, + "learning_rate": 9.305753801113316e-07, + "loss": 0.6294, + "step": 62791 + }, + { + "epoch": 1.61, + "learning_rate": 9.305477764472798e-07, + "loss": 0.7861, + "step": 62792 + }, + { + "epoch": 1.61, + "learning_rate": 9.305201728364042e-07, + "loss": 0.5547, + "step": 62793 + }, + { + "epoch": 1.61, + "learning_rate": 9.304925692787264e-07, + "loss": 0.4888, + "step": 62794 + }, + { + "epoch": 1.61, + "learning_rate": 9.304649657742669e-07, + "loss": 0.7021, + "step": 62795 + }, + { + "epoch": 1.61, + "learning_rate": 9.304373623230476e-07, + "loss": 0.5435, + "step": 62796 + }, + { + "epoch": 1.61, + "learning_rate": 9.304097589250892e-07, + "loss": 0.7344, + "step": 62797 + }, + { + "epoch": 1.61, + "learning_rate": 9.303821555804126e-07, + "loss": 0.8164, + "step": 62798 + }, + { + "epoch": 1.61, + "learning_rate": 9.303545522890393e-07, + "loss": 0.3901, + "step": 62799 + }, + { + "epoch": 1.61, + "learning_rate": 9.303269490509902e-07, + "loss": 0.6064, + "step": 62800 + }, + { + "epoch": 1.61, + "learning_rate": 9.302993458662867e-07, + "loss": 0.3881, + "step": 62801 + }, + { + "epoch": 1.61, + "learning_rate": 9.302717427349498e-07, + "loss": 0.5884, + "step": 62802 + }, + { + "epoch": 1.61, + "learning_rate": 9.302441396570003e-07, + "loss": 0.6885, + "step": 62803 + }, + { + "epoch": 1.61, + "learning_rate": 9.3021653663246e-07, + "loss": 0.7324, + "step": 62804 + }, + { + "epoch": 1.61, + "learning_rate": 9.301889336613494e-07, + "loss": 0.665, + "step": 62805 + }, + { + "epoch": 1.61, + "learning_rate": 9.301613307436902e-07, + "loss": 0.8252, + "step": 62806 + }, + { + "epoch": 1.61, + "learning_rate": 9.301337278795034e-07, + "loss": 0.5444, + "step": 62807 + }, + { + "epoch": 1.61, + "learning_rate": 9.301061250688095e-07, + "loss": 0.6904, + "step": 62808 + }, + { + "epoch": 1.61, + "learning_rate": 9.300785223116305e-07, + "loss": 0.6807, + "step": 62809 + }, + { + "epoch": 1.61, + "learning_rate": 9.30050919607987e-07, + "loss": 0.6445, + "step": 62810 + }, + { + "epoch": 1.61, + "learning_rate": 9.300233169579003e-07, + "loss": 0.5439, + "step": 62811 + }, + { + "epoch": 1.61, + "learning_rate": 9.299957143613915e-07, + "loss": 0.7393, + "step": 62812 + }, + { + "epoch": 1.61, + "learning_rate": 9.299681118184819e-07, + "loss": 0.3955, + "step": 62813 + }, + { + "epoch": 1.61, + "learning_rate": 9.299405093291922e-07, + "loss": 0.6914, + "step": 62814 + }, + { + "epoch": 1.61, + "learning_rate": 9.299129068935442e-07, + "loss": 0.6841, + "step": 62815 + }, + { + "epoch": 1.61, + "learning_rate": 9.298853045115584e-07, + "loss": 0.6318, + "step": 62816 + }, + { + "epoch": 1.61, + "learning_rate": 9.298577021832565e-07, + "loss": 0.7598, + "step": 62817 + }, + { + "epoch": 1.61, + "learning_rate": 9.298300999086593e-07, + "loss": 0.7402, + "step": 62818 + }, + { + "epoch": 1.61, + "learning_rate": 9.298024976877878e-07, + "loss": 0.6787, + "step": 62819 + }, + { + "epoch": 1.61, + "learning_rate": 9.297748955206633e-07, + "loss": 0.6504, + "step": 62820 + }, + { + "epoch": 1.61, + "learning_rate": 9.297472934073069e-07, + "loss": 0.5303, + "step": 62821 + }, + { + "epoch": 1.61, + "learning_rate": 9.297196913477397e-07, + "loss": 0.6973, + "step": 62822 + }, + { + "epoch": 1.61, + "learning_rate": 9.296920893419831e-07, + "loss": 0.6787, + "step": 62823 + }, + { + "epoch": 1.61, + "learning_rate": 9.296644873900577e-07, + "loss": 0.5786, + "step": 62824 + }, + { + "epoch": 1.61, + "learning_rate": 9.296368854919854e-07, + "loss": 0.6553, + "step": 62825 + }, + { + "epoch": 1.61, + "learning_rate": 9.296092836477865e-07, + "loss": 0.5815, + "step": 62826 + }, + { + "epoch": 1.61, + "learning_rate": 9.295816818574831e-07, + "loss": 0.606, + "step": 62827 + }, + { + "epoch": 1.61, + "learning_rate": 9.295540801210955e-07, + "loss": 0.6377, + "step": 62828 + }, + { + "epoch": 1.61, + "learning_rate": 9.295264784386449e-07, + "loss": 0.6152, + "step": 62829 + }, + { + "epoch": 1.61, + "learning_rate": 9.294988768101528e-07, + "loss": 0.7744, + "step": 62830 + }, + { + "epoch": 1.61, + "learning_rate": 9.2947127523564e-07, + "loss": 0.5483, + "step": 62831 + }, + { + "epoch": 1.61, + "learning_rate": 9.294436737151279e-07, + "loss": 0.6763, + "step": 62832 + }, + { + "epoch": 1.61, + "learning_rate": 9.294160722486375e-07, + "loss": 0.7373, + "step": 62833 + }, + { + "epoch": 1.61, + "learning_rate": 9.293884708361901e-07, + "loss": 0.615, + "step": 62834 + }, + { + "epoch": 1.61, + "learning_rate": 9.293608694778065e-07, + "loss": 0.7974, + "step": 62835 + }, + { + "epoch": 1.61, + "learning_rate": 9.293332681735083e-07, + "loss": 0.604, + "step": 62836 + }, + { + "epoch": 1.61, + "learning_rate": 9.293056669233164e-07, + "loss": 0.6279, + "step": 62837 + }, + { + "epoch": 1.61, + "learning_rate": 9.292780657272518e-07, + "loss": 0.6533, + "step": 62838 + }, + { + "epoch": 1.61, + "learning_rate": 9.292504645853355e-07, + "loss": 0.6855, + "step": 62839 + }, + { + "epoch": 1.61, + "learning_rate": 9.292228634975891e-07, + "loss": 0.5459, + "step": 62840 + }, + { + "epoch": 1.61, + "learning_rate": 9.291952624640333e-07, + "loss": 0.4248, + "step": 62841 + }, + { + "epoch": 1.61, + "learning_rate": 9.291676614846897e-07, + "loss": 0.5444, + "step": 62842 + }, + { + "epoch": 1.61, + "learning_rate": 9.291400605595788e-07, + "loss": 0.6719, + "step": 62843 + }, + { + "epoch": 1.61, + "learning_rate": 9.291124596887224e-07, + "loss": 0.6963, + "step": 62844 + }, + { + "epoch": 1.61, + "learning_rate": 9.290848588721412e-07, + "loss": 0.6562, + "step": 62845 + }, + { + "epoch": 1.61, + "learning_rate": 9.290572581098565e-07, + "loss": 0.5859, + "step": 62846 + }, + { + "epoch": 1.61, + "learning_rate": 9.290296574018896e-07, + "loss": 0.6064, + "step": 62847 + }, + { + "epoch": 1.61, + "learning_rate": 9.290020567482611e-07, + "loss": 0.5522, + "step": 62848 + }, + { + "epoch": 1.61, + "learning_rate": 9.289744561489927e-07, + "loss": 0.6885, + "step": 62849 + }, + { + "epoch": 1.61, + "learning_rate": 9.289468556041051e-07, + "loss": 0.5974, + "step": 62850 + }, + { + "epoch": 1.61, + "learning_rate": 9.289192551136198e-07, + "loss": 0.8018, + "step": 62851 + }, + { + "epoch": 1.61, + "learning_rate": 9.288916546775576e-07, + "loss": 0.5747, + "step": 62852 + }, + { + "epoch": 1.61, + "learning_rate": 9.288640542959398e-07, + "loss": 0.7441, + "step": 62853 + }, + { + "epoch": 1.61, + "learning_rate": 9.288364539687875e-07, + "loss": 0.5137, + "step": 62854 + }, + { + "epoch": 1.61, + "learning_rate": 9.288088536961221e-07, + "loss": 0.8545, + "step": 62855 + }, + { + "epoch": 1.61, + "learning_rate": 9.287812534779642e-07, + "loss": 0.575, + "step": 62856 + }, + { + "epoch": 1.61, + "learning_rate": 9.287536533143357e-07, + "loss": 0.3889, + "step": 62857 + }, + { + "epoch": 1.61, + "learning_rate": 9.287260532052569e-07, + "loss": 0.6279, + "step": 62858 + }, + { + "epoch": 1.61, + "learning_rate": 9.286984531507493e-07, + "loss": 0.5254, + "step": 62859 + }, + { + "epoch": 1.61, + "learning_rate": 9.286708531508338e-07, + "loss": 0.7559, + "step": 62860 + }, + { + "epoch": 1.61, + "learning_rate": 9.286432532055321e-07, + "loss": 0.3954, + "step": 62861 + }, + { + "epoch": 1.61, + "learning_rate": 9.286156533148647e-07, + "loss": 0.7529, + "step": 62862 + }, + { + "epoch": 1.61, + "learning_rate": 9.285880534788532e-07, + "loss": 0.7227, + "step": 62863 + }, + { + "epoch": 1.61, + "learning_rate": 9.285604536975183e-07, + "loss": 0.7168, + "step": 62864 + }, + { + "epoch": 1.61, + "learning_rate": 9.285328539708817e-07, + "loss": 0.7109, + "step": 62865 + }, + { + "epoch": 1.61, + "learning_rate": 9.285052542989639e-07, + "loss": 0.6973, + "step": 62866 + }, + { + "epoch": 1.61, + "learning_rate": 9.284776546817867e-07, + "loss": 0.6299, + "step": 62867 + }, + { + "epoch": 1.61, + "learning_rate": 9.284500551193708e-07, + "loss": 0.5991, + "step": 62868 + }, + { + "epoch": 1.61, + "learning_rate": 9.284224556117372e-07, + "loss": 0.7197, + "step": 62869 + }, + { + "epoch": 1.61, + "learning_rate": 9.283948561589074e-07, + "loss": 0.7119, + "step": 62870 + }, + { + "epoch": 1.61, + "learning_rate": 9.283672567609021e-07, + "loss": 0.6221, + "step": 62871 + }, + { + "epoch": 1.61, + "learning_rate": 9.283396574177429e-07, + "loss": 0.4966, + "step": 62872 + }, + { + "epoch": 1.61, + "learning_rate": 9.283120581294505e-07, + "loss": 0.7617, + "step": 62873 + }, + { + "epoch": 1.61, + "learning_rate": 9.282844588960466e-07, + "loss": 0.6304, + "step": 62874 + }, + { + "epoch": 1.61, + "learning_rate": 9.28256859717552e-07, + "loss": 0.6621, + "step": 62875 + }, + { + "epoch": 1.61, + "learning_rate": 9.282292605939876e-07, + "loss": 0.7656, + "step": 62876 + }, + { + "epoch": 1.61, + "learning_rate": 9.28201661525375e-07, + "loss": 0.6113, + "step": 62877 + }, + { + "epoch": 1.61, + "learning_rate": 9.281740625117351e-07, + "loss": 0.4568, + "step": 62878 + }, + { + "epoch": 1.61, + "learning_rate": 9.281464635530886e-07, + "loss": 0.7588, + "step": 62879 + }, + { + "epoch": 1.61, + "learning_rate": 9.281188646494574e-07, + "loss": 0.521, + "step": 62880 + }, + { + "epoch": 1.61, + "learning_rate": 9.280912658008621e-07, + "loss": 0.6758, + "step": 62881 + }, + { + "epoch": 1.61, + "learning_rate": 9.280636670073241e-07, + "loss": 0.6353, + "step": 62882 + }, + { + "epoch": 1.61, + "learning_rate": 9.280360682688643e-07, + "loss": 0.7617, + "step": 62883 + }, + { + "epoch": 1.61, + "learning_rate": 9.280084695855042e-07, + "loss": 0.573, + "step": 62884 + }, + { + "epoch": 1.61, + "learning_rate": 9.279808709572644e-07, + "loss": 0.6782, + "step": 62885 + }, + { + "epoch": 1.61, + "learning_rate": 9.279532723841667e-07, + "loss": 0.6132, + "step": 62886 + }, + { + "epoch": 1.61, + "learning_rate": 9.27925673866232e-07, + "loss": 0.8027, + "step": 62887 + }, + { + "epoch": 1.61, + "learning_rate": 9.278980754034807e-07, + "loss": 0.4673, + "step": 62888 + }, + { + "epoch": 1.61, + "learning_rate": 9.27870476995935e-07, + "loss": 0.6514, + "step": 62889 + }, + { + "epoch": 1.61, + "learning_rate": 9.278428786436152e-07, + "loss": 0.5732, + "step": 62890 + }, + { + "epoch": 1.61, + "learning_rate": 9.278152803465431e-07, + "loss": 0.6963, + "step": 62891 + }, + { + "epoch": 1.61, + "learning_rate": 9.277876821047395e-07, + "loss": 0.7188, + "step": 62892 + }, + { + "epoch": 1.61, + "learning_rate": 9.277600839182252e-07, + "loss": 0.4927, + "step": 62893 + }, + { + "epoch": 1.61, + "learning_rate": 9.277324857870222e-07, + "loss": 0.7822, + "step": 62894 + }, + { + "epoch": 1.61, + "learning_rate": 9.277048877111506e-07, + "loss": 0.626, + "step": 62895 + }, + { + "epoch": 1.61, + "learning_rate": 9.276772896906325e-07, + "loss": 0.5361, + "step": 62896 + }, + { + "epoch": 1.61, + "learning_rate": 9.276496917254886e-07, + "loss": 0.8057, + "step": 62897 + }, + { + "epoch": 1.61, + "learning_rate": 9.276220938157395e-07, + "loss": 0.6309, + "step": 62898 + }, + { + "epoch": 1.61, + "learning_rate": 9.275944959614072e-07, + "loss": 0.2593, + "step": 62899 + }, + { + "epoch": 1.61, + "learning_rate": 9.275668981625122e-07, + "loss": 0.5708, + "step": 62900 + }, + { + "epoch": 1.61, + "learning_rate": 9.275393004190763e-07, + "loss": 0.6748, + "step": 62901 + }, + { + "epoch": 1.61, + "learning_rate": 9.275117027311198e-07, + "loss": 0.5981, + "step": 62902 + }, + { + "epoch": 1.61, + "learning_rate": 9.274841050986645e-07, + "loss": 0.6196, + "step": 62903 + }, + { + "epoch": 1.61, + "learning_rate": 9.274565075217311e-07, + "loss": 0.7085, + "step": 62904 + }, + { + "epoch": 1.61, + "learning_rate": 9.274289100003411e-07, + "loss": 0.8379, + "step": 62905 + }, + { + "epoch": 1.61, + "learning_rate": 9.274013125345153e-07, + "loss": 0.5479, + "step": 62906 + }, + { + "epoch": 1.61, + "learning_rate": 9.273737151242754e-07, + "loss": 0.5952, + "step": 62907 + }, + { + "epoch": 1.61, + "learning_rate": 9.273461177696418e-07, + "loss": 0.6133, + "step": 62908 + }, + { + "epoch": 1.61, + "learning_rate": 9.27318520470636e-07, + "loss": 0.5339, + "step": 62909 + }, + { + "epoch": 1.61, + "learning_rate": 9.272909232272787e-07, + "loss": 0.5056, + "step": 62910 + }, + { + "epoch": 1.61, + "learning_rate": 9.272633260395919e-07, + "loss": 0.8418, + "step": 62911 + }, + { + "epoch": 1.61, + "learning_rate": 9.272357289075958e-07, + "loss": 0.6807, + "step": 62912 + }, + { + "epoch": 1.61, + "learning_rate": 9.272081318313123e-07, + "loss": 0.624, + "step": 62913 + }, + { + "epoch": 1.61, + "learning_rate": 9.271805348107618e-07, + "loss": 0.686, + "step": 62914 + }, + { + "epoch": 1.61, + "learning_rate": 9.271529378459662e-07, + "loss": 0.7163, + "step": 62915 + }, + { + "epoch": 1.61, + "learning_rate": 9.271253409369459e-07, + "loss": 0.6626, + "step": 62916 + }, + { + "epoch": 1.61, + "learning_rate": 9.27097744083723e-07, + "loss": 0.5771, + "step": 62917 + }, + { + "epoch": 1.61, + "learning_rate": 9.270701472863176e-07, + "loss": 0.7139, + "step": 62918 + }, + { + "epoch": 1.61, + "learning_rate": 9.270425505447511e-07, + "loss": 0.6719, + "step": 62919 + }, + { + "epoch": 1.61, + "learning_rate": 9.270149538590449e-07, + "loss": 0.6992, + "step": 62920 + }, + { + "epoch": 1.61, + "learning_rate": 9.2698735722922e-07, + "loss": 0.6465, + "step": 62921 + }, + { + "epoch": 1.61, + "learning_rate": 9.269597606552974e-07, + "loss": 0.5657, + "step": 62922 + }, + { + "epoch": 1.61, + "learning_rate": 9.269321641372985e-07, + "loss": 0.7202, + "step": 62923 + }, + { + "epoch": 1.61, + "learning_rate": 9.269045676752443e-07, + "loss": 0.5654, + "step": 62924 + }, + { + "epoch": 1.61, + "learning_rate": 9.268769712691557e-07, + "loss": 0.7783, + "step": 62925 + }, + { + "epoch": 1.61, + "learning_rate": 9.268493749190543e-07, + "loss": 0.7412, + "step": 62926 + }, + { + "epoch": 1.61, + "learning_rate": 9.268217786249611e-07, + "loss": 0.6416, + "step": 62927 + }, + { + "epoch": 1.61, + "learning_rate": 9.267941823868969e-07, + "loss": 0.5996, + "step": 62928 + }, + { + "epoch": 1.61, + "learning_rate": 9.267665862048829e-07, + "loss": 0.7783, + "step": 62929 + }, + { + "epoch": 1.61, + "learning_rate": 9.267389900789405e-07, + "loss": 0.6748, + "step": 62930 + }, + { + "epoch": 1.61, + "learning_rate": 9.267113940090905e-07, + "loss": 0.7588, + "step": 62931 + }, + { + "epoch": 1.61, + "learning_rate": 9.266837979953545e-07, + "loss": 0.6836, + "step": 62932 + }, + { + "epoch": 1.61, + "learning_rate": 9.26656202037753e-07, + "loss": 0.5437, + "step": 62933 + }, + { + "epoch": 1.61, + "learning_rate": 9.266286061363078e-07, + "loss": 0.5068, + "step": 62934 + }, + { + "epoch": 1.61, + "learning_rate": 9.266010102910394e-07, + "loss": 0.4402, + "step": 62935 + }, + { + "epoch": 1.61, + "learning_rate": 9.265734145019695e-07, + "loss": 0.5616, + "step": 62936 + }, + { + "epoch": 1.61, + "learning_rate": 9.265458187691191e-07, + "loss": 0.5713, + "step": 62937 + }, + { + "epoch": 1.61, + "learning_rate": 9.265182230925088e-07, + "loss": 0.7217, + "step": 62938 + }, + { + "epoch": 1.61, + "learning_rate": 9.264906274721603e-07, + "loss": 0.8945, + "step": 62939 + }, + { + "epoch": 1.61, + "learning_rate": 9.264630319080945e-07, + "loss": 0.6807, + "step": 62940 + }, + { + "epoch": 1.61, + "learning_rate": 9.264354364003326e-07, + "loss": 0.668, + "step": 62941 + }, + { + "epoch": 1.61, + "learning_rate": 9.264078409488955e-07, + "loss": 0.5361, + "step": 62942 + }, + { + "epoch": 1.61, + "learning_rate": 9.263802455538049e-07, + "loss": 0.7012, + "step": 62943 + }, + { + "epoch": 1.61, + "learning_rate": 9.263526502150813e-07, + "loss": 0.7764, + "step": 62944 + }, + { + "epoch": 1.61, + "learning_rate": 9.263250549327462e-07, + "loss": 0.5166, + "step": 62945 + }, + { + "epoch": 1.61, + "learning_rate": 9.26297459706821e-07, + "loss": 0.6367, + "step": 62946 + }, + { + "epoch": 1.61, + "learning_rate": 9.26269864537326e-07, + "loss": 0.6367, + "step": 62947 + }, + { + "epoch": 1.61, + "learning_rate": 9.262422694242827e-07, + "loss": 0.7236, + "step": 62948 + }, + { + "epoch": 1.61, + "learning_rate": 9.262146743677125e-07, + "loss": 0.75, + "step": 62949 + }, + { + "epoch": 1.61, + "learning_rate": 9.261870793676361e-07, + "loss": 0.6094, + "step": 62950 + }, + { + "epoch": 1.61, + "learning_rate": 9.261594844240751e-07, + "loss": 0.835, + "step": 62951 + }, + { + "epoch": 1.61, + "learning_rate": 9.261318895370501e-07, + "loss": 0.6719, + "step": 62952 + }, + { + "epoch": 1.61, + "learning_rate": 9.261042947065828e-07, + "loss": 0.4995, + "step": 62953 + }, + { + "epoch": 1.61, + "learning_rate": 9.260766999326939e-07, + "loss": 0.7158, + "step": 62954 + }, + { + "epoch": 1.61, + "learning_rate": 9.260491052154048e-07, + "loss": 0.6289, + "step": 62955 + }, + { + "epoch": 1.61, + "learning_rate": 9.260215105547367e-07, + "loss": 0.4543, + "step": 62956 + }, + { + "epoch": 1.61, + "learning_rate": 9.259939159507101e-07, + "loss": 0.359, + "step": 62957 + }, + { + "epoch": 1.61, + "learning_rate": 9.259663214033468e-07, + "loss": 0.5796, + "step": 62958 + }, + { + "epoch": 1.61, + "learning_rate": 9.259387269126675e-07, + "loss": 0.4028, + "step": 62959 + }, + { + "epoch": 1.61, + "learning_rate": 9.259111324786937e-07, + "loss": 0.6938, + "step": 62960 + }, + { + "epoch": 1.61, + "learning_rate": 9.258835381014461e-07, + "loss": 0.6904, + "step": 62961 + }, + { + "epoch": 1.61, + "learning_rate": 9.258559437809462e-07, + "loss": 0.6646, + "step": 62962 + }, + { + "epoch": 1.61, + "learning_rate": 9.258283495172149e-07, + "loss": 0.7744, + "step": 62963 + }, + { + "epoch": 1.61, + "learning_rate": 9.258007553102735e-07, + "loss": 0.668, + "step": 62964 + }, + { + "epoch": 1.61, + "learning_rate": 9.257731611601433e-07, + "loss": 0.6172, + "step": 62965 + }, + { + "epoch": 1.61, + "learning_rate": 9.257455670668453e-07, + "loss": 0.6572, + "step": 62966 + }, + { + "epoch": 1.61, + "learning_rate": 9.257179730303999e-07, + "loss": 0.748, + "step": 62967 + }, + { + "epoch": 1.61, + "learning_rate": 9.256903790508292e-07, + "loss": 0.79, + "step": 62968 + }, + { + "epoch": 1.61, + "learning_rate": 9.256627851281537e-07, + "loss": 0.635, + "step": 62969 + }, + { + "epoch": 1.61, + "learning_rate": 9.256351912623951e-07, + "loss": 0.6279, + "step": 62970 + }, + { + "epoch": 1.61, + "learning_rate": 9.256075974535739e-07, + "loss": 0.7051, + "step": 62971 + }, + { + "epoch": 1.61, + "learning_rate": 9.255800037017117e-07, + "loss": 0.4048, + "step": 62972 + }, + { + "epoch": 1.61, + "learning_rate": 9.255524100068293e-07, + "loss": 0.7134, + "step": 62973 + }, + { + "epoch": 1.61, + "learning_rate": 9.255248163689483e-07, + "loss": 0.7559, + "step": 62974 + }, + { + "epoch": 1.61, + "learning_rate": 9.254972227880893e-07, + "loss": 0.6155, + "step": 62975 + }, + { + "epoch": 1.61, + "learning_rate": 9.25469629264274e-07, + "loss": 0.6934, + "step": 62976 + }, + { + "epoch": 1.61, + "learning_rate": 9.25442035797523e-07, + "loss": 0.5825, + "step": 62977 + }, + { + "epoch": 1.61, + "learning_rate": 9.254144423878574e-07, + "loss": 0.5576, + "step": 62978 + }, + { + "epoch": 1.61, + "learning_rate": 9.253868490352987e-07, + "loss": 0.6973, + "step": 62979 + }, + { + "epoch": 1.61, + "learning_rate": 9.253592557398677e-07, + "loss": 0.7832, + "step": 62980 + }, + { + "epoch": 1.61, + "learning_rate": 9.25331662501586e-07, + "loss": 0.481, + "step": 62981 + }, + { + "epoch": 1.61, + "learning_rate": 9.253040693204741e-07, + "loss": 0.6987, + "step": 62982 + }, + { + "epoch": 1.61, + "learning_rate": 9.252764761965534e-07, + "loss": 0.8145, + "step": 62983 + }, + { + "epoch": 1.61, + "learning_rate": 9.252488831298454e-07, + "loss": 0.5916, + "step": 62984 + }, + { + "epoch": 1.61, + "learning_rate": 9.252212901203706e-07, + "loss": 0.6489, + "step": 62985 + }, + { + "epoch": 1.61, + "learning_rate": 9.251936971681508e-07, + "loss": 0.584, + "step": 62986 + }, + { + "epoch": 1.61, + "learning_rate": 9.251661042732065e-07, + "loss": 0.6641, + "step": 62987 + }, + { + "epoch": 1.61, + "learning_rate": 9.251385114355589e-07, + "loss": 0.564, + "step": 62988 + }, + { + "epoch": 1.61, + "learning_rate": 9.251109186552295e-07, + "loss": 0.6934, + "step": 62989 + }, + { + "epoch": 1.61, + "learning_rate": 9.250833259322391e-07, + "loss": 0.9033, + "step": 62990 + }, + { + "epoch": 1.61, + "learning_rate": 9.250557332666091e-07, + "loss": 0.6904, + "step": 62991 + }, + { + "epoch": 1.61, + "learning_rate": 9.250281406583602e-07, + "loss": 0.6416, + "step": 62992 + }, + { + "epoch": 1.61, + "learning_rate": 9.250005481075141e-07, + "loss": 0.7646, + "step": 62993 + }, + { + "epoch": 1.61, + "learning_rate": 9.249729556140915e-07, + "loss": 0.7515, + "step": 62994 + }, + { + "epoch": 1.61, + "learning_rate": 9.249453631781138e-07, + "loss": 0.6416, + "step": 62995 + }, + { + "epoch": 1.61, + "learning_rate": 9.249177707996021e-07, + "loss": 0.6499, + "step": 62996 + }, + { + "epoch": 1.61, + "learning_rate": 9.248901784785771e-07, + "loss": 0.5967, + "step": 62997 + }, + { + "epoch": 1.61, + "learning_rate": 9.248625862150604e-07, + "loss": 0.7407, + "step": 62998 + }, + { + "epoch": 1.61, + "learning_rate": 9.248349940090727e-07, + "loss": 0.6904, + "step": 62999 + }, + { + "epoch": 1.61, + "learning_rate": 9.248074018606356e-07, + "loss": 0.7148, + "step": 63000 + }, + { + "epoch": 1.61, + "learning_rate": 9.247798097697702e-07, + "loss": 0.606, + "step": 63001 + }, + { + "epoch": 1.61, + "learning_rate": 9.247522177364971e-07, + "loss": 0.6689, + "step": 63002 + }, + { + "epoch": 1.61, + "learning_rate": 9.24724625760838e-07, + "loss": 0.6719, + "step": 63003 + }, + { + "epoch": 1.61, + "learning_rate": 9.246970338428135e-07, + "loss": 0.6641, + "step": 63004 + }, + { + "epoch": 1.61, + "learning_rate": 9.246694419824454e-07, + "loss": 0.666, + "step": 63005 + }, + { + "epoch": 1.61, + "learning_rate": 9.246418501797545e-07, + "loss": 0.5254, + "step": 63006 + }, + { + "epoch": 1.61, + "learning_rate": 9.246142584347615e-07, + "loss": 0.583, + "step": 63007 + }, + { + "epoch": 1.61, + "learning_rate": 9.245866667474881e-07, + "loss": 0.5634, + "step": 63008 + }, + { + "epoch": 1.61, + "learning_rate": 9.24559075117955e-07, + "loss": 0.6753, + "step": 63009 + }, + { + "epoch": 1.61, + "learning_rate": 9.245314835461839e-07, + "loss": 0.6978, + "step": 63010 + }, + { + "epoch": 1.62, + "learning_rate": 9.245038920321951e-07, + "loss": 0.7334, + "step": 63011 + }, + { + "epoch": 1.62, + "learning_rate": 9.244763005760106e-07, + "loss": 0.6738, + "step": 63012 + }, + { + "epoch": 1.62, + "learning_rate": 9.244487091776508e-07, + "loss": 0.7285, + "step": 63013 + }, + { + "epoch": 1.62, + "learning_rate": 9.244211178371375e-07, + "loss": 0.6084, + "step": 63014 + }, + { + "epoch": 1.62, + "learning_rate": 9.243935265544911e-07, + "loss": 0.7275, + "step": 63015 + }, + { + "epoch": 1.62, + "learning_rate": 9.243659353297336e-07, + "loss": 0.6318, + "step": 63016 + }, + { + "epoch": 1.62, + "learning_rate": 9.243383441628854e-07, + "loss": 0.7236, + "step": 63017 + }, + { + "epoch": 1.62, + "learning_rate": 9.24310753053968e-07, + "loss": 0.6582, + "step": 63018 + }, + { + "epoch": 1.62, + "learning_rate": 9.24283162003002e-07, + "loss": 0.7441, + "step": 63019 + }, + { + "epoch": 1.62, + "learning_rate": 9.24255571010009e-07, + "loss": 0.5457, + "step": 63020 + }, + { + "epoch": 1.62, + "learning_rate": 9.242279800750101e-07, + "loss": 0.79, + "step": 63021 + }, + { + "epoch": 1.62, + "learning_rate": 9.242003891980264e-07, + "loss": 0.7207, + "step": 63022 + }, + { + "epoch": 1.62, + "learning_rate": 9.241727983790788e-07, + "loss": 0.5303, + "step": 63023 + }, + { + "epoch": 1.62, + "learning_rate": 9.241452076181888e-07, + "loss": 0.5952, + "step": 63024 + }, + { + "epoch": 1.62, + "learning_rate": 9.241176169153772e-07, + "loss": 0.6094, + "step": 63025 + }, + { + "epoch": 1.62, + "learning_rate": 9.240900262706655e-07, + "loss": 0.6138, + "step": 63026 + }, + { + "epoch": 1.62, + "learning_rate": 9.240624356840745e-07, + "loss": 0.6631, + "step": 63027 + }, + { + "epoch": 1.62, + "learning_rate": 9.240348451556251e-07, + "loss": 0.7373, + "step": 63028 + }, + { + "epoch": 1.62, + "learning_rate": 9.24007254685339e-07, + "loss": 0.6211, + "step": 63029 + }, + { + "epoch": 1.62, + "learning_rate": 9.239796642732368e-07, + "loss": 0.7432, + "step": 63030 + }, + { + "epoch": 1.62, + "learning_rate": 9.239520739193402e-07, + "loss": 0.8301, + "step": 63031 + }, + { + "epoch": 1.62, + "learning_rate": 9.239244836236697e-07, + "loss": 0.8047, + "step": 63032 + }, + { + "epoch": 1.62, + "learning_rate": 9.238968933862468e-07, + "loss": 0.6309, + "step": 63033 + }, + { + "epoch": 1.62, + "learning_rate": 9.238693032070926e-07, + "loss": 0.6626, + "step": 63034 + }, + { + "epoch": 1.62, + "learning_rate": 9.238417130862282e-07, + "loss": 0.5801, + "step": 63035 + }, + { + "epoch": 1.62, + "learning_rate": 9.23814123023675e-07, + "loss": 0.5128, + "step": 63036 + }, + { + "epoch": 1.62, + "learning_rate": 9.237865330194536e-07, + "loss": 0.6538, + "step": 63037 + }, + { + "epoch": 1.62, + "learning_rate": 9.237589430735851e-07, + "loss": 0.6294, + "step": 63038 + }, + { + "epoch": 1.62, + "learning_rate": 9.237313531860911e-07, + "loss": 0.5007, + "step": 63039 + }, + { + "epoch": 1.62, + "learning_rate": 9.237037633569923e-07, + "loss": 0.5439, + "step": 63040 + }, + { + "epoch": 1.62, + "learning_rate": 9.236761735863102e-07, + "loss": 0.5742, + "step": 63041 + }, + { + "epoch": 1.62, + "learning_rate": 9.236485838740656e-07, + "loss": 0.7871, + "step": 63042 + }, + { + "epoch": 1.62, + "learning_rate": 9.2362099422028e-07, + "loss": 0.5112, + "step": 63043 + }, + { + "epoch": 1.62, + "learning_rate": 9.235934046249739e-07, + "loss": 0.3789, + "step": 63044 + }, + { + "epoch": 1.62, + "learning_rate": 9.235658150881692e-07, + "loss": 0.4921, + "step": 63045 + }, + { + "epoch": 1.62, + "learning_rate": 9.235382256098867e-07, + "loss": 0.5559, + "step": 63046 + }, + { + "epoch": 1.62, + "learning_rate": 9.235106361901472e-07, + "loss": 0.5046, + "step": 63047 + }, + { + "epoch": 1.62, + "learning_rate": 9.234830468289722e-07, + "loss": 0.7236, + "step": 63048 + }, + { + "epoch": 1.62, + "learning_rate": 9.234554575263825e-07, + "loss": 0.6548, + "step": 63049 + }, + { + "epoch": 1.62, + "learning_rate": 9.234278682823997e-07, + "loss": 0.5308, + "step": 63050 + }, + { + "epoch": 1.62, + "learning_rate": 9.234002790970444e-07, + "loss": 0.5898, + "step": 63051 + }, + { + "epoch": 1.62, + "learning_rate": 9.233726899703382e-07, + "loss": 0.6582, + "step": 63052 + }, + { + "epoch": 1.62, + "learning_rate": 9.233451009023019e-07, + "loss": 0.8799, + "step": 63053 + }, + { + "epoch": 1.62, + "learning_rate": 9.23317511892957e-07, + "loss": 0.6084, + "step": 63054 + }, + { + "epoch": 1.62, + "learning_rate": 9.232899229423241e-07, + "loss": 0.6768, + "step": 63055 + }, + { + "epoch": 1.62, + "learning_rate": 9.23262334050425e-07, + "loss": 0.7334, + "step": 63056 + }, + { + "epoch": 1.62, + "learning_rate": 9.232347452172799e-07, + "loss": 0.7393, + "step": 63057 + }, + { + "epoch": 1.62, + "learning_rate": 9.232071564429106e-07, + "loss": 0.6758, + "step": 63058 + }, + { + "epoch": 1.62, + "learning_rate": 9.231795677273379e-07, + "loss": 0.5254, + "step": 63059 + }, + { + "epoch": 1.62, + "learning_rate": 9.231519790705831e-07, + "loss": 0.6738, + "step": 63060 + }, + { + "epoch": 1.62, + "learning_rate": 9.231243904726673e-07, + "loss": 0.7305, + "step": 63061 + }, + { + "epoch": 1.62, + "learning_rate": 9.230968019336118e-07, + "loss": 0.7109, + "step": 63062 + }, + { + "epoch": 1.62, + "learning_rate": 9.230692134534372e-07, + "loss": 0.3699, + "step": 63063 + }, + { + "epoch": 1.62, + "learning_rate": 9.230416250321653e-07, + "loss": 0.5045, + "step": 63064 + }, + { + "epoch": 1.62, + "learning_rate": 9.230140366698167e-07, + "loss": 0.4692, + "step": 63065 + }, + { + "epoch": 1.62, + "learning_rate": 9.229864483664132e-07, + "loss": 0.4692, + "step": 63066 + }, + { + "epoch": 1.62, + "learning_rate": 9.22958860121975e-07, + "loss": 0.6001, + "step": 63067 + }, + { + "epoch": 1.62, + "learning_rate": 9.229312719365235e-07, + "loss": 0.7363, + "step": 63068 + }, + { + "epoch": 1.62, + "learning_rate": 9.229036838100803e-07, + "loss": 0.479, + "step": 63069 + }, + { + "epoch": 1.62, + "learning_rate": 9.22876095742666e-07, + "loss": 0.7617, + "step": 63070 + }, + { + "epoch": 1.62, + "learning_rate": 9.22848507734302e-07, + "loss": 0.6401, + "step": 63071 + }, + { + "epoch": 1.62, + "learning_rate": 9.228209197850095e-07, + "loss": 0.7627, + "step": 63072 + }, + { + "epoch": 1.62, + "learning_rate": 9.227933318948092e-07, + "loss": 0.6807, + "step": 63073 + }, + { + "epoch": 1.62, + "learning_rate": 9.227657440637226e-07, + "loss": 0.6597, + "step": 63074 + }, + { + "epoch": 1.62, + "learning_rate": 9.227381562917707e-07, + "loss": 0.6689, + "step": 63075 + }, + { + "epoch": 1.62, + "learning_rate": 9.22710568578975e-07, + "loss": 0.6309, + "step": 63076 + }, + { + "epoch": 1.62, + "learning_rate": 9.22682980925356e-07, + "loss": 0.8418, + "step": 63077 + }, + { + "epoch": 1.62, + "learning_rate": 9.226553933309349e-07, + "loss": 0.5718, + "step": 63078 + }, + { + "epoch": 1.62, + "learning_rate": 9.226278057957333e-07, + "loss": 0.6865, + "step": 63079 + }, + { + "epoch": 1.62, + "learning_rate": 9.226002183197717e-07, + "loss": 0.437, + "step": 63080 + }, + { + "epoch": 1.62, + "learning_rate": 9.225726309030718e-07, + "loss": 0.6191, + "step": 63081 + }, + { + "epoch": 1.62, + "learning_rate": 9.225450435456543e-07, + "loss": 0.7705, + "step": 63082 + }, + { + "epoch": 1.62, + "learning_rate": 9.225174562475406e-07, + "loss": 0.4085, + "step": 63083 + }, + { + "epoch": 1.62, + "learning_rate": 9.224898690087516e-07, + "loss": 0.6333, + "step": 63084 + }, + { + "epoch": 1.62, + "learning_rate": 9.224622818293087e-07, + "loss": 0.6455, + "step": 63085 + }, + { + "epoch": 1.62, + "learning_rate": 9.224346947092332e-07, + "loss": 0.6572, + "step": 63086 + }, + { + "epoch": 1.62, + "learning_rate": 9.224071076485454e-07, + "loss": 0.6108, + "step": 63087 + }, + { + "epoch": 1.62, + "learning_rate": 9.223795206472671e-07, + "loss": 0.7158, + "step": 63088 + }, + { + "epoch": 1.62, + "learning_rate": 9.223519337054191e-07, + "loss": 0.4478, + "step": 63089 + }, + { + "epoch": 1.62, + "learning_rate": 9.223243468230227e-07, + "loss": 0.4315, + "step": 63090 + }, + { + "epoch": 1.62, + "learning_rate": 9.22296760000099e-07, + "loss": 0.6646, + "step": 63091 + }, + { + "epoch": 1.62, + "learning_rate": 9.222691732366691e-07, + "loss": 0.5991, + "step": 63092 + }, + { + "epoch": 1.62, + "learning_rate": 9.222415865327542e-07, + "loss": 0.6348, + "step": 63093 + }, + { + "epoch": 1.62, + "learning_rate": 9.222139998883751e-07, + "loss": 0.5974, + "step": 63094 + }, + { + "epoch": 1.62, + "learning_rate": 9.221864133035534e-07, + "loss": 0.5981, + "step": 63095 + }, + { + "epoch": 1.62, + "learning_rate": 9.221588267783102e-07, + "loss": 0.6865, + "step": 63096 + }, + { + "epoch": 1.62, + "learning_rate": 9.22131240312666e-07, + "loss": 0.6123, + "step": 63097 + }, + { + "epoch": 1.62, + "learning_rate": 9.221036539066425e-07, + "loss": 0.7188, + "step": 63098 + }, + { + "epoch": 1.62, + "learning_rate": 9.220760675602603e-07, + "loss": 0.6738, + "step": 63099 + }, + { + "epoch": 1.62, + "learning_rate": 9.220484812735414e-07, + "loss": 0.5415, + "step": 63100 + }, + { + "epoch": 1.62, + "learning_rate": 9.220208950465059e-07, + "loss": 0.6875, + "step": 63101 + }, + { + "epoch": 1.62, + "learning_rate": 9.219933088791758e-07, + "loss": 0.5979, + "step": 63102 + }, + { + "epoch": 1.62, + "learning_rate": 9.219657227715716e-07, + "loss": 0.5676, + "step": 63103 + }, + { + "epoch": 1.62, + "learning_rate": 9.219381367237148e-07, + "loss": 0.6543, + "step": 63104 + }, + { + "epoch": 1.62, + "learning_rate": 9.219105507356262e-07, + "loss": 0.5234, + "step": 63105 + }, + { + "epoch": 1.62, + "learning_rate": 9.218829648073275e-07, + "loss": 0.3706, + "step": 63106 + }, + { + "epoch": 1.62, + "learning_rate": 9.218553789388394e-07, + "loss": 0.71, + "step": 63107 + }, + { + "epoch": 1.62, + "learning_rate": 9.218277931301827e-07, + "loss": 0.3783, + "step": 63108 + }, + { + "epoch": 1.62, + "learning_rate": 9.218002073813789e-07, + "loss": 0.5596, + "step": 63109 + }, + { + "epoch": 1.62, + "learning_rate": 9.217726216924493e-07, + "loss": 0.6514, + "step": 63110 + }, + { + "epoch": 1.62, + "learning_rate": 9.217450360634145e-07, + "loss": 0.6455, + "step": 63111 + }, + { + "epoch": 1.62, + "learning_rate": 9.217174504942961e-07, + "loss": 0.6115, + "step": 63112 + }, + { + "epoch": 1.62, + "learning_rate": 9.216898649851151e-07, + "loss": 0.7754, + "step": 63113 + }, + { + "epoch": 1.62, + "learning_rate": 9.216622795358925e-07, + "loss": 0.6655, + "step": 63114 + }, + { + "epoch": 1.62, + "learning_rate": 9.216346941466493e-07, + "loss": 0.606, + "step": 63115 + }, + { + "epoch": 1.62, + "learning_rate": 9.216071088174073e-07, + "loss": 0.5518, + "step": 63116 + }, + { + "epoch": 1.62, + "learning_rate": 9.215795235481871e-07, + "loss": 0.6084, + "step": 63117 + }, + { + "epoch": 1.62, + "learning_rate": 9.215519383390093e-07, + "loss": 0.6787, + "step": 63118 + }, + { + "epoch": 1.62, + "learning_rate": 9.215243531898959e-07, + "loss": 0.7266, + "step": 63119 + }, + { + "epoch": 1.62, + "learning_rate": 9.214967681008677e-07, + "loss": 0.7832, + "step": 63120 + }, + { + "epoch": 1.62, + "learning_rate": 9.214691830719457e-07, + "loss": 0.8086, + "step": 63121 + }, + { + "epoch": 1.62, + "learning_rate": 9.214415981031511e-07, + "loss": 0.4722, + "step": 63122 + }, + { + "epoch": 1.62, + "learning_rate": 9.214140131945053e-07, + "loss": 0.6797, + "step": 63123 + }, + { + "epoch": 1.62, + "learning_rate": 9.213864283460288e-07, + "loss": 0.7646, + "step": 63124 + }, + { + "epoch": 1.62, + "learning_rate": 9.213588435577435e-07, + "loss": 0.5674, + "step": 63125 + }, + { + "epoch": 1.62, + "learning_rate": 9.213312588296703e-07, + "loss": 0.8311, + "step": 63126 + }, + { + "epoch": 1.62, + "learning_rate": 9.213036741618298e-07, + "loss": 1.0, + "step": 63127 + }, + { + "epoch": 1.62, + "learning_rate": 9.212760895542434e-07, + "loss": 0.6826, + "step": 63128 + }, + { + "epoch": 1.62, + "learning_rate": 9.212485050069324e-07, + "loss": 0.4392, + "step": 63129 + }, + { + "epoch": 1.62, + "learning_rate": 9.212209205199177e-07, + "loss": 0.6387, + "step": 63130 + }, + { + "epoch": 1.62, + "learning_rate": 9.211933360932206e-07, + "loss": 0.5635, + "step": 63131 + }, + { + "epoch": 1.62, + "learning_rate": 9.21165751726862e-07, + "loss": 0.5898, + "step": 63132 + }, + { + "epoch": 1.62, + "learning_rate": 9.211381674208633e-07, + "loss": 0.6699, + "step": 63133 + }, + { + "epoch": 1.62, + "learning_rate": 9.211105831752453e-07, + "loss": 0.3584, + "step": 63134 + }, + { + "epoch": 1.62, + "learning_rate": 9.210829989900295e-07, + "loss": 0.6211, + "step": 63135 + }, + { + "epoch": 1.62, + "learning_rate": 9.21055414865237e-07, + "loss": 0.585, + "step": 63136 + }, + { + "epoch": 1.62, + "learning_rate": 9.210278308008883e-07, + "loss": 0.6548, + "step": 63137 + }, + { + "epoch": 1.62, + "learning_rate": 9.210002467970053e-07, + "loss": 0.7471, + "step": 63138 + }, + { + "epoch": 1.62, + "learning_rate": 9.209726628536086e-07, + "loss": 0.6396, + "step": 63139 + }, + { + "epoch": 1.62, + "learning_rate": 9.209450789707195e-07, + "loss": 0.6279, + "step": 63140 + }, + { + "epoch": 1.62, + "learning_rate": 9.209174951483591e-07, + "loss": 0.7402, + "step": 63141 + }, + { + "epoch": 1.62, + "learning_rate": 9.208899113865485e-07, + "loss": 0.5732, + "step": 63142 + }, + { + "epoch": 1.62, + "learning_rate": 9.208623276853088e-07, + "loss": 0.6865, + "step": 63143 + }, + { + "epoch": 1.62, + "learning_rate": 9.208347440446615e-07, + "loss": 0.6482, + "step": 63144 + }, + { + "epoch": 1.62, + "learning_rate": 9.208071604646273e-07, + "loss": 0.7695, + "step": 63145 + }, + { + "epoch": 1.62, + "learning_rate": 9.207795769452275e-07, + "loss": 0.5576, + "step": 63146 + }, + { + "epoch": 1.62, + "learning_rate": 9.20751993486483e-07, + "loss": 0.79, + "step": 63147 + }, + { + "epoch": 1.62, + "learning_rate": 9.20724410088415e-07, + "loss": 0.571, + "step": 63148 + }, + { + "epoch": 1.62, + "learning_rate": 9.206968267510446e-07, + "loss": 0.6431, + "step": 63149 + }, + { + "epoch": 1.62, + "learning_rate": 9.206692434743931e-07, + "loss": 0.728, + "step": 63150 + }, + { + "epoch": 1.62, + "learning_rate": 9.206416602584814e-07, + "loss": 0.7646, + "step": 63151 + }, + { + "epoch": 1.62, + "learning_rate": 9.206140771033309e-07, + "loss": 0.6768, + "step": 63152 + }, + { + "epoch": 1.62, + "learning_rate": 9.205864940089623e-07, + "loss": 0.6479, + "step": 63153 + }, + { + "epoch": 1.62, + "learning_rate": 9.205589109753972e-07, + "loss": 0.7578, + "step": 63154 + }, + { + "epoch": 1.62, + "learning_rate": 9.205313280026563e-07, + "loss": 0.6465, + "step": 63155 + }, + { + "epoch": 1.62, + "learning_rate": 9.205037450907613e-07, + "loss": 0.6592, + "step": 63156 + }, + { + "epoch": 1.62, + "learning_rate": 9.204761622397328e-07, + "loss": 0.5596, + "step": 63157 + }, + { + "epoch": 1.62, + "learning_rate": 9.204485794495919e-07, + "loss": 0.6475, + "step": 63158 + }, + { + "epoch": 1.62, + "learning_rate": 9.204209967203599e-07, + "loss": 0.6914, + "step": 63159 + }, + { + "epoch": 1.62, + "learning_rate": 9.203934140520577e-07, + "loss": 0.8281, + "step": 63160 + }, + { + "epoch": 1.62, + "learning_rate": 9.20365831444707e-07, + "loss": 0.4509, + "step": 63161 + }, + { + "epoch": 1.62, + "learning_rate": 9.20338248898328e-07, + "loss": 0.6211, + "step": 63162 + }, + { + "epoch": 1.62, + "learning_rate": 9.203106664129428e-07, + "loss": 0.6787, + "step": 63163 + }, + { + "epoch": 1.62, + "learning_rate": 9.202830839885719e-07, + "loss": 0.7021, + "step": 63164 + }, + { + "epoch": 1.62, + "learning_rate": 9.202555016252365e-07, + "loss": 0.5879, + "step": 63165 + }, + { + "epoch": 1.62, + "learning_rate": 9.20227919322958e-07, + "loss": 0.7456, + "step": 63166 + }, + { + "epoch": 1.62, + "learning_rate": 9.202003370817574e-07, + "loss": 0.543, + "step": 63167 + }, + { + "epoch": 1.62, + "learning_rate": 9.201727549016554e-07, + "loss": 0.5957, + "step": 63168 + }, + { + "epoch": 1.62, + "learning_rate": 9.201451727826735e-07, + "loss": 0.5046, + "step": 63169 + }, + { + "epoch": 1.62, + "learning_rate": 9.201175907248327e-07, + "loss": 0.6199, + "step": 63170 + }, + { + "epoch": 1.62, + "learning_rate": 9.200900087281545e-07, + "loss": 0.5623, + "step": 63171 + }, + { + "epoch": 1.62, + "learning_rate": 9.200624267926593e-07, + "loss": 0.5432, + "step": 63172 + }, + { + "epoch": 1.62, + "learning_rate": 9.200348449183691e-07, + "loss": 0.7344, + "step": 63173 + }, + { + "epoch": 1.62, + "learning_rate": 9.20007263105304e-07, + "loss": 0.6689, + "step": 63174 + }, + { + "epoch": 1.62, + "learning_rate": 9.19979681353486e-07, + "loss": 0.752, + "step": 63175 + }, + { + "epoch": 1.62, + "learning_rate": 9.199520996629362e-07, + "loss": 0.624, + "step": 63176 + }, + { + "epoch": 1.62, + "learning_rate": 9.199245180336748e-07, + "loss": 0.5308, + "step": 63177 + }, + { + "epoch": 1.62, + "learning_rate": 9.198969364657239e-07, + "loss": 0.7139, + "step": 63178 + }, + { + "epoch": 1.62, + "learning_rate": 9.198693549591039e-07, + "loss": 0.6016, + "step": 63179 + }, + { + "epoch": 1.62, + "learning_rate": 9.198417735138365e-07, + "loss": 0.6274, + "step": 63180 + }, + { + "epoch": 1.62, + "learning_rate": 9.198141921299426e-07, + "loss": 0.6953, + "step": 63181 + }, + { + "epoch": 1.62, + "learning_rate": 9.19786610807443e-07, + "loss": 0.4951, + "step": 63182 + }, + { + "epoch": 1.62, + "learning_rate": 9.197590295463594e-07, + "loss": 0.6475, + "step": 63183 + }, + { + "epoch": 1.62, + "learning_rate": 9.197314483467124e-07, + "loss": 0.7158, + "step": 63184 + }, + { + "epoch": 1.62, + "learning_rate": 9.197038672085235e-07, + "loss": 0.918, + "step": 63185 + }, + { + "epoch": 1.62, + "learning_rate": 9.196762861318139e-07, + "loss": 0.6885, + "step": 63186 + }, + { + "epoch": 1.62, + "learning_rate": 9.196487051166041e-07, + "loss": 0.4902, + "step": 63187 + }, + { + "epoch": 1.62, + "learning_rate": 9.196211241629157e-07, + "loss": 0.7686, + "step": 63188 + }, + { + "epoch": 1.62, + "learning_rate": 9.195935432707696e-07, + "loss": 0.6002, + "step": 63189 + }, + { + "epoch": 1.62, + "learning_rate": 9.195659624401872e-07, + "loss": 0.6611, + "step": 63190 + }, + { + "epoch": 1.62, + "learning_rate": 9.195383816711892e-07, + "loss": 0.5886, + "step": 63191 + }, + { + "epoch": 1.62, + "learning_rate": 9.195108009637971e-07, + "loss": 0.6904, + "step": 63192 + }, + { + "epoch": 1.62, + "learning_rate": 9.194832203180317e-07, + "loss": 0.7285, + "step": 63193 + }, + { + "epoch": 1.62, + "learning_rate": 9.194556397339146e-07, + "loss": 0.6758, + "step": 63194 + }, + { + "epoch": 1.62, + "learning_rate": 9.194280592114664e-07, + "loss": 0.7139, + "step": 63195 + }, + { + "epoch": 1.62, + "learning_rate": 9.194004787507088e-07, + "loss": 0.5449, + "step": 63196 + }, + { + "epoch": 1.62, + "learning_rate": 9.193728983516623e-07, + "loss": 0.6963, + "step": 63197 + }, + { + "epoch": 1.62, + "learning_rate": 9.193453180143483e-07, + "loss": 0.646, + "step": 63198 + }, + { + "epoch": 1.62, + "learning_rate": 9.193177377387877e-07, + "loss": 0.6787, + "step": 63199 + }, + { + "epoch": 1.62, + "learning_rate": 9.19290157525002e-07, + "loss": 0.7256, + "step": 63200 + }, + { + "epoch": 1.62, + "learning_rate": 9.192625773730119e-07, + "loss": 0.6396, + "step": 63201 + }, + { + "epoch": 1.62, + "learning_rate": 9.192349972828389e-07, + "loss": 0.5254, + "step": 63202 + }, + { + "epoch": 1.62, + "learning_rate": 9.192074172545039e-07, + "loss": 0.6787, + "step": 63203 + }, + { + "epoch": 1.62, + "learning_rate": 9.191798372880281e-07, + "loss": 0.6934, + "step": 63204 + }, + { + "epoch": 1.62, + "learning_rate": 9.191522573834324e-07, + "loss": 0.6377, + "step": 63205 + }, + { + "epoch": 1.62, + "learning_rate": 9.191246775407386e-07, + "loss": 0.7139, + "step": 63206 + }, + { + "epoch": 1.62, + "learning_rate": 9.19097097759967e-07, + "loss": 0.5137, + "step": 63207 + }, + { + "epoch": 1.62, + "learning_rate": 9.19069518041139e-07, + "loss": 0.7227, + "step": 63208 + }, + { + "epoch": 1.62, + "learning_rate": 9.190419383842758e-07, + "loss": 0.5347, + "step": 63209 + }, + { + "epoch": 1.62, + "learning_rate": 9.190143587893983e-07, + "loss": 0.5488, + "step": 63210 + }, + { + "epoch": 1.62, + "learning_rate": 9.189867792565279e-07, + "loss": 0.6201, + "step": 63211 + }, + { + "epoch": 1.62, + "learning_rate": 9.189591997856854e-07, + "loss": 0.564, + "step": 63212 + }, + { + "epoch": 1.62, + "learning_rate": 9.189316203768924e-07, + "loss": 0.6343, + "step": 63213 + }, + { + "epoch": 1.62, + "learning_rate": 9.189040410301696e-07, + "loss": 0.6045, + "step": 63214 + }, + { + "epoch": 1.62, + "learning_rate": 9.188764617455383e-07, + "loss": 0.4961, + "step": 63215 + }, + { + "epoch": 1.62, + "learning_rate": 9.188488825230199e-07, + "loss": 0.8291, + "step": 63216 + }, + { + "epoch": 1.62, + "learning_rate": 9.18821303362635e-07, + "loss": 0.5664, + "step": 63217 + }, + { + "epoch": 1.62, + "learning_rate": 9.187937242644045e-07, + "loss": 0.6812, + "step": 63218 + }, + { + "epoch": 1.62, + "learning_rate": 9.187661452283502e-07, + "loss": 0.4111, + "step": 63219 + }, + { + "epoch": 1.62, + "learning_rate": 9.187385662544928e-07, + "loss": 0.5933, + "step": 63220 + }, + { + "epoch": 1.62, + "learning_rate": 9.187109873428537e-07, + "loss": 0.6055, + "step": 63221 + }, + { + "epoch": 1.62, + "learning_rate": 9.186834084934536e-07, + "loss": 0.6504, + "step": 63222 + }, + { + "epoch": 1.62, + "learning_rate": 9.186558297063142e-07, + "loss": 0.6436, + "step": 63223 + }, + { + "epoch": 1.62, + "learning_rate": 9.186282509814559e-07, + "loss": 0.7246, + "step": 63224 + }, + { + "epoch": 1.62, + "learning_rate": 9.186006723189006e-07, + "loss": 0.4796, + "step": 63225 + }, + { + "epoch": 1.62, + "learning_rate": 9.185730937186691e-07, + "loss": 0.5303, + "step": 63226 + }, + { + "epoch": 1.62, + "learning_rate": 9.18545515180782e-07, + "loss": 0.6116, + "step": 63227 + }, + { + "epoch": 1.62, + "learning_rate": 9.185179367052613e-07, + "loss": 0.5449, + "step": 63228 + }, + { + "epoch": 1.62, + "learning_rate": 9.184903582921272e-07, + "loss": 0.6802, + "step": 63229 + }, + { + "epoch": 1.62, + "learning_rate": 9.184627799414017e-07, + "loss": 0.6465, + "step": 63230 + }, + { + "epoch": 1.62, + "learning_rate": 9.18435201653105e-07, + "loss": 0.5786, + "step": 63231 + }, + { + "epoch": 1.62, + "learning_rate": 9.184076234272592e-07, + "loss": 0.7676, + "step": 63232 + }, + { + "epoch": 1.62, + "learning_rate": 9.183800452638845e-07, + "loss": 0.6865, + "step": 63233 + }, + { + "epoch": 1.62, + "learning_rate": 9.183524671630029e-07, + "loss": 0.6016, + "step": 63234 + }, + { + "epoch": 1.62, + "learning_rate": 9.183248891246349e-07, + "loss": 0.4863, + "step": 63235 + }, + { + "epoch": 1.62, + "learning_rate": 9.182973111488021e-07, + "loss": 0.6689, + "step": 63236 + }, + { + "epoch": 1.62, + "learning_rate": 9.182697332355248e-07, + "loss": 0.589, + "step": 63237 + }, + { + "epoch": 1.62, + "learning_rate": 9.182421553848248e-07, + "loss": 0.3691, + "step": 63238 + }, + { + "epoch": 1.62, + "learning_rate": 9.182145775967228e-07, + "loss": 0.7217, + "step": 63239 + }, + { + "epoch": 1.62, + "learning_rate": 9.181869998712404e-07, + "loss": 0.6416, + "step": 63240 + }, + { + "epoch": 1.62, + "learning_rate": 9.181594222083983e-07, + "loss": 0.8184, + "step": 63241 + }, + { + "epoch": 1.62, + "learning_rate": 9.181318446082178e-07, + "loss": 0.6069, + "step": 63242 + }, + { + "epoch": 1.62, + "learning_rate": 9.1810426707072e-07, + "loss": 0.6758, + "step": 63243 + }, + { + "epoch": 1.62, + "learning_rate": 9.18076689595926e-07, + "loss": 0.4662, + "step": 63244 + }, + { + "epoch": 1.62, + "learning_rate": 9.180491121838572e-07, + "loss": 0.6992, + "step": 63245 + }, + { + "epoch": 1.62, + "learning_rate": 9.18021534834534e-07, + "loss": 0.709, + "step": 63246 + }, + { + "epoch": 1.62, + "learning_rate": 9.179939575479782e-07, + "loss": 0.8076, + "step": 63247 + }, + { + "epoch": 1.62, + "learning_rate": 9.179663803242104e-07, + "loss": 0.6108, + "step": 63248 + }, + { + "epoch": 1.62, + "learning_rate": 9.179388031632522e-07, + "loss": 0.6357, + "step": 63249 + }, + { + "epoch": 1.62, + "learning_rate": 9.179112260651242e-07, + "loss": 0.6255, + "step": 63250 + }, + { + "epoch": 1.62, + "learning_rate": 9.178836490298481e-07, + "loss": 0.6475, + "step": 63251 + }, + { + "epoch": 1.62, + "learning_rate": 9.178560720574444e-07, + "loss": 0.6255, + "step": 63252 + }, + { + "epoch": 1.62, + "learning_rate": 9.178284951479349e-07, + "loss": 0.6006, + "step": 63253 + }, + { + "epoch": 1.62, + "learning_rate": 9.178009183013402e-07, + "loss": 0.5796, + "step": 63254 + }, + { + "epoch": 1.62, + "learning_rate": 9.17773341517682e-07, + "loss": 0.6914, + "step": 63255 + }, + { + "epoch": 1.62, + "learning_rate": 9.177457647969803e-07, + "loss": 0.6191, + "step": 63256 + }, + { + "epoch": 1.62, + "learning_rate": 9.177181881392571e-07, + "loss": 0.7212, + "step": 63257 + }, + { + "epoch": 1.62, + "learning_rate": 9.176906115445332e-07, + "loss": 0.5073, + "step": 63258 + }, + { + "epoch": 1.62, + "learning_rate": 9.1766303501283e-07, + "loss": 0.5996, + "step": 63259 + }, + { + "epoch": 1.62, + "learning_rate": 9.176354585441682e-07, + "loss": 0.7373, + "step": 63260 + }, + { + "epoch": 1.62, + "learning_rate": 9.176078821385693e-07, + "loss": 0.6943, + "step": 63261 + }, + { + "epoch": 1.62, + "learning_rate": 9.175803057960541e-07, + "loss": 0.6538, + "step": 63262 + }, + { + "epoch": 1.62, + "learning_rate": 9.175527295166441e-07, + "loss": 0.7617, + "step": 63263 + }, + { + "epoch": 1.62, + "learning_rate": 9.1752515330036e-07, + "loss": 0.5801, + "step": 63264 + }, + { + "epoch": 1.62, + "learning_rate": 9.174975771472234e-07, + "loss": 0.7422, + "step": 63265 + }, + { + "epoch": 1.62, + "learning_rate": 9.17470001057255e-07, + "loss": 0.5435, + "step": 63266 + }, + { + "epoch": 1.62, + "learning_rate": 9.174424250304758e-07, + "loss": 0.6016, + "step": 63267 + }, + { + "epoch": 1.62, + "learning_rate": 9.174148490669073e-07, + "loss": 0.6396, + "step": 63268 + }, + { + "epoch": 1.62, + "learning_rate": 9.173872731665703e-07, + "loss": 0.7471, + "step": 63269 + }, + { + "epoch": 1.62, + "learning_rate": 9.173596973294863e-07, + "loss": 0.4133, + "step": 63270 + }, + { + "epoch": 1.62, + "learning_rate": 9.173321215556761e-07, + "loss": 0.7256, + "step": 63271 + }, + { + "epoch": 1.62, + "learning_rate": 9.173045458451608e-07, + "loss": 0.6655, + "step": 63272 + }, + { + "epoch": 1.62, + "learning_rate": 9.172769701979616e-07, + "loss": 0.6836, + "step": 63273 + }, + { + "epoch": 1.62, + "learning_rate": 9.172493946140995e-07, + "loss": 0.7295, + "step": 63274 + }, + { + "epoch": 1.62, + "learning_rate": 9.172218190935963e-07, + "loss": 0.5166, + "step": 63275 + }, + { + "epoch": 1.62, + "learning_rate": 9.171942436364723e-07, + "loss": 0.4756, + "step": 63276 + }, + { + "epoch": 1.62, + "learning_rate": 9.171666682427486e-07, + "loss": 0.6255, + "step": 63277 + }, + { + "epoch": 1.62, + "learning_rate": 9.171390929124468e-07, + "loss": 0.7314, + "step": 63278 + }, + { + "epoch": 1.62, + "learning_rate": 9.171115176455875e-07, + "loss": 0.6108, + "step": 63279 + }, + { + "epoch": 1.62, + "learning_rate": 9.170839424421923e-07, + "loss": 0.6099, + "step": 63280 + }, + { + "epoch": 1.62, + "learning_rate": 9.17056367302282e-07, + "loss": 0.522, + "step": 63281 + }, + { + "epoch": 1.62, + "learning_rate": 9.170287922258781e-07, + "loss": 0.5967, + "step": 63282 + }, + { + "epoch": 1.62, + "learning_rate": 9.170012172130011e-07, + "loss": 0.7871, + "step": 63283 + }, + { + "epoch": 1.62, + "learning_rate": 9.169736422636725e-07, + "loss": 0.6313, + "step": 63284 + }, + { + "epoch": 1.62, + "learning_rate": 9.169460673779139e-07, + "loss": 0.5791, + "step": 63285 + }, + { + "epoch": 1.62, + "learning_rate": 9.169184925557453e-07, + "loss": 0.5885, + "step": 63286 + }, + { + "epoch": 1.62, + "learning_rate": 9.168909177971886e-07, + "loss": 0.5977, + "step": 63287 + }, + { + "epoch": 1.62, + "learning_rate": 9.168633431022648e-07, + "loss": 0.5537, + "step": 63288 + }, + { + "epoch": 1.62, + "learning_rate": 9.168357684709946e-07, + "loss": 0.7217, + "step": 63289 + }, + { + "epoch": 1.62, + "learning_rate": 9.168081939033996e-07, + "loss": 0.6191, + "step": 63290 + }, + { + "epoch": 1.62, + "learning_rate": 9.167806193995006e-07, + "loss": 0.5798, + "step": 63291 + }, + { + "epoch": 1.62, + "learning_rate": 9.16753044959319e-07, + "loss": 0.834, + "step": 63292 + }, + { + "epoch": 1.62, + "learning_rate": 9.167254705828758e-07, + "loss": 0.6582, + "step": 63293 + }, + { + "epoch": 1.62, + "learning_rate": 9.16697896270192e-07, + "loss": 0.7666, + "step": 63294 + }, + { + "epoch": 1.62, + "learning_rate": 9.166703220212892e-07, + "loss": 0.6328, + "step": 63295 + }, + { + "epoch": 1.62, + "learning_rate": 9.166427478361875e-07, + "loss": 0.554, + "step": 63296 + }, + { + "epoch": 1.62, + "learning_rate": 9.16615173714909e-07, + "loss": 0.5942, + "step": 63297 + }, + { + "epoch": 1.62, + "learning_rate": 9.16587599657474e-07, + "loss": 0.7236, + "step": 63298 + }, + { + "epoch": 1.62, + "learning_rate": 9.165600256639044e-07, + "loss": 0.6475, + "step": 63299 + }, + { + "epoch": 1.62, + "learning_rate": 9.165324517342208e-07, + "loss": 0.6621, + "step": 63300 + }, + { + "epoch": 1.62, + "learning_rate": 9.165048778684445e-07, + "loss": 0.5791, + "step": 63301 + }, + { + "epoch": 1.62, + "learning_rate": 9.164773040665966e-07, + "loss": 0.644, + "step": 63302 + }, + { + "epoch": 1.62, + "learning_rate": 9.164497303286981e-07, + "loss": 0.6943, + "step": 63303 + }, + { + "epoch": 1.62, + "learning_rate": 9.164221566547702e-07, + "loss": 0.7227, + "step": 63304 + }, + { + "epoch": 1.62, + "learning_rate": 9.163945830448346e-07, + "loss": 0.5947, + "step": 63305 + }, + { + "epoch": 1.62, + "learning_rate": 9.163670094989112e-07, + "loss": 0.6543, + "step": 63306 + }, + { + "epoch": 1.62, + "learning_rate": 9.163394360170219e-07, + "loss": 0.6113, + "step": 63307 + }, + { + "epoch": 1.62, + "learning_rate": 9.163118625991875e-07, + "loss": 0.5557, + "step": 63308 + }, + { + "epoch": 1.62, + "learning_rate": 9.162842892454295e-07, + "loss": 0.6301, + "step": 63309 + }, + { + "epoch": 1.62, + "learning_rate": 9.162567159557684e-07, + "loss": 0.7549, + "step": 63310 + }, + { + "epoch": 1.62, + "learning_rate": 9.16229142730226e-07, + "loss": 0.6934, + "step": 63311 + }, + { + "epoch": 1.62, + "learning_rate": 9.162015695688228e-07, + "loss": 0.5815, + "step": 63312 + }, + { + "epoch": 1.62, + "learning_rate": 9.161739964715805e-07, + "loss": 0.6284, + "step": 63313 + }, + { + "epoch": 1.62, + "learning_rate": 9.161464234385197e-07, + "loss": 0.7266, + "step": 63314 + }, + { + "epoch": 1.62, + "learning_rate": 9.161188504696622e-07, + "loss": 0.7256, + "step": 63315 + }, + { + "epoch": 1.62, + "learning_rate": 9.160912775650284e-07, + "loss": 0.6108, + "step": 63316 + }, + { + "epoch": 1.62, + "learning_rate": 9.160637047246394e-07, + "loss": 0.6592, + "step": 63317 + }, + { + "epoch": 1.62, + "learning_rate": 9.160361319485167e-07, + "loss": 0.6641, + "step": 63318 + }, + { + "epoch": 1.62, + "learning_rate": 9.160085592366811e-07, + "loss": 0.728, + "step": 63319 + }, + { + "epoch": 1.62, + "learning_rate": 9.159809865891542e-07, + "loss": 0.5393, + "step": 63320 + }, + { + "epoch": 1.62, + "learning_rate": 9.159534140059565e-07, + "loss": 0.5809, + "step": 63321 + }, + { + "epoch": 1.62, + "learning_rate": 9.159258414871096e-07, + "loss": 0.5581, + "step": 63322 + }, + { + "epoch": 1.62, + "learning_rate": 9.158982690326343e-07, + "loss": 0.5393, + "step": 63323 + }, + { + "epoch": 1.62, + "learning_rate": 9.15870696642552e-07, + "loss": 0.6143, + "step": 63324 + }, + { + "epoch": 1.62, + "learning_rate": 9.158431243168838e-07, + "loss": 0.6279, + "step": 63325 + }, + { + "epoch": 1.62, + "learning_rate": 9.158155520556506e-07, + "loss": 0.709, + "step": 63326 + }, + { + "epoch": 1.62, + "learning_rate": 9.157879798588731e-07, + "loss": 0.5687, + "step": 63327 + }, + { + "epoch": 1.62, + "learning_rate": 9.157604077265733e-07, + "loss": 0.71, + "step": 63328 + }, + { + "epoch": 1.62, + "learning_rate": 9.157328356587715e-07, + "loss": 0.423, + "step": 63329 + }, + { + "epoch": 1.62, + "learning_rate": 9.157052636554895e-07, + "loss": 0.6772, + "step": 63330 + }, + { + "epoch": 1.62, + "learning_rate": 9.156776917167479e-07, + "loss": 0.7695, + "step": 63331 + }, + { + "epoch": 1.62, + "learning_rate": 9.156501198425681e-07, + "loss": 0.5206, + "step": 63332 + }, + { + "epoch": 1.62, + "learning_rate": 9.156225480329711e-07, + "loss": 0.7744, + "step": 63333 + }, + { + "epoch": 1.62, + "learning_rate": 9.155949762879781e-07, + "loss": 0.749, + "step": 63334 + }, + { + "epoch": 1.62, + "learning_rate": 9.155674046076105e-07, + "loss": 0.6992, + "step": 63335 + }, + { + "epoch": 1.62, + "learning_rate": 9.155398329918885e-07, + "loss": 0.5908, + "step": 63336 + }, + { + "epoch": 1.62, + "learning_rate": 9.15512261440834e-07, + "loss": 0.6553, + "step": 63337 + }, + { + "epoch": 1.62, + "learning_rate": 9.154846899544678e-07, + "loss": 0.583, + "step": 63338 + }, + { + "epoch": 1.62, + "learning_rate": 9.154571185328112e-07, + "loss": 0.7939, + "step": 63339 + }, + { + "epoch": 1.62, + "learning_rate": 9.154295471758849e-07, + "loss": 0.7061, + "step": 63340 + }, + { + "epoch": 1.62, + "learning_rate": 9.154019758837106e-07, + "loss": 0.6084, + "step": 63341 + }, + { + "epoch": 1.62, + "learning_rate": 9.153744046563089e-07, + "loss": 0.5168, + "step": 63342 + }, + { + "epoch": 1.62, + "learning_rate": 9.153468334937013e-07, + "loss": 0.6758, + "step": 63343 + }, + { + "epoch": 1.62, + "learning_rate": 9.153192623959089e-07, + "loss": 0.5801, + "step": 63344 + }, + { + "epoch": 1.62, + "learning_rate": 9.152916913629527e-07, + "loss": 0.5552, + "step": 63345 + }, + { + "epoch": 1.62, + "learning_rate": 9.152641203948533e-07, + "loss": 0.6553, + "step": 63346 + }, + { + "epoch": 1.62, + "learning_rate": 9.152365494916325e-07, + "loss": 0.5718, + "step": 63347 + }, + { + "epoch": 1.62, + "learning_rate": 9.15208978653311e-07, + "loss": 0.6799, + "step": 63348 + }, + { + "epoch": 1.62, + "learning_rate": 9.151814078799104e-07, + "loss": 0.6089, + "step": 63349 + }, + { + "epoch": 1.62, + "learning_rate": 9.151538371714512e-07, + "loss": 0.7148, + "step": 63350 + }, + { + "epoch": 1.62, + "learning_rate": 9.15126266527955e-07, + "loss": 0.8633, + "step": 63351 + }, + { + "epoch": 1.62, + "learning_rate": 9.150986959494426e-07, + "loss": 0.6602, + "step": 63352 + }, + { + "epoch": 1.62, + "learning_rate": 9.150711254359353e-07, + "loss": 0.5615, + "step": 63353 + }, + { + "epoch": 1.62, + "learning_rate": 9.150435549874539e-07, + "loss": 0.6001, + "step": 63354 + }, + { + "epoch": 1.62, + "learning_rate": 9.150159846040203e-07, + "loss": 0.6475, + "step": 63355 + }, + { + "epoch": 1.62, + "learning_rate": 9.149884142856548e-07, + "loss": 0.5898, + "step": 63356 + }, + { + "epoch": 1.62, + "learning_rate": 9.149608440323785e-07, + "loss": 0.6797, + "step": 63357 + }, + { + "epoch": 1.62, + "learning_rate": 9.149332738442131e-07, + "loss": 0.7402, + "step": 63358 + }, + { + "epoch": 1.62, + "learning_rate": 9.149057037211791e-07, + "loss": 0.413, + "step": 63359 + }, + { + "epoch": 1.62, + "learning_rate": 9.148781336632981e-07, + "loss": 0.6895, + "step": 63360 + }, + { + "epoch": 1.62, + "learning_rate": 9.148505636705908e-07, + "loss": 0.5342, + "step": 63361 + }, + { + "epoch": 1.62, + "learning_rate": 9.148229937430786e-07, + "loss": 0.7588, + "step": 63362 + }, + { + "epoch": 1.62, + "learning_rate": 9.147954238807826e-07, + "loss": 0.7168, + "step": 63363 + }, + { + "epoch": 1.62, + "learning_rate": 9.147678540837236e-07, + "loss": 0.7412, + "step": 63364 + }, + { + "epoch": 1.62, + "learning_rate": 9.147402843519234e-07, + "loss": 0.7393, + "step": 63365 + }, + { + "epoch": 1.62, + "learning_rate": 9.147127146854023e-07, + "loss": 0.3306, + "step": 63366 + }, + { + "epoch": 1.62, + "learning_rate": 9.146851450841817e-07, + "loss": 0.7275, + "step": 63367 + }, + { + "epoch": 1.62, + "learning_rate": 9.14657575548283e-07, + "loss": 0.6641, + "step": 63368 + }, + { + "epoch": 1.62, + "learning_rate": 9.146300060777268e-07, + "loss": 0.7217, + "step": 63369 + }, + { + "epoch": 1.62, + "learning_rate": 9.146024366725347e-07, + "loss": 0.7959, + "step": 63370 + }, + { + "epoch": 1.62, + "learning_rate": 9.145748673327272e-07, + "loss": 0.5571, + "step": 63371 + }, + { + "epoch": 1.62, + "learning_rate": 9.145472980583263e-07, + "loss": 0.5235, + "step": 63372 + }, + { + "epoch": 1.62, + "learning_rate": 9.145197288493522e-07, + "loss": 0.7368, + "step": 63373 + }, + { + "epoch": 1.62, + "learning_rate": 9.144921597058268e-07, + "loss": 0.7461, + "step": 63374 + }, + { + "epoch": 1.62, + "learning_rate": 9.144645906277708e-07, + "loss": 0.6338, + "step": 63375 + }, + { + "epoch": 1.62, + "learning_rate": 9.144370216152051e-07, + "loss": 0.7842, + "step": 63376 + }, + { + "epoch": 1.62, + "learning_rate": 9.144094526681512e-07, + "loss": 0.7246, + "step": 63377 + }, + { + "epoch": 1.62, + "learning_rate": 9.1438188378663e-07, + "loss": 0.5549, + "step": 63378 + }, + { + "epoch": 1.62, + "learning_rate": 9.143543149706624e-07, + "loss": 0.5574, + "step": 63379 + }, + { + "epoch": 1.62, + "learning_rate": 9.143267462202701e-07, + "loss": 0.7144, + "step": 63380 + }, + { + "epoch": 1.62, + "learning_rate": 9.142991775354734e-07, + "loss": 0.5879, + "step": 63381 + }, + { + "epoch": 1.62, + "learning_rate": 9.142716089162944e-07, + "loss": 0.7256, + "step": 63382 + }, + { + "epoch": 1.62, + "learning_rate": 9.142440403627534e-07, + "loss": 0.6108, + "step": 63383 + }, + { + "epoch": 1.62, + "learning_rate": 9.14216471874872e-07, + "loss": 0.5352, + "step": 63384 + }, + { + "epoch": 1.62, + "learning_rate": 9.141889034526712e-07, + "loss": 0.708, + "step": 63385 + }, + { + "epoch": 1.62, + "learning_rate": 9.141613350961717e-07, + "loss": 0.6172, + "step": 63386 + }, + { + "epoch": 1.62, + "learning_rate": 9.141337668053951e-07, + "loss": 0.6978, + "step": 63387 + }, + { + "epoch": 1.62, + "learning_rate": 9.141061985803621e-07, + "loss": 0.5046, + "step": 63388 + }, + { + "epoch": 1.62, + "learning_rate": 9.140786304210942e-07, + "loss": 0.426, + "step": 63389 + }, + { + "epoch": 1.62, + "learning_rate": 9.140510623276123e-07, + "loss": 0.4487, + "step": 63390 + }, + { + "epoch": 1.62, + "learning_rate": 9.140234942999376e-07, + "loss": 0.6538, + "step": 63391 + }, + { + "epoch": 1.62, + "learning_rate": 9.13995926338091e-07, + "loss": 0.7676, + "step": 63392 + }, + { + "epoch": 1.62, + "learning_rate": 9.13968358442094e-07, + "loss": 0.6274, + "step": 63393 + }, + { + "epoch": 1.62, + "learning_rate": 9.139407906119671e-07, + "loss": 0.562, + "step": 63394 + }, + { + "epoch": 1.62, + "learning_rate": 9.139132228477326e-07, + "loss": 0.6348, + "step": 63395 + }, + { + "epoch": 1.62, + "learning_rate": 9.138856551494102e-07, + "loss": 0.5869, + "step": 63396 + }, + { + "epoch": 1.62, + "learning_rate": 9.138580875170217e-07, + "loss": 0.6157, + "step": 63397 + }, + { + "epoch": 1.62, + "learning_rate": 9.138305199505879e-07, + "loss": 0.6172, + "step": 63398 + }, + { + "epoch": 1.62, + "learning_rate": 9.138029524501303e-07, + "loss": 0.5864, + "step": 63399 + }, + { + "epoch": 1.62, + "learning_rate": 9.137753850156697e-07, + "loss": 0.5913, + "step": 63400 + }, + { + "epoch": 1.62, + "learning_rate": 9.137478176472275e-07, + "loss": 0.5623, + "step": 63401 + }, + { + "epoch": 1.63, + "learning_rate": 9.137202503448243e-07, + "loss": 0.4895, + "step": 63402 + }, + { + "epoch": 1.63, + "learning_rate": 9.136926831084818e-07, + "loss": 0.498, + "step": 63403 + }, + { + "epoch": 1.63, + "learning_rate": 9.136651159382206e-07, + "loss": 0.6411, + "step": 63404 + }, + { + "epoch": 1.63, + "learning_rate": 9.136375488340625e-07, + "loss": 0.5068, + "step": 63405 + }, + { + "epoch": 1.63, + "learning_rate": 9.13609981796028e-07, + "loss": 0.4407, + "step": 63406 + }, + { + "epoch": 1.63, + "learning_rate": 9.135824148241382e-07, + "loss": 0.6038, + "step": 63407 + }, + { + "epoch": 1.63, + "learning_rate": 9.135548479184146e-07, + "loss": 0.6064, + "step": 63408 + }, + { + "epoch": 1.63, + "learning_rate": 9.135272810788777e-07, + "loss": 0.5159, + "step": 63409 + }, + { + "epoch": 1.63, + "learning_rate": 9.134997143055492e-07, + "loss": 0.6187, + "step": 63410 + }, + { + "epoch": 1.63, + "learning_rate": 9.134721475984499e-07, + "loss": 0.4857, + "step": 63411 + }, + { + "epoch": 1.63, + "learning_rate": 9.134445809576011e-07, + "loss": 0.6465, + "step": 63412 + }, + { + "epoch": 1.63, + "learning_rate": 9.134170143830236e-07, + "loss": 0.5845, + "step": 63413 + }, + { + "epoch": 1.63, + "learning_rate": 9.13389447874739e-07, + "loss": 0.6582, + "step": 63414 + }, + { + "epoch": 1.63, + "learning_rate": 9.133618814327684e-07, + "loss": 0.5811, + "step": 63415 + }, + { + "epoch": 1.63, + "learning_rate": 9.133343150571323e-07, + "loss": 0.5197, + "step": 63416 + }, + { + "epoch": 1.63, + "learning_rate": 9.13306748747852e-07, + "loss": 0.6528, + "step": 63417 + }, + { + "epoch": 1.63, + "learning_rate": 9.132791825049488e-07, + "loss": 0.7705, + "step": 63418 + }, + { + "epoch": 1.63, + "learning_rate": 9.132516163284436e-07, + "loss": 0.6245, + "step": 63419 + }, + { + "epoch": 1.63, + "learning_rate": 9.132240502183579e-07, + "loss": 0.5698, + "step": 63420 + }, + { + "epoch": 1.63, + "learning_rate": 9.131964841747124e-07, + "loss": 0.6431, + "step": 63421 + }, + { + "epoch": 1.63, + "learning_rate": 9.131689181975284e-07, + "loss": 0.4824, + "step": 63422 + }, + { + "epoch": 1.63, + "learning_rate": 9.131413522868269e-07, + "loss": 0.7334, + "step": 63423 + }, + { + "epoch": 1.63, + "learning_rate": 9.131137864426293e-07, + "loss": 0.5278, + "step": 63424 + }, + { + "epoch": 1.63, + "learning_rate": 9.130862206649565e-07, + "loss": 0.708, + "step": 63425 + }, + { + "epoch": 1.63, + "learning_rate": 9.130586549538292e-07, + "loss": 0.4844, + "step": 63426 + }, + { + "epoch": 1.63, + "learning_rate": 9.130310893092693e-07, + "loss": 0.7041, + "step": 63427 + }, + { + "epoch": 1.63, + "learning_rate": 9.130035237312972e-07, + "loss": 0.5552, + "step": 63428 + }, + { + "epoch": 1.63, + "learning_rate": 9.129759582199344e-07, + "loss": 0.7129, + "step": 63429 + }, + { + "epoch": 1.63, + "learning_rate": 9.129483927752019e-07, + "loss": 0.6304, + "step": 63430 + }, + { + "epoch": 1.63, + "learning_rate": 9.129208273971208e-07, + "loss": 0.603, + "step": 63431 + }, + { + "epoch": 1.63, + "learning_rate": 9.128932620857122e-07, + "loss": 0.583, + "step": 63432 + }, + { + "epoch": 1.63, + "learning_rate": 9.128656968409974e-07, + "loss": 0.7402, + "step": 63433 + }, + { + "epoch": 1.63, + "learning_rate": 9.128381316629972e-07, + "loss": 0.6885, + "step": 63434 + }, + { + "epoch": 1.63, + "learning_rate": 9.128105665517332e-07, + "loss": 0.6973, + "step": 63435 + }, + { + "epoch": 1.63, + "learning_rate": 9.127830015072255e-07, + "loss": 0.6851, + "step": 63436 + }, + { + "epoch": 1.63, + "learning_rate": 9.127554365294963e-07, + "loss": 0.7471, + "step": 63437 + }, + { + "epoch": 1.63, + "learning_rate": 9.127278716185659e-07, + "loss": 0.7139, + "step": 63438 + }, + { + "epoch": 1.63, + "learning_rate": 9.12700306774456e-07, + "loss": 0.666, + "step": 63439 + }, + { + "epoch": 1.63, + "learning_rate": 9.126727419971873e-07, + "loss": 0.5776, + "step": 63440 + }, + { + "epoch": 1.63, + "learning_rate": 9.126451772867811e-07, + "loss": 0.8916, + "step": 63441 + }, + { + "epoch": 1.63, + "learning_rate": 9.126176126432584e-07, + "loss": 0.5806, + "step": 63442 + }, + { + "epoch": 1.63, + "learning_rate": 9.125900480666406e-07, + "loss": 0.749, + "step": 63443 + }, + { + "epoch": 1.63, + "learning_rate": 9.125624835569483e-07, + "loss": 0.5957, + "step": 63444 + }, + { + "epoch": 1.63, + "learning_rate": 9.125349191142034e-07, + "loss": 0.6963, + "step": 63445 + }, + { + "epoch": 1.63, + "learning_rate": 9.125073547384263e-07, + "loss": 0.469, + "step": 63446 + }, + { + "epoch": 1.63, + "learning_rate": 9.12479790429638e-07, + "loss": 0.5454, + "step": 63447 + }, + { + "epoch": 1.63, + "learning_rate": 9.124522261878601e-07, + "loss": 0.627, + "step": 63448 + }, + { + "epoch": 1.63, + "learning_rate": 9.124246620131133e-07, + "loss": 0.4619, + "step": 63449 + }, + { + "epoch": 1.63, + "learning_rate": 9.123970979054192e-07, + "loss": 0.5345, + "step": 63450 + }, + { + "epoch": 1.63, + "learning_rate": 9.123695338647986e-07, + "loss": 0.6499, + "step": 63451 + }, + { + "epoch": 1.63, + "learning_rate": 9.123419698912723e-07, + "loss": 0.666, + "step": 63452 + }, + { + "epoch": 1.63, + "learning_rate": 9.12314405984862e-07, + "loss": 0.5283, + "step": 63453 + }, + { + "epoch": 1.63, + "learning_rate": 9.122868421455883e-07, + "loss": 0.6519, + "step": 63454 + }, + { + "epoch": 1.63, + "learning_rate": 9.12259278373473e-07, + "loss": 0.6743, + "step": 63455 + }, + { + "epoch": 1.63, + "learning_rate": 9.122317146685365e-07, + "loss": 0.6973, + "step": 63456 + }, + { + "epoch": 1.63, + "learning_rate": 9.122041510308e-07, + "loss": 0.5337, + "step": 63457 + }, + { + "epoch": 1.63, + "learning_rate": 9.121765874602848e-07, + "loss": 0.4929, + "step": 63458 + }, + { + "epoch": 1.63, + "learning_rate": 9.121490239570118e-07, + "loss": 0.6621, + "step": 63459 + }, + { + "epoch": 1.63, + "learning_rate": 9.121214605210025e-07, + "loss": 0.5649, + "step": 63460 + }, + { + "epoch": 1.63, + "learning_rate": 9.120938971522775e-07, + "loss": 0.585, + "step": 63461 + }, + { + "epoch": 1.63, + "learning_rate": 9.120663338508584e-07, + "loss": 0.6768, + "step": 63462 + }, + { + "epoch": 1.63, + "learning_rate": 9.120387706167658e-07, + "loss": 0.5425, + "step": 63463 + }, + { + "epoch": 1.63, + "learning_rate": 9.120112074500213e-07, + "loss": 0.5596, + "step": 63464 + }, + { + "epoch": 1.63, + "learning_rate": 9.119836443506461e-07, + "loss": 0.5022, + "step": 63465 + }, + { + "epoch": 1.63, + "learning_rate": 9.119560813186605e-07, + "loss": 0.4922, + "step": 63466 + }, + { + "epoch": 1.63, + "learning_rate": 9.119285183540863e-07, + "loss": 0.626, + "step": 63467 + }, + { + "epoch": 1.63, + "learning_rate": 9.119009554569444e-07, + "loss": 0.5327, + "step": 63468 + }, + { + "epoch": 1.63, + "learning_rate": 9.118733926272555e-07, + "loss": 0.5015, + "step": 63469 + }, + { + "epoch": 1.63, + "learning_rate": 9.118458298650414e-07, + "loss": 0.8525, + "step": 63470 + }, + { + "epoch": 1.63, + "learning_rate": 9.118182671703227e-07, + "loss": 0.5869, + "step": 63471 + }, + { + "epoch": 1.63, + "learning_rate": 9.11790704543121e-07, + "loss": 0.6387, + "step": 63472 + }, + { + "epoch": 1.63, + "learning_rate": 9.117631419834568e-07, + "loss": 0.7471, + "step": 63473 + }, + { + "epoch": 1.63, + "learning_rate": 9.117355794913517e-07, + "loss": 0.5596, + "step": 63474 + }, + { + "epoch": 1.63, + "learning_rate": 9.117080170668268e-07, + "loss": 0.6191, + "step": 63475 + }, + { + "epoch": 1.63, + "learning_rate": 9.116804547099026e-07, + "loss": 0.668, + "step": 63476 + }, + { + "epoch": 1.63, + "learning_rate": 9.11652892420601e-07, + "loss": 0.5161, + "step": 63477 + }, + { + "epoch": 1.63, + "learning_rate": 9.116253301989423e-07, + "loss": 0.6816, + "step": 63478 + }, + { + "epoch": 1.63, + "learning_rate": 9.115977680449483e-07, + "loss": 0.6895, + "step": 63479 + }, + { + "epoch": 1.63, + "learning_rate": 9.115702059586396e-07, + "loss": 0.7754, + "step": 63480 + }, + { + "epoch": 1.63, + "learning_rate": 9.115426439400378e-07, + "loss": 0.5796, + "step": 63481 + }, + { + "epoch": 1.63, + "learning_rate": 9.115150819891634e-07, + "loss": 0.6152, + "step": 63482 + }, + { + "epoch": 1.63, + "learning_rate": 9.114875201060382e-07, + "loss": 0.499, + "step": 63483 + }, + { + "epoch": 1.63, + "learning_rate": 9.114599582906825e-07, + "loss": 0.6973, + "step": 63484 + }, + { + "epoch": 1.63, + "learning_rate": 9.114323965431186e-07, + "loss": 0.6577, + "step": 63485 + }, + { + "epoch": 1.63, + "learning_rate": 9.114048348633663e-07, + "loss": 0.7007, + "step": 63486 + }, + { + "epoch": 1.63, + "learning_rate": 9.113772732514475e-07, + "loss": 0.5317, + "step": 63487 + }, + { + "epoch": 1.63, + "learning_rate": 9.113497117073826e-07, + "loss": 0.4019, + "step": 63488 + }, + { + "epoch": 1.63, + "learning_rate": 9.113221502311935e-07, + "loss": 0.5679, + "step": 63489 + }, + { + "epoch": 1.63, + "learning_rate": 9.112945888229007e-07, + "loss": 0.5903, + "step": 63490 + }, + { + "epoch": 1.63, + "learning_rate": 9.112670274825258e-07, + "loss": 0.5242, + "step": 63491 + }, + { + "epoch": 1.63, + "learning_rate": 9.112394662100893e-07, + "loss": 0.6162, + "step": 63492 + }, + { + "epoch": 1.63, + "learning_rate": 9.11211905005613e-07, + "loss": 0.5225, + "step": 63493 + }, + { + "epoch": 1.63, + "learning_rate": 9.111843438691174e-07, + "loss": 0.6787, + "step": 63494 + }, + { + "epoch": 1.63, + "learning_rate": 9.111567828006244e-07, + "loss": 0.6489, + "step": 63495 + }, + { + "epoch": 1.63, + "learning_rate": 9.111292218001543e-07, + "loss": 0.582, + "step": 63496 + }, + { + "epoch": 1.63, + "learning_rate": 9.111016608677282e-07, + "loss": 0.7744, + "step": 63497 + }, + { + "epoch": 1.63, + "learning_rate": 9.110741000033678e-07, + "loss": 0.4829, + "step": 63498 + }, + { + "epoch": 1.63, + "learning_rate": 9.110465392070935e-07, + "loss": 0.645, + "step": 63499 + }, + { + "epoch": 1.63, + "learning_rate": 9.110189784789272e-07, + "loss": 0.5054, + "step": 63500 + }, + { + "epoch": 1.63, + "learning_rate": 9.109914178188892e-07, + "loss": 0.6665, + "step": 63501 + }, + { + "epoch": 1.63, + "learning_rate": 9.109638572270012e-07, + "loss": 0.6611, + "step": 63502 + }, + { + "epoch": 1.63, + "learning_rate": 9.109362967032838e-07, + "loss": 0.6284, + "step": 63503 + }, + { + "epoch": 1.63, + "learning_rate": 9.109087362477588e-07, + "loss": 0.8359, + "step": 63504 + }, + { + "epoch": 1.63, + "learning_rate": 9.10881175860447e-07, + "loss": 0.5688, + "step": 63505 + }, + { + "epoch": 1.63, + "learning_rate": 9.108536155413691e-07, + "loss": 0.6245, + "step": 63506 + }, + { + "epoch": 1.63, + "learning_rate": 9.108260552905464e-07, + "loss": 0.625, + "step": 63507 + }, + { + "epoch": 1.63, + "learning_rate": 9.107984951080003e-07, + "loss": 0.6011, + "step": 63508 + }, + { + "epoch": 1.63, + "learning_rate": 9.107709349937514e-07, + "loss": 0.666, + "step": 63509 + }, + { + "epoch": 1.63, + "learning_rate": 9.107433749478213e-07, + "loss": 0.6655, + "step": 63510 + }, + { + "epoch": 1.63, + "learning_rate": 9.107158149702306e-07, + "loss": 0.7676, + "step": 63511 + }, + { + "epoch": 1.63, + "learning_rate": 9.10688255061001e-07, + "loss": 0.5791, + "step": 63512 + }, + { + "epoch": 1.63, + "learning_rate": 9.106606952201531e-07, + "loss": 0.5762, + "step": 63513 + }, + { + "epoch": 1.63, + "learning_rate": 9.106331354477084e-07, + "loss": 0.647, + "step": 63514 + }, + { + "epoch": 1.63, + "learning_rate": 9.106055757436881e-07, + "loss": 0.6494, + "step": 63515 + }, + { + "epoch": 1.63, + "learning_rate": 9.105780161081124e-07, + "loss": 0.6133, + "step": 63516 + }, + { + "epoch": 1.63, + "learning_rate": 9.105504565410034e-07, + "loss": 0.5435, + "step": 63517 + }, + { + "epoch": 1.63, + "learning_rate": 9.105228970423813e-07, + "loss": 0.6338, + "step": 63518 + }, + { + "epoch": 1.63, + "learning_rate": 9.104953376122683e-07, + "loss": 0.6365, + "step": 63519 + }, + { + "epoch": 1.63, + "learning_rate": 9.104677782506844e-07, + "loss": 0.6338, + "step": 63520 + }, + { + "epoch": 1.63, + "learning_rate": 9.104402189576515e-07, + "loss": 0.6016, + "step": 63521 + }, + { + "epoch": 1.63, + "learning_rate": 9.104126597331902e-07, + "loss": 0.6768, + "step": 63522 + }, + { + "epoch": 1.63, + "learning_rate": 9.103851005773221e-07, + "loss": 0.4993, + "step": 63523 + }, + { + "epoch": 1.63, + "learning_rate": 9.103575414900679e-07, + "loss": 0.5659, + "step": 63524 + }, + { + "epoch": 1.63, + "learning_rate": 9.103299824714491e-07, + "loss": 0.5432, + "step": 63525 + }, + { + "epoch": 1.63, + "learning_rate": 9.10302423521486e-07, + "loss": 0.5483, + "step": 63526 + }, + { + "epoch": 1.63, + "learning_rate": 9.102748646402005e-07, + "loss": 0.6475, + "step": 63527 + }, + { + "epoch": 1.63, + "learning_rate": 9.102473058276132e-07, + "loss": 0.708, + "step": 63528 + }, + { + "epoch": 1.63, + "learning_rate": 9.102197470837456e-07, + "loss": 0.6333, + "step": 63529 + }, + { + "epoch": 1.63, + "learning_rate": 9.101921884086184e-07, + "loss": 0.6333, + "step": 63530 + }, + { + "epoch": 1.63, + "learning_rate": 9.101646298022531e-07, + "loss": 0.6187, + "step": 63531 + }, + { + "epoch": 1.63, + "learning_rate": 9.101370712646704e-07, + "loss": 0.7349, + "step": 63532 + }, + { + "epoch": 1.63, + "learning_rate": 9.101095127958918e-07, + "loss": 0.7441, + "step": 63533 + }, + { + "epoch": 1.63, + "learning_rate": 9.100819543959385e-07, + "loss": 0.6191, + "step": 63534 + }, + { + "epoch": 1.63, + "learning_rate": 9.100543960648308e-07, + "loss": 0.5898, + "step": 63535 + }, + { + "epoch": 1.63, + "learning_rate": 9.100268378025906e-07, + "loss": 0.6885, + "step": 63536 + }, + { + "epoch": 1.63, + "learning_rate": 9.099992796092385e-07, + "loss": 0.5376, + "step": 63537 + }, + { + "epoch": 1.63, + "learning_rate": 9.099717214847959e-07, + "loss": 0.666, + "step": 63538 + }, + { + "epoch": 1.63, + "learning_rate": 9.099441634292837e-07, + "loss": 0.6641, + "step": 63539 + }, + { + "epoch": 1.63, + "learning_rate": 9.099166054427234e-07, + "loss": 0.5845, + "step": 63540 + }, + { + "epoch": 1.63, + "learning_rate": 9.098890475251357e-07, + "loss": 1.0518, + "step": 63541 + }, + { + "epoch": 1.63, + "learning_rate": 9.098614896765417e-07, + "loss": 0.7686, + "step": 63542 + }, + { + "epoch": 1.63, + "learning_rate": 9.098339318969628e-07, + "loss": 0.6851, + "step": 63543 + }, + { + "epoch": 1.63, + "learning_rate": 9.0980637418642e-07, + "loss": 0.668, + "step": 63544 + }, + { + "epoch": 1.63, + "learning_rate": 9.097788165449341e-07, + "loss": 0.7637, + "step": 63545 + }, + { + "epoch": 1.63, + "learning_rate": 9.097512589725265e-07, + "loss": 0.5757, + "step": 63546 + }, + { + "epoch": 1.63, + "learning_rate": 9.09723701469218e-07, + "loss": 0.6763, + "step": 63547 + }, + { + "epoch": 1.63, + "learning_rate": 9.0969614403503e-07, + "loss": 0.4348, + "step": 63548 + }, + { + "epoch": 1.63, + "learning_rate": 9.096685866699835e-07, + "loss": 0.6001, + "step": 63549 + }, + { + "epoch": 1.63, + "learning_rate": 9.096410293740997e-07, + "loss": 0.5483, + "step": 63550 + }, + { + "epoch": 1.63, + "learning_rate": 9.096134721473995e-07, + "loss": 0.4819, + "step": 63551 + }, + { + "epoch": 1.63, + "learning_rate": 9.095859149899042e-07, + "loss": 0.5515, + "step": 63552 + }, + { + "epoch": 1.63, + "learning_rate": 9.095583579016347e-07, + "loss": 0.6152, + "step": 63553 + }, + { + "epoch": 1.63, + "learning_rate": 9.095308008826126e-07, + "loss": 0.646, + "step": 63554 + }, + { + "epoch": 1.63, + "learning_rate": 9.095032439328584e-07, + "loss": 0.7393, + "step": 63555 + }, + { + "epoch": 1.63, + "learning_rate": 9.09475687052393e-07, + "loss": 0.5239, + "step": 63556 + }, + { + "epoch": 1.63, + "learning_rate": 9.094481302412385e-07, + "loss": 0.6943, + "step": 63557 + }, + { + "epoch": 1.63, + "learning_rate": 9.094205734994152e-07, + "loss": 0.6709, + "step": 63558 + }, + { + "epoch": 1.63, + "learning_rate": 9.093930168269442e-07, + "loss": 0.564, + "step": 63559 + }, + { + "epoch": 1.63, + "learning_rate": 9.093654602238469e-07, + "loss": 0.6104, + "step": 63560 + }, + { + "epoch": 1.63, + "learning_rate": 9.093379036901442e-07, + "loss": 0.6323, + "step": 63561 + }, + { + "epoch": 1.63, + "learning_rate": 9.093103472258574e-07, + "loss": 0.5659, + "step": 63562 + }, + { + "epoch": 1.63, + "learning_rate": 9.092827908310075e-07, + "loss": 0.623, + "step": 63563 + }, + { + "epoch": 1.63, + "learning_rate": 9.092552345056159e-07, + "loss": 0.8389, + "step": 63564 + }, + { + "epoch": 1.63, + "learning_rate": 9.092276782497031e-07, + "loss": 0.53, + "step": 63565 + }, + { + "epoch": 1.63, + "learning_rate": 9.092001220632904e-07, + "loss": 0.5442, + "step": 63566 + }, + { + "epoch": 1.63, + "learning_rate": 9.091725659463991e-07, + "loss": 0.6387, + "step": 63567 + }, + { + "epoch": 1.63, + "learning_rate": 9.091450098990501e-07, + "loss": 0.5161, + "step": 63568 + }, + { + "epoch": 1.63, + "learning_rate": 9.091174539212647e-07, + "loss": 0.6509, + "step": 63569 + }, + { + "epoch": 1.63, + "learning_rate": 9.090898980130638e-07, + "loss": 0.5659, + "step": 63570 + }, + { + "epoch": 1.63, + "learning_rate": 9.090623421744688e-07, + "loss": 0.542, + "step": 63571 + }, + { + "epoch": 1.63, + "learning_rate": 9.090347864055002e-07, + "loss": 0.5771, + "step": 63572 + }, + { + "epoch": 1.63, + "learning_rate": 9.090072307061798e-07, + "loss": 0.5469, + "step": 63573 + }, + { + "epoch": 1.63, + "learning_rate": 9.089796750765285e-07, + "loss": 0.7383, + "step": 63574 + }, + { + "epoch": 1.63, + "learning_rate": 9.089521195165671e-07, + "loss": 0.5996, + "step": 63575 + }, + { + "epoch": 1.63, + "learning_rate": 9.089245640263168e-07, + "loss": 0.6279, + "step": 63576 + }, + { + "epoch": 1.63, + "learning_rate": 9.088970086057989e-07, + "loss": 0.4722, + "step": 63577 + }, + { + "epoch": 1.63, + "learning_rate": 9.08869453255034e-07, + "loss": 0.5889, + "step": 63578 + }, + { + "epoch": 1.63, + "learning_rate": 9.088418979740441e-07, + "loss": 0.5247, + "step": 63579 + }, + { + "epoch": 1.63, + "learning_rate": 9.088143427628493e-07, + "loss": 0.7061, + "step": 63580 + }, + { + "epoch": 1.63, + "learning_rate": 9.087867876214715e-07, + "loss": 0.7515, + "step": 63581 + }, + { + "epoch": 1.63, + "learning_rate": 9.087592325499312e-07, + "loss": 0.6924, + "step": 63582 + }, + { + "epoch": 1.63, + "learning_rate": 9.0873167754825e-07, + "loss": 0.6953, + "step": 63583 + }, + { + "epoch": 1.63, + "learning_rate": 9.087041226164489e-07, + "loss": 0.7979, + "step": 63584 + }, + { + "epoch": 1.63, + "learning_rate": 9.086765677545485e-07, + "loss": 0.6543, + "step": 63585 + }, + { + "epoch": 1.63, + "learning_rate": 9.086490129625705e-07, + "loss": 0.5566, + "step": 63586 + }, + { + "epoch": 1.63, + "learning_rate": 9.086214582405355e-07, + "loss": 0.7373, + "step": 63587 + }, + { + "epoch": 1.63, + "learning_rate": 9.08593903588465e-07, + "loss": 0.5405, + "step": 63588 + }, + { + "epoch": 1.63, + "learning_rate": 9.085663490063797e-07, + "loss": 0.7754, + "step": 63589 + }, + { + "epoch": 1.63, + "learning_rate": 9.085387944943013e-07, + "loss": 0.5991, + "step": 63590 + }, + { + "epoch": 1.63, + "learning_rate": 9.085112400522504e-07, + "loss": 0.7441, + "step": 63591 + }, + { + "epoch": 1.63, + "learning_rate": 9.084836856802482e-07, + "loss": 0.6396, + "step": 63592 + }, + { + "epoch": 1.63, + "learning_rate": 9.084561313783157e-07, + "loss": 0.4316, + "step": 63593 + }, + { + "epoch": 1.63, + "learning_rate": 9.084285771464748e-07, + "loss": 0.5278, + "step": 63594 + }, + { + "epoch": 1.63, + "learning_rate": 9.084010229847453e-07, + "loss": 0.6699, + "step": 63595 + }, + { + "epoch": 1.63, + "learning_rate": 9.083734688931492e-07, + "loss": 0.8525, + "step": 63596 + }, + { + "epoch": 1.63, + "learning_rate": 9.08345914871707e-07, + "loss": 0.6313, + "step": 63597 + }, + { + "epoch": 1.63, + "learning_rate": 9.083183609204404e-07, + "loss": 0.6494, + "step": 63598 + }, + { + "epoch": 1.63, + "learning_rate": 9.082908070393699e-07, + "loss": 0.7109, + "step": 63599 + }, + { + "epoch": 1.63, + "learning_rate": 9.082632532285173e-07, + "loss": 0.6421, + "step": 63600 + }, + { + "epoch": 1.63, + "learning_rate": 9.082356994879029e-07, + "loss": 0.4519, + "step": 63601 + }, + { + "epoch": 1.63, + "learning_rate": 9.082081458175485e-07, + "loss": 0.5977, + "step": 63602 + }, + { + "epoch": 1.63, + "learning_rate": 9.081805922174747e-07, + "loss": 0.4744, + "step": 63603 + }, + { + "epoch": 1.63, + "learning_rate": 9.081530386877032e-07, + "loss": 0.6533, + "step": 63604 + }, + { + "epoch": 1.63, + "learning_rate": 9.081254852282546e-07, + "loss": 0.4424, + "step": 63605 + }, + { + "epoch": 1.63, + "learning_rate": 9.080979318391498e-07, + "loss": 0.627, + "step": 63606 + }, + { + "epoch": 1.63, + "learning_rate": 9.080703785204103e-07, + "loss": 0.7627, + "step": 63607 + }, + { + "epoch": 1.63, + "learning_rate": 9.08042825272057e-07, + "loss": 0.6174, + "step": 63608 + }, + { + "epoch": 1.63, + "learning_rate": 9.080152720941112e-07, + "loss": 0.6729, + "step": 63609 + }, + { + "epoch": 1.63, + "learning_rate": 9.079877189865937e-07, + "loss": 0.5878, + "step": 63610 + }, + { + "epoch": 1.63, + "learning_rate": 9.079601659495261e-07, + "loss": 0.6836, + "step": 63611 + }, + { + "epoch": 1.63, + "learning_rate": 9.079326129829287e-07, + "loss": 0.7471, + "step": 63612 + }, + { + "epoch": 1.63, + "learning_rate": 9.079050600868236e-07, + "loss": 0.666, + "step": 63613 + }, + { + "epoch": 1.63, + "learning_rate": 9.078775072612314e-07, + "loss": 0.6309, + "step": 63614 + }, + { + "epoch": 1.63, + "learning_rate": 9.078499545061729e-07, + "loss": 0.7744, + "step": 63615 + }, + { + "epoch": 1.63, + "learning_rate": 9.078224018216692e-07, + "loss": 0.6479, + "step": 63616 + }, + { + "epoch": 1.63, + "learning_rate": 9.077948492077421e-07, + "loss": 0.6914, + "step": 63617 + }, + { + "epoch": 1.63, + "learning_rate": 9.077672966644119e-07, + "loss": 0.6172, + "step": 63618 + }, + { + "epoch": 1.63, + "learning_rate": 9.077397441917002e-07, + "loss": 0.8525, + "step": 63619 + }, + { + "epoch": 1.63, + "learning_rate": 9.077121917896278e-07, + "loss": 0.5234, + "step": 63620 + }, + { + "epoch": 1.63, + "learning_rate": 9.07684639458216e-07, + "loss": 0.5488, + "step": 63621 + }, + { + "epoch": 1.63, + "learning_rate": 9.076570871974858e-07, + "loss": 0.7246, + "step": 63622 + }, + { + "epoch": 1.63, + "learning_rate": 9.076295350074584e-07, + "loss": 0.5869, + "step": 63623 + }, + { + "epoch": 1.63, + "learning_rate": 9.076019828881551e-07, + "loss": 0.6324, + "step": 63624 + }, + { + "epoch": 1.63, + "learning_rate": 9.075744308395963e-07, + "loss": 0.6357, + "step": 63625 + }, + { + "epoch": 1.63, + "learning_rate": 9.075468788618037e-07, + "loss": 0.4751, + "step": 63626 + }, + { + "epoch": 1.63, + "learning_rate": 9.075193269547979e-07, + "loss": 0.6133, + "step": 63627 + }, + { + "epoch": 1.63, + "learning_rate": 9.074917751186006e-07, + "loss": 0.6846, + "step": 63628 + }, + { + "epoch": 1.63, + "learning_rate": 9.074642233532323e-07, + "loss": 0.7275, + "step": 63629 + }, + { + "epoch": 1.63, + "learning_rate": 9.074366716587148e-07, + "loss": 0.7622, + "step": 63630 + }, + { + "epoch": 1.63, + "learning_rate": 9.074091200350687e-07, + "loss": 0.7393, + "step": 63631 + }, + { + "epoch": 1.63, + "learning_rate": 9.073815684823149e-07, + "loss": 0.5361, + "step": 63632 + }, + { + "epoch": 1.63, + "learning_rate": 9.07354017000475e-07, + "loss": 0.6558, + "step": 63633 + }, + { + "epoch": 1.63, + "learning_rate": 9.0732646558957e-07, + "loss": 0.709, + "step": 63634 + }, + { + "epoch": 1.63, + "learning_rate": 9.072989142496206e-07, + "loss": 0.6543, + "step": 63635 + }, + { + "epoch": 1.63, + "learning_rate": 9.072713629806483e-07, + "loss": 0.6729, + "step": 63636 + }, + { + "epoch": 1.63, + "learning_rate": 9.072438117826739e-07, + "loss": 0.6504, + "step": 63637 + }, + { + "epoch": 1.63, + "learning_rate": 9.072162606557188e-07, + "loss": 0.426, + "step": 63638 + }, + { + "epoch": 1.63, + "learning_rate": 9.071887095998037e-07, + "loss": 0.6426, + "step": 63639 + }, + { + "epoch": 1.63, + "learning_rate": 9.071611586149503e-07, + "loss": 0.4778, + "step": 63640 + }, + { + "epoch": 1.63, + "learning_rate": 9.071336077011789e-07, + "loss": 0.6567, + "step": 63641 + }, + { + "epoch": 1.63, + "learning_rate": 9.071060568585114e-07, + "loss": 0.7056, + "step": 63642 + }, + { + "epoch": 1.63, + "learning_rate": 9.070785060869682e-07, + "loss": 0.7744, + "step": 63643 + }, + { + "epoch": 1.63, + "learning_rate": 9.070509553865713e-07, + "loss": 0.5459, + "step": 63644 + }, + { + "epoch": 1.63, + "learning_rate": 9.070234047573409e-07, + "loss": 0.7285, + "step": 63645 + }, + { + "epoch": 1.63, + "learning_rate": 9.069958541992981e-07, + "loss": 0.5336, + "step": 63646 + }, + { + "epoch": 1.63, + "learning_rate": 9.069683037124646e-07, + "loss": 0.79, + "step": 63647 + }, + { + "epoch": 1.63, + "learning_rate": 9.069407532968612e-07, + "loss": 0.7871, + "step": 63648 + }, + { + "epoch": 1.63, + "learning_rate": 9.069132029525088e-07, + "loss": 0.521, + "step": 63649 + }, + { + "epoch": 1.63, + "learning_rate": 9.068856526794288e-07, + "loss": 0.6611, + "step": 63650 + }, + { + "epoch": 1.63, + "learning_rate": 9.068581024776421e-07, + "loss": 0.7817, + "step": 63651 + }, + { + "epoch": 1.63, + "learning_rate": 9.0683055234717e-07, + "loss": 0.7637, + "step": 63652 + }, + { + "epoch": 1.63, + "learning_rate": 9.068030022880332e-07, + "loss": 0.4767, + "step": 63653 + }, + { + "epoch": 1.63, + "learning_rate": 9.067754523002535e-07, + "loss": 0.6196, + "step": 63654 + }, + { + "epoch": 1.63, + "learning_rate": 9.067479023838514e-07, + "loss": 0.7783, + "step": 63655 + }, + { + "epoch": 1.63, + "learning_rate": 9.067203525388478e-07, + "loss": 0.4922, + "step": 63656 + }, + { + "epoch": 1.63, + "learning_rate": 9.066928027652645e-07, + "loss": 0.4611, + "step": 63657 + }, + { + "epoch": 1.63, + "learning_rate": 9.06665253063122e-07, + "loss": 0.6729, + "step": 63658 + }, + { + "epoch": 1.63, + "learning_rate": 9.066377034324418e-07, + "loss": 0.5918, + "step": 63659 + }, + { + "epoch": 1.63, + "learning_rate": 9.066101538732446e-07, + "loss": 0.8525, + "step": 63660 + }, + { + "epoch": 1.63, + "learning_rate": 9.065826043855519e-07, + "loss": 0.6592, + "step": 63661 + }, + { + "epoch": 1.63, + "learning_rate": 9.065550549693845e-07, + "loss": 0.707, + "step": 63662 + }, + { + "epoch": 1.63, + "learning_rate": 9.065275056247636e-07, + "loss": 0.5781, + "step": 63663 + }, + { + "epoch": 1.63, + "learning_rate": 9.064999563517107e-07, + "loss": 0.7285, + "step": 63664 + }, + { + "epoch": 1.63, + "learning_rate": 9.06472407150246e-07, + "loss": 0.5989, + "step": 63665 + }, + { + "epoch": 1.63, + "learning_rate": 9.064448580203913e-07, + "loss": 0.5488, + "step": 63666 + }, + { + "epoch": 1.63, + "learning_rate": 9.064173089621674e-07, + "loss": 0.6709, + "step": 63667 + }, + { + "epoch": 1.63, + "learning_rate": 9.063897599755953e-07, + "loss": 0.6504, + "step": 63668 + }, + { + "epoch": 1.63, + "learning_rate": 9.063622110606965e-07, + "loss": 0.626, + "step": 63669 + }, + { + "epoch": 1.63, + "learning_rate": 9.063346622174917e-07, + "loss": 0.6089, + "step": 63670 + }, + { + "epoch": 1.63, + "learning_rate": 9.063071134460022e-07, + "loss": 0.6943, + "step": 63671 + }, + { + "epoch": 1.63, + "learning_rate": 9.062795647462489e-07, + "loss": 0.6631, + "step": 63672 + }, + { + "epoch": 1.63, + "learning_rate": 9.062520161182532e-07, + "loss": 0.5422, + "step": 63673 + }, + { + "epoch": 1.63, + "learning_rate": 9.062244675620362e-07, + "loss": 0.7529, + "step": 63674 + }, + { + "epoch": 1.63, + "learning_rate": 9.061969190776185e-07, + "loss": 0.7178, + "step": 63675 + }, + { + "epoch": 1.63, + "learning_rate": 9.061693706650216e-07, + "loss": 0.6064, + "step": 63676 + }, + { + "epoch": 1.63, + "learning_rate": 9.061418223242664e-07, + "loss": 0.7715, + "step": 63677 + }, + { + "epoch": 1.63, + "learning_rate": 9.061142740553742e-07, + "loss": 0.6367, + "step": 63678 + }, + { + "epoch": 1.63, + "learning_rate": 9.060867258583658e-07, + "loss": 0.6367, + "step": 63679 + }, + { + "epoch": 1.63, + "learning_rate": 9.060591777332628e-07, + "loss": 0.6221, + "step": 63680 + }, + { + "epoch": 1.63, + "learning_rate": 9.060316296800858e-07, + "loss": 0.8096, + "step": 63681 + }, + { + "epoch": 1.63, + "learning_rate": 9.06004081698856e-07, + "loss": 0.5537, + "step": 63682 + }, + { + "epoch": 1.63, + "learning_rate": 9.059765337895945e-07, + "loss": 0.7656, + "step": 63683 + }, + { + "epoch": 1.63, + "learning_rate": 9.059489859523231e-07, + "loss": 0.8555, + "step": 63684 + }, + { + "epoch": 1.63, + "learning_rate": 9.059214381870615e-07, + "loss": 0.5864, + "step": 63685 + }, + { + "epoch": 1.63, + "learning_rate": 9.058938904938319e-07, + "loss": 0.6187, + "step": 63686 + }, + { + "epoch": 1.63, + "learning_rate": 9.058663428726547e-07, + "loss": 0.5947, + "step": 63687 + }, + { + "epoch": 1.63, + "learning_rate": 9.058387953235515e-07, + "loss": 0.623, + "step": 63688 + }, + { + "epoch": 1.63, + "learning_rate": 9.05811247846543e-07, + "loss": 0.6436, + "step": 63689 + }, + { + "epoch": 1.63, + "learning_rate": 9.057837004416507e-07, + "loss": 0.6826, + "step": 63690 + }, + { + "epoch": 1.63, + "learning_rate": 9.057561531088955e-07, + "loss": 0.5107, + "step": 63691 + }, + { + "epoch": 1.63, + "learning_rate": 9.057286058482985e-07, + "loss": 0.6487, + "step": 63692 + }, + { + "epoch": 1.63, + "learning_rate": 9.057010586598805e-07, + "loss": 0.666, + "step": 63693 + }, + { + "epoch": 1.63, + "learning_rate": 9.056735115436633e-07, + "loss": 0.5491, + "step": 63694 + }, + { + "epoch": 1.63, + "learning_rate": 9.056459644996674e-07, + "loss": 0.6885, + "step": 63695 + }, + { + "epoch": 1.63, + "learning_rate": 9.056184175279139e-07, + "loss": 0.5332, + "step": 63696 + }, + { + "epoch": 1.63, + "learning_rate": 9.055908706284242e-07, + "loss": 0.7437, + "step": 63697 + }, + { + "epoch": 1.63, + "learning_rate": 9.055633238012191e-07, + "loss": 0.5122, + "step": 63698 + }, + { + "epoch": 1.63, + "learning_rate": 9.055357770463198e-07, + "loss": 0.6489, + "step": 63699 + }, + { + "epoch": 1.63, + "learning_rate": 9.055082303637473e-07, + "loss": 0.7812, + "step": 63700 + }, + { + "epoch": 1.63, + "learning_rate": 9.054806837535231e-07, + "loss": 0.6279, + "step": 63701 + }, + { + "epoch": 1.63, + "learning_rate": 9.054531372156677e-07, + "loss": 0.4487, + "step": 63702 + }, + { + "epoch": 1.63, + "learning_rate": 9.054255907502027e-07, + "loss": 0.5356, + "step": 63703 + }, + { + "epoch": 1.63, + "learning_rate": 9.053980443571493e-07, + "loss": 0.6543, + "step": 63704 + }, + { + "epoch": 1.63, + "learning_rate": 9.053704980365279e-07, + "loss": 0.6494, + "step": 63705 + }, + { + "epoch": 1.63, + "learning_rate": 9.053429517883598e-07, + "loss": 0.5447, + "step": 63706 + }, + { + "epoch": 1.63, + "learning_rate": 9.053154056126666e-07, + "loss": 0.7441, + "step": 63707 + }, + { + "epoch": 1.63, + "learning_rate": 9.052878595094687e-07, + "loss": 0.7861, + "step": 63708 + }, + { + "epoch": 1.63, + "learning_rate": 9.052603134787878e-07, + "loss": 0.6216, + "step": 63709 + }, + { + "epoch": 1.63, + "learning_rate": 9.052327675206444e-07, + "loss": 0.7031, + "step": 63710 + }, + { + "epoch": 1.63, + "learning_rate": 9.052052216350602e-07, + "loss": 0.4858, + "step": 63711 + }, + { + "epoch": 1.63, + "learning_rate": 9.051776758220557e-07, + "loss": 0.748, + "step": 63712 + }, + { + "epoch": 1.63, + "learning_rate": 9.051501300816527e-07, + "loss": 0.4192, + "step": 63713 + }, + { + "epoch": 1.63, + "learning_rate": 9.051225844138719e-07, + "loss": 0.478, + "step": 63714 + }, + { + "epoch": 1.63, + "learning_rate": 9.05095038818734e-07, + "loss": 0.8457, + "step": 63715 + }, + { + "epoch": 1.63, + "learning_rate": 9.050674932962607e-07, + "loss": 0.5327, + "step": 63716 + }, + { + "epoch": 1.63, + "learning_rate": 9.050399478464727e-07, + "loss": 0.666, + "step": 63717 + }, + { + "epoch": 1.63, + "learning_rate": 9.050124024693915e-07, + "loss": 0.7812, + "step": 63718 + }, + { + "epoch": 1.63, + "learning_rate": 9.049848571650376e-07, + "loss": 0.6943, + "step": 63719 + }, + { + "epoch": 1.63, + "learning_rate": 9.049573119334326e-07, + "loss": 0.7031, + "step": 63720 + }, + { + "epoch": 1.63, + "learning_rate": 9.049297667745975e-07, + "loss": 0.5212, + "step": 63721 + }, + { + "epoch": 1.63, + "learning_rate": 9.049022216885531e-07, + "loss": 0.6328, + "step": 63722 + }, + { + "epoch": 1.63, + "learning_rate": 9.048746766753209e-07, + "loss": 0.5703, + "step": 63723 + }, + { + "epoch": 1.63, + "learning_rate": 9.04847131734922e-07, + "loss": 0.5627, + "step": 63724 + }, + { + "epoch": 1.63, + "learning_rate": 9.048195868673768e-07, + "loss": 0.4658, + "step": 63725 + }, + { + "epoch": 1.63, + "learning_rate": 9.047920420727071e-07, + "loss": 0.666, + "step": 63726 + }, + { + "epoch": 1.63, + "learning_rate": 9.047644973509337e-07, + "loss": 0.3472, + "step": 63727 + }, + { + "epoch": 1.63, + "learning_rate": 9.047369527020778e-07, + "loss": 0.7822, + "step": 63728 + }, + { + "epoch": 1.63, + "learning_rate": 9.047094081261602e-07, + "loss": 0.7363, + "step": 63729 + }, + { + "epoch": 1.63, + "learning_rate": 9.046818636232024e-07, + "loss": 0.6377, + "step": 63730 + }, + { + "epoch": 1.63, + "learning_rate": 9.046543191932252e-07, + "loss": 0.6167, + "step": 63731 + }, + { + "epoch": 1.63, + "learning_rate": 9.0462677483625e-07, + "loss": 0.6602, + "step": 63732 + }, + { + "epoch": 1.63, + "learning_rate": 9.045992305522975e-07, + "loss": 0.6201, + "step": 63733 + }, + { + "epoch": 1.63, + "learning_rate": 9.045716863413894e-07, + "loss": 0.6274, + "step": 63734 + }, + { + "epoch": 1.63, + "learning_rate": 9.045441422035462e-07, + "loss": 0.5591, + "step": 63735 + }, + { + "epoch": 1.63, + "learning_rate": 9.045165981387887e-07, + "loss": 0.6309, + "step": 63736 + }, + { + "epoch": 1.63, + "learning_rate": 9.044890541471389e-07, + "loss": 0.6904, + "step": 63737 + }, + { + "epoch": 1.63, + "learning_rate": 9.044615102286175e-07, + "loss": 0.6738, + "step": 63738 + }, + { + "epoch": 1.63, + "learning_rate": 9.044339663832452e-07, + "loss": 0.8018, + "step": 63739 + }, + { + "epoch": 1.63, + "learning_rate": 9.044064226110436e-07, + "loss": 0.6079, + "step": 63740 + }, + { + "epoch": 1.63, + "learning_rate": 9.043788789120334e-07, + "loss": 0.5459, + "step": 63741 + }, + { + "epoch": 1.63, + "learning_rate": 9.043513352862362e-07, + "loss": 0.6704, + "step": 63742 + }, + { + "epoch": 1.63, + "learning_rate": 9.043237917336725e-07, + "loss": 0.5972, + "step": 63743 + }, + { + "epoch": 1.63, + "learning_rate": 9.042962482543641e-07, + "loss": 0.5538, + "step": 63744 + }, + { + "epoch": 1.63, + "learning_rate": 9.042687048483315e-07, + "loss": 0.6719, + "step": 63745 + }, + { + "epoch": 1.63, + "learning_rate": 9.042411615155957e-07, + "loss": 0.667, + "step": 63746 + }, + { + "epoch": 1.63, + "learning_rate": 9.042136182561782e-07, + "loss": 0.6011, + "step": 63747 + }, + { + "epoch": 1.63, + "learning_rate": 9.041860750700998e-07, + "loss": 0.446, + "step": 63748 + }, + { + "epoch": 1.63, + "learning_rate": 9.04158531957382e-07, + "loss": 0.5063, + "step": 63749 + }, + { + "epoch": 1.63, + "learning_rate": 9.041309889180451e-07, + "loss": 0.8076, + "step": 63750 + }, + { + "epoch": 1.63, + "learning_rate": 9.041034459521111e-07, + "loss": 0.5957, + "step": 63751 + }, + { + "epoch": 1.63, + "learning_rate": 9.040759030596006e-07, + "loss": 0.6237, + "step": 63752 + }, + { + "epoch": 1.63, + "learning_rate": 9.040483602405347e-07, + "loss": 0.7173, + "step": 63753 + }, + { + "epoch": 1.63, + "learning_rate": 9.04020817494935e-07, + "loss": 0.5112, + "step": 63754 + }, + { + "epoch": 1.63, + "learning_rate": 9.039932748228216e-07, + "loss": 0.6797, + "step": 63755 + }, + { + "epoch": 1.63, + "learning_rate": 9.039657322242164e-07, + "loss": 0.5942, + "step": 63756 + }, + { + "epoch": 1.63, + "learning_rate": 9.039381896991402e-07, + "loss": 0.6914, + "step": 63757 + }, + { + "epoch": 1.63, + "learning_rate": 9.03910647247614e-07, + "loss": 0.6084, + "step": 63758 + }, + { + "epoch": 1.63, + "learning_rate": 9.038831048696592e-07, + "loss": 0.667, + "step": 63759 + }, + { + "epoch": 1.63, + "learning_rate": 9.038555625652962e-07, + "loss": 0.427, + "step": 63760 + }, + { + "epoch": 1.63, + "learning_rate": 9.038280203345471e-07, + "loss": 0.5708, + "step": 63761 + }, + { + "epoch": 1.63, + "learning_rate": 9.038004781774321e-07, + "loss": 0.728, + "step": 63762 + }, + { + "epoch": 1.63, + "learning_rate": 9.037729360939729e-07, + "loss": 0.7344, + "step": 63763 + }, + { + "epoch": 1.63, + "learning_rate": 9.037453940841906e-07, + "loss": 0.5962, + "step": 63764 + }, + { + "epoch": 1.63, + "learning_rate": 9.037178521481055e-07, + "loss": 0.7949, + "step": 63765 + }, + { + "epoch": 1.63, + "learning_rate": 9.036903102857395e-07, + "loss": 0.6768, + "step": 63766 + }, + { + "epoch": 1.63, + "learning_rate": 9.036627684971132e-07, + "loss": 0.5679, + "step": 63767 + }, + { + "epoch": 1.63, + "learning_rate": 9.036352267822481e-07, + "loss": 0.5454, + "step": 63768 + }, + { + "epoch": 1.63, + "learning_rate": 9.036076851411647e-07, + "loss": 0.5884, + "step": 63769 + }, + { + "epoch": 1.63, + "learning_rate": 9.035801435738848e-07, + "loss": 0.6582, + "step": 63770 + }, + { + "epoch": 1.63, + "learning_rate": 9.03552602080429e-07, + "loss": 0.6436, + "step": 63771 + }, + { + "epoch": 1.63, + "learning_rate": 9.035250606608186e-07, + "loss": 0.5815, + "step": 63772 + }, + { + "epoch": 1.63, + "learning_rate": 9.034975193150746e-07, + "loss": 0.4535, + "step": 63773 + }, + { + "epoch": 1.63, + "learning_rate": 9.034699780432186e-07, + "loss": 0.7441, + "step": 63774 + }, + { + "epoch": 1.63, + "learning_rate": 9.034424368452707e-07, + "loss": 0.5923, + "step": 63775 + }, + { + "epoch": 1.63, + "learning_rate": 9.034148957212526e-07, + "loss": 0.7266, + "step": 63776 + }, + { + "epoch": 1.63, + "learning_rate": 9.03387354671185e-07, + "loss": 0.5205, + "step": 63777 + }, + { + "epoch": 1.63, + "learning_rate": 9.033598136950897e-07, + "loss": 0.71, + "step": 63778 + }, + { + "epoch": 1.63, + "learning_rate": 9.033322727929868e-07, + "loss": 0.7617, + "step": 63779 + }, + { + "epoch": 1.63, + "learning_rate": 9.033047319648984e-07, + "loss": 0.5615, + "step": 63780 + }, + { + "epoch": 1.63, + "learning_rate": 9.032771912108448e-07, + "loss": 0.623, + "step": 63781 + }, + { + "epoch": 1.63, + "learning_rate": 9.032496505308477e-07, + "loss": 0.6431, + "step": 63782 + }, + { + "epoch": 1.63, + "learning_rate": 9.032221099249276e-07, + "loss": 0.4873, + "step": 63783 + }, + { + "epoch": 1.63, + "learning_rate": 9.031945693931064e-07, + "loss": 0.6226, + "step": 63784 + }, + { + "epoch": 1.63, + "learning_rate": 9.031670289354044e-07, + "loss": 0.6641, + "step": 63785 + }, + { + "epoch": 1.63, + "learning_rate": 9.031394885518428e-07, + "loss": 0.7158, + "step": 63786 + }, + { + "epoch": 1.63, + "learning_rate": 9.03111948242443e-07, + "loss": 0.5234, + "step": 63787 + }, + { + "epoch": 1.63, + "learning_rate": 9.030844080072257e-07, + "loss": 0.6006, + "step": 63788 + }, + { + "epoch": 1.63, + "learning_rate": 9.030568678462124e-07, + "loss": 0.563, + "step": 63789 + }, + { + "epoch": 1.63, + "learning_rate": 9.030293277594237e-07, + "loss": 0.7695, + "step": 63790 + }, + { + "epoch": 1.63, + "learning_rate": 9.030017877468814e-07, + "loss": 0.6914, + "step": 63791 + }, + { + "epoch": 1.64, + "learning_rate": 9.029742478086059e-07, + "loss": 0.6816, + "step": 63792 + }, + { + "epoch": 1.64, + "learning_rate": 9.029467079446186e-07, + "loss": 0.6172, + "step": 63793 + }, + { + "epoch": 1.64, + "learning_rate": 9.02919168154941e-07, + "loss": 0.707, + "step": 63794 + }, + { + "epoch": 1.64, + "learning_rate": 9.028916284395935e-07, + "loss": 0.7188, + "step": 63795 + }, + { + "epoch": 1.64, + "learning_rate": 9.02864088798597e-07, + "loss": 0.7998, + "step": 63796 + }, + { + "epoch": 1.64, + "learning_rate": 9.028365492319734e-07, + "loss": 0.5599, + "step": 63797 + }, + { + "epoch": 1.64, + "learning_rate": 9.02809009739743e-07, + "loss": 0.45, + "step": 63798 + }, + { + "epoch": 1.64, + "learning_rate": 9.027814703219277e-07, + "loss": 0.7871, + "step": 63799 + }, + { + "epoch": 1.64, + "learning_rate": 9.027539309785478e-07, + "loss": 0.7646, + "step": 63800 + }, + { + "epoch": 1.64, + "learning_rate": 9.027263917096249e-07, + "loss": 0.5845, + "step": 63801 + }, + { + "epoch": 1.64, + "learning_rate": 9.026988525151799e-07, + "loss": 0.7861, + "step": 63802 + }, + { + "epoch": 1.64, + "learning_rate": 9.026713133952339e-07, + "loss": 0.7705, + "step": 63803 + }, + { + "epoch": 1.64, + "learning_rate": 9.026437743498084e-07, + "loss": 0.6523, + "step": 63804 + }, + { + "epoch": 1.64, + "learning_rate": 9.026162353789236e-07, + "loss": 0.6035, + "step": 63805 + }, + { + "epoch": 1.64, + "learning_rate": 9.025886964826014e-07, + "loss": 0.5809, + "step": 63806 + }, + { + "epoch": 1.64, + "learning_rate": 9.025611576608622e-07, + "loss": 0.5859, + "step": 63807 + }, + { + "epoch": 1.64, + "learning_rate": 9.025336189137277e-07, + "loss": 0.8203, + "step": 63808 + }, + { + "epoch": 1.64, + "learning_rate": 9.025060802412184e-07, + "loss": 0.7422, + "step": 63809 + }, + { + "epoch": 1.64, + "learning_rate": 9.024785416433562e-07, + "loss": 0.5503, + "step": 63810 + }, + { + "epoch": 1.64, + "learning_rate": 9.024510031201614e-07, + "loss": 0.6787, + "step": 63811 + }, + { + "epoch": 1.64, + "learning_rate": 9.024234646716553e-07, + "loss": 0.5605, + "step": 63812 + }, + { + "epoch": 1.64, + "learning_rate": 9.023959262978593e-07, + "loss": 0.5737, + "step": 63813 + }, + { + "epoch": 1.64, + "learning_rate": 9.023683879987945e-07, + "loss": 0.7773, + "step": 63814 + }, + { + "epoch": 1.64, + "learning_rate": 9.023408497744813e-07, + "loss": 0.644, + "step": 63815 + }, + { + "epoch": 1.64, + "learning_rate": 9.023133116249413e-07, + "loss": 0.8066, + "step": 63816 + }, + { + "epoch": 1.64, + "learning_rate": 9.022857735501953e-07, + "loss": 0.7021, + "step": 63817 + }, + { + "epoch": 1.64, + "learning_rate": 9.022582355502649e-07, + "loss": 0.6091, + "step": 63818 + }, + { + "epoch": 1.64, + "learning_rate": 9.022306976251705e-07, + "loss": 0.6855, + "step": 63819 + }, + { + "epoch": 1.64, + "learning_rate": 9.02203159774934e-07, + "loss": 0.6265, + "step": 63820 + }, + { + "epoch": 1.64, + "learning_rate": 9.021756219995757e-07, + "loss": 0.6504, + "step": 63821 + }, + { + "epoch": 1.64, + "learning_rate": 9.021480842991174e-07, + "loss": 0.7217, + "step": 63822 + }, + { + "epoch": 1.64, + "learning_rate": 9.021205466735794e-07, + "loss": 0.6279, + "step": 63823 + }, + { + "epoch": 1.64, + "learning_rate": 9.020930091229837e-07, + "loss": 0.6611, + "step": 63824 + }, + { + "epoch": 1.64, + "learning_rate": 9.020654716473507e-07, + "loss": 0.6069, + "step": 63825 + }, + { + "epoch": 1.64, + "learning_rate": 9.020379342467014e-07, + "loss": 0.7598, + "step": 63826 + }, + { + "epoch": 1.64, + "learning_rate": 9.020103969210574e-07, + "loss": 0.5703, + "step": 63827 + }, + { + "epoch": 1.64, + "learning_rate": 9.019828596704393e-07, + "loss": 0.6221, + "step": 63828 + }, + { + "epoch": 1.64, + "learning_rate": 9.019553224948687e-07, + "loss": 0.7285, + "step": 63829 + }, + { + "epoch": 1.64, + "learning_rate": 9.019277853943664e-07, + "loss": 0.7627, + "step": 63830 + }, + { + "epoch": 1.64, + "learning_rate": 9.019002483689531e-07, + "loss": 0.6641, + "step": 63831 + }, + { + "epoch": 1.64, + "learning_rate": 9.018727114186506e-07, + "loss": 0.7617, + "step": 63832 + }, + { + "epoch": 1.64, + "learning_rate": 9.018451745434799e-07, + "loss": 0.6797, + "step": 63833 + }, + { + "epoch": 1.64, + "learning_rate": 9.018176377434613e-07, + "loss": 0.6226, + "step": 63834 + }, + { + "epoch": 1.64, + "learning_rate": 9.017901010186167e-07, + "loss": 0.5962, + "step": 63835 + }, + { + "epoch": 1.64, + "learning_rate": 9.017625643689667e-07, + "loss": 0.5962, + "step": 63836 + }, + { + "epoch": 1.64, + "learning_rate": 9.017350277945328e-07, + "loss": 0.6489, + "step": 63837 + }, + { + "epoch": 1.64, + "learning_rate": 9.017074912953357e-07, + "loss": 0.6943, + "step": 63838 + }, + { + "epoch": 1.64, + "learning_rate": 9.016799548713968e-07, + "loss": 0.6113, + "step": 63839 + }, + { + "epoch": 1.64, + "learning_rate": 9.016524185227368e-07, + "loss": 0.7598, + "step": 63840 + }, + { + "epoch": 1.64, + "learning_rate": 9.016248822493773e-07, + "loss": 0.665, + "step": 63841 + }, + { + "epoch": 1.64, + "learning_rate": 9.015973460513389e-07, + "loss": 0.6284, + "step": 63842 + }, + { + "epoch": 1.64, + "learning_rate": 9.015698099286432e-07, + "loss": 0.7939, + "step": 63843 + }, + { + "epoch": 1.64, + "learning_rate": 9.015422738813109e-07, + "loss": 0.6455, + "step": 63844 + }, + { + "epoch": 1.64, + "learning_rate": 9.015147379093629e-07, + "loss": 0.6797, + "step": 63845 + }, + { + "epoch": 1.64, + "learning_rate": 9.014872020128207e-07, + "loss": 0.637, + "step": 63846 + }, + { + "epoch": 1.64, + "learning_rate": 9.014596661917052e-07, + "loss": 0.5396, + "step": 63847 + }, + { + "epoch": 1.64, + "learning_rate": 9.014321304460374e-07, + "loss": 0.6484, + "step": 63848 + }, + { + "epoch": 1.64, + "learning_rate": 9.014045947758387e-07, + "loss": 0.6035, + "step": 63849 + }, + { + "epoch": 1.64, + "learning_rate": 9.013770591811296e-07, + "loss": 0.5537, + "step": 63850 + }, + { + "epoch": 1.64, + "learning_rate": 9.013495236619318e-07, + "loss": 0.6665, + "step": 63851 + }, + { + "epoch": 1.64, + "learning_rate": 9.01321988218266e-07, + "loss": 0.665, + "step": 63852 + }, + { + "epoch": 1.64, + "learning_rate": 9.012944528501538e-07, + "loss": 0.6162, + "step": 63853 + }, + { + "epoch": 1.64, + "learning_rate": 9.012669175576158e-07, + "loss": 0.9404, + "step": 63854 + }, + { + "epoch": 1.64, + "learning_rate": 9.012393823406728e-07, + "loss": 0.6621, + "step": 63855 + }, + { + "epoch": 1.64, + "learning_rate": 9.012118471993466e-07, + "loss": 0.5562, + "step": 63856 + }, + { + "epoch": 1.64, + "learning_rate": 9.011843121336577e-07, + "loss": 0.5503, + "step": 63857 + }, + { + "epoch": 1.64, + "learning_rate": 9.011567771436276e-07, + "loss": 0.4727, + "step": 63858 + }, + { + "epoch": 1.64, + "learning_rate": 9.01129242229277e-07, + "loss": 0.6187, + "step": 63859 + }, + { + "epoch": 1.64, + "learning_rate": 9.011017073906274e-07, + "loss": 0.6006, + "step": 63860 + }, + { + "epoch": 1.64, + "learning_rate": 9.010741726276994e-07, + "loss": 0.6436, + "step": 63861 + }, + { + "epoch": 1.64, + "learning_rate": 9.010466379405148e-07, + "loss": 0.6611, + "step": 63862 + }, + { + "epoch": 1.64, + "learning_rate": 9.010191033290943e-07, + "loss": 0.7578, + "step": 63863 + }, + { + "epoch": 1.64, + "learning_rate": 9.009915687934587e-07, + "loss": 0.6758, + "step": 63864 + }, + { + "epoch": 1.64, + "learning_rate": 9.009640343336291e-07, + "loss": 0.7939, + "step": 63865 + }, + { + "epoch": 1.64, + "learning_rate": 9.00936499949627e-07, + "loss": 0.5532, + "step": 63866 + }, + { + "epoch": 1.64, + "learning_rate": 9.009089656414731e-07, + "loss": 0.5952, + "step": 63867 + }, + { + "epoch": 1.64, + "learning_rate": 9.008814314091888e-07, + "loss": 0.6465, + "step": 63868 + }, + { + "epoch": 1.64, + "learning_rate": 9.008538972527948e-07, + "loss": 0.665, + "step": 63869 + }, + { + "epoch": 1.64, + "learning_rate": 9.008263631723128e-07, + "loss": 0.5276, + "step": 63870 + }, + { + "epoch": 1.64, + "learning_rate": 9.00798829167763e-07, + "loss": 0.5967, + "step": 63871 + }, + { + "epoch": 1.64, + "learning_rate": 9.007712952391673e-07, + "loss": 0.7051, + "step": 63872 + }, + { + "epoch": 1.64, + "learning_rate": 9.007437613865468e-07, + "loss": 0.5972, + "step": 63873 + }, + { + "epoch": 1.64, + "learning_rate": 9.007162276099218e-07, + "loss": 0.6846, + "step": 63874 + }, + { + "epoch": 1.64, + "learning_rate": 9.006886939093139e-07, + "loss": 0.5796, + "step": 63875 + }, + { + "epoch": 1.64, + "learning_rate": 9.006611602847439e-07, + "loss": 0.6035, + "step": 63876 + }, + { + "epoch": 1.64, + "learning_rate": 9.006336267362333e-07, + "loss": 0.5186, + "step": 63877 + }, + { + "epoch": 1.64, + "learning_rate": 9.006060932638029e-07, + "loss": 0.5596, + "step": 63878 + }, + { + "epoch": 1.64, + "learning_rate": 9.005785598674739e-07, + "loss": 0.5447, + "step": 63879 + }, + { + "epoch": 1.64, + "learning_rate": 9.005510265472672e-07, + "loss": 0.5308, + "step": 63880 + }, + { + "epoch": 1.64, + "learning_rate": 9.005234933032041e-07, + "loss": 0.6943, + "step": 63881 + }, + { + "epoch": 1.64, + "learning_rate": 9.004959601353055e-07, + "loss": 0.5474, + "step": 63882 + }, + { + "epoch": 1.64, + "learning_rate": 9.004684270435931e-07, + "loss": 0.5088, + "step": 63883 + }, + { + "epoch": 1.64, + "learning_rate": 9.004408940280869e-07, + "loss": 0.5674, + "step": 63884 + }, + { + "epoch": 1.64, + "learning_rate": 9.004133610888087e-07, + "loss": 0.6499, + "step": 63885 + }, + { + "epoch": 1.64, + "learning_rate": 9.003858282257791e-07, + "loss": 0.5171, + "step": 63886 + }, + { + "epoch": 1.64, + "learning_rate": 9.003582954390198e-07, + "loss": 0.3039, + "step": 63887 + }, + { + "epoch": 1.64, + "learning_rate": 9.003307627285514e-07, + "loss": 0.5312, + "step": 63888 + }, + { + "epoch": 1.64, + "learning_rate": 9.003032300943953e-07, + "loss": 0.6367, + "step": 63889 + }, + { + "epoch": 1.64, + "learning_rate": 9.002756975365723e-07, + "loss": 0.5566, + "step": 63890 + }, + { + "epoch": 1.64, + "learning_rate": 9.002481650551038e-07, + "loss": 0.6392, + "step": 63891 + }, + { + "epoch": 1.64, + "learning_rate": 9.002206326500105e-07, + "loss": 0.7275, + "step": 63892 + }, + { + "epoch": 1.64, + "learning_rate": 9.00193100321314e-07, + "loss": 0.7354, + "step": 63893 + }, + { + "epoch": 1.64, + "learning_rate": 9.001655680690349e-07, + "loss": 0.6743, + "step": 63894 + }, + { + "epoch": 1.64, + "learning_rate": 9.001380358931942e-07, + "loss": 0.6304, + "step": 63895 + }, + { + "epoch": 1.64, + "learning_rate": 9.001105037938135e-07, + "loss": 0.6245, + "step": 63896 + }, + { + "epoch": 1.64, + "learning_rate": 9.000829717709133e-07, + "loss": 0.8574, + "step": 63897 + }, + { + "epoch": 1.64, + "learning_rate": 9.000554398245152e-07, + "loss": 0.6406, + "step": 63898 + }, + { + "epoch": 1.64, + "learning_rate": 9.000279079546399e-07, + "loss": 0.7842, + "step": 63899 + }, + { + "epoch": 1.64, + "learning_rate": 9.000003761613088e-07, + "loss": 0.4658, + "step": 63900 + }, + { + "epoch": 1.64, + "learning_rate": 8.999728444445428e-07, + "loss": 0.5344, + "step": 63901 + }, + { + "epoch": 1.64, + "learning_rate": 8.999453128043628e-07, + "loss": 0.7422, + "step": 63902 + }, + { + "epoch": 1.64, + "learning_rate": 8.999177812407905e-07, + "loss": 0.5435, + "step": 63903 + }, + { + "epoch": 1.64, + "learning_rate": 8.998902497538463e-07, + "loss": 0.6914, + "step": 63904 + }, + { + "epoch": 1.64, + "learning_rate": 8.998627183435513e-07, + "loss": 0.7168, + "step": 63905 + }, + { + "epoch": 1.64, + "learning_rate": 8.998351870099271e-07, + "loss": 0.7236, + "step": 63906 + }, + { + "epoch": 1.64, + "learning_rate": 8.998076557529944e-07, + "loss": 0.5005, + "step": 63907 + }, + { + "epoch": 1.64, + "learning_rate": 8.997801245727743e-07, + "loss": 0.6982, + "step": 63908 + }, + { + "epoch": 1.64, + "learning_rate": 8.997525934692879e-07, + "loss": 0.5491, + "step": 63909 + }, + { + "epoch": 1.64, + "learning_rate": 8.997250624425565e-07, + "loss": 0.5903, + "step": 63910 + }, + { + "epoch": 1.64, + "learning_rate": 8.996975314926009e-07, + "loss": 0.5674, + "step": 63911 + }, + { + "epoch": 1.64, + "learning_rate": 8.996700006194425e-07, + "loss": 0.7031, + "step": 63912 + }, + { + "epoch": 1.64, + "learning_rate": 8.996424698231022e-07, + "loss": 0.626, + "step": 63913 + }, + { + "epoch": 1.64, + "learning_rate": 8.996149391036006e-07, + "loss": 0.5356, + "step": 63914 + }, + { + "epoch": 1.64, + "learning_rate": 8.995874084609596e-07, + "loss": 0.5581, + "step": 63915 + }, + { + "epoch": 1.64, + "learning_rate": 8.995598778951998e-07, + "loss": 0.6875, + "step": 63916 + }, + { + "epoch": 1.64, + "learning_rate": 8.995323474063423e-07, + "loss": 0.5723, + "step": 63917 + }, + { + "epoch": 1.64, + "learning_rate": 8.995048169944082e-07, + "loss": 0.4263, + "step": 63918 + }, + { + "epoch": 1.64, + "learning_rate": 8.994772866594189e-07, + "loss": 0.6509, + "step": 63919 + }, + { + "epoch": 1.64, + "learning_rate": 8.994497564013952e-07, + "loss": 0.6313, + "step": 63920 + }, + { + "epoch": 1.64, + "learning_rate": 8.994222262203579e-07, + "loss": 0.4771, + "step": 63921 + }, + { + "epoch": 1.64, + "learning_rate": 8.993946961163287e-07, + "loss": 0.647, + "step": 63922 + }, + { + "epoch": 1.64, + "learning_rate": 8.993671660893285e-07, + "loss": 0.6069, + "step": 63923 + }, + { + "epoch": 1.64, + "learning_rate": 8.993396361393778e-07, + "loss": 0.7505, + "step": 63924 + }, + { + "epoch": 1.64, + "learning_rate": 8.993121062664984e-07, + "loss": 0.5249, + "step": 63925 + }, + { + "epoch": 1.64, + "learning_rate": 8.992845764707108e-07, + "loss": 0.6436, + "step": 63926 + }, + { + "epoch": 1.64, + "learning_rate": 8.992570467520366e-07, + "loss": 0.5654, + "step": 63927 + }, + { + "epoch": 1.64, + "learning_rate": 8.992295171104963e-07, + "loss": 0.5493, + "step": 63928 + }, + { + "epoch": 1.64, + "learning_rate": 8.992019875461118e-07, + "loss": 0.5474, + "step": 63929 + }, + { + "epoch": 1.64, + "learning_rate": 8.991744580589033e-07, + "loss": 0.5715, + "step": 63930 + }, + { + "epoch": 1.64, + "learning_rate": 8.991469286488926e-07, + "loss": 0.6504, + "step": 63931 + }, + { + "epoch": 1.64, + "learning_rate": 8.991193993161002e-07, + "loss": 0.7217, + "step": 63932 + }, + { + "epoch": 1.64, + "learning_rate": 8.990918700605479e-07, + "loss": 0.8125, + "step": 63933 + }, + { + "epoch": 1.64, + "learning_rate": 8.99064340882256e-07, + "loss": 0.6333, + "step": 63934 + }, + { + "epoch": 1.64, + "learning_rate": 8.990368117812458e-07, + "loss": 0.6226, + "step": 63935 + }, + { + "epoch": 1.64, + "learning_rate": 8.990092827575386e-07, + "loss": 0.876, + "step": 63936 + }, + { + "epoch": 1.64, + "learning_rate": 8.989817538111554e-07, + "loss": 0.5942, + "step": 63937 + }, + { + "epoch": 1.64, + "learning_rate": 8.98954224942117e-07, + "loss": 0.7773, + "step": 63938 + }, + { + "epoch": 1.64, + "learning_rate": 8.98926696150445e-07, + "loss": 0.4991, + "step": 63939 + }, + { + "epoch": 1.64, + "learning_rate": 8.988991674361597e-07, + "loss": 0.5283, + "step": 63940 + }, + { + "epoch": 1.64, + "learning_rate": 8.988716387992832e-07, + "loss": 0.6343, + "step": 63941 + }, + { + "epoch": 1.64, + "learning_rate": 8.988441102398357e-07, + "loss": 0.6636, + "step": 63942 + }, + { + "epoch": 1.64, + "learning_rate": 8.988165817578389e-07, + "loss": 0.6313, + "step": 63943 + }, + { + "epoch": 1.64, + "learning_rate": 8.987890533533136e-07, + "loss": 0.5869, + "step": 63944 + }, + { + "epoch": 1.64, + "learning_rate": 8.987615250262804e-07, + "loss": 0.5586, + "step": 63945 + }, + { + "epoch": 1.64, + "learning_rate": 8.987339967767613e-07, + "loss": 0.5781, + "step": 63946 + }, + { + "epoch": 1.64, + "learning_rate": 8.987064686047766e-07, + "loss": 0.7852, + "step": 63947 + }, + { + "epoch": 1.64, + "learning_rate": 8.986789405103478e-07, + "loss": 0.416, + "step": 63948 + }, + { + "epoch": 1.64, + "learning_rate": 8.98651412493496e-07, + "loss": 0.6514, + "step": 63949 + }, + { + "epoch": 1.64, + "learning_rate": 8.986238845542421e-07, + "loss": 0.6572, + "step": 63950 + }, + { + "epoch": 1.64, + "learning_rate": 8.985963566926071e-07, + "loss": 0.5825, + "step": 63951 + }, + { + "epoch": 1.64, + "learning_rate": 8.985688289086124e-07, + "loss": 0.7168, + "step": 63952 + }, + { + "epoch": 1.64, + "learning_rate": 8.985413012022791e-07, + "loss": 0.5059, + "step": 63953 + }, + { + "epoch": 1.64, + "learning_rate": 8.985137735736278e-07, + "loss": 0.7246, + "step": 63954 + }, + { + "epoch": 1.64, + "learning_rate": 8.984862460226797e-07, + "loss": 0.5205, + "step": 63955 + }, + { + "epoch": 1.64, + "learning_rate": 8.984587185494561e-07, + "loss": 0.6182, + "step": 63956 + }, + { + "epoch": 1.64, + "learning_rate": 8.984311911539779e-07, + "loss": 0.5645, + "step": 63957 + }, + { + "epoch": 1.64, + "learning_rate": 8.984036638362664e-07, + "loss": 0.6206, + "step": 63958 + }, + { + "epoch": 1.64, + "learning_rate": 8.983761365963425e-07, + "loss": 0.5078, + "step": 63959 + }, + { + "epoch": 1.64, + "learning_rate": 8.983486094342273e-07, + "loss": 0.6982, + "step": 63960 + }, + { + "epoch": 1.64, + "learning_rate": 8.983210823499419e-07, + "loss": 0.6338, + "step": 63961 + }, + { + "epoch": 1.64, + "learning_rate": 8.982935553435074e-07, + "loss": 0.7295, + "step": 63962 + }, + { + "epoch": 1.64, + "learning_rate": 8.982660284149452e-07, + "loss": 0.8184, + "step": 63963 + }, + { + "epoch": 1.64, + "learning_rate": 8.982385015642755e-07, + "loss": 0.5718, + "step": 63964 + }, + { + "epoch": 1.64, + "learning_rate": 8.982109747915202e-07, + "loss": 0.5825, + "step": 63965 + }, + { + "epoch": 1.64, + "learning_rate": 8.981834480966997e-07, + "loss": 0.7061, + "step": 63966 + }, + { + "epoch": 1.64, + "learning_rate": 8.981559214798359e-07, + "loss": 0.6318, + "step": 63967 + }, + { + "epoch": 1.64, + "learning_rate": 8.98128394940949e-07, + "loss": 0.533, + "step": 63968 + }, + { + "epoch": 1.64, + "learning_rate": 8.981008684800608e-07, + "loss": 0.6655, + "step": 63969 + }, + { + "epoch": 1.64, + "learning_rate": 8.980733420971918e-07, + "loss": 0.5571, + "step": 63970 + }, + { + "epoch": 1.64, + "learning_rate": 8.980458157923638e-07, + "loss": 0.7246, + "step": 63971 + }, + { + "epoch": 1.64, + "learning_rate": 8.98018289565597e-07, + "loss": 0.7178, + "step": 63972 + }, + { + "epoch": 1.64, + "learning_rate": 8.979907634169137e-07, + "loss": 0.6777, + "step": 63973 + }, + { + "epoch": 1.64, + "learning_rate": 8.979632373463334e-07, + "loss": 0.6934, + "step": 63974 + }, + { + "epoch": 1.64, + "learning_rate": 8.979357113538783e-07, + "loss": 0.4824, + "step": 63975 + }, + { + "epoch": 1.64, + "learning_rate": 8.979081854395687e-07, + "loss": 0.6562, + "step": 63976 + }, + { + "epoch": 1.64, + "learning_rate": 8.978806596034265e-07, + "loss": 0.5078, + "step": 63977 + }, + { + "epoch": 1.64, + "learning_rate": 8.978531338454721e-07, + "loss": 0.5422, + "step": 63978 + }, + { + "epoch": 1.64, + "learning_rate": 8.978256081657271e-07, + "loss": 0.5895, + "step": 63979 + }, + { + "epoch": 1.64, + "learning_rate": 8.977980825642122e-07, + "loss": 0.7598, + "step": 63980 + }, + { + "epoch": 1.64, + "learning_rate": 8.977705570409487e-07, + "loss": 0.6758, + "step": 63981 + }, + { + "epoch": 1.64, + "learning_rate": 8.977430315959575e-07, + "loss": 0.3647, + "step": 63982 + }, + { + "epoch": 1.64, + "learning_rate": 8.977155062292601e-07, + "loss": 0.6128, + "step": 63983 + }, + { + "epoch": 1.64, + "learning_rate": 8.976879809408769e-07, + "loss": 0.6387, + "step": 63984 + }, + { + "epoch": 1.64, + "learning_rate": 8.976604557308293e-07, + "loss": 0.6353, + "step": 63985 + }, + { + "epoch": 1.64, + "learning_rate": 8.976329305991385e-07, + "loss": 0.6592, + "step": 63986 + }, + { + "epoch": 1.64, + "learning_rate": 8.976054055458253e-07, + "loss": 0.8291, + "step": 63987 + }, + { + "epoch": 1.64, + "learning_rate": 8.975778805709111e-07, + "loss": 0.5171, + "step": 63988 + }, + { + "epoch": 1.64, + "learning_rate": 8.975503556744166e-07, + "loss": 0.4854, + "step": 63989 + }, + { + "epoch": 1.64, + "learning_rate": 8.975228308563632e-07, + "loss": 0.6802, + "step": 63990 + }, + { + "epoch": 1.64, + "learning_rate": 8.974953061167721e-07, + "loss": 0.6953, + "step": 63991 + }, + { + "epoch": 1.64, + "learning_rate": 8.974677814556637e-07, + "loss": 0.6167, + "step": 63992 + }, + { + "epoch": 1.64, + "learning_rate": 8.9744025687306e-07, + "loss": 0.792, + "step": 63993 + }, + { + "epoch": 1.64, + "learning_rate": 8.974127323689814e-07, + "loss": 0.5854, + "step": 63994 + }, + { + "epoch": 1.64, + "learning_rate": 8.973852079434489e-07, + "loss": 0.5908, + "step": 63995 + }, + { + "epoch": 1.64, + "learning_rate": 8.97357683596484e-07, + "loss": 0.7305, + "step": 63996 + }, + { + "epoch": 1.64, + "learning_rate": 8.973301593281075e-07, + "loss": 0.6284, + "step": 63997 + }, + { + "epoch": 1.64, + "learning_rate": 8.973026351383407e-07, + "loss": 0.6572, + "step": 63998 + }, + { + "epoch": 1.64, + "learning_rate": 8.972751110272044e-07, + "loss": 0.6748, + "step": 63999 + }, + { + "epoch": 1.64, + "learning_rate": 8.972475869947199e-07, + "loss": 0.6167, + "step": 64000 + }, + { + "epoch": 1.64, + "learning_rate": 8.972200630409081e-07, + "loss": 0.3369, + "step": 64001 + }, + { + "epoch": 1.64, + "learning_rate": 8.971925391657904e-07, + "loss": 0.6929, + "step": 64002 + }, + { + "epoch": 1.64, + "learning_rate": 8.971650153693878e-07, + "loss": 0.647, + "step": 64003 + }, + { + "epoch": 1.64, + "learning_rate": 8.971374916517209e-07, + "loss": 0.5615, + "step": 64004 + }, + { + "epoch": 1.64, + "learning_rate": 8.971099680128113e-07, + "loss": 0.5139, + "step": 64005 + }, + { + "epoch": 1.64, + "learning_rate": 8.970824444526794e-07, + "loss": 0.6807, + "step": 64006 + }, + { + "epoch": 1.64, + "learning_rate": 8.970549209713471e-07, + "loss": 0.6763, + "step": 64007 + }, + { + "epoch": 1.64, + "learning_rate": 8.97027397568835e-07, + "loss": 0.7441, + "step": 64008 + }, + { + "epoch": 1.64, + "learning_rate": 8.969998742451645e-07, + "loss": 0.6377, + "step": 64009 + }, + { + "epoch": 1.64, + "learning_rate": 8.969723510003564e-07, + "loss": 0.626, + "step": 64010 + }, + { + "epoch": 1.64, + "learning_rate": 8.969448278344316e-07, + "loss": 0.5349, + "step": 64011 + }, + { + "epoch": 1.64, + "learning_rate": 8.969173047474116e-07, + "loss": 0.6553, + "step": 64012 + }, + { + "epoch": 1.64, + "learning_rate": 8.968897817393176e-07, + "loss": 0.5186, + "step": 64013 + }, + { + "epoch": 1.64, + "learning_rate": 8.968622588101699e-07, + "loss": 0.7119, + "step": 64014 + }, + { + "epoch": 1.64, + "learning_rate": 8.968347359599901e-07, + "loss": 0.6562, + "step": 64015 + }, + { + "epoch": 1.64, + "learning_rate": 8.968072131887991e-07, + "loss": 0.7881, + "step": 64016 + }, + { + "epoch": 1.64, + "learning_rate": 8.967796904966183e-07, + "loss": 0.6475, + "step": 64017 + }, + { + "epoch": 1.64, + "learning_rate": 8.967521678834683e-07, + "loss": 0.6299, + "step": 64018 + }, + { + "epoch": 1.64, + "learning_rate": 8.967246453493707e-07, + "loss": 0.6152, + "step": 64019 + }, + { + "epoch": 1.64, + "learning_rate": 8.966971228943458e-07, + "loss": 0.7607, + "step": 64020 + }, + { + "epoch": 1.64, + "learning_rate": 8.966696005184157e-07, + "loss": 0.4971, + "step": 64021 + }, + { + "epoch": 1.64, + "learning_rate": 8.966420782216006e-07, + "loss": 0.4658, + "step": 64022 + }, + { + "epoch": 1.64, + "learning_rate": 8.966145560039223e-07, + "loss": 0.624, + "step": 64023 + }, + { + "epoch": 1.64, + "learning_rate": 8.965870338654014e-07, + "loss": 0.4866, + "step": 64024 + }, + { + "epoch": 1.64, + "learning_rate": 8.965595118060587e-07, + "loss": 0.8252, + "step": 64025 + }, + { + "epoch": 1.64, + "learning_rate": 8.965319898259158e-07, + "loss": 0.7305, + "step": 64026 + }, + { + "epoch": 1.64, + "learning_rate": 8.965044679249938e-07, + "loss": 0.667, + "step": 64027 + }, + { + "epoch": 1.64, + "learning_rate": 8.964769461033133e-07, + "loss": 0.6377, + "step": 64028 + }, + { + "epoch": 1.64, + "learning_rate": 8.964494243608957e-07, + "loss": 0.6602, + "step": 64029 + }, + { + "epoch": 1.64, + "learning_rate": 8.964219026977619e-07, + "loss": 0.5317, + "step": 64030 + }, + { + "epoch": 1.64, + "learning_rate": 8.963943811139333e-07, + "loss": 0.8564, + "step": 64031 + }, + { + "epoch": 1.64, + "learning_rate": 8.963668596094305e-07, + "loss": 0.5049, + "step": 64032 + }, + { + "epoch": 1.64, + "learning_rate": 8.963393381842753e-07, + "loss": 0.6021, + "step": 64033 + }, + { + "epoch": 1.64, + "learning_rate": 8.963118168384881e-07, + "loss": 0.5139, + "step": 64034 + }, + { + "epoch": 1.64, + "learning_rate": 8.9628429557209e-07, + "loss": 0.561, + "step": 64035 + }, + { + "epoch": 1.64, + "learning_rate": 8.962567743851024e-07, + "loss": 0.6816, + "step": 64036 + }, + { + "epoch": 1.64, + "learning_rate": 8.962292532775459e-07, + "loss": 0.708, + "step": 64037 + }, + { + "epoch": 1.64, + "learning_rate": 8.962017322494423e-07, + "loss": 0.7695, + "step": 64038 + }, + { + "epoch": 1.64, + "learning_rate": 8.961742113008119e-07, + "loss": 0.6396, + "step": 64039 + }, + { + "epoch": 1.64, + "learning_rate": 8.961466904316764e-07, + "loss": 0.5635, + "step": 64040 + }, + { + "epoch": 1.64, + "learning_rate": 8.961191696420564e-07, + "loss": 0.6279, + "step": 64041 + }, + { + "epoch": 1.64, + "learning_rate": 8.960916489319734e-07, + "loss": 0.6844, + "step": 64042 + }, + { + "epoch": 1.64, + "learning_rate": 8.960641283014485e-07, + "loss": 0.7622, + "step": 64043 + }, + { + "epoch": 1.64, + "learning_rate": 8.960366077505023e-07, + "loss": 0.5918, + "step": 64044 + }, + { + "epoch": 1.64, + "learning_rate": 8.960090872791558e-07, + "loss": 0.6865, + "step": 64045 + }, + { + "epoch": 1.64, + "learning_rate": 8.959815668874305e-07, + "loss": 0.4868, + "step": 64046 + }, + { + "epoch": 1.64, + "learning_rate": 8.959540465753474e-07, + "loss": 0.6025, + "step": 64047 + }, + { + "epoch": 1.64, + "learning_rate": 8.959265263429274e-07, + "loss": 0.5195, + "step": 64048 + }, + { + "epoch": 1.64, + "learning_rate": 8.958990061901917e-07, + "loss": 0.5862, + "step": 64049 + }, + { + "epoch": 1.64, + "learning_rate": 8.958714861171614e-07, + "loss": 0.7705, + "step": 64050 + }, + { + "epoch": 1.64, + "learning_rate": 8.958439661238573e-07, + "loss": 0.6484, + "step": 64051 + }, + { + "epoch": 1.64, + "learning_rate": 8.958164462103009e-07, + "loss": 0.666, + "step": 64052 + }, + { + "epoch": 1.64, + "learning_rate": 8.957889263765134e-07, + "loss": 0.7217, + "step": 64053 + }, + { + "epoch": 1.64, + "learning_rate": 8.957614066225149e-07, + "loss": 0.6484, + "step": 64054 + }, + { + "epoch": 1.64, + "learning_rate": 8.957338869483276e-07, + "loss": 0.6514, + "step": 64055 + }, + { + "epoch": 1.64, + "learning_rate": 8.957063673539716e-07, + "loss": 0.7354, + "step": 64056 + }, + { + "epoch": 1.64, + "learning_rate": 8.956788478394688e-07, + "loss": 0.6914, + "step": 64057 + }, + { + "epoch": 1.64, + "learning_rate": 8.956513284048396e-07, + "loss": 0.583, + "step": 64058 + }, + { + "epoch": 1.64, + "learning_rate": 8.956238090501057e-07, + "loss": 0.7979, + "step": 64059 + }, + { + "epoch": 1.64, + "learning_rate": 8.955962897752876e-07, + "loss": 0.6321, + "step": 64060 + }, + { + "epoch": 1.64, + "learning_rate": 8.955687705804067e-07, + "loss": 0.6553, + "step": 64061 + }, + { + "epoch": 1.64, + "learning_rate": 8.955412514654839e-07, + "loss": 0.6294, + "step": 64062 + }, + { + "epoch": 1.64, + "learning_rate": 8.955137324305409e-07, + "loss": 0.6377, + "step": 64063 + }, + { + "epoch": 1.64, + "learning_rate": 8.954862134755978e-07, + "loss": 0.6841, + "step": 64064 + }, + { + "epoch": 1.64, + "learning_rate": 8.954586946006761e-07, + "loss": 0.7783, + "step": 64065 + }, + { + "epoch": 1.64, + "learning_rate": 8.954311758057969e-07, + "loss": 0.7637, + "step": 64066 + }, + { + "epoch": 1.64, + "learning_rate": 8.954036570909813e-07, + "loss": 0.4819, + "step": 64067 + }, + { + "epoch": 1.64, + "learning_rate": 8.953761384562499e-07, + "loss": 0.604, + "step": 64068 + }, + { + "epoch": 1.64, + "learning_rate": 8.953486199016246e-07, + "loss": 0.8096, + "step": 64069 + }, + { + "epoch": 1.64, + "learning_rate": 8.953211014271259e-07, + "loss": 0.5562, + "step": 64070 + }, + { + "epoch": 1.64, + "learning_rate": 8.952935830327751e-07, + "loss": 0.5811, + "step": 64071 + }, + { + "epoch": 1.64, + "learning_rate": 8.95266064718593e-07, + "loss": 0.6108, + "step": 64072 + }, + { + "epoch": 1.64, + "learning_rate": 8.952385464846014e-07, + "loss": 0.5188, + "step": 64073 + }, + { + "epoch": 1.64, + "learning_rate": 8.952110283308205e-07, + "loss": 0.7266, + "step": 64074 + }, + { + "epoch": 1.64, + "learning_rate": 8.951835102572716e-07, + "loss": 0.7285, + "step": 64075 + }, + { + "epoch": 1.64, + "learning_rate": 8.95155992263976e-07, + "loss": 0.566, + "step": 64076 + }, + { + "epoch": 1.64, + "learning_rate": 8.951284743509544e-07, + "loss": 0.5835, + "step": 64077 + }, + { + "epoch": 1.64, + "learning_rate": 8.951009565182283e-07, + "loss": 0.875, + "step": 64078 + }, + { + "epoch": 1.64, + "learning_rate": 8.950734387658183e-07, + "loss": 0.6562, + "step": 64079 + }, + { + "epoch": 1.64, + "learning_rate": 8.950459210937462e-07, + "loss": 0.4822, + "step": 64080 + }, + { + "epoch": 1.64, + "learning_rate": 8.950184035020321e-07, + "loss": 0.6792, + "step": 64081 + }, + { + "epoch": 1.64, + "learning_rate": 8.949908859906981e-07, + "loss": 0.7402, + "step": 64082 + }, + { + "epoch": 1.64, + "learning_rate": 8.949633685597647e-07, + "loss": 0.3672, + "step": 64083 + }, + { + "epoch": 1.64, + "learning_rate": 8.94935851209253e-07, + "loss": 0.6992, + "step": 64084 + }, + { + "epoch": 1.64, + "learning_rate": 8.949083339391837e-07, + "loss": 0.6172, + "step": 64085 + }, + { + "epoch": 1.64, + "learning_rate": 8.948808167495786e-07, + "loss": 0.5605, + "step": 64086 + }, + { + "epoch": 1.64, + "learning_rate": 8.948532996404582e-07, + "loss": 0.6904, + "step": 64087 + }, + { + "epoch": 1.64, + "learning_rate": 8.948257826118439e-07, + "loss": 0.7588, + "step": 64088 + }, + { + "epoch": 1.64, + "learning_rate": 8.947982656637566e-07, + "loss": 0.6611, + "step": 64089 + }, + { + "epoch": 1.64, + "learning_rate": 8.947707487962175e-07, + "loss": 0.6895, + "step": 64090 + }, + { + "epoch": 1.64, + "learning_rate": 8.947432320092475e-07, + "loss": 0.5669, + "step": 64091 + }, + { + "epoch": 1.64, + "learning_rate": 8.94715715302868e-07, + "loss": 0.6787, + "step": 64092 + }, + { + "epoch": 1.64, + "learning_rate": 8.946881986771e-07, + "loss": 0.6885, + "step": 64093 + }, + { + "epoch": 1.64, + "learning_rate": 8.946606821319639e-07, + "loss": 0.5078, + "step": 64094 + }, + { + "epoch": 1.64, + "learning_rate": 8.946331656674816e-07, + "loss": 0.4719, + "step": 64095 + }, + { + "epoch": 1.64, + "learning_rate": 8.946056492836736e-07, + "loss": 0.4592, + "step": 64096 + }, + { + "epoch": 1.64, + "learning_rate": 8.945781329805613e-07, + "loss": 0.6174, + "step": 64097 + }, + { + "epoch": 1.64, + "learning_rate": 8.945506167581655e-07, + "loss": 0.6177, + "step": 64098 + }, + { + "epoch": 1.64, + "learning_rate": 8.945231006165079e-07, + "loss": 0.7754, + "step": 64099 + }, + { + "epoch": 1.64, + "learning_rate": 8.944955845556088e-07, + "loss": 0.6758, + "step": 64100 + }, + { + "epoch": 1.64, + "learning_rate": 8.944680685754895e-07, + "loss": 0.3979, + "step": 64101 + }, + { + "epoch": 1.64, + "learning_rate": 8.944405526761714e-07, + "loss": 0.5977, + "step": 64102 + }, + { + "epoch": 1.64, + "learning_rate": 8.944130368576754e-07, + "loss": 0.6465, + "step": 64103 + }, + { + "epoch": 1.64, + "learning_rate": 8.943855211200222e-07, + "loss": 0.5957, + "step": 64104 + }, + { + "epoch": 1.64, + "learning_rate": 8.943580054632334e-07, + "loss": 0.5347, + "step": 64105 + }, + { + "epoch": 1.64, + "learning_rate": 8.943304898873294e-07, + "loss": 0.3381, + "step": 64106 + }, + { + "epoch": 1.64, + "learning_rate": 8.94302974392332e-07, + "loss": 0.4387, + "step": 64107 + }, + { + "epoch": 1.64, + "learning_rate": 8.942754589782617e-07, + "loss": 0.6094, + "step": 64108 + }, + { + "epoch": 1.64, + "learning_rate": 8.942479436451401e-07, + "loss": 0.667, + "step": 64109 + }, + { + "epoch": 1.64, + "learning_rate": 8.942204283929879e-07, + "loss": 0.3755, + "step": 64110 + }, + { + "epoch": 1.64, + "learning_rate": 8.941929132218262e-07, + "loss": 0.6562, + "step": 64111 + }, + { + "epoch": 1.64, + "learning_rate": 8.94165398131676e-07, + "loss": 0.625, + "step": 64112 + }, + { + "epoch": 1.64, + "learning_rate": 8.94137883122559e-07, + "loss": 0.4338, + "step": 64113 + }, + { + "epoch": 1.64, + "learning_rate": 8.941103681944955e-07, + "loss": 0.4849, + "step": 64114 + }, + { + "epoch": 1.64, + "learning_rate": 8.940828533475066e-07, + "loss": 0.6377, + "step": 64115 + }, + { + "epoch": 1.64, + "learning_rate": 8.940553385816137e-07, + "loss": 0.6841, + "step": 64116 + }, + { + "epoch": 1.64, + "learning_rate": 8.940278238968379e-07, + "loss": 0.6523, + "step": 64117 + }, + { + "epoch": 1.64, + "learning_rate": 8.940003092931999e-07, + "loss": 0.6245, + "step": 64118 + }, + { + "epoch": 1.64, + "learning_rate": 8.939727947707212e-07, + "loss": 0.6763, + "step": 64119 + }, + { + "epoch": 1.64, + "learning_rate": 8.939452803294224e-07, + "loss": 0.6467, + "step": 64120 + }, + { + "epoch": 1.64, + "learning_rate": 8.93917765969325e-07, + "loss": 0.4954, + "step": 64121 + }, + { + "epoch": 1.64, + "learning_rate": 8.938902516904497e-07, + "loss": 0.5308, + "step": 64122 + }, + { + "epoch": 1.64, + "learning_rate": 8.938627374928182e-07, + "loss": 0.6987, + "step": 64123 + }, + { + "epoch": 1.64, + "learning_rate": 8.938352233764509e-07, + "loss": 0.5625, + "step": 64124 + }, + { + "epoch": 1.64, + "learning_rate": 8.938077093413689e-07, + "loss": 0.7109, + "step": 64125 + }, + { + "epoch": 1.64, + "learning_rate": 8.937801953875937e-07, + "loss": 0.4004, + "step": 64126 + }, + { + "epoch": 1.64, + "learning_rate": 8.937526815151459e-07, + "loss": 0.4854, + "step": 64127 + }, + { + "epoch": 1.64, + "learning_rate": 8.937251677240469e-07, + "loss": 0.7344, + "step": 64128 + }, + { + "epoch": 1.64, + "learning_rate": 8.936976540143175e-07, + "loss": 0.624, + "step": 64129 + }, + { + "epoch": 1.64, + "learning_rate": 8.936701403859791e-07, + "loss": 0.5906, + "step": 64130 + }, + { + "epoch": 1.64, + "learning_rate": 8.936426268390524e-07, + "loss": 0.5288, + "step": 64131 + }, + { + "epoch": 1.64, + "learning_rate": 8.936151133735591e-07, + "loss": 0.552, + "step": 64132 + }, + { + "epoch": 1.64, + "learning_rate": 8.935875999895195e-07, + "loss": 0.4695, + "step": 64133 + }, + { + "epoch": 1.64, + "learning_rate": 8.935600866869551e-07, + "loss": 0.7627, + "step": 64134 + }, + { + "epoch": 1.64, + "learning_rate": 8.935325734658866e-07, + "loss": 0.4861, + "step": 64135 + }, + { + "epoch": 1.64, + "learning_rate": 8.935050603263356e-07, + "loss": 0.5415, + "step": 64136 + }, + { + "epoch": 1.64, + "learning_rate": 8.934775472683224e-07, + "loss": 0.5728, + "step": 64137 + }, + { + "epoch": 1.64, + "learning_rate": 8.93450034291869e-07, + "loss": 0.4638, + "step": 64138 + }, + { + "epoch": 1.64, + "learning_rate": 8.934225213969958e-07, + "loss": 0.792, + "step": 64139 + }, + { + "epoch": 1.64, + "learning_rate": 8.933950085837242e-07, + "loss": 0.7021, + "step": 64140 + }, + { + "epoch": 1.64, + "learning_rate": 8.933674958520749e-07, + "loss": 0.4536, + "step": 64141 + }, + { + "epoch": 1.64, + "learning_rate": 8.933399832020697e-07, + "loss": 0.5796, + "step": 64142 + }, + { + "epoch": 1.64, + "learning_rate": 8.93312470633729e-07, + "loss": 0.6562, + "step": 64143 + }, + { + "epoch": 1.64, + "learning_rate": 8.932849581470737e-07, + "loss": 0.6323, + "step": 64144 + }, + { + "epoch": 1.64, + "learning_rate": 8.932574457421256e-07, + "loss": 0.7617, + "step": 64145 + }, + { + "epoch": 1.64, + "learning_rate": 8.932299334189049e-07, + "loss": 0.6265, + "step": 64146 + }, + { + "epoch": 1.64, + "learning_rate": 8.932024211774335e-07, + "loss": 0.6416, + "step": 64147 + }, + { + "epoch": 1.64, + "learning_rate": 8.931749090177318e-07, + "loss": 0.6011, + "step": 64148 + }, + { + "epoch": 1.64, + "learning_rate": 8.931473969398215e-07, + "loss": 0.3865, + "step": 64149 + }, + { + "epoch": 1.64, + "learning_rate": 8.93119884943723e-07, + "loss": 0.6321, + "step": 64150 + }, + { + "epoch": 1.64, + "learning_rate": 8.93092373029458e-07, + "loss": 0.6714, + "step": 64151 + }, + { + "epoch": 1.64, + "learning_rate": 8.930648611970475e-07, + "loss": 0.5581, + "step": 64152 + }, + { + "epoch": 1.64, + "learning_rate": 8.93037349446512e-07, + "loss": 0.5833, + "step": 64153 + }, + { + "epoch": 1.64, + "learning_rate": 8.930098377778727e-07, + "loss": 0.564, + "step": 64154 + }, + { + "epoch": 1.64, + "learning_rate": 8.92982326191151e-07, + "loss": 0.5591, + "step": 64155 + }, + { + "epoch": 1.64, + "learning_rate": 8.929548146863677e-07, + "loss": 0.5513, + "step": 64156 + }, + { + "epoch": 1.64, + "learning_rate": 8.92927303263544e-07, + "loss": 0.6982, + "step": 64157 + }, + { + "epoch": 1.64, + "learning_rate": 8.928997919227009e-07, + "loss": 0.752, + "step": 64158 + }, + { + "epoch": 1.64, + "learning_rate": 8.928722806638597e-07, + "loss": 0.5358, + "step": 64159 + }, + { + "epoch": 1.64, + "learning_rate": 8.92844769487041e-07, + "loss": 0.5693, + "step": 64160 + }, + { + "epoch": 1.64, + "learning_rate": 8.928172583922664e-07, + "loss": 0.6895, + "step": 64161 + }, + { + "epoch": 1.64, + "learning_rate": 8.92789747379557e-07, + "loss": 0.5068, + "step": 64162 + }, + { + "epoch": 1.64, + "learning_rate": 8.92762236448933e-07, + "loss": 0.6602, + "step": 64163 + }, + { + "epoch": 1.64, + "learning_rate": 8.927347256004162e-07, + "loss": 0.749, + "step": 64164 + }, + { + "epoch": 1.64, + "learning_rate": 8.927072148340273e-07, + "loss": 0.6113, + "step": 64165 + }, + { + "epoch": 1.64, + "learning_rate": 8.926797041497878e-07, + "loss": 0.4634, + "step": 64166 + }, + { + "epoch": 1.64, + "learning_rate": 8.926521935477183e-07, + "loss": 0.7598, + "step": 64167 + }, + { + "epoch": 1.64, + "learning_rate": 8.926246830278403e-07, + "loss": 0.604, + "step": 64168 + }, + { + "epoch": 1.64, + "learning_rate": 8.925971725901745e-07, + "loss": 0.6914, + "step": 64169 + }, + { + "epoch": 1.64, + "learning_rate": 8.925696622347423e-07, + "loss": 0.4893, + "step": 64170 + }, + { + "epoch": 1.64, + "learning_rate": 8.925421519615642e-07, + "loss": 0.6309, + "step": 64171 + }, + { + "epoch": 1.64, + "learning_rate": 8.925146417706625e-07, + "loss": 0.5732, + "step": 64172 + }, + { + "epoch": 1.64, + "learning_rate": 8.924871316620566e-07, + "loss": 0.5649, + "step": 64173 + }, + { + "epoch": 1.64, + "learning_rate": 8.924596216357686e-07, + "loss": 0.6758, + "step": 64174 + }, + { + "epoch": 1.64, + "learning_rate": 8.924321116918191e-07, + "loss": 0.6416, + "step": 64175 + }, + { + "epoch": 1.64, + "learning_rate": 8.924046018302297e-07, + "loss": 0.5967, + "step": 64176 + }, + { + "epoch": 1.64, + "learning_rate": 8.923770920510209e-07, + "loss": 0.7236, + "step": 64177 + }, + { + "epoch": 1.64, + "learning_rate": 8.923495823542141e-07, + "loss": 0.5542, + "step": 64178 + }, + { + "epoch": 1.64, + "learning_rate": 8.923220727398302e-07, + "loss": 0.4839, + "step": 64179 + }, + { + "epoch": 1.64, + "learning_rate": 8.922945632078905e-07, + "loss": 0.5649, + "step": 64180 + }, + { + "epoch": 1.64, + "learning_rate": 8.922670537584156e-07, + "loss": 0.7295, + "step": 64181 + }, + { + "epoch": 1.65, + "learning_rate": 8.922395443914274e-07, + "loss": 0.6328, + "step": 64182 + }, + { + "epoch": 1.65, + "learning_rate": 8.922120351069462e-07, + "loss": 0.4889, + "step": 64183 + }, + { + "epoch": 1.65, + "learning_rate": 8.921845259049931e-07, + "loss": 0.4729, + "step": 64184 + }, + { + "epoch": 1.65, + "learning_rate": 8.921570167855894e-07, + "loss": 0.7119, + "step": 64185 + }, + { + "epoch": 1.65, + "learning_rate": 8.92129507748756e-07, + "loss": 0.7549, + "step": 64186 + }, + { + "epoch": 1.65, + "learning_rate": 8.921019987945144e-07, + "loss": 0.6333, + "step": 64187 + }, + { + "epoch": 1.65, + "learning_rate": 8.920744899228851e-07, + "loss": 0.7715, + "step": 64188 + }, + { + "epoch": 1.65, + "learning_rate": 8.920469811338894e-07, + "loss": 0.4742, + "step": 64189 + }, + { + "epoch": 1.65, + "learning_rate": 8.920194724275486e-07, + "loss": 0.6445, + "step": 64190 + }, + { + "epoch": 1.65, + "learning_rate": 8.919919638038832e-07, + "loss": 0.6528, + "step": 64191 + }, + { + "epoch": 1.65, + "learning_rate": 8.919644552629151e-07, + "loss": 0.5908, + "step": 64192 + }, + { + "epoch": 1.65, + "learning_rate": 8.919369468046644e-07, + "loss": 0.7314, + "step": 64193 + }, + { + "epoch": 1.65, + "learning_rate": 8.919094384291527e-07, + "loss": 0.6196, + "step": 64194 + }, + { + "epoch": 1.65, + "learning_rate": 8.918819301364011e-07, + "loss": 0.6582, + "step": 64195 + }, + { + "epoch": 1.65, + "learning_rate": 8.918544219264302e-07, + "loss": 0.7529, + "step": 64196 + }, + { + "epoch": 1.65, + "learning_rate": 8.918269137992618e-07, + "loss": 0.6548, + "step": 64197 + }, + { + "epoch": 1.65, + "learning_rate": 8.917994057549161e-07, + "loss": 0.6729, + "step": 64198 + }, + { + "epoch": 1.65, + "learning_rate": 8.91771897793415e-07, + "loss": 0.6196, + "step": 64199 + }, + { + "epoch": 1.65, + "learning_rate": 8.917443899147789e-07, + "loss": 0.4061, + "step": 64200 + }, + { + "epoch": 1.65, + "learning_rate": 8.917168821190295e-07, + "loss": 0.6445, + "step": 64201 + }, + { + "epoch": 1.65, + "learning_rate": 8.916893744061875e-07, + "loss": 0.5581, + "step": 64202 + }, + { + "epoch": 1.65, + "learning_rate": 8.916618667762737e-07, + "loss": 0.7109, + "step": 64203 + }, + { + "epoch": 1.65, + "learning_rate": 8.916343592293096e-07, + "loss": 0.8086, + "step": 64204 + }, + { + "epoch": 1.65, + "learning_rate": 8.916068517653159e-07, + "loss": 0.7803, + "step": 64205 + }, + { + "epoch": 1.65, + "learning_rate": 8.91579344384314e-07, + "loss": 0.751, + "step": 64206 + }, + { + "epoch": 1.65, + "learning_rate": 8.915518370863249e-07, + "loss": 0.5835, + "step": 64207 + }, + { + "epoch": 1.65, + "learning_rate": 8.915243298713693e-07, + "loss": 0.6299, + "step": 64208 + }, + { + "epoch": 1.65, + "learning_rate": 8.914968227394687e-07, + "loss": 0.5532, + "step": 64209 + }, + { + "epoch": 1.65, + "learning_rate": 8.914693156906438e-07, + "loss": 0.6816, + "step": 64210 + }, + { + "epoch": 1.65, + "learning_rate": 8.91441808724916e-07, + "loss": 0.7549, + "step": 64211 + }, + { + "epoch": 1.65, + "learning_rate": 8.914143018423066e-07, + "loss": 0.5947, + "step": 64212 + }, + { + "epoch": 1.65, + "learning_rate": 8.913867950428357e-07, + "loss": 0.6523, + "step": 64213 + }, + { + "epoch": 1.65, + "learning_rate": 8.913592883265253e-07, + "loss": 0.6357, + "step": 64214 + }, + { + "epoch": 1.65, + "learning_rate": 8.913317816933958e-07, + "loss": 0.6646, + "step": 64215 + }, + { + "epoch": 1.65, + "learning_rate": 8.913042751434687e-07, + "loss": 0.5974, + "step": 64216 + }, + { + "epoch": 1.65, + "learning_rate": 8.912767686767649e-07, + "loss": 0.7281, + "step": 64217 + }, + { + "epoch": 1.65, + "learning_rate": 8.912492622933055e-07, + "loss": 0.6797, + "step": 64218 + }, + { + "epoch": 1.65, + "learning_rate": 8.912217559931115e-07, + "loss": 0.6055, + "step": 64219 + }, + { + "epoch": 1.65, + "learning_rate": 8.911942497762041e-07, + "loss": 0.7021, + "step": 64220 + }, + { + "epoch": 1.65, + "learning_rate": 8.91166743642604e-07, + "loss": 0.6138, + "step": 64221 + }, + { + "epoch": 1.65, + "learning_rate": 8.91139237592333e-07, + "loss": 0.6184, + "step": 64222 + }, + { + "epoch": 1.65, + "learning_rate": 8.911117316254115e-07, + "loss": 0.4824, + "step": 64223 + }, + { + "epoch": 1.65, + "learning_rate": 8.910842257418607e-07, + "loss": 0.6831, + "step": 64224 + }, + { + "epoch": 1.65, + "learning_rate": 8.910567199417015e-07, + "loss": 0.5986, + "step": 64225 + }, + { + "epoch": 1.65, + "learning_rate": 8.910292142249553e-07, + "loss": 0.7095, + "step": 64226 + }, + { + "epoch": 1.65, + "learning_rate": 8.91001708591643e-07, + "loss": 0.559, + "step": 64227 + }, + { + "epoch": 1.65, + "learning_rate": 8.909742030417858e-07, + "loss": 0.627, + "step": 64228 + }, + { + "epoch": 1.65, + "learning_rate": 8.909466975754043e-07, + "loss": 0.5103, + "step": 64229 + }, + { + "epoch": 1.65, + "learning_rate": 8.909191921925202e-07, + "loss": 0.6436, + "step": 64230 + }, + { + "epoch": 1.65, + "learning_rate": 8.90891686893154e-07, + "loss": 0.7031, + "step": 64231 + }, + { + "epoch": 1.65, + "learning_rate": 8.908641816773276e-07, + "loss": 0.751, + "step": 64232 + }, + { + "epoch": 1.65, + "learning_rate": 8.908366765450611e-07, + "loss": 0.6929, + "step": 64233 + }, + { + "epoch": 1.65, + "learning_rate": 8.908091714963758e-07, + "loss": 0.6738, + "step": 64234 + }, + { + "epoch": 1.65, + "learning_rate": 8.907816665312932e-07, + "loss": 0.445, + "step": 64235 + }, + { + "epoch": 1.65, + "learning_rate": 8.907541616498337e-07, + "loss": 0.6289, + "step": 64236 + }, + { + "epoch": 1.65, + "learning_rate": 8.907266568520189e-07, + "loss": 0.427, + "step": 64237 + }, + { + "epoch": 1.65, + "learning_rate": 8.906991521378696e-07, + "loss": 0.5642, + "step": 64238 + }, + { + "epoch": 1.65, + "learning_rate": 8.906716475074071e-07, + "loss": 0.5898, + "step": 64239 + }, + { + "epoch": 1.65, + "learning_rate": 8.906441429606521e-07, + "loss": 0.7402, + "step": 64240 + }, + { + "epoch": 1.65, + "learning_rate": 8.906166384976259e-07, + "loss": 0.5366, + "step": 64241 + }, + { + "epoch": 1.65, + "learning_rate": 8.9058913411835e-07, + "loss": 0.7432, + "step": 64242 + }, + { + "epoch": 1.65, + "learning_rate": 8.905616298228445e-07, + "loss": 0.9053, + "step": 64243 + }, + { + "epoch": 1.65, + "learning_rate": 8.905341256111309e-07, + "loss": 0.6709, + "step": 64244 + }, + { + "epoch": 1.65, + "learning_rate": 8.905066214832303e-07, + "loss": 0.6077, + "step": 64245 + }, + { + "epoch": 1.65, + "learning_rate": 8.904791174391638e-07, + "loss": 0.6211, + "step": 64246 + }, + { + "epoch": 1.65, + "learning_rate": 8.904516134789524e-07, + "loss": 0.4768, + "step": 64247 + }, + { + "epoch": 1.65, + "learning_rate": 8.904241096026169e-07, + "loss": 0.4883, + "step": 64248 + }, + { + "epoch": 1.65, + "learning_rate": 8.903966058101789e-07, + "loss": 0.6611, + "step": 64249 + }, + { + "epoch": 1.65, + "learning_rate": 8.90369102101659e-07, + "loss": 0.6445, + "step": 64250 + }, + { + "epoch": 1.65, + "learning_rate": 8.903415984770788e-07, + "loss": 0.6726, + "step": 64251 + }, + { + "epoch": 1.65, + "learning_rate": 8.90314094936459e-07, + "loss": 0.7441, + "step": 64252 + }, + { + "epoch": 1.65, + "learning_rate": 8.902865914798204e-07, + "loss": 0.7324, + "step": 64253 + }, + { + "epoch": 1.65, + "learning_rate": 8.902590881071844e-07, + "loss": 0.7041, + "step": 64254 + }, + { + "epoch": 1.65, + "learning_rate": 8.902315848185718e-07, + "loss": 0.6265, + "step": 64255 + }, + { + "epoch": 1.65, + "learning_rate": 8.90204081614004e-07, + "loss": 0.6865, + "step": 64256 + }, + { + "epoch": 1.65, + "learning_rate": 8.901765784935017e-07, + "loss": 0.6045, + "step": 64257 + }, + { + "epoch": 1.65, + "learning_rate": 8.901490754570864e-07, + "loss": 0.8145, + "step": 64258 + }, + { + "epoch": 1.65, + "learning_rate": 8.901215725047786e-07, + "loss": 0.7373, + "step": 64259 + }, + { + "epoch": 1.65, + "learning_rate": 8.900940696365999e-07, + "loss": 0.6353, + "step": 64260 + }, + { + "epoch": 1.65, + "learning_rate": 8.900665668525709e-07, + "loss": 0.5864, + "step": 64261 + }, + { + "epoch": 1.65, + "learning_rate": 8.900390641527136e-07, + "loss": 0.6846, + "step": 64262 + }, + { + "epoch": 1.65, + "learning_rate": 8.900115615370476e-07, + "loss": 0.6572, + "step": 64263 + }, + { + "epoch": 1.65, + "learning_rate": 8.899840590055949e-07, + "loss": 0.636, + "step": 64264 + }, + { + "epoch": 1.65, + "learning_rate": 8.899565565583762e-07, + "loss": 0.7578, + "step": 64265 + }, + { + "epoch": 1.65, + "learning_rate": 8.899290541954128e-07, + "loss": 0.5474, + "step": 64266 + }, + { + "epoch": 1.65, + "learning_rate": 8.899015519167257e-07, + "loss": 0.688, + "step": 64267 + }, + { + "epoch": 1.65, + "learning_rate": 8.89874049722336e-07, + "loss": 0.6155, + "step": 64268 + }, + { + "epoch": 1.65, + "learning_rate": 8.898465476122643e-07, + "loss": 0.6377, + "step": 64269 + }, + { + "epoch": 1.65, + "learning_rate": 8.898190455865324e-07, + "loss": 0.6738, + "step": 64270 + }, + { + "epoch": 1.65, + "learning_rate": 8.897915436451607e-07, + "loss": 0.7451, + "step": 64271 + }, + { + "epoch": 1.65, + "learning_rate": 8.897640417881711e-07, + "loss": 0.5156, + "step": 64272 + }, + { + "epoch": 1.65, + "learning_rate": 8.897365400155838e-07, + "loss": 0.7012, + "step": 64273 + }, + { + "epoch": 1.65, + "learning_rate": 8.897090383274199e-07, + "loss": 0.6382, + "step": 64274 + }, + { + "epoch": 1.65, + "learning_rate": 8.89681536723701e-07, + "loss": 0.4492, + "step": 64275 + }, + { + "epoch": 1.65, + "learning_rate": 8.896540352044477e-07, + "loss": 0.5923, + "step": 64276 + }, + { + "epoch": 1.65, + "learning_rate": 8.896265337696814e-07, + "loss": 0.52, + "step": 64277 + }, + { + "epoch": 1.65, + "learning_rate": 8.895990324194228e-07, + "loss": 0.7461, + "step": 64278 + }, + { + "epoch": 1.65, + "learning_rate": 8.895715311536934e-07, + "loss": 0.5879, + "step": 64279 + }, + { + "epoch": 1.65, + "learning_rate": 8.895440299725139e-07, + "loss": 0.6035, + "step": 64280 + }, + { + "epoch": 1.65, + "learning_rate": 8.895165288759053e-07, + "loss": 0.6011, + "step": 64281 + }, + { + "epoch": 1.65, + "learning_rate": 8.894890278638891e-07, + "loss": 0.5771, + "step": 64282 + }, + { + "epoch": 1.65, + "learning_rate": 8.89461526936486e-07, + "loss": 0.6948, + "step": 64283 + }, + { + "epoch": 1.65, + "learning_rate": 8.89434026093717e-07, + "loss": 0.7422, + "step": 64284 + }, + { + "epoch": 1.65, + "learning_rate": 8.894065253356033e-07, + "loss": 0.584, + "step": 64285 + }, + { + "epoch": 1.65, + "learning_rate": 8.893790246621658e-07, + "loss": 0.7578, + "step": 64286 + }, + { + "epoch": 1.65, + "learning_rate": 8.893515240734259e-07, + "loss": 0.5342, + "step": 64287 + }, + { + "epoch": 1.65, + "learning_rate": 8.893240235694042e-07, + "loss": 0.6448, + "step": 64288 + }, + { + "epoch": 1.65, + "learning_rate": 8.892965231501224e-07, + "loss": 0.606, + "step": 64289 + }, + { + "epoch": 1.65, + "learning_rate": 8.892690228156008e-07, + "loss": 0.6597, + "step": 64290 + }, + { + "epoch": 1.65, + "learning_rate": 8.89241522565861e-07, + "loss": 0.5464, + "step": 64291 + }, + { + "epoch": 1.65, + "learning_rate": 8.892140224009242e-07, + "loss": 0.7246, + "step": 64292 + }, + { + "epoch": 1.65, + "learning_rate": 8.891865223208107e-07, + "loss": 0.5444, + "step": 64293 + }, + { + "epoch": 1.65, + "learning_rate": 8.891590223255421e-07, + "loss": 0.6841, + "step": 64294 + }, + { + "epoch": 1.65, + "learning_rate": 8.891315224151392e-07, + "loss": 0.5674, + "step": 64295 + }, + { + "epoch": 1.65, + "learning_rate": 8.891040225896234e-07, + "loss": 0.4468, + "step": 64296 + }, + { + "epoch": 1.65, + "learning_rate": 8.890765228490155e-07, + "loss": 0.5742, + "step": 64297 + }, + { + "epoch": 1.65, + "learning_rate": 8.890490231933364e-07, + "loss": 0.6611, + "step": 64298 + }, + { + "epoch": 1.65, + "learning_rate": 8.890215236226077e-07, + "loss": 0.6348, + "step": 64299 + }, + { + "epoch": 1.65, + "learning_rate": 8.889940241368496e-07, + "loss": 0.6494, + "step": 64300 + }, + { + "epoch": 1.65, + "learning_rate": 8.889665247360841e-07, + "loss": 0.7012, + "step": 64301 + }, + { + "epoch": 1.65, + "learning_rate": 8.889390254203321e-07, + "loss": 0.6396, + "step": 64302 + }, + { + "epoch": 1.65, + "learning_rate": 8.889115261896139e-07, + "loss": 0.6558, + "step": 64303 + }, + { + "epoch": 1.65, + "learning_rate": 8.888840270439512e-07, + "loss": 0.5552, + "step": 64304 + }, + { + "epoch": 1.65, + "learning_rate": 8.888565279833647e-07, + "loss": 0.6558, + "step": 64305 + }, + { + "epoch": 1.65, + "learning_rate": 8.88829029007876e-07, + "loss": 0.7695, + "step": 64306 + }, + { + "epoch": 1.65, + "learning_rate": 8.888015301175054e-07, + "loss": 0.5601, + "step": 64307 + }, + { + "epoch": 1.65, + "learning_rate": 8.887740313122746e-07, + "loss": 0.5164, + "step": 64308 + }, + { + "epoch": 1.65, + "learning_rate": 8.887465325922041e-07, + "loss": 0.7559, + "step": 64309 + }, + { + "epoch": 1.65, + "learning_rate": 8.887190339573157e-07, + "loss": 0.7227, + "step": 64310 + }, + { + "epoch": 1.65, + "learning_rate": 8.886915354076297e-07, + "loss": 0.7031, + "step": 64311 + }, + { + "epoch": 1.65, + "learning_rate": 8.886640369431678e-07, + "loss": 0.6104, + "step": 64312 + }, + { + "epoch": 1.65, + "learning_rate": 8.886365385639508e-07, + "loss": 0.6353, + "step": 64313 + }, + { + "epoch": 1.65, + "learning_rate": 8.886090402699994e-07, + "loss": 0.5659, + "step": 64314 + }, + { + "epoch": 1.65, + "learning_rate": 8.885815420613348e-07, + "loss": 0.7275, + "step": 64315 + }, + { + "epoch": 1.65, + "learning_rate": 8.885540439379783e-07, + "loss": 0.7197, + "step": 64316 + }, + { + "epoch": 1.65, + "learning_rate": 8.885265458999509e-07, + "loss": 0.7129, + "step": 64317 + }, + { + "epoch": 1.65, + "learning_rate": 8.884990479472736e-07, + "loss": 0.4475, + "step": 64318 + }, + { + "epoch": 1.65, + "learning_rate": 8.884715500799673e-07, + "loss": 0.6479, + "step": 64319 + }, + { + "epoch": 1.65, + "learning_rate": 8.884440522980534e-07, + "loss": 0.5615, + "step": 64320 + }, + { + "epoch": 1.65, + "learning_rate": 8.884165546015526e-07, + "loss": 0.4993, + "step": 64321 + }, + { + "epoch": 1.65, + "learning_rate": 8.883890569904866e-07, + "loss": 0.5938, + "step": 64322 + }, + { + "epoch": 1.65, + "learning_rate": 8.883615594648756e-07, + "loss": 0.5513, + "step": 64323 + }, + { + "epoch": 1.65, + "learning_rate": 8.883340620247409e-07, + "loss": 0.583, + "step": 64324 + }, + { + "epoch": 1.65, + "learning_rate": 8.883065646701039e-07, + "loss": 0.6401, + "step": 64325 + }, + { + "epoch": 1.65, + "learning_rate": 8.882790674009851e-07, + "loss": 0.6426, + "step": 64326 + }, + { + "epoch": 1.65, + "learning_rate": 8.882515702174062e-07, + "loss": 0.6836, + "step": 64327 + }, + { + "epoch": 1.65, + "learning_rate": 8.882240731193876e-07, + "loss": 0.5796, + "step": 64328 + }, + { + "epoch": 1.65, + "learning_rate": 8.881965761069511e-07, + "loss": 0.6248, + "step": 64329 + }, + { + "epoch": 1.65, + "learning_rate": 8.88169079180117e-07, + "loss": 0.7939, + "step": 64330 + }, + { + "epoch": 1.65, + "learning_rate": 8.881415823389069e-07, + "loss": 0.5032, + "step": 64331 + }, + { + "epoch": 1.65, + "learning_rate": 8.881140855833419e-07, + "loss": 0.6592, + "step": 64332 + }, + { + "epoch": 1.65, + "learning_rate": 8.880865889134425e-07, + "loss": 0.7773, + "step": 64333 + }, + { + "epoch": 1.65, + "learning_rate": 8.880590923292299e-07, + "loss": 0.6514, + "step": 64334 + }, + { + "epoch": 1.65, + "learning_rate": 8.880315958307256e-07, + "loss": 0.5369, + "step": 64335 + }, + { + "epoch": 1.65, + "learning_rate": 8.8800409941795e-07, + "loss": 0.7148, + "step": 64336 + }, + { + "epoch": 1.65, + "learning_rate": 8.879766030909249e-07, + "loss": 0.5385, + "step": 64337 + }, + { + "epoch": 1.65, + "learning_rate": 8.879491068496707e-07, + "loss": 0.665, + "step": 64338 + }, + { + "epoch": 1.65, + "learning_rate": 8.879216106942088e-07, + "loss": 0.6699, + "step": 64339 + }, + { + "epoch": 1.65, + "learning_rate": 8.8789411462456e-07, + "loss": 0.5664, + "step": 64340 + }, + { + "epoch": 1.65, + "learning_rate": 8.878666186407458e-07, + "loss": 0.6445, + "step": 64341 + }, + { + "epoch": 1.65, + "learning_rate": 8.878391227427872e-07, + "loss": 0.4833, + "step": 64342 + }, + { + "epoch": 1.65, + "learning_rate": 8.878116269307046e-07, + "loss": 0.8066, + "step": 64343 + }, + { + "epoch": 1.65, + "learning_rate": 8.877841312045195e-07, + "loss": 0.4019, + "step": 64344 + }, + { + "epoch": 1.65, + "learning_rate": 8.877566355642529e-07, + "loss": 0.5435, + "step": 64345 + }, + { + "epoch": 1.65, + "learning_rate": 8.877291400099262e-07, + "loss": 0.6035, + "step": 64346 + }, + { + "epoch": 1.65, + "learning_rate": 8.877016445415597e-07, + "loss": 0.4995, + "step": 64347 + }, + { + "epoch": 1.65, + "learning_rate": 8.876741491591752e-07, + "loss": 0.7939, + "step": 64348 + }, + { + "epoch": 1.65, + "learning_rate": 8.876466538627932e-07, + "loss": 0.7891, + "step": 64349 + }, + { + "epoch": 1.65, + "learning_rate": 8.876191586524352e-07, + "loss": 0.6846, + "step": 64350 + }, + { + "epoch": 1.65, + "learning_rate": 8.875916635281219e-07, + "loss": 0.6072, + "step": 64351 + }, + { + "epoch": 1.65, + "learning_rate": 8.875641684898751e-07, + "loss": 0.8018, + "step": 64352 + }, + { + "epoch": 1.65, + "learning_rate": 8.875366735377145e-07, + "loss": 0.4006, + "step": 64353 + }, + { + "epoch": 1.65, + "learning_rate": 8.875091786716622e-07, + "loss": 0.7607, + "step": 64354 + }, + { + "epoch": 1.65, + "learning_rate": 8.874816838917387e-07, + "loss": 0.7578, + "step": 64355 + }, + { + "epoch": 1.65, + "learning_rate": 8.874541891979657e-07, + "loss": 0.7295, + "step": 64356 + }, + { + "epoch": 1.65, + "learning_rate": 8.874266945903635e-07, + "loss": 0.5474, + "step": 64357 + }, + { + "epoch": 1.65, + "learning_rate": 8.873992000689536e-07, + "loss": 0.6904, + "step": 64358 + }, + { + "epoch": 1.65, + "learning_rate": 8.873717056337569e-07, + "loss": 0.3857, + "step": 64359 + }, + { + "epoch": 1.65, + "learning_rate": 8.873442112847946e-07, + "loss": 0.6172, + "step": 64360 + }, + { + "epoch": 1.65, + "learning_rate": 8.873167170220876e-07, + "loss": 0.7754, + "step": 64361 + }, + { + "epoch": 1.65, + "learning_rate": 8.872892228456573e-07, + "loss": 0.6772, + "step": 64362 + }, + { + "epoch": 1.65, + "learning_rate": 8.872617287555243e-07, + "loss": 0.6411, + "step": 64363 + }, + { + "epoch": 1.65, + "learning_rate": 8.872342347517096e-07, + "loss": 0.4902, + "step": 64364 + }, + { + "epoch": 1.65, + "learning_rate": 8.872067408342346e-07, + "loss": 0.7363, + "step": 64365 + }, + { + "epoch": 1.65, + "learning_rate": 8.871792470031201e-07, + "loss": 0.6689, + "step": 64366 + }, + { + "epoch": 1.65, + "learning_rate": 8.871517532583875e-07, + "loss": 0.7764, + "step": 64367 + }, + { + "epoch": 1.65, + "learning_rate": 8.871242596000573e-07, + "loss": 0.6768, + "step": 64368 + }, + { + "epoch": 1.65, + "learning_rate": 8.870967660281511e-07, + "loss": 0.6826, + "step": 64369 + }, + { + "epoch": 1.65, + "learning_rate": 8.870692725426897e-07, + "loss": 0.6611, + "step": 64370 + }, + { + "epoch": 1.65, + "learning_rate": 8.870417791436939e-07, + "loss": 0.7402, + "step": 64371 + }, + { + "epoch": 1.65, + "learning_rate": 8.870142858311857e-07, + "loss": 0.666, + "step": 64372 + }, + { + "epoch": 1.65, + "learning_rate": 8.86986792605185e-07, + "loss": 0.6421, + "step": 64373 + }, + { + "epoch": 1.65, + "learning_rate": 8.869592994657131e-07, + "loss": 0.6006, + "step": 64374 + }, + { + "epoch": 1.65, + "learning_rate": 8.869318064127917e-07, + "loss": 0.5552, + "step": 64375 + }, + { + "epoch": 1.65, + "learning_rate": 8.86904313446441e-07, + "loss": 0.6055, + "step": 64376 + }, + { + "epoch": 1.65, + "learning_rate": 8.868768205666827e-07, + "loss": 0.6218, + "step": 64377 + }, + { + "epoch": 1.65, + "learning_rate": 8.868493277735375e-07, + "loss": 0.5474, + "step": 64378 + }, + { + "epoch": 1.65, + "learning_rate": 8.868218350670267e-07, + "loss": 0.6157, + "step": 64379 + }, + { + "epoch": 1.65, + "learning_rate": 8.867943424471711e-07, + "loss": 0.4735, + "step": 64380 + }, + { + "epoch": 1.65, + "learning_rate": 8.86766849913992e-07, + "loss": 0.4414, + "step": 64381 + }, + { + "epoch": 1.65, + "learning_rate": 8.867393574675105e-07, + "loss": 0.5229, + "step": 64382 + }, + { + "epoch": 1.65, + "learning_rate": 8.867118651077471e-07, + "loss": 0.7988, + "step": 64383 + }, + { + "epoch": 1.65, + "learning_rate": 8.866843728347234e-07, + "loss": 0.6504, + "step": 64384 + }, + { + "epoch": 1.65, + "learning_rate": 8.8665688064846e-07, + "loss": 0.7773, + "step": 64385 + }, + { + "epoch": 1.65, + "learning_rate": 8.866293885489786e-07, + "loss": 0.5527, + "step": 64386 + }, + { + "epoch": 1.65, + "learning_rate": 8.866018965362997e-07, + "loss": 0.6895, + "step": 64387 + }, + { + "epoch": 1.65, + "learning_rate": 8.865744046104444e-07, + "loss": 0.6865, + "step": 64388 + }, + { + "epoch": 1.65, + "learning_rate": 8.86546912771434e-07, + "loss": 0.6504, + "step": 64389 + }, + { + "epoch": 1.65, + "learning_rate": 8.865194210192892e-07, + "loss": 0.7432, + "step": 64390 + }, + { + "epoch": 1.65, + "learning_rate": 8.864919293540315e-07, + "loss": 0.7012, + "step": 64391 + }, + { + "epoch": 1.65, + "learning_rate": 8.86464437775682e-07, + "loss": 0.6611, + "step": 64392 + }, + { + "epoch": 1.65, + "learning_rate": 8.86436946284261e-07, + "loss": 0.6699, + "step": 64393 + }, + { + "epoch": 1.65, + "learning_rate": 8.864094548797901e-07, + "loss": 0.6904, + "step": 64394 + }, + { + "epoch": 1.65, + "learning_rate": 8.863819635622901e-07, + "loss": 0.5076, + "step": 64395 + }, + { + "epoch": 1.65, + "learning_rate": 8.863544723317825e-07, + "loss": 0.6782, + "step": 64396 + }, + { + "epoch": 1.65, + "learning_rate": 8.863269811882877e-07, + "loss": 0.5107, + "step": 64397 + }, + { + "epoch": 1.65, + "learning_rate": 8.862994901318275e-07, + "loss": 0.5908, + "step": 64398 + }, + { + "epoch": 1.65, + "learning_rate": 8.862719991624222e-07, + "loss": 0.6562, + "step": 64399 + }, + { + "epoch": 1.65, + "learning_rate": 8.862445082800934e-07, + "loss": 0.5686, + "step": 64400 + }, + { + "epoch": 1.65, + "learning_rate": 8.862170174848619e-07, + "loss": 0.6479, + "step": 64401 + }, + { + "epoch": 1.65, + "learning_rate": 8.861895267767491e-07, + "loss": 0.6479, + "step": 64402 + }, + { + "epoch": 1.65, + "learning_rate": 8.861620361557755e-07, + "loss": 0.7197, + "step": 64403 + }, + { + "epoch": 1.65, + "learning_rate": 8.861345456219626e-07, + "loss": 0.6396, + "step": 64404 + }, + { + "epoch": 1.65, + "learning_rate": 8.861070551753308e-07, + "loss": 0.6631, + "step": 64405 + }, + { + "epoch": 1.65, + "learning_rate": 8.860795648159018e-07, + "loss": 0.6387, + "step": 64406 + }, + { + "epoch": 1.65, + "learning_rate": 8.860520745436963e-07, + "loss": 0.5039, + "step": 64407 + }, + { + "epoch": 1.65, + "learning_rate": 8.860245843587357e-07, + "loss": 0.5752, + "step": 64408 + }, + { + "epoch": 1.65, + "learning_rate": 8.859970942610406e-07, + "loss": 0.6157, + "step": 64409 + }, + { + "epoch": 1.65, + "learning_rate": 8.859696042506326e-07, + "loss": 0.689, + "step": 64410 + }, + { + "epoch": 1.65, + "learning_rate": 8.859421143275322e-07, + "loss": 0.5781, + "step": 64411 + }, + { + "epoch": 1.65, + "learning_rate": 8.85914624491761e-07, + "loss": 0.7012, + "step": 64412 + }, + { + "epoch": 1.65, + "learning_rate": 8.858871347433396e-07, + "loss": 0.6064, + "step": 64413 + }, + { + "epoch": 1.65, + "learning_rate": 8.858596450822888e-07, + "loss": 0.5151, + "step": 64414 + }, + { + "epoch": 1.65, + "learning_rate": 8.858321555086305e-07, + "loss": 0.623, + "step": 64415 + }, + { + "epoch": 1.65, + "learning_rate": 8.858046660223848e-07, + "loss": 0.8018, + "step": 64416 + }, + { + "epoch": 1.65, + "learning_rate": 8.857771766235735e-07, + "loss": 0.7188, + "step": 64417 + }, + { + "epoch": 1.65, + "learning_rate": 8.857496873122174e-07, + "loss": 0.4678, + "step": 64418 + }, + { + "epoch": 1.65, + "learning_rate": 8.857221980883374e-07, + "loss": 0.8018, + "step": 64419 + }, + { + "epoch": 1.65, + "learning_rate": 8.856947089519545e-07, + "loss": 0.6611, + "step": 64420 + }, + { + "epoch": 1.65, + "learning_rate": 8.856672199030905e-07, + "loss": 0.6104, + "step": 64421 + }, + { + "epoch": 1.65, + "learning_rate": 8.856397309417655e-07, + "loss": 0.7739, + "step": 64422 + }, + { + "epoch": 1.65, + "learning_rate": 8.856122420680008e-07, + "loss": 0.6807, + "step": 64423 + }, + { + "epoch": 1.65, + "learning_rate": 8.855847532818176e-07, + "loss": 0.7007, + "step": 64424 + }, + { + "epoch": 1.65, + "learning_rate": 8.85557264583237e-07, + "loss": 0.6719, + "step": 64425 + }, + { + "epoch": 1.65, + "learning_rate": 8.855297759722796e-07, + "loss": 0.6494, + "step": 64426 + }, + { + "epoch": 1.65, + "learning_rate": 8.855022874489671e-07, + "loss": 0.6514, + "step": 64427 + }, + { + "epoch": 1.65, + "learning_rate": 8.854747990133201e-07, + "loss": 0.5884, + "step": 64428 + }, + { + "epoch": 1.65, + "learning_rate": 8.8544731066536e-07, + "loss": 0.707, + "step": 64429 + }, + { + "epoch": 1.65, + "learning_rate": 8.854198224051073e-07, + "loss": 0.5247, + "step": 64430 + }, + { + "epoch": 1.65, + "learning_rate": 8.853923342325838e-07, + "loss": 0.6084, + "step": 64431 + }, + { + "epoch": 1.65, + "learning_rate": 8.853648461478099e-07, + "loss": 0.6606, + "step": 64432 + }, + { + "epoch": 1.65, + "learning_rate": 8.853373581508067e-07, + "loss": 0.584, + "step": 64433 + }, + { + "epoch": 1.65, + "learning_rate": 8.853098702415955e-07, + "loss": 0.7324, + "step": 64434 + }, + { + "epoch": 1.65, + "learning_rate": 8.852823824201972e-07, + "loss": 0.7393, + "step": 64435 + }, + { + "epoch": 1.65, + "learning_rate": 8.852548946866332e-07, + "loss": 0.6479, + "step": 64436 + }, + { + "epoch": 1.65, + "learning_rate": 8.852274070409238e-07, + "loss": 0.6821, + "step": 64437 + }, + { + "epoch": 1.65, + "learning_rate": 8.851999194830908e-07, + "loss": 0.5144, + "step": 64438 + }, + { + "epoch": 1.65, + "learning_rate": 8.851724320131548e-07, + "loss": 0.584, + "step": 64439 + }, + { + "epoch": 1.65, + "learning_rate": 8.851449446311372e-07, + "loss": 0.5913, + "step": 64440 + }, + { + "epoch": 1.65, + "learning_rate": 8.85117457337059e-07, + "loss": 0.8652, + "step": 64441 + }, + { + "epoch": 1.65, + "learning_rate": 8.850899701309409e-07, + "loss": 0.6517, + "step": 64442 + }, + { + "epoch": 1.65, + "learning_rate": 8.850624830128038e-07, + "loss": 0.6084, + "step": 64443 + }, + { + "epoch": 1.65, + "learning_rate": 8.850349959826694e-07, + "loss": 0.687, + "step": 64444 + }, + { + "epoch": 1.65, + "learning_rate": 8.850075090405582e-07, + "loss": 0.7686, + "step": 64445 + }, + { + "epoch": 1.65, + "learning_rate": 8.849800221864916e-07, + "loss": 0.6621, + "step": 64446 + }, + { + "epoch": 1.65, + "learning_rate": 8.849525354204903e-07, + "loss": 0.6675, + "step": 64447 + }, + { + "epoch": 1.65, + "learning_rate": 8.849250487425759e-07, + "loss": 0.5974, + "step": 64448 + }, + { + "epoch": 1.65, + "learning_rate": 8.848975621527688e-07, + "loss": 0.5737, + "step": 64449 + }, + { + "epoch": 1.65, + "learning_rate": 8.848700756510905e-07, + "loss": 0.4956, + "step": 64450 + }, + { + "epoch": 1.65, + "learning_rate": 8.848425892375621e-07, + "loss": 0.6709, + "step": 64451 + }, + { + "epoch": 1.65, + "learning_rate": 8.848151029122042e-07, + "loss": 0.6309, + "step": 64452 + }, + { + "epoch": 1.65, + "learning_rate": 8.847876166750381e-07, + "loss": 0.6021, + "step": 64453 + }, + { + "epoch": 1.65, + "learning_rate": 8.847601305260846e-07, + "loss": 0.5864, + "step": 64454 + }, + { + "epoch": 1.65, + "learning_rate": 8.847326444653653e-07, + "loss": 0.7607, + "step": 64455 + }, + { + "epoch": 1.65, + "learning_rate": 8.847051584929006e-07, + "loss": 0.6455, + "step": 64456 + }, + { + "epoch": 1.65, + "learning_rate": 8.846776726087122e-07, + "loss": 0.7891, + "step": 64457 + }, + { + "epoch": 1.65, + "learning_rate": 8.846501868128204e-07, + "loss": 0.5425, + "step": 64458 + }, + { + "epoch": 1.65, + "learning_rate": 8.846227011052471e-07, + "loss": 0.6504, + "step": 64459 + }, + { + "epoch": 1.65, + "learning_rate": 8.845952154860128e-07, + "loss": 0.6006, + "step": 64460 + }, + { + "epoch": 1.65, + "learning_rate": 8.845677299551387e-07, + "loss": 0.4795, + "step": 64461 + }, + { + "epoch": 1.65, + "learning_rate": 8.845402445126456e-07, + "loss": 0.5769, + "step": 64462 + }, + { + "epoch": 1.65, + "learning_rate": 8.845127591585547e-07, + "loss": 0.4531, + "step": 64463 + }, + { + "epoch": 1.65, + "learning_rate": 8.84485273892887e-07, + "loss": 0.5498, + "step": 64464 + }, + { + "epoch": 1.65, + "learning_rate": 8.844577887156638e-07, + "loss": 0.6172, + "step": 64465 + }, + { + "epoch": 1.65, + "learning_rate": 8.844303036269058e-07, + "loss": 0.6274, + "step": 64466 + }, + { + "epoch": 1.65, + "learning_rate": 8.844028186266343e-07, + "loss": 0.6777, + "step": 64467 + }, + { + "epoch": 1.65, + "learning_rate": 8.8437533371487e-07, + "loss": 0.6807, + "step": 64468 + }, + { + "epoch": 1.65, + "learning_rate": 8.843478488916346e-07, + "loss": 0.6172, + "step": 64469 + }, + { + "epoch": 1.65, + "learning_rate": 8.843203641569484e-07, + "loss": 0.7012, + "step": 64470 + }, + { + "epoch": 1.65, + "learning_rate": 8.842928795108332e-07, + "loss": 0.5315, + "step": 64471 + }, + { + "epoch": 1.65, + "learning_rate": 8.842653949533094e-07, + "loss": 0.6445, + "step": 64472 + }, + { + "epoch": 1.65, + "learning_rate": 8.842379104843982e-07, + "loss": 0.5386, + "step": 64473 + }, + { + "epoch": 1.65, + "learning_rate": 8.842104261041207e-07, + "loss": 0.6689, + "step": 64474 + }, + { + "epoch": 1.65, + "learning_rate": 8.841829418124978e-07, + "loss": 0.5591, + "step": 64475 + }, + { + "epoch": 1.65, + "learning_rate": 8.84155457609551e-07, + "loss": 0.5234, + "step": 64476 + }, + { + "epoch": 1.65, + "learning_rate": 8.84127973495301e-07, + "loss": 0.6665, + "step": 64477 + }, + { + "epoch": 1.65, + "learning_rate": 8.841004894697687e-07, + "loss": 0.5962, + "step": 64478 + }, + { + "epoch": 1.65, + "learning_rate": 8.840730055329755e-07, + "loss": 0.6367, + "step": 64479 + }, + { + "epoch": 1.65, + "learning_rate": 8.840455216849421e-07, + "loss": 0.6221, + "step": 64480 + }, + { + "epoch": 1.65, + "learning_rate": 8.8401803792569e-07, + "loss": 0.8145, + "step": 64481 + }, + { + "epoch": 1.65, + "learning_rate": 8.839905542552398e-07, + "loss": 0.6992, + "step": 64482 + }, + { + "epoch": 1.65, + "learning_rate": 8.839630706736125e-07, + "loss": 0.7236, + "step": 64483 + }, + { + "epoch": 1.65, + "learning_rate": 8.839355871808296e-07, + "loss": 0.6758, + "step": 64484 + }, + { + "epoch": 1.65, + "learning_rate": 8.839081037769117e-07, + "loss": 0.4636, + "step": 64485 + }, + { + "epoch": 1.65, + "learning_rate": 8.838806204618802e-07, + "loss": 0.8213, + "step": 64486 + }, + { + "epoch": 1.65, + "learning_rate": 8.838531372357557e-07, + "loss": 0.5645, + "step": 64487 + }, + { + "epoch": 1.65, + "learning_rate": 8.838256540985598e-07, + "loss": 0.7227, + "step": 64488 + }, + { + "epoch": 1.65, + "learning_rate": 8.83798171050313e-07, + "loss": 0.6934, + "step": 64489 + }, + { + "epoch": 1.65, + "learning_rate": 8.837706880910369e-07, + "loss": 0.6064, + "step": 64490 + }, + { + "epoch": 1.65, + "learning_rate": 8.837432052207523e-07, + "loss": 0.7676, + "step": 64491 + }, + { + "epoch": 1.65, + "learning_rate": 8.837157224394797e-07, + "loss": 0.5625, + "step": 64492 + }, + { + "epoch": 1.65, + "learning_rate": 8.836882397472411e-07, + "loss": 0.7031, + "step": 64493 + }, + { + "epoch": 1.65, + "learning_rate": 8.83660757144057e-07, + "loss": 0.5654, + "step": 64494 + }, + { + "epoch": 1.65, + "learning_rate": 8.836332746299481e-07, + "loss": 0.5637, + "step": 64495 + }, + { + "epoch": 1.65, + "learning_rate": 8.836057922049363e-07, + "loss": 0.7339, + "step": 64496 + }, + { + "epoch": 1.65, + "learning_rate": 8.835783098690418e-07, + "loss": 0.5134, + "step": 64497 + }, + { + "epoch": 1.65, + "learning_rate": 8.835508276222863e-07, + "loss": 0.792, + "step": 64498 + }, + { + "epoch": 1.65, + "learning_rate": 8.835233454646904e-07, + "loss": 0.5835, + "step": 64499 + }, + { + "epoch": 1.65, + "learning_rate": 8.834958633962756e-07, + "loss": 0.5259, + "step": 64500 + }, + { + "epoch": 1.65, + "learning_rate": 8.834683814170627e-07, + "loss": 0.7305, + "step": 64501 + }, + { + "epoch": 1.65, + "learning_rate": 8.834408995270725e-07, + "loss": 0.6826, + "step": 64502 + }, + { + "epoch": 1.65, + "learning_rate": 8.834134177263263e-07, + "loss": 0.6455, + "step": 64503 + }, + { + "epoch": 1.65, + "learning_rate": 8.833859360148448e-07, + "loss": 0.8037, + "step": 64504 + }, + { + "epoch": 1.65, + "learning_rate": 8.833584543926497e-07, + "loss": 0.5952, + "step": 64505 + }, + { + "epoch": 1.65, + "learning_rate": 8.833309728597613e-07, + "loss": 0.8604, + "step": 64506 + }, + { + "epoch": 1.65, + "learning_rate": 8.833034914162014e-07, + "loss": 0.6094, + "step": 64507 + }, + { + "epoch": 1.65, + "learning_rate": 8.832760100619903e-07, + "loss": 0.709, + "step": 64508 + }, + { + "epoch": 1.65, + "learning_rate": 8.832485287971496e-07, + "loss": 0.6328, + "step": 64509 + }, + { + "epoch": 1.65, + "learning_rate": 8.832210476217e-07, + "loss": 0.5293, + "step": 64510 + }, + { + "epoch": 1.65, + "learning_rate": 8.831935665356631e-07, + "loss": 0.5386, + "step": 64511 + }, + { + "epoch": 1.65, + "learning_rate": 8.831660855390593e-07, + "loss": 0.7529, + "step": 64512 + }, + { + "epoch": 1.65, + "learning_rate": 8.831386046319098e-07, + "loss": 0.6479, + "step": 64513 + }, + { + "epoch": 1.65, + "learning_rate": 8.831111238142356e-07, + "loss": 0.7026, + "step": 64514 + }, + { + "epoch": 1.65, + "learning_rate": 8.830836430860579e-07, + "loss": 0.6367, + "step": 64515 + }, + { + "epoch": 1.65, + "learning_rate": 8.830561624473976e-07, + "loss": 0.667, + "step": 64516 + }, + { + "epoch": 1.65, + "learning_rate": 8.830286818982759e-07, + "loss": 0.7119, + "step": 64517 + }, + { + "epoch": 1.65, + "learning_rate": 8.830012014387136e-07, + "loss": 0.7227, + "step": 64518 + }, + { + "epoch": 1.65, + "learning_rate": 8.829737210687321e-07, + "loss": 0.6582, + "step": 64519 + }, + { + "epoch": 1.65, + "learning_rate": 8.829462407883522e-07, + "loss": 0.7959, + "step": 64520 + }, + { + "epoch": 1.65, + "learning_rate": 8.829187605975952e-07, + "loss": 0.7412, + "step": 64521 + }, + { + "epoch": 1.65, + "learning_rate": 8.828912804964818e-07, + "loss": 0.5151, + "step": 64522 + }, + { + "epoch": 1.65, + "learning_rate": 8.828638004850328e-07, + "loss": 0.7344, + "step": 64523 + }, + { + "epoch": 1.65, + "learning_rate": 8.828363205632701e-07, + "loss": 0.6768, + "step": 64524 + }, + { + "epoch": 1.65, + "learning_rate": 8.828088407312137e-07, + "loss": 0.5542, + "step": 64525 + }, + { + "epoch": 1.65, + "learning_rate": 8.827813609888856e-07, + "loss": 0.584, + "step": 64526 + }, + { + "epoch": 1.65, + "learning_rate": 8.827538813363062e-07, + "loss": 0.8418, + "step": 64527 + }, + { + "epoch": 1.65, + "learning_rate": 8.827264017734969e-07, + "loss": 0.5063, + "step": 64528 + }, + { + "epoch": 1.65, + "learning_rate": 8.826989223004785e-07, + "loss": 0.6602, + "step": 64529 + }, + { + "epoch": 1.65, + "learning_rate": 8.826714429172723e-07, + "loss": 0.7344, + "step": 64530 + }, + { + "epoch": 1.65, + "learning_rate": 8.826439636238993e-07, + "loss": 0.623, + "step": 64531 + }, + { + "epoch": 1.65, + "learning_rate": 8.826164844203802e-07, + "loss": 0.7437, + "step": 64532 + }, + { + "epoch": 1.65, + "learning_rate": 8.825890053067362e-07, + "loss": 0.4678, + "step": 64533 + }, + { + "epoch": 1.65, + "learning_rate": 8.825615262829886e-07, + "loss": 0.7021, + "step": 64534 + }, + { + "epoch": 1.65, + "learning_rate": 8.82534047349158e-07, + "loss": 0.7007, + "step": 64535 + }, + { + "epoch": 1.65, + "learning_rate": 8.825065685052659e-07, + "loss": 0.6826, + "step": 64536 + }, + { + "epoch": 1.65, + "learning_rate": 8.824790897513328e-07, + "loss": 0.6377, + "step": 64537 + }, + { + "epoch": 1.65, + "learning_rate": 8.824516110873803e-07, + "loss": 0.7622, + "step": 64538 + }, + { + "epoch": 1.65, + "learning_rate": 8.824241325134291e-07, + "loss": 0.7158, + "step": 64539 + }, + { + "epoch": 1.65, + "learning_rate": 8.823966540295005e-07, + "loss": 0.5776, + "step": 64540 + }, + { + "epoch": 1.65, + "learning_rate": 8.823691756356155e-07, + "loss": 0.6079, + "step": 64541 + }, + { + "epoch": 1.65, + "learning_rate": 8.823416973317946e-07, + "loss": 0.6592, + "step": 64542 + }, + { + "epoch": 1.65, + "learning_rate": 8.823142191180596e-07, + "loss": 0.4427, + "step": 64543 + }, + { + "epoch": 1.65, + "learning_rate": 8.82286740994431e-07, + "loss": 0.6006, + "step": 64544 + }, + { + "epoch": 1.65, + "learning_rate": 8.8225926296093e-07, + "loss": 0.6797, + "step": 64545 + }, + { + "epoch": 1.65, + "learning_rate": 8.822317850175775e-07, + "loss": 0.6963, + "step": 64546 + }, + { + "epoch": 1.65, + "learning_rate": 8.822043071643951e-07, + "loss": 0.6113, + "step": 64547 + }, + { + "epoch": 1.65, + "learning_rate": 8.821768294014031e-07, + "loss": 0.4442, + "step": 64548 + }, + { + "epoch": 1.65, + "learning_rate": 8.821493517286231e-07, + "loss": 0.4866, + "step": 64549 + }, + { + "epoch": 1.65, + "learning_rate": 8.821218741460761e-07, + "loss": 0.6367, + "step": 64550 + }, + { + "epoch": 1.65, + "learning_rate": 8.820943966537829e-07, + "loss": 0.6245, + "step": 64551 + }, + { + "epoch": 1.65, + "learning_rate": 8.820669192517644e-07, + "loss": 0.7168, + "step": 64552 + }, + { + "epoch": 1.65, + "learning_rate": 8.820394419400418e-07, + "loss": 0.6421, + "step": 64553 + }, + { + "epoch": 1.65, + "learning_rate": 8.820119647186363e-07, + "loss": 0.4469, + "step": 64554 + }, + { + "epoch": 1.65, + "learning_rate": 8.819844875875688e-07, + "loss": 0.8711, + "step": 64555 + }, + { + "epoch": 1.65, + "learning_rate": 8.819570105468602e-07, + "loss": 0.5873, + "step": 64556 + }, + { + "epoch": 1.65, + "learning_rate": 8.819295335965319e-07, + "loss": 0.8535, + "step": 64557 + }, + { + "epoch": 1.65, + "learning_rate": 8.819020567366044e-07, + "loss": 0.7153, + "step": 64558 + }, + { + "epoch": 1.65, + "learning_rate": 8.818745799670994e-07, + "loss": 0.6021, + "step": 64559 + }, + { + "epoch": 1.65, + "learning_rate": 8.818471032880374e-07, + "loss": 0.606, + "step": 64560 + }, + { + "epoch": 1.65, + "learning_rate": 8.818196266994401e-07, + "loss": 0.665, + "step": 64561 + }, + { + "epoch": 1.65, + "learning_rate": 8.817921502013278e-07, + "loss": 0.7119, + "step": 64562 + }, + { + "epoch": 1.65, + "learning_rate": 8.817646737937216e-07, + "loss": 0.6299, + "step": 64563 + }, + { + "epoch": 1.65, + "learning_rate": 8.81737197476643e-07, + "loss": 0.4985, + "step": 64564 + }, + { + "epoch": 1.65, + "learning_rate": 8.817097212501125e-07, + "loss": 0.6445, + "step": 64565 + }, + { + "epoch": 1.65, + "learning_rate": 8.816822451141517e-07, + "loss": 0.8154, + "step": 64566 + }, + { + "epoch": 1.65, + "learning_rate": 8.816547690687813e-07, + "loss": 0.6455, + "step": 64567 + }, + { + "epoch": 1.65, + "learning_rate": 8.816272931140222e-07, + "loss": 0.6562, + "step": 64568 + }, + { + "epoch": 1.65, + "learning_rate": 8.815998172498959e-07, + "loss": 0.498, + "step": 64569 + }, + { + "epoch": 1.65, + "learning_rate": 8.81572341476423e-07, + "loss": 0.7256, + "step": 64570 + }, + { + "epoch": 1.65, + "learning_rate": 8.81544865793625e-07, + "loss": 0.4746, + "step": 64571 + }, + { + "epoch": 1.66, + "learning_rate": 8.815173902015226e-07, + "loss": 0.5016, + "step": 64572 + }, + { + "epoch": 1.66, + "learning_rate": 8.814899147001367e-07, + "loss": 0.7197, + "step": 64573 + }, + { + "epoch": 1.66, + "learning_rate": 8.814624392894886e-07, + "loss": 0.4905, + "step": 64574 + }, + { + "epoch": 1.66, + "learning_rate": 8.814349639695991e-07, + "loss": 0.6182, + "step": 64575 + }, + { + "epoch": 1.66, + "learning_rate": 8.814074887404895e-07, + "loss": 0.8154, + "step": 64576 + }, + { + "epoch": 1.66, + "learning_rate": 8.813800136021806e-07, + "loss": 0.541, + "step": 64577 + }, + { + "epoch": 1.66, + "learning_rate": 8.813525385546939e-07, + "loss": 0.5288, + "step": 64578 + }, + { + "epoch": 1.66, + "learning_rate": 8.813250635980497e-07, + "loss": 0.6631, + "step": 64579 + }, + { + "epoch": 1.66, + "learning_rate": 8.812975887322698e-07, + "loss": 0.6528, + "step": 64580 + }, + { + "epoch": 1.66, + "learning_rate": 8.81270113957375e-07, + "loss": 0.665, + "step": 64581 + }, + { + "epoch": 1.66, + "learning_rate": 8.812426392733858e-07, + "loss": 0.6895, + "step": 64582 + }, + { + "epoch": 1.66, + "learning_rate": 8.812151646803238e-07, + "loss": 0.5654, + "step": 64583 + }, + { + "epoch": 1.66, + "learning_rate": 8.811876901782099e-07, + "loss": 0.4512, + "step": 64584 + }, + { + "epoch": 1.66, + "learning_rate": 8.811602157670652e-07, + "loss": 0.4785, + "step": 64585 + }, + { + "epoch": 1.66, + "learning_rate": 8.811327414469107e-07, + "loss": 0.6406, + "step": 64586 + }, + { + "epoch": 1.66, + "learning_rate": 8.81105267217767e-07, + "loss": 0.5967, + "step": 64587 + }, + { + "epoch": 1.66, + "learning_rate": 8.810777930796559e-07, + "loss": 0.8525, + "step": 64588 + }, + { + "epoch": 1.66, + "learning_rate": 8.810503190325979e-07, + "loss": 0.7949, + "step": 64589 + }, + { + "epoch": 1.66, + "learning_rate": 8.810228450766143e-07, + "loss": 0.5654, + "step": 64590 + }, + { + "epoch": 1.66, + "learning_rate": 8.809953712117263e-07, + "loss": 0.7178, + "step": 64591 + }, + { + "epoch": 1.66, + "learning_rate": 8.809678974379543e-07, + "loss": 0.6147, + "step": 64592 + }, + { + "epoch": 1.66, + "learning_rate": 8.809404237553198e-07, + "loss": 0.6973, + "step": 64593 + }, + { + "epoch": 1.66, + "learning_rate": 8.809129501638436e-07, + "loss": 0.6782, + "step": 64594 + }, + { + "epoch": 1.66, + "learning_rate": 8.80885476663547e-07, + "loss": 0.6357, + "step": 64595 + }, + { + "epoch": 1.66, + "learning_rate": 8.808580032544509e-07, + "loss": 0.7822, + "step": 64596 + }, + { + "epoch": 1.66, + "learning_rate": 8.808305299365765e-07, + "loss": 0.5864, + "step": 64597 + }, + { + "epoch": 1.66, + "learning_rate": 8.808030567099443e-07, + "loss": 0.7568, + "step": 64598 + }, + { + "epoch": 1.66, + "learning_rate": 8.807755835745761e-07, + "loss": 0.6318, + "step": 64599 + }, + { + "epoch": 1.66, + "learning_rate": 8.807481105304922e-07, + "loss": 0.5959, + "step": 64600 + }, + { + "epoch": 1.66, + "learning_rate": 8.807206375777146e-07, + "loss": 0.6152, + "step": 64601 + }, + { + "epoch": 1.66, + "learning_rate": 8.806931647162634e-07, + "loss": 0.8203, + "step": 64602 + }, + { + "epoch": 1.66, + "learning_rate": 8.806656919461599e-07, + "loss": 0.5337, + "step": 64603 + }, + { + "epoch": 1.66, + "learning_rate": 8.806382192674251e-07, + "loss": 0.6216, + "step": 64604 + }, + { + "epoch": 1.66, + "learning_rate": 8.806107466800803e-07, + "loss": 0.5352, + "step": 64605 + }, + { + "epoch": 1.66, + "learning_rate": 8.805832741841461e-07, + "loss": 0.6406, + "step": 64606 + }, + { + "epoch": 1.66, + "learning_rate": 8.80555801779644e-07, + "loss": 0.7422, + "step": 64607 + }, + { + "epoch": 1.66, + "learning_rate": 8.805283294665947e-07, + "loss": 0.5474, + "step": 64608 + }, + { + "epoch": 1.66, + "learning_rate": 8.805008572450196e-07, + "loss": 0.5938, + "step": 64609 + }, + { + "epoch": 1.66, + "learning_rate": 8.804733851149392e-07, + "loss": 0.5269, + "step": 64610 + }, + { + "epoch": 1.66, + "learning_rate": 8.804459130763752e-07, + "loss": 0.5679, + "step": 64611 + }, + { + "epoch": 1.66, + "learning_rate": 8.804184411293482e-07, + "loss": 0.5244, + "step": 64612 + }, + { + "epoch": 1.66, + "learning_rate": 8.803909692738791e-07, + "loss": 0.6543, + "step": 64613 + }, + { + "epoch": 1.66, + "learning_rate": 8.803634975099893e-07, + "loss": 0.6001, + "step": 64614 + }, + { + "epoch": 1.66, + "learning_rate": 8.803360258376994e-07, + "loss": 0.7441, + "step": 64615 + }, + { + "epoch": 1.66, + "learning_rate": 8.80308554257031e-07, + "loss": 0.7402, + "step": 64616 + }, + { + "epoch": 1.66, + "learning_rate": 8.802810827680045e-07, + "loss": 0.5742, + "step": 64617 + }, + { + "epoch": 1.66, + "learning_rate": 8.802536113706415e-07, + "loss": 0.6152, + "step": 64618 + }, + { + "epoch": 1.66, + "learning_rate": 8.802261400649628e-07, + "loss": 0.7852, + "step": 64619 + }, + { + "epoch": 1.66, + "learning_rate": 8.801986688509894e-07, + "loss": 0.5312, + "step": 64620 + }, + { + "epoch": 1.66, + "learning_rate": 8.801711977287428e-07, + "loss": 0.4028, + "step": 64621 + }, + { + "epoch": 1.66, + "learning_rate": 8.801437266982432e-07, + "loss": 0.5176, + "step": 64622 + }, + { + "epoch": 1.66, + "learning_rate": 8.801162557595118e-07, + "loss": 0.5791, + "step": 64623 + }, + { + "epoch": 1.66, + "learning_rate": 8.800887849125702e-07, + "loss": 0.6016, + "step": 64624 + }, + { + "epoch": 1.66, + "learning_rate": 8.800613141574389e-07, + "loss": 0.8672, + "step": 64625 + }, + { + "epoch": 1.66, + "learning_rate": 8.800338434941393e-07, + "loss": 0.8735, + "step": 64626 + }, + { + "epoch": 1.66, + "learning_rate": 8.800063729226921e-07, + "loss": 0.7822, + "step": 64627 + }, + { + "epoch": 1.66, + "learning_rate": 8.799789024431188e-07, + "loss": 0.438, + "step": 64628 + }, + { + "epoch": 1.66, + "learning_rate": 8.799514320554397e-07, + "loss": 0.7451, + "step": 64629 + }, + { + "epoch": 1.66, + "learning_rate": 8.799239617596767e-07, + "loss": 0.6553, + "step": 64630 + }, + { + "epoch": 1.66, + "learning_rate": 8.798964915558505e-07, + "loss": 0.6846, + "step": 64631 + }, + { + "epoch": 1.66, + "learning_rate": 8.798690214439815e-07, + "loss": 0.8926, + "step": 64632 + }, + { + "epoch": 1.66, + "learning_rate": 8.798415514240917e-07, + "loss": 0.604, + "step": 64633 + }, + { + "epoch": 1.66, + "learning_rate": 8.798140814962014e-07, + "loss": 0.8232, + "step": 64634 + }, + { + "epoch": 1.66, + "learning_rate": 8.797866116603321e-07, + "loss": 0.6855, + "step": 64635 + }, + { + "epoch": 1.66, + "learning_rate": 8.797591419165045e-07, + "loss": 0.6152, + "step": 64636 + }, + { + "epoch": 1.66, + "learning_rate": 8.7973167226474e-07, + "loss": 0.6694, + "step": 64637 + }, + { + "epoch": 1.66, + "learning_rate": 8.797042027050592e-07, + "loss": 0.4227, + "step": 64638 + }, + { + "epoch": 1.66, + "learning_rate": 8.796767332374835e-07, + "loss": 0.6387, + "step": 64639 + }, + { + "epoch": 1.66, + "learning_rate": 8.796492638620339e-07, + "loss": 0.5159, + "step": 64640 + }, + { + "epoch": 1.66, + "learning_rate": 8.796217945787315e-07, + "loss": 0.5269, + "step": 64641 + }, + { + "epoch": 1.66, + "learning_rate": 8.795943253875968e-07, + "loss": 0.6025, + "step": 64642 + }, + { + "epoch": 1.66, + "learning_rate": 8.795668562886513e-07, + "loss": 0.6035, + "step": 64643 + }, + { + "epoch": 1.66, + "learning_rate": 8.795393872819158e-07, + "loss": 0.665, + "step": 64644 + }, + { + "epoch": 1.66, + "learning_rate": 8.795119183674116e-07, + "loss": 0.6104, + "step": 64645 + }, + { + "epoch": 1.66, + "learning_rate": 8.794844495451593e-07, + "loss": 0.6631, + "step": 64646 + }, + { + "epoch": 1.66, + "learning_rate": 8.794569808151806e-07, + "loss": 0.6714, + "step": 64647 + }, + { + "epoch": 1.66, + "learning_rate": 8.794295121774959e-07, + "loss": 0.5908, + "step": 64648 + }, + { + "epoch": 1.66, + "learning_rate": 8.794020436321266e-07, + "loss": 0.7031, + "step": 64649 + }, + { + "epoch": 1.66, + "learning_rate": 8.793745751790935e-07, + "loss": 0.6753, + "step": 64650 + }, + { + "epoch": 1.66, + "learning_rate": 8.793471068184179e-07, + "loss": 0.6235, + "step": 64651 + }, + { + "epoch": 1.66, + "learning_rate": 8.793196385501208e-07, + "loss": 0.5659, + "step": 64652 + }, + { + "epoch": 1.66, + "learning_rate": 8.792921703742227e-07, + "loss": 0.6201, + "step": 64653 + }, + { + "epoch": 1.66, + "learning_rate": 8.792647022907454e-07, + "loss": 0.8359, + "step": 64654 + }, + { + "epoch": 1.66, + "learning_rate": 8.792372342997092e-07, + "loss": 0.7305, + "step": 64655 + }, + { + "epoch": 1.66, + "learning_rate": 8.792097664011358e-07, + "loss": 0.6533, + "step": 64656 + }, + { + "epoch": 1.66, + "learning_rate": 8.791822985950459e-07, + "loss": 0.4971, + "step": 64657 + }, + { + "epoch": 1.66, + "learning_rate": 8.791548308814602e-07, + "loss": 0.707, + "step": 64658 + }, + { + "epoch": 1.66, + "learning_rate": 8.791273632604005e-07, + "loss": 0.5859, + "step": 64659 + }, + { + "epoch": 1.66, + "learning_rate": 8.790998957318871e-07, + "loss": 0.6233, + "step": 64660 + }, + { + "epoch": 1.66, + "learning_rate": 8.790724282959419e-07, + "loss": 0.7207, + "step": 64661 + }, + { + "epoch": 1.66, + "learning_rate": 8.790449609525851e-07, + "loss": 0.668, + "step": 64662 + }, + { + "epoch": 1.66, + "learning_rate": 8.790174937018377e-07, + "loss": 0.55, + "step": 64663 + }, + { + "epoch": 1.66, + "learning_rate": 8.789900265437215e-07, + "loss": 0.8936, + "step": 64664 + }, + { + "epoch": 1.66, + "learning_rate": 8.789625594782566e-07, + "loss": 0.6064, + "step": 64665 + }, + { + "epoch": 1.66, + "learning_rate": 8.789350925054648e-07, + "loss": 0.75, + "step": 64666 + }, + { + "epoch": 1.66, + "learning_rate": 8.789076256253666e-07, + "loss": 0.5903, + "step": 64667 + }, + { + "epoch": 1.66, + "learning_rate": 8.788801588379837e-07, + "loss": 0.7656, + "step": 64668 + }, + { + "epoch": 1.66, + "learning_rate": 8.788526921433363e-07, + "loss": 0.7266, + "step": 64669 + }, + { + "epoch": 1.66, + "learning_rate": 8.788252255414459e-07, + "loss": 0.6958, + "step": 64670 + }, + { + "epoch": 1.66, + "learning_rate": 8.787977590323339e-07, + "loss": 0.7393, + "step": 64671 + }, + { + "epoch": 1.66, + "learning_rate": 8.787702926160204e-07, + "loss": 0.7441, + "step": 64672 + }, + { + "epoch": 1.66, + "learning_rate": 8.787428262925269e-07, + "loss": 0.6038, + "step": 64673 + }, + { + "epoch": 1.66, + "learning_rate": 8.787153600618746e-07, + "loss": 0.666, + "step": 64674 + }, + { + "epoch": 1.66, + "learning_rate": 8.786878939240842e-07, + "loss": 0.7266, + "step": 64675 + }, + { + "epoch": 1.66, + "learning_rate": 8.786604278791772e-07, + "loss": 0.6924, + "step": 64676 + }, + { + "epoch": 1.66, + "learning_rate": 8.78632961927174e-07, + "loss": 0.5327, + "step": 64677 + }, + { + "epoch": 1.66, + "learning_rate": 8.786054960680962e-07, + "loss": 0.79, + "step": 64678 + }, + { + "epoch": 1.66, + "learning_rate": 8.785780303019644e-07, + "loss": 0.5894, + "step": 64679 + }, + { + "epoch": 1.66, + "learning_rate": 8.785505646288e-07, + "loss": 0.5684, + "step": 64680 + }, + { + "epoch": 1.66, + "learning_rate": 8.78523099048624e-07, + "loss": 0.5732, + "step": 64681 + }, + { + "epoch": 1.66, + "learning_rate": 8.784956335614569e-07, + "loss": 0.509, + "step": 64682 + }, + { + "epoch": 1.66, + "learning_rate": 8.784681681673204e-07, + "loss": 0.8623, + "step": 64683 + }, + { + "epoch": 1.66, + "learning_rate": 8.78440702866235e-07, + "loss": 0.604, + "step": 64684 + }, + { + "epoch": 1.66, + "learning_rate": 8.784132376582221e-07, + "loss": 0.5679, + "step": 64685 + }, + { + "epoch": 1.66, + "learning_rate": 8.783857725433024e-07, + "loss": 0.7988, + "step": 64686 + }, + { + "epoch": 1.66, + "learning_rate": 8.783583075214973e-07, + "loss": 0.6387, + "step": 64687 + }, + { + "epoch": 1.66, + "learning_rate": 8.783308425928275e-07, + "loss": 0.5669, + "step": 64688 + }, + { + "epoch": 1.66, + "learning_rate": 8.783033777573144e-07, + "loss": 0.5225, + "step": 64689 + }, + { + "epoch": 1.66, + "learning_rate": 8.782759130149785e-07, + "loss": 0.79, + "step": 64690 + }, + { + "epoch": 1.66, + "learning_rate": 8.782484483658417e-07, + "loss": 0.6465, + "step": 64691 + }, + { + "epoch": 1.66, + "learning_rate": 8.782209838099241e-07, + "loss": 0.6528, + "step": 64692 + }, + { + "epoch": 1.66, + "learning_rate": 8.781935193472473e-07, + "loss": 0.4194, + "step": 64693 + }, + { + "epoch": 1.66, + "learning_rate": 8.781660549778317e-07, + "loss": 0.7422, + "step": 64694 + }, + { + "epoch": 1.66, + "learning_rate": 8.781385907016991e-07, + "loss": 0.5317, + "step": 64695 + }, + { + "epoch": 1.66, + "learning_rate": 8.781111265188699e-07, + "loss": 0.6064, + "step": 64696 + }, + { + "epoch": 1.66, + "learning_rate": 8.780836624293656e-07, + "loss": 0.606, + "step": 64697 + }, + { + "epoch": 1.66, + "learning_rate": 8.780561984332069e-07, + "loss": 0.6011, + "step": 64698 + }, + { + "epoch": 1.66, + "learning_rate": 8.780287345304151e-07, + "loss": 0.6279, + "step": 64699 + }, + { + "epoch": 1.66, + "learning_rate": 8.780012707210109e-07, + "loss": 0.7178, + "step": 64700 + }, + { + "epoch": 1.66, + "learning_rate": 8.77973807005016e-07, + "loss": 0.6729, + "step": 64701 + }, + { + "epoch": 1.66, + "learning_rate": 8.779463433824507e-07, + "loss": 0.5908, + "step": 64702 + }, + { + "epoch": 1.66, + "learning_rate": 8.77918879853336e-07, + "loss": 0.7832, + "step": 64703 + }, + { + "epoch": 1.66, + "learning_rate": 8.778914164176934e-07, + "loss": 0.6108, + "step": 64704 + }, + { + "epoch": 1.66, + "learning_rate": 8.778639530755436e-07, + "loss": 0.6738, + "step": 64705 + }, + { + "epoch": 1.66, + "learning_rate": 8.77836489826908e-07, + "loss": 0.6973, + "step": 64706 + }, + { + "epoch": 1.66, + "learning_rate": 8.77809026671807e-07, + "loss": 0.8076, + "step": 64707 + }, + { + "epoch": 1.66, + "learning_rate": 8.777815636102624e-07, + "loss": 0.6641, + "step": 64708 + }, + { + "epoch": 1.66, + "learning_rate": 8.777541006422945e-07, + "loss": 0.6711, + "step": 64709 + }, + { + "epoch": 1.66, + "learning_rate": 8.77726637767925e-07, + "loss": 0.5757, + "step": 64710 + }, + { + "epoch": 1.66, + "learning_rate": 8.776991749871747e-07, + "loss": 0.542, + "step": 64711 + }, + { + "epoch": 1.66, + "learning_rate": 8.776717123000643e-07, + "loss": 0.4817, + "step": 64712 + }, + { + "epoch": 1.66, + "learning_rate": 8.776442497066149e-07, + "loss": 0.7422, + "step": 64713 + }, + { + "epoch": 1.66, + "learning_rate": 8.776167872068479e-07, + "loss": 0.7734, + "step": 64714 + }, + { + "epoch": 1.66, + "learning_rate": 8.775893248007839e-07, + "loss": 0.5913, + "step": 64715 + }, + { + "epoch": 1.66, + "learning_rate": 8.775618624884442e-07, + "loss": 0.7686, + "step": 64716 + }, + { + "epoch": 1.66, + "learning_rate": 8.775344002698496e-07, + "loss": 0.571, + "step": 64717 + }, + { + "epoch": 1.66, + "learning_rate": 8.775069381450215e-07, + "loss": 0.6309, + "step": 64718 + }, + { + "epoch": 1.66, + "learning_rate": 8.774794761139805e-07, + "loss": 0.6846, + "step": 64719 + }, + { + "epoch": 1.66, + "learning_rate": 8.774520141767483e-07, + "loss": 0.707, + "step": 64720 + }, + { + "epoch": 1.66, + "learning_rate": 8.774245523333452e-07, + "loss": 0.543, + "step": 64721 + }, + { + "epoch": 1.66, + "learning_rate": 8.773970905837922e-07, + "loss": 0.645, + "step": 64722 + }, + { + "epoch": 1.66, + "learning_rate": 8.773696289281109e-07, + "loss": 0.6519, + "step": 64723 + }, + { + "epoch": 1.66, + "learning_rate": 8.77342167366322e-07, + "loss": 0.6689, + "step": 64724 + }, + { + "epoch": 1.66, + "learning_rate": 8.773147058984465e-07, + "loss": 0.834, + "step": 64725 + }, + { + "epoch": 1.66, + "learning_rate": 8.772872445245053e-07, + "loss": 0.6748, + "step": 64726 + }, + { + "epoch": 1.66, + "learning_rate": 8.7725978324452e-07, + "loss": 0.646, + "step": 64727 + }, + { + "epoch": 1.66, + "learning_rate": 8.772323220585108e-07, + "loss": 0.6982, + "step": 64728 + }, + { + "epoch": 1.66, + "learning_rate": 8.772048609664996e-07, + "loss": 0.5708, + "step": 64729 + }, + { + "epoch": 1.66, + "learning_rate": 8.771773999685071e-07, + "loss": 0.7002, + "step": 64730 + }, + { + "epoch": 1.66, + "learning_rate": 8.77149939064554e-07, + "loss": 0.6548, + "step": 64731 + }, + { + "epoch": 1.66, + "learning_rate": 8.771224782546614e-07, + "loss": 0.5254, + "step": 64732 + }, + { + "epoch": 1.66, + "learning_rate": 8.770950175388507e-07, + "loss": 0.6733, + "step": 64733 + }, + { + "epoch": 1.66, + "learning_rate": 8.770675569171423e-07, + "loss": 0.5479, + "step": 64734 + }, + { + "epoch": 1.66, + "learning_rate": 8.770400963895579e-07, + "loss": 0.599, + "step": 64735 + }, + { + "epoch": 1.66, + "learning_rate": 8.770126359561181e-07, + "loss": 0.6641, + "step": 64736 + }, + { + "epoch": 1.66, + "learning_rate": 8.769851756168443e-07, + "loss": 0.5369, + "step": 64737 + }, + { + "epoch": 1.66, + "learning_rate": 8.76957715371757e-07, + "loss": 0.5126, + "step": 64738 + }, + { + "epoch": 1.66, + "learning_rate": 8.769302552208778e-07, + "loss": 0.6172, + "step": 64739 + }, + { + "epoch": 1.66, + "learning_rate": 8.769027951642276e-07, + "loss": 0.7061, + "step": 64740 + }, + { + "epoch": 1.66, + "learning_rate": 8.768753352018269e-07, + "loss": 0.646, + "step": 64741 + }, + { + "epoch": 1.66, + "learning_rate": 8.768478753336974e-07, + "loss": 0.5479, + "step": 64742 + }, + { + "epoch": 1.66, + "learning_rate": 8.768204155598593e-07, + "loss": 0.6938, + "step": 64743 + }, + { + "epoch": 1.66, + "learning_rate": 8.767929558803347e-07, + "loss": 0.6611, + "step": 64744 + }, + { + "epoch": 1.66, + "learning_rate": 8.767654962951437e-07, + "loss": 0.6299, + "step": 64745 + }, + { + "epoch": 1.66, + "learning_rate": 8.767380368043078e-07, + "loss": 0.481, + "step": 64746 + }, + { + "epoch": 1.66, + "learning_rate": 8.767105774078478e-07, + "loss": 0.5928, + "step": 64747 + }, + { + "epoch": 1.66, + "learning_rate": 8.76683118105785e-07, + "loss": 0.7998, + "step": 64748 + }, + { + "epoch": 1.66, + "learning_rate": 8.766556588981404e-07, + "loss": 0.6904, + "step": 64749 + }, + { + "epoch": 1.66, + "learning_rate": 8.76628199784935e-07, + "loss": 0.6528, + "step": 64750 + }, + { + "epoch": 1.66, + "learning_rate": 8.766007407661893e-07, + "loss": 0.626, + "step": 64751 + }, + { + "epoch": 1.66, + "learning_rate": 8.76573281841925e-07, + "loss": 0.7012, + "step": 64752 + }, + { + "epoch": 1.66, + "learning_rate": 8.765458230121626e-07, + "loss": 0.6953, + "step": 64753 + }, + { + "epoch": 1.66, + "learning_rate": 8.765183642769236e-07, + "loss": 0.4121, + "step": 64754 + }, + { + "epoch": 1.66, + "learning_rate": 8.764909056362286e-07, + "loss": 0.5435, + "step": 64755 + }, + { + "epoch": 1.66, + "learning_rate": 8.764634470900991e-07, + "loss": 0.7656, + "step": 64756 + }, + { + "epoch": 1.66, + "learning_rate": 8.764359886385556e-07, + "loss": 0.5903, + "step": 64757 + }, + { + "epoch": 1.66, + "learning_rate": 8.764085302816196e-07, + "loss": 0.5957, + "step": 64758 + }, + { + "epoch": 1.66, + "learning_rate": 8.763810720193118e-07, + "loss": 0.6963, + "step": 64759 + }, + { + "epoch": 1.66, + "learning_rate": 8.763536138516536e-07, + "loss": 0.4824, + "step": 64760 + }, + { + "epoch": 1.66, + "learning_rate": 8.763261557786656e-07, + "loss": 0.6372, + "step": 64761 + }, + { + "epoch": 1.66, + "learning_rate": 8.762986978003688e-07, + "loss": 0.6387, + "step": 64762 + }, + { + "epoch": 1.66, + "learning_rate": 8.762712399167846e-07, + "loss": 0.8613, + "step": 64763 + }, + { + "epoch": 1.66, + "learning_rate": 8.762437821279335e-07, + "loss": 0.6968, + "step": 64764 + }, + { + "epoch": 1.66, + "learning_rate": 8.762163244338371e-07, + "loss": 0.6895, + "step": 64765 + }, + { + "epoch": 1.66, + "learning_rate": 8.761888668345162e-07, + "loss": 0.7383, + "step": 64766 + }, + { + "epoch": 1.66, + "learning_rate": 8.761614093299916e-07, + "loss": 0.7446, + "step": 64767 + }, + { + "epoch": 1.66, + "learning_rate": 8.761339519202848e-07, + "loss": 0.5527, + "step": 64768 + }, + { + "epoch": 1.66, + "learning_rate": 8.761064946054162e-07, + "loss": 0.625, + "step": 64769 + }, + { + "epoch": 1.66, + "learning_rate": 8.760790373854076e-07, + "loss": 0.5068, + "step": 64770 + }, + { + "epoch": 1.66, + "learning_rate": 8.760515802602793e-07, + "loss": 0.6309, + "step": 64771 + }, + { + "epoch": 1.66, + "learning_rate": 8.760241232300526e-07, + "loss": 0.6582, + "step": 64772 + }, + { + "epoch": 1.66, + "learning_rate": 8.759966662947487e-07, + "loss": 0.5605, + "step": 64773 + }, + { + "epoch": 1.66, + "learning_rate": 8.75969209454388e-07, + "loss": 0.6401, + "step": 64774 + }, + { + "epoch": 1.66, + "learning_rate": 8.759417527089924e-07, + "loss": 0.4548, + "step": 64775 + }, + { + "epoch": 1.66, + "learning_rate": 8.759142960585822e-07, + "loss": 0.5903, + "step": 64776 + }, + { + "epoch": 1.66, + "learning_rate": 8.75886839503179e-07, + "loss": 0.626, + "step": 64777 + }, + { + "epoch": 1.66, + "learning_rate": 8.758593830428032e-07, + "loss": 0.7236, + "step": 64778 + }, + { + "epoch": 1.66, + "learning_rate": 8.758319266774766e-07, + "loss": 0.6587, + "step": 64779 + }, + { + "epoch": 1.66, + "learning_rate": 8.758044704072198e-07, + "loss": 0.6802, + "step": 64780 + }, + { + "epoch": 1.66, + "learning_rate": 8.757770142320536e-07, + "loss": 0.6128, + "step": 64781 + }, + { + "epoch": 1.66, + "learning_rate": 8.757495581519991e-07, + "loss": 0.6929, + "step": 64782 + }, + { + "epoch": 1.66, + "learning_rate": 8.757221021670777e-07, + "loss": 0.6836, + "step": 64783 + }, + { + "epoch": 1.66, + "learning_rate": 8.756946462773099e-07, + "loss": 0.6973, + "step": 64784 + }, + { + "epoch": 1.66, + "learning_rate": 8.756671904827172e-07, + "loss": 0.6108, + "step": 64785 + }, + { + "epoch": 1.66, + "learning_rate": 8.756397347833203e-07, + "loss": 0.5938, + "step": 64786 + }, + { + "epoch": 1.66, + "learning_rate": 8.756122791791404e-07, + "loss": 0.6353, + "step": 64787 + }, + { + "epoch": 1.66, + "learning_rate": 8.755848236701982e-07, + "loss": 0.5803, + "step": 64788 + }, + { + "epoch": 1.66, + "learning_rate": 8.755573682565154e-07, + "loss": 0.5701, + "step": 64789 + }, + { + "epoch": 1.66, + "learning_rate": 8.755299129381126e-07, + "loss": 0.5869, + "step": 64790 + }, + { + "epoch": 1.66, + "learning_rate": 8.755024577150105e-07, + "loss": 0.6328, + "step": 64791 + }, + { + "epoch": 1.66, + "learning_rate": 8.754750025872308e-07, + "loss": 0.6943, + "step": 64792 + }, + { + "epoch": 1.66, + "learning_rate": 8.754475475547937e-07, + "loss": 0.7832, + "step": 64793 + }, + { + "epoch": 1.66, + "learning_rate": 8.75420092617721e-07, + "loss": 0.7295, + "step": 64794 + }, + { + "epoch": 1.66, + "learning_rate": 8.753926377760333e-07, + "loss": 0.4084, + "step": 64795 + }, + { + "epoch": 1.66, + "learning_rate": 8.753651830297517e-07, + "loss": 0.5603, + "step": 64796 + }, + { + "epoch": 1.66, + "learning_rate": 8.753377283788972e-07, + "loss": 0.6162, + "step": 64797 + }, + { + "epoch": 1.66, + "learning_rate": 8.75310273823491e-07, + "loss": 0.593, + "step": 64798 + }, + { + "epoch": 1.66, + "learning_rate": 8.75282819363554e-07, + "loss": 0.688, + "step": 64799 + }, + { + "epoch": 1.66, + "learning_rate": 8.752553649991076e-07, + "loss": 0.5508, + "step": 64800 + }, + { + "epoch": 1.66, + "learning_rate": 8.752279107301719e-07, + "loss": 0.666, + "step": 64801 + }, + { + "epoch": 1.66, + "learning_rate": 8.752004565567687e-07, + "loss": 0.877, + "step": 64802 + }, + { + "epoch": 1.66, + "learning_rate": 8.751730024789185e-07, + "loss": 0.5889, + "step": 64803 + }, + { + "epoch": 1.66, + "learning_rate": 8.751455484966428e-07, + "loss": 0.6016, + "step": 64804 + }, + { + "epoch": 1.66, + "learning_rate": 8.751180946099621e-07, + "loss": 0.502, + "step": 64805 + }, + { + "epoch": 1.66, + "learning_rate": 8.750906408188981e-07, + "loss": 0.5509, + "step": 64806 + }, + { + "epoch": 1.66, + "learning_rate": 8.750631871234712e-07, + "loss": 0.5557, + "step": 64807 + }, + { + "epoch": 1.66, + "learning_rate": 8.750357335237029e-07, + "loss": 0.4956, + "step": 64808 + }, + { + "epoch": 1.66, + "learning_rate": 8.750082800196138e-07, + "loss": 0.6191, + "step": 64809 + }, + { + "epoch": 1.66, + "learning_rate": 8.749808266112255e-07, + "loss": 0.5967, + "step": 64810 + }, + { + "epoch": 1.66, + "learning_rate": 8.749533732985583e-07, + "loss": 0.6904, + "step": 64811 + }, + { + "epoch": 1.66, + "learning_rate": 8.749259200816335e-07, + "loss": 0.6914, + "step": 64812 + }, + { + "epoch": 1.66, + "learning_rate": 8.748984669604724e-07, + "loss": 0.7124, + "step": 64813 + }, + { + "epoch": 1.66, + "learning_rate": 8.748710139350954e-07, + "loss": 0.5244, + "step": 64814 + }, + { + "epoch": 1.66, + "learning_rate": 8.748435610055244e-07, + "loss": 0.6772, + "step": 64815 + }, + { + "epoch": 1.66, + "learning_rate": 8.748161081717795e-07, + "loss": 0.7432, + "step": 64816 + }, + { + "epoch": 1.66, + "learning_rate": 8.747886554338824e-07, + "loss": 0.6431, + "step": 64817 + }, + { + "epoch": 1.66, + "learning_rate": 8.747612027918537e-07, + "loss": 0.5659, + "step": 64818 + }, + { + "epoch": 1.66, + "learning_rate": 8.747337502457148e-07, + "loss": 0.8506, + "step": 64819 + }, + { + "epoch": 1.66, + "learning_rate": 8.747062977954867e-07, + "loss": 0.6836, + "step": 64820 + }, + { + "epoch": 1.66, + "learning_rate": 8.7467884544119e-07, + "loss": 0.6567, + "step": 64821 + }, + { + "epoch": 1.66, + "learning_rate": 8.746513931828458e-07, + "loss": 0.5664, + "step": 64822 + }, + { + "epoch": 1.66, + "learning_rate": 8.746239410204754e-07, + "loss": 0.6426, + "step": 64823 + }, + { + "epoch": 1.66, + "learning_rate": 8.745964889540995e-07, + "loss": 0.6812, + "step": 64824 + }, + { + "epoch": 1.66, + "learning_rate": 8.745690369837395e-07, + "loss": 0.6787, + "step": 64825 + }, + { + "epoch": 1.66, + "learning_rate": 8.74541585109416e-07, + "loss": 0.6807, + "step": 64826 + }, + { + "epoch": 1.66, + "learning_rate": 8.745141333311506e-07, + "loss": 0.6714, + "step": 64827 + }, + { + "epoch": 1.66, + "learning_rate": 8.744866816489635e-07, + "loss": 0.792, + "step": 64828 + }, + { + "epoch": 1.66, + "learning_rate": 8.744592300628765e-07, + "loss": 0.6196, + "step": 64829 + }, + { + "epoch": 1.66, + "learning_rate": 8.744317785729106e-07, + "loss": 0.5586, + "step": 64830 + }, + { + "epoch": 1.66, + "learning_rate": 8.744043271790859e-07, + "loss": 0.5668, + "step": 64831 + }, + { + "epoch": 1.66, + "learning_rate": 8.743768758814244e-07, + "loss": 0.6836, + "step": 64832 + }, + { + "epoch": 1.66, + "learning_rate": 8.743494246799465e-07, + "loss": 0.7861, + "step": 64833 + }, + { + "epoch": 1.66, + "learning_rate": 8.743219735746737e-07, + "loss": 0.519, + "step": 64834 + }, + { + "epoch": 1.66, + "learning_rate": 8.742945225656264e-07, + "loss": 0.8115, + "step": 64835 + }, + { + "epoch": 1.66, + "learning_rate": 8.742670716528264e-07, + "loss": 0.7007, + "step": 64836 + }, + { + "epoch": 1.66, + "learning_rate": 8.742396208362941e-07, + "loss": 0.6006, + "step": 64837 + }, + { + "epoch": 1.66, + "learning_rate": 8.742121701160508e-07, + "loss": 0.6733, + "step": 64838 + }, + { + "epoch": 1.66, + "learning_rate": 8.741847194921176e-07, + "loss": 0.6514, + "step": 64839 + }, + { + "epoch": 1.66, + "learning_rate": 8.741572689645156e-07, + "loss": 0.665, + "step": 64840 + }, + { + "epoch": 1.66, + "learning_rate": 8.741298185332651e-07, + "loss": 0.6499, + "step": 64841 + }, + { + "epoch": 1.66, + "learning_rate": 8.741023681983879e-07, + "loss": 0.7451, + "step": 64842 + }, + { + "epoch": 1.66, + "learning_rate": 8.740749179599045e-07, + "loss": 0.5413, + "step": 64843 + }, + { + "epoch": 1.66, + "learning_rate": 8.740474678178363e-07, + "loss": 0.6914, + "step": 64844 + }, + { + "epoch": 1.66, + "learning_rate": 8.740200177722039e-07, + "loss": 0.6304, + "step": 64845 + }, + { + "epoch": 1.66, + "learning_rate": 8.739925678230288e-07, + "loss": 0.5542, + "step": 64846 + }, + { + "epoch": 1.66, + "learning_rate": 8.739651179703318e-07, + "loss": 0.5459, + "step": 64847 + }, + { + "epoch": 1.66, + "learning_rate": 8.739376682141339e-07, + "loss": 0.5928, + "step": 64848 + }, + { + "epoch": 1.66, + "learning_rate": 8.73910218554456e-07, + "loss": 0.5957, + "step": 64849 + }, + { + "epoch": 1.66, + "learning_rate": 8.738827689913198e-07, + "loss": 0.6357, + "step": 64850 + }, + { + "epoch": 1.66, + "learning_rate": 8.738553195247453e-07, + "loss": 0.7656, + "step": 64851 + }, + { + "epoch": 1.66, + "learning_rate": 8.738278701547539e-07, + "loss": 0.6094, + "step": 64852 + }, + { + "epoch": 1.66, + "learning_rate": 8.738004208813669e-07, + "loss": 0.6196, + "step": 64853 + }, + { + "epoch": 1.66, + "learning_rate": 8.73772971704605e-07, + "loss": 0.6528, + "step": 64854 + }, + { + "epoch": 1.66, + "learning_rate": 8.737455226244894e-07, + "loss": 0.6128, + "step": 64855 + }, + { + "epoch": 1.66, + "learning_rate": 8.737180736410411e-07, + "loss": 0.6211, + "step": 64856 + }, + { + "epoch": 1.66, + "learning_rate": 8.736906247542808e-07, + "loss": 0.5396, + "step": 64857 + }, + { + "epoch": 1.66, + "learning_rate": 8.736631759642302e-07, + "loss": 0.5283, + "step": 64858 + }, + { + "epoch": 1.66, + "learning_rate": 8.736357272709094e-07, + "loss": 0.6238, + "step": 64859 + }, + { + "epoch": 1.66, + "learning_rate": 8.736082786743405e-07, + "loss": 0.5254, + "step": 64860 + }, + { + "epoch": 1.66, + "learning_rate": 8.735808301745436e-07, + "loss": 0.5708, + "step": 64861 + }, + { + "epoch": 1.66, + "learning_rate": 8.735533817715399e-07, + "loss": 0.7793, + "step": 64862 + }, + { + "epoch": 1.66, + "learning_rate": 8.735259334653508e-07, + "loss": 0.7021, + "step": 64863 + }, + { + "epoch": 1.66, + "learning_rate": 8.734984852559969e-07, + "loss": 0.6036, + "step": 64864 + }, + { + "epoch": 1.66, + "learning_rate": 8.734710371434996e-07, + "loss": 0.6382, + "step": 64865 + }, + { + "epoch": 1.66, + "learning_rate": 8.734435891278794e-07, + "loss": 0.4995, + "step": 64866 + }, + { + "epoch": 1.66, + "learning_rate": 8.734161412091578e-07, + "loss": 0.54, + "step": 64867 + }, + { + "epoch": 1.66, + "learning_rate": 8.733886933873556e-07, + "loss": 0.4243, + "step": 64868 + }, + { + "epoch": 1.66, + "learning_rate": 8.73361245662494e-07, + "loss": 0.6582, + "step": 64869 + }, + { + "epoch": 1.66, + "learning_rate": 8.733337980345941e-07, + "loss": 0.7686, + "step": 64870 + }, + { + "epoch": 1.66, + "learning_rate": 8.733063505036762e-07, + "loss": 0.4672, + "step": 64871 + }, + { + "epoch": 1.66, + "learning_rate": 8.73278903069762e-07, + "loss": 0.7109, + "step": 64872 + }, + { + "epoch": 1.66, + "learning_rate": 8.732514557328725e-07, + "loss": 0.5977, + "step": 64873 + }, + { + "epoch": 1.66, + "learning_rate": 8.732240084930281e-07, + "loss": 0.5366, + "step": 64874 + }, + { + "epoch": 1.66, + "learning_rate": 8.731965613502505e-07, + "loss": 0.5513, + "step": 64875 + }, + { + "epoch": 1.66, + "learning_rate": 8.731691143045603e-07, + "loss": 0.4143, + "step": 64876 + }, + { + "epoch": 1.66, + "learning_rate": 8.731416673559789e-07, + "loss": 0.5508, + "step": 64877 + }, + { + "epoch": 1.66, + "learning_rate": 8.731142205045269e-07, + "loss": 0.603, + "step": 64878 + }, + { + "epoch": 1.66, + "learning_rate": 8.730867737502257e-07, + "loss": 0.5713, + "step": 64879 + }, + { + "epoch": 1.66, + "learning_rate": 8.730593270930963e-07, + "loss": 0.6333, + "step": 64880 + }, + { + "epoch": 1.66, + "learning_rate": 8.730318805331591e-07, + "loss": 0.7119, + "step": 64881 + }, + { + "epoch": 1.66, + "learning_rate": 8.730044340704359e-07, + "loss": 0.666, + "step": 64882 + }, + { + "epoch": 1.66, + "learning_rate": 8.72976987704947e-07, + "loss": 0.6436, + "step": 64883 + }, + { + "epoch": 1.66, + "learning_rate": 8.729495414367141e-07, + "loss": 0.7324, + "step": 64884 + }, + { + "epoch": 1.66, + "learning_rate": 8.729220952657576e-07, + "loss": 0.8232, + "step": 64885 + }, + { + "epoch": 1.66, + "learning_rate": 8.72894649192099e-07, + "loss": 0.6504, + "step": 64886 + }, + { + "epoch": 1.66, + "learning_rate": 8.72867203215759e-07, + "loss": 0.5979, + "step": 64887 + }, + { + "epoch": 1.66, + "learning_rate": 8.728397573367589e-07, + "loss": 0.6152, + "step": 64888 + }, + { + "epoch": 1.66, + "learning_rate": 8.728123115551193e-07, + "loss": 0.5151, + "step": 64889 + }, + { + "epoch": 1.66, + "learning_rate": 8.727848658708621e-07, + "loss": 0.6826, + "step": 64890 + }, + { + "epoch": 1.66, + "learning_rate": 8.727574202840071e-07, + "loss": 0.5446, + "step": 64891 + }, + { + "epoch": 1.66, + "learning_rate": 8.727299747945761e-07, + "loss": 0.603, + "step": 64892 + }, + { + "epoch": 1.66, + "learning_rate": 8.727025294025896e-07, + "loss": 0.6221, + "step": 64893 + }, + { + "epoch": 1.66, + "learning_rate": 8.726750841080692e-07, + "loss": 0.5811, + "step": 64894 + }, + { + "epoch": 1.66, + "learning_rate": 8.726476389110355e-07, + "loss": 0.5493, + "step": 64895 + }, + { + "epoch": 1.66, + "learning_rate": 8.726201938115098e-07, + "loss": 0.603, + "step": 64896 + }, + { + "epoch": 1.66, + "learning_rate": 8.725927488095127e-07, + "loss": 0.6357, + "step": 64897 + }, + { + "epoch": 1.66, + "learning_rate": 8.725653039050658e-07, + "loss": 0.5764, + "step": 64898 + }, + { + "epoch": 1.66, + "learning_rate": 8.725378590981895e-07, + "loss": 0.6079, + "step": 64899 + }, + { + "epoch": 1.66, + "learning_rate": 8.725104143889055e-07, + "loss": 0.6934, + "step": 64900 + }, + { + "epoch": 1.66, + "learning_rate": 8.724829697772342e-07, + "loss": 0.6001, + "step": 64901 + }, + { + "epoch": 1.66, + "learning_rate": 8.724555252631967e-07, + "loss": 0.6665, + "step": 64902 + }, + { + "epoch": 1.66, + "learning_rate": 8.724280808468143e-07, + "loss": 0.4741, + "step": 64903 + }, + { + "epoch": 1.66, + "learning_rate": 8.724006365281076e-07, + "loss": 0.7178, + "step": 64904 + }, + { + "epoch": 1.66, + "learning_rate": 8.72373192307098e-07, + "loss": 0.6738, + "step": 64905 + }, + { + "epoch": 1.66, + "learning_rate": 8.723457481838064e-07, + "loss": 0.5212, + "step": 64906 + }, + { + "epoch": 1.66, + "learning_rate": 8.723183041582538e-07, + "loss": 0.7393, + "step": 64907 + }, + { + "epoch": 1.66, + "learning_rate": 8.72290860230461e-07, + "loss": 0.5016, + "step": 64908 + }, + { + "epoch": 1.66, + "learning_rate": 8.722634164004496e-07, + "loss": 0.5996, + "step": 64909 + }, + { + "epoch": 1.66, + "learning_rate": 8.722359726682403e-07, + "loss": 0.4175, + "step": 64910 + }, + { + "epoch": 1.66, + "learning_rate": 8.722085290338539e-07, + "loss": 0.5913, + "step": 64911 + }, + { + "epoch": 1.66, + "learning_rate": 8.721810854973112e-07, + "loss": 0.6748, + "step": 64912 + }, + { + "epoch": 1.66, + "learning_rate": 8.72153642058634e-07, + "loss": 0.647, + "step": 64913 + }, + { + "epoch": 1.66, + "learning_rate": 8.721261987178426e-07, + "loss": 0.6211, + "step": 64914 + }, + { + "epoch": 1.66, + "learning_rate": 8.720987554749585e-07, + "loss": 0.6201, + "step": 64915 + }, + { + "epoch": 1.66, + "learning_rate": 8.720713123300022e-07, + "loss": 0.3367, + "step": 64916 + }, + { + "epoch": 1.66, + "learning_rate": 8.720438692829953e-07, + "loss": 0.6606, + "step": 64917 + }, + { + "epoch": 1.66, + "learning_rate": 8.720164263339583e-07, + "loss": 0.708, + "step": 64918 + }, + { + "epoch": 1.66, + "learning_rate": 8.719889834829126e-07, + "loss": 0.3324, + "step": 64919 + }, + { + "epoch": 1.66, + "learning_rate": 8.719615407298793e-07, + "loss": 0.5801, + "step": 64920 + }, + { + "epoch": 1.66, + "learning_rate": 8.719340980748788e-07, + "loss": 0.8564, + "step": 64921 + }, + { + "epoch": 1.66, + "learning_rate": 8.719066555179326e-07, + "loss": 0.604, + "step": 64922 + }, + { + "epoch": 1.66, + "learning_rate": 8.718792130590613e-07, + "loss": 0.7402, + "step": 64923 + }, + { + "epoch": 1.66, + "learning_rate": 8.718517706982865e-07, + "loss": 0.5396, + "step": 64924 + }, + { + "epoch": 1.66, + "learning_rate": 8.718243284356287e-07, + "loss": 0.6582, + "step": 64925 + }, + { + "epoch": 1.66, + "learning_rate": 8.717968862711094e-07, + "loss": 0.6216, + "step": 64926 + }, + { + "epoch": 1.66, + "learning_rate": 8.71769444204749e-07, + "loss": 0.6904, + "step": 64927 + }, + { + "epoch": 1.66, + "learning_rate": 8.717420022365692e-07, + "loss": 0.5234, + "step": 64928 + }, + { + "epoch": 1.66, + "learning_rate": 8.717145603665904e-07, + "loss": 0.5747, + "step": 64929 + }, + { + "epoch": 1.66, + "learning_rate": 8.716871185948342e-07, + "loss": 0.6279, + "step": 64930 + }, + { + "epoch": 1.66, + "learning_rate": 8.716596769213209e-07, + "loss": 0.6641, + "step": 64931 + }, + { + "epoch": 1.66, + "learning_rate": 8.716322353460721e-07, + "loss": 0.6982, + "step": 64932 + }, + { + "epoch": 1.66, + "learning_rate": 8.716047938691084e-07, + "loss": 0.6792, + "step": 64933 + }, + { + "epoch": 1.66, + "learning_rate": 8.715773524904511e-07, + "loss": 0.667, + "step": 64934 + }, + { + "epoch": 1.66, + "learning_rate": 8.71549911210121e-07, + "loss": 0.6504, + "step": 64935 + }, + { + "epoch": 1.66, + "learning_rate": 8.715224700281394e-07, + "loss": 0.5967, + "step": 64936 + }, + { + "epoch": 1.66, + "learning_rate": 8.714950289445269e-07, + "loss": 0.4773, + "step": 64937 + }, + { + "epoch": 1.66, + "learning_rate": 8.714675879593049e-07, + "loss": 0.7803, + "step": 64938 + }, + { + "epoch": 1.66, + "learning_rate": 8.714401470724942e-07, + "loss": 0.5513, + "step": 64939 + }, + { + "epoch": 1.66, + "learning_rate": 8.714127062841162e-07, + "loss": 0.6121, + "step": 64940 + }, + { + "epoch": 1.66, + "learning_rate": 8.713852655941914e-07, + "loss": 0.4902, + "step": 64941 + }, + { + "epoch": 1.66, + "learning_rate": 8.713578250027408e-07, + "loss": 0.6885, + "step": 64942 + }, + { + "epoch": 1.66, + "learning_rate": 8.713303845097859e-07, + "loss": 0.6748, + "step": 64943 + }, + { + "epoch": 1.66, + "learning_rate": 8.71302944115347e-07, + "loss": 0.4602, + "step": 64944 + }, + { + "epoch": 1.66, + "learning_rate": 8.712755038194458e-07, + "loss": 0.3499, + "step": 64945 + }, + { + "epoch": 1.66, + "learning_rate": 8.71248063622103e-07, + "loss": 0.75, + "step": 64946 + }, + { + "epoch": 1.66, + "learning_rate": 8.712206235233395e-07, + "loss": 0.5879, + "step": 64947 + }, + { + "epoch": 1.66, + "learning_rate": 8.711931835231766e-07, + "loss": 0.4783, + "step": 64948 + }, + { + "epoch": 1.66, + "learning_rate": 8.71165743621635e-07, + "loss": 0.6665, + "step": 64949 + }, + { + "epoch": 1.66, + "learning_rate": 8.711383038187362e-07, + "loss": 0.6826, + "step": 64950 + }, + { + "epoch": 1.66, + "learning_rate": 8.711108641145008e-07, + "loss": 0.8467, + "step": 64951 + }, + { + "epoch": 1.66, + "learning_rate": 8.710834245089495e-07, + "loss": 0.8262, + "step": 64952 + }, + { + "epoch": 1.66, + "learning_rate": 8.71055985002104e-07, + "loss": 0.5732, + "step": 64953 + }, + { + "epoch": 1.66, + "learning_rate": 8.710285455939848e-07, + "loss": 0.605, + "step": 64954 + }, + { + "epoch": 1.66, + "learning_rate": 8.710011062846133e-07, + "loss": 0.6064, + "step": 64955 + }, + { + "epoch": 1.66, + "learning_rate": 8.709736670740102e-07, + "loss": 0.7109, + "step": 64956 + }, + { + "epoch": 1.66, + "learning_rate": 8.709462279621968e-07, + "loss": 0.5942, + "step": 64957 + }, + { + "epoch": 1.66, + "learning_rate": 8.709187889491936e-07, + "loss": 0.603, + "step": 64958 + }, + { + "epoch": 1.66, + "learning_rate": 8.708913500350223e-07, + "loss": 0.6611, + "step": 64959 + }, + { + "epoch": 1.66, + "learning_rate": 8.708639112197037e-07, + "loss": 0.7061, + "step": 64960 + }, + { + "epoch": 1.66, + "learning_rate": 8.708364725032583e-07, + "loss": 0.6426, + "step": 64961 + }, + { + "epoch": 1.67, + "learning_rate": 8.708090338857076e-07, + "loss": 0.5288, + "step": 64962 + }, + { + "epoch": 1.67, + "learning_rate": 8.707815953670726e-07, + "loss": 0.5923, + "step": 64963 + }, + { + "epoch": 1.67, + "learning_rate": 8.707541569473739e-07, + "loss": 0.6875, + "step": 64964 + }, + { + "epoch": 1.67, + "learning_rate": 8.70726718626633e-07, + "loss": 0.2667, + "step": 64965 + }, + { + "epoch": 1.67, + "learning_rate": 8.706992804048705e-07, + "loss": 0.6123, + "step": 64966 + }, + { + "epoch": 1.67, + "learning_rate": 8.706718422821079e-07, + "loss": 0.7188, + "step": 64967 + }, + { + "epoch": 1.67, + "learning_rate": 8.706444042583656e-07, + "loss": 0.5947, + "step": 64968 + }, + { + "epoch": 1.67, + "learning_rate": 8.706169663336652e-07, + "loss": 0.6455, + "step": 64969 + }, + { + "epoch": 1.67, + "learning_rate": 8.705895285080277e-07, + "loss": 0.6711, + "step": 64970 + }, + { + "epoch": 1.67, + "learning_rate": 8.705620907814733e-07, + "loss": 0.626, + "step": 64971 + }, + { + "epoch": 1.67, + "learning_rate": 8.705346531540238e-07, + "loss": 0.7764, + "step": 64972 + }, + { + "epoch": 1.67, + "learning_rate": 8.705072156256998e-07, + "loss": 0.6333, + "step": 64973 + }, + { + "epoch": 1.67, + "learning_rate": 8.704797781965227e-07, + "loss": 0.4651, + "step": 64974 + }, + { + "epoch": 1.67, + "learning_rate": 8.704523408665131e-07, + "loss": 0.7539, + "step": 64975 + }, + { + "epoch": 1.67, + "learning_rate": 8.704249036356923e-07, + "loss": 0.5554, + "step": 64976 + }, + { + "epoch": 1.67, + "learning_rate": 8.70397466504081e-07, + "loss": 0.7031, + "step": 64977 + }, + { + "epoch": 1.67, + "learning_rate": 8.703700294717007e-07, + "loss": 0.6997, + "step": 64978 + }, + { + "epoch": 1.67, + "learning_rate": 8.703425925385718e-07, + "loss": 0.751, + "step": 64979 + }, + { + "epoch": 1.67, + "learning_rate": 8.703151557047164e-07, + "loss": 0.6592, + "step": 64980 + }, + { + "epoch": 1.67, + "learning_rate": 8.702877189701538e-07, + "loss": 0.7393, + "step": 64981 + }, + { + "epoch": 1.67, + "learning_rate": 8.702602823349063e-07, + "loss": 0.6362, + "step": 64982 + }, + { + "epoch": 1.67, + "learning_rate": 8.702328457989945e-07, + "loss": 0.52, + "step": 64983 + }, + { + "epoch": 1.67, + "learning_rate": 8.702054093624393e-07, + "loss": 0.6196, + "step": 64984 + }, + { + "epoch": 1.67, + "learning_rate": 8.701779730252619e-07, + "loss": 0.6123, + "step": 64985 + }, + { + "epoch": 1.67, + "learning_rate": 8.701505367874834e-07, + "loss": 0.4768, + "step": 64986 + }, + { + "epoch": 1.67, + "learning_rate": 8.701231006491245e-07, + "loss": 0.7158, + "step": 64987 + }, + { + "epoch": 1.67, + "learning_rate": 8.700956646102064e-07, + "loss": 0.7373, + "step": 64988 + }, + { + "epoch": 1.67, + "learning_rate": 8.700682286707501e-07, + "loss": 0.4431, + "step": 64989 + }, + { + "epoch": 1.67, + "learning_rate": 8.700407928307769e-07, + "loss": 0.6196, + "step": 64990 + }, + { + "epoch": 1.67, + "learning_rate": 8.700133570903073e-07, + "loss": 0.7451, + "step": 64991 + }, + { + "epoch": 1.67, + "learning_rate": 8.699859214493622e-07, + "loss": 0.7812, + "step": 64992 + }, + { + "epoch": 1.67, + "learning_rate": 8.699584859079632e-07, + "loss": 0.573, + "step": 64993 + }, + { + "epoch": 1.67, + "learning_rate": 8.699310504661308e-07, + "loss": 0.4912, + "step": 64994 + }, + { + "epoch": 1.67, + "learning_rate": 8.699036151238863e-07, + "loss": 0.6177, + "step": 64995 + }, + { + "epoch": 1.67, + "learning_rate": 8.698761798812507e-07, + "loss": 0.7803, + "step": 64996 + }, + { + "epoch": 1.67, + "learning_rate": 8.698487447382447e-07, + "loss": 0.6924, + "step": 64997 + }, + { + "epoch": 1.67, + "learning_rate": 8.698213096948897e-07, + "loss": 0.7012, + "step": 64998 + }, + { + "epoch": 1.67, + "learning_rate": 8.697938747512066e-07, + "loss": 0.7021, + "step": 64999 + }, + { + "epoch": 1.67, + "learning_rate": 8.697664399072166e-07, + "loss": 0.6416, + "step": 65000 + }, + { + "epoch": 1.67, + "learning_rate": 8.697390051629402e-07, + "loss": 0.647, + "step": 65001 + }, + { + "epoch": 1.67, + "learning_rate": 8.697115705183984e-07, + "loss": 0.5986, + "step": 65002 + }, + { + "epoch": 1.67, + "learning_rate": 8.696841359736127e-07, + "loss": 0.6035, + "step": 65003 + }, + { + "epoch": 1.67, + "learning_rate": 8.696567015286037e-07, + "loss": 0.6846, + "step": 65004 + }, + { + "epoch": 1.67, + "learning_rate": 8.696292671833927e-07, + "loss": 0.5737, + "step": 65005 + }, + { + "epoch": 1.67, + "learning_rate": 8.696018329380003e-07, + "loss": 0.6299, + "step": 65006 + }, + { + "epoch": 1.67, + "learning_rate": 8.695743987924482e-07, + "loss": 0.6592, + "step": 65007 + }, + { + "epoch": 1.67, + "learning_rate": 8.695469647467567e-07, + "loss": 0.6426, + "step": 65008 + }, + { + "epoch": 1.67, + "learning_rate": 8.695195308009473e-07, + "loss": 0.6465, + "step": 65009 + }, + { + "epoch": 1.67, + "learning_rate": 8.69492096955041e-07, + "loss": 0.6621, + "step": 65010 + }, + { + "epoch": 1.67, + "learning_rate": 8.694646632090582e-07, + "loss": 0.6924, + "step": 65011 + }, + { + "epoch": 1.67, + "learning_rate": 8.694372295630204e-07, + "loss": 0.7881, + "step": 65012 + }, + { + "epoch": 1.67, + "learning_rate": 8.694097960169484e-07, + "loss": 0.7549, + "step": 65013 + }, + { + "epoch": 1.67, + "learning_rate": 8.693823625708636e-07, + "loss": 0.5713, + "step": 65014 + }, + { + "epoch": 1.67, + "learning_rate": 8.693549292247864e-07, + "loss": 0.6377, + "step": 65015 + }, + { + "epoch": 1.67, + "learning_rate": 8.693274959787383e-07, + "loss": 0.6455, + "step": 65016 + }, + { + "epoch": 1.67, + "learning_rate": 8.6930006283274e-07, + "loss": 0.6494, + "step": 65017 + }, + { + "epoch": 1.67, + "learning_rate": 8.692726297868128e-07, + "loss": 0.5, + "step": 65018 + }, + { + "epoch": 1.67, + "learning_rate": 8.692451968409777e-07, + "loss": 0.7271, + "step": 65019 + }, + { + "epoch": 1.67, + "learning_rate": 8.692177639952555e-07, + "loss": 0.6025, + "step": 65020 + }, + { + "epoch": 1.67, + "learning_rate": 8.691903312496669e-07, + "loss": 0.519, + "step": 65021 + }, + { + "epoch": 1.67, + "learning_rate": 8.691628986042335e-07, + "loss": 0.7061, + "step": 65022 + }, + { + "epoch": 1.67, + "learning_rate": 8.691354660589758e-07, + "loss": 0.5186, + "step": 65023 + }, + { + "epoch": 1.67, + "learning_rate": 8.691080336139153e-07, + "loss": 0.6206, + "step": 65024 + }, + { + "epoch": 1.67, + "learning_rate": 8.690806012690725e-07, + "loss": 0.7734, + "step": 65025 + }, + { + "epoch": 1.67, + "learning_rate": 8.690531690244689e-07, + "loss": 0.4861, + "step": 65026 + }, + { + "epoch": 1.67, + "learning_rate": 8.690257368801251e-07, + "loss": 0.4944, + "step": 65027 + }, + { + "epoch": 1.67, + "learning_rate": 8.689983048360625e-07, + "loss": 0.7686, + "step": 65028 + }, + { + "epoch": 1.67, + "learning_rate": 8.68970872892302e-07, + "loss": 0.668, + "step": 65029 + }, + { + "epoch": 1.67, + "learning_rate": 8.68943441048864e-07, + "loss": 0.5969, + "step": 65030 + }, + { + "epoch": 1.67, + "learning_rate": 8.689160093057703e-07, + "loss": 0.751, + "step": 65031 + }, + { + "epoch": 1.67, + "learning_rate": 8.688885776630414e-07, + "loss": 0.5332, + "step": 65032 + }, + { + "epoch": 1.67, + "learning_rate": 8.688611461206987e-07, + "loss": 0.4998, + "step": 65033 + }, + { + "epoch": 1.67, + "learning_rate": 8.688337146787628e-07, + "loss": 0.7998, + "step": 65034 + }, + { + "epoch": 1.67, + "learning_rate": 8.688062833372549e-07, + "loss": 0.5742, + "step": 65035 + }, + { + "epoch": 1.67, + "learning_rate": 8.687788520961961e-07, + "loss": 0.5532, + "step": 65036 + }, + { + "epoch": 1.67, + "learning_rate": 8.687514209556072e-07, + "loss": 0.4434, + "step": 65037 + }, + { + "epoch": 1.67, + "learning_rate": 8.687239899155095e-07, + "loss": 0.6855, + "step": 65038 + }, + { + "epoch": 1.67, + "learning_rate": 8.68696558975924e-07, + "loss": 0.5771, + "step": 65039 + }, + { + "epoch": 1.67, + "learning_rate": 8.68669128136871e-07, + "loss": 0.71, + "step": 65040 + }, + { + "epoch": 1.67, + "learning_rate": 8.686416973983722e-07, + "loss": 0.6445, + "step": 65041 + }, + { + "epoch": 1.67, + "learning_rate": 8.686142667604484e-07, + "loss": 0.6973, + "step": 65042 + }, + { + "epoch": 1.67, + "learning_rate": 8.685868362231206e-07, + "loss": 0.5564, + "step": 65043 + }, + { + "epoch": 1.67, + "learning_rate": 8.685594057864096e-07, + "loss": 0.6377, + "step": 65044 + }, + { + "epoch": 1.67, + "learning_rate": 8.68531975450337e-07, + "loss": 0.7119, + "step": 65045 + }, + { + "epoch": 1.67, + "learning_rate": 8.685045452149231e-07, + "loss": 0.5596, + "step": 65046 + }, + { + "epoch": 1.67, + "learning_rate": 8.684771150801895e-07, + "loss": 0.54, + "step": 65047 + }, + { + "epoch": 1.67, + "learning_rate": 8.684496850461567e-07, + "loss": 0.8135, + "step": 65048 + }, + { + "epoch": 1.67, + "learning_rate": 8.684222551128464e-07, + "loss": 0.707, + "step": 65049 + }, + { + "epoch": 1.67, + "learning_rate": 8.683948252802787e-07, + "loss": 0.6523, + "step": 65050 + }, + { + "epoch": 1.67, + "learning_rate": 8.68367395548475e-07, + "loss": 0.6992, + "step": 65051 + }, + { + "epoch": 1.67, + "learning_rate": 8.683399659174566e-07, + "loss": 0.604, + "step": 65052 + }, + { + "epoch": 1.67, + "learning_rate": 8.683125363872442e-07, + "loss": 0.7021, + "step": 65053 + }, + { + "epoch": 1.67, + "learning_rate": 8.682851069578585e-07, + "loss": 0.6807, + "step": 65054 + }, + { + "epoch": 1.67, + "learning_rate": 8.682576776293211e-07, + "loss": 0.6987, + "step": 65055 + }, + { + "epoch": 1.67, + "learning_rate": 8.682302484016526e-07, + "loss": 0.8018, + "step": 65056 + }, + { + "epoch": 1.67, + "learning_rate": 8.682028192748742e-07, + "loss": 0.5146, + "step": 65057 + }, + { + "epoch": 1.67, + "learning_rate": 8.681753902490068e-07, + "loss": 0.625, + "step": 65058 + }, + { + "epoch": 1.67, + "learning_rate": 8.681479613240718e-07, + "loss": 0.6196, + "step": 65059 + }, + { + "epoch": 1.67, + "learning_rate": 8.681205325000896e-07, + "loss": 0.6797, + "step": 65060 + }, + { + "epoch": 1.67, + "learning_rate": 8.680931037770812e-07, + "loss": 0.5229, + "step": 65061 + }, + { + "epoch": 1.67, + "learning_rate": 8.680656751550681e-07, + "loss": 0.6504, + "step": 65062 + }, + { + "epoch": 1.67, + "learning_rate": 8.68038246634071e-07, + "loss": 0.6572, + "step": 65063 + }, + { + "epoch": 1.67, + "learning_rate": 8.680108182141109e-07, + "loss": 0.7393, + "step": 65064 + }, + { + "epoch": 1.67, + "learning_rate": 8.679833898952088e-07, + "loss": 0.4739, + "step": 65065 + }, + { + "epoch": 1.67, + "learning_rate": 8.679559616773859e-07, + "loss": 0.6016, + "step": 65066 + }, + { + "epoch": 1.67, + "learning_rate": 8.679285335606628e-07, + "loss": 0.7754, + "step": 65067 + }, + { + "epoch": 1.67, + "learning_rate": 8.67901105545061e-07, + "loss": 0.6621, + "step": 65068 + }, + { + "epoch": 1.67, + "learning_rate": 8.678736776306015e-07, + "loss": 0.7822, + "step": 65069 + }, + { + "epoch": 1.67, + "learning_rate": 8.678462498173048e-07, + "loss": 0.7734, + "step": 65070 + }, + { + "epoch": 1.67, + "learning_rate": 8.678188221051919e-07, + "loss": 0.6855, + "step": 65071 + }, + { + "epoch": 1.67, + "learning_rate": 8.677913944942843e-07, + "loss": 0.5786, + "step": 65072 + }, + { + "epoch": 1.67, + "learning_rate": 8.677639669846027e-07, + "loss": 0.7646, + "step": 65073 + }, + { + "epoch": 1.67, + "learning_rate": 8.677365395761681e-07, + "loss": 0.7256, + "step": 65074 + }, + { + "epoch": 1.67, + "learning_rate": 8.677091122690015e-07, + "loss": 0.7383, + "step": 65075 + }, + { + "epoch": 1.67, + "learning_rate": 8.67681685063124e-07, + "loss": 0.5359, + "step": 65076 + }, + { + "epoch": 1.67, + "learning_rate": 8.676542579585564e-07, + "loss": 0.626, + "step": 65077 + }, + { + "epoch": 1.67, + "learning_rate": 8.676268309553202e-07, + "loss": 0.7495, + "step": 65078 + }, + { + "epoch": 1.67, + "learning_rate": 8.675994040534362e-07, + "loss": 0.6885, + "step": 65079 + }, + { + "epoch": 1.67, + "learning_rate": 8.675719772529247e-07, + "loss": 0.752, + "step": 65080 + }, + { + "epoch": 1.67, + "learning_rate": 8.675445505538076e-07, + "loss": 0.627, + "step": 65081 + }, + { + "epoch": 1.67, + "learning_rate": 8.675171239561052e-07, + "loss": 0.6758, + "step": 65082 + }, + { + "epoch": 1.67, + "learning_rate": 8.674896974598391e-07, + "loss": 0.4558, + "step": 65083 + }, + { + "epoch": 1.67, + "learning_rate": 8.674622710650299e-07, + "loss": 0.793, + "step": 65084 + }, + { + "epoch": 1.67, + "learning_rate": 8.67434844771699e-07, + "loss": 0.6367, + "step": 65085 + }, + { + "epoch": 1.67, + "learning_rate": 8.674074185798668e-07, + "loss": 0.5898, + "step": 65086 + }, + { + "epoch": 1.67, + "learning_rate": 8.67379992489555e-07, + "loss": 0.6394, + "step": 65087 + }, + { + "epoch": 1.67, + "learning_rate": 8.673525665007839e-07, + "loss": 0.7124, + "step": 65088 + }, + { + "epoch": 1.67, + "learning_rate": 8.673251406135755e-07, + "loss": 0.6362, + "step": 65089 + }, + { + "epoch": 1.67, + "learning_rate": 8.672977148279495e-07, + "loss": 0.6646, + "step": 65090 + }, + { + "epoch": 1.67, + "learning_rate": 8.672702891439279e-07, + "loss": 0.5166, + "step": 65091 + }, + { + "epoch": 1.67, + "learning_rate": 8.67242863561531e-07, + "loss": 0.502, + "step": 65092 + }, + { + "epoch": 1.67, + "learning_rate": 8.672154380807804e-07, + "loss": 0.7412, + "step": 65093 + }, + { + "epoch": 1.67, + "learning_rate": 8.671880127016963e-07, + "loss": 0.8213, + "step": 65094 + }, + { + "epoch": 1.67, + "learning_rate": 8.671605874243008e-07, + "loss": 0.5532, + "step": 65095 + }, + { + "epoch": 1.67, + "learning_rate": 8.671331622486141e-07, + "loss": 0.8242, + "step": 65096 + }, + { + "epoch": 1.67, + "learning_rate": 8.671057371746575e-07, + "loss": 0.6904, + "step": 65097 + }, + { + "epoch": 1.67, + "learning_rate": 8.670783122024519e-07, + "loss": 0.6758, + "step": 65098 + }, + { + "epoch": 1.67, + "learning_rate": 8.670508873320186e-07, + "loss": 0.7324, + "step": 65099 + }, + { + "epoch": 1.67, + "learning_rate": 8.670234625633781e-07, + "loss": 0.7812, + "step": 65100 + }, + { + "epoch": 1.67, + "learning_rate": 8.669960378965515e-07, + "loss": 0.6357, + "step": 65101 + }, + { + "epoch": 1.67, + "learning_rate": 8.669686133315601e-07, + "loss": 0.7598, + "step": 65102 + }, + { + "epoch": 1.67, + "learning_rate": 8.669411888684244e-07, + "loss": 0.5481, + "step": 65103 + }, + { + "epoch": 1.67, + "learning_rate": 8.66913764507166e-07, + "loss": 0.5483, + "step": 65104 + }, + { + "epoch": 1.67, + "learning_rate": 8.668863402478055e-07, + "loss": 0.5106, + "step": 65105 + }, + { + "epoch": 1.67, + "learning_rate": 8.668589160903641e-07, + "loss": 0.6562, + "step": 65106 + }, + { + "epoch": 1.67, + "learning_rate": 8.668314920348625e-07, + "loss": 0.6611, + "step": 65107 + }, + { + "epoch": 1.67, + "learning_rate": 8.668040680813222e-07, + "loss": 0.4812, + "step": 65108 + }, + { + "epoch": 1.67, + "learning_rate": 8.66776644229764e-07, + "loss": 0.6494, + "step": 65109 + }, + { + "epoch": 1.67, + "learning_rate": 8.667492204802087e-07, + "loss": 0.7021, + "step": 65110 + }, + { + "epoch": 1.67, + "learning_rate": 8.667217968326771e-07, + "loss": 0.4702, + "step": 65111 + }, + { + "epoch": 1.67, + "learning_rate": 8.666943732871908e-07, + "loss": 0.5146, + "step": 65112 + }, + { + "epoch": 1.67, + "learning_rate": 8.666669498437701e-07, + "loss": 0.6704, + "step": 65113 + }, + { + "epoch": 1.67, + "learning_rate": 8.666395265024367e-07, + "loss": 0.7109, + "step": 65114 + }, + { + "epoch": 1.67, + "learning_rate": 8.666121032632111e-07, + "loss": 0.708, + "step": 65115 + }, + { + "epoch": 1.67, + "learning_rate": 8.665846801261146e-07, + "loss": 0.5938, + "step": 65116 + }, + { + "epoch": 1.67, + "learning_rate": 8.66557257091168e-07, + "loss": 0.5854, + "step": 65117 + }, + { + "epoch": 1.67, + "learning_rate": 8.665298341583924e-07, + "loss": 0.7012, + "step": 65118 + }, + { + "epoch": 1.67, + "learning_rate": 8.665024113278092e-07, + "loss": 0.6592, + "step": 65119 + }, + { + "epoch": 1.67, + "learning_rate": 8.664749885994384e-07, + "loss": 0.6338, + "step": 65120 + }, + { + "epoch": 1.67, + "learning_rate": 8.664475659733018e-07, + "loss": 0.6338, + "step": 65121 + }, + { + "epoch": 1.67, + "learning_rate": 8.664201434494199e-07, + "loss": 0.6558, + "step": 65122 + }, + { + "epoch": 1.67, + "learning_rate": 8.663927210278144e-07, + "loss": 0.5688, + "step": 65123 + }, + { + "epoch": 1.67, + "learning_rate": 8.663652987085052e-07, + "loss": 0.4788, + "step": 65124 + }, + { + "epoch": 1.67, + "learning_rate": 8.663378764915146e-07, + "loss": 0.6821, + "step": 65125 + }, + { + "epoch": 1.67, + "learning_rate": 8.663104543768626e-07, + "loss": 0.613, + "step": 65126 + }, + { + "epoch": 1.67, + "learning_rate": 8.662830323645705e-07, + "loss": 0.5601, + "step": 65127 + }, + { + "epoch": 1.67, + "learning_rate": 8.662556104546596e-07, + "loss": 0.6318, + "step": 65128 + }, + { + "epoch": 1.67, + "learning_rate": 8.662281886471508e-07, + "loss": 0.6504, + "step": 65129 + }, + { + "epoch": 1.67, + "learning_rate": 8.662007669420644e-07, + "loss": 0.6865, + "step": 65130 + }, + { + "epoch": 1.67, + "learning_rate": 8.661733453394222e-07, + "loss": 0.5979, + "step": 65131 + }, + { + "epoch": 1.67, + "learning_rate": 8.661459238392448e-07, + "loss": 0.4546, + "step": 65132 + }, + { + "epoch": 1.67, + "learning_rate": 8.661185024415533e-07, + "loss": 0.5518, + "step": 65133 + }, + { + "epoch": 1.67, + "learning_rate": 8.660910811463688e-07, + "loss": 0.6738, + "step": 65134 + }, + { + "epoch": 1.67, + "learning_rate": 8.660636599537121e-07, + "loss": 0.5977, + "step": 65135 + }, + { + "epoch": 1.67, + "learning_rate": 8.660362388636042e-07, + "loss": 0.749, + "step": 65136 + }, + { + "epoch": 1.67, + "learning_rate": 8.660088178760665e-07, + "loss": 0.6206, + "step": 65137 + }, + { + "epoch": 1.67, + "learning_rate": 8.659813969911194e-07, + "loss": 0.5498, + "step": 65138 + }, + { + "epoch": 1.67, + "learning_rate": 8.659539762087846e-07, + "loss": 0.6797, + "step": 65139 + }, + { + "epoch": 1.67, + "learning_rate": 8.659265555290824e-07, + "loss": 0.584, + "step": 65140 + }, + { + "epoch": 1.67, + "learning_rate": 8.658991349520341e-07, + "loss": 0.5933, + "step": 65141 + }, + { + "epoch": 1.67, + "learning_rate": 8.658717144776607e-07, + "loss": 0.7451, + "step": 65142 + }, + { + "epoch": 1.67, + "learning_rate": 8.658442941059832e-07, + "loss": 0.7539, + "step": 65143 + }, + { + "epoch": 1.67, + "learning_rate": 8.658168738370222e-07, + "loss": 0.5215, + "step": 65144 + }, + { + "epoch": 1.67, + "learning_rate": 8.657894536707995e-07, + "loss": 0.6162, + "step": 65145 + }, + { + "epoch": 1.67, + "learning_rate": 8.657620336073353e-07, + "loss": 0.6748, + "step": 65146 + }, + { + "epoch": 1.67, + "learning_rate": 8.65734613646651e-07, + "loss": 0.5461, + "step": 65147 + }, + { + "epoch": 1.67, + "learning_rate": 8.657071937887675e-07, + "loss": 0.6191, + "step": 65148 + }, + { + "epoch": 1.67, + "learning_rate": 8.656797740337063e-07, + "loss": 0.5245, + "step": 65149 + }, + { + "epoch": 1.67, + "learning_rate": 8.656523543814876e-07, + "loss": 0.5347, + "step": 65150 + }, + { + "epoch": 1.67, + "learning_rate": 8.656249348321325e-07, + "loss": 0.7627, + "step": 65151 + }, + { + "epoch": 1.67, + "learning_rate": 8.655975153856625e-07, + "loss": 0.5513, + "step": 65152 + }, + { + "epoch": 1.67, + "learning_rate": 8.65570096042098e-07, + "loss": 0.6758, + "step": 65153 + }, + { + "epoch": 1.67, + "learning_rate": 8.655426768014607e-07, + "loss": 0.7998, + "step": 65154 + }, + { + "epoch": 1.67, + "learning_rate": 8.655152576637708e-07, + "loss": 0.6963, + "step": 65155 + }, + { + "epoch": 1.67, + "learning_rate": 8.654878386290499e-07, + "loss": 0.4182, + "step": 65156 + }, + { + "epoch": 1.67, + "learning_rate": 8.654604196973186e-07, + "loss": 0.5981, + "step": 65157 + }, + { + "epoch": 1.67, + "learning_rate": 8.654330008685983e-07, + "loss": 0.667, + "step": 65158 + }, + { + "epoch": 1.67, + "learning_rate": 8.654055821429101e-07, + "loss": 0.792, + "step": 65159 + }, + { + "epoch": 1.67, + "learning_rate": 8.653781635202742e-07, + "loss": 0.6313, + "step": 65160 + }, + { + "epoch": 1.67, + "learning_rate": 8.653507450007119e-07, + "loss": 0.6348, + "step": 65161 + }, + { + "epoch": 1.67, + "learning_rate": 8.653233265842446e-07, + "loss": 0.7285, + "step": 65162 + }, + { + "epoch": 1.67, + "learning_rate": 8.652959082708929e-07, + "loss": 0.6797, + "step": 65163 + }, + { + "epoch": 1.67, + "learning_rate": 8.652684900606779e-07, + "loss": 0.5225, + "step": 65164 + }, + { + "epoch": 1.67, + "learning_rate": 8.652410719536207e-07, + "loss": 0.5396, + "step": 65165 + }, + { + "epoch": 1.67, + "learning_rate": 8.652136539497423e-07, + "loss": 0.7949, + "step": 65166 + }, + { + "epoch": 1.67, + "learning_rate": 8.651862360490634e-07, + "loss": 0.6836, + "step": 65167 + }, + { + "epoch": 1.67, + "learning_rate": 8.651588182516054e-07, + "loss": 0.7949, + "step": 65168 + }, + { + "epoch": 1.67, + "learning_rate": 8.651314005573894e-07, + "loss": 0.5884, + "step": 65169 + }, + { + "epoch": 1.67, + "learning_rate": 8.651039829664355e-07, + "loss": 0.6816, + "step": 65170 + }, + { + "epoch": 1.67, + "learning_rate": 8.650765654787655e-07, + "loss": 0.6299, + "step": 65171 + }, + { + "epoch": 1.67, + "learning_rate": 8.650491480944e-07, + "loss": 0.5454, + "step": 65172 + }, + { + "epoch": 1.67, + "learning_rate": 8.650217308133603e-07, + "loss": 0.6494, + "step": 65173 + }, + { + "epoch": 1.67, + "learning_rate": 8.649943136356672e-07, + "loss": 0.6953, + "step": 65174 + }, + { + "epoch": 1.67, + "learning_rate": 8.649668965613419e-07, + "loss": 0.6172, + "step": 65175 + }, + { + "epoch": 1.67, + "learning_rate": 8.649394795904051e-07, + "loss": 0.6685, + "step": 65176 + }, + { + "epoch": 1.67, + "learning_rate": 8.649120627228781e-07, + "loss": 0.6006, + "step": 65177 + }, + { + "epoch": 1.67, + "learning_rate": 8.648846459587814e-07, + "loss": 0.6562, + "step": 65178 + }, + { + "epoch": 1.67, + "learning_rate": 8.648572292981371e-07, + "loss": 0.6436, + "step": 65179 + }, + { + "epoch": 1.67, + "learning_rate": 8.648298127409646e-07, + "loss": 0.5664, + "step": 65180 + }, + { + "epoch": 1.67, + "learning_rate": 8.64802396287286e-07, + "loss": 0.6416, + "step": 65181 + }, + { + "epoch": 1.67, + "learning_rate": 8.647749799371218e-07, + "loss": 0.7295, + "step": 65182 + }, + { + "epoch": 1.67, + "learning_rate": 8.647475636904934e-07, + "loss": 0.7363, + "step": 65183 + }, + { + "epoch": 1.67, + "learning_rate": 8.647201475474213e-07, + "loss": 0.6265, + "step": 65184 + }, + { + "epoch": 1.67, + "learning_rate": 8.64692731507927e-07, + "loss": 0.7588, + "step": 65185 + }, + { + "epoch": 1.67, + "learning_rate": 8.64665315572031e-07, + "loss": 0.6455, + "step": 65186 + }, + { + "epoch": 1.67, + "learning_rate": 8.646378997397548e-07, + "loss": 0.7744, + "step": 65187 + }, + { + "epoch": 1.67, + "learning_rate": 8.646104840111191e-07, + "loss": 0.5938, + "step": 65188 + }, + { + "epoch": 1.67, + "learning_rate": 8.64583068386145e-07, + "loss": 0.6831, + "step": 65189 + }, + { + "epoch": 1.67, + "learning_rate": 8.645556528648535e-07, + "loss": 0.5388, + "step": 65190 + }, + { + "epoch": 1.67, + "learning_rate": 8.645282374472651e-07, + "loss": 0.6543, + "step": 65191 + }, + { + "epoch": 1.67, + "learning_rate": 8.645008221334016e-07, + "loss": 0.7549, + "step": 65192 + }, + { + "epoch": 1.67, + "learning_rate": 8.644734069232832e-07, + "loss": 0.6777, + "step": 65193 + }, + { + "epoch": 1.67, + "learning_rate": 8.644459918169315e-07, + "loss": 0.7578, + "step": 65194 + }, + { + "epoch": 1.67, + "learning_rate": 8.644185768143671e-07, + "loss": 0.5239, + "step": 65195 + }, + { + "epoch": 1.67, + "learning_rate": 8.643911619156114e-07, + "loss": 0.8271, + "step": 65196 + }, + { + "epoch": 1.67, + "learning_rate": 8.643637471206851e-07, + "loss": 0.7207, + "step": 65197 + }, + { + "epoch": 1.67, + "learning_rate": 8.643363324296091e-07, + "loss": 0.4932, + "step": 65198 + }, + { + "epoch": 1.67, + "learning_rate": 8.643089178424051e-07, + "loss": 0.5, + "step": 65199 + }, + { + "epoch": 1.67, + "learning_rate": 8.642815033590931e-07, + "loss": 0.6396, + "step": 65200 + }, + { + "epoch": 1.67, + "learning_rate": 8.642540889796943e-07, + "loss": 0.7061, + "step": 65201 + }, + { + "epoch": 1.67, + "learning_rate": 8.642266747042302e-07, + "loss": 0.8193, + "step": 65202 + }, + { + "epoch": 1.67, + "learning_rate": 8.641992605327211e-07, + "loss": 0.6973, + "step": 65203 + }, + { + "epoch": 1.67, + "learning_rate": 8.641718464651888e-07, + "loss": 0.4221, + "step": 65204 + }, + { + "epoch": 1.67, + "learning_rate": 8.641444325016536e-07, + "loss": 0.5898, + "step": 65205 + }, + { + "epoch": 1.67, + "learning_rate": 8.641170186421371e-07, + "loss": 0.6011, + "step": 65206 + }, + { + "epoch": 1.67, + "learning_rate": 8.640896048866595e-07, + "loss": 0.6167, + "step": 65207 + }, + { + "epoch": 1.67, + "learning_rate": 8.640621912352426e-07, + "loss": 0.6934, + "step": 65208 + }, + { + "epoch": 1.67, + "learning_rate": 8.640347776879071e-07, + "loss": 0.4792, + "step": 65209 + }, + { + "epoch": 1.67, + "learning_rate": 8.640073642446737e-07, + "loss": 0.749, + "step": 65210 + }, + { + "epoch": 1.67, + "learning_rate": 8.639799509055637e-07, + "loss": 0.7188, + "step": 65211 + }, + { + "epoch": 1.67, + "learning_rate": 8.639525376705979e-07, + "loss": 0.6855, + "step": 65212 + }, + { + "epoch": 1.67, + "learning_rate": 8.639251245397973e-07, + "loss": 0.5947, + "step": 65213 + }, + { + "epoch": 1.67, + "learning_rate": 8.63897711513183e-07, + "loss": 0.6045, + "step": 65214 + }, + { + "epoch": 1.67, + "learning_rate": 8.638702985907762e-07, + "loss": 0.5991, + "step": 65215 + }, + { + "epoch": 1.67, + "learning_rate": 8.638428857725975e-07, + "loss": 0.7754, + "step": 65216 + }, + { + "epoch": 1.67, + "learning_rate": 8.638154730586679e-07, + "loss": 0.6201, + "step": 65217 + }, + { + "epoch": 1.67, + "learning_rate": 8.637880604490089e-07, + "loss": 0.6968, + "step": 65218 + }, + { + "epoch": 1.67, + "learning_rate": 8.637606479436411e-07, + "loss": 0.7612, + "step": 65219 + }, + { + "epoch": 1.67, + "learning_rate": 8.637332355425852e-07, + "loss": 0.6118, + "step": 65220 + }, + { + "epoch": 1.67, + "learning_rate": 8.637058232458627e-07, + "loss": 0.7383, + "step": 65221 + }, + { + "epoch": 1.67, + "learning_rate": 8.636784110534942e-07, + "loss": 0.7021, + "step": 65222 + }, + { + "epoch": 1.67, + "learning_rate": 8.63650998965501e-07, + "loss": 0.71, + "step": 65223 + }, + { + "epoch": 1.67, + "learning_rate": 8.636235869819038e-07, + "loss": 0.6348, + "step": 65224 + }, + { + "epoch": 1.67, + "learning_rate": 8.635961751027239e-07, + "loss": 0.5669, + "step": 65225 + }, + { + "epoch": 1.67, + "learning_rate": 8.63568763327982e-07, + "loss": 0.7119, + "step": 65226 + }, + { + "epoch": 1.67, + "learning_rate": 8.635413516576995e-07, + "loss": 0.6523, + "step": 65227 + }, + { + "epoch": 1.67, + "learning_rate": 8.635139400918968e-07, + "loss": 0.748, + "step": 65228 + }, + { + "epoch": 1.67, + "learning_rate": 8.634865286305956e-07, + "loss": 0.6934, + "step": 65229 + }, + { + "epoch": 1.67, + "learning_rate": 8.634591172738162e-07, + "loss": 0.6367, + "step": 65230 + }, + { + "epoch": 1.67, + "learning_rate": 8.634317060215798e-07, + "loss": 0.6682, + "step": 65231 + }, + { + "epoch": 1.67, + "learning_rate": 8.634042948739078e-07, + "loss": 0.5786, + "step": 65232 + }, + { + "epoch": 1.67, + "learning_rate": 8.633768838308206e-07, + "loss": 0.4668, + "step": 65233 + }, + { + "epoch": 1.67, + "learning_rate": 8.633494728923394e-07, + "loss": 0.752, + "step": 65234 + }, + { + "epoch": 1.67, + "learning_rate": 8.633220620584853e-07, + "loss": 0.4934, + "step": 65235 + }, + { + "epoch": 1.67, + "learning_rate": 8.63294651329279e-07, + "loss": 0.5688, + "step": 65236 + }, + { + "epoch": 1.67, + "learning_rate": 8.63267240704742e-07, + "loss": 0.5431, + "step": 65237 + }, + { + "epoch": 1.67, + "learning_rate": 8.632398301848948e-07, + "loss": 0.7705, + "step": 65238 + }, + { + "epoch": 1.67, + "learning_rate": 8.63212419769759e-07, + "loss": 0.6812, + "step": 65239 + }, + { + "epoch": 1.67, + "learning_rate": 8.631850094593547e-07, + "loss": 0.6982, + "step": 65240 + }, + { + "epoch": 1.67, + "learning_rate": 8.631575992537035e-07, + "loss": 0.6572, + "step": 65241 + }, + { + "epoch": 1.67, + "learning_rate": 8.631301891528262e-07, + "loss": 0.6113, + "step": 65242 + }, + { + "epoch": 1.67, + "learning_rate": 8.631027791567438e-07, + "loss": 0.6807, + "step": 65243 + }, + { + "epoch": 1.67, + "learning_rate": 8.630753692654773e-07, + "loss": 0.6548, + "step": 65244 + }, + { + "epoch": 1.67, + "learning_rate": 8.630479594790476e-07, + "loss": 0.562, + "step": 65245 + }, + { + "epoch": 1.67, + "learning_rate": 8.63020549797476e-07, + "loss": 0.5793, + "step": 65246 + }, + { + "epoch": 1.67, + "learning_rate": 8.629931402207831e-07, + "loss": 0.5708, + "step": 65247 + }, + { + "epoch": 1.67, + "learning_rate": 8.629657307489902e-07, + "loss": 0.5752, + "step": 65248 + }, + { + "epoch": 1.67, + "learning_rate": 8.629383213821183e-07, + "loss": 0.5757, + "step": 65249 + }, + { + "epoch": 1.67, + "learning_rate": 8.629109121201881e-07, + "loss": 0.4954, + "step": 65250 + }, + { + "epoch": 1.67, + "learning_rate": 8.628835029632205e-07, + "loss": 0.6523, + "step": 65251 + }, + { + "epoch": 1.67, + "learning_rate": 8.628560939112368e-07, + "loss": 0.6333, + "step": 65252 + }, + { + "epoch": 1.67, + "learning_rate": 8.628286849642577e-07, + "loss": 0.5276, + "step": 65253 + }, + { + "epoch": 1.67, + "learning_rate": 8.628012761223047e-07, + "loss": 0.7168, + "step": 65254 + }, + { + "epoch": 1.67, + "learning_rate": 8.627738673853982e-07, + "loss": 0.748, + "step": 65255 + }, + { + "epoch": 1.67, + "learning_rate": 8.627464587535596e-07, + "loss": 0.7236, + "step": 65256 + }, + { + "epoch": 1.67, + "learning_rate": 8.627190502268095e-07, + "loss": 0.7734, + "step": 65257 + }, + { + "epoch": 1.67, + "learning_rate": 8.626916418051693e-07, + "loss": 0.5679, + "step": 65258 + }, + { + "epoch": 1.67, + "learning_rate": 8.626642334886602e-07, + "loss": 0.7119, + "step": 65259 + }, + { + "epoch": 1.67, + "learning_rate": 8.62636825277302e-07, + "loss": 0.667, + "step": 65260 + }, + { + "epoch": 1.67, + "learning_rate": 8.62609417171117e-07, + "loss": 0.6523, + "step": 65261 + }, + { + "epoch": 1.67, + "learning_rate": 8.625820091701254e-07, + "loss": 0.5962, + "step": 65262 + }, + { + "epoch": 1.67, + "learning_rate": 8.625546012743485e-07, + "loss": 0.7051, + "step": 65263 + }, + { + "epoch": 1.67, + "learning_rate": 8.625271934838071e-07, + "loss": 0.6091, + "step": 65264 + }, + { + "epoch": 1.67, + "learning_rate": 8.624997857985226e-07, + "loss": 0.6602, + "step": 65265 + }, + { + "epoch": 1.67, + "learning_rate": 8.624723782185153e-07, + "loss": 0.6533, + "step": 65266 + }, + { + "epoch": 1.67, + "learning_rate": 8.624449707438069e-07, + "loss": 0.6973, + "step": 65267 + }, + { + "epoch": 1.67, + "learning_rate": 8.624175633744179e-07, + "loss": 0.6582, + "step": 65268 + }, + { + "epoch": 1.67, + "learning_rate": 8.623901561103699e-07, + "loss": 0.561, + "step": 65269 + }, + { + "epoch": 1.67, + "learning_rate": 8.623627489516829e-07, + "loss": 0.5933, + "step": 65270 + }, + { + "epoch": 1.67, + "learning_rate": 8.623353418983788e-07, + "loss": 0.6504, + "step": 65271 + }, + { + "epoch": 1.67, + "learning_rate": 8.623079349504777e-07, + "loss": 0.5825, + "step": 65272 + }, + { + "epoch": 1.67, + "learning_rate": 8.622805281080014e-07, + "loss": 0.6533, + "step": 65273 + }, + { + "epoch": 1.67, + "learning_rate": 8.622531213709704e-07, + "loss": 0.709, + "step": 65274 + }, + { + "epoch": 1.67, + "learning_rate": 8.622257147394061e-07, + "loss": 0.6533, + "step": 65275 + }, + { + "epoch": 1.67, + "learning_rate": 8.621983082133288e-07, + "loss": 0.7188, + "step": 65276 + }, + { + "epoch": 1.67, + "learning_rate": 8.621709017927605e-07, + "loss": 0.5627, + "step": 65277 + }, + { + "epoch": 1.67, + "learning_rate": 8.621434954777212e-07, + "loss": 0.6826, + "step": 65278 + }, + { + "epoch": 1.67, + "learning_rate": 8.621160892682326e-07, + "loss": 0.5017, + "step": 65279 + }, + { + "epoch": 1.67, + "learning_rate": 8.620886831643153e-07, + "loss": 0.4847, + "step": 65280 + }, + { + "epoch": 1.67, + "learning_rate": 8.6206127716599e-07, + "loss": 0.7085, + "step": 65281 + }, + { + "epoch": 1.67, + "learning_rate": 8.620338712732785e-07, + "loss": 0.7461, + "step": 65282 + }, + { + "epoch": 1.67, + "learning_rate": 8.620064654862008e-07, + "loss": 0.521, + "step": 65283 + }, + { + "epoch": 1.67, + "learning_rate": 8.619790598047788e-07, + "loss": 0.6172, + "step": 65284 + }, + { + "epoch": 1.67, + "learning_rate": 8.619516542290329e-07, + "loss": 0.7109, + "step": 65285 + }, + { + "epoch": 1.67, + "learning_rate": 8.619242487589844e-07, + "loss": 0.7832, + "step": 65286 + }, + { + "epoch": 1.67, + "learning_rate": 8.618968433946539e-07, + "loss": 0.7979, + "step": 65287 + }, + { + "epoch": 1.67, + "learning_rate": 8.61869438136063e-07, + "loss": 0.6309, + "step": 65288 + }, + { + "epoch": 1.67, + "learning_rate": 8.618420329832323e-07, + "loss": 0.6533, + "step": 65289 + }, + { + "epoch": 1.67, + "learning_rate": 8.618146279361829e-07, + "loss": 0.6279, + "step": 65290 + }, + { + "epoch": 1.67, + "learning_rate": 8.617872229949352e-07, + "loss": 0.5122, + "step": 65291 + }, + { + "epoch": 1.67, + "learning_rate": 8.61759818159511e-07, + "loss": 0.4038, + "step": 65292 + }, + { + "epoch": 1.67, + "learning_rate": 8.617324134299307e-07, + "loss": 0.6504, + "step": 65293 + }, + { + "epoch": 1.67, + "learning_rate": 8.617050088062158e-07, + "loss": 0.4727, + "step": 65294 + }, + { + "epoch": 1.67, + "learning_rate": 8.616776042883868e-07, + "loss": 0.8057, + "step": 65295 + }, + { + "epoch": 1.67, + "learning_rate": 8.61650199876465e-07, + "loss": 0.6465, + "step": 65296 + }, + { + "epoch": 1.67, + "learning_rate": 8.616227955704712e-07, + "loss": 0.5759, + "step": 65297 + }, + { + "epoch": 1.67, + "learning_rate": 8.615953913704267e-07, + "loss": 0.7354, + "step": 65298 + }, + { + "epoch": 1.67, + "learning_rate": 8.615679872763524e-07, + "loss": 0.5568, + "step": 65299 + }, + { + "epoch": 1.67, + "learning_rate": 8.615405832882686e-07, + "loss": 0.7588, + "step": 65300 + }, + { + "epoch": 1.67, + "learning_rate": 8.615131794061972e-07, + "loss": 0.7354, + "step": 65301 + }, + { + "epoch": 1.67, + "learning_rate": 8.614857756301584e-07, + "loss": 0.7783, + "step": 65302 + }, + { + "epoch": 1.67, + "learning_rate": 8.614583719601739e-07, + "loss": 0.6035, + "step": 65303 + }, + { + "epoch": 1.67, + "learning_rate": 8.614309683962642e-07, + "loss": 0.6885, + "step": 65304 + }, + { + "epoch": 1.67, + "learning_rate": 8.614035649384506e-07, + "loss": 0.665, + "step": 65305 + }, + { + "epoch": 1.67, + "learning_rate": 8.613761615867539e-07, + "loss": 0.6147, + "step": 65306 + }, + { + "epoch": 1.67, + "learning_rate": 8.613487583411947e-07, + "loss": 0.4941, + "step": 65307 + }, + { + "epoch": 1.67, + "learning_rate": 8.613213552017951e-07, + "loss": 0.5933, + "step": 65308 + }, + { + "epoch": 1.67, + "learning_rate": 8.612939521685749e-07, + "loss": 0.5742, + "step": 65309 + }, + { + "epoch": 1.67, + "learning_rate": 8.612665492415555e-07, + "loss": 0.7861, + "step": 65310 + }, + { + "epoch": 1.67, + "learning_rate": 8.612391464207581e-07, + "loss": 0.564, + "step": 65311 + }, + { + "epoch": 1.67, + "learning_rate": 8.612117437062033e-07, + "loss": 0.6299, + "step": 65312 + }, + { + "epoch": 1.67, + "learning_rate": 8.611843410979125e-07, + "loss": 0.6465, + "step": 65313 + }, + { + "epoch": 1.67, + "learning_rate": 8.611569385959062e-07, + "loss": 0.5488, + "step": 65314 + }, + { + "epoch": 1.67, + "learning_rate": 8.611295362002059e-07, + "loss": 0.4443, + "step": 65315 + }, + { + "epoch": 1.67, + "learning_rate": 8.611021339108321e-07, + "loss": 0.4495, + "step": 65316 + }, + { + "epoch": 1.67, + "learning_rate": 8.610747317278062e-07, + "loss": 0.6211, + "step": 65317 + }, + { + "epoch": 1.67, + "learning_rate": 8.610473296511493e-07, + "loss": 0.7051, + "step": 65318 + }, + { + "epoch": 1.67, + "learning_rate": 8.610199276808816e-07, + "loss": 0.7061, + "step": 65319 + }, + { + "epoch": 1.67, + "learning_rate": 8.609925258170248e-07, + "loss": 0.5918, + "step": 65320 + }, + { + "epoch": 1.67, + "learning_rate": 8.609651240595994e-07, + "loss": 0.4585, + "step": 65321 + }, + { + "epoch": 1.67, + "learning_rate": 8.609377224086267e-07, + "loss": 0.6392, + "step": 65322 + }, + { + "epoch": 1.67, + "learning_rate": 8.609103208641277e-07, + "loss": 0.6768, + "step": 65323 + }, + { + "epoch": 1.67, + "learning_rate": 8.60882919426123e-07, + "loss": 0.6111, + "step": 65324 + }, + { + "epoch": 1.67, + "learning_rate": 8.608555180946341e-07, + "loss": 0.6221, + "step": 65325 + }, + { + "epoch": 1.67, + "learning_rate": 8.608281168696816e-07, + "loss": 0.6895, + "step": 65326 + }, + { + "epoch": 1.67, + "learning_rate": 8.608007157512867e-07, + "loss": 0.5298, + "step": 65327 + }, + { + "epoch": 1.67, + "learning_rate": 8.607733147394706e-07, + "loss": 0.6528, + "step": 65328 + }, + { + "epoch": 1.67, + "learning_rate": 8.607459138342534e-07, + "loss": 0.5713, + "step": 65329 + }, + { + "epoch": 1.67, + "learning_rate": 8.60718513035657e-07, + "loss": 0.7168, + "step": 65330 + }, + { + "epoch": 1.67, + "learning_rate": 8.606911123437017e-07, + "loss": 0.5977, + "step": 65331 + }, + { + "epoch": 1.67, + "learning_rate": 8.606637117584092e-07, + "loss": 0.3945, + "step": 65332 + }, + { + "epoch": 1.67, + "learning_rate": 8.606363112797997e-07, + "loss": 0.4766, + "step": 65333 + }, + { + "epoch": 1.67, + "learning_rate": 8.606089109078949e-07, + "loss": 0.7148, + "step": 65334 + }, + { + "epoch": 1.67, + "learning_rate": 8.605815106427152e-07, + "loss": 0.5747, + "step": 65335 + }, + { + "epoch": 1.67, + "learning_rate": 8.60554110484282e-07, + "loss": 0.7578, + "step": 65336 + }, + { + "epoch": 1.67, + "learning_rate": 8.605267104326159e-07, + "loss": 0.4846, + "step": 65337 + }, + { + "epoch": 1.67, + "learning_rate": 8.604993104877386e-07, + "loss": 0.5859, + "step": 65338 + }, + { + "epoch": 1.67, + "learning_rate": 8.604719106496703e-07, + "loss": 0.5474, + "step": 65339 + }, + { + "epoch": 1.67, + "learning_rate": 8.60444510918432e-07, + "loss": 0.7422, + "step": 65340 + }, + { + "epoch": 1.67, + "learning_rate": 8.604171112940451e-07, + "loss": 0.7119, + "step": 65341 + }, + { + "epoch": 1.67, + "learning_rate": 8.603897117765305e-07, + "loss": 0.4556, + "step": 65342 + }, + { + "epoch": 1.67, + "learning_rate": 8.603623123659088e-07, + "loss": 0.6006, + "step": 65343 + }, + { + "epoch": 1.67, + "learning_rate": 8.603349130622015e-07, + "loss": 0.5962, + "step": 65344 + }, + { + "epoch": 1.67, + "learning_rate": 8.603075138654291e-07, + "loss": 0.6353, + "step": 65345 + }, + { + "epoch": 1.67, + "learning_rate": 8.602801147756132e-07, + "loss": 0.8916, + "step": 65346 + }, + { + "epoch": 1.67, + "learning_rate": 8.60252715792774e-07, + "loss": 0.6556, + "step": 65347 + }, + { + "epoch": 1.67, + "learning_rate": 8.602253169169333e-07, + "loss": 0.5037, + "step": 65348 + }, + { + "epoch": 1.67, + "learning_rate": 8.601979181481113e-07, + "loss": 0.6631, + "step": 65349 + }, + { + "epoch": 1.67, + "learning_rate": 8.601705194863294e-07, + "loss": 0.5537, + "step": 65350 + }, + { + "epoch": 1.67, + "learning_rate": 8.601431209316084e-07, + "loss": 0.6846, + "step": 65351 + }, + { + "epoch": 1.68, + "learning_rate": 8.601157224839694e-07, + "loss": 0.6045, + "step": 65352 + }, + { + "epoch": 1.68, + "learning_rate": 8.600883241434336e-07, + "loss": 0.5967, + "step": 65353 + }, + { + "epoch": 1.68, + "learning_rate": 8.600609259100213e-07, + "loss": 0.6196, + "step": 65354 + }, + { + "epoch": 1.68, + "learning_rate": 8.600335277837543e-07, + "loss": 0.5154, + "step": 65355 + }, + { + "epoch": 1.68, + "learning_rate": 8.60006129764653e-07, + "loss": 0.5449, + "step": 65356 + }, + { + "epoch": 1.68, + "learning_rate": 8.599787318527387e-07, + "loss": 0.6411, + "step": 65357 + }, + { + "epoch": 1.68, + "learning_rate": 8.599513340480325e-07, + "loss": 0.51, + "step": 65358 + }, + { + "epoch": 1.68, + "learning_rate": 8.599239363505548e-07, + "loss": 0.5151, + "step": 65359 + }, + { + "epoch": 1.68, + "learning_rate": 8.598965387603269e-07, + "loss": 0.7236, + "step": 65360 + }, + { + "epoch": 1.68, + "learning_rate": 8.598691412773698e-07, + "loss": 0.7295, + "step": 65361 + }, + { + "epoch": 1.68, + "learning_rate": 8.598417439017044e-07, + "loss": 0.8066, + "step": 65362 + }, + { + "epoch": 1.68, + "learning_rate": 8.598143466333518e-07, + "loss": 0.6221, + "step": 65363 + }, + { + "epoch": 1.68, + "learning_rate": 8.597869494723328e-07, + "loss": 0.7002, + "step": 65364 + }, + { + "epoch": 1.68, + "learning_rate": 8.597595524186687e-07, + "loss": 0.6245, + "step": 65365 + }, + { + "epoch": 1.68, + "learning_rate": 8.5973215547238e-07, + "loss": 0.748, + "step": 65366 + }, + { + "epoch": 1.68, + "learning_rate": 8.597047586334881e-07, + "loss": 0.6409, + "step": 65367 + }, + { + "epoch": 1.68, + "learning_rate": 8.596773619020141e-07, + "loss": 0.5007, + "step": 65368 + }, + { + "epoch": 1.68, + "learning_rate": 8.596499652779783e-07, + "loss": 0.5303, + "step": 65369 + }, + { + "epoch": 1.68, + "learning_rate": 8.596225687614022e-07, + "loss": 0.7129, + "step": 65370 + }, + { + "epoch": 1.68, + "learning_rate": 8.595951723523065e-07, + "loss": 0.4945, + "step": 65371 + }, + { + "epoch": 1.68, + "learning_rate": 8.595677760507125e-07, + "loss": 0.7383, + "step": 65372 + }, + { + "epoch": 1.68, + "learning_rate": 8.595403798566408e-07, + "loss": 0.5996, + "step": 65373 + }, + { + "epoch": 1.68, + "learning_rate": 8.595129837701127e-07, + "loss": 0.7178, + "step": 65374 + }, + { + "epoch": 1.68, + "learning_rate": 8.594855877911489e-07, + "loss": 0.5396, + "step": 65375 + }, + { + "epoch": 1.68, + "learning_rate": 8.594581919197708e-07, + "loss": 0.5659, + "step": 65376 + }, + { + "epoch": 1.68, + "learning_rate": 8.594307961559988e-07, + "loss": 0.7314, + "step": 65377 + }, + { + "epoch": 1.68, + "learning_rate": 8.594034004998548e-07, + "loss": 0.9614, + "step": 65378 + }, + { + "epoch": 1.68, + "learning_rate": 8.593760049513586e-07, + "loss": 0.5249, + "step": 65379 + }, + { + "epoch": 1.68, + "learning_rate": 8.593486095105319e-07, + "loss": 0.6865, + "step": 65380 + }, + { + "epoch": 1.68, + "learning_rate": 8.593212141773952e-07, + "loss": 0.5312, + "step": 65381 + }, + { + "epoch": 1.68, + "learning_rate": 8.592938189519702e-07, + "loss": 0.6665, + "step": 65382 + }, + { + "epoch": 1.68, + "learning_rate": 8.592664238342771e-07, + "loss": 0.5269, + "step": 65383 + }, + { + "epoch": 1.68, + "learning_rate": 8.592390288243374e-07, + "loss": 0.665, + "step": 65384 + }, + { + "epoch": 1.68, + "learning_rate": 8.592116339221718e-07, + "loss": 0.6904, + "step": 65385 + }, + { + "epoch": 1.68, + "learning_rate": 8.591842391278015e-07, + "loss": 0.4327, + "step": 65386 + }, + { + "epoch": 1.68, + "learning_rate": 8.591568444412471e-07, + "loss": 0.6377, + "step": 65387 + }, + { + "epoch": 1.68, + "learning_rate": 8.591294498625304e-07, + "loss": 0.6973, + "step": 65388 + }, + { + "epoch": 1.68, + "learning_rate": 8.591020553916715e-07, + "loss": 0.5996, + "step": 65389 + }, + { + "epoch": 1.68, + "learning_rate": 8.590746610286915e-07, + "loss": 0.6611, + "step": 65390 + }, + { + "epoch": 1.68, + "learning_rate": 8.590472667736117e-07, + "loss": 0.6924, + "step": 65391 + }, + { + "epoch": 1.68, + "learning_rate": 8.590198726264528e-07, + "loss": 0.5288, + "step": 65392 + }, + { + "epoch": 1.68, + "learning_rate": 8.589924785872361e-07, + "loss": 0.6597, + "step": 65393 + }, + { + "epoch": 1.68, + "learning_rate": 8.589650846559822e-07, + "loss": 0.571, + "step": 65394 + }, + { + "epoch": 1.68, + "learning_rate": 8.589376908327123e-07, + "loss": 0.6338, + "step": 65395 + }, + { + "epoch": 1.68, + "learning_rate": 8.589102971174476e-07, + "loss": 0.6013, + "step": 65396 + }, + { + "epoch": 1.68, + "learning_rate": 8.588829035102084e-07, + "loss": 0.4756, + "step": 65397 + }, + { + "epoch": 1.68, + "learning_rate": 8.588555100110164e-07, + "loss": 0.5566, + "step": 65398 + }, + { + "epoch": 1.68, + "learning_rate": 8.588281166198921e-07, + "loss": 0.5303, + "step": 65399 + }, + { + "epoch": 1.68, + "learning_rate": 8.588007233368564e-07, + "loss": 0.4475, + "step": 65400 + }, + { + "epoch": 1.68, + "learning_rate": 8.587733301619309e-07, + "loss": 0.7129, + "step": 65401 + }, + { + "epoch": 1.68, + "learning_rate": 8.587459370951358e-07, + "loss": 0.4858, + "step": 65402 + }, + { + "epoch": 1.68, + "learning_rate": 8.587185441364927e-07, + "loss": 0.6675, + "step": 65403 + }, + { + "epoch": 1.68, + "learning_rate": 8.58691151286022e-07, + "loss": 0.5747, + "step": 65404 + }, + { + "epoch": 1.68, + "learning_rate": 8.586637585437452e-07, + "loss": 0.7744, + "step": 65405 + }, + { + "epoch": 1.68, + "learning_rate": 8.58636365909683e-07, + "loss": 0.6279, + "step": 65406 + }, + { + "epoch": 1.68, + "learning_rate": 8.586089733838567e-07, + "loss": 0.5269, + "step": 65407 + }, + { + "epoch": 1.68, + "learning_rate": 8.585815809662869e-07, + "loss": 0.5266, + "step": 65408 + }, + { + "epoch": 1.68, + "learning_rate": 8.585541886569945e-07, + "loss": 0.5752, + "step": 65409 + }, + { + "epoch": 1.68, + "learning_rate": 8.585267964560007e-07, + "loss": 0.6187, + "step": 65410 + }, + { + "epoch": 1.68, + "learning_rate": 8.584994043633265e-07, + "loss": 0.6729, + "step": 65411 + }, + { + "epoch": 1.68, + "learning_rate": 8.584720123789929e-07, + "loss": 0.5024, + "step": 65412 + }, + { + "epoch": 1.68, + "learning_rate": 8.584446205030206e-07, + "loss": 0.6924, + "step": 65413 + }, + { + "epoch": 1.68, + "learning_rate": 8.584172287354307e-07, + "loss": 0.5498, + "step": 65414 + }, + { + "epoch": 1.68, + "learning_rate": 8.583898370762444e-07, + "loss": 0.5116, + "step": 65415 + }, + { + "epoch": 1.68, + "learning_rate": 8.583624455254821e-07, + "loss": 0.627, + "step": 65416 + }, + { + "epoch": 1.68, + "learning_rate": 8.583350540831655e-07, + "loss": 0.6758, + "step": 65417 + }, + { + "epoch": 1.68, + "learning_rate": 8.583076627493156e-07, + "loss": 0.6211, + "step": 65418 + }, + { + "epoch": 1.68, + "learning_rate": 8.582802715239524e-07, + "loss": 0.6504, + "step": 65419 + }, + { + "epoch": 1.68, + "learning_rate": 8.582528804070978e-07, + "loss": 0.7959, + "step": 65420 + }, + { + "epoch": 1.68, + "learning_rate": 8.582254893987721e-07, + "loss": 0.3722, + "step": 65421 + }, + { + "epoch": 1.68, + "learning_rate": 8.581980984989969e-07, + "loss": 0.6511, + "step": 65422 + }, + { + "epoch": 1.68, + "learning_rate": 8.581707077077927e-07, + "loss": 0.5479, + "step": 65423 + }, + { + "epoch": 1.68, + "learning_rate": 8.581433170251809e-07, + "loss": 0.7783, + "step": 65424 + }, + { + "epoch": 1.68, + "learning_rate": 8.58115926451182e-07, + "loss": 0.7773, + "step": 65425 + }, + { + "epoch": 1.68, + "learning_rate": 8.580885359858174e-07, + "loss": 0.6553, + "step": 65426 + }, + { + "epoch": 1.68, + "learning_rate": 8.580611456291079e-07, + "loss": 0.8027, + "step": 65427 + }, + { + "epoch": 1.68, + "learning_rate": 8.580337553810745e-07, + "loss": 0.543, + "step": 65428 + }, + { + "epoch": 1.68, + "learning_rate": 8.580063652417382e-07, + "loss": 0.6484, + "step": 65429 + }, + { + "epoch": 1.68, + "learning_rate": 8.579789752111195e-07, + "loss": 0.6211, + "step": 65430 + }, + { + "epoch": 1.68, + "learning_rate": 8.579515852892401e-07, + "loss": 0.6846, + "step": 65431 + }, + { + "epoch": 1.68, + "learning_rate": 8.579241954761206e-07, + "loss": 0.4543, + "step": 65432 + }, + { + "epoch": 1.68, + "learning_rate": 8.578968057717818e-07, + "loss": 0.7607, + "step": 65433 + }, + { + "epoch": 1.68, + "learning_rate": 8.578694161762451e-07, + "loss": 0.6494, + "step": 65434 + }, + { + "epoch": 1.68, + "learning_rate": 8.57842026689531e-07, + "loss": 0.5728, + "step": 65435 + }, + { + "epoch": 1.68, + "learning_rate": 8.57814637311661e-07, + "loss": 0.6543, + "step": 65436 + }, + { + "epoch": 1.68, + "learning_rate": 8.577872480426556e-07, + "loss": 0.6318, + "step": 65437 + }, + { + "epoch": 1.68, + "learning_rate": 8.577598588825364e-07, + "loss": 0.5293, + "step": 65438 + }, + { + "epoch": 1.68, + "learning_rate": 8.577324698313236e-07, + "loss": 0.5244, + "step": 65439 + }, + { + "epoch": 1.68, + "learning_rate": 8.577050808890383e-07, + "loss": 0.6953, + "step": 65440 + }, + { + "epoch": 1.68, + "learning_rate": 8.57677692055702e-07, + "loss": 0.6816, + "step": 65441 + }, + { + "epoch": 1.68, + "learning_rate": 8.57650303331335e-07, + "loss": 0.7148, + "step": 65442 + }, + { + "epoch": 1.68, + "learning_rate": 8.57622914715959e-07, + "loss": 0.5825, + "step": 65443 + }, + { + "epoch": 1.68, + "learning_rate": 8.575955262095943e-07, + "loss": 0.6392, + "step": 65444 + }, + { + "epoch": 1.68, + "learning_rate": 8.575681378122623e-07, + "loss": 0.6826, + "step": 65445 + }, + { + "epoch": 1.68, + "learning_rate": 8.575407495239837e-07, + "loss": 0.4434, + "step": 65446 + }, + { + "epoch": 1.68, + "learning_rate": 8.575133613447798e-07, + "loss": 0.6025, + "step": 65447 + }, + { + "epoch": 1.68, + "learning_rate": 8.574859732746715e-07, + "loss": 0.5632, + "step": 65448 + }, + { + "epoch": 1.68, + "learning_rate": 8.574585853136795e-07, + "loss": 0.5796, + "step": 65449 + }, + { + "epoch": 1.68, + "learning_rate": 8.574311974618247e-07, + "loss": 0.5713, + "step": 65450 + }, + { + "epoch": 1.68, + "learning_rate": 8.574038097191285e-07, + "loss": 0.5786, + "step": 65451 + }, + { + "epoch": 1.68, + "learning_rate": 8.573764220856115e-07, + "loss": 0.8379, + "step": 65452 + }, + { + "epoch": 1.68, + "learning_rate": 8.573490345612948e-07, + "loss": 0.624, + "step": 65453 + }, + { + "epoch": 1.68, + "learning_rate": 8.573216471461994e-07, + "loss": 0.6504, + "step": 65454 + }, + { + "epoch": 1.68, + "learning_rate": 8.572942598403463e-07, + "loss": 0.71, + "step": 65455 + }, + { + "epoch": 1.68, + "learning_rate": 8.572668726437563e-07, + "loss": 0.6909, + "step": 65456 + }, + { + "epoch": 1.68, + "learning_rate": 8.572394855564507e-07, + "loss": 0.6982, + "step": 65457 + }, + { + "epoch": 1.68, + "learning_rate": 8.572120985784504e-07, + "loss": 0.6182, + "step": 65458 + }, + { + "epoch": 1.68, + "learning_rate": 8.571847117097759e-07, + "loss": 0.6431, + "step": 65459 + }, + { + "epoch": 1.68, + "learning_rate": 8.571573249504487e-07, + "loss": 0.4893, + "step": 65460 + }, + { + "epoch": 1.68, + "learning_rate": 8.571299383004893e-07, + "loss": 0.5732, + "step": 65461 + }, + { + "epoch": 1.68, + "learning_rate": 8.571025517599193e-07, + "loss": 0.4791, + "step": 65462 + }, + { + "epoch": 1.68, + "learning_rate": 8.570751653287589e-07, + "loss": 0.8975, + "step": 65463 + }, + { + "epoch": 1.68, + "learning_rate": 8.570477790070297e-07, + "loss": 0.6787, + "step": 65464 + }, + { + "epoch": 1.68, + "learning_rate": 8.570203927947524e-07, + "loss": 0.5728, + "step": 65465 + }, + { + "epoch": 1.68, + "learning_rate": 8.56993006691948e-07, + "loss": 0.6082, + "step": 65466 + }, + { + "epoch": 1.68, + "learning_rate": 8.569656206986376e-07, + "loss": 0.5669, + "step": 65467 + }, + { + "epoch": 1.68, + "learning_rate": 8.569382348148424e-07, + "loss": 0.6953, + "step": 65468 + }, + { + "epoch": 1.68, + "learning_rate": 8.569108490405824e-07, + "loss": 0.6489, + "step": 65469 + }, + { + "epoch": 1.68, + "learning_rate": 8.568834633758795e-07, + "loss": 0.416, + "step": 65470 + }, + { + "epoch": 1.68, + "learning_rate": 8.568560778207541e-07, + "loss": 0.7061, + "step": 65471 + }, + { + "epoch": 1.68, + "learning_rate": 8.568286923752274e-07, + "loss": 0.5879, + "step": 65472 + }, + { + "epoch": 1.68, + "learning_rate": 8.568013070393205e-07, + "loss": 0.5801, + "step": 65473 + }, + { + "epoch": 1.68, + "learning_rate": 8.567739218130544e-07, + "loss": 0.7969, + "step": 65474 + }, + { + "epoch": 1.68, + "learning_rate": 8.567465366964497e-07, + "loss": 0.5161, + "step": 65475 + }, + { + "epoch": 1.68, + "learning_rate": 8.567191516895277e-07, + "loss": 0.4927, + "step": 65476 + }, + { + "epoch": 1.68, + "learning_rate": 8.566917667923092e-07, + "loss": 0.6865, + "step": 65477 + }, + { + "epoch": 1.68, + "learning_rate": 8.566643820048156e-07, + "loss": 0.6445, + "step": 65478 + }, + { + "epoch": 1.68, + "learning_rate": 8.566369973270672e-07, + "loss": 0.6875, + "step": 65479 + }, + { + "epoch": 1.68, + "learning_rate": 8.566096127590851e-07, + "loss": 0.6353, + "step": 65480 + }, + { + "epoch": 1.68, + "learning_rate": 8.565822283008906e-07, + "loss": 0.5498, + "step": 65481 + }, + { + "epoch": 1.68, + "learning_rate": 8.565548439525043e-07, + "loss": 0.5438, + "step": 65482 + }, + { + "epoch": 1.68, + "learning_rate": 8.565274597139476e-07, + "loss": 0.5098, + "step": 65483 + }, + { + "epoch": 1.68, + "learning_rate": 8.565000755852409e-07, + "loss": 0.6582, + "step": 65484 + }, + { + "epoch": 1.68, + "learning_rate": 8.564726915664059e-07, + "loss": 0.6221, + "step": 65485 + }, + { + "epoch": 1.68, + "learning_rate": 8.56445307657463e-07, + "loss": 0.6147, + "step": 65486 + }, + { + "epoch": 1.68, + "learning_rate": 8.564179238584332e-07, + "loss": 0.5881, + "step": 65487 + }, + { + "epoch": 1.68, + "learning_rate": 8.563905401693379e-07, + "loss": 0.7588, + "step": 65488 + }, + { + "epoch": 1.68, + "learning_rate": 8.563631565901978e-07, + "loss": 0.7305, + "step": 65489 + }, + { + "epoch": 1.68, + "learning_rate": 8.563357731210334e-07, + "loss": 0.7246, + "step": 65490 + }, + { + "epoch": 1.68, + "learning_rate": 8.563083897618663e-07, + "loss": 0.5483, + "step": 65491 + }, + { + "epoch": 1.68, + "learning_rate": 8.562810065127172e-07, + "loss": 0.6714, + "step": 65492 + }, + { + "epoch": 1.68, + "learning_rate": 8.562536233736071e-07, + "loss": 0.8213, + "step": 65493 + }, + { + "epoch": 1.68, + "learning_rate": 8.562262403445571e-07, + "loss": 0.6626, + "step": 65494 + }, + { + "epoch": 1.68, + "learning_rate": 8.56198857425588e-07, + "loss": 0.6953, + "step": 65495 + }, + { + "epoch": 1.68, + "learning_rate": 8.561714746167208e-07, + "loss": 0.5601, + "step": 65496 + }, + { + "epoch": 1.68, + "learning_rate": 8.561440919179765e-07, + "loss": 0.6108, + "step": 65497 + }, + { + "epoch": 1.68, + "learning_rate": 8.561167093293764e-07, + "loss": 0.7461, + "step": 65498 + }, + { + "epoch": 1.68, + "learning_rate": 8.560893268509407e-07, + "loss": 0.7148, + "step": 65499 + }, + { + "epoch": 1.68, + "learning_rate": 8.56061944482691e-07, + "loss": 0.4834, + "step": 65500 + }, + { + "epoch": 1.68, + "learning_rate": 8.560345622246478e-07, + "loss": 0.6143, + "step": 65501 + }, + { + "epoch": 1.68, + "learning_rate": 8.560071800768325e-07, + "loss": 0.7119, + "step": 65502 + }, + { + "epoch": 1.68, + "learning_rate": 8.559797980392657e-07, + "loss": 0.623, + "step": 65503 + }, + { + "epoch": 1.68, + "learning_rate": 8.559524161119688e-07, + "loss": 0.8037, + "step": 65504 + }, + { + "epoch": 1.68, + "learning_rate": 8.559250342949624e-07, + "loss": 0.543, + "step": 65505 + }, + { + "epoch": 1.68, + "learning_rate": 8.558976525882675e-07, + "loss": 0.6289, + "step": 65506 + }, + { + "epoch": 1.68, + "learning_rate": 8.558702709919052e-07, + "loss": 0.7314, + "step": 65507 + }, + { + "epoch": 1.68, + "learning_rate": 8.558428895058967e-07, + "loss": 0.6084, + "step": 65508 + }, + { + "epoch": 1.68, + "learning_rate": 8.558155081302623e-07, + "loss": 0.6011, + "step": 65509 + }, + { + "epoch": 1.68, + "learning_rate": 8.557881268650236e-07, + "loss": 0.6862, + "step": 65510 + }, + { + "epoch": 1.68, + "learning_rate": 8.55760745710201e-07, + "loss": 0.6943, + "step": 65511 + }, + { + "epoch": 1.68, + "learning_rate": 8.557333646658158e-07, + "loss": 0.3956, + "step": 65512 + }, + { + "epoch": 1.68, + "learning_rate": 8.55705983731889e-07, + "loss": 0.6123, + "step": 65513 + }, + { + "epoch": 1.68, + "learning_rate": 8.556786029084415e-07, + "loss": 0.6821, + "step": 65514 + }, + { + "epoch": 1.68, + "learning_rate": 8.556512221954941e-07, + "loss": 0.6865, + "step": 65515 + }, + { + "epoch": 1.68, + "learning_rate": 8.556238415930682e-07, + "loss": 0.7334, + "step": 65516 + }, + { + "epoch": 1.68, + "learning_rate": 8.555964611011843e-07, + "loss": 0.6904, + "step": 65517 + }, + { + "epoch": 1.68, + "learning_rate": 8.555690807198638e-07, + "loss": 0.572, + "step": 65518 + }, + { + "epoch": 1.68, + "learning_rate": 8.555417004491274e-07, + "loss": 0.6602, + "step": 65519 + }, + { + "epoch": 1.68, + "learning_rate": 8.555143202889959e-07, + "loss": 0.6182, + "step": 65520 + }, + { + "epoch": 1.68, + "learning_rate": 8.554869402394904e-07, + "loss": 0.6714, + "step": 65521 + }, + { + "epoch": 1.68, + "learning_rate": 8.554595603006321e-07, + "loss": 0.6445, + "step": 65522 + }, + { + "epoch": 1.68, + "learning_rate": 8.554321804724415e-07, + "loss": 0.6143, + "step": 65523 + }, + { + "epoch": 1.68, + "learning_rate": 8.554048007549401e-07, + "loss": 0.6008, + "step": 65524 + }, + { + "epoch": 1.68, + "learning_rate": 8.553774211481482e-07, + "loss": 0.4453, + "step": 65525 + }, + { + "epoch": 1.68, + "learning_rate": 8.553500416520876e-07, + "loss": 0.7305, + "step": 65526 + }, + { + "epoch": 1.68, + "learning_rate": 8.553226622667784e-07, + "loss": 0.6875, + "step": 65527 + }, + { + "epoch": 1.68, + "learning_rate": 8.552952829922426e-07, + "loss": 0.7051, + "step": 65528 + }, + { + "epoch": 1.68, + "learning_rate": 8.552679038285002e-07, + "loss": 0.7412, + "step": 65529 + }, + { + "epoch": 1.68, + "learning_rate": 8.552405247755724e-07, + "loss": 0.8369, + "step": 65530 + }, + { + "epoch": 1.68, + "learning_rate": 8.552131458334803e-07, + "loss": 0.7559, + "step": 65531 + }, + { + "epoch": 1.68, + "learning_rate": 8.551857670022449e-07, + "loss": 0.6709, + "step": 65532 + }, + { + "epoch": 1.68, + "learning_rate": 8.551583882818872e-07, + "loss": 0.7305, + "step": 65533 + }, + { + "epoch": 1.68, + "learning_rate": 8.551310096724278e-07, + "loss": 0.5571, + "step": 65534 + }, + { + "epoch": 1.68, + "learning_rate": 8.551036311738882e-07, + "loss": 0.5283, + "step": 65535 + }, + { + "epoch": 1.68, + "learning_rate": 8.550762527862887e-07, + "loss": 0.5432, + "step": 65536 + }, + { + "epoch": 1.68, + "learning_rate": 8.550488745096512e-07, + "loss": 0.4685, + "step": 65537 + }, + { + "epoch": 1.68, + "learning_rate": 8.55021496343996e-07, + "loss": 0.6431, + "step": 65538 + }, + { + "epoch": 1.68, + "learning_rate": 8.549941182893441e-07, + "loss": 0.7139, + "step": 65539 + }, + { + "epoch": 1.68, + "learning_rate": 8.549667403457163e-07, + "loss": 0.5513, + "step": 65540 + }, + { + "epoch": 1.68, + "learning_rate": 8.549393625131341e-07, + "loss": 0.5947, + "step": 65541 + }, + { + "epoch": 1.68, + "learning_rate": 8.549119847916177e-07, + "loss": 0.6807, + "step": 65542 + }, + { + "epoch": 1.68, + "learning_rate": 8.54884607181189e-07, + "loss": 0.6104, + "step": 65543 + }, + { + "epoch": 1.68, + "learning_rate": 8.548572296818681e-07, + "loss": 0.5947, + "step": 65544 + }, + { + "epoch": 1.68, + "learning_rate": 8.548298522936766e-07, + "loss": 0.3641, + "step": 65545 + }, + { + "epoch": 1.68, + "learning_rate": 8.54802475016635e-07, + "loss": 0.5718, + "step": 65546 + }, + { + "epoch": 1.68, + "learning_rate": 8.547750978507647e-07, + "loss": 0.6123, + "step": 65547 + }, + { + "epoch": 1.68, + "learning_rate": 8.547477207960867e-07, + "loss": 0.7046, + "step": 65548 + }, + { + "epoch": 1.68, + "learning_rate": 8.547203438526213e-07, + "loss": 0.605, + "step": 65549 + }, + { + "epoch": 1.68, + "learning_rate": 8.546929670203899e-07, + "loss": 0.7061, + "step": 65550 + }, + { + "epoch": 1.68, + "learning_rate": 8.546655902994133e-07, + "loss": 0.4492, + "step": 65551 + }, + { + "epoch": 1.68, + "learning_rate": 8.546382136897127e-07, + "loss": 0.5557, + "step": 65552 + }, + { + "epoch": 1.68, + "learning_rate": 8.546108371913089e-07, + "loss": 0.4873, + "step": 65553 + }, + { + "epoch": 1.68, + "learning_rate": 8.545834608042229e-07, + "loss": 0.5664, + "step": 65554 + }, + { + "epoch": 1.68, + "learning_rate": 8.545560845284756e-07, + "loss": 0.5605, + "step": 65555 + }, + { + "epoch": 1.68, + "learning_rate": 8.545287083640882e-07, + "loss": 0.8115, + "step": 65556 + }, + { + "epoch": 1.68, + "learning_rate": 8.545013323110812e-07, + "loss": 0.5542, + "step": 65557 + }, + { + "epoch": 1.68, + "learning_rate": 8.544739563694765e-07, + "loss": 0.3495, + "step": 65558 + }, + { + "epoch": 1.68, + "learning_rate": 8.544465805392937e-07, + "loss": 0.6758, + "step": 65559 + }, + { + "epoch": 1.68, + "learning_rate": 8.544192048205548e-07, + "loss": 0.4863, + "step": 65560 + }, + { + "epoch": 1.68, + "learning_rate": 8.543918292132803e-07, + "loss": 0.6279, + "step": 65561 + }, + { + "epoch": 1.68, + "learning_rate": 8.543644537174913e-07, + "loss": 0.5916, + "step": 65562 + }, + { + "epoch": 1.68, + "learning_rate": 8.543370783332085e-07, + "loss": 0.387, + "step": 65563 + }, + { + "epoch": 1.68, + "learning_rate": 8.543097030604534e-07, + "loss": 0.6704, + "step": 65564 + }, + { + "epoch": 1.68, + "learning_rate": 8.542823278992465e-07, + "loss": 0.7988, + "step": 65565 + }, + { + "epoch": 1.68, + "learning_rate": 8.542549528496091e-07, + "loss": 0.5358, + "step": 65566 + }, + { + "epoch": 1.68, + "learning_rate": 8.542275779115617e-07, + "loss": 0.5364, + "step": 65567 + }, + { + "epoch": 1.68, + "learning_rate": 8.542002030851261e-07, + "loss": 0.6299, + "step": 65568 + }, + { + "epoch": 1.68, + "learning_rate": 8.541728283703223e-07, + "loss": 0.7822, + "step": 65569 + }, + { + "epoch": 1.68, + "learning_rate": 8.541454537671716e-07, + "loss": 0.6885, + "step": 65570 + }, + { + "epoch": 1.68, + "learning_rate": 8.541180792756952e-07, + "loss": 0.6216, + "step": 65571 + }, + { + "epoch": 1.68, + "learning_rate": 8.540907048959136e-07, + "loss": 0.7305, + "step": 65572 + }, + { + "epoch": 1.68, + "learning_rate": 8.540633306278484e-07, + "loss": 0.687, + "step": 65573 + }, + { + "epoch": 1.68, + "learning_rate": 8.540359564715198e-07, + "loss": 0.6689, + "step": 65574 + }, + { + "epoch": 1.68, + "learning_rate": 8.540085824269495e-07, + "loss": 0.5029, + "step": 65575 + }, + { + "epoch": 1.68, + "learning_rate": 8.53981208494158e-07, + "loss": 0.4651, + "step": 65576 + }, + { + "epoch": 1.68, + "learning_rate": 8.539538346731663e-07, + "loss": 0.6792, + "step": 65577 + }, + { + "epoch": 1.68, + "learning_rate": 8.539264609639958e-07, + "loss": 0.6035, + "step": 65578 + }, + { + "epoch": 1.68, + "learning_rate": 8.538990873666669e-07, + "loss": 0.6362, + "step": 65579 + }, + { + "epoch": 1.68, + "learning_rate": 8.538717138812004e-07, + "loss": 0.4749, + "step": 65580 + }, + { + "epoch": 1.68, + "learning_rate": 8.53844340507618e-07, + "loss": 0.5825, + "step": 65581 + }, + { + "epoch": 1.68, + "learning_rate": 8.5381696724594e-07, + "loss": 0.5264, + "step": 65582 + }, + { + "epoch": 1.68, + "learning_rate": 8.537895940961878e-07, + "loss": 0.6372, + "step": 65583 + }, + { + "epoch": 1.68, + "learning_rate": 8.537622210583819e-07, + "loss": 0.5732, + "step": 65584 + }, + { + "epoch": 1.68, + "learning_rate": 8.537348481325439e-07, + "loss": 0.5913, + "step": 65585 + }, + { + "epoch": 1.68, + "learning_rate": 8.537074753186941e-07, + "loss": 0.6738, + "step": 65586 + }, + { + "epoch": 1.68, + "learning_rate": 8.536801026168541e-07, + "loss": 0.6982, + "step": 65587 + }, + { + "epoch": 1.68, + "learning_rate": 8.536527300270446e-07, + "loss": 0.5977, + "step": 65588 + }, + { + "epoch": 1.68, + "learning_rate": 8.536253575492861e-07, + "loss": 0.7109, + "step": 65589 + }, + { + "epoch": 1.68, + "learning_rate": 8.535979851836002e-07, + "loss": 0.8467, + "step": 65590 + }, + { + "epoch": 1.68, + "learning_rate": 8.535706129300073e-07, + "loss": 0.6719, + "step": 65591 + }, + { + "epoch": 1.68, + "learning_rate": 8.535432407885289e-07, + "loss": 0.6826, + "step": 65592 + }, + { + "epoch": 1.68, + "learning_rate": 8.535158687591855e-07, + "loss": 0.6279, + "step": 65593 + }, + { + "epoch": 1.68, + "learning_rate": 8.534884968419984e-07, + "loss": 0.5757, + "step": 65594 + }, + { + "epoch": 1.68, + "learning_rate": 8.534611250369885e-07, + "loss": 0.7764, + "step": 65595 + }, + { + "epoch": 1.68, + "learning_rate": 8.534337533441765e-07, + "loss": 0.561, + "step": 65596 + }, + { + "epoch": 1.68, + "learning_rate": 8.534063817635836e-07, + "loss": 0.604, + "step": 65597 + }, + { + "epoch": 1.68, + "learning_rate": 8.533790102952309e-07, + "loss": 0.4473, + "step": 65598 + }, + { + "epoch": 1.68, + "learning_rate": 8.533516389391388e-07, + "loss": 0.7051, + "step": 65599 + }, + { + "epoch": 1.68, + "learning_rate": 8.533242676953289e-07, + "loss": 0.6455, + "step": 65600 + }, + { + "epoch": 1.68, + "learning_rate": 8.532968965638217e-07, + "loss": 0.5713, + "step": 65601 + }, + { + "epoch": 1.68, + "learning_rate": 8.532695255446383e-07, + "loss": 0.5649, + "step": 65602 + }, + { + "epoch": 1.68, + "learning_rate": 8.532421546377996e-07, + "loss": 0.6924, + "step": 65603 + }, + { + "epoch": 1.68, + "learning_rate": 8.532147838433267e-07, + "loss": 0.8027, + "step": 65604 + }, + { + "epoch": 1.68, + "learning_rate": 8.531874131612406e-07, + "loss": 0.7021, + "step": 65605 + }, + { + "epoch": 1.68, + "learning_rate": 8.531600425915621e-07, + "loss": 0.5129, + "step": 65606 + }, + { + "epoch": 1.68, + "learning_rate": 8.531326721343125e-07, + "loss": 0.5364, + "step": 65607 + }, + { + "epoch": 1.68, + "learning_rate": 8.53105301789512e-07, + "loss": 0.6992, + "step": 65608 + }, + { + "epoch": 1.68, + "learning_rate": 8.530779315571823e-07, + "loss": 0.5879, + "step": 65609 + }, + { + "epoch": 1.68, + "learning_rate": 8.530505614373438e-07, + "loss": 0.625, + "step": 65610 + }, + { + "epoch": 1.68, + "learning_rate": 8.530231914300179e-07, + "loss": 0.6357, + "step": 65611 + }, + { + "epoch": 1.68, + "learning_rate": 8.529958215352255e-07, + "loss": 0.6733, + "step": 65612 + }, + { + "epoch": 1.68, + "learning_rate": 8.529684517529871e-07, + "loss": 0.6333, + "step": 65613 + }, + { + "epoch": 1.68, + "learning_rate": 8.529410820833243e-07, + "loss": 0.5618, + "step": 65614 + }, + { + "epoch": 1.68, + "learning_rate": 8.529137125262575e-07, + "loss": 0.6436, + "step": 65615 + }, + { + "epoch": 1.68, + "learning_rate": 8.528863430818081e-07, + "loss": 0.6416, + "step": 65616 + }, + { + "epoch": 1.68, + "learning_rate": 8.528589737499971e-07, + "loss": 0.6396, + "step": 65617 + }, + { + "epoch": 1.68, + "learning_rate": 8.528316045308447e-07, + "loss": 0.7676, + "step": 65618 + }, + { + "epoch": 1.68, + "learning_rate": 8.528042354243727e-07, + "loss": 0.6899, + "step": 65619 + }, + { + "epoch": 1.68, + "learning_rate": 8.527768664306016e-07, + "loss": 0.5659, + "step": 65620 + }, + { + "epoch": 1.68, + "learning_rate": 8.527494975495526e-07, + "loss": 0.7754, + "step": 65621 + }, + { + "epoch": 1.68, + "learning_rate": 8.527221287812462e-07, + "loss": 0.5343, + "step": 65622 + }, + { + "epoch": 1.68, + "learning_rate": 8.526947601257042e-07, + "loss": 0.6855, + "step": 65623 + }, + { + "epoch": 1.68, + "learning_rate": 8.526673915829466e-07, + "loss": 0.4601, + "step": 65624 + }, + { + "epoch": 1.68, + "learning_rate": 8.526400231529951e-07, + "loss": 0.7324, + "step": 65625 + }, + { + "epoch": 1.68, + "learning_rate": 8.526126548358701e-07, + "loss": 0.7041, + "step": 65626 + }, + { + "epoch": 1.68, + "learning_rate": 8.525852866315933e-07, + "loss": 0.7217, + "step": 65627 + }, + { + "epoch": 1.68, + "learning_rate": 8.525579185401849e-07, + "loss": 0.8193, + "step": 65628 + }, + { + "epoch": 1.68, + "learning_rate": 8.525305505616661e-07, + "loss": 0.6572, + "step": 65629 + }, + { + "epoch": 1.68, + "learning_rate": 8.525031826960577e-07, + "loss": 0.6064, + "step": 65630 + }, + { + "epoch": 1.68, + "learning_rate": 8.524758149433811e-07, + "loss": 0.4502, + "step": 65631 + }, + { + "epoch": 1.68, + "learning_rate": 8.524484473036567e-07, + "loss": 0.7617, + "step": 65632 + }, + { + "epoch": 1.68, + "learning_rate": 8.52421079776906e-07, + "loss": 0.6831, + "step": 65633 + }, + { + "epoch": 1.68, + "learning_rate": 8.523937123631494e-07, + "loss": 0.5571, + "step": 65634 + }, + { + "epoch": 1.68, + "learning_rate": 8.523663450624084e-07, + "loss": 0.6543, + "step": 65635 + }, + { + "epoch": 1.68, + "learning_rate": 8.523389778747035e-07, + "loss": 0.5029, + "step": 65636 + }, + { + "epoch": 1.68, + "learning_rate": 8.523116108000563e-07, + "loss": 0.627, + "step": 65637 + }, + { + "epoch": 1.68, + "learning_rate": 8.522842438384872e-07, + "loss": 0.6348, + "step": 65638 + }, + { + "epoch": 1.68, + "learning_rate": 8.522568769900168e-07, + "loss": 0.6143, + "step": 65639 + }, + { + "epoch": 1.68, + "learning_rate": 8.522295102546668e-07, + "loss": 0.7305, + "step": 65640 + }, + { + "epoch": 1.68, + "learning_rate": 8.522021436324578e-07, + "loss": 0.7803, + "step": 65641 + }, + { + "epoch": 1.68, + "learning_rate": 8.521747771234109e-07, + "loss": 0.6895, + "step": 65642 + }, + { + "epoch": 1.68, + "learning_rate": 8.521474107275468e-07, + "loss": 0.5796, + "step": 65643 + }, + { + "epoch": 1.68, + "learning_rate": 8.521200444448869e-07, + "loss": 0.4736, + "step": 65644 + }, + { + "epoch": 1.68, + "learning_rate": 8.520926782754516e-07, + "loss": 0.5659, + "step": 65645 + }, + { + "epoch": 1.68, + "learning_rate": 8.520653122192624e-07, + "loss": 0.6426, + "step": 65646 + }, + { + "epoch": 1.68, + "learning_rate": 8.520379462763402e-07, + "loss": 0.5715, + "step": 65647 + }, + { + "epoch": 1.68, + "learning_rate": 8.520105804467055e-07, + "loss": 0.5625, + "step": 65648 + }, + { + "epoch": 1.68, + "learning_rate": 8.519832147303793e-07, + "loss": 0.7227, + "step": 65649 + }, + { + "epoch": 1.68, + "learning_rate": 8.519558491273829e-07, + "loss": 0.6523, + "step": 65650 + }, + { + "epoch": 1.68, + "learning_rate": 8.51928483637737e-07, + "loss": 0.6392, + "step": 65651 + }, + { + "epoch": 1.68, + "learning_rate": 8.519011182614627e-07, + "loss": 0.667, + "step": 65652 + }, + { + "epoch": 1.68, + "learning_rate": 8.518737529985808e-07, + "loss": 0.6299, + "step": 65653 + }, + { + "epoch": 1.68, + "learning_rate": 8.518463878491126e-07, + "loss": 0.6396, + "step": 65654 + }, + { + "epoch": 1.68, + "learning_rate": 8.518190228130785e-07, + "loss": 0.748, + "step": 65655 + }, + { + "epoch": 1.68, + "learning_rate": 8.517916578905e-07, + "loss": 0.708, + "step": 65656 + }, + { + "epoch": 1.68, + "learning_rate": 8.517642930813981e-07, + "loss": 0.6792, + "step": 65657 + }, + { + "epoch": 1.68, + "learning_rate": 8.51736928385793e-07, + "loss": 0.502, + "step": 65658 + }, + { + "epoch": 1.68, + "learning_rate": 8.517095638037063e-07, + "loss": 0.7568, + "step": 65659 + }, + { + "epoch": 1.68, + "learning_rate": 8.516821993351586e-07, + "loss": 0.7358, + "step": 65660 + }, + { + "epoch": 1.68, + "learning_rate": 8.516548349801711e-07, + "loss": 0.6797, + "step": 65661 + }, + { + "epoch": 1.68, + "learning_rate": 8.516274707387646e-07, + "loss": 0.6123, + "step": 65662 + }, + { + "epoch": 1.68, + "learning_rate": 8.516001066109604e-07, + "loss": 0.8477, + "step": 65663 + }, + { + "epoch": 1.68, + "learning_rate": 8.515727425967788e-07, + "loss": 0.5391, + "step": 65664 + }, + { + "epoch": 1.68, + "learning_rate": 8.515453786962415e-07, + "loss": 0.8867, + "step": 65665 + }, + { + "epoch": 1.68, + "learning_rate": 8.515180149093686e-07, + "loss": 0.5217, + "step": 65666 + }, + { + "epoch": 1.68, + "learning_rate": 8.514906512361823e-07, + "loss": 0.8174, + "step": 65667 + }, + { + "epoch": 1.68, + "learning_rate": 8.514632876767023e-07, + "loss": 0.5137, + "step": 65668 + }, + { + "epoch": 1.68, + "learning_rate": 8.514359242309501e-07, + "loss": 0.665, + "step": 65669 + }, + { + "epoch": 1.68, + "learning_rate": 8.514085608989463e-07, + "loss": 0.7578, + "step": 65670 + }, + { + "epoch": 1.68, + "learning_rate": 8.513811976807125e-07, + "loss": 0.6357, + "step": 65671 + }, + { + "epoch": 1.68, + "learning_rate": 8.51353834576269e-07, + "loss": 0.686, + "step": 65672 + }, + { + "epoch": 1.68, + "learning_rate": 8.513264715856372e-07, + "loss": 0.7549, + "step": 65673 + }, + { + "epoch": 1.68, + "learning_rate": 8.512991087088377e-07, + "loss": 0.6445, + "step": 65674 + }, + { + "epoch": 1.68, + "learning_rate": 8.512717459458919e-07, + "loss": 0.5786, + "step": 65675 + }, + { + "epoch": 1.68, + "learning_rate": 8.512443832968202e-07, + "loss": 0.6152, + "step": 65676 + }, + { + "epoch": 1.68, + "learning_rate": 8.512170207616444e-07, + "loss": 0.7627, + "step": 65677 + }, + { + "epoch": 1.68, + "learning_rate": 8.511896583403846e-07, + "loss": 0.5471, + "step": 65678 + }, + { + "epoch": 1.68, + "learning_rate": 8.511622960330617e-07, + "loss": 0.6943, + "step": 65679 + }, + { + "epoch": 1.68, + "learning_rate": 8.511349338396974e-07, + "loss": 0.6348, + "step": 65680 + }, + { + "epoch": 1.68, + "learning_rate": 8.511075717603117e-07, + "loss": 0.7188, + "step": 65681 + }, + { + "epoch": 1.68, + "learning_rate": 8.510802097949266e-07, + "loss": 0.6738, + "step": 65682 + }, + { + "epoch": 1.68, + "learning_rate": 8.510528479435623e-07, + "loss": 0.7314, + "step": 65683 + }, + { + "epoch": 1.68, + "learning_rate": 8.510254862062401e-07, + "loss": 0.5681, + "step": 65684 + }, + { + "epoch": 1.68, + "learning_rate": 8.50998124582981e-07, + "loss": 0.5032, + "step": 65685 + }, + { + "epoch": 1.68, + "learning_rate": 8.509707630738053e-07, + "loss": 0.793, + "step": 65686 + }, + { + "epoch": 1.68, + "learning_rate": 8.509434016787351e-07, + "loss": 0.7231, + "step": 65687 + }, + { + "epoch": 1.68, + "learning_rate": 8.509160403977904e-07, + "loss": 0.6035, + "step": 65688 + }, + { + "epoch": 1.68, + "learning_rate": 8.508886792309921e-07, + "loss": 0.6367, + "step": 65689 + }, + { + "epoch": 1.68, + "learning_rate": 8.508613181783618e-07, + "loss": 0.7822, + "step": 65690 + }, + { + "epoch": 1.68, + "learning_rate": 8.508339572399199e-07, + "loss": 0.8281, + "step": 65691 + }, + { + "epoch": 1.68, + "learning_rate": 8.508065964156878e-07, + "loss": 0.6826, + "step": 65692 + }, + { + "epoch": 1.68, + "learning_rate": 8.507792357056862e-07, + "loss": 0.7715, + "step": 65693 + }, + { + "epoch": 1.68, + "learning_rate": 8.50751875109936e-07, + "loss": 0.5767, + "step": 65694 + }, + { + "epoch": 1.68, + "learning_rate": 8.507245146284581e-07, + "loss": 0.4414, + "step": 65695 + }, + { + "epoch": 1.68, + "learning_rate": 8.506971542612738e-07, + "loss": 0.6846, + "step": 65696 + }, + { + "epoch": 1.68, + "learning_rate": 8.506697940084041e-07, + "loss": 0.5933, + "step": 65697 + }, + { + "epoch": 1.68, + "learning_rate": 8.506424338698692e-07, + "loss": 0.6855, + "step": 65698 + }, + { + "epoch": 1.68, + "learning_rate": 8.506150738456907e-07, + "loss": 0.5044, + "step": 65699 + }, + { + "epoch": 1.68, + "learning_rate": 8.505877139358892e-07, + "loss": 0.5564, + "step": 65700 + }, + { + "epoch": 1.68, + "learning_rate": 8.50560354140486e-07, + "loss": 0.6382, + "step": 65701 + }, + { + "epoch": 1.68, + "learning_rate": 8.505329944595019e-07, + "loss": 0.7695, + "step": 65702 + }, + { + "epoch": 1.68, + "learning_rate": 8.505056348929575e-07, + "loss": 0.6475, + "step": 65703 + }, + { + "epoch": 1.68, + "learning_rate": 8.504782754408743e-07, + "loss": 0.7002, + "step": 65704 + }, + { + "epoch": 1.68, + "learning_rate": 8.504509161032729e-07, + "loss": 0.6143, + "step": 65705 + }, + { + "epoch": 1.68, + "learning_rate": 8.504235568801745e-07, + "loss": 0.6655, + "step": 65706 + }, + { + "epoch": 1.68, + "learning_rate": 8.503961977716002e-07, + "loss": 0.9082, + "step": 65707 + }, + { + "epoch": 1.68, + "learning_rate": 8.503688387775703e-07, + "loss": 0.7812, + "step": 65708 + }, + { + "epoch": 1.68, + "learning_rate": 8.503414798981061e-07, + "loss": 0.6719, + "step": 65709 + }, + { + "epoch": 1.68, + "learning_rate": 8.503141211332285e-07, + "loss": 0.3951, + "step": 65710 + }, + { + "epoch": 1.68, + "learning_rate": 8.502867624829585e-07, + "loss": 0.6562, + "step": 65711 + }, + { + "epoch": 1.68, + "learning_rate": 8.50259403947317e-07, + "loss": 0.917, + "step": 65712 + }, + { + "epoch": 1.68, + "learning_rate": 8.502320455263251e-07, + "loss": 0.6733, + "step": 65713 + }, + { + "epoch": 1.68, + "learning_rate": 8.502046872200035e-07, + "loss": 0.6543, + "step": 65714 + }, + { + "epoch": 1.68, + "learning_rate": 8.501773290283734e-07, + "loss": 0.6597, + "step": 65715 + }, + { + "epoch": 1.68, + "learning_rate": 8.501499709514556e-07, + "loss": 0.5615, + "step": 65716 + }, + { + "epoch": 1.68, + "learning_rate": 8.501226129892714e-07, + "loss": 0.6213, + "step": 65717 + }, + { + "epoch": 1.68, + "learning_rate": 8.500952551418412e-07, + "loss": 0.5127, + "step": 65718 + }, + { + "epoch": 1.68, + "learning_rate": 8.500678974091862e-07, + "loss": 0.501, + "step": 65719 + }, + { + "epoch": 1.68, + "learning_rate": 8.500405397913271e-07, + "loss": 0.6943, + "step": 65720 + }, + { + "epoch": 1.68, + "learning_rate": 8.500131822882852e-07, + "loss": 0.5752, + "step": 65721 + }, + { + "epoch": 1.68, + "learning_rate": 8.499858249000811e-07, + "loss": 0.6191, + "step": 65722 + }, + { + "epoch": 1.68, + "learning_rate": 8.499584676267362e-07, + "loss": 0.6233, + "step": 65723 + }, + { + "epoch": 1.68, + "learning_rate": 8.49931110468271e-07, + "loss": 0.9092, + "step": 65724 + }, + { + "epoch": 1.68, + "learning_rate": 8.499037534247068e-07, + "loss": 0.6777, + "step": 65725 + }, + { + "epoch": 1.68, + "learning_rate": 8.498763964960644e-07, + "loss": 0.7246, + "step": 65726 + }, + { + "epoch": 1.68, + "learning_rate": 8.49849039682365e-07, + "loss": 0.645, + "step": 65727 + }, + { + "epoch": 1.68, + "learning_rate": 8.498216829836291e-07, + "loss": 0.5859, + "step": 65728 + }, + { + "epoch": 1.68, + "learning_rate": 8.497943263998775e-07, + "loss": 0.5981, + "step": 65729 + }, + { + "epoch": 1.68, + "learning_rate": 8.497669699311318e-07, + "loss": 0.6299, + "step": 65730 + }, + { + "epoch": 1.68, + "learning_rate": 8.497396135774125e-07, + "loss": 0.687, + "step": 65731 + }, + { + "epoch": 1.68, + "learning_rate": 8.497122573387407e-07, + "loss": 0.6606, + "step": 65732 + }, + { + "epoch": 1.68, + "learning_rate": 8.496849012151372e-07, + "loss": 0.5479, + "step": 65733 + }, + { + "epoch": 1.68, + "learning_rate": 8.496575452066234e-07, + "loss": 0.7656, + "step": 65734 + }, + { + "epoch": 1.68, + "learning_rate": 8.496301893132195e-07, + "loss": 0.3424, + "step": 65735 + }, + { + "epoch": 1.68, + "learning_rate": 8.496028335349471e-07, + "loss": 0.6836, + "step": 65736 + }, + { + "epoch": 1.68, + "learning_rate": 8.495754778718272e-07, + "loss": 0.5796, + "step": 65737 + }, + { + "epoch": 1.68, + "learning_rate": 8.4954812232388e-07, + "loss": 0.8076, + "step": 65738 + }, + { + "epoch": 1.68, + "learning_rate": 8.49520766891127e-07, + "loss": 0.5713, + "step": 65739 + }, + { + "epoch": 1.68, + "learning_rate": 8.49493411573589e-07, + "loss": 0.6582, + "step": 65740 + }, + { + "epoch": 1.68, + "learning_rate": 8.494660563712869e-07, + "loss": 0.6177, + "step": 65741 + }, + { + "epoch": 1.69, + "learning_rate": 8.494387012842418e-07, + "loss": 0.7397, + "step": 65742 + }, + { + "epoch": 1.69, + "learning_rate": 8.494113463124743e-07, + "loss": 0.4883, + "step": 65743 + }, + { + "epoch": 1.69, + "learning_rate": 8.49383991456006e-07, + "loss": 0.6221, + "step": 65744 + }, + { + "epoch": 1.69, + "learning_rate": 8.493566367148573e-07, + "loss": 0.6016, + "step": 65745 + }, + { + "epoch": 1.69, + "learning_rate": 8.493292820890493e-07, + "loss": 0.6245, + "step": 65746 + }, + { + "epoch": 1.69, + "learning_rate": 8.493019275786033e-07, + "loss": 0.7891, + "step": 65747 + }, + { + "epoch": 1.69, + "learning_rate": 8.492745731835394e-07, + "loss": 0.5923, + "step": 65748 + }, + { + "epoch": 1.69, + "learning_rate": 8.492472189038792e-07, + "loss": 0.6826, + "step": 65749 + }, + { + "epoch": 1.69, + "learning_rate": 8.492198647396433e-07, + "loss": 0.6387, + "step": 65750 + }, + { + "epoch": 1.69, + "learning_rate": 8.491925106908531e-07, + "loss": 0.7275, + "step": 65751 + }, + { + "epoch": 1.69, + "learning_rate": 8.491651567575289e-07, + "loss": 0.832, + "step": 65752 + }, + { + "epoch": 1.69, + "learning_rate": 8.491378029396923e-07, + "loss": 0.3721, + "step": 65753 + }, + { + "epoch": 1.69, + "learning_rate": 8.491104492373638e-07, + "loss": 0.7461, + "step": 65754 + }, + { + "epoch": 1.69, + "learning_rate": 8.490830956505645e-07, + "loss": 0.6357, + "step": 65755 + }, + { + "epoch": 1.69, + "learning_rate": 8.490557421793153e-07, + "loss": 0.6133, + "step": 65756 + }, + { + "epoch": 1.69, + "learning_rate": 8.490283888236378e-07, + "loss": 0.5947, + "step": 65757 + }, + { + "epoch": 1.69, + "learning_rate": 8.490010355835516e-07, + "loss": 0.5068, + "step": 65758 + }, + { + "epoch": 1.69, + "learning_rate": 8.489736824590786e-07, + "loss": 0.6885, + "step": 65759 + }, + { + "epoch": 1.69, + "learning_rate": 8.489463294502394e-07, + "loss": 0.8184, + "step": 65760 + }, + { + "epoch": 1.69, + "learning_rate": 8.489189765570551e-07, + "loss": 0.707, + "step": 65761 + }, + { + "epoch": 1.69, + "learning_rate": 8.488916237795465e-07, + "loss": 0.8125, + "step": 65762 + }, + { + "epoch": 1.69, + "learning_rate": 8.488642711177347e-07, + "loss": 0.5701, + "step": 65763 + }, + { + "epoch": 1.69, + "learning_rate": 8.488369185716405e-07, + "loss": 0.5371, + "step": 65764 + }, + { + "epoch": 1.69, + "learning_rate": 8.488095661412852e-07, + "loss": 0.7168, + "step": 65765 + }, + { + "epoch": 1.69, + "learning_rate": 8.487822138266891e-07, + "loss": 0.6265, + "step": 65766 + }, + { + "epoch": 1.69, + "learning_rate": 8.487548616278741e-07, + "loss": 0.46, + "step": 65767 + }, + { + "epoch": 1.69, + "learning_rate": 8.487275095448602e-07, + "loss": 0.5259, + "step": 65768 + }, + { + "epoch": 1.69, + "learning_rate": 8.487001575776685e-07, + "loss": 0.8232, + "step": 65769 + }, + { + "epoch": 1.69, + "learning_rate": 8.486728057263203e-07, + "loss": 0.6543, + "step": 65770 + }, + { + "epoch": 1.69, + "learning_rate": 8.486454539908362e-07, + "loss": 0.6768, + "step": 65771 + }, + { + "epoch": 1.69, + "learning_rate": 8.486181023712375e-07, + "loss": 0.5343, + "step": 65772 + }, + { + "epoch": 1.69, + "learning_rate": 8.485907508675448e-07, + "loss": 0.6372, + "step": 65773 + }, + { + "epoch": 1.69, + "learning_rate": 8.485633994797794e-07, + "loss": 0.8125, + "step": 65774 + }, + { + "epoch": 1.69, + "learning_rate": 8.485360482079621e-07, + "loss": 0.6606, + "step": 65775 + }, + { + "epoch": 1.69, + "learning_rate": 8.485086970521135e-07, + "loss": 0.5942, + "step": 65776 + }, + { + "epoch": 1.69, + "learning_rate": 8.484813460122553e-07, + "loss": 0.4692, + "step": 65777 + }, + { + "epoch": 1.69, + "learning_rate": 8.484539950884077e-07, + "loss": 0.6426, + "step": 65778 + }, + { + "epoch": 1.69, + "learning_rate": 8.484266442805916e-07, + "loss": 0.6533, + "step": 65779 + }, + { + "epoch": 1.69, + "learning_rate": 8.483992935888287e-07, + "loss": 0.5964, + "step": 65780 + }, + { + "epoch": 1.69, + "learning_rate": 8.48371943013139e-07, + "loss": 0.5068, + "step": 65781 + }, + { + "epoch": 1.69, + "learning_rate": 8.483445925535444e-07, + "loss": 0.6855, + "step": 65782 + }, + { + "epoch": 1.69, + "learning_rate": 8.483172422100651e-07, + "loss": 0.5957, + "step": 65783 + }, + { + "epoch": 1.69, + "learning_rate": 8.482898919827224e-07, + "loss": 0.4897, + "step": 65784 + }, + { + "epoch": 1.69, + "learning_rate": 8.48262541871537e-07, + "loss": 0.7129, + "step": 65785 + }, + { + "epoch": 1.69, + "learning_rate": 8.482351918765303e-07, + "loss": 0.457, + "step": 65786 + }, + { + "epoch": 1.69, + "learning_rate": 8.48207841997723e-07, + "loss": 0.6646, + "step": 65787 + }, + { + "epoch": 1.69, + "learning_rate": 8.481804922351357e-07, + "loss": 0.7295, + "step": 65788 + }, + { + "epoch": 1.69, + "learning_rate": 8.481531425887898e-07, + "loss": 0.6733, + "step": 65789 + }, + { + "epoch": 1.69, + "learning_rate": 8.481257930587058e-07, + "loss": 0.6631, + "step": 65790 + }, + { + "epoch": 1.69, + "learning_rate": 8.48098443644905e-07, + "loss": 0.7627, + "step": 65791 + }, + { + "epoch": 1.69, + "learning_rate": 8.480710943474084e-07, + "loss": 0.6816, + "step": 65792 + }, + { + "epoch": 1.69, + "learning_rate": 8.480437451662365e-07, + "loss": 0.7012, + "step": 65793 + }, + { + "epoch": 1.69, + "learning_rate": 8.480163961014108e-07, + "loss": 0.7454, + "step": 65794 + }, + { + "epoch": 1.69, + "learning_rate": 8.479890471529516e-07, + "loss": 0.7319, + "step": 65795 + }, + { + "epoch": 1.69, + "learning_rate": 8.479616983208805e-07, + "loss": 0.4592, + "step": 65796 + }, + { + "epoch": 1.69, + "learning_rate": 8.479343496052183e-07, + "loss": 0.5879, + "step": 65797 + }, + { + "epoch": 1.69, + "learning_rate": 8.479070010059854e-07, + "loss": 0.7861, + "step": 65798 + }, + { + "epoch": 1.69, + "learning_rate": 8.478796525232034e-07, + "loss": 0.7061, + "step": 65799 + }, + { + "epoch": 1.69, + "learning_rate": 8.478523041568926e-07, + "loss": 0.6807, + "step": 65800 + }, + { + "epoch": 1.69, + "learning_rate": 8.478249559070746e-07, + "loss": 0.6729, + "step": 65801 + }, + { + "epoch": 1.69, + "learning_rate": 8.477976077737698e-07, + "loss": 0.6299, + "step": 65802 + }, + { + "epoch": 1.69, + "learning_rate": 8.477702597569996e-07, + "loss": 0.7627, + "step": 65803 + }, + { + "epoch": 1.69, + "learning_rate": 8.477429118567845e-07, + "loss": 0.6201, + "step": 65804 + }, + { + "epoch": 1.69, + "learning_rate": 8.477155640731458e-07, + "loss": 0.5421, + "step": 65805 + }, + { + "epoch": 1.69, + "learning_rate": 8.476882164061041e-07, + "loss": 0.6455, + "step": 65806 + }, + { + "epoch": 1.69, + "learning_rate": 8.47660868855681e-07, + "loss": 0.7451, + "step": 65807 + }, + { + "epoch": 1.69, + "learning_rate": 8.476335214218967e-07, + "loss": 0.6064, + "step": 65808 + }, + { + "epoch": 1.69, + "learning_rate": 8.476061741047725e-07, + "loss": 0.71, + "step": 65809 + }, + { + "epoch": 1.69, + "learning_rate": 8.475788269043289e-07, + "loss": 0.6836, + "step": 65810 + }, + { + "epoch": 1.69, + "learning_rate": 8.475514798205875e-07, + "loss": 0.5649, + "step": 65811 + }, + { + "epoch": 1.69, + "learning_rate": 8.475241328535687e-07, + "loss": 0.6572, + "step": 65812 + }, + { + "epoch": 1.69, + "learning_rate": 8.474967860032938e-07, + "loss": 0.8047, + "step": 65813 + }, + { + "epoch": 1.69, + "learning_rate": 8.474694392697834e-07, + "loss": 0.5486, + "step": 65814 + }, + { + "epoch": 1.69, + "learning_rate": 8.47442092653059e-07, + "loss": 0.8057, + "step": 65815 + }, + { + "epoch": 1.69, + "learning_rate": 8.474147461531408e-07, + "loss": 0.7227, + "step": 65816 + }, + { + "epoch": 1.69, + "learning_rate": 8.473873997700506e-07, + "loss": 0.6875, + "step": 65817 + }, + { + "epoch": 1.69, + "learning_rate": 8.473600535038086e-07, + "loss": 0.562, + "step": 65818 + }, + { + "epoch": 1.69, + "learning_rate": 8.473327073544358e-07, + "loss": 0.48, + "step": 65819 + }, + { + "epoch": 1.69, + "learning_rate": 8.473053613219535e-07, + "loss": 0.8115, + "step": 65820 + }, + { + "epoch": 1.69, + "learning_rate": 8.472780154063824e-07, + "loss": 0.6079, + "step": 65821 + }, + { + "epoch": 1.69, + "learning_rate": 8.472506696077435e-07, + "loss": 0.7256, + "step": 65822 + }, + { + "epoch": 1.69, + "learning_rate": 8.472233239260576e-07, + "loss": 0.3335, + "step": 65823 + }, + { + "epoch": 1.69, + "learning_rate": 8.471959783613461e-07, + "loss": 0.7129, + "step": 65824 + }, + { + "epoch": 1.69, + "learning_rate": 8.471686329136293e-07, + "loss": 0.7266, + "step": 65825 + }, + { + "epoch": 1.69, + "learning_rate": 8.471412875829287e-07, + "loss": 0.7212, + "step": 65826 + }, + { + "epoch": 1.69, + "learning_rate": 8.471139423692652e-07, + "loss": 0.6304, + "step": 65827 + }, + { + "epoch": 1.69, + "learning_rate": 8.470865972726593e-07, + "loss": 0.7144, + "step": 65828 + }, + { + "epoch": 1.69, + "learning_rate": 8.47059252293132e-07, + "loss": 0.8047, + "step": 65829 + }, + { + "epoch": 1.69, + "learning_rate": 8.470319074307044e-07, + "loss": 0.6807, + "step": 65830 + }, + { + "epoch": 1.69, + "learning_rate": 8.470045626853974e-07, + "loss": 0.5903, + "step": 65831 + }, + { + "epoch": 1.69, + "learning_rate": 8.469772180572322e-07, + "loss": 0.6826, + "step": 65832 + }, + { + "epoch": 1.69, + "learning_rate": 8.469498735462293e-07, + "loss": 0.7783, + "step": 65833 + }, + { + "epoch": 1.69, + "learning_rate": 8.469225291524099e-07, + "loss": 0.6826, + "step": 65834 + }, + { + "epoch": 1.69, + "learning_rate": 8.468951848757948e-07, + "loss": 0.7026, + "step": 65835 + }, + { + "epoch": 1.69, + "learning_rate": 8.468678407164052e-07, + "loss": 0.6343, + "step": 65836 + }, + { + "epoch": 1.69, + "learning_rate": 8.468404966742622e-07, + "loss": 0.5322, + "step": 65837 + }, + { + "epoch": 1.69, + "learning_rate": 8.468131527493858e-07, + "loss": 0.7344, + "step": 65838 + }, + { + "epoch": 1.69, + "learning_rate": 8.467858089417978e-07, + "loss": 0.5209, + "step": 65839 + }, + { + "epoch": 1.69, + "learning_rate": 8.467584652515185e-07, + "loss": 0.6013, + "step": 65840 + }, + { + "epoch": 1.69, + "learning_rate": 8.467311216785695e-07, + "loss": 0.6602, + "step": 65841 + }, + { + "epoch": 1.69, + "learning_rate": 8.467037782229714e-07, + "loss": 0.5405, + "step": 65842 + }, + { + "epoch": 1.69, + "learning_rate": 8.466764348847451e-07, + "loss": 0.8154, + "step": 65843 + }, + { + "epoch": 1.69, + "learning_rate": 8.466490916639116e-07, + "loss": 0.6768, + "step": 65844 + }, + { + "epoch": 1.69, + "learning_rate": 8.46621748560492e-07, + "loss": 0.7129, + "step": 65845 + }, + { + "epoch": 1.69, + "learning_rate": 8.465944055745068e-07, + "loss": 0.7412, + "step": 65846 + }, + { + "epoch": 1.69, + "learning_rate": 8.465670627059778e-07, + "loss": 0.4684, + "step": 65847 + }, + { + "epoch": 1.69, + "learning_rate": 8.465397199549249e-07, + "loss": 0.5708, + "step": 65848 + }, + { + "epoch": 1.69, + "learning_rate": 8.465123773213696e-07, + "loss": 0.519, + "step": 65849 + }, + { + "epoch": 1.69, + "learning_rate": 8.464850348053326e-07, + "loss": 0.7178, + "step": 65850 + }, + { + "epoch": 1.69, + "learning_rate": 8.464576924068349e-07, + "loss": 0.7012, + "step": 65851 + }, + { + "epoch": 1.69, + "learning_rate": 8.464303501258975e-07, + "loss": 0.5361, + "step": 65852 + }, + { + "epoch": 1.69, + "learning_rate": 8.464030079625414e-07, + "loss": 0.5293, + "step": 65853 + }, + { + "epoch": 1.69, + "learning_rate": 8.463756659167874e-07, + "loss": 0.7793, + "step": 65854 + }, + { + "epoch": 1.69, + "learning_rate": 8.463483239886565e-07, + "loss": 0.5889, + "step": 65855 + }, + { + "epoch": 1.69, + "learning_rate": 8.463209821781695e-07, + "loss": 0.6807, + "step": 65856 + }, + { + "epoch": 1.69, + "learning_rate": 8.462936404853479e-07, + "loss": 0.6089, + "step": 65857 + }, + { + "epoch": 1.69, + "learning_rate": 8.462662989102121e-07, + "loss": 0.5347, + "step": 65858 + }, + { + "epoch": 1.69, + "learning_rate": 8.462389574527826e-07, + "loss": 0.7021, + "step": 65859 + }, + { + "epoch": 1.69, + "learning_rate": 8.462116161130814e-07, + "loss": 0.688, + "step": 65860 + }, + { + "epoch": 1.69, + "learning_rate": 8.461842748911285e-07, + "loss": 0.6167, + "step": 65861 + }, + { + "epoch": 1.69, + "learning_rate": 8.461569337869454e-07, + "loss": 0.8242, + "step": 65862 + }, + { + "epoch": 1.69, + "learning_rate": 8.461295928005528e-07, + "loss": 0.6328, + "step": 65863 + }, + { + "epoch": 1.69, + "learning_rate": 8.461022519319719e-07, + "loss": 0.6709, + "step": 65864 + }, + { + "epoch": 1.69, + "learning_rate": 8.460749111812233e-07, + "loss": 0.6533, + "step": 65865 + }, + { + "epoch": 1.69, + "learning_rate": 8.460475705483278e-07, + "loss": 0.6709, + "step": 65866 + }, + { + "epoch": 1.69, + "learning_rate": 8.460202300333073e-07, + "loss": 0.4055, + "step": 65867 + }, + { + "epoch": 1.69, + "learning_rate": 8.459928896361816e-07, + "loss": 0.4274, + "step": 65868 + }, + { + "epoch": 1.69, + "learning_rate": 8.45965549356972e-07, + "loss": 0.5371, + "step": 65869 + }, + { + "epoch": 1.69, + "learning_rate": 8.459382091956996e-07, + "loss": 0.533, + "step": 65870 + }, + { + "epoch": 1.69, + "learning_rate": 8.45910869152385e-07, + "loss": 0.5486, + "step": 65871 + }, + { + "epoch": 1.69, + "learning_rate": 8.458835292270496e-07, + "loss": 0.6455, + "step": 65872 + }, + { + "epoch": 1.69, + "learning_rate": 8.458561894197138e-07, + "loss": 0.7168, + "step": 65873 + }, + { + "epoch": 1.69, + "learning_rate": 8.458288497303992e-07, + "loss": 0.6631, + "step": 65874 + }, + { + "epoch": 1.69, + "learning_rate": 8.45801510159126e-07, + "loss": 0.5669, + "step": 65875 + }, + { + "epoch": 1.69, + "learning_rate": 8.457741707059158e-07, + "loss": 0.7261, + "step": 65876 + }, + { + "epoch": 1.69, + "learning_rate": 8.457468313707895e-07, + "loss": 0.4729, + "step": 65877 + }, + { + "epoch": 1.69, + "learning_rate": 8.457194921537673e-07, + "loss": 0.6562, + "step": 65878 + }, + { + "epoch": 1.69, + "learning_rate": 8.456921530548707e-07, + "loss": 0.6934, + "step": 65879 + }, + { + "epoch": 1.69, + "learning_rate": 8.456648140741204e-07, + "loss": 0.4998, + "step": 65880 + }, + { + "epoch": 1.69, + "learning_rate": 8.456374752115376e-07, + "loss": 0.7197, + "step": 65881 + }, + { + "epoch": 1.69, + "learning_rate": 8.456101364671431e-07, + "loss": 0.397, + "step": 65882 + }, + { + "epoch": 1.69, + "learning_rate": 8.455827978409578e-07, + "loss": 0.7109, + "step": 65883 + }, + { + "epoch": 1.69, + "learning_rate": 8.455554593330025e-07, + "loss": 0.7432, + "step": 65884 + }, + { + "epoch": 1.69, + "learning_rate": 8.455281209432984e-07, + "loss": 0.7656, + "step": 65885 + }, + { + "epoch": 1.69, + "learning_rate": 8.455007826718663e-07, + "loss": 0.6316, + "step": 65886 + }, + { + "epoch": 1.69, + "learning_rate": 8.454734445187274e-07, + "loss": 0.5894, + "step": 65887 + }, + { + "epoch": 1.69, + "learning_rate": 8.454461064839021e-07, + "loss": 0.6636, + "step": 65888 + }, + { + "epoch": 1.69, + "learning_rate": 8.454187685674118e-07, + "loss": 0.7104, + "step": 65889 + }, + { + "epoch": 1.69, + "learning_rate": 8.453914307692768e-07, + "loss": 0.689, + "step": 65890 + }, + { + "epoch": 1.69, + "learning_rate": 8.45364093089519e-07, + "loss": 0.6587, + "step": 65891 + }, + { + "epoch": 1.69, + "learning_rate": 8.453367555281584e-07, + "loss": 0.7256, + "step": 65892 + }, + { + "epoch": 1.69, + "learning_rate": 8.453094180852166e-07, + "loss": 0.5913, + "step": 65893 + }, + { + "epoch": 1.69, + "learning_rate": 8.452820807607139e-07, + "loss": 0.6611, + "step": 65894 + }, + { + "epoch": 1.69, + "learning_rate": 8.45254743554672e-07, + "loss": 0.6387, + "step": 65895 + }, + { + "epoch": 1.69, + "learning_rate": 8.452274064671112e-07, + "loss": 0.5737, + "step": 65896 + }, + { + "epoch": 1.69, + "learning_rate": 8.452000694980531e-07, + "loss": 0.645, + "step": 65897 + }, + { + "epoch": 1.69, + "learning_rate": 8.451727326475179e-07, + "loss": 0.5923, + "step": 65898 + }, + { + "epoch": 1.69, + "learning_rate": 8.451453959155268e-07, + "loss": 0.5029, + "step": 65899 + }, + { + "epoch": 1.69, + "learning_rate": 8.451180593021006e-07, + "loss": 0.6602, + "step": 65900 + }, + { + "epoch": 1.69, + "learning_rate": 8.450907228072606e-07, + "loss": 0.749, + "step": 65901 + }, + { + "epoch": 1.69, + "learning_rate": 8.450633864310272e-07, + "loss": 0.6133, + "step": 65902 + }, + { + "epoch": 1.69, + "learning_rate": 8.450360501734219e-07, + "loss": 0.5879, + "step": 65903 + }, + { + "epoch": 1.69, + "learning_rate": 8.450087140344653e-07, + "loss": 0.6436, + "step": 65904 + }, + { + "epoch": 1.69, + "learning_rate": 8.449813780141784e-07, + "loss": 0.6641, + "step": 65905 + }, + { + "epoch": 1.69, + "learning_rate": 8.449540421125824e-07, + "loss": 0.6038, + "step": 65906 + }, + { + "epoch": 1.69, + "learning_rate": 8.449267063296977e-07, + "loss": 0.5698, + "step": 65907 + }, + { + "epoch": 1.69, + "learning_rate": 8.448993706655455e-07, + "loss": 0.6953, + "step": 65908 + }, + { + "epoch": 1.69, + "learning_rate": 8.448720351201466e-07, + "loss": 0.5757, + "step": 65909 + }, + { + "epoch": 1.69, + "learning_rate": 8.448446996935222e-07, + "loss": 0.6079, + "step": 65910 + }, + { + "epoch": 1.69, + "learning_rate": 8.44817364385693e-07, + "loss": 0.6514, + "step": 65911 + }, + { + "epoch": 1.69, + "learning_rate": 8.447900291966801e-07, + "loss": 0.467, + "step": 65912 + }, + { + "epoch": 1.69, + "learning_rate": 8.447626941265041e-07, + "loss": 0.6265, + "step": 65913 + }, + { + "epoch": 1.69, + "learning_rate": 8.447353591751865e-07, + "loss": 0.6084, + "step": 65914 + }, + { + "epoch": 1.69, + "learning_rate": 8.447080243427476e-07, + "loss": 0.7295, + "step": 65915 + }, + { + "epoch": 1.69, + "learning_rate": 8.446806896292094e-07, + "loss": 0.7178, + "step": 65916 + }, + { + "epoch": 1.69, + "learning_rate": 8.446533550345912e-07, + "loss": 0.6299, + "step": 65917 + }, + { + "epoch": 1.69, + "learning_rate": 8.446260205589151e-07, + "loss": 0.7373, + "step": 65918 + }, + { + "epoch": 1.69, + "learning_rate": 8.445986862022014e-07, + "loss": 0.5796, + "step": 65919 + }, + { + "epoch": 1.69, + "learning_rate": 8.445713519644717e-07, + "loss": 0.6152, + "step": 65920 + }, + { + "epoch": 1.69, + "learning_rate": 8.445440178457463e-07, + "loss": 0.7344, + "step": 65921 + }, + { + "epoch": 1.69, + "learning_rate": 8.445166838460467e-07, + "loss": 0.8486, + "step": 65922 + }, + { + "epoch": 1.69, + "learning_rate": 8.444893499653931e-07, + "loss": 0.7109, + "step": 65923 + }, + { + "epoch": 1.69, + "learning_rate": 8.444620162038073e-07, + "loss": 0.665, + "step": 65924 + }, + { + "epoch": 1.69, + "learning_rate": 8.444346825613094e-07, + "loss": 0.6753, + "step": 65925 + }, + { + "epoch": 1.69, + "learning_rate": 8.444073490379212e-07, + "loss": 0.8916, + "step": 65926 + }, + { + "epoch": 1.69, + "learning_rate": 8.443800156336629e-07, + "loss": 0.6406, + "step": 65927 + }, + { + "epoch": 1.69, + "learning_rate": 8.443526823485555e-07, + "loss": 0.873, + "step": 65928 + }, + { + "epoch": 1.69, + "learning_rate": 8.443253491826204e-07, + "loss": 0.4657, + "step": 65929 + }, + { + "epoch": 1.69, + "learning_rate": 8.442980161358779e-07, + "loss": 0.6357, + "step": 65930 + }, + { + "epoch": 1.69, + "learning_rate": 8.442706832083494e-07, + "loss": 0.6914, + "step": 65931 + }, + { + "epoch": 1.69, + "learning_rate": 8.442433504000555e-07, + "loss": 0.5171, + "step": 65932 + }, + { + "epoch": 1.69, + "learning_rate": 8.442160177110175e-07, + "loss": 0.7236, + "step": 65933 + }, + { + "epoch": 1.69, + "learning_rate": 8.441886851412559e-07, + "loss": 0.5576, + "step": 65934 + }, + { + "epoch": 1.69, + "learning_rate": 8.441613526907922e-07, + "loss": 0.6636, + "step": 65935 + }, + { + "epoch": 1.69, + "learning_rate": 8.441340203596472e-07, + "loss": 0.3677, + "step": 65936 + }, + { + "epoch": 1.69, + "learning_rate": 8.441066881478414e-07, + "loss": 0.5791, + "step": 65937 + }, + { + "epoch": 1.69, + "learning_rate": 8.440793560553956e-07, + "loss": 0.5996, + "step": 65938 + }, + { + "epoch": 1.69, + "learning_rate": 8.440520240823313e-07, + "loss": 0.6567, + "step": 65939 + }, + { + "epoch": 1.69, + "learning_rate": 8.44024692228669e-07, + "loss": 0.4696, + "step": 65940 + }, + { + "epoch": 1.69, + "learning_rate": 8.4399736049443e-07, + "loss": 0.7158, + "step": 65941 + }, + { + "epoch": 1.69, + "learning_rate": 8.439700288796349e-07, + "loss": 0.6396, + "step": 65942 + }, + { + "epoch": 1.69, + "learning_rate": 8.439426973843051e-07, + "loss": 0.5474, + "step": 65943 + }, + { + "epoch": 1.69, + "learning_rate": 8.439153660084608e-07, + "loss": 0.6758, + "step": 65944 + }, + { + "epoch": 1.69, + "learning_rate": 8.438880347521235e-07, + "loss": 0.917, + "step": 65945 + }, + { + "epoch": 1.69, + "learning_rate": 8.438607036153143e-07, + "loss": 0.6865, + "step": 65946 + }, + { + "epoch": 1.69, + "learning_rate": 8.438333725980534e-07, + "loss": 0.7637, + "step": 65947 + }, + { + "epoch": 1.69, + "learning_rate": 8.438060417003623e-07, + "loss": 0.5361, + "step": 65948 + }, + { + "epoch": 1.69, + "learning_rate": 8.437787109222614e-07, + "loss": 0.667, + "step": 65949 + }, + { + "epoch": 1.69, + "learning_rate": 8.437513802637722e-07, + "loss": 0.8057, + "step": 65950 + }, + { + "epoch": 1.69, + "learning_rate": 8.437240497249153e-07, + "loss": 0.4927, + "step": 65951 + }, + { + "epoch": 1.69, + "learning_rate": 8.436967193057118e-07, + "loss": 0.6924, + "step": 65952 + }, + { + "epoch": 1.69, + "learning_rate": 8.436693890061824e-07, + "loss": 0.6826, + "step": 65953 + }, + { + "epoch": 1.69, + "learning_rate": 8.436420588263484e-07, + "loss": 0.5601, + "step": 65954 + }, + { + "epoch": 1.69, + "learning_rate": 8.436147287662303e-07, + "loss": 0.5735, + "step": 65955 + }, + { + "epoch": 1.69, + "learning_rate": 8.435873988258495e-07, + "loss": 0.6855, + "step": 65956 + }, + { + "epoch": 1.69, + "learning_rate": 8.435600690052262e-07, + "loss": 0.5713, + "step": 65957 + }, + { + "epoch": 1.69, + "learning_rate": 8.43532739304382e-07, + "loss": 0.8066, + "step": 65958 + }, + { + "epoch": 1.69, + "learning_rate": 8.435054097233375e-07, + "loss": 0.6001, + "step": 65959 + }, + { + "epoch": 1.69, + "learning_rate": 8.434780802621138e-07, + "loss": 0.5854, + "step": 65960 + }, + { + "epoch": 1.69, + "learning_rate": 8.434507509207316e-07, + "loss": 0.5854, + "step": 65961 + }, + { + "epoch": 1.69, + "learning_rate": 8.434234216992121e-07, + "loss": 0.6191, + "step": 65962 + }, + { + "epoch": 1.69, + "learning_rate": 8.433960925975759e-07, + "loss": 0.7012, + "step": 65963 + }, + { + "epoch": 1.69, + "learning_rate": 8.433687636158443e-07, + "loss": 0.8008, + "step": 65964 + }, + { + "epoch": 1.69, + "learning_rate": 8.433414347540378e-07, + "loss": 0.6216, + "step": 65965 + }, + { + "epoch": 1.69, + "learning_rate": 8.43314106012178e-07, + "loss": 0.6094, + "step": 65966 + }, + { + "epoch": 1.69, + "learning_rate": 8.432867773902852e-07, + "loss": 0.5339, + "step": 65967 + }, + { + "epoch": 1.69, + "learning_rate": 8.432594488883803e-07, + "loss": 0.5676, + "step": 65968 + }, + { + "epoch": 1.69, + "learning_rate": 8.432321205064847e-07, + "loss": 0.4907, + "step": 65969 + }, + { + "epoch": 1.69, + "learning_rate": 8.432047922446187e-07, + "loss": 0.7432, + "step": 65970 + }, + { + "epoch": 1.69, + "learning_rate": 8.431774641028039e-07, + "loss": 0.8018, + "step": 65971 + }, + { + "epoch": 1.69, + "learning_rate": 8.431501360810609e-07, + "loss": 0.6226, + "step": 65972 + }, + { + "epoch": 1.69, + "learning_rate": 8.431228081794104e-07, + "loss": 0.6348, + "step": 65973 + }, + { + "epoch": 1.69, + "learning_rate": 8.430954803978739e-07, + "loss": 0.6611, + "step": 65974 + }, + { + "epoch": 1.69, + "learning_rate": 8.430681527364714e-07, + "loss": 0.4231, + "step": 65975 + }, + { + "epoch": 1.69, + "learning_rate": 8.430408251952251e-07, + "loss": 0.834, + "step": 65976 + }, + { + "epoch": 1.69, + "learning_rate": 8.430134977741549e-07, + "loss": 0.5742, + "step": 65977 + }, + { + "epoch": 1.69, + "learning_rate": 8.42986170473282e-07, + "loss": 0.3323, + "step": 65978 + }, + { + "epoch": 1.69, + "learning_rate": 8.429588432926274e-07, + "loss": 0.4312, + "step": 65979 + }, + { + "epoch": 1.69, + "learning_rate": 8.42931516232212e-07, + "loss": 0.7266, + "step": 65980 + }, + { + "epoch": 1.69, + "learning_rate": 8.429041892920567e-07, + "loss": 0.644, + "step": 65981 + }, + { + "epoch": 1.69, + "learning_rate": 8.428768624721823e-07, + "loss": 0.5713, + "step": 65982 + }, + { + "epoch": 1.69, + "learning_rate": 8.428495357726101e-07, + "loss": 0.6748, + "step": 65983 + }, + { + "epoch": 1.69, + "learning_rate": 8.428222091933606e-07, + "loss": 0.6143, + "step": 65984 + }, + { + "epoch": 1.69, + "learning_rate": 8.427948827344549e-07, + "loss": 0.7437, + "step": 65985 + }, + { + "epoch": 1.69, + "learning_rate": 8.427675563959145e-07, + "loss": 0.5461, + "step": 65986 + }, + { + "epoch": 1.69, + "learning_rate": 8.427402301777591e-07, + "loss": 0.6492, + "step": 65987 + }, + { + "epoch": 1.69, + "learning_rate": 8.427129040800105e-07, + "loss": 0.5713, + "step": 65988 + }, + { + "epoch": 1.69, + "learning_rate": 8.426855781026895e-07, + "loss": 0.7061, + "step": 65989 + }, + { + "epoch": 1.69, + "learning_rate": 8.426582522458165e-07, + "loss": 0.5791, + "step": 65990 + }, + { + "epoch": 1.69, + "learning_rate": 8.426309265094133e-07, + "loss": 0.7354, + "step": 65991 + }, + { + "epoch": 1.69, + "learning_rate": 8.426036008935e-07, + "loss": 0.6318, + "step": 65992 + }, + { + "epoch": 1.69, + "learning_rate": 8.425762753980982e-07, + "loss": 0.6929, + "step": 65993 + }, + { + "epoch": 1.69, + "learning_rate": 8.425489500232283e-07, + "loss": 0.7354, + "step": 65994 + }, + { + "epoch": 1.69, + "learning_rate": 8.425216247689115e-07, + "loss": 0.6606, + "step": 65995 + }, + { + "epoch": 1.69, + "learning_rate": 8.42494299635169e-07, + "loss": 0.6494, + "step": 65996 + }, + { + "epoch": 1.69, + "learning_rate": 8.424669746220208e-07, + "loss": 0.7563, + "step": 65997 + }, + { + "epoch": 1.69, + "learning_rate": 8.424396497294887e-07, + "loss": 0.7139, + "step": 65998 + }, + { + "epoch": 1.69, + "learning_rate": 8.424123249575931e-07, + "loss": 0.7549, + "step": 65999 + }, + { + "epoch": 1.69, + "learning_rate": 8.423850003063553e-07, + "loss": 0.7969, + "step": 66000 + }, + { + "epoch": 1.69, + "learning_rate": 8.42357675775796e-07, + "loss": 0.5791, + "step": 66001 + }, + { + "epoch": 1.69, + "learning_rate": 8.423303513659362e-07, + "loss": 0.7388, + "step": 66002 + }, + { + "epoch": 1.69, + "learning_rate": 8.423030270767967e-07, + "loss": 0.5034, + "step": 66003 + }, + { + "epoch": 1.69, + "learning_rate": 8.422757029083987e-07, + "loss": 0.4434, + "step": 66004 + }, + { + "epoch": 1.69, + "learning_rate": 8.422483788607627e-07, + "loss": 0.6104, + "step": 66005 + }, + { + "epoch": 1.69, + "learning_rate": 8.422210549339104e-07, + "loss": 0.6357, + "step": 66006 + }, + { + "epoch": 1.69, + "learning_rate": 8.421937311278618e-07, + "loss": 0.5605, + "step": 66007 + }, + { + "epoch": 1.69, + "learning_rate": 8.421664074426383e-07, + "loss": 0.5095, + "step": 66008 + }, + { + "epoch": 1.69, + "learning_rate": 8.421390838782605e-07, + "loss": 0.6338, + "step": 66009 + }, + { + "epoch": 1.69, + "learning_rate": 8.421117604347499e-07, + "loss": 0.6089, + "step": 66010 + }, + { + "epoch": 1.69, + "learning_rate": 8.420844371121267e-07, + "loss": 0.5093, + "step": 66011 + }, + { + "epoch": 1.69, + "learning_rate": 8.420571139104123e-07, + "loss": 0.5938, + "step": 66012 + }, + { + "epoch": 1.69, + "learning_rate": 8.420297908296275e-07, + "loss": 0.501, + "step": 66013 + }, + { + "epoch": 1.69, + "learning_rate": 8.420024678697932e-07, + "loss": 0.6057, + "step": 66014 + }, + { + "epoch": 1.69, + "learning_rate": 8.419751450309304e-07, + "loss": 0.6611, + "step": 66015 + }, + { + "epoch": 1.69, + "learning_rate": 8.419478223130603e-07, + "loss": 0.7593, + "step": 66016 + }, + { + "epoch": 1.69, + "learning_rate": 8.419204997162032e-07, + "loss": 0.6162, + "step": 66017 + }, + { + "epoch": 1.69, + "learning_rate": 8.418931772403801e-07, + "loss": 0.7637, + "step": 66018 + }, + { + "epoch": 1.69, + "learning_rate": 8.418658548856124e-07, + "loss": 0.6479, + "step": 66019 + }, + { + "epoch": 1.69, + "learning_rate": 8.418385326519205e-07, + "loss": 0.7754, + "step": 66020 + }, + { + "epoch": 1.69, + "learning_rate": 8.418112105393258e-07, + "loss": 0.5217, + "step": 66021 + }, + { + "epoch": 1.69, + "learning_rate": 8.417838885478488e-07, + "loss": 0.7217, + "step": 66022 + }, + { + "epoch": 1.69, + "learning_rate": 8.417565666775108e-07, + "loss": 0.5674, + "step": 66023 + }, + { + "epoch": 1.69, + "learning_rate": 8.417292449283322e-07, + "loss": 0.5073, + "step": 66024 + }, + { + "epoch": 1.69, + "learning_rate": 8.417019233003344e-07, + "loss": 0.7095, + "step": 66025 + }, + { + "epoch": 1.69, + "learning_rate": 8.416746017935386e-07, + "loss": 0.5786, + "step": 66026 + }, + { + "epoch": 1.69, + "learning_rate": 8.41647280407965e-07, + "loss": 0.6226, + "step": 66027 + }, + { + "epoch": 1.69, + "learning_rate": 8.416199591436344e-07, + "loss": 0.7871, + "step": 66028 + }, + { + "epoch": 1.69, + "learning_rate": 8.415926380005686e-07, + "loss": 0.5569, + "step": 66029 + }, + { + "epoch": 1.69, + "learning_rate": 8.415653169787876e-07, + "loss": 0.6582, + "step": 66030 + }, + { + "epoch": 1.69, + "learning_rate": 8.415379960783131e-07, + "loss": 0.6318, + "step": 66031 + }, + { + "epoch": 1.69, + "learning_rate": 8.415106752991655e-07, + "loss": 0.834, + "step": 66032 + }, + { + "epoch": 1.69, + "learning_rate": 8.414833546413659e-07, + "loss": 0.6475, + "step": 66033 + }, + { + "epoch": 1.69, + "learning_rate": 8.414560341049351e-07, + "loss": 0.5002, + "step": 66034 + }, + { + "epoch": 1.69, + "learning_rate": 8.414287136898943e-07, + "loss": 0.7021, + "step": 66035 + }, + { + "epoch": 1.69, + "learning_rate": 8.414013933962645e-07, + "loss": 0.7158, + "step": 66036 + }, + { + "epoch": 1.69, + "learning_rate": 8.413740732240659e-07, + "loss": 0.8291, + "step": 66037 + }, + { + "epoch": 1.69, + "learning_rate": 8.413467531733203e-07, + "loss": 0.8701, + "step": 66038 + }, + { + "epoch": 1.69, + "learning_rate": 8.413194332440477e-07, + "loss": 0.8115, + "step": 66039 + }, + { + "epoch": 1.69, + "learning_rate": 8.412921134362698e-07, + "loss": 0.5533, + "step": 66040 + }, + { + "epoch": 1.69, + "learning_rate": 8.412647937500071e-07, + "loss": 0.7354, + "step": 66041 + }, + { + "epoch": 1.69, + "learning_rate": 8.412374741852808e-07, + "loss": 0.6123, + "step": 66042 + }, + { + "epoch": 1.69, + "learning_rate": 8.412101547421116e-07, + "loss": 0.5691, + "step": 66043 + }, + { + "epoch": 1.69, + "learning_rate": 8.411828354205205e-07, + "loss": 0.4631, + "step": 66044 + }, + { + "epoch": 1.69, + "learning_rate": 8.411555162205284e-07, + "loss": 0.7295, + "step": 66045 + }, + { + "epoch": 1.69, + "learning_rate": 8.411281971421566e-07, + "loss": 0.624, + "step": 66046 + }, + { + "epoch": 1.69, + "learning_rate": 8.411008781854249e-07, + "loss": 0.7725, + "step": 66047 + }, + { + "epoch": 1.69, + "learning_rate": 8.410735593503555e-07, + "loss": 0.5879, + "step": 66048 + }, + { + "epoch": 1.69, + "learning_rate": 8.410462406369683e-07, + "loss": 0.585, + "step": 66049 + }, + { + "epoch": 1.69, + "learning_rate": 8.410189220452851e-07, + "loss": 0.6143, + "step": 66050 + }, + { + "epoch": 1.69, + "learning_rate": 8.409916035753262e-07, + "loss": 0.5781, + "step": 66051 + }, + { + "epoch": 1.69, + "learning_rate": 8.409642852271128e-07, + "loss": 0.667, + "step": 66052 + }, + { + "epoch": 1.69, + "learning_rate": 8.409369670006655e-07, + "loss": 0.627, + "step": 66053 + }, + { + "epoch": 1.69, + "learning_rate": 8.409096488960058e-07, + "loss": 0.6431, + "step": 66054 + }, + { + "epoch": 1.69, + "learning_rate": 8.40882330913154e-07, + "loss": 0.5371, + "step": 66055 + }, + { + "epoch": 1.69, + "learning_rate": 8.408550130521316e-07, + "loss": 0.5312, + "step": 66056 + }, + { + "epoch": 1.69, + "learning_rate": 8.408276953129591e-07, + "loss": 0.6001, + "step": 66057 + }, + { + "epoch": 1.69, + "learning_rate": 8.408003776956573e-07, + "loss": 0.542, + "step": 66058 + }, + { + "epoch": 1.69, + "learning_rate": 8.407730602002475e-07, + "loss": 0.7197, + "step": 66059 + }, + { + "epoch": 1.69, + "learning_rate": 8.407457428267503e-07, + "loss": 0.5889, + "step": 66060 + }, + { + "epoch": 1.69, + "learning_rate": 8.407184255751869e-07, + "loss": 0.5576, + "step": 66061 + }, + { + "epoch": 1.69, + "learning_rate": 8.406911084455781e-07, + "loss": 0.7285, + "step": 66062 + }, + { + "epoch": 1.69, + "learning_rate": 8.406637914379445e-07, + "loss": 0.5215, + "step": 66063 + }, + { + "epoch": 1.69, + "learning_rate": 8.406364745523076e-07, + "loss": 0.5459, + "step": 66064 + }, + { + "epoch": 1.69, + "learning_rate": 8.406091577886879e-07, + "loss": 0.6438, + "step": 66065 + }, + { + "epoch": 1.69, + "learning_rate": 8.405818411471067e-07, + "loss": 0.7832, + "step": 66066 + }, + { + "epoch": 1.69, + "learning_rate": 8.405545246275845e-07, + "loss": 0.6777, + "step": 66067 + }, + { + "epoch": 1.69, + "learning_rate": 8.405272082301422e-07, + "loss": 0.6025, + "step": 66068 + }, + { + "epoch": 1.69, + "learning_rate": 8.404998919548012e-07, + "loss": 0.6206, + "step": 66069 + }, + { + "epoch": 1.69, + "learning_rate": 8.404725758015817e-07, + "loss": 0.563, + "step": 66070 + }, + { + "epoch": 1.69, + "learning_rate": 8.404452597705053e-07, + "loss": 0.6172, + "step": 66071 + }, + { + "epoch": 1.69, + "learning_rate": 8.404179438615924e-07, + "loss": 0.5684, + "step": 66072 + }, + { + "epoch": 1.69, + "learning_rate": 8.403906280748643e-07, + "loss": 0.7031, + "step": 66073 + }, + { + "epoch": 1.69, + "learning_rate": 8.403633124103417e-07, + "loss": 0.6899, + "step": 66074 + }, + { + "epoch": 1.69, + "learning_rate": 8.403359968680457e-07, + "loss": 0.5874, + "step": 66075 + }, + { + "epoch": 1.69, + "learning_rate": 8.403086814479972e-07, + "loss": 0.5771, + "step": 66076 + }, + { + "epoch": 1.69, + "learning_rate": 8.402813661502166e-07, + "loss": 0.6836, + "step": 66077 + }, + { + "epoch": 1.69, + "learning_rate": 8.402540509747256e-07, + "loss": 0.6426, + "step": 66078 + }, + { + "epoch": 1.69, + "learning_rate": 8.402267359215445e-07, + "loss": 0.627, + "step": 66079 + }, + { + "epoch": 1.69, + "learning_rate": 8.401994209906944e-07, + "loss": 0.6416, + "step": 66080 + }, + { + "epoch": 1.69, + "learning_rate": 8.401721061821965e-07, + "loss": 0.6777, + "step": 66081 + }, + { + "epoch": 1.69, + "learning_rate": 8.401447914960711e-07, + "loss": 0.5054, + "step": 66082 + }, + { + "epoch": 1.69, + "learning_rate": 8.401174769323398e-07, + "loss": 0.5032, + "step": 66083 + }, + { + "epoch": 1.69, + "learning_rate": 8.400901624910228e-07, + "loss": 0.8281, + "step": 66084 + }, + { + "epoch": 1.69, + "learning_rate": 8.400628481721419e-07, + "loss": 0.5892, + "step": 66085 + }, + { + "epoch": 1.69, + "learning_rate": 8.400355339757176e-07, + "loss": 0.6904, + "step": 66086 + }, + { + "epoch": 1.69, + "learning_rate": 8.400082199017703e-07, + "loss": 0.5845, + "step": 66087 + }, + { + "epoch": 1.69, + "learning_rate": 8.399809059503216e-07, + "loss": 0.6016, + "step": 66088 + }, + { + "epoch": 1.69, + "learning_rate": 8.399535921213918e-07, + "loss": 0.8779, + "step": 66089 + }, + { + "epoch": 1.69, + "learning_rate": 8.399262784150027e-07, + "loss": 0.6318, + "step": 66090 + }, + { + "epoch": 1.69, + "learning_rate": 8.398989648311742e-07, + "loss": 0.7192, + "step": 66091 + }, + { + "epoch": 1.69, + "learning_rate": 8.39871651369928e-07, + "loss": 0.6133, + "step": 66092 + }, + { + "epoch": 1.69, + "learning_rate": 8.398443380312845e-07, + "loss": 0.6372, + "step": 66093 + }, + { + "epoch": 1.69, + "learning_rate": 8.398170248152651e-07, + "loss": 0.8135, + "step": 66094 + }, + { + "epoch": 1.69, + "learning_rate": 8.397897117218902e-07, + "loss": 0.5625, + "step": 66095 + }, + { + "epoch": 1.69, + "learning_rate": 8.397623987511813e-07, + "loss": 0.5361, + "step": 66096 + }, + { + "epoch": 1.69, + "learning_rate": 8.397350859031588e-07, + "loss": 0.7041, + "step": 66097 + }, + { + "epoch": 1.69, + "learning_rate": 8.397077731778437e-07, + "loss": 0.6562, + "step": 66098 + }, + { + "epoch": 1.69, + "learning_rate": 8.396804605752569e-07, + "loss": 0.75, + "step": 66099 + }, + { + "epoch": 1.69, + "learning_rate": 8.396531480954195e-07, + "loss": 0.5483, + "step": 66100 + }, + { + "epoch": 1.69, + "learning_rate": 8.396258357383523e-07, + "loss": 0.5396, + "step": 66101 + }, + { + "epoch": 1.69, + "learning_rate": 8.395985235040762e-07, + "loss": 0.7368, + "step": 66102 + }, + { + "epoch": 1.69, + "learning_rate": 8.39571211392612e-07, + "loss": 0.584, + "step": 66103 + }, + { + "epoch": 1.69, + "learning_rate": 8.39543899403981e-07, + "loss": 0.6904, + "step": 66104 + }, + { + "epoch": 1.69, + "learning_rate": 8.395165875382036e-07, + "loss": 0.6787, + "step": 66105 + }, + { + "epoch": 1.69, + "learning_rate": 8.394892757953014e-07, + "loss": 0.667, + "step": 66106 + }, + { + "epoch": 1.69, + "learning_rate": 8.394619641752947e-07, + "loss": 0.7773, + "step": 66107 + }, + { + "epoch": 1.69, + "learning_rate": 8.394346526782043e-07, + "loss": 0.446, + "step": 66108 + }, + { + "epoch": 1.69, + "learning_rate": 8.394073413040518e-07, + "loss": 0.6357, + "step": 66109 + }, + { + "epoch": 1.69, + "learning_rate": 8.393800300528573e-07, + "loss": 0.4493, + "step": 66110 + }, + { + "epoch": 1.69, + "learning_rate": 8.393527189246424e-07, + "loss": 0.6094, + "step": 66111 + }, + { + "epoch": 1.69, + "learning_rate": 8.393254079194276e-07, + "loss": 0.2987, + "step": 66112 + }, + { + "epoch": 1.69, + "learning_rate": 8.392980970372341e-07, + "loss": 0.4878, + "step": 66113 + }, + { + "epoch": 1.69, + "learning_rate": 8.392707862780825e-07, + "loss": 0.3899, + "step": 66114 + }, + { + "epoch": 1.69, + "learning_rate": 8.392434756419939e-07, + "loss": 0.9658, + "step": 66115 + }, + { + "epoch": 1.69, + "learning_rate": 8.392161651289896e-07, + "loss": 0.6318, + "step": 66116 + }, + { + "epoch": 1.69, + "learning_rate": 8.391888547390899e-07, + "loss": 0.6523, + "step": 66117 + }, + { + "epoch": 1.69, + "learning_rate": 8.391615444723154e-07, + "loss": 0.6841, + "step": 66118 + }, + { + "epoch": 1.69, + "learning_rate": 8.39134234328688e-07, + "loss": 0.2665, + "step": 66119 + }, + { + "epoch": 1.69, + "learning_rate": 8.391069243082278e-07, + "loss": 0.627, + "step": 66120 + }, + { + "epoch": 1.69, + "learning_rate": 8.390796144109563e-07, + "loss": 0.6099, + "step": 66121 + }, + { + "epoch": 1.69, + "learning_rate": 8.390523046368938e-07, + "loss": 0.5317, + "step": 66122 + }, + { + "epoch": 1.69, + "learning_rate": 8.390249949860619e-07, + "loss": 0.625, + "step": 66123 + }, + { + "epoch": 1.69, + "learning_rate": 8.389976854584809e-07, + "loss": 0.6812, + "step": 66124 + }, + { + "epoch": 1.69, + "learning_rate": 8.389703760541722e-07, + "loss": 0.6311, + "step": 66125 + }, + { + "epoch": 1.69, + "learning_rate": 8.389430667731566e-07, + "loss": 0.6553, + "step": 66126 + }, + { + "epoch": 1.69, + "learning_rate": 8.389157576154547e-07, + "loss": 0.5874, + "step": 66127 + }, + { + "epoch": 1.69, + "learning_rate": 8.388884485810875e-07, + "loss": 0.5151, + "step": 66128 + }, + { + "epoch": 1.69, + "learning_rate": 8.38861139670076e-07, + "loss": 0.6777, + "step": 66129 + }, + { + "epoch": 1.69, + "learning_rate": 8.388338308824412e-07, + "loss": 0.5867, + "step": 66130 + }, + { + "epoch": 1.69, + "learning_rate": 8.388065222182038e-07, + "loss": 0.528, + "step": 66131 + }, + { + "epoch": 1.69, + "learning_rate": 8.387792136773851e-07, + "loss": 0.5457, + "step": 66132 + }, + { + "epoch": 1.7, + "learning_rate": 8.387519052600054e-07, + "loss": 0.7285, + "step": 66133 + }, + { + "epoch": 1.7, + "learning_rate": 8.387245969660863e-07, + "loss": 0.5693, + "step": 66134 + }, + { + "epoch": 1.7, + "learning_rate": 8.386972887956481e-07, + "loss": 0.6587, + "step": 66135 + }, + { + "epoch": 1.7, + "learning_rate": 8.386699807487124e-07, + "loss": 0.6113, + "step": 66136 + }, + { + "epoch": 1.7, + "learning_rate": 8.386426728252994e-07, + "loss": 0.5913, + "step": 66137 + }, + { + "epoch": 1.7, + "learning_rate": 8.386153650254302e-07, + "loss": 0.5908, + "step": 66138 + }, + { + "epoch": 1.7, + "learning_rate": 8.385880573491257e-07, + "loss": 0.6157, + "step": 66139 + }, + { + "epoch": 1.7, + "learning_rate": 8.385607497964071e-07, + "loss": 0.5874, + "step": 66140 + }, + { + "epoch": 1.7, + "learning_rate": 8.385334423672948e-07, + "loss": 0.7627, + "step": 66141 + }, + { + "epoch": 1.7, + "learning_rate": 8.385061350618104e-07, + "loss": 0.7139, + "step": 66142 + }, + { + "epoch": 1.7, + "learning_rate": 8.384788278799741e-07, + "loss": 0.4014, + "step": 66143 + }, + { + "epoch": 1.7, + "learning_rate": 8.384515208218075e-07, + "loss": 0.6377, + "step": 66144 + }, + { + "epoch": 1.7, + "learning_rate": 8.384242138873308e-07, + "loss": 0.6016, + "step": 66145 + }, + { + "epoch": 1.7, + "learning_rate": 8.383969070765657e-07, + "loss": 0.5752, + "step": 66146 + }, + { + "epoch": 1.7, + "learning_rate": 8.383696003895324e-07, + "loss": 0.4167, + "step": 66147 + }, + { + "epoch": 1.7, + "learning_rate": 8.383422938262519e-07, + "loss": 0.6504, + "step": 66148 + }, + { + "epoch": 1.7, + "learning_rate": 8.383149873867455e-07, + "loss": 0.7451, + "step": 66149 + }, + { + "epoch": 1.7, + "learning_rate": 8.382876810710336e-07, + "loss": 0.8438, + "step": 66150 + }, + { + "epoch": 1.7, + "learning_rate": 8.382603748791377e-07, + "loss": 0.5781, + "step": 66151 + }, + { + "epoch": 1.7, + "learning_rate": 8.382330688110784e-07, + "loss": 0.6553, + "step": 66152 + }, + { + "epoch": 1.7, + "learning_rate": 8.382057628668763e-07, + "loss": 0.3699, + "step": 66153 + }, + { + "epoch": 1.7, + "learning_rate": 8.381784570465529e-07, + "loss": 0.5273, + "step": 66154 + }, + { + "epoch": 1.7, + "learning_rate": 8.381511513501285e-07, + "loss": 0.7139, + "step": 66155 + }, + { + "epoch": 1.7, + "learning_rate": 8.381238457776248e-07, + "loss": 0.6323, + "step": 66156 + }, + { + "epoch": 1.7, + "learning_rate": 8.38096540329062e-07, + "loss": 0.7036, + "step": 66157 + }, + { + "epoch": 1.7, + "learning_rate": 8.380692350044612e-07, + "loss": 0.6826, + "step": 66158 + }, + { + "epoch": 1.7, + "learning_rate": 8.380419298038433e-07, + "loss": 0.6895, + "step": 66159 + }, + { + "epoch": 1.7, + "learning_rate": 8.380146247272291e-07, + "loss": 0.7539, + "step": 66160 + }, + { + "epoch": 1.7, + "learning_rate": 8.379873197746399e-07, + "loss": 0.7383, + "step": 66161 + }, + { + "epoch": 1.7, + "learning_rate": 8.379600149460962e-07, + "loss": 0.6455, + "step": 66162 + }, + { + "epoch": 1.7, + "learning_rate": 8.379327102416191e-07, + "loss": 0.7148, + "step": 66163 + }, + { + "epoch": 1.7, + "learning_rate": 8.379054056612295e-07, + "loss": 0.6001, + "step": 66164 + }, + { + "epoch": 1.7, + "learning_rate": 8.378781012049483e-07, + "loss": 0.5344, + "step": 66165 + }, + { + "epoch": 1.7, + "learning_rate": 8.378507968727967e-07, + "loss": 0.4023, + "step": 66166 + }, + { + "epoch": 1.7, + "learning_rate": 8.378234926647948e-07, + "loss": 0.6943, + "step": 66167 + }, + { + "epoch": 1.7, + "learning_rate": 8.377961885809642e-07, + "loss": 0.6016, + "step": 66168 + }, + { + "epoch": 1.7, + "learning_rate": 8.377688846213256e-07, + "loss": 0.428, + "step": 66169 + }, + { + "epoch": 1.7, + "learning_rate": 8.377415807858998e-07, + "loss": 0.4912, + "step": 66170 + }, + { + "epoch": 1.7, + "learning_rate": 8.377142770747079e-07, + "loss": 0.5151, + "step": 66171 + }, + { + "epoch": 1.7, + "learning_rate": 8.376869734877706e-07, + "loss": 0.709, + "step": 66172 + }, + { + "epoch": 1.7, + "learning_rate": 8.376596700251092e-07, + "loss": 0.5737, + "step": 66173 + }, + { + "epoch": 1.7, + "learning_rate": 8.37632366686744e-07, + "loss": 0.6118, + "step": 66174 + }, + { + "epoch": 1.7, + "learning_rate": 8.376050634726964e-07, + "loss": 0.5527, + "step": 66175 + }, + { + "epoch": 1.7, + "learning_rate": 8.375777603829875e-07, + "loss": 0.5674, + "step": 66176 + }, + { + "epoch": 1.7, + "learning_rate": 8.375504574176372e-07, + "loss": 0.707, + "step": 66177 + }, + { + "epoch": 1.7, + "learning_rate": 8.375231545766674e-07, + "loss": 0.4482, + "step": 66178 + }, + { + "epoch": 1.7, + "learning_rate": 8.374958518600984e-07, + "loss": 0.6357, + "step": 66179 + }, + { + "epoch": 1.7, + "learning_rate": 8.374685492679515e-07, + "loss": 0.5498, + "step": 66180 + }, + { + "epoch": 1.7, + "learning_rate": 8.374412468002474e-07, + "loss": 0.4805, + "step": 66181 + }, + { + "epoch": 1.7, + "learning_rate": 8.374139444570072e-07, + "loss": 0.6133, + "step": 66182 + }, + { + "epoch": 1.7, + "learning_rate": 8.373866422382514e-07, + "loss": 0.3939, + "step": 66183 + }, + { + "epoch": 1.7, + "learning_rate": 8.373593401440014e-07, + "loss": 0.5399, + "step": 66184 + }, + { + "epoch": 1.7, + "learning_rate": 8.373320381742777e-07, + "loss": 0.6865, + "step": 66185 + }, + { + "epoch": 1.7, + "learning_rate": 8.373047363291018e-07, + "loss": 0.6992, + "step": 66186 + }, + { + "epoch": 1.7, + "learning_rate": 8.37277434608494e-07, + "loss": 0.6079, + "step": 66187 + }, + { + "epoch": 1.7, + "learning_rate": 8.372501330124754e-07, + "loss": 0.5, + "step": 66188 + }, + { + "epoch": 1.7, + "learning_rate": 8.372228315410666e-07, + "loss": 0.6904, + "step": 66189 + }, + { + "epoch": 1.7, + "learning_rate": 8.37195530194289e-07, + "loss": 0.6973, + "step": 66190 + }, + { + "epoch": 1.7, + "learning_rate": 8.371682289721631e-07, + "loss": 0.6562, + "step": 66191 + }, + { + "epoch": 1.7, + "learning_rate": 8.371409278747104e-07, + "loss": 0.4868, + "step": 66192 + }, + { + "epoch": 1.7, + "learning_rate": 8.371136269019509e-07, + "loss": 0.7241, + "step": 66193 + }, + { + "epoch": 1.7, + "learning_rate": 8.370863260539064e-07, + "loss": 0.6909, + "step": 66194 + }, + { + "epoch": 1.7, + "learning_rate": 8.370590253305976e-07, + "loss": 0.7188, + "step": 66195 + }, + { + "epoch": 1.7, + "learning_rate": 8.370317247320446e-07, + "loss": 0.6763, + "step": 66196 + }, + { + "epoch": 1.7, + "learning_rate": 8.370044242582693e-07, + "loss": 0.792, + "step": 66197 + }, + { + "epoch": 1.7, + "learning_rate": 8.36977123909292e-07, + "loss": 0.5811, + "step": 66198 + }, + { + "epoch": 1.7, + "learning_rate": 8.36949823685134e-07, + "loss": 0.6299, + "step": 66199 + }, + { + "epoch": 1.7, + "learning_rate": 8.36922523585816e-07, + "loss": 0.7861, + "step": 66200 + }, + { + "epoch": 1.7, + "learning_rate": 8.368952236113589e-07, + "loss": 0.5474, + "step": 66201 + }, + { + "epoch": 1.7, + "learning_rate": 8.368679237617834e-07, + "loss": 0.6196, + "step": 66202 + }, + { + "epoch": 1.7, + "learning_rate": 8.36840624037111e-07, + "loss": 0.624, + "step": 66203 + }, + { + "epoch": 1.7, + "learning_rate": 8.368133244373619e-07, + "loss": 0.5334, + "step": 66204 + }, + { + "epoch": 1.7, + "learning_rate": 8.36786024962558e-07, + "loss": 0.6543, + "step": 66205 + }, + { + "epoch": 1.7, + "learning_rate": 8.367587256127188e-07, + "loss": 0.6738, + "step": 66206 + }, + { + "epoch": 1.7, + "learning_rate": 8.367314263878664e-07, + "loss": 0.688, + "step": 66207 + }, + { + "epoch": 1.7, + "learning_rate": 8.367041272880209e-07, + "loss": 0.5875, + "step": 66208 + }, + { + "epoch": 1.7, + "learning_rate": 8.366768283132038e-07, + "loss": 0.6357, + "step": 66209 + }, + { + "epoch": 1.7, + "learning_rate": 8.366495294634354e-07, + "loss": 0.4175, + "step": 66210 + }, + { + "epoch": 1.7, + "learning_rate": 8.366222307387372e-07, + "loss": 0.5835, + "step": 66211 + }, + { + "epoch": 1.7, + "learning_rate": 8.365949321391297e-07, + "loss": 0.8076, + "step": 66212 + }, + { + "epoch": 1.7, + "learning_rate": 8.365676336646341e-07, + "loss": 0.6172, + "step": 66213 + }, + { + "epoch": 1.7, + "learning_rate": 8.365403353152709e-07, + "loss": 0.6924, + "step": 66214 + }, + { + "epoch": 1.7, + "learning_rate": 8.365130370910618e-07, + "loss": 0.6973, + "step": 66215 + }, + { + "epoch": 1.7, + "learning_rate": 8.364857389920268e-07, + "loss": 0.6299, + "step": 66216 + }, + { + "epoch": 1.7, + "learning_rate": 8.36458441018187e-07, + "loss": 0.4888, + "step": 66217 + }, + { + "epoch": 1.7, + "learning_rate": 8.364311431695638e-07, + "loss": 0.5034, + "step": 66218 + }, + { + "epoch": 1.7, + "learning_rate": 8.364038454461774e-07, + "loss": 0.5669, + "step": 66219 + }, + { + "epoch": 1.7, + "learning_rate": 8.363765478480493e-07, + "loss": 0.6279, + "step": 66220 + }, + { + "epoch": 1.7, + "learning_rate": 8.363492503751999e-07, + "loss": 0.5352, + "step": 66221 + }, + { + "epoch": 1.7, + "learning_rate": 8.363219530276505e-07, + "loss": 0.5723, + "step": 66222 + }, + { + "epoch": 1.7, + "learning_rate": 8.362946558054218e-07, + "loss": 0.8125, + "step": 66223 + }, + { + "epoch": 1.7, + "learning_rate": 8.362673587085348e-07, + "loss": 0.554, + "step": 66224 + }, + { + "epoch": 1.7, + "learning_rate": 8.362400617370107e-07, + "loss": 0.7314, + "step": 66225 + }, + { + "epoch": 1.7, + "learning_rate": 8.362127648908698e-07, + "loss": 0.624, + "step": 66226 + }, + { + "epoch": 1.7, + "learning_rate": 8.361854681701331e-07, + "loss": 0.8184, + "step": 66227 + }, + { + "epoch": 1.7, + "learning_rate": 8.361581715748218e-07, + "loss": 0.6016, + "step": 66228 + }, + { + "epoch": 1.7, + "learning_rate": 8.361308751049565e-07, + "loss": 0.5256, + "step": 66229 + }, + { + "epoch": 1.7, + "learning_rate": 8.361035787605584e-07, + "loss": 0.7012, + "step": 66230 + }, + { + "epoch": 1.7, + "learning_rate": 8.360762825416481e-07, + "loss": 0.5896, + "step": 66231 + }, + { + "epoch": 1.7, + "learning_rate": 8.360489864482467e-07, + "loss": 0.6606, + "step": 66232 + }, + { + "epoch": 1.7, + "learning_rate": 8.36021690480375e-07, + "loss": 0.6348, + "step": 66233 + }, + { + "epoch": 1.7, + "learning_rate": 8.35994394638054e-07, + "loss": 0.6406, + "step": 66234 + }, + { + "epoch": 1.7, + "learning_rate": 8.35967098921305e-07, + "loss": 0.6343, + "step": 66235 + }, + { + "epoch": 1.7, + "learning_rate": 8.359398033301479e-07, + "loss": 0.6494, + "step": 66236 + }, + { + "epoch": 1.7, + "learning_rate": 8.359125078646044e-07, + "loss": 0.8096, + "step": 66237 + }, + { + "epoch": 1.7, + "learning_rate": 8.358852125246949e-07, + "loss": 0.6108, + "step": 66238 + }, + { + "epoch": 1.7, + "learning_rate": 8.358579173104409e-07, + "loss": 0.4963, + "step": 66239 + }, + { + "epoch": 1.7, + "learning_rate": 8.358306222218625e-07, + "loss": 0.5952, + "step": 66240 + }, + { + "epoch": 1.7, + "learning_rate": 8.358033272589814e-07, + "loss": 0.7305, + "step": 66241 + }, + { + "epoch": 1.7, + "learning_rate": 8.357760324218182e-07, + "loss": 0.8154, + "step": 66242 + }, + { + "epoch": 1.7, + "learning_rate": 8.357487377103934e-07, + "loss": 0.6494, + "step": 66243 + }, + { + "epoch": 1.7, + "learning_rate": 8.357214431247285e-07, + "loss": 0.5806, + "step": 66244 + }, + { + "epoch": 1.7, + "learning_rate": 8.356941486648444e-07, + "loss": 0.5718, + "step": 66245 + }, + { + "epoch": 1.7, + "learning_rate": 8.356668543307611e-07, + "loss": 0.6252, + "step": 66246 + }, + { + "epoch": 1.7, + "learning_rate": 8.356395601225006e-07, + "loss": 0.5527, + "step": 66247 + }, + { + "epoch": 1.7, + "learning_rate": 8.35612266040083e-07, + "loss": 0.4946, + "step": 66248 + }, + { + "epoch": 1.7, + "learning_rate": 8.355849720835297e-07, + "loss": 0.5352, + "step": 66249 + }, + { + "epoch": 1.7, + "learning_rate": 8.355576782528612e-07, + "loss": 0.7646, + "step": 66250 + }, + { + "epoch": 1.7, + "learning_rate": 8.35530384548099e-07, + "loss": 0.6499, + "step": 66251 + }, + { + "epoch": 1.7, + "learning_rate": 8.355030909692633e-07, + "loss": 0.6445, + "step": 66252 + }, + { + "epoch": 1.7, + "learning_rate": 8.354757975163755e-07, + "loss": 0.7334, + "step": 66253 + }, + { + "epoch": 1.7, + "learning_rate": 8.354485041894562e-07, + "loss": 0.8311, + "step": 66254 + }, + { + "epoch": 1.7, + "learning_rate": 8.354212109885268e-07, + "loss": 0.6309, + "step": 66255 + }, + { + "epoch": 1.7, + "learning_rate": 8.353939179136076e-07, + "loss": 0.6069, + "step": 66256 + }, + { + "epoch": 1.7, + "learning_rate": 8.353666249647194e-07, + "loss": 0.7393, + "step": 66257 + }, + { + "epoch": 1.7, + "learning_rate": 8.353393321418838e-07, + "loss": 0.6104, + "step": 66258 + }, + { + "epoch": 1.7, + "learning_rate": 8.353120394451209e-07, + "loss": 0.5737, + "step": 66259 + }, + { + "epoch": 1.7, + "learning_rate": 8.352847468744524e-07, + "loss": 0.4868, + "step": 66260 + }, + { + "epoch": 1.7, + "learning_rate": 8.352574544298987e-07, + "loss": 0.6143, + "step": 66261 + }, + { + "epoch": 1.7, + "learning_rate": 8.352301621114805e-07, + "loss": 0.5557, + "step": 66262 + }, + { + "epoch": 1.7, + "learning_rate": 8.352028699192193e-07, + "loss": 0.6235, + "step": 66263 + }, + { + "epoch": 1.7, + "learning_rate": 8.351755778531355e-07, + "loss": 0.4688, + "step": 66264 + }, + { + "epoch": 1.7, + "learning_rate": 8.351482859132506e-07, + "loss": 0.624, + "step": 66265 + }, + { + "epoch": 1.7, + "learning_rate": 8.351209940995848e-07, + "loss": 0.6343, + "step": 66266 + }, + { + "epoch": 1.7, + "learning_rate": 8.35093702412159e-07, + "loss": 0.6494, + "step": 66267 + }, + { + "epoch": 1.7, + "learning_rate": 8.350664108509947e-07, + "loss": 0.6431, + "step": 66268 + }, + { + "epoch": 1.7, + "learning_rate": 8.350391194161123e-07, + "loss": 0.6875, + "step": 66269 + }, + { + "epoch": 1.7, + "learning_rate": 8.350118281075329e-07, + "loss": 0.7568, + "step": 66270 + }, + { + "epoch": 1.7, + "learning_rate": 8.349845369252773e-07, + "loss": 0.6353, + "step": 66271 + }, + { + "epoch": 1.7, + "learning_rate": 8.349572458693665e-07, + "loss": 0.6216, + "step": 66272 + }, + { + "epoch": 1.7, + "learning_rate": 8.349299549398213e-07, + "loss": 0.6387, + "step": 66273 + }, + { + "epoch": 1.7, + "learning_rate": 8.349026641366628e-07, + "loss": 0.7324, + "step": 66274 + }, + { + "epoch": 1.7, + "learning_rate": 8.34875373459912e-07, + "loss": 0.5933, + "step": 66275 + }, + { + "epoch": 1.7, + "learning_rate": 8.348480829095889e-07, + "loss": 0.5137, + "step": 66276 + }, + { + "epoch": 1.7, + "learning_rate": 8.348207924857154e-07, + "loss": 0.7432, + "step": 66277 + }, + { + "epoch": 1.7, + "learning_rate": 8.347935021883121e-07, + "loss": 0.4852, + "step": 66278 + }, + { + "epoch": 1.7, + "learning_rate": 8.347662120173995e-07, + "loss": 0.6484, + "step": 66279 + }, + { + "epoch": 1.7, + "learning_rate": 8.347389219729991e-07, + "loss": 0.6514, + "step": 66280 + }, + { + "epoch": 1.7, + "learning_rate": 8.347116320551312e-07, + "loss": 0.5781, + "step": 66281 + }, + { + "epoch": 1.7, + "learning_rate": 8.346843422638174e-07, + "loss": 0.5386, + "step": 66282 + }, + { + "epoch": 1.7, + "learning_rate": 8.346570525990777e-07, + "loss": 0.6934, + "step": 66283 + }, + { + "epoch": 1.7, + "learning_rate": 8.34629763060934e-07, + "loss": 0.7178, + "step": 66284 + }, + { + "epoch": 1.7, + "learning_rate": 8.346024736494066e-07, + "loss": 0.6553, + "step": 66285 + }, + { + "epoch": 1.7, + "learning_rate": 8.345751843645164e-07, + "loss": 0.5767, + "step": 66286 + }, + { + "epoch": 1.7, + "learning_rate": 8.345478952062843e-07, + "loss": 0.7129, + "step": 66287 + }, + { + "epoch": 1.7, + "learning_rate": 8.345206061747312e-07, + "loss": 0.6299, + "step": 66288 + }, + { + "epoch": 1.7, + "learning_rate": 8.344933172698782e-07, + "loss": 0.6724, + "step": 66289 + }, + { + "epoch": 1.7, + "learning_rate": 8.344660284917458e-07, + "loss": 0.5493, + "step": 66290 + }, + { + "epoch": 1.7, + "learning_rate": 8.344387398403554e-07, + "loss": 0.79, + "step": 66291 + }, + { + "epoch": 1.7, + "learning_rate": 8.344114513157275e-07, + "loss": 0.6855, + "step": 66292 + }, + { + "epoch": 1.7, + "learning_rate": 8.343841629178834e-07, + "loss": 0.834, + "step": 66293 + }, + { + "epoch": 1.7, + "learning_rate": 8.343568746468433e-07, + "loss": 0.7441, + "step": 66294 + }, + { + "epoch": 1.7, + "learning_rate": 8.343295865026294e-07, + "loss": 0.7393, + "step": 66295 + }, + { + "epoch": 1.7, + "learning_rate": 8.34302298485261e-07, + "loss": 0.6689, + "step": 66296 + }, + { + "epoch": 1.7, + "learning_rate": 8.342750105947599e-07, + "loss": 0.6396, + "step": 66297 + }, + { + "epoch": 1.7, + "learning_rate": 8.342477228311465e-07, + "loss": 0.6846, + "step": 66298 + }, + { + "epoch": 1.7, + "learning_rate": 8.342204351944425e-07, + "loss": 0.7529, + "step": 66299 + }, + { + "epoch": 1.7, + "learning_rate": 8.341931476846678e-07, + "loss": 0.5918, + "step": 66300 + }, + { + "epoch": 1.7, + "learning_rate": 8.34165860301844e-07, + "loss": 0.6221, + "step": 66301 + }, + { + "epoch": 1.7, + "learning_rate": 8.341385730459917e-07, + "loss": 0.6562, + "step": 66302 + }, + { + "epoch": 1.7, + "learning_rate": 8.34111285917132e-07, + "loss": 0.4323, + "step": 66303 + }, + { + "epoch": 1.7, + "learning_rate": 8.340839989152854e-07, + "loss": 0.6274, + "step": 66304 + }, + { + "epoch": 1.7, + "learning_rate": 8.340567120404735e-07, + "loss": 0.6318, + "step": 66305 + }, + { + "epoch": 1.7, + "learning_rate": 8.340294252927167e-07, + "loss": 0.7021, + "step": 66306 + }, + { + "epoch": 1.7, + "learning_rate": 8.340021386720356e-07, + "loss": 0.6611, + "step": 66307 + }, + { + "epoch": 1.7, + "learning_rate": 8.339748521784517e-07, + "loss": 0.6562, + "step": 66308 + }, + { + "epoch": 1.7, + "learning_rate": 8.339475658119852e-07, + "loss": 0.5732, + "step": 66309 + }, + { + "epoch": 1.7, + "learning_rate": 8.339202795726579e-07, + "loss": 0.7158, + "step": 66310 + }, + { + "epoch": 1.7, + "learning_rate": 8.338929934604898e-07, + "loss": 0.6367, + "step": 66311 + }, + { + "epoch": 1.7, + "learning_rate": 8.338657074755026e-07, + "loss": 0.6416, + "step": 66312 + }, + { + "epoch": 1.7, + "learning_rate": 8.338384216177163e-07, + "loss": 0.7451, + "step": 66313 + }, + { + "epoch": 1.7, + "learning_rate": 8.338111358871527e-07, + "loss": 0.6152, + "step": 66314 + }, + { + "epoch": 1.7, + "learning_rate": 8.337838502838325e-07, + "loss": 0.5271, + "step": 66315 + }, + { + "epoch": 1.7, + "learning_rate": 8.33756564807776e-07, + "loss": 0.6099, + "step": 66316 + }, + { + "epoch": 1.7, + "learning_rate": 8.337292794590044e-07, + "loss": 0.6309, + "step": 66317 + }, + { + "epoch": 1.7, + "learning_rate": 8.337019942375387e-07, + "loss": 0.615, + "step": 66318 + }, + { + "epoch": 1.7, + "learning_rate": 8.336747091433996e-07, + "loss": 0.6055, + "step": 66319 + }, + { + "epoch": 1.7, + "learning_rate": 8.336474241766085e-07, + "loss": 0.7173, + "step": 66320 + }, + { + "epoch": 1.7, + "learning_rate": 8.336201393371855e-07, + "loss": 0.5469, + "step": 66321 + }, + { + "epoch": 1.7, + "learning_rate": 8.335928546251522e-07, + "loss": 0.5815, + "step": 66322 + }, + { + "epoch": 1.7, + "learning_rate": 8.335655700405289e-07, + "loss": 0.5942, + "step": 66323 + }, + { + "epoch": 1.7, + "learning_rate": 8.335382855833371e-07, + "loss": 0.4219, + "step": 66324 + }, + { + "epoch": 1.7, + "learning_rate": 8.335110012535976e-07, + "loss": 0.5732, + "step": 66325 + }, + { + "epoch": 1.7, + "learning_rate": 8.334837170513306e-07, + "loss": 0.5283, + "step": 66326 + }, + { + "epoch": 1.7, + "learning_rate": 8.334564329765577e-07, + "loss": 0.6157, + "step": 66327 + }, + { + "epoch": 1.7, + "learning_rate": 8.334291490292993e-07, + "loss": 0.6704, + "step": 66328 + }, + { + "epoch": 1.7, + "learning_rate": 8.334018652095767e-07, + "loss": 0.7344, + "step": 66329 + }, + { + "epoch": 1.7, + "learning_rate": 8.333745815174106e-07, + "loss": 0.6963, + "step": 66330 + }, + { + "epoch": 1.7, + "learning_rate": 8.33347297952822e-07, + "loss": 0.7842, + "step": 66331 + }, + { + "epoch": 1.7, + "learning_rate": 8.333200145158314e-07, + "loss": 0.6211, + "step": 66332 + }, + { + "epoch": 1.7, + "learning_rate": 8.332927312064604e-07, + "loss": 0.5425, + "step": 66333 + }, + { + "epoch": 1.7, + "learning_rate": 8.332654480247294e-07, + "loss": 0.582, + "step": 66334 + }, + { + "epoch": 1.7, + "learning_rate": 8.332381649706597e-07, + "loss": 0.6138, + "step": 66335 + }, + { + "epoch": 1.7, + "learning_rate": 8.332108820442713e-07, + "loss": 0.5532, + "step": 66336 + }, + { + "epoch": 1.7, + "learning_rate": 8.33183599245586e-07, + "loss": 0.6396, + "step": 66337 + }, + { + "epoch": 1.7, + "learning_rate": 8.33156316574624e-07, + "loss": 0.6182, + "step": 66338 + }, + { + "epoch": 1.7, + "learning_rate": 8.331290340314069e-07, + "loss": 0.6199, + "step": 66339 + }, + { + "epoch": 1.7, + "learning_rate": 8.331017516159549e-07, + "loss": 0.5896, + "step": 66340 + }, + { + "epoch": 1.7, + "learning_rate": 8.330744693282895e-07, + "loss": 0.7666, + "step": 66341 + }, + { + "epoch": 1.7, + "learning_rate": 8.33047187168431e-07, + "loss": 0.5298, + "step": 66342 + }, + { + "epoch": 1.7, + "learning_rate": 8.330199051364009e-07, + "loss": 0.6885, + "step": 66343 + }, + { + "epoch": 1.7, + "learning_rate": 8.329926232322195e-07, + "loss": 0.5991, + "step": 66344 + }, + { + "epoch": 1.7, + "learning_rate": 8.329653414559085e-07, + "loss": 0.6113, + "step": 66345 + }, + { + "epoch": 1.7, + "learning_rate": 8.329380598074878e-07, + "loss": 0.6963, + "step": 66346 + }, + { + "epoch": 1.7, + "learning_rate": 8.329107782869787e-07, + "loss": 0.6895, + "step": 66347 + }, + { + "epoch": 1.7, + "learning_rate": 8.328834968944024e-07, + "loss": 0.751, + "step": 66348 + }, + { + "epoch": 1.7, + "learning_rate": 8.328562156297793e-07, + "loss": 0.7109, + "step": 66349 + }, + { + "epoch": 1.7, + "learning_rate": 8.328289344931306e-07, + "loss": 0.6396, + "step": 66350 + }, + { + "epoch": 1.7, + "learning_rate": 8.328016534844773e-07, + "loss": 0.4336, + "step": 66351 + }, + { + "epoch": 1.7, + "learning_rate": 8.327743726038396e-07, + "loss": 0.5508, + "step": 66352 + }, + { + "epoch": 1.7, + "learning_rate": 8.327470918512393e-07, + "loss": 0.4797, + "step": 66353 + }, + { + "epoch": 1.7, + "learning_rate": 8.327198112266967e-07, + "loss": 0.6216, + "step": 66354 + }, + { + "epoch": 1.7, + "learning_rate": 8.32692530730233e-07, + "loss": 0.6318, + "step": 66355 + }, + { + "epoch": 1.7, + "learning_rate": 8.326652503618689e-07, + "loss": 0.9189, + "step": 66356 + }, + { + "epoch": 1.7, + "learning_rate": 8.326379701216251e-07, + "loss": 0.5366, + "step": 66357 + }, + { + "epoch": 1.7, + "learning_rate": 8.326106900095229e-07, + "loss": 0.7793, + "step": 66358 + }, + { + "epoch": 1.7, + "learning_rate": 8.325834100255829e-07, + "loss": 0.7358, + "step": 66359 + }, + { + "epoch": 1.7, + "learning_rate": 8.325561301698262e-07, + "loss": 0.5986, + "step": 66360 + }, + { + "epoch": 1.7, + "learning_rate": 8.325288504422733e-07, + "loss": 0.6514, + "step": 66361 + }, + { + "epoch": 1.7, + "learning_rate": 8.325015708429455e-07, + "loss": 0.8203, + "step": 66362 + }, + { + "epoch": 1.7, + "learning_rate": 8.324742913718637e-07, + "loss": 0.667, + "step": 66363 + }, + { + "epoch": 1.7, + "learning_rate": 8.324470120290485e-07, + "loss": 0.4736, + "step": 66364 + }, + { + "epoch": 1.7, + "learning_rate": 8.324197328145212e-07, + "loss": 0.387, + "step": 66365 + }, + { + "epoch": 1.7, + "learning_rate": 8.32392453728302e-07, + "loss": 0.7422, + "step": 66366 + }, + { + "epoch": 1.7, + "learning_rate": 8.323651747704124e-07, + "loss": 0.7949, + "step": 66367 + }, + { + "epoch": 1.7, + "learning_rate": 8.323378959408731e-07, + "loss": 0.6748, + "step": 66368 + }, + { + "epoch": 1.7, + "learning_rate": 8.323106172397047e-07, + "loss": 0.6816, + "step": 66369 + }, + { + "epoch": 1.7, + "learning_rate": 8.322833386669288e-07, + "loss": 0.6084, + "step": 66370 + }, + { + "epoch": 1.7, + "learning_rate": 8.322560602225653e-07, + "loss": 0.4545, + "step": 66371 + }, + { + "epoch": 1.7, + "learning_rate": 8.322287819066361e-07, + "loss": 0.7266, + "step": 66372 + }, + { + "epoch": 1.7, + "learning_rate": 8.322015037191613e-07, + "loss": 0.6416, + "step": 66373 + }, + { + "epoch": 1.7, + "learning_rate": 8.321742256601622e-07, + "loss": 0.6245, + "step": 66374 + }, + { + "epoch": 1.7, + "learning_rate": 8.321469477296599e-07, + "loss": 0.5356, + "step": 66375 + }, + { + "epoch": 1.7, + "learning_rate": 8.321196699276744e-07, + "loss": 0.6157, + "step": 66376 + }, + { + "epoch": 1.7, + "learning_rate": 8.320923922542275e-07, + "loss": 0.5261, + "step": 66377 + }, + { + "epoch": 1.7, + "learning_rate": 8.320651147093395e-07, + "loss": 0.6143, + "step": 66378 + }, + { + "epoch": 1.7, + "learning_rate": 8.320378372930317e-07, + "loss": 0.5, + "step": 66379 + }, + { + "epoch": 1.7, + "learning_rate": 8.320105600053246e-07, + "loss": 0.5952, + "step": 66380 + }, + { + "epoch": 1.7, + "learning_rate": 8.319832828462396e-07, + "loss": 0.5396, + "step": 66381 + }, + { + "epoch": 1.7, + "learning_rate": 8.319560058157968e-07, + "loss": 0.5544, + "step": 66382 + }, + { + "epoch": 1.7, + "learning_rate": 8.31928728914018e-07, + "loss": 0.6484, + "step": 66383 + }, + { + "epoch": 1.7, + "learning_rate": 8.319014521409233e-07, + "loss": 0.668, + "step": 66384 + }, + { + "epoch": 1.7, + "learning_rate": 8.318741754965347e-07, + "loss": 0.6416, + "step": 66385 + }, + { + "epoch": 1.7, + "learning_rate": 8.318468989808717e-07, + "loss": 0.5928, + "step": 66386 + }, + { + "epoch": 1.7, + "learning_rate": 8.318196225939559e-07, + "loss": 0.6772, + "step": 66387 + }, + { + "epoch": 1.7, + "learning_rate": 8.317923463358079e-07, + "loss": 0.6274, + "step": 66388 + }, + { + "epoch": 1.7, + "learning_rate": 8.317650702064489e-07, + "loss": 0.6953, + "step": 66389 + }, + { + "epoch": 1.7, + "learning_rate": 8.317377942058996e-07, + "loss": 0.7598, + "step": 66390 + }, + { + "epoch": 1.7, + "learning_rate": 8.31710518334181e-07, + "loss": 0.7148, + "step": 66391 + }, + { + "epoch": 1.7, + "learning_rate": 8.316832425913138e-07, + "loss": 0.4584, + "step": 66392 + }, + { + "epoch": 1.7, + "learning_rate": 8.316559669773192e-07, + "loss": 0.5938, + "step": 66393 + }, + { + "epoch": 1.7, + "learning_rate": 8.316286914922176e-07, + "loss": 0.6943, + "step": 66394 + }, + { + "epoch": 1.7, + "learning_rate": 8.316014161360307e-07, + "loss": 0.5215, + "step": 66395 + }, + { + "epoch": 1.7, + "learning_rate": 8.315741409087785e-07, + "loss": 0.7598, + "step": 66396 + }, + { + "epoch": 1.7, + "learning_rate": 8.315468658104822e-07, + "loss": 0.834, + "step": 66397 + }, + { + "epoch": 1.7, + "learning_rate": 8.315195908411628e-07, + "loss": 0.5508, + "step": 66398 + }, + { + "epoch": 1.7, + "learning_rate": 8.314923160008409e-07, + "loss": 0.5664, + "step": 66399 + }, + { + "epoch": 1.7, + "learning_rate": 8.314650412895379e-07, + "loss": 0.5879, + "step": 66400 + }, + { + "epoch": 1.7, + "learning_rate": 8.314377667072741e-07, + "loss": 0.6631, + "step": 66401 + }, + { + "epoch": 1.7, + "learning_rate": 8.314104922540708e-07, + "loss": 0.6462, + "step": 66402 + }, + { + "epoch": 1.7, + "learning_rate": 8.313832179299486e-07, + "loss": 0.6719, + "step": 66403 + }, + { + "epoch": 1.7, + "learning_rate": 8.313559437349287e-07, + "loss": 0.626, + "step": 66404 + }, + { + "epoch": 1.7, + "learning_rate": 8.313286696690321e-07, + "loss": 0.6172, + "step": 66405 + }, + { + "epoch": 1.7, + "learning_rate": 8.31301395732279e-07, + "loss": 0.6035, + "step": 66406 + }, + { + "epoch": 1.7, + "learning_rate": 8.312741219246904e-07, + "loss": 0.8047, + "step": 66407 + }, + { + "epoch": 1.7, + "learning_rate": 8.312468482462878e-07, + "loss": 0.6348, + "step": 66408 + }, + { + "epoch": 1.7, + "learning_rate": 8.312195746970915e-07, + "loss": 0.709, + "step": 66409 + }, + { + "epoch": 1.7, + "learning_rate": 8.311923012771229e-07, + "loss": 0.4673, + "step": 66410 + }, + { + "epoch": 1.7, + "learning_rate": 8.311650279864024e-07, + "loss": 0.6836, + "step": 66411 + }, + { + "epoch": 1.7, + "learning_rate": 8.311377548249511e-07, + "loss": 0.6592, + "step": 66412 + }, + { + "epoch": 1.7, + "learning_rate": 8.311104817927899e-07, + "loss": 0.7109, + "step": 66413 + }, + { + "epoch": 1.7, + "learning_rate": 8.310832088899396e-07, + "loss": 0.7207, + "step": 66414 + }, + { + "epoch": 1.7, + "learning_rate": 8.310559361164214e-07, + "loss": 0.5381, + "step": 66415 + }, + { + "epoch": 1.7, + "learning_rate": 8.310286634722556e-07, + "loss": 0.5063, + "step": 66416 + }, + { + "epoch": 1.7, + "learning_rate": 8.310013909574634e-07, + "loss": 0.6045, + "step": 66417 + }, + { + "epoch": 1.7, + "learning_rate": 8.309741185720656e-07, + "loss": 0.7134, + "step": 66418 + }, + { + "epoch": 1.7, + "learning_rate": 8.309468463160833e-07, + "loss": 0.7598, + "step": 66419 + }, + { + "epoch": 1.7, + "learning_rate": 8.30919574189537e-07, + "loss": 0.4785, + "step": 66420 + }, + { + "epoch": 1.7, + "learning_rate": 8.308923021924481e-07, + "loss": 0.448, + "step": 66421 + }, + { + "epoch": 1.7, + "learning_rate": 8.308650303248369e-07, + "loss": 0.519, + "step": 66422 + }, + { + "epoch": 1.7, + "learning_rate": 8.308377585867248e-07, + "loss": 0.7393, + "step": 66423 + }, + { + "epoch": 1.7, + "learning_rate": 8.308104869781324e-07, + "loss": 0.5415, + "step": 66424 + }, + { + "epoch": 1.7, + "learning_rate": 8.30783215499081e-07, + "loss": 0.5303, + "step": 66425 + }, + { + "epoch": 1.7, + "learning_rate": 8.307559441495905e-07, + "loss": 0.6846, + "step": 66426 + }, + { + "epoch": 1.7, + "learning_rate": 8.307286729296827e-07, + "loss": 0.4192, + "step": 66427 + }, + { + "epoch": 1.7, + "learning_rate": 8.307014018393778e-07, + "loss": 0.6143, + "step": 66428 + }, + { + "epoch": 1.7, + "learning_rate": 8.306741308786975e-07, + "loss": 0.5312, + "step": 66429 + }, + { + "epoch": 1.7, + "learning_rate": 8.306468600476619e-07, + "loss": 0.6826, + "step": 66430 + }, + { + "epoch": 1.7, + "learning_rate": 8.306195893462925e-07, + "loss": 0.6367, + "step": 66431 + }, + { + "epoch": 1.7, + "learning_rate": 8.305923187746096e-07, + "loss": 0.5889, + "step": 66432 + }, + { + "epoch": 1.7, + "learning_rate": 8.305650483326346e-07, + "loss": 0.689, + "step": 66433 + }, + { + "epoch": 1.7, + "learning_rate": 8.30537778020388e-07, + "loss": 0.7246, + "step": 66434 + }, + { + "epoch": 1.7, + "learning_rate": 8.305105078378913e-07, + "loss": 0.7607, + "step": 66435 + }, + { + "epoch": 1.7, + "learning_rate": 8.304832377851645e-07, + "loss": 0.7002, + "step": 66436 + }, + { + "epoch": 1.7, + "learning_rate": 8.304559678622288e-07, + "loss": 0.7349, + "step": 66437 + }, + { + "epoch": 1.7, + "learning_rate": 8.304286980691054e-07, + "loss": 0.5635, + "step": 66438 + }, + { + "epoch": 1.7, + "learning_rate": 8.304014284058148e-07, + "loss": 0.7656, + "step": 66439 + }, + { + "epoch": 1.7, + "learning_rate": 8.303741588723781e-07, + "loss": 0.7656, + "step": 66440 + }, + { + "epoch": 1.7, + "learning_rate": 8.303468894688162e-07, + "loss": 0.585, + "step": 66441 + }, + { + "epoch": 1.7, + "learning_rate": 8.303196201951495e-07, + "loss": 0.6655, + "step": 66442 + }, + { + "epoch": 1.7, + "learning_rate": 8.302923510513996e-07, + "loss": 0.5771, + "step": 66443 + }, + { + "epoch": 1.7, + "learning_rate": 8.30265082037587e-07, + "loss": 0.7119, + "step": 66444 + }, + { + "epoch": 1.7, + "learning_rate": 8.302378131537327e-07, + "loss": 0.6582, + "step": 66445 + }, + { + "epoch": 1.7, + "learning_rate": 8.302105443998575e-07, + "loss": 0.4797, + "step": 66446 + }, + { + "epoch": 1.7, + "learning_rate": 8.301832757759821e-07, + "loss": 0.5923, + "step": 66447 + }, + { + "epoch": 1.7, + "learning_rate": 8.301560072821276e-07, + "loss": 0.5674, + "step": 66448 + }, + { + "epoch": 1.7, + "learning_rate": 8.301287389183149e-07, + "loss": 0.6797, + "step": 66449 + }, + { + "epoch": 1.7, + "learning_rate": 8.301014706845649e-07, + "loss": 0.6182, + "step": 66450 + }, + { + "epoch": 1.7, + "learning_rate": 8.30074202580898e-07, + "loss": 0.4524, + "step": 66451 + }, + { + "epoch": 1.7, + "learning_rate": 8.300469346073357e-07, + "loss": 0.5962, + "step": 66452 + }, + { + "epoch": 1.7, + "learning_rate": 8.300196667638986e-07, + "loss": 0.665, + "step": 66453 + }, + { + "epoch": 1.7, + "learning_rate": 8.299923990506079e-07, + "loss": 0.7139, + "step": 66454 + }, + { + "epoch": 1.7, + "learning_rate": 8.299651314674843e-07, + "loss": 0.7793, + "step": 66455 + }, + { + "epoch": 1.7, + "learning_rate": 8.299378640145481e-07, + "loss": 0.6309, + "step": 66456 + }, + { + "epoch": 1.7, + "learning_rate": 8.299105966918209e-07, + "loss": 0.7725, + "step": 66457 + }, + { + "epoch": 1.7, + "learning_rate": 8.298833294993235e-07, + "loss": 0.8096, + "step": 66458 + }, + { + "epoch": 1.7, + "learning_rate": 8.298560624370762e-07, + "loss": 0.6924, + "step": 66459 + }, + { + "epoch": 1.7, + "learning_rate": 8.298287955051005e-07, + "loss": 0.5662, + "step": 66460 + }, + { + "epoch": 1.7, + "learning_rate": 8.29801528703417e-07, + "loss": 0.5518, + "step": 66461 + }, + { + "epoch": 1.7, + "learning_rate": 8.297742620320468e-07, + "loss": 0.5962, + "step": 66462 + }, + { + "epoch": 1.7, + "learning_rate": 8.297469954910104e-07, + "loss": 0.5391, + "step": 66463 + }, + { + "epoch": 1.7, + "learning_rate": 8.297197290803291e-07, + "loss": 0.6069, + "step": 66464 + }, + { + "epoch": 1.7, + "learning_rate": 8.296924628000237e-07, + "loss": 0.5216, + "step": 66465 + }, + { + "epoch": 1.7, + "learning_rate": 8.296651966501147e-07, + "loss": 0.729, + "step": 66466 + }, + { + "epoch": 1.7, + "learning_rate": 8.296379306306232e-07, + "loss": 0.4922, + "step": 66467 + }, + { + "epoch": 1.7, + "learning_rate": 8.296106647415701e-07, + "loss": 0.626, + "step": 66468 + }, + { + "epoch": 1.7, + "learning_rate": 8.295833989829764e-07, + "loss": 0.625, + "step": 66469 + }, + { + "epoch": 1.7, + "learning_rate": 8.295561333548627e-07, + "loss": 0.5503, + "step": 66470 + }, + { + "epoch": 1.7, + "learning_rate": 8.295288678572502e-07, + "loss": 0.7422, + "step": 66471 + }, + { + "epoch": 1.7, + "learning_rate": 8.295016024901595e-07, + "loss": 0.522, + "step": 66472 + }, + { + "epoch": 1.7, + "learning_rate": 8.294743372536118e-07, + "loss": 0.6387, + "step": 66473 + }, + { + "epoch": 1.7, + "learning_rate": 8.294470721476273e-07, + "loss": 0.4585, + "step": 66474 + }, + { + "epoch": 1.7, + "learning_rate": 8.294198071722282e-07, + "loss": 0.522, + "step": 66475 + }, + { + "epoch": 1.7, + "learning_rate": 8.293925423274337e-07, + "loss": 0.5989, + "step": 66476 + }, + { + "epoch": 1.7, + "learning_rate": 8.293652776132658e-07, + "loss": 0.7544, + "step": 66477 + }, + { + "epoch": 1.7, + "learning_rate": 8.293380130297449e-07, + "loss": 0.7021, + "step": 66478 + }, + { + "epoch": 1.7, + "learning_rate": 8.293107485768922e-07, + "loss": 0.488, + "step": 66479 + }, + { + "epoch": 1.7, + "learning_rate": 8.292834842547282e-07, + "loss": 0.7559, + "step": 66480 + }, + { + "epoch": 1.7, + "learning_rate": 8.292562200632742e-07, + "loss": 0.7275, + "step": 66481 + }, + { + "epoch": 1.7, + "learning_rate": 8.292289560025506e-07, + "loss": 0.6504, + "step": 66482 + }, + { + "epoch": 1.7, + "learning_rate": 8.292016920725788e-07, + "loss": 0.7041, + "step": 66483 + }, + { + "epoch": 1.7, + "learning_rate": 8.291744282733792e-07, + "loss": 0.5798, + "step": 66484 + }, + { + "epoch": 1.7, + "learning_rate": 8.291471646049733e-07, + "loss": 0.5444, + "step": 66485 + }, + { + "epoch": 1.7, + "learning_rate": 8.291199010673813e-07, + "loss": 0.6514, + "step": 66486 + }, + { + "epoch": 1.7, + "learning_rate": 8.290926376606242e-07, + "loss": 0.4392, + "step": 66487 + }, + { + "epoch": 1.7, + "learning_rate": 8.290653743847231e-07, + "loss": 0.5269, + "step": 66488 + }, + { + "epoch": 1.7, + "learning_rate": 8.290381112396987e-07, + "loss": 0.6562, + "step": 66489 + }, + { + "epoch": 1.7, + "learning_rate": 8.290108482255722e-07, + "loss": 0.6709, + "step": 66490 + }, + { + "epoch": 1.7, + "learning_rate": 8.289835853423639e-07, + "loss": 0.4834, + "step": 66491 + }, + { + "epoch": 1.7, + "learning_rate": 8.289563225900953e-07, + "loss": 0.667, + "step": 66492 + }, + { + "epoch": 1.7, + "learning_rate": 8.289290599687867e-07, + "loss": 0.7275, + "step": 66493 + }, + { + "epoch": 1.7, + "learning_rate": 8.289017974784599e-07, + "loss": 0.7402, + "step": 66494 + }, + { + "epoch": 1.7, + "learning_rate": 8.288745351191345e-07, + "loss": 0.5195, + "step": 66495 + }, + { + "epoch": 1.7, + "learning_rate": 8.288472728908322e-07, + "loss": 0.7114, + "step": 66496 + }, + { + "epoch": 1.7, + "learning_rate": 8.288200107935736e-07, + "loss": 0.5796, + "step": 66497 + }, + { + "epoch": 1.7, + "learning_rate": 8.287927488273797e-07, + "loss": 0.5781, + "step": 66498 + }, + { + "epoch": 1.7, + "learning_rate": 8.287654869922711e-07, + "loss": 0.6318, + "step": 66499 + }, + { + "epoch": 1.7, + "learning_rate": 8.287382252882692e-07, + "loss": 0.7935, + "step": 66500 + }, + { + "epoch": 1.7, + "learning_rate": 8.287109637153942e-07, + "loss": 0.3816, + "step": 66501 + }, + { + "epoch": 1.7, + "learning_rate": 8.286837022736678e-07, + "loss": 0.6562, + "step": 66502 + }, + { + "epoch": 1.7, + "learning_rate": 8.286564409631101e-07, + "loss": 0.5605, + "step": 66503 + }, + { + "epoch": 1.7, + "learning_rate": 8.286291797837426e-07, + "loss": 0.5269, + "step": 66504 + }, + { + "epoch": 1.7, + "learning_rate": 8.286019187355857e-07, + "loss": 0.6279, + "step": 66505 + }, + { + "epoch": 1.7, + "learning_rate": 8.285746578186602e-07, + "loss": 0.6162, + "step": 66506 + }, + { + "epoch": 1.7, + "learning_rate": 8.285473970329875e-07, + "loss": 0.603, + "step": 66507 + }, + { + "epoch": 1.7, + "learning_rate": 8.285201363785879e-07, + "loss": 0.7646, + "step": 66508 + }, + { + "epoch": 1.7, + "learning_rate": 8.284928758554828e-07, + "loss": 0.563, + "step": 66509 + }, + { + "epoch": 1.7, + "learning_rate": 8.284656154636925e-07, + "loss": 0.6841, + "step": 66510 + }, + { + "epoch": 1.7, + "learning_rate": 8.284383552032386e-07, + "loss": 0.7178, + "step": 66511 + }, + { + "epoch": 1.7, + "learning_rate": 8.284110950741411e-07, + "loss": 0.4133, + "step": 66512 + }, + { + "epoch": 1.7, + "learning_rate": 8.283838350764217e-07, + "loss": 0.7461, + "step": 66513 + }, + { + "epoch": 1.7, + "learning_rate": 8.283565752101011e-07, + "loss": 0.8242, + "step": 66514 + }, + { + "epoch": 1.7, + "learning_rate": 8.283293154751998e-07, + "loss": 0.6777, + "step": 66515 + }, + { + "epoch": 1.7, + "learning_rate": 8.283020558717386e-07, + "loss": 0.6211, + "step": 66516 + }, + { + "epoch": 1.7, + "learning_rate": 8.282747963997387e-07, + "loss": 0.6533, + "step": 66517 + }, + { + "epoch": 1.7, + "learning_rate": 8.282475370592209e-07, + "loss": 0.479, + "step": 66518 + }, + { + "epoch": 1.7, + "learning_rate": 8.282202778502062e-07, + "loss": 0.5439, + "step": 66519 + }, + { + "epoch": 1.7, + "learning_rate": 8.281930187727151e-07, + "loss": 0.5776, + "step": 66520 + }, + { + "epoch": 1.7, + "learning_rate": 8.281657598267689e-07, + "loss": 0.5366, + "step": 66521 + }, + { + "epoch": 1.7, + "learning_rate": 8.281385010123881e-07, + "loss": 0.6738, + "step": 66522 + }, + { + "epoch": 1.71, + "learning_rate": 8.281112423295939e-07, + "loss": 0.541, + "step": 66523 + }, + { + "epoch": 1.71, + "learning_rate": 8.280839837784074e-07, + "loss": 0.6006, + "step": 66524 + }, + { + "epoch": 1.71, + "learning_rate": 8.280567253588485e-07, + "loss": 0.6113, + "step": 66525 + }, + { + "epoch": 1.71, + "learning_rate": 8.280294670709389e-07, + "loss": 0.583, + "step": 66526 + }, + { + "epoch": 1.71, + "learning_rate": 8.280022089146989e-07, + "loss": 0.5581, + "step": 66527 + }, + { + "epoch": 1.71, + "learning_rate": 8.279749508901501e-07, + "loss": 0.582, + "step": 66528 + }, + { + "epoch": 1.71, + "learning_rate": 8.279476929973128e-07, + "loss": 0.6934, + "step": 66529 + }, + { + "epoch": 1.71, + "learning_rate": 8.279204352362081e-07, + "loss": 0.4775, + "step": 66530 + }, + { + "epoch": 1.71, + "learning_rate": 8.278931776068569e-07, + "loss": 0.6709, + "step": 66531 + }, + { + "epoch": 1.71, + "learning_rate": 8.278659201092797e-07, + "loss": 0.5078, + "step": 66532 + }, + { + "epoch": 1.71, + "learning_rate": 8.278386627434979e-07, + "loss": 0.6162, + "step": 66533 + }, + { + "epoch": 1.71, + "learning_rate": 8.278114055095324e-07, + "loss": 0.7607, + "step": 66534 + }, + { + "epoch": 1.71, + "learning_rate": 8.277841484074033e-07, + "loss": 0.5205, + "step": 66535 + }, + { + "epoch": 1.71, + "learning_rate": 8.277568914371322e-07, + "loss": 0.666, + "step": 66536 + }, + { + "epoch": 1.71, + "learning_rate": 8.277296345987395e-07, + "loss": 0.8135, + "step": 66537 + }, + { + "epoch": 1.71, + "learning_rate": 8.277023778922464e-07, + "loss": 0.6646, + "step": 66538 + }, + { + "epoch": 1.71, + "learning_rate": 8.276751213176736e-07, + "loss": 0.4399, + "step": 66539 + }, + { + "epoch": 1.71, + "learning_rate": 8.276478648750421e-07, + "loss": 0.4668, + "step": 66540 + }, + { + "epoch": 1.71, + "learning_rate": 8.276206085643727e-07, + "loss": 0.7637, + "step": 66541 + }, + { + "epoch": 1.71, + "learning_rate": 8.275933523856862e-07, + "loss": 0.7617, + "step": 66542 + }, + { + "epoch": 1.71, + "learning_rate": 8.275660963390035e-07, + "loss": 0.6863, + "step": 66543 + }, + { + "epoch": 1.71, + "learning_rate": 8.275388404243459e-07, + "loss": 0.7061, + "step": 66544 + }, + { + "epoch": 1.71, + "learning_rate": 8.275115846417338e-07, + "loss": 0.7988, + "step": 66545 + }, + { + "epoch": 1.71, + "learning_rate": 8.274843289911879e-07, + "loss": 0.6421, + "step": 66546 + }, + { + "epoch": 1.71, + "learning_rate": 8.274570734727295e-07, + "loss": 0.7441, + "step": 66547 + }, + { + "epoch": 1.71, + "learning_rate": 8.274298180863792e-07, + "loss": 0.6084, + "step": 66548 + }, + { + "epoch": 1.71, + "learning_rate": 8.274025628321578e-07, + "loss": 0.6113, + "step": 66549 + }, + { + "epoch": 1.71, + "learning_rate": 8.273753077100865e-07, + "loss": 0.5215, + "step": 66550 + }, + { + "epoch": 1.71, + "learning_rate": 8.273480527201858e-07, + "loss": 0.709, + "step": 66551 + }, + { + "epoch": 1.71, + "learning_rate": 8.27320797862477e-07, + "loss": 0.7383, + "step": 66552 + }, + { + "epoch": 1.71, + "learning_rate": 8.272935431369806e-07, + "loss": 0.7168, + "step": 66553 + }, + { + "epoch": 1.71, + "learning_rate": 8.272662885437179e-07, + "loss": 0.7568, + "step": 66554 + }, + { + "epoch": 1.71, + "learning_rate": 8.272390340827091e-07, + "loss": 0.7119, + "step": 66555 + }, + { + "epoch": 1.71, + "learning_rate": 8.272117797539755e-07, + "loss": 0.7026, + "step": 66556 + }, + { + "epoch": 1.71, + "learning_rate": 8.271845255575379e-07, + "loss": 0.6758, + "step": 66557 + }, + { + "epoch": 1.71, + "learning_rate": 8.27157271493417e-07, + "loss": 0.6641, + "step": 66558 + }, + { + "epoch": 1.71, + "learning_rate": 8.271300175616341e-07, + "loss": 0.4893, + "step": 66559 + }, + { + "epoch": 1.71, + "learning_rate": 8.271027637622095e-07, + "loss": 0.7344, + "step": 66560 + }, + { + "epoch": 1.71, + "learning_rate": 8.270755100951648e-07, + "loss": 0.5344, + "step": 66561 + }, + { + "epoch": 1.71, + "learning_rate": 8.270482565605199e-07, + "loss": 0.6572, + "step": 66562 + }, + { + "epoch": 1.71, + "learning_rate": 8.270210031582966e-07, + "loss": 0.624, + "step": 66563 + }, + { + "epoch": 1.71, + "learning_rate": 8.269937498885156e-07, + "loss": 0.6357, + "step": 66564 + }, + { + "epoch": 1.71, + "learning_rate": 8.269664967511972e-07, + "loss": 0.75, + "step": 66565 + }, + { + "epoch": 1.71, + "learning_rate": 8.269392437463625e-07, + "loss": 0.5015, + "step": 66566 + }, + { + "epoch": 1.71, + "learning_rate": 8.269119908740325e-07, + "loss": 0.5134, + "step": 66567 + }, + { + "epoch": 1.71, + "learning_rate": 8.26884738134228e-07, + "loss": 0.5486, + "step": 66568 + }, + { + "epoch": 1.71, + "learning_rate": 8.2685748552697e-07, + "loss": 0.7236, + "step": 66569 + }, + { + "epoch": 1.71, + "learning_rate": 8.268302330522791e-07, + "loss": 0.6216, + "step": 66570 + }, + { + "epoch": 1.71, + "learning_rate": 8.268029807101765e-07, + "loss": 0.5798, + "step": 66571 + }, + { + "epoch": 1.71, + "learning_rate": 8.267757285006828e-07, + "loss": 0.7036, + "step": 66572 + }, + { + "epoch": 1.71, + "learning_rate": 8.26748476423819e-07, + "loss": 0.5229, + "step": 66573 + }, + { + "epoch": 1.71, + "learning_rate": 8.267212244796062e-07, + "loss": 0.7134, + "step": 66574 + }, + { + "epoch": 1.71, + "learning_rate": 8.266939726680646e-07, + "loss": 0.5781, + "step": 66575 + }, + { + "epoch": 1.71, + "learning_rate": 8.266667209892157e-07, + "loss": 0.6748, + "step": 66576 + }, + { + "epoch": 1.71, + "learning_rate": 8.266394694430798e-07, + "loss": 0.6724, + "step": 66577 + }, + { + "epoch": 1.71, + "learning_rate": 8.266122180296784e-07, + "loss": 0.7158, + "step": 66578 + }, + { + "epoch": 1.71, + "learning_rate": 8.265849667490319e-07, + "loss": 0.6975, + "step": 66579 + }, + { + "epoch": 1.71, + "learning_rate": 8.265577156011614e-07, + "loss": 0.6836, + "step": 66580 + }, + { + "epoch": 1.71, + "learning_rate": 8.265304645860874e-07, + "loss": 0.6187, + "step": 66581 + }, + { + "epoch": 1.71, + "learning_rate": 8.265032137038315e-07, + "loss": 0.584, + "step": 66582 + }, + { + "epoch": 1.71, + "learning_rate": 8.264759629544136e-07, + "loss": 0.5518, + "step": 66583 + }, + { + "epoch": 1.71, + "learning_rate": 8.26448712337856e-07, + "loss": 0.4969, + "step": 66584 + }, + { + "epoch": 1.71, + "learning_rate": 8.264214618541778e-07, + "loss": 0.6348, + "step": 66585 + }, + { + "epoch": 1.71, + "learning_rate": 8.26394211503401e-07, + "loss": 0.7974, + "step": 66586 + }, + { + "epoch": 1.71, + "learning_rate": 8.26366961285546e-07, + "loss": 0.5469, + "step": 66587 + }, + { + "epoch": 1.71, + "learning_rate": 8.26339711200634e-07, + "loss": 0.7725, + "step": 66588 + }, + { + "epoch": 1.71, + "learning_rate": 8.263124612486855e-07, + "loss": 0.6924, + "step": 66589 + }, + { + "epoch": 1.71, + "learning_rate": 8.262852114297217e-07, + "loss": 0.7285, + "step": 66590 + }, + { + "epoch": 1.71, + "learning_rate": 8.262579617437633e-07, + "loss": 0.6294, + "step": 66591 + }, + { + "epoch": 1.71, + "learning_rate": 8.262307121908312e-07, + "loss": 0.6104, + "step": 66592 + }, + { + "epoch": 1.71, + "learning_rate": 8.262034627709461e-07, + "loss": 0.5181, + "step": 66593 + }, + { + "epoch": 1.71, + "learning_rate": 8.261762134841294e-07, + "loss": 0.4778, + "step": 66594 + }, + { + "epoch": 1.71, + "learning_rate": 8.261489643304015e-07, + "loss": 0.5908, + "step": 66595 + }, + { + "epoch": 1.71, + "learning_rate": 8.26121715309783e-07, + "loss": 0.646, + "step": 66596 + }, + { + "epoch": 1.71, + "learning_rate": 8.260944664222955e-07, + "loss": 0.7471, + "step": 66597 + }, + { + "epoch": 1.71, + "learning_rate": 8.260672176679591e-07, + "loss": 0.6362, + "step": 66598 + }, + { + "epoch": 1.71, + "learning_rate": 8.260399690467953e-07, + "loss": 0.6685, + "step": 66599 + }, + { + "epoch": 1.71, + "learning_rate": 8.260127205588245e-07, + "loss": 0.7036, + "step": 66600 + }, + { + "epoch": 1.71, + "learning_rate": 8.259854722040679e-07, + "loss": 0.4072, + "step": 66601 + }, + { + "epoch": 1.71, + "learning_rate": 8.25958223982546e-07, + "loss": 0.5415, + "step": 66602 + }, + { + "epoch": 1.71, + "learning_rate": 8.259309758942802e-07, + "loss": 0.3787, + "step": 66603 + }, + { + "epoch": 1.71, + "learning_rate": 8.259037279392912e-07, + "loss": 0.5298, + "step": 66604 + }, + { + "epoch": 1.71, + "learning_rate": 8.258764801175994e-07, + "loss": 0.7158, + "step": 66605 + }, + { + "epoch": 1.71, + "learning_rate": 8.25849232429226e-07, + "loss": 0.7261, + "step": 66606 + }, + { + "epoch": 1.71, + "learning_rate": 8.258219848741918e-07, + "loss": 0.5869, + "step": 66607 + }, + { + "epoch": 1.71, + "learning_rate": 8.257947374525177e-07, + "loss": 0.6973, + "step": 66608 + }, + { + "epoch": 1.71, + "learning_rate": 8.257674901642247e-07, + "loss": 0.7041, + "step": 66609 + }, + { + "epoch": 1.71, + "learning_rate": 8.257402430093332e-07, + "loss": 0.6133, + "step": 66610 + }, + { + "epoch": 1.71, + "learning_rate": 8.257129959878647e-07, + "loss": 0.6406, + "step": 66611 + }, + { + "epoch": 1.71, + "learning_rate": 8.256857490998394e-07, + "loss": 0.366, + "step": 66612 + }, + { + "epoch": 1.71, + "learning_rate": 8.256585023452789e-07, + "loss": 0.6006, + "step": 66613 + }, + { + "epoch": 1.71, + "learning_rate": 8.256312557242039e-07, + "loss": 0.4707, + "step": 66614 + }, + { + "epoch": 1.71, + "learning_rate": 8.256040092366344e-07, + "loss": 0.4553, + "step": 66615 + }, + { + "epoch": 1.71, + "learning_rate": 8.255767628825923e-07, + "loss": 0.5859, + "step": 66616 + }, + { + "epoch": 1.71, + "learning_rate": 8.255495166620977e-07, + "loss": 0.8188, + "step": 66617 + }, + { + "epoch": 1.71, + "learning_rate": 8.255222705751721e-07, + "loss": 0.5381, + "step": 66618 + }, + { + "epoch": 1.71, + "learning_rate": 8.254950246218358e-07, + "loss": 0.4536, + "step": 66619 + }, + { + "epoch": 1.71, + "learning_rate": 8.254677788021103e-07, + "loss": 0.5439, + "step": 66620 + }, + { + "epoch": 1.71, + "learning_rate": 8.254405331160159e-07, + "loss": 0.5396, + "step": 66621 + }, + { + "epoch": 1.71, + "learning_rate": 8.254132875635736e-07, + "loss": 0.6279, + "step": 66622 + }, + { + "epoch": 1.71, + "learning_rate": 8.253860421448045e-07, + "loss": 0.6914, + "step": 66623 + }, + { + "epoch": 1.71, + "learning_rate": 8.253587968597294e-07, + "loss": 0.7085, + "step": 66624 + }, + { + "epoch": 1.71, + "learning_rate": 8.253315517083686e-07, + "loss": 0.8008, + "step": 66625 + }, + { + "epoch": 1.71, + "learning_rate": 8.253043066907438e-07, + "loss": 0.7219, + "step": 66626 + }, + { + "epoch": 1.71, + "learning_rate": 8.252770618068751e-07, + "loss": 0.6328, + "step": 66627 + }, + { + "epoch": 1.71, + "learning_rate": 8.25249817056784e-07, + "loss": 0.6553, + "step": 66628 + }, + { + "epoch": 1.71, + "learning_rate": 8.252225724404908e-07, + "loss": 0.6802, + "step": 66629 + }, + { + "epoch": 1.71, + "learning_rate": 8.251953279580169e-07, + "loss": 0.5757, + "step": 66630 + }, + { + "epoch": 1.71, + "learning_rate": 8.251680836093826e-07, + "loss": 0.5845, + "step": 66631 + }, + { + "epoch": 1.71, + "learning_rate": 8.251408393946093e-07, + "loss": 0.6719, + "step": 66632 + }, + { + "epoch": 1.71, + "learning_rate": 8.251135953137175e-07, + "loss": 0.5365, + "step": 66633 + }, + { + "epoch": 1.71, + "learning_rate": 8.250863513667285e-07, + "loss": 0.6514, + "step": 66634 + }, + { + "epoch": 1.71, + "learning_rate": 8.250591075536628e-07, + "loss": 0.6523, + "step": 66635 + }, + { + "epoch": 1.71, + "learning_rate": 8.25031863874541e-07, + "loss": 0.7061, + "step": 66636 + }, + { + "epoch": 1.71, + "learning_rate": 8.250046203293843e-07, + "loss": 0.4697, + "step": 66637 + }, + { + "epoch": 1.71, + "learning_rate": 8.249773769182137e-07, + "loss": 0.6494, + "step": 66638 + }, + { + "epoch": 1.71, + "learning_rate": 8.249501336410496e-07, + "loss": 0.7119, + "step": 66639 + }, + { + "epoch": 1.71, + "learning_rate": 8.249228904979133e-07, + "loss": 0.5352, + "step": 66640 + }, + { + "epoch": 1.71, + "learning_rate": 8.248956474888254e-07, + "loss": 0.7998, + "step": 66641 + }, + { + "epoch": 1.71, + "learning_rate": 8.248684046138071e-07, + "loss": 0.3916, + "step": 66642 + }, + { + "epoch": 1.71, + "learning_rate": 8.248411618728785e-07, + "loss": 0.6357, + "step": 66643 + }, + { + "epoch": 1.71, + "learning_rate": 8.248139192660617e-07, + "loss": 0.71, + "step": 66644 + }, + { + "epoch": 1.71, + "learning_rate": 8.247866767933765e-07, + "loss": 0.5171, + "step": 66645 + }, + { + "epoch": 1.71, + "learning_rate": 8.247594344548438e-07, + "loss": 0.7236, + "step": 66646 + }, + { + "epoch": 1.71, + "learning_rate": 8.24732192250485e-07, + "loss": 0.627, + "step": 66647 + }, + { + "epoch": 1.71, + "learning_rate": 8.247049501803206e-07, + "loss": 0.6299, + "step": 66648 + }, + { + "epoch": 1.71, + "learning_rate": 8.246777082443717e-07, + "loss": 0.6289, + "step": 66649 + }, + { + "epoch": 1.71, + "learning_rate": 8.246504664426588e-07, + "loss": 0.5405, + "step": 66650 + }, + { + "epoch": 1.71, + "learning_rate": 8.246232247752032e-07, + "loss": 0.7432, + "step": 66651 + }, + { + "epoch": 1.71, + "learning_rate": 8.245959832420253e-07, + "loss": 0.7686, + "step": 66652 + }, + { + "epoch": 1.71, + "learning_rate": 8.245687418431464e-07, + "loss": 0.7275, + "step": 66653 + }, + { + "epoch": 1.71, + "learning_rate": 8.245415005785874e-07, + "loss": 0.8096, + "step": 66654 + }, + { + "epoch": 1.71, + "learning_rate": 8.245142594483686e-07, + "loss": 0.6074, + "step": 66655 + }, + { + "epoch": 1.71, + "learning_rate": 8.24487018452511e-07, + "loss": 0.6777, + "step": 66656 + }, + { + "epoch": 1.71, + "learning_rate": 8.244597775910358e-07, + "loss": 0.5847, + "step": 66657 + }, + { + "epoch": 1.71, + "learning_rate": 8.244325368639635e-07, + "loss": 0.71, + "step": 66658 + }, + { + "epoch": 1.71, + "learning_rate": 8.244052962713154e-07, + "loss": 0.7314, + "step": 66659 + }, + { + "epoch": 1.71, + "learning_rate": 8.243780558131118e-07, + "loss": 0.7354, + "step": 66660 + }, + { + "epoch": 1.71, + "learning_rate": 8.243508154893741e-07, + "loss": 0.6992, + "step": 66661 + }, + { + "epoch": 1.71, + "learning_rate": 8.243235753001228e-07, + "loss": 0.7275, + "step": 66662 + }, + { + "epoch": 1.71, + "learning_rate": 8.242963352453789e-07, + "loss": 0.4755, + "step": 66663 + }, + { + "epoch": 1.71, + "learning_rate": 8.242690953251635e-07, + "loss": 0.7808, + "step": 66664 + }, + { + "epoch": 1.71, + "learning_rate": 8.242418555394967e-07, + "loss": 0.7324, + "step": 66665 + }, + { + "epoch": 1.71, + "learning_rate": 8.242146158884e-07, + "loss": 0.6245, + "step": 66666 + }, + { + "epoch": 1.71, + "learning_rate": 8.241873763718941e-07, + "loss": 0.5977, + "step": 66667 + }, + { + "epoch": 1.71, + "learning_rate": 8.241601369899997e-07, + "loss": 0.5747, + "step": 66668 + }, + { + "epoch": 1.71, + "learning_rate": 8.24132897742738e-07, + "loss": 0.5684, + "step": 66669 + }, + { + "epoch": 1.71, + "learning_rate": 8.241056586301296e-07, + "loss": 0.5166, + "step": 66670 + }, + { + "epoch": 1.71, + "learning_rate": 8.240784196521953e-07, + "loss": 0.5947, + "step": 66671 + }, + { + "epoch": 1.71, + "learning_rate": 8.240511808089561e-07, + "loss": 0.5654, + "step": 66672 + }, + { + "epoch": 1.71, + "learning_rate": 8.240239421004328e-07, + "loss": 0.668, + "step": 66673 + }, + { + "epoch": 1.71, + "learning_rate": 8.239967035266468e-07, + "loss": 0.7041, + "step": 66674 + }, + { + "epoch": 1.71, + "learning_rate": 8.239694650876179e-07, + "loss": 0.6797, + "step": 66675 + }, + { + "epoch": 1.71, + "learning_rate": 8.239422267833677e-07, + "loss": 0.6836, + "step": 66676 + }, + { + "epoch": 1.71, + "learning_rate": 8.239149886139165e-07, + "loss": 0.6313, + "step": 66677 + }, + { + "epoch": 1.71, + "learning_rate": 8.238877505792858e-07, + "loss": 0.5322, + "step": 66678 + }, + { + "epoch": 1.71, + "learning_rate": 8.238605126794958e-07, + "loss": 0.6426, + "step": 66679 + }, + { + "epoch": 1.71, + "learning_rate": 8.238332749145681e-07, + "loss": 0.6582, + "step": 66680 + }, + { + "epoch": 1.71, + "learning_rate": 8.23806037284523e-07, + "loss": 0.5493, + "step": 66681 + }, + { + "epoch": 1.71, + "learning_rate": 8.237787997893815e-07, + "loss": 0.5679, + "step": 66682 + }, + { + "epoch": 1.71, + "learning_rate": 8.237515624291644e-07, + "loss": 0.5725, + "step": 66683 + }, + { + "epoch": 1.71, + "learning_rate": 8.23724325203893e-07, + "loss": 0.7227, + "step": 66684 + }, + { + "epoch": 1.71, + "learning_rate": 8.236970881135876e-07, + "loss": 0.7852, + "step": 66685 + }, + { + "epoch": 1.71, + "learning_rate": 8.23669851158269e-07, + "loss": 0.5476, + "step": 66686 + }, + { + "epoch": 1.71, + "learning_rate": 8.236426143379586e-07, + "loss": 0.5879, + "step": 66687 + }, + { + "epoch": 1.71, + "learning_rate": 8.236153776526766e-07, + "loss": 0.5928, + "step": 66688 + }, + { + "epoch": 1.71, + "learning_rate": 8.235881411024444e-07, + "loss": 0.4468, + "step": 66689 + }, + { + "epoch": 1.71, + "learning_rate": 8.235609046872824e-07, + "loss": 0.6772, + "step": 66690 + }, + { + "epoch": 1.71, + "learning_rate": 8.23533668407212e-07, + "loss": 0.603, + "step": 66691 + }, + { + "epoch": 1.71, + "learning_rate": 8.235064322622535e-07, + "loss": 0.6982, + "step": 66692 + }, + { + "epoch": 1.71, + "learning_rate": 8.234791962524284e-07, + "loss": 0.583, + "step": 66693 + }, + { + "epoch": 1.71, + "learning_rate": 8.234519603777573e-07, + "loss": 0.6577, + "step": 66694 + }, + { + "epoch": 1.71, + "learning_rate": 8.234247246382606e-07, + "loss": 0.6323, + "step": 66695 + }, + { + "epoch": 1.71, + "learning_rate": 8.233974890339593e-07, + "loss": 0.6304, + "step": 66696 + }, + { + "epoch": 1.71, + "learning_rate": 8.233702535648745e-07, + "loss": 0.5853, + "step": 66697 + }, + { + "epoch": 1.71, + "learning_rate": 8.233430182310271e-07, + "loss": 0.6348, + "step": 66698 + }, + { + "epoch": 1.71, + "learning_rate": 8.233157830324378e-07, + "loss": 0.6631, + "step": 66699 + }, + { + "epoch": 1.71, + "learning_rate": 8.232885479691273e-07, + "loss": 0.5715, + "step": 66700 + }, + { + "epoch": 1.71, + "learning_rate": 8.232613130411168e-07, + "loss": 0.532, + "step": 66701 + }, + { + "epoch": 1.71, + "learning_rate": 8.232340782484268e-07, + "loss": 0.7266, + "step": 66702 + }, + { + "epoch": 1.71, + "learning_rate": 8.232068435910786e-07, + "loss": 0.71, + "step": 66703 + }, + { + "epoch": 1.71, + "learning_rate": 8.23179609069093e-07, + "loss": 0.707, + "step": 66704 + }, + { + "epoch": 1.71, + "learning_rate": 8.231523746824902e-07, + "loss": 0.6699, + "step": 66705 + }, + { + "epoch": 1.71, + "learning_rate": 8.231251404312916e-07, + "loss": 0.7466, + "step": 66706 + }, + { + "epoch": 1.71, + "learning_rate": 8.230979063155179e-07, + "loss": 0.4719, + "step": 66707 + }, + { + "epoch": 1.71, + "learning_rate": 8.230706723351901e-07, + "loss": 0.5874, + "step": 66708 + }, + { + "epoch": 1.71, + "learning_rate": 8.230434384903289e-07, + "loss": 0.5615, + "step": 66709 + }, + { + "epoch": 1.71, + "learning_rate": 8.230162047809553e-07, + "loss": 0.5078, + "step": 66710 + }, + { + "epoch": 1.71, + "learning_rate": 8.2298897120709e-07, + "loss": 0.666, + "step": 66711 + }, + { + "epoch": 1.71, + "learning_rate": 8.229617377687538e-07, + "loss": 0.4598, + "step": 66712 + }, + { + "epoch": 1.71, + "learning_rate": 8.229345044659678e-07, + "loss": 0.5581, + "step": 66713 + }, + { + "epoch": 1.71, + "learning_rate": 8.22907271298753e-07, + "loss": 0.3634, + "step": 66714 + }, + { + "epoch": 1.71, + "learning_rate": 8.228800382671294e-07, + "loss": 0.707, + "step": 66715 + }, + { + "epoch": 1.71, + "learning_rate": 8.228528053711187e-07, + "loss": 0.71, + "step": 66716 + }, + { + "epoch": 1.71, + "learning_rate": 8.228255726107412e-07, + "loss": 0.6416, + "step": 66717 + }, + { + "epoch": 1.71, + "learning_rate": 8.227983399860183e-07, + "loss": 0.7188, + "step": 66718 + }, + { + "epoch": 1.71, + "learning_rate": 8.227711074969703e-07, + "loss": 0.6123, + "step": 66719 + }, + { + "epoch": 1.71, + "learning_rate": 8.227438751436186e-07, + "loss": 0.5505, + "step": 66720 + }, + { + "epoch": 1.71, + "learning_rate": 8.227166429259835e-07, + "loss": 0.5903, + "step": 66721 + }, + { + "epoch": 1.71, + "learning_rate": 8.226894108440863e-07, + "loss": 0.6113, + "step": 66722 + }, + { + "epoch": 1.71, + "learning_rate": 8.226621788979476e-07, + "loss": 0.4746, + "step": 66723 + }, + { + "epoch": 1.71, + "learning_rate": 8.226349470875885e-07, + "loss": 0.8701, + "step": 66724 + }, + { + "epoch": 1.71, + "learning_rate": 8.226077154130296e-07, + "loss": 0.6455, + "step": 66725 + }, + { + "epoch": 1.71, + "learning_rate": 8.225804838742915e-07, + "loss": 0.7197, + "step": 66726 + }, + { + "epoch": 1.71, + "learning_rate": 8.225532524713958e-07, + "loss": 0.6006, + "step": 66727 + }, + { + "epoch": 1.71, + "learning_rate": 8.225260212043627e-07, + "loss": 0.7148, + "step": 66728 + }, + { + "epoch": 1.71, + "learning_rate": 8.224987900732131e-07, + "loss": 0.5728, + "step": 66729 + }, + { + "epoch": 1.71, + "learning_rate": 8.224715590779682e-07, + "loss": 0.6924, + "step": 66730 + }, + { + "epoch": 1.71, + "learning_rate": 8.224443282186486e-07, + "loss": 0.5381, + "step": 66731 + }, + { + "epoch": 1.71, + "learning_rate": 8.224170974952753e-07, + "loss": 0.6729, + "step": 66732 + }, + { + "epoch": 1.71, + "learning_rate": 8.223898669078688e-07, + "loss": 0.7998, + "step": 66733 + }, + { + "epoch": 1.71, + "learning_rate": 8.223626364564507e-07, + "loss": 0.5562, + "step": 66734 + }, + { + "epoch": 1.71, + "learning_rate": 8.223354061410412e-07, + "loss": 0.499, + "step": 66735 + }, + { + "epoch": 1.71, + "learning_rate": 8.22308175961661e-07, + "loss": 0.7344, + "step": 66736 + }, + { + "epoch": 1.71, + "learning_rate": 8.222809459183316e-07, + "loss": 0.6338, + "step": 66737 + }, + { + "epoch": 1.71, + "learning_rate": 8.222537160110732e-07, + "loss": 0.7178, + "step": 66738 + }, + { + "epoch": 1.71, + "learning_rate": 8.222264862399072e-07, + "loss": 0.6689, + "step": 66739 + }, + { + "epoch": 1.71, + "learning_rate": 8.22199256604854e-07, + "loss": 0.7822, + "step": 66740 + }, + { + "epoch": 1.71, + "learning_rate": 8.221720271059349e-07, + "loss": 0.4966, + "step": 66741 + }, + { + "epoch": 1.71, + "learning_rate": 8.221447977431702e-07, + "loss": 0.4877, + "step": 66742 + }, + { + "epoch": 1.71, + "learning_rate": 8.221175685165813e-07, + "loss": 0.469, + "step": 66743 + }, + { + "epoch": 1.71, + "learning_rate": 8.220903394261891e-07, + "loss": 0.8154, + "step": 66744 + }, + { + "epoch": 1.71, + "learning_rate": 8.220631104720138e-07, + "loss": 0.6616, + "step": 66745 + }, + { + "epoch": 1.71, + "learning_rate": 8.220358816540765e-07, + "loss": 0.6021, + "step": 66746 + }, + { + "epoch": 1.71, + "learning_rate": 8.220086529723982e-07, + "loss": 0.8105, + "step": 66747 + }, + { + "epoch": 1.71, + "learning_rate": 8.219814244269996e-07, + "loss": 0.7095, + "step": 66748 + }, + { + "epoch": 1.71, + "learning_rate": 8.219541960179018e-07, + "loss": 0.6128, + "step": 66749 + }, + { + "epoch": 1.71, + "learning_rate": 8.219269677451253e-07, + "loss": 0.6328, + "step": 66750 + }, + { + "epoch": 1.71, + "learning_rate": 8.218997396086913e-07, + "loss": 0.6592, + "step": 66751 + }, + { + "epoch": 1.71, + "learning_rate": 8.218725116086203e-07, + "loss": 0.5786, + "step": 66752 + }, + { + "epoch": 1.71, + "learning_rate": 8.218452837449337e-07, + "loss": 0.6973, + "step": 66753 + }, + { + "epoch": 1.71, + "learning_rate": 8.218180560176519e-07, + "loss": 0.6904, + "step": 66754 + }, + { + "epoch": 1.71, + "learning_rate": 8.217908284267955e-07, + "loss": 0.4648, + "step": 66755 + }, + { + "epoch": 1.71, + "learning_rate": 8.21763600972386e-07, + "loss": 0.6982, + "step": 66756 + }, + { + "epoch": 1.71, + "learning_rate": 8.217363736544436e-07, + "loss": 0.7109, + "step": 66757 + }, + { + "epoch": 1.71, + "learning_rate": 8.217091464729897e-07, + "loss": 0.7822, + "step": 66758 + }, + { + "epoch": 1.71, + "learning_rate": 8.216819194280447e-07, + "loss": 0.7031, + "step": 66759 + }, + { + "epoch": 1.71, + "learning_rate": 8.216546925196298e-07, + "loss": 0.7383, + "step": 66760 + }, + { + "epoch": 1.71, + "learning_rate": 8.216274657477656e-07, + "loss": 0.5874, + "step": 66761 + }, + { + "epoch": 1.71, + "learning_rate": 8.216002391124731e-07, + "loss": 0.7007, + "step": 66762 + }, + { + "epoch": 1.71, + "learning_rate": 8.21573012613773e-07, + "loss": 0.7129, + "step": 66763 + }, + { + "epoch": 1.71, + "learning_rate": 8.215457862516869e-07, + "loss": 0.5435, + "step": 66764 + }, + { + "epoch": 1.71, + "learning_rate": 8.215185600262343e-07, + "loss": 0.6572, + "step": 66765 + }, + { + "epoch": 1.71, + "learning_rate": 8.21491333937437e-07, + "loss": 0.5276, + "step": 66766 + }, + { + "epoch": 1.71, + "learning_rate": 8.214641079853153e-07, + "loss": 0.5742, + "step": 66767 + }, + { + "epoch": 1.71, + "learning_rate": 8.214368821698905e-07, + "loss": 0.5078, + "step": 66768 + }, + { + "epoch": 1.71, + "learning_rate": 8.214096564911831e-07, + "loss": 0.7695, + "step": 66769 + }, + { + "epoch": 1.71, + "learning_rate": 8.213824309492143e-07, + "loss": 0.4634, + "step": 66770 + }, + { + "epoch": 1.71, + "learning_rate": 8.213552055440046e-07, + "loss": 0.7451, + "step": 66771 + }, + { + "epoch": 1.71, + "learning_rate": 8.213279802755752e-07, + "loss": 0.7412, + "step": 66772 + }, + { + "epoch": 1.71, + "learning_rate": 8.213007551439465e-07, + "loss": 0.6191, + "step": 66773 + }, + { + "epoch": 1.71, + "learning_rate": 8.212735301491401e-07, + "loss": 0.6514, + "step": 66774 + }, + { + "epoch": 1.71, + "learning_rate": 8.212463052911761e-07, + "loss": 0.5518, + "step": 66775 + }, + { + "epoch": 1.71, + "learning_rate": 8.212190805700753e-07, + "loss": 0.6685, + "step": 66776 + }, + { + "epoch": 1.71, + "learning_rate": 8.211918559858592e-07, + "loss": 0.667, + "step": 66777 + }, + { + "epoch": 1.71, + "learning_rate": 8.211646315385479e-07, + "loss": 0.6689, + "step": 66778 + }, + { + "epoch": 1.71, + "learning_rate": 8.21137407228163e-07, + "loss": 0.4761, + "step": 66779 + }, + { + "epoch": 1.71, + "learning_rate": 8.211101830547245e-07, + "loss": 0.5122, + "step": 66780 + }, + { + "epoch": 1.71, + "learning_rate": 8.210829590182541e-07, + "loss": 0.5859, + "step": 66781 + }, + { + "epoch": 1.71, + "learning_rate": 8.21055735118772e-07, + "loss": 0.6602, + "step": 66782 + }, + { + "epoch": 1.71, + "learning_rate": 8.210285113562995e-07, + "loss": 0.5464, + "step": 66783 + }, + { + "epoch": 1.71, + "learning_rate": 8.210012877308574e-07, + "loss": 0.6587, + "step": 66784 + }, + { + "epoch": 1.71, + "learning_rate": 8.209740642424662e-07, + "loss": 0.6777, + "step": 66785 + }, + { + "epoch": 1.71, + "learning_rate": 8.209468408911469e-07, + "loss": 0.594, + "step": 66786 + }, + { + "epoch": 1.71, + "learning_rate": 8.209196176769204e-07, + "loss": 0.6953, + "step": 66787 + }, + { + "epoch": 1.71, + "learning_rate": 8.208923945998073e-07, + "loss": 0.6001, + "step": 66788 + }, + { + "epoch": 1.71, + "learning_rate": 8.20865171659829e-07, + "loss": 0.6504, + "step": 66789 + }, + { + "epoch": 1.71, + "learning_rate": 8.208379488570057e-07, + "loss": 0.5636, + "step": 66790 + }, + { + "epoch": 1.71, + "learning_rate": 8.208107261913586e-07, + "loss": 0.7686, + "step": 66791 + }, + { + "epoch": 1.71, + "learning_rate": 8.207835036629084e-07, + "loss": 0.6118, + "step": 66792 + }, + { + "epoch": 1.71, + "learning_rate": 8.207562812716766e-07, + "loss": 0.645, + "step": 66793 + }, + { + "epoch": 1.71, + "learning_rate": 8.207290590176831e-07, + "loss": 0.5962, + "step": 66794 + }, + { + "epoch": 1.71, + "learning_rate": 8.207018369009488e-07, + "loss": 0.6396, + "step": 66795 + }, + { + "epoch": 1.71, + "learning_rate": 8.206746149214954e-07, + "loss": 0.7129, + "step": 66796 + }, + { + "epoch": 1.71, + "learning_rate": 8.206473930793427e-07, + "loss": 0.6167, + "step": 66797 + }, + { + "epoch": 1.71, + "learning_rate": 8.206201713745125e-07, + "loss": 0.6934, + "step": 66798 + }, + { + "epoch": 1.71, + "learning_rate": 8.205929498070248e-07, + "loss": 0.6001, + "step": 66799 + }, + { + "epoch": 1.71, + "learning_rate": 8.20565728376901e-07, + "loss": 0.5522, + "step": 66800 + }, + { + "epoch": 1.71, + "learning_rate": 8.205385070841619e-07, + "loss": 0.7451, + "step": 66801 + }, + { + "epoch": 1.71, + "learning_rate": 8.205112859288279e-07, + "loss": 0.3633, + "step": 66802 + }, + { + "epoch": 1.71, + "learning_rate": 8.204840649109206e-07, + "loss": 0.6943, + "step": 66803 + }, + { + "epoch": 1.71, + "learning_rate": 8.204568440304602e-07, + "loss": 0.6396, + "step": 66804 + }, + { + "epoch": 1.71, + "learning_rate": 8.204296232874675e-07, + "loss": 0.7578, + "step": 66805 + }, + { + "epoch": 1.71, + "learning_rate": 8.20402402681964e-07, + "loss": 0.7041, + "step": 66806 + }, + { + "epoch": 1.71, + "learning_rate": 8.203751822139696e-07, + "loss": 0.6597, + "step": 66807 + }, + { + "epoch": 1.71, + "learning_rate": 8.203479618835061e-07, + "loss": 0.792, + "step": 66808 + }, + { + "epoch": 1.71, + "learning_rate": 8.203207416905935e-07, + "loss": 0.6479, + "step": 66809 + }, + { + "epoch": 1.71, + "learning_rate": 8.202935216352534e-07, + "loss": 0.5869, + "step": 66810 + }, + { + "epoch": 1.71, + "learning_rate": 8.202663017175061e-07, + "loss": 0.5635, + "step": 66811 + }, + { + "epoch": 1.71, + "learning_rate": 8.202390819373728e-07, + "loss": 0.5381, + "step": 66812 + }, + { + "epoch": 1.71, + "learning_rate": 8.202118622948743e-07, + "loss": 0.6992, + "step": 66813 + }, + { + "epoch": 1.71, + "learning_rate": 8.20184642790031e-07, + "loss": 0.8086, + "step": 66814 + }, + { + "epoch": 1.71, + "learning_rate": 8.201574234228642e-07, + "loss": 0.6567, + "step": 66815 + }, + { + "epoch": 1.71, + "learning_rate": 8.201302041933944e-07, + "loss": 0.7764, + "step": 66816 + }, + { + "epoch": 1.71, + "learning_rate": 8.201029851016428e-07, + "loss": 0.4706, + "step": 66817 + }, + { + "epoch": 1.71, + "learning_rate": 8.200757661476302e-07, + "loss": 0.6421, + "step": 66818 + }, + { + "epoch": 1.71, + "learning_rate": 8.20048547331377e-07, + "loss": 0.5469, + "step": 66819 + }, + { + "epoch": 1.71, + "learning_rate": 8.200213286529045e-07, + "loss": 0.792, + "step": 66820 + }, + { + "epoch": 1.71, + "learning_rate": 8.199941101122332e-07, + "loss": 0.5647, + "step": 66821 + }, + { + "epoch": 1.71, + "learning_rate": 8.199668917093845e-07, + "loss": 0.6602, + "step": 66822 + }, + { + "epoch": 1.71, + "learning_rate": 8.19939673444379e-07, + "loss": 0.542, + "step": 66823 + }, + { + "epoch": 1.71, + "learning_rate": 8.19912455317237e-07, + "loss": 0.7876, + "step": 66824 + }, + { + "epoch": 1.71, + "learning_rate": 8.198852373279798e-07, + "loss": 0.6055, + "step": 66825 + }, + { + "epoch": 1.71, + "learning_rate": 8.198580194766282e-07, + "loss": 0.6382, + "step": 66826 + }, + { + "epoch": 1.71, + "learning_rate": 8.198308017632032e-07, + "loss": 0.6216, + "step": 66827 + }, + { + "epoch": 1.71, + "learning_rate": 8.198035841877252e-07, + "loss": 0.749, + "step": 66828 + }, + { + "epoch": 1.71, + "learning_rate": 8.197763667502156e-07, + "loss": 0.4946, + "step": 66829 + }, + { + "epoch": 1.71, + "learning_rate": 8.197491494506946e-07, + "loss": 0.7461, + "step": 66830 + }, + { + "epoch": 1.71, + "learning_rate": 8.197219322891837e-07, + "loss": 0.8701, + "step": 66831 + }, + { + "epoch": 1.71, + "learning_rate": 8.196947152657032e-07, + "loss": 0.7314, + "step": 66832 + }, + { + "epoch": 1.71, + "learning_rate": 8.196674983802746e-07, + "loss": 0.6895, + "step": 66833 + }, + { + "epoch": 1.71, + "learning_rate": 8.196402816329181e-07, + "loss": 0.6357, + "step": 66834 + }, + { + "epoch": 1.71, + "learning_rate": 8.196130650236547e-07, + "loss": 0.4448, + "step": 66835 + }, + { + "epoch": 1.71, + "learning_rate": 8.195858485525052e-07, + "loss": 0.7188, + "step": 66836 + }, + { + "epoch": 1.71, + "learning_rate": 8.195586322194905e-07, + "loss": 0.6436, + "step": 66837 + }, + { + "epoch": 1.71, + "learning_rate": 8.195314160246314e-07, + "loss": 0.6362, + "step": 66838 + }, + { + "epoch": 1.71, + "learning_rate": 8.19504199967949e-07, + "loss": 0.6875, + "step": 66839 + }, + { + "epoch": 1.71, + "learning_rate": 8.194769840494636e-07, + "loss": 0.5757, + "step": 66840 + }, + { + "epoch": 1.71, + "learning_rate": 8.194497682691968e-07, + "loss": 0.6255, + "step": 66841 + }, + { + "epoch": 1.71, + "learning_rate": 8.194225526271686e-07, + "loss": 0.6172, + "step": 66842 + }, + { + "epoch": 1.71, + "learning_rate": 8.193953371234008e-07, + "loss": 0.8545, + "step": 66843 + }, + { + "epoch": 1.71, + "learning_rate": 8.193681217579134e-07, + "loss": 0.7012, + "step": 66844 + }, + { + "epoch": 1.71, + "learning_rate": 8.193409065307273e-07, + "loss": 0.6621, + "step": 66845 + }, + { + "epoch": 1.71, + "learning_rate": 8.193136914418639e-07, + "loss": 0.6309, + "step": 66846 + }, + { + "epoch": 1.71, + "learning_rate": 8.192864764913434e-07, + "loss": 0.6179, + "step": 66847 + }, + { + "epoch": 1.71, + "learning_rate": 8.192592616791871e-07, + "loss": 0.6113, + "step": 66848 + }, + { + "epoch": 1.71, + "learning_rate": 8.192320470054155e-07, + "loss": 0.6509, + "step": 66849 + }, + { + "epoch": 1.71, + "learning_rate": 8.192048324700499e-07, + "loss": 0.5776, + "step": 66850 + }, + { + "epoch": 1.71, + "learning_rate": 8.191776180731104e-07, + "loss": 0.6123, + "step": 66851 + }, + { + "epoch": 1.71, + "learning_rate": 8.191504038146188e-07, + "loss": 0.71, + "step": 66852 + }, + { + "epoch": 1.71, + "learning_rate": 8.191231896945955e-07, + "loss": 0.7549, + "step": 66853 + }, + { + "epoch": 1.71, + "learning_rate": 8.19095975713061e-07, + "loss": 0.7451, + "step": 66854 + }, + { + "epoch": 1.71, + "learning_rate": 8.190687618700362e-07, + "loss": 0.6846, + "step": 66855 + }, + { + "epoch": 1.71, + "learning_rate": 8.190415481655424e-07, + "loss": 0.6606, + "step": 66856 + }, + { + "epoch": 1.71, + "learning_rate": 8.190143345995999e-07, + "loss": 0.5161, + "step": 66857 + }, + { + "epoch": 1.71, + "learning_rate": 8.189871211722301e-07, + "loss": 0.7041, + "step": 66858 + }, + { + "epoch": 1.71, + "learning_rate": 8.189599078834533e-07, + "loss": 0.7686, + "step": 66859 + }, + { + "epoch": 1.71, + "learning_rate": 8.189326947332906e-07, + "loss": 0.6655, + "step": 66860 + }, + { + "epoch": 1.71, + "learning_rate": 8.189054817217628e-07, + "loss": 0.5386, + "step": 66861 + }, + { + "epoch": 1.71, + "learning_rate": 8.188782688488909e-07, + "loss": 0.6777, + "step": 66862 + }, + { + "epoch": 1.71, + "learning_rate": 8.188510561146957e-07, + "loss": 0.5889, + "step": 66863 + }, + { + "epoch": 1.71, + "learning_rate": 8.188238435191976e-07, + "loss": 0.7036, + "step": 66864 + }, + { + "epoch": 1.71, + "learning_rate": 8.18796631062418e-07, + "loss": 0.5801, + "step": 66865 + }, + { + "epoch": 1.71, + "learning_rate": 8.187694187443772e-07, + "loss": 0.6865, + "step": 66866 + }, + { + "epoch": 1.71, + "learning_rate": 8.187422065650966e-07, + "loss": 0.75, + "step": 66867 + }, + { + "epoch": 1.71, + "learning_rate": 8.187149945245965e-07, + "loss": 0.6636, + "step": 66868 + }, + { + "epoch": 1.71, + "learning_rate": 8.186877826228982e-07, + "loss": 0.6953, + "step": 66869 + }, + { + "epoch": 1.71, + "learning_rate": 8.186605708600221e-07, + "loss": 0.6709, + "step": 66870 + }, + { + "epoch": 1.71, + "learning_rate": 8.186333592359895e-07, + "loss": 0.5591, + "step": 66871 + }, + { + "epoch": 1.71, + "learning_rate": 8.186061477508209e-07, + "loss": 0.6816, + "step": 66872 + }, + { + "epoch": 1.71, + "learning_rate": 8.185789364045377e-07, + "loss": 0.7373, + "step": 66873 + }, + { + "epoch": 1.71, + "learning_rate": 8.185517251971596e-07, + "loss": 0.52, + "step": 66874 + }, + { + "epoch": 1.71, + "learning_rate": 8.185245141287085e-07, + "loss": 0.6875, + "step": 66875 + }, + { + "epoch": 1.71, + "learning_rate": 8.184973031992044e-07, + "loss": 0.7871, + "step": 66876 + }, + { + "epoch": 1.71, + "learning_rate": 8.18470092408669e-07, + "loss": 0.6108, + "step": 66877 + }, + { + "epoch": 1.71, + "learning_rate": 8.184428817571223e-07, + "loss": 0.7012, + "step": 66878 + }, + { + "epoch": 1.71, + "learning_rate": 8.184156712445859e-07, + "loss": 0.6851, + "step": 66879 + }, + { + "epoch": 1.71, + "learning_rate": 8.1838846087108e-07, + "loss": 0.6426, + "step": 66880 + }, + { + "epoch": 1.71, + "learning_rate": 8.183612506366258e-07, + "loss": 0.709, + "step": 66881 + }, + { + "epoch": 1.71, + "learning_rate": 8.18334040541244e-07, + "loss": 0.7803, + "step": 66882 + }, + { + "epoch": 1.71, + "learning_rate": 8.183068305849558e-07, + "loss": 0.6021, + "step": 66883 + }, + { + "epoch": 1.71, + "learning_rate": 8.182796207677815e-07, + "loss": 0.7754, + "step": 66884 + }, + { + "epoch": 1.71, + "learning_rate": 8.182524110897421e-07, + "loss": 0.7734, + "step": 66885 + }, + { + "epoch": 1.71, + "learning_rate": 8.182252015508585e-07, + "loss": 0.7158, + "step": 66886 + }, + { + "epoch": 1.71, + "learning_rate": 8.181979921511514e-07, + "loss": 0.6064, + "step": 66887 + }, + { + "epoch": 1.71, + "learning_rate": 8.181707828906419e-07, + "loss": 0.6279, + "step": 66888 + }, + { + "epoch": 1.71, + "learning_rate": 8.181435737693504e-07, + "loss": 0.7734, + "step": 66889 + }, + { + "epoch": 1.71, + "learning_rate": 8.181163647872982e-07, + "loss": 0.5959, + "step": 66890 + }, + { + "epoch": 1.71, + "learning_rate": 8.18089155944506e-07, + "loss": 0.6538, + "step": 66891 + }, + { + "epoch": 1.71, + "learning_rate": 8.180619472409944e-07, + "loss": 0.7266, + "step": 66892 + }, + { + "epoch": 1.71, + "learning_rate": 8.180347386767848e-07, + "loss": 0.5791, + "step": 66893 + }, + { + "epoch": 1.71, + "learning_rate": 8.180075302518974e-07, + "loss": 0.6318, + "step": 66894 + }, + { + "epoch": 1.71, + "learning_rate": 8.17980321966353e-07, + "loss": 0.4624, + "step": 66895 + }, + { + "epoch": 1.71, + "learning_rate": 8.17953113820173e-07, + "loss": 0.7148, + "step": 66896 + }, + { + "epoch": 1.71, + "learning_rate": 8.179259058133776e-07, + "loss": 0.7002, + "step": 66897 + }, + { + "epoch": 1.71, + "learning_rate": 8.178986979459883e-07, + "loss": 0.6514, + "step": 66898 + }, + { + "epoch": 1.71, + "learning_rate": 8.178714902180254e-07, + "loss": 0.8896, + "step": 66899 + }, + { + "epoch": 1.71, + "learning_rate": 8.1784428262951e-07, + "loss": 0.7251, + "step": 66900 + }, + { + "epoch": 1.71, + "learning_rate": 8.178170751804627e-07, + "loss": 0.48, + "step": 66901 + }, + { + "epoch": 1.71, + "learning_rate": 8.177898678709048e-07, + "loss": 0.7285, + "step": 66902 + }, + { + "epoch": 1.71, + "learning_rate": 8.17762660700857e-07, + "loss": 0.5581, + "step": 66903 + }, + { + "epoch": 1.71, + "learning_rate": 8.177354536703393e-07, + "loss": 0.71, + "step": 66904 + }, + { + "epoch": 1.71, + "learning_rate": 8.177082467793736e-07, + "loss": 0.6519, + "step": 66905 + }, + { + "epoch": 1.71, + "learning_rate": 8.176810400279801e-07, + "loss": 0.5188, + "step": 66906 + }, + { + "epoch": 1.71, + "learning_rate": 8.176538334161801e-07, + "loss": 0.6338, + "step": 66907 + }, + { + "epoch": 1.71, + "learning_rate": 8.176266269439941e-07, + "loss": 0.5786, + "step": 66908 + }, + { + "epoch": 1.71, + "learning_rate": 8.175994206114428e-07, + "loss": 0.7295, + "step": 66909 + }, + { + "epoch": 1.71, + "learning_rate": 8.175722144185475e-07, + "loss": 0.7656, + "step": 66910 + }, + { + "epoch": 1.71, + "learning_rate": 8.175450083653285e-07, + "loss": 0.582, + "step": 66911 + }, + { + "epoch": 1.71, + "learning_rate": 8.175178024518071e-07, + "loss": 0.7256, + "step": 66912 + }, + { + "epoch": 1.72, + "learning_rate": 8.174905966780041e-07, + "loss": 0.4478, + "step": 66913 + }, + { + "epoch": 1.72, + "learning_rate": 8.174633910439398e-07, + "loss": 0.7725, + "step": 66914 + }, + { + "epoch": 1.72, + "learning_rate": 8.174361855496356e-07, + "loss": 0.7607, + "step": 66915 + }, + { + "epoch": 1.72, + "learning_rate": 8.174089801951119e-07, + "loss": 0.8369, + "step": 66916 + }, + { + "epoch": 1.72, + "learning_rate": 8.1738177498039e-07, + "loss": 0.7158, + "step": 66917 + }, + { + "epoch": 1.72, + "learning_rate": 8.173545699054902e-07, + "loss": 0.5967, + "step": 66918 + }, + { + "epoch": 1.72, + "learning_rate": 8.173273649704337e-07, + "loss": 0.5933, + "step": 66919 + }, + { + "epoch": 1.72, + "learning_rate": 8.173001601752413e-07, + "loss": 0.4891, + "step": 66920 + }, + { + "epoch": 1.72, + "learning_rate": 8.172729555199338e-07, + "loss": 0.564, + "step": 66921 + }, + { + "epoch": 1.72, + "learning_rate": 8.172457510045319e-07, + "loss": 0.6831, + "step": 66922 + }, + { + "epoch": 1.72, + "learning_rate": 8.172185466290569e-07, + "loss": 0.5967, + "step": 66923 + }, + { + "epoch": 1.72, + "learning_rate": 8.171913423935289e-07, + "loss": 0.6447, + "step": 66924 + }, + { + "epoch": 1.72, + "learning_rate": 8.171641382979691e-07, + "loss": 0.626, + "step": 66925 + }, + { + "epoch": 1.72, + "learning_rate": 8.171369343423984e-07, + "loss": 0.6074, + "step": 66926 + }, + { + "epoch": 1.72, + "learning_rate": 8.171097305268375e-07, + "loss": 0.6084, + "step": 66927 + }, + { + "epoch": 1.72, + "learning_rate": 8.170825268513071e-07, + "loss": 0.7871, + "step": 66928 + }, + { + "epoch": 1.72, + "learning_rate": 8.170553233158285e-07, + "loss": 0.5977, + "step": 66929 + }, + { + "epoch": 1.72, + "learning_rate": 8.170281199204219e-07, + "loss": 0.5239, + "step": 66930 + }, + { + "epoch": 1.72, + "learning_rate": 8.170009166651087e-07, + "loss": 0.6362, + "step": 66931 + }, + { + "epoch": 1.72, + "learning_rate": 8.169737135499093e-07, + "loss": 0.6279, + "step": 66932 + }, + { + "epoch": 1.72, + "learning_rate": 8.169465105748451e-07, + "loss": 0.7061, + "step": 66933 + }, + { + "epoch": 1.72, + "learning_rate": 8.169193077399363e-07, + "loss": 0.6748, + "step": 66934 + }, + { + "epoch": 1.72, + "learning_rate": 8.168921050452037e-07, + "loss": 0.71, + "step": 66935 + }, + { + "epoch": 1.72, + "learning_rate": 8.168649024906688e-07, + "loss": 0.7656, + "step": 66936 + }, + { + "epoch": 1.72, + "learning_rate": 8.168377000763518e-07, + "loss": 0.7495, + "step": 66937 + }, + { + "epoch": 1.72, + "learning_rate": 8.168104978022738e-07, + "loss": 0.415, + "step": 66938 + }, + { + "epoch": 1.72, + "learning_rate": 8.167832956684555e-07, + "loss": 0.7344, + "step": 66939 + }, + { + "epoch": 1.72, + "learning_rate": 8.167560936749179e-07, + "loss": 0.4961, + "step": 66940 + }, + { + "epoch": 1.72, + "learning_rate": 8.167288918216816e-07, + "loss": 0.8472, + "step": 66941 + }, + { + "epoch": 1.72, + "learning_rate": 8.167016901087678e-07, + "loss": 0.7002, + "step": 66942 + }, + { + "epoch": 1.72, + "learning_rate": 8.166744885361972e-07, + "loss": 0.5854, + "step": 66943 + }, + { + "epoch": 1.72, + "learning_rate": 8.166472871039904e-07, + "loss": 0.7461, + "step": 66944 + }, + { + "epoch": 1.72, + "learning_rate": 8.166200858121681e-07, + "loss": 0.7402, + "step": 66945 + }, + { + "epoch": 1.72, + "learning_rate": 8.165928846607516e-07, + "loss": 0.6187, + "step": 66946 + }, + { + "epoch": 1.72, + "learning_rate": 8.165656836497612e-07, + "loss": 0.6641, + "step": 66947 + }, + { + "epoch": 1.72, + "learning_rate": 8.165384827792183e-07, + "loss": 0.6436, + "step": 66948 + }, + { + "epoch": 1.72, + "learning_rate": 8.165112820491433e-07, + "loss": 0.623, + "step": 66949 + }, + { + "epoch": 1.72, + "learning_rate": 8.164840814595573e-07, + "loss": 0.5371, + "step": 66950 + }, + { + "epoch": 1.72, + "learning_rate": 8.164568810104807e-07, + "loss": 0.5464, + "step": 66951 + }, + { + "epoch": 1.72, + "learning_rate": 8.16429680701935e-07, + "loss": 0.4688, + "step": 66952 + }, + { + "epoch": 1.72, + "learning_rate": 8.164024805339408e-07, + "loss": 0.7891, + "step": 66953 + }, + { + "epoch": 1.72, + "learning_rate": 8.163752805065182e-07, + "loss": 0.5732, + "step": 66954 + }, + { + "epoch": 1.72, + "learning_rate": 8.16348080619689e-07, + "loss": 0.3974, + "step": 66955 + }, + { + "epoch": 1.72, + "learning_rate": 8.163208808734735e-07, + "loss": 0.8438, + "step": 66956 + }, + { + "epoch": 1.72, + "learning_rate": 8.162936812678928e-07, + "loss": 0.7188, + "step": 66957 + }, + { + "epoch": 1.72, + "learning_rate": 8.162664818029673e-07, + "loss": 0.533, + "step": 66958 + }, + { + "epoch": 1.72, + "learning_rate": 8.162392824787184e-07, + "loss": 0.5977, + "step": 66959 + }, + { + "epoch": 1.72, + "learning_rate": 8.162120832951662e-07, + "loss": 0.7969, + "step": 66960 + }, + { + "epoch": 1.72, + "learning_rate": 8.161848842523324e-07, + "loss": 0.6685, + "step": 66961 + }, + { + "epoch": 1.72, + "learning_rate": 8.16157685350237e-07, + "loss": 0.7227, + "step": 66962 + }, + { + "epoch": 1.72, + "learning_rate": 8.16130486588902e-07, + "loss": 0.6982, + "step": 66963 + }, + { + "epoch": 1.72, + "learning_rate": 8.161032879683468e-07, + "loss": 0.6885, + "step": 66964 + }, + { + "epoch": 1.72, + "learning_rate": 8.16076089488593e-07, + "loss": 0.48, + "step": 66965 + }, + { + "epoch": 1.72, + "learning_rate": 8.160488911496611e-07, + "loss": 0.6953, + "step": 66966 + }, + { + "epoch": 1.72, + "learning_rate": 8.160216929515723e-07, + "loss": 0.6963, + "step": 66967 + }, + { + "epoch": 1.72, + "learning_rate": 8.15994494894347e-07, + "loss": 0.4879, + "step": 66968 + }, + { + "epoch": 1.72, + "learning_rate": 8.159672969780065e-07, + "loss": 0.7334, + "step": 66969 + }, + { + "epoch": 1.72, + "learning_rate": 8.159400992025711e-07, + "loss": 0.8311, + "step": 66970 + }, + { + "epoch": 1.72, + "learning_rate": 8.159129015680622e-07, + "loss": 0.6057, + "step": 66971 + }, + { + "epoch": 1.72, + "learning_rate": 8.158857040745001e-07, + "loss": 0.3887, + "step": 66972 + }, + { + "epoch": 1.72, + "learning_rate": 8.158585067219063e-07, + "loss": 0.7178, + "step": 66973 + }, + { + "epoch": 1.72, + "learning_rate": 8.158313095103009e-07, + "loss": 0.7305, + "step": 66974 + }, + { + "epoch": 1.72, + "learning_rate": 8.158041124397048e-07, + "loss": 0.4568, + "step": 66975 + }, + { + "epoch": 1.72, + "learning_rate": 8.157769155101392e-07, + "loss": 0.7168, + "step": 66976 + }, + { + "epoch": 1.72, + "learning_rate": 8.157497187216245e-07, + "loss": 0.5933, + "step": 66977 + }, + { + "epoch": 1.72, + "learning_rate": 8.157225220741821e-07, + "loss": 0.6592, + "step": 66978 + }, + { + "epoch": 1.72, + "learning_rate": 8.156953255678323e-07, + "loss": 0.7012, + "step": 66979 + }, + { + "epoch": 1.72, + "learning_rate": 8.156681292025962e-07, + "loss": 0.7656, + "step": 66980 + }, + { + "epoch": 1.72, + "learning_rate": 8.156409329784946e-07, + "loss": 0.6743, + "step": 66981 + }, + { + "epoch": 1.72, + "learning_rate": 8.156137368955481e-07, + "loss": 0.6055, + "step": 66982 + }, + { + "epoch": 1.72, + "learning_rate": 8.15586540953778e-07, + "loss": 0.7324, + "step": 66983 + }, + { + "epoch": 1.72, + "learning_rate": 8.155593451532046e-07, + "loss": 0.6289, + "step": 66984 + }, + { + "epoch": 1.72, + "learning_rate": 8.155321494938488e-07, + "loss": 0.6885, + "step": 66985 + }, + { + "epoch": 1.72, + "learning_rate": 8.155049539757317e-07, + "loss": 0.6558, + "step": 66986 + }, + { + "epoch": 1.72, + "learning_rate": 8.154777585988737e-07, + "loss": 0.6963, + "step": 66987 + }, + { + "epoch": 1.72, + "learning_rate": 8.154505633632963e-07, + "loss": 0.5708, + "step": 66988 + }, + { + "epoch": 1.72, + "learning_rate": 8.154233682690196e-07, + "loss": 0.6284, + "step": 66989 + }, + { + "epoch": 1.72, + "learning_rate": 8.15396173316065e-07, + "loss": 0.4614, + "step": 66990 + }, + { + "epoch": 1.72, + "learning_rate": 8.153689785044528e-07, + "loss": 0.6768, + "step": 66991 + }, + { + "epoch": 1.72, + "learning_rate": 8.153417838342043e-07, + "loss": 0.7744, + "step": 66992 + }, + { + "epoch": 1.72, + "learning_rate": 8.153145893053403e-07, + "loss": 0.6621, + "step": 66993 + }, + { + "epoch": 1.72, + "learning_rate": 8.15287394917881e-07, + "loss": 0.5576, + "step": 66994 + }, + { + "epoch": 1.72, + "learning_rate": 8.152602006718479e-07, + "loss": 0.6406, + "step": 66995 + }, + { + "epoch": 1.72, + "learning_rate": 8.152330065672613e-07, + "loss": 0.6592, + "step": 66996 + }, + { + "epoch": 1.72, + "learning_rate": 8.152058126041426e-07, + "loss": 0.6162, + "step": 66997 + }, + { + "epoch": 1.72, + "learning_rate": 8.151786187825121e-07, + "loss": 0.5449, + "step": 66998 + }, + { + "epoch": 1.72, + "learning_rate": 8.151514251023908e-07, + "loss": 0.627, + "step": 66999 + }, + { + "epoch": 1.72, + "learning_rate": 8.151242315637998e-07, + "loss": 0.5801, + "step": 67000 + }, + { + "epoch": 1.72, + "learning_rate": 8.150970381667595e-07, + "loss": 0.6587, + "step": 67001 + }, + { + "epoch": 1.72, + "learning_rate": 8.150698449112909e-07, + "loss": 0.6768, + "step": 67002 + }, + { + "epoch": 1.72, + "learning_rate": 8.150426517974152e-07, + "loss": 0.6714, + "step": 67003 + }, + { + "epoch": 1.72, + "learning_rate": 8.150154588251523e-07, + "loss": 0.7109, + "step": 67004 + }, + { + "epoch": 1.72, + "learning_rate": 8.149882659945238e-07, + "loss": 0.4888, + "step": 67005 + }, + { + "epoch": 1.72, + "learning_rate": 8.1496107330555e-07, + "loss": 0.6089, + "step": 67006 + }, + { + "epoch": 1.72, + "learning_rate": 8.149338807582525e-07, + "loss": 0.5518, + "step": 67007 + }, + { + "epoch": 1.72, + "learning_rate": 8.149066883526511e-07, + "loss": 0.6416, + "step": 67008 + }, + { + "epoch": 1.72, + "learning_rate": 8.148794960887675e-07, + "loss": 0.7129, + "step": 67009 + }, + { + "epoch": 1.72, + "learning_rate": 8.148523039666218e-07, + "loss": 0.7559, + "step": 67010 + }, + { + "epoch": 1.72, + "learning_rate": 8.148251119862355e-07, + "loss": 0.6641, + "step": 67011 + }, + { + "epoch": 1.72, + "learning_rate": 8.147979201476289e-07, + "loss": 0.5396, + "step": 67012 + }, + { + "epoch": 1.72, + "learning_rate": 8.147707284508234e-07, + "loss": 0.6597, + "step": 67013 + }, + { + "epoch": 1.72, + "learning_rate": 8.147435368958392e-07, + "loss": 0.7441, + "step": 67014 + }, + { + "epoch": 1.72, + "learning_rate": 8.147163454826972e-07, + "loss": 0.6611, + "step": 67015 + }, + { + "epoch": 1.72, + "learning_rate": 8.146891542114186e-07, + "loss": 0.4202, + "step": 67016 + }, + { + "epoch": 1.72, + "learning_rate": 8.146619630820239e-07, + "loss": 0.6299, + "step": 67017 + }, + { + "epoch": 1.72, + "learning_rate": 8.146347720945339e-07, + "loss": 0.7334, + "step": 67018 + }, + { + "epoch": 1.72, + "learning_rate": 8.146075812489696e-07, + "loss": 0.7734, + "step": 67019 + }, + { + "epoch": 1.72, + "learning_rate": 8.145803905453518e-07, + "loss": 0.7227, + "step": 67020 + }, + { + "epoch": 1.72, + "learning_rate": 8.145531999837012e-07, + "loss": 0.708, + "step": 67021 + }, + { + "epoch": 1.72, + "learning_rate": 8.145260095640387e-07, + "loss": 0.4767, + "step": 67022 + }, + { + "epoch": 1.72, + "learning_rate": 8.144988192863854e-07, + "loss": 0.5752, + "step": 67023 + }, + { + "epoch": 1.72, + "learning_rate": 8.144716291507616e-07, + "loss": 0.5938, + "step": 67024 + }, + { + "epoch": 1.72, + "learning_rate": 8.144444391571882e-07, + "loss": 0.6321, + "step": 67025 + }, + { + "epoch": 1.72, + "learning_rate": 8.144172493056863e-07, + "loss": 0.6758, + "step": 67026 + }, + { + "epoch": 1.72, + "learning_rate": 8.143900595962765e-07, + "loss": 0.5029, + "step": 67027 + }, + { + "epoch": 1.72, + "learning_rate": 8.143628700289797e-07, + "loss": 0.5747, + "step": 67028 + }, + { + "epoch": 1.72, + "learning_rate": 8.143356806038167e-07, + "loss": 0.5928, + "step": 67029 + }, + { + "epoch": 1.72, + "learning_rate": 8.143084913208085e-07, + "loss": 0.6167, + "step": 67030 + }, + { + "epoch": 1.72, + "learning_rate": 8.142813021799755e-07, + "loss": 0.6592, + "step": 67031 + }, + { + "epoch": 1.72, + "learning_rate": 8.142541131813389e-07, + "loss": 0.7324, + "step": 67032 + }, + { + "epoch": 1.72, + "learning_rate": 8.142269243249198e-07, + "loss": 0.6929, + "step": 67033 + }, + { + "epoch": 1.72, + "learning_rate": 8.141997356107381e-07, + "loss": 0.6494, + "step": 67034 + }, + { + "epoch": 1.72, + "learning_rate": 8.141725470388152e-07, + "loss": 0.572, + "step": 67035 + }, + { + "epoch": 1.72, + "learning_rate": 8.141453586091719e-07, + "loss": 0.6003, + "step": 67036 + }, + { + "epoch": 1.72, + "learning_rate": 8.141181703218287e-07, + "loss": 0.6431, + "step": 67037 + }, + { + "epoch": 1.72, + "learning_rate": 8.140909821768071e-07, + "loss": 0.6323, + "step": 67038 + }, + { + "epoch": 1.72, + "learning_rate": 8.14063794174127e-07, + "loss": 0.668, + "step": 67039 + }, + { + "epoch": 1.72, + "learning_rate": 8.140366063138101e-07, + "loss": 0.4912, + "step": 67040 + }, + { + "epoch": 1.72, + "learning_rate": 8.140094185958766e-07, + "loss": 0.585, + "step": 67041 + }, + { + "epoch": 1.72, + "learning_rate": 8.139822310203477e-07, + "loss": 0.7305, + "step": 67042 + }, + { + "epoch": 1.72, + "learning_rate": 8.139550435872442e-07, + "loss": 0.6367, + "step": 67043 + }, + { + "epoch": 1.72, + "learning_rate": 8.139278562965865e-07, + "loss": 0.6094, + "step": 67044 + }, + { + "epoch": 1.72, + "learning_rate": 8.139006691483958e-07, + "loss": 0.5125, + "step": 67045 + }, + { + "epoch": 1.72, + "learning_rate": 8.138734821426924e-07, + "loss": 0.5737, + "step": 67046 + }, + { + "epoch": 1.72, + "learning_rate": 8.13846295279498e-07, + "loss": 0.4315, + "step": 67047 + }, + { + "epoch": 1.72, + "learning_rate": 8.138191085588326e-07, + "loss": 0.7988, + "step": 67048 + }, + { + "epoch": 1.72, + "learning_rate": 8.137919219807177e-07, + "loss": 0.5742, + "step": 67049 + }, + { + "epoch": 1.72, + "learning_rate": 8.137647355451733e-07, + "loss": 0.6196, + "step": 67050 + }, + { + "epoch": 1.72, + "learning_rate": 8.137375492522212e-07, + "loss": 0.561, + "step": 67051 + }, + { + "epoch": 1.72, + "learning_rate": 8.137103631018813e-07, + "loss": 0.7603, + "step": 67052 + }, + { + "epoch": 1.72, + "learning_rate": 8.136831770941755e-07, + "loss": 0.7041, + "step": 67053 + }, + { + "epoch": 1.72, + "learning_rate": 8.136559912291232e-07, + "loss": 0.5718, + "step": 67054 + }, + { + "epoch": 1.72, + "learning_rate": 8.136288055067462e-07, + "loss": 0.3956, + "step": 67055 + }, + { + "epoch": 1.72, + "learning_rate": 8.136016199270647e-07, + "loss": 0.7715, + "step": 67056 + }, + { + "epoch": 1.72, + "learning_rate": 8.135744344901003e-07, + "loss": 0.5977, + "step": 67057 + }, + { + "epoch": 1.72, + "learning_rate": 8.135472491958732e-07, + "loss": 0.6689, + "step": 67058 + }, + { + "epoch": 1.72, + "learning_rate": 8.135200640444044e-07, + "loss": 0.6777, + "step": 67059 + }, + { + "epoch": 1.72, + "learning_rate": 8.134928790357147e-07, + "loss": 0.6465, + "step": 67060 + }, + { + "epoch": 1.72, + "learning_rate": 8.13465694169825e-07, + "loss": 0.6089, + "step": 67061 + }, + { + "epoch": 1.72, + "learning_rate": 8.134385094467559e-07, + "loss": 0.5898, + "step": 67062 + }, + { + "epoch": 1.72, + "learning_rate": 8.134113248665287e-07, + "loss": 0.605, + "step": 67063 + }, + { + "epoch": 1.72, + "learning_rate": 8.133841404291638e-07, + "loss": 0.5358, + "step": 67064 + }, + { + "epoch": 1.72, + "learning_rate": 8.133569561346818e-07, + "loss": 0.7559, + "step": 67065 + }, + { + "epoch": 1.72, + "learning_rate": 8.13329771983104e-07, + "loss": 0.6797, + "step": 67066 + }, + { + "epoch": 1.72, + "learning_rate": 8.133025879744507e-07, + "loss": 0.8164, + "step": 67067 + }, + { + "epoch": 1.72, + "learning_rate": 8.132754041087434e-07, + "loss": 0.7295, + "step": 67068 + }, + { + "epoch": 1.72, + "learning_rate": 8.132482203860022e-07, + "loss": 0.6143, + "step": 67069 + }, + { + "epoch": 1.72, + "learning_rate": 8.132210368062485e-07, + "loss": 0.6729, + "step": 67070 + }, + { + "epoch": 1.72, + "learning_rate": 8.131938533695029e-07, + "loss": 0.8203, + "step": 67071 + }, + { + "epoch": 1.72, + "learning_rate": 8.13166670075786e-07, + "loss": 0.5679, + "step": 67072 + }, + { + "epoch": 1.72, + "learning_rate": 8.131394869251191e-07, + "loss": 0.5535, + "step": 67073 + }, + { + "epoch": 1.72, + "learning_rate": 8.131123039175227e-07, + "loss": 0.7002, + "step": 67074 + }, + { + "epoch": 1.72, + "learning_rate": 8.130851210530172e-07, + "loss": 0.5103, + "step": 67075 + }, + { + "epoch": 1.72, + "learning_rate": 8.130579383316241e-07, + "loss": 0.5376, + "step": 67076 + }, + { + "epoch": 1.72, + "learning_rate": 8.130307557533637e-07, + "loss": 0.6587, + "step": 67077 + }, + { + "epoch": 1.72, + "learning_rate": 8.130035733182572e-07, + "loss": 0.5244, + "step": 67078 + }, + { + "epoch": 1.72, + "learning_rate": 8.129763910263252e-07, + "loss": 0.5835, + "step": 67079 + }, + { + "epoch": 1.72, + "learning_rate": 8.129492088775887e-07, + "loss": 0.6157, + "step": 67080 + }, + { + "epoch": 1.72, + "learning_rate": 8.129220268720682e-07, + "loss": 0.5898, + "step": 67081 + }, + { + "epoch": 1.72, + "learning_rate": 8.128948450097853e-07, + "loss": 0.4208, + "step": 67082 + }, + { + "epoch": 1.72, + "learning_rate": 8.128676632907597e-07, + "loss": 0.532, + "step": 67083 + }, + { + "epoch": 1.72, + "learning_rate": 8.128404817150127e-07, + "loss": 0.3574, + "step": 67084 + }, + { + "epoch": 1.72, + "learning_rate": 8.128133002825653e-07, + "loss": 0.52, + "step": 67085 + }, + { + "epoch": 1.72, + "learning_rate": 8.127861189934378e-07, + "loss": 0.5186, + "step": 67086 + }, + { + "epoch": 1.72, + "learning_rate": 8.127589378476518e-07, + "loss": 0.6592, + "step": 67087 + }, + { + "epoch": 1.72, + "learning_rate": 8.127317568452274e-07, + "loss": 0.6299, + "step": 67088 + }, + { + "epoch": 1.72, + "learning_rate": 8.127045759861858e-07, + "loss": 0.4712, + "step": 67089 + }, + { + "epoch": 1.72, + "learning_rate": 8.126773952705477e-07, + "loss": 0.5652, + "step": 67090 + }, + { + "epoch": 1.72, + "learning_rate": 8.126502146983339e-07, + "loss": 0.7114, + "step": 67091 + }, + { + "epoch": 1.72, + "learning_rate": 8.126230342695655e-07, + "loss": 0.7051, + "step": 67092 + }, + { + "epoch": 1.72, + "learning_rate": 8.125958539842628e-07, + "loss": 0.7383, + "step": 67093 + }, + { + "epoch": 1.72, + "learning_rate": 8.125686738424465e-07, + "loss": 0.6914, + "step": 67094 + }, + { + "epoch": 1.72, + "learning_rate": 8.125414938441381e-07, + "loss": 0.6523, + "step": 67095 + }, + { + "epoch": 1.72, + "learning_rate": 8.125143139893579e-07, + "loss": 0.7256, + "step": 67096 + }, + { + "epoch": 1.72, + "learning_rate": 8.124871342781269e-07, + "loss": 0.4692, + "step": 67097 + }, + { + "epoch": 1.72, + "learning_rate": 8.124599547104659e-07, + "loss": 0.6392, + "step": 67098 + }, + { + "epoch": 1.72, + "learning_rate": 8.124327752863957e-07, + "loss": 0.6436, + "step": 67099 + }, + { + "epoch": 1.72, + "learning_rate": 8.124055960059371e-07, + "loss": 0.5273, + "step": 67100 + }, + { + "epoch": 1.72, + "learning_rate": 8.12378416869111e-07, + "loss": 0.5059, + "step": 67101 + }, + { + "epoch": 1.72, + "learning_rate": 8.123512378759382e-07, + "loss": 0.6367, + "step": 67102 + }, + { + "epoch": 1.72, + "learning_rate": 8.123240590264391e-07, + "loss": 0.5151, + "step": 67103 + }, + { + "epoch": 1.72, + "learning_rate": 8.122968803206352e-07, + "loss": 0.6592, + "step": 67104 + }, + { + "epoch": 1.72, + "learning_rate": 8.122697017585466e-07, + "loss": 0.5312, + "step": 67105 + }, + { + "epoch": 1.72, + "learning_rate": 8.122425233401947e-07, + "loss": 0.6201, + "step": 67106 + }, + { + "epoch": 1.72, + "learning_rate": 8.122153450656001e-07, + "loss": 0.7061, + "step": 67107 + }, + { + "epoch": 1.72, + "learning_rate": 8.121881669347832e-07, + "loss": 0.5344, + "step": 67108 + }, + { + "epoch": 1.72, + "learning_rate": 8.121609889477657e-07, + "loss": 0.5271, + "step": 67109 + }, + { + "epoch": 1.72, + "learning_rate": 8.121338111045673e-07, + "loss": 0.5928, + "step": 67110 + }, + { + "epoch": 1.72, + "learning_rate": 8.121066334052099e-07, + "loss": 0.4517, + "step": 67111 + }, + { + "epoch": 1.72, + "learning_rate": 8.12079455849714e-07, + "loss": 0.8369, + "step": 67112 + }, + { + "epoch": 1.72, + "learning_rate": 8.120522784380997e-07, + "loss": 0.6338, + "step": 67113 + }, + { + "epoch": 1.72, + "learning_rate": 8.120251011703884e-07, + "loss": 0.5581, + "step": 67114 + }, + { + "epoch": 1.72, + "learning_rate": 8.119979240466009e-07, + "loss": 0.6792, + "step": 67115 + }, + { + "epoch": 1.72, + "learning_rate": 8.11970747066758e-07, + "loss": 0.5381, + "step": 67116 + }, + { + "epoch": 1.72, + "learning_rate": 8.119435702308803e-07, + "loss": 0.666, + "step": 67117 + }, + { + "epoch": 1.72, + "learning_rate": 8.11916393538989e-07, + "loss": 0.6033, + "step": 67118 + }, + { + "epoch": 1.72, + "learning_rate": 8.118892169911044e-07, + "loss": 0.5986, + "step": 67119 + }, + { + "epoch": 1.72, + "learning_rate": 8.118620405872478e-07, + "loss": 0.519, + "step": 67120 + }, + { + "epoch": 1.72, + "learning_rate": 8.118348643274396e-07, + "loss": 0.6484, + "step": 67121 + }, + { + "epoch": 1.72, + "learning_rate": 8.118076882117013e-07, + "loss": 0.6226, + "step": 67122 + }, + { + "epoch": 1.72, + "learning_rate": 8.117805122400529e-07, + "loss": 0.5857, + "step": 67123 + }, + { + "epoch": 1.72, + "learning_rate": 8.117533364125155e-07, + "loss": 0.7031, + "step": 67124 + }, + { + "epoch": 1.72, + "learning_rate": 8.117261607291097e-07, + "loss": 0.5903, + "step": 67125 + }, + { + "epoch": 1.72, + "learning_rate": 8.116989851898567e-07, + "loss": 0.5437, + "step": 67126 + }, + { + "epoch": 1.72, + "learning_rate": 8.116718097947769e-07, + "loss": 0.8486, + "step": 67127 + }, + { + "epoch": 1.72, + "learning_rate": 8.116446345438916e-07, + "loss": 0.5854, + "step": 67128 + }, + { + "epoch": 1.72, + "learning_rate": 8.116174594372212e-07, + "loss": 0.4541, + "step": 67129 + }, + { + "epoch": 1.72, + "learning_rate": 8.115902844747867e-07, + "loss": 0.6865, + "step": 67130 + }, + { + "epoch": 1.72, + "learning_rate": 8.115631096566088e-07, + "loss": 0.5015, + "step": 67131 + }, + { + "epoch": 1.72, + "learning_rate": 8.115359349827087e-07, + "loss": 0.6367, + "step": 67132 + }, + { + "epoch": 1.72, + "learning_rate": 8.115087604531067e-07, + "loss": 0.5146, + "step": 67133 + }, + { + "epoch": 1.72, + "learning_rate": 8.114815860678235e-07, + "loss": 0.5054, + "step": 67134 + }, + { + "epoch": 1.72, + "learning_rate": 8.114544118268804e-07, + "loss": 0.5898, + "step": 67135 + }, + { + "epoch": 1.72, + "learning_rate": 8.114272377302978e-07, + "loss": 0.7959, + "step": 67136 + }, + { + "epoch": 1.72, + "learning_rate": 8.11400063778097e-07, + "loss": 0.668, + "step": 67137 + }, + { + "epoch": 1.72, + "learning_rate": 8.113728899702981e-07, + "loss": 0.6416, + "step": 67138 + }, + { + "epoch": 1.72, + "learning_rate": 8.113457163069226e-07, + "loss": 0.6904, + "step": 67139 + }, + { + "epoch": 1.72, + "learning_rate": 8.113185427879909e-07, + "loss": 0.4801, + "step": 67140 + }, + { + "epoch": 1.72, + "learning_rate": 8.11291369413524e-07, + "loss": 0.7158, + "step": 67141 + }, + { + "epoch": 1.72, + "learning_rate": 8.112641961835429e-07, + "loss": 0.6797, + "step": 67142 + }, + { + "epoch": 1.72, + "learning_rate": 8.112370230980679e-07, + "loss": 0.5879, + "step": 67143 + }, + { + "epoch": 1.72, + "learning_rate": 8.112098501571199e-07, + "loss": 0.5945, + "step": 67144 + }, + { + "epoch": 1.72, + "learning_rate": 8.111826773607199e-07, + "loss": 0.7344, + "step": 67145 + }, + { + "epoch": 1.72, + "learning_rate": 8.111555047088885e-07, + "loss": 0.6304, + "step": 67146 + }, + { + "epoch": 1.72, + "learning_rate": 8.111283322016468e-07, + "loss": 0.7246, + "step": 67147 + }, + { + "epoch": 1.72, + "learning_rate": 8.111011598390153e-07, + "loss": 0.5879, + "step": 67148 + }, + { + "epoch": 1.72, + "learning_rate": 8.11073987621015e-07, + "loss": 0.7749, + "step": 67149 + }, + { + "epoch": 1.72, + "learning_rate": 8.110468155476668e-07, + "loss": 0.666, + "step": 67150 + }, + { + "epoch": 1.72, + "learning_rate": 8.110196436189913e-07, + "loss": 0.6152, + "step": 67151 + }, + { + "epoch": 1.72, + "learning_rate": 8.109924718350097e-07, + "loss": 0.6138, + "step": 67152 + }, + { + "epoch": 1.72, + "learning_rate": 8.109653001957421e-07, + "loss": 0.6602, + "step": 67153 + }, + { + "epoch": 1.72, + "learning_rate": 8.109381287012097e-07, + "loss": 0.7603, + "step": 67154 + }, + { + "epoch": 1.72, + "learning_rate": 8.109109573514332e-07, + "loss": 0.6465, + "step": 67155 + }, + { + "epoch": 1.72, + "learning_rate": 8.108837861464337e-07, + "loss": 0.4375, + "step": 67156 + }, + { + "epoch": 1.72, + "learning_rate": 8.108566150862314e-07, + "loss": 0.6895, + "step": 67157 + }, + { + "epoch": 1.72, + "learning_rate": 8.108294441708479e-07, + "loss": 0.6135, + "step": 67158 + }, + { + "epoch": 1.72, + "learning_rate": 8.108022734003033e-07, + "loss": 0.541, + "step": 67159 + }, + { + "epoch": 1.72, + "learning_rate": 8.107751027746191e-07, + "loss": 0.8047, + "step": 67160 + }, + { + "epoch": 1.72, + "learning_rate": 8.107479322938156e-07, + "loss": 0.6543, + "step": 67161 + }, + { + "epoch": 1.72, + "learning_rate": 8.107207619579137e-07, + "loss": 0.7188, + "step": 67162 + }, + { + "epoch": 1.72, + "learning_rate": 8.10693591766934e-07, + "loss": 0.5762, + "step": 67163 + }, + { + "epoch": 1.72, + "learning_rate": 8.106664217208978e-07, + "loss": 0.6797, + "step": 67164 + }, + { + "epoch": 1.72, + "learning_rate": 8.106392518198252e-07, + "loss": 0.6582, + "step": 67165 + }, + { + "epoch": 1.72, + "learning_rate": 8.106120820637377e-07, + "loss": 0.7402, + "step": 67166 + }, + { + "epoch": 1.72, + "learning_rate": 8.105849124526556e-07, + "loss": 0.5186, + "step": 67167 + }, + { + "epoch": 1.72, + "learning_rate": 8.105577429866002e-07, + "loss": 0.7891, + "step": 67168 + }, + { + "epoch": 1.72, + "learning_rate": 8.105305736655918e-07, + "loss": 0.5044, + "step": 67169 + }, + { + "epoch": 1.72, + "learning_rate": 8.105034044896515e-07, + "loss": 0.6499, + "step": 67170 + }, + { + "epoch": 1.72, + "learning_rate": 8.104762354587999e-07, + "loss": 0.6758, + "step": 67171 + }, + { + "epoch": 1.72, + "learning_rate": 8.104490665730585e-07, + "loss": 0.6133, + "step": 67172 + }, + { + "epoch": 1.72, + "learning_rate": 8.104218978324472e-07, + "loss": 0.4756, + "step": 67173 + }, + { + "epoch": 1.72, + "learning_rate": 8.103947292369868e-07, + "loss": 0.667, + "step": 67174 + }, + { + "epoch": 1.72, + "learning_rate": 8.103675607866989e-07, + "loss": 0.5161, + "step": 67175 + }, + { + "epoch": 1.72, + "learning_rate": 8.103403924816034e-07, + "loss": 0.6909, + "step": 67176 + }, + { + "epoch": 1.72, + "learning_rate": 8.103132243217219e-07, + "loss": 0.6938, + "step": 67177 + }, + { + "epoch": 1.72, + "learning_rate": 8.102860563070746e-07, + "loss": 0.7148, + "step": 67178 + }, + { + "epoch": 1.72, + "learning_rate": 8.102588884376827e-07, + "loss": 0.6709, + "step": 67179 + }, + { + "epoch": 1.72, + "learning_rate": 8.10231720713567e-07, + "loss": 0.5718, + "step": 67180 + }, + { + "epoch": 1.72, + "learning_rate": 8.102045531347478e-07, + "loss": 0.6445, + "step": 67181 + }, + { + "epoch": 1.72, + "learning_rate": 8.101773857012466e-07, + "loss": 0.6328, + "step": 67182 + }, + { + "epoch": 1.72, + "learning_rate": 8.101502184130837e-07, + "loss": 0.6343, + "step": 67183 + }, + { + "epoch": 1.72, + "learning_rate": 8.101230512702799e-07, + "loss": 0.6958, + "step": 67184 + }, + { + "epoch": 1.72, + "learning_rate": 8.100958842728564e-07, + "loss": 0.5537, + "step": 67185 + }, + { + "epoch": 1.72, + "learning_rate": 8.100687174208334e-07, + "loss": 0.7271, + "step": 67186 + }, + { + "epoch": 1.72, + "learning_rate": 8.100415507142323e-07, + "loss": 0.7402, + "step": 67187 + }, + { + "epoch": 1.72, + "learning_rate": 8.100143841530735e-07, + "loss": 0.6299, + "step": 67188 + }, + { + "epoch": 1.72, + "learning_rate": 8.09987217737378e-07, + "loss": 0.6289, + "step": 67189 + }, + { + "epoch": 1.72, + "learning_rate": 8.099600514671666e-07, + "loss": 0.7529, + "step": 67190 + }, + { + "epoch": 1.72, + "learning_rate": 8.099328853424601e-07, + "loss": 0.6714, + "step": 67191 + }, + { + "epoch": 1.72, + "learning_rate": 8.099057193632795e-07, + "loss": 0.6523, + "step": 67192 + }, + { + "epoch": 1.72, + "learning_rate": 8.098785535296448e-07, + "loss": 0.7676, + "step": 67193 + }, + { + "epoch": 1.72, + "learning_rate": 8.098513878415778e-07, + "loss": 0.7251, + "step": 67194 + }, + { + "epoch": 1.72, + "learning_rate": 8.098242222990985e-07, + "loss": 0.6372, + "step": 67195 + }, + { + "epoch": 1.72, + "learning_rate": 8.097970569022283e-07, + "loss": 0.5283, + "step": 67196 + }, + { + "epoch": 1.72, + "learning_rate": 8.097698916509876e-07, + "loss": 0.5391, + "step": 67197 + }, + { + "epoch": 1.72, + "learning_rate": 8.097427265453974e-07, + "loss": 0.6289, + "step": 67198 + }, + { + "epoch": 1.72, + "learning_rate": 8.097155615854785e-07, + "loss": 0.6538, + "step": 67199 + }, + { + "epoch": 1.72, + "learning_rate": 8.096883967712513e-07, + "loss": 0.583, + "step": 67200 + }, + { + "epoch": 1.72, + "learning_rate": 8.096612321027374e-07, + "loss": 0.667, + "step": 67201 + }, + { + "epoch": 1.72, + "learning_rate": 8.096340675799572e-07, + "loss": 0.8018, + "step": 67202 + }, + { + "epoch": 1.72, + "learning_rate": 8.096069032029311e-07, + "loss": 0.6558, + "step": 67203 + }, + { + "epoch": 1.72, + "learning_rate": 8.095797389716804e-07, + "loss": 0.582, + "step": 67204 + }, + { + "epoch": 1.72, + "learning_rate": 8.095525748862257e-07, + "loss": 0.55, + "step": 67205 + }, + { + "epoch": 1.72, + "learning_rate": 8.095254109465878e-07, + "loss": 0.6768, + "step": 67206 + }, + { + "epoch": 1.72, + "learning_rate": 8.094982471527873e-07, + "loss": 0.6543, + "step": 67207 + }, + { + "epoch": 1.72, + "learning_rate": 8.094710835048457e-07, + "loss": 0.5894, + "step": 67208 + }, + { + "epoch": 1.72, + "learning_rate": 8.094439200027829e-07, + "loss": 0.5983, + "step": 67209 + }, + { + "epoch": 1.72, + "learning_rate": 8.094167566466204e-07, + "loss": 0.6875, + "step": 67210 + }, + { + "epoch": 1.72, + "learning_rate": 8.093895934363785e-07, + "loss": 0.6426, + "step": 67211 + }, + { + "epoch": 1.72, + "learning_rate": 8.093624303720788e-07, + "loss": 0.749, + "step": 67212 + }, + { + "epoch": 1.72, + "learning_rate": 8.093352674537412e-07, + "loss": 0.3982, + "step": 67213 + }, + { + "epoch": 1.72, + "learning_rate": 8.093081046813868e-07, + "loss": 0.8145, + "step": 67214 + }, + { + "epoch": 1.72, + "learning_rate": 8.092809420550363e-07, + "loss": 0.6963, + "step": 67215 + }, + { + "epoch": 1.72, + "learning_rate": 8.092537795747108e-07, + "loss": 0.605, + "step": 67216 + }, + { + "epoch": 1.72, + "learning_rate": 8.092266172404305e-07, + "loss": 0.605, + "step": 67217 + }, + { + "epoch": 1.72, + "learning_rate": 8.09199455052217e-07, + "loss": 0.5007, + "step": 67218 + }, + { + "epoch": 1.72, + "learning_rate": 8.091722930100904e-07, + "loss": 0.554, + "step": 67219 + }, + { + "epoch": 1.72, + "learning_rate": 8.091451311140721e-07, + "loss": 0.4814, + "step": 67220 + }, + { + "epoch": 1.72, + "learning_rate": 8.091179693641823e-07, + "loss": 0.5942, + "step": 67221 + }, + { + "epoch": 1.72, + "learning_rate": 8.090908077604426e-07, + "loss": 0.5781, + "step": 67222 + }, + { + "epoch": 1.72, + "learning_rate": 8.09063646302873e-07, + "loss": 0.5117, + "step": 67223 + }, + { + "epoch": 1.72, + "learning_rate": 8.090364849914945e-07, + "loss": 0.6523, + "step": 67224 + }, + { + "epoch": 1.72, + "learning_rate": 8.090093238263281e-07, + "loss": 0.5786, + "step": 67225 + }, + { + "epoch": 1.72, + "learning_rate": 8.089821628073943e-07, + "loss": 0.5698, + "step": 67226 + }, + { + "epoch": 1.72, + "learning_rate": 8.089550019347142e-07, + "loss": 0.4849, + "step": 67227 + }, + { + "epoch": 1.72, + "learning_rate": 8.089278412083084e-07, + "loss": 0.6943, + "step": 67228 + }, + { + "epoch": 1.72, + "learning_rate": 8.08900680628198e-07, + "loss": 0.6348, + "step": 67229 + }, + { + "epoch": 1.72, + "learning_rate": 8.088735201944031e-07, + "loss": 0.5815, + "step": 67230 + }, + { + "epoch": 1.72, + "learning_rate": 8.088463599069454e-07, + "loss": 0.6934, + "step": 67231 + }, + { + "epoch": 1.72, + "learning_rate": 8.088191997658453e-07, + "loss": 0.5996, + "step": 67232 + }, + { + "epoch": 1.72, + "learning_rate": 8.087920397711236e-07, + "loss": 0.6885, + "step": 67233 + }, + { + "epoch": 1.72, + "learning_rate": 8.087648799228006e-07, + "loss": 0.6309, + "step": 67234 + }, + { + "epoch": 1.72, + "learning_rate": 8.087377202208978e-07, + "loss": 0.7129, + "step": 67235 + }, + { + "epoch": 1.72, + "learning_rate": 8.087105606654355e-07, + "loss": 0.6807, + "step": 67236 + }, + { + "epoch": 1.72, + "learning_rate": 8.08683401256435e-07, + "loss": 0.8564, + "step": 67237 + }, + { + "epoch": 1.72, + "learning_rate": 8.086562419939166e-07, + "loss": 0.4568, + "step": 67238 + }, + { + "epoch": 1.72, + "learning_rate": 8.086290828779015e-07, + "loss": 0.6782, + "step": 67239 + }, + { + "epoch": 1.72, + "learning_rate": 8.086019239084101e-07, + "loss": 0.4985, + "step": 67240 + }, + { + "epoch": 1.72, + "learning_rate": 8.085747650854636e-07, + "loss": 0.4873, + "step": 67241 + }, + { + "epoch": 1.72, + "learning_rate": 8.085476064090828e-07, + "loss": 0.7422, + "step": 67242 + }, + { + "epoch": 1.72, + "learning_rate": 8.08520447879288e-07, + "loss": 0.4656, + "step": 67243 + }, + { + "epoch": 1.72, + "learning_rate": 8.084932894961004e-07, + "loss": 0.6011, + "step": 67244 + }, + { + "epoch": 1.72, + "learning_rate": 8.084661312595405e-07, + "loss": 0.4176, + "step": 67245 + }, + { + "epoch": 1.72, + "learning_rate": 8.084389731696295e-07, + "loss": 0.6631, + "step": 67246 + }, + { + "epoch": 1.72, + "learning_rate": 8.084118152263877e-07, + "loss": 0.6807, + "step": 67247 + }, + { + "epoch": 1.72, + "learning_rate": 8.083846574298363e-07, + "loss": 0.6885, + "step": 67248 + }, + { + "epoch": 1.72, + "learning_rate": 8.083574997799958e-07, + "loss": 0.6421, + "step": 67249 + }, + { + "epoch": 1.72, + "learning_rate": 8.083303422768875e-07, + "loss": 0.6226, + "step": 67250 + }, + { + "epoch": 1.72, + "learning_rate": 8.083031849205315e-07, + "loss": 0.5991, + "step": 67251 + }, + { + "epoch": 1.72, + "learning_rate": 8.082760277109497e-07, + "loss": 0.4849, + "step": 67252 + }, + { + "epoch": 1.72, + "learning_rate": 8.082488706481613e-07, + "loss": 0.6357, + "step": 67253 + }, + { + "epoch": 1.72, + "learning_rate": 8.082217137321882e-07, + "loss": 0.8027, + "step": 67254 + }, + { + "epoch": 1.72, + "learning_rate": 8.081945569630508e-07, + "loss": 0.7461, + "step": 67255 + }, + { + "epoch": 1.72, + "learning_rate": 8.081674003407702e-07, + "loss": 0.7144, + "step": 67256 + }, + { + "epoch": 1.72, + "learning_rate": 8.081402438653668e-07, + "loss": 0.6914, + "step": 67257 + }, + { + "epoch": 1.72, + "learning_rate": 8.081130875368618e-07, + "loss": 0.573, + "step": 67258 + }, + { + "epoch": 1.72, + "learning_rate": 8.080859313552755e-07, + "loss": 0.7197, + "step": 67259 + }, + { + "epoch": 1.72, + "learning_rate": 8.080587753206293e-07, + "loss": 0.3683, + "step": 67260 + }, + { + "epoch": 1.72, + "learning_rate": 8.080316194329433e-07, + "loss": 0.5571, + "step": 67261 + }, + { + "epoch": 1.72, + "learning_rate": 8.080044636922392e-07, + "loss": 0.6733, + "step": 67262 + }, + { + "epoch": 1.72, + "learning_rate": 8.07977308098537e-07, + "loss": 0.6914, + "step": 67263 + }, + { + "epoch": 1.72, + "learning_rate": 8.079501526518576e-07, + "loss": 0.5298, + "step": 67264 + }, + { + "epoch": 1.72, + "learning_rate": 8.07922997352222e-07, + "loss": 0.6191, + "step": 67265 + }, + { + "epoch": 1.72, + "learning_rate": 8.078958421996509e-07, + "loss": 0.478, + "step": 67266 + }, + { + "epoch": 1.72, + "learning_rate": 8.078686871941652e-07, + "loss": 0.5864, + "step": 67267 + }, + { + "epoch": 1.72, + "learning_rate": 8.078415323357855e-07, + "loss": 0.5752, + "step": 67268 + }, + { + "epoch": 1.72, + "learning_rate": 8.078143776245327e-07, + "loss": 0.457, + "step": 67269 + }, + { + "epoch": 1.72, + "learning_rate": 8.077872230604279e-07, + "loss": 0.6807, + "step": 67270 + }, + { + "epoch": 1.72, + "learning_rate": 8.077600686434913e-07, + "loss": 0.6025, + "step": 67271 + }, + { + "epoch": 1.72, + "learning_rate": 8.077329143737443e-07, + "loss": 0.6729, + "step": 67272 + }, + { + "epoch": 1.72, + "learning_rate": 8.07705760251207e-07, + "loss": 0.7681, + "step": 67273 + }, + { + "epoch": 1.72, + "learning_rate": 8.076786062759007e-07, + "loss": 0.4907, + "step": 67274 + }, + { + "epoch": 1.72, + "learning_rate": 8.076514524478461e-07, + "loss": 0.3872, + "step": 67275 + }, + { + "epoch": 1.72, + "learning_rate": 8.076242987670637e-07, + "loss": 0.7061, + "step": 67276 + }, + { + "epoch": 1.72, + "learning_rate": 8.075971452335747e-07, + "loss": 0.6213, + "step": 67277 + }, + { + "epoch": 1.72, + "learning_rate": 8.075699918473995e-07, + "loss": 0.5381, + "step": 67278 + }, + { + "epoch": 1.72, + "learning_rate": 8.075428386085595e-07, + "loss": 0.8379, + "step": 67279 + }, + { + "epoch": 1.72, + "learning_rate": 8.075156855170747e-07, + "loss": 0.5547, + "step": 67280 + }, + { + "epoch": 1.72, + "learning_rate": 8.074885325729666e-07, + "loss": 0.6133, + "step": 67281 + }, + { + "epoch": 1.72, + "learning_rate": 8.074613797762558e-07, + "loss": 0.5542, + "step": 67282 + }, + { + "epoch": 1.72, + "learning_rate": 8.074342271269627e-07, + "loss": 0.5728, + "step": 67283 + }, + { + "epoch": 1.72, + "learning_rate": 8.074070746251083e-07, + "loss": 0.6455, + "step": 67284 + }, + { + "epoch": 1.72, + "learning_rate": 8.073799222707135e-07, + "loss": 0.5552, + "step": 67285 + }, + { + "epoch": 1.72, + "learning_rate": 8.073527700637992e-07, + "loss": 0.5295, + "step": 67286 + }, + { + "epoch": 1.72, + "learning_rate": 8.073256180043859e-07, + "loss": 0.7324, + "step": 67287 + }, + { + "epoch": 1.72, + "learning_rate": 8.072984660924944e-07, + "loss": 0.3894, + "step": 67288 + }, + { + "epoch": 1.72, + "learning_rate": 8.072713143281459e-07, + "loss": 0.6426, + "step": 67289 + }, + { + "epoch": 1.72, + "learning_rate": 8.072441627113605e-07, + "loss": 0.709, + "step": 67290 + }, + { + "epoch": 1.72, + "learning_rate": 8.072170112421597e-07, + "loss": 0.6465, + "step": 67291 + }, + { + "epoch": 1.72, + "learning_rate": 8.071898599205642e-07, + "loss": 0.625, + "step": 67292 + }, + { + "epoch": 1.72, + "learning_rate": 8.071627087465941e-07, + "loss": 0.606, + "step": 67293 + }, + { + "epoch": 1.72, + "learning_rate": 8.071355577202709e-07, + "loss": 0.6973, + "step": 67294 + }, + { + "epoch": 1.72, + "learning_rate": 8.071084068416149e-07, + "loss": 0.71, + "step": 67295 + }, + { + "epoch": 1.72, + "learning_rate": 8.070812561106472e-07, + "loss": 0.584, + "step": 67296 + }, + { + "epoch": 1.72, + "learning_rate": 8.070541055273884e-07, + "loss": 0.5654, + "step": 67297 + }, + { + "epoch": 1.72, + "learning_rate": 8.070269550918597e-07, + "loss": 0.6147, + "step": 67298 + }, + { + "epoch": 1.72, + "learning_rate": 8.069998048040813e-07, + "loss": 0.6528, + "step": 67299 + }, + { + "epoch": 1.72, + "learning_rate": 8.069726546640745e-07, + "loss": 0.6543, + "step": 67300 + }, + { + "epoch": 1.72, + "learning_rate": 8.069455046718596e-07, + "loss": 0.6719, + "step": 67301 + }, + { + "epoch": 1.72, + "learning_rate": 8.069183548274581e-07, + "loss": 0.6328, + "step": 67302 + }, + { + "epoch": 1.73, + "learning_rate": 8.068912051308901e-07, + "loss": 0.4861, + "step": 67303 + }, + { + "epoch": 1.73, + "learning_rate": 8.068640555821768e-07, + "loss": 0.7256, + "step": 67304 + }, + { + "epoch": 1.73, + "learning_rate": 8.068369061813384e-07, + "loss": 0.4995, + "step": 67305 + }, + { + "epoch": 1.73, + "learning_rate": 8.068097569283964e-07, + "loss": 0.5869, + "step": 67306 + }, + { + "epoch": 1.73, + "learning_rate": 8.06782607823371e-07, + "loss": 0.583, + "step": 67307 + }, + { + "epoch": 1.73, + "learning_rate": 8.067554588662835e-07, + "loss": 0.7461, + "step": 67308 + }, + { + "epoch": 1.73, + "learning_rate": 8.067283100571542e-07, + "loss": 0.6616, + "step": 67309 + }, + { + "epoch": 1.73, + "learning_rate": 8.067011613960045e-07, + "loss": 0.6924, + "step": 67310 + }, + { + "epoch": 1.73, + "learning_rate": 8.066740128828546e-07, + "loss": 0.5754, + "step": 67311 + }, + { + "epoch": 1.73, + "learning_rate": 8.066468645177259e-07, + "loss": 0.6133, + "step": 67312 + }, + { + "epoch": 1.73, + "learning_rate": 8.066197163006386e-07, + "loss": 0.7256, + "step": 67313 + }, + { + "epoch": 1.73, + "learning_rate": 8.065925682316135e-07, + "loss": 0.4976, + "step": 67314 + }, + { + "epoch": 1.73, + "learning_rate": 8.065654203106717e-07, + "loss": 0.6689, + "step": 67315 + }, + { + "epoch": 1.73, + "learning_rate": 8.065382725378337e-07, + "loss": 0.7178, + "step": 67316 + }, + { + "epoch": 1.73, + "learning_rate": 8.065111249131207e-07, + "loss": 0.4836, + "step": 67317 + }, + { + "epoch": 1.73, + "learning_rate": 8.064839774365531e-07, + "loss": 0.7109, + "step": 67318 + }, + { + "epoch": 1.73, + "learning_rate": 8.064568301081518e-07, + "loss": 0.6826, + "step": 67319 + }, + { + "epoch": 1.73, + "learning_rate": 8.064296829279375e-07, + "loss": 0.6787, + "step": 67320 + }, + { + "epoch": 1.73, + "learning_rate": 8.064025358959314e-07, + "loss": 0.5874, + "step": 67321 + }, + { + "epoch": 1.73, + "learning_rate": 8.063753890121541e-07, + "loss": 0.6748, + "step": 67322 + }, + { + "epoch": 1.73, + "learning_rate": 8.063482422766261e-07, + "loss": 0.5542, + "step": 67323 + }, + { + "epoch": 1.73, + "learning_rate": 8.06321095689368e-07, + "loss": 0.7432, + "step": 67324 + }, + { + "epoch": 1.73, + "learning_rate": 8.062939492504012e-07, + "loss": 0.71, + "step": 67325 + }, + { + "epoch": 1.73, + "learning_rate": 8.062668029597461e-07, + "loss": 0.7021, + "step": 67326 + }, + { + "epoch": 1.73, + "learning_rate": 8.062396568174238e-07, + "loss": 0.6309, + "step": 67327 + }, + { + "epoch": 1.73, + "learning_rate": 8.062125108234547e-07, + "loss": 0.5254, + "step": 67328 + }, + { + "epoch": 1.73, + "learning_rate": 8.061853649778598e-07, + "loss": 0.7178, + "step": 67329 + }, + { + "epoch": 1.73, + "learning_rate": 8.061582192806599e-07, + "loss": 0.5605, + "step": 67330 + }, + { + "epoch": 1.73, + "learning_rate": 8.061310737318757e-07, + "loss": 0.5708, + "step": 67331 + }, + { + "epoch": 1.73, + "learning_rate": 8.061039283315284e-07, + "loss": 0.4834, + "step": 67332 + }, + { + "epoch": 1.73, + "learning_rate": 8.060767830796379e-07, + "loss": 0.6562, + "step": 67333 + }, + { + "epoch": 1.73, + "learning_rate": 8.060496379762257e-07, + "loss": 0.7812, + "step": 67334 + }, + { + "epoch": 1.73, + "learning_rate": 8.060224930213121e-07, + "loss": 0.6865, + "step": 67335 + }, + { + "epoch": 1.73, + "learning_rate": 8.059953482149186e-07, + "loss": 0.7568, + "step": 67336 + }, + { + "epoch": 1.73, + "learning_rate": 8.059682035570651e-07, + "loss": 0.6802, + "step": 67337 + }, + { + "epoch": 1.73, + "learning_rate": 8.059410590477732e-07, + "loss": 0.6934, + "step": 67338 + }, + { + "epoch": 1.73, + "learning_rate": 8.05913914687063e-07, + "loss": 0.6948, + "step": 67339 + }, + { + "epoch": 1.73, + "learning_rate": 8.058867704749559e-07, + "loss": 0.6367, + "step": 67340 + }, + { + "epoch": 1.73, + "learning_rate": 8.058596264114719e-07, + "loss": 0.6057, + "step": 67341 + }, + { + "epoch": 1.73, + "learning_rate": 8.058324824966332e-07, + "loss": 0.7129, + "step": 67342 + }, + { + "epoch": 1.73, + "learning_rate": 8.058053387304588e-07, + "loss": 0.6555, + "step": 67343 + }, + { + "epoch": 1.73, + "learning_rate": 8.057781951129708e-07, + "loss": 0.7451, + "step": 67344 + }, + { + "epoch": 1.73, + "learning_rate": 8.05751051644189e-07, + "loss": 0.6758, + "step": 67345 + }, + { + "epoch": 1.73, + "learning_rate": 8.05723908324135e-07, + "loss": 0.5957, + "step": 67346 + }, + { + "epoch": 1.73, + "learning_rate": 8.056967651528292e-07, + "loss": 0.5088, + "step": 67347 + }, + { + "epoch": 1.73, + "learning_rate": 8.056696221302924e-07, + "loss": 0.5767, + "step": 67348 + }, + { + "epoch": 1.73, + "learning_rate": 8.056424792565454e-07, + "loss": 0.5483, + "step": 67349 + }, + { + "epoch": 1.73, + "learning_rate": 8.056153365316092e-07, + "loss": 0.4844, + "step": 67350 + }, + { + "epoch": 1.73, + "learning_rate": 8.055881939555041e-07, + "loss": 0.8154, + "step": 67351 + }, + { + "epoch": 1.73, + "learning_rate": 8.055610515282517e-07, + "loss": 0.6553, + "step": 67352 + }, + { + "epoch": 1.73, + "learning_rate": 8.055339092498721e-07, + "loss": 0.573, + "step": 67353 + }, + { + "epoch": 1.73, + "learning_rate": 8.055067671203859e-07, + "loss": 0.6807, + "step": 67354 + }, + { + "epoch": 1.73, + "learning_rate": 8.054796251398145e-07, + "loss": 0.626, + "step": 67355 + }, + { + "epoch": 1.73, + "learning_rate": 8.054524833081782e-07, + "loss": 0.6348, + "step": 67356 + }, + { + "epoch": 1.73, + "learning_rate": 8.054253416254982e-07, + "loss": 0.8086, + "step": 67357 + }, + { + "epoch": 1.73, + "learning_rate": 8.053982000917948e-07, + "loss": 0.5753, + "step": 67358 + }, + { + "epoch": 1.73, + "learning_rate": 8.053710587070894e-07, + "loss": 0.6294, + "step": 67359 + }, + { + "epoch": 1.73, + "learning_rate": 8.053439174714023e-07, + "loss": 0.6084, + "step": 67360 + }, + { + "epoch": 1.73, + "learning_rate": 8.053167763847543e-07, + "loss": 0.6323, + "step": 67361 + }, + { + "epoch": 1.73, + "learning_rate": 8.052896354471666e-07, + "loss": 0.3367, + "step": 67362 + }, + { + "epoch": 1.73, + "learning_rate": 8.052624946586595e-07, + "loss": 0.6353, + "step": 67363 + }, + { + "epoch": 1.73, + "learning_rate": 8.052353540192538e-07, + "loss": 0.6611, + "step": 67364 + }, + { + "epoch": 1.73, + "learning_rate": 8.052082135289706e-07, + "loss": 0.6333, + "step": 67365 + }, + { + "epoch": 1.73, + "learning_rate": 8.051810731878304e-07, + "loss": 0.8057, + "step": 67366 + }, + { + "epoch": 1.73, + "learning_rate": 8.051539329958541e-07, + "loss": 0.583, + "step": 67367 + }, + { + "epoch": 1.73, + "learning_rate": 8.051267929530624e-07, + "loss": 0.7012, + "step": 67368 + }, + { + "epoch": 1.73, + "learning_rate": 8.050996530594764e-07, + "loss": 0.8379, + "step": 67369 + }, + { + "epoch": 1.73, + "learning_rate": 8.050725133151164e-07, + "loss": 0.4436, + "step": 67370 + }, + { + "epoch": 1.73, + "learning_rate": 8.050453737200036e-07, + "loss": 0.4143, + "step": 67371 + }, + { + "epoch": 1.73, + "learning_rate": 8.050182342741587e-07, + "loss": 0.7363, + "step": 67372 + }, + { + "epoch": 1.73, + "learning_rate": 8.049910949776021e-07, + "loss": 0.6924, + "step": 67373 + }, + { + "epoch": 1.73, + "learning_rate": 8.049639558303549e-07, + "loss": 0.707, + "step": 67374 + }, + { + "epoch": 1.73, + "learning_rate": 8.049368168324378e-07, + "loss": 0.6904, + "step": 67375 + }, + { + "epoch": 1.73, + "learning_rate": 8.049096779838717e-07, + "loss": 0.4886, + "step": 67376 + }, + { + "epoch": 1.73, + "learning_rate": 8.048825392846774e-07, + "loss": 0.7627, + "step": 67377 + }, + { + "epoch": 1.73, + "learning_rate": 8.048554007348753e-07, + "loss": 0.604, + "step": 67378 + }, + { + "epoch": 1.73, + "learning_rate": 8.048282623344867e-07, + "loss": 0.4971, + "step": 67379 + }, + { + "epoch": 1.73, + "learning_rate": 8.048011240835318e-07, + "loss": 0.6152, + "step": 67380 + }, + { + "epoch": 1.73, + "learning_rate": 8.047739859820322e-07, + "loss": 0.5339, + "step": 67381 + }, + { + "epoch": 1.73, + "learning_rate": 8.04746848030008e-07, + "loss": 0.4279, + "step": 67382 + }, + { + "epoch": 1.73, + "learning_rate": 8.047197102274798e-07, + "loss": 0.6011, + "step": 67383 + }, + { + "epoch": 1.73, + "learning_rate": 8.046925725744692e-07, + "loss": 0.7471, + "step": 67384 + }, + { + "epoch": 1.73, + "learning_rate": 8.046654350709962e-07, + "loss": 0.9062, + "step": 67385 + }, + { + "epoch": 1.73, + "learning_rate": 8.04638297717082e-07, + "loss": 0.623, + "step": 67386 + }, + { + "epoch": 1.73, + "learning_rate": 8.046111605127471e-07, + "loss": 0.6226, + "step": 67387 + }, + { + "epoch": 1.73, + "learning_rate": 8.045840234580128e-07, + "loss": 0.6816, + "step": 67388 + }, + { + "epoch": 1.73, + "learning_rate": 8.045568865528991e-07, + "loss": 0.7783, + "step": 67389 + }, + { + "epoch": 1.73, + "learning_rate": 8.045297497974276e-07, + "loss": 0.5479, + "step": 67390 + }, + { + "epoch": 1.73, + "learning_rate": 8.045026131916188e-07, + "loss": 0.7842, + "step": 67391 + }, + { + "epoch": 1.73, + "learning_rate": 8.04475476735493e-07, + "loss": 0.3367, + "step": 67392 + }, + { + "epoch": 1.73, + "learning_rate": 8.044483404290715e-07, + "loss": 0.5977, + "step": 67393 + }, + { + "epoch": 1.73, + "learning_rate": 8.044212042723749e-07, + "loss": 0.5278, + "step": 67394 + }, + { + "epoch": 1.73, + "learning_rate": 8.043940682654238e-07, + "loss": 0.6599, + "step": 67395 + }, + { + "epoch": 1.73, + "learning_rate": 8.043669324082394e-07, + "loss": 0.7969, + "step": 67396 + }, + { + "epoch": 1.73, + "learning_rate": 8.043397967008421e-07, + "loss": 0.6118, + "step": 67397 + }, + { + "epoch": 1.73, + "learning_rate": 8.043126611432529e-07, + "loss": 0.5859, + "step": 67398 + }, + { + "epoch": 1.73, + "learning_rate": 8.042855257354923e-07, + "loss": 0.6763, + "step": 67399 + }, + { + "epoch": 1.73, + "learning_rate": 8.042583904775814e-07, + "loss": 0.7725, + "step": 67400 + }, + { + "epoch": 1.73, + "learning_rate": 8.042312553695414e-07, + "loss": 0.731, + "step": 67401 + }, + { + "epoch": 1.73, + "learning_rate": 8.042041204113918e-07, + "loss": 0.5996, + "step": 67402 + }, + { + "epoch": 1.73, + "learning_rate": 8.041769856031544e-07, + "loss": 0.5591, + "step": 67403 + }, + { + "epoch": 1.73, + "learning_rate": 8.041498509448494e-07, + "loss": 0.6494, + "step": 67404 + }, + { + "epoch": 1.73, + "learning_rate": 8.041227164364982e-07, + "loss": 0.6689, + "step": 67405 + }, + { + "epoch": 1.73, + "learning_rate": 8.04095582078121e-07, + "loss": 0.5938, + "step": 67406 + }, + { + "epoch": 1.73, + "learning_rate": 8.040684478697389e-07, + "loss": 0.4883, + "step": 67407 + }, + { + "epoch": 1.73, + "learning_rate": 8.040413138113724e-07, + "loss": 0.6348, + "step": 67408 + }, + { + "epoch": 1.73, + "learning_rate": 8.040141799030428e-07, + "loss": 0.5781, + "step": 67409 + }, + { + "epoch": 1.73, + "learning_rate": 8.039870461447702e-07, + "loss": 0.5762, + "step": 67410 + }, + { + "epoch": 1.73, + "learning_rate": 8.039599125365763e-07, + "loss": 0.5586, + "step": 67411 + }, + { + "epoch": 1.73, + "learning_rate": 8.039327790784808e-07, + "loss": 0.7075, + "step": 67412 + }, + { + "epoch": 1.73, + "learning_rate": 8.03905645770505e-07, + "loss": 0.6221, + "step": 67413 + }, + { + "epoch": 1.73, + "learning_rate": 8.038785126126694e-07, + "loss": 0.6953, + "step": 67414 + }, + { + "epoch": 1.73, + "learning_rate": 8.038513796049954e-07, + "loss": 0.6646, + "step": 67415 + }, + { + "epoch": 1.73, + "learning_rate": 8.038242467475032e-07, + "loss": 0.7314, + "step": 67416 + }, + { + "epoch": 1.73, + "learning_rate": 8.037971140402138e-07, + "loss": 0.7227, + "step": 67417 + }, + { + "epoch": 1.73, + "learning_rate": 8.037699814831477e-07, + "loss": 0.7344, + "step": 67418 + }, + { + "epoch": 1.73, + "learning_rate": 8.037428490763262e-07, + "loss": 0.4812, + "step": 67419 + }, + { + "epoch": 1.73, + "learning_rate": 8.037157168197695e-07, + "loss": 0.6021, + "step": 67420 + }, + { + "epoch": 1.73, + "learning_rate": 8.036885847134991e-07, + "loss": 0.4878, + "step": 67421 + }, + { + "epoch": 1.73, + "learning_rate": 8.036614527575352e-07, + "loss": 0.6641, + "step": 67422 + }, + { + "epoch": 1.73, + "learning_rate": 8.036343209518983e-07, + "loss": 0.5728, + "step": 67423 + }, + { + "epoch": 1.73, + "learning_rate": 8.0360718929661e-07, + "loss": 0.6543, + "step": 67424 + }, + { + "epoch": 1.73, + "learning_rate": 8.035800577916902e-07, + "loss": 0.5686, + "step": 67425 + }, + { + "epoch": 1.73, + "learning_rate": 8.035529264371605e-07, + "loss": 0.8232, + "step": 67426 + }, + { + "epoch": 1.73, + "learning_rate": 8.035257952330411e-07, + "loss": 0.8418, + "step": 67427 + }, + { + "epoch": 1.73, + "learning_rate": 8.034986641793531e-07, + "loss": 0.6274, + "step": 67428 + }, + { + "epoch": 1.73, + "learning_rate": 8.03471533276117e-07, + "loss": 0.4644, + "step": 67429 + }, + { + "epoch": 1.73, + "learning_rate": 8.034444025233537e-07, + "loss": 0.6318, + "step": 67430 + }, + { + "epoch": 1.73, + "learning_rate": 8.034172719210845e-07, + "loss": 0.7207, + "step": 67431 + }, + { + "epoch": 1.73, + "learning_rate": 8.033901414693292e-07, + "loss": 0.571, + "step": 67432 + }, + { + "epoch": 1.73, + "learning_rate": 8.033630111681089e-07, + "loss": 0.4241, + "step": 67433 + }, + { + "epoch": 1.73, + "learning_rate": 8.033358810174448e-07, + "loss": 0.5487, + "step": 67434 + }, + { + "epoch": 1.73, + "learning_rate": 8.033087510173571e-07, + "loss": 0.5913, + "step": 67435 + }, + { + "epoch": 1.73, + "learning_rate": 8.03281621167867e-07, + "loss": 0.5078, + "step": 67436 + }, + { + "epoch": 1.73, + "learning_rate": 8.032544914689949e-07, + "loss": 0.5947, + "step": 67437 + }, + { + "epoch": 1.73, + "learning_rate": 8.032273619207621e-07, + "loss": 0.6436, + "step": 67438 + }, + { + "epoch": 1.73, + "learning_rate": 8.032002325231888e-07, + "loss": 0.4116, + "step": 67439 + }, + { + "epoch": 1.73, + "learning_rate": 8.031731032762963e-07, + "loss": 0.6934, + "step": 67440 + }, + { + "epoch": 1.73, + "learning_rate": 8.031459741801052e-07, + "loss": 0.7266, + "step": 67441 + }, + { + "epoch": 1.73, + "learning_rate": 8.031188452346358e-07, + "loss": 0.6289, + "step": 67442 + }, + { + "epoch": 1.73, + "learning_rate": 8.030917164399094e-07, + "loss": 0.7231, + "step": 67443 + }, + { + "epoch": 1.73, + "learning_rate": 8.030645877959465e-07, + "loss": 0.6055, + "step": 67444 + }, + { + "epoch": 1.73, + "learning_rate": 8.030374593027682e-07, + "loss": 0.5977, + "step": 67445 + }, + { + "epoch": 1.73, + "learning_rate": 8.030103309603948e-07, + "loss": 0.7568, + "step": 67446 + }, + { + "epoch": 1.73, + "learning_rate": 8.029832027688477e-07, + "loss": 0.5901, + "step": 67447 + }, + { + "epoch": 1.73, + "learning_rate": 8.02956074728147e-07, + "loss": 0.7124, + "step": 67448 + }, + { + "epoch": 1.73, + "learning_rate": 8.02928946838314e-07, + "loss": 0.5063, + "step": 67449 + }, + { + "epoch": 1.73, + "learning_rate": 8.02901819099369e-07, + "loss": 0.54, + "step": 67450 + }, + { + "epoch": 1.73, + "learning_rate": 8.028746915113336e-07, + "loss": 0.5132, + "step": 67451 + }, + { + "epoch": 1.73, + "learning_rate": 8.028475640742273e-07, + "loss": 0.4878, + "step": 67452 + }, + { + "epoch": 1.73, + "learning_rate": 8.028204367880719e-07, + "loss": 0.5352, + "step": 67453 + }, + { + "epoch": 1.73, + "learning_rate": 8.027933096528875e-07, + "loss": 0.8701, + "step": 67454 + }, + { + "epoch": 1.73, + "learning_rate": 8.027661826686955e-07, + "loss": 0.666, + "step": 67455 + }, + { + "epoch": 1.73, + "learning_rate": 8.02739055835516e-07, + "loss": 0.4695, + "step": 67456 + }, + { + "epoch": 1.73, + "learning_rate": 8.027119291533706e-07, + "loss": 0.5449, + "step": 67457 + }, + { + "epoch": 1.73, + "learning_rate": 8.026848026222792e-07, + "loss": 0.7236, + "step": 67458 + }, + { + "epoch": 1.73, + "learning_rate": 8.026576762422632e-07, + "loss": 0.4275, + "step": 67459 + }, + { + "epoch": 1.73, + "learning_rate": 8.02630550013343e-07, + "loss": 0.5635, + "step": 67460 + }, + { + "epoch": 1.73, + "learning_rate": 8.026034239355399e-07, + "loss": 0.6182, + "step": 67461 + }, + { + "epoch": 1.73, + "learning_rate": 8.025762980088742e-07, + "loss": 0.5767, + "step": 67462 + }, + { + "epoch": 1.73, + "learning_rate": 8.025491722333664e-07, + "loss": 0.686, + "step": 67463 + }, + { + "epoch": 1.73, + "learning_rate": 8.025220466090378e-07, + "loss": 0.7314, + "step": 67464 + }, + { + "epoch": 1.73, + "learning_rate": 8.024949211359089e-07, + "loss": 0.5415, + "step": 67465 + }, + { + "epoch": 1.73, + "learning_rate": 8.024677958140007e-07, + "loss": 0.5811, + "step": 67466 + }, + { + "epoch": 1.73, + "learning_rate": 8.024406706433338e-07, + "loss": 0.6416, + "step": 67467 + }, + { + "epoch": 1.73, + "learning_rate": 8.024135456239289e-07, + "loss": 0.6714, + "step": 67468 + }, + { + "epoch": 1.73, + "learning_rate": 8.023864207558069e-07, + "loss": 0.4604, + "step": 67469 + }, + { + "epoch": 1.73, + "learning_rate": 8.023592960389884e-07, + "loss": 0.7656, + "step": 67470 + }, + { + "epoch": 1.73, + "learning_rate": 8.023321714734948e-07, + "loss": 0.542, + "step": 67471 + }, + { + "epoch": 1.73, + "learning_rate": 8.02305047059346e-07, + "loss": 0.7188, + "step": 67472 + }, + { + "epoch": 1.73, + "learning_rate": 8.02277922796563e-07, + "loss": 0.5049, + "step": 67473 + }, + { + "epoch": 1.73, + "learning_rate": 8.022507986851669e-07, + "loss": 0.562, + "step": 67474 + }, + { + "epoch": 1.73, + "learning_rate": 8.022236747251781e-07, + "loss": 0.7773, + "step": 67475 + }, + { + "epoch": 1.73, + "learning_rate": 8.021965509166178e-07, + "loss": 0.5591, + "step": 67476 + }, + { + "epoch": 1.73, + "learning_rate": 8.021694272595061e-07, + "loss": 0.7456, + "step": 67477 + }, + { + "epoch": 1.73, + "learning_rate": 8.021423037538646e-07, + "loss": 0.5835, + "step": 67478 + }, + { + "epoch": 1.73, + "learning_rate": 8.021151803997133e-07, + "loss": 0.4683, + "step": 67479 + }, + { + "epoch": 1.73, + "learning_rate": 8.020880571970735e-07, + "loss": 0.4727, + "step": 67480 + }, + { + "epoch": 1.73, + "learning_rate": 8.020609341459661e-07, + "loss": 0.5549, + "step": 67481 + }, + { + "epoch": 1.73, + "learning_rate": 8.02033811246411e-07, + "loss": 0.5894, + "step": 67482 + }, + { + "epoch": 1.73, + "learning_rate": 8.020066884984298e-07, + "loss": 0.6357, + "step": 67483 + }, + { + "epoch": 1.73, + "learning_rate": 8.01979565902043e-07, + "loss": 0.4526, + "step": 67484 + }, + { + "epoch": 1.73, + "learning_rate": 8.019524434572711e-07, + "loss": 0.7129, + "step": 67485 + }, + { + "epoch": 1.73, + "learning_rate": 8.019253211641352e-07, + "loss": 0.7285, + "step": 67486 + }, + { + "epoch": 1.73, + "learning_rate": 8.018981990226558e-07, + "loss": 0.4316, + "step": 67487 + }, + { + "epoch": 1.73, + "learning_rate": 8.018710770328543e-07, + "loss": 0.7773, + "step": 67488 + }, + { + "epoch": 1.73, + "learning_rate": 8.018439551947505e-07, + "loss": 0.6846, + "step": 67489 + }, + { + "epoch": 1.73, + "learning_rate": 8.018168335083661e-07, + "loss": 0.6416, + "step": 67490 + }, + { + "epoch": 1.73, + "learning_rate": 8.017897119737215e-07, + "loss": 0.5835, + "step": 67491 + }, + { + "epoch": 1.73, + "learning_rate": 8.01762590590837e-07, + "loss": 0.7207, + "step": 67492 + }, + { + "epoch": 1.73, + "learning_rate": 8.01735469359734e-07, + "loss": 0.748, + "step": 67493 + }, + { + "epoch": 1.73, + "learning_rate": 8.017083482804329e-07, + "loss": 0.5449, + "step": 67494 + }, + { + "epoch": 1.73, + "learning_rate": 8.016812273529548e-07, + "loss": 0.6038, + "step": 67495 + }, + { + "epoch": 1.73, + "learning_rate": 8.016541065773199e-07, + "loss": 0.6987, + "step": 67496 + }, + { + "epoch": 1.73, + "learning_rate": 8.016269859535496e-07, + "loss": 0.7598, + "step": 67497 + }, + { + "epoch": 1.73, + "learning_rate": 8.015998654816642e-07, + "loss": 0.6709, + "step": 67498 + }, + { + "epoch": 1.73, + "learning_rate": 8.015727451616849e-07, + "loss": 0.6611, + "step": 67499 + }, + { + "epoch": 1.73, + "learning_rate": 8.01545624993632e-07, + "loss": 0.5483, + "step": 67500 + }, + { + "epoch": 1.73, + "learning_rate": 8.015185049775271e-07, + "loss": 0.6421, + "step": 67501 + }, + { + "epoch": 1.73, + "learning_rate": 8.014913851133897e-07, + "loss": 0.6069, + "step": 67502 + }, + { + "epoch": 1.73, + "learning_rate": 8.014642654012416e-07, + "loss": 0.708, + "step": 67503 + }, + { + "epoch": 1.73, + "learning_rate": 8.014371458411029e-07, + "loss": 0.5278, + "step": 67504 + }, + { + "epoch": 1.73, + "learning_rate": 8.014100264329947e-07, + "loss": 0.6445, + "step": 67505 + }, + { + "epoch": 1.73, + "learning_rate": 8.013829071769377e-07, + "loss": 0.7119, + "step": 67506 + }, + { + "epoch": 1.73, + "learning_rate": 8.013557880729528e-07, + "loss": 0.6279, + "step": 67507 + }, + { + "epoch": 1.73, + "learning_rate": 8.013286691210604e-07, + "loss": 0.606, + "step": 67508 + }, + { + "epoch": 1.73, + "learning_rate": 8.013015503212817e-07, + "loss": 0.792, + "step": 67509 + }, + { + "epoch": 1.73, + "learning_rate": 8.012744316736371e-07, + "loss": 0.5869, + "step": 67510 + }, + { + "epoch": 1.73, + "learning_rate": 8.01247313178148e-07, + "loss": 0.7354, + "step": 67511 + }, + { + "epoch": 1.73, + "learning_rate": 8.012201948348343e-07, + "loss": 0.3353, + "step": 67512 + }, + { + "epoch": 1.73, + "learning_rate": 8.011930766437171e-07, + "loss": 0.5918, + "step": 67513 + }, + { + "epoch": 1.73, + "learning_rate": 8.011659586048174e-07, + "loss": 0.5688, + "step": 67514 + }, + { + "epoch": 1.73, + "learning_rate": 8.011388407181556e-07, + "loss": 0.6455, + "step": 67515 + }, + { + "epoch": 1.73, + "learning_rate": 8.011117229837529e-07, + "loss": 0.5164, + "step": 67516 + }, + { + "epoch": 1.73, + "learning_rate": 8.010846054016295e-07, + "loss": 0.6621, + "step": 67517 + }, + { + "epoch": 1.73, + "learning_rate": 8.010574879718067e-07, + "loss": 0.6221, + "step": 67518 + }, + { + "epoch": 1.73, + "learning_rate": 8.01030370694305e-07, + "loss": 0.5723, + "step": 67519 + }, + { + "epoch": 1.73, + "learning_rate": 8.010032535691451e-07, + "loss": 0.6338, + "step": 67520 + }, + { + "epoch": 1.73, + "learning_rate": 8.009761365963482e-07, + "loss": 0.6167, + "step": 67521 + }, + { + "epoch": 1.73, + "learning_rate": 8.009490197759346e-07, + "loss": 0.7109, + "step": 67522 + }, + { + "epoch": 1.73, + "learning_rate": 8.009219031079249e-07, + "loss": 0.5815, + "step": 67523 + }, + { + "epoch": 1.73, + "learning_rate": 8.008947865923404e-07, + "loss": 0.6147, + "step": 67524 + }, + { + "epoch": 1.73, + "learning_rate": 8.008676702292013e-07, + "loss": 0.5303, + "step": 67525 + }, + { + "epoch": 1.73, + "learning_rate": 8.008405540185288e-07, + "loss": 0.7676, + "step": 67526 + }, + { + "epoch": 1.73, + "learning_rate": 8.008134379603435e-07, + "loss": 0.6509, + "step": 67527 + }, + { + "epoch": 1.73, + "learning_rate": 8.007863220546663e-07, + "loss": 0.6758, + "step": 67528 + }, + { + "epoch": 1.73, + "learning_rate": 8.007592063015177e-07, + "loss": 0.4158, + "step": 67529 + }, + { + "epoch": 1.73, + "learning_rate": 8.007320907009189e-07, + "loss": 0.6396, + "step": 67530 + }, + { + "epoch": 1.73, + "learning_rate": 8.007049752528905e-07, + "loss": 0.6245, + "step": 67531 + }, + { + "epoch": 1.73, + "learning_rate": 8.006778599574526e-07, + "loss": 0.6536, + "step": 67532 + }, + { + "epoch": 1.73, + "learning_rate": 8.006507448146269e-07, + "loss": 0.7998, + "step": 67533 + }, + { + "epoch": 1.73, + "learning_rate": 8.006236298244334e-07, + "loss": 0.687, + "step": 67534 + }, + { + "epoch": 1.73, + "learning_rate": 8.005965149868935e-07, + "loss": 0.6875, + "step": 67535 + }, + { + "epoch": 1.73, + "learning_rate": 8.005694003020276e-07, + "loss": 0.6787, + "step": 67536 + }, + { + "epoch": 1.73, + "learning_rate": 8.005422857698565e-07, + "loss": 0.7549, + "step": 67537 + }, + { + "epoch": 1.73, + "learning_rate": 8.00515171390401e-07, + "loss": 0.6606, + "step": 67538 + }, + { + "epoch": 1.73, + "learning_rate": 8.004880571636819e-07, + "loss": 0.5142, + "step": 67539 + }, + { + "epoch": 1.73, + "learning_rate": 8.0046094308972e-07, + "loss": 0.627, + "step": 67540 + }, + { + "epoch": 1.73, + "learning_rate": 8.004338291685362e-07, + "loss": 0.7715, + "step": 67541 + }, + { + "epoch": 1.73, + "learning_rate": 8.004067154001505e-07, + "loss": 0.7861, + "step": 67542 + }, + { + "epoch": 1.73, + "learning_rate": 8.003796017845847e-07, + "loss": 0.4829, + "step": 67543 + }, + { + "epoch": 1.73, + "learning_rate": 8.003524883218587e-07, + "loss": 0.5298, + "step": 67544 + }, + { + "epoch": 1.73, + "learning_rate": 8.003253750119938e-07, + "loss": 0.564, + "step": 67545 + }, + { + "epoch": 1.73, + "learning_rate": 8.002982618550103e-07, + "loss": 0.7021, + "step": 67546 + }, + { + "epoch": 1.73, + "learning_rate": 8.002711488509296e-07, + "loss": 0.6533, + "step": 67547 + }, + { + "epoch": 1.73, + "learning_rate": 8.002440359997718e-07, + "loss": 0.5146, + "step": 67548 + }, + { + "epoch": 1.73, + "learning_rate": 8.002169233015581e-07, + "loss": 0.5996, + "step": 67549 + }, + { + "epoch": 1.73, + "learning_rate": 8.00189810756309e-07, + "loss": 0.7646, + "step": 67550 + }, + { + "epoch": 1.73, + "learning_rate": 8.001626983640458e-07, + "loss": 0.7207, + "step": 67551 + }, + { + "epoch": 1.73, + "learning_rate": 8.001355861247886e-07, + "loss": 0.6064, + "step": 67552 + }, + { + "epoch": 1.73, + "learning_rate": 8.001084740385582e-07, + "loss": 0.6885, + "step": 67553 + }, + { + "epoch": 1.73, + "learning_rate": 8.000813621053757e-07, + "loss": 0.6357, + "step": 67554 + }, + { + "epoch": 1.73, + "learning_rate": 8.000542503252616e-07, + "loss": 0.7012, + "step": 67555 + }, + { + "epoch": 1.73, + "learning_rate": 8.000271386982369e-07, + "loss": 0.6089, + "step": 67556 + }, + { + "epoch": 1.73, + "learning_rate": 8.000000272243222e-07, + "loss": 0.6572, + "step": 67557 + }, + { + "epoch": 1.73, + "learning_rate": 7.999729159035381e-07, + "loss": 0.6414, + "step": 67558 + }, + { + "epoch": 1.73, + "learning_rate": 7.999458047359058e-07, + "loss": 0.5249, + "step": 67559 + }, + { + "epoch": 1.73, + "learning_rate": 7.999186937214456e-07, + "loss": 0.6426, + "step": 67560 + }, + { + "epoch": 1.73, + "learning_rate": 7.998915828601788e-07, + "loss": 0.5781, + "step": 67561 + }, + { + "epoch": 1.73, + "learning_rate": 7.998644721521256e-07, + "loss": 0.665, + "step": 67562 + }, + { + "epoch": 1.73, + "learning_rate": 7.998373615973068e-07, + "loss": 0.554, + "step": 67563 + }, + { + "epoch": 1.73, + "learning_rate": 7.998102511957437e-07, + "loss": 0.4762, + "step": 67564 + }, + { + "epoch": 1.73, + "learning_rate": 7.997831409474561e-07, + "loss": 0.6538, + "step": 67565 + }, + { + "epoch": 1.73, + "learning_rate": 7.997560308524658e-07, + "loss": 0.5576, + "step": 67566 + }, + { + "epoch": 1.73, + "learning_rate": 7.99728920910793e-07, + "loss": 0.5884, + "step": 67567 + }, + { + "epoch": 1.73, + "learning_rate": 7.997018111224585e-07, + "loss": 0.6821, + "step": 67568 + }, + { + "epoch": 1.73, + "learning_rate": 7.996747014874831e-07, + "loss": 0.4702, + "step": 67569 + }, + { + "epoch": 1.73, + "learning_rate": 7.996475920058876e-07, + "loss": 0.5903, + "step": 67570 + }, + { + "epoch": 1.73, + "learning_rate": 7.996204826776931e-07, + "loss": 0.4473, + "step": 67571 + }, + { + "epoch": 1.73, + "learning_rate": 7.995933735029195e-07, + "loss": 0.6333, + "step": 67572 + }, + { + "epoch": 1.73, + "learning_rate": 7.995662644815883e-07, + "loss": 0.5273, + "step": 67573 + }, + { + "epoch": 1.73, + "learning_rate": 7.995391556137199e-07, + "loss": 0.8408, + "step": 67574 + }, + { + "epoch": 1.73, + "learning_rate": 7.995120468993349e-07, + "loss": 0.5513, + "step": 67575 + }, + { + "epoch": 1.73, + "learning_rate": 7.994849383384547e-07, + "loss": 0.8018, + "step": 67576 + }, + { + "epoch": 1.73, + "learning_rate": 7.994578299310993e-07, + "loss": 0.6494, + "step": 67577 + }, + { + "epoch": 1.73, + "learning_rate": 7.994307216772901e-07, + "loss": 0.7251, + "step": 67578 + }, + { + "epoch": 1.73, + "learning_rate": 7.994036135770473e-07, + "loss": 0.6807, + "step": 67579 + }, + { + "epoch": 1.73, + "learning_rate": 7.993765056303922e-07, + "loss": 0.7046, + "step": 67580 + }, + { + "epoch": 1.73, + "learning_rate": 7.993493978373456e-07, + "loss": 0.5537, + "step": 67581 + }, + { + "epoch": 1.73, + "learning_rate": 7.993222901979273e-07, + "loss": 0.4634, + "step": 67582 + }, + { + "epoch": 1.73, + "learning_rate": 7.992951827121591e-07, + "loss": 0.666, + "step": 67583 + }, + { + "epoch": 1.73, + "learning_rate": 7.992680753800609e-07, + "loss": 0.6602, + "step": 67584 + }, + { + "epoch": 1.73, + "learning_rate": 7.992409682016544e-07, + "loss": 0.6543, + "step": 67585 + }, + { + "epoch": 1.73, + "learning_rate": 7.992138611769595e-07, + "loss": 0.6309, + "step": 67586 + }, + { + "epoch": 1.73, + "learning_rate": 7.991867543059975e-07, + "loss": 0.7441, + "step": 67587 + }, + { + "epoch": 1.73, + "learning_rate": 7.991596475887888e-07, + "loss": 0.7139, + "step": 67588 + }, + { + "epoch": 1.73, + "learning_rate": 7.991325410253545e-07, + "loss": 0.6343, + "step": 67589 + }, + { + "epoch": 1.73, + "learning_rate": 7.99105434615715e-07, + "loss": 0.5298, + "step": 67590 + }, + { + "epoch": 1.73, + "learning_rate": 7.990783283598916e-07, + "loss": 0.4927, + "step": 67591 + }, + { + "epoch": 1.73, + "learning_rate": 7.990512222579046e-07, + "loss": 0.7363, + "step": 67592 + }, + { + "epoch": 1.73, + "learning_rate": 7.990241163097747e-07, + "loss": 0.6017, + "step": 67593 + }, + { + "epoch": 1.73, + "learning_rate": 7.989970105155227e-07, + "loss": 0.6602, + "step": 67594 + }, + { + "epoch": 1.73, + "learning_rate": 7.989699048751696e-07, + "loss": 0.5469, + "step": 67595 + }, + { + "epoch": 1.73, + "learning_rate": 7.989427993887357e-07, + "loss": 0.5591, + "step": 67596 + }, + { + "epoch": 1.73, + "learning_rate": 7.989156940562425e-07, + "loss": 0.707, + "step": 67597 + }, + { + "epoch": 1.73, + "learning_rate": 7.988885888777099e-07, + "loss": 0.604, + "step": 67598 + }, + { + "epoch": 1.73, + "learning_rate": 7.988614838531594e-07, + "loss": 0.5923, + "step": 67599 + }, + { + "epoch": 1.73, + "learning_rate": 7.988343789826111e-07, + "loss": 0.665, + "step": 67600 + }, + { + "epoch": 1.73, + "learning_rate": 7.988072742660864e-07, + "loss": 0.6543, + "step": 67601 + }, + { + "epoch": 1.73, + "learning_rate": 7.987801697036056e-07, + "loss": 0.6084, + "step": 67602 + }, + { + "epoch": 1.73, + "learning_rate": 7.987530652951895e-07, + "loss": 0.8154, + "step": 67603 + }, + { + "epoch": 1.73, + "learning_rate": 7.98725961040859e-07, + "loss": 0.6318, + "step": 67604 + }, + { + "epoch": 1.73, + "learning_rate": 7.986988569406346e-07, + "loss": 0.7764, + "step": 67605 + }, + { + "epoch": 1.73, + "learning_rate": 7.986717529945374e-07, + "loss": 0.5825, + "step": 67606 + }, + { + "epoch": 1.73, + "learning_rate": 7.986446492025878e-07, + "loss": 0.5791, + "step": 67607 + }, + { + "epoch": 1.73, + "learning_rate": 7.986175455648068e-07, + "loss": 0.6134, + "step": 67608 + }, + { + "epoch": 1.73, + "learning_rate": 7.98590442081215e-07, + "loss": 0.7637, + "step": 67609 + }, + { + "epoch": 1.73, + "learning_rate": 7.985633387518336e-07, + "loss": 0.7388, + "step": 67610 + }, + { + "epoch": 1.73, + "learning_rate": 7.98536235576683e-07, + "loss": 0.6099, + "step": 67611 + }, + { + "epoch": 1.73, + "learning_rate": 7.985091325557838e-07, + "loss": 0.5703, + "step": 67612 + }, + { + "epoch": 1.73, + "learning_rate": 7.984820296891567e-07, + "loss": 0.6006, + "step": 67613 + }, + { + "epoch": 1.73, + "learning_rate": 7.984549269768228e-07, + "loss": 0.6484, + "step": 67614 + }, + { + "epoch": 1.73, + "learning_rate": 7.984278244188025e-07, + "loss": 0.6328, + "step": 67615 + }, + { + "epoch": 1.73, + "learning_rate": 7.98400722015117e-07, + "loss": 0.5173, + "step": 67616 + }, + { + "epoch": 1.73, + "learning_rate": 7.983736197657866e-07, + "loss": 0.6592, + "step": 67617 + }, + { + "epoch": 1.73, + "learning_rate": 7.983465176708324e-07, + "loss": 0.7324, + "step": 67618 + }, + { + "epoch": 1.73, + "learning_rate": 7.983194157302747e-07, + "loss": 0.7178, + "step": 67619 + }, + { + "epoch": 1.73, + "learning_rate": 7.982923139441349e-07, + "loss": 0.5845, + "step": 67620 + }, + { + "epoch": 1.73, + "learning_rate": 7.982652123124336e-07, + "loss": 0.5518, + "step": 67621 + }, + { + "epoch": 1.73, + "learning_rate": 7.982381108351909e-07, + "loss": 0.6587, + "step": 67622 + }, + { + "epoch": 1.73, + "learning_rate": 7.982110095124282e-07, + "loss": 0.7666, + "step": 67623 + }, + { + "epoch": 1.73, + "learning_rate": 7.981839083441659e-07, + "loss": 0.502, + "step": 67624 + }, + { + "epoch": 1.73, + "learning_rate": 7.98156807330425e-07, + "loss": 0.6592, + "step": 67625 + }, + { + "epoch": 1.73, + "learning_rate": 7.98129706471226e-07, + "loss": 0.6431, + "step": 67626 + }, + { + "epoch": 1.73, + "learning_rate": 7.981026057665901e-07, + "loss": 0.6602, + "step": 67627 + }, + { + "epoch": 1.73, + "learning_rate": 7.980755052165374e-07, + "loss": 0.8125, + "step": 67628 + }, + { + "epoch": 1.73, + "learning_rate": 7.980484048210892e-07, + "loss": 0.5322, + "step": 67629 + }, + { + "epoch": 1.73, + "learning_rate": 7.980213045802662e-07, + "loss": 0.5957, + "step": 67630 + }, + { + "epoch": 1.73, + "learning_rate": 7.979942044940892e-07, + "loss": 0.6348, + "step": 67631 + }, + { + "epoch": 1.73, + "learning_rate": 7.979671045625782e-07, + "loss": 0.5986, + "step": 67632 + }, + { + "epoch": 1.73, + "learning_rate": 7.979400047857547e-07, + "loss": 0.6719, + "step": 67633 + }, + { + "epoch": 1.73, + "learning_rate": 7.979129051636392e-07, + "loss": 0.4277, + "step": 67634 + }, + { + "epoch": 1.73, + "learning_rate": 7.978858056962526e-07, + "loss": 0.5127, + "step": 67635 + }, + { + "epoch": 1.73, + "learning_rate": 7.978587063836153e-07, + "loss": 0.562, + "step": 67636 + }, + { + "epoch": 1.73, + "learning_rate": 7.978316072257486e-07, + "loss": 0.8027, + "step": 67637 + }, + { + "epoch": 1.73, + "learning_rate": 7.978045082226727e-07, + "loss": 0.6255, + "step": 67638 + }, + { + "epoch": 1.73, + "learning_rate": 7.977774093744087e-07, + "loss": 0.7217, + "step": 67639 + }, + { + "epoch": 1.73, + "learning_rate": 7.977503106809772e-07, + "loss": 0.4811, + "step": 67640 + }, + { + "epoch": 1.73, + "learning_rate": 7.977232121423994e-07, + "loss": 0.252, + "step": 67641 + }, + { + "epoch": 1.73, + "learning_rate": 7.976961137586952e-07, + "loss": 0.5956, + "step": 67642 + }, + { + "epoch": 1.73, + "learning_rate": 7.976690155298858e-07, + "loss": 0.7139, + "step": 67643 + }, + { + "epoch": 1.73, + "learning_rate": 7.97641917455992e-07, + "loss": 0.6357, + "step": 67644 + }, + { + "epoch": 1.73, + "learning_rate": 7.976148195370344e-07, + "loss": 0.6562, + "step": 67645 + }, + { + "epoch": 1.73, + "learning_rate": 7.975877217730341e-07, + "loss": 0.7168, + "step": 67646 + }, + { + "epoch": 1.73, + "learning_rate": 7.975606241640114e-07, + "loss": 0.6157, + "step": 67647 + }, + { + "epoch": 1.73, + "learning_rate": 7.97533526709987e-07, + "loss": 0.7598, + "step": 67648 + }, + { + "epoch": 1.73, + "learning_rate": 7.975064294109821e-07, + "loss": 0.5596, + "step": 67649 + }, + { + "epoch": 1.73, + "learning_rate": 7.974793322670171e-07, + "loss": 0.6992, + "step": 67650 + }, + { + "epoch": 1.73, + "learning_rate": 7.974522352781133e-07, + "loss": 0.6758, + "step": 67651 + }, + { + "epoch": 1.73, + "learning_rate": 7.974251384442906e-07, + "loss": 0.675, + "step": 67652 + }, + { + "epoch": 1.73, + "learning_rate": 7.973980417655702e-07, + "loss": 0.5532, + "step": 67653 + }, + { + "epoch": 1.73, + "learning_rate": 7.973709452419728e-07, + "loss": 0.623, + "step": 67654 + }, + { + "epoch": 1.73, + "learning_rate": 7.97343848873519e-07, + "loss": 0.7275, + "step": 67655 + }, + { + "epoch": 1.73, + "learning_rate": 7.973167526602299e-07, + "loss": 0.7549, + "step": 67656 + }, + { + "epoch": 1.73, + "learning_rate": 7.972896566021259e-07, + "loss": 0.4897, + "step": 67657 + }, + { + "epoch": 1.73, + "learning_rate": 7.97262560699228e-07, + "loss": 0.6299, + "step": 67658 + }, + { + "epoch": 1.73, + "learning_rate": 7.972354649515567e-07, + "loss": 0.4449, + "step": 67659 + }, + { + "epoch": 1.73, + "learning_rate": 7.972083693591331e-07, + "loss": 0.5293, + "step": 67660 + }, + { + "epoch": 1.73, + "learning_rate": 7.971812739219779e-07, + "loss": 0.6719, + "step": 67661 + }, + { + "epoch": 1.73, + "learning_rate": 7.971541786401112e-07, + "loss": 0.71, + "step": 67662 + }, + { + "epoch": 1.73, + "learning_rate": 7.971270835135546e-07, + "loss": 0.7344, + "step": 67663 + }, + { + "epoch": 1.73, + "learning_rate": 7.970999885423284e-07, + "loss": 0.4392, + "step": 67664 + }, + { + "epoch": 1.73, + "learning_rate": 7.970728937264531e-07, + "loss": 0.6655, + "step": 67665 + }, + { + "epoch": 1.73, + "learning_rate": 7.9704579906595e-07, + "loss": 0.4204, + "step": 67666 + }, + { + "epoch": 1.73, + "learning_rate": 7.970187045608394e-07, + "loss": 0.665, + "step": 67667 + }, + { + "epoch": 1.73, + "learning_rate": 7.969916102111425e-07, + "loss": 0.6924, + "step": 67668 + }, + { + "epoch": 1.73, + "learning_rate": 7.969645160168795e-07, + "loss": 0.8125, + "step": 67669 + }, + { + "epoch": 1.73, + "learning_rate": 7.969374219780718e-07, + "loss": 0.5566, + "step": 67670 + }, + { + "epoch": 1.73, + "learning_rate": 7.969103280947398e-07, + "loss": 0.6963, + "step": 67671 + }, + { + "epoch": 1.73, + "learning_rate": 7.96883234366904e-07, + "loss": 0.4714, + "step": 67672 + }, + { + "epoch": 1.73, + "learning_rate": 7.968561407945854e-07, + "loss": 0.6084, + "step": 67673 + }, + { + "epoch": 1.73, + "learning_rate": 7.968290473778045e-07, + "loss": 0.6755, + "step": 67674 + }, + { + "epoch": 1.73, + "learning_rate": 7.968019541165826e-07, + "loss": 0.8301, + "step": 67675 + }, + { + "epoch": 1.73, + "learning_rate": 7.967748610109399e-07, + "loss": 0.7207, + "step": 67676 + }, + { + "epoch": 1.73, + "learning_rate": 7.967477680608974e-07, + "loss": 0.519, + "step": 67677 + }, + { + "epoch": 1.73, + "learning_rate": 7.967206752664757e-07, + "loss": 0.5576, + "step": 67678 + }, + { + "epoch": 1.73, + "learning_rate": 7.966935826276957e-07, + "loss": 0.6885, + "step": 67679 + }, + { + "epoch": 1.73, + "learning_rate": 7.966664901445784e-07, + "loss": 0.6592, + "step": 67680 + }, + { + "epoch": 1.73, + "learning_rate": 7.966393978171438e-07, + "loss": 0.583, + "step": 67681 + }, + { + "epoch": 1.73, + "learning_rate": 7.966123056454133e-07, + "loss": 0.7627, + "step": 67682 + }, + { + "epoch": 1.73, + "learning_rate": 7.965852136294074e-07, + "loss": 0.5996, + "step": 67683 + }, + { + "epoch": 1.73, + "learning_rate": 7.965581217691465e-07, + "loss": 0.6785, + "step": 67684 + }, + { + "epoch": 1.73, + "learning_rate": 7.96531030064652e-07, + "loss": 0.6045, + "step": 67685 + }, + { + "epoch": 1.73, + "learning_rate": 7.965039385159441e-07, + "loss": 0.5142, + "step": 67686 + }, + { + "epoch": 1.73, + "learning_rate": 7.964768471230441e-07, + "loss": 0.5967, + "step": 67687 + }, + { + "epoch": 1.73, + "learning_rate": 7.964497558859721e-07, + "loss": 0.6279, + "step": 67688 + }, + { + "epoch": 1.73, + "learning_rate": 7.964226648047494e-07, + "loss": 0.7417, + "step": 67689 + }, + { + "epoch": 1.73, + "learning_rate": 7.963955738793967e-07, + "loss": 0.7451, + "step": 67690 + }, + { + "epoch": 1.73, + "learning_rate": 7.963684831099341e-07, + "loss": 0.5527, + "step": 67691 + }, + { + "epoch": 1.73, + "learning_rate": 7.963413924963831e-07, + "loss": 0.7861, + "step": 67692 + }, + { + "epoch": 1.74, + "learning_rate": 7.963143020387638e-07, + "loss": 0.6802, + "step": 67693 + }, + { + "epoch": 1.74, + "learning_rate": 7.962872117370976e-07, + "loss": 0.4609, + "step": 67694 + }, + { + "epoch": 1.74, + "learning_rate": 7.962601215914046e-07, + "loss": 0.8662, + "step": 67695 + }, + { + "epoch": 1.74, + "learning_rate": 7.962330316017061e-07, + "loss": 0.7295, + "step": 67696 + }, + { + "epoch": 1.74, + "learning_rate": 7.962059417680224e-07, + "loss": 0.6099, + "step": 67697 + }, + { + "epoch": 1.74, + "learning_rate": 7.961788520903746e-07, + "loss": 0.415, + "step": 67698 + }, + { + "epoch": 1.74, + "learning_rate": 7.961517625687832e-07, + "loss": 0.6934, + "step": 67699 + }, + { + "epoch": 1.74, + "learning_rate": 7.961246732032696e-07, + "loss": 0.7012, + "step": 67700 + }, + { + "epoch": 1.74, + "learning_rate": 7.960975839938533e-07, + "loss": 0.7109, + "step": 67701 + }, + { + "epoch": 1.74, + "learning_rate": 7.960704949405559e-07, + "loss": 0.6567, + "step": 67702 + }, + { + "epoch": 1.74, + "learning_rate": 7.960434060433977e-07, + "loss": 0.6465, + "step": 67703 + }, + { + "epoch": 1.74, + "learning_rate": 7.960163173024e-07, + "loss": 0.6138, + "step": 67704 + }, + { + "epoch": 1.74, + "learning_rate": 7.959892287175829e-07, + "loss": 0.8516, + "step": 67705 + }, + { + "epoch": 1.74, + "learning_rate": 7.959621402889678e-07, + "loss": 0.6182, + "step": 67706 + }, + { + "epoch": 1.74, + "learning_rate": 7.959350520165748e-07, + "loss": 0.5649, + "step": 67707 + }, + { + "epoch": 1.74, + "learning_rate": 7.959079639004252e-07, + "loss": 0.6602, + "step": 67708 + }, + { + "epoch": 1.74, + "learning_rate": 7.958808759405393e-07, + "loss": 0.6323, + "step": 67709 + }, + { + "epoch": 1.74, + "learning_rate": 7.958537881369385e-07, + "loss": 0.4602, + "step": 67710 + }, + { + "epoch": 1.74, + "learning_rate": 7.958267004896427e-07, + "loss": 0.7002, + "step": 67711 + }, + { + "epoch": 1.74, + "learning_rate": 7.957996129986728e-07, + "loss": 0.5657, + "step": 67712 + }, + { + "epoch": 1.74, + "learning_rate": 7.957725256640502e-07, + "loss": 0.6895, + "step": 67713 + }, + { + "epoch": 1.74, + "learning_rate": 7.957454384857947e-07, + "loss": 0.5066, + "step": 67714 + }, + { + "epoch": 1.74, + "learning_rate": 7.957183514639278e-07, + "loss": 0.537, + "step": 67715 + }, + { + "epoch": 1.74, + "learning_rate": 7.956912645984699e-07, + "loss": 0.6533, + "step": 67716 + }, + { + "epoch": 1.74, + "learning_rate": 7.956641778894419e-07, + "loss": 0.71, + "step": 67717 + }, + { + "epoch": 1.74, + "learning_rate": 7.956370913368642e-07, + "loss": 0.4661, + "step": 67718 + }, + { + "epoch": 1.74, + "learning_rate": 7.956100049407581e-07, + "loss": 0.5464, + "step": 67719 + }, + { + "epoch": 1.74, + "learning_rate": 7.955829187011442e-07, + "loss": 0.7129, + "step": 67720 + }, + { + "epoch": 1.74, + "learning_rate": 7.955558326180428e-07, + "loss": 0.634, + "step": 67721 + }, + { + "epoch": 1.74, + "learning_rate": 7.955287466914747e-07, + "loss": 0.7236, + "step": 67722 + }, + { + "epoch": 1.74, + "learning_rate": 7.955016609214611e-07, + "loss": 0.623, + "step": 67723 + }, + { + "epoch": 1.74, + "learning_rate": 7.954745753080222e-07, + "loss": 0.533, + "step": 67724 + }, + { + "epoch": 1.74, + "learning_rate": 7.954474898511792e-07, + "loss": 0.6846, + "step": 67725 + }, + { + "epoch": 1.74, + "learning_rate": 7.954204045509525e-07, + "loss": 0.5844, + "step": 67726 + }, + { + "epoch": 1.74, + "learning_rate": 7.953933194073632e-07, + "loss": 0.6738, + "step": 67727 + }, + { + "epoch": 1.74, + "learning_rate": 7.953662344204316e-07, + "loss": 0.7104, + "step": 67728 + }, + { + "epoch": 1.74, + "learning_rate": 7.953391495901788e-07, + "loss": 0.7021, + "step": 67729 + }, + { + "epoch": 1.74, + "learning_rate": 7.953120649166259e-07, + "loss": 0.666, + "step": 67730 + }, + { + "epoch": 1.74, + "learning_rate": 7.952849803997924e-07, + "loss": 0.5464, + "step": 67731 + }, + { + "epoch": 1.74, + "learning_rate": 7.952578960397001e-07, + "loss": 0.6572, + "step": 67732 + }, + { + "epoch": 1.74, + "learning_rate": 7.952308118363692e-07, + "loss": 0.6895, + "step": 67733 + }, + { + "epoch": 1.74, + "learning_rate": 7.95203727789821e-07, + "loss": 0.6523, + "step": 67734 + }, + { + "epoch": 1.74, + "learning_rate": 7.951766439000754e-07, + "loss": 0.5728, + "step": 67735 + }, + { + "epoch": 1.74, + "learning_rate": 7.95149560167154e-07, + "loss": 0.447, + "step": 67736 + }, + { + "epoch": 1.74, + "learning_rate": 7.951224765910771e-07, + "loss": 0.7002, + "step": 67737 + }, + { + "epoch": 1.74, + "learning_rate": 7.950953931718654e-07, + "loss": 0.6855, + "step": 67738 + }, + { + "epoch": 1.74, + "learning_rate": 7.950683099095399e-07, + "loss": 0.752, + "step": 67739 + }, + { + "epoch": 1.74, + "learning_rate": 7.950412268041214e-07, + "loss": 0.5386, + "step": 67740 + }, + { + "epoch": 1.74, + "learning_rate": 7.9501414385563e-07, + "loss": 0.7178, + "step": 67741 + }, + { + "epoch": 1.74, + "learning_rate": 7.949870610640868e-07, + "loss": 0.5203, + "step": 67742 + }, + { + "epoch": 1.74, + "learning_rate": 7.949599784295127e-07, + "loss": 0.6475, + "step": 67743 + }, + { + "epoch": 1.74, + "learning_rate": 7.949328959519283e-07, + "loss": 0.5183, + "step": 67744 + }, + { + "epoch": 1.74, + "learning_rate": 7.949058136313543e-07, + "loss": 0.4617, + "step": 67745 + }, + { + "epoch": 1.74, + "learning_rate": 7.948787314678116e-07, + "loss": 0.4321, + "step": 67746 + }, + { + "epoch": 1.74, + "learning_rate": 7.948516494613207e-07, + "loss": 0.6135, + "step": 67747 + }, + { + "epoch": 1.74, + "learning_rate": 7.948245676119026e-07, + "loss": 0.8008, + "step": 67748 + }, + { + "epoch": 1.74, + "learning_rate": 7.947974859195777e-07, + "loss": 0.624, + "step": 67749 + }, + { + "epoch": 1.74, + "learning_rate": 7.947704043843674e-07, + "loss": 0.6335, + "step": 67750 + }, + { + "epoch": 1.74, + "learning_rate": 7.947433230062918e-07, + "loss": 0.627, + "step": 67751 + }, + { + "epoch": 1.74, + "learning_rate": 7.947162417853714e-07, + "loss": 0.6816, + "step": 67752 + }, + { + "epoch": 1.74, + "learning_rate": 7.946891607216278e-07, + "loss": 0.8389, + "step": 67753 + }, + { + "epoch": 1.74, + "learning_rate": 7.946620798150807e-07, + "loss": 0.6035, + "step": 67754 + }, + { + "epoch": 1.74, + "learning_rate": 7.94634999065752e-07, + "loss": 0.3752, + "step": 67755 + }, + { + "epoch": 1.74, + "learning_rate": 7.946079184736616e-07, + "loss": 0.6836, + "step": 67756 + }, + { + "epoch": 1.74, + "learning_rate": 7.945808380388302e-07, + "loss": 0.6772, + "step": 67757 + }, + { + "epoch": 1.74, + "learning_rate": 7.945537577612792e-07, + "loss": 0.5991, + "step": 67758 + }, + { + "epoch": 1.74, + "learning_rate": 7.945266776410287e-07, + "loss": 0.5872, + "step": 67759 + }, + { + "epoch": 1.74, + "learning_rate": 7.944995976781001e-07, + "loss": 0.5854, + "step": 67760 + }, + { + "epoch": 1.74, + "learning_rate": 7.944725178725134e-07, + "loss": 0.7236, + "step": 67761 + }, + { + "epoch": 1.74, + "learning_rate": 7.944454382242896e-07, + "loss": 0.4858, + "step": 67762 + }, + { + "epoch": 1.74, + "learning_rate": 7.944183587334495e-07, + "loss": 0.4695, + "step": 67763 + }, + { + "epoch": 1.74, + "learning_rate": 7.943912794000137e-07, + "loss": 0.6318, + "step": 67764 + }, + { + "epoch": 1.74, + "learning_rate": 7.943642002240032e-07, + "loss": 0.6895, + "step": 67765 + }, + { + "epoch": 1.74, + "learning_rate": 7.943371212054384e-07, + "loss": 0.6025, + "step": 67766 + }, + { + "epoch": 1.74, + "learning_rate": 7.943100423443404e-07, + "loss": 0.6846, + "step": 67767 + }, + { + "epoch": 1.74, + "learning_rate": 7.942829636407296e-07, + "loss": 0.6436, + "step": 67768 + }, + { + "epoch": 1.74, + "learning_rate": 7.94255885094627e-07, + "loss": 0.7148, + "step": 67769 + }, + { + "epoch": 1.74, + "learning_rate": 7.942288067060536e-07, + "loss": 0.6187, + "step": 67770 + }, + { + "epoch": 1.74, + "learning_rate": 7.942017284750291e-07, + "loss": 0.7285, + "step": 67771 + }, + { + "epoch": 1.74, + "learning_rate": 7.941746504015751e-07, + "loss": 0.6504, + "step": 67772 + }, + { + "epoch": 1.74, + "learning_rate": 7.941475724857122e-07, + "loss": 0.7549, + "step": 67773 + }, + { + "epoch": 1.74, + "learning_rate": 7.941204947274608e-07, + "loss": 0.573, + "step": 67774 + }, + { + "epoch": 1.74, + "learning_rate": 7.940934171268421e-07, + "loss": 0.8271, + "step": 67775 + }, + { + "epoch": 1.74, + "learning_rate": 7.940663396838764e-07, + "loss": 0.6255, + "step": 67776 + }, + { + "epoch": 1.74, + "learning_rate": 7.940392623985848e-07, + "loss": 0.3284, + "step": 67777 + }, + { + "epoch": 1.74, + "learning_rate": 7.940121852709875e-07, + "loss": 0.6875, + "step": 67778 + }, + { + "epoch": 1.74, + "learning_rate": 7.939851083011062e-07, + "loss": 0.6416, + "step": 67779 + }, + { + "epoch": 1.74, + "learning_rate": 7.939580314889609e-07, + "loss": 0.71, + "step": 67780 + }, + { + "epoch": 1.74, + "learning_rate": 7.939309548345722e-07, + "loss": 0.5747, + "step": 67781 + }, + { + "epoch": 1.74, + "learning_rate": 7.939038783379612e-07, + "loss": 0.6016, + "step": 67782 + }, + { + "epoch": 1.74, + "learning_rate": 7.938768019991484e-07, + "loss": 0.7734, + "step": 67783 + }, + { + "epoch": 1.74, + "learning_rate": 7.938497258181549e-07, + "loss": 0.6553, + "step": 67784 + }, + { + "epoch": 1.74, + "learning_rate": 7.938226497950009e-07, + "loss": 0.708, + "step": 67785 + }, + { + "epoch": 1.74, + "learning_rate": 7.937955739297077e-07, + "loss": 0.6504, + "step": 67786 + }, + { + "epoch": 1.74, + "learning_rate": 7.937684982222954e-07, + "loss": 0.6934, + "step": 67787 + }, + { + "epoch": 1.74, + "learning_rate": 7.937414226727854e-07, + "loss": 0.6406, + "step": 67788 + }, + { + "epoch": 1.74, + "learning_rate": 7.937143472811978e-07, + "loss": 0.3868, + "step": 67789 + }, + { + "epoch": 1.74, + "learning_rate": 7.936872720475545e-07, + "loss": 0.4309, + "step": 67790 + }, + { + "epoch": 1.74, + "learning_rate": 7.936601969718744e-07, + "loss": 0.5439, + "step": 67791 + }, + { + "epoch": 1.74, + "learning_rate": 7.936331220541796e-07, + "loss": 0.7354, + "step": 67792 + }, + { + "epoch": 1.74, + "learning_rate": 7.936060472944903e-07, + "loss": 0.604, + "step": 67793 + }, + { + "epoch": 1.74, + "learning_rate": 7.935789726928275e-07, + "loss": 0.6362, + "step": 67794 + }, + { + "epoch": 1.74, + "learning_rate": 7.935518982492115e-07, + "loss": 0.5615, + "step": 67795 + }, + { + "epoch": 1.74, + "learning_rate": 7.935248239636636e-07, + "loss": 0.6143, + "step": 67796 + }, + { + "epoch": 1.74, + "learning_rate": 7.934977498362039e-07, + "loss": 0.375, + "step": 67797 + }, + { + "epoch": 1.74, + "learning_rate": 7.934706758668539e-07, + "loss": 0.5376, + "step": 67798 + }, + { + "epoch": 1.74, + "learning_rate": 7.934436020556336e-07, + "loss": 0.5312, + "step": 67799 + }, + { + "epoch": 1.74, + "learning_rate": 7.934165284025645e-07, + "loss": 0.6016, + "step": 67800 + }, + { + "epoch": 1.74, + "learning_rate": 7.933894549076666e-07, + "loss": 0.6572, + "step": 67801 + }, + { + "epoch": 1.74, + "learning_rate": 7.933623815709607e-07, + "loss": 0.7334, + "step": 67802 + }, + { + "epoch": 1.74, + "learning_rate": 7.93335308392468e-07, + "loss": 0.5815, + "step": 67803 + }, + { + "epoch": 1.74, + "learning_rate": 7.933082353722086e-07, + "loss": 0.627, + "step": 67804 + }, + { + "epoch": 1.74, + "learning_rate": 7.932811625102038e-07, + "loss": 0.5542, + "step": 67805 + }, + { + "epoch": 1.74, + "learning_rate": 7.93254089806474e-07, + "loss": 0.5728, + "step": 67806 + }, + { + "epoch": 1.74, + "learning_rate": 7.932270172610403e-07, + "loss": 0.7939, + "step": 67807 + }, + { + "epoch": 1.74, + "learning_rate": 7.931999448739228e-07, + "loss": 0.6963, + "step": 67808 + }, + { + "epoch": 1.74, + "learning_rate": 7.931728726451429e-07, + "loss": 0.6226, + "step": 67809 + }, + { + "epoch": 1.74, + "learning_rate": 7.931458005747213e-07, + "loss": 0.5237, + "step": 67810 + }, + { + "epoch": 1.74, + "learning_rate": 7.931187286626781e-07, + "loss": 0.623, + "step": 67811 + }, + { + "epoch": 1.74, + "learning_rate": 7.930916569090342e-07, + "loss": 0.645, + "step": 67812 + }, + { + "epoch": 1.74, + "learning_rate": 7.930645853138107e-07, + "loss": 0.6294, + "step": 67813 + }, + { + "epoch": 1.74, + "learning_rate": 7.93037513877028e-07, + "loss": 0.6797, + "step": 67814 + }, + { + "epoch": 1.74, + "learning_rate": 7.930104425987071e-07, + "loss": 0.6572, + "step": 67815 + }, + { + "epoch": 1.74, + "learning_rate": 7.929833714788683e-07, + "loss": 0.606, + "step": 67816 + }, + { + "epoch": 1.74, + "learning_rate": 7.92956300517533e-07, + "loss": 0.4856, + "step": 67817 + }, + { + "epoch": 1.74, + "learning_rate": 7.929292297147212e-07, + "loss": 0.6177, + "step": 67818 + }, + { + "epoch": 1.74, + "learning_rate": 7.929021590704543e-07, + "loss": 0.5403, + "step": 67819 + }, + { + "epoch": 1.74, + "learning_rate": 7.928750885847527e-07, + "loss": 0.6963, + "step": 67820 + }, + { + "epoch": 1.74, + "learning_rate": 7.928480182576369e-07, + "loss": 0.8545, + "step": 67821 + }, + { + "epoch": 1.74, + "learning_rate": 7.928209480891279e-07, + "loss": 0.6768, + "step": 67822 + }, + { + "epoch": 1.74, + "learning_rate": 7.927938780792463e-07, + "loss": 0.5874, + "step": 67823 + }, + { + "epoch": 1.74, + "learning_rate": 7.92766808228013e-07, + "loss": 0.6172, + "step": 67824 + }, + { + "epoch": 1.74, + "learning_rate": 7.927397385354485e-07, + "loss": 0.7207, + "step": 67825 + }, + { + "epoch": 1.74, + "learning_rate": 7.927126690015738e-07, + "loss": 0.6353, + "step": 67826 + }, + { + "epoch": 1.74, + "learning_rate": 7.926855996264096e-07, + "loss": 0.468, + "step": 67827 + }, + { + "epoch": 1.74, + "learning_rate": 7.926585304099762e-07, + "loss": 0.7275, + "step": 67828 + }, + { + "epoch": 1.74, + "learning_rate": 7.926314613522949e-07, + "loss": 0.6802, + "step": 67829 + }, + { + "epoch": 1.74, + "learning_rate": 7.926043924533862e-07, + "loss": 0.6401, + "step": 67830 + }, + { + "epoch": 1.74, + "learning_rate": 7.925773237132705e-07, + "loss": 0.7842, + "step": 67831 + }, + { + "epoch": 1.74, + "learning_rate": 7.92550255131969e-07, + "loss": 0.7559, + "step": 67832 + }, + { + "epoch": 1.74, + "learning_rate": 7.92523186709502e-07, + "loss": 0.6484, + "step": 67833 + }, + { + "epoch": 1.74, + "learning_rate": 7.924961184458907e-07, + "loss": 0.6235, + "step": 67834 + }, + { + "epoch": 1.74, + "learning_rate": 7.924690503411553e-07, + "loss": 0.4771, + "step": 67835 + }, + { + "epoch": 1.74, + "learning_rate": 7.924419823953171e-07, + "loss": 0.8535, + "step": 67836 + }, + { + "epoch": 1.74, + "learning_rate": 7.924149146083963e-07, + "loss": 0.7539, + "step": 67837 + }, + { + "epoch": 1.74, + "learning_rate": 7.92387846980414e-07, + "loss": 0.4558, + "step": 67838 + }, + { + "epoch": 1.74, + "learning_rate": 7.923607795113907e-07, + "loss": 0.7139, + "step": 67839 + }, + { + "epoch": 1.74, + "learning_rate": 7.923337122013475e-07, + "loss": 0.6636, + "step": 67840 + }, + { + "epoch": 1.74, + "learning_rate": 7.923066450503046e-07, + "loss": 0.8125, + "step": 67841 + }, + { + "epoch": 1.74, + "learning_rate": 7.922795780582828e-07, + "loss": 0.625, + "step": 67842 + }, + { + "epoch": 1.74, + "learning_rate": 7.922525112253033e-07, + "loss": 0.8184, + "step": 67843 + }, + { + "epoch": 1.74, + "learning_rate": 7.92225444551386e-07, + "loss": 0.4097, + "step": 67844 + }, + { + "epoch": 1.74, + "learning_rate": 7.921983780365526e-07, + "loss": 0.668, + "step": 67845 + }, + { + "epoch": 1.74, + "learning_rate": 7.921713116808233e-07, + "loss": 0.6499, + "step": 67846 + }, + { + "epoch": 1.74, + "learning_rate": 7.921442454842187e-07, + "loss": 0.6836, + "step": 67847 + }, + { + "epoch": 1.74, + "learning_rate": 7.921171794467598e-07, + "loss": 0.6904, + "step": 67848 + }, + { + "epoch": 1.74, + "learning_rate": 7.92090113568467e-07, + "loss": 0.6812, + "step": 67849 + }, + { + "epoch": 1.74, + "learning_rate": 7.920630478493617e-07, + "loss": 0.6328, + "step": 67850 + }, + { + "epoch": 1.74, + "learning_rate": 7.920359822894638e-07, + "loss": 0.7104, + "step": 67851 + }, + { + "epoch": 1.74, + "learning_rate": 7.920089168887945e-07, + "loss": 0.7354, + "step": 67852 + }, + { + "epoch": 1.74, + "learning_rate": 7.919818516473743e-07, + "loss": 0.5811, + "step": 67853 + }, + { + "epoch": 1.74, + "learning_rate": 7.919547865652239e-07, + "loss": 0.6865, + "step": 67854 + }, + { + "epoch": 1.74, + "learning_rate": 7.919277216423646e-07, + "loss": 1.0908, + "step": 67855 + }, + { + "epoch": 1.74, + "learning_rate": 7.919006568788162e-07, + "loss": 0.7319, + "step": 67856 + }, + { + "epoch": 1.74, + "learning_rate": 7.918735922746002e-07, + "loss": 0.5308, + "step": 67857 + }, + { + "epoch": 1.74, + "learning_rate": 7.918465278297368e-07, + "loss": 0.6011, + "step": 67858 + }, + { + "epoch": 1.74, + "learning_rate": 7.918194635442471e-07, + "loss": 0.7998, + "step": 67859 + }, + { + "epoch": 1.74, + "learning_rate": 7.91792399418152e-07, + "loss": 0.4629, + "step": 67860 + }, + { + "epoch": 1.74, + "learning_rate": 7.917653354514714e-07, + "loss": 0.6553, + "step": 67861 + }, + { + "epoch": 1.74, + "learning_rate": 7.917382716442267e-07, + "loss": 0.7129, + "step": 67862 + }, + { + "epoch": 1.74, + "learning_rate": 7.917112079964384e-07, + "loss": 0.5737, + "step": 67863 + }, + { + "epoch": 1.74, + "learning_rate": 7.916841445081272e-07, + "loss": 0.6396, + "step": 67864 + }, + { + "epoch": 1.74, + "learning_rate": 7.916570811793138e-07, + "loss": 0.7041, + "step": 67865 + }, + { + "epoch": 1.74, + "learning_rate": 7.91630018010019e-07, + "loss": 0.6338, + "step": 67866 + }, + { + "epoch": 1.74, + "learning_rate": 7.916029550002636e-07, + "loss": 0.6636, + "step": 67867 + }, + { + "epoch": 1.74, + "learning_rate": 7.915758921500682e-07, + "loss": 0.4731, + "step": 67868 + }, + { + "epoch": 1.74, + "learning_rate": 7.915488294594537e-07, + "loss": 0.5718, + "step": 67869 + }, + { + "epoch": 1.74, + "learning_rate": 7.915217669284409e-07, + "loss": 0.6055, + "step": 67870 + }, + { + "epoch": 1.74, + "learning_rate": 7.914947045570496e-07, + "loss": 0.6455, + "step": 67871 + }, + { + "epoch": 1.74, + "learning_rate": 7.914676423453019e-07, + "loss": 0.6963, + "step": 67872 + }, + { + "epoch": 1.74, + "learning_rate": 7.914405802932173e-07, + "loss": 0.6475, + "step": 67873 + }, + { + "epoch": 1.74, + "learning_rate": 7.914135184008173e-07, + "loss": 0.6836, + "step": 67874 + }, + { + "epoch": 1.74, + "learning_rate": 7.913864566681223e-07, + "loss": 0.7598, + "step": 67875 + }, + { + "epoch": 1.74, + "learning_rate": 7.913593950951532e-07, + "loss": 0.79, + "step": 67876 + }, + { + "epoch": 1.74, + "learning_rate": 7.913323336819304e-07, + "loss": 0.5923, + "step": 67877 + }, + { + "epoch": 1.74, + "learning_rate": 7.913052724284751e-07, + "loss": 0.7446, + "step": 67878 + }, + { + "epoch": 1.74, + "learning_rate": 7.912782113348076e-07, + "loss": 0.7402, + "step": 67879 + }, + { + "epoch": 1.74, + "learning_rate": 7.912511504009493e-07, + "loss": 0.6152, + "step": 67880 + }, + { + "epoch": 1.74, + "learning_rate": 7.912240896269198e-07, + "loss": 0.6602, + "step": 67881 + }, + { + "epoch": 1.74, + "learning_rate": 7.911970290127405e-07, + "loss": 0.7363, + "step": 67882 + }, + { + "epoch": 1.74, + "learning_rate": 7.911699685584321e-07, + "loss": 0.5771, + "step": 67883 + }, + { + "epoch": 1.74, + "learning_rate": 7.911429082640153e-07, + "loss": 0.5977, + "step": 67884 + }, + { + "epoch": 1.74, + "learning_rate": 7.911158481295106e-07, + "loss": 0.7061, + "step": 67885 + }, + { + "epoch": 1.74, + "learning_rate": 7.910887881549391e-07, + "loss": 0.6387, + "step": 67886 + }, + { + "epoch": 1.74, + "learning_rate": 7.910617283403209e-07, + "loss": 0.6885, + "step": 67887 + }, + { + "epoch": 1.74, + "learning_rate": 7.910346686856776e-07, + "loss": 0.6484, + "step": 67888 + }, + { + "epoch": 1.74, + "learning_rate": 7.910076091910291e-07, + "loss": 0.71, + "step": 67889 + }, + { + "epoch": 1.74, + "learning_rate": 7.90980549856397e-07, + "loss": 0.6885, + "step": 67890 + }, + { + "epoch": 1.74, + "learning_rate": 7.909534906818012e-07, + "loss": 0.7637, + "step": 67891 + }, + { + "epoch": 1.74, + "learning_rate": 7.909264316672625e-07, + "loss": 0.427, + "step": 67892 + }, + { + "epoch": 1.74, + "learning_rate": 7.90899372812802e-07, + "loss": 0.5176, + "step": 67893 + }, + { + "epoch": 1.74, + "learning_rate": 7.9087231411844e-07, + "loss": 0.5967, + "step": 67894 + }, + { + "epoch": 1.74, + "learning_rate": 7.908452555841978e-07, + "loss": 0.7861, + "step": 67895 + }, + { + "epoch": 1.74, + "learning_rate": 7.908181972100954e-07, + "loss": 0.5781, + "step": 67896 + }, + { + "epoch": 1.74, + "learning_rate": 7.907911389961541e-07, + "loss": 0.6318, + "step": 67897 + }, + { + "epoch": 1.74, + "learning_rate": 7.907640809423943e-07, + "loss": 0.7344, + "step": 67898 + }, + { + "epoch": 1.74, + "learning_rate": 7.90737023048837e-07, + "loss": 0.541, + "step": 67899 + }, + { + "epoch": 1.74, + "learning_rate": 7.90709965315503e-07, + "loss": 0.5767, + "step": 67900 + }, + { + "epoch": 1.74, + "learning_rate": 7.906829077424125e-07, + "loss": 0.6112, + "step": 67901 + }, + { + "epoch": 1.74, + "learning_rate": 7.906558503295863e-07, + "loss": 0.7959, + "step": 67902 + }, + { + "epoch": 1.74, + "learning_rate": 7.906287930770454e-07, + "loss": 0.6348, + "step": 67903 + }, + { + "epoch": 1.74, + "learning_rate": 7.906017359848103e-07, + "loss": 0.8193, + "step": 67904 + }, + { + "epoch": 1.74, + "learning_rate": 7.905746790529019e-07, + "loss": 0.6011, + "step": 67905 + }, + { + "epoch": 1.74, + "learning_rate": 7.905476222813408e-07, + "loss": 0.5478, + "step": 67906 + }, + { + "epoch": 1.74, + "learning_rate": 7.905205656701478e-07, + "loss": 0.7168, + "step": 67907 + }, + { + "epoch": 1.74, + "learning_rate": 7.904935092193435e-07, + "loss": 0.7432, + "step": 67908 + }, + { + "epoch": 1.74, + "learning_rate": 7.904664529289487e-07, + "loss": 0.5874, + "step": 67909 + }, + { + "epoch": 1.74, + "learning_rate": 7.904393967989845e-07, + "loss": 0.6001, + "step": 67910 + }, + { + "epoch": 1.74, + "learning_rate": 7.904123408294707e-07, + "loss": 0.6787, + "step": 67911 + }, + { + "epoch": 1.74, + "learning_rate": 7.903852850204289e-07, + "loss": 0.6519, + "step": 67912 + }, + { + "epoch": 1.74, + "learning_rate": 7.90358229371879e-07, + "loss": 0.6943, + "step": 67913 + }, + { + "epoch": 1.74, + "learning_rate": 7.903311738838425e-07, + "loss": 0.6094, + "step": 67914 + }, + { + "epoch": 1.74, + "learning_rate": 7.903041185563396e-07, + "loss": 0.6138, + "step": 67915 + }, + { + "epoch": 1.74, + "learning_rate": 7.902770633893914e-07, + "loss": 0.6323, + "step": 67916 + }, + { + "epoch": 1.74, + "learning_rate": 7.902500083830181e-07, + "loss": 0.7002, + "step": 67917 + }, + { + "epoch": 1.74, + "learning_rate": 7.902229535372411e-07, + "loss": 0.6655, + "step": 67918 + }, + { + "epoch": 1.74, + "learning_rate": 7.901958988520806e-07, + "loss": 0.6328, + "step": 67919 + }, + { + "epoch": 1.74, + "learning_rate": 7.901688443275577e-07, + "loss": 0.7627, + "step": 67920 + }, + { + "epoch": 1.74, + "learning_rate": 7.901417899636925e-07, + "loss": 0.4741, + "step": 67921 + }, + { + "epoch": 1.74, + "learning_rate": 7.901147357605063e-07, + "loss": 0.5591, + "step": 67922 + }, + { + "epoch": 1.74, + "learning_rate": 7.900876817180193e-07, + "loss": 0.5547, + "step": 67923 + }, + { + "epoch": 1.74, + "learning_rate": 7.900606278362527e-07, + "loss": 0.6318, + "step": 67924 + }, + { + "epoch": 1.74, + "learning_rate": 7.900335741152269e-07, + "loss": 0.7256, + "step": 67925 + }, + { + "epoch": 1.74, + "learning_rate": 7.900065205549629e-07, + "loss": 0.7222, + "step": 67926 + }, + { + "epoch": 1.74, + "learning_rate": 7.899794671554811e-07, + "loss": 0.6821, + "step": 67927 + }, + { + "epoch": 1.74, + "learning_rate": 7.899524139168024e-07, + "loss": 0.6064, + "step": 67928 + }, + { + "epoch": 1.74, + "learning_rate": 7.899253608389474e-07, + "loss": 0.5879, + "step": 67929 + }, + { + "epoch": 1.74, + "learning_rate": 7.898983079219375e-07, + "loss": 0.4756, + "step": 67930 + }, + { + "epoch": 1.74, + "learning_rate": 7.898712551657924e-07, + "loss": 0.6572, + "step": 67931 + }, + { + "epoch": 1.74, + "learning_rate": 7.89844202570533e-07, + "loss": 0.5518, + "step": 67932 + }, + { + "epoch": 1.74, + "learning_rate": 7.898171501361803e-07, + "loss": 0.6504, + "step": 67933 + }, + { + "epoch": 1.74, + "learning_rate": 7.89790097862755e-07, + "loss": 0.7275, + "step": 67934 + }, + { + "epoch": 1.74, + "learning_rate": 7.897630457502779e-07, + "loss": 0.5737, + "step": 67935 + }, + { + "epoch": 1.74, + "learning_rate": 7.897359937987694e-07, + "loss": 0.6396, + "step": 67936 + }, + { + "epoch": 1.74, + "learning_rate": 7.897089420082503e-07, + "loss": 0.7153, + "step": 67937 + }, + { + "epoch": 1.74, + "learning_rate": 7.896818903787417e-07, + "loss": 0.6626, + "step": 67938 + }, + { + "epoch": 1.74, + "learning_rate": 7.896548389102636e-07, + "loss": 0.6582, + "step": 67939 + }, + { + "epoch": 1.74, + "learning_rate": 7.896277876028376e-07, + "loss": 0.5659, + "step": 67940 + }, + { + "epoch": 1.74, + "learning_rate": 7.896007364564838e-07, + "loss": 0.5718, + "step": 67941 + }, + { + "epoch": 1.74, + "learning_rate": 7.895736854712228e-07, + "loss": 0.521, + "step": 67942 + }, + { + "epoch": 1.74, + "learning_rate": 7.895466346470758e-07, + "loss": 0.481, + "step": 67943 + }, + { + "epoch": 1.74, + "learning_rate": 7.895195839840629e-07, + "loss": 0.5703, + "step": 67944 + }, + { + "epoch": 1.74, + "learning_rate": 7.894925334822055e-07, + "loss": 0.6797, + "step": 67945 + }, + { + "epoch": 1.74, + "learning_rate": 7.894654831415238e-07, + "loss": 0.7227, + "step": 67946 + }, + { + "epoch": 1.74, + "learning_rate": 7.894384329620389e-07, + "loss": 0.5488, + "step": 67947 + }, + { + "epoch": 1.74, + "learning_rate": 7.894113829437711e-07, + "loss": 0.8799, + "step": 67948 + }, + { + "epoch": 1.74, + "learning_rate": 7.893843330867415e-07, + "loss": 0.7471, + "step": 67949 + }, + { + "epoch": 1.74, + "learning_rate": 7.893572833909709e-07, + "loss": 0.667, + "step": 67950 + }, + { + "epoch": 1.74, + "learning_rate": 7.893302338564793e-07, + "loss": 0.7812, + "step": 67951 + }, + { + "epoch": 1.74, + "learning_rate": 7.893031844832879e-07, + "loss": 0.5312, + "step": 67952 + }, + { + "epoch": 1.74, + "learning_rate": 7.892761352714176e-07, + "loss": 0.7744, + "step": 67953 + }, + { + "epoch": 1.74, + "learning_rate": 7.892490862208885e-07, + "loss": 0.5073, + "step": 67954 + }, + { + "epoch": 1.74, + "learning_rate": 7.89222037331722e-07, + "loss": 0.5698, + "step": 67955 + }, + { + "epoch": 1.74, + "learning_rate": 7.891949886039382e-07, + "loss": 0.5693, + "step": 67956 + }, + { + "epoch": 1.74, + "learning_rate": 7.891679400375584e-07, + "loss": 0.6553, + "step": 67957 + }, + { + "epoch": 1.74, + "learning_rate": 7.891408916326026e-07, + "loss": 0.5183, + "step": 67958 + }, + { + "epoch": 1.74, + "learning_rate": 7.891138433890923e-07, + "loss": 0.7471, + "step": 67959 + }, + { + "epoch": 1.74, + "learning_rate": 7.890867953070481e-07, + "loss": 0.6328, + "step": 67960 + }, + { + "epoch": 1.74, + "learning_rate": 7.8905974738649e-07, + "loss": 0.6597, + "step": 67961 + }, + { + "epoch": 1.74, + "learning_rate": 7.890326996274394e-07, + "loss": 0.7549, + "step": 67962 + }, + { + "epoch": 1.74, + "learning_rate": 7.890056520299164e-07, + "loss": 0.5337, + "step": 67963 + }, + { + "epoch": 1.74, + "learning_rate": 7.889786045939423e-07, + "loss": 0.6572, + "step": 67964 + }, + { + "epoch": 1.74, + "learning_rate": 7.889515573195375e-07, + "loss": 0.7441, + "step": 67965 + }, + { + "epoch": 1.74, + "learning_rate": 7.889245102067229e-07, + "loss": 0.6416, + "step": 67966 + }, + { + "epoch": 1.74, + "learning_rate": 7.888974632555189e-07, + "loss": 0.603, + "step": 67967 + }, + { + "epoch": 1.74, + "learning_rate": 7.888704164659465e-07, + "loss": 0.6787, + "step": 67968 + }, + { + "epoch": 1.74, + "learning_rate": 7.888433698380268e-07, + "loss": 0.5093, + "step": 67969 + }, + { + "epoch": 1.74, + "learning_rate": 7.888163233717796e-07, + "loss": 0.6392, + "step": 67970 + }, + { + "epoch": 1.74, + "learning_rate": 7.887892770672259e-07, + "loss": 0.7178, + "step": 67971 + }, + { + "epoch": 1.74, + "learning_rate": 7.887622309243867e-07, + "loss": 0.6035, + "step": 67972 + }, + { + "epoch": 1.74, + "learning_rate": 7.887351849432824e-07, + "loss": 0.6523, + "step": 67973 + }, + { + "epoch": 1.74, + "learning_rate": 7.887081391239341e-07, + "loss": 0.8076, + "step": 67974 + }, + { + "epoch": 1.74, + "learning_rate": 7.886810934663619e-07, + "loss": 0.644, + "step": 67975 + }, + { + "epoch": 1.74, + "learning_rate": 7.886540479705872e-07, + "loss": 0.531, + "step": 67976 + }, + { + "epoch": 1.74, + "learning_rate": 7.8862700263663e-07, + "loss": 0.6074, + "step": 67977 + }, + { + "epoch": 1.74, + "learning_rate": 7.885999574645118e-07, + "loss": 0.6582, + "step": 67978 + }, + { + "epoch": 1.74, + "learning_rate": 7.88572912454253e-07, + "loss": 0.4626, + "step": 67979 + }, + { + "epoch": 1.74, + "learning_rate": 7.885458676058739e-07, + "loss": 0.6582, + "step": 67980 + }, + { + "epoch": 1.74, + "learning_rate": 7.885188229193955e-07, + "loss": 0.5044, + "step": 67981 + }, + { + "epoch": 1.74, + "learning_rate": 7.884917783948385e-07, + "loss": 0.5811, + "step": 67982 + }, + { + "epoch": 1.74, + "learning_rate": 7.884647340322237e-07, + "loss": 0.5825, + "step": 67983 + }, + { + "epoch": 1.74, + "learning_rate": 7.884376898315717e-07, + "loss": 0.668, + "step": 67984 + }, + { + "epoch": 1.74, + "learning_rate": 7.884106457929032e-07, + "loss": 0.7217, + "step": 67985 + }, + { + "epoch": 1.74, + "learning_rate": 7.883836019162389e-07, + "loss": 0.583, + "step": 67986 + }, + { + "epoch": 1.74, + "learning_rate": 7.883565582015997e-07, + "loss": 0.71, + "step": 67987 + }, + { + "epoch": 1.74, + "learning_rate": 7.883295146490059e-07, + "loss": 0.5361, + "step": 67988 + }, + { + "epoch": 1.74, + "learning_rate": 7.883024712584792e-07, + "loss": 0.8213, + "step": 67989 + }, + { + "epoch": 1.74, + "learning_rate": 7.882754280300388e-07, + "loss": 0.6499, + "step": 67990 + }, + { + "epoch": 1.74, + "learning_rate": 7.882483849637065e-07, + "loss": 0.6914, + "step": 67991 + }, + { + "epoch": 1.74, + "learning_rate": 7.882213420595023e-07, + "loss": 0.6045, + "step": 67992 + }, + { + "epoch": 1.74, + "learning_rate": 7.881942993174477e-07, + "loss": 0.4005, + "step": 67993 + }, + { + "epoch": 1.74, + "learning_rate": 7.881672567375627e-07, + "loss": 0.5811, + "step": 67994 + }, + { + "epoch": 1.74, + "learning_rate": 7.881402143198684e-07, + "loss": 0.6016, + "step": 67995 + }, + { + "epoch": 1.74, + "learning_rate": 7.881131720643853e-07, + "loss": 0.6465, + "step": 67996 + }, + { + "epoch": 1.74, + "learning_rate": 7.880861299711343e-07, + "loss": 0.6206, + "step": 67997 + }, + { + "epoch": 1.74, + "learning_rate": 7.880590880401359e-07, + "loss": 0.7178, + "step": 67998 + }, + { + "epoch": 1.74, + "learning_rate": 7.880320462714113e-07, + "loss": 0.6631, + "step": 67999 + }, + { + "epoch": 1.74, + "learning_rate": 7.880050046649806e-07, + "loss": 0.5186, + "step": 68000 + }, + { + "epoch": 1.74, + "learning_rate": 7.879779632208645e-07, + "loss": 0.6104, + "step": 68001 + }, + { + "epoch": 1.74, + "learning_rate": 7.879509219390842e-07, + "loss": 0.7109, + "step": 68002 + }, + { + "epoch": 1.74, + "learning_rate": 7.879238808196598e-07, + "loss": 0.5667, + "step": 68003 + }, + { + "epoch": 1.74, + "learning_rate": 7.878968398626127e-07, + "loss": 0.6494, + "step": 68004 + }, + { + "epoch": 1.74, + "learning_rate": 7.878697990679629e-07, + "loss": 0.5898, + "step": 68005 + }, + { + "epoch": 1.74, + "learning_rate": 7.878427584357316e-07, + "loss": 0.5396, + "step": 68006 + }, + { + "epoch": 1.74, + "learning_rate": 7.878157179659393e-07, + "loss": 0.6377, + "step": 68007 + }, + { + "epoch": 1.74, + "learning_rate": 7.877886776586069e-07, + "loss": 0.7852, + "step": 68008 + }, + { + "epoch": 1.74, + "learning_rate": 7.877616375137551e-07, + "loss": 0.626, + "step": 68009 + }, + { + "epoch": 1.74, + "learning_rate": 7.877345975314044e-07, + "loss": 0.688, + "step": 68010 + }, + { + "epoch": 1.74, + "learning_rate": 7.877075577115751e-07, + "loss": 0.604, + "step": 68011 + }, + { + "epoch": 1.74, + "learning_rate": 7.876805180542888e-07, + "loss": 0.5244, + "step": 68012 + }, + { + "epoch": 1.74, + "learning_rate": 7.876534785595654e-07, + "loss": 0.5737, + "step": 68013 + }, + { + "epoch": 1.74, + "learning_rate": 7.876264392274263e-07, + "loss": 0.5537, + "step": 68014 + }, + { + "epoch": 1.74, + "learning_rate": 7.875994000578916e-07, + "loss": 0.6567, + "step": 68015 + }, + { + "epoch": 1.74, + "learning_rate": 7.875723610509825e-07, + "loss": 0.583, + "step": 68016 + }, + { + "epoch": 1.74, + "learning_rate": 7.875453222067192e-07, + "loss": 0.6035, + "step": 68017 + }, + { + "epoch": 1.74, + "learning_rate": 7.87518283525123e-07, + "loss": 0.5454, + "step": 68018 + }, + { + "epoch": 1.74, + "learning_rate": 7.874912450062145e-07, + "loss": 0.7573, + "step": 68019 + }, + { + "epoch": 1.74, + "learning_rate": 7.874642066500137e-07, + "loss": 0.7012, + "step": 68020 + }, + { + "epoch": 1.74, + "learning_rate": 7.87437168456542e-07, + "loss": 0.6426, + "step": 68021 + }, + { + "epoch": 1.74, + "learning_rate": 7.874101304258196e-07, + "loss": 0.6284, + "step": 68022 + }, + { + "epoch": 1.74, + "learning_rate": 7.873830925578677e-07, + "loss": 0.6377, + "step": 68023 + }, + { + "epoch": 1.74, + "learning_rate": 7.873560548527066e-07, + "loss": 0.5635, + "step": 68024 + }, + { + "epoch": 1.74, + "learning_rate": 7.873290173103575e-07, + "loss": 0.8652, + "step": 68025 + }, + { + "epoch": 1.74, + "learning_rate": 7.873019799308407e-07, + "loss": 0.7598, + "step": 68026 + }, + { + "epoch": 1.74, + "learning_rate": 7.872749427141768e-07, + "loss": 0.6621, + "step": 68027 + }, + { + "epoch": 1.74, + "learning_rate": 7.872479056603869e-07, + "loss": 0.7764, + "step": 68028 + }, + { + "epoch": 1.74, + "learning_rate": 7.872208687694918e-07, + "loss": 0.5459, + "step": 68029 + }, + { + "epoch": 1.74, + "learning_rate": 7.871938320415114e-07, + "loss": 0.345, + "step": 68030 + }, + { + "epoch": 1.74, + "learning_rate": 7.871667954764671e-07, + "loss": 0.5024, + "step": 68031 + }, + { + "epoch": 1.74, + "learning_rate": 7.871397590743792e-07, + "loss": 0.6045, + "step": 68032 + }, + { + "epoch": 1.74, + "learning_rate": 7.871127228352689e-07, + "loss": 0.7168, + "step": 68033 + }, + { + "epoch": 1.74, + "learning_rate": 7.870856867591563e-07, + "loss": 0.6377, + "step": 68034 + }, + { + "epoch": 1.74, + "learning_rate": 7.870586508460627e-07, + "loss": 0.686, + "step": 68035 + }, + { + "epoch": 1.74, + "learning_rate": 7.87031615096008e-07, + "loss": 0.6069, + "step": 68036 + }, + { + "epoch": 1.74, + "learning_rate": 7.870045795090139e-07, + "loss": 0.6335, + "step": 68037 + }, + { + "epoch": 1.74, + "learning_rate": 7.869775440851002e-07, + "loss": 0.5981, + "step": 68038 + }, + { + "epoch": 1.74, + "learning_rate": 7.869505088242886e-07, + "loss": 0.5811, + "step": 68039 + }, + { + "epoch": 1.74, + "learning_rate": 7.869234737265988e-07, + "loss": 0.5469, + "step": 68040 + }, + { + "epoch": 1.74, + "learning_rate": 7.868964387920519e-07, + "loss": 0.665, + "step": 68041 + }, + { + "epoch": 1.74, + "learning_rate": 7.868694040206687e-07, + "loss": 0.6914, + "step": 68042 + }, + { + "epoch": 1.74, + "learning_rate": 7.868423694124698e-07, + "loss": 0.7334, + "step": 68043 + }, + { + "epoch": 1.74, + "learning_rate": 7.868153349674757e-07, + "loss": 0.6328, + "step": 68044 + }, + { + "epoch": 1.74, + "learning_rate": 7.867883006857074e-07, + "loss": 0.6191, + "step": 68045 + }, + { + "epoch": 1.74, + "learning_rate": 7.867612665671855e-07, + "loss": 0.3959, + "step": 68046 + }, + { + "epoch": 1.74, + "learning_rate": 7.867342326119307e-07, + "loss": 0.6914, + "step": 68047 + }, + { + "epoch": 1.74, + "learning_rate": 7.867071988199637e-07, + "loss": 0.7129, + "step": 68048 + }, + { + "epoch": 1.74, + "learning_rate": 7.866801651913053e-07, + "loss": 0.7109, + "step": 68049 + }, + { + "epoch": 1.74, + "learning_rate": 7.866531317259761e-07, + "loss": 0.6885, + "step": 68050 + }, + { + "epoch": 1.74, + "learning_rate": 7.866260984239966e-07, + "loss": 0.6396, + "step": 68051 + }, + { + "epoch": 1.74, + "learning_rate": 7.865990652853878e-07, + "loss": 0.7266, + "step": 68052 + }, + { + "epoch": 1.74, + "learning_rate": 7.8657203231017e-07, + "loss": 0.5115, + "step": 68053 + }, + { + "epoch": 1.74, + "learning_rate": 7.865449994983645e-07, + "loss": 0.7041, + "step": 68054 + }, + { + "epoch": 1.74, + "learning_rate": 7.865179668499915e-07, + "loss": 0.6846, + "step": 68055 + }, + { + "epoch": 1.74, + "learning_rate": 7.864909343650721e-07, + "loss": 0.6919, + "step": 68056 + }, + { + "epoch": 1.74, + "learning_rate": 7.864639020436265e-07, + "loss": 0.6562, + "step": 68057 + }, + { + "epoch": 1.74, + "learning_rate": 7.864368698856758e-07, + "loss": 0.6621, + "step": 68058 + }, + { + "epoch": 1.74, + "learning_rate": 7.86409837891241e-07, + "loss": 0.6099, + "step": 68059 + }, + { + "epoch": 1.74, + "learning_rate": 7.863828060603419e-07, + "loss": 0.4417, + "step": 68060 + }, + { + "epoch": 1.74, + "learning_rate": 7.863557743929997e-07, + "loss": 0.7803, + "step": 68061 + }, + { + "epoch": 1.74, + "learning_rate": 7.863287428892351e-07, + "loss": 0.4756, + "step": 68062 + }, + { + "epoch": 1.74, + "learning_rate": 7.863017115490685e-07, + "loss": 0.7402, + "step": 68063 + }, + { + "epoch": 1.74, + "learning_rate": 7.862746803725212e-07, + "loss": 0.6719, + "step": 68064 + }, + { + "epoch": 1.74, + "learning_rate": 7.862476493596133e-07, + "loss": 0.5491, + "step": 68065 + }, + { + "epoch": 1.74, + "learning_rate": 7.86220618510366e-07, + "loss": 0.4438, + "step": 68066 + }, + { + "epoch": 1.74, + "learning_rate": 7.861935878247994e-07, + "loss": 0.6963, + "step": 68067 + }, + { + "epoch": 1.74, + "learning_rate": 7.861665573029348e-07, + "loss": 0.5903, + "step": 68068 + }, + { + "epoch": 1.74, + "learning_rate": 7.86139526944793e-07, + "loss": 0.4945, + "step": 68069 + }, + { + "epoch": 1.74, + "learning_rate": 7.861124967503937e-07, + "loss": 0.5811, + "step": 68070 + }, + { + "epoch": 1.74, + "learning_rate": 7.860854667197585e-07, + "loss": 0.4714, + "step": 68071 + }, + { + "epoch": 1.74, + "learning_rate": 7.860584368529077e-07, + "loss": 0.8369, + "step": 68072 + }, + { + "epoch": 1.74, + "learning_rate": 7.860314071498622e-07, + "loss": 0.5137, + "step": 68073 + }, + { + "epoch": 1.74, + "learning_rate": 7.860043776106425e-07, + "loss": 0.6396, + "step": 68074 + }, + { + "epoch": 1.74, + "learning_rate": 7.859773482352696e-07, + "loss": 0.707, + "step": 68075 + }, + { + "epoch": 1.74, + "learning_rate": 7.859503190237638e-07, + "loss": 0.8359, + "step": 68076 + }, + { + "epoch": 1.74, + "learning_rate": 7.859232899761462e-07, + "loss": 0.5977, + "step": 68077 + }, + { + "epoch": 1.74, + "learning_rate": 7.858962610924371e-07, + "loss": 0.6343, + "step": 68078 + }, + { + "epoch": 1.74, + "learning_rate": 7.85869232372658e-07, + "loss": 0.751, + "step": 68079 + }, + { + "epoch": 1.74, + "learning_rate": 7.858422038168283e-07, + "loss": 0.5752, + "step": 68080 + }, + { + "epoch": 1.74, + "learning_rate": 7.858151754249697e-07, + "loss": 0.6309, + "step": 68081 + }, + { + "epoch": 1.74, + "learning_rate": 7.857881471971022e-07, + "loss": 0.6885, + "step": 68082 + }, + { + "epoch": 1.75, + "learning_rate": 7.857611191332471e-07, + "loss": 0.7949, + "step": 68083 + }, + { + "epoch": 1.75, + "learning_rate": 7.857340912334249e-07, + "loss": 0.6909, + "step": 68084 + }, + { + "epoch": 1.75, + "learning_rate": 7.857070634976562e-07, + "loss": 0.561, + "step": 68085 + }, + { + "epoch": 1.75, + "learning_rate": 7.856800359259616e-07, + "loss": 0.5364, + "step": 68086 + }, + { + "epoch": 1.75, + "learning_rate": 7.856530085183621e-07, + "loss": 0.7686, + "step": 68087 + }, + { + "epoch": 1.75, + "learning_rate": 7.856259812748782e-07, + "loss": 0.5889, + "step": 68088 + }, + { + "epoch": 1.75, + "learning_rate": 7.85598954195531e-07, + "loss": 0.6255, + "step": 68089 + }, + { + "epoch": 1.75, + "learning_rate": 7.855719272803404e-07, + "loss": 0.6816, + "step": 68090 + }, + { + "epoch": 1.75, + "learning_rate": 7.855449005293276e-07, + "loss": 0.5381, + "step": 68091 + }, + { + "epoch": 1.75, + "learning_rate": 7.855178739425132e-07, + "loss": 0.5723, + "step": 68092 + }, + { + "epoch": 1.75, + "learning_rate": 7.854908475199178e-07, + "loss": 0.7227, + "step": 68093 + }, + { + "epoch": 1.75, + "learning_rate": 7.854638212615624e-07, + "loss": 0.75, + "step": 68094 + }, + { + "epoch": 1.75, + "learning_rate": 7.854367951674673e-07, + "loss": 0.7041, + "step": 68095 + }, + { + "epoch": 1.75, + "learning_rate": 7.854097692376535e-07, + "loss": 0.623, + "step": 68096 + }, + { + "epoch": 1.75, + "learning_rate": 7.853827434721414e-07, + "loss": 0.6855, + "step": 68097 + }, + { + "epoch": 1.75, + "learning_rate": 7.853557178709521e-07, + "loss": 0.689, + "step": 68098 + }, + { + "epoch": 1.75, + "learning_rate": 7.853286924341063e-07, + "loss": 0.6841, + "step": 68099 + }, + { + "epoch": 1.75, + "learning_rate": 7.853016671616242e-07, + "loss": 0.6802, + "step": 68100 + }, + { + "epoch": 1.75, + "learning_rate": 7.852746420535265e-07, + "loss": 0.5791, + "step": 68101 + }, + { + "epoch": 1.75, + "learning_rate": 7.852476171098343e-07, + "loss": 0.6465, + "step": 68102 + }, + { + "epoch": 1.75, + "learning_rate": 7.85220592330568e-07, + "loss": 0.6733, + "step": 68103 + }, + { + "epoch": 1.75, + "learning_rate": 7.851935677157486e-07, + "loss": 0.583, + "step": 68104 + }, + { + "epoch": 1.75, + "learning_rate": 7.851665432653965e-07, + "loss": 0.7285, + "step": 68105 + }, + { + "epoch": 1.75, + "learning_rate": 7.851395189795326e-07, + "loss": 0.6992, + "step": 68106 + }, + { + "epoch": 1.75, + "learning_rate": 7.851124948581773e-07, + "loss": 0.4077, + "step": 68107 + }, + { + "epoch": 1.75, + "learning_rate": 7.850854709013517e-07, + "loss": 0.5283, + "step": 68108 + }, + { + "epoch": 1.75, + "learning_rate": 7.850584471090764e-07, + "loss": 0.4645, + "step": 68109 + }, + { + "epoch": 1.75, + "learning_rate": 7.850314234813716e-07, + "loss": 0.709, + "step": 68110 + }, + { + "epoch": 1.75, + "learning_rate": 7.850044000182586e-07, + "loss": 0.5969, + "step": 68111 + }, + { + "epoch": 1.75, + "learning_rate": 7.849773767197577e-07, + "loss": 0.5864, + "step": 68112 + }, + { + "epoch": 1.75, + "learning_rate": 7.849503535858898e-07, + "loss": 0.5864, + "step": 68113 + }, + { + "epoch": 1.75, + "learning_rate": 7.849233306166754e-07, + "loss": 0.6587, + "step": 68114 + }, + { + "epoch": 1.75, + "learning_rate": 7.848963078121354e-07, + "loss": 0.6829, + "step": 68115 + }, + { + "epoch": 1.75, + "learning_rate": 7.848692851722906e-07, + "loss": 0.6641, + "step": 68116 + }, + { + "epoch": 1.75, + "learning_rate": 7.848422626971611e-07, + "loss": 0.5522, + "step": 68117 + }, + { + "epoch": 1.75, + "learning_rate": 7.848152403867684e-07, + "loss": 0.5552, + "step": 68118 + }, + { + "epoch": 1.75, + "learning_rate": 7.847882182411328e-07, + "loss": 0.7305, + "step": 68119 + }, + { + "epoch": 1.75, + "learning_rate": 7.847611962602747e-07, + "loss": 0.6162, + "step": 68120 + }, + { + "epoch": 1.75, + "learning_rate": 7.847341744442152e-07, + "loss": 0.5938, + "step": 68121 + }, + { + "epoch": 1.75, + "learning_rate": 7.847071527929747e-07, + "loss": 0.8057, + "step": 68122 + }, + { + "epoch": 1.75, + "learning_rate": 7.846801313065741e-07, + "loss": 0.5981, + "step": 68123 + }, + { + "epoch": 1.75, + "learning_rate": 7.846531099850338e-07, + "loss": 0.4714, + "step": 68124 + }, + { + "epoch": 1.75, + "learning_rate": 7.84626088828375e-07, + "loss": 0.6084, + "step": 68125 + }, + { + "epoch": 1.75, + "learning_rate": 7.845990678366179e-07, + "loss": 0.6523, + "step": 68126 + }, + { + "epoch": 1.75, + "learning_rate": 7.845720470097837e-07, + "loss": 0.665, + "step": 68127 + }, + { + "epoch": 1.75, + "learning_rate": 7.845450263478923e-07, + "loss": 0.6431, + "step": 68128 + }, + { + "epoch": 1.75, + "learning_rate": 7.845180058509655e-07, + "loss": 0.7139, + "step": 68129 + }, + { + "epoch": 1.75, + "learning_rate": 7.844909855190231e-07, + "loss": 0.6089, + "step": 68130 + }, + { + "epoch": 1.75, + "learning_rate": 7.844639653520858e-07, + "loss": 0.5869, + "step": 68131 + }, + { + "epoch": 1.75, + "learning_rate": 7.844369453501748e-07, + "loss": 0.492, + "step": 68132 + }, + { + "epoch": 1.75, + "learning_rate": 7.844099255133105e-07, + "loss": 0.6753, + "step": 68133 + }, + { + "epoch": 1.75, + "learning_rate": 7.843829058415134e-07, + "loss": 0.644, + "step": 68134 + }, + { + "epoch": 1.75, + "learning_rate": 7.843558863348045e-07, + "loss": 0.6504, + "step": 68135 + }, + { + "epoch": 1.75, + "learning_rate": 7.843288669932043e-07, + "loss": 0.6504, + "step": 68136 + }, + { + "epoch": 1.75, + "learning_rate": 7.843018478167338e-07, + "loss": 0.6694, + "step": 68137 + }, + { + "epoch": 1.75, + "learning_rate": 7.84274828805413e-07, + "loss": 0.6128, + "step": 68138 + }, + { + "epoch": 1.75, + "learning_rate": 7.842478099592638e-07, + "loss": 0.3174, + "step": 68139 + }, + { + "epoch": 1.75, + "learning_rate": 7.842207912783058e-07, + "loss": 0.5105, + "step": 68140 + }, + { + "epoch": 1.75, + "learning_rate": 7.841937727625597e-07, + "loss": 0.6016, + "step": 68141 + }, + { + "epoch": 1.75, + "learning_rate": 7.841667544120468e-07, + "loss": 0.5889, + "step": 68142 + }, + { + "epoch": 1.75, + "learning_rate": 7.841397362267873e-07, + "loss": 0.5166, + "step": 68143 + }, + { + "epoch": 1.75, + "learning_rate": 7.841127182068023e-07, + "loss": 0.4692, + "step": 68144 + }, + { + "epoch": 1.75, + "learning_rate": 7.84085700352112e-07, + "loss": 0.5498, + "step": 68145 + }, + { + "epoch": 1.75, + "learning_rate": 7.840586826627375e-07, + "loss": 0.6562, + "step": 68146 + }, + { + "epoch": 1.75, + "learning_rate": 7.840316651386992e-07, + "loss": 0.6309, + "step": 68147 + }, + { + "epoch": 1.75, + "learning_rate": 7.840046477800182e-07, + "loss": 0.7202, + "step": 68148 + }, + { + "epoch": 1.75, + "learning_rate": 7.83977630586715e-07, + "loss": 0.8574, + "step": 68149 + }, + { + "epoch": 1.75, + "learning_rate": 7.839506135588101e-07, + "loss": 0.707, + "step": 68150 + }, + { + "epoch": 1.75, + "learning_rate": 7.83923596696324e-07, + "loss": 0.7227, + "step": 68151 + }, + { + "epoch": 1.75, + "learning_rate": 7.838965799992779e-07, + "loss": 0.6016, + "step": 68152 + }, + { + "epoch": 1.75, + "learning_rate": 7.83869563467692e-07, + "loss": 0.8447, + "step": 68153 + }, + { + "epoch": 1.75, + "learning_rate": 7.838425471015875e-07, + "loss": 0.4248, + "step": 68154 + }, + { + "epoch": 1.75, + "learning_rate": 7.838155309009846e-07, + "loss": 0.7051, + "step": 68155 + }, + { + "epoch": 1.75, + "learning_rate": 7.837885148659045e-07, + "loss": 0.4003, + "step": 68156 + }, + { + "epoch": 1.75, + "learning_rate": 7.837614989963672e-07, + "loss": 0.6201, + "step": 68157 + }, + { + "epoch": 1.75, + "learning_rate": 7.837344832923941e-07, + "loss": 0.6118, + "step": 68158 + }, + { + "epoch": 1.75, + "learning_rate": 7.837074677540057e-07, + "loss": 0.4536, + "step": 68159 + }, + { + "epoch": 1.75, + "learning_rate": 7.836804523812223e-07, + "loss": 0.5183, + "step": 68160 + }, + { + "epoch": 1.75, + "learning_rate": 7.836534371740648e-07, + "loss": 0.6338, + "step": 68161 + }, + { + "epoch": 1.75, + "learning_rate": 7.836264221325539e-07, + "loss": 0.6328, + "step": 68162 + }, + { + "epoch": 1.75, + "learning_rate": 7.835994072567105e-07, + "loss": 0.6807, + "step": 68163 + }, + { + "epoch": 1.75, + "learning_rate": 7.835723925465547e-07, + "loss": 0.7041, + "step": 68164 + }, + { + "epoch": 1.75, + "learning_rate": 7.835453780021079e-07, + "loss": 0.5674, + "step": 68165 + }, + { + "epoch": 1.75, + "learning_rate": 7.835183636233903e-07, + "loss": 0.6104, + "step": 68166 + }, + { + "epoch": 1.75, + "learning_rate": 7.834913494104228e-07, + "loss": 0.6709, + "step": 68167 + }, + { + "epoch": 1.75, + "learning_rate": 7.834643353632259e-07, + "loss": 0.6816, + "step": 68168 + }, + { + "epoch": 1.75, + "learning_rate": 7.834373214818211e-07, + "loss": 0.7207, + "step": 68169 + }, + { + "epoch": 1.75, + "learning_rate": 7.834103077662276e-07, + "loss": 0.6968, + "step": 68170 + }, + { + "epoch": 1.75, + "learning_rate": 7.833832942164672e-07, + "loss": 0.6348, + "step": 68171 + }, + { + "epoch": 1.75, + "learning_rate": 7.8335628083256e-07, + "loss": 0.5542, + "step": 68172 + }, + { + "epoch": 1.75, + "learning_rate": 7.833292676145271e-07, + "loss": 0.5869, + "step": 68173 + }, + { + "epoch": 1.75, + "learning_rate": 7.833022545623889e-07, + "loss": 0.5481, + "step": 68174 + }, + { + "epoch": 1.75, + "learning_rate": 7.832752416761663e-07, + "loss": 0.7207, + "step": 68175 + }, + { + "epoch": 1.75, + "learning_rate": 7.832482289558798e-07, + "loss": 0.5957, + "step": 68176 + }, + { + "epoch": 1.75, + "learning_rate": 7.832212164015501e-07, + "loss": 0.5664, + "step": 68177 + }, + { + "epoch": 1.75, + "learning_rate": 7.831942040131981e-07, + "loss": 0.8555, + "step": 68178 + }, + { + "epoch": 1.75, + "learning_rate": 7.831671917908445e-07, + "loss": 0.5308, + "step": 68179 + }, + { + "epoch": 1.75, + "learning_rate": 7.831401797345096e-07, + "loss": 0.6807, + "step": 68180 + }, + { + "epoch": 1.75, + "learning_rate": 7.831131678442142e-07, + "loss": 0.7178, + "step": 68181 + }, + { + "epoch": 1.75, + "learning_rate": 7.830861561199793e-07, + "loss": 0.7119, + "step": 68182 + }, + { + "epoch": 1.75, + "learning_rate": 7.830591445618251e-07, + "loss": 0.7598, + "step": 68183 + }, + { + "epoch": 1.75, + "learning_rate": 7.830321331697727e-07, + "loss": 0.5439, + "step": 68184 + }, + { + "epoch": 1.75, + "learning_rate": 7.830051219438425e-07, + "loss": 0.8105, + "step": 68185 + }, + { + "epoch": 1.75, + "learning_rate": 7.829781108840554e-07, + "loss": 0.6992, + "step": 68186 + }, + { + "epoch": 1.75, + "learning_rate": 7.829510999904318e-07, + "loss": 0.6885, + "step": 68187 + }, + { + "epoch": 1.75, + "learning_rate": 7.829240892629929e-07, + "loss": 0.7681, + "step": 68188 + }, + { + "epoch": 1.75, + "learning_rate": 7.828970787017591e-07, + "loss": 0.4771, + "step": 68189 + }, + { + "epoch": 1.75, + "learning_rate": 7.82870068306751e-07, + "loss": 0.543, + "step": 68190 + }, + { + "epoch": 1.75, + "learning_rate": 7.828430580779889e-07, + "loss": 0.6592, + "step": 68191 + }, + { + "epoch": 1.75, + "learning_rate": 7.828160480154942e-07, + "loss": 0.6592, + "step": 68192 + }, + { + "epoch": 1.75, + "learning_rate": 7.82789038119287e-07, + "loss": 0.583, + "step": 68193 + }, + { + "epoch": 1.75, + "learning_rate": 7.827620283893885e-07, + "loss": 0.5742, + "step": 68194 + }, + { + "epoch": 1.75, + "learning_rate": 7.827350188258188e-07, + "loss": 0.7373, + "step": 68195 + }, + { + "epoch": 1.75, + "learning_rate": 7.827080094285993e-07, + "loss": 0.5669, + "step": 68196 + }, + { + "epoch": 1.75, + "learning_rate": 7.826810001977499e-07, + "loss": 0.5103, + "step": 68197 + }, + { + "epoch": 1.75, + "learning_rate": 7.82653991133292e-07, + "loss": 0.6616, + "step": 68198 + }, + { + "epoch": 1.75, + "learning_rate": 7.826269822352461e-07, + "loss": 0.6396, + "step": 68199 + }, + { + "epoch": 1.75, + "learning_rate": 7.825999735036324e-07, + "loss": 0.563, + "step": 68200 + }, + { + "epoch": 1.75, + "learning_rate": 7.825729649384721e-07, + "loss": 0.5472, + "step": 68201 + }, + { + "epoch": 1.75, + "learning_rate": 7.825459565397853e-07, + "loss": 0.687, + "step": 68202 + }, + { + "epoch": 1.75, + "learning_rate": 7.825189483075934e-07, + "loss": 0.7207, + "step": 68203 + }, + { + "epoch": 1.75, + "learning_rate": 7.824919402419165e-07, + "loss": 0.4476, + "step": 68204 + }, + { + "epoch": 1.75, + "learning_rate": 7.824649323427758e-07, + "loss": 0.748, + "step": 68205 + }, + { + "epoch": 1.75, + "learning_rate": 7.824379246101916e-07, + "loss": 0.5908, + "step": 68206 + }, + { + "epoch": 1.75, + "learning_rate": 7.824109170441845e-07, + "loss": 0.5562, + "step": 68207 + }, + { + "epoch": 1.75, + "learning_rate": 7.823839096447755e-07, + "loss": 0.5332, + "step": 68208 + }, + { + "epoch": 1.75, + "learning_rate": 7.823569024119855e-07, + "loss": 0.6729, + "step": 68209 + }, + { + "epoch": 1.75, + "learning_rate": 7.823298953458343e-07, + "loss": 0.6772, + "step": 68210 + }, + { + "epoch": 1.75, + "learning_rate": 7.823028884463433e-07, + "loss": 0.6113, + "step": 68211 + }, + { + "epoch": 1.75, + "learning_rate": 7.822758817135328e-07, + "loss": 0.7334, + "step": 68212 + }, + { + "epoch": 1.75, + "learning_rate": 7.822488751474239e-07, + "loss": 0.7144, + "step": 68213 + }, + { + "epoch": 1.75, + "learning_rate": 7.822218687480366e-07, + "loss": 0.6479, + "step": 68214 + }, + { + "epoch": 1.75, + "learning_rate": 7.821948625153924e-07, + "loss": 0.7354, + "step": 68215 + }, + { + "epoch": 1.75, + "learning_rate": 7.821678564495114e-07, + "loss": 0.7207, + "step": 68216 + }, + { + "epoch": 1.75, + "learning_rate": 7.821408505504146e-07, + "loss": 0.6772, + "step": 68217 + }, + { + "epoch": 1.75, + "learning_rate": 7.821138448181222e-07, + "loss": 0.6611, + "step": 68218 + }, + { + "epoch": 1.75, + "learning_rate": 7.820868392526557e-07, + "loss": 0.8555, + "step": 68219 + }, + { + "epoch": 1.75, + "learning_rate": 7.820598338540351e-07, + "loss": 0.6133, + "step": 68220 + }, + { + "epoch": 1.75, + "learning_rate": 7.820328286222812e-07, + "loss": 0.7725, + "step": 68221 + }, + { + "epoch": 1.75, + "learning_rate": 7.820058235574147e-07, + "loss": 0.5161, + "step": 68222 + }, + { + "epoch": 1.75, + "learning_rate": 7.819788186594565e-07, + "loss": 0.6245, + "step": 68223 + }, + { + "epoch": 1.75, + "learning_rate": 7.819518139284268e-07, + "loss": 0.6196, + "step": 68224 + }, + { + "epoch": 1.75, + "learning_rate": 7.819248093643468e-07, + "loss": 0.6121, + "step": 68225 + }, + { + "epoch": 1.75, + "learning_rate": 7.818978049672368e-07, + "loss": 0.707, + "step": 68226 + }, + { + "epoch": 1.75, + "learning_rate": 7.818708007371178e-07, + "loss": 0.5996, + "step": 68227 + }, + { + "epoch": 1.75, + "learning_rate": 7.8184379667401e-07, + "loss": 0.8438, + "step": 68228 + }, + { + "epoch": 1.75, + "learning_rate": 7.818167927779349e-07, + "loss": 0.6211, + "step": 68229 + }, + { + "epoch": 1.75, + "learning_rate": 7.817897890489123e-07, + "loss": 0.6709, + "step": 68230 + }, + { + "epoch": 1.75, + "learning_rate": 7.817627854869631e-07, + "loss": 0.6362, + "step": 68231 + }, + { + "epoch": 1.75, + "learning_rate": 7.817357820921083e-07, + "loss": 0.601, + "step": 68232 + }, + { + "epoch": 1.75, + "learning_rate": 7.817087788643683e-07, + "loss": 0.7339, + "step": 68233 + }, + { + "epoch": 1.75, + "learning_rate": 7.816817758037639e-07, + "loss": 0.6357, + "step": 68234 + }, + { + "epoch": 1.75, + "learning_rate": 7.816547729103155e-07, + "loss": 0.4135, + "step": 68235 + }, + { + "epoch": 1.75, + "learning_rate": 7.816277701840444e-07, + "loss": 0.6069, + "step": 68236 + }, + { + "epoch": 1.75, + "learning_rate": 7.816007676249704e-07, + "loss": 0.7012, + "step": 68237 + }, + { + "epoch": 1.75, + "learning_rate": 7.81573765233115e-07, + "loss": 0.6396, + "step": 68238 + }, + { + "epoch": 1.75, + "learning_rate": 7.815467630084988e-07, + "loss": 0.7627, + "step": 68239 + }, + { + "epoch": 1.75, + "learning_rate": 7.815197609511419e-07, + "loss": 0.4907, + "step": 68240 + }, + { + "epoch": 1.75, + "learning_rate": 7.814927590610651e-07, + "loss": 0.502, + "step": 68241 + }, + { + "epoch": 1.75, + "learning_rate": 7.814657573382894e-07, + "loss": 0.7959, + "step": 68242 + }, + { + "epoch": 1.75, + "learning_rate": 7.814387557828352e-07, + "loss": 0.6279, + "step": 68243 + }, + { + "epoch": 1.75, + "learning_rate": 7.814117543947234e-07, + "loss": 0.6895, + "step": 68244 + }, + { + "epoch": 1.75, + "learning_rate": 7.813847531739744e-07, + "loss": 0.5688, + "step": 68245 + }, + { + "epoch": 1.75, + "learning_rate": 7.813577521206092e-07, + "loss": 0.4875, + "step": 68246 + }, + { + "epoch": 1.75, + "learning_rate": 7.813307512346483e-07, + "loss": 0.6187, + "step": 68247 + }, + { + "epoch": 1.75, + "learning_rate": 7.813037505161124e-07, + "loss": 0.5996, + "step": 68248 + }, + { + "epoch": 1.75, + "learning_rate": 7.812767499650225e-07, + "loss": 0.7197, + "step": 68249 + }, + { + "epoch": 1.75, + "learning_rate": 7.812497495813984e-07, + "loss": 0.6675, + "step": 68250 + }, + { + "epoch": 1.75, + "learning_rate": 7.812227493652616e-07, + "loss": 0.6201, + "step": 68251 + }, + { + "epoch": 1.75, + "learning_rate": 7.811957493166322e-07, + "loss": 0.5942, + "step": 68252 + }, + { + "epoch": 1.75, + "learning_rate": 7.811687494355315e-07, + "loss": 0.5859, + "step": 68253 + }, + { + "epoch": 1.75, + "learning_rate": 7.811417497219794e-07, + "loss": 0.6558, + "step": 68254 + }, + { + "epoch": 1.75, + "learning_rate": 7.811147501759974e-07, + "loss": 0.5127, + "step": 68255 + }, + { + "epoch": 1.75, + "learning_rate": 7.810877507976055e-07, + "loss": 0.7168, + "step": 68256 + }, + { + "epoch": 1.75, + "learning_rate": 7.810607515868248e-07, + "loss": 0.7295, + "step": 68257 + }, + { + "epoch": 1.75, + "learning_rate": 7.810337525436758e-07, + "loss": 0.3813, + "step": 68258 + }, + { + "epoch": 1.75, + "learning_rate": 7.810067536681796e-07, + "loss": 0.5516, + "step": 68259 + }, + { + "epoch": 1.75, + "learning_rate": 7.80979754960356e-07, + "loss": 0.6631, + "step": 68260 + }, + { + "epoch": 1.75, + "learning_rate": 7.809527564202261e-07, + "loss": 0.5303, + "step": 68261 + }, + { + "epoch": 1.75, + "learning_rate": 7.809257580478106e-07, + "loss": 0.6118, + "step": 68262 + }, + { + "epoch": 1.75, + "learning_rate": 7.808987598431302e-07, + "loss": 0.7227, + "step": 68263 + }, + { + "epoch": 1.75, + "learning_rate": 7.808717618062055e-07, + "loss": 0.8096, + "step": 68264 + }, + { + "epoch": 1.75, + "learning_rate": 7.808447639370575e-07, + "loss": 0.5527, + "step": 68265 + }, + { + "epoch": 1.75, + "learning_rate": 7.808177662357062e-07, + "loss": 0.5879, + "step": 68266 + }, + { + "epoch": 1.75, + "learning_rate": 7.80790768702173e-07, + "loss": 0.7275, + "step": 68267 + }, + { + "epoch": 1.75, + "learning_rate": 7.807637713364783e-07, + "loss": 0.6421, + "step": 68268 + }, + { + "epoch": 1.75, + "learning_rate": 7.807367741386423e-07, + "loss": 0.7393, + "step": 68269 + }, + { + "epoch": 1.75, + "learning_rate": 7.807097771086864e-07, + "loss": 0.5476, + "step": 68270 + }, + { + "epoch": 1.75, + "learning_rate": 7.806827802466306e-07, + "loss": 0.6787, + "step": 68271 + }, + { + "epoch": 1.75, + "learning_rate": 7.806557835524962e-07, + "loss": 0.7422, + "step": 68272 + }, + { + "epoch": 1.75, + "learning_rate": 7.806287870263034e-07, + "loss": 0.4905, + "step": 68273 + }, + { + "epoch": 1.75, + "learning_rate": 7.806017906680732e-07, + "loss": 0.6553, + "step": 68274 + }, + { + "epoch": 1.75, + "learning_rate": 7.805747944778258e-07, + "loss": 0.5889, + "step": 68275 + }, + { + "epoch": 1.75, + "learning_rate": 7.805477984555826e-07, + "loss": 0.5552, + "step": 68276 + }, + { + "epoch": 1.75, + "learning_rate": 7.805208026013636e-07, + "loss": 0.7104, + "step": 68277 + }, + { + "epoch": 1.75, + "learning_rate": 7.804938069151903e-07, + "loss": 0.6284, + "step": 68278 + }, + { + "epoch": 1.75, + "learning_rate": 7.804668113970822e-07, + "loss": 0.6123, + "step": 68279 + }, + { + "epoch": 1.75, + "learning_rate": 7.804398160470608e-07, + "loss": 0.8096, + "step": 68280 + }, + { + "epoch": 1.75, + "learning_rate": 7.804128208651462e-07, + "loss": 0.6104, + "step": 68281 + }, + { + "epoch": 1.75, + "learning_rate": 7.803858258513598e-07, + "loss": 0.6494, + "step": 68282 + }, + { + "epoch": 1.75, + "learning_rate": 7.803588310057216e-07, + "loss": 0.6484, + "step": 68283 + }, + { + "epoch": 1.75, + "learning_rate": 7.803318363282527e-07, + "loss": 0.5962, + "step": 68284 + }, + { + "epoch": 1.75, + "learning_rate": 7.803048418189734e-07, + "loss": 0.7168, + "step": 68285 + }, + { + "epoch": 1.75, + "learning_rate": 7.802778474779049e-07, + "loss": 0.625, + "step": 68286 + }, + { + "epoch": 1.75, + "learning_rate": 7.802508533050673e-07, + "loss": 0.7275, + "step": 68287 + }, + { + "epoch": 1.75, + "learning_rate": 7.802238593004819e-07, + "loss": 0.6875, + "step": 68288 + }, + { + "epoch": 1.75, + "learning_rate": 7.801968654641688e-07, + "loss": 0.562, + "step": 68289 + }, + { + "epoch": 1.75, + "learning_rate": 7.801698717961485e-07, + "loss": 0.6885, + "step": 68290 + }, + { + "epoch": 1.75, + "learning_rate": 7.801428782964424e-07, + "loss": 0.5723, + "step": 68291 + }, + { + "epoch": 1.75, + "learning_rate": 7.801158849650706e-07, + "loss": 0.626, + "step": 68292 + }, + { + "epoch": 1.75, + "learning_rate": 7.80088891802054e-07, + "loss": 0.8223, + "step": 68293 + }, + { + "epoch": 1.75, + "learning_rate": 7.800618988074132e-07, + "loss": 0.6973, + "step": 68294 + }, + { + "epoch": 1.75, + "learning_rate": 7.80034905981169e-07, + "loss": 0.7285, + "step": 68295 + }, + { + "epoch": 1.75, + "learning_rate": 7.80007913323342e-07, + "loss": 0.5414, + "step": 68296 + }, + { + "epoch": 1.75, + "learning_rate": 7.799809208339525e-07, + "loss": 0.6592, + "step": 68297 + }, + { + "epoch": 1.75, + "learning_rate": 7.799539285130221e-07, + "loss": 0.7637, + "step": 68298 + }, + { + "epoch": 1.75, + "learning_rate": 7.799269363605705e-07, + "loss": 0.7119, + "step": 68299 + }, + { + "epoch": 1.75, + "learning_rate": 7.798999443766185e-07, + "loss": 0.5776, + "step": 68300 + }, + { + "epoch": 1.75, + "learning_rate": 7.798729525611874e-07, + "loss": 0.561, + "step": 68301 + }, + { + "epoch": 1.75, + "learning_rate": 7.798459609142971e-07, + "loss": 0.5859, + "step": 68302 + }, + { + "epoch": 1.75, + "learning_rate": 7.798189694359688e-07, + "loss": 0.666, + "step": 68303 + }, + { + "epoch": 1.75, + "learning_rate": 7.797919781262229e-07, + "loss": 0.5781, + "step": 68304 + }, + { + "epoch": 1.75, + "learning_rate": 7.797649869850802e-07, + "loss": 0.7363, + "step": 68305 + }, + { + "epoch": 1.75, + "learning_rate": 7.797379960125613e-07, + "loss": 0.5952, + "step": 68306 + }, + { + "epoch": 1.75, + "learning_rate": 7.79711005208687e-07, + "loss": 0.667, + "step": 68307 + }, + { + "epoch": 1.75, + "learning_rate": 7.796840145734781e-07, + "loss": 0.7256, + "step": 68308 + }, + { + "epoch": 1.75, + "learning_rate": 7.796570241069545e-07, + "loss": 0.5245, + "step": 68309 + }, + { + "epoch": 1.75, + "learning_rate": 7.796300338091378e-07, + "loss": 0.6509, + "step": 68310 + }, + { + "epoch": 1.75, + "learning_rate": 7.796030436800479e-07, + "loss": 0.7451, + "step": 68311 + }, + { + "epoch": 1.75, + "learning_rate": 7.795760537197059e-07, + "loss": 0.6636, + "step": 68312 + }, + { + "epoch": 1.75, + "learning_rate": 7.795490639281325e-07, + "loss": 0.4402, + "step": 68313 + }, + { + "epoch": 1.75, + "learning_rate": 7.795220743053481e-07, + "loss": 0.7646, + "step": 68314 + }, + { + "epoch": 1.75, + "learning_rate": 7.794950848513737e-07, + "loss": 0.6086, + "step": 68315 + }, + { + "epoch": 1.75, + "learning_rate": 7.794680955662295e-07, + "loss": 0.6392, + "step": 68316 + }, + { + "epoch": 1.75, + "learning_rate": 7.794411064499366e-07, + "loss": 0.5845, + "step": 68317 + }, + { + "epoch": 1.75, + "learning_rate": 7.794141175025159e-07, + "loss": 0.7002, + "step": 68318 + }, + { + "epoch": 1.75, + "learning_rate": 7.793871287239871e-07, + "loss": 0.6851, + "step": 68319 + }, + { + "epoch": 1.75, + "learning_rate": 7.793601401143717e-07, + "loss": 0.5508, + "step": 68320 + }, + { + "epoch": 1.75, + "learning_rate": 7.793331516736899e-07, + "loss": 0.6938, + "step": 68321 + }, + { + "epoch": 1.75, + "learning_rate": 7.793061634019628e-07, + "loss": 0.7471, + "step": 68322 + }, + { + "epoch": 1.75, + "learning_rate": 7.792791752992105e-07, + "loss": 0.6738, + "step": 68323 + }, + { + "epoch": 1.75, + "learning_rate": 7.792521873654543e-07, + "loss": 0.6689, + "step": 68324 + }, + { + "epoch": 1.75, + "learning_rate": 7.792251996007142e-07, + "loss": 0.6855, + "step": 68325 + }, + { + "epoch": 1.75, + "learning_rate": 7.791982120050115e-07, + "loss": 0.5479, + "step": 68326 + }, + { + "epoch": 1.75, + "learning_rate": 7.791712245783664e-07, + "loss": 0.5898, + "step": 68327 + }, + { + "epoch": 1.75, + "learning_rate": 7.791442373208001e-07, + "loss": 0.6953, + "step": 68328 + }, + { + "epoch": 1.75, + "learning_rate": 7.791172502323329e-07, + "loss": 0.5791, + "step": 68329 + }, + { + "epoch": 1.75, + "learning_rate": 7.790902633129853e-07, + "loss": 0.5342, + "step": 68330 + }, + { + "epoch": 1.75, + "learning_rate": 7.790632765627779e-07, + "loss": 0.7295, + "step": 68331 + }, + { + "epoch": 1.75, + "learning_rate": 7.790362899817317e-07, + "loss": 0.7012, + "step": 68332 + }, + { + "epoch": 1.75, + "learning_rate": 7.790093035698672e-07, + "loss": 0.5608, + "step": 68333 + }, + { + "epoch": 1.75, + "learning_rate": 7.789823173272053e-07, + "loss": 0.6606, + "step": 68334 + }, + { + "epoch": 1.75, + "learning_rate": 7.789553312537662e-07, + "loss": 0.4453, + "step": 68335 + }, + { + "epoch": 1.75, + "learning_rate": 7.789283453495712e-07, + "loss": 0.5164, + "step": 68336 + }, + { + "epoch": 1.75, + "learning_rate": 7.789013596146402e-07, + "loss": 0.6108, + "step": 68337 + }, + { + "epoch": 1.75, + "learning_rate": 7.788743740489948e-07, + "loss": 0.5283, + "step": 68338 + }, + { + "epoch": 1.75, + "learning_rate": 7.788473886526549e-07, + "loss": 0.6841, + "step": 68339 + }, + { + "epoch": 1.75, + "learning_rate": 7.788204034256411e-07, + "loss": 0.6611, + "step": 68340 + }, + { + "epoch": 1.75, + "learning_rate": 7.787934183679746e-07, + "loss": 0.6162, + "step": 68341 + }, + { + "epoch": 1.75, + "learning_rate": 7.787664334796757e-07, + "loss": 0.5381, + "step": 68342 + }, + { + "epoch": 1.75, + "learning_rate": 7.787394487607653e-07, + "loss": 0.4832, + "step": 68343 + }, + { + "epoch": 1.75, + "learning_rate": 7.787124642112637e-07, + "loss": 0.6152, + "step": 68344 + }, + { + "epoch": 1.75, + "learning_rate": 7.786854798311921e-07, + "loss": 0.7998, + "step": 68345 + }, + { + "epoch": 1.75, + "learning_rate": 7.786584956205704e-07, + "loss": 0.4814, + "step": 68346 + }, + { + "epoch": 1.75, + "learning_rate": 7.786315115794202e-07, + "loss": 0.6318, + "step": 68347 + }, + { + "epoch": 1.75, + "learning_rate": 7.786045277077617e-07, + "loss": 0.6514, + "step": 68348 + }, + { + "epoch": 1.75, + "learning_rate": 7.785775440056154e-07, + "loss": 0.5554, + "step": 68349 + }, + { + "epoch": 1.75, + "learning_rate": 7.785505604730018e-07, + "loss": 0.6201, + "step": 68350 + }, + { + "epoch": 1.75, + "learning_rate": 7.785235771099422e-07, + "loss": 0.4951, + "step": 68351 + }, + { + "epoch": 1.75, + "learning_rate": 7.784965939164566e-07, + "loss": 0.6858, + "step": 68352 + }, + { + "epoch": 1.75, + "learning_rate": 7.784696108925663e-07, + "loss": 0.6284, + "step": 68353 + }, + { + "epoch": 1.75, + "learning_rate": 7.784426280382913e-07, + "loss": 0.6982, + "step": 68354 + }, + { + "epoch": 1.75, + "learning_rate": 7.784156453536528e-07, + "loss": 0.5186, + "step": 68355 + }, + { + "epoch": 1.75, + "learning_rate": 7.783886628386711e-07, + "loss": 0.4883, + "step": 68356 + }, + { + "epoch": 1.75, + "learning_rate": 7.783616804933673e-07, + "loss": 0.6211, + "step": 68357 + }, + { + "epoch": 1.75, + "learning_rate": 7.783346983177619e-07, + "loss": 0.5693, + "step": 68358 + }, + { + "epoch": 1.75, + "learning_rate": 7.78307716311875e-07, + "loss": 0.7383, + "step": 68359 + }, + { + "epoch": 1.75, + "learning_rate": 7.782807344757278e-07, + "loss": 0.8438, + "step": 68360 + }, + { + "epoch": 1.75, + "learning_rate": 7.782537528093407e-07, + "loss": 0.5786, + "step": 68361 + }, + { + "epoch": 1.75, + "learning_rate": 7.782267713127349e-07, + "loss": 0.6323, + "step": 68362 + }, + { + "epoch": 1.75, + "learning_rate": 7.781997899859301e-07, + "loss": 0.5576, + "step": 68363 + }, + { + "epoch": 1.75, + "learning_rate": 7.781728088289481e-07, + "loss": 0.6763, + "step": 68364 + }, + { + "epoch": 1.75, + "learning_rate": 7.781458278418085e-07, + "loss": 0.8428, + "step": 68365 + }, + { + "epoch": 1.75, + "learning_rate": 7.781188470245328e-07, + "loss": 0.541, + "step": 68366 + }, + { + "epoch": 1.75, + "learning_rate": 7.780918663771409e-07, + "loss": 0.6938, + "step": 68367 + }, + { + "epoch": 1.75, + "learning_rate": 7.780648858996548e-07, + "loss": 0.5234, + "step": 68368 + }, + { + "epoch": 1.75, + "learning_rate": 7.780379055920934e-07, + "loss": 0.6323, + "step": 68369 + }, + { + "epoch": 1.75, + "learning_rate": 7.780109254544783e-07, + "loss": 0.52, + "step": 68370 + }, + { + "epoch": 1.75, + "learning_rate": 7.7798394548683e-07, + "loss": 0.8574, + "step": 68371 + }, + { + "epoch": 1.75, + "learning_rate": 7.779569656891693e-07, + "loss": 0.792, + "step": 68372 + }, + { + "epoch": 1.75, + "learning_rate": 7.779299860615165e-07, + "loss": 0.6543, + "step": 68373 + }, + { + "epoch": 1.75, + "learning_rate": 7.779030066038928e-07, + "loss": 0.7212, + "step": 68374 + }, + { + "epoch": 1.75, + "learning_rate": 7.778760273163182e-07, + "loss": 0.8467, + "step": 68375 + }, + { + "epoch": 1.75, + "learning_rate": 7.77849048198814e-07, + "loss": 0.6455, + "step": 68376 + }, + { + "epoch": 1.75, + "learning_rate": 7.778220692514003e-07, + "loss": 0.7656, + "step": 68377 + }, + { + "epoch": 1.75, + "learning_rate": 7.777950904740985e-07, + "loss": 0.6016, + "step": 68378 + }, + { + "epoch": 1.75, + "learning_rate": 7.777681118669286e-07, + "loss": 0.6846, + "step": 68379 + }, + { + "epoch": 1.75, + "learning_rate": 7.777411334299113e-07, + "loss": 0.6768, + "step": 68380 + }, + { + "epoch": 1.75, + "learning_rate": 7.777141551630675e-07, + "loss": 0.7412, + "step": 68381 + }, + { + "epoch": 1.75, + "learning_rate": 7.776871770664175e-07, + "loss": 0.7158, + "step": 68382 + }, + { + "epoch": 1.75, + "learning_rate": 7.776601991399825e-07, + "loss": 0.665, + "step": 68383 + }, + { + "epoch": 1.75, + "learning_rate": 7.776332213837826e-07, + "loss": 0.6797, + "step": 68384 + }, + { + "epoch": 1.75, + "learning_rate": 7.776062437978389e-07, + "loss": 0.6904, + "step": 68385 + }, + { + "epoch": 1.75, + "learning_rate": 7.77579266382172e-07, + "loss": 0.6182, + "step": 68386 + }, + { + "epoch": 1.75, + "learning_rate": 7.775522891368021e-07, + "loss": 0.6357, + "step": 68387 + }, + { + "epoch": 1.75, + "learning_rate": 7.775253120617506e-07, + "loss": 0.5457, + "step": 68388 + }, + { + "epoch": 1.75, + "learning_rate": 7.774983351570376e-07, + "loss": 0.6377, + "step": 68389 + }, + { + "epoch": 1.75, + "learning_rate": 7.774713584226838e-07, + "loss": 0.709, + "step": 68390 + }, + { + "epoch": 1.75, + "learning_rate": 7.774443818587098e-07, + "loss": 0.7764, + "step": 68391 + }, + { + "epoch": 1.75, + "learning_rate": 7.774174054651366e-07, + "loss": 0.7256, + "step": 68392 + }, + { + "epoch": 1.75, + "learning_rate": 7.773904292419846e-07, + "loss": 0.5327, + "step": 68393 + }, + { + "epoch": 1.75, + "learning_rate": 7.773634531892743e-07, + "loss": 0.4839, + "step": 68394 + }, + { + "epoch": 1.75, + "learning_rate": 7.773364773070269e-07, + "loss": 0.5215, + "step": 68395 + }, + { + "epoch": 1.75, + "learning_rate": 7.773095015952625e-07, + "loss": 0.7676, + "step": 68396 + }, + { + "epoch": 1.75, + "learning_rate": 7.772825260540021e-07, + "loss": 0.4886, + "step": 68397 + }, + { + "epoch": 1.75, + "learning_rate": 7.772555506832665e-07, + "loss": 0.5508, + "step": 68398 + }, + { + "epoch": 1.75, + "learning_rate": 7.772285754830756e-07, + "loss": 0.7354, + "step": 68399 + }, + { + "epoch": 1.75, + "learning_rate": 7.77201600453451e-07, + "loss": 0.4409, + "step": 68400 + }, + { + "epoch": 1.75, + "learning_rate": 7.771746255944124e-07, + "loss": 0.5747, + "step": 68401 + }, + { + "epoch": 1.75, + "learning_rate": 7.771476509059812e-07, + "loss": 0.4113, + "step": 68402 + }, + { + "epoch": 1.75, + "learning_rate": 7.771206763881779e-07, + "loss": 0.5767, + "step": 68403 + }, + { + "epoch": 1.75, + "learning_rate": 7.770937020410226e-07, + "loss": 0.5342, + "step": 68404 + }, + { + "epoch": 1.75, + "learning_rate": 7.770667278645368e-07, + "loss": 0.6182, + "step": 68405 + }, + { + "epoch": 1.75, + "learning_rate": 7.770397538587407e-07, + "loss": 0.6143, + "step": 68406 + }, + { + "epoch": 1.75, + "learning_rate": 7.77012780023655e-07, + "loss": 0.4905, + "step": 68407 + }, + { + "epoch": 1.75, + "learning_rate": 7.769858063593007e-07, + "loss": 0.5015, + "step": 68408 + }, + { + "epoch": 1.75, + "learning_rate": 7.769588328656975e-07, + "loss": 0.7246, + "step": 68409 + }, + { + "epoch": 1.75, + "learning_rate": 7.76931859542867e-07, + "loss": 0.6299, + "step": 68410 + }, + { + "epoch": 1.75, + "learning_rate": 7.769048863908293e-07, + "loss": 0.5203, + "step": 68411 + }, + { + "epoch": 1.75, + "learning_rate": 7.768779134096055e-07, + "loss": 0.6934, + "step": 68412 + }, + { + "epoch": 1.75, + "learning_rate": 7.768509405992157e-07, + "loss": 0.6216, + "step": 68413 + }, + { + "epoch": 1.75, + "learning_rate": 7.768239679596812e-07, + "loss": 0.6433, + "step": 68414 + }, + { + "epoch": 1.75, + "learning_rate": 7.767969954910221e-07, + "loss": 0.6426, + "step": 68415 + }, + { + "epoch": 1.75, + "learning_rate": 7.767700231932595e-07, + "loss": 0.6133, + "step": 68416 + }, + { + "epoch": 1.75, + "learning_rate": 7.767430510664135e-07, + "loss": 0.4834, + "step": 68417 + }, + { + "epoch": 1.75, + "learning_rate": 7.767160791105056e-07, + "loss": 0.52, + "step": 68418 + }, + { + "epoch": 1.75, + "learning_rate": 7.766891073255558e-07, + "loss": 0.5486, + "step": 68419 + }, + { + "epoch": 1.75, + "learning_rate": 7.766621357115847e-07, + "loss": 0.6865, + "step": 68420 + }, + { + "epoch": 1.75, + "learning_rate": 7.766351642686131e-07, + "loss": 0.6743, + "step": 68421 + }, + { + "epoch": 1.75, + "learning_rate": 7.766081929966619e-07, + "loss": 0.5977, + "step": 68422 + }, + { + "epoch": 1.75, + "learning_rate": 7.765812218957513e-07, + "loss": 0.6167, + "step": 68423 + }, + { + "epoch": 1.75, + "learning_rate": 7.765542509659022e-07, + "loss": 0.5986, + "step": 68424 + }, + { + "epoch": 1.75, + "learning_rate": 7.765272802071352e-07, + "loss": 0.7686, + "step": 68425 + }, + { + "epoch": 1.75, + "learning_rate": 7.765003096194711e-07, + "loss": 0.3273, + "step": 68426 + }, + { + "epoch": 1.75, + "learning_rate": 7.764733392029303e-07, + "loss": 0.5986, + "step": 68427 + }, + { + "epoch": 1.75, + "learning_rate": 7.764463689575341e-07, + "loss": 0.5876, + "step": 68428 + }, + { + "epoch": 1.75, + "learning_rate": 7.764193988833022e-07, + "loss": 0.5791, + "step": 68429 + }, + { + "epoch": 1.75, + "learning_rate": 7.763924289802557e-07, + "loss": 0.5312, + "step": 68430 + }, + { + "epoch": 1.75, + "learning_rate": 7.763654592484152e-07, + "loss": 0.562, + "step": 68431 + }, + { + "epoch": 1.75, + "learning_rate": 7.763384896878014e-07, + "loss": 0.6992, + "step": 68432 + }, + { + "epoch": 1.75, + "learning_rate": 7.763115202984351e-07, + "loss": 0.5603, + "step": 68433 + }, + { + "epoch": 1.75, + "learning_rate": 7.762845510803364e-07, + "loss": 0.6426, + "step": 68434 + }, + { + "epoch": 1.75, + "learning_rate": 7.762575820335268e-07, + "loss": 0.4414, + "step": 68435 + }, + { + "epoch": 1.75, + "learning_rate": 7.76230613158026e-07, + "loss": 0.5571, + "step": 68436 + }, + { + "epoch": 1.75, + "learning_rate": 7.762036444538556e-07, + "loss": 0.6206, + "step": 68437 + }, + { + "epoch": 1.75, + "learning_rate": 7.761766759210358e-07, + "loss": 0.6001, + "step": 68438 + }, + { + "epoch": 1.75, + "learning_rate": 7.761497075595872e-07, + "loss": 0.6289, + "step": 68439 + }, + { + "epoch": 1.75, + "learning_rate": 7.761227393695301e-07, + "loss": 0.6924, + "step": 68440 + }, + { + "epoch": 1.75, + "learning_rate": 7.760957713508858e-07, + "loss": 0.7832, + "step": 68441 + }, + { + "epoch": 1.75, + "learning_rate": 7.760688035036745e-07, + "loss": 0.6013, + "step": 68442 + }, + { + "epoch": 1.75, + "learning_rate": 7.760418358279172e-07, + "loss": 0.6182, + "step": 68443 + }, + { + "epoch": 1.75, + "learning_rate": 7.76014868323634e-07, + "loss": 0.6772, + "step": 68444 + }, + { + "epoch": 1.75, + "learning_rate": 7.759879009908463e-07, + "loss": 0.5093, + "step": 68445 + }, + { + "epoch": 1.75, + "learning_rate": 7.759609338295741e-07, + "loss": 0.625, + "step": 68446 + }, + { + "epoch": 1.75, + "learning_rate": 7.759339668398386e-07, + "loss": 0.7437, + "step": 68447 + }, + { + "epoch": 1.75, + "learning_rate": 7.759070000216604e-07, + "loss": 0.5723, + "step": 68448 + }, + { + "epoch": 1.75, + "learning_rate": 7.758800333750594e-07, + "loss": 0.6255, + "step": 68449 + }, + { + "epoch": 1.75, + "learning_rate": 7.75853066900057e-07, + "loss": 0.5967, + "step": 68450 + }, + { + "epoch": 1.75, + "learning_rate": 7.758261005966733e-07, + "loss": 0.7109, + "step": 68451 + }, + { + "epoch": 1.75, + "learning_rate": 7.757991344649295e-07, + "loss": 0.6597, + "step": 68452 + }, + { + "epoch": 1.75, + "learning_rate": 7.757721685048457e-07, + "loss": 0.5859, + "step": 68453 + }, + { + "epoch": 1.75, + "learning_rate": 7.757452027164431e-07, + "loss": 0.4956, + "step": 68454 + }, + { + "epoch": 1.75, + "learning_rate": 7.757182370997421e-07, + "loss": 0.6785, + "step": 68455 + }, + { + "epoch": 1.75, + "learning_rate": 7.756912716547632e-07, + "loss": 0.522, + "step": 68456 + }, + { + "epoch": 1.75, + "learning_rate": 7.756643063815272e-07, + "loss": 0.6562, + "step": 68457 + }, + { + "epoch": 1.75, + "learning_rate": 7.756373412800553e-07, + "loss": 0.4312, + "step": 68458 + }, + { + "epoch": 1.75, + "learning_rate": 7.75610376350367e-07, + "loss": 0.7158, + "step": 68459 + }, + { + "epoch": 1.75, + "learning_rate": 7.755834115924837e-07, + "loss": 0.7227, + "step": 68460 + }, + { + "epoch": 1.75, + "learning_rate": 7.755564470064255e-07, + "loss": 0.7871, + "step": 68461 + }, + { + "epoch": 1.75, + "learning_rate": 7.755294825922137e-07, + "loss": 0.8496, + "step": 68462 + }, + { + "epoch": 1.75, + "learning_rate": 7.755025183498685e-07, + "loss": 0.5986, + "step": 68463 + }, + { + "epoch": 1.75, + "learning_rate": 7.754755542794109e-07, + "loss": 0.6572, + "step": 68464 + }, + { + "epoch": 1.75, + "learning_rate": 7.75448590380861e-07, + "loss": 0.4089, + "step": 68465 + }, + { + "epoch": 1.75, + "learning_rate": 7.754216266542401e-07, + "loss": 0.6069, + "step": 68466 + }, + { + "epoch": 1.75, + "learning_rate": 7.753946630995684e-07, + "loss": 0.5342, + "step": 68467 + }, + { + "epoch": 1.75, + "learning_rate": 7.753676997168671e-07, + "loss": 0.6133, + "step": 68468 + }, + { + "epoch": 1.75, + "learning_rate": 7.753407365061562e-07, + "loss": 0.7705, + "step": 68469 + }, + { + "epoch": 1.75, + "learning_rate": 7.753137734674563e-07, + "loss": 0.4678, + "step": 68470 + }, + { + "epoch": 1.75, + "learning_rate": 7.752868106007885e-07, + "loss": 0.7144, + "step": 68471 + }, + { + "epoch": 1.75, + "learning_rate": 7.75259847906173e-07, + "loss": 0.5518, + "step": 68472 + }, + { + "epoch": 1.75, + "learning_rate": 7.75232885383631e-07, + "loss": 0.6426, + "step": 68473 + }, + { + "epoch": 1.76, + "learning_rate": 7.752059230331826e-07, + "loss": 0.8447, + "step": 68474 + }, + { + "epoch": 1.76, + "learning_rate": 7.75178960854849e-07, + "loss": 0.533, + "step": 68475 + }, + { + "epoch": 1.76, + "learning_rate": 7.751519988486504e-07, + "loss": 0.5693, + "step": 68476 + }, + { + "epoch": 1.76, + "learning_rate": 7.751250370146074e-07, + "loss": 0.5815, + "step": 68477 + }, + { + "epoch": 1.76, + "learning_rate": 7.750980753527413e-07, + "loss": 0.6733, + "step": 68478 + }, + { + "epoch": 1.76, + "learning_rate": 7.750711138630721e-07, + "loss": 0.5713, + "step": 68479 + }, + { + "epoch": 1.76, + "learning_rate": 7.750441525456203e-07, + "loss": 0.8271, + "step": 68480 + }, + { + "epoch": 1.76, + "learning_rate": 7.75017191400407e-07, + "loss": 0.6704, + "step": 68481 + }, + { + "epoch": 1.76, + "learning_rate": 7.749902304274526e-07, + "loss": 0.5469, + "step": 68482 + }, + { + "epoch": 1.76, + "learning_rate": 7.74963269626778e-07, + "loss": 0.6138, + "step": 68483 + }, + { + "epoch": 1.76, + "learning_rate": 7.749363089984033e-07, + "loss": 0.5859, + "step": 68484 + }, + { + "epoch": 1.76, + "learning_rate": 7.7490934854235e-07, + "loss": 0.5728, + "step": 68485 + }, + { + "epoch": 1.76, + "learning_rate": 7.74882388258638e-07, + "loss": 0.5774, + "step": 68486 + }, + { + "epoch": 1.76, + "learning_rate": 7.748554281472883e-07, + "loss": 0.6318, + "step": 68487 + }, + { + "epoch": 1.76, + "learning_rate": 7.748284682083217e-07, + "loss": 0.7554, + "step": 68488 + }, + { + "epoch": 1.76, + "learning_rate": 7.748015084417582e-07, + "loss": 0.7266, + "step": 68489 + }, + { + "epoch": 1.76, + "learning_rate": 7.74774548847619e-07, + "loss": 0.6758, + "step": 68490 + }, + { + "epoch": 1.76, + "learning_rate": 7.747475894259243e-07, + "loss": 0.6328, + "step": 68491 + }, + { + "epoch": 1.76, + "learning_rate": 7.747206301766955e-07, + "loss": 0.4814, + "step": 68492 + }, + { + "epoch": 1.76, + "learning_rate": 7.746936710999524e-07, + "loss": 0.5305, + "step": 68493 + }, + { + "epoch": 1.76, + "learning_rate": 7.74666712195716e-07, + "loss": 0.5405, + "step": 68494 + }, + { + "epoch": 1.76, + "learning_rate": 7.746397534640071e-07, + "loss": 0.6377, + "step": 68495 + }, + { + "epoch": 1.76, + "learning_rate": 7.74612794904846e-07, + "loss": 0.5796, + "step": 68496 + }, + { + "epoch": 1.76, + "learning_rate": 7.745858365182535e-07, + "loss": 0.6104, + "step": 68497 + }, + { + "epoch": 1.76, + "learning_rate": 7.745588783042508e-07, + "loss": 0.5522, + "step": 68498 + }, + { + "epoch": 1.76, + "learning_rate": 7.745319202628574e-07, + "loss": 0.6934, + "step": 68499 + }, + { + "epoch": 1.76, + "learning_rate": 7.745049623940948e-07, + "loss": 0.626, + "step": 68500 + }, + { + "epoch": 1.76, + "learning_rate": 7.744780046979832e-07, + "loss": 0.6519, + "step": 68501 + }, + { + "epoch": 1.76, + "learning_rate": 7.744510471745436e-07, + "loss": 0.5952, + "step": 68502 + }, + { + "epoch": 1.76, + "learning_rate": 7.744240898237963e-07, + "loss": 0.7129, + "step": 68503 + }, + { + "epoch": 1.76, + "learning_rate": 7.743971326457622e-07, + "loss": 0.6621, + "step": 68504 + }, + { + "epoch": 1.76, + "learning_rate": 7.743701756404617e-07, + "loss": 0.5605, + "step": 68505 + }, + { + "epoch": 1.76, + "learning_rate": 7.743432188079157e-07, + "loss": 0.5171, + "step": 68506 + }, + { + "epoch": 1.76, + "learning_rate": 7.743162621481447e-07, + "loss": 0.6543, + "step": 68507 + }, + { + "epoch": 1.76, + "learning_rate": 7.742893056611697e-07, + "loss": 0.5278, + "step": 68508 + }, + { + "epoch": 1.76, + "learning_rate": 7.742623493470107e-07, + "loss": 0.5859, + "step": 68509 + }, + { + "epoch": 1.76, + "learning_rate": 7.742353932056885e-07, + "loss": 0.4253, + "step": 68510 + }, + { + "epoch": 1.76, + "learning_rate": 7.742084372372241e-07, + "loss": 0.7432, + "step": 68511 + }, + { + "epoch": 1.76, + "learning_rate": 7.741814814416379e-07, + "loss": 0.4819, + "step": 68512 + }, + { + "epoch": 1.76, + "learning_rate": 7.741545258189503e-07, + "loss": 0.6035, + "step": 68513 + }, + { + "epoch": 1.76, + "learning_rate": 7.741275703691826e-07, + "loss": 0.4594, + "step": 68514 + }, + { + "epoch": 1.76, + "learning_rate": 7.741006150923546e-07, + "loss": 0.6592, + "step": 68515 + }, + { + "epoch": 1.76, + "learning_rate": 7.740736599884876e-07, + "loss": 0.6475, + "step": 68516 + }, + { + "epoch": 1.76, + "learning_rate": 7.740467050576019e-07, + "loss": 0.7832, + "step": 68517 + }, + { + "epoch": 1.76, + "learning_rate": 7.740197502997186e-07, + "loss": 0.6426, + "step": 68518 + }, + { + "epoch": 1.76, + "learning_rate": 7.739927957148577e-07, + "loss": 0.6494, + "step": 68519 + }, + { + "epoch": 1.76, + "learning_rate": 7.739658413030401e-07, + "loss": 0.5435, + "step": 68520 + }, + { + "epoch": 1.76, + "learning_rate": 7.739388870642867e-07, + "loss": 0.6865, + "step": 68521 + }, + { + "epoch": 1.76, + "learning_rate": 7.739119329986174e-07, + "loss": 0.3762, + "step": 68522 + }, + { + "epoch": 1.76, + "learning_rate": 7.738849791060538e-07, + "loss": 0.458, + "step": 68523 + }, + { + "epoch": 1.76, + "learning_rate": 7.738580253866158e-07, + "loss": 0.7446, + "step": 68524 + }, + { + "epoch": 1.76, + "learning_rate": 7.738310718403245e-07, + "loss": 0.5679, + "step": 68525 + }, + { + "epoch": 1.76, + "learning_rate": 7.738041184672002e-07, + "loss": 0.6758, + "step": 68526 + }, + { + "epoch": 1.76, + "learning_rate": 7.737771652672637e-07, + "loss": 0.8613, + "step": 68527 + }, + { + "epoch": 1.76, + "learning_rate": 7.737502122405362e-07, + "loss": 0.6943, + "step": 68528 + }, + { + "epoch": 1.76, + "learning_rate": 7.737232593870372e-07, + "loss": 0.5479, + "step": 68529 + }, + { + "epoch": 1.76, + "learning_rate": 7.736963067067878e-07, + "loss": 0.4258, + "step": 68530 + }, + { + "epoch": 1.76, + "learning_rate": 7.736693541998089e-07, + "loss": 0.6787, + "step": 68531 + }, + { + "epoch": 1.76, + "learning_rate": 7.73642401866121e-07, + "loss": 0.6311, + "step": 68532 + }, + { + "epoch": 1.76, + "learning_rate": 7.736154497057447e-07, + "loss": 0.6299, + "step": 68533 + }, + { + "epoch": 1.76, + "learning_rate": 7.735884977187003e-07, + "loss": 0.5732, + "step": 68534 + }, + { + "epoch": 1.76, + "learning_rate": 7.735615459050092e-07, + "loss": 0.6084, + "step": 68535 + }, + { + "epoch": 1.76, + "learning_rate": 7.735345942646913e-07, + "loss": 0.6846, + "step": 68536 + }, + { + "epoch": 1.76, + "learning_rate": 7.735076427977679e-07, + "loss": 0.6455, + "step": 68537 + }, + { + "epoch": 1.76, + "learning_rate": 7.734806915042594e-07, + "loss": 0.627, + "step": 68538 + }, + { + "epoch": 1.76, + "learning_rate": 7.734537403841859e-07, + "loss": 0.6641, + "step": 68539 + }, + { + "epoch": 1.76, + "learning_rate": 7.734267894375687e-07, + "loss": 0.6553, + "step": 68540 + }, + { + "epoch": 1.76, + "learning_rate": 7.733998386644279e-07, + "loss": 0.5498, + "step": 68541 + }, + { + "epoch": 1.76, + "learning_rate": 7.733728880647848e-07, + "loss": 0.5483, + "step": 68542 + }, + { + "epoch": 1.76, + "learning_rate": 7.733459376386592e-07, + "loss": 0.6909, + "step": 68543 + }, + { + "epoch": 1.76, + "learning_rate": 7.733189873860726e-07, + "loss": 0.5625, + "step": 68544 + }, + { + "epoch": 1.76, + "learning_rate": 7.732920373070449e-07, + "loss": 0.6982, + "step": 68545 + }, + { + "epoch": 1.76, + "learning_rate": 7.732650874015973e-07, + "loss": 0.8184, + "step": 68546 + }, + { + "epoch": 1.76, + "learning_rate": 7.7323813766975e-07, + "loss": 0.7666, + "step": 68547 + }, + { + "epoch": 1.76, + "learning_rate": 7.732111881115245e-07, + "loss": 0.3745, + "step": 68548 + }, + { + "epoch": 1.76, + "learning_rate": 7.7318423872694e-07, + "loss": 0.4338, + "step": 68549 + }, + { + "epoch": 1.76, + "learning_rate": 7.731572895160183e-07, + "loss": 0.5056, + "step": 68550 + }, + { + "epoch": 1.76, + "learning_rate": 7.731303404787793e-07, + "loss": 0.5531, + "step": 68551 + }, + { + "epoch": 1.76, + "learning_rate": 7.731033916152443e-07, + "loss": 0.707, + "step": 68552 + }, + { + "epoch": 1.76, + "learning_rate": 7.730764429254333e-07, + "loss": 0.7012, + "step": 68553 + }, + { + "epoch": 1.76, + "learning_rate": 7.730494944093674e-07, + "loss": 0.6631, + "step": 68554 + }, + { + "epoch": 1.76, + "learning_rate": 7.73022546067067e-07, + "loss": 0.5859, + "step": 68555 + }, + { + "epoch": 1.76, + "learning_rate": 7.729955978985528e-07, + "loss": 0.6499, + "step": 68556 + }, + { + "epoch": 1.76, + "learning_rate": 7.729686499038454e-07, + "loss": 0.6406, + "step": 68557 + }, + { + "epoch": 1.76, + "learning_rate": 7.729417020829658e-07, + "loss": 0.6455, + "step": 68558 + }, + { + "epoch": 1.76, + "learning_rate": 7.729147544359341e-07, + "loss": 0.6377, + "step": 68559 + }, + { + "epoch": 1.76, + "learning_rate": 7.728878069627709e-07, + "loss": 0.6992, + "step": 68560 + }, + { + "epoch": 1.76, + "learning_rate": 7.728608596634974e-07, + "loss": 0.6191, + "step": 68561 + }, + { + "epoch": 1.76, + "learning_rate": 7.728339125381336e-07, + "loss": 0.7705, + "step": 68562 + }, + { + "epoch": 1.76, + "learning_rate": 7.728069655867005e-07, + "loss": 0.7715, + "step": 68563 + }, + { + "epoch": 1.76, + "learning_rate": 7.727800188092186e-07, + "loss": 0.4717, + "step": 68564 + }, + { + "epoch": 1.76, + "learning_rate": 7.727530722057087e-07, + "loss": 0.6255, + "step": 68565 + }, + { + "epoch": 1.76, + "learning_rate": 7.727261257761915e-07, + "loss": 0.6592, + "step": 68566 + }, + { + "epoch": 1.76, + "learning_rate": 7.726991795206877e-07, + "loss": 0.5859, + "step": 68567 + }, + { + "epoch": 1.76, + "learning_rate": 7.726722334392171e-07, + "loss": 0.7017, + "step": 68568 + }, + { + "epoch": 1.76, + "learning_rate": 7.72645287531801e-07, + "loss": 0.6543, + "step": 68569 + }, + { + "epoch": 1.76, + "learning_rate": 7.7261834179846e-07, + "loss": 0.3845, + "step": 68570 + }, + { + "epoch": 1.76, + "learning_rate": 7.725913962392148e-07, + "loss": 0.6401, + "step": 68571 + }, + { + "epoch": 1.76, + "learning_rate": 7.725644508540856e-07, + "loss": 0.6145, + "step": 68572 + }, + { + "epoch": 1.76, + "learning_rate": 7.725375056430937e-07, + "loss": 0.6357, + "step": 68573 + }, + { + "epoch": 1.76, + "learning_rate": 7.725105606062591e-07, + "loss": 0.4558, + "step": 68574 + }, + { + "epoch": 1.76, + "learning_rate": 7.72483615743603e-07, + "loss": 0.667, + "step": 68575 + }, + { + "epoch": 1.76, + "learning_rate": 7.724566710551453e-07, + "loss": 0.5669, + "step": 68576 + }, + { + "epoch": 1.76, + "learning_rate": 7.724297265409077e-07, + "loss": 0.7012, + "step": 68577 + }, + { + "epoch": 1.76, + "learning_rate": 7.724027822009099e-07, + "loss": 0.6074, + "step": 68578 + }, + { + "epoch": 1.76, + "learning_rate": 7.723758380351725e-07, + "loss": 0.6035, + "step": 68579 + }, + { + "epoch": 1.76, + "learning_rate": 7.72348894043717e-07, + "loss": 0.7583, + "step": 68580 + }, + { + "epoch": 1.76, + "learning_rate": 7.72321950226563e-07, + "loss": 0.6841, + "step": 68581 + }, + { + "epoch": 1.76, + "learning_rate": 7.722950065837319e-07, + "loss": 0.6516, + "step": 68582 + }, + { + "epoch": 1.76, + "learning_rate": 7.722680631152441e-07, + "loss": 0.5718, + "step": 68583 + }, + { + "epoch": 1.76, + "learning_rate": 7.722411198211198e-07, + "loss": 0.6387, + "step": 68584 + }, + { + "epoch": 1.76, + "learning_rate": 7.722141767013803e-07, + "loss": 0.5488, + "step": 68585 + }, + { + "epoch": 1.76, + "learning_rate": 7.721872337560458e-07, + "loss": 0.5635, + "step": 68586 + }, + { + "epoch": 1.76, + "learning_rate": 7.721602909851375e-07, + "loss": 0.4854, + "step": 68587 + }, + { + "epoch": 1.76, + "learning_rate": 7.721333483886752e-07, + "loss": 0.6875, + "step": 68588 + }, + { + "epoch": 1.76, + "learning_rate": 7.721064059666798e-07, + "loss": 0.583, + "step": 68589 + }, + { + "epoch": 1.76, + "learning_rate": 7.720794637191722e-07, + "loss": 0.5898, + "step": 68590 + }, + { + "epoch": 1.76, + "learning_rate": 7.720525216461728e-07, + "loss": 0.6729, + "step": 68591 + }, + { + "epoch": 1.76, + "learning_rate": 7.720255797477025e-07, + "loss": 0.6904, + "step": 68592 + }, + { + "epoch": 1.76, + "learning_rate": 7.719986380237813e-07, + "loss": 0.7798, + "step": 68593 + }, + { + "epoch": 1.76, + "learning_rate": 7.719716964744306e-07, + "loss": 0.7002, + "step": 68594 + }, + { + "epoch": 1.76, + "learning_rate": 7.719447550996705e-07, + "loss": 0.666, + "step": 68595 + }, + { + "epoch": 1.76, + "learning_rate": 7.71917813899522e-07, + "loss": 0.5898, + "step": 68596 + }, + { + "epoch": 1.76, + "learning_rate": 7.718908728740059e-07, + "loss": 0.6836, + "step": 68597 + }, + { + "epoch": 1.76, + "learning_rate": 7.718639320231419e-07, + "loss": 0.6758, + "step": 68598 + }, + { + "epoch": 1.76, + "learning_rate": 7.718369913469514e-07, + "loss": 0.7051, + "step": 68599 + }, + { + "epoch": 1.76, + "learning_rate": 7.718100508454546e-07, + "loss": 0.627, + "step": 68600 + }, + { + "epoch": 1.76, + "learning_rate": 7.717831105186726e-07, + "loss": 0.5747, + "step": 68601 + }, + { + "epoch": 1.76, + "learning_rate": 7.717561703666259e-07, + "loss": 0.7549, + "step": 68602 + }, + { + "epoch": 1.76, + "learning_rate": 7.717292303893346e-07, + "loss": 0.6143, + "step": 68603 + }, + { + "epoch": 1.76, + "learning_rate": 7.7170229058682e-07, + "loss": 0.6514, + "step": 68604 + }, + { + "epoch": 1.76, + "learning_rate": 7.716753509591023e-07, + "loss": 0.6816, + "step": 68605 + }, + { + "epoch": 1.76, + "learning_rate": 7.716484115062026e-07, + "loss": 0.5532, + "step": 68606 + }, + { + "epoch": 1.76, + "learning_rate": 7.716214722281412e-07, + "loss": 0.8662, + "step": 68607 + }, + { + "epoch": 1.76, + "learning_rate": 7.715945331249383e-07, + "loss": 0.6709, + "step": 68608 + }, + { + "epoch": 1.76, + "learning_rate": 7.715675941966153e-07, + "loss": 0.8389, + "step": 68609 + }, + { + "epoch": 1.76, + "learning_rate": 7.715406554431923e-07, + "loss": 0.6787, + "step": 68610 + }, + { + "epoch": 1.76, + "learning_rate": 7.715137168646903e-07, + "loss": 0.6777, + "step": 68611 + }, + { + "epoch": 1.76, + "learning_rate": 7.714867784611295e-07, + "loss": 0.582, + "step": 68612 + }, + { + "epoch": 1.76, + "learning_rate": 7.714598402325309e-07, + "loss": 0.7314, + "step": 68613 + }, + { + "epoch": 1.76, + "learning_rate": 7.71432902178915e-07, + "loss": 0.5732, + "step": 68614 + }, + { + "epoch": 1.76, + "learning_rate": 7.714059643003025e-07, + "loss": 0.6165, + "step": 68615 + }, + { + "epoch": 1.76, + "learning_rate": 7.713790265967137e-07, + "loss": 0.5608, + "step": 68616 + }, + { + "epoch": 1.76, + "learning_rate": 7.713520890681699e-07, + "loss": 0.4237, + "step": 68617 + }, + { + "epoch": 1.76, + "learning_rate": 7.713251517146911e-07, + "loss": 0.8184, + "step": 68618 + }, + { + "epoch": 1.76, + "learning_rate": 7.712982145362982e-07, + "loss": 0.6187, + "step": 68619 + }, + { + "epoch": 1.76, + "learning_rate": 7.712712775330115e-07, + "loss": 0.5562, + "step": 68620 + }, + { + "epoch": 1.76, + "learning_rate": 7.712443407048519e-07, + "loss": 0.4248, + "step": 68621 + }, + { + "epoch": 1.76, + "learning_rate": 7.7121740405184e-07, + "loss": 0.6973, + "step": 68622 + }, + { + "epoch": 1.76, + "learning_rate": 7.711904675739965e-07, + "loss": 0.6328, + "step": 68623 + }, + { + "epoch": 1.76, + "learning_rate": 7.711635312713417e-07, + "loss": 0.6836, + "step": 68624 + }, + { + "epoch": 1.76, + "learning_rate": 7.711365951438968e-07, + "loss": 0.6123, + "step": 68625 + }, + { + "epoch": 1.76, + "learning_rate": 7.711096591916818e-07, + "loss": 0.5569, + "step": 68626 + }, + { + "epoch": 1.76, + "learning_rate": 7.71082723414718e-07, + "loss": 0.6304, + "step": 68627 + }, + { + "epoch": 1.76, + "learning_rate": 7.710557878130255e-07, + "loss": 0.4595, + "step": 68628 + }, + { + "epoch": 1.76, + "learning_rate": 7.710288523866248e-07, + "loss": 0.7393, + "step": 68629 + }, + { + "epoch": 1.76, + "learning_rate": 7.71001917135537e-07, + "loss": 0.5415, + "step": 68630 + }, + { + "epoch": 1.76, + "learning_rate": 7.709749820597823e-07, + "loss": 0.5737, + "step": 68631 + }, + { + "epoch": 1.76, + "learning_rate": 7.709480471593817e-07, + "loss": 0.6445, + "step": 68632 + }, + { + "epoch": 1.76, + "learning_rate": 7.709211124343555e-07, + "loss": 0.7168, + "step": 68633 + }, + { + "epoch": 1.76, + "learning_rate": 7.708941778847246e-07, + "loss": 0.6992, + "step": 68634 + }, + { + "epoch": 1.76, + "learning_rate": 7.708672435105093e-07, + "loss": 0.5391, + "step": 68635 + }, + { + "epoch": 1.76, + "learning_rate": 7.708403093117306e-07, + "loss": 0.7168, + "step": 68636 + }, + { + "epoch": 1.76, + "learning_rate": 7.708133752884093e-07, + "loss": 0.7002, + "step": 68637 + }, + { + "epoch": 1.76, + "learning_rate": 7.707864414405654e-07, + "loss": 0.6138, + "step": 68638 + }, + { + "epoch": 1.76, + "learning_rate": 7.707595077682195e-07, + "loss": 0.7041, + "step": 68639 + }, + { + "epoch": 1.76, + "learning_rate": 7.707325742713926e-07, + "loss": 0.7373, + "step": 68640 + }, + { + "epoch": 1.76, + "learning_rate": 7.707056409501051e-07, + "loss": 0.6216, + "step": 68641 + }, + { + "epoch": 1.76, + "learning_rate": 7.706787078043782e-07, + "loss": 0.6035, + "step": 68642 + }, + { + "epoch": 1.76, + "learning_rate": 7.706517748342316e-07, + "loss": 0.9268, + "step": 68643 + }, + { + "epoch": 1.76, + "learning_rate": 7.706248420396866e-07, + "loss": 0.4668, + "step": 68644 + }, + { + "epoch": 1.76, + "learning_rate": 7.705979094207635e-07, + "loss": 0.6489, + "step": 68645 + }, + { + "epoch": 1.76, + "learning_rate": 7.705709769774832e-07, + "loss": 0.7021, + "step": 68646 + }, + { + "epoch": 1.76, + "learning_rate": 7.705440447098663e-07, + "loss": 0.7852, + "step": 68647 + }, + { + "epoch": 1.76, + "learning_rate": 7.705171126179331e-07, + "loss": 0.6924, + "step": 68648 + }, + { + "epoch": 1.76, + "learning_rate": 7.704901807017044e-07, + "loss": 0.6316, + "step": 68649 + }, + { + "epoch": 1.76, + "learning_rate": 7.704632489612007e-07, + "loss": 0.6279, + "step": 68650 + }, + { + "epoch": 1.76, + "learning_rate": 7.704363173964427e-07, + "loss": 0.6177, + "step": 68651 + }, + { + "epoch": 1.76, + "learning_rate": 7.704093860074511e-07, + "loss": 0.5581, + "step": 68652 + }, + { + "epoch": 1.76, + "learning_rate": 7.703824547942465e-07, + "loss": 0.6514, + "step": 68653 + }, + { + "epoch": 1.76, + "learning_rate": 7.703555237568495e-07, + "loss": 0.6787, + "step": 68654 + }, + { + "epoch": 1.76, + "learning_rate": 7.703285928952808e-07, + "loss": 0.7129, + "step": 68655 + }, + { + "epoch": 1.76, + "learning_rate": 7.703016622095611e-07, + "loss": 0.8242, + "step": 68656 + }, + { + "epoch": 1.76, + "learning_rate": 7.702747316997109e-07, + "loss": 0.7539, + "step": 68657 + }, + { + "epoch": 1.76, + "learning_rate": 7.702478013657503e-07, + "loss": 0.4314, + "step": 68658 + }, + { + "epoch": 1.76, + "learning_rate": 7.702208712077007e-07, + "loss": 0.5981, + "step": 68659 + }, + { + "epoch": 1.76, + "learning_rate": 7.701939412255822e-07, + "loss": 0.4202, + "step": 68660 + }, + { + "epoch": 1.76, + "learning_rate": 7.701670114194159e-07, + "loss": 0.7969, + "step": 68661 + }, + { + "epoch": 1.76, + "learning_rate": 7.701400817892219e-07, + "loss": 0.7686, + "step": 68662 + }, + { + "epoch": 1.76, + "learning_rate": 7.701131523350211e-07, + "loss": 0.5254, + "step": 68663 + }, + { + "epoch": 1.76, + "learning_rate": 7.700862230568342e-07, + "loss": 0.8223, + "step": 68664 + }, + { + "epoch": 1.76, + "learning_rate": 7.700592939546817e-07, + "loss": 0.5889, + "step": 68665 + }, + { + "epoch": 1.76, + "learning_rate": 7.70032365028584e-07, + "loss": 0.6211, + "step": 68666 + }, + { + "epoch": 1.76, + "learning_rate": 7.700054362785625e-07, + "loss": 0.512, + "step": 68667 + }, + { + "epoch": 1.76, + "learning_rate": 7.69978507704637e-07, + "loss": 0.6206, + "step": 68668 + }, + { + "epoch": 1.76, + "learning_rate": 7.699515793068281e-07, + "loss": 0.668, + "step": 68669 + }, + { + "epoch": 1.76, + "learning_rate": 7.699246510851571e-07, + "loss": 0.6992, + "step": 68670 + }, + { + "epoch": 1.76, + "learning_rate": 7.698977230396437e-07, + "loss": 0.6318, + "step": 68671 + }, + { + "epoch": 1.76, + "learning_rate": 7.698707951703095e-07, + "loss": 0.5571, + "step": 68672 + }, + { + "epoch": 1.76, + "learning_rate": 7.698438674771743e-07, + "loss": 0.6426, + "step": 68673 + }, + { + "epoch": 1.76, + "learning_rate": 7.698169399602593e-07, + "loss": 0.5186, + "step": 68674 + }, + { + "epoch": 1.76, + "learning_rate": 7.69790012619585e-07, + "loss": 0.5703, + "step": 68675 + }, + { + "epoch": 1.76, + "learning_rate": 7.697630854551715e-07, + "loss": 0.6733, + "step": 68676 + }, + { + "epoch": 1.76, + "learning_rate": 7.697361584670404e-07, + "loss": 0.8164, + "step": 68677 + }, + { + "epoch": 1.76, + "learning_rate": 7.697092316552115e-07, + "loss": 0.7031, + "step": 68678 + }, + { + "epoch": 1.76, + "learning_rate": 7.696823050197055e-07, + "loss": 0.7295, + "step": 68679 + }, + { + "epoch": 1.76, + "learning_rate": 7.696553785605432e-07, + "loss": 0.6992, + "step": 68680 + }, + { + "epoch": 1.76, + "learning_rate": 7.696284522777451e-07, + "loss": 0.6113, + "step": 68681 + }, + { + "epoch": 1.76, + "learning_rate": 7.69601526171332e-07, + "loss": 0.7471, + "step": 68682 + }, + { + "epoch": 1.76, + "learning_rate": 7.695746002413243e-07, + "loss": 0.6606, + "step": 68683 + }, + { + "epoch": 1.76, + "learning_rate": 7.695476744877429e-07, + "loss": 0.6953, + "step": 68684 + }, + { + "epoch": 1.76, + "learning_rate": 7.695207489106082e-07, + "loss": 0.6494, + "step": 68685 + }, + { + "epoch": 1.76, + "learning_rate": 7.694938235099409e-07, + "loss": 0.7119, + "step": 68686 + }, + { + "epoch": 1.76, + "learning_rate": 7.694668982857618e-07, + "loss": 0.4263, + "step": 68687 + }, + { + "epoch": 1.76, + "learning_rate": 7.69439973238091e-07, + "loss": 0.7529, + "step": 68688 + }, + { + "epoch": 1.76, + "learning_rate": 7.694130483669494e-07, + "loss": 0.5435, + "step": 68689 + }, + { + "epoch": 1.76, + "learning_rate": 7.693861236723575e-07, + "loss": 0.6357, + "step": 68690 + }, + { + "epoch": 1.76, + "learning_rate": 7.693591991543364e-07, + "loss": 0.7549, + "step": 68691 + }, + { + "epoch": 1.76, + "learning_rate": 7.693322748129063e-07, + "loss": 0.5151, + "step": 68692 + }, + { + "epoch": 1.76, + "learning_rate": 7.693053506480876e-07, + "loss": 0.6162, + "step": 68693 + }, + { + "epoch": 1.76, + "learning_rate": 7.692784266599014e-07, + "loss": 0.6187, + "step": 68694 + }, + { + "epoch": 1.76, + "learning_rate": 7.692515028483679e-07, + "loss": 0.4042, + "step": 68695 + }, + { + "epoch": 1.76, + "learning_rate": 7.692245792135081e-07, + "loss": 0.791, + "step": 68696 + }, + { + "epoch": 1.76, + "learning_rate": 7.691976557553426e-07, + "loss": 0.7119, + "step": 68697 + }, + { + "epoch": 1.76, + "learning_rate": 7.691707324738915e-07, + "loss": 0.8232, + "step": 68698 + }, + { + "epoch": 1.76, + "learning_rate": 7.69143809369176e-07, + "loss": 0.6064, + "step": 68699 + }, + { + "epoch": 1.76, + "learning_rate": 7.691168864412162e-07, + "loss": 0.4612, + "step": 68700 + }, + { + "epoch": 1.76, + "learning_rate": 7.690899636900333e-07, + "loss": 0.6689, + "step": 68701 + }, + { + "epoch": 1.76, + "learning_rate": 7.690630411156473e-07, + "loss": 0.5688, + "step": 68702 + }, + { + "epoch": 1.76, + "learning_rate": 7.690361187180792e-07, + "loss": 0.6357, + "step": 68703 + }, + { + "epoch": 1.76, + "learning_rate": 7.690091964973494e-07, + "loss": 0.582, + "step": 68704 + }, + { + "epoch": 1.76, + "learning_rate": 7.689822744534789e-07, + "loss": 0.5586, + "step": 68705 + }, + { + "epoch": 1.76, + "learning_rate": 7.689553525864878e-07, + "loss": 0.5869, + "step": 68706 + }, + { + "epoch": 1.76, + "learning_rate": 7.689284308963975e-07, + "loss": 0.9199, + "step": 68707 + }, + { + "epoch": 1.76, + "learning_rate": 7.689015093832277e-07, + "loss": 0.749, + "step": 68708 + }, + { + "epoch": 1.76, + "learning_rate": 7.688745880469994e-07, + "loss": 0.6611, + "step": 68709 + }, + { + "epoch": 1.76, + "learning_rate": 7.68847666887733e-07, + "loss": 0.7881, + "step": 68710 + }, + { + "epoch": 1.76, + "learning_rate": 7.688207459054497e-07, + "loss": 0.5322, + "step": 68711 + }, + { + "epoch": 1.76, + "learning_rate": 7.687938251001694e-07, + "loss": 0.6479, + "step": 68712 + }, + { + "epoch": 1.76, + "learning_rate": 7.687669044719131e-07, + "loss": 0.5002, + "step": 68713 + }, + { + "epoch": 1.76, + "learning_rate": 7.687399840207014e-07, + "loss": 0.4712, + "step": 68714 + }, + { + "epoch": 1.76, + "learning_rate": 7.687130637465548e-07, + "loss": 0.5239, + "step": 68715 + }, + { + "epoch": 1.76, + "learning_rate": 7.68686143649494e-07, + "loss": 0.8369, + "step": 68716 + }, + { + "epoch": 1.76, + "learning_rate": 7.686592237295399e-07, + "loss": 0.7666, + "step": 68717 + }, + { + "epoch": 1.76, + "learning_rate": 7.686323039867125e-07, + "loss": 0.7271, + "step": 68718 + }, + { + "epoch": 1.76, + "learning_rate": 7.686053844210326e-07, + "loss": 0.7056, + "step": 68719 + }, + { + "epoch": 1.76, + "learning_rate": 7.685784650325211e-07, + "loss": 0.4459, + "step": 68720 + }, + { + "epoch": 1.76, + "learning_rate": 7.685515458211983e-07, + "loss": 0.7568, + "step": 68721 + }, + { + "epoch": 1.76, + "learning_rate": 7.68524626787085e-07, + "loss": 0.6504, + "step": 68722 + }, + { + "epoch": 1.76, + "learning_rate": 7.684977079302016e-07, + "loss": 0.7383, + "step": 68723 + }, + { + "epoch": 1.76, + "learning_rate": 7.684707892505692e-07, + "loss": 0.6611, + "step": 68724 + }, + { + "epoch": 1.76, + "learning_rate": 7.684438707482077e-07, + "loss": 0.4934, + "step": 68725 + }, + { + "epoch": 1.76, + "learning_rate": 7.684169524231383e-07, + "loss": 0.6445, + "step": 68726 + }, + { + "epoch": 1.76, + "learning_rate": 7.683900342753817e-07, + "loss": 0.5857, + "step": 68727 + }, + { + "epoch": 1.76, + "learning_rate": 7.68363116304958e-07, + "loss": 0.5432, + "step": 68728 + }, + { + "epoch": 1.76, + "learning_rate": 7.683361985118877e-07, + "loss": 0.8389, + "step": 68729 + }, + { + "epoch": 1.76, + "learning_rate": 7.68309280896192e-07, + "loss": 0.5479, + "step": 68730 + }, + { + "epoch": 1.76, + "learning_rate": 7.682823634578909e-07, + "loss": 0.6372, + "step": 68731 + }, + { + "epoch": 1.76, + "learning_rate": 7.682554461970056e-07, + "loss": 0.6533, + "step": 68732 + }, + { + "epoch": 1.76, + "learning_rate": 7.682285291135563e-07, + "loss": 0.3787, + "step": 68733 + }, + { + "epoch": 1.76, + "learning_rate": 7.68201612207564e-07, + "loss": 0.6455, + "step": 68734 + }, + { + "epoch": 1.76, + "learning_rate": 7.681746954790487e-07, + "loss": 0.7402, + "step": 68735 + }, + { + "epoch": 1.76, + "learning_rate": 7.681477789280317e-07, + "loss": 0.5518, + "step": 68736 + }, + { + "epoch": 1.76, + "learning_rate": 7.681208625545335e-07, + "loss": 0.6465, + "step": 68737 + }, + { + "epoch": 1.76, + "learning_rate": 7.680939463585741e-07, + "loss": 0.7783, + "step": 68738 + }, + { + "epoch": 1.76, + "learning_rate": 7.680670303401746e-07, + "loss": 0.7734, + "step": 68739 + }, + { + "epoch": 1.76, + "learning_rate": 7.680401144993554e-07, + "loss": 0.7539, + "step": 68740 + }, + { + "epoch": 1.76, + "learning_rate": 7.680131988361374e-07, + "loss": 0.6924, + "step": 68741 + }, + { + "epoch": 1.76, + "learning_rate": 7.679862833505409e-07, + "loss": 0.54, + "step": 68742 + }, + { + "epoch": 1.76, + "learning_rate": 7.679593680425867e-07, + "loss": 0.6738, + "step": 68743 + }, + { + "epoch": 1.76, + "learning_rate": 7.679324529122951e-07, + "loss": 0.603, + "step": 68744 + }, + { + "epoch": 1.76, + "learning_rate": 7.679055379596872e-07, + "loss": 0.7527, + "step": 68745 + }, + { + "epoch": 1.76, + "learning_rate": 7.678786231847835e-07, + "loss": 0.7695, + "step": 68746 + }, + { + "epoch": 1.76, + "learning_rate": 7.678517085876045e-07, + "loss": 0.6165, + "step": 68747 + }, + { + "epoch": 1.76, + "learning_rate": 7.678247941681705e-07, + "loss": 0.6504, + "step": 68748 + }, + { + "epoch": 1.76, + "learning_rate": 7.677978799265024e-07, + "loss": 0.6748, + "step": 68749 + }, + { + "epoch": 1.76, + "learning_rate": 7.677709658626208e-07, + "loss": 0.6826, + "step": 68750 + }, + { + "epoch": 1.76, + "learning_rate": 7.677440519765464e-07, + "loss": 0.707, + "step": 68751 + }, + { + "epoch": 1.76, + "learning_rate": 7.677171382682995e-07, + "loss": 0.6851, + "step": 68752 + }, + { + "epoch": 1.76, + "learning_rate": 7.676902247379011e-07, + "loss": 0.7148, + "step": 68753 + }, + { + "epoch": 1.76, + "learning_rate": 7.676633113853715e-07, + "loss": 0.6592, + "step": 68754 + }, + { + "epoch": 1.76, + "learning_rate": 7.676363982107315e-07, + "loss": 0.7148, + "step": 68755 + }, + { + "epoch": 1.76, + "learning_rate": 7.676094852140014e-07, + "loss": 0.7158, + "step": 68756 + }, + { + "epoch": 1.76, + "learning_rate": 7.675825723952026e-07, + "loss": 0.5674, + "step": 68757 + }, + { + "epoch": 1.76, + "learning_rate": 7.675556597543548e-07, + "loss": 0.7266, + "step": 68758 + }, + { + "epoch": 1.76, + "learning_rate": 7.675287472914787e-07, + "loss": 0.6758, + "step": 68759 + }, + { + "epoch": 1.76, + "learning_rate": 7.675018350065954e-07, + "loss": 0.5114, + "step": 68760 + }, + { + "epoch": 1.76, + "learning_rate": 7.67474922899725e-07, + "loss": 0.6973, + "step": 68761 + }, + { + "epoch": 1.76, + "learning_rate": 7.674480109708887e-07, + "loss": 0.6914, + "step": 68762 + }, + { + "epoch": 1.76, + "learning_rate": 7.674210992201064e-07, + "loss": 0.5151, + "step": 68763 + }, + { + "epoch": 1.76, + "learning_rate": 7.673941876473995e-07, + "loss": 0.7041, + "step": 68764 + }, + { + "epoch": 1.76, + "learning_rate": 7.67367276252788e-07, + "loss": 0.7578, + "step": 68765 + }, + { + "epoch": 1.76, + "learning_rate": 7.673403650362927e-07, + "loss": 0.5702, + "step": 68766 + }, + { + "epoch": 1.76, + "learning_rate": 7.673134539979342e-07, + "loss": 0.6641, + "step": 68767 + }, + { + "epoch": 1.76, + "learning_rate": 7.672865431377332e-07, + "loss": 0.5894, + "step": 68768 + }, + { + "epoch": 1.76, + "learning_rate": 7.672596324557099e-07, + "loss": 0.7158, + "step": 68769 + }, + { + "epoch": 1.76, + "learning_rate": 7.672327219518854e-07, + "loss": 0.499, + "step": 68770 + }, + { + "epoch": 1.76, + "learning_rate": 7.672058116262798e-07, + "loss": 0.7295, + "step": 68771 + }, + { + "epoch": 1.76, + "learning_rate": 7.671789014789144e-07, + "loss": 0.4697, + "step": 68772 + }, + { + "epoch": 1.76, + "learning_rate": 7.671519915098091e-07, + "loss": 0.6445, + "step": 68773 + }, + { + "epoch": 1.76, + "learning_rate": 7.671250817189849e-07, + "loss": 0.6348, + "step": 68774 + }, + { + "epoch": 1.76, + "learning_rate": 7.670981721064624e-07, + "loss": 0.6279, + "step": 68775 + }, + { + "epoch": 1.76, + "learning_rate": 7.670712626722621e-07, + "loss": 0.5273, + "step": 68776 + }, + { + "epoch": 1.76, + "learning_rate": 7.670443534164049e-07, + "loss": 0.6636, + "step": 68777 + }, + { + "epoch": 1.76, + "learning_rate": 7.670174443389107e-07, + "loss": 0.5444, + "step": 68778 + }, + { + "epoch": 1.76, + "learning_rate": 7.669905354398008e-07, + "loss": 0.6143, + "step": 68779 + }, + { + "epoch": 1.76, + "learning_rate": 7.669636267190952e-07, + "loss": 0.6807, + "step": 68780 + }, + { + "epoch": 1.76, + "learning_rate": 7.669367181768152e-07, + "loss": 0.4927, + "step": 68781 + }, + { + "epoch": 1.76, + "learning_rate": 7.669098098129809e-07, + "loss": 0.6431, + "step": 68782 + }, + { + "epoch": 1.76, + "learning_rate": 7.668829016276128e-07, + "loss": 0.7749, + "step": 68783 + }, + { + "epoch": 1.76, + "learning_rate": 7.66855993620732e-07, + "loss": 0.4912, + "step": 68784 + }, + { + "epoch": 1.76, + "learning_rate": 7.668290857923587e-07, + "loss": 0.8145, + "step": 68785 + }, + { + "epoch": 1.76, + "learning_rate": 7.668021781425138e-07, + "loss": 0.5093, + "step": 68786 + }, + { + "epoch": 1.76, + "learning_rate": 7.66775270671218e-07, + "loss": 0.7275, + "step": 68787 + }, + { + "epoch": 1.76, + "learning_rate": 7.667483633784913e-07, + "loss": 0.5884, + "step": 68788 + }, + { + "epoch": 1.76, + "learning_rate": 7.667214562643547e-07, + "loss": 0.5278, + "step": 68789 + }, + { + "epoch": 1.76, + "learning_rate": 7.666945493288287e-07, + "loss": 0.8076, + "step": 68790 + }, + { + "epoch": 1.76, + "learning_rate": 7.666676425719341e-07, + "loss": 0.6621, + "step": 68791 + }, + { + "epoch": 1.76, + "learning_rate": 7.66640735993691e-07, + "loss": 0.6289, + "step": 68792 + }, + { + "epoch": 1.76, + "learning_rate": 7.666138295941208e-07, + "loss": 0.5774, + "step": 68793 + }, + { + "epoch": 1.76, + "learning_rate": 7.665869233732434e-07, + "loss": 0.7188, + "step": 68794 + }, + { + "epoch": 1.76, + "learning_rate": 7.665600173310798e-07, + "loss": 0.5205, + "step": 68795 + }, + { + "epoch": 1.76, + "learning_rate": 7.665331114676503e-07, + "loss": 0.3379, + "step": 68796 + }, + { + "epoch": 1.76, + "learning_rate": 7.665062057829761e-07, + "loss": 0.7168, + "step": 68797 + }, + { + "epoch": 1.76, + "learning_rate": 7.66479300277077e-07, + "loss": 0.6348, + "step": 68798 + }, + { + "epoch": 1.76, + "learning_rate": 7.664523949499741e-07, + "loss": 0.6387, + "step": 68799 + }, + { + "epoch": 1.76, + "learning_rate": 7.664254898016877e-07, + "loss": 0.6841, + "step": 68800 + }, + { + "epoch": 1.76, + "learning_rate": 7.663985848322386e-07, + "loss": 0.6719, + "step": 68801 + }, + { + "epoch": 1.76, + "learning_rate": 7.663716800416473e-07, + "loss": 0.6768, + "step": 68802 + }, + { + "epoch": 1.76, + "learning_rate": 7.663447754299346e-07, + "loss": 0.4719, + "step": 68803 + }, + { + "epoch": 1.76, + "learning_rate": 7.663178709971207e-07, + "loss": 0.5439, + "step": 68804 + }, + { + "epoch": 1.76, + "learning_rate": 7.662909667432268e-07, + "loss": 0.5427, + "step": 68805 + }, + { + "epoch": 1.76, + "learning_rate": 7.662640626682729e-07, + "loss": 0.4548, + "step": 68806 + }, + { + "epoch": 1.76, + "learning_rate": 7.662371587722804e-07, + "loss": 0.5173, + "step": 68807 + }, + { + "epoch": 1.76, + "learning_rate": 7.662102550552689e-07, + "loss": 0.6318, + "step": 68808 + }, + { + "epoch": 1.76, + "learning_rate": 7.661833515172594e-07, + "loss": 0.6211, + "step": 68809 + }, + { + "epoch": 1.76, + "learning_rate": 7.661564481582727e-07, + "loss": 0.6245, + "step": 68810 + }, + { + "epoch": 1.76, + "learning_rate": 7.661295449783292e-07, + "loss": 0.4683, + "step": 68811 + }, + { + "epoch": 1.76, + "learning_rate": 7.661026419774496e-07, + "loss": 0.6685, + "step": 68812 + }, + { + "epoch": 1.76, + "learning_rate": 7.660757391556543e-07, + "loss": 0.7129, + "step": 68813 + }, + { + "epoch": 1.76, + "learning_rate": 7.660488365129643e-07, + "loss": 0.5461, + "step": 68814 + }, + { + "epoch": 1.76, + "learning_rate": 7.660219340493996e-07, + "loss": 0.6455, + "step": 68815 + }, + { + "epoch": 1.76, + "learning_rate": 7.659950317649815e-07, + "loss": 0.7578, + "step": 68816 + }, + { + "epoch": 1.76, + "learning_rate": 7.659681296597303e-07, + "loss": 0.6782, + "step": 68817 + }, + { + "epoch": 1.76, + "learning_rate": 7.659412277336666e-07, + "loss": 0.6895, + "step": 68818 + }, + { + "epoch": 1.76, + "learning_rate": 7.659143259868104e-07, + "loss": 0.541, + "step": 68819 + }, + { + "epoch": 1.76, + "learning_rate": 7.658874244191833e-07, + "loss": 0.6299, + "step": 68820 + }, + { + "epoch": 1.76, + "learning_rate": 7.658605230308051e-07, + "loss": 0.832, + "step": 68821 + }, + { + "epoch": 1.76, + "learning_rate": 7.65833621821697e-07, + "loss": 0.8594, + "step": 68822 + }, + { + "epoch": 1.76, + "learning_rate": 7.65806720791879e-07, + "loss": 0.6064, + "step": 68823 + }, + { + "epoch": 1.76, + "learning_rate": 7.657798199413724e-07, + "loss": 0.6528, + "step": 68824 + }, + { + "epoch": 1.76, + "learning_rate": 7.657529192701971e-07, + "loss": 0.5586, + "step": 68825 + }, + { + "epoch": 1.76, + "learning_rate": 7.657260187783743e-07, + "loss": 0.6221, + "step": 68826 + }, + { + "epoch": 1.76, + "learning_rate": 7.656991184659245e-07, + "loss": 0.6465, + "step": 68827 + }, + { + "epoch": 1.76, + "learning_rate": 7.656722183328677e-07, + "loss": 0.4785, + "step": 68828 + }, + { + "epoch": 1.76, + "learning_rate": 7.656453183792251e-07, + "loss": 0.6245, + "step": 68829 + }, + { + "epoch": 1.76, + "learning_rate": 7.656184186050168e-07, + "loss": 0.7324, + "step": 68830 + }, + { + "epoch": 1.76, + "learning_rate": 7.655915190102641e-07, + "loss": 0.6499, + "step": 68831 + }, + { + "epoch": 1.76, + "learning_rate": 7.655646195949869e-07, + "loss": 0.6582, + "step": 68832 + }, + { + "epoch": 1.76, + "learning_rate": 7.655377203592063e-07, + "loss": 0.6074, + "step": 68833 + }, + { + "epoch": 1.76, + "learning_rate": 7.655108213029424e-07, + "loss": 0.585, + "step": 68834 + }, + { + "epoch": 1.76, + "learning_rate": 7.654839224262164e-07, + "loss": 0.5488, + "step": 68835 + }, + { + "epoch": 1.76, + "learning_rate": 7.654570237290483e-07, + "loss": 0.5938, + "step": 68836 + }, + { + "epoch": 1.76, + "learning_rate": 7.654301252114597e-07, + "loss": 0.7793, + "step": 68837 + }, + { + "epoch": 1.76, + "learning_rate": 7.654032268734697e-07, + "loss": 0.5283, + "step": 68838 + }, + { + "epoch": 1.76, + "learning_rate": 7.653763287151e-07, + "loss": 0.5774, + "step": 68839 + }, + { + "epoch": 1.76, + "learning_rate": 7.653494307363706e-07, + "loss": 0.7344, + "step": 68840 + }, + { + "epoch": 1.76, + "learning_rate": 7.653225329373025e-07, + "loss": 0.6748, + "step": 68841 + }, + { + "epoch": 1.76, + "learning_rate": 7.65295635317916e-07, + "loss": 0.5664, + "step": 68842 + }, + { + "epoch": 1.76, + "learning_rate": 7.652687378782321e-07, + "loss": 0.542, + "step": 68843 + }, + { + "epoch": 1.76, + "learning_rate": 7.652418406182708e-07, + "loss": 0.7061, + "step": 68844 + }, + { + "epoch": 1.76, + "learning_rate": 7.652149435380533e-07, + "loss": 0.5107, + "step": 68845 + }, + { + "epoch": 1.76, + "learning_rate": 7.651880466375998e-07, + "loss": 0.4658, + "step": 68846 + }, + { + "epoch": 1.76, + "learning_rate": 7.651611499169313e-07, + "loss": 0.5398, + "step": 68847 + }, + { + "epoch": 1.76, + "learning_rate": 7.651342533760679e-07, + "loss": 0.6709, + "step": 68848 + }, + { + "epoch": 1.76, + "learning_rate": 7.651073570150303e-07, + "loss": 0.6006, + "step": 68849 + }, + { + "epoch": 1.76, + "learning_rate": 7.650804608338393e-07, + "loss": 0.7051, + "step": 68850 + }, + { + "epoch": 1.76, + "learning_rate": 7.650535648325151e-07, + "loss": 0.6865, + "step": 68851 + }, + { + "epoch": 1.76, + "learning_rate": 7.65026669011079e-07, + "loss": 0.4832, + "step": 68852 + }, + { + "epoch": 1.76, + "learning_rate": 7.64999773369551e-07, + "loss": 0.7261, + "step": 68853 + }, + { + "epoch": 1.76, + "learning_rate": 7.649728779079518e-07, + "loss": 0.8027, + "step": 68854 + }, + { + "epoch": 1.76, + "learning_rate": 7.649459826263023e-07, + "loss": 0.7578, + "step": 68855 + }, + { + "epoch": 1.76, + "learning_rate": 7.64919087524623e-07, + "loss": 0.7227, + "step": 68856 + }, + { + "epoch": 1.76, + "learning_rate": 7.64892192602934e-07, + "loss": 0.7773, + "step": 68857 + }, + { + "epoch": 1.76, + "learning_rate": 7.648652978612562e-07, + "loss": 0.6963, + "step": 68858 + }, + { + "epoch": 1.76, + "learning_rate": 7.648384032996102e-07, + "loss": 0.6245, + "step": 68859 + }, + { + "epoch": 1.76, + "learning_rate": 7.648115089180168e-07, + "loss": 0.5286, + "step": 68860 + }, + { + "epoch": 1.76, + "learning_rate": 7.647846147164962e-07, + "loss": 0.7422, + "step": 68861 + }, + { + "epoch": 1.76, + "learning_rate": 7.647577206950694e-07, + "loss": 0.6042, + "step": 68862 + }, + { + "epoch": 1.76, + "learning_rate": 7.647308268537567e-07, + "loss": 0.5801, + "step": 68863 + }, + { + "epoch": 1.77, + "learning_rate": 7.647039331925789e-07, + "loss": 0.7646, + "step": 68864 + }, + { + "epoch": 1.77, + "learning_rate": 7.646770397115563e-07, + "loss": 0.8799, + "step": 68865 + }, + { + "epoch": 1.77, + "learning_rate": 7.6465014641071e-07, + "loss": 0.6572, + "step": 68866 + }, + { + "epoch": 1.77, + "learning_rate": 7.646232532900601e-07, + "loss": 0.8604, + "step": 68867 + }, + { + "epoch": 1.77, + "learning_rate": 7.645963603496271e-07, + "loss": 0.623, + "step": 68868 + }, + { + "epoch": 1.77, + "learning_rate": 7.645694675894322e-07, + "loss": 0.5879, + "step": 68869 + }, + { + "epoch": 1.77, + "learning_rate": 7.645425750094954e-07, + "loss": 0.4858, + "step": 68870 + }, + { + "epoch": 1.77, + "learning_rate": 7.645156826098375e-07, + "loss": 0.6426, + "step": 68871 + }, + { + "epoch": 1.77, + "learning_rate": 7.644887903904794e-07, + "loss": 0.6924, + "step": 68872 + }, + { + "epoch": 1.77, + "learning_rate": 7.644618983514411e-07, + "loss": 0.6665, + "step": 68873 + }, + { + "epoch": 1.77, + "learning_rate": 7.644350064927436e-07, + "loss": 0.791, + "step": 68874 + }, + { + "epoch": 1.77, + "learning_rate": 7.644081148144073e-07, + "loss": 0.79, + "step": 68875 + }, + { + "epoch": 1.77, + "learning_rate": 7.643812233164533e-07, + "loss": 0.5044, + "step": 68876 + }, + { + "epoch": 1.77, + "learning_rate": 7.643543319989014e-07, + "loss": 0.5596, + "step": 68877 + }, + { + "epoch": 1.77, + "learning_rate": 7.643274408617724e-07, + "loss": 0.6465, + "step": 68878 + }, + { + "epoch": 1.77, + "learning_rate": 7.643005499050874e-07, + "loss": 0.7432, + "step": 68879 + }, + { + "epoch": 1.77, + "learning_rate": 7.642736591288663e-07, + "loss": 0.7393, + "step": 68880 + }, + { + "epoch": 1.77, + "learning_rate": 7.642467685331303e-07, + "loss": 0.522, + "step": 68881 + }, + { + "epoch": 1.77, + "learning_rate": 7.642198781178995e-07, + "loss": 0.752, + "step": 68882 + }, + { + "epoch": 1.77, + "learning_rate": 7.641929878831948e-07, + "loss": 0.7451, + "step": 68883 + }, + { + "epoch": 1.77, + "learning_rate": 7.641660978290365e-07, + "loss": 0.7236, + "step": 68884 + }, + { + "epoch": 1.77, + "learning_rate": 7.641392079554456e-07, + "loss": 0.4626, + "step": 68885 + }, + { + "epoch": 1.77, + "learning_rate": 7.641123182624427e-07, + "loss": 0.6997, + "step": 68886 + }, + { + "epoch": 1.77, + "learning_rate": 7.640854287500478e-07, + "loss": 0.7158, + "step": 68887 + }, + { + "epoch": 1.77, + "learning_rate": 7.640585394182819e-07, + "loss": 0.6104, + "step": 68888 + }, + { + "epoch": 1.77, + "learning_rate": 7.640316502671657e-07, + "loss": 0.4883, + "step": 68889 + }, + { + "epoch": 1.77, + "learning_rate": 7.640047612967192e-07, + "loss": 0.6982, + "step": 68890 + }, + { + "epoch": 1.77, + "learning_rate": 7.639778725069637e-07, + "loss": 0.6113, + "step": 68891 + }, + { + "epoch": 1.77, + "learning_rate": 7.639509838979194e-07, + "loss": 0.5195, + "step": 68892 + }, + { + "epoch": 1.77, + "learning_rate": 7.63924095469607e-07, + "loss": 0.616, + "step": 68893 + }, + { + "epoch": 1.77, + "learning_rate": 7.63897207222047e-07, + "loss": 0.7734, + "step": 68894 + }, + { + "epoch": 1.77, + "learning_rate": 7.638703191552602e-07, + "loss": 0.8438, + "step": 68895 + }, + { + "epoch": 1.77, + "learning_rate": 7.638434312692672e-07, + "loss": 0.5371, + "step": 68896 + }, + { + "epoch": 1.77, + "learning_rate": 7.638165435640881e-07, + "loss": 0.6689, + "step": 68897 + }, + { + "epoch": 1.77, + "learning_rate": 7.63789656039744e-07, + "loss": 0.6758, + "step": 68898 + }, + { + "epoch": 1.77, + "learning_rate": 7.637627686962551e-07, + "loss": 0.6738, + "step": 68899 + }, + { + "epoch": 1.77, + "learning_rate": 7.637358815336423e-07, + "loss": 0.8086, + "step": 68900 + }, + { + "epoch": 1.77, + "learning_rate": 7.637089945519259e-07, + "loss": 0.8418, + "step": 68901 + }, + { + "epoch": 1.77, + "learning_rate": 7.63682107751127e-07, + "loss": 0.6445, + "step": 68902 + }, + { + "epoch": 1.77, + "learning_rate": 7.636552211312654e-07, + "loss": 0.7236, + "step": 68903 + }, + { + "epoch": 1.77, + "learning_rate": 7.636283346923626e-07, + "loss": 0.6177, + "step": 68904 + }, + { + "epoch": 1.77, + "learning_rate": 7.636014484344383e-07, + "loss": 0.6099, + "step": 68905 + }, + { + "epoch": 1.77, + "learning_rate": 7.635745623575143e-07, + "loss": 0.564, + "step": 68906 + }, + { + "epoch": 1.77, + "learning_rate": 7.635476764616096e-07, + "loss": 0.6118, + "step": 68907 + }, + { + "epoch": 1.77, + "learning_rate": 7.635207907467458e-07, + "loss": 0.8359, + "step": 68908 + }, + { + "epoch": 1.77, + "learning_rate": 7.634939052129431e-07, + "loss": 0.6504, + "step": 68909 + }, + { + "epoch": 1.77, + "learning_rate": 7.634670198602224e-07, + "loss": 0.6758, + "step": 68910 + }, + { + "epoch": 1.77, + "learning_rate": 7.63440134688604e-07, + "loss": 0.6992, + "step": 68911 + }, + { + "epoch": 1.77, + "learning_rate": 7.634132496981088e-07, + "loss": 0.7998, + "step": 68912 + }, + { + "epoch": 1.77, + "learning_rate": 7.63386364888757e-07, + "loss": 0.7539, + "step": 68913 + }, + { + "epoch": 1.77, + "learning_rate": 7.633594802605696e-07, + "loss": 0.5776, + "step": 68914 + }, + { + "epoch": 1.77, + "learning_rate": 7.633325958135667e-07, + "loss": 0.4922, + "step": 68915 + }, + { + "epoch": 1.77, + "learning_rate": 7.633057115477696e-07, + "loss": 0.564, + "step": 68916 + }, + { + "epoch": 1.77, + "learning_rate": 7.632788274631982e-07, + "loss": 0.7051, + "step": 68917 + }, + { + "epoch": 1.77, + "learning_rate": 7.632519435598731e-07, + "loss": 0.7705, + "step": 68918 + }, + { + "epoch": 1.77, + "learning_rate": 7.632250598378152e-07, + "loss": 0.583, + "step": 68919 + }, + { + "epoch": 1.77, + "learning_rate": 7.631981762970449e-07, + "loss": 0.625, + "step": 68920 + }, + { + "epoch": 1.77, + "learning_rate": 7.631712929375832e-07, + "loss": 0.6494, + "step": 68921 + }, + { + "epoch": 1.77, + "learning_rate": 7.6314440975945e-07, + "loss": 0.728, + "step": 68922 + }, + { + "epoch": 1.77, + "learning_rate": 7.631175267626663e-07, + "loss": 0.5249, + "step": 68923 + }, + { + "epoch": 1.77, + "learning_rate": 7.630906439472527e-07, + "loss": 0.6162, + "step": 68924 + }, + { + "epoch": 1.77, + "learning_rate": 7.630637613132298e-07, + "loss": 0.5815, + "step": 68925 + }, + { + "epoch": 1.77, + "learning_rate": 7.630368788606183e-07, + "loss": 0.666, + "step": 68926 + }, + { + "epoch": 1.77, + "learning_rate": 7.630099965894384e-07, + "loss": 0.7432, + "step": 68927 + }, + { + "epoch": 1.77, + "learning_rate": 7.629831144997106e-07, + "loss": 0.729, + "step": 68928 + }, + { + "epoch": 1.77, + "learning_rate": 7.629562325914558e-07, + "loss": 0.7363, + "step": 68929 + }, + { + "epoch": 1.77, + "learning_rate": 7.629293508646943e-07, + "loss": 0.6455, + "step": 68930 + }, + { + "epoch": 1.77, + "learning_rate": 7.629024693194474e-07, + "loss": 0.6086, + "step": 68931 + }, + { + "epoch": 1.77, + "learning_rate": 7.628755879557347e-07, + "loss": 0.6709, + "step": 68932 + }, + { + "epoch": 1.77, + "learning_rate": 7.628487067735776e-07, + "loss": 0.6953, + "step": 68933 + }, + { + "epoch": 1.77, + "learning_rate": 7.62821825772996e-07, + "loss": 0.5273, + "step": 68934 + }, + { + "epoch": 1.77, + "learning_rate": 7.627949449540112e-07, + "loss": 0.707, + "step": 68935 + }, + { + "epoch": 1.77, + "learning_rate": 7.627680643166436e-07, + "loss": 0.584, + "step": 68936 + }, + { + "epoch": 1.77, + "learning_rate": 7.62741183860913e-07, + "loss": 0.563, + "step": 68937 + }, + { + "epoch": 1.77, + "learning_rate": 7.627143035868409e-07, + "loss": 0.4648, + "step": 68938 + }, + { + "epoch": 1.77, + "learning_rate": 7.626874234944473e-07, + "loss": 0.6865, + "step": 68939 + }, + { + "epoch": 1.77, + "learning_rate": 7.626605435837532e-07, + "loss": 0.5532, + "step": 68940 + }, + { + "epoch": 1.77, + "learning_rate": 7.626336638547789e-07, + "loss": 0.6904, + "step": 68941 + }, + { + "epoch": 1.77, + "learning_rate": 7.626067843075452e-07, + "loss": 0.4216, + "step": 68942 + }, + { + "epoch": 1.77, + "learning_rate": 7.625799049420724e-07, + "loss": 0.709, + "step": 68943 + }, + { + "epoch": 1.77, + "learning_rate": 7.625530257583814e-07, + "loss": 0.7285, + "step": 68944 + }, + { + "epoch": 1.77, + "learning_rate": 7.625261467564927e-07, + "loss": 0.5896, + "step": 68945 + }, + { + "epoch": 1.77, + "learning_rate": 7.62499267936427e-07, + "loss": 0.5911, + "step": 68946 + }, + { + "epoch": 1.77, + "learning_rate": 7.624723892982043e-07, + "loss": 0.6406, + "step": 68947 + }, + { + "epoch": 1.77, + "learning_rate": 7.624455108418458e-07, + "loss": 0.7891, + "step": 68948 + }, + { + "epoch": 1.77, + "learning_rate": 7.624186325673716e-07, + "loss": 0.4708, + "step": 68949 + }, + { + "epoch": 1.77, + "learning_rate": 7.623917544748028e-07, + "loss": 0.6343, + "step": 68950 + }, + { + "epoch": 1.77, + "learning_rate": 7.623648765641594e-07, + "loss": 0.5139, + "step": 68951 + }, + { + "epoch": 1.77, + "learning_rate": 7.623379988354626e-07, + "loss": 0.6182, + "step": 68952 + }, + { + "epoch": 1.77, + "learning_rate": 7.623111212887323e-07, + "loss": 0.5928, + "step": 68953 + }, + { + "epoch": 1.77, + "learning_rate": 7.622842439239898e-07, + "loss": 0.6685, + "step": 68954 + }, + { + "epoch": 1.77, + "learning_rate": 7.622573667412551e-07, + "loss": 0.6221, + "step": 68955 + }, + { + "epoch": 1.77, + "learning_rate": 7.622304897405494e-07, + "loss": 0.5781, + "step": 68956 + }, + { + "epoch": 1.77, + "learning_rate": 7.622036129218926e-07, + "loss": 0.7134, + "step": 68957 + }, + { + "epoch": 1.77, + "learning_rate": 7.621767362853055e-07, + "loss": 0.5174, + "step": 68958 + }, + { + "epoch": 1.77, + "learning_rate": 7.621498598308087e-07, + "loss": 0.8086, + "step": 68959 + }, + { + "epoch": 1.77, + "learning_rate": 7.621229835584229e-07, + "loss": 0.6885, + "step": 68960 + }, + { + "epoch": 1.77, + "learning_rate": 7.620961074681686e-07, + "loss": 0.5757, + "step": 68961 + }, + { + "epoch": 1.77, + "learning_rate": 7.620692315600664e-07, + "loss": 0.6699, + "step": 68962 + }, + { + "epoch": 1.77, + "learning_rate": 7.620423558341366e-07, + "loss": 0.5781, + "step": 68963 + }, + { + "epoch": 1.77, + "learning_rate": 7.620154802904004e-07, + "loss": 0.5349, + "step": 68964 + }, + { + "epoch": 1.77, + "learning_rate": 7.619886049288777e-07, + "loss": 0.8184, + "step": 68965 + }, + { + "epoch": 1.77, + "learning_rate": 7.619617297495898e-07, + "loss": 0.6484, + "step": 68966 + }, + { + "epoch": 1.77, + "learning_rate": 7.619348547525567e-07, + "loss": 0.5598, + "step": 68967 + }, + { + "epoch": 1.77, + "learning_rate": 7.619079799377989e-07, + "loss": 0.6758, + "step": 68968 + }, + { + "epoch": 1.77, + "learning_rate": 7.618811053053373e-07, + "loss": 0.5195, + "step": 68969 + }, + { + "epoch": 1.77, + "learning_rate": 7.618542308551923e-07, + "loss": 0.5928, + "step": 68970 + }, + { + "epoch": 1.77, + "learning_rate": 7.618273565873847e-07, + "loss": 0.708, + "step": 68971 + }, + { + "epoch": 1.77, + "learning_rate": 7.618004825019349e-07, + "loss": 0.5918, + "step": 68972 + }, + { + "epoch": 1.77, + "learning_rate": 7.617736085988636e-07, + "loss": 0.5825, + "step": 68973 + }, + { + "epoch": 1.77, + "learning_rate": 7.617467348781911e-07, + "loss": 0.375, + "step": 68974 + }, + { + "epoch": 1.77, + "learning_rate": 7.617198613399383e-07, + "loss": 0.6704, + "step": 68975 + }, + { + "epoch": 1.77, + "learning_rate": 7.61692987984126e-07, + "loss": 0.6323, + "step": 68976 + }, + { + "epoch": 1.77, + "learning_rate": 7.61666114810774e-07, + "loss": 0.6157, + "step": 68977 + }, + { + "epoch": 1.77, + "learning_rate": 7.616392418199033e-07, + "loss": 0.6582, + "step": 68978 + }, + { + "epoch": 1.77, + "learning_rate": 7.616123690115347e-07, + "loss": 0.6313, + "step": 68979 + }, + { + "epoch": 1.77, + "learning_rate": 7.615854963856882e-07, + "loss": 0.6118, + "step": 68980 + }, + { + "epoch": 1.77, + "learning_rate": 7.61558623942385e-07, + "loss": 0.5625, + "step": 68981 + }, + { + "epoch": 1.77, + "learning_rate": 7.615317516816452e-07, + "loss": 0.5947, + "step": 68982 + }, + { + "epoch": 1.77, + "learning_rate": 7.615048796034897e-07, + "loss": 0.5654, + "step": 68983 + }, + { + "epoch": 1.77, + "learning_rate": 7.614780077079388e-07, + "loss": 0.5198, + "step": 68984 + }, + { + "epoch": 1.77, + "learning_rate": 7.614511359950134e-07, + "loss": 0.6035, + "step": 68985 + }, + { + "epoch": 1.77, + "learning_rate": 7.614242644647342e-07, + "loss": 0.5048, + "step": 68986 + }, + { + "epoch": 1.77, + "learning_rate": 7.613973931171209e-07, + "loss": 0.6846, + "step": 68987 + }, + { + "epoch": 1.77, + "learning_rate": 7.61370521952195e-07, + "loss": 0.5288, + "step": 68988 + }, + { + "epoch": 1.77, + "learning_rate": 7.613436509699765e-07, + "loss": 0.6719, + "step": 68989 + }, + { + "epoch": 1.77, + "learning_rate": 7.613167801704862e-07, + "loss": 0.5337, + "step": 68990 + }, + { + "epoch": 1.77, + "learning_rate": 7.612899095537448e-07, + "loss": 0.5757, + "step": 68991 + }, + { + "epoch": 1.77, + "learning_rate": 7.612630391197727e-07, + "loss": 0.5913, + "step": 68992 + }, + { + "epoch": 1.77, + "learning_rate": 7.612361688685903e-07, + "loss": 0.666, + "step": 68993 + }, + { + "epoch": 1.77, + "learning_rate": 7.612092988002187e-07, + "loss": 0.5007, + "step": 68994 + }, + { + "epoch": 1.77, + "learning_rate": 7.611824289146779e-07, + "loss": 0.6484, + "step": 68995 + }, + { + "epoch": 1.77, + "learning_rate": 7.611555592119893e-07, + "loss": 0.5757, + "step": 68996 + }, + { + "epoch": 1.77, + "learning_rate": 7.611286896921723e-07, + "loss": 0.7345, + "step": 68997 + }, + { + "epoch": 1.77, + "learning_rate": 7.611018203552484e-07, + "loss": 0.6045, + "step": 68998 + }, + { + "epoch": 1.77, + "learning_rate": 7.610749512012375e-07, + "loss": 0.5424, + "step": 68999 + }, + { + "epoch": 1.77, + "learning_rate": 7.610480822301609e-07, + "loss": 0.5547, + "step": 69000 + }, + { + "epoch": 1.77, + "learning_rate": 7.610212134420385e-07, + "loss": 0.6401, + "step": 69001 + }, + { + "epoch": 1.77, + "learning_rate": 7.609943448368914e-07, + "loss": 0.6836, + "step": 69002 + }, + { + "epoch": 1.77, + "learning_rate": 7.609674764147397e-07, + "loss": 0.499, + "step": 69003 + }, + { + "epoch": 1.77, + "learning_rate": 7.609406081756045e-07, + "loss": 0.4883, + "step": 69004 + }, + { + "epoch": 1.77, + "learning_rate": 7.609137401195057e-07, + "loss": 0.7266, + "step": 69005 + }, + { + "epoch": 1.77, + "learning_rate": 7.608868722464648e-07, + "loss": 0.6357, + "step": 69006 + }, + { + "epoch": 1.77, + "learning_rate": 7.608600045565016e-07, + "loss": 0.6318, + "step": 69007 + }, + { + "epoch": 1.77, + "learning_rate": 7.608331370496367e-07, + "loss": 0.7744, + "step": 69008 + }, + { + "epoch": 1.77, + "learning_rate": 7.60806269725891e-07, + "loss": 0.6846, + "step": 69009 + }, + { + "epoch": 1.77, + "learning_rate": 7.607794025852849e-07, + "loss": 0.7397, + "step": 69010 + }, + { + "epoch": 1.77, + "learning_rate": 7.60752535627839e-07, + "loss": 0.7368, + "step": 69011 + }, + { + "epoch": 1.77, + "learning_rate": 7.607256688535739e-07, + "loss": 0.6289, + "step": 69012 + }, + { + "epoch": 1.77, + "learning_rate": 7.606988022625102e-07, + "loss": 0.6387, + "step": 69013 + }, + { + "epoch": 1.77, + "learning_rate": 7.606719358546682e-07, + "loss": 0.6731, + "step": 69014 + }, + { + "epoch": 1.77, + "learning_rate": 7.60645069630069e-07, + "loss": 0.7158, + "step": 69015 + }, + { + "epoch": 1.77, + "learning_rate": 7.606182035887329e-07, + "loss": 0.6768, + "step": 69016 + }, + { + "epoch": 1.77, + "learning_rate": 7.605913377306805e-07, + "loss": 0.7832, + "step": 69017 + }, + { + "epoch": 1.77, + "learning_rate": 7.60564472055932e-07, + "loss": 0.6074, + "step": 69018 + }, + { + "epoch": 1.77, + "learning_rate": 7.605376065645084e-07, + "loss": 0.5796, + "step": 69019 + }, + { + "epoch": 1.77, + "learning_rate": 7.6051074125643e-07, + "loss": 0.3811, + "step": 69020 + }, + { + "epoch": 1.77, + "learning_rate": 7.604838761317177e-07, + "loss": 0.5669, + "step": 69021 + }, + { + "epoch": 1.77, + "learning_rate": 7.604570111903916e-07, + "loss": 0.6709, + "step": 69022 + }, + { + "epoch": 1.77, + "learning_rate": 7.604301464324729e-07, + "loss": 0.7065, + "step": 69023 + }, + { + "epoch": 1.77, + "learning_rate": 7.604032818579815e-07, + "loss": 0.6543, + "step": 69024 + }, + { + "epoch": 1.77, + "learning_rate": 7.603764174669386e-07, + "loss": 0.7314, + "step": 69025 + }, + { + "epoch": 1.77, + "learning_rate": 7.603495532593647e-07, + "loss": 0.75, + "step": 69026 + }, + { + "epoch": 1.77, + "learning_rate": 7.603226892352796e-07, + "loss": 0.5715, + "step": 69027 + }, + { + "epoch": 1.77, + "learning_rate": 7.602958253947045e-07, + "loss": 0.5273, + "step": 69028 + }, + { + "epoch": 1.77, + "learning_rate": 7.602689617376598e-07, + "loss": 0.6094, + "step": 69029 + }, + { + "epoch": 1.77, + "learning_rate": 7.602420982641664e-07, + "loss": 0.6064, + "step": 69030 + }, + { + "epoch": 1.77, + "learning_rate": 7.602152349742443e-07, + "loss": 0.6514, + "step": 69031 + }, + { + "epoch": 1.77, + "learning_rate": 7.601883718679146e-07, + "loss": 0.5957, + "step": 69032 + }, + { + "epoch": 1.77, + "learning_rate": 7.601615089451974e-07, + "loss": 0.6152, + "step": 69033 + }, + { + "epoch": 1.77, + "learning_rate": 7.601346462061138e-07, + "loss": 0.6123, + "step": 69034 + }, + { + "epoch": 1.77, + "learning_rate": 7.601077836506839e-07, + "loss": 0.502, + "step": 69035 + }, + { + "epoch": 1.77, + "learning_rate": 7.600809212789289e-07, + "loss": 0.6628, + "step": 69036 + }, + { + "epoch": 1.77, + "learning_rate": 7.600540590908683e-07, + "loss": 0.5791, + "step": 69037 + }, + { + "epoch": 1.77, + "learning_rate": 7.600271970865235e-07, + "loss": 0.6699, + "step": 69038 + }, + { + "epoch": 1.77, + "learning_rate": 7.600003352659146e-07, + "loss": 0.4398, + "step": 69039 + }, + { + "epoch": 1.77, + "learning_rate": 7.599734736290627e-07, + "loss": 0.6248, + "step": 69040 + }, + { + "epoch": 1.77, + "learning_rate": 7.599466121759878e-07, + "loss": 0.6914, + "step": 69041 + }, + { + "epoch": 1.77, + "learning_rate": 7.599197509067112e-07, + "loss": 0.689, + "step": 69042 + }, + { + "epoch": 1.77, + "learning_rate": 7.598928898212524e-07, + "loss": 0.8286, + "step": 69043 + }, + { + "epoch": 1.77, + "learning_rate": 7.59866028919633e-07, + "loss": 0.6436, + "step": 69044 + }, + { + "epoch": 1.77, + "learning_rate": 7.598391682018729e-07, + "loss": 0.5264, + "step": 69045 + }, + { + "epoch": 1.77, + "learning_rate": 7.598123076679935e-07, + "loss": 0.7334, + "step": 69046 + }, + { + "epoch": 1.77, + "learning_rate": 7.597854473180143e-07, + "loss": 0.6519, + "step": 69047 + }, + { + "epoch": 1.77, + "learning_rate": 7.597585871519563e-07, + "loss": 0.5552, + "step": 69048 + }, + { + "epoch": 1.77, + "learning_rate": 7.597317271698402e-07, + "loss": 0.7871, + "step": 69049 + }, + { + "epoch": 1.77, + "learning_rate": 7.597048673716863e-07, + "loss": 0.4691, + "step": 69050 + }, + { + "epoch": 1.77, + "learning_rate": 7.596780077575156e-07, + "loss": 0.6787, + "step": 69051 + }, + { + "epoch": 1.77, + "learning_rate": 7.596511483273482e-07, + "loss": 0.582, + "step": 69052 + }, + { + "epoch": 1.77, + "learning_rate": 7.596242890812047e-07, + "loss": 0.6782, + "step": 69053 + }, + { + "epoch": 1.77, + "learning_rate": 7.595974300191063e-07, + "loss": 0.6025, + "step": 69054 + }, + { + "epoch": 1.77, + "learning_rate": 7.595705711410727e-07, + "loss": 0.7036, + "step": 69055 + }, + { + "epoch": 1.77, + "learning_rate": 7.595437124471253e-07, + "loss": 0.582, + "step": 69056 + }, + { + "epoch": 1.77, + "learning_rate": 7.59516853937284e-07, + "loss": 0.6797, + "step": 69057 + }, + { + "epoch": 1.77, + "learning_rate": 7.594899956115693e-07, + "loss": 0.7451, + "step": 69058 + }, + { + "epoch": 1.77, + "learning_rate": 7.594631374700025e-07, + "loss": 0.5752, + "step": 69059 + }, + { + "epoch": 1.77, + "learning_rate": 7.594362795126032e-07, + "loss": 0.7178, + "step": 69060 + }, + { + "epoch": 1.77, + "learning_rate": 7.594094217393929e-07, + "loss": 0.6333, + "step": 69061 + }, + { + "epoch": 1.77, + "learning_rate": 7.593825641503915e-07, + "loss": 0.6626, + "step": 69062 + }, + { + "epoch": 1.77, + "learning_rate": 7.5935570674562e-07, + "loss": 0.8037, + "step": 69063 + }, + { + "epoch": 1.77, + "learning_rate": 7.593288495250985e-07, + "loss": 0.541, + "step": 69064 + }, + { + "epoch": 1.77, + "learning_rate": 7.593019924888481e-07, + "loss": 0.5703, + "step": 69065 + }, + { + "epoch": 1.77, + "learning_rate": 7.592751356368892e-07, + "loss": 0.6934, + "step": 69066 + }, + { + "epoch": 1.77, + "learning_rate": 7.59248278969242e-07, + "loss": 0.4214, + "step": 69067 + }, + { + "epoch": 1.77, + "learning_rate": 7.592214224859275e-07, + "loss": 0.7051, + "step": 69068 + }, + { + "epoch": 1.77, + "learning_rate": 7.591945661869661e-07, + "loss": 0.5923, + "step": 69069 + }, + { + "epoch": 1.77, + "learning_rate": 7.591677100723782e-07, + "loss": 0.6357, + "step": 69070 + }, + { + "epoch": 1.77, + "learning_rate": 7.591408541421845e-07, + "loss": 0.8467, + "step": 69071 + }, + { + "epoch": 1.77, + "learning_rate": 7.591139983964054e-07, + "loss": 0.6084, + "step": 69072 + }, + { + "epoch": 1.77, + "learning_rate": 7.590871428350621e-07, + "loss": 0.644, + "step": 69073 + }, + { + "epoch": 1.77, + "learning_rate": 7.590602874581742e-07, + "loss": 0.7842, + "step": 69074 + }, + { + "epoch": 1.77, + "learning_rate": 7.590334322657631e-07, + "loss": 0.6982, + "step": 69075 + }, + { + "epoch": 1.77, + "learning_rate": 7.590065772578492e-07, + "loss": 0.5361, + "step": 69076 + }, + { + "epoch": 1.77, + "learning_rate": 7.589797224344525e-07, + "loss": 0.7383, + "step": 69077 + }, + { + "epoch": 1.77, + "learning_rate": 7.589528677955941e-07, + "loss": 0.5981, + "step": 69078 + }, + { + "epoch": 1.77, + "learning_rate": 7.589260133412942e-07, + "loss": 0.5029, + "step": 69079 + }, + { + "epoch": 1.77, + "learning_rate": 7.588991590715738e-07, + "loss": 0.7021, + "step": 69080 + }, + { + "epoch": 1.77, + "learning_rate": 7.58872304986453e-07, + "loss": 0.916, + "step": 69081 + }, + { + "epoch": 1.77, + "learning_rate": 7.588454510859528e-07, + "loss": 0.7705, + "step": 69082 + }, + { + "epoch": 1.77, + "learning_rate": 7.588185973700934e-07, + "loss": 0.7441, + "step": 69083 + }, + { + "epoch": 1.77, + "learning_rate": 7.587917438388958e-07, + "loss": 0.5654, + "step": 69084 + }, + { + "epoch": 1.77, + "learning_rate": 7.587648904923798e-07, + "loss": 0.6484, + "step": 69085 + }, + { + "epoch": 1.77, + "learning_rate": 7.587380373305673e-07, + "loss": 0.5898, + "step": 69086 + }, + { + "epoch": 1.77, + "learning_rate": 7.587111843534773e-07, + "loss": 0.5596, + "step": 69087 + }, + { + "epoch": 1.77, + "learning_rate": 7.586843315611311e-07, + "loss": 0.6118, + "step": 69088 + }, + { + "epoch": 1.77, + "learning_rate": 7.586574789535492e-07, + "loss": 0.6191, + "step": 69089 + }, + { + "epoch": 1.77, + "learning_rate": 7.586306265307523e-07, + "loss": 0.6606, + "step": 69090 + }, + { + "epoch": 1.77, + "learning_rate": 7.586037742927606e-07, + "loss": 0.5703, + "step": 69091 + }, + { + "epoch": 1.77, + "learning_rate": 7.585769222395951e-07, + "loss": 0.5137, + "step": 69092 + }, + { + "epoch": 1.77, + "learning_rate": 7.585500703712759e-07, + "loss": 0.6406, + "step": 69093 + }, + { + "epoch": 1.77, + "learning_rate": 7.585232186878242e-07, + "loss": 0.5991, + "step": 69094 + }, + { + "epoch": 1.77, + "learning_rate": 7.584963671892598e-07, + "loss": 0.6265, + "step": 69095 + }, + { + "epoch": 1.77, + "learning_rate": 7.584695158756042e-07, + "loss": 0.5806, + "step": 69096 + }, + { + "epoch": 1.77, + "learning_rate": 7.58442664746877e-07, + "loss": 0.561, + "step": 69097 + }, + { + "epoch": 1.77, + "learning_rate": 7.584158138030989e-07, + "loss": 0.7441, + "step": 69098 + }, + { + "epoch": 1.77, + "learning_rate": 7.583889630442911e-07, + "loss": 0.6895, + "step": 69099 + }, + { + "epoch": 1.77, + "learning_rate": 7.583621124704734e-07, + "loss": 0.708, + "step": 69100 + }, + { + "epoch": 1.77, + "learning_rate": 7.58335262081667e-07, + "loss": 0.6865, + "step": 69101 + }, + { + "epoch": 1.77, + "learning_rate": 7.58308411877892e-07, + "loss": 0.501, + "step": 69102 + }, + { + "epoch": 1.77, + "learning_rate": 7.582815618591694e-07, + "loss": 0.7549, + "step": 69103 + }, + { + "epoch": 1.77, + "learning_rate": 7.582547120255191e-07, + "loss": 0.6279, + "step": 69104 + }, + { + "epoch": 1.77, + "learning_rate": 7.582278623769623e-07, + "loss": 0.6611, + "step": 69105 + }, + { + "epoch": 1.77, + "learning_rate": 7.582010129135197e-07, + "loss": 0.6621, + "step": 69106 + }, + { + "epoch": 1.77, + "learning_rate": 7.581741636352111e-07, + "loss": 0.5605, + "step": 69107 + }, + { + "epoch": 1.77, + "learning_rate": 7.581473145420571e-07, + "loss": 0.6729, + "step": 69108 + }, + { + "epoch": 1.77, + "learning_rate": 7.58120465634079e-07, + "loss": 0.5723, + "step": 69109 + }, + { + "epoch": 1.77, + "learning_rate": 7.580936169112967e-07, + "loss": 0.6028, + "step": 69110 + }, + { + "epoch": 1.77, + "learning_rate": 7.580667683737312e-07, + "loss": 0.7568, + "step": 69111 + }, + { + "epoch": 1.77, + "learning_rate": 7.580399200214026e-07, + "loss": 0.4736, + "step": 69112 + }, + { + "epoch": 1.77, + "learning_rate": 7.580130718543318e-07, + "loss": 0.5376, + "step": 69113 + }, + { + "epoch": 1.77, + "learning_rate": 7.579862238725393e-07, + "loss": 0.564, + "step": 69114 + }, + { + "epoch": 1.77, + "learning_rate": 7.579593760760457e-07, + "loss": 0.6929, + "step": 69115 + }, + { + "epoch": 1.77, + "learning_rate": 7.579325284648716e-07, + "loss": 0.6094, + "step": 69116 + }, + { + "epoch": 1.77, + "learning_rate": 7.579056810390371e-07, + "loss": 0.7656, + "step": 69117 + }, + { + "epoch": 1.77, + "learning_rate": 7.578788337985633e-07, + "loss": 0.6675, + "step": 69118 + }, + { + "epoch": 1.77, + "learning_rate": 7.578519867434704e-07, + "loss": 0.604, + "step": 69119 + }, + { + "epoch": 1.77, + "learning_rate": 7.578251398737793e-07, + "loss": 0.542, + "step": 69120 + }, + { + "epoch": 1.77, + "learning_rate": 7.577982931895101e-07, + "loss": 0.6084, + "step": 69121 + }, + { + "epoch": 1.77, + "learning_rate": 7.577714466906837e-07, + "loss": 0.6924, + "step": 69122 + }, + { + "epoch": 1.77, + "learning_rate": 7.577446003773204e-07, + "loss": 0.6523, + "step": 69123 + }, + { + "epoch": 1.77, + "learning_rate": 7.577177542494412e-07, + "loss": 0.6963, + "step": 69124 + }, + { + "epoch": 1.77, + "learning_rate": 7.576909083070665e-07, + "loss": 0.8154, + "step": 69125 + }, + { + "epoch": 1.77, + "learning_rate": 7.576640625502169e-07, + "loss": 0.7988, + "step": 69126 + }, + { + "epoch": 1.77, + "learning_rate": 7.576372169789122e-07, + "loss": 0.6128, + "step": 69127 + }, + { + "epoch": 1.77, + "learning_rate": 7.576103715931739e-07, + "loss": 0.7549, + "step": 69128 + }, + { + "epoch": 1.77, + "learning_rate": 7.575835263930218e-07, + "loss": 0.4854, + "step": 69129 + }, + { + "epoch": 1.77, + "learning_rate": 7.575566813784771e-07, + "loss": 0.4802, + "step": 69130 + }, + { + "epoch": 1.77, + "learning_rate": 7.5752983654956e-07, + "loss": 0.6045, + "step": 69131 + }, + { + "epoch": 1.77, + "learning_rate": 7.575029919062914e-07, + "loss": 0.4613, + "step": 69132 + }, + { + "epoch": 1.77, + "learning_rate": 7.574761474486913e-07, + "loss": 0.6079, + "step": 69133 + }, + { + "epoch": 1.77, + "learning_rate": 7.574493031767808e-07, + "loss": 0.5361, + "step": 69134 + }, + { + "epoch": 1.77, + "learning_rate": 7.5742245909058e-07, + "loss": 0.6885, + "step": 69135 + }, + { + "epoch": 1.77, + "learning_rate": 7.573956151901101e-07, + "loss": 0.7388, + "step": 69136 + }, + { + "epoch": 1.77, + "learning_rate": 7.57368771475391e-07, + "loss": 0.4663, + "step": 69137 + }, + { + "epoch": 1.77, + "learning_rate": 7.573419279464433e-07, + "loss": 0.6182, + "step": 69138 + }, + { + "epoch": 1.77, + "learning_rate": 7.573150846032879e-07, + "loss": 0.5903, + "step": 69139 + }, + { + "epoch": 1.77, + "learning_rate": 7.572882414459449e-07, + "loss": 0.4796, + "step": 69140 + }, + { + "epoch": 1.77, + "learning_rate": 7.572613984744355e-07, + "loss": 0.7686, + "step": 69141 + }, + { + "epoch": 1.77, + "learning_rate": 7.572345556887798e-07, + "loss": 0.8164, + "step": 69142 + }, + { + "epoch": 1.77, + "learning_rate": 7.572077130889982e-07, + "loss": 0.6621, + "step": 69143 + }, + { + "epoch": 1.77, + "learning_rate": 7.571808706751117e-07, + "loss": 0.499, + "step": 69144 + }, + { + "epoch": 1.77, + "learning_rate": 7.571540284471405e-07, + "loss": 0.582, + "step": 69145 + }, + { + "epoch": 1.77, + "learning_rate": 7.571271864051056e-07, + "loss": 0.4155, + "step": 69146 + }, + { + "epoch": 1.77, + "learning_rate": 7.571003445490272e-07, + "loss": 0.7173, + "step": 69147 + }, + { + "epoch": 1.77, + "learning_rate": 7.570735028789256e-07, + "loss": 0.7725, + "step": 69148 + }, + { + "epoch": 1.77, + "learning_rate": 7.570466613948218e-07, + "loss": 0.4927, + "step": 69149 + }, + { + "epoch": 1.77, + "learning_rate": 7.570198200967362e-07, + "loss": 0.54, + "step": 69150 + }, + { + "epoch": 1.77, + "learning_rate": 7.569929789846893e-07, + "loss": 0.5552, + "step": 69151 + }, + { + "epoch": 1.77, + "learning_rate": 7.569661380587016e-07, + "loss": 0.8271, + "step": 69152 + }, + { + "epoch": 1.77, + "learning_rate": 7.56939297318794e-07, + "loss": 0.6982, + "step": 69153 + }, + { + "epoch": 1.77, + "learning_rate": 7.569124567649865e-07, + "loss": 0.5654, + "step": 69154 + }, + { + "epoch": 1.77, + "learning_rate": 7.568856163973005e-07, + "loss": 0.5459, + "step": 69155 + }, + { + "epoch": 1.77, + "learning_rate": 7.568587762157557e-07, + "loss": 0.6846, + "step": 69156 + }, + { + "epoch": 1.77, + "learning_rate": 7.568319362203728e-07, + "loss": 0.5898, + "step": 69157 + }, + { + "epoch": 1.77, + "learning_rate": 7.568050964111727e-07, + "loss": 0.793, + "step": 69158 + }, + { + "epoch": 1.77, + "learning_rate": 7.567782567881757e-07, + "loss": 0.4506, + "step": 69159 + }, + { + "epoch": 1.77, + "learning_rate": 7.567514173514023e-07, + "loss": 0.4351, + "step": 69160 + }, + { + "epoch": 1.77, + "learning_rate": 7.567245781008734e-07, + "loss": 0.729, + "step": 69161 + }, + { + "epoch": 1.77, + "learning_rate": 7.566977390366088e-07, + "loss": 0.6372, + "step": 69162 + }, + { + "epoch": 1.77, + "learning_rate": 7.5667090015863e-07, + "loss": 0.5887, + "step": 69163 + }, + { + "epoch": 1.77, + "learning_rate": 7.566440614669569e-07, + "loss": 0.6436, + "step": 69164 + }, + { + "epoch": 1.77, + "learning_rate": 7.566172229616106e-07, + "loss": 0.4547, + "step": 69165 + }, + { + "epoch": 1.77, + "learning_rate": 7.565903846426111e-07, + "loss": 0.4746, + "step": 69166 + }, + { + "epoch": 1.77, + "learning_rate": 7.56563546509979e-07, + "loss": 0.6543, + "step": 69167 + }, + { + "epoch": 1.77, + "learning_rate": 7.565367085637352e-07, + "loss": 0.668, + "step": 69168 + }, + { + "epoch": 1.77, + "learning_rate": 7.565098708038997e-07, + "loss": 0.6899, + "step": 69169 + }, + { + "epoch": 1.77, + "learning_rate": 7.564830332304938e-07, + "loss": 0.8311, + "step": 69170 + }, + { + "epoch": 1.77, + "learning_rate": 7.564561958435373e-07, + "loss": 0.7422, + "step": 69171 + }, + { + "epoch": 1.77, + "learning_rate": 7.564293586430514e-07, + "loss": 0.6812, + "step": 69172 + }, + { + "epoch": 1.77, + "learning_rate": 7.56402521629056e-07, + "loss": 0.623, + "step": 69173 + }, + { + "epoch": 1.77, + "learning_rate": 7.563756848015723e-07, + "loss": 0.6704, + "step": 69174 + }, + { + "epoch": 1.77, + "learning_rate": 7.563488481606209e-07, + "loss": 0.5903, + "step": 69175 + }, + { + "epoch": 1.77, + "learning_rate": 7.563220117062212e-07, + "loss": 0.7266, + "step": 69176 + }, + { + "epoch": 1.77, + "learning_rate": 7.562951754383951e-07, + "loss": 0.6372, + "step": 69177 + }, + { + "epoch": 1.77, + "learning_rate": 7.562683393571622e-07, + "loss": 0.5547, + "step": 69178 + }, + { + "epoch": 1.77, + "learning_rate": 7.562415034625436e-07, + "loss": 0.749, + "step": 69179 + }, + { + "epoch": 1.77, + "learning_rate": 7.562146677545596e-07, + "loss": 0.6953, + "step": 69180 + }, + { + "epoch": 1.77, + "learning_rate": 7.561878322332307e-07, + "loss": 0.5498, + "step": 69181 + }, + { + "epoch": 1.77, + "learning_rate": 7.561609968985778e-07, + "loss": 0.645, + "step": 69182 + }, + { + "epoch": 1.77, + "learning_rate": 7.561341617506211e-07, + "loss": 0.6582, + "step": 69183 + }, + { + "epoch": 1.77, + "learning_rate": 7.561073267893813e-07, + "loss": 0.6514, + "step": 69184 + }, + { + "epoch": 1.77, + "learning_rate": 7.560804920148792e-07, + "loss": 0.6885, + "step": 69185 + }, + { + "epoch": 1.77, + "learning_rate": 7.560536574271345e-07, + "loss": 0.7515, + "step": 69186 + }, + { + "epoch": 1.77, + "learning_rate": 7.560268230261687e-07, + "loss": 0.5889, + "step": 69187 + }, + { + "epoch": 1.77, + "learning_rate": 7.559999888120017e-07, + "loss": 0.4897, + "step": 69188 + }, + { + "epoch": 1.77, + "learning_rate": 7.559731547846544e-07, + "loss": 0.6128, + "step": 69189 + }, + { + "epoch": 1.77, + "learning_rate": 7.559463209441471e-07, + "loss": 0.623, + "step": 69190 + }, + { + "epoch": 1.77, + "learning_rate": 7.559194872905005e-07, + "loss": 0.6782, + "step": 69191 + }, + { + "epoch": 1.77, + "learning_rate": 7.558926538237353e-07, + "loss": 0.6777, + "step": 69192 + }, + { + "epoch": 1.77, + "learning_rate": 7.558658205438718e-07, + "loss": 0.4617, + "step": 69193 + }, + { + "epoch": 1.77, + "learning_rate": 7.558389874509305e-07, + "loss": 0.5347, + "step": 69194 + }, + { + "epoch": 1.77, + "learning_rate": 7.558121545449327e-07, + "loss": 0.4531, + "step": 69195 + }, + { + "epoch": 1.77, + "learning_rate": 7.557853218258976e-07, + "loss": 0.6504, + "step": 69196 + }, + { + "epoch": 1.77, + "learning_rate": 7.557584892938466e-07, + "loss": 0.7432, + "step": 69197 + }, + { + "epoch": 1.77, + "learning_rate": 7.557316569488e-07, + "loss": 0.6211, + "step": 69198 + }, + { + "epoch": 1.77, + "learning_rate": 7.557048247907787e-07, + "loss": 0.6326, + "step": 69199 + }, + { + "epoch": 1.77, + "learning_rate": 7.556779928198027e-07, + "loss": 0.5432, + "step": 69200 + }, + { + "epoch": 1.77, + "learning_rate": 7.55651161035893e-07, + "loss": 0.7031, + "step": 69201 + }, + { + "epoch": 1.77, + "learning_rate": 7.556243294390699e-07, + "loss": 0.6167, + "step": 69202 + }, + { + "epoch": 1.77, + "learning_rate": 7.55597498029354e-07, + "loss": 0.4595, + "step": 69203 + }, + { + "epoch": 1.77, + "learning_rate": 7.555706668067658e-07, + "loss": 0.6367, + "step": 69204 + }, + { + "epoch": 1.77, + "learning_rate": 7.555438357713262e-07, + "loss": 0.7324, + "step": 69205 + }, + { + "epoch": 1.77, + "learning_rate": 7.555170049230554e-07, + "loss": 0.5688, + "step": 69206 + }, + { + "epoch": 1.77, + "learning_rate": 7.554901742619737e-07, + "loss": 0.6958, + "step": 69207 + }, + { + "epoch": 1.77, + "learning_rate": 7.554633437881021e-07, + "loss": 0.6328, + "step": 69208 + }, + { + "epoch": 1.77, + "learning_rate": 7.554365135014609e-07, + "loss": 0.791, + "step": 69209 + }, + { + "epoch": 1.77, + "learning_rate": 7.554096834020707e-07, + "loss": 0.6782, + "step": 69210 + }, + { + "epoch": 1.77, + "learning_rate": 7.55382853489952e-07, + "loss": 0.5142, + "step": 69211 + }, + { + "epoch": 1.77, + "learning_rate": 7.553560237651256e-07, + "loss": 0.7373, + "step": 69212 + }, + { + "epoch": 1.77, + "learning_rate": 7.553291942276116e-07, + "loss": 0.6875, + "step": 69213 + }, + { + "epoch": 1.77, + "learning_rate": 7.55302364877431e-07, + "loss": 0.552, + "step": 69214 + }, + { + "epoch": 1.77, + "learning_rate": 7.552755357146044e-07, + "loss": 0.5933, + "step": 69215 + }, + { + "epoch": 1.77, + "learning_rate": 7.552487067391518e-07, + "loss": 0.7246, + "step": 69216 + }, + { + "epoch": 1.77, + "learning_rate": 7.55221877951094e-07, + "loss": 0.8877, + "step": 69217 + }, + { + "epoch": 1.77, + "learning_rate": 7.551950493504514e-07, + "loss": 0.4077, + "step": 69218 + }, + { + "epoch": 1.77, + "learning_rate": 7.551682209372447e-07, + "loss": 0.644, + "step": 69219 + }, + { + "epoch": 1.77, + "learning_rate": 7.551413927114946e-07, + "loss": 0.6133, + "step": 69220 + }, + { + "epoch": 1.77, + "learning_rate": 7.551145646732213e-07, + "loss": 0.7183, + "step": 69221 + }, + { + "epoch": 1.77, + "learning_rate": 7.550877368224458e-07, + "loss": 0.6895, + "step": 69222 + }, + { + "epoch": 1.77, + "learning_rate": 7.550609091591879e-07, + "loss": 0.6416, + "step": 69223 + }, + { + "epoch": 1.77, + "learning_rate": 7.55034081683469e-07, + "loss": 0.6885, + "step": 69224 + }, + { + "epoch": 1.77, + "learning_rate": 7.550072543953095e-07, + "loss": 0.6719, + "step": 69225 + }, + { + "epoch": 1.77, + "learning_rate": 7.549804272947292e-07, + "loss": 0.6058, + "step": 69226 + }, + { + "epoch": 1.77, + "learning_rate": 7.549536003817493e-07, + "loss": 0.5225, + "step": 69227 + }, + { + "epoch": 1.77, + "learning_rate": 7.549267736563899e-07, + "loss": 0.7031, + "step": 69228 + }, + { + "epoch": 1.77, + "learning_rate": 7.548999471186722e-07, + "loss": 0.6216, + "step": 69229 + }, + { + "epoch": 1.77, + "learning_rate": 7.548731207686159e-07, + "loss": 0.6543, + "step": 69230 + }, + { + "epoch": 1.77, + "learning_rate": 7.548462946062423e-07, + "loss": 0.5562, + "step": 69231 + }, + { + "epoch": 1.77, + "learning_rate": 7.548194686315715e-07, + "loss": 0.7451, + "step": 69232 + }, + { + "epoch": 1.77, + "learning_rate": 7.54792642844624e-07, + "loss": 0.8564, + "step": 69233 + }, + { + "epoch": 1.77, + "learning_rate": 7.547658172454209e-07, + "loss": 0.5991, + "step": 69234 + }, + { + "epoch": 1.77, + "learning_rate": 7.547389918339823e-07, + "loss": 0.5151, + "step": 69235 + }, + { + "epoch": 1.77, + "learning_rate": 7.547121666103286e-07, + "loss": 0.5918, + "step": 69236 + }, + { + "epoch": 1.77, + "learning_rate": 7.546853415744805e-07, + "loss": 0.7773, + "step": 69237 + }, + { + "epoch": 1.77, + "learning_rate": 7.546585167264586e-07, + "loss": 0.6021, + "step": 69238 + }, + { + "epoch": 1.77, + "learning_rate": 7.546316920662833e-07, + "loss": 0.6836, + "step": 69239 + }, + { + "epoch": 1.77, + "learning_rate": 7.546048675939751e-07, + "loss": 0.4785, + "step": 69240 + }, + { + "epoch": 1.77, + "learning_rate": 7.54578043309555e-07, + "loss": 0.6699, + "step": 69241 + }, + { + "epoch": 1.77, + "learning_rate": 7.54551219213043e-07, + "loss": 0.7314, + "step": 69242 + }, + { + "epoch": 1.77, + "learning_rate": 7.5452439530446e-07, + "loss": 0.5371, + "step": 69243 + }, + { + "epoch": 1.77, + "learning_rate": 7.54497571583826e-07, + "loss": 0.6566, + "step": 69244 + }, + { + "epoch": 1.77, + "learning_rate": 7.544707480511626e-07, + "loss": 0.5835, + "step": 69245 + }, + { + "epoch": 1.77, + "learning_rate": 7.544439247064893e-07, + "loss": 0.7744, + "step": 69246 + }, + { + "epoch": 1.77, + "learning_rate": 7.54417101549827e-07, + "loss": 0.6162, + "step": 69247 + }, + { + "epoch": 1.77, + "learning_rate": 7.543902785811962e-07, + "loss": 0.6006, + "step": 69248 + }, + { + "epoch": 1.77, + "learning_rate": 7.543634558006176e-07, + "loss": 0.6523, + "step": 69249 + }, + { + "epoch": 1.77, + "learning_rate": 7.543366332081114e-07, + "loss": 0.7559, + "step": 69250 + }, + { + "epoch": 1.77, + "learning_rate": 7.543098108036985e-07, + "loss": 0.5723, + "step": 69251 + }, + { + "epoch": 1.77, + "learning_rate": 7.542829885873991e-07, + "loss": 0.478, + "step": 69252 + }, + { + "epoch": 1.77, + "learning_rate": 7.54256166559234e-07, + "loss": 0.7534, + "step": 69253 + }, + { + "epoch": 1.78, + "learning_rate": 7.542293447192236e-07, + "loss": 0.5527, + "step": 69254 + }, + { + "epoch": 1.78, + "learning_rate": 7.542025230673888e-07, + "loss": 0.4822, + "step": 69255 + }, + { + "epoch": 1.78, + "learning_rate": 7.541757016037497e-07, + "loss": 0.5962, + "step": 69256 + }, + { + "epoch": 1.78, + "learning_rate": 7.541488803283267e-07, + "loss": 0.5624, + "step": 69257 + }, + { + "epoch": 1.78, + "learning_rate": 7.541220592411408e-07, + "loss": 0.4399, + "step": 69258 + }, + { + "epoch": 1.78, + "learning_rate": 7.540952383422122e-07, + "loss": 0.6147, + "step": 69259 + }, + { + "epoch": 1.78, + "learning_rate": 7.540684176315617e-07, + "loss": 0.5352, + "step": 69260 + }, + { + "epoch": 1.78, + "learning_rate": 7.540415971092096e-07, + "loss": 0.6631, + "step": 69261 + }, + { + "epoch": 1.78, + "learning_rate": 7.540147767751766e-07, + "loss": 0.6431, + "step": 69262 + }, + { + "epoch": 1.78, + "learning_rate": 7.539879566294832e-07, + "loss": 0.4443, + "step": 69263 + }, + { + "epoch": 1.78, + "learning_rate": 7.539611366721499e-07, + "loss": 0.7104, + "step": 69264 + }, + { + "epoch": 1.78, + "learning_rate": 7.539343169031975e-07, + "loss": 0.5862, + "step": 69265 + }, + { + "epoch": 1.78, + "learning_rate": 7.539074973226459e-07, + "loss": 0.4834, + "step": 69266 + }, + { + "epoch": 1.78, + "learning_rate": 7.538806779305162e-07, + "loss": 0.5742, + "step": 69267 + }, + { + "epoch": 1.78, + "learning_rate": 7.538538587268287e-07, + "loss": 0.5747, + "step": 69268 + }, + { + "epoch": 1.78, + "learning_rate": 7.538270397116038e-07, + "loss": 0.6401, + "step": 69269 + }, + { + "epoch": 1.78, + "learning_rate": 7.538002208848625e-07, + "loss": 0.6348, + "step": 69270 + }, + { + "epoch": 1.78, + "learning_rate": 7.537734022466248e-07, + "loss": 0.6758, + "step": 69271 + }, + { + "epoch": 1.78, + "learning_rate": 7.537465837969117e-07, + "loss": 0.4912, + "step": 69272 + }, + { + "epoch": 1.78, + "learning_rate": 7.537197655357433e-07, + "loss": 0.5435, + "step": 69273 + }, + { + "epoch": 1.78, + "learning_rate": 7.536929474631405e-07, + "loss": 0.7734, + "step": 69274 + }, + { + "epoch": 1.78, + "learning_rate": 7.53666129579124e-07, + "loss": 0.7441, + "step": 69275 + }, + { + "epoch": 1.78, + "learning_rate": 7.536393118837136e-07, + "loss": 0.8574, + "step": 69276 + }, + { + "epoch": 1.78, + "learning_rate": 7.536124943769303e-07, + "loss": 0.52, + "step": 69277 + }, + { + "epoch": 1.78, + "learning_rate": 7.535856770587945e-07, + "loss": 0.6689, + "step": 69278 + }, + { + "epoch": 1.78, + "learning_rate": 7.53558859929327e-07, + "loss": 0.6533, + "step": 69279 + }, + { + "epoch": 1.78, + "learning_rate": 7.535320429885478e-07, + "loss": 0.4573, + "step": 69280 + }, + { + "epoch": 1.78, + "learning_rate": 7.535052262364782e-07, + "loss": 0.5977, + "step": 69281 + }, + { + "epoch": 1.78, + "learning_rate": 7.534784096731381e-07, + "loss": 0.7471, + "step": 69282 + }, + { + "epoch": 1.78, + "learning_rate": 7.534515932985484e-07, + "loss": 0.5576, + "step": 69283 + }, + { + "epoch": 1.78, + "learning_rate": 7.534247771127293e-07, + "loss": 0.7188, + "step": 69284 + }, + { + "epoch": 1.78, + "learning_rate": 7.533979611157021e-07, + "loss": 0.6089, + "step": 69285 + }, + { + "epoch": 1.78, + "learning_rate": 7.533711453074861e-07, + "loss": 0.6372, + "step": 69286 + }, + { + "epoch": 1.78, + "learning_rate": 7.533443296881028e-07, + "loss": 0.7109, + "step": 69287 + }, + { + "epoch": 1.78, + "learning_rate": 7.533175142575721e-07, + "loss": 0.6079, + "step": 69288 + }, + { + "epoch": 1.78, + "learning_rate": 7.532906990159149e-07, + "loss": 0.7129, + "step": 69289 + }, + { + "epoch": 1.78, + "learning_rate": 7.532638839631516e-07, + "loss": 0.6763, + "step": 69290 + }, + { + "epoch": 1.78, + "learning_rate": 7.532370690993031e-07, + "loss": 0.5933, + "step": 69291 + }, + { + "epoch": 1.78, + "learning_rate": 7.532102544243893e-07, + "loss": 0.6416, + "step": 69292 + }, + { + "epoch": 1.78, + "learning_rate": 7.531834399384314e-07, + "loss": 0.6699, + "step": 69293 + }, + { + "epoch": 1.78, + "learning_rate": 7.531566256414492e-07, + "loss": 0.5094, + "step": 69294 + }, + { + "epoch": 1.78, + "learning_rate": 7.531298115334641e-07, + "loss": 0.499, + "step": 69295 + }, + { + "epoch": 1.78, + "learning_rate": 7.53102997614496e-07, + "loss": 0.5391, + "step": 69296 + }, + { + "epoch": 1.78, + "learning_rate": 7.530761838845653e-07, + "loss": 0.6602, + "step": 69297 + }, + { + "epoch": 1.78, + "learning_rate": 7.530493703436931e-07, + "loss": 0.6953, + "step": 69298 + }, + { + "epoch": 1.78, + "learning_rate": 7.530225569918993e-07, + "loss": 0.5165, + "step": 69299 + }, + { + "epoch": 1.78, + "learning_rate": 7.529957438292052e-07, + "loss": 0.5049, + "step": 69300 + }, + { + "epoch": 1.78, + "learning_rate": 7.529689308556305e-07, + "loss": 0.4843, + "step": 69301 + }, + { + "epoch": 1.78, + "learning_rate": 7.529421180711964e-07, + "loss": 0.6182, + "step": 69302 + }, + { + "epoch": 1.78, + "learning_rate": 7.52915305475923e-07, + "loss": 0.8311, + "step": 69303 + }, + { + "epoch": 1.78, + "learning_rate": 7.528884930698312e-07, + "loss": 0.5791, + "step": 69304 + }, + { + "epoch": 1.78, + "learning_rate": 7.528616808529415e-07, + "loss": 0.7334, + "step": 69305 + }, + { + "epoch": 1.78, + "learning_rate": 7.528348688252739e-07, + "loss": 0.6223, + "step": 69306 + }, + { + "epoch": 1.78, + "learning_rate": 7.528080569868492e-07, + "loss": 0.5408, + "step": 69307 + }, + { + "epoch": 1.78, + "learning_rate": 7.527812453376883e-07, + "loss": 0.6777, + "step": 69308 + }, + { + "epoch": 1.78, + "learning_rate": 7.527544338778112e-07, + "loss": 0.625, + "step": 69309 + }, + { + "epoch": 1.78, + "learning_rate": 7.527276226072386e-07, + "loss": 0.8169, + "step": 69310 + }, + { + "epoch": 1.78, + "learning_rate": 7.527008115259911e-07, + "loss": 0.6484, + "step": 69311 + }, + { + "epoch": 1.78, + "learning_rate": 7.526740006340894e-07, + "loss": 0.5552, + "step": 69312 + }, + { + "epoch": 1.78, + "learning_rate": 7.526471899315537e-07, + "loss": 0.5886, + "step": 69313 + }, + { + "epoch": 1.78, + "learning_rate": 7.526203794184048e-07, + "loss": 0.4897, + "step": 69314 + }, + { + "epoch": 1.78, + "learning_rate": 7.525935690946633e-07, + "loss": 0.792, + "step": 69315 + }, + { + "epoch": 1.78, + "learning_rate": 7.525667589603491e-07, + "loss": 0.791, + "step": 69316 + }, + { + "epoch": 1.78, + "learning_rate": 7.525399490154834e-07, + "loss": 0.7402, + "step": 69317 + }, + { + "epoch": 1.78, + "learning_rate": 7.525131392600863e-07, + "loss": 0.5674, + "step": 69318 + }, + { + "epoch": 1.78, + "learning_rate": 7.524863296941788e-07, + "loss": 0.791, + "step": 69319 + }, + { + "epoch": 1.78, + "learning_rate": 7.524595203177808e-07, + "loss": 0.6455, + "step": 69320 + }, + { + "epoch": 1.78, + "learning_rate": 7.524327111309135e-07, + "loss": 0.6926, + "step": 69321 + }, + { + "epoch": 1.78, + "learning_rate": 7.524059021335969e-07, + "loss": 0.7578, + "step": 69322 + }, + { + "epoch": 1.78, + "learning_rate": 7.523790933258516e-07, + "loss": 0.5894, + "step": 69323 + }, + { + "epoch": 1.78, + "learning_rate": 7.523522847076984e-07, + "loss": 0.709, + "step": 69324 + }, + { + "epoch": 1.78, + "learning_rate": 7.52325476279158e-07, + "loss": 0.5425, + "step": 69325 + }, + { + "epoch": 1.78, + "learning_rate": 7.5229866804025e-07, + "loss": 0.6335, + "step": 69326 + }, + { + "epoch": 1.78, + "learning_rate": 7.522718599909958e-07, + "loss": 0.5415, + "step": 69327 + }, + { + "epoch": 1.78, + "learning_rate": 7.522450521314155e-07, + "loss": 0.5469, + "step": 69328 + }, + { + "epoch": 1.78, + "learning_rate": 7.522182444615299e-07, + "loss": 0.6108, + "step": 69329 + }, + { + "epoch": 1.78, + "learning_rate": 7.521914369813594e-07, + "loss": 0.5757, + "step": 69330 + }, + { + "epoch": 1.78, + "learning_rate": 7.521646296909244e-07, + "loss": 0.6484, + "step": 69331 + }, + { + "epoch": 1.78, + "learning_rate": 7.521378225902455e-07, + "loss": 0.5439, + "step": 69332 + }, + { + "epoch": 1.78, + "learning_rate": 7.521110156793435e-07, + "loss": 0.4326, + "step": 69333 + }, + { + "epoch": 1.78, + "learning_rate": 7.520842089582386e-07, + "loss": 0.7725, + "step": 69334 + }, + { + "epoch": 1.78, + "learning_rate": 7.520574024269517e-07, + "loss": 0.4594, + "step": 69335 + }, + { + "epoch": 1.78, + "learning_rate": 7.520305960855028e-07, + "loss": 0.5566, + "step": 69336 + }, + { + "epoch": 1.78, + "learning_rate": 7.520037899339124e-07, + "loss": 0.6135, + "step": 69337 + }, + { + "epoch": 1.78, + "learning_rate": 7.519769839722017e-07, + "loss": 0.6006, + "step": 69338 + }, + { + "epoch": 1.78, + "learning_rate": 7.519501782003905e-07, + "loss": 0.7637, + "step": 69339 + }, + { + "epoch": 1.78, + "learning_rate": 7.519233726184999e-07, + "loss": 0.6533, + "step": 69340 + }, + { + "epoch": 1.78, + "learning_rate": 7.518965672265502e-07, + "loss": 0.5884, + "step": 69341 + }, + { + "epoch": 1.78, + "learning_rate": 7.518697620245616e-07, + "loss": 0.6533, + "step": 69342 + }, + { + "epoch": 1.78, + "learning_rate": 7.518429570125551e-07, + "loss": 0.6406, + "step": 69343 + }, + { + "epoch": 1.78, + "learning_rate": 7.51816152190551e-07, + "loss": 0.7539, + "step": 69344 + }, + { + "epoch": 1.78, + "learning_rate": 7.5178934755857e-07, + "loss": 0.5403, + "step": 69345 + }, + { + "epoch": 1.78, + "learning_rate": 7.517625431166325e-07, + "loss": 0.5488, + "step": 69346 + }, + { + "epoch": 1.78, + "learning_rate": 7.517357388647587e-07, + "loss": 0.6499, + "step": 69347 + }, + { + "epoch": 1.78, + "learning_rate": 7.517089348029697e-07, + "loss": 0.7188, + "step": 69348 + }, + { + "epoch": 1.78, + "learning_rate": 7.516821309312855e-07, + "loss": 0.6621, + "step": 69349 + }, + { + "epoch": 1.78, + "learning_rate": 7.51655327249727e-07, + "loss": 0.6626, + "step": 69350 + }, + { + "epoch": 1.78, + "learning_rate": 7.516285237583146e-07, + "loss": 0.644, + "step": 69351 + }, + { + "epoch": 1.78, + "learning_rate": 7.516017204570689e-07, + "loss": 0.6919, + "step": 69352 + }, + { + "epoch": 1.78, + "learning_rate": 7.515749173460101e-07, + "loss": 0.5918, + "step": 69353 + }, + { + "epoch": 1.78, + "learning_rate": 7.515481144251592e-07, + "loss": 0.7178, + "step": 69354 + }, + { + "epoch": 1.78, + "learning_rate": 7.515213116945367e-07, + "loss": 0.5212, + "step": 69355 + }, + { + "epoch": 1.78, + "learning_rate": 7.514945091541624e-07, + "loss": 0.6382, + "step": 69356 + }, + { + "epoch": 1.78, + "learning_rate": 7.514677068040578e-07, + "loss": 0.7197, + "step": 69357 + }, + { + "epoch": 1.78, + "learning_rate": 7.514409046442427e-07, + "loss": 0.5444, + "step": 69358 + }, + { + "epoch": 1.78, + "learning_rate": 7.514141026747378e-07, + "loss": 0.5752, + "step": 69359 + }, + { + "epoch": 1.78, + "learning_rate": 7.513873008955638e-07, + "loss": 0.6548, + "step": 69360 + }, + { + "epoch": 1.78, + "learning_rate": 7.513604993067409e-07, + "loss": 0.5918, + "step": 69361 + }, + { + "epoch": 1.78, + "learning_rate": 7.513336979082901e-07, + "loss": 0.6338, + "step": 69362 + }, + { + "epoch": 1.78, + "learning_rate": 7.513068967002314e-07, + "loss": 0.499, + "step": 69363 + }, + { + "epoch": 1.78, + "learning_rate": 7.512800956825859e-07, + "loss": 0.5188, + "step": 69364 + }, + { + "epoch": 1.78, + "learning_rate": 7.512532948553739e-07, + "loss": 0.689, + "step": 69365 + }, + { + "epoch": 1.78, + "learning_rate": 7.512264942186154e-07, + "loss": 0.5815, + "step": 69366 + }, + { + "epoch": 1.78, + "learning_rate": 7.511996937723316e-07, + "loss": 0.4506, + "step": 69367 + }, + { + "epoch": 1.78, + "learning_rate": 7.511728935165424e-07, + "loss": 0.7266, + "step": 69368 + }, + { + "epoch": 1.78, + "learning_rate": 7.51146093451269e-07, + "loss": 0.5508, + "step": 69369 + }, + { + "epoch": 1.78, + "learning_rate": 7.511192935765314e-07, + "loss": 0.709, + "step": 69370 + }, + { + "epoch": 1.78, + "learning_rate": 7.510924938923506e-07, + "loss": 0.5825, + "step": 69371 + }, + { + "epoch": 1.78, + "learning_rate": 7.510656943987464e-07, + "loss": 0.5972, + "step": 69372 + }, + { + "epoch": 1.78, + "learning_rate": 7.510388950957401e-07, + "loss": 0.7363, + "step": 69373 + }, + { + "epoch": 1.78, + "learning_rate": 7.510120959833517e-07, + "loss": 0.5283, + "step": 69374 + }, + { + "epoch": 1.78, + "learning_rate": 7.509852970616024e-07, + "loss": 0.5718, + "step": 69375 + }, + { + "epoch": 1.78, + "learning_rate": 7.509584983305116e-07, + "loss": 0.6924, + "step": 69376 + }, + { + "epoch": 1.78, + "learning_rate": 7.509316997901008e-07, + "loss": 0.604, + "step": 69377 + }, + { + "epoch": 1.78, + "learning_rate": 7.509049014403897e-07, + "loss": 0.7085, + "step": 69378 + }, + { + "epoch": 1.78, + "learning_rate": 7.508781032813996e-07, + "loss": 0.6475, + "step": 69379 + }, + { + "epoch": 1.78, + "learning_rate": 7.508513053131505e-07, + "loss": 0.377, + "step": 69380 + }, + { + "epoch": 1.78, + "learning_rate": 7.508245075356631e-07, + "loss": 0.624, + "step": 69381 + }, + { + "epoch": 1.78, + "learning_rate": 7.507977099489579e-07, + "loss": 0.6675, + "step": 69382 + }, + { + "epoch": 1.78, + "learning_rate": 7.507709125530557e-07, + "loss": 0.6582, + "step": 69383 + }, + { + "epoch": 1.78, + "learning_rate": 7.507441153479764e-07, + "loss": 0.5747, + "step": 69384 + }, + { + "epoch": 1.78, + "learning_rate": 7.507173183337415e-07, + "loss": 0.6729, + "step": 69385 + }, + { + "epoch": 1.78, + "learning_rate": 7.506905215103704e-07, + "loss": 0.5215, + "step": 69386 + }, + { + "epoch": 1.78, + "learning_rate": 7.50663724877884e-07, + "loss": 0.4514, + "step": 69387 + }, + { + "epoch": 1.78, + "learning_rate": 7.506369284363032e-07, + "loss": 0.5298, + "step": 69388 + }, + { + "epoch": 1.78, + "learning_rate": 7.50610132185648e-07, + "loss": 0.6348, + "step": 69389 + }, + { + "epoch": 1.78, + "learning_rate": 7.505833361259393e-07, + "loss": 0.6602, + "step": 69390 + }, + { + "epoch": 1.78, + "learning_rate": 7.505565402571973e-07, + "loss": 0.6816, + "step": 69391 + }, + { + "epoch": 1.78, + "learning_rate": 7.505297445794428e-07, + "loss": 0.7412, + "step": 69392 + }, + { + "epoch": 1.78, + "learning_rate": 7.505029490926962e-07, + "loss": 0.7227, + "step": 69393 + }, + { + "epoch": 1.78, + "learning_rate": 7.50476153796978e-07, + "loss": 0.6079, + "step": 69394 + }, + { + "epoch": 1.78, + "learning_rate": 7.504493586923091e-07, + "loss": 0.6592, + "step": 69395 + }, + { + "epoch": 1.78, + "learning_rate": 7.504225637787094e-07, + "loss": 0.7051, + "step": 69396 + }, + { + "epoch": 1.78, + "learning_rate": 7.503957690561995e-07, + "loss": 0.6592, + "step": 69397 + }, + { + "epoch": 1.78, + "learning_rate": 7.503689745248003e-07, + "loss": 0.6919, + "step": 69398 + }, + { + "epoch": 1.78, + "learning_rate": 7.503421801845318e-07, + "loss": 0.6523, + "step": 69399 + }, + { + "epoch": 1.78, + "learning_rate": 7.50315386035415e-07, + "loss": 0.5913, + "step": 69400 + }, + { + "epoch": 1.78, + "learning_rate": 7.502885920774702e-07, + "loss": 0.7422, + "step": 69401 + }, + { + "epoch": 1.78, + "learning_rate": 7.50261798310718e-07, + "loss": 0.7202, + "step": 69402 + }, + { + "epoch": 1.78, + "learning_rate": 7.502350047351786e-07, + "loss": 0.6016, + "step": 69403 + }, + { + "epoch": 1.78, + "learning_rate": 7.502082113508732e-07, + "loss": 0.7979, + "step": 69404 + }, + { + "epoch": 1.78, + "learning_rate": 7.501814181578219e-07, + "loss": 0.6836, + "step": 69405 + }, + { + "epoch": 1.78, + "learning_rate": 7.501546251560449e-07, + "loss": 0.6318, + "step": 69406 + }, + { + "epoch": 1.78, + "learning_rate": 7.501278323455631e-07, + "loss": 0.7832, + "step": 69407 + }, + { + "epoch": 1.78, + "learning_rate": 7.501010397263968e-07, + "loss": 0.686, + "step": 69408 + }, + { + "epoch": 1.78, + "learning_rate": 7.500742472985668e-07, + "loss": 0.689, + "step": 69409 + }, + { + "epoch": 1.78, + "learning_rate": 7.500474550620933e-07, + "loss": 0.6182, + "step": 69410 + }, + { + "epoch": 1.78, + "learning_rate": 7.500206630169972e-07, + "loss": 0.6128, + "step": 69411 + }, + { + "epoch": 1.78, + "learning_rate": 7.499938711632987e-07, + "loss": 0.5088, + "step": 69412 + }, + { + "epoch": 1.78, + "learning_rate": 7.499670795010183e-07, + "loss": 0.5361, + "step": 69413 + }, + { + "epoch": 1.78, + "learning_rate": 7.499402880301769e-07, + "loss": 0.5708, + "step": 69414 + }, + { + "epoch": 1.78, + "learning_rate": 7.499134967507947e-07, + "loss": 0.686, + "step": 69415 + }, + { + "epoch": 1.78, + "learning_rate": 7.49886705662892e-07, + "loss": 0.4614, + "step": 69416 + }, + { + "epoch": 1.78, + "learning_rate": 7.498599147664896e-07, + "loss": 0.6465, + "step": 69417 + }, + { + "epoch": 1.78, + "learning_rate": 7.498331240616078e-07, + "loss": 0.6357, + "step": 69418 + }, + { + "epoch": 1.78, + "learning_rate": 7.498063335482675e-07, + "loss": 0.6743, + "step": 69419 + }, + { + "epoch": 1.78, + "learning_rate": 7.497795432264888e-07, + "loss": 0.4443, + "step": 69420 + }, + { + "epoch": 1.78, + "learning_rate": 7.497527530962926e-07, + "loss": 0.4478, + "step": 69421 + }, + { + "epoch": 1.78, + "learning_rate": 7.49725963157699e-07, + "loss": 0.3788, + "step": 69422 + }, + { + "epoch": 1.78, + "learning_rate": 7.49699173410729e-07, + "loss": 0.5432, + "step": 69423 + }, + { + "epoch": 1.78, + "learning_rate": 7.496723838554025e-07, + "loss": 0.6426, + "step": 69424 + }, + { + "epoch": 1.78, + "learning_rate": 7.496455944917408e-07, + "loss": 0.5784, + "step": 69425 + }, + { + "epoch": 1.78, + "learning_rate": 7.496188053197637e-07, + "loss": 0.5796, + "step": 69426 + }, + { + "epoch": 1.78, + "learning_rate": 7.495920163394918e-07, + "loss": 0.5518, + "step": 69427 + }, + { + "epoch": 1.78, + "learning_rate": 7.495652275509461e-07, + "loss": 0.6045, + "step": 69428 + }, + { + "epoch": 1.78, + "learning_rate": 7.495384389541464e-07, + "loss": 0.5386, + "step": 69429 + }, + { + "epoch": 1.78, + "learning_rate": 7.495116505491139e-07, + "loss": 0.707, + "step": 69430 + }, + { + "epoch": 1.78, + "learning_rate": 7.494848623358688e-07, + "loss": 0.6523, + "step": 69431 + }, + { + "epoch": 1.78, + "learning_rate": 7.494580743144314e-07, + "loss": 0.4976, + "step": 69432 + }, + { + "epoch": 1.78, + "learning_rate": 7.494312864848227e-07, + "loss": 0.6377, + "step": 69433 + }, + { + "epoch": 1.78, + "learning_rate": 7.494044988470627e-07, + "loss": 0.6855, + "step": 69434 + }, + { + "epoch": 1.78, + "learning_rate": 7.493777114011726e-07, + "loss": 0.7578, + "step": 69435 + }, + { + "epoch": 1.78, + "learning_rate": 7.493509241471722e-07, + "loss": 0.6128, + "step": 69436 + }, + { + "epoch": 1.78, + "learning_rate": 7.49324137085082e-07, + "loss": 0.4553, + "step": 69437 + }, + { + "epoch": 1.78, + "learning_rate": 7.492973502149232e-07, + "loss": 0.5942, + "step": 69438 + }, + { + "epoch": 1.78, + "learning_rate": 7.492705635367156e-07, + "loss": 0.5952, + "step": 69439 + }, + { + "epoch": 1.78, + "learning_rate": 7.4924377705048e-07, + "loss": 0.5647, + "step": 69440 + }, + { + "epoch": 1.78, + "learning_rate": 7.492169907562369e-07, + "loss": 0.7783, + "step": 69441 + }, + { + "epoch": 1.78, + "learning_rate": 7.491902046540071e-07, + "loss": 0.6314, + "step": 69442 + }, + { + "epoch": 1.78, + "learning_rate": 7.491634187438105e-07, + "loss": 0.6611, + "step": 69443 + }, + { + "epoch": 1.78, + "learning_rate": 7.491366330256681e-07, + "loss": 0.5591, + "step": 69444 + }, + { + "epoch": 1.78, + "learning_rate": 7.491098474996005e-07, + "loss": 0.6494, + "step": 69445 + }, + { + "epoch": 1.78, + "learning_rate": 7.490830621656277e-07, + "loss": 0.6035, + "step": 69446 + }, + { + "epoch": 1.78, + "learning_rate": 7.490562770237703e-07, + "loss": 0.5444, + "step": 69447 + }, + { + "epoch": 1.78, + "learning_rate": 7.490294920740493e-07, + "loss": 0.6426, + "step": 69448 + }, + { + "epoch": 1.78, + "learning_rate": 7.490027073164847e-07, + "loss": 0.7026, + "step": 69449 + }, + { + "epoch": 1.78, + "learning_rate": 7.489759227510971e-07, + "loss": 0.5305, + "step": 69450 + }, + { + "epoch": 1.78, + "learning_rate": 7.489491383779071e-07, + "loss": 0.5166, + "step": 69451 + }, + { + "epoch": 1.78, + "learning_rate": 7.489223541969353e-07, + "loss": 0.7754, + "step": 69452 + }, + { + "epoch": 1.78, + "learning_rate": 7.488955702082019e-07, + "loss": 0.6807, + "step": 69453 + }, + { + "epoch": 1.78, + "learning_rate": 7.488687864117281e-07, + "loss": 0.5241, + "step": 69454 + }, + { + "epoch": 1.78, + "learning_rate": 7.488420028075337e-07, + "loss": 0.6387, + "step": 69455 + }, + { + "epoch": 1.78, + "learning_rate": 7.488152193956392e-07, + "loss": 0.6709, + "step": 69456 + }, + { + "epoch": 1.78, + "learning_rate": 7.487884361760657e-07, + "loss": 0.4626, + "step": 69457 + }, + { + "epoch": 1.78, + "learning_rate": 7.487616531488329e-07, + "loss": 0.6162, + "step": 69458 + }, + { + "epoch": 1.78, + "learning_rate": 7.48734870313962e-07, + "loss": 0.5728, + "step": 69459 + }, + { + "epoch": 1.78, + "learning_rate": 7.487080876714731e-07, + "loss": 0.6704, + "step": 69460 + }, + { + "epoch": 1.78, + "learning_rate": 7.486813052213872e-07, + "loss": 0.6924, + "step": 69461 + }, + { + "epoch": 1.78, + "learning_rate": 7.48654522963724e-07, + "loss": 0.7783, + "step": 69462 + }, + { + "epoch": 1.78, + "learning_rate": 7.486277408985049e-07, + "loss": 0.5234, + "step": 69463 + }, + { + "epoch": 1.78, + "learning_rate": 7.4860095902575e-07, + "loss": 0.6235, + "step": 69464 + }, + { + "epoch": 1.78, + "learning_rate": 7.485741773454798e-07, + "loss": 0.5244, + "step": 69465 + }, + { + "epoch": 1.78, + "learning_rate": 7.485473958577144e-07, + "loss": 0.5369, + "step": 69466 + }, + { + "epoch": 1.78, + "learning_rate": 7.485206145624749e-07, + "loss": 0.707, + "step": 69467 + }, + { + "epoch": 1.78, + "learning_rate": 7.484938334597815e-07, + "loss": 0.6963, + "step": 69468 + }, + { + "epoch": 1.78, + "learning_rate": 7.484670525496551e-07, + "loss": 0.6963, + "step": 69469 + }, + { + "epoch": 1.78, + "learning_rate": 7.484402718321155e-07, + "loss": 0.5732, + "step": 69470 + }, + { + "epoch": 1.78, + "learning_rate": 7.48413491307184e-07, + "loss": 0.5557, + "step": 69471 + }, + { + "epoch": 1.78, + "learning_rate": 7.483867109748804e-07, + "loss": 0.5649, + "step": 69472 + }, + { + "epoch": 1.78, + "learning_rate": 7.483599308352258e-07, + "loss": 0.5557, + "step": 69473 + }, + { + "epoch": 1.78, + "learning_rate": 7.483331508882405e-07, + "loss": 0.7041, + "step": 69474 + }, + { + "epoch": 1.78, + "learning_rate": 7.483063711339446e-07, + "loss": 0.4834, + "step": 69475 + }, + { + "epoch": 1.78, + "learning_rate": 7.482795915723592e-07, + "loss": 0.4556, + "step": 69476 + }, + { + "epoch": 1.78, + "learning_rate": 7.482528122035044e-07, + "loss": 0.6719, + "step": 69477 + }, + { + "epoch": 1.78, + "learning_rate": 7.482260330274009e-07, + "loss": 0.7637, + "step": 69478 + }, + { + "epoch": 1.78, + "learning_rate": 7.481992540440689e-07, + "loss": 0.6465, + "step": 69479 + }, + { + "epoch": 1.78, + "learning_rate": 7.481724752535294e-07, + "loss": 0.4971, + "step": 69480 + }, + { + "epoch": 1.78, + "learning_rate": 7.481456966558026e-07, + "loss": 0.6094, + "step": 69481 + }, + { + "epoch": 1.78, + "learning_rate": 7.481189182509092e-07, + "loss": 0.5626, + "step": 69482 + }, + { + "epoch": 1.78, + "learning_rate": 7.480921400388693e-07, + "loss": 0.7881, + "step": 69483 + }, + { + "epoch": 1.78, + "learning_rate": 7.480653620197044e-07, + "loss": 0.5217, + "step": 69484 + }, + { + "epoch": 1.78, + "learning_rate": 7.480385841934335e-07, + "loss": 0.3916, + "step": 69485 + }, + { + "epoch": 1.78, + "learning_rate": 7.480118065600781e-07, + "loss": 0.5977, + "step": 69486 + }, + { + "epoch": 1.78, + "learning_rate": 7.479850291196583e-07, + "loss": 0.5146, + "step": 69487 + }, + { + "epoch": 1.78, + "learning_rate": 7.47958251872195e-07, + "loss": 0.7373, + "step": 69488 + }, + { + "epoch": 1.78, + "learning_rate": 7.479314748177082e-07, + "loss": 0.7178, + "step": 69489 + }, + { + "epoch": 1.78, + "learning_rate": 7.47904697956219e-07, + "loss": 0.6289, + "step": 69490 + }, + { + "epoch": 1.78, + "learning_rate": 7.478779212877473e-07, + "loss": 0.6567, + "step": 69491 + }, + { + "epoch": 1.78, + "learning_rate": 7.478511448123141e-07, + "loss": 0.5845, + "step": 69492 + }, + { + "epoch": 1.78, + "learning_rate": 7.478243685299394e-07, + "loss": 0.6282, + "step": 69493 + }, + { + "epoch": 1.78, + "learning_rate": 7.477975924406446e-07, + "loss": 0.7314, + "step": 69494 + }, + { + "epoch": 1.78, + "learning_rate": 7.477708165444491e-07, + "loss": 0.5942, + "step": 69495 + }, + { + "epoch": 1.78, + "learning_rate": 7.47744040841374e-07, + "loss": 0.6846, + "step": 69496 + }, + { + "epoch": 1.78, + "learning_rate": 7.477172653314397e-07, + "loss": 0.5874, + "step": 69497 + }, + { + "epoch": 1.78, + "learning_rate": 7.476904900146666e-07, + "loss": 0.7734, + "step": 69498 + }, + { + "epoch": 1.78, + "learning_rate": 7.476637148910754e-07, + "loss": 0.5942, + "step": 69499 + }, + { + "epoch": 1.78, + "learning_rate": 7.476369399606862e-07, + "loss": 0.6162, + "step": 69500 + }, + { + "epoch": 1.78, + "learning_rate": 7.4761016522352e-07, + "loss": 0.5073, + "step": 69501 + }, + { + "epoch": 1.78, + "learning_rate": 7.475833906795972e-07, + "loss": 0.6299, + "step": 69502 + }, + { + "epoch": 1.78, + "learning_rate": 7.475566163289381e-07, + "loss": 0.6255, + "step": 69503 + }, + { + "epoch": 1.78, + "learning_rate": 7.475298421715635e-07, + "loss": 0.5303, + "step": 69504 + }, + { + "epoch": 1.78, + "learning_rate": 7.475030682074937e-07, + "loss": 0.6074, + "step": 69505 + }, + { + "epoch": 1.78, + "learning_rate": 7.474762944367487e-07, + "loss": 0.7451, + "step": 69506 + }, + { + "epoch": 1.78, + "learning_rate": 7.474495208593499e-07, + "loss": 0.7568, + "step": 69507 + }, + { + "epoch": 1.78, + "learning_rate": 7.474227474753172e-07, + "loss": 0.6338, + "step": 69508 + }, + { + "epoch": 1.78, + "learning_rate": 7.473959742846714e-07, + "loss": 0.5903, + "step": 69509 + }, + { + "epoch": 1.78, + "learning_rate": 7.473692012874326e-07, + "loss": 0.7812, + "step": 69510 + }, + { + "epoch": 1.78, + "learning_rate": 7.47342428483622e-07, + "loss": 0.688, + "step": 69511 + }, + { + "epoch": 1.78, + "learning_rate": 7.473156558732594e-07, + "loss": 0.665, + "step": 69512 + }, + { + "epoch": 1.78, + "learning_rate": 7.472888834563657e-07, + "loss": 0.6572, + "step": 69513 + }, + { + "epoch": 1.78, + "learning_rate": 7.472621112329616e-07, + "loss": 0.7217, + "step": 69514 + }, + { + "epoch": 1.78, + "learning_rate": 7.472353392030668e-07, + "loss": 0.6289, + "step": 69515 + }, + { + "epoch": 1.78, + "learning_rate": 7.472085673667026e-07, + "loss": 0.6489, + "step": 69516 + }, + { + "epoch": 1.78, + "learning_rate": 7.471817957238888e-07, + "loss": 0.5703, + "step": 69517 + }, + { + "epoch": 1.78, + "learning_rate": 7.471550242746465e-07, + "loss": 0.6914, + "step": 69518 + }, + { + "epoch": 1.78, + "learning_rate": 7.471282530189959e-07, + "loss": 0.4622, + "step": 69519 + }, + { + "epoch": 1.78, + "learning_rate": 7.471014819569577e-07, + "loss": 0.6704, + "step": 69520 + }, + { + "epoch": 1.78, + "learning_rate": 7.470747110885523e-07, + "loss": 0.7432, + "step": 69521 + }, + { + "epoch": 1.78, + "learning_rate": 7.470479404137998e-07, + "loss": 0.624, + "step": 69522 + }, + { + "epoch": 1.78, + "learning_rate": 7.470211699327214e-07, + "loss": 0.4297, + "step": 69523 + }, + { + "epoch": 1.78, + "learning_rate": 7.469943996453375e-07, + "loss": 0.5068, + "step": 69524 + }, + { + "epoch": 1.78, + "learning_rate": 7.469676295516678e-07, + "loss": 0.6357, + "step": 69525 + }, + { + "epoch": 1.78, + "learning_rate": 7.469408596517337e-07, + "loss": 0.5137, + "step": 69526 + }, + { + "epoch": 1.78, + "learning_rate": 7.46914089945555e-07, + "loss": 0.7783, + "step": 69527 + }, + { + "epoch": 1.78, + "learning_rate": 7.468873204331529e-07, + "loss": 0.5311, + "step": 69528 + }, + { + "epoch": 1.78, + "learning_rate": 7.468605511145474e-07, + "loss": 0.6616, + "step": 69529 + }, + { + "epoch": 1.78, + "learning_rate": 7.468337819897592e-07, + "loss": 0.6855, + "step": 69530 + }, + { + "epoch": 1.78, + "learning_rate": 7.468070130588085e-07, + "loss": 0.6172, + "step": 69531 + }, + { + "epoch": 1.78, + "learning_rate": 7.467802443217162e-07, + "loss": 0.5469, + "step": 69532 + }, + { + "epoch": 1.78, + "learning_rate": 7.467534757785026e-07, + "loss": 0.5703, + "step": 69533 + }, + { + "epoch": 1.78, + "learning_rate": 7.467267074291885e-07, + "loss": 0.7061, + "step": 69534 + }, + { + "epoch": 1.78, + "learning_rate": 7.46699939273794e-07, + "loss": 0.7168, + "step": 69535 + }, + { + "epoch": 1.78, + "learning_rate": 7.466731713123393e-07, + "loss": 0.7568, + "step": 69536 + }, + { + "epoch": 1.78, + "learning_rate": 7.466464035448457e-07, + "loss": 0.7749, + "step": 69537 + }, + { + "epoch": 1.78, + "learning_rate": 7.466196359713333e-07, + "loss": 0.7041, + "step": 69538 + }, + { + "epoch": 1.78, + "learning_rate": 7.465928685918224e-07, + "loss": 0.623, + "step": 69539 + }, + { + "epoch": 1.78, + "learning_rate": 7.465661014063338e-07, + "loss": 0.373, + "step": 69540 + }, + { + "epoch": 1.78, + "learning_rate": 7.465393344148876e-07, + "loss": 0.6738, + "step": 69541 + }, + { + "epoch": 1.78, + "learning_rate": 7.46512567617505e-07, + "loss": 0.7031, + "step": 69542 + }, + { + "epoch": 1.78, + "learning_rate": 7.464858010142056e-07, + "loss": 0.666, + "step": 69543 + }, + { + "epoch": 1.78, + "learning_rate": 7.46459034605011e-07, + "loss": 0.6445, + "step": 69544 + }, + { + "epoch": 1.78, + "learning_rate": 7.464322683899408e-07, + "loss": 0.4788, + "step": 69545 + }, + { + "epoch": 1.78, + "learning_rate": 7.464055023690155e-07, + "loss": 0.6016, + "step": 69546 + }, + { + "epoch": 1.78, + "learning_rate": 7.463787365422562e-07, + "loss": 0.7979, + "step": 69547 + }, + { + "epoch": 1.78, + "learning_rate": 7.463519709096826e-07, + "loss": 0.6431, + "step": 69548 + }, + { + "epoch": 1.78, + "learning_rate": 7.46325205471316e-07, + "loss": 0.751, + "step": 69549 + }, + { + "epoch": 1.78, + "learning_rate": 7.462984402271764e-07, + "loss": 0.6064, + "step": 69550 + }, + { + "epoch": 1.78, + "learning_rate": 7.462716751772844e-07, + "loss": 0.405, + "step": 69551 + }, + { + "epoch": 1.78, + "learning_rate": 7.462449103216604e-07, + "loss": 0.688, + "step": 69552 + }, + { + "epoch": 1.78, + "learning_rate": 7.462181456603253e-07, + "loss": 0.7593, + "step": 69553 + }, + { + "epoch": 1.78, + "learning_rate": 7.461913811932994e-07, + "loss": 0.7271, + "step": 69554 + }, + { + "epoch": 1.78, + "learning_rate": 7.461646169206029e-07, + "loss": 0.625, + "step": 69555 + }, + { + "epoch": 1.78, + "learning_rate": 7.461378528422562e-07, + "loss": 0.5596, + "step": 69556 + }, + { + "epoch": 1.78, + "learning_rate": 7.461110889582805e-07, + "loss": 0.7065, + "step": 69557 + }, + { + "epoch": 1.78, + "learning_rate": 7.460843252686955e-07, + "loss": 0.6504, + "step": 69558 + }, + { + "epoch": 1.78, + "learning_rate": 7.460575617735223e-07, + "loss": 0.666, + "step": 69559 + }, + { + "epoch": 1.78, + "learning_rate": 7.460307984727809e-07, + "loss": 0.6782, + "step": 69560 + }, + { + "epoch": 1.78, + "learning_rate": 7.460040353664923e-07, + "loss": 0.3838, + "step": 69561 + }, + { + "epoch": 1.78, + "learning_rate": 7.459772724546765e-07, + "loss": 0.5693, + "step": 69562 + }, + { + "epoch": 1.78, + "learning_rate": 7.459505097373544e-07, + "loss": 0.5801, + "step": 69563 + }, + { + "epoch": 1.78, + "learning_rate": 7.459237472145465e-07, + "loss": 0.7021, + "step": 69564 + }, + { + "epoch": 1.78, + "learning_rate": 7.458969848862727e-07, + "loss": 0.6836, + "step": 69565 + }, + { + "epoch": 1.78, + "learning_rate": 7.458702227525542e-07, + "loss": 0.75, + "step": 69566 + }, + { + "epoch": 1.78, + "learning_rate": 7.458434608134108e-07, + "loss": 0.6738, + "step": 69567 + }, + { + "epoch": 1.78, + "learning_rate": 7.458166990688638e-07, + "loss": 0.8369, + "step": 69568 + }, + { + "epoch": 1.78, + "learning_rate": 7.45789937518933e-07, + "loss": 0.5017, + "step": 69569 + }, + { + "epoch": 1.78, + "learning_rate": 7.457631761636393e-07, + "loss": 0.6016, + "step": 69570 + }, + { + "epoch": 1.78, + "learning_rate": 7.457364150030028e-07, + "loss": 0.6631, + "step": 69571 + }, + { + "epoch": 1.78, + "learning_rate": 7.457096540370444e-07, + "loss": 0.532, + "step": 69572 + }, + { + "epoch": 1.78, + "learning_rate": 7.456828932657843e-07, + "loss": 0.6631, + "step": 69573 + }, + { + "epoch": 1.78, + "learning_rate": 7.456561326892439e-07, + "loss": 0.6565, + "step": 69574 + }, + { + "epoch": 1.78, + "learning_rate": 7.456293723074421e-07, + "loss": 0.6689, + "step": 69575 + }, + { + "epoch": 1.78, + "learning_rate": 7.456026121204004e-07, + "loss": 0.6763, + "step": 69576 + }, + { + "epoch": 1.78, + "learning_rate": 7.45575852128139e-07, + "loss": 0.6807, + "step": 69577 + }, + { + "epoch": 1.78, + "learning_rate": 7.455490923306787e-07, + "loss": 0.6904, + "step": 69578 + }, + { + "epoch": 1.78, + "learning_rate": 7.455223327280393e-07, + "loss": 0.7334, + "step": 69579 + }, + { + "epoch": 1.78, + "learning_rate": 7.454955733202421e-07, + "loss": 0.7266, + "step": 69580 + }, + { + "epoch": 1.78, + "learning_rate": 7.454688141073071e-07, + "loss": 0.6743, + "step": 69581 + }, + { + "epoch": 1.78, + "learning_rate": 7.45442055089255e-07, + "loss": 0.6528, + "step": 69582 + }, + { + "epoch": 1.78, + "learning_rate": 7.45415296266106e-07, + "loss": 0.7168, + "step": 69583 + }, + { + "epoch": 1.78, + "learning_rate": 7.453885376378815e-07, + "loss": 0.6025, + "step": 69584 + }, + { + "epoch": 1.78, + "learning_rate": 7.453617792046007e-07, + "loss": 0.6133, + "step": 69585 + }, + { + "epoch": 1.78, + "learning_rate": 7.453350209662848e-07, + "loss": 0.6943, + "step": 69586 + }, + { + "epoch": 1.78, + "learning_rate": 7.453082629229541e-07, + "loss": 0.6553, + "step": 69587 + }, + { + "epoch": 1.78, + "learning_rate": 7.45281505074629e-07, + "loss": 0.5625, + "step": 69588 + }, + { + "epoch": 1.78, + "learning_rate": 7.452547474213304e-07, + "loss": 0.6533, + "step": 69589 + }, + { + "epoch": 1.78, + "learning_rate": 7.452279899630783e-07, + "loss": 0.7109, + "step": 69590 + }, + { + "epoch": 1.78, + "learning_rate": 7.452012326998938e-07, + "loss": 0.5679, + "step": 69591 + }, + { + "epoch": 1.78, + "learning_rate": 7.451744756317966e-07, + "loss": 0.7852, + "step": 69592 + }, + { + "epoch": 1.78, + "learning_rate": 7.451477187588077e-07, + "loss": 0.4087, + "step": 69593 + }, + { + "epoch": 1.78, + "learning_rate": 7.451209620809479e-07, + "loss": 0.6182, + "step": 69594 + }, + { + "epoch": 1.78, + "learning_rate": 7.450942055982369e-07, + "loss": 0.7578, + "step": 69595 + }, + { + "epoch": 1.78, + "learning_rate": 7.450674493106954e-07, + "loss": 0.5991, + "step": 69596 + }, + { + "epoch": 1.78, + "learning_rate": 7.450406932183443e-07, + "loss": 0.5474, + "step": 69597 + }, + { + "epoch": 1.78, + "learning_rate": 7.450139373212035e-07, + "loss": 0.6567, + "step": 69598 + }, + { + "epoch": 1.78, + "learning_rate": 7.449871816192941e-07, + "loss": 0.6865, + "step": 69599 + }, + { + "epoch": 1.78, + "learning_rate": 7.449604261126361e-07, + "loss": 0.5366, + "step": 69600 + }, + { + "epoch": 1.78, + "learning_rate": 7.449336708012503e-07, + "loss": 0.6421, + "step": 69601 + }, + { + "epoch": 1.78, + "learning_rate": 7.449069156851568e-07, + "loss": 0.6375, + "step": 69602 + }, + { + "epoch": 1.78, + "learning_rate": 7.448801607643767e-07, + "loss": 0.7256, + "step": 69603 + }, + { + "epoch": 1.78, + "learning_rate": 7.448534060389302e-07, + "loss": 0.6162, + "step": 69604 + }, + { + "epoch": 1.78, + "learning_rate": 7.448266515088374e-07, + "loss": 0.6401, + "step": 69605 + }, + { + "epoch": 1.78, + "learning_rate": 7.447998971741193e-07, + "loss": 0.6836, + "step": 69606 + }, + { + "epoch": 1.78, + "learning_rate": 7.447731430347958e-07, + "loss": 0.6758, + "step": 69607 + }, + { + "epoch": 1.78, + "learning_rate": 7.447463890908883e-07, + "loss": 0.8271, + "step": 69608 + }, + { + "epoch": 1.78, + "learning_rate": 7.447196353424164e-07, + "loss": 0.6045, + "step": 69609 + }, + { + "epoch": 1.78, + "learning_rate": 7.446928817894011e-07, + "loss": 0.5291, + "step": 69610 + }, + { + "epoch": 1.78, + "learning_rate": 7.446661284318627e-07, + "loss": 0.4719, + "step": 69611 + }, + { + "epoch": 1.78, + "learning_rate": 7.446393752698214e-07, + "loss": 0.7036, + "step": 69612 + }, + { + "epoch": 1.78, + "learning_rate": 7.446126223032984e-07, + "loss": 0.6279, + "step": 69613 + }, + { + "epoch": 1.78, + "learning_rate": 7.44585869532314e-07, + "loss": 0.8853, + "step": 69614 + }, + { + "epoch": 1.78, + "learning_rate": 7.445591169568879e-07, + "loss": 0.5464, + "step": 69615 + }, + { + "epoch": 1.78, + "learning_rate": 7.445323645770414e-07, + "loss": 0.5088, + "step": 69616 + }, + { + "epoch": 1.78, + "learning_rate": 7.445056123927945e-07, + "loss": 0.5398, + "step": 69617 + }, + { + "epoch": 1.78, + "learning_rate": 7.444788604041681e-07, + "loss": 0.5713, + "step": 69618 + }, + { + "epoch": 1.78, + "learning_rate": 7.444521086111824e-07, + "loss": 0.6182, + "step": 69619 + }, + { + "epoch": 1.78, + "learning_rate": 7.44425357013858e-07, + "loss": 0.4998, + "step": 69620 + }, + { + "epoch": 1.78, + "learning_rate": 7.443986056122152e-07, + "loss": 0.4751, + "step": 69621 + }, + { + "epoch": 1.78, + "learning_rate": 7.443718544062749e-07, + "loss": 0.3971, + "step": 69622 + }, + { + "epoch": 1.78, + "learning_rate": 7.443451033960571e-07, + "loss": 0.6816, + "step": 69623 + }, + { + "epoch": 1.78, + "learning_rate": 7.443183525815829e-07, + "loss": 0.709, + "step": 69624 + }, + { + "epoch": 1.78, + "learning_rate": 7.442916019628723e-07, + "loss": 0.5659, + "step": 69625 + }, + { + "epoch": 1.78, + "learning_rate": 7.442648515399455e-07, + "loss": 0.7266, + "step": 69626 + }, + { + "epoch": 1.78, + "learning_rate": 7.442381013128234e-07, + "loss": 0.3699, + "step": 69627 + }, + { + "epoch": 1.78, + "learning_rate": 7.442113512815266e-07, + "loss": 0.532, + "step": 69628 + }, + { + "epoch": 1.78, + "learning_rate": 7.441846014460753e-07, + "loss": 0.7358, + "step": 69629 + }, + { + "epoch": 1.78, + "learning_rate": 7.441578518064901e-07, + "loss": 0.7266, + "step": 69630 + }, + { + "epoch": 1.78, + "learning_rate": 7.441311023627915e-07, + "loss": 0.7061, + "step": 69631 + }, + { + "epoch": 1.78, + "learning_rate": 7.44104353115e-07, + "loss": 0.5933, + "step": 69632 + }, + { + "epoch": 1.78, + "learning_rate": 7.440776040631358e-07, + "loss": 0.709, + "step": 69633 + }, + { + "epoch": 1.78, + "learning_rate": 7.4405085520722e-07, + "loss": 0.5674, + "step": 69634 + }, + { + "epoch": 1.78, + "learning_rate": 7.440241065472725e-07, + "loss": 0.5835, + "step": 69635 + }, + { + "epoch": 1.78, + "learning_rate": 7.439973580833139e-07, + "loss": 0.667, + "step": 69636 + }, + { + "epoch": 1.78, + "learning_rate": 7.439706098153648e-07, + "loss": 0.7607, + "step": 69637 + }, + { + "epoch": 1.78, + "learning_rate": 7.439438617434454e-07, + "loss": 0.478, + "step": 69638 + }, + { + "epoch": 1.78, + "learning_rate": 7.439171138675768e-07, + "loss": 0.6069, + "step": 69639 + }, + { + "epoch": 1.78, + "learning_rate": 7.438903661877788e-07, + "loss": 0.6113, + "step": 69640 + }, + { + "epoch": 1.78, + "learning_rate": 7.438636187040724e-07, + "loss": 0.5547, + "step": 69641 + }, + { + "epoch": 1.78, + "learning_rate": 7.438368714164775e-07, + "loss": 0.7256, + "step": 69642 + }, + { + "epoch": 1.78, + "learning_rate": 7.438101243250153e-07, + "loss": 0.5911, + "step": 69643 + }, + { + "epoch": 1.79, + "learning_rate": 7.437833774297061e-07, + "loss": 0.5815, + "step": 69644 + }, + { + "epoch": 1.79, + "learning_rate": 7.4375663073057e-07, + "loss": 0.4531, + "step": 69645 + }, + { + "epoch": 1.79, + "learning_rate": 7.437298842276274e-07, + "loss": 0.7778, + "step": 69646 + }, + { + "epoch": 1.79, + "learning_rate": 7.437031379208992e-07, + "loss": 0.7021, + "step": 69647 + }, + { + "epoch": 1.79, + "learning_rate": 7.436763918104056e-07, + "loss": 0.6475, + "step": 69648 + }, + { + "epoch": 1.79, + "learning_rate": 7.436496458961674e-07, + "loss": 0.6621, + "step": 69649 + }, + { + "epoch": 1.79, + "learning_rate": 7.436229001782046e-07, + "loss": 0.5505, + "step": 69650 + }, + { + "epoch": 1.79, + "learning_rate": 7.435961546565383e-07, + "loss": 0.6938, + "step": 69651 + }, + { + "epoch": 1.79, + "learning_rate": 7.435694093311882e-07, + "loss": 0.6333, + "step": 69652 + }, + { + "epoch": 1.79, + "learning_rate": 7.435426642021756e-07, + "loss": 0.7217, + "step": 69653 + }, + { + "epoch": 1.79, + "learning_rate": 7.435159192695208e-07, + "loss": 0.5347, + "step": 69654 + }, + { + "epoch": 1.79, + "learning_rate": 7.434891745332436e-07, + "loss": 0.8574, + "step": 69655 + }, + { + "epoch": 1.79, + "learning_rate": 7.434624299933651e-07, + "loss": 0.7578, + "step": 69656 + }, + { + "epoch": 1.79, + "learning_rate": 7.434356856499055e-07, + "loss": 0.6455, + "step": 69657 + }, + { + "epoch": 1.79, + "learning_rate": 7.434089415028857e-07, + "loss": 0.7109, + "step": 69658 + }, + { + "epoch": 1.79, + "learning_rate": 7.433821975523255e-07, + "loss": 0.6514, + "step": 69659 + }, + { + "epoch": 1.79, + "learning_rate": 7.43355453798246e-07, + "loss": 0.5278, + "step": 69660 + }, + { + "epoch": 1.79, + "learning_rate": 7.433287102406672e-07, + "loss": 0.5117, + "step": 69661 + }, + { + "epoch": 1.79, + "learning_rate": 7.433019668796101e-07, + "loss": 0.8408, + "step": 69662 + }, + { + "epoch": 1.79, + "learning_rate": 7.432752237150945e-07, + "loss": 0.6821, + "step": 69663 + }, + { + "epoch": 1.79, + "learning_rate": 7.432484807471421e-07, + "loss": 0.7324, + "step": 69664 + }, + { + "epoch": 1.79, + "learning_rate": 7.432217379757717e-07, + "loss": 0.5972, + "step": 69665 + }, + { + "epoch": 1.79, + "learning_rate": 7.431949954010051e-07, + "loss": 0.5532, + "step": 69666 + }, + { + "epoch": 1.79, + "learning_rate": 7.431682530228618e-07, + "loss": 0.7715, + "step": 69667 + }, + { + "epoch": 1.79, + "learning_rate": 7.43141510841363e-07, + "loss": 0.7295, + "step": 69668 + }, + { + "epoch": 1.79, + "learning_rate": 7.431147688565288e-07, + "loss": 0.8525, + "step": 69669 + }, + { + "epoch": 1.79, + "learning_rate": 7.4308802706838e-07, + "loss": 0.71, + "step": 69670 + }, + { + "epoch": 1.79, + "learning_rate": 7.430612854769367e-07, + "loss": 0.7744, + "step": 69671 + }, + { + "epoch": 1.79, + "learning_rate": 7.430345440822198e-07, + "loss": 0.7031, + "step": 69672 + }, + { + "epoch": 1.79, + "learning_rate": 7.430078028842492e-07, + "loss": 0.5488, + "step": 69673 + }, + { + "epoch": 1.79, + "learning_rate": 7.429810618830462e-07, + "loss": 0.5269, + "step": 69674 + }, + { + "epoch": 1.79, + "learning_rate": 7.429543210786306e-07, + "loss": 0.5859, + "step": 69675 + }, + { + "epoch": 1.79, + "learning_rate": 7.429275804710229e-07, + "loss": 0.6079, + "step": 69676 + }, + { + "epoch": 1.79, + "learning_rate": 7.429008400602438e-07, + "loss": 0.5975, + "step": 69677 + }, + { + "epoch": 1.79, + "learning_rate": 7.428740998463136e-07, + "loss": 0.6494, + "step": 69678 + }, + { + "epoch": 1.79, + "learning_rate": 7.42847359829253e-07, + "loss": 0.5933, + "step": 69679 + }, + { + "epoch": 1.79, + "learning_rate": 7.428206200090822e-07, + "loss": 0.6082, + "step": 69680 + }, + { + "epoch": 1.79, + "learning_rate": 7.427938803858221e-07, + "loss": 0.4421, + "step": 69681 + }, + { + "epoch": 1.79, + "learning_rate": 7.427671409594926e-07, + "loss": 0.665, + "step": 69682 + }, + { + "epoch": 1.79, + "learning_rate": 7.427404017301147e-07, + "loss": 0.6885, + "step": 69683 + }, + { + "epoch": 1.79, + "learning_rate": 7.427136626977089e-07, + "loss": 0.6162, + "step": 69684 + }, + { + "epoch": 1.79, + "learning_rate": 7.42686923862295e-07, + "loss": 0.7178, + "step": 69685 + }, + { + "epoch": 1.79, + "learning_rate": 7.426601852238939e-07, + "loss": 0.5908, + "step": 69686 + }, + { + "epoch": 1.79, + "learning_rate": 7.426334467825262e-07, + "loss": 0.6631, + "step": 69687 + }, + { + "epoch": 1.79, + "learning_rate": 7.42606708538212e-07, + "loss": 0.6426, + "step": 69688 + }, + { + "epoch": 1.79, + "learning_rate": 7.425799704909723e-07, + "loss": 0.4897, + "step": 69689 + }, + { + "epoch": 1.79, + "learning_rate": 7.425532326408271e-07, + "loss": 0.8359, + "step": 69690 + }, + { + "epoch": 1.79, + "learning_rate": 7.425264949877972e-07, + "loss": 0.7012, + "step": 69691 + }, + { + "epoch": 1.79, + "learning_rate": 7.424997575319027e-07, + "loss": 0.6172, + "step": 69692 + }, + { + "epoch": 1.79, + "learning_rate": 7.424730202731644e-07, + "loss": 0.7188, + "step": 69693 + }, + { + "epoch": 1.79, + "learning_rate": 7.42446283211603e-07, + "loss": 0.7666, + "step": 69694 + }, + { + "epoch": 1.79, + "learning_rate": 7.424195463472382e-07, + "loss": 0.5156, + "step": 69695 + }, + { + "epoch": 1.79, + "learning_rate": 7.423928096800911e-07, + "loss": 0.7158, + "step": 69696 + }, + { + "epoch": 1.79, + "learning_rate": 7.423660732101818e-07, + "loss": 0.7012, + "step": 69697 + }, + { + "epoch": 1.79, + "learning_rate": 7.423393369375313e-07, + "loss": 0.6162, + "step": 69698 + }, + { + "epoch": 1.79, + "learning_rate": 7.423126008621593e-07, + "loss": 0.7588, + "step": 69699 + }, + { + "epoch": 1.79, + "learning_rate": 7.422858649840869e-07, + "loss": 0.5928, + "step": 69700 + }, + { + "epoch": 1.79, + "learning_rate": 7.422591293033344e-07, + "loss": 0.5461, + "step": 69701 + }, + { + "epoch": 1.79, + "learning_rate": 7.422323938199222e-07, + "loss": 0.79, + "step": 69702 + }, + { + "epoch": 1.79, + "learning_rate": 7.422056585338708e-07, + "loss": 0.6067, + "step": 69703 + }, + { + "epoch": 1.79, + "learning_rate": 7.42178923445201e-07, + "loss": 0.4937, + "step": 69704 + }, + { + "epoch": 1.79, + "learning_rate": 7.421521885539325e-07, + "loss": 0.54, + "step": 69705 + }, + { + "epoch": 1.79, + "learning_rate": 7.421254538600864e-07, + "loss": 0.7275, + "step": 69706 + }, + { + "epoch": 1.79, + "learning_rate": 7.420987193636828e-07, + "loss": 0.6592, + "step": 69707 + }, + { + "epoch": 1.79, + "learning_rate": 7.420719850647425e-07, + "loss": 0.7002, + "step": 69708 + }, + { + "epoch": 1.79, + "learning_rate": 7.420452509632857e-07, + "loss": 0.4304, + "step": 69709 + }, + { + "epoch": 1.79, + "learning_rate": 7.420185170593332e-07, + "loss": 0.7007, + "step": 69710 + }, + { + "epoch": 1.79, + "learning_rate": 7.419917833529049e-07, + "loss": 0.7266, + "step": 69711 + }, + { + "epoch": 1.79, + "learning_rate": 7.41965049844022e-07, + "loss": 0.5181, + "step": 69712 + }, + { + "epoch": 1.79, + "learning_rate": 7.419383165327042e-07, + "loss": 0.5452, + "step": 69713 + }, + { + "epoch": 1.79, + "learning_rate": 7.41911583418973e-07, + "loss": 0.4404, + "step": 69714 + }, + { + "epoch": 1.79, + "learning_rate": 7.418848505028479e-07, + "loss": 0.5908, + "step": 69715 + }, + { + "epoch": 1.79, + "learning_rate": 7.418581177843495e-07, + "loss": 0.6367, + "step": 69716 + }, + { + "epoch": 1.79, + "learning_rate": 7.418313852634988e-07, + "loss": 0.6533, + "step": 69717 + }, + { + "epoch": 1.79, + "learning_rate": 7.418046529403157e-07, + "loss": 0.8564, + "step": 69718 + }, + { + "epoch": 1.79, + "learning_rate": 7.417779208148209e-07, + "loss": 0.6802, + "step": 69719 + }, + { + "epoch": 1.79, + "learning_rate": 7.41751188887035e-07, + "loss": 0.6504, + "step": 69720 + }, + { + "epoch": 1.79, + "learning_rate": 7.417244571569781e-07, + "loss": 0.6553, + "step": 69721 + }, + { + "epoch": 1.79, + "learning_rate": 7.416977256246713e-07, + "loss": 0.6978, + "step": 69722 + }, + { + "epoch": 1.79, + "learning_rate": 7.416709942901343e-07, + "loss": 0.5967, + "step": 69723 + }, + { + "epoch": 1.79, + "learning_rate": 7.416442631533883e-07, + "loss": 0.6729, + "step": 69724 + }, + { + "epoch": 1.79, + "learning_rate": 7.416175322144534e-07, + "loss": 0.5386, + "step": 69725 + }, + { + "epoch": 1.79, + "learning_rate": 7.415908014733497e-07, + "loss": 0.6494, + "step": 69726 + }, + { + "epoch": 1.79, + "learning_rate": 7.415640709300983e-07, + "loss": 0.6289, + "step": 69727 + }, + { + "epoch": 1.79, + "learning_rate": 7.415373405847192e-07, + "loss": 0.5381, + "step": 69728 + }, + { + "epoch": 1.79, + "learning_rate": 7.415106104372333e-07, + "loss": 0.689, + "step": 69729 + }, + { + "epoch": 1.79, + "learning_rate": 7.414838804876607e-07, + "loss": 0.6255, + "step": 69730 + }, + { + "epoch": 1.79, + "learning_rate": 7.41457150736022e-07, + "loss": 0.7168, + "step": 69731 + }, + { + "epoch": 1.79, + "learning_rate": 7.414304211823376e-07, + "loss": 0.6895, + "step": 69732 + }, + { + "epoch": 1.79, + "learning_rate": 7.414036918266282e-07, + "loss": 0.6426, + "step": 69733 + }, + { + "epoch": 1.79, + "learning_rate": 7.413769626689144e-07, + "loss": 0.7695, + "step": 69734 + }, + { + "epoch": 1.79, + "learning_rate": 7.413502337092161e-07, + "loss": 0.6396, + "step": 69735 + }, + { + "epoch": 1.79, + "learning_rate": 7.413235049475539e-07, + "loss": 0.7314, + "step": 69736 + }, + { + "epoch": 1.79, + "learning_rate": 7.412967763839484e-07, + "loss": 0.5522, + "step": 69737 + }, + { + "epoch": 1.79, + "learning_rate": 7.412700480184201e-07, + "loss": 0.6172, + "step": 69738 + }, + { + "epoch": 1.79, + "learning_rate": 7.412433198509896e-07, + "loss": 0.7891, + "step": 69739 + }, + { + "epoch": 1.79, + "learning_rate": 7.412165918816768e-07, + "loss": 0.7207, + "step": 69740 + }, + { + "epoch": 1.79, + "learning_rate": 7.41189864110503e-07, + "loss": 0.5327, + "step": 69741 + }, + { + "epoch": 1.79, + "learning_rate": 7.411631365374877e-07, + "loss": 0.552, + "step": 69742 + }, + { + "epoch": 1.79, + "learning_rate": 7.411364091626526e-07, + "loss": 0.8086, + "step": 69743 + }, + { + "epoch": 1.79, + "learning_rate": 7.411096819860172e-07, + "loss": 0.493, + "step": 69744 + }, + { + "epoch": 1.79, + "learning_rate": 7.410829550076019e-07, + "loss": 0.5551, + "step": 69745 + }, + { + "epoch": 1.79, + "learning_rate": 7.410562282274277e-07, + "loss": 0.7891, + "step": 69746 + }, + { + "epoch": 1.79, + "learning_rate": 7.410295016455145e-07, + "loss": 0.561, + "step": 69747 + }, + { + "epoch": 1.79, + "learning_rate": 7.410027752618837e-07, + "loss": 0.5801, + "step": 69748 + }, + { + "epoch": 1.79, + "learning_rate": 7.409760490765546e-07, + "loss": 0.6592, + "step": 69749 + }, + { + "epoch": 1.79, + "learning_rate": 7.409493230895486e-07, + "loss": 0.5654, + "step": 69750 + }, + { + "epoch": 1.79, + "learning_rate": 7.409225973008855e-07, + "loss": 0.7432, + "step": 69751 + }, + { + "epoch": 1.79, + "learning_rate": 7.408958717105864e-07, + "loss": 0.4244, + "step": 69752 + }, + { + "epoch": 1.79, + "learning_rate": 7.408691463186714e-07, + "loss": 0.6069, + "step": 69753 + }, + { + "epoch": 1.79, + "learning_rate": 7.40842421125161e-07, + "loss": 0.4849, + "step": 69754 + }, + { + "epoch": 1.79, + "learning_rate": 7.408156961300753e-07, + "loss": 0.4719, + "step": 69755 + }, + { + "epoch": 1.79, + "learning_rate": 7.407889713334355e-07, + "loss": 0.5176, + "step": 69756 + }, + { + "epoch": 1.79, + "learning_rate": 7.407622467352613e-07, + "loss": 0.4352, + "step": 69757 + }, + { + "epoch": 1.79, + "learning_rate": 7.407355223355736e-07, + "loss": 0.7598, + "step": 69758 + }, + { + "epoch": 1.79, + "learning_rate": 7.407087981343927e-07, + "loss": 0.6421, + "step": 69759 + }, + { + "epoch": 1.79, + "learning_rate": 7.406820741317394e-07, + "loss": 0.7598, + "step": 69760 + }, + { + "epoch": 1.79, + "learning_rate": 7.406553503276337e-07, + "loss": 0.75, + "step": 69761 + }, + { + "epoch": 1.79, + "learning_rate": 7.406286267220965e-07, + "loss": 0.6899, + "step": 69762 + }, + { + "epoch": 1.79, + "learning_rate": 7.406019033151483e-07, + "loss": 0.6191, + "step": 69763 + }, + { + "epoch": 1.79, + "learning_rate": 7.405751801068088e-07, + "loss": 0.4777, + "step": 69764 + }, + { + "epoch": 1.79, + "learning_rate": 7.40548457097099e-07, + "loss": 0.5122, + "step": 69765 + }, + { + "epoch": 1.79, + "learning_rate": 7.405217342860392e-07, + "loss": 0.6494, + "step": 69766 + }, + { + "epoch": 1.79, + "learning_rate": 7.404950116736503e-07, + "loss": 0.5342, + "step": 69767 + }, + { + "epoch": 1.79, + "learning_rate": 7.404682892599523e-07, + "loss": 0.644, + "step": 69768 + }, + { + "epoch": 1.79, + "learning_rate": 7.404415670449657e-07, + "loss": 0.5957, + "step": 69769 + }, + { + "epoch": 1.79, + "learning_rate": 7.404148450287111e-07, + "loss": 0.6006, + "step": 69770 + }, + { + "epoch": 1.79, + "learning_rate": 7.40388123211209e-07, + "loss": 0.7017, + "step": 69771 + }, + { + "epoch": 1.79, + "learning_rate": 7.403614015924797e-07, + "loss": 0.3773, + "step": 69772 + }, + { + "epoch": 1.79, + "learning_rate": 7.403346801725443e-07, + "loss": 0.8125, + "step": 69773 + }, + { + "epoch": 1.79, + "learning_rate": 7.40307958951422e-07, + "loss": 0.4778, + "step": 69774 + }, + { + "epoch": 1.79, + "learning_rate": 7.402812379291343e-07, + "loss": 0.6162, + "step": 69775 + }, + { + "epoch": 1.79, + "learning_rate": 7.40254517105701e-07, + "loss": 0.4275, + "step": 69776 + }, + { + "epoch": 1.79, + "learning_rate": 7.40227796481143e-07, + "loss": 0.6631, + "step": 69777 + }, + { + "epoch": 1.79, + "learning_rate": 7.402010760554807e-07, + "loss": 0.708, + "step": 69778 + }, + { + "epoch": 1.79, + "learning_rate": 7.401743558287345e-07, + "loss": 0.4824, + "step": 69779 + }, + { + "epoch": 1.79, + "learning_rate": 7.401476358009246e-07, + "loss": 0.5769, + "step": 69780 + }, + { + "epoch": 1.79, + "learning_rate": 7.40120915972072e-07, + "loss": 0.561, + "step": 69781 + }, + { + "epoch": 1.79, + "learning_rate": 7.400941963421967e-07, + "loss": 0.5656, + "step": 69782 + }, + { + "epoch": 1.79, + "learning_rate": 7.400674769113197e-07, + "loss": 0.4346, + "step": 69783 + }, + { + "epoch": 1.79, + "learning_rate": 7.400407576794608e-07, + "loss": 0.4524, + "step": 69784 + }, + { + "epoch": 1.79, + "learning_rate": 7.400140386466406e-07, + "loss": 0.7256, + "step": 69785 + }, + { + "epoch": 1.79, + "learning_rate": 7.399873198128799e-07, + "loss": 0.6191, + "step": 69786 + }, + { + "epoch": 1.79, + "learning_rate": 7.399606011781987e-07, + "loss": 0.5381, + "step": 69787 + }, + { + "epoch": 1.79, + "learning_rate": 7.399338827426179e-07, + "loss": 0.7261, + "step": 69788 + }, + { + "epoch": 1.79, + "learning_rate": 7.399071645061576e-07, + "loss": 0.8467, + "step": 69789 + }, + { + "epoch": 1.79, + "learning_rate": 7.398804464688387e-07, + "loss": 0.3276, + "step": 69790 + }, + { + "epoch": 1.79, + "learning_rate": 7.398537286306814e-07, + "loss": 0.7275, + "step": 69791 + }, + { + "epoch": 1.79, + "learning_rate": 7.398270109917058e-07, + "loss": 0.6235, + "step": 69792 + }, + { + "epoch": 1.79, + "learning_rate": 7.398002935519332e-07, + "loss": 0.6582, + "step": 69793 + }, + { + "epoch": 1.79, + "learning_rate": 7.397735763113832e-07, + "loss": 0.6602, + "step": 69794 + }, + { + "epoch": 1.79, + "learning_rate": 7.397468592700766e-07, + "loss": 0.6973, + "step": 69795 + }, + { + "epoch": 1.79, + "learning_rate": 7.397201424280339e-07, + "loss": 0.7295, + "step": 69796 + }, + { + "epoch": 1.79, + "learning_rate": 7.396934257852754e-07, + "loss": 0.6426, + "step": 69797 + }, + { + "epoch": 1.79, + "learning_rate": 7.396667093418219e-07, + "loss": 0.6855, + "step": 69798 + }, + { + "epoch": 1.79, + "learning_rate": 7.396399930976934e-07, + "loss": 0.7256, + "step": 69799 + }, + { + "epoch": 1.79, + "learning_rate": 7.396132770529107e-07, + "loss": 0.6265, + "step": 69800 + }, + { + "epoch": 1.79, + "learning_rate": 7.395865612074941e-07, + "loss": 0.6938, + "step": 69801 + }, + { + "epoch": 1.79, + "learning_rate": 7.395598455614643e-07, + "loss": 0.7441, + "step": 69802 + }, + { + "epoch": 1.79, + "learning_rate": 7.395331301148417e-07, + "loss": 0.8184, + "step": 69803 + }, + { + "epoch": 1.79, + "learning_rate": 7.395064148676461e-07, + "loss": 0.6021, + "step": 69804 + }, + { + "epoch": 1.79, + "learning_rate": 7.394796998198988e-07, + "loss": 0.6758, + "step": 69805 + }, + { + "epoch": 1.79, + "learning_rate": 7.394529849716195e-07, + "loss": 0.8242, + "step": 69806 + }, + { + "epoch": 1.79, + "learning_rate": 7.394262703228295e-07, + "loss": 0.4727, + "step": 69807 + }, + { + "epoch": 1.79, + "learning_rate": 7.393995558735488e-07, + "loss": 0.4482, + "step": 69808 + }, + { + "epoch": 1.79, + "learning_rate": 7.393728416237976e-07, + "loss": 0.6069, + "step": 69809 + }, + { + "epoch": 1.79, + "learning_rate": 7.393461275735968e-07, + "loss": 0.7393, + "step": 69810 + }, + { + "epoch": 1.79, + "learning_rate": 7.393194137229666e-07, + "loss": 0.6709, + "step": 69811 + }, + { + "epoch": 1.79, + "learning_rate": 7.392927000719277e-07, + "loss": 0.5752, + "step": 69812 + }, + { + "epoch": 1.79, + "learning_rate": 7.392659866205006e-07, + "loss": 0.7627, + "step": 69813 + }, + { + "epoch": 1.79, + "learning_rate": 7.392392733687051e-07, + "loss": 0.5415, + "step": 69814 + }, + { + "epoch": 1.79, + "learning_rate": 7.392125603165622e-07, + "loss": 0.6152, + "step": 69815 + }, + { + "epoch": 1.79, + "learning_rate": 7.391858474640922e-07, + "loss": 0.6484, + "step": 69816 + }, + { + "epoch": 1.79, + "learning_rate": 7.391591348113157e-07, + "loss": 0.4443, + "step": 69817 + }, + { + "epoch": 1.79, + "learning_rate": 7.39132422358253e-07, + "loss": 0.667, + "step": 69818 + }, + { + "epoch": 1.79, + "learning_rate": 7.391057101049247e-07, + "loss": 0.561, + "step": 69819 + }, + { + "epoch": 1.79, + "learning_rate": 7.390789980513509e-07, + "loss": 0.7451, + "step": 69820 + }, + { + "epoch": 1.79, + "learning_rate": 7.390522861975527e-07, + "loss": 0.6553, + "step": 69821 + }, + { + "epoch": 1.79, + "learning_rate": 7.390255745435499e-07, + "loss": 0.562, + "step": 69822 + }, + { + "epoch": 1.79, + "learning_rate": 7.389988630893636e-07, + "loss": 0.6484, + "step": 69823 + }, + { + "epoch": 1.79, + "learning_rate": 7.389721518350137e-07, + "loss": 0.5525, + "step": 69824 + }, + { + "epoch": 1.79, + "learning_rate": 7.389454407805208e-07, + "loss": 0.8984, + "step": 69825 + }, + { + "epoch": 1.79, + "learning_rate": 7.389187299259052e-07, + "loss": 0.6094, + "step": 69826 + }, + { + "epoch": 1.79, + "learning_rate": 7.388920192711876e-07, + "loss": 0.6592, + "step": 69827 + }, + { + "epoch": 1.79, + "learning_rate": 7.388653088163883e-07, + "loss": 0.6924, + "step": 69828 + }, + { + "epoch": 1.79, + "learning_rate": 7.38838598561528e-07, + "loss": 0.667, + "step": 69829 + }, + { + "epoch": 1.79, + "learning_rate": 7.388118885066268e-07, + "loss": 0.5031, + "step": 69830 + }, + { + "epoch": 1.79, + "learning_rate": 7.387851786517054e-07, + "loss": 0.6353, + "step": 69831 + }, + { + "epoch": 1.79, + "learning_rate": 7.387584689967841e-07, + "loss": 0.6191, + "step": 69832 + }, + { + "epoch": 1.79, + "learning_rate": 7.387317595418838e-07, + "loss": 0.7021, + "step": 69833 + }, + { + "epoch": 1.79, + "learning_rate": 7.387050502870243e-07, + "loss": 0.5724, + "step": 69834 + }, + { + "epoch": 1.79, + "learning_rate": 7.386783412322262e-07, + "loss": 0.6133, + "step": 69835 + }, + { + "epoch": 1.79, + "learning_rate": 7.386516323775103e-07, + "loss": 0.7822, + "step": 69836 + }, + { + "epoch": 1.79, + "learning_rate": 7.386249237228967e-07, + "loss": 0.7373, + "step": 69837 + }, + { + "epoch": 1.79, + "learning_rate": 7.38598215268406e-07, + "loss": 0.8203, + "step": 69838 + }, + { + "epoch": 1.79, + "learning_rate": 7.385715070140586e-07, + "loss": 0.7129, + "step": 69839 + }, + { + "epoch": 1.79, + "learning_rate": 7.38544798959875e-07, + "loss": 0.6855, + "step": 69840 + }, + { + "epoch": 1.79, + "learning_rate": 7.385180911058755e-07, + "loss": 0.4854, + "step": 69841 + }, + { + "epoch": 1.79, + "learning_rate": 7.384913834520809e-07, + "loss": 0.4663, + "step": 69842 + }, + { + "epoch": 1.79, + "learning_rate": 7.384646759985116e-07, + "loss": 0.6328, + "step": 69843 + }, + { + "epoch": 1.79, + "learning_rate": 7.384379687451877e-07, + "loss": 0.7485, + "step": 69844 + }, + { + "epoch": 1.79, + "learning_rate": 7.384112616921297e-07, + "loss": 0.7041, + "step": 69845 + }, + { + "epoch": 1.79, + "learning_rate": 7.383845548393582e-07, + "loss": 0.7734, + "step": 69846 + }, + { + "epoch": 1.79, + "learning_rate": 7.383578481868935e-07, + "loss": 0.7148, + "step": 69847 + }, + { + "epoch": 1.79, + "learning_rate": 7.383311417347563e-07, + "loss": 0.6543, + "step": 69848 + }, + { + "epoch": 1.79, + "learning_rate": 7.383044354829667e-07, + "loss": 0.7334, + "step": 69849 + }, + { + "epoch": 1.79, + "learning_rate": 7.382777294315457e-07, + "loss": 0.6494, + "step": 69850 + }, + { + "epoch": 1.79, + "learning_rate": 7.382510235805131e-07, + "loss": 0.5938, + "step": 69851 + }, + { + "epoch": 1.79, + "learning_rate": 7.382243179298899e-07, + "loss": 0.6533, + "step": 69852 + }, + { + "epoch": 1.79, + "learning_rate": 7.381976124796965e-07, + "loss": 0.6104, + "step": 69853 + }, + { + "epoch": 1.79, + "learning_rate": 7.381709072299527e-07, + "loss": 0.748, + "step": 69854 + }, + { + "epoch": 1.79, + "learning_rate": 7.381442021806797e-07, + "loss": 0.5662, + "step": 69855 + }, + { + "epoch": 1.79, + "learning_rate": 7.381174973318973e-07, + "loss": 0.5635, + "step": 69856 + }, + { + "epoch": 1.79, + "learning_rate": 7.380907926836267e-07, + "loss": 0.7158, + "step": 69857 + }, + { + "epoch": 1.79, + "learning_rate": 7.380640882358875e-07, + "loss": 0.5088, + "step": 69858 + }, + { + "epoch": 1.79, + "learning_rate": 7.380373839887008e-07, + "loss": 0.5605, + "step": 69859 + }, + { + "epoch": 1.79, + "learning_rate": 7.380106799420868e-07, + "loss": 0.6606, + "step": 69860 + }, + { + "epoch": 1.79, + "learning_rate": 7.379839760960662e-07, + "loss": 0.7949, + "step": 69861 + }, + { + "epoch": 1.79, + "learning_rate": 7.379572724506589e-07, + "loss": 0.6631, + "step": 69862 + }, + { + "epoch": 1.79, + "learning_rate": 7.379305690058863e-07, + "loss": 0.5972, + "step": 69863 + }, + { + "epoch": 1.79, + "learning_rate": 7.379038657617675e-07, + "loss": 0.6392, + "step": 69864 + }, + { + "epoch": 1.79, + "learning_rate": 7.37877162718324e-07, + "loss": 0.9053, + "step": 69865 + }, + { + "epoch": 1.79, + "learning_rate": 7.378504598755757e-07, + "loss": 0.6089, + "step": 69866 + }, + { + "epoch": 1.79, + "learning_rate": 7.378237572335434e-07, + "loss": 0.55, + "step": 69867 + }, + { + "epoch": 1.79, + "learning_rate": 7.377970547922472e-07, + "loss": 0.6279, + "step": 69868 + }, + { + "epoch": 1.79, + "learning_rate": 7.377703525517079e-07, + "loss": 0.6587, + "step": 69869 + }, + { + "epoch": 1.79, + "learning_rate": 7.377436505119456e-07, + "loss": 0.4351, + "step": 69870 + }, + { + "epoch": 1.79, + "learning_rate": 7.377169486729812e-07, + "loss": 0.6973, + "step": 69871 + }, + { + "epoch": 1.79, + "learning_rate": 7.376902470348346e-07, + "loss": 0.5112, + "step": 69872 + }, + { + "epoch": 1.79, + "learning_rate": 7.376635455975271e-07, + "loss": 0.6836, + "step": 69873 + }, + { + "epoch": 1.79, + "learning_rate": 7.37636844361078e-07, + "loss": 0.769, + "step": 69874 + }, + { + "epoch": 1.79, + "learning_rate": 7.376101433255084e-07, + "loss": 0.5957, + "step": 69875 + }, + { + "epoch": 1.79, + "learning_rate": 7.375834424908388e-07, + "loss": 0.7334, + "step": 69876 + }, + { + "epoch": 1.79, + "learning_rate": 7.375567418570892e-07, + "loss": 0.6528, + "step": 69877 + }, + { + "epoch": 1.79, + "learning_rate": 7.375300414242807e-07, + "loss": 0.6592, + "step": 69878 + }, + { + "epoch": 1.79, + "learning_rate": 7.375033411924329e-07, + "loss": 0.667, + "step": 69879 + }, + { + "epoch": 1.79, + "learning_rate": 7.374766411615672e-07, + "loss": 0.7363, + "step": 69880 + }, + { + "epoch": 1.79, + "learning_rate": 7.374499413317034e-07, + "loss": 0.6812, + "step": 69881 + }, + { + "epoch": 1.79, + "learning_rate": 7.37423241702862e-07, + "loss": 0.708, + "step": 69882 + }, + { + "epoch": 1.79, + "learning_rate": 7.373965422750639e-07, + "loss": 0.5437, + "step": 69883 + }, + { + "epoch": 1.79, + "learning_rate": 7.373698430483291e-07, + "loss": 0.7402, + "step": 69884 + }, + { + "epoch": 1.79, + "learning_rate": 7.373431440226778e-07, + "loss": 0.7256, + "step": 69885 + }, + { + "epoch": 1.79, + "learning_rate": 7.373164451981309e-07, + "loss": 0.7617, + "step": 69886 + }, + { + "epoch": 1.79, + "learning_rate": 7.372897465747087e-07, + "loss": 0.5239, + "step": 69887 + }, + { + "epoch": 1.79, + "learning_rate": 7.372630481524317e-07, + "loss": 0.6284, + "step": 69888 + }, + { + "epoch": 1.79, + "learning_rate": 7.372363499313203e-07, + "loss": 0.5547, + "step": 69889 + }, + { + "epoch": 1.79, + "learning_rate": 7.37209651911395e-07, + "loss": 0.6821, + "step": 69890 + }, + { + "epoch": 1.79, + "learning_rate": 7.371829540926759e-07, + "loss": 0.7959, + "step": 69891 + }, + { + "epoch": 1.79, + "learning_rate": 7.371562564751841e-07, + "loss": 0.6626, + "step": 69892 + }, + { + "epoch": 1.79, + "learning_rate": 7.371295590589399e-07, + "loss": 0.5125, + "step": 69893 + }, + { + "epoch": 1.79, + "learning_rate": 7.37102861843963e-07, + "loss": 0.6602, + "step": 69894 + }, + { + "epoch": 1.79, + "learning_rate": 7.370761648302745e-07, + "loss": 0.6816, + "step": 69895 + }, + { + "epoch": 1.79, + "learning_rate": 7.370494680178947e-07, + "loss": 0.7295, + "step": 69896 + }, + { + "epoch": 1.79, + "learning_rate": 7.370227714068441e-07, + "loss": 0.627, + "step": 69897 + }, + { + "epoch": 1.79, + "learning_rate": 7.369960749971431e-07, + "loss": 0.6011, + "step": 69898 + }, + { + "epoch": 1.79, + "learning_rate": 7.369693787888118e-07, + "loss": 0.626, + "step": 69899 + }, + { + "epoch": 1.79, + "learning_rate": 7.369426827818714e-07, + "loss": 0.6611, + "step": 69900 + }, + { + "epoch": 1.79, + "learning_rate": 7.369159869763415e-07, + "loss": 0.6802, + "step": 69901 + }, + { + "epoch": 1.79, + "learning_rate": 7.368892913722431e-07, + "loss": 0.4232, + "step": 69902 + }, + { + "epoch": 1.79, + "learning_rate": 7.368625959695967e-07, + "loss": 0.543, + "step": 69903 + }, + { + "epoch": 1.79, + "learning_rate": 7.368359007684221e-07, + "loss": 0.4802, + "step": 69904 + }, + { + "epoch": 1.79, + "learning_rate": 7.368092057687405e-07, + "loss": 0.5532, + "step": 69905 + }, + { + "epoch": 1.79, + "learning_rate": 7.367825109705716e-07, + "loss": 0.6274, + "step": 69906 + }, + { + "epoch": 1.79, + "learning_rate": 7.367558163739367e-07, + "loss": 0.752, + "step": 69907 + }, + { + "epoch": 1.79, + "learning_rate": 7.367291219788552e-07, + "loss": 0.6064, + "step": 69908 + }, + { + "epoch": 1.79, + "learning_rate": 7.367024277853486e-07, + "loss": 0.5906, + "step": 69909 + }, + { + "epoch": 1.79, + "learning_rate": 7.366757337934365e-07, + "loss": 0.4452, + "step": 69910 + }, + { + "epoch": 1.79, + "learning_rate": 7.3664904000314e-07, + "loss": 0.5547, + "step": 69911 + }, + { + "epoch": 1.79, + "learning_rate": 7.36622346414479e-07, + "loss": 0.707, + "step": 69912 + }, + { + "epoch": 1.79, + "learning_rate": 7.365956530274744e-07, + "loss": 0.6582, + "step": 69913 + }, + { + "epoch": 1.79, + "learning_rate": 7.365689598421463e-07, + "loss": 0.6963, + "step": 69914 + }, + { + "epoch": 1.79, + "learning_rate": 7.365422668585153e-07, + "loss": 0.6094, + "step": 69915 + }, + { + "epoch": 1.79, + "learning_rate": 7.365155740766013e-07, + "loss": 0.6387, + "step": 69916 + }, + { + "epoch": 1.79, + "learning_rate": 7.364888814964258e-07, + "loss": 0.6719, + "step": 69917 + }, + { + "epoch": 1.79, + "learning_rate": 7.364621891180081e-07, + "loss": 0.7627, + "step": 69918 + }, + { + "epoch": 1.79, + "learning_rate": 7.364354969413696e-07, + "loss": 0.6172, + "step": 69919 + }, + { + "epoch": 1.79, + "learning_rate": 7.3640880496653e-07, + "loss": 0.6426, + "step": 69920 + }, + { + "epoch": 1.79, + "learning_rate": 7.363821131935104e-07, + "loss": 0.6123, + "step": 69921 + }, + { + "epoch": 1.79, + "learning_rate": 7.363554216223307e-07, + "loss": 0.5762, + "step": 69922 + }, + { + "epoch": 1.79, + "learning_rate": 7.363287302530118e-07, + "loss": 0.5249, + "step": 69923 + }, + { + "epoch": 1.79, + "learning_rate": 7.363020390855737e-07, + "loss": 0.5908, + "step": 69924 + }, + { + "epoch": 1.79, + "learning_rate": 7.362753481200367e-07, + "loss": 0.6592, + "step": 69925 + }, + { + "epoch": 1.79, + "learning_rate": 7.36248657356422e-07, + "loss": 0.6094, + "step": 69926 + }, + { + "epoch": 1.79, + "learning_rate": 7.362219667947491e-07, + "loss": 0.7314, + "step": 69927 + }, + { + "epoch": 1.79, + "learning_rate": 7.361952764350394e-07, + "loss": 0.5293, + "step": 69928 + }, + { + "epoch": 1.79, + "learning_rate": 7.361685862773124e-07, + "loss": 0.4436, + "step": 69929 + }, + { + "epoch": 1.79, + "learning_rate": 7.361418963215893e-07, + "loss": 0.6777, + "step": 69930 + }, + { + "epoch": 1.79, + "learning_rate": 7.3611520656789e-07, + "loss": 0.4849, + "step": 69931 + }, + { + "epoch": 1.79, + "learning_rate": 7.360885170162353e-07, + "loss": 0.5398, + "step": 69932 + }, + { + "epoch": 1.79, + "learning_rate": 7.360618276666457e-07, + "loss": 0.7544, + "step": 69933 + }, + { + "epoch": 1.79, + "learning_rate": 7.360351385191412e-07, + "loss": 0.5942, + "step": 69934 + }, + { + "epoch": 1.79, + "learning_rate": 7.360084495737424e-07, + "loss": 0.4827, + "step": 69935 + }, + { + "epoch": 1.79, + "learning_rate": 7.359817608304699e-07, + "loss": 0.5898, + "step": 69936 + }, + { + "epoch": 1.79, + "learning_rate": 7.359550722893438e-07, + "loss": 0.5254, + "step": 69937 + }, + { + "epoch": 1.79, + "learning_rate": 7.35928383950385e-07, + "loss": 0.604, + "step": 69938 + }, + { + "epoch": 1.79, + "learning_rate": 7.359016958136135e-07, + "loss": 0.584, + "step": 69939 + }, + { + "epoch": 1.79, + "learning_rate": 7.358750078790501e-07, + "loss": 0.5845, + "step": 69940 + }, + { + "epoch": 1.79, + "learning_rate": 7.35848320146715e-07, + "loss": 0.6846, + "step": 69941 + }, + { + "epoch": 1.79, + "learning_rate": 7.358216326166287e-07, + "loss": 0.6392, + "step": 69942 + }, + { + "epoch": 1.79, + "learning_rate": 7.35794945288812e-07, + "loss": 0.6641, + "step": 69943 + }, + { + "epoch": 1.79, + "learning_rate": 7.357682581632843e-07, + "loss": 0.667, + "step": 69944 + }, + { + "epoch": 1.79, + "learning_rate": 7.35741571240067e-07, + "loss": 0.6162, + "step": 69945 + }, + { + "epoch": 1.79, + "learning_rate": 7.357148845191801e-07, + "loss": 0.7163, + "step": 69946 + }, + { + "epoch": 1.79, + "learning_rate": 7.356881980006445e-07, + "loss": 0.6777, + "step": 69947 + }, + { + "epoch": 1.79, + "learning_rate": 7.356615116844797e-07, + "loss": 0.7197, + "step": 69948 + }, + { + "epoch": 1.79, + "learning_rate": 7.356348255707072e-07, + "loss": 0.4685, + "step": 69949 + }, + { + "epoch": 1.79, + "learning_rate": 7.356081396593467e-07, + "loss": 0.6147, + "step": 69950 + }, + { + "epoch": 1.79, + "learning_rate": 7.355814539504192e-07, + "loss": 0.6284, + "step": 69951 + }, + { + "epoch": 1.79, + "learning_rate": 7.355547684439445e-07, + "loss": 0.5752, + "step": 69952 + }, + { + "epoch": 1.79, + "learning_rate": 7.355280831399439e-07, + "loss": 0.5601, + "step": 69953 + }, + { + "epoch": 1.79, + "learning_rate": 7.355013980384369e-07, + "loss": 0.686, + "step": 69954 + }, + { + "epoch": 1.79, + "learning_rate": 7.354747131394443e-07, + "loss": 0.7734, + "step": 69955 + }, + { + "epoch": 1.79, + "learning_rate": 7.354480284429865e-07, + "loss": 0.4375, + "step": 69956 + }, + { + "epoch": 1.79, + "learning_rate": 7.354213439490842e-07, + "loss": 0.75, + "step": 69957 + }, + { + "epoch": 1.79, + "learning_rate": 7.353946596577572e-07, + "loss": 0.731, + "step": 69958 + }, + { + "epoch": 1.79, + "learning_rate": 7.353679755690267e-07, + "loss": 0.7246, + "step": 69959 + }, + { + "epoch": 1.79, + "learning_rate": 7.353412916829125e-07, + "loss": 0.6719, + "step": 69960 + }, + { + "epoch": 1.79, + "learning_rate": 7.353146079994356e-07, + "loss": 0.6816, + "step": 69961 + }, + { + "epoch": 1.79, + "learning_rate": 7.352879245186158e-07, + "loss": 0.6934, + "step": 69962 + }, + { + "epoch": 1.79, + "learning_rate": 7.352612412404744e-07, + "loss": 0.751, + "step": 69963 + }, + { + "epoch": 1.79, + "learning_rate": 7.35234558165031e-07, + "loss": 0.5215, + "step": 69964 + }, + { + "epoch": 1.79, + "learning_rate": 7.352078752923063e-07, + "loss": 0.6748, + "step": 69965 + }, + { + "epoch": 1.79, + "learning_rate": 7.351811926223209e-07, + "loss": 0.751, + "step": 69966 + }, + { + "epoch": 1.79, + "learning_rate": 7.351545101550947e-07, + "loss": 0.5537, + "step": 69967 + }, + { + "epoch": 1.79, + "learning_rate": 7.351278278906488e-07, + "loss": 0.3777, + "step": 69968 + }, + { + "epoch": 1.79, + "learning_rate": 7.351011458290031e-07, + "loss": 0.6592, + "step": 69969 + }, + { + "epoch": 1.79, + "learning_rate": 7.350744639701785e-07, + "loss": 0.4027, + "step": 69970 + }, + { + "epoch": 1.79, + "learning_rate": 7.350477823141953e-07, + "loss": 0.7666, + "step": 69971 + }, + { + "epoch": 1.79, + "learning_rate": 7.350211008610735e-07, + "loss": 0.6973, + "step": 69972 + }, + { + "epoch": 1.79, + "learning_rate": 7.349944196108345e-07, + "loss": 0.4917, + "step": 69973 + }, + { + "epoch": 1.79, + "learning_rate": 7.349677385634976e-07, + "loss": 0.4526, + "step": 69974 + }, + { + "epoch": 1.79, + "learning_rate": 7.349410577190835e-07, + "loss": 0.6162, + "step": 69975 + }, + { + "epoch": 1.79, + "learning_rate": 7.349143770776133e-07, + "loss": 0.5894, + "step": 69976 + }, + { + "epoch": 1.79, + "learning_rate": 7.348876966391067e-07, + "loss": 0.6846, + "step": 69977 + }, + { + "epoch": 1.79, + "learning_rate": 7.348610164035844e-07, + "loss": 0.7676, + "step": 69978 + }, + { + "epoch": 1.79, + "learning_rate": 7.348343363710667e-07, + "loss": 0.5903, + "step": 69979 + }, + { + "epoch": 1.79, + "learning_rate": 7.348076565415746e-07, + "loss": 0.6362, + "step": 69980 + }, + { + "epoch": 1.79, + "learning_rate": 7.347809769151277e-07, + "loss": 0.4045, + "step": 69981 + }, + { + "epoch": 1.79, + "learning_rate": 7.34754297491747e-07, + "loss": 0.5771, + "step": 69982 + }, + { + "epoch": 1.79, + "learning_rate": 7.34727618271453e-07, + "loss": 0.5889, + "step": 69983 + }, + { + "epoch": 1.79, + "learning_rate": 7.347009392542654e-07, + "loss": 0.6045, + "step": 69984 + }, + { + "epoch": 1.79, + "learning_rate": 7.346742604402053e-07, + "loss": 0.7139, + "step": 69985 + }, + { + "epoch": 1.79, + "learning_rate": 7.346475818292927e-07, + "loss": 0.5654, + "step": 69986 + }, + { + "epoch": 1.79, + "learning_rate": 7.346209034215484e-07, + "loss": 0.5762, + "step": 69987 + }, + { + "epoch": 1.79, + "learning_rate": 7.345942252169928e-07, + "loss": 0.5522, + "step": 69988 + }, + { + "epoch": 1.79, + "learning_rate": 7.345675472156461e-07, + "loss": 0.6738, + "step": 69989 + }, + { + "epoch": 1.79, + "learning_rate": 7.345408694175288e-07, + "loss": 0.6204, + "step": 69990 + }, + { + "epoch": 1.79, + "learning_rate": 7.345141918226612e-07, + "loss": 0.5371, + "step": 69991 + }, + { + "epoch": 1.79, + "learning_rate": 7.34487514431064e-07, + "loss": 0.5898, + "step": 69992 + }, + { + "epoch": 1.79, + "learning_rate": 7.344608372427579e-07, + "loss": 0.6377, + "step": 69993 + }, + { + "epoch": 1.79, + "learning_rate": 7.344341602577624e-07, + "loss": 0.5933, + "step": 69994 + }, + { + "epoch": 1.79, + "learning_rate": 7.344074834760987e-07, + "loss": 0.6528, + "step": 69995 + }, + { + "epoch": 1.79, + "learning_rate": 7.343808068977868e-07, + "loss": 0.4229, + "step": 69996 + }, + { + "epoch": 1.79, + "learning_rate": 7.343541305228475e-07, + "loss": 0.5498, + "step": 69997 + }, + { + "epoch": 1.79, + "learning_rate": 7.343274543513007e-07, + "loss": 0.6475, + "step": 69998 + }, + { + "epoch": 1.79, + "learning_rate": 7.343007783831675e-07, + "loss": 0.635, + "step": 69999 + }, + { + "epoch": 1.79, + "learning_rate": 7.342741026184676e-07, + "loss": 0.6748, + "step": 70000 + }, + { + "epoch": 1.79, + "learning_rate": 7.342474270572222e-07, + "loss": 0.4531, + "step": 70001 + }, + { + "epoch": 1.79, + "learning_rate": 7.342207516994511e-07, + "loss": 0.6675, + "step": 70002 + }, + { + "epoch": 1.79, + "learning_rate": 7.341940765451753e-07, + "loss": 0.541, + "step": 70003 + }, + { + "epoch": 1.79, + "learning_rate": 7.341674015944146e-07, + "loss": 0.71, + "step": 70004 + }, + { + "epoch": 1.79, + "learning_rate": 7.341407268471898e-07, + "loss": 0.6279, + "step": 70005 + }, + { + "epoch": 1.79, + "learning_rate": 7.34114052303521e-07, + "loss": 0.542, + "step": 70006 + }, + { + "epoch": 1.79, + "learning_rate": 7.34087377963429e-07, + "loss": 0.6123, + "step": 70007 + }, + { + "epoch": 1.79, + "learning_rate": 7.34060703826934e-07, + "loss": 0.6152, + "step": 70008 + }, + { + "epoch": 1.79, + "learning_rate": 7.340340298940565e-07, + "loss": 0.6611, + "step": 70009 + }, + { + "epoch": 1.79, + "learning_rate": 7.340073561648168e-07, + "loss": 0.7607, + "step": 70010 + }, + { + "epoch": 1.79, + "learning_rate": 7.339806826392356e-07, + "loss": 0.583, + "step": 70011 + }, + { + "epoch": 1.79, + "learning_rate": 7.339540093173331e-07, + "loss": 0.436, + "step": 70012 + }, + { + "epoch": 1.79, + "learning_rate": 7.339273361991301e-07, + "loss": 0.4478, + "step": 70013 + }, + { + "epoch": 1.79, + "learning_rate": 7.339006632846465e-07, + "loss": 0.6743, + "step": 70014 + }, + { + "epoch": 1.79, + "learning_rate": 7.338739905739027e-07, + "loss": 0.5164, + "step": 70015 + }, + { + "epoch": 1.79, + "learning_rate": 7.338473180669196e-07, + "loss": 0.5039, + "step": 70016 + }, + { + "epoch": 1.79, + "learning_rate": 7.338206457637171e-07, + "loss": 0.5361, + "step": 70017 + }, + { + "epoch": 1.79, + "learning_rate": 7.337939736643161e-07, + "loss": 0.6411, + "step": 70018 + }, + { + "epoch": 1.79, + "learning_rate": 7.337673017687365e-07, + "loss": 0.6079, + "step": 70019 + }, + { + "epoch": 1.79, + "learning_rate": 7.337406300769995e-07, + "loss": 0.6465, + "step": 70020 + }, + { + "epoch": 1.79, + "learning_rate": 7.337139585891247e-07, + "loss": 0.6445, + "step": 70021 + }, + { + "epoch": 1.79, + "learning_rate": 7.336872873051331e-07, + "loss": 0.6377, + "step": 70022 + }, + { + "epoch": 1.79, + "learning_rate": 7.336606162250451e-07, + "loss": 0.6406, + "step": 70023 + }, + { + "epoch": 1.79, + "learning_rate": 7.336339453488808e-07, + "loss": 0.7344, + "step": 70024 + }, + { + "epoch": 1.79, + "learning_rate": 7.336072746766604e-07, + "loss": 0.5073, + "step": 70025 + }, + { + "epoch": 1.79, + "learning_rate": 7.335806042084049e-07, + "loss": 0.688, + "step": 70026 + }, + { + "epoch": 1.79, + "learning_rate": 7.335539339441343e-07, + "loss": 0.7432, + "step": 70027 + }, + { + "epoch": 1.79, + "learning_rate": 7.335272638838694e-07, + "loss": 0.4583, + "step": 70028 + }, + { + "epoch": 1.79, + "learning_rate": 7.335005940276303e-07, + "loss": 0.6543, + "step": 70029 + }, + { + "epoch": 1.79, + "learning_rate": 7.334739243754376e-07, + "loss": 0.7793, + "step": 70030 + }, + { + "epoch": 1.79, + "learning_rate": 7.334472549273116e-07, + "loss": 0.4722, + "step": 70031 + }, + { + "epoch": 1.79, + "learning_rate": 7.33420585683273e-07, + "loss": 0.7451, + "step": 70032 + }, + { + "epoch": 1.79, + "learning_rate": 7.333939166433421e-07, + "loss": 0.5708, + "step": 70033 + }, + { + "epoch": 1.8, + "learning_rate": 7.333672478075388e-07, + "loss": 0.6597, + "step": 70034 + }, + { + "epoch": 1.8, + "learning_rate": 7.333405791758842e-07, + "loss": 0.6445, + "step": 70035 + }, + { + "epoch": 1.8, + "learning_rate": 7.333139107483981e-07, + "loss": 0.7129, + "step": 70036 + }, + { + "epoch": 1.8, + "learning_rate": 7.332872425251017e-07, + "loss": 0.6885, + "step": 70037 + }, + { + "epoch": 1.8, + "learning_rate": 7.332605745060147e-07, + "loss": 0.3818, + "step": 70038 + }, + { + "epoch": 1.8, + "learning_rate": 7.332339066911579e-07, + "loss": 0.5791, + "step": 70039 + }, + { + "epoch": 1.8, + "learning_rate": 7.332072390805516e-07, + "loss": 0.5337, + "step": 70040 + }, + { + "epoch": 1.8, + "learning_rate": 7.331805716742165e-07, + "loss": 0.6875, + "step": 70041 + }, + { + "epoch": 1.8, + "learning_rate": 7.331539044721728e-07, + "loss": 0.6577, + "step": 70042 + }, + { + "epoch": 1.8, + "learning_rate": 7.331272374744408e-07, + "loss": 0.5935, + "step": 70043 + }, + { + "epoch": 1.8, + "learning_rate": 7.331005706810407e-07, + "loss": 0.7007, + "step": 70044 + }, + { + "epoch": 1.8, + "learning_rate": 7.330739040919934e-07, + "loss": 0.7422, + "step": 70045 + }, + { + "epoch": 1.8, + "learning_rate": 7.330472377073191e-07, + "loss": 0.5459, + "step": 70046 + }, + { + "epoch": 1.8, + "learning_rate": 7.330205715270383e-07, + "loss": 0.4849, + "step": 70047 + }, + { + "epoch": 1.8, + "learning_rate": 7.329939055511713e-07, + "loss": 0.6523, + "step": 70048 + }, + { + "epoch": 1.8, + "learning_rate": 7.329672397797386e-07, + "loss": 0.5918, + "step": 70049 + }, + { + "epoch": 1.8, + "learning_rate": 7.329405742127606e-07, + "loss": 0.6934, + "step": 70050 + }, + { + "epoch": 1.8, + "learning_rate": 7.329139088502579e-07, + "loss": 0.6406, + "step": 70051 + }, + { + "epoch": 1.8, + "learning_rate": 7.328872436922508e-07, + "loss": 0.623, + "step": 70052 + }, + { + "epoch": 1.8, + "learning_rate": 7.328605787387594e-07, + "loss": 0.6045, + "step": 70053 + }, + { + "epoch": 1.8, + "learning_rate": 7.328339139898046e-07, + "loss": 0.709, + "step": 70054 + }, + { + "epoch": 1.8, + "learning_rate": 7.328072494454063e-07, + "loss": 0.5098, + "step": 70055 + }, + { + "epoch": 1.8, + "learning_rate": 7.327805851055853e-07, + "loss": 0.6123, + "step": 70056 + }, + { + "epoch": 1.8, + "learning_rate": 7.327539209703619e-07, + "loss": 0.6519, + "step": 70057 + }, + { + "epoch": 1.8, + "learning_rate": 7.327272570397567e-07, + "loss": 0.6616, + "step": 70058 + }, + { + "epoch": 1.8, + "learning_rate": 7.327005933137896e-07, + "loss": 0.4763, + "step": 70059 + }, + { + "epoch": 1.8, + "learning_rate": 7.326739297924818e-07, + "loss": 0.7236, + "step": 70060 + }, + { + "epoch": 1.8, + "learning_rate": 7.326472664758531e-07, + "loss": 0.707, + "step": 70061 + }, + { + "epoch": 1.8, + "learning_rate": 7.326206033639244e-07, + "loss": 0.5859, + "step": 70062 + }, + { + "epoch": 1.8, + "learning_rate": 7.325939404567153e-07, + "loss": 0.708, + "step": 70063 + }, + { + "epoch": 1.8, + "learning_rate": 7.32567277754247e-07, + "loss": 0.6196, + "step": 70064 + }, + { + "epoch": 1.8, + "learning_rate": 7.325406152565394e-07, + "loss": 0.7051, + "step": 70065 + }, + { + "epoch": 1.8, + "learning_rate": 7.325139529636133e-07, + "loss": 0.6069, + "step": 70066 + }, + { + "epoch": 1.8, + "learning_rate": 7.324872908754888e-07, + "loss": 0.6455, + "step": 70067 + }, + { + "epoch": 1.8, + "learning_rate": 7.324606289921868e-07, + "loss": 0.5229, + "step": 70068 + }, + { + "epoch": 1.8, + "learning_rate": 7.324339673137272e-07, + "loss": 0.709, + "step": 70069 + }, + { + "epoch": 1.8, + "learning_rate": 7.324073058401308e-07, + "loss": 0.6465, + "step": 70070 + }, + { + "epoch": 1.8, + "learning_rate": 7.323806445714175e-07, + "loss": 0.6216, + "step": 70071 + }, + { + "epoch": 1.8, + "learning_rate": 7.323539835076084e-07, + "loss": 0.6953, + "step": 70072 + }, + { + "epoch": 1.8, + "learning_rate": 7.323273226487234e-07, + "loss": 0.752, + "step": 70073 + }, + { + "epoch": 1.8, + "learning_rate": 7.323006619947829e-07, + "loss": 0.7725, + "step": 70074 + }, + { + "epoch": 1.8, + "learning_rate": 7.322740015458078e-07, + "loss": 0.571, + "step": 70075 + }, + { + "epoch": 1.8, + "learning_rate": 7.322473413018178e-07, + "loss": 0.6758, + "step": 70076 + }, + { + "epoch": 1.8, + "learning_rate": 7.32220681262834e-07, + "loss": 0.6331, + "step": 70077 + }, + { + "epoch": 1.8, + "learning_rate": 7.321940214288765e-07, + "loss": 0.6987, + "step": 70078 + }, + { + "epoch": 1.8, + "learning_rate": 7.321673617999654e-07, + "loss": 0.6191, + "step": 70079 + }, + { + "epoch": 1.8, + "learning_rate": 7.321407023761217e-07, + "loss": 0.6099, + "step": 70080 + }, + { + "epoch": 1.8, + "learning_rate": 7.321140431573653e-07, + "loss": 0.5723, + "step": 70081 + }, + { + "epoch": 1.8, + "learning_rate": 7.320873841437174e-07, + "loss": 0.5615, + "step": 70082 + }, + { + "epoch": 1.8, + "learning_rate": 7.320607253351976e-07, + "loss": 0.6973, + "step": 70083 + }, + { + "epoch": 1.8, + "learning_rate": 7.320340667318265e-07, + "loss": 0.5393, + "step": 70084 + }, + { + "epoch": 1.8, + "learning_rate": 7.320074083336246e-07, + "loss": 0.666, + "step": 70085 + }, + { + "epoch": 1.8, + "learning_rate": 7.319807501406122e-07, + "loss": 0.6758, + "step": 70086 + }, + { + "epoch": 1.8, + "learning_rate": 7.3195409215281e-07, + "loss": 0.4636, + "step": 70087 + }, + { + "epoch": 1.8, + "learning_rate": 7.319274343702379e-07, + "loss": 0.4233, + "step": 70088 + }, + { + "epoch": 1.8, + "learning_rate": 7.319007767929171e-07, + "loss": 0.4948, + "step": 70089 + }, + { + "epoch": 1.8, + "learning_rate": 7.318741194208672e-07, + "loss": 0.6157, + "step": 70090 + }, + { + "epoch": 1.8, + "learning_rate": 7.318474622541091e-07, + "loss": 0.564, + "step": 70091 + }, + { + "epoch": 1.8, + "learning_rate": 7.318208052926634e-07, + "loss": 0.668, + "step": 70092 + }, + { + "epoch": 1.8, + "learning_rate": 7.317941485365497e-07, + "loss": 0.5815, + "step": 70093 + }, + { + "epoch": 1.8, + "learning_rate": 7.317674919857892e-07, + "loss": 0.4631, + "step": 70094 + }, + { + "epoch": 1.8, + "learning_rate": 7.317408356404016e-07, + "loss": 0.7568, + "step": 70095 + }, + { + "epoch": 1.8, + "learning_rate": 7.31714179500408e-07, + "loss": 0.7891, + "step": 70096 + }, + { + "epoch": 1.8, + "learning_rate": 7.316875235658287e-07, + "loss": 0.6538, + "step": 70097 + }, + { + "epoch": 1.8, + "learning_rate": 7.316608678366833e-07, + "loss": 0.7285, + "step": 70098 + }, + { + "epoch": 1.8, + "learning_rate": 7.316342123129935e-07, + "loss": 0.6025, + "step": 70099 + }, + { + "epoch": 1.8, + "learning_rate": 7.316075569947786e-07, + "loss": 0.6172, + "step": 70100 + }, + { + "epoch": 1.8, + "learning_rate": 7.315809018820595e-07, + "loss": 0.6816, + "step": 70101 + }, + { + "epoch": 1.8, + "learning_rate": 7.315542469748571e-07, + "loss": 0.5107, + "step": 70102 + }, + { + "epoch": 1.8, + "learning_rate": 7.315275922731907e-07, + "loss": 0.6191, + "step": 70103 + }, + { + "epoch": 1.8, + "learning_rate": 7.315009377770816e-07, + "loss": 0.5371, + "step": 70104 + }, + { + "epoch": 1.8, + "learning_rate": 7.314742834865495e-07, + "loss": 0.5374, + "step": 70105 + }, + { + "epoch": 1.8, + "learning_rate": 7.314476294016155e-07, + "loss": 0.5898, + "step": 70106 + }, + { + "epoch": 1.8, + "learning_rate": 7.314209755222993e-07, + "loss": 0.4438, + "step": 70107 + }, + { + "epoch": 1.8, + "learning_rate": 7.313943218486221e-07, + "loss": 0.5928, + "step": 70108 + }, + { + "epoch": 1.8, + "learning_rate": 7.313676683806038e-07, + "loss": 0.5581, + "step": 70109 + }, + { + "epoch": 1.8, + "learning_rate": 7.313410151182651e-07, + "loss": 0.5879, + "step": 70110 + }, + { + "epoch": 1.8, + "learning_rate": 7.313143620616258e-07, + "loss": 0.5122, + "step": 70111 + }, + { + "epoch": 1.8, + "learning_rate": 7.312877092107074e-07, + "loss": 0.6567, + "step": 70112 + }, + { + "epoch": 1.8, + "learning_rate": 7.312610565655292e-07, + "loss": 0.7842, + "step": 70113 + }, + { + "epoch": 1.8, + "learning_rate": 7.312344041261123e-07, + "loss": 0.5498, + "step": 70114 + }, + { + "epoch": 1.8, + "learning_rate": 7.312077518924765e-07, + "loss": 0.5986, + "step": 70115 + }, + { + "epoch": 1.8, + "learning_rate": 7.311810998646428e-07, + "loss": 0.4902, + "step": 70116 + }, + { + "epoch": 1.8, + "learning_rate": 7.311544480426313e-07, + "loss": 0.6377, + "step": 70117 + }, + { + "epoch": 1.8, + "learning_rate": 7.311277964264625e-07, + "loss": 0.52, + "step": 70118 + }, + { + "epoch": 1.8, + "learning_rate": 7.311011450161566e-07, + "loss": 0.6006, + "step": 70119 + }, + { + "epoch": 1.8, + "learning_rate": 7.310744938117344e-07, + "loss": 0.6357, + "step": 70120 + }, + { + "epoch": 1.8, + "learning_rate": 7.310478428132161e-07, + "loss": 0.7207, + "step": 70121 + }, + { + "epoch": 1.8, + "learning_rate": 7.310211920206222e-07, + "loss": 0.6675, + "step": 70122 + }, + { + "epoch": 1.8, + "learning_rate": 7.30994541433973e-07, + "loss": 0.7026, + "step": 70123 + }, + { + "epoch": 1.8, + "learning_rate": 7.309678910532886e-07, + "loss": 0.6353, + "step": 70124 + }, + { + "epoch": 1.8, + "learning_rate": 7.3094124087859e-07, + "loss": 0.4524, + "step": 70125 + }, + { + "epoch": 1.8, + "learning_rate": 7.30914590909897e-07, + "loss": 0.4702, + "step": 70126 + }, + { + "epoch": 1.8, + "learning_rate": 7.308879411472306e-07, + "loss": 0.5322, + "step": 70127 + }, + { + "epoch": 1.8, + "learning_rate": 7.308612915906108e-07, + "loss": 0.6562, + "step": 70128 + }, + { + "epoch": 1.8, + "learning_rate": 7.308346422400583e-07, + "loss": 0.6167, + "step": 70129 + }, + { + "epoch": 1.8, + "learning_rate": 7.30807993095593e-07, + "loss": 0.6836, + "step": 70130 + }, + { + "epoch": 1.8, + "learning_rate": 7.30781344157236e-07, + "loss": 0.6016, + "step": 70131 + }, + { + "epoch": 1.8, + "learning_rate": 7.307546954250076e-07, + "loss": 0.6963, + "step": 70132 + }, + { + "epoch": 1.8, + "learning_rate": 7.307280468989276e-07, + "loss": 0.6343, + "step": 70133 + }, + { + "epoch": 1.8, + "learning_rate": 7.307013985790166e-07, + "loss": 0.5552, + "step": 70134 + }, + { + "epoch": 1.8, + "learning_rate": 7.306747504652954e-07, + "loss": 0.6499, + "step": 70135 + }, + { + "epoch": 1.8, + "learning_rate": 7.306481025577838e-07, + "loss": 0.5735, + "step": 70136 + }, + { + "epoch": 1.8, + "learning_rate": 7.306214548565029e-07, + "loss": 0.627, + "step": 70137 + }, + { + "epoch": 1.8, + "learning_rate": 7.305948073614725e-07, + "loss": 0.5781, + "step": 70138 + }, + { + "epoch": 1.8, + "learning_rate": 7.305681600727136e-07, + "loss": 0.6196, + "step": 70139 + }, + { + "epoch": 1.8, + "learning_rate": 7.30541512990246e-07, + "loss": 0.6167, + "step": 70140 + }, + { + "epoch": 1.8, + "learning_rate": 7.305148661140905e-07, + "loss": 0.6914, + "step": 70141 + }, + { + "epoch": 1.8, + "learning_rate": 7.304882194442677e-07, + "loss": 0.5254, + "step": 70142 + }, + { + "epoch": 1.8, + "learning_rate": 7.304615729807971e-07, + "loss": 0.626, + "step": 70143 + }, + { + "epoch": 1.8, + "learning_rate": 7.304349267237e-07, + "loss": 0.6792, + "step": 70144 + }, + { + "epoch": 1.8, + "learning_rate": 7.304082806729964e-07, + "loss": 0.6865, + "step": 70145 + }, + { + "epoch": 1.8, + "learning_rate": 7.303816348287069e-07, + "loss": 0.6855, + "step": 70146 + }, + { + "epoch": 1.8, + "learning_rate": 7.303549891908514e-07, + "loss": 0.748, + "step": 70147 + }, + { + "epoch": 1.8, + "learning_rate": 7.303283437594509e-07, + "loss": 0.5391, + "step": 70148 + }, + { + "epoch": 1.8, + "learning_rate": 7.303016985345256e-07, + "loss": 0.7549, + "step": 70149 + }, + { + "epoch": 1.8, + "learning_rate": 7.30275053516096e-07, + "loss": 0.5991, + "step": 70150 + }, + { + "epoch": 1.8, + "learning_rate": 7.302484087041825e-07, + "loss": 0.7549, + "step": 70151 + }, + { + "epoch": 1.8, + "learning_rate": 7.302217640988054e-07, + "loss": 0.6514, + "step": 70152 + }, + { + "epoch": 1.8, + "learning_rate": 7.301951196999848e-07, + "loss": 0.59, + "step": 70153 + }, + { + "epoch": 1.8, + "learning_rate": 7.301684755077415e-07, + "loss": 0.6099, + "step": 70154 + }, + { + "epoch": 1.8, + "learning_rate": 7.301418315220958e-07, + "loss": 0.5889, + "step": 70155 + }, + { + "epoch": 1.8, + "learning_rate": 7.301151877430681e-07, + "loss": 0.6113, + "step": 70156 + }, + { + "epoch": 1.8, + "learning_rate": 7.300885441706786e-07, + "loss": 0.6514, + "step": 70157 + }, + { + "epoch": 1.8, + "learning_rate": 7.300619008049481e-07, + "loss": 0.6758, + "step": 70158 + }, + { + "epoch": 1.8, + "learning_rate": 7.300352576458966e-07, + "loss": 0.6841, + "step": 70159 + }, + { + "epoch": 1.8, + "learning_rate": 7.300086146935449e-07, + "loss": 0.6143, + "step": 70160 + }, + { + "epoch": 1.8, + "learning_rate": 7.29981971947913e-07, + "loss": 0.6387, + "step": 70161 + }, + { + "epoch": 1.8, + "learning_rate": 7.299553294090219e-07, + "loss": 0.791, + "step": 70162 + }, + { + "epoch": 1.8, + "learning_rate": 7.299286870768914e-07, + "loss": 0.6538, + "step": 70163 + }, + { + "epoch": 1.8, + "learning_rate": 7.299020449515419e-07, + "loss": 0.6523, + "step": 70164 + }, + { + "epoch": 1.8, + "learning_rate": 7.298754030329941e-07, + "loss": 0.6045, + "step": 70165 + }, + { + "epoch": 1.8, + "learning_rate": 7.29848761321268e-07, + "loss": 0.7822, + "step": 70166 + }, + { + "epoch": 1.8, + "learning_rate": 7.298221198163847e-07, + "loss": 0.7207, + "step": 70167 + }, + { + "epoch": 1.8, + "learning_rate": 7.297954785183641e-07, + "loss": 0.7002, + "step": 70168 + }, + { + "epoch": 1.8, + "learning_rate": 7.297688374272264e-07, + "loss": 0.6963, + "step": 70169 + }, + { + "epoch": 1.8, + "learning_rate": 7.297421965429926e-07, + "loss": 0.5259, + "step": 70170 + }, + { + "epoch": 1.8, + "learning_rate": 7.297155558656825e-07, + "loss": 0.5396, + "step": 70171 + }, + { + "epoch": 1.8, + "learning_rate": 7.296889153953172e-07, + "loss": 0.4915, + "step": 70172 + }, + { + "epoch": 1.8, + "learning_rate": 7.296622751319165e-07, + "loss": 0.7324, + "step": 70173 + }, + { + "epoch": 1.8, + "learning_rate": 7.296356350755007e-07, + "loss": 0.7402, + "step": 70174 + }, + { + "epoch": 1.8, + "learning_rate": 7.296089952260907e-07, + "loss": 0.5757, + "step": 70175 + }, + { + "epoch": 1.8, + "learning_rate": 7.295823555837064e-07, + "loss": 0.8008, + "step": 70176 + }, + { + "epoch": 1.8, + "learning_rate": 7.295557161483688e-07, + "loss": 0.7578, + "step": 70177 + }, + { + "epoch": 1.8, + "learning_rate": 7.295290769200975e-07, + "loss": 0.4276, + "step": 70178 + }, + { + "epoch": 1.8, + "learning_rate": 7.295024378989137e-07, + "loss": 0.6318, + "step": 70179 + }, + { + "epoch": 1.8, + "learning_rate": 7.294757990848373e-07, + "loss": 0.7021, + "step": 70180 + }, + { + "epoch": 1.8, + "learning_rate": 7.29449160477889e-07, + "loss": 0.6729, + "step": 70181 + }, + { + "epoch": 1.8, + "learning_rate": 7.294225220780892e-07, + "loss": 0.6865, + "step": 70182 + }, + { + "epoch": 1.8, + "learning_rate": 7.293958838854577e-07, + "loss": 0.5201, + "step": 70183 + }, + { + "epoch": 1.8, + "learning_rate": 7.293692459000156e-07, + "loss": 0.4905, + "step": 70184 + }, + { + "epoch": 1.8, + "learning_rate": 7.293426081217828e-07, + "loss": 0.5747, + "step": 70185 + }, + { + "epoch": 1.8, + "learning_rate": 7.293159705507801e-07, + "loss": 0.6484, + "step": 70186 + }, + { + "epoch": 1.8, + "learning_rate": 7.292893331870277e-07, + "loss": 0.6294, + "step": 70187 + }, + { + "epoch": 1.8, + "learning_rate": 7.29262696030546e-07, + "loss": 0.6499, + "step": 70188 + }, + { + "epoch": 1.8, + "learning_rate": 7.292360590813555e-07, + "loss": 0.7168, + "step": 70189 + }, + { + "epoch": 1.8, + "learning_rate": 7.292094223394762e-07, + "loss": 0.6816, + "step": 70190 + }, + { + "epoch": 1.8, + "learning_rate": 7.291827858049291e-07, + "loss": 0.6104, + "step": 70191 + }, + { + "epoch": 1.8, + "learning_rate": 7.291561494777343e-07, + "loss": 0.5103, + "step": 70192 + }, + { + "epoch": 1.8, + "learning_rate": 7.29129513357912e-07, + "loss": 0.6895, + "step": 70193 + }, + { + "epoch": 1.8, + "learning_rate": 7.291028774454828e-07, + "loss": 0.7119, + "step": 70194 + }, + { + "epoch": 1.8, + "learning_rate": 7.29076241740467e-07, + "loss": 0.7666, + "step": 70195 + }, + { + "epoch": 1.8, + "learning_rate": 7.290496062428853e-07, + "loss": 0.5776, + "step": 70196 + }, + { + "epoch": 1.8, + "learning_rate": 7.290229709527575e-07, + "loss": 0.6172, + "step": 70197 + }, + { + "epoch": 1.8, + "learning_rate": 7.289963358701048e-07, + "loss": 0.6426, + "step": 70198 + }, + { + "epoch": 1.8, + "learning_rate": 7.289697009949467e-07, + "loss": 0.7344, + "step": 70199 + }, + { + "epoch": 1.8, + "learning_rate": 7.289430663273044e-07, + "loss": 0.7959, + "step": 70200 + }, + { + "epoch": 1.8, + "learning_rate": 7.289164318671976e-07, + "loss": 0.6289, + "step": 70201 + }, + { + "epoch": 1.8, + "learning_rate": 7.288897976146475e-07, + "loss": 0.6836, + "step": 70202 + }, + { + "epoch": 1.8, + "learning_rate": 7.288631635696738e-07, + "loss": 0.6665, + "step": 70203 + }, + { + "epoch": 1.8, + "learning_rate": 7.288365297322971e-07, + "loss": 0.6279, + "step": 70204 + }, + { + "epoch": 1.8, + "learning_rate": 7.288098961025375e-07, + "loss": 0.7188, + "step": 70205 + }, + { + "epoch": 1.8, + "learning_rate": 7.28783262680416e-07, + "loss": 0.6235, + "step": 70206 + }, + { + "epoch": 1.8, + "learning_rate": 7.287566294659526e-07, + "loss": 0.5723, + "step": 70207 + }, + { + "epoch": 1.8, + "learning_rate": 7.287299964591677e-07, + "loss": 0.5908, + "step": 70208 + }, + { + "epoch": 1.8, + "learning_rate": 7.287033636600819e-07, + "loss": 0.6636, + "step": 70209 + }, + { + "epoch": 1.8, + "learning_rate": 7.286767310687154e-07, + "loss": 0.603, + "step": 70210 + }, + { + "epoch": 1.8, + "learning_rate": 7.286500986850885e-07, + "loss": 0.6865, + "step": 70211 + }, + { + "epoch": 1.8, + "learning_rate": 7.286234665092223e-07, + "loss": 0.5771, + "step": 70212 + }, + { + "epoch": 1.8, + "learning_rate": 7.285968345411363e-07, + "loss": 0.543, + "step": 70213 + }, + { + "epoch": 1.8, + "learning_rate": 7.28570202780851e-07, + "loss": 0.4961, + "step": 70214 + }, + { + "epoch": 1.8, + "learning_rate": 7.285435712283873e-07, + "loss": 0.7549, + "step": 70215 + }, + { + "epoch": 1.8, + "learning_rate": 7.285169398837651e-07, + "loss": 0.4469, + "step": 70216 + }, + { + "epoch": 1.8, + "learning_rate": 7.284903087470051e-07, + "loss": 0.5469, + "step": 70217 + }, + { + "epoch": 1.8, + "learning_rate": 7.284636778181275e-07, + "loss": 0.5281, + "step": 70218 + }, + { + "epoch": 1.8, + "learning_rate": 7.284370470971528e-07, + "loss": 0.7139, + "step": 70219 + }, + { + "epoch": 1.8, + "learning_rate": 7.284104165841014e-07, + "loss": 0.5718, + "step": 70220 + }, + { + "epoch": 1.8, + "learning_rate": 7.283837862789936e-07, + "loss": 0.6592, + "step": 70221 + }, + { + "epoch": 1.8, + "learning_rate": 7.283571561818502e-07, + "loss": 0.6045, + "step": 70222 + }, + { + "epoch": 1.8, + "learning_rate": 7.283305262926911e-07, + "loss": 0.5923, + "step": 70223 + }, + { + "epoch": 1.8, + "learning_rate": 7.283038966115364e-07, + "loss": 0.6909, + "step": 70224 + }, + { + "epoch": 1.8, + "learning_rate": 7.282772671384074e-07, + "loss": 0.6992, + "step": 70225 + }, + { + "epoch": 1.8, + "learning_rate": 7.282506378733236e-07, + "loss": 0.6367, + "step": 70226 + }, + { + "epoch": 1.8, + "learning_rate": 7.282240088163061e-07, + "loss": 0.6008, + "step": 70227 + }, + { + "epoch": 1.8, + "learning_rate": 7.281973799673747e-07, + "loss": 0.7676, + "step": 70228 + }, + { + "epoch": 1.8, + "learning_rate": 7.281707513265503e-07, + "loss": 0.606, + "step": 70229 + }, + { + "epoch": 1.8, + "learning_rate": 7.281441228938529e-07, + "loss": 0.8135, + "step": 70230 + }, + { + "epoch": 1.8, + "learning_rate": 7.281174946693032e-07, + "loss": 0.7036, + "step": 70231 + }, + { + "epoch": 1.8, + "learning_rate": 7.280908666529217e-07, + "loss": 0.6211, + "step": 70232 + }, + { + "epoch": 1.8, + "learning_rate": 7.28064238844728e-07, + "loss": 0.7749, + "step": 70233 + }, + { + "epoch": 1.8, + "learning_rate": 7.280376112447433e-07, + "loss": 0.595, + "step": 70234 + }, + { + "epoch": 1.8, + "learning_rate": 7.280109838529875e-07, + "loss": 0.4766, + "step": 70235 + }, + { + "epoch": 1.8, + "learning_rate": 7.279843566694812e-07, + "loss": 0.6162, + "step": 70236 + }, + { + "epoch": 1.8, + "learning_rate": 7.279577296942448e-07, + "loss": 0.5864, + "step": 70237 + }, + { + "epoch": 1.8, + "learning_rate": 7.279311029272988e-07, + "loss": 0.5989, + "step": 70238 + }, + { + "epoch": 1.8, + "learning_rate": 7.279044763686631e-07, + "loss": 0.7075, + "step": 70239 + }, + { + "epoch": 1.8, + "learning_rate": 7.278778500183589e-07, + "loss": 0.5679, + "step": 70240 + }, + { + "epoch": 1.8, + "learning_rate": 7.278512238764059e-07, + "loss": 0.6963, + "step": 70241 + }, + { + "epoch": 1.8, + "learning_rate": 7.27824597942825e-07, + "loss": 0.6748, + "step": 70242 + }, + { + "epoch": 1.8, + "learning_rate": 7.277979722176358e-07, + "loss": 0.5254, + "step": 70243 + }, + { + "epoch": 1.8, + "learning_rate": 7.277713467008595e-07, + "loss": 0.6211, + "step": 70244 + }, + { + "epoch": 1.8, + "learning_rate": 7.277447213925159e-07, + "loss": 0.6699, + "step": 70245 + }, + { + "epoch": 1.8, + "learning_rate": 7.277180962926258e-07, + "loss": 0.6846, + "step": 70246 + }, + { + "epoch": 1.8, + "learning_rate": 7.276914714012092e-07, + "loss": 0.71, + "step": 70247 + }, + { + "epoch": 1.8, + "learning_rate": 7.276648467182871e-07, + "loss": 0.6641, + "step": 70248 + }, + { + "epoch": 1.8, + "learning_rate": 7.276382222438792e-07, + "loss": 0.5249, + "step": 70249 + }, + { + "epoch": 1.8, + "learning_rate": 7.276115979780064e-07, + "loss": 0.5112, + "step": 70250 + }, + { + "epoch": 1.8, + "learning_rate": 7.275849739206887e-07, + "loss": 0.3789, + "step": 70251 + }, + { + "epoch": 1.8, + "learning_rate": 7.27558350071947e-07, + "loss": 0.5059, + "step": 70252 + }, + { + "epoch": 1.8, + "learning_rate": 7.275317264318012e-07, + "loss": 0.5933, + "step": 70253 + }, + { + "epoch": 1.8, + "learning_rate": 7.275051030002716e-07, + "loss": 0.6338, + "step": 70254 + }, + { + "epoch": 1.8, + "learning_rate": 7.27478479777379e-07, + "loss": 0.585, + "step": 70255 + }, + { + "epoch": 1.8, + "learning_rate": 7.274518567631433e-07, + "loss": 0.5864, + "step": 70256 + }, + { + "epoch": 1.8, + "learning_rate": 7.274252339575856e-07, + "loss": 0.5962, + "step": 70257 + }, + { + "epoch": 1.8, + "learning_rate": 7.273986113607256e-07, + "loss": 0.7073, + "step": 70258 + }, + { + "epoch": 1.8, + "learning_rate": 7.27371988972584e-07, + "loss": 0.4501, + "step": 70259 + }, + { + "epoch": 1.8, + "learning_rate": 7.273453667931813e-07, + "loss": 0.6743, + "step": 70260 + }, + { + "epoch": 1.8, + "learning_rate": 7.273187448225374e-07, + "loss": 0.5342, + "step": 70261 + }, + { + "epoch": 1.8, + "learning_rate": 7.272921230606734e-07, + "loss": 0.6689, + "step": 70262 + }, + { + "epoch": 1.8, + "learning_rate": 7.272655015076093e-07, + "loss": 0.4846, + "step": 70263 + }, + { + "epoch": 1.8, + "learning_rate": 7.272388801633651e-07, + "loss": 0.5918, + "step": 70264 + }, + { + "epoch": 1.8, + "learning_rate": 7.272122590279617e-07, + "loss": 0.4517, + "step": 70265 + }, + { + "epoch": 1.8, + "learning_rate": 7.271856381014192e-07, + "loss": 0.667, + "step": 70266 + }, + { + "epoch": 1.8, + "learning_rate": 7.271590173837583e-07, + "loss": 0.6421, + "step": 70267 + }, + { + "epoch": 1.8, + "learning_rate": 7.27132396874999e-07, + "loss": 0.7549, + "step": 70268 + }, + { + "epoch": 1.8, + "learning_rate": 7.27105776575162e-07, + "loss": 0.4805, + "step": 70269 + }, + { + "epoch": 1.8, + "learning_rate": 7.270791564842673e-07, + "loss": 0.5781, + "step": 70270 + }, + { + "epoch": 1.8, + "learning_rate": 7.270525366023359e-07, + "loss": 0.6289, + "step": 70271 + }, + { + "epoch": 1.8, + "learning_rate": 7.270259169293879e-07, + "loss": 0.8623, + "step": 70272 + }, + { + "epoch": 1.8, + "learning_rate": 7.269992974654434e-07, + "loss": 0.4548, + "step": 70273 + }, + { + "epoch": 1.8, + "learning_rate": 7.269726782105231e-07, + "loss": 0.6641, + "step": 70274 + }, + { + "epoch": 1.8, + "learning_rate": 7.26946059164647e-07, + "loss": 0.5771, + "step": 70275 + }, + { + "epoch": 1.8, + "learning_rate": 7.26919440327836e-07, + "loss": 0.6367, + "step": 70276 + }, + { + "epoch": 1.8, + "learning_rate": 7.268928217001102e-07, + "loss": 0.6089, + "step": 70277 + }, + { + "epoch": 1.8, + "learning_rate": 7.268662032814899e-07, + "loss": 0.667, + "step": 70278 + }, + { + "epoch": 1.8, + "learning_rate": 7.268395850719957e-07, + "loss": 0.6602, + "step": 70279 + }, + { + "epoch": 1.8, + "learning_rate": 7.268129670716477e-07, + "loss": 0.5547, + "step": 70280 + }, + { + "epoch": 1.8, + "learning_rate": 7.267863492804666e-07, + "loss": 0.543, + "step": 70281 + }, + { + "epoch": 1.8, + "learning_rate": 7.267597316984728e-07, + "loss": 0.5923, + "step": 70282 + }, + { + "epoch": 1.8, + "learning_rate": 7.267331143256863e-07, + "loss": 0.6094, + "step": 70283 + }, + { + "epoch": 1.8, + "learning_rate": 7.267064971621277e-07, + "loss": 0.7383, + "step": 70284 + }, + { + "epoch": 1.8, + "learning_rate": 7.266798802078172e-07, + "loss": 0.7783, + "step": 70285 + }, + { + "epoch": 1.8, + "learning_rate": 7.266532634627755e-07, + "loss": 0.6787, + "step": 70286 + }, + { + "epoch": 1.8, + "learning_rate": 7.266266469270228e-07, + "loss": 0.6448, + "step": 70287 + }, + { + "epoch": 1.8, + "learning_rate": 7.266000306005796e-07, + "loss": 0.4209, + "step": 70288 + }, + { + "epoch": 1.8, + "learning_rate": 7.265734144834659e-07, + "loss": 0.7607, + "step": 70289 + }, + { + "epoch": 1.8, + "learning_rate": 7.265467985757028e-07, + "loss": 0.6533, + "step": 70290 + }, + { + "epoch": 1.8, + "learning_rate": 7.265201828773097e-07, + "loss": 0.5762, + "step": 70291 + }, + { + "epoch": 1.8, + "learning_rate": 7.264935673883084e-07, + "loss": 0.6152, + "step": 70292 + }, + { + "epoch": 1.8, + "learning_rate": 7.264669521087178e-07, + "loss": 0.7725, + "step": 70293 + }, + { + "epoch": 1.8, + "learning_rate": 7.26440337038559e-07, + "loss": 0.4767, + "step": 70294 + }, + { + "epoch": 1.8, + "learning_rate": 7.264137221778521e-07, + "loss": 0.875, + "step": 70295 + }, + { + "epoch": 1.8, + "learning_rate": 7.263871075266177e-07, + "loss": 0.5073, + "step": 70296 + }, + { + "epoch": 1.8, + "learning_rate": 7.26360493084876e-07, + "loss": 0.6982, + "step": 70297 + }, + { + "epoch": 1.8, + "learning_rate": 7.263338788526477e-07, + "loss": 0.6212, + "step": 70298 + }, + { + "epoch": 1.8, + "learning_rate": 7.263072648299528e-07, + "loss": 0.3146, + "step": 70299 + }, + { + "epoch": 1.8, + "learning_rate": 7.262806510168121e-07, + "loss": 0.559, + "step": 70300 + }, + { + "epoch": 1.8, + "learning_rate": 7.262540374132453e-07, + "loss": 0.5425, + "step": 70301 + }, + { + "epoch": 1.8, + "learning_rate": 7.262274240192737e-07, + "loss": 0.6084, + "step": 70302 + }, + { + "epoch": 1.8, + "learning_rate": 7.26200810834917e-07, + "loss": 0.6602, + "step": 70303 + }, + { + "epoch": 1.8, + "learning_rate": 7.261741978601955e-07, + "loss": 0.5552, + "step": 70304 + }, + { + "epoch": 1.8, + "learning_rate": 7.261475850951301e-07, + "loss": 0.6367, + "step": 70305 + }, + { + "epoch": 1.8, + "learning_rate": 7.261209725397406e-07, + "loss": 0.5327, + "step": 70306 + }, + { + "epoch": 1.8, + "learning_rate": 7.260943601940479e-07, + "loss": 0.4844, + "step": 70307 + }, + { + "epoch": 1.8, + "learning_rate": 7.260677480580722e-07, + "loss": 0.4421, + "step": 70308 + }, + { + "epoch": 1.8, + "learning_rate": 7.260411361318337e-07, + "loss": 0.6816, + "step": 70309 + }, + { + "epoch": 1.8, + "learning_rate": 7.260145244153528e-07, + "loss": 0.6064, + "step": 70310 + }, + { + "epoch": 1.8, + "learning_rate": 7.259879129086503e-07, + "loss": 0.6353, + "step": 70311 + }, + { + "epoch": 1.8, + "learning_rate": 7.259613016117463e-07, + "loss": 0.6538, + "step": 70312 + }, + { + "epoch": 1.8, + "learning_rate": 7.259346905246611e-07, + "loss": 0.6807, + "step": 70313 + }, + { + "epoch": 1.8, + "learning_rate": 7.259080796474146e-07, + "loss": 0.8154, + "step": 70314 + }, + { + "epoch": 1.8, + "learning_rate": 7.258814689800281e-07, + "loss": 0.6421, + "step": 70315 + }, + { + "epoch": 1.8, + "learning_rate": 7.258548585225214e-07, + "loss": 0.5225, + "step": 70316 + }, + { + "epoch": 1.8, + "learning_rate": 7.258282482749152e-07, + "loss": 0.4937, + "step": 70317 + }, + { + "epoch": 1.8, + "learning_rate": 7.258016382372294e-07, + "loss": 0.5334, + "step": 70318 + }, + { + "epoch": 1.8, + "learning_rate": 7.25775028409485e-07, + "loss": 0.5312, + "step": 70319 + }, + { + "epoch": 1.8, + "learning_rate": 7.257484187917018e-07, + "loss": 0.6597, + "step": 70320 + }, + { + "epoch": 1.8, + "learning_rate": 7.257218093839005e-07, + "loss": 0.7148, + "step": 70321 + }, + { + "epoch": 1.8, + "learning_rate": 7.256952001861019e-07, + "loss": 0.6748, + "step": 70322 + }, + { + "epoch": 1.8, + "learning_rate": 7.256685911983252e-07, + "loss": 0.8379, + "step": 70323 + }, + { + "epoch": 1.8, + "learning_rate": 7.256419824205917e-07, + "loss": 0.5608, + "step": 70324 + }, + { + "epoch": 1.8, + "learning_rate": 7.256153738529214e-07, + "loss": 0.6357, + "step": 70325 + }, + { + "epoch": 1.8, + "learning_rate": 7.25588765495335e-07, + "loss": 0.4661, + "step": 70326 + }, + { + "epoch": 1.8, + "learning_rate": 7.255621573478523e-07, + "loss": 0.4341, + "step": 70327 + }, + { + "epoch": 1.8, + "learning_rate": 7.255355494104945e-07, + "loss": 0.4458, + "step": 70328 + }, + { + "epoch": 1.8, + "learning_rate": 7.255089416832812e-07, + "loss": 0.7734, + "step": 70329 + }, + { + "epoch": 1.8, + "learning_rate": 7.25482334166233e-07, + "loss": 0.4089, + "step": 70330 + }, + { + "epoch": 1.8, + "learning_rate": 7.254557268593707e-07, + "loss": 0.6294, + "step": 70331 + }, + { + "epoch": 1.8, + "learning_rate": 7.254291197627145e-07, + "loss": 0.463, + "step": 70332 + }, + { + "epoch": 1.8, + "learning_rate": 7.25402512876284e-07, + "loss": 0.6572, + "step": 70333 + }, + { + "epoch": 1.8, + "learning_rate": 7.253759062001005e-07, + "loss": 0.6943, + "step": 70334 + }, + { + "epoch": 1.8, + "learning_rate": 7.253492997341839e-07, + "loss": 0.7803, + "step": 70335 + }, + { + "epoch": 1.8, + "learning_rate": 7.253226934785548e-07, + "loss": 0.5537, + "step": 70336 + }, + { + "epoch": 1.8, + "learning_rate": 7.252960874332335e-07, + "loss": 0.5028, + "step": 70337 + }, + { + "epoch": 1.8, + "learning_rate": 7.252694815982403e-07, + "loss": 0.4043, + "step": 70338 + }, + { + "epoch": 1.8, + "learning_rate": 7.252428759735955e-07, + "loss": 0.6758, + "step": 70339 + }, + { + "epoch": 1.8, + "learning_rate": 7.252162705593198e-07, + "loss": 0.553, + "step": 70340 + }, + { + "epoch": 1.8, + "learning_rate": 7.251896653554336e-07, + "loss": 0.6562, + "step": 70341 + }, + { + "epoch": 1.8, + "learning_rate": 7.251630603619566e-07, + "loss": 0.5542, + "step": 70342 + }, + { + "epoch": 1.8, + "learning_rate": 7.251364555789098e-07, + "loss": 0.5442, + "step": 70343 + }, + { + "epoch": 1.8, + "learning_rate": 7.251098510063131e-07, + "loss": 0.7505, + "step": 70344 + }, + { + "epoch": 1.8, + "learning_rate": 7.250832466441876e-07, + "loss": 0.5962, + "step": 70345 + }, + { + "epoch": 1.8, + "learning_rate": 7.250566424925528e-07, + "loss": 0.5608, + "step": 70346 + }, + { + "epoch": 1.8, + "learning_rate": 7.250300385514296e-07, + "loss": 0.5674, + "step": 70347 + }, + { + "epoch": 1.8, + "learning_rate": 7.250034348208383e-07, + "loss": 0.5693, + "step": 70348 + }, + { + "epoch": 1.8, + "learning_rate": 7.249768313007994e-07, + "loss": 0.7178, + "step": 70349 + }, + { + "epoch": 1.8, + "learning_rate": 7.249502279913329e-07, + "loss": 0.5615, + "step": 70350 + }, + { + "epoch": 1.8, + "learning_rate": 7.249236248924597e-07, + "loss": 0.6091, + "step": 70351 + }, + { + "epoch": 1.8, + "learning_rate": 7.248970220041994e-07, + "loss": 0.6646, + "step": 70352 + }, + { + "epoch": 1.8, + "learning_rate": 7.248704193265731e-07, + "loss": 0.666, + "step": 70353 + }, + { + "epoch": 1.8, + "learning_rate": 7.248438168596005e-07, + "loss": 0.6147, + "step": 70354 + }, + { + "epoch": 1.8, + "learning_rate": 7.248172146033027e-07, + "loss": 0.6807, + "step": 70355 + }, + { + "epoch": 1.8, + "learning_rate": 7.247906125576995e-07, + "loss": 0.7109, + "step": 70356 + }, + { + "epoch": 1.8, + "learning_rate": 7.247640107228115e-07, + "loss": 0.751, + "step": 70357 + }, + { + "epoch": 1.8, + "learning_rate": 7.247374090986589e-07, + "loss": 0.6543, + "step": 70358 + }, + { + "epoch": 1.8, + "learning_rate": 7.247108076852625e-07, + "loss": 0.6782, + "step": 70359 + }, + { + "epoch": 1.8, + "learning_rate": 7.246842064826421e-07, + "loss": 0.7378, + "step": 70360 + }, + { + "epoch": 1.8, + "learning_rate": 7.246576054908188e-07, + "loss": 0.5308, + "step": 70361 + }, + { + "epoch": 1.8, + "learning_rate": 7.246310047098123e-07, + "loss": 0.4829, + "step": 70362 + }, + { + "epoch": 1.8, + "learning_rate": 7.246044041396429e-07, + "loss": 0.4998, + "step": 70363 + }, + { + "epoch": 1.8, + "learning_rate": 7.245778037803316e-07, + "loss": 0.5698, + "step": 70364 + }, + { + "epoch": 1.8, + "learning_rate": 7.245512036318982e-07, + "loss": 0.6128, + "step": 70365 + }, + { + "epoch": 1.8, + "learning_rate": 7.245246036943633e-07, + "loss": 0.8086, + "step": 70366 + }, + { + "epoch": 1.8, + "learning_rate": 7.244980039677473e-07, + "loss": 0.6162, + "step": 70367 + }, + { + "epoch": 1.8, + "learning_rate": 7.244714044520703e-07, + "loss": 0.752, + "step": 70368 + }, + { + "epoch": 1.8, + "learning_rate": 7.244448051473531e-07, + "loss": 0.6997, + "step": 70369 + }, + { + "epoch": 1.8, + "learning_rate": 7.244182060536157e-07, + "loss": 0.7466, + "step": 70370 + }, + { + "epoch": 1.8, + "learning_rate": 7.243916071708791e-07, + "loss": 0.5898, + "step": 70371 + }, + { + "epoch": 1.8, + "learning_rate": 7.243650084991628e-07, + "loss": 0.5559, + "step": 70372 + }, + { + "epoch": 1.8, + "learning_rate": 7.243384100384873e-07, + "loss": 0.8076, + "step": 70373 + }, + { + "epoch": 1.8, + "learning_rate": 7.243118117888736e-07, + "loss": 0.5127, + "step": 70374 + }, + { + "epoch": 1.8, + "learning_rate": 7.242852137503412e-07, + "loss": 0.6934, + "step": 70375 + }, + { + "epoch": 1.8, + "learning_rate": 7.242586159229113e-07, + "loss": 0.6992, + "step": 70376 + }, + { + "epoch": 1.8, + "learning_rate": 7.242320183066038e-07, + "loss": 0.6455, + "step": 70377 + }, + { + "epoch": 1.8, + "learning_rate": 7.242054209014392e-07, + "loss": 0.7036, + "step": 70378 + }, + { + "epoch": 1.8, + "learning_rate": 7.241788237074377e-07, + "loss": 0.7773, + "step": 70379 + }, + { + "epoch": 1.8, + "learning_rate": 7.241522267246201e-07, + "loss": 0.572, + "step": 70380 + }, + { + "epoch": 1.8, + "learning_rate": 7.241256299530065e-07, + "loss": 0.3828, + "step": 70381 + }, + { + "epoch": 1.8, + "learning_rate": 7.240990333926168e-07, + "loss": 0.7095, + "step": 70382 + }, + { + "epoch": 1.8, + "learning_rate": 7.240724370434721e-07, + "loss": 0.4741, + "step": 70383 + }, + { + "epoch": 1.8, + "learning_rate": 7.240458409055923e-07, + "loss": 0.8047, + "step": 70384 + }, + { + "epoch": 1.8, + "learning_rate": 7.240192449789979e-07, + "loss": 0.7432, + "step": 70385 + }, + { + "epoch": 1.8, + "learning_rate": 7.239926492637094e-07, + "loss": 0.6934, + "step": 70386 + }, + { + "epoch": 1.8, + "learning_rate": 7.239660537597467e-07, + "loss": 0.8896, + "step": 70387 + }, + { + "epoch": 1.8, + "learning_rate": 7.239394584671308e-07, + "loss": 0.4351, + "step": 70388 + }, + { + "epoch": 1.8, + "learning_rate": 7.239128633858816e-07, + "loss": 0.3593, + "step": 70389 + }, + { + "epoch": 1.8, + "learning_rate": 7.238862685160199e-07, + "loss": 0.6172, + "step": 70390 + }, + { + "epoch": 1.8, + "learning_rate": 7.238596738575657e-07, + "loss": 0.7861, + "step": 70391 + }, + { + "epoch": 1.8, + "learning_rate": 7.238330794105394e-07, + "loss": 0.6689, + "step": 70392 + }, + { + "epoch": 1.8, + "learning_rate": 7.238064851749614e-07, + "loss": 0.7305, + "step": 70393 + }, + { + "epoch": 1.8, + "learning_rate": 7.237798911508519e-07, + "loss": 0.4209, + "step": 70394 + }, + { + "epoch": 1.8, + "learning_rate": 7.237532973382316e-07, + "loss": 0.4961, + "step": 70395 + }, + { + "epoch": 1.8, + "learning_rate": 7.237267037371206e-07, + "loss": 0.7505, + "step": 70396 + }, + { + "epoch": 1.8, + "learning_rate": 7.237001103475396e-07, + "loss": 0.6904, + "step": 70397 + }, + { + "epoch": 1.8, + "learning_rate": 7.236735171695084e-07, + "loss": 0.4932, + "step": 70398 + }, + { + "epoch": 1.8, + "learning_rate": 7.236469242030479e-07, + "loss": 0.6211, + "step": 70399 + }, + { + "epoch": 1.8, + "learning_rate": 7.23620331448178e-07, + "loss": 0.6465, + "step": 70400 + }, + { + "epoch": 1.8, + "learning_rate": 7.2359373890492e-07, + "loss": 0.7695, + "step": 70401 + }, + { + "epoch": 1.8, + "learning_rate": 7.23567146573293e-07, + "loss": 0.6396, + "step": 70402 + }, + { + "epoch": 1.8, + "learning_rate": 7.235405544533179e-07, + "loss": 0.6211, + "step": 70403 + }, + { + "epoch": 1.8, + "learning_rate": 7.235139625450152e-07, + "loss": 0.6514, + "step": 70404 + }, + { + "epoch": 1.8, + "learning_rate": 7.234873708484052e-07, + "loss": 0.708, + "step": 70405 + }, + { + "epoch": 1.8, + "learning_rate": 7.23460779363508e-07, + "loss": 0.6523, + "step": 70406 + }, + { + "epoch": 1.8, + "learning_rate": 7.234341880903443e-07, + "loss": 0.5488, + "step": 70407 + }, + { + "epoch": 1.8, + "learning_rate": 7.234075970289342e-07, + "loss": 0.5967, + "step": 70408 + }, + { + "epoch": 1.8, + "learning_rate": 7.233810061792984e-07, + "loss": 0.5234, + "step": 70409 + }, + { + "epoch": 1.8, + "learning_rate": 7.233544155414569e-07, + "loss": 0.45, + "step": 70410 + }, + { + "epoch": 1.8, + "learning_rate": 7.233278251154304e-07, + "loss": 0.6699, + "step": 70411 + }, + { + "epoch": 1.8, + "learning_rate": 7.23301234901239e-07, + "loss": 0.54, + "step": 70412 + }, + { + "epoch": 1.8, + "learning_rate": 7.232746448989029e-07, + "loss": 0.6787, + "step": 70413 + }, + { + "epoch": 1.8, + "learning_rate": 7.232480551084428e-07, + "loss": 0.6768, + "step": 70414 + }, + { + "epoch": 1.8, + "learning_rate": 7.232214655298789e-07, + "loss": 0.7402, + "step": 70415 + }, + { + "epoch": 1.8, + "learning_rate": 7.231948761632317e-07, + "loss": 0.533, + "step": 70416 + }, + { + "epoch": 1.8, + "learning_rate": 7.231682870085212e-07, + "loss": 0.604, + "step": 70417 + }, + { + "epoch": 1.8, + "learning_rate": 7.231416980657683e-07, + "loss": 0.5747, + "step": 70418 + }, + { + "epoch": 1.8, + "learning_rate": 7.231151093349928e-07, + "loss": 0.6001, + "step": 70419 + }, + { + "epoch": 1.8, + "learning_rate": 7.230885208162156e-07, + "loss": 0.6592, + "step": 70420 + }, + { + "epoch": 1.8, + "learning_rate": 7.230619325094572e-07, + "loss": 0.5146, + "step": 70421 + }, + { + "epoch": 1.8, + "learning_rate": 7.23035344414737e-07, + "loss": 0.5527, + "step": 70422 + }, + { + "epoch": 1.8, + "learning_rate": 7.230087565320758e-07, + "loss": 0.3786, + "step": 70423 + }, + { + "epoch": 1.81, + "learning_rate": 7.229821688614943e-07, + "loss": 0.5723, + "step": 70424 + }, + { + "epoch": 1.81, + "learning_rate": 7.229555814030124e-07, + "loss": 0.5703, + "step": 70425 + }, + { + "epoch": 1.81, + "learning_rate": 7.229289941566508e-07, + "loss": 0.623, + "step": 70426 + }, + { + "epoch": 1.81, + "learning_rate": 7.229024071224297e-07, + "loss": 0.3494, + "step": 70427 + }, + { + "epoch": 1.81, + "learning_rate": 7.228758203003695e-07, + "loss": 0.709, + "step": 70428 + }, + { + "epoch": 1.81, + "learning_rate": 7.228492336904904e-07, + "loss": 0.8096, + "step": 70429 + }, + { + "epoch": 1.81, + "learning_rate": 7.228226472928131e-07, + "loss": 0.5181, + "step": 70430 + }, + { + "epoch": 1.81, + "learning_rate": 7.22796061107358e-07, + "loss": 0.6621, + "step": 70431 + }, + { + "epoch": 1.81, + "learning_rate": 7.227694751341448e-07, + "loss": 0.7588, + "step": 70432 + }, + { + "epoch": 1.81, + "learning_rate": 7.227428893731945e-07, + "loss": 0.5168, + "step": 70433 + }, + { + "epoch": 1.81, + "learning_rate": 7.22716303824527e-07, + "loss": 0.665, + "step": 70434 + }, + { + "epoch": 1.81, + "learning_rate": 7.22689718488163e-07, + "loss": 0.5645, + "step": 70435 + }, + { + "epoch": 1.81, + "learning_rate": 7.226631333641227e-07, + "loss": 0.582, + "step": 70436 + }, + { + "epoch": 1.81, + "learning_rate": 7.226365484524264e-07, + "loss": 0.6562, + "step": 70437 + }, + { + "epoch": 1.81, + "learning_rate": 7.226099637530946e-07, + "loss": 0.645, + "step": 70438 + }, + { + "epoch": 1.81, + "learning_rate": 7.225833792661476e-07, + "loss": 0.7383, + "step": 70439 + }, + { + "epoch": 1.81, + "learning_rate": 7.22556794991606e-07, + "loss": 0.6606, + "step": 70440 + }, + { + "epoch": 1.81, + "learning_rate": 7.2253021092949e-07, + "loss": 0.6611, + "step": 70441 + }, + { + "epoch": 1.81, + "learning_rate": 7.225036270798193e-07, + "loss": 0.5408, + "step": 70442 + }, + { + "epoch": 1.81, + "learning_rate": 7.224770434426152e-07, + "loss": 0.6846, + "step": 70443 + }, + { + "epoch": 1.81, + "learning_rate": 7.224504600178973e-07, + "loss": 0.5349, + "step": 70444 + }, + { + "epoch": 1.81, + "learning_rate": 7.224238768056867e-07, + "loss": 0.7139, + "step": 70445 + }, + { + "epoch": 1.81, + "learning_rate": 7.22397293806003e-07, + "loss": 0.6641, + "step": 70446 + }, + { + "epoch": 1.81, + "learning_rate": 7.223707110188672e-07, + "loss": 0.5217, + "step": 70447 + }, + { + "epoch": 1.81, + "learning_rate": 7.223441284442992e-07, + "loss": 0.5918, + "step": 70448 + }, + { + "epoch": 1.81, + "learning_rate": 7.223175460823199e-07, + "loss": 0.54, + "step": 70449 + }, + { + "epoch": 1.81, + "learning_rate": 7.222909639329489e-07, + "loss": 0.5923, + "step": 70450 + }, + { + "epoch": 1.81, + "learning_rate": 7.222643819962073e-07, + "loss": 0.6367, + "step": 70451 + }, + { + "epoch": 1.81, + "learning_rate": 7.22237800272115e-07, + "loss": 0.6089, + "step": 70452 + }, + { + "epoch": 1.81, + "learning_rate": 7.222112187606921e-07, + "loss": 0.6787, + "step": 70453 + }, + { + "epoch": 1.81, + "learning_rate": 7.221846374619597e-07, + "loss": 0.6494, + "step": 70454 + }, + { + "epoch": 1.81, + "learning_rate": 7.221580563759374e-07, + "loss": 0.5967, + "step": 70455 + }, + { + "epoch": 1.81, + "learning_rate": 7.221314755026462e-07, + "loss": 0.5151, + "step": 70456 + }, + { + "epoch": 1.81, + "learning_rate": 7.22104894842106e-07, + "loss": 0.5628, + "step": 70457 + }, + { + "epoch": 1.81, + "learning_rate": 7.220783143943372e-07, + "loss": 0.6602, + "step": 70458 + }, + { + "epoch": 1.81, + "learning_rate": 7.220517341593605e-07, + "loss": 0.6621, + "step": 70459 + }, + { + "epoch": 1.81, + "learning_rate": 7.220251541371957e-07, + "loss": 0.6675, + "step": 70460 + }, + { + "epoch": 1.81, + "learning_rate": 7.219985743278641e-07, + "loss": 0.7412, + "step": 70461 + }, + { + "epoch": 1.81, + "learning_rate": 7.21971994731385e-07, + "loss": 0.5845, + "step": 70462 + }, + { + "epoch": 1.81, + "learning_rate": 7.219454153477788e-07, + "loss": 0.6296, + "step": 70463 + }, + { + "epoch": 1.81, + "learning_rate": 7.219188361770667e-07, + "loss": 0.6436, + "step": 70464 + }, + { + "epoch": 1.81, + "learning_rate": 7.218922572192682e-07, + "loss": 0.6118, + "step": 70465 + }, + { + "epoch": 1.81, + "learning_rate": 7.218656784744043e-07, + "loss": 0.7305, + "step": 70466 + }, + { + "epoch": 1.81, + "learning_rate": 7.218390999424948e-07, + "loss": 0.6426, + "step": 70467 + }, + { + "epoch": 1.81, + "learning_rate": 7.218125216235607e-07, + "loss": 0.5225, + "step": 70468 + }, + { + "epoch": 1.81, + "learning_rate": 7.217859435176215e-07, + "loss": 0.8086, + "step": 70469 + }, + { + "epoch": 1.81, + "learning_rate": 7.217593656246983e-07, + "loss": 0.5449, + "step": 70470 + }, + { + "epoch": 1.81, + "learning_rate": 7.217327879448114e-07, + "loss": 0.6104, + "step": 70471 + }, + { + "epoch": 1.81, + "learning_rate": 7.217062104779806e-07, + "loss": 0.5986, + "step": 70472 + }, + { + "epoch": 1.81, + "learning_rate": 7.216796332242265e-07, + "loss": 0.79, + "step": 70473 + }, + { + "epoch": 1.81, + "learning_rate": 7.216530561835696e-07, + "loss": 0.6865, + "step": 70474 + }, + { + "epoch": 1.81, + "learning_rate": 7.216264793560301e-07, + "loss": 0.6431, + "step": 70475 + }, + { + "epoch": 1.81, + "learning_rate": 7.215999027416286e-07, + "loss": 0.5957, + "step": 70476 + }, + { + "epoch": 1.81, + "learning_rate": 7.21573326340385e-07, + "loss": 0.623, + "step": 70477 + }, + { + "epoch": 1.81, + "learning_rate": 7.2154675015232e-07, + "loss": 0.5835, + "step": 70478 + }, + { + "epoch": 1.81, + "learning_rate": 7.215201741774537e-07, + "loss": 0.5369, + "step": 70479 + }, + { + "epoch": 1.81, + "learning_rate": 7.214935984158068e-07, + "loss": 0.7373, + "step": 70480 + }, + { + "epoch": 1.81, + "learning_rate": 7.214670228673995e-07, + "loss": 0.8545, + "step": 70481 + }, + { + "epoch": 1.81, + "learning_rate": 7.21440447532252e-07, + "loss": 0.6079, + "step": 70482 + }, + { + "epoch": 1.81, + "learning_rate": 7.214138724103848e-07, + "loss": 0.5986, + "step": 70483 + }, + { + "epoch": 1.81, + "learning_rate": 7.213872975018181e-07, + "loss": 0.6094, + "step": 70484 + }, + { + "epoch": 1.81, + "learning_rate": 7.213607228065723e-07, + "loss": 0.6655, + "step": 70485 + }, + { + "epoch": 1.81, + "learning_rate": 7.213341483246677e-07, + "loss": 0.6572, + "step": 70486 + }, + { + "epoch": 1.81, + "learning_rate": 7.21307574056125e-07, + "loss": 0.5273, + "step": 70487 + }, + { + "epoch": 1.81, + "learning_rate": 7.212810000009639e-07, + "loss": 0.6572, + "step": 70488 + }, + { + "epoch": 1.81, + "learning_rate": 7.212544261592055e-07, + "loss": 0.6543, + "step": 70489 + }, + { + "epoch": 1.81, + "learning_rate": 7.212278525308695e-07, + "loss": 0.5771, + "step": 70490 + }, + { + "epoch": 1.81, + "learning_rate": 7.212012791159771e-07, + "loss": 0.7344, + "step": 70491 + }, + { + "epoch": 1.81, + "learning_rate": 7.211747059145474e-07, + "loss": 0.6709, + "step": 70492 + }, + { + "epoch": 1.81, + "learning_rate": 7.211481329266017e-07, + "loss": 0.6099, + "step": 70493 + }, + { + "epoch": 1.81, + "learning_rate": 7.211215601521599e-07, + "loss": 0.7002, + "step": 70494 + }, + { + "epoch": 1.81, + "learning_rate": 7.210949875912426e-07, + "loss": 0.793, + "step": 70495 + }, + { + "epoch": 1.81, + "learning_rate": 7.210684152438698e-07, + "loss": 0.5693, + "step": 70496 + }, + { + "epoch": 1.81, + "learning_rate": 7.210418431100624e-07, + "loss": 0.5571, + "step": 70497 + }, + { + "epoch": 1.81, + "learning_rate": 7.210152711898402e-07, + "loss": 0.6016, + "step": 70498 + }, + { + "epoch": 1.81, + "learning_rate": 7.20988699483224e-07, + "loss": 0.4774, + "step": 70499 + }, + { + "epoch": 1.81, + "learning_rate": 7.209621279902336e-07, + "loss": 0.5492, + "step": 70500 + }, + { + "epoch": 1.81, + "learning_rate": 7.209355567108903e-07, + "loss": 0.5952, + "step": 70501 + }, + { + "epoch": 1.81, + "learning_rate": 7.209089856452134e-07, + "loss": 0.5596, + "step": 70502 + }, + { + "epoch": 1.81, + "learning_rate": 7.208824147932235e-07, + "loss": 0.5254, + "step": 70503 + }, + { + "epoch": 1.81, + "learning_rate": 7.208558441549414e-07, + "loss": 0.7637, + "step": 70504 + }, + { + "epoch": 1.81, + "learning_rate": 7.208292737303869e-07, + "loss": 0.7012, + "step": 70505 + }, + { + "epoch": 1.81, + "learning_rate": 7.208027035195807e-07, + "loss": 0.7646, + "step": 70506 + }, + { + "epoch": 1.81, + "learning_rate": 7.20776133522543e-07, + "loss": 0.3984, + "step": 70507 + }, + { + "epoch": 1.81, + "learning_rate": 7.207495637392942e-07, + "loss": 0.3967, + "step": 70508 + }, + { + "epoch": 1.81, + "learning_rate": 7.207229941698545e-07, + "loss": 0.3989, + "step": 70509 + }, + { + "epoch": 1.81, + "learning_rate": 7.206964248142446e-07, + "loss": 0.7075, + "step": 70510 + }, + { + "epoch": 1.81, + "learning_rate": 7.206698556724847e-07, + "loss": 0.6719, + "step": 70511 + }, + { + "epoch": 1.81, + "learning_rate": 7.206432867445949e-07, + "loss": 0.5649, + "step": 70512 + }, + { + "epoch": 1.81, + "learning_rate": 7.206167180305956e-07, + "loss": 0.4865, + "step": 70513 + }, + { + "epoch": 1.81, + "learning_rate": 7.205901495305073e-07, + "loss": 0.6094, + "step": 70514 + }, + { + "epoch": 1.81, + "learning_rate": 7.2056358124435e-07, + "loss": 0.2463, + "step": 70515 + }, + { + "epoch": 1.81, + "learning_rate": 7.205370131721447e-07, + "loss": 0.7607, + "step": 70516 + }, + { + "epoch": 1.81, + "learning_rate": 7.205104453139111e-07, + "loss": 0.562, + "step": 70517 + }, + { + "epoch": 1.81, + "learning_rate": 7.2048387766967e-07, + "loss": 0.7314, + "step": 70518 + }, + { + "epoch": 1.81, + "learning_rate": 7.204573102394414e-07, + "loss": 0.6956, + "step": 70519 + }, + { + "epoch": 1.81, + "learning_rate": 7.204307430232458e-07, + "loss": 0.4785, + "step": 70520 + }, + { + "epoch": 1.81, + "learning_rate": 7.20404176021104e-07, + "loss": 0.5996, + "step": 70521 + }, + { + "epoch": 1.81, + "learning_rate": 7.203776092330352e-07, + "loss": 0.5874, + "step": 70522 + }, + { + "epoch": 1.81, + "learning_rate": 7.203510426590606e-07, + "loss": 0.6206, + "step": 70523 + }, + { + "epoch": 1.81, + "learning_rate": 7.203244762992004e-07, + "loss": 0.5649, + "step": 70524 + }, + { + "epoch": 1.81, + "learning_rate": 7.20297910153475e-07, + "loss": 0.5977, + "step": 70525 + }, + { + "epoch": 1.81, + "learning_rate": 7.202713442219042e-07, + "loss": 0.6475, + "step": 70526 + }, + { + "epoch": 1.81, + "learning_rate": 7.202447785045091e-07, + "loss": 0.6572, + "step": 70527 + }, + { + "epoch": 1.81, + "learning_rate": 7.202182130013097e-07, + "loss": 0.5679, + "step": 70528 + }, + { + "epoch": 1.81, + "learning_rate": 7.201916477123264e-07, + "loss": 0.4874, + "step": 70529 + }, + { + "epoch": 1.81, + "learning_rate": 7.201650826375795e-07, + "loss": 0.7183, + "step": 70530 + }, + { + "epoch": 1.81, + "learning_rate": 7.201385177770896e-07, + "loss": 0.707, + "step": 70531 + }, + { + "epoch": 1.81, + "learning_rate": 7.201119531308762e-07, + "loss": 0.4204, + "step": 70532 + }, + { + "epoch": 1.81, + "learning_rate": 7.200853886989604e-07, + "loss": 0.5405, + "step": 70533 + }, + { + "epoch": 1.81, + "learning_rate": 7.200588244813624e-07, + "loss": 0.6436, + "step": 70534 + }, + { + "epoch": 1.81, + "learning_rate": 7.200322604781024e-07, + "loss": 0.6831, + "step": 70535 + }, + { + "epoch": 1.81, + "learning_rate": 7.200056966892007e-07, + "loss": 0.4932, + "step": 70536 + }, + { + "epoch": 1.81, + "learning_rate": 7.199791331146781e-07, + "loss": 0.6406, + "step": 70537 + }, + { + "epoch": 1.81, + "learning_rate": 7.199525697545543e-07, + "loss": 0.7803, + "step": 70538 + }, + { + "epoch": 1.81, + "learning_rate": 7.199260066088501e-07, + "loss": 0.7109, + "step": 70539 + }, + { + "epoch": 1.81, + "learning_rate": 7.198994436775856e-07, + "loss": 0.5991, + "step": 70540 + }, + { + "epoch": 1.81, + "learning_rate": 7.198728809607817e-07, + "loss": 0.5745, + "step": 70541 + }, + { + "epoch": 1.81, + "learning_rate": 7.198463184584578e-07, + "loss": 0.7451, + "step": 70542 + }, + { + "epoch": 1.81, + "learning_rate": 7.198197561706346e-07, + "loss": 0.5581, + "step": 70543 + }, + { + "epoch": 1.81, + "learning_rate": 7.197931940973327e-07, + "loss": 0.5562, + "step": 70544 + }, + { + "epoch": 1.81, + "learning_rate": 7.197666322385722e-07, + "loss": 0.4834, + "step": 70545 + }, + { + "epoch": 1.81, + "learning_rate": 7.197400705943736e-07, + "loss": 0.5317, + "step": 70546 + }, + { + "epoch": 1.81, + "learning_rate": 7.197135091647572e-07, + "loss": 0.8203, + "step": 70547 + }, + { + "epoch": 1.81, + "learning_rate": 7.196869479497429e-07, + "loss": 0.5415, + "step": 70548 + }, + { + "epoch": 1.81, + "learning_rate": 7.196603869493518e-07, + "loss": 0.5586, + "step": 70549 + }, + { + "epoch": 1.81, + "learning_rate": 7.196338261636036e-07, + "loss": 0.5227, + "step": 70550 + }, + { + "epoch": 1.81, + "learning_rate": 7.196072655925193e-07, + "loss": 0.6348, + "step": 70551 + }, + { + "epoch": 1.81, + "learning_rate": 7.195807052361185e-07, + "loss": 0.6677, + "step": 70552 + }, + { + "epoch": 1.81, + "learning_rate": 7.195541450944218e-07, + "loss": 0.6875, + "step": 70553 + }, + { + "epoch": 1.81, + "learning_rate": 7.195275851674498e-07, + "loss": 0.5217, + "step": 70554 + }, + { + "epoch": 1.81, + "learning_rate": 7.195010254552224e-07, + "loss": 0.6172, + "step": 70555 + }, + { + "epoch": 1.81, + "learning_rate": 7.194744659577602e-07, + "loss": 0.7598, + "step": 70556 + }, + { + "epoch": 1.81, + "learning_rate": 7.194479066750836e-07, + "loss": 0.4719, + "step": 70557 + }, + { + "epoch": 1.81, + "learning_rate": 7.194213476072128e-07, + "loss": 0.5989, + "step": 70558 + }, + { + "epoch": 1.81, + "learning_rate": 7.193947887541682e-07, + "loss": 0.5718, + "step": 70559 + }, + { + "epoch": 1.81, + "learning_rate": 7.193682301159701e-07, + "loss": 0.749, + "step": 70560 + }, + { + "epoch": 1.81, + "learning_rate": 7.193416716926392e-07, + "loss": 0.644, + "step": 70561 + }, + { + "epoch": 1.81, + "learning_rate": 7.193151134841951e-07, + "loss": 0.6567, + "step": 70562 + }, + { + "epoch": 1.81, + "learning_rate": 7.192885554906585e-07, + "loss": 0.6367, + "step": 70563 + }, + { + "epoch": 1.81, + "learning_rate": 7.192619977120497e-07, + "loss": 0.6543, + "step": 70564 + }, + { + "epoch": 1.81, + "learning_rate": 7.192354401483891e-07, + "loss": 0.6729, + "step": 70565 + }, + { + "epoch": 1.81, + "learning_rate": 7.192088827996971e-07, + "loss": 0.7451, + "step": 70566 + }, + { + "epoch": 1.81, + "learning_rate": 7.191823256659939e-07, + "loss": 0.665, + "step": 70567 + }, + { + "epoch": 1.81, + "learning_rate": 7.191557687473e-07, + "loss": 0.5188, + "step": 70568 + }, + { + "epoch": 1.81, + "learning_rate": 7.191292120436354e-07, + "loss": 0.6421, + "step": 70569 + }, + { + "epoch": 1.81, + "learning_rate": 7.191026555550208e-07, + "loss": 0.5767, + "step": 70570 + }, + { + "epoch": 1.81, + "learning_rate": 7.190760992814766e-07, + "loss": 0.6885, + "step": 70571 + }, + { + "epoch": 1.81, + "learning_rate": 7.190495432230226e-07, + "loss": 0.8438, + "step": 70572 + }, + { + "epoch": 1.81, + "learning_rate": 7.190229873796796e-07, + "loss": 0.5117, + "step": 70573 + }, + { + "epoch": 1.81, + "learning_rate": 7.189964317514675e-07, + "loss": 0.8115, + "step": 70574 + }, + { + "epoch": 1.81, + "learning_rate": 7.189698763384071e-07, + "loss": 0.6777, + "step": 70575 + }, + { + "epoch": 1.81, + "learning_rate": 7.189433211405185e-07, + "loss": 0.5713, + "step": 70576 + }, + { + "epoch": 1.81, + "learning_rate": 7.189167661578222e-07, + "loss": 0.624, + "step": 70577 + }, + { + "epoch": 1.81, + "learning_rate": 7.188902113903382e-07, + "loss": 0.6719, + "step": 70578 + }, + { + "epoch": 1.81, + "learning_rate": 7.188636568380872e-07, + "loss": 0.6738, + "step": 70579 + }, + { + "epoch": 1.81, + "learning_rate": 7.188371025010891e-07, + "loss": 0.7695, + "step": 70580 + }, + { + "epoch": 1.81, + "learning_rate": 7.188105483793653e-07, + "loss": 0.8086, + "step": 70581 + }, + { + "epoch": 1.81, + "learning_rate": 7.187839944729347e-07, + "loss": 0.7324, + "step": 70582 + }, + { + "epoch": 1.81, + "learning_rate": 7.187574407818184e-07, + "loss": 0.7412, + "step": 70583 + }, + { + "epoch": 1.81, + "learning_rate": 7.187308873060364e-07, + "loss": 0.5605, + "step": 70584 + }, + { + "epoch": 1.81, + "learning_rate": 7.187043340456094e-07, + "loss": 0.6533, + "step": 70585 + }, + { + "epoch": 1.81, + "learning_rate": 7.186777810005573e-07, + "loss": 0.5824, + "step": 70586 + }, + { + "epoch": 1.81, + "learning_rate": 7.186512281709011e-07, + "loss": 0.5659, + "step": 70587 + }, + { + "epoch": 1.81, + "learning_rate": 7.186246755566602e-07, + "loss": 0.6924, + "step": 70588 + }, + { + "epoch": 1.81, + "learning_rate": 7.18598123157856e-07, + "loss": 0.8564, + "step": 70589 + }, + { + "epoch": 1.81, + "learning_rate": 7.185715709745079e-07, + "loss": 0.7275, + "step": 70590 + }, + { + "epoch": 1.81, + "learning_rate": 7.185450190066372e-07, + "loss": 0.5757, + "step": 70591 + }, + { + "epoch": 1.81, + "learning_rate": 7.185184672542631e-07, + "loss": 0.5713, + "step": 70592 + }, + { + "epoch": 1.81, + "learning_rate": 7.184919157174064e-07, + "loss": 0.6313, + "step": 70593 + }, + { + "epoch": 1.81, + "learning_rate": 7.184653643960878e-07, + "loss": 0.4771, + "step": 70594 + }, + { + "epoch": 1.81, + "learning_rate": 7.18438813290327e-07, + "loss": 0.5166, + "step": 70595 + }, + { + "epoch": 1.81, + "learning_rate": 7.184122624001449e-07, + "loss": 0.618, + "step": 70596 + }, + { + "epoch": 1.81, + "learning_rate": 7.183857117255614e-07, + "loss": 0.6738, + "step": 70597 + }, + { + "epoch": 1.81, + "learning_rate": 7.183591612665971e-07, + "loss": 0.7383, + "step": 70598 + }, + { + "epoch": 1.81, + "learning_rate": 7.183326110232722e-07, + "loss": 0.793, + "step": 70599 + }, + { + "epoch": 1.81, + "learning_rate": 7.183060609956073e-07, + "loss": 0.657, + "step": 70600 + }, + { + "epoch": 1.81, + "learning_rate": 7.182795111836226e-07, + "loss": 0.7158, + "step": 70601 + }, + { + "epoch": 1.81, + "learning_rate": 7.182529615873381e-07, + "loss": 0.4766, + "step": 70602 + }, + { + "epoch": 1.81, + "learning_rate": 7.182264122067741e-07, + "loss": 0.4106, + "step": 70603 + }, + { + "epoch": 1.81, + "learning_rate": 7.181998630419514e-07, + "loss": 0.7598, + "step": 70604 + }, + { + "epoch": 1.81, + "learning_rate": 7.1817331409289e-07, + "loss": 0.6401, + "step": 70605 + }, + { + "epoch": 1.81, + "learning_rate": 7.181467653596106e-07, + "loss": 0.4761, + "step": 70606 + }, + { + "epoch": 1.81, + "learning_rate": 7.18120216842133e-07, + "loss": 0.6328, + "step": 70607 + }, + { + "epoch": 1.81, + "learning_rate": 7.180936685404779e-07, + "loss": 0.6641, + "step": 70608 + }, + { + "epoch": 1.81, + "learning_rate": 7.180671204546654e-07, + "loss": 0.7612, + "step": 70609 + }, + { + "epoch": 1.81, + "learning_rate": 7.180405725847161e-07, + "loss": 0.6108, + "step": 70610 + }, + { + "epoch": 1.81, + "learning_rate": 7.180140249306503e-07, + "loss": 0.7271, + "step": 70611 + }, + { + "epoch": 1.81, + "learning_rate": 7.179874774924879e-07, + "loss": 0.6807, + "step": 70612 + }, + { + "epoch": 1.81, + "learning_rate": 7.179609302702498e-07, + "loss": 0.6846, + "step": 70613 + }, + { + "epoch": 1.81, + "learning_rate": 7.179343832639557e-07, + "loss": 0.6914, + "step": 70614 + }, + { + "epoch": 1.81, + "learning_rate": 7.179078364736265e-07, + "loss": 0.5314, + "step": 70615 + }, + { + "epoch": 1.81, + "learning_rate": 7.178812898992821e-07, + "loss": 0.6055, + "step": 70616 + }, + { + "epoch": 1.81, + "learning_rate": 7.178547435409432e-07, + "loss": 0.6309, + "step": 70617 + }, + { + "epoch": 1.81, + "learning_rate": 7.178281973986297e-07, + "loss": 0.7041, + "step": 70618 + }, + { + "epoch": 1.81, + "learning_rate": 7.178016514723626e-07, + "loss": 0.8301, + "step": 70619 + }, + { + "epoch": 1.81, + "learning_rate": 7.177751057621617e-07, + "loss": 0.7988, + "step": 70620 + }, + { + "epoch": 1.81, + "learning_rate": 7.177485602680475e-07, + "loss": 0.6367, + "step": 70621 + }, + { + "epoch": 1.81, + "learning_rate": 7.1772201499004e-07, + "loss": 0.7466, + "step": 70622 + }, + { + "epoch": 1.81, + "learning_rate": 7.176954699281599e-07, + "loss": 0.4572, + "step": 70623 + }, + { + "epoch": 1.81, + "learning_rate": 7.176689250824273e-07, + "loss": 0.5693, + "step": 70624 + }, + { + "epoch": 1.81, + "learning_rate": 7.176423804528626e-07, + "loss": 0.5482, + "step": 70625 + }, + { + "epoch": 1.81, + "learning_rate": 7.176158360394862e-07, + "loss": 0.4497, + "step": 70626 + }, + { + "epoch": 1.81, + "learning_rate": 7.175892918423183e-07, + "loss": 0.5579, + "step": 70627 + }, + { + "epoch": 1.81, + "learning_rate": 7.175627478613792e-07, + "loss": 0.6685, + "step": 70628 + }, + { + "epoch": 1.81, + "learning_rate": 7.175362040966897e-07, + "loss": 0.5928, + "step": 70629 + }, + { + "epoch": 1.81, + "learning_rate": 7.175096605482698e-07, + "loss": 0.6992, + "step": 70630 + }, + { + "epoch": 1.81, + "learning_rate": 7.174831172161393e-07, + "loss": 0.6104, + "step": 70631 + }, + { + "epoch": 1.81, + "learning_rate": 7.174565741003193e-07, + "loss": 0.6553, + "step": 70632 + }, + { + "epoch": 1.81, + "learning_rate": 7.174300312008295e-07, + "loss": 0.499, + "step": 70633 + }, + { + "epoch": 1.81, + "learning_rate": 7.174034885176908e-07, + "loss": 0.5078, + "step": 70634 + }, + { + "epoch": 1.81, + "learning_rate": 7.173769460509231e-07, + "loss": 0.5366, + "step": 70635 + }, + { + "epoch": 1.81, + "learning_rate": 7.17350403800547e-07, + "loss": 0.6265, + "step": 70636 + }, + { + "epoch": 1.81, + "learning_rate": 7.173238617665827e-07, + "loss": 0.5913, + "step": 70637 + }, + { + "epoch": 1.81, + "learning_rate": 7.172973199490505e-07, + "loss": 0.5591, + "step": 70638 + }, + { + "epoch": 1.81, + "learning_rate": 7.172707783479705e-07, + "loss": 0.5303, + "step": 70639 + }, + { + "epoch": 1.81, + "learning_rate": 7.172442369633639e-07, + "loss": 0.6128, + "step": 70640 + }, + { + "epoch": 1.81, + "learning_rate": 7.172176957952498e-07, + "loss": 0.8516, + "step": 70641 + }, + { + "epoch": 1.81, + "learning_rate": 7.171911548436494e-07, + "loss": 0.5216, + "step": 70642 + }, + { + "epoch": 1.81, + "learning_rate": 7.171646141085824e-07, + "loss": 0.7432, + "step": 70643 + }, + { + "epoch": 1.81, + "learning_rate": 7.171380735900699e-07, + "loss": 0.7373, + "step": 70644 + }, + { + "epoch": 1.81, + "learning_rate": 7.171115332881313e-07, + "loss": 0.5112, + "step": 70645 + }, + { + "epoch": 1.81, + "learning_rate": 7.170849932027876e-07, + "loss": 0.6221, + "step": 70646 + }, + { + "epoch": 1.81, + "learning_rate": 7.170584533340589e-07, + "loss": 0.5972, + "step": 70647 + }, + { + "epoch": 1.81, + "learning_rate": 7.170319136819656e-07, + "loss": 0.437, + "step": 70648 + }, + { + "epoch": 1.81, + "learning_rate": 7.170053742465278e-07, + "loss": 0.6465, + "step": 70649 + }, + { + "epoch": 1.81, + "learning_rate": 7.169788350277663e-07, + "loss": 0.6616, + "step": 70650 + }, + { + "epoch": 1.81, + "learning_rate": 7.169522960257009e-07, + "loss": 0.606, + "step": 70651 + }, + { + "epoch": 1.81, + "learning_rate": 7.16925757240352e-07, + "loss": 0.6338, + "step": 70652 + }, + { + "epoch": 1.81, + "learning_rate": 7.168992186717402e-07, + "loss": 0.4312, + "step": 70653 + }, + { + "epoch": 1.81, + "learning_rate": 7.168726803198857e-07, + "loss": 0.4712, + "step": 70654 + }, + { + "epoch": 1.81, + "learning_rate": 7.168461421848085e-07, + "loss": 0.8076, + "step": 70655 + }, + { + "epoch": 1.81, + "learning_rate": 7.168196042665293e-07, + "loss": 0.6987, + "step": 70656 + }, + { + "epoch": 1.81, + "learning_rate": 7.167930665650683e-07, + "loss": 0.7366, + "step": 70657 + }, + { + "epoch": 1.81, + "learning_rate": 7.167665290804459e-07, + "loss": 0.6875, + "step": 70658 + }, + { + "epoch": 1.81, + "learning_rate": 7.167399918126822e-07, + "loss": 0.512, + "step": 70659 + }, + { + "epoch": 1.81, + "learning_rate": 7.16713454761798e-07, + "loss": 0.5155, + "step": 70660 + }, + { + "epoch": 1.81, + "learning_rate": 7.166869179278132e-07, + "loss": 0.6035, + "step": 70661 + }, + { + "epoch": 1.81, + "learning_rate": 7.166603813107479e-07, + "loss": 0.6382, + "step": 70662 + }, + { + "epoch": 1.81, + "learning_rate": 7.16633844910623e-07, + "loss": 0.6064, + "step": 70663 + }, + { + "epoch": 1.81, + "learning_rate": 7.166073087274582e-07, + "loss": 0.6274, + "step": 70664 + }, + { + "epoch": 1.81, + "learning_rate": 7.165807727612745e-07, + "loss": 0.5503, + "step": 70665 + }, + { + "epoch": 1.81, + "learning_rate": 7.165542370120915e-07, + "loss": 0.5629, + "step": 70666 + }, + { + "epoch": 1.81, + "learning_rate": 7.165277014799303e-07, + "loss": 0.485, + "step": 70667 + }, + { + "epoch": 1.81, + "learning_rate": 7.165011661648104e-07, + "loss": 0.71, + "step": 70668 + }, + { + "epoch": 1.81, + "learning_rate": 7.164746310667529e-07, + "loss": 0.5366, + "step": 70669 + }, + { + "epoch": 1.81, + "learning_rate": 7.164480961857777e-07, + "loss": 0.6562, + "step": 70670 + }, + { + "epoch": 1.81, + "learning_rate": 7.164215615219052e-07, + "loss": 0.5649, + "step": 70671 + }, + { + "epoch": 1.81, + "learning_rate": 7.163950270751553e-07, + "loss": 0.5957, + "step": 70672 + }, + { + "epoch": 1.81, + "learning_rate": 7.163684928455491e-07, + "loss": 0.7271, + "step": 70673 + }, + { + "epoch": 1.81, + "learning_rate": 7.163419588331061e-07, + "loss": 0.5615, + "step": 70674 + }, + { + "epoch": 1.81, + "learning_rate": 7.163154250378474e-07, + "loss": 0.5247, + "step": 70675 + }, + { + "epoch": 1.81, + "learning_rate": 7.162888914597925e-07, + "loss": 0.5479, + "step": 70676 + }, + { + "epoch": 1.81, + "learning_rate": 7.162623580989625e-07, + "loss": 0.6807, + "step": 70677 + }, + { + "epoch": 1.81, + "learning_rate": 7.162358249553772e-07, + "loss": 0.7432, + "step": 70678 + }, + { + "epoch": 1.81, + "learning_rate": 7.162092920290572e-07, + "loss": 0.6113, + "step": 70679 + }, + { + "epoch": 1.81, + "learning_rate": 7.16182759320023e-07, + "loss": 0.5703, + "step": 70680 + }, + { + "epoch": 1.81, + "learning_rate": 7.16156226828294e-07, + "loss": 0.7041, + "step": 70681 + }, + { + "epoch": 1.81, + "learning_rate": 7.161296945538915e-07, + "loss": 0.5625, + "step": 70682 + }, + { + "epoch": 1.81, + "learning_rate": 7.161031624968353e-07, + "loss": 0.5852, + "step": 70683 + }, + { + "epoch": 1.81, + "learning_rate": 7.160766306571458e-07, + "loss": 0.6187, + "step": 70684 + }, + { + "epoch": 1.81, + "learning_rate": 7.160500990348433e-07, + "loss": 0.6123, + "step": 70685 + }, + { + "epoch": 1.81, + "learning_rate": 7.160235676299484e-07, + "loss": 0.6729, + "step": 70686 + }, + { + "epoch": 1.81, + "learning_rate": 7.15997036442481e-07, + "loss": 0.5742, + "step": 70687 + }, + { + "epoch": 1.81, + "learning_rate": 7.159705054724618e-07, + "loss": 0.7432, + "step": 70688 + }, + { + "epoch": 1.81, + "learning_rate": 7.159439747199107e-07, + "loss": 0.7515, + "step": 70689 + }, + { + "epoch": 1.81, + "learning_rate": 7.15917444184849e-07, + "loss": 0.752, + "step": 70690 + }, + { + "epoch": 1.81, + "learning_rate": 7.158909138672955e-07, + "loss": 0.6226, + "step": 70691 + }, + { + "epoch": 1.81, + "learning_rate": 7.158643837672714e-07, + "loss": 0.5681, + "step": 70692 + }, + { + "epoch": 1.81, + "learning_rate": 7.158378538847968e-07, + "loss": 0.5896, + "step": 70693 + }, + { + "epoch": 1.81, + "learning_rate": 7.158113242198922e-07, + "loss": 0.665, + "step": 70694 + }, + { + "epoch": 1.81, + "learning_rate": 7.157847947725777e-07, + "loss": 0.7793, + "step": 70695 + }, + { + "epoch": 1.81, + "learning_rate": 7.157582655428739e-07, + "loss": 0.5145, + "step": 70696 + }, + { + "epoch": 1.81, + "learning_rate": 7.157317365308006e-07, + "loss": 0.7061, + "step": 70697 + }, + { + "epoch": 1.81, + "learning_rate": 7.157052077363788e-07, + "loss": 0.5823, + "step": 70698 + }, + { + "epoch": 1.81, + "learning_rate": 7.156786791596281e-07, + "loss": 0.7344, + "step": 70699 + }, + { + "epoch": 1.81, + "learning_rate": 7.156521508005697e-07, + "loss": 0.6543, + "step": 70700 + }, + { + "epoch": 1.81, + "learning_rate": 7.156256226592231e-07, + "loss": 0.6162, + "step": 70701 + }, + { + "epoch": 1.81, + "learning_rate": 7.155990947356088e-07, + "loss": 0.52, + "step": 70702 + }, + { + "epoch": 1.81, + "learning_rate": 7.155725670297473e-07, + "loss": 0.5972, + "step": 70703 + }, + { + "epoch": 1.81, + "learning_rate": 7.155460395416585e-07, + "loss": 0.4755, + "step": 70704 + }, + { + "epoch": 1.81, + "learning_rate": 7.155195122713633e-07, + "loss": 0.6172, + "step": 70705 + }, + { + "epoch": 1.81, + "learning_rate": 7.154929852188816e-07, + "loss": 0.6797, + "step": 70706 + }, + { + "epoch": 1.81, + "learning_rate": 7.15466458384234e-07, + "loss": 0.7285, + "step": 70707 + }, + { + "epoch": 1.81, + "learning_rate": 7.154399317674404e-07, + "loss": 0.4541, + "step": 70708 + }, + { + "epoch": 1.81, + "learning_rate": 7.154134053685216e-07, + "loss": 0.8516, + "step": 70709 + }, + { + "epoch": 1.81, + "learning_rate": 7.15386879187498e-07, + "loss": 0.5508, + "step": 70710 + }, + { + "epoch": 1.81, + "learning_rate": 7.153603532243891e-07, + "loss": 0.5864, + "step": 70711 + }, + { + "epoch": 1.81, + "learning_rate": 7.153338274792157e-07, + "loss": 0.6196, + "step": 70712 + }, + { + "epoch": 1.81, + "learning_rate": 7.153073019519982e-07, + "loss": 0.7402, + "step": 70713 + }, + { + "epoch": 1.81, + "learning_rate": 7.152807766427567e-07, + "loss": 0.5526, + "step": 70714 + }, + { + "epoch": 1.81, + "learning_rate": 7.152542515515116e-07, + "loss": 0.5986, + "step": 70715 + }, + { + "epoch": 1.81, + "learning_rate": 7.152277266782834e-07, + "loss": 0.5894, + "step": 70716 + }, + { + "epoch": 1.81, + "learning_rate": 7.152012020230921e-07, + "loss": 0.584, + "step": 70717 + }, + { + "epoch": 1.81, + "learning_rate": 7.151746775859581e-07, + "loss": 0.5752, + "step": 70718 + }, + { + "epoch": 1.81, + "learning_rate": 7.15148153366902e-07, + "loss": 0.6257, + "step": 70719 + }, + { + "epoch": 1.81, + "learning_rate": 7.151216293659439e-07, + "loss": 0.7622, + "step": 70720 + }, + { + "epoch": 1.81, + "learning_rate": 7.150951055831038e-07, + "loss": 0.6367, + "step": 70721 + }, + { + "epoch": 1.81, + "learning_rate": 7.150685820184023e-07, + "loss": 0.8203, + "step": 70722 + }, + { + "epoch": 1.81, + "learning_rate": 7.150420586718598e-07, + "loss": 0.6846, + "step": 70723 + }, + { + "epoch": 1.81, + "learning_rate": 7.150155355434963e-07, + "loss": 0.5625, + "step": 70724 + }, + { + "epoch": 1.81, + "learning_rate": 7.149890126333325e-07, + "loss": 0.4924, + "step": 70725 + }, + { + "epoch": 1.81, + "learning_rate": 7.149624899413884e-07, + "loss": 0.6411, + "step": 70726 + }, + { + "epoch": 1.81, + "learning_rate": 7.149359674676844e-07, + "loss": 0.5146, + "step": 70727 + }, + { + "epoch": 1.81, + "learning_rate": 7.149094452122408e-07, + "loss": 0.7349, + "step": 70728 + }, + { + "epoch": 1.81, + "learning_rate": 7.148829231750781e-07, + "loss": 0.7109, + "step": 70729 + }, + { + "epoch": 1.81, + "learning_rate": 7.148564013562167e-07, + "loss": 0.6719, + "step": 70730 + }, + { + "epoch": 1.81, + "learning_rate": 7.148298797556762e-07, + "loss": 0.4082, + "step": 70731 + }, + { + "epoch": 1.81, + "learning_rate": 7.148033583734775e-07, + "loss": 0.623, + "step": 70732 + }, + { + "epoch": 1.81, + "learning_rate": 7.147768372096405e-07, + "loss": 0.792, + "step": 70733 + }, + { + "epoch": 1.81, + "learning_rate": 7.14750316264186e-07, + "loss": 0.7607, + "step": 70734 + }, + { + "epoch": 1.81, + "learning_rate": 7.147237955371339e-07, + "loss": 0.5776, + "step": 70735 + }, + { + "epoch": 1.81, + "learning_rate": 7.14697275028505e-07, + "loss": 0.6108, + "step": 70736 + }, + { + "epoch": 1.81, + "learning_rate": 7.146707547383188e-07, + "loss": 0.8252, + "step": 70737 + }, + { + "epoch": 1.81, + "learning_rate": 7.146442346665964e-07, + "loss": 0.4653, + "step": 70738 + }, + { + "epoch": 1.81, + "learning_rate": 7.146177148133577e-07, + "loss": 0.6914, + "step": 70739 + }, + { + "epoch": 1.81, + "learning_rate": 7.145911951786234e-07, + "loss": 0.626, + "step": 70740 + }, + { + "epoch": 1.81, + "learning_rate": 7.145646757624133e-07, + "loss": 0.5996, + "step": 70741 + }, + { + "epoch": 1.81, + "learning_rate": 7.145381565647477e-07, + "loss": 0.5571, + "step": 70742 + }, + { + "epoch": 1.81, + "learning_rate": 7.145116375856472e-07, + "loss": 0.7783, + "step": 70743 + }, + { + "epoch": 1.81, + "learning_rate": 7.144851188251322e-07, + "loss": 0.563, + "step": 70744 + }, + { + "epoch": 1.81, + "learning_rate": 7.144586002832226e-07, + "loss": 0.8096, + "step": 70745 + }, + { + "epoch": 1.81, + "learning_rate": 7.14432081959939e-07, + "loss": 0.6074, + "step": 70746 + }, + { + "epoch": 1.81, + "learning_rate": 7.144055638553015e-07, + "loss": 0.5811, + "step": 70747 + }, + { + "epoch": 1.81, + "learning_rate": 7.143790459693307e-07, + "loss": 0.7061, + "step": 70748 + }, + { + "epoch": 1.81, + "learning_rate": 7.143525283020466e-07, + "loss": 0.6309, + "step": 70749 + }, + { + "epoch": 1.81, + "learning_rate": 7.1432601085347e-07, + "loss": 0.6831, + "step": 70750 + }, + { + "epoch": 1.81, + "learning_rate": 7.142994936236206e-07, + "loss": 0.7637, + "step": 70751 + }, + { + "epoch": 1.81, + "learning_rate": 7.142729766125189e-07, + "loss": 0.6587, + "step": 70752 + }, + { + "epoch": 1.81, + "learning_rate": 7.142464598201851e-07, + "loss": 0.6343, + "step": 70753 + }, + { + "epoch": 1.81, + "learning_rate": 7.142199432466397e-07, + "loss": 0.4646, + "step": 70754 + }, + { + "epoch": 1.81, + "learning_rate": 7.141934268919031e-07, + "loss": 0.4778, + "step": 70755 + }, + { + "epoch": 1.81, + "learning_rate": 7.141669107559953e-07, + "loss": 0.6172, + "step": 70756 + }, + { + "epoch": 1.81, + "learning_rate": 7.141403948389369e-07, + "loss": 0.459, + "step": 70757 + }, + { + "epoch": 1.81, + "learning_rate": 7.141138791407478e-07, + "loss": 0.6152, + "step": 70758 + }, + { + "epoch": 1.81, + "learning_rate": 7.140873636614488e-07, + "loss": 0.4519, + "step": 70759 + }, + { + "epoch": 1.81, + "learning_rate": 7.140608484010602e-07, + "loss": 0.4971, + "step": 70760 + }, + { + "epoch": 1.81, + "learning_rate": 7.140343333596017e-07, + "loss": 0.7871, + "step": 70761 + }, + { + "epoch": 1.81, + "learning_rate": 7.140078185370941e-07, + "loss": 0.6279, + "step": 70762 + }, + { + "epoch": 1.81, + "learning_rate": 7.139813039335576e-07, + "loss": 0.709, + "step": 70763 + }, + { + "epoch": 1.81, + "learning_rate": 7.139547895490121e-07, + "loss": 0.7207, + "step": 70764 + }, + { + "epoch": 1.81, + "learning_rate": 7.139282753834786e-07, + "loss": 0.6475, + "step": 70765 + }, + { + "epoch": 1.81, + "learning_rate": 7.139017614369769e-07, + "loss": 0.6445, + "step": 70766 + }, + { + "epoch": 1.81, + "learning_rate": 7.138752477095276e-07, + "loss": 0.5112, + "step": 70767 + }, + { + "epoch": 1.81, + "learning_rate": 7.138487342011508e-07, + "loss": 0.5991, + "step": 70768 + }, + { + "epoch": 1.81, + "learning_rate": 7.138222209118668e-07, + "loss": 0.3817, + "step": 70769 + }, + { + "epoch": 1.81, + "learning_rate": 7.137957078416964e-07, + "loss": 0.7305, + "step": 70770 + }, + { + "epoch": 1.81, + "learning_rate": 7.13769194990659e-07, + "loss": 0.6655, + "step": 70771 + }, + { + "epoch": 1.81, + "learning_rate": 7.137426823587756e-07, + "loss": 0.6924, + "step": 70772 + }, + { + "epoch": 1.81, + "learning_rate": 7.137161699460659e-07, + "loss": 0.6504, + "step": 70773 + }, + { + "epoch": 1.81, + "learning_rate": 7.13689657752551e-07, + "loss": 0.4985, + "step": 70774 + }, + { + "epoch": 1.81, + "learning_rate": 7.136631457782504e-07, + "loss": 0.6846, + "step": 70775 + }, + { + "epoch": 1.81, + "learning_rate": 7.136366340231849e-07, + "loss": 0.5376, + "step": 70776 + }, + { + "epoch": 1.81, + "learning_rate": 7.136101224873747e-07, + "loss": 0.6211, + "step": 70777 + }, + { + "epoch": 1.81, + "learning_rate": 7.135836111708401e-07, + "loss": 0.8584, + "step": 70778 + }, + { + "epoch": 1.81, + "learning_rate": 7.135571000736012e-07, + "loss": 0.6553, + "step": 70779 + }, + { + "epoch": 1.81, + "learning_rate": 7.135305891956791e-07, + "loss": 0.5039, + "step": 70780 + }, + { + "epoch": 1.81, + "learning_rate": 7.135040785370927e-07, + "loss": 0.5532, + "step": 70781 + }, + { + "epoch": 1.81, + "learning_rate": 7.134775680978634e-07, + "loss": 0.5005, + "step": 70782 + }, + { + "epoch": 1.81, + "learning_rate": 7.13451057878011e-07, + "loss": 0.7588, + "step": 70783 + }, + { + "epoch": 1.81, + "learning_rate": 7.13424547877556e-07, + "loss": 0.5093, + "step": 70784 + }, + { + "epoch": 1.81, + "learning_rate": 7.133980380965186e-07, + "loss": 0.6367, + "step": 70785 + }, + { + "epoch": 1.81, + "learning_rate": 7.133715285349191e-07, + "loss": 0.6865, + "step": 70786 + }, + { + "epoch": 1.81, + "learning_rate": 7.133450191927779e-07, + "loss": 0.5664, + "step": 70787 + }, + { + "epoch": 1.81, + "learning_rate": 7.133185100701153e-07, + "loss": 0.7275, + "step": 70788 + }, + { + "epoch": 1.81, + "learning_rate": 7.132920011669514e-07, + "loss": 0.6479, + "step": 70789 + }, + { + "epoch": 1.81, + "learning_rate": 7.13265492483307e-07, + "loss": 0.5806, + "step": 70790 + }, + { + "epoch": 1.81, + "learning_rate": 7.132389840192018e-07, + "loss": 0.7842, + "step": 70791 + }, + { + "epoch": 1.81, + "learning_rate": 7.132124757746561e-07, + "loss": 0.6221, + "step": 70792 + }, + { + "epoch": 1.81, + "learning_rate": 7.131859677496908e-07, + "loss": 0.8545, + "step": 70793 + }, + { + "epoch": 1.81, + "learning_rate": 7.131594599443254e-07, + "loss": 0.6768, + "step": 70794 + }, + { + "epoch": 1.81, + "learning_rate": 7.131329523585809e-07, + "loss": 0.6348, + "step": 70795 + }, + { + "epoch": 1.81, + "learning_rate": 7.131064449924771e-07, + "loss": 0.6958, + "step": 70796 + }, + { + "epoch": 1.81, + "learning_rate": 7.130799378460347e-07, + "loss": 0.5645, + "step": 70797 + }, + { + "epoch": 1.81, + "learning_rate": 7.130534309192736e-07, + "loss": 0.7705, + "step": 70798 + }, + { + "epoch": 1.81, + "learning_rate": 7.130269242122144e-07, + "loss": 0.5776, + "step": 70799 + }, + { + "epoch": 1.81, + "learning_rate": 7.130004177248777e-07, + "loss": 0.6855, + "step": 70800 + }, + { + "epoch": 1.81, + "learning_rate": 7.12973911457283e-07, + "loss": 0.708, + "step": 70801 + }, + { + "epoch": 1.81, + "learning_rate": 7.129474054094509e-07, + "loss": 0.5439, + "step": 70802 + }, + { + "epoch": 1.81, + "learning_rate": 7.12920899581402e-07, + "loss": 0.7412, + "step": 70803 + }, + { + "epoch": 1.81, + "learning_rate": 7.12894393973156e-07, + "loss": 0.6216, + "step": 70804 + }, + { + "epoch": 1.81, + "learning_rate": 7.128678885847339e-07, + "loss": 0.5615, + "step": 70805 + }, + { + "epoch": 1.81, + "learning_rate": 7.128413834161554e-07, + "loss": 0.5615, + "step": 70806 + }, + { + "epoch": 1.81, + "learning_rate": 7.128148784674412e-07, + "loss": 0.6562, + "step": 70807 + }, + { + "epoch": 1.81, + "learning_rate": 7.127883737386113e-07, + "loss": 0.6367, + "step": 70808 + }, + { + "epoch": 1.81, + "learning_rate": 7.127618692296864e-07, + "loss": 0.5718, + "step": 70809 + }, + { + "epoch": 1.81, + "learning_rate": 7.127353649406867e-07, + "loss": 0.6272, + "step": 70810 + }, + { + "epoch": 1.81, + "learning_rate": 7.127088608716319e-07, + "loss": 0.5342, + "step": 70811 + }, + { + "epoch": 1.81, + "learning_rate": 7.126823570225429e-07, + "loss": 0.6709, + "step": 70812 + }, + { + "epoch": 1.81, + "learning_rate": 7.126558533934396e-07, + "loss": 0.7363, + "step": 70813 + }, + { + "epoch": 1.81, + "learning_rate": 7.126293499843427e-07, + "loss": 0.5837, + "step": 70814 + }, + { + "epoch": 1.82, + "learning_rate": 7.12602846795272e-07, + "loss": 0.5674, + "step": 70815 + }, + { + "epoch": 1.82, + "learning_rate": 7.125763438262485e-07, + "loss": 0.6128, + "step": 70816 + }, + { + "epoch": 1.82, + "learning_rate": 7.12549841077292e-07, + "loss": 0.5645, + "step": 70817 + }, + { + "epoch": 1.82, + "learning_rate": 7.125233385484226e-07, + "loss": 0.6973, + "step": 70818 + }, + { + "epoch": 1.82, + "learning_rate": 7.124968362396611e-07, + "loss": 0.5332, + "step": 70819 + }, + { + "epoch": 1.82, + "learning_rate": 7.124703341510278e-07, + "loss": 0.4814, + "step": 70820 + }, + { + "epoch": 1.82, + "learning_rate": 7.124438322825423e-07, + "loss": 0.7275, + "step": 70821 + }, + { + "epoch": 1.82, + "learning_rate": 7.124173306342255e-07, + "loss": 0.6099, + "step": 70822 + }, + { + "epoch": 1.82, + "learning_rate": 7.123908292060973e-07, + "loss": 0.6846, + "step": 70823 + }, + { + "epoch": 1.82, + "learning_rate": 7.123643279981786e-07, + "loss": 0.5781, + "step": 70824 + }, + { + "epoch": 1.82, + "learning_rate": 7.12337827010489e-07, + "loss": 0.5066, + "step": 70825 + }, + { + "epoch": 1.82, + "learning_rate": 7.123113262430492e-07, + "loss": 0.394, + "step": 70826 + }, + { + "epoch": 1.82, + "learning_rate": 7.122848256958792e-07, + "loss": 0.6299, + "step": 70827 + }, + { + "epoch": 1.82, + "learning_rate": 7.122583253689998e-07, + "loss": 0.7314, + "step": 70828 + }, + { + "epoch": 1.82, + "learning_rate": 7.122318252624307e-07, + "loss": 0.5608, + "step": 70829 + }, + { + "epoch": 1.82, + "learning_rate": 7.122053253761928e-07, + "loss": 0.6807, + "step": 70830 + }, + { + "epoch": 1.82, + "learning_rate": 7.12178825710306e-07, + "loss": 0.6611, + "step": 70831 + }, + { + "epoch": 1.82, + "learning_rate": 7.121523262647903e-07, + "loss": 0.6147, + "step": 70832 + }, + { + "epoch": 1.82, + "learning_rate": 7.121258270396666e-07, + "loss": 0.8848, + "step": 70833 + }, + { + "epoch": 1.82, + "learning_rate": 7.12099328034955e-07, + "loss": 0.4941, + "step": 70834 + }, + { + "epoch": 1.82, + "learning_rate": 7.120728292506754e-07, + "loss": 0.7656, + "step": 70835 + }, + { + "epoch": 1.82, + "learning_rate": 7.120463306868487e-07, + "loss": 0.7188, + "step": 70836 + }, + { + "epoch": 1.82, + "learning_rate": 7.120198323434945e-07, + "loss": 0.4399, + "step": 70837 + }, + { + "epoch": 1.82, + "learning_rate": 7.119933342206337e-07, + "loss": 0.7988, + "step": 70838 + }, + { + "epoch": 1.82, + "learning_rate": 7.119668363182864e-07, + "loss": 0.6455, + "step": 70839 + }, + { + "epoch": 1.82, + "learning_rate": 7.119403386364731e-07, + "loss": 0.5947, + "step": 70840 + }, + { + "epoch": 1.82, + "learning_rate": 7.119138411752136e-07, + "loss": 0.5371, + "step": 70841 + }, + { + "epoch": 1.82, + "learning_rate": 7.118873439345282e-07, + "loss": 0.5659, + "step": 70842 + }, + { + "epoch": 1.82, + "learning_rate": 7.118608469144376e-07, + "loss": 0.5664, + "step": 70843 + }, + { + "epoch": 1.82, + "learning_rate": 7.118343501149617e-07, + "loss": 0.6011, + "step": 70844 + }, + { + "epoch": 1.82, + "learning_rate": 7.118078535361214e-07, + "loss": 0.6211, + "step": 70845 + }, + { + "epoch": 1.82, + "learning_rate": 7.117813571779361e-07, + "loss": 0.5654, + "step": 70846 + }, + { + "epoch": 1.82, + "learning_rate": 7.117548610404269e-07, + "loss": 0.5596, + "step": 70847 + }, + { + "epoch": 1.82, + "learning_rate": 7.117283651236135e-07, + "loss": 0.7764, + "step": 70848 + }, + { + "epoch": 1.82, + "learning_rate": 7.117018694275168e-07, + "loss": 0.5928, + "step": 70849 + }, + { + "epoch": 1.82, + "learning_rate": 7.116753739521569e-07, + "loss": 0.6509, + "step": 70850 + }, + { + "epoch": 1.82, + "learning_rate": 7.116488786975532e-07, + "loss": 0.7217, + "step": 70851 + }, + { + "epoch": 1.82, + "learning_rate": 7.116223836637272e-07, + "loss": 0.707, + "step": 70852 + }, + { + "epoch": 1.82, + "learning_rate": 7.115958888506986e-07, + "loss": 0.4626, + "step": 70853 + }, + { + "epoch": 1.82, + "learning_rate": 7.115693942584875e-07, + "loss": 0.5261, + "step": 70854 + }, + { + "epoch": 1.82, + "learning_rate": 7.115428998871147e-07, + "loss": 0.6343, + "step": 70855 + }, + { + "epoch": 1.82, + "learning_rate": 7.115164057366e-07, + "loss": 0.5747, + "step": 70856 + }, + { + "epoch": 1.82, + "learning_rate": 7.114899118069642e-07, + "loss": 0.6406, + "step": 70857 + }, + { + "epoch": 1.82, + "learning_rate": 7.114634180982271e-07, + "loss": 0.5913, + "step": 70858 + }, + { + "epoch": 1.82, + "learning_rate": 7.114369246104093e-07, + "loss": 0.6963, + "step": 70859 + }, + { + "epoch": 1.82, + "learning_rate": 7.114104313435312e-07, + "loss": 0.3267, + "step": 70860 + }, + { + "epoch": 1.82, + "learning_rate": 7.113839382976126e-07, + "loss": 0.6514, + "step": 70861 + }, + { + "epoch": 1.82, + "learning_rate": 7.113574454726741e-07, + "loss": 0.7871, + "step": 70862 + }, + { + "epoch": 1.82, + "learning_rate": 7.113309528687356e-07, + "loss": 0.6846, + "step": 70863 + }, + { + "epoch": 1.82, + "learning_rate": 7.113044604858182e-07, + "loss": 0.6479, + "step": 70864 + }, + { + "epoch": 1.82, + "learning_rate": 7.112779683239414e-07, + "loss": 0.7148, + "step": 70865 + }, + { + "epoch": 1.82, + "learning_rate": 7.112514763831259e-07, + "loss": 0.7627, + "step": 70866 + }, + { + "epoch": 1.82, + "learning_rate": 7.112249846633917e-07, + "loss": 0.6934, + "step": 70867 + }, + { + "epoch": 1.82, + "learning_rate": 7.111984931647597e-07, + "loss": 0.751, + "step": 70868 + }, + { + "epoch": 1.82, + "learning_rate": 7.111720018872493e-07, + "loss": 0.7432, + "step": 70869 + }, + { + "epoch": 1.82, + "learning_rate": 7.111455108308818e-07, + "loss": 0.603, + "step": 70870 + }, + { + "epoch": 1.82, + "learning_rate": 7.111190199956763e-07, + "loss": 0.6953, + "step": 70871 + }, + { + "epoch": 1.82, + "learning_rate": 7.11092529381654e-07, + "loss": 0.5986, + "step": 70872 + }, + { + "epoch": 1.82, + "learning_rate": 7.110660389888345e-07, + "loss": 0.7129, + "step": 70873 + }, + { + "epoch": 1.82, + "learning_rate": 7.110395488172388e-07, + "loss": 0.6304, + "step": 70874 + }, + { + "epoch": 1.82, + "learning_rate": 7.110130588668865e-07, + "loss": 0.5239, + "step": 70875 + }, + { + "epoch": 1.82, + "learning_rate": 7.109865691377985e-07, + "loss": 0.502, + "step": 70876 + }, + { + "epoch": 1.82, + "learning_rate": 7.109600796299946e-07, + "loss": 0.584, + "step": 70877 + }, + { + "epoch": 1.82, + "learning_rate": 7.109335903434955e-07, + "loss": 0.6667, + "step": 70878 + }, + { + "epoch": 1.82, + "learning_rate": 7.10907101278321e-07, + "loss": 0.7725, + "step": 70879 + }, + { + "epoch": 1.82, + "learning_rate": 7.108806124344921e-07, + "loss": 0.624, + "step": 70880 + }, + { + "epoch": 1.82, + "learning_rate": 7.108541238120284e-07, + "loss": 0.5322, + "step": 70881 + }, + { + "epoch": 1.82, + "learning_rate": 7.108276354109501e-07, + "loss": 0.6968, + "step": 70882 + }, + { + "epoch": 1.82, + "learning_rate": 7.108011472312782e-07, + "loss": 0.5303, + "step": 70883 + }, + { + "epoch": 1.82, + "learning_rate": 7.107746592730322e-07, + "loss": 0.6567, + "step": 70884 + }, + { + "epoch": 1.82, + "learning_rate": 7.107481715362329e-07, + "loss": 0.4507, + "step": 70885 + }, + { + "epoch": 1.82, + "learning_rate": 7.107216840209003e-07, + "loss": 0.5701, + "step": 70886 + }, + { + "epoch": 1.82, + "learning_rate": 7.106951967270551e-07, + "loss": 0.7744, + "step": 70887 + }, + { + "epoch": 1.82, + "learning_rate": 7.106687096547169e-07, + "loss": 0.8223, + "step": 70888 + }, + { + "epoch": 1.82, + "learning_rate": 7.106422228039068e-07, + "loss": 0.6826, + "step": 70889 + }, + { + "epoch": 1.82, + "learning_rate": 7.106157361746446e-07, + "loss": 0.46, + "step": 70890 + }, + { + "epoch": 1.82, + "learning_rate": 7.105892497669505e-07, + "loss": 0.6992, + "step": 70891 + }, + { + "epoch": 1.82, + "learning_rate": 7.105627635808447e-07, + "loss": 0.4951, + "step": 70892 + }, + { + "epoch": 1.82, + "learning_rate": 7.10536277616348e-07, + "loss": 0.5474, + "step": 70893 + }, + { + "epoch": 1.82, + "learning_rate": 7.1050979187348e-07, + "loss": 0.6167, + "step": 70894 + }, + { + "epoch": 1.82, + "learning_rate": 7.104833063522618e-07, + "loss": 0.6411, + "step": 70895 + }, + { + "epoch": 1.82, + "learning_rate": 7.104568210527126e-07, + "loss": 0.625, + "step": 70896 + }, + { + "epoch": 1.82, + "learning_rate": 7.104303359748538e-07, + "loss": 0.7783, + "step": 70897 + }, + { + "epoch": 1.82, + "learning_rate": 7.104038511187049e-07, + "loss": 0.6287, + "step": 70898 + }, + { + "epoch": 1.82, + "learning_rate": 7.103773664842867e-07, + "loss": 0.7227, + "step": 70899 + }, + { + "epoch": 1.82, + "learning_rate": 7.103508820716194e-07, + "loss": 0.4171, + "step": 70900 + }, + { + "epoch": 1.82, + "learning_rate": 7.103243978807227e-07, + "loss": 0.5425, + "step": 70901 + }, + { + "epoch": 1.82, + "learning_rate": 7.102979139116176e-07, + "loss": 0.6458, + "step": 70902 + }, + { + "epoch": 1.82, + "learning_rate": 7.102714301643237e-07, + "loss": 0.5986, + "step": 70903 + }, + { + "epoch": 1.82, + "learning_rate": 7.102449466388619e-07, + "loss": 0.6064, + "step": 70904 + }, + { + "epoch": 1.82, + "learning_rate": 7.10218463335252e-07, + "loss": 0.5923, + "step": 70905 + }, + { + "epoch": 1.82, + "learning_rate": 7.101919802535148e-07, + "loss": 0.6934, + "step": 70906 + }, + { + "epoch": 1.82, + "learning_rate": 7.101654973936702e-07, + "loss": 0.6714, + "step": 70907 + }, + { + "epoch": 1.82, + "learning_rate": 7.101390147557382e-07, + "loss": 0.6807, + "step": 70908 + }, + { + "epoch": 1.82, + "learning_rate": 7.101125323397399e-07, + "loss": 0.6699, + "step": 70909 + }, + { + "epoch": 1.82, + "learning_rate": 7.100860501456953e-07, + "loss": 0.7881, + "step": 70910 + }, + { + "epoch": 1.82, + "learning_rate": 7.100595681736239e-07, + "loss": 0.644, + "step": 70911 + }, + { + "epoch": 1.82, + "learning_rate": 7.100330864235469e-07, + "loss": 0.627, + "step": 70912 + }, + { + "epoch": 1.82, + "learning_rate": 7.100066048954838e-07, + "loss": 0.6401, + "step": 70913 + }, + { + "epoch": 1.82, + "learning_rate": 7.099801235894557e-07, + "loss": 0.71, + "step": 70914 + }, + { + "epoch": 1.82, + "learning_rate": 7.099536425054822e-07, + "loss": 0.6152, + "step": 70915 + }, + { + "epoch": 1.82, + "learning_rate": 7.099271616435842e-07, + "loss": 0.5488, + "step": 70916 + }, + { + "epoch": 1.82, + "learning_rate": 7.099006810037813e-07, + "loss": 0.6611, + "step": 70917 + }, + { + "epoch": 1.82, + "learning_rate": 7.098742005860944e-07, + "loss": 0.6846, + "step": 70918 + }, + { + "epoch": 1.82, + "learning_rate": 7.098477203905432e-07, + "loss": 0.7617, + "step": 70919 + }, + { + "epoch": 1.82, + "learning_rate": 7.098212404171486e-07, + "loss": 0.5098, + "step": 70920 + }, + { + "epoch": 1.82, + "learning_rate": 7.097947606659304e-07, + "loss": 0.6226, + "step": 70921 + }, + { + "epoch": 1.82, + "learning_rate": 7.09768281136909e-07, + "loss": 0.7178, + "step": 70922 + }, + { + "epoch": 1.82, + "learning_rate": 7.097418018301046e-07, + "loss": 0.6772, + "step": 70923 + }, + { + "epoch": 1.82, + "learning_rate": 7.097153227455378e-07, + "loss": 0.5513, + "step": 70924 + }, + { + "epoch": 1.82, + "learning_rate": 7.096888438832283e-07, + "loss": 0.3379, + "step": 70925 + }, + { + "epoch": 1.82, + "learning_rate": 7.096623652431969e-07, + "loss": 0.5793, + "step": 70926 + }, + { + "epoch": 1.82, + "learning_rate": 7.096358868254635e-07, + "loss": 0.6094, + "step": 70927 + }, + { + "epoch": 1.82, + "learning_rate": 7.096094086300487e-07, + "loss": 0.6934, + "step": 70928 + }, + { + "epoch": 1.82, + "learning_rate": 7.095829306569729e-07, + "loss": 0.5127, + "step": 70929 + }, + { + "epoch": 1.82, + "learning_rate": 7.095564529062556e-07, + "loss": 0.5933, + "step": 70930 + }, + { + "epoch": 1.82, + "learning_rate": 7.095299753779178e-07, + "loss": 0.8057, + "step": 70931 + }, + { + "epoch": 1.82, + "learning_rate": 7.095034980719794e-07, + "loss": 0.7075, + "step": 70932 + }, + { + "epoch": 1.82, + "learning_rate": 7.094770209884611e-07, + "loss": 0.4583, + "step": 70933 + }, + { + "epoch": 1.82, + "learning_rate": 7.094505441273824e-07, + "loss": 0.7422, + "step": 70934 + }, + { + "epoch": 1.82, + "learning_rate": 7.094240674887645e-07, + "loss": 0.6484, + "step": 70935 + }, + { + "epoch": 1.82, + "learning_rate": 7.093975910726269e-07, + "loss": 0.7568, + "step": 70936 + }, + { + "epoch": 1.82, + "learning_rate": 7.093711148789905e-07, + "loss": 0.519, + "step": 70937 + }, + { + "epoch": 1.82, + "learning_rate": 7.09344638907875e-07, + "loss": 0.76, + "step": 70938 + }, + { + "epoch": 1.82, + "learning_rate": 7.093181631593014e-07, + "loss": 0.6406, + "step": 70939 + }, + { + "epoch": 1.82, + "learning_rate": 7.092916876332893e-07, + "loss": 0.6016, + "step": 70940 + }, + { + "epoch": 1.82, + "learning_rate": 7.09265212329859e-07, + "loss": 0.5776, + "step": 70941 + }, + { + "epoch": 1.82, + "learning_rate": 7.092387372490311e-07, + "loss": 0.5269, + "step": 70942 + }, + { + "epoch": 1.82, + "learning_rate": 7.092122623908259e-07, + "loss": 0.7168, + "step": 70943 + }, + { + "epoch": 1.82, + "learning_rate": 7.091857877552631e-07, + "loss": 0.6289, + "step": 70944 + }, + { + "epoch": 1.82, + "learning_rate": 7.091593133423637e-07, + "loss": 0.7012, + "step": 70945 + }, + { + "epoch": 1.82, + "learning_rate": 7.091328391521473e-07, + "loss": 0.5293, + "step": 70946 + }, + { + "epoch": 1.82, + "learning_rate": 7.091063651846348e-07, + "loss": 0.665, + "step": 70947 + }, + { + "epoch": 1.82, + "learning_rate": 7.090798914398459e-07, + "loss": 0.6611, + "step": 70948 + }, + { + "epoch": 1.82, + "learning_rate": 7.090534179178017e-07, + "loss": 0.6865, + "step": 70949 + }, + { + "epoch": 1.82, + "learning_rate": 7.090269446185217e-07, + "loss": 0.7217, + "step": 70950 + }, + { + "epoch": 1.82, + "learning_rate": 7.090004715420261e-07, + "loss": 0.6299, + "step": 70951 + }, + { + "epoch": 1.82, + "learning_rate": 7.089739986883356e-07, + "loss": 0.5767, + "step": 70952 + }, + { + "epoch": 1.82, + "learning_rate": 7.089475260574703e-07, + "loss": 0.5454, + "step": 70953 + }, + { + "epoch": 1.82, + "learning_rate": 7.089210536494506e-07, + "loss": 0.5552, + "step": 70954 + }, + { + "epoch": 1.82, + "learning_rate": 7.088945814642964e-07, + "loss": 0.5594, + "step": 70955 + }, + { + "epoch": 1.82, + "learning_rate": 7.088681095020285e-07, + "loss": 0.7158, + "step": 70956 + }, + { + "epoch": 1.82, + "learning_rate": 7.088416377626667e-07, + "loss": 0.749, + "step": 70957 + }, + { + "epoch": 1.82, + "learning_rate": 7.088151662462318e-07, + "loss": 0.6584, + "step": 70958 + }, + { + "epoch": 1.82, + "learning_rate": 7.087886949527438e-07, + "loss": 0.5508, + "step": 70959 + }, + { + "epoch": 1.82, + "learning_rate": 7.087622238822227e-07, + "loss": 0.5625, + "step": 70960 + }, + { + "epoch": 1.82, + "learning_rate": 7.087357530346888e-07, + "loss": 0.4946, + "step": 70961 + }, + { + "epoch": 1.82, + "learning_rate": 7.087092824101628e-07, + "loss": 0.5615, + "step": 70962 + }, + { + "epoch": 1.82, + "learning_rate": 7.086828120086644e-07, + "loss": 0.627, + "step": 70963 + }, + { + "epoch": 1.82, + "learning_rate": 7.086563418302145e-07, + "loss": 0.6475, + "step": 70964 + }, + { + "epoch": 1.82, + "learning_rate": 7.086298718748327e-07, + "loss": 0.364, + "step": 70965 + }, + { + "epoch": 1.82, + "learning_rate": 7.086034021425399e-07, + "loss": 0.7109, + "step": 70966 + }, + { + "epoch": 1.82, + "learning_rate": 7.085769326333558e-07, + "loss": 0.7559, + "step": 70967 + }, + { + "epoch": 1.82, + "learning_rate": 7.085504633473012e-07, + "loss": 0.7979, + "step": 70968 + }, + { + "epoch": 1.82, + "learning_rate": 7.085239942843964e-07, + "loss": 0.5225, + "step": 70969 + }, + { + "epoch": 1.82, + "learning_rate": 7.084975254446608e-07, + "loss": 0.6562, + "step": 70970 + }, + { + "epoch": 1.82, + "learning_rate": 7.084710568281155e-07, + "loss": 0.6602, + "step": 70971 + }, + { + "epoch": 1.82, + "learning_rate": 7.084445884347803e-07, + "loss": 0.5144, + "step": 70972 + }, + { + "epoch": 1.82, + "learning_rate": 7.084181202646759e-07, + "loss": 0.7314, + "step": 70973 + }, + { + "epoch": 1.82, + "learning_rate": 7.083916523178222e-07, + "loss": 0.8613, + "step": 70974 + }, + { + "epoch": 1.82, + "learning_rate": 7.083651845942398e-07, + "loss": 0.5098, + "step": 70975 + }, + { + "epoch": 1.82, + "learning_rate": 7.083387170939486e-07, + "loss": 0.3721, + "step": 70976 + }, + { + "epoch": 1.82, + "learning_rate": 7.08312249816969e-07, + "loss": 0.5786, + "step": 70977 + }, + { + "epoch": 1.82, + "learning_rate": 7.082857827633213e-07, + "loss": 0.6841, + "step": 70978 + }, + { + "epoch": 1.82, + "learning_rate": 7.082593159330263e-07, + "loss": 0.5962, + "step": 70979 + }, + { + "epoch": 1.82, + "learning_rate": 7.082328493261031e-07, + "loss": 0.6206, + "step": 70980 + }, + { + "epoch": 1.82, + "learning_rate": 7.082063829425729e-07, + "loss": 0.5293, + "step": 70981 + }, + { + "epoch": 1.82, + "learning_rate": 7.081799167824554e-07, + "loss": 0.5693, + "step": 70982 + }, + { + "epoch": 1.82, + "learning_rate": 7.081534508457713e-07, + "loss": 0.7314, + "step": 70983 + }, + { + "epoch": 1.82, + "learning_rate": 7.081269851325404e-07, + "loss": 0.6436, + "step": 70984 + }, + { + "epoch": 1.82, + "learning_rate": 7.081005196427836e-07, + "loss": 0.7598, + "step": 70985 + }, + { + "epoch": 1.82, + "learning_rate": 7.080740543765205e-07, + "loss": 0.5874, + "step": 70986 + }, + { + "epoch": 1.82, + "learning_rate": 7.080475893337718e-07, + "loss": 0.7979, + "step": 70987 + }, + { + "epoch": 1.82, + "learning_rate": 7.080211245145576e-07, + "loss": 0.6577, + "step": 70988 + }, + { + "epoch": 1.82, + "learning_rate": 7.079946599188987e-07, + "loss": 0.5664, + "step": 70989 + }, + { + "epoch": 1.82, + "learning_rate": 7.079681955468144e-07, + "loss": 0.5437, + "step": 70990 + }, + { + "epoch": 1.82, + "learning_rate": 7.079417313983254e-07, + "loss": 0.6738, + "step": 70991 + }, + { + "epoch": 1.82, + "learning_rate": 7.079152674734521e-07, + "loss": 0.54, + "step": 70992 + }, + { + "epoch": 1.82, + "learning_rate": 7.078888037722144e-07, + "loss": 0.6196, + "step": 70993 + }, + { + "epoch": 1.82, + "learning_rate": 7.078623402946331e-07, + "loss": 0.7324, + "step": 70994 + }, + { + "epoch": 1.82, + "learning_rate": 7.07835877040728e-07, + "loss": 0.6143, + "step": 70995 + }, + { + "epoch": 1.82, + "learning_rate": 7.078094140105197e-07, + "loss": 0.7314, + "step": 70996 + }, + { + "epoch": 1.82, + "learning_rate": 7.077829512040283e-07, + "loss": 0.7852, + "step": 70997 + }, + { + "epoch": 1.82, + "learning_rate": 7.077564886212739e-07, + "loss": 0.6748, + "step": 70998 + }, + { + "epoch": 1.82, + "learning_rate": 7.077300262622772e-07, + "loss": 0.7285, + "step": 70999 + }, + { + "epoch": 1.82, + "learning_rate": 7.077035641270581e-07, + "loss": 0.6963, + "step": 71000 + }, + { + "epoch": 1.82, + "learning_rate": 7.076771022156367e-07, + "loss": 0.5269, + "step": 71001 + }, + { + "epoch": 1.82, + "learning_rate": 7.076506405280336e-07, + "loss": 0.6504, + "step": 71002 + }, + { + "epoch": 1.82, + "learning_rate": 7.076241790642689e-07, + "loss": 0.7471, + "step": 71003 + }, + { + "epoch": 1.82, + "learning_rate": 7.07597717824363e-07, + "loss": 0.6431, + "step": 71004 + }, + { + "epoch": 1.82, + "learning_rate": 7.075712568083361e-07, + "loss": 0.5513, + "step": 71005 + }, + { + "epoch": 1.82, + "learning_rate": 7.075447960162084e-07, + "loss": 0.4443, + "step": 71006 + }, + { + "epoch": 1.82, + "learning_rate": 7.075183354480001e-07, + "loss": 0.5825, + "step": 71007 + }, + { + "epoch": 1.82, + "learning_rate": 7.074918751037317e-07, + "loss": 0.6621, + "step": 71008 + }, + { + "epoch": 1.82, + "learning_rate": 7.074654149834236e-07, + "loss": 0.6587, + "step": 71009 + }, + { + "epoch": 1.82, + "learning_rate": 7.074389550870954e-07, + "loss": 0.6797, + "step": 71010 + }, + { + "epoch": 1.82, + "learning_rate": 7.07412495414768e-07, + "loss": 0.7002, + "step": 71011 + }, + { + "epoch": 1.82, + "learning_rate": 7.073860359664609e-07, + "loss": 0.7383, + "step": 71012 + }, + { + "epoch": 1.82, + "learning_rate": 7.073595767421954e-07, + "loss": 0.748, + "step": 71013 + }, + { + "epoch": 1.82, + "learning_rate": 7.073331177419907e-07, + "loss": 0.5693, + "step": 71014 + }, + { + "epoch": 1.82, + "learning_rate": 7.073066589658681e-07, + "loss": 0.5459, + "step": 71015 + }, + { + "epoch": 1.82, + "learning_rate": 7.072802004138472e-07, + "loss": 0.7676, + "step": 71016 + }, + { + "epoch": 1.82, + "learning_rate": 7.072537420859481e-07, + "loss": 0.4183, + "step": 71017 + }, + { + "epoch": 1.82, + "learning_rate": 7.072272839821916e-07, + "loss": 0.5259, + "step": 71018 + }, + { + "epoch": 1.82, + "learning_rate": 7.072008261025981e-07, + "loss": 0.6558, + "step": 71019 + }, + { + "epoch": 1.82, + "learning_rate": 7.071743684471868e-07, + "loss": 0.6689, + "step": 71020 + }, + { + "epoch": 1.82, + "learning_rate": 7.071479110159789e-07, + "loss": 0.793, + "step": 71021 + }, + { + "epoch": 1.82, + "learning_rate": 7.071214538089943e-07, + "loss": 0.7275, + "step": 71022 + }, + { + "epoch": 1.82, + "learning_rate": 7.070949968262534e-07, + "loss": 0.7363, + "step": 71023 + }, + { + "epoch": 1.82, + "learning_rate": 7.070685400677762e-07, + "loss": 0.7334, + "step": 71024 + }, + { + "epoch": 1.82, + "learning_rate": 7.070420835335833e-07, + "loss": 0.3972, + "step": 71025 + }, + { + "epoch": 1.82, + "learning_rate": 7.070156272236946e-07, + "loss": 0.6777, + "step": 71026 + }, + { + "epoch": 1.82, + "learning_rate": 7.06989171138131e-07, + "loss": 0.5884, + "step": 71027 + }, + { + "epoch": 1.82, + "learning_rate": 7.069627152769119e-07, + "loss": 0.6211, + "step": 71028 + }, + { + "epoch": 1.82, + "learning_rate": 7.069362596400585e-07, + "loss": 0.7085, + "step": 71029 + }, + { + "epoch": 1.82, + "learning_rate": 7.069098042275903e-07, + "loss": 0.5977, + "step": 71030 + }, + { + "epoch": 1.82, + "learning_rate": 7.068833490395275e-07, + "loss": 0.6279, + "step": 71031 + }, + { + "epoch": 1.82, + "learning_rate": 7.068568940758908e-07, + "loss": 0.427, + "step": 71032 + }, + { + "epoch": 1.82, + "learning_rate": 7.068304393367005e-07, + "loss": 0.4592, + "step": 71033 + }, + { + "epoch": 1.82, + "learning_rate": 7.068039848219763e-07, + "loss": 0.519, + "step": 71034 + }, + { + "epoch": 1.82, + "learning_rate": 7.067775305317391e-07, + "loss": 0.4492, + "step": 71035 + }, + { + "epoch": 1.82, + "learning_rate": 7.067510764660086e-07, + "loss": 0.8262, + "step": 71036 + }, + { + "epoch": 1.82, + "learning_rate": 7.067246226248056e-07, + "loss": 0.5742, + "step": 71037 + }, + { + "epoch": 1.82, + "learning_rate": 7.066981690081497e-07, + "loss": 0.5483, + "step": 71038 + }, + { + "epoch": 1.82, + "learning_rate": 7.06671715616062e-07, + "loss": 0.6812, + "step": 71039 + }, + { + "epoch": 1.82, + "learning_rate": 7.066452624485622e-07, + "loss": 0.6104, + "step": 71040 + }, + { + "epoch": 1.82, + "learning_rate": 7.066188095056702e-07, + "loss": 0.4399, + "step": 71041 + }, + { + "epoch": 1.82, + "learning_rate": 7.065923567874072e-07, + "loss": 0.7383, + "step": 71042 + }, + { + "epoch": 1.82, + "learning_rate": 7.065659042937924e-07, + "loss": 0.5161, + "step": 71043 + }, + { + "epoch": 1.82, + "learning_rate": 7.065394520248471e-07, + "loss": 0.6177, + "step": 71044 + }, + { + "epoch": 1.82, + "learning_rate": 7.065129999805906e-07, + "loss": 0.5647, + "step": 71045 + }, + { + "epoch": 1.82, + "learning_rate": 7.06486548161044e-07, + "loss": 0.5659, + "step": 71046 + }, + { + "epoch": 1.82, + "learning_rate": 7.064600965662268e-07, + "loss": 0.562, + "step": 71047 + }, + { + "epoch": 1.82, + "learning_rate": 7.064336451961599e-07, + "loss": 0.7627, + "step": 71048 + }, + { + "epoch": 1.82, + "learning_rate": 7.064071940508635e-07, + "loss": 0.6211, + "step": 71049 + }, + { + "epoch": 1.82, + "learning_rate": 7.063807431303573e-07, + "loss": 0.7744, + "step": 71050 + }, + { + "epoch": 1.82, + "learning_rate": 7.063542924346618e-07, + "loss": 0.5652, + "step": 71051 + }, + { + "epoch": 1.82, + "learning_rate": 7.063278419637973e-07, + "loss": 0.7773, + "step": 71052 + }, + { + "epoch": 1.82, + "learning_rate": 7.063013917177841e-07, + "loss": 0.8066, + "step": 71053 + }, + { + "epoch": 1.82, + "learning_rate": 7.062749416966425e-07, + "loss": 0.7256, + "step": 71054 + }, + { + "epoch": 1.82, + "learning_rate": 7.062484919003924e-07, + "loss": 0.5879, + "step": 71055 + }, + { + "epoch": 1.82, + "learning_rate": 7.062220423290545e-07, + "loss": 0.9297, + "step": 71056 + }, + { + "epoch": 1.82, + "learning_rate": 7.061955929826489e-07, + "loss": 0.5815, + "step": 71057 + }, + { + "epoch": 1.82, + "learning_rate": 7.061691438611959e-07, + "loss": 0.5452, + "step": 71058 + }, + { + "epoch": 1.82, + "learning_rate": 7.061426949647159e-07, + "loss": 0.6836, + "step": 71059 + }, + { + "epoch": 1.82, + "learning_rate": 7.061162462932284e-07, + "loss": 0.7568, + "step": 71060 + }, + { + "epoch": 1.82, + "learning_rate": 7.060897978467546e-07, + "loss": 0.7285, + "step": 71061 + }, + { + "epoch": 1.82, + "learning_rate": 7.06063349625314e-07, + "loss": 0.5532, + "step": 71062 + }, + { + "epoch": 1.82, + "learning_rate": 7.060369016289274e-07, + "loss": 0.8428, + "step": 71063 + }, + { + "epoch": 1.82, + "learning_rate": 7.060104538576146e-07, + "loss": 0.6924, + "step": 71064 + }, + { + "epoch": 1.82, + "learning_rate": 7.059840063113962e-07, + "loss": 0.6538, + "step": 71065 + }, + { + "epoch": 1.82, + "learning_rate": 7.059575589902923e-07, + "loss": 0.5947, + "step": 71066 + }, + { + "epoch": 1.82, + "learning_rate": 7.059311118943233e-07, + "loss": 0.6592, + "step": 71067 + }, + { + "epoch": 1.82, + "learning_rate": 7.05904665023509e-07, + "loss": 0.4854, + "step": 71068 + }, + { + "epoch": 1.82, + "learning_rate": 7.058782183778709e-07, + "loss": 0.5002, + "step": 71069 + }, + { + "epoch": 1.82, + "learning_rate": 7.058517719574275e-07, + "loss": 0.7178, + "step": 71070 + }, + { + "epoch": 1.82, + "learning_rate": 7.058253257622e-07, + "loss": 0.6514, + "step": 71071 + }, + { + "epoch": 1.82, + "learning_rate": 7.057988797922086e-07, + "loss": 0.5767, + "step": 71072 + }, + { + "epoch": 1.82, + "learning_rate": 7.057724340474734e-07, + "loss": 0.6982, + "step": 71073 + }, + { + "epoch": 1.82, + "learning_rate": 7.057459885280145e-07, + "loss": 0.6846, + "step": 71074 + }, + { + "epoch": 1.82, + "learning_rate": 7.057195432338527e-07, + "loss": 0.6992, + "step": 71075 + }, + { + "epoch": 1.82, + "learning_rate": 7.056930981650078e-07, + "loss": 0.6372, + "step": 71076 + }, + { + "epoch": 1.82, + "learning_rate": 7.056666533215001e-07, + "loss": 0.5558, + "step": 71077 + }, + { + "epoch": 1.82, + "learning_rate": 7.056402087033499e-07, + "loss": 0.7529, + "step": 71078 + }, + { + "epoch": 1.82, + "learning_rate": 7.056137643105779e-07, + "loss": 0.5688, + "step": 71079 + }, + { + "epoch": 1.82, + "learning_rate": 7.055873201432035e-07, + "loss": 0.6514, + "step": 71080 + }, + { + "epoch": 1.82, + "learning_rate": 7.055608762012472e-07, + "loss": 0.5566, + "step": 71081 + }, + { + "epoch": 1.82, + "learning_rate": 7.055344324847299e-07, + "loss": 0.5811, + "step": 71082 + }, + { + "epoch": 1.82, + "learning_rate": 7.055079889936708e-07, + "loss": 0.603, + "step": 71083 + }, + { + "epoch": 1.82, + "learning_rate": 7.05481545728091e-07, + "loss": 0.7275, + "step": 71084 + }, + { + "epoch": 1.82, + "learning_rate": 7.054551026880103e-07, + "loss": 0.5603, + "step": 71085 + }, + { + "epoch": 1.82, + "learning_rate": 7.054286598734491e-07, + "loss": 0.6987, + "step": 71086 + }, + { + "epoch": 1.82, + "learning_rate": 7.054022172844278e-07, + "loss": 0.771, + "step": 71087 + }, + { + "epoch": 1.82, + "learning_rate": 7.053757749209664e-07, + "loss": 0.6416, + "step": 71088 + }, + { + "epoch": 1.82, + "learning_rate": 7.053493327830853e-07, + "loss": 0.5653, + "step": 71089 + }, + { + "epoch": 1.82, + "learning_rate": 7.053228908708047e-07, + "loss": 0.666, + "step": 71090 + }, + { + "epoch": 1.82, + "learning_rate": 7.052964491841445e-07, + "loss": 0.5934, + "step": 71091 + }, + { + "epoch": 1.82, + "learning_rate": 7.052700077231255e-07, + "loss": 0.646, + "step": 71092 + }, + { + "epoch": 1.82, + "learning_rate": 7.052435664877675e-07, + "loss": 0.6304, + "step": 71093 + }, + { + "epoch": 1.82, + "learning_rate": 7.052171254780912e-07, + "loss": 0.6313, + "step": 71094 + }, + { + "epoch": 1.82, + "learning_rate": 7.051906846941162e-07, + "loss": 0.7402, + "step": 71095 + }, + { + "epoch": 1.82, + "learning_rate": 7.051642441358636e-07, + "loss": 0.6162, + "step": 71096 + }, + { + "epoch": 1.82, + "learning_rate": 7.051378038033529e-07, + "loss": 0.7891, + "step": 71097 + }, + { + "epoch": 1.82, + "learning_rate": 7.051113636966047e-07, + "loss": 0.7422, + "step": 71098 + }, + { + "epoch": 1.82, + "learning_rate": 7.050849238156396e-07, + "loss": 0.5635, + "step": 71099 + }, + { + "epoch": 1.82, + "learning_rate": 7.050584841604767e-07, + "loss": 0.6445, + "step": 71100 + }, + { + "epoch": 1.82, + "learning_rate": 7.050320447311374e-07, + "loss": 0.6738, + "step": 71101 + }, + { + "epoch": 1.82, + "learning_rate": 7.050056055276412e-07, + "loss": 0.5249, + "step": 71102 + }, + { + "epoch": 1.82, + "learning_rate": 7.049791665500089e-07, + "loss": 0.5193, + "step": 71103 + }, + { + "epoch": 1.82, + "learning_rate": 7.049527277982602e-07, + "loss": 0.7119, + "step": 71104 + }, + { + "epoch": 1.82, + "learning_rate": 7.049262892724159e-07, + "loss": 0.6855, + "step": 71105 + }, + { + "epoch": 1.82, + "learning_rate": 7.048998509724959e-07, + "loss": 0.6113, + "step": 71106 + }, + { + "epoch": 1.82, + "learning_rate": 7.048734128985204e-07, + "loss": 0.6543, + "step": 71107 + }, + { + "epoch": 1.82, + "learning_rate": 7.048469750505099e-07, + "loss": 0.6455, + "step": 71108 + }, + { + "epoch": 1.82, + "learning_rate": 7.048205374284848e-07, + "loss": 0.6235, + "step": 71109 + }, + { + "epoch": 1.82, + "learning_rate": 7.047941000324645e-07, + "loss": 0.4824, + "step": 71110 + }, + { + "epoch": 1.82, + "learning_rate": 7.047676628624701e-07, + "loss": 0.6865, + "step": 71111 + }, + { + "epoch": 1.82, + "learning_rate": 7.047412259185213e-07, + "loss": 0.7637, + "step": 71112 + }, + { + "epoch": 1.82, + "learning_rate": 7.047147892006388e-07, + "loss": 0.7041, + "step": 71113 + }, + { + "epoch": 1.82, + "learning_rate": 7.046883527088423e-07, + "loss": 0.7246, + "step": 71114 + }, + { + "epoch": 1.82, + "learning_rate": 7.046619164431526e-07, + "loss": 0.5676, + "step": 71115 + }, + { + "epoch": 1.82, + "learning_rate": 7.046354804035894e-07, + "loss": 0.6221, + "step": 71116 + }, + { + "epoch": 1.82, + "learning_rate": 7.046090445901736e-07, + "loss": 0.6602, + "step": 71117 + }, + { + "epoch": 1.82, + "learning_rate": 7.045826090029247e-07, + "loss": 0.5415, + "step": 71118 + }, + { + "epoch": 1.82, + "learning_rate": 7.045561736418639e-07, + "loss": 0.7061, + "step": 71119 + }, + { + "epoch": 1.82, + "learning_rate": 7.045297385070106e-07, + "loss": 0.6602, + "step": 71120 + }, + { + "epoch": 1.82, + "learning_rate": 7.045033035983851e-07, + "loss": 0.5928, + "step": 71121 + }, + { + "epoch": 1.82, + "learning_rate": 7.044768689160078e-07, + "loss": 0.6958, + "step": 71122 + }, + { + "epoch": 1.82, + "learning_rate": 7.044504344598994e-07, + "loss": 0.6128, + "step": 71123 + }, + { + "epoch": 1.82, + "learning_rate": 7.044240002300791e-07, + "loss": 0.5767, + "step": 71124 + }, + { + "epoch": 1.82, + "learning_rate": 7.043975662265682e-07, + "loss": 0.7065, + "step": 71125 + }, + { + "epoch": 1.82, + "learning_rate": 7.043711324493862e-07, + "loss": 0.6787, + "step": 71126 + }, + { + "epoch": 1.82, + "learning_rate": 7.043446988985538e-07, + "loss": 0.5342, + "step": 71127 + }, + { + "epoch": 1.82, + "learning_rate": 7.043182655740909e-07, + "loss": 0.5244, + "step": 71128 + }, + { + "epoch": 1.82, + "learning_rate": 7.042918324760184e-07, + "loss": 0.5557, + "step": 71129 + }, + { + "epoch": 1.82, + "learning_rate": 7.042653996043558e-07, + "loss": 0.8008, + "step": 71130 + }, + { + "epoch": 1.82, + "learning_rate": 7.042389669591233e-07, + "loss": 0.6162, + "step": 71131 + }, + { + "epoch": 1.82, + "learning_rate": 7.042125345403418e-07, + "loss": 0.4187, + "step": 71132 + }, + { + "epoch": 1.82, + "learning_rate": 7.041861023480308e-07, + "loss": 0.5366, + "step": 71133 + }, + { + "epoch": 1.82, + "learning_rate": 7.041596703822111e-07, + "loss": 0.8281, + "step": 71134 + }, + { + "epoch": 1.82, + "learning_rate": 7.041332386429026e-07, + "loss": 0.6267, + "step": 71135 + }, + { + "epoch": 1.82, + "learning_rate": 7.04106807130126e-07, + "loss": 0.7578, + "step": 71136 + }, + { + "epoch": 1.82, + "learning_rate": 7.040803758439006e-07, + "loss": 0.6167, + "step": 71137 + }, + { + "epoch": 1.82, + "learning_rate": 7.040539447842479e-07, + "loss": 0.6235, + "step": 71138 + }, + { + "epoch": 1.82, + "learning_rate": 7.040275139511875e-07, + "loss": 0.6035, + "step": 71139 + }, + { + "epoch": 1.82, + "learning_rate": 7.040010833447394e-07, + "loss": 0.5181, + "step": 71140 + }, + { + "epoch": 1.82, + "learning_rate": 7.039746529649239e-07, + "loss": 0.6064, + "step": 71141 + }, + { + "epoch": 1.82, + "learning_rate": 7.039482228117616e-07, + "loss": 0.7578, + "step": 71142 + }, + { + "epoch": 1.82, + "learning_rate": 7.039217928852724e-07, + "loss": 0.6523, + "step": 71143 + }, + { + "epoch": 1.82, + "learning_rate": 7.038953631854767e-07, + "loss": 0.615, + "step": 71144 + }, + { + "epoch": 1.82, + "learning_rate": 7.038689337123946e-07, + "loss": 0.6079, + "step": 71145 + }, + { + "epoch": 1.82, + "learning_rate": 7.038425044660465e-07, + "loss": 0.615, + "step": 71146 + }, + { + "epoch": 1.82, + "learning_rate": 7.038160754464527e-07, + "loss": 0.6133, + "step": 71147 + }, + { + "epoch": 1.82, + "learning_rate": 7.037896466536333e-07, + "loss": 0.5625, + "step": 71148 + }, + { + "epoch": 1.82, + "learning_rate": 7.037632180876087e-07, + "loss": 0.5095, + "step": 71149 + }, + { + "epoch": 1.82, + "learning_rate": 7.037367897483987e-07, + "loss": 0.6079, + "step": 71150 + }, + { + "epoch": 1.82, + "learning_rate": 7.037103616360239e-07, + "loss": 0.7539, + "step": 71151 + }, + { + "epoch": 1.82, + "learning_rate": 7.036839337505043e-07, + "loss": 0.6875, + "step": 71152 + }, + { + "epoch": 1.82, + "learning_rate": 7.036575060918606e-07, + "loss": 0.7871, + "step": 71153 + }, + { + "epoch": 1.82, + "learning_rate": 7.036310786601124e-07, + "loss": 0.6895, + "step": 71154 + }, + { + "epoch": 1.82, + "learning_rate": 7.036046514552805e-07, + "loss": 0.7031, + "step": 71155 + }, + { + "epoch": 1.82, + "learning_rate": 7.035782244773847e-07, + "loss": 0.6406, + "step": 71156 + }, + { + "epoch": 1.82, + "learning_rate": 7.035517977264456e-07, + "loss": 0.5669, + "step": 71157 + }, + { + "epoch": 1.82, + "learning_rate": 7.035253712024831e-07, + "loss": 0.4261, + "step": 71158 + }, + { + "epoch": 1.82, + "learning_rate": 7.034989449055181e-07, + "loss": 0.5454, + "step": 71159 + }, + { + "epoch": 1.82, + "learning_rate": 7.034725188355697e-07, + "loss": 0.7539, + "step": 71160 + }, + { + "epoch": 1.82, + "learning_rate": 7.034460929926591e-07, + "loss": 0.5728, + "step": 71161 + }, + { + "epoch": 1.82, + "learning_rate": 7.034196673768058e-07, + "loss": 0.6318, + "step": 71162 + }, + { + "epoch": 1.82, + "learning_rate": 7.033932419880309e-07, + "loss": 0.7021, + "step": 71163 + }, + { + "epoch": 1.82, + "learning_rate": 7.033668168263538e-07, + "loss": 0.8242, + "step": 71164 + }, + { + "epoch": 1.82, + "learning_rate": 7.033403918917952e-07, + "loss": 0.6323, + "step": 71165 + }, + { + "epoch": 1.82, + "learning_rate": 7.033139671843751e-07, + "loss": 0.6445, + "step": 71166 + }, + { + "epoch": 1.82, + "learning_rate": 7.032875427041141e-07, + "loss": 0.5654, + "step": 71167 + }, + { + "epoch": 1.82, + "learning_rate": 7.03261118451032e-07, + "loss": 0.6582, + "step": 71168 + }, + { + "epoch": 1.82, + "learning_rate": 7.032346944251495e-07, + "loss": 0.5601, + "step": 71169 + }, + { + "epoch": 1.82, + "learning_rate": 7.032082706264864e-07, + "loss": 0.7246, + "step": 71170 + }, + { + "epoch": 1.82, + "learning_rate": 7.031818470550629e-07, + "loss": 0.6426, + "step": 71171 + }, + { + "epoch": 1.82, + "learning_rate": 7.031554237108997e-07, + "loss": 0.6077, + "step": 71172 + }, + { + "epoch": 1.82, + "learning_rate": 7.031290005940163e-07, + "loss": 0.5864, + "step": 71173 + }, + { + "epoch": 1.82, + "learning_rate": 7.031025777044338e-07, + "loss": 0.6113, + "step": 71174 + }, + { + "epoch": 1.82, + "learning_rate": 7.030761550421718e-07, + "loss": 0.7988, + "step": 71175 + }, + { + "epoch": 1.82, + "learning_rate": 7.030497326072509e-07, + "loss": 0.6655, + "step": 71176 + }, + { + "epoch": 1.82, + "learning_rate": 7.030233103996908e-07, + "loss": 0.6755, + "step": 71177 + }, + { + "epoch": 1.82, + "learning_rate": 7.029968884195125e-07, + "loss": 0.645, + "step": 71178 + }, + { + "epoch": 1.82, + "learning_rate": 7.029704666667359e-07, + "loss": 0.6143, + "step": 71179 + }, + { + "epoch": 1.82, + "learning_rate": 7.029440451413811e-07, + "loss": 0.6416, + "step": 71180 + }, + { + "epoch": 1.82, + "learning_rate": 7.02917623843468e-07, + "loss": 0.6367, + "step": 71181 + }, + { + "epoch": 1.82, + "learning_rate": 7.028912027730175e-07, + "loss": 0.7593, + "step": 71182 + }, + { + "epoch": 1.82, + "learning_rate": 7.028647819300493e-07, + "loss": 0.6943, + "step": 71183 + }, + { + "epoch": 1.82, + "learning_rate": 7.028383613145842e-07, + "loss": 0.6084, + "step": 71184 + }, + { + "epoch": 1.82, + "learning_rate": 7.028119409266417e-07, + "loss": 0.7842, + "step": 71185 + }, + { + "epoch": 1.82, + "learning_rate": 7.027855207662429e-07, + "loss": 0.5693, + "step": 71186 + }, + { + "epoch": 1.82, + "learning_rate": 7.027591008334072e-07, + "loss": 0.6641, + "step": 71187 + }, + { + "epoch": 1.82, + "learning_rate": 7.027326811281554e-07, + "loss": 0.6719, + "step": 71188 + }, + { + "epoch": 1.82, + "learning_rate": 7.027062616505078e-07, + "loss": 0.6245, + "step": 71189 + }, + { + "epoch": 1.82, + "learning_rate": 7.026798424004838e-07, + "loss": 0.8369, + "step": 71190 + }, + { + "epoch": 1.82, + "learning_rate": 7.026534233781045e-07, + "loss": 0.7568, + "step": 71191 + }, + { + "epoch": 1.82, + "learning_rate": 7.026270045833896e-07, + "loss": 0.4941, + "step": 71192 + }, + { + "epoch": 1.82, + "learning_rate": 7.026005860163596e-07, + "loss": 0.5601, + "step": 71193 + }, + { + "epoch": 1.82, + "learning_rate": 7.025741676770344e-07, + "loss": 0.5894, + "step": 71194 + }, + { + "epoch": 1.82, + "learning_rate": 7.02547749565435e-07, + "loss": 0.6636, + "step": 71195 + }, + { + "epoch": 1.82, + "learning_rate": 7.025213316815808e-07, + "loss": 0.8184, + "step": 71196 + }, + { + "epoch": 1.82, + "learning_rate": 7.024949140254923e-07, + "loss": 0.5801, + "step": 71197 + }, + { + "epoch": 1.82, + "learning_rate": 7.024684965971899e-07, + "loss": 0.752, + "step": 71198 + }, + { + "epoch": 1.82, + "learning_rate": 7.02442079396694e-07, + "loss": 0.6963, + "step": 71199 + }, + { + "epoch": 1.82, + "learning_rate": 7.024156624240241e-07, + "loss": 0.6963, + "step": 71200 + }, + { + "epoch": 1.82, + "learning_rate": 7.023892456792009e-07, + "loss": 0.5708, + "step": 71201 + }, + { + "epoch": 1.82, + "learning_rate": 7.023628291622445e-07, + "loss": 0.6816, + "step": 71202 + }, + { + "epoch": 1.82, + "learning_rate": 7.023364128731752e-07, + "loss": 0.667, + "step": 71203 + }, + { + "epoch": 1.82, + "learning_rate": 7.023099968120133e-07, + "loss": 0.5264, + "step": 71204 + }, + { + "epoch": 1.83, + "learning_rate": 7.02283580978779e-07, + "loss": 0.6436, + "step": 71205 + }, + { + "epoch": 1.83, + "learning_rate": 7.022571653734924e-07, + "loss": 0.595, + "step": 71206 + }, + { + "epoch": 1.83, + "learning_rate": 7.022307499961737e-07, + "loss": 0.5079, + "step": 71207 + }, + { + "epoch": 1.83, + "learning_rate": 7.022043348468433e-07, + "loss": 0.584, + "step": 71208 + }, + { + "epoch": 1.83, + "learning_rate": 7.021779199255216e-07, + "loss": 0.5234, + "step": 71209 + }, + { + "epoch": 1.83, + "learning_rate": 7.021515052322285e-07, + "loss": 0.6904, + "step": 71210 + }, + { + "epoch": 1.83, + "learning_rate": 7.02125090766984e-07, + "loss": 0.6484, + "step": 71211 + }, + { + "epoch": 1.83, + "learning_rate": 7.020986765298089e-07, + "loss": 0.5308, + "step": 71212 + }, + { + "epoch": 1.83, + "learning_rate": 7.020722625207231e-07, + "loss": 0.707, + "step": 71213 + }, + { + "epoch": 1.83, + "learning_rate": 7.020458487397467e-07, + "loss": 0.6035, + "step": 71214 + }, + { + "epoch": 1.83, + "learning_rate": 7.020194351869003e-07, + "loss": 0.6562, + "step": 71215 + }, + { + "epoch": 1.83, + "learning_rate": 7.019930218622035e-07, + "loss": 0.4878, + "step": 71216 + }, + { + "epoch": 1.83, + "learning_rate": 7.019666087656773e-07, + "loss": 0.6597, + "step": 71217 + }, + { + "epoch": 1.83, + "learning_rate": 7.019401958973414e-07, + "loss": 0.604, + "step": 71218 + }, + { + "epoch": 1.83, + "learning_rate": 7.019137832572166e-07, + "loss": 0.7021, + "step": 71219 + }, + { + "epoch": 1.83, + "learning_rate": 7.018873708453226e-07, + "loss": 0.6201, + "step": 71220 + }, + { + "epoch": 1.83, + "learning_rate": 7.018609586616793e-07, + "loss": 0.6802, + "step": 71221 + }, + { + "epoch": 1.83, + "learning_rate": 7.018345467063077e-07, + "loss": 0.5801, + "step": 71222 + }, + { + "epoch": 1.83, + "learning_rate": 7.018081349792274e-07, + "loss": 0.5596, + "step": 71223 + }, + { + "epoch": 1.83, + "learning_rate": 7.017817234804592e-07, + "loss": 0.5957, + "step": 71224 + }, + { + "epoch": 1.83, + "learning_rate": 7.017553122100227e-07, + "loss": 0.4199, + "step": 71225 + }, + { + "epoch": 1.83, + "learning_rate": 7.017289011679388e-07, + "loss": 0.54, + "step": 71226 + }, + { + "epoch": 1.83, + "learning_rate": 7.01702490354227e-07, + "loss": 0.678, + "step": 71227 + }, + { + "epoch": 1.83, + "learning_rate": 7.016760797689084e-07, + "loss": 0.6709, + "step": 71228 + }, + { + "epoch": 1.83, + "learning_rate": 7.016496694120024e-07, + "loss": 0.835, + "step": 71229 + }, + { + "epoch": 1.83, + "learning_rate": 7.016232592835296e-07, + "loss": 0.7686, + "step": 71230 + }, + { + "epoch": 1.83, + "learning_rate": 7.0159684938351e-07, + "loss": 0.5913, + "step": 71231 + }, + { + "epoch": 1.83, + "learning_rate": 7.015704397119641e-07, + "loss": 0.5073, + "step": 71232 + }, + { + "epoch": 1.83, + "learning_rate": 7.015440302689118e-07, + "loss": 0.7109, + "step": 71233 + }, + { + "epoch": 1.83, + "learning_rate": 7.015176210543738e-07, + "loss": 0.5098, + "step": 71234 + }, + { + "epoch": 1.83, + "learning_rate": 7.014912120683697e-07, + "loss": 0.6318, + "step": 71235 + }, + { + "epoch": 1.83, + "learning_rate": 7.014648033109203e-07, + "loss": 0.6445, + "step": 71236 + }, + { + "epoch": 1.83, + "learning_rate": 7.014383947820455e-07, + "loss": 0.6875, + "step": 71237 + }, + { + "epoch": 1.83, + "learning_rate": 7.014119864817658e-07, + "loss": 0.6113, + "step": 71238 + }, + { + "epoch": 1.83, + "learning_rate": 7.01385578410101e-07, + "loss": 0.7627, + "step": 71239 + }, + { + "epoch": 1.83, + "learning_rate": 7.013591705670715e-07, + "loss": 0.6509, + "step": 71240 + }, + { + "epoch": 1.83, + "learning_rate": 7.013327629526977e-07, + "loss": 0.4802, + "step": 71241 + }, + { + "epoch": 1.83, + "learning_rate": 7.013063555669993e-07, + "loss": 0.6729, + "step": 71242 + }, + { + "epoch": 1.83, + "learning_rate": 7.012799484099974e-07, + "loss": 0.7773, + "step": 71243 + }, + { + "epoch": 1.83, + "learning_rate": 7.012535414817113e-07, + "loss": 0.5537, + "step": 71244 + }, + { + "epoch": 1.83, + "learning_rate": 7.012271347821619e-07, + "loss": 0.5781, + "step": 71245 + }, + { + "epoch": 1.83, + "learning_rate": 7.012007283113689e-07, + "loss": 0.6357, + "step": 71246 + }, + { + "epoch": 1.83, + "learning_rate": 7.011743220693529e-07, + "loss": 0.4514, + "step": 71247 + }, + { + "epoch": 1.83, + "learning_rate": 7.011479160561344e-07, + "loss": 0.5918, + "step": 71248 + }, + { + "epoch": 1.83, + "learning_rate": 7.011215102717328e-07, + "loss": 0.6157, + "step": 71249 + }, + { + "epoch": 1.83, + "learning_rate": 7.010951047161687e-07, + "loss": 0.5571, + "step": 71250 + }, + { + "epoch": 1.83, + "learning_rate": 7.010686993894624e-07, + "loss": 0.4269, + "step": 71251 + }, + { + "epoch": 1.83, + "learning_rate": 7.010422942916336e-07, + "loss": 0.6584, + "step": 71252 + }, + { + "epoch": 1.83, + "learning_rate": 7.010158894227036e-07, + "loss": 0.6445, + "step": 71253 + }, + { + "epoch": 1.83, + "learning_rate": 7.009894847826916e-07, + "loss": 0.6445, + "step": 71254 + }, + { + "epoch": 1.83, + "learning_rate": 7.009630803716184e-07, + "loss": 0.4875, + "step": 71255 + }, + { + "epoch": 1.83, + "learning_rate": 7.009366761895038e-07, + "loss": 0.7017, + "step": 71256 + }, + { + "epoch": 1.83, + "learning_rate": 7.009102722363685e-07, + "loss": 0.834, + "step": 71257 + }, + { + "epoch": 1.83, + "learning_rate": 7.008838685122327e-07, + "loss": 0.8193, + "step": 71258 + }, + { + "epoch": 1.83, + "learning_rate": 7.008574650171157e-07, + "loss": 0.6616, + "step": 71259 + }, + { + "epoch": 1.83, + "learning_rate": 7.008310617510389e-07, + "loss": 0.7002, + "step": 71260 + }, + { + "epoch": 1.83, + "learning_rate": 7.008046587140218e-07, + "loss": 0.6553, + "step": 71261 + }, + { + "epoch": 1.83, + "learning_rate": 7.007782559060847e-07, + "loss": 0.6807, + "step": 71262 + }, + { + "epoch": 1.83, + "learning_rate": 7.00751853327248e-07, + "loss": 0.7285, + "step": 71263 + }, + { + "epoch": 1.83, + "learning_rate": 7.00725450977532e-07, + "loss": 0.7959, + "step": 71264 + }, + { + "epoch": 1.83, + "learning_rate": 7.006990488569564e-07, + "loss": 0.6416, + "step": 71265 + }, + { + "epoch": 1.83, + "learning_rate": 7.006726469655422e-07, + "loss": 0.6182, + "step": 71266 + }, + { + "epoch": 1.83, + "learning_rate": 7.006462453033089e-07, + "loss": 0.6475, + "step": 71267 + }, + { + "epoch": 1.83, + "learning_rate": 7.006198438702775e-07, + "loss": 0.5654, + "step": 71268 + }, + { + "epoch": 1.83, + "learning_rate": 7.005934426664673e-07, + "loss": 0.6953, + "step": 71269 + }, + { + "epoch": 1.83, + "learning_rate": 7.005670416918991e-07, + "loss": 0.5669, + "step": 71270 + }, + { + "epoch": 1.83, + "learning_rate": 7.005406409465926e-07, + "loss": 0.8037, + "step": 71271 + }, + { + "epoch": 1.83, + "learning_rate": 7.005142404305688e-07, + "loss": 0.4171, + "step": 71272 + }, + { + "epoch": 1.83, + "learning_rate": 7.00487840143847e-07, + "loss": 0.6104, + "step": 71273 + }, + { + "epoch": 1.83, + "learning_rate": 7.004614400864483e-07, + "loss": 0.6309, + "step": 71274 + }, + { + "epoch": 1.83, + "learning_rate": 7.004350402583922e-07, + "loss": 0.5942, + "step": 71275 + }, + { + "epoch": 1.83, + "learning_rate": 7.004086406596994e-07, + "loss": 0.5837, + "step": 71276 + }, + { + "epoch": 1.83, + "learning_rate": 7.003822412903898e-07, + "loss": 0.6572, + "step": 71277 + }, + { + "epoch": 1.83, + "learning_rate": 7.003558421504842e-07, + "loss": 0.5996, + "step": 71278 + }, + { + "epoch": 1.83, + "learning_rate": 7.00329443240002e-07, + "loss": 0.6602, + "step": 71279 + }, + { + "epoch": 1.83, + "learning_rate": 7.003030445589637e-07, + "loss": 0.6133, + "step": 71280 + }, + { + "epoch": 1.83, + "learning_rate": 7.002766461073897e-07, + "loss": 0.6924, + "step": 71281 + }, + { + "epoch": 1.83, + "learning_rate": 7.002502478852998e-07, + "loss": 0.7236, + "step": 71282 + }, + { + "epoch": 1.83, + "learning_rate": 7.002238498927149e-07, + "loss": 0.4683, + "step": 71283 + }, + { + "epoch": 1.83, + "learning_rate": 7.001974521296545e-07, + "loss": 0.5046, + "step": 71284 + }, + { + "epoch": 1.83, + "learning_rate": 7.001710545961394e-07, + "loss": 0.4714, + "step": 71285 + }, + { + "epoch": 1.83, + "learning_rate": 7.001446572921894e-07, + "loss": 0.5669, + "step": 71286 + }, + { + "epoch": 1.83, + "learning_rate": 7.001182602178247e-07, + "loss": 0.7656, + "step": 71287 + }, + { + "epoch": 1.83, + "learning_rate": 7.000918633730661e-07, + "loss": 0.6416, + "step": 71288 + }, + { + "epoch": 1.83, + "learning_rate": 7.000654667579332e-07, + "loss": 0.6064, + "step": 71289 + }, + { + "epoch": 1.83, + "learning_rate": 7.000390703724461e-07, + "loss": 0.582, + "step": 71290 + }, + { + "epoch": 1.83, + "learning_rate": 7.000126742166256e-07, + "loss": 0.6621, + "step": 71291 + }, + { + "epoch": 1.83, + "learning_rate": 6.999862782904913e-07, + "loss": 0.7568, + "step": 71292 + }, + { + "epoch": 1.83, + "learning_rate": 6.99959882594064e-07, + "loss": 0.627, + "step": 71293 + }, + { + "epoch": 1.83, + "learning_rate": 6.999334871273634e-07, + "loss": 0.7607, + "step": 71294 + }, + { + "epoch": 1.83, + "learning_rate": 6.9990709189041e-07, + "loss": 0.5265, + "step": 71295 + }, + { + "epoch": 1.83, + "learning_rate": 6.998806968832238e-07, + "loss": 0.7207, + "step": 71296 + }, + { + "epoch": 1.83, + "learning_rate": 6.998543021058254e-07, + "loss": 0.6299, + "step": 71297 + }, + { + "epoch": 1.83, + "learning_rate": 6.998279075582349e-07, + "loss": 0.6455, + "step": 71298 + }, + { + "epoch": 1.83, + "learning_rate": 6.998015132404721e-07, + "loss": 0.6445, + "step": 71299 + }, + { + "epoch": 1.83, + "learning_rate": 6.997751191525576e-07, + "loss": 0.416, + "step": 71300 + }, + { + "epoch": 1.83, + "learning_rate": 6.997487252945113e-07, + "loss": 0.6816, + "step": 71301 + }, + { + "epoch": 1.83, + "learning_rate": 6.997223316663539e-07, + "loss": 0.6963, + "step": 71302 + }, + { + "epoch": 1.83, + "learning_rate": 6.996959382681051e-07, + "loss": 0.5554, + "step": 71303 + }, + { + "epoch": 1.83, + "learning_rate": 6.996695450997851e-07, + "loss": 0.5681, + "step": 71304 + }, + { + "epoch": 1.83, + "learning_rate": 6.996431521614147e-07, + "loss": 0.604, + "step": 71305 + }, + { + "epoch": 1.83, + "learning_rate": 6.996167594530134e-07, + "loss": 0.6201, + "step": 71306 + }, + { + "epoch": 1.83, + "learning_rate": 6.99590366974602e-07, + "loss": 0.7451, + "step": 71307 + }, + { + "epoch": 1.83, + "learning_rate": 6.995639747262005e-07, + "loss": 0.708, + "step": 71308 + }, + { + "epoch": 1.83, + "learning_rate": 6.995375827078289e-07, + "loss": 0.7134, + "step": 71309 + }, + { + "epoch": 1.83, + "learning_rate": 6.995111909195076e-07, + "loss": 0.5872, + "step": 71310 + }, + { + "epoch": 1.83, + "learning_rate": 6.994847993612566e-07, + "loss": 0.5498, + "step": 71311 + }, + { + "epoch": 1.83, + "learning_rate": 6.994584080330965e-07, + "loss": 0.7568, + "step": 71312 + }, + { + "epoch": 1.83, + "learning_rate": 6.99432016935047e-07, + "loss": 0.6177, + "step": 71313 + }, + { + "epoch": 1.83, + "learning_rate": 6.994056260671288e-07, + "loss": 0.6758, + "step": 71314 + }, + { + "epoch": 1.83, + "learning_rate": 6.993792354293617e-07, + "loss": 0.5571, + "step": 71315 + }, + { + "epoch": 1.83, + "learning_rate": 6.993528450217663e-07, + "loss": 0.7422, + "step": 71316 + }, + { + "epoch": 1.83, + "learning_rate": 6.993264548443625e-07, + "loss": 0.6172, + "step": 71317 + }, + { + "epoch": 1.83, + "learning_rate": 6.99300064897171e-07, + "loss": 0.5469, + "step": 71318 + }, + { + "epoch": 1.83, + "learning_rate": 6.992736751802113e-07, + "loss": 0.5737, + "step": 71319 + }, + { + "epoch": 1.83, + "learning_rate": 6.992472856935039e-07, + "loss": 0.5448, + "step": 71320 + }, + { + "epoch": 1.83, + "learning_rate": 6.992208964370689e-07, + "loss": 0.6592, + "step": 71321 + }, + { + "epoch": 1.83, + "learning_rate": 6.991945074109268e-07, + "loss": 0.6187, + "step": 71322 + }, + { + "epoch": 1.83, + "learning_rate": 6.991681186150974e-07, + "loss": 0.5752, + "step": 71323 + }, + { + "epoch": 1.83, + "learning_rate": 6.991417300496014e-07, + "loss": 0.6841, + "step": 71324 + }, + { + "epoch": 1.83, + "learning_rate": 6.991153417144585e-07, + "loss": 0.5391, + "step": 71325 + }, + { + "epoch": 1.83, + "learning_rate": 6.990889536096893e-07, + "loss": 0.6753, + "step": 71326 + }, + { + "epoch": 1.83, + "learning_rate": 6.990625657353137e-07, + "loss": 0.6924, + "step": 71327 + }, + { + "epoch": 1.83, + "learning_rate": 6.990361780913527e-07, + "loss": 0.5813, + "step": 71328 + }, + { + "epoch": 1.83, + "learning_rate": 6.990097906778253e-07, + "loss": 0.6006, + "step": 71329 + }, + { + "epoch": 1.83, + "learning_rate": 6.989834034947523e-07, + "loss": 0.4529, + "step": 71330 + }, + { + "epoch": 1.83, + "learning_rate": 6.989570165421538e-07, + "loss": 0.7461, + "step": 71331 + }, + { + "epoch": 1.83, + "learning_rate": 6.989306298200501e-07, + "loss": 0.6885, + "step": 71332 + }, + { + "epoch": 1.83, + "learning_rate": 6.989042433284615e-07, + "loss": 0.7422, + "step": 71333 + }, + { + "epoch": 1.83, + "learning_rate": 6.988778570674079e-07, + "loss": 0.5369, + "step": 71334 + }, + { + "epoch": 1.83, + "learning_rate": 6.9885147103691e-07, + "loss": 0.7139, + "step": 71335 + }, + { + "epoch": 1.83, + "learning_rate": 6.988250852369872e-07, + "loss": 0.7725, + "step": 71336 + }, + { + "epoch": 1.83, + "learning_rate": 6.987986996676606e-07, + "loss": 0.5674, + "step": 71337 + }, + { + "epoch": 1.83, + "learning_rate": 6.987723143289501e-07, + "loss": 0.5283, + "step": 71338 + }, + { + "epoch": 1.83, + "learning_rate": 6.987459292208757e-07, + "loss": 0.7275, + "step": 71339 + }, + { + "epoch": 1.83, + "learning_rate": 6.987195443434574e-07, + "loss": 0.6641, + "step": 71340 + }, + { + "epoch": 1.83, + "learning_rate": 6.986931596967159e-07, + "loss": 0.5332, + "step": 71341 + }, + { + "epoch": 1.83, + "learning_rate": 6.98666775280671e-07, + "loss": 0.6548, + "step": 71342 + }, + { + "epoch": 1.83, + "learning_rate": 6.986403910953431e-07, + "loss": 0.6982, + "step": 71343 + }, + { + "epoch": 1.83, + "learning_rate": 6.986140071407525e-07, + "loss": 0.6797, + "step": 71344 + }, + { + "epoch": 1.83, + "learning_rate": 6.985876234169193e-07, + "loss": 0.6777, + "step": 71345 + }, + { + "epoch": 1.83, + "learning_rate": 6.985612399238636e-07, + "loss": 0.5759, + "step": 71346 + }, + { + "epoch": 1.83, + "learning_rate": 6.985348566616059e-07, + "loss": 0.4485, + "step": 71347 + }, + { + "epoch": 1.83, + "learning_rate": 6.985084736301662e-07, + "loss": 0.6455, + "step": 71348 + }, + { + "epoch": 1.83, + "learning_rate": 6.984820908295646e-07, + "loss": 0.5151, + "step": 71349 + }, + { + "epoch": 1.83, + "learning_rate": 6.984557082598214e-07, + "loss": 0.7109, + "step": 71350 + }, + { + "epoch": 1.83, + "learning_rate": 6.984293259209567e-07, + "loss": 0.5723, + "step": 71351 + }, + { + "epoch": 1.83, + "learning_rate": 6.98402943812991e-07, + "loss": 0.5381, + "step": 71352 + }, + { + "epoch": 1.83, + "learning_rate": 6.98376561935944e-07, + "loss": 0.6064, + "step": 71353 + }, + { + "epoch": 1.83, + "learning_rate": 6.983501802898365e-07, + "loss": 0.6016, + "step": 71354 + }, + { + "epoch": 1.83, + "learning_rate": 6.983237988746881e-07, + "loss": 0.6953, + "step": 71355 + }, + { + "epoch": 1.83, + "learning_rate": 6.982974176905197e-07, + "loss": 0.7036, + "step": 71356 + }, + { + "epoch": 1.83, + "learning_rate": 6.982710367373506e-07, + "loss": 0.4917, + "step": 71357 + }, + { + "epoch": 1.83, + "learning_rate": 6.982446560152022e-07, + "loss": 0.6615, + "step": 71358 + }, + { + "epoch": 1.83, + "learning_rate": 6.982182755240935e-07, + "loss": 0.6558, + "step": 71359 + }, + { + "epoch": 1.83, + "learning_rate": 6.981918952640453e-07, + "loss": 0.5249, + "step": 71360 + }, + { + "epoch": 1.83, + "learning_rate": 6.981655152350776e-07, + "loss": 0.6631, + "step": 71361 + }, + { + "epoch": 1.83, + "learning_rate": 6.981391354372107e-07, + "loss": 0.8154, + "step": 71362 + }, + { + "epoch": 1.83, + "learning_rate": 6.981127558704647e-07, + "loss": 0.7227, + "step": 71363 + }, + { + "epoch": 1.83, + "learning_rate": 6.980863765348602e-07, + "loss": 0.5018, + "step": 71364 + }, + { + "epoch": 1.83, + "learning_rate": 6.980599974304167e-07, + "loss": 0.6514, + "step": 71365 + }, + { + "epoch": 1.83, + "learning_rate": 6.980336185571549e-07, + "loss": 0.6519, + "step": 71366 + }, + { + "epoch": 1.83, + "learning_rate": 6.980072399150948e-07, + "loss": 0.6514, + "step": 71367 + }, + { + "epoch": 1.83, + "learning_rate": 6.979808615042571e-07, + "loss": 0.7549, + "step": 71368 + }, + { + "epoch": 1.83, + "learning_rate": 6.979544833246614e-07, + "loss": 0.8271, + "step": 71369 + }, + { + "epoch": 1.83, + "learning_rate": 6.979281053763278e-07, + "loss": 0.6226, + "step": 71370 + }, + { + "epoch": 1.83, + "learning_rate": 6.979017276592768e-07, + "loss": 0.5044, + "step": 71371 + }, + { + "epoch": 1.83, + "learning_rate": 6.978753501735285e-07, + "loss": 0.5356, + "step": 71372 + }, + { + "epoch": 1.83, + "learning_rate": 6.978489729191034e-07, + "loss": 0.6592, + "step": 71373 + }, + { + "epoch": 1.83, + "learning_rate": 6.978225958960211e-07, + "loss": 0.7285, + "step": 71374 + }, + { + "epoch": 1.83, + "learning_rate": 6.977962191043025e-07, + "loss": 0.6094, + "step": 71375 + }, + { + "epoch": 1.83, + "learning_rate": 6.977698425439674e-07, + "loss": 0.6201, + "step": 71376 + }, + { + "epoch": 1.83, + "learning_rate": 6.977434662150359e-07, + "loss": 0.7158, + "step": 71377 + }, + { + "epoch": 1.83, + "learning_rate": 6.977170901175286e-07, + "loss": 0.5798, + "step": 71378 + }, + { + "epoch": 1.83, + "learning_rate": 6.976907142514652e-07, + "loss": 0.7598, + "step": 71379 + }, + { + "epoch": 1.83, + "learning_rate": 6.976643386168662e-07, + "loss": 0.5527, + "step": 71380 + }, + { + "epoch": 1.83, + "learning_rate": 6.976379632137516e-07, + "loss": 0.7705, + "step": 71381 + }, + { + "epoch": 1.83, + "learning_rate": 6.976115880421416e-07, + "loss": 0.5798, + "step": 71382 + }, + { + "epoch": 1.83, + "learning_rate": 6.975852131020567e-07, + "loss": 0.6597, + "step": 71383 + }, + { + "epoch": 1.83, + "learning_rate": 6.975588383935167e-07, + "loss": 0.7412, + "step": 71384 + }, + { + "epoch": 1.83, + "learning_rate": 6.975324639165423e-07, + "loss": 0.6724, + "step": 71385 + }, + { + "epoch": 1.83, + "learning_rate": 6.975060896711531e-07, + "loss": 0.6416, + "step": 71386 + }, + { + "epoch": 1.83, + "learning_rate": 6.974797156573698e-07, + "loss": 0.5464, + "step": 71387 + }, + { + "epoch": 1.83, + "learning_rate": 6.974533418752124e-07, + "loss": 0.6602, + "step": 71388 + }, + { + "epoch": 1.83, + "learning_rate": 6.97426968324701e-07, + "loss": 0.4913, + "step": 71389 + }, + { + "epoch": 1.83, + "learning_rate": 6.974005950058557e-07, + "loss": 0.8086, + "step": 71390 + }, + { + "epoch": 1.83, + "learning_rate": 6.973742219186969e-07, + "loss": 0.8945, + "step": 71391 + }, + { + "epoch": 1.83, + "learning_rate": 6.973478490632447e-07, + "loss": 0.5349, + "step": 71392 + }, + { + "epoch": 1.83, + "learning_rate": 6.973214764395196e-07, + "loss": 0.4771, + "step": 71393 + }, + { + "epoch": 1.83, + "learning_rate": 6.972951040475412e-07, + "loss": 0.5471, + "step": 71394 + }, + { + "epoch": 1.83, + "learning_rate": 6.972687318873303e-07, + "loss": 0.6045, + "step": 71395 + }, + { + "epoch": 1.83, + "learning_rate": 6.972423599589066e-07, + "loss": 0.6426, + "step": 71396 + }, + { + "epoch": 1.83, + "learning_rate": 6.972159882622906e-07, + "loss": 0.4121, + "step": 71397 + }, + { + "epoch": 1.83, + "learning_rate": 6.971896167975027e-07, + "loss": 0.5854, + "step": 71398 + }, + { + "epoch": 1.83, + "learning_rate": 6.971632455645623e-07, + "loss": 0.7295, + "step": 71399 + }, + { + "epoch": 1.83, + "learning_rate": 6.971368745634903e-07, + "loss": 0.4087, + "step": 71400 + }, + { + "epoch": 1.83, + "learning_rate": 6.971105037943065e-07, + "loss": 0.7363, + "step": 71401 + }, + { + "epoch": 1.83, + "learning_rate": 6.970841332570314e-07, + "loss": 0.7383, + "step": 71402 + }, + { + "epoch": 1.83, + "learning_rate": 6.97057762951685e-07, + "loss": 0.6533, + "step": 71403 + }, + { + "epoch": 1.83, + "learning_rate": 6.970313928782876e-07, + "loss": 0.5723, + "step": 71404 + }, + { + "epoch": 1.83, + "learning_rate": 6.970050230368591e-07, + "loss": 0.6885, + "step": 71405 + }, + { + "epoch": 1.83, + "learning_rate": 6.969786534274203e-07, + "loss": 0.7246, + "step": 71406 + }, + { + "epoch": 1.83, + "learning_rate": 6.969522840499906e-07, + "loss": 0.7588, + "step": 71407 + }, + { + "epoch": 1.83, + "learning_rate": 6.969259149045912e-07, + "loss": 0.7896, + "step": 71408 + }, + { + "epoch": 1.83, + "learning_rate": 6.968995459912415e-07, + "loss": 0.707, + "step": 71409 + }, + { + "epoch": 1.83, + "learning_rate": 6.968731773099616e-07, + "loss": 0.5547, + "step": 71410 + }, + { + "epoch": 1.83, + "learning_rate": 6.968468088607719e-07, + "loss": 0.5688, + "step": 71411 + }, + { + "epoch": 1.83, + "learning_rate": 6.96820440643693e-07, + "loss": 0.6531, + "step": 71412 + }, + { + "epoch": 1.83, + "learning_rate": 6.967940726587444e-07, + "loss": 0.5796, + "step": 71413 + }, + { + "epoch": 1.83, + "learning_rate": 6.967677049059469e-07, + "loss": 0.6699, + "step": 71414 + }, + { + "epoch": 1.83, + "learning_rate": 6.967413373853202e-07, + "loss": 0.5527, + "step": 71415 + }, + { + "epoch": 1.83, + "learning_rate": 6.96714970096885e-07, + "loss": 0.6243, + "step": 71416 + }, + { + "epoch": 1.83, + "learning_rate": 6.966886030406609e-07, + "loss": 0.5439, + "step": 71417 + }, + { + "epoch": 1.83, + "learning_rate": 6.966622362166689e-07, + "loss": 0.6553, + "step": 71418 + }, + { + "epoch": 1.83, + "learning_rate": 6.966358696249283e-07, + "loss": 0.8652, + "step": 71419 + }, + { + "epoch": 1.83, + "learning_rate": 6.966095032654597e-07, + "loss": 0.5864, + "step": 71420 + }, + { + "epoch": 1.83, + "learning_rate": 6.965831371382833e-07, + "loss": 0.7119, + "step": 71421 + }, + { + "epoch": 1.83, + "learning_rate": 6.965567712434191e-07, + "loss": 0.707, + "step": 71422 + }, + { + "epoch": 1.83, + "learning_rate": 6.965304055808876e-07, + "loss": 0.6807, + "step": 71423 + }, + { + "epoch": 1.83, + "learning_rate": 6.965040401507085e-07, + "loss": 0.541, + "step": 71424 + }, + { + "epoch": 1.83, + "learning_rate": 6.964776749529027e-07, + "loss": 0.7363, + "step": 71425 + }, + { + "epoch": 1.83, + "learning_rate": 6.964513099874895e-07, + "loss": 0.509, + "step": 71426 + }, + { + "epoch": 1.83, + "learning_rate": 6.964249452544902e-07, + "loss": 0.7207, + "step": 71427 + }, + { + "epoch": 1.83, + "learning_rate": 6.963985807539242e-07, + "loss": 0.6855, + "step": 71428 + }, + { + "epoch": 1.83, + "learning_rate": 6.963722164858117e-07, + "loss": 0.5127, + "step": 71429 + }, + { + "epoch": 1.83, + "learning_rate": 6.963458524501731e-07, + "loss": 0.525, + "step": 71430 + }, + { + "epoch": 1.83, + "learning_rate": 6.963194886470285e-07, + "loss": 0.5015, + "step": 71431 + }, + { + "epoch": 1.83, + "learning_rate": 6.962931250763979e-07, + "loss": 0.3411, + "step": 71432 + }, + { + "epoch": 1.83, + "learning_rate": 6.962667617383019e-07, + "loss": 0.7471, + "step": 71433 + }, + { + "epoch": 1.83, + "learning_rate": 6.962403986327603e-07, + "loss": 0.6895, + "step": 71434 + }, + { + "epoch": 1.83, + "learning_rate": 6.962140357597936e-07, + "loss": 0.6211, + "step": 71435 + }, + { + "epoch": 1.83, + "learning_rate": 6.961876731194218e-07, + "loss": 0.5928, + "step": 71436 + }, + { + "epoch": 1.83, + "learning_rate": 6.961613107116652e-07, + "loss": 0.5063, + "step": 71437 + }, + { + "epoch": 1.83, + "learning_rate": 6.96134948536544e-07, + "loss": 0.5654, + "step": 71438 + }, + { + "epoch": 1.83, + "learning_rate": 6.961085865940781e-07, + "loss": 0.7637, + "step": 71439 + }, + { + "epoch": 1.83, + "learning_rate": 6.960822248842881e-07, + "loss": 0.6328, + "step": 71440 + }, + { + "epoch": 1.83, + "learning_rate": 6.960558634071936e-07, + "loss": 0.6074, + "step": 71441 + }, + { + "epoch": 1.83, + "learning_rate": 6.960295021628156e-07, + "loss": 0.4888, + "step": 71442 + }, + { + "epoch": 1.83, + "learning_rate": 6.960031411511733e-07, + "loss": 0.6089, + "step": 71443 + }, + { + "epoch": 1.83, + "learning_rate": 6.959767803722878e-07, + "loss": 0.5073, + "step": 71444 + }, + { + "epoch": 1.83, + "learning_rate": 6.959504198261787e-07, + "loss": 0.6553, + "step": 71445 + }, + { + "epoch": 1.83, + "learning_rate": 6.959240595128666e-07, + "loss": 0.6067, + "step": 71446 + }, + { + "epoch": 1.83, + "learning_rate": 6.958976994323712e-07, + "loss": 0.7148, + "step": 71447 + }, + { + "epoch": 1.83, + "learning_rate": 6.958713395847136e-07, + "loss": 0.5781, + "step": 71448 + }, + { + "epoch": 1.83, + "learning_rate": 6.958449799699126e-07, + "loss": 0.5049, + "step": 71449 + }, + { + "epoch": 1.83, + "learning_rate": 6.958186205879896e-07, + "loss": 0.5991, + "step": 71450 + }, + { + "epoch": 1.83, + "learning_rate": 6.957922614389639e-07, + "loss": 0.7754, + "step": 71451 + }, + { + "epoch": 1.83, + "learning_rate": 6.957659025228562e-07, + "loss": 0.5334, + "step": 71452 + }, + { + "epoch": 1.83, + "learning_rate": 6.957395438396865e-07, + "loss": 0.6377, + "step": 71453 + }, + { + "epoch": 1.83, + "learning_rate": 6.957131853894752e-07, + "loss": 0.8252, + "step": 71454 + }, + { + "epoch": 1.83, + "learning_rate": 6.956868271722422e-07, + "loss": 0.5801, + "step": 71455 + }, + { + "epoch": 1.83, + "learning_rate": 6.956604691880079e-07, + "loss": 0.623, + "step": 71456 + }, + { + "epoch": 1.83, + "learning_rate": 6.956341114367922e-07, + "loss": 0.5877, + "step": 71457 + }, + { + "epoch": 1.83, + "learning_rate": 6.956077539186158e-07, + "loss": 0.6865, + "step": 71458 + }, + { + "epoch": 1.83, + "learning_rate": 6.955813966334985e-07, + "loss": 0.4045, + "step": 71459 + }, + { + "epoch": 1.83, + "learning_rate": 6.955550395814602e-07, + "loss": 0.624, + "step": 71460 + }, + { + "epoch": 1.83, + "learning_rate": 6.955286827625217e-07, + "loss": 0.7861, + "step": 71461 + }, + { + "epoch": 1.83, + "learning_rate": 6.955023261767026e-07, + "loss": 0.668, + "step": 71462 + }, + { + "epoch": 1.83, + "learning_rate": 6.954759698240236e-07, + "loss": 0.7422, + "step": 71463 + }, + { + "epoch": 1.83, + "learning_rate": 6.954496137045045e-07, + "loss": 0.5449, + "step": 71464 + }, + { + "epoch": 1.83, + "learning_rate": 6.954232578181658e-07, + "loss": 0.7314, + "step": 71465 + }, + { + "epoch": 1.83, + "learning_rate": 6.953969021650275e-07, + "loss": 0.8271, + "step": 71466 + }, + { + "epoch": 1.83, + "learning_rate": 6.953705467451096e-07, + "loss": 0.5117, + "step": 71467 + }, + { + "epoch": 1.83, + "learning_rate": 6.953441915584329e-07, + "loss": 0.6099, + "step": 71468 + }, + { + "epoch": 1.83, + "learning_rate": 6.953178366050168e-07, + "loss": 0.6216, + "step": 71469 + }, + { + "epoch": 1.83, + "learning_rate": 6.952914818848817e-07, + "loss": 0.6182, + "step": 71470 + }, + { + "epoch": 1.83, + "learning_rate": 6.952651273980481e-07, + "loss": 0.5728, + "step": 71471 + }, + { + "epoch": 1.83, + "learning_rate": 6.95238773144536e-07, + "loss": 0.7021, + "step": 71472 + }, + { + "epoch": 1.83, + "learning_rate": 6.952124191243654e-07, + "loss": 0.7832, + "step": 71473 + }, + { + "epoch": 1.83, + "learning_rate": 6.951860653375565e-07, + "loss": 0.6099, + "step": 71474 + }, + { + "epoch": 1.83, + "learning_rate": 6.951597117841301e-07, + "loss": 0.4258, + "step": 71475 + }, + { + "epoch": 1.83, + "learning_rate": 6.951333584641055e-07, + "loss": 0.6538, + "step": 71476 + }, + { + "epoch": 1.83, + "learning_rate": 6.951070053775034e-07, + "loss": 0.5435, + "step": 71477 + }, + { + "epoch": 1.83, + "learning_rate": 6.950806525243441e-07, + "loss": 0.5645, + "step": 71478 + }, + { + "epoch": 1.83, + "learning_rate": 6.950542999046471e-07, + "loss": 0.4731, + "step": 71479 + }, + { + "epoch": 1.83, + "learning_rate": 6.950279475184333e-07, + "loss": 0.5698, + "step": 71480 + }, + { + "epoch": 1.83, + "learning_rate": 6.950015953657222e-07, + "loss": 0.6455, + "step": 71481 + }, + { + "epoch": 1.83, + "learning_rate": 6.949752434465348e-07, + "loss": 0.6357, + "step": 71482 + }, + { + "epoch": 1.83, + "learning_rate": 6.949488917608907e-07, + "loss": 0.5786, + "step": 71483 + }, + { + "epoch": 1.83, + "learning_rate": 6.949225403088099e-07, + "loss": 0.5737, + "step": 71484 + }, + { + "epoch": 1.83, + "learning_rate": 6.948961890903132e-07, + "loss": 0.6738, + "step": 71485 + }, + { + "epoch": 1.83, + "learning_rate": 6.948698381054203e-07, + "loss": 0.5625, + "step": 71486 + }, + { + "epoch": 1.83, + "learning_rate": 6.948434873541517e-07, + "loss": 0.5449, + "step": 71487 + }, + { + "epoch": 1.83, + "learning_rate": 6.948171368365275e-07, + "loss": 0.6494, + "step": 71488 + }, + { + "epoch": 1.83, + "learning_rate": 6.947907865525675e-07, + "loss": 0.6328, + "step": 71489 + }, + { + "epoch": 1.83, + "learning_rate": 6.947644365022924e-07, + "loss": 0.5889, + "step": 71490 + }, + { + "epoch": 1.83, + "learning_rate": 6.947380866857219e-07, + "loss": 0.4119, + "step": 71491 + }, + { + "epoch": 1.83, + "learning_rate": 6.947117371028766e-07, + "loss": 0.7432, + "step": 71492 + }, + { + "epoch": 1.83, + "learning_rate": 6.946853877537761e-07, + "loss": 0.6553, + "step": 71493 + }, + { + "epoch": 1.83, + "learning_rate": 6.946590386384414e-07, + "loss": 0.5332, + "step": 71494 + }, + { + "epoch": 1.83, + "learning_rate": 6.946326897568919e-07, + "loss": 0.7832, + "step": 71495 + }, + { + "epoch": 1.83, + "learning_rate": 6.946063411091485e-07, + "loss": 0.6274, + "step": 71496 + }, + { + "epoch": 1.83, + "learning_rate": 6.945799926952306e-07, + "loss": 0.5757, + "step": 71497 + }, + { + "epoch": 1.83, + "learning_rate": 6.945536445151592e-07, + "loss": 0.5859, + "step": 71498 + }, + { + "epoch": 1.83, + "learning_rate": 6.945272965689539e-07, + "loss": 0.5925, + "step": 71499 + }, + { + "epoch": 1.83, + "learning_rate": 6.945009488566349e-07, + "loss": 0.6316, + "step": 71500 + }, + { + "epoch": 1.83, + "learning_rate": 6.944746013782223e-07, + "loss": 0.7383, + "step": 71501 + }, + { + "epoch": 1.83, + "learning_rate": 6.944482541337366e-07, + "loss": 0.5508, + "step": 71502 + }, + { + "epoch": 1.83, + "learning_rate": 6.944219071231978e-07, + "loss": 0.7725, + "step": 71503 + }, + { + "epoch": 1.83, + "learning_rate": 6.943955603466263e-07, + "loss": 0.6885, + "step": 71504 + }, + { + "epoch": 1.83, + "learning_rate": 6.943692138040416e-07, + "loss": 0.6519, + "step": 71505 + }, + { + "epoch": 1.83, + "learning_rate": 6.943428674954648e-07, + "loss": 0.5635, + "step": 71506 + }, + { + "epoch": 1.83, + "learning_rate": 6.943165214209152e-07, + "loss": 0.4011, + "step": 71507 + }, + { + "epoch": 1.83, + "learning_rate": 6.942901755804139e-07, + "loss": 0.7314, + "step": 71508 + }, + { + "epoch": 1.83, + "learning_rate": 6.942638299739804e-07, + "loss": 0.5334, + "step": 71509 + }, + { + "epoch": 1.83, + "learning_rate": 6.942374846016348e-07, + "loss": 0.79, + "step": 71510 + }, + { + "epoch": 1.83, + "learning_rate": 6.942111394633976e-07, + "loss": 0.7222, + "step": 71511 + }, + { + "epoch": 1.83, + "learning_rate": 6.941847945592887e-07, + "loss": 0.7295, + "step": 71512 + }, + { + "epoch": 1.83, + "learning_rate": 6.941584498893287e-07, + "loss": 0.5952, + "step": 71513 + }, + { + "epoch": 1.83, + "learning_rate": 6.941321054535374e-07, + "loss": 0.4471, + "step": 71514 + }, + { + "epoch": 1.83, + "learning_rate": 6.941057612519351e-07, + "loss": 0.7178, + "step": 71515 + }, + { + "epoch": 1.83, + "learning_rate": 6.940794172845419e-07, + "loss": 0.5361, + "step": 71516 + }, + { + "epoch": 1.83, + "learning_rate": 6.940530735513783e-07, + "loss": 0.7383, + "step": 71517 + }, + { + "epoch": 1.83, + "learning_rate": 6.940267300524641e-07, + "loss": 0.606, + "step": 71518 + }, + { + "epoch": 1.83, + "learning_rate": 6.940003867878195e-07, + "loss": 0.55, + "step": 71519 + }, + { + "epoch": 1.83, + "learning_rate": 6.939740437574645e-07, + "loss": 0.6479, + "step": 71520 + }, + { + "epoch": 1.83, + "learning_rate": 6.939477009614197e-07, + "loss": 0.707, + "step": 71521 + }, + { + "epoch": 1.83, + "learning_rate": 6.93921358399705e-07, + "loss": 0.7188, + "step": 71522 + }, + { + "epoch": 1.83, + "learning_rate": 6.938950160723407e-07, + "loss": 0.5732, + "step": 71523 + }, + { + "epoch": 1.83, + "learning_rate": 6.938686739793468e-07, + "loss": 0.522, + "step": 71524 + }, + { + "epoch": 1.83, + "learning_rate": 6.938423321207439e-07, + "loss": 0.5759, + "step": 71525 + }, + { + "epoch": 1.83, + "learning_rate": 6.938159904965514e-07, + "loss": 0.709, + "step": 71526 + }, + { + "epoch": 1.83, + "learning_rate": 6.937896491067904e-07, + "loss": 0.6816, + "step": 71527 + }, + { + "epoch": 1.83, + "learning_rate": 6.937633079514804e-07, + "loss": 0.5195, + "step": 71528 + }, + { + "epoch": 1.83, + "learning_rate": 6.937369670306416e-07, + "loss": 0.6499, + "step": 71529 + }, + { + "epoch": 1.83, + "learning_rate": 6.937106263442945e-07, + "loss": 0.7803, + "step": 71530 + }, + { + "epoch": 1.83, + "learning_rate": 6.936842858924588e-07, + "loss": 0.5146, + "step": 71531 + }, + { + "epoch": 1.83, + "learning_rate": 6.936579456751552e-07, + "loss": 0.6982, + "step": 71532 + }, + { + "epoch": 1.83, + "learning_rate": 6.936316056924034e-07, + "loss": 0.6245, + "step": 71533 + }, + { + "epoch": 1.83, + "learning_rate": 6.936052659442242e-07, + "loss": 0.5984, + "step": 71534 + }, + { + "epoch": 1.83, + "learning_rate": 6.935789264306369e-07, + "loss": 0.6416, + "step": 71535 + }, + { + "epoch": 1.83, + "learning_rate": 6.935525871516625e-07, + "loss": 0.5127, + "step": 71536 + }, + { + "epoch": 1.83, + "learning_rate": 6.93526248107321e-07, + "loss": 0.5322, + "step": 71537 + }, + { + "epoch": 1.83, + "learning_rate": 6.934999092976319e-07, + "loss": 0.6709, + "step": 71538 + }, + { + "epoch": 1.83, + "learning_rate": 6.934735707226159e-07, + "loss": 0.5894, + "step": 71539 + }, + { + "epoch": 1.83, + "learning_rate": 6.934472323822932e-07, + "loss": 0.582, + "step": 71540 + }, + { + "epoch": 1.83, + "learning_rate": 6.934208942766837e-07, + "loss": 0.6797, + "step": 71541 + }, + { + "epoch": 1.83, + "learning_rate": 6.933945564058079e-07, + "loss": 0.6289, + "step": 71542 + }, + { + "epoch": 1.83, + "learning_rate": 6.933682187696855e-07, + "loss": 0.6289, + "step": 71543 + }, + { + "epoch": 1.83, + "learning_rate": 6.933418813683372e-07, + "loss": 0.8223, + "step": 71544 + }, + { + "epoch": 1.83, + "learning_rate": 6.933155442017829e-07, + "loss": 0.6191, + "step": 71545 + }, + { + "epoch": 1.83, + "learning_rate": 6.932892072700427e-07, + "loss": 0.5466, + "step": 71546 + }, + { + "epoch": 1.83, + "learning_rate": 6.932628705731373e-07, + "loss": 0.5249, + "step": 71547 + }, + { + "epoch": 1.83, + "learning_rate": 6.932365341110859e-07, + "loss": 0.7681, + "step": 71548 + }, + { + "epoch": 1.83, + "learning_rate": 6.932101978839093e-07, + "loss": 0.7891, + "step": 71549 + }, + { + "epoch": 1.83, + "learning_rate": 6.931838618916274e-07, + "loss": 0.5884, + "step": 71550 + }, + { + "epoch": 1.83, + "learning_rate": 6.931575261342608e-07, + "loss": 0.7783, + "step": 71551 + }, + { + "epoch": 1.83, + "learning_rate": 6.931311906118291e-07, + "loss": 0.3604, + "step": 71552 + }, + { + "epoch": 1.83, + "learning_rate": 6.931048553243531e-07, + "loss": 0.8389, + "step": 71553 + }, + { + "epoch": 1.83, + "learning_rate": 6.930785202718521e-07, + "loss": 0.6025, + "step": 71554 + }, + { + "epoch": 1.83, + "learning_rate": 6.930521854543472e-07, + "loss": 0.5591, + "step": 71555 + }, + { + "epoch": 1.83, + "learning_rate": 6.93025850871858e-07, + "loss": 0.6968, + "step": 71556 + }, + { + "epoch": 1.83, + "learning_rate": 6.92999516524405e-07, + "loss": 0.6133, + "step": 71557 + }, + { + "epoch": 1.83, + "learning_rate": 6.929731824120077e-07, + "loss": 0.5728, + "step": 71558 + }, + { + "epoch": 1.83, + "learning_rate": 6.929468485346871e-07, + "loss": 0.4868, + "step": 71559 + }, + { + "epoch": 1.83, + "learning_rate": 6.929205148924628e-07, + "loss": 0.5635, + "step": 71560 + }, + { + "epoch": 1.83, + "learning_rate": 6.928941814853551e-07, + "loss": 0.5298, + "step": 71561 + }, + { + "epoch": 1.83, + "learning_rate": 6.928678483133842e-07, + "loss": 0.6196, + "step": 71562 + }, + { + "epoch": 1.83, + "learning_rate": 6.928415153765703e-07, + "loss": 0.4097, + "step": 71563 + }, + { + "epoch": 1.83, + "learning_rate": 6.928151826749335e-07, + "loss": 0.6797, + "step": 71564 + }, + { + "epoch": 1.83, + "learning_rate": 6.92788850208494e-07, + "loss": 0.5328, + "step": 71565 + }, + { + "epoch": 1.83, + "learning_rate": 6.92762517977272e-07, + "loss": 0.6055, + "step": 71566 + }, + { + "epoch": 1.83, + "learning_rate": 6.927361859812879e-07, + "loss": 0.6177, + "step": 71567 + }, + { + "epoch": 1.83, + "learning_rate": 6.927098542205614e-07, + "loss": 0.7095, + "step": 71568 + }, + { + "epoch": 1.83, + "learning_rate": 6.926835226951124e-07, + "loss": 0.6533, + "step": 71569 + }, + { + "epoch": 1.83, + "learning_rate": 6.926571914049619e-07, + "loss": 0.7354, + "step": 71570 + }, + { + "epoch": 1.83, + "learning_rate": 6.926308603501295e-07, + "loss": 0.6309, + "step": 71571 + }, + { + "epoch": 1.83, + "learning_rate": 6.926045295306357e-07, + "loss": 0.4572, + "step": 71572 + }, + { + "epoch": 1.83, + "learning_rate": 6.925781989465005e-07, + "loss": 0.7354, + "step": 71573 + }, + { + "epoch": 1.83, + "learning_rate": 6.925518685977436e-07, + "loss": 0.624, + "step": 71574 + }, + { + "epoch": 1.83, + "learning_rate": 6.92525538484386e-07, + "loss": 0.5889, + "step": 71575 + }, + { + "epoch": 1.83, + "learning_rate": 6.924992086064472e-07, + "loss": 0.6377, + "step": 71576 + }, + { + "epoch": 1.83, + "learning_rate": 6.924728789639481e-07, + "loss": 0.6904, + "step": 71577 + }, + { + "epoch": 1.83, + "learning_rate": 6.924465495569082e-07, + "loss": 0.6396, + "step": 71578 + }, + { + "epoch": 1.83, + "learning_rate": 6.924202203853475e-07, + "loss": 0.6216, + "step": 71579 + }, + { + "epoch": 1.83, + "learning_rate": 6.923938914492868e-07, + "loss": 0.4771, + "step": 71580 + }, + { + "epoch": 1.83, + "learning_rate": 6.923675627487457e-07, + "loss": 0.7432, + "step": 71581 + }, + { + "epoch": 1.83, + "learning_rate": 6.923412342837448e-07, + "loss": 0.7227, + "step": 71582 + }, + { + "epoch": 1.83, + "learning_rate": 6.923149060543039e-07, + "loss": 0.6963, + "step": 71583 + }, + { + "epoch": 1.83, + "learning_rate": 6.922885780604435e-07, + "loss": 0.5908, + "step": 71584 + }, + { + "epoch": 1.83, + "learning_rate": 6.922622503021833e-07, + "loss": 0.4656, + "step": 71585 + }, + { + "epoch": 1.83, + "learning_rate": 6.922359227795441e-07, + "loss": 0.6636, + "step": 71586 + }, + { + "epoch": 1.83, + "learning_rate": 6.922095954925458e-07, + "loss": 0.4858, + "step": 71587 + }, + { + "epoch": 1.83, + "learning_rate": 6.921832684412081e-07, + "loss": 0.5476, + "step": 71588 + }, + { + "epoch": 1.83, + "learning_rate": 6.921569416255518e-07, + "loss": 0.4795, + "step": 71589 + }, + { + "epoch": 1.83, + "learning_rate": 6.921306150455967e-07, + "loss": 0.5212, + "step": 71590 + }, + { + "epoch": 1.83, + "learning_rate": 6.921042887013629e-07, + "loss": 0.6777, + "step": 71591 + }, + { + "epoch": 1.83, + "learning_rate": 6.920779625928708e-07, + "loss": 0.5881, + "step": 71592 + }, + { + "epoch": 1.83, + "learning_rate": 6.920516367201402e-07, + "loss": 0.5957, + "step": 71593 + }, + { + "epoch": 1.83, + "learning_rate": 6.920253110831917e-07, + "loss": 0.6675, + "step": 71594 + }, + { + "epoch": 1.84, + "learning_rate": 6.919989856820451e-07, + "loss": 0.6709, + "step": 71595 + }, + { + "epoch": 1.84, + "learning_rate": 6.91972660516721e-07, + "loss": 0.6777, + "step": 71596 + }, + { + "epoch": 1.84, + "learning_rate": 6.919463355872395e-07, + "loss": 0.6738, + "step": 71597 + }, + { + "epoch": 1.84, + "learning_rate": 6.9192001089362e-07, + "loss": 0.7354, + "step": 71598 + }, + { + "epoch": 1.84, + "learning_rate": 6.918936864358835e-07, + "loss": 0.4158, + "step": 71599 + }, + { + "epoch": 1.84, + "learning_rate": 6.918673622140495e-07, + "loss": 0.6177, + "step": 71600 + }, + { + "epoch": 1.84, + "learning_rate": 6.918410382281388e-07, + "loss": 0.5645, + "step": 71601 + }, + { + "epoch": 1.84, + "learning_rate": 6.91814714478171e-07, + "loss": 0.7275, + "step": 71602 + }, + { + "epoch": 1.84, + "learning_rate": 6.917883909641666e-07, + "loss": 0.6572, + "step": 71603 + }, + { + "epoch": 1.84, + "learning_rate": 6.917620676861455e-07, + "loss": 0.3787, + "step": 71604 + }, + { + "epoch": 1.84, + "learning_rate": 6.917357446441284e-07, + "loss": 0.6123, + "step": 71605 + }, + { + "epoch": 1.84, + "learning_rate": 6.917094218381347e-07, + "loss": 0.543, + "step": 71606 + }, + { + "epoch": 1.84, + "learning_rate": 6.916830992681853e-07, + "loss": 0.4561, + "step": 71607 + }, + { + "epoch": 1.84, + "learning_rate": 6.916567769342999e-07, + "loss": 0.6709, + "step": 71608 + }, + { + "epoch": 1.84, + "learning_rate": 6.916304548364986e-07, + "loss": 0.5474, + "step": 71609 + }, + { + "epoch": 1.84, + "learning_rate": 6.916041329748015e-07, + "loss": 0.5332, + "step": 71610 + }, + { + "epoch": 1.84, + "learning_rate": 6.915778113492292e-07, + "loss": 0.5737, + "step": 71611 + }, + { + "epoch": 1.84, + "learning_rate": 6.915514899598014e-07, + "loss": 0.6963, + "step": 71612 + }, + { + "epoch": 1.84, + "learning_rate": 6.915251688065386e-07, + "loss": 0.4854, + "step": 71613 + }, + { + "epoch": 1.84, + "learning_rate": 6.914988478894605e-07, + "loss": 0.5706, + "step": 71614 + }, + { + "epoch": 1.84, + "learning_rate": 6.914725272085879e-07, + "loss": 0.5176, + "step": 71615 + }, + { + "epoch": 1.84, + "learning_rate": 6.914462067639404e-07, + "loss": 0.6943, + "step": 71616 + }, + { + "epoch": 1.84, + "learning_rate": 6.914198865555387e-07, + "loss": 0.6045, + "step": 71617 + }, + { + "epoch": 1.84, + "learning_rate": 6.913935665834024e-07, + "loss": 0.605, + "step": 71618 + }, + { + "epoch": 1.84, + "learning_rate": 6.913672468475517e-07, + "loss": 0.7373, + "step": 71619 + }, + { + "epoch": 1.84, + "learning_rate": 6.913409273480071e-07, + "loss": 0.6484, + "step": 71620 + }, + { + "epoch": 1.84, + "learning_rate": 6.913146080847882e-07, + "loss": 0.667, + "step": 71621 + }, + { + "epoch": 1.84, + "learning_rate": 6.912882890579159e-07, + "loss": 0.5913, + "step": 71622 + }, + { + "epoch": 1.84, + "learning_rate": 6.912619702674096e-07, + "loss": 0.834, + "step": 71623 + }, + { + "epoch": 1.84, + "learning_rate": 6.912356517132902e-07, + "loss": 0.5532, + "step": 71624 + }, + { + "epoch": 1.84, + "learning_rate": 6.912093333955771e-07, + "loss": 0.6729, + "step": 71625 + }, + { + "epoch": 1.84, + "learning_rate": 6.911830153142911e-07, + "loss": 0.6821, + "step": 71626 + }, + { + "epoch": 1.84, + "learning_rate": 6.911566974694522e-07, + "loss": 0.5322, + "step": 71627 + }, + { + "epoch": 1.84, + "learning_rate": 6.911303798610804e-07, + "loss": 0.6489, + "step": 71628 + }, + { + "epoch": 1.84, + "learning_rate": 6.911040624891955e-07, + "loss": 0.6426, + "step": 71629 + }, + { + "epoch": 1.84, + "learning_rate": 6.910777453538183e-07, + "loss": 0.6514, + "step": 71630 + }, + { + "epoch": 1.84, + "learning_rate": 6.910514284549683e-07, + "loss": 0.728, + "step": 71631 + }, + { + "epoch": 1.84, + "learning_rate": 6.910251117926664e-07, + "loss": 0.4597, + "step": 71632 + }, + { + "epoch": 1.84, + "learning_rate": 6.90998795366932e-07, + "loss": 0.6606, + "step": 71633 + }, + { + "epoch": 1.84, + "learning_rate": 6.90972479177786e-07, + "loss": 0.4585, + "step": 71634 + }, + { + "epoch": 1.84, + "learning_rate": 6.909461632252477e-07, + "loss": 0.7402, + "step": 71635 + }, + { + "epoch": 1.84, + "learning_rate": 6.909198475093383e-07, + "loss": 0.6851, + "step": 71636 + }, + { + "epoch": 1.84, + "learning_rate": 6.908935320300773e-07, + "loss": 0.5247, + "step": 71637 + }, + { + "epoch": 1.84, + "learning_rate": 6.908672167874845e-07, + "loss": 0.6333, + "step": 71638 + }, + { + "epoch": 1.84, + "learning_rate": 6.908409017815809e-07, + "loss": 0.339, + "step": 71639 + }, + { + "epoch": 1.84, + "learning_rate": 6.908145870123857e-07, + "loss": 0.6499, + "step": 71640 + }, + { + "epoch": 1.84, + "learning_rate": 6.907882724799199e-07, + "loss": 0.4492, + "step": 71641 + }, + { + "epoch": 1.84, + "learning_rate": 6.907619581842031e-07, + "loss": 0.5601, + "step": 71642 + }, + { + "epoch": 1.84, + "learning_rate": 6.907356441252558e-07, + "loss": 0.6611, + "step": 71643 + }, + { + "epoch": 1.84, + "learning_rate": 6.907093303030978e-07, + "loss": 0.79, + "step": 71644 + }, + { + "epoch": 1.84, + "learning_rate": 6.906830167177497e-07, + "loss": 0.7456, + "step": 71645 + }, + { + "epoch": 1.84, + "learning_rate": 6.906567033692313e-07, + "loss": 0.5903, + "step": 71646 + }, + { + "epoch": 1.84, + "learning_rate": 6.90630390257563e-07, + "loss": 0.625, + "step": 71647 + }, + { + "epoch": 1.84, + "learning_rate": 6.906040773827646e-07, + "loss": 0.7148, + "step": 71648 + }, + { + "epoch": 1.84, + "learning_rate": 6.905777647448565e-07, + "loss": 0.6328, + "step": 71649 + }, + { + "epoch": 1.84, + "learning_rate": 6.905514523438586e-07, + "loss": 0.8652, + "step": 71650 + }, + { + "epoch": 1.84, + "learning_rate": 6.905251401797913e-07, + "loss": 0.8994, + "step": 71651 + }, + { + "epoch": 1.84, + "learning_rate": 6.904988282526747e-07, + "loss": 0.4536, + "step": 71652 + }, + { + "epoch": 1.84, + "learning_rate": 6.904725165625289e-07, + "loss": 0.5425, + "step": 71653 + }, + { + "epoch": 1.84, + "learning_rate": 6.90446205109374e-07, + "loss": 0.4907, + "step": 71654 + }, + { + "epoch": 1.84, + "learning_rate": 6.904198938932304e-07, + "loss": 0.6255, + "step": 71655 + }, + { + "epoch": 1.84, + "learning_rate": 6.903935829141179e-07, + "loss": 0.5182, + "step": 71656 + }, + { + "epoch": 1.84, + "learning_rate": 6.90367272172057e-07, + "loss": 0.5249, + "step": 71657 + }, + { + "epoch": 1.84, + "learning_rate": 6.903409616670677e-07, + "loss": 0.7881, + "step": 71658 + }, + { + "epoch": 1.84, + "learning_rate": 6.903146513991697e-07, + "loss": 0.6792, + "step": 71659 + }, + { + "epoch": 1.84, + "learning_rate": 6.902883413683838e-07, + "loss": 0.7617, + "step": 71660 + }, + { + "epoch": 1.84, + "learning_rate": 6.902620315747296e-07, + "loss": 0.7598, + "step": 71661 + }, + { + "epoch": 1.84, + "learning_rate": 6.902357220182278e-07, + "loss": 0.6108, + "step": 71662 + }, + { + "epoch": 1.84, + "learning_rate": 6.902094126988982e-07, + "loss": 0.6924, + "step": 71663 + }, + { + "epoch": 1.84, + "learning_rate": 6.901831036167609e-07, + "loss": 0.6133, + "step": 71664 + }, + { + "epoch": 1.84, + "learning_rate": 6.901567947718363e-07, + "loss": 0.5557, + "step": 71665 + }, + { + "epoch": 1.84, + "learning_rate": 6.901304861641442e-07, + "loss": 0.6592, + "step": 71666 + }, + { + "epoch": 1.84, + "learning_rate": 6.901041777937053e-07, + "loss": 0.5552, + "step": 71667 + }, + { + "epoch": 1.84, + "learning_rate": 6.900778696605392e-07, + "loss": 0.6465, + "step": 71668 + }, + { + "epoch": 1.84, + "learning_rate": 6.900515617646661e-07, + "loss": 0.6431, + "step": 71669 + }, + { + "epoch": 1.84, + "learning_rate": 6.900252541061064e-07, + "loss": 0.603, + "step": 71670 + }, + { + "epoch": 1.84, + "learning_rate": 6.899989466848799e-07, + "loss": 0.8018, + "step": 71671 + }, + { + "epoch": 1.84, + "learning_rate": 6.899726395010072e-07, + "loss": 0.6455, + "step": 71672 + }, + { + "epoch": 1.84, + "learning_rate": 6.899463325545079e-07, + "loss": 0.5479, + "step": 71673 + }, + { + "epoch": 1.84, + "learning_rate": 6.899200258454028e-07, + "loss": 0.6621, + "step": 71674 + }, + { + "epoch": 1.84, + "learning_rate": 6.898937193737113e-07, + "loss": 0.7568, + "step": 71675 + }, + { + "epoch": 1.84, + "learning_rate": 6.898674131394541e-07, + "loss": 0.6797, + "step": 71676 + }, + { + "epoch": 1.84, + "learning_rate": 6.898411071426516e-07, + "loss": 0.6426, + "step": 71677 + }, + { + "epoch": 1.84, + "learning_rate": 6.898148013833229e-07, + "loss": 0.5869, + "step": 71678 + }, + { + "epoch": 1.84, + "learning_rate": 6.89788495861489e-07, + "loss": 0.6621, + "step": 71679 + }, + { + "epoch": 1.84, + "learning_rate": 6.897621905771695e-07, + "loss": 0.7373, + "step": 71680 + }, + { + "epoch": 1.84, + "learning_rate": 6.897358855303852e-07, + "loss": 0.5784, + "step": 71681 + }, + { + "epoch": 1.84, + "learning_rate": 6.89709580721156e-07, + "loss": 0.4042, + "step": 71682 + }, + { + "epoch": 1.84, + "learning_rate": 6.896832761495013e-07, + "loss": 0.7178, + "step": 71683 + }, + { + "epoch": 1.84, + "learning_rate": 6.896569718154422e-07, + "loss": 0.7607, + "step": 71684 + }, + { + "epoch": 1.84, + "learning_rate": 6.896306677189985e-07, + "loss": 0.6738, + "step": 71685 + }, + { + "epoch": 1.84, + "learning_rate": 6.896043638601903e-07, + "loss": 0.4578, + "step": 71686 + }, + { + "epoch": 1.84, + "learning_rate": 6.89578060239038e-07, + "loss": 0.7749, + "step": 71687 + }, + { + "epoch": 1.84, + "learning_rate": 6.895517568555611e-07, + "loss": 0.6855, + "step": 71688 + }, + { + "epoch": 1.84, + "learning_rate": 6.895254537097803e-07, + "loss": 0.6504, + "step": 71689 + }, + { + "epoch": 1.84, + "learning_rate": 6.894991508017155e-07, + "loss": 0.6797, + "step": 71690 + }, + { + "epoch": 1.84, + "learning_rate": 6.894728481313871e-07, + "loss": 0.4255, + "step": 71691 + }, + { + "epoch": 1.84, + "learning_rate": 6.894465456988148e-07, + "loss": 0.3347, + "step": 71692 + }, + { + "epoch": 1.84, + "learning_rate": 6.894202435040193e-07, + "loss": 0.6973, + "step": 71693 + }, + { + "epoch": 1.84, + "learning_rate": 6.893939415470201e-07, + "loss": 0.5918, + "step": 71694 + }, + { + "epoch": 1.84, + "learning_rate": 6.89367639827838e-07, + "loss": 0.6426, + "step": 71695 + }, + { + "epoch": 1.84, + "learning_rate": 6.893413383464925e-07, + "loss": 0.6631, + "step": 71696 + }, + { + "epoch": 1.84, + "learning_rate": 6.893150371030045e-07, + "loss": 0.709, + "step": 71697 + }, + { + "epoch": 1.84, + "learning_rate": 6.892887360973936e-07, + "loss": 0.5439, + "step": 71698 + }, + { + "epoch": 1.84, + "learning_rate": 6.892624353296798e-07, + "loss": 0.7061, + "step": 71699 + }, + { + "epoch": 1.84, + "learning_rate": 6.892361347998835e-07, + "loss": 0.7051, + "step": 71700 + }, + { + "epoch": 1.84, + "learning_rate": 6.892098345080249e-07, + "loss": 0.6356, + "step": 71701 + }, + { + "epoch": 1.84, + "learning_rate": 6.891835344541239e-07, + "loss": 0.5403, + "step": 71702 + }, + { + "epoch": 1.84, + "learning_rate": 6.891572346382009e-07, + "loss": 0.6104, + "step": 71703 + }, + { + "epoch": 1.84, + "learning_rate": 6.891309350602758e-07, + "loss": 0.6172, + "step": 71704 + }, + { + "epoch": 1.84, + "learning_rate": 6.891046357203689e-07, + "loss": 0.7451, + "step": 71705 + }, + { + "epoch": 1.84, + "learning_rate": 6.890783366185003e-07, + "loss": 0.624, + "step": 71706 + }, + { + "epoch": 1.84, + "learning_rate": 6.890520377546902e-07, + "loss": 0.7051, + "step": 71707 + }, + { + "epoch": 1.84, + "learning_rate": 6.890257391289586e-07, + "loss": 0.5664, + "step": 71708 + }, + { + "epoch": 1.84, + "learning_rate": 6.889994407413256e-07, + "loss": 0.6689, + "step": 71709 + }, + { + "epoch": 1.84, + "learning_rate": 6.889731425918117e-07, + "loss": 0.5796, + "step": 71710 + }, + { + "epoch": 1.84, + "learning_rate": 6.889468446804363e-07, + "loss": 0.6914, + "step": 71711 + }, + { + "epoch": 1.84, + "learning_rate": 6.889205470072204e-07, + "loss": 0.8262, + "step": 71712 + }, + { + "epoch": 1.84, + "learning_rate": 6.888942495721834e-07, + "loss": 0.5723, + "step": 71713 + }, + { + "epoch": 1.84, + "learning_rate": 6.88867952375346e-07, + "loss": 0.5183, + "step": 71714 + }, + { + "epoch": 1.84, + "learning_rate": 6.88841655416728e-07, + "loss": 0.604, + "step": 71715 + }, + { + "epoch": 1.84, + "learning_rate": 6.888153586963498e-07, + "loss": 0.7666, + "step": 71716 + }, + { + "epoch": 1.84, + "learning_rate": 6.887890622142316e-07, + "loss": 0.7568, + "step": 71717 + }, + { + "epoch": 1.84, + "learning_rate": 6.887627659703929e-07, + "loss": 0.6924, + "step": 71718 + }, + { + "epoch": 1.84, + "learning_rate": 6.887364699648542e-07, + "loss": 0.7236, + "step": 71719 + }, + { + "epoch": 1.84, + "learning_rate": 6.88710174197636e-07, + "loss": 0.7207, + "step": 71720 + }, + { + "epoch": 1.84, + "learning_rate": 6.886838786687576e-07, + "loss": 0.6719, + "step": 71721 + }, + { + "epoch": 1.84, + "learning_rate": 6.886575833782401e-07, + "loss": 0.666, + "step": 71722 + }, + { + "epoch": 1.84, + "learning_rate": 6.886312883261029e-07, + "loss": 0.6343, + "step": 71723 + }, + { + "epoch": 1.84, + "learning_rate": 6.886049935123666e-07, + "loss": 0.7246, + "step": 71724 + }, + { + "epoch": 1.84, + "learning_rate": 6.885786989370508e-07, + "loss": 0.542, + "step": 71725 + }, + { + "epoch": 1.84, + "learning_rate": 6.885524046001763e-07, + "loss": 0.5798, + "step": 71726 + }, + { + "epoch": 1.84, + "learning_rate": 6.885261105017633e-07, + "loss": 0.5125, + "step": 71727 + }, + { + "epoch": 1.84, + "learning_rate": 6.884998166418308e-07, + "loss": 0.5576, + "step": 71728 + }, + { + "epoch": 1.84, + "learning_rate": 6.884735230204e-07, + "loss": 0.6162, + "step": 71729 + }, + { + "epoch": 1.84, + "learning_rate": 6.884472296374905e-07, + "loss": 0.5359, + "step": 71730 + }, + { + "epoch": 1.84, + "learning_rate": 6.884209364931229e-07, + "loss": 0.5879, + "step": 71731 + }, + { + "epoch": 1.84, + "learning_rate": 6.883946435873167e-07, + "loss": 0.7051, + "step": 71732 + }, + { + "epoch": 1.84, + "learning_rate": 6.883683509200926e-07, + "loss": 0.7031, + "step": 71733 + }, + { + "epoch": 1.84, + "learning_rate": 6.883420584914706e-07, + "loss": 0.6992, + "step": 71734 + }, + { + "epoch": 1.84, + "learning_rate": 6.883157663014707e-07, + "loss": 0.6592, + "step": 71735 + }, + { + "epoch": 1.84, + "learning_rate": 6.882894743501131e-07, + "loss": 0.665, + "step": 71736 + }, + { + "epoch": 1.84, + "learning_rate": 6.882631826374181e-07, + "loss": 0.6309, + "step": 71737 + }, + { + "epoch": 1.84, + "learning_rate": 6.882368911634053e-07, + "loss": 0.5439, + "step": 71738 + }, + { + "epoch": 1.84, + "learning_rate": 6.882105999280954e-07, + "loss": 0.7998, + "step": 71739 + }, + { + "epoch": 1.84, + "learning_rate": 6.881843089315081e-07, + "loss": 0.605, + "step": 71740 + }, + { + "epoch": 1.84, + "learning_rate": 6.881580181736639e-07, + "loss": 0.5684, + "step": 71741 + }, + { + "epoch": 1.84, + "learning_rate": 6.881317276545826e-07, + "loss": 0.5967, + "step": 71742 + }, + { + "epoch": 1.84, + "learning_rate": 6.881054373742848e-07, + "loss": 0.5195, + "step": 71743 + }, + { + "epoch": 1.84, + "learning_rate": 6.8807914733279e-07, + "loss": 0.6963, + "step": 71744 + }, + { + "epoch": 1.84, + "learning_rate": 6.880528575301188e-07, + "loss": 0.7266, + "step": 71745 + }, + { + "epoch": 1.84, + "learning_rate": 6.880265679662911e-07, + "loss": 0.7031, + "step": 71746 + }, + { + "epoch": 1.84, + "learning_rate": 6.880002786413275e-07, + "loss": 0.6426, + "step": 71747 + }, + { + "epoch": 1.84, + "learning_rate": 6.879739895552475e-07, + "loss": 0.6758, + "step": 71748 + }, + { + "epoch": 1.84, + "learning_rate": 6.879477007080713e-07, + "loss": 0.5811, + "step": 71749 + }, + { + "epoch": 1.84, + "learning_rate": 6.879214120998193e-07, + "loss": 0.7842, + "step": 71750 + }, + { + "epoch": 1.84, + "learning_rate": 6.878951237305115e-07, + "loss": 0.5957, + "step": 71751 + }, + { + "epoch": 1.84, + "learning_rate": 6.878688356001681e-07, + "loss": 0.4551, + "step": 71752 + }, + { + "epoch": 1.84, + "learning_rate": 6.878425477088092e-07, + "loss": 0.5715, + "step": 71753 + }, + { + "epoch": 1.84, + "learning_rate": 6.878162600564548e-07, + "loss": 0.7168, + "step": 71754 + }, + { + "epoch": 1.84, + "learning_rate": 6.877899726431253e-07, + "loss": 0.6431, + "step": 71755 + }, + { + "epoch": 1.84, + "learning_rate": 6.877636854688405e-07, + "loss": 0.7354, + "step": 71756 + }, + { + "epoch": 1.84, + "learning_rate": 6.87737398533621e-07, + "loss": 0.668, + "step": 71757 + }, + { + "epoch": 1.84, + "learning_rate": 6.877111118374863e-07, + "loss": 0.6309, + "step": 71758 + }, + { + "epoch": 1.84, + "learning_rate": 6.876848253804568e-07, + "loss": 0.6963, + "step": 71759 + }, + { + "epoch": 1.84, + "learning_rate": 6.876585391625529e-07, + "loss": 0.5991, + "step": 71760 + }, + { + "epoch": 1.84, + "learning_rate": 6.876322531837943e-07, + "loss": 0.5459, + "step": 71761 + }, + { + "epoch": 1.84, + "learning_rate": 6.876059674442014e-07, + "loss": 0.6279, + "step": 71762 + }, + { + "epoch": 1.84, + "learning_rate": 6.875796819437942e-07, + "loss": 0.6992, + "step": 71763 + }, + { + "epoch": 1.84, + "learning_rate": 6.87553396682593e-07, + "loss": 0.6851, + "step": 71764 + }, + { + "epoch": 1.84, + "learning_rate": 6.875271116606175e-07, + "loss": 0.6328, + "step": 71765 + }, + { + "epoch": 1.84, + "learning_rate": 6.875008268778884e-07, + "loss": 0.835, + "step": 71766 + }, + { + "epoch": 1.84, + "learning_rate": 6.874745423344258e-07, + "loss": 0.7256, + "step": 71767 + }, + { + "epoch": 1.84, + "learning_rate": 6.874482580302491e-07, + "loss": 0.6729, + "step": 71768 + }, + { + "epoch": 1.84, + "learning_rate": 6.874219739653792e-07, + "loss": 0.6211, + "step": 71769 + }, + { + "epoch": 1.84, + "learning_rate": 6.873956901398356e-07, + "loss": 0.667, + "step": 71770 + }, + { + "epoch": 1.84, + "learning_rate": 6.873694065536391e-07, + "loss": 0.6479, + "step": 71771 + }, + { + "epoch": 1.84, + "learning_rate": 6.873431232068092e-07, + "loss": 0.6641, + "step": 71772 + }, + { + "epoch": 1.84, + "learning_rate": 6.873168400993663e-07, + "loss": 0.5938, + "step": 71773 + }, + { + "epoch": 1.84, + "learning_rate": 6.872905572313306e-07, + "loss": 0.4219, + "step": 71774 + }, + { + "epoch": 1.84, + "learning_rate": 6.872642746027221e-07, + "loss": 0.6416, + "step": 71775 + }, + { + "epoch": 1.84, + "learning_rate": 6.872379922135612e-07, + "loss": 0.561, + "step": 71776 + }, + { + "epoch": 1.84, + "learning_rate": 6.872117100638679e-07, + "loss": 0.5591, + "step": 71777 + }, + { + "epoch": 1.84, + "learning_rate": 6.871854281536617e-07, + "loss": 0.5962, + "step": 71778 + }, + { + "epoch": 1.84, + "learning_rate": 6.871591464829635e-07, + "loss": 0.5605, + "step": 71779 + }, + { + "epoch": 1.84, + "learning_rate": 6.871328650517929e-07, + "loss": 0.5327, + "step": 71780 + }, + { + "epoch": 1.84, + "learning_rate": 6.871065838601706e-07, + "loss": 0.5542, + "step": 71781 + }, + { + "epoch": 1.84, + "learning_rate": 6.870803029081162e-07, + "loss": 0.7129, + "step": 71782 + }, + { + "epoch": 1.84, + "learning_rate": 6.870540221956501e-07, + "loss": 0.6646, + "step": 71783 + }, + { + "epoch": 1.84, + "learning_rate": 6.870277417227924e-07, + "loss": 0.6392, + "step": 71784 + }, + { + "epoch": 1.84, + "learning_rate": 6.870014614895631e-07, + "loss": 0.5381, + "step": 71785 + }, + { + "epoch": 1.84, + "learning_rate": 6.869751814959822e-07, + "loss": 0.8242, + "step": 71786 + }, + { + "epoch": 1.84, + "learning_rate": 6.869489017420704e-07, + "loss": 0.4761, + "step": 71787 + }, + { + "epoch": 1.84, + "learning_rate": 6.869226222278475e-07, + "loss": 0.5552, + "step": 71788 + }, + { + "epoch": 1.84, + "learning_rate": 6.868963429533334e-07, + "loss": 0.5254, + "step": 71789 + }, + { + "epoch": 1.84, + "learning_rate": 6.86870063918548e-07, + "loss": 0.8135, + "step": 71790 + }, + { + "epoch": 1.84, + "learning_rate": 6.868437851235123e-07, + "loss": 0.7017, + "step": 71791 + }, + { + "epoch": 1.84, + "learning_rate": 6.868175065682454e-07, + "loss": 0.707, + "step": 71792 + }, + { + "epoch": 1.84, + "learning_rate": 6.867912282527684e-07, + "loss": 0.5645, + "step": 71793 + }, + { + "epoch": 1.84, + "learning_rate": 6.867649501771006e-07, + "loss": 0.6216, + "step": 71794 + }, + { + "epoch": 1.84, + "learning_rate": 6.867386723412627e-07, + "loss": 0.4746, + "step": 71795 + }, + { + "epoch": 1.84, + "learning_rate": 6.867123947452744e-07, + "loss": 0.9297, + "step": 71796 + }, + { + "epoch": 1.84, + "learning_rate": 6.866861173891565e-07, + "loss": 0.5928, + "step": 71797 + }, + { + "epoch": 1.84, + "learning_rate": 6.866598402729283e-07, + "loss": 0.4189, + "step": 71798 + }, + { + "epoch": 1.84, + "learning_rate": 6.866335633966101e-07, + "loss": 0.5659, + "step": 71799 + }, + { + "epoch": 1.84, + "learning_rate": 6.866072867602224e-07, + "loss": 0.6392, + "step": 71800 + }, + { + "epoch": 1.84, + "learning_rate": 6.865810103637849e-07, + "loss": 0.6245, + "step": 71801 + }, + { + "epoch": 1.84, + "learning_rate": 6.865547342073181e-07, + "loss": 0.4849, + "step": 71802 + }, + { + "epoch": 1.84, + "learning_rate": 6.865284582908417e-07, + "loss": 0.7383, + "step": 71803 + }, + { + "epoch": 1.84, + "learning_rate": 6.865021826143762e-07, + "loss": 0.4551, + "step": 71804 + }, + { + "epoch": 1.84, + "learning_rate": 6.864759071779415e-07, + "loss": 0.6392, + "step": 71805 + }, + { + "epoch": 1.84, + "learning_rate": 6.864496319815578e-07, + "loss": 0.5684, + "step": 71806 + }, + { + "epoch": 1.84, + "learning_rate": 6.864233570252455e-07, + "loss": 0.8037, + "step": 71807 + }, + { + "epoch": 1.84, + "learning_rate": 6.863970823090244e-07, + "loss": 0.6836, + "step": 71808 + }, + { + "epoch": 1.84, + "learning_rate": 6.863708078329143e-07, + "loss": 0.6992, + "step": 71809 + }, + { + "epoch": 1.84, + "learning_rate": 6.863445335969356e-07, + "loss": 0.3436, + "step": 71810 + }, + { + "epoch": 1.84, + "learning_rate": 6.863182596011085e-07, + "loss": 0.5715, + "step": 71811 + }, + { + "epoch": 1.84, + "learning_rate": 6.862919858454533e-07, + "loss": 0.4187, + "step": 71812 + }, + { + "epoch": 1.84, + "learning_rate": 6.862657123299897e-07, + "loss": 0.6157, + "step": 71813 + }, + { + "epoch": 1.84, + "learning_rate": 6.862394390547381e-07, + "loss": 0.6318, + "step": 71814 + }, + { + "epoch": 1.84, + "learning_rate": 6.862131660197185e-07, + "loss": 0.6514, + "step": 71815 + }, + { + "epoch": 1.84, + "learning_rate": 6.861868932249513e-07, + "loss": 0.8379, + "step": 71816 + }, + { + "epoch": 1.84, + "learning_rate": 6.861606206704562e-07, + "loss": 0.6348, + "step": 71817 + }, + { + "epoch": 1.84, + "learning_rate": 6.861343483562534e-07, + "loss": 0.7617, + "step": 71818 + }, + { + "epoch": 1.84, + "learning_rate": 6.861080762823633e-07, + "loss": 0.8174, + "step": 71819 + }, + { + "epoch": 1.84, + "learning_rate": 6.860818044488053e-07, + "loss": 0.6582, + "step": 71820 + }, + { + "epoch": 1.84, + "learning_rate": 6.860555328556006e-07, + "loss": 0.542, + "step": 71821 + }, + { + "epoch": 1.84, + "learning_rate": 6.860292615027683e-07, + "loss": 0.4926, + "step": 71822 + }, + { + "epoch": 1.84, + "learning_rate": 6.860029903903293e-07, + "loss": 0.6709, + "step": 71823 + }, + { + "epoch": 1.84, + "learning_rate": 6.859767195183031e-07, + "loss": 0.5469, + "step": 71824 + }, + { + "epoch": 1.84, + "learning_rate": 6.859504488867103e-07, + "loss": 0.5522, + "step": 71825 + }, + { + "epoch": 1.84, + "learning_rate": 6.85924178495571e-07, + "loss": 0.4966, + "step": 71826 + }, + { + "epoch": 1.84, + "learning_rate": 6.85897908344905e-07, + "loss": 0.7861, + "step": 71827 + }, + { + "epoch": 1.84, + "learning_rate": 6.858716384347322e-07, + "loss": 0.6689, + "step": 71828 + }, + { + "epoch": 1.84, + "learning_rate": 6.858453687650734e-07, + "loss": 0.6641, + "step": 71829 + }, + { + "epoch": 1.84, + "learning_rate": 6.85819099335948e-07, + "loss": 0.6377, + "step": 71830 + }, + { + "epoch": 1.84, + "learning_rate": 6.857928301473767e-07, + "loss": 0.3616, + "step": 71831 + }, + { + "epoch": 1.84, + "learning_rate": 6.857665611993793e-07, + "loss": 0.584, + "step": 71832 + }, + { + "epoch": 1.84, + "learning_rate": 6.85740292491976e-07, + "loss": 0.7939, + "step": 71833 + }, + { + "epoch": 1.84, + "learning_rate": 6.857140240251868e-07, + "loss": 0.7236, + "step": 71834 + }, + { + "epoch": 1.84, + "learning_rate": 6.856877557990321e-07, + "loss": 0.6367, + "step": 71835 + }, + { + "epoch": 1.84, + "learning_rate": 6.856614878135321e-07, + "loss": 0.5615, + "step": 71836 + }, + { + "epoch": 1.84, + "learning_rate": 6.856352200687062e-07, + "loss": 0.6855, + "step": 71837 + }, + { + "epoch": 1.84, + "learning_rate": 6.856089525645752e-07, + "loss": 0.6094, + "step": 71838 + }, + { + "epoch": 1.84, + "learning_rate": 6.855826853011587e-07, + "loss": 0.563, + "step": 71839 + }, + { + "epoch": 1.84, + "learning_rate": 6.855564182784774e-07, + "loss": 0.6943, + "step": 71840 + }, + { + "epoch": 1.84, + "learning_rate": 6.855301514965508e-07, + "loss": 0.6416, + "step": 71841 + }, + { + "epoch": 1.84, + "learning_rate": 6.855038849553994e-07, + "loss": 0.5991, + "step": 71842 + }, + { + "epoch": 1.84, + "learning_rate": 6.854776186550431e-07, + "loss": 0.6465, + "step": 71843 + }, + { + "epoch": 1.84, + "learning_rate": 6.854513525955024e-07, + "loss": 0.6274, + "step": 71844 + }, + { + "epoch": 1.84, + "learning_rate": 6.854250867767971e-07, + "loss": 0.6528, + "step": 71845 + }, + { + "epoch": 1.84, + "learning_rate": 6.853988211989475e-07, + "loss": 0.5483, + "step": 71846 + }, + { + "epoch": 1.84, + "learning_rate": 6.853725558619731e-07, + "loss": 0.6943, + "step": 71847 + }, + { + "epoch": 1.84, + "learning_rate": 6.853462907658949e-07, + "loss": 0.6348, + "step": 71848 + }, + { + "epoch": 1.84, + "learning_rate": 6.853200259107321e-07, + "loss": 0.7007, + "step": 71849 + }, + { + "epoch": 1.84, + "learning_rate": 6.852937612965057e-07, + "loss": 0.6895, + "step": 71850 + }, + { + "epoch": 1.84, + "learning_rate": 6.852674969232352e-07, + "loss": 0.5518, + "step": 71851 + }, + { + "epoch": 1.84, + "learning_rate": 6.852412327909409e-07, + "loss": 0.5562, + "step": 71852 + }, + { + "epoch": 1.84, + "learning_rate": 6.852149688996429e-07, + "loss": 0.5789, + "step": 71853 + }, + { + "epoch": 1.84, + "learning_rate": 6.851887052493614e-07, + "loss": 0.667, + "step": 71854 + }, + { + "epoch": 1.84, + "learning_rate": 6.851624418401163e-07, + "loss": 0.7812, + "step": 71855 + }, + { + "epoch": 1.84, + "learning_rate": 6.851361786719283e-07, + "loss": 0.6826, + "step": 71856 + }, + { + "epoch": 1.84, + "learning_rate": 6.851099157448168e-07, + "loss": 0.4934, + "step": 71857 + }, + { + "epoch": 1.84, + "learning_rate": 6.850836530588019e-07, + "loss": 0.6172, + "step": 71858 + }, + { + "epoch": 1.84, + "learning_rate": 6.850573906139042e-07, + "loss": 0.397, + "step": 71859 + }, + { + "epoch": 1.84, + "learning_rate": 6.850311284101434e-07, + "loss": 0.7549, + "step": 71860 + }, + { + "epoch": 1.84, + "learning_rate": 6.8500486644754e-07, + "loss": 0.6099, + "step": 71861 + }, + { + "epoch": 1.84, + "learning_rate": 6.849786047261139e-07, + "loss": 0.5889, + "step": 71862 + }, + { + "epoch": 1.84, + "learning_rate": 6.849523432458848e-07, + "loss": 0.5996, + "step": 71863 + }, + { + "epoch": 1.84, + "learning_rate": 6.849260820068736e-07, + "loss": 0.4919, + "step": 71864 + }, + { + "epoch": 1.84, + "learning_rate": 6.848998210090999e-07, + "loss": 0.7305, + "step": 71865 + }, + { + "epoch": 1.84, + "learning_rate": 6.848735602525842e-07, + "loss": 0.6108, + "step": 71866 + }, + { + "epoch": 1.84, + "learning_rate": 6.84847299737346e-07, + "loss": 0.7129, + "step": 71867 + }, + { + "epoch": 1.84, + "learning_rate": 6.848210394634057e-07, + "loss": 0.7119, + "step": 71868 + }, + { + "epoch": 1.84, + "learning_rate": 6.847947794307836e-07, + "loss": 0.7422, + "step": 71869 + }, + { + "epoch": 1.84, + "learning_rate": 6.847685196394994e-07, + "loss": 0.6191, + "step": 71870 + }, + { + "epoch": 1.84, + "learning_rate": 6.847422600895736e-07, + "loss": 0.4531, + "step": 71871 + }, + { + "epoch": 1.84, + "learning_rate": 6.847160007810261e-07, + "loss": 0.5967, + "step": 71872 + }, + { + "epoch": 1.84, + "learning_rate": 6.846897417138772e-07, + "loss": 0.5004, + "step": 71873 + }, + { + "epoch": 1.84, + "learning_rate": 6.846634828881465e-07, + "loss": 0.5166, + "step": 71874 + }, + { + "epoch": 1.84, + "learning_rate": 6.84637224303855e-07, + "loss": 0.5312, + "step": 71875 + }, + { + "epoch": 1.84, + "learning_rate": 6.846109659610223e-07, + "loss": 0.6895, + "step": 71876 + }, + { + "epoch": 1.84, + "learning_rate": 6.84584707859668e-07, + "loss": 0.6572, + "step": 71877 + }, + { + "epoch": 1.84, + "learning_rate": 6.84558449999813e-07, + "loss": 0.624, + "step": 71878 + }, + { + "epoch": 1.84, + "learning_rate": 6.845321923814771e-07, + "loss": 0.7363, + "step": 71879 + }, + { + "epoch": 1.84, + "learning_rate": 6.845059350046803e-07, + "loss": 0.4333, + "step": 71880 + }, + { + "epoch": 1.84, + "learning_rate": 6.844796778694427e-07, + "loss": 0.584, + "step": 71881 + }, + { + "epoch": 1.84, + "learning_rate": 6.844534209757844e-07, + "loss": 0.4863, + "step": 71882 + }, + { + "epoch": 1.84, + "learning_rate": 6.84427164323726e-07, + "loss": 0.8262, + "step": 71883 + }, + { + "epoch": 1.84, + "learning_rate": 6.844009079132869e-07, + "loss": 0.5225, + "step": 71884 + }, + { + "epoch": 1.84, + "learning_rate": 6.843746517444876e-07, + "loss": 0.7969, + "step": 71885 + }, + { + "epoch": 1.84, + "learning_rate": 6.843483958173484e-07, + "loss": 0.6367, + "step": 71886 + }, + { + "epoch": 1.84, + "learning_rate": 6.843221401318889e-07, + "loss": 0.7344, + "step": 71887 + }, + { + "epoch": 1.84, + "learning_rate": 6.842958846881293e-07, + "loss": 0.6118, + "step": 71888 + }, + { + "epoch": 1.84, + "learning_rate": 6.842696294860898e-07, + "loss": 0.8428, + "step": 71889 + }, + { + "epoch": 1.84, + "learning_rate": 6.842433745257908e-07, + "loss": 0.5112, + "step": 71890 + }, + { + "epoch": 1.84, + "learning_rate": 6.842171198072517e-07, + "loss": 0.5815, + "step": 71891 + }, + { + "epoch": 1.84, + "learning_rate": 6.841908653304933e-07, + "loss": 0.6211, + "step": 71892 + }, + { + "epoch": 1.84, + "learning_rate": 6.841646110955354e-07, + "loss": 0.75, + "step": 71893 + }, + { + "epoch": 1.84, + "learning_rate": 6.841383571023982e-07, + "loss": 0.6797, + "step": 71894 + }, + { + "epoch": 1.84, + "learning_rate": 6.841121033511015e-07, + "loss": 0.6025, + "step": 71895 + }, + { + "epoch": 1.84, + "learning_rate": 6.840858498416664e-07, + "loss": 0.5977, + "step": 71896 + }, + { + "epoch": 1.84, + "learning_rate": 6.840595965741115e-07, + "loss": 0.4937, + "step": 71897 + }, + { + "epoch": 1.84, + "learning_rate": 6.840333435484578e-07, + "loss": 0.46, + "step": 71898 + }, + { + "epoch": 1.84, + "learning_rate": 6.840070907647253e-07, + "loss": 0.8057, + "step": 71899 + }, + { + "epoch": 1.84, + "learning_rate": 6.83980838222934e-07, + "loss": 0.624, + "step": 71900 + }, + { + "epoch": 1.84, + "learning_rate": 6.83954585923104e-07, + "loss": 0.7393, + "step": 71901 + }, + { + "epoch": 1.84, + "learning_rate": 6.839283338652555e-07, + "loss": 0.7061, + "step": 71902 + }, + { + "epoch": 1.84, + "learning_rate": 6.839020820494083e-07, + "loss": 0.574, + "step": 71903 + }, + { + "epoch": 1.84, + "learning_rate": 6.838758304755831e-07, + "loss": 0.7075, + "step": 71904 + }, + { + "epoch": 1.84, + "learning_rate": 6.838495791437993e-07, + "loss": 0.5332, + "step": 71905 + }, + { + "epoch": 1.84, + "learning_rate": 6.838233280540778e-07, + "loss": 0.7002, + "step": 71906 + }, + { + "epoch": 1.84, + "learning_rate": 6.837970772064381e-07, + "loss": 0.4966, + "step": 71907 + }, + { + "epoch": 1.84, + "learning_rate": 6.837708266009002e-07, + "loss": 0.6743, + "step": 71908 + }, + { + "epoch": 1.84, + "learning_rate": 6.837445762374845e-07, + "loss": 0.749, + "step": 71909 + }, + { + "epoch": 1.84, + "learning_rate": 6.83718326116211e-07, + "loss": 0.6543, + "step": 71910 + }, + { + "epoch": 1.84, + "learning_rate": 6.836920762371e-07, + "loss": 0.6865, + "step": 71911 + }, + { + "epoch": 1.84, + "learning_rate": 6.836658266001713e-07, + "loss": 0.5815, + "step": 71912 + }, + { + "epoch": 1.84, + "learning_rate": 6.836395772054452e-07, + "loss": 0.6675, + "step": 71913 + }, + { + "epoch": 1.84, + "learning_rate": 6.836133280529415e-07, + "loss": 0.6729, + "step": 71914 + }, + { + "epoch": 1.84, + "learning_rate": 6.835870791426809e-07, + "loss": 0.5566, + "step": 71915 + }, + { + "epoch": 1.84, + "learning_rate": 6.835608304746833e-07, + "loss": 0.5083, + "step": 71916 + }, + { + "epoch": 1.84, + "learning_rate": 6.835345820489684e-07, + "loss": 0.6865, + "step": 71917 + }, + { + "epoch": 1.84, + "learning_rate": 6.835083338655562e-07, + "loss": 0.8174, + "step": 71918 + }, + { + "epoch": 1.84, + "learning_rate": 6.834820859244675e-07, + "loss": 0.4978, + "step": 71919 + }, + { + "epoch": 1.84, + "learning_rate": 6.834558382257216e-07, + "loss": 0.6104, + "step": 71920 + }, + { + "epoch": 1.84, + "learning_rate": 6.834295907693392e-07, + "loss": 0.7432, + "step": 71921 + }, + { + "epoch": 1.84, + "learning_rate": 6.834033435553403e-07, + "loss": 0.6758, + "step": 71922 + }, + { + "epoch": 1.84, + "learning_rate": 6.833770965837448e-07, + "loss": 0.6675, + "step": 71923 + }, + { + "epoch": 1.84, + "learning_rate": 6.833508498545729e-07, + "loss": 0.481, + "step": 71924 + }, + { + "epoch": 1.84, + "learning_rate": 6.833246033678448e-07, + "loss": 0.5518, + "step": 71925 + }, + { + "epoch": 1.84, + "learning_rate": 6.832983571235808e-07, + "loss": 0.7959, + "step": 71926 + }, + { + "epoch": 1.84, + "learning_rate": 6.832721111218001e-07, + "loss": 0.6743, + "step": 71927 + }, + { + "epoch": 1.84, + "learning_rate": 6.832458653625237e-07, + "loss": 0.6377, + "step": 71928 + }, + { + "epoch": 1.84, + "learning_rate": 6.832196198457712e-07, + "loss": 0.6484, + "step": 71929 + }, + { + "epoch": 1.84, + "learning_rate": 6.83193374571563e-07, + "loss": 0.6953, + "step": 71930 + }, + { + "epoch": 1.84, + "learning_rate": 6.831671295399189e-07, + "loss": 0.6572, + "step": 71931 + }, + { + "epoch": 1.84, + "learning_rate": 6.831408847508593e-07, + "loss": 0.6128, + "step": 71932 + }, + { + "epoch": 1.84, + "learning_rate": 6.83114640204404e-07, + "loss": 0.625, + "step": 71933 + }, + { + "epoch": 1.84, + "learning_rate": 6.830883959005736e-07, + "loss": 0.5781, + "step": 71934 + }, + { + "epoch": 1.84, + "learning_rate": 6.830621518393875e-07, + "loss": 0.7441, + "step": 71935 + }, + { + "epoch": 1.84, + "learning_rate": 6.830359080208666e-07, + "loss": 0.7012, + "step": 71936 + }, + { + "epoch": 1.84, + "learning_rate": 6.8300966444503e-07, + "loss": 0.4656, + "step": 71937 + }, + { + "epoch": 1.84, + "learning_rate": 6.829834211118986e-07, + "loss": 0.9277, + "step": 71938 + }, + { + "epoch": 1.84, + "learning_rate": 6.829571780214921e-07, + "loss": 0.5957, + "step": 71939 + }, + { + "epoch": 1.84, + "learning_rate": 6.829309351738308e-07, + "loss": 0.7393, + "step": 71940 + }, + { + "epoch": 1.84, + "learning_rate": 6.829046925689346e-07, + "loss": 0.5449, + "step": 71941 + }, + { + "epoch": 1.84, + "learning_rate": 6.828784502068238e-07, + "loss": 0.6914, + "step": 71942 + }, + { + "epoch": 1.84, + "learning_rate": 6.828522080875181e-07, + "loss": 0.627, + "step": 71943 + }, + { + "epoch": 1.84, + "learning_rate": 6.828259662110383e-07, + "loss": 0.4475, + "step": 71944 + }, + { + "epoch": 1.84, + "learning_rate": 6.827997245774037e-07, + "loss": 0.6816, + "step": 71945 + }, + { + "epoch": 1.84, + "learning_rate": 6.827734831866352e-07, + "loss": 0.7812, + "step": 71946 + }, + { + "epoch": 1.84, + "learning_rate": 6.827472420387523e-07, + "loss": 0.6045, + "step": 71947 + }, + { + "epoch": 1.84, + "learning_rate": 6.827210011337751e-07, + "loss": 0.5146, + "step": 71948 + }, + { + "epoch": 1.84, + "learning_rate": 6.82694760471724e-07, + "loss": 0.6953, + "step": 71949 + }, + { + "epoch": 1.84, + "learning_rate": 6.826685200526186e-07, + "loss": 0.7793, + "step": 71950 + }, + { + "epoch": 1.84, + "learning_rate": 6.826422798764797e-07, + "loss": 0.6992, + "step": 71951 + }, + { + "epoch": 1.84, + "learning_rate": 6.826160399433269e-07, + "loss": 0.623, + "step": 71952 + }, + { + "epoch": 1.84, + "learning_rate": 6.825898002531803e-07, + "loss": 0.6719, + "step": 71953 + }, + { + "epoch": 1.84, + "learning_rate": 6.825635608060603e-07, + "loss": 0.6309, + "step": 71954 + }, + { + "epoch": 1.84, + "learning_rate": 6.825373216019865e-07, + "loss": 0.5884, + "step": 71955 + }, + { + "epoch": 1.84, + "learning_rate": 6.825110826409797e-07, + "loss": 0.7344, + "step": 71956 + }, + { + "epoch": 1.84, + "learning_rate": 6.824848439230592e-07, + "loss": 0.5674, + "step": 71957 + }, + { + "epoch": 1.84, + "learning_rate": 6.824586054482455e-07, + "loss": 0.7544, + "step": 71958 + }, + { + "epoch": 1.84, + "learning_rate": 6.824323672165588e-07, + "loss": 0.4609, + "step": 71959 + }, + { + "epoch": 1.84, + "learning_rate": 6.824061292280187e-07, + "loss": 0.6768, + "step": 71960 + }, + { + "epoch": 1.84, + "learning_rate": 6.823798914826461e-07, + "loss": 0.5635, + "step": 71961 + }, + { + "epoch": 1.84, + "learning_rate": 6.823536539804602e-07, + "loss": 0.6738, + "step": 71962 + }, + { + "epoch": 1.84, + "learning_rate": 6.823274167214817e-07, + "loss": 0.6548, + "step": 71963 + }, + { + "epoch": 1.84, + "learning_rate": 6.823011797057303e-07, + "loss": 0.584, + "step": 71964 + }, + { + "epoch": 1.84, + "learning_rate": 6.822749429332267e-07, + "loss": 0.5879, + "step": 71965 + }, + { + "epoch": 1.84, + "learning_rate": 6.822487064039904e-07, + "loss": 0.6084, + "step": 71966 + }, + { + "epoch": 1.84, + "learning_rate": 6.822224701180414e-07, + "loss": 0.7021, + "step": 71967 + }, + { + "epoch": 1.84, + "learning_rate": 6.821962340754004e-07, + "loss": 0.584, + "step": 71968 + }, + { + "epoch": 1.84, + "learning_rate": 6.821699982760869e-07, + "loss": 0.6006, + "step": 71969 + }, + { + "epoch": 1.84, + "learning_rate": 6.821437627201212e-07, + "loss": 0.582, + "step": 71970 + }, + { + "epoch": 1.84, + "learning_rate": 6.821175274075235e-07, + "loss": 0.5576, + "step": 71971 + }, + { + "epoch": 1.84, + "learning_rate": 6.820912923383136e-07, + "loss": 0.6348, + "step": 71972 + }, + { + "epoch": 1.84, + "learning_rate": 6.82065057512512e-07, + "loss": 0.7881, + "step": 71973 + }, + { + "epoch": 1.84, + "learning_rate": 6.820388229301384e-07, + "loss": 0.7041, + "step": 71974 + }, + { + "epoch": 1.84, + "learning_rate": 6.820125885912132e-07, + "loss": 0.666, + "step": 71975 + }, + { + "epoch": 1.84, + "learning_rate": 6.819863544957566e-07, + "loss": 0.4943, + "step": 71976 + }, + { + "epoch": 1.84, + "learning_rate": 6.81960120643788e-07, + "loss": 0.626, + "step": 71977 + }, + { + "epoch": 1.84, + "learning_rate": 6.819338870353281e-07, + "loss": 0.5532, + "step": 71978 + }, + { + "epoch": 1.84, + "learning_rate": 6.819076536703966e-07, + "loss": 0.5605, + "step": 71979 + }, + { + "epoch": 1.84, + "learning_rate": 6.81881420549014e-07, + "loss": 0.6033, + "step": 71980 + }, + { + "epoch": 1.84, + "learning_rate": 6.818551876712e-07, + "loss": 0.8535, + "step": 71981 + }, + { + "epoch": 1.84, + "learning_rate": 6.818289550369749e-07, + "loss": 0.6143, + "step": 71982 + }, + { + "epoch": 1.84, + "learning_rate": 6.818027226463587e-07, + "loss": 0.5767, + "step": 71983 + }, + { + "epoch": 1.84, + "learning_rate": 6.817764904993717e-07, + "loss": 0.5742, + "step": 71984 + }, + { + "epoch": 1.85, + "learning_rate": 6.817502585960335e-07, + "loss": 0.6631, + "step": 71985 + }, + { + "epoch": 1.85, + "learning_rate": 6.817240269363652e-07, + "loss": 0.3938, + "step": 71986 + }, + { + "epoch": 1.85, + "learning_rate": 6.816977955203855e-07, + "loss": 0.4531, + "step": 71987 + }, + { + "epoch": 1.85, + "learning_rate": 6.816715643481155e-07, + "loss": 0.707, + "step": 71988 + }, + { + "epoch": 1.85, + "learning_rate": 6.816453334195747e-07, + "loss": 0.6211, + "step": 71989 + }, + { + "epoch": 1.85, + "learning_rate": 6.816191027347835e-07, + "loss": 0.5486, + "step": 71990 + }, + { + "epoch": 1.85, + "learning_rate": 6.815928722937619e-07, + "loss": 0.5894, + "step": 71991 + }, + { + "epoch": 1.85, + "learning_rate": 6.815666420965301e-07, + "loss": 0.666, + "step": 71992 + }, + { + "epoch": 1.85, + "learning_rate": 6.815404121431076e-07, + "loss": 0.7461, + "step": 71993 + }, + { + "epoch": 1.85, + "learning_rate": 6.815141824335155e-07, + "loss": 0.5216, + "step": 71994 + }, + { + "epoch": 1.85, + "learning_rate": 6.81487952967773e-07, + "loss": 0.6152, + "step": 71995 + }, + { + "epoch": 1.85, + "learning_rate": 6.814617237459011e-07, + "loss": 0.7944, + "step": 71996 + }, + { + "epoch": 1.85, + "learning_rate": 6.814354947679191e-07, + "loss": 0.7275, + "step": 71997 + }, + { + "epoch": 1.85, + "learning_rate": 6.814092660338471e-07, + "loss": 0.4966, + "step": 71998 + }, + { + "epoch": 1.85, + "learning_rate": 6.813830375437054e-07, + "loss": 0.5352, + "step": 71999 + }, + { + "epoch": 1.85, + "learning_rate": 6.813568092975139e-07, + "loss": 0.6914, + "step": 72000 + }, + { + "epoch": 1.85, + "learning_rate": 6.813305812952932e-07, + "loss": 0.5698, + "step": 72001 + }, + { + "epoch": 1.85, + "learning_rate": 6.813043535370626e-07, + "loss": 0.6689, + "step": 72002 + }, + { + "epoch": 1.85, + "learning_rate": 6.81278126022843e-07, + "loss": 0.6182, + "step": 72003 + }, + { + "epoch": 1.85, + "learning_rate": 6.812518987526537e-07, + "loss": 0.5825, + "step": 72004 + }, + { + "epoch": 1.85, + "learning_rate": 6.812256717265155e-07, + "loss": 0.7329, + "step": 72005 + }, + { + "epoch": 1.85, + "learning_rate": 6.811994449444483e-07, + "loss": 0.403, + "step": 72006 + }, + { + "epoch": 1.85, + "learning_rate": 6.811732184064718e-07, + "loss": 0.6594, + "step": 72007 + }, + { + "epoch": 1.85, + "learning_rate": 6.811469921126063e-07, + "loss": 0.5713, + "step": 72008 + }, + { + "epoch": 1.85, + "learning_rate": 6.811207660628718e-07, + "loss": 0.6953, + "step": 72009 + }, + { + "epoch": 1.85, + "learning_rate": 6.810945402572884e-07, + "loss": 0.5952, + "step": 72010 + }, + { + "epoch": 1.85, + "learning_rate": 6.810683146958764e-07, + "loss": 0.4596, + "step": 72011 + }, + { + "epoch": 1.85, + "learning_rate": 6.810420893786557e-07, + "loss": 0.6787, + "step": 72012 + }, + { + "epoch": 1.85, + "learning_rate": 6.810158643056464e-07, + "loss": 0.5884, + "step": 72013 + }, + { + "epoch": 1.85, + "learning_rate": 6.809896394768685e-07, + "loss": 0.6992, + "step": 72014 + }, + { + "epoch": 1.85, + "learning_rate": 6.809634148923423e-07, + "loss": 0.5386, + "step": 72015 + }, + { + "epoch": 1.85, + "learning_rate": 6.80937190552088e-07, + "loss": 0.7705, + "step": 72016 + }, + { + "epoch": 1.85, + "learning_rate": 6.80910966456125e-07, + "loss": 0.5146, + "step": 72017 + }, + { + "epoch": 1.85, + "learning_rate": 6.808847426044739e-07, + "loss": 0.4995, + "step": 72018 + }, + { + "epoch": 1.85, + "learning_rate": 6.808585189971546e-07, + "loss": 0.6206, + "step": 72019 + }, + { + "epoch": 1.85, + "learning_rate": 6.808322956341874e-07, + "loss": 0.635, + "step": 72020 + }, + { + "epoch": 1.85, + "learning_rate": 6.808060725155921e-07, + "loss": 0.718, + "step": 72021 + }, + { + "epoch": 1.85, + "learning_rate": 6.80779849641389e-07, + "loss": 0.5549, + "step": 72022 + }, + { + "epoch": 1.85, + "learning_rate": 6.807536270115981e-07, + "loss": 0.5674, + "step": 72023 + }, + { + "epoch": 1.85, + "learning_rate": 6.807274046262395e-07, + "loss": 0.3816, + "step": 72024 + }, + { + "epoch": 1.85, + "learning_rate": 6.807011824853333e-07, + "loss": 0.7437, + "step": 72025 + }, + { + "epoch": 1.85, + "learning_rate": 6.806749605888998e-07, + "loss": 0.4771, + "step": 72026 + }, + { + "epoch": 1.85, + "learning_rate": 6.806487389369582e-07, + "loss": 0.6289, + "step": 72027 + }, + { + "epoch": 1.85, + "learning_rate": 6.806225175295295e-07, + "loss": 0.9443, + "step": 72028 + }, + { + "epoch": 1.85, + "learning_rate": 6.805962963666331e-07, + "loss": 0.6846, + "step": 72029 + }, + { + "epoch": 1.85, + "learning_rate": 6.805700754482899e-07, + "loss": 0.5627, + "step": 72030 + }, + { + "epoch": 1.85, + "learning_rate": 6.805438547745191e-07, + "loss": 0.6914, + "step": 72031 + }, + { + "epoch": 1.85, + "learning_rate": 6.805176343453415e-07, + "loss": 0.6631, + "step": 72032 + }, + { + "epoch": 1.85, + "learning_rate": 6.804914141607766e-07, + "loss": 0.4561, + "step": 72033 + }, + { + "epoch": 1.85, + "learning_rate": 6.804651942208449e-07, + "loss": 0.7021, + "step": 72034 + }, + { + "epoch": 1.85, + "learning_rate": 6.804389745255661e-07, + "loss": 0.6973, + "step": 72035 + }, + { + "epoch": 1.85, + "learning_rate": 6.80412755074961e-07, + "loss": 0.4999, + "step": 72036 + }, + { + "epoch": 1.85, + "learning_rate": 6.80386535869049e-07, + "loss": 0.6582, + "step": 72037 + }, + { + "epoch": 1.85, + "learning_rate": 6.8036031690785e-07, + "loss": 0.5742, + "step": 72038 + }, + { + "epoch": 1.85, + "learning_rate": 6.803340981913845e-07, + "loss": 0.7861, + "step": 72039 + }, + { + "epoch": 1.85, + "learning_rate": 6.803078797196724e-07, + "loss": 0.6074, + "step": 72040 + }, + { + "epoch": 1.85, + "learning_rate": 6.802816614927341e-07, + "loss": 0.6807, + "step": 72041 + }, + { + "epoch": 1.85, + "learning_rate": 6.802554435105894e-07, + "loss": 0.4827, + "step": 72042 + }, + { + "epoch": 1.85, + "learning_rate": 6.802292257732583e-07, + "loss": 0.5864, + "step": 72043 + }, + { + "epoch": 1.85, + "learning_rate": 6.80203008280761e-07, + "loss": 0.6426, + "step": 72044 + }, + { + "epoch": 1.85, + "learning_rate": 6.801767910331176e-07, + "loss": 0.7129, + "step": 72045 + }, + { + "epoch": 1.85, + "learning_rate": 6.801505740303483e-07, + "loss": 0.7314, + "step": 72046 + }, + { + "epoch": 1.85, + "learning_rate": 6.801243572724728e-07, + "loss": 0.5811, + "step": 72047 + }, + { + "epoch": 1.85, + "learning_rate": 6.800981407595112e-07, + "loss": 0.6271, + "step": 72048 + }, + { + "epoch": 1.85, + "learning_rate": 6.80071924491484e-07, + "loss": 0.4873, + "step": 72049 + }, + { + "epoch": 1.85, + "learning_rate": 6.800457084684108e-07, + "loss": 0.6445, + "step": 72050 + }, + { + "epoch": 1.85, + "learning_rate": 6.80019492690312e-07, + "loss": 0.6206, + "step": 72051 + }, + { + "epoch": 1.85, + "learning_rate": 6.799932771572074e-07, + "loss": 0.7197, + "step": 72052 + }, + { + "epoch": 1.85, + "learning_rate": 6.799670618691175e-07, + "loss": 0.6152, + "step": 72053 + }, + { + "epoch": 1.85, + "learning_rate": 6.799408468260619e-07, + "loss": 0.6343, + "step": 72054 + }, + { + "epoch": 1.85, + "learning_rate": 6.799146320280611e-07, + "loss": 0.6465, + "step": 72055 + }, + { + "epoch": 1.85, + "learning_rate": 6.798884174751351e-07, + "loss": 0.6406, + "step": 72056 + }, + { + "epoch": 1.85, + "learning_rate": 6.798622031673035e-07, + "loss": 0.5859, + "step": 72057 + }, + { + "epoch": 1.85, + "learning_rate": 6.798359891045868e-07, + "loss": 0.9307, + "step": 72058 + }, + { + "epoch": 1.85, + "learning_rate": 6.798097752870049e-07, + "loss": 0.5825, + "step": 72059 + }, + { + "epoch": 1.85, + "learning_rate": 6.797835617145779e-07, + "loss": 0.1942, + "step": 72060 + }, + { + "epoch": 1.85, + "learning_rate": 6.79757348387326e-07, + "loss": 0.6782, + "step": 72061 + }, + { + "epoch": 1.85, + "learning_rate": 6.797311353052691e-07, + "loss": 0.5708, + "step": 72062 + }, + { + "epoch": 1.85, + "learning_rate": 6.797049224684272e-07, + "loss": 0.474, + "step": 72063 + }, + { + "epoch": 1.85, + "learning_rate": 6.796787098768206e-07, + "loss": 0.4849, + "step": 72064 + }, + { + "epoch": 1.85, + "learning_rate": 6.796524975304695e-07, + "loss": 0.6631, + "step": 72065 + }, + { + "epoch": 1.85, + "learning_rate": 6.796262854293939e-07, + "loss": 0.7188, + "step": 72066 + }, + { + "epoch": 1.85, + "learning_rate": 6.796000735736132e-07, + "loss": 0.6621, + "step": 72067 + }, + { + "epoch": 1.85, + "learning_rate": 6.795738619631483e-07, + "loss": 0.584, + "step": 72068 + }, + { + "epoch": 1.85, + "learning_rate": 6.795476505980188e-07, + "loss": 0.7383, + "step": 72069 + }, + { + "epoch": 1.85, + "learning_rate": 6.795214394782451e-07, + "loss": 0.48, + "step": 72070 + }, + { + "epoch": 1.85, + "learning_rate": 6.794952286038469e-07, + "loss": 0.6978, + "step": 72071 + }, + { + "epoch": 1.85, + "learning_rate": 6.794690179748446e-07, + "loss": 0.4983, + "step": 72072 + }, + { + "epoch": 1.85, + "learning_rate": 6.79442807591258e-07, + "loss": 0.6396, + "step": 72073 + }, + { + "epoch": 1.85, + "learning_rate": 6.794165974531074e-07, + "loss": 0.7197, + "step": 72074 + }, + { + "epoch": 1.85, + "learning_rate": 6.793903875604127e-07, + "loss": 0.6221, + "step": 72075 + }, + { + "epoch": 1.85, + "learning_rate": 6.793641779131947e-07, + "loss": 0.7065, + "step": 72076 + }, + { + "epoch": 1.85, + "learning_rate": 6.793379685114719e-07, + "loss": 0.5474, + "step": 72077 + }, + { + "epoch": 1.85, + "learning_rate": 6.793117593552657e-07, + "loss": 0.6147, + "step": 72078 + }, + { + "epoch": 1.85, + "learning_rate": 6.792855504445955e-07, + "loss": 0.668, + "step": 72079 + }, + { + "epoch": 1.85, + "learning_rate": 6.792593417794819e-07, + "loss": 0.7031, + "step": 72080 + }, + { + "epoch": 1.85, + "learning_rate": 6.792331333599443e-07, + "loss": 0.6182, + "step": 72081 + }, + { + "epoch": 1.85, + "learning_rate": 6.792069251860035e-07, + "loss": 0.6621, + "step": 72082 + }, + { + "epoch": 1.85, + "learning_rate": 6.791807172576789e-07, + "loss": 0.4097, + "step": 72083 + }, + { + "epoch": 1.85, + "learning_rate": 6.791545095749912e-07, + "loss": 0.5762, + "step": 72084 + }, + { + "epoch": 1.85, + "learning_rate": 6.791283021379599e-07, + "loss": 0.6875, + "step": 72085 + }, + { + "epoch": 1.85, + "learning_rate": 6.791020949466055e-07, + "loss": 0.4912, + "step": 72086 + }, + { + "epoch": 1.85, + "learning_rate": 6.790758880009479e-07, + "loss": 0.5928, + "step": 72087 + }, + { + "epoch": 1.85, + "learning_rate": 6.790496813010069e-07, + "loss": 0.5127, + "step": 72088 + }, + { + "epoch": 1.85, + "learning_rate": 6.790234748468029e-07, + "loss": 0.5928, + "step": 72089 + }, + { + "epoch": 1.85, + "learning_rate": 6.789972686383558e-07, + "loss": 0.5767, + "step": 72090 + }, + { + "epoch": 1.85, + "learning_rate": 6.78971062675686e-07, + "loss": 0.6436, + "step": 72091 + }, + { + "epoch": 1.85, + "learning_rate": 6.789448569588128e-07, + "loss": 0.6445, + "step": 72092 + }, + { + "epoch": 1.85, + "learning_rate": 6.789186514877572e-07, + "loss": 0.5986, + "step": 72093 + }, + { + "epoch": 1.85, + "learning_rate": 6.788924462625385e-07, + "loss": 0.5586, + "step": 72094 + }, + { + "epoch": 1.85, + "learning_rate": 6.788662412831774e-07, + "loss": 0.6533, + "step": 72095 + }, + { + "epoch": 1.85, + "learning_rate": 6.788400365496937e-07, + "loss": 0.6152, + "step": 72096 + }, + { + "epoch": 1.85, + "learning_rate": 6.788138320621073e-07, + "loss": 0.6213, + "step": 72097 + }, + { + "epoch": 1.85, + "learning_rate": 6.787876278204382e-07, + "loss": 0.5542, + "step": 72098 + }, + { + "epoch": 1.85, + "learning_rate": 6.787614238247069e-07, + "loss": 0.5347, + "step": 72099 + }, + { + "epoch": 1.85, + "learning_rate": 6.787352200749328e-07, + "loss": 0.48, + "step": 72100 + }, + { + "epoch": 1.85, + "learning_rate": 6.787090165711368e-07, + "loss": 0.5083, + "step": 72101 + }, + { + "epoch": 1.85, + "learning_rate": 6.786828133133382e-07, + "loss": 0.5618, + "step": 72102 + }, + { + "epoch": 1.85, + "learning_rate": 6.786566103015576e-07, + "loss": 0.6455, + "step": 72103 + }, + { + "epoch": 1.85, + "learning_rate": 6.786304075358146e-07, + "loss": 0.4907, + "step": 72104 + }, + { + "epoch": 1.85, + "learning_rate": 6.786042050161299e-07, + "loss": 0.4834, + "step": 72105 + }, + { + "epoch": 1.85, + "learning_rate": 6.785780027425233e-07, + "loss": 0.6133, + "step": 72106 + }, + { + "epoch": 1.85, + "learning_rate": 6.785518007150144e-07, + "loss": 0.7734, + "step": 72107 + }, + { + "epoch": 1.85, + "learning_rate": 6.785255989336236e-07, + "loss": 0.538, + "step": 72108 + }, + { + "epoch": 1.85, + "learning_rate": 6.78499397398371e-07, + "loss": 0.5981, + "step": 72109 + }, + { + "epoch": 1.85, + "learning_rate": 6.784731961092767e-07, + "loss": 0.7373, + "step": 72110 + }, + { + "epoch": 1.85, + "learning_rate": 6.784469950663605e-07, + "loss": 0.7007, + "step": 72111 + }, + { + "epoch": 1.85, + "learning_rate": 6.78420794269643e-07, + "loss": 0.7119, + "step": 72112 + }, + { + "epoch": 1.85, + "learning_rate": 6.783945937191436e-07, + "loss": 0.6279, + "step": 72113 + }, + { + "epoch": 1.85, + "learning_rate": 6.783683934148827e-07, + "loss": 0.5635, + "step": 72114 + }, + { + "epoch": 1.85, + "learning_rate": 6.783421933568807e-07, + "loss": 0.4153, + "step": 72115 + }, + { + "epoch": 1.85, + "learning_rate": 6.783159935451572e-07, + "loss": 0.431, + "step": 72116 + }, + { + "epoch": 1.85, + "learning_rate": 6.782897939797319e-07, + "loss": 0.627, + "step": 72117 + }, + { + "epoch": 1.85, + "learning_rate": 6.782635946606257e-07, + "loss": 0.6426, + "step": 72118 + }, + { + "epoch": 1.85, + "learning_rate": 6.78237395587858e-07, + "loss": 0.7334, + "step": 72119 + }, + { + "epoch": 1.85, + "learning_rate": 6.782111967614495e-07, + "loss": 0.6953, + "step": 72120 + }, + { + "epoch": 1.85, + "learning_rate": 6.781849981814193e-07, + "loss": 0.4045, + "step": 72121 + }, + { + "epoch": 1.85, + "learning_rate": 6.781587998477887e-07, + "loss": 0.5488, + "step": 72122 + }, + { + "epoch": 1.85, + "learning_rate": 6.781326017605766e-07, + "loss": 0.5894, + "step": 72123 + }, + { + "epoch": 1.85, + "learning_rate": 6.781064039198039e-07, + "loss": 0.6777, + "step": 72124 + }, + { + "epoch": 1.85, + "learning_rate": 6.780802063254904e-07, + "loss": 0.5144, + "step": 72125 + }, + { + "epoch": 1.85, + "learning_rate": 6.780540089776559e-07, + "loss": 0.5483, + "step": 72126 + }, + { + "epoch": 1.85, + "learning_rate": 6.780278118763207e-07, + "loss": 0.6387, + "step": 72127 + }, + { + "epoch": 1.85, + "learning_rate": 6.780016150215046e-07, + "loss": 0.5122, + "step": 72128 + }, + { + "epoch": 1.85, + "learning_rate": 6.77975418413228e-07, + "loss": 0.7075, + "step": 72129 + }, + { + "epoch": 1.85, + "learning_rate": 6.779492220515109e-07, + "loss": 0.6558, + "step": 72130 + }, + { + "epoch": 1.85, + "learning_rate": 6.779230259363731e-07, + "loss": 0.6934, + "step": 72131 + }, + { + "epoch": 1.85, + "learning_rate": 6.778968300678349e-07, + "loss": 0.8057, + "step": 72132 + }, + { + "epoch": 1.85, + "learning_rate": 6.778706344459163e-07, + "loss": 0.6133, + "step": 72133 + }, + { + "epoch": 1.85, + "learning_rate": 6.778444390706375e-07, + "loss": 0.71, + "step": 72134 + }, + { + "epoch": 1.85, + "learning_rate": 6.778182439420184e-07, + "loss": 0.5015, + "step": 72135 + }, + { + "epoch": 1.85, + "learning_rate": 6.777920490600788e-07, + "loss": 0.5278, + "step": 72136 + }, + { + "epoch": 1.85, + "learning_rate": 6.777658544248392e-07, + "loss": 0.665, + "step": 72137 + }, + { + "epoch": 1.85, + "learning_rate": 6.777396600363193e-07, + "loss": 0.6289, + "step": 72138 + }, + { + "epoch": 1.85, + "learning_rate": 6.777134658945393e-07, + "loss": 0.7441, + "step": 72139 + }, + { + "epoch": 1.85, + "learning_rate": 6.776872719995195e-07, + "loss": 0.4614, + "step": 72140 + }, + { + "epoch": 1.85, + "learning_rate": 6.776610783512796e-07, + "loss": 0.4663, + "step": 72141 + }, + { + "epoch": 1.85, + "learning_rate": 6.776348849498397e-07, + "loss": 0.7773, + "step": 72142 + }, + { + "epoch": 1.85, + "learning_rate": 6.776086917952202e-07, + "loss": 0.5244, + "step": 72143 + }, + { + "epoch": 1.85, + "learning_rate": 6.775824988874406e-07, + "loss": 0.7305, + "step": 72144 + }, + { + "epoch": 1.85, + "learning_rate": 6.775563062265217e-07, + "loss": 0.6875, + "step": 72145 + }, + { + "epoch": 1.85, + "learning_rate": 6.775301138124829e-07, + "loss": 0.624, + "step": 72146 + }, + { + "epoch": 1.85, + "learning_rate": 6.775039216453442e-07, + "loss": 0.3892, + "step": 72147 + }, + { + "epoch": 1.85, + "learning_rate": 6.774777297251261e-07, + "loss": 0.5801, + "step": 72148 + }, + { + "epoch": 1.85, + "learning_rate": 6.774515380518486e-07, + "loss": 0.5425, + "step": 72149 + }, + { + "epoch": 1.85, + "learning_rate": 6.774253466255315e-07, + "loss": 0.6113, + "step": 72150 + }, + { + "epoch": 1.85, + "learning_rate": 6.773991554461951e-07, + "loss": 0.6602, + "step": 72151 + }, + { + "epoch": 1.85, + "learning_rate": 6.77372964513859e-07, + "loss": 0.6309, + "step": 72152 + }, + { + "epoch": 1.85, + "learning_rate": 6.773467738285439e-07, + "loss": 0.6758, + "step": 72153 + }, + { + "epoch": 1.85, + "learning_rate": 6.773205833902693e-07, + "loss": 0.6592, + "step": 72154 + }, + { + "epoch": 1.85, + "learning_rate": 6.772943931990559e-07, + "loss": 0.5018, + "step": 72155 + }, + { + "epoch": 1.85, + "learning_rate": 6.772682032549232e-07, + "loss": 0.6357, + "step": 72156 + }, + { + "epoch": 1.85, + "learning_rate": 6.772420135578911e-07, + "loss": 0.5083, + "step": 72157 + }, + { + "epoch": 1.85, + "learning_rate": 6.772158241079801e-07, + "loss": 0.6201, + "step": 72158 + }, + { + "epoch": 1.85, + "learning_rate": 6.771896349052102e-07, + "loss": 0.6738, + "step": 72159 + }, + { + "epoch": 1.85, + "learning_rate": 6.771634459496012e-07, + "loss": 0.6309, + "step": 72160 + }, + { + "epoch": 1.85, + "learning_rate": 6.771372572411734e-07, + "loss": 0.7139, + "step": 72161 + }, + { + "epoch": 1.85, + "learning_rate": 6.771110687799468e-07, + "loss": 0.6807, + "step": 72162 + }, + { + "epoch": 1.85, + "learning_rate": 6.770848805659413e-07, + "loss": 0.499, + "step": 72163 + }, + { + "epoch": 1.85, + "learning_rate": 6.77058692599177e-07, + "loss": 0.7451, + "step": 72164 + }, + { + "epoch": 1.85, + "learning_rate": 6.770325048796745e-07, + "loss": 0.7559, + "step": 72165 + }, + { + "epoch": 1.85, + "learning_rate": 6.770063174074531e-07, + "loss": 0.6592, + "step": 72166 + }, + { + "epoch": 1.85, + "learning_rate": 6.769801301825329e-07, + "loss": 0.7578, + "step": 72167 + }, + { + "epoch": 1.85, + "learning_rate": 6.769539432049343e-07, + "loss": 0.5806, + "step": 72168 + }, + { + "epoch": 1.85, + "learning_rate": 6.76927756474677e-07, + "loss": 0.6621, + "step": 72169 + }, + { + "epoch": 1.85, + "learning_rate": 6.769015699917815e-07, + "loss": 0.5825, + "step": 72170 + }, + { + "epoch": 1.85, + "learning_rate": 6.768753837562674e-07, + "loss": 0.5085, + "step": 72171 + }, + { + "epoch": 1.85, + "learning_rate": 6.768491977681552e-07, + "loss": 0.5522, + "step": 72172 + }, + { + "epoch": 1.85, + "learning_rate": 6.768230120274645e-07, + "loss": 0.5962, + "step": 72173 + }, + { + "epoch": 1.85, + "learning_rate": 6.767968265342157e-07, + "loss": 0.8477, + "step": 72174 + }, + { + "epoch": 1.85, + "learning_rate": 6.767706412884289e-07, + "loss": 0.6377, + "step": 72175 + }, + { + "epoch": 1.85, + "learning_rate": 6.767444562901236e-07, + "loss": 0.4, + "step": 72176 + }, + { + "epoch": 1.85, + "learning_rate": 6.767182715393205e-07, + "loss": 0.5615, + "step": 72177 + }, + { + "epoch": 1.85, + "learning_rate": 6.76692087036039e-07, + "loss": 0.5874, + "step": 72178 + }, + { + "epoch": 1.85, + "learning_rate": 6.766659027802999e-07, + "loss": 0.6304, + "step": 72179 + }, + { + "epoch": 1.85, + "learning_rate": 6.766397187721224e-07, + "loss": 0.6343, + "step": 72180 + }, + { + "epoch": 1.85, + "learning_rate": 6.766135350115274e-07, + "loss": 0.5796, + "step": 72181 + }, + { + "epoch": 1.85, + "learning_rate": 6.765873514985343e-07, + "loss": 0.52, + "step": 72182 + }, + { + "epoch": 1.85, + "learning_rate": 6.765611682331636e-07, + "loss": 0.5525, + "step": 72183 + }, + { + "epoch": 1.85, + "learning_rate": 6.765349852154349e-07, + "loss": 0.5918, + "step": 72184 + }, + { + "epoch": 1.85, + "learning_rate": 6.765088024453691e-07, + "loss": 0.6362, + "step": 72185 + }, + { + "epoch": 1.85, + "learning_rate": 6.76482619922985e-07, + "loss": 0.6221, + "step": 72186 + }, + { + "epoch": 1.85, + "learning_rate": 6.764564376483035e-07, + "loss": 0.6455, + "step": 72187 + }, + { + "epoch": 1.85, + "learning_rate": 6.764302556213442e-07, + "loss": 0.5659, + "step": 72188 + }, + { + "epoch": 1.85, + "learning_rate": 6.764040738421277e-07, + "loss": 0.7861, + "step": 72189 + }, + { + "epoch": 1.85, + "learning_rate": 6.763778923106733e-07, + "loss": 0.5981, + "step": 72190 + }, + { + "epoch": 1.85, + "learning_rate": 6.763517110270019e-07, + "loss": 0.4326, + "step": 72191 + }, + { + "epoch": 1.85, + "learning_rate": 6.763255299911328e-07, + "loss": 0.5728, + "step": 72192 + }, + { + "epoch": 1.85, + "learning_rate": 6.762993492030866e-07, + "loss": 0.4995, + "step": 72193 + }, + { + "epoch": 1.85, + "learning_rate": 6.762731686628829e-07, + "loss": 0.5723, + "step": 72194 + }, + { + "epoch": 1.85, + "learning_rate": 6.762469883705424e-07, + "loss": 0.6006, + "step": 72195 + }, + { + "epoch": 1.85, + "learning_rate": 6.762208083260843e-07, + "loss": 0.6216, + "step": 72196 + }, + { + "epoch": 1.85, + "learning_rate": 6.76194628529529e-07, + "loss": 0.7324, + "step": 72197 + }, + { + "epoch": 1.85, + "learning_rate": 6.761684489808967e-07, + "loss": 0.6167, + "step": 72198 + }, + { + "epoch": 1.85, + "learning_rate": 6.761422696802073e-07, + "loss": 0.6074, + "step": 72199 + }, + { + "epoch": 1.85, + "learning_rate": 6.761160906274808e-07, + "loss": 0.6445, + "step": 72200 + }, + { + "epoch": 1.85, + "learning_rate": 6.760899118227373e-07, + "loss": 0.582, + "step": 72201 + }, + { + "epoch": 1.85, + "learning_rate": 6.760637332659971e-07, + "loss": 0.5103, + "step": 72202 + }, + { + "epoch": 1.85, + "learning_rate": 6.760375549572796e-07, + "loss": 0.479, + "step": 72203 + }, + { + "epoch": 1.85, + "learning_rate": 6.760113768966057e-07, + "loss": 0.6885, + "step": 72204 + }, + { + "epoch": 1.85, + "learning_rate": 6.759851990839951e-07, + "loss": 0.5352, + "step": 72205 + }, + { + "epoch": 1.85, + "learning_rate": 6.759590215194675e-07, + "loss": 0.6318, + "step": 72206 + }, + { + "epoch": 1.85, + "learning_rate": 6.75932844203043e-07, + "loss": 0.498, + "step": 72207 + }, + { + "epoch": 1.85, + "learning_rate": 6.75906667134742e-07, + "loss": 0.6299, + "step": 72208 + }, + { + "epoch": 1.85, + "learning_rate": 6.758804903145841e-07, + "loss": 0.6436, + "step": 72209 + }, + { + "epoch": 1.85, + "learning_rate": 6.758543137425898e-07, + "loss": 0.5034, + "step": 72210 + }, + { + "epoch": 1.85, + "learning_rate": 6.758281374187789e-07, + "loss": 0.627, + "step": 72211 + }, + { + "epoch": 1.85, + "learning_rate": 6.758019613431716e-07, + "loss": 0.5159, + "step": 72212 + }, + { + "epoch": 1.85, + "learning_rate": 6.757757855157877e-07, + "loss": 0.6265, + "step": 72213 + }, + { + "epoch": 1.85, + "learning_rate": 6.757496099366476e-07, + "loss": 0.667, + "step": 72214 + }, + { + "epoch": 1.85, + "learning_rate": 6.757234346057712e-07, + "loss": 0.7324, + "step": 72215 + }, + { + "epoch": 1.85, + "learning_rate": 6.75697259523178e-07, + "loss": 0.6045, + "step": 72216 + }, + { + "epoch": 1.85, + "learning_rate": 6.756710846888888e-07, + "loss": 0.6689, + "step": 72217 + }, + { + "epoch": 1.85, + "learning_rate": 6.756449101029231e-07, + "loss": 0.6475, + "step": 72218 + }, + { + "epoch": 1.85, + "learning_rate": 6.756187357653014e-07, + "loss": 0.8057, + "step": 72219 + }, + { + "epoch": 1.85, + "learning_rate": 6.755925616760433e-07, + "loss": 0.5098, + "step": 72220 + }, + { + "epoch": 1.85, + "learning_rate": 6.755663878351693e-07, + "loss": 0.6641, + "step": 72221 + }, + { + "epoch": 1.85, + "learning_rate": 6.755402142426991e-07, + "loss": 0.4058, + "step": 72222 + }, + { + "epoch": 1.85, + "learning_rate": 6.755140408986529e-07, + "loss": 0.6992, + "step": 72223 + }, + { + "epoch": 1.85, + "learning_rate": 6.754878678030505e-07, + "loss": 0.7188, + "step": 72224 + }, + { + "epoch": 1.85, + "learning_rate": 6.754616949559126e-07, + "loss": 0.4904, + "step": 72225 + }, + { + "epoch": 1.85, + "learning_rate": 6.754355223572582e-07, + "loss": 0.6665, + "step": 72226 + }, + { + "epoch": 1.85, + "learning_rate": 6.754093500071082e-07, + "loss": 0.7207, + "step": 72227 + }, + { + "epoch": 1.85, + "learning_rate": 6.75383177905482e-07, + "loss": 0.7021, + "step": 72228 + }, + { + "epoch": 1.85, + "learning_rate": 6.753570060524003e-07, + "loss": 0.5737, + "step": 72229 + }, + { + "epoch": 1.85, + "learning_rate": 6.753308344478826e-07, + "loss": 0.637, + "step": 72230 + }, + { + "epoch": 1.85, + "learning_rate": 6.753046630919493e-07, + "loss": 0.4878, + "step": 72231 + }, + { + "epoch": 1.85, + "learning_rate": 6.752784919846201e-07, + "loss": 0.5542, + "step": 72232 + }, + { + "epoch": 1.85, + "learning_rate": 6.752523211259155e-07, + "loss": 0.5391, + "step": 72233 + }, + { + "epoch": 1.85, + "learning_rate": 6.752261505158549e-07, + "loss": 0.5688, + "step": 72234 + }, + { + "epoch": 1.85, + "learning_rate": 6.751999801544595e-07, + "loss": 0.5654, + "step": 72235 + }, + { + "epoch": 1.85, + "learning_rate": 6.751738100417479e-07, + "loss": 0.5557, + "step": 72236 + }, + { + "epoch": 1.85, + "learning_rate": 6.751476401777408e-07, + "loss": 0.7617, + "step": 72237 + }, + { + "epoch": 1.85, + "learning_rate": 6.751214705624584e-07, + "loss": 0.7559, + "step": 72238 + }, + { + "epoch": 1.85, + "learning_rate": 6.750953011959204e-07, + "loss": 0.623, + "step": 72239 + }, + { + "epoch": 1.85, + "learning_rate": 6.75069132078147e-07, + "loss": 0.6777, + "step": 72240 + }, + { + "epoch": 1.85, + "learning_rate": 6.750429632091584e-07, + "loss": 0.6953, + "step": 72241 + }, + { + "epoch": 1.85, + "learning_rate": 6.75016794588974e-07, + "loss": 0.6587, + "step": 72242 + }, + { + "epoch": 1.85, + "learning_rate": 6.749906262176147e-07, + "loss": 0.7109, + "step": 72243 + }, + { + "epoch": 1.85, + "learning_rate": 6.749644580950999e-07, + "loss": 0.5513, + "step": 72244 + }, + { + "epoch": 1.85, + "learning_rate": 6.749382902214503e-07, + "loss": 0.632, + "step": 72245 + }, + { + "epoch": 1.85, + "learning_rate": 6.749121225966853e-07, + "loss": 0.5181, + "step": 72246 + }, + { + "epoch": 1.85, + "learning_rate": 6.74885955220825e-07, + "loss": 0.6934, + "step": 72247 + }, + { + "epoch": 1.85, + "learning_rate": 6.748597880938896e-07, + "loss": 0.5186, + "step": 72248 + }, + { + "epoch": 1.85, + "learning_rate": 6.748336212158989e-07, + "loss": 0.6279, + "step": 72249 + }, + { + "epoch": 1.85, + "learning_rate": 6.748074545868736e-07, + "loss": 0.7354, + "step": 72250 + }, + { + "epoch": 1.85, + "learning_rate": 6.747812882068329e-07, + "loss": 0.6377, + "step": 72251 + }, + { + "epoch": 1.85, + "learning_rate": 6.747551220757974e-07, + "loss": 0.6885, + "step": 72252 + }, + { + "epoch": 1.85, + "learning_rate": 6.747289561937868e-07, + "loss": 0.8076, + "step": 72253 + }, + { + "epoch": 1.85, + "learning_rate": 6.747027905608216e-07, + "loss": 0.5942, + "step": 72254 + }, + { + "epoch": 1.85, + "learning_rate": 6.746766251769216e-07, + "loss": 0.6641, + "step": 72255 + }, + { + "epoch": 1.85, + "learning_rate": 6.746504600421065e-07, + "loss": 0.6099, + "step": 72256 + }, + { + "epoch": 1.85, + "learning_rate": 6.746242951563963e-07, + "loss": 0.6641, + "step": 72257 + }, + { + "epoch": 1.85, + "learning_rate": 6.745981305198117e-07, + "loss": 0.6162, + "step": 72258 + }, + { + "epoch": 1.85, + "learning_rate": 6.745719661323721e-07, + "loss": 0.6213, + "step": 72259 + }, + { + "epoch": 1.85, + "learning_rate": 6.74545801994098e-07, + "loss": 0.6953, + "step": 72260 + }, + { + "epoch": 1.85, + "learning_rate": 6.745196381050089e-07, + "loss": 0.7695, + "step": 72261 + }, + { + "epoch": 1.85, + "learning_rate": 6.744934744651255e-07, + "loss": 0.7451, + "step": 72262 + }, + { + "epoch": 1.85, + "learning_rate": 6.744673110744672e-07, + "loss": 0.8271, + "step": 72263 + }, + { + "epoch": 1.85, + "learning_rate": 6.744411479330545e-07, + "loss": 0.6123, + "step": 72264 + }, + { + "epoch": 1.85, + "learning_rate": 6.744149850409076e-07, + "loss": 0.5061, + "step": 72265 + }, + { + "epoch": 1.85, + "learning_rate": 6.743888223980455e-07, + "loss": 0.7695, + "step": 72266 + }, + { + "epoch": 1.85, + "learning_rate": 6.743626600044893e-07, + "loss": 0.6079, + "step": 72267 + }, + { + "epoch": 1.85, + "learning_rate": 6.743364978602584e-07, + "loss": 0.3853, + "step": 72268 + }, + { + "epoch": 1.85, + "learning_rate": 6.743103359653732e-07, + "loss": 0.5908, + "step": 72269 + }, + { + "epoch": 1.85, + "learning_rate": 6.742841743198535e-07, + "loss": 0.6846, + "step": 72270 + }, + { + "epoch": 1.85, + "learning_rate": 6.742580129237196e-07, + "loss": 0.4497, + "step": 72271 + }, + { + "epoch": 1.85, + "learning_rate": 6.742318517769911e-07, + "loss": 0.5127, + "step": 72272 + }, + { + "epoch": 1.85, + "learning_rate": 6.742056908796884e-07, + "loss": 0.6992, + "step": 72273 + }, + { + "epoch": 1.85, + "learning_rate": 6.741795302318314e-07, + "loss": 0.5464, + "step": 72274 + }, + { + "epoch": 1.85, + "learning_rate": 6.741533698334408e-07, + "loss": 0.5869, + "step": 72275 + }, + { + "epoch": 1.85, + "learning_rate": 6.741272096845354e-07, + "loss": 0.6094, + "step": 72276 + }, + { + "epoch": 1.85, + "learning_rate": 6.741010497851358e-07, + "loss": 0.6562, + "step": 72277 + }, + { + "epoch": 1.85, + "learning_rate": 6.74074890135262e-07, + "loss": 0.6079, + "step": 72278 + }, + { + "epoch": 1.85, + "learning_rate": 6.740487307349343e-07, + "loss": 0.5122, + "step": 72279 + }, + { + "epoch": 1.85, + "learning_rate": 6.740225715841721e-07, + "loss": 0.3499, + "step": 72280 + }, + { + "epoch": 1.85, + "learning_rate": 6.739964126829963e-07, + "loss": 0.7139, + "step": 72281 + }, + { + "epoch": 1.85, + "learning_rate": 6.73970254031426e-07, + "loss": 0.5991, + "step": 72282 + }, + { + "epoch": 1.85, + "learning_rate": 6.73944095629482e-07, + "loss": 0.5159, + "step": 72283 + }, + { + "epoch": 1.85, + "learning_rate": 6.739179374771837e-07, + "loss": 0.6914, + "step": 72284 + }, + { + "epoch": 1.85, + "learning_rate": 6.73891779574552e-07, + "loss": 0.749, + "step": 72285 + }, + { + "epoch": 1.85, + "learning_rate": 6.738656219216061e-07, + "loss": 0.7656, + "step": 72286 + }, + { + "epoch": 1.85, + "learning_rate": 6.738394645183662e-07, + "loss": 0.3787, + "step": 72287 + }, + { + "epoch": 1.85, + "learning_rate": 6.738133073648525e-07, + "loss": 0.7334, + "step": 72288 + }, + { + "epoch": 1.85, + "learning_rate": 6.737871504610848e-07, + "loss": 0.7256, + "step": 72289 + }, + { + "epoch": 1.85, + "learning_rate": 6.737609938070833e-07, + "loss": 0.667, + "step": 72290 + }, + { + "epoch": 1.85, + "learning_rate": 6.737348374028681e-07, + "loss": 0.5234, + "step": 72291 + }, + { + "epoch": 1.85, + "learning_rate": 6.737086812484592e-07, + "loss": 0.5002, + "step": 72292 + }, + { + "epoch": 1.85, + "learning_rate": 6.736825253438764e-07, + "loss": 0.75, + "step": 72293 + }, + { + "epoch": 1.85, + "learning_rate": 6.7365636968914e-07, + "loss": 0.4915, + "step": 72294 + }, + { + "epoch": 1.85, + "learning_rate": 6.736302142842702e-07, + "loss": 0.6436, + "step": 72295 + }, + { + "epoch": 1.85, + "learning_rate": 6.736040591292865e-07, + "loss": 0.437, + "step": 72296 + }, + { + "epoch": 1.85, + "learning_rate": 6.735779042242089e-07, + "loss": 0.6523, + "step": 72297 + }, + { + "epoch": 1.85, + "learning_rate": 6.73551749569058e-07, + "loss": 0.6182, + "step": 72298 + }, + { + "epoch": 1.85, + "learning_rate": 6.735255951638532e-07, + "loss": 0.6284, + "step": 72299 + }, + { + "epoch": 1.85, + "learning_rate": 6.734994410086153e-07, + "loss": 0.6265, + "step": 72300 + }, + { + "epoch": 1.85, + "learning_rate": 6.734732871033634e-07, + "loss": 0.668, + "step": 72301 + }, + { + "epoch": 1.85, + "learning_rate": 6.734471334481182e-07, + "loss": 0.5464, + "step": 72302 + }, + { + "epoch": 1.85, + "learning_rate": 6.734209800428994e-07, + "loss": 0.7344, + "step": 72303 + }, + { + "epoch": 1.85, + "learning_rate": 6.733948268877273e-07, + "loss": 0.7803, + "step": 72304 + }, + { + "epoch": 1.85, + "learning_rate": 6.73368673982622e-07, + "loss": 0.5859, + "step": 72305 + }, + { + "epoch": 1.85, + "learning_rate": 6.73342521327603e-07, + "loss": 0.5728, + "step": 72306 + }, + { + "epoch": 1.85, + "learning_rate": 6.733163689226906e-07, + "loss": 0.6133, + "step": 72307 + }, + { + "epoch": 1.85, + "learning_rate": 6.732902167679047e-07, + "loss": 0.6284, + "step": 72308 + }, + { + "epoch": 1.85, + "learning_rate": 6.732640648632657e-07, + "loss": 0.6953, + "step": 72309 + }, + { + "epoch": 1.85, + "learning_rate": 6.73237913208793e-07, + "loss": 0.6768, + "step": 72310 + }, + { + "epoch": 1.85, + "learning_rate": 6.732117618045074e-07, + "loss": 0.6226, + "step": 72311 + }, + { + "epoch": 1.85, + "learning_rate": 6.731856106504285e-07, + "loss": 0.5443, + "step": 72312 + }, + { + "epoch": 1.85, + "learning_rate": 6.731594597465762e-07, + "loss": 0.6289, + "step": 72313 + }, + { + "epoch": 1.85, + "learning_rate": 6.731333090929707e-07, + "loss": 0.4641, + "step": 72314 + }, + { + "epoch": 1.85, + "learning_rate": 6.731071586896324e-07, + "loss": 0.5935, + "step": 72315 + }, + { + "epoch": 1.85, + "learning_rate": 6.730810085365804e-07, + "loss": 0.6738, + "step": 72316 + }, + { + "epoch": 1.85, + "learning_rate": 6.730548586338355e-07, + "loss": 0.6377, + "step": 72317 + }, + { + "epoch": 1.85, + "learning_rate": 6.730287089814173e-07, + "loss": 0.5405, + "step": 72318 + }, + { + "epoch": 1.85, + "learning_rate": 6.73002559579346e-07, + "loss": 0.6577, + "step": 72319 + }, + { + "epoch": 1.85, + "learning_rate": 6.729764104276416e-07, + "loss": 0.5342, + "step": 72320 + }, + { + "epoch": 1.85, + "learning_rate": 6.729502615263242e-07, + "loss": 0.5596, + "step": 72321 + }, + { + "epoch": 1.85, + "learning_rate": 6.729241128754135e-07, + "loss": 0.7031, + "step": 72322 + }, + { + "epoch": 1.85, + "learning_rate": 6.728979644749302e-07, + "loss": 0.6182, + "step": 72323 + }, + { + "epoch": 1.85, + "learning_rate": 6.728718163248934e-07, + "loss": 0.5918, + "step": 72324 + }, + { + "epoch": 1.85, + "learning_rate": 6.728456684253241e-07, + "loss": 0.6201, + "step": 72325 + }, + { + "epoch": 1.85, + "learning_rate": 6.728195207762418e-07, + "loss": 0.5015, + "step": 72326 + }, + { + "epoch": 1.85, + "learning_rate": 6.727933733776663e-07, + "loss": 0.7217, + "step": 72327 + }, + { + "epoch": 1.85, + "learning_rate": 6.727672262296179e-07, + "loss": 0.6084, + "step": 72328 + }, + { + "epoch": 1.85, + "learning_rate": 6.727410793321166e-07, + "loss": 0.7148, + "step": 72329 + }, + { + "epoch": 1.85, + "learning_rate": 6.727149326851824e-07, + "loss": 0.686, + "step": 72330 + }, + { + "epoch": 1.85, + "learning_rate": 6.726887862888354e-07, + "loss": 0.709, + "step": 72331 + }, + { + "epoch": 1.85, + "learning_rate": 6.726626401430953e-07, + "loss": 0.4263, + "step": 72332 + }, + { + "epoch": 1.85, + "learning_rate": 6.726364942479827e-07, + "loss": 0.7207, + "step": 72333 + }, + { + "epoch": 1.85, + "learning_rate": 6.726103486035171e-07, + "loss": 0.6934, + "step": 72334 + }, + { + "epoch": 1.85, + "learning_rate": 6.725842032097189e-07, + "loss": 0.624, + "step": 72335 + }, + { + "epoch": 1.85, + "learning_rate": 6.72558058066608e-07, + "loss": 0.6553, + "step": 72336 + }, + { + "epoch": 1.85, + "learning_rate": 6.725319131742038e-07, + "loss": 0.7046, + "step": 72337 + }, + { + "epoch": 1.85, + "learning_rate": 6.725057685325273e-07, + "loss": 0.5062, + "step": 72338 + }, + { + "epoch": 1.85, + "learning_rate": 6.724796241415978e-07, + "loss": 0.6431, + "step": 72339 + }, + { + "epoch": 1.85, + "learning_rate": 6.724534800014358e-07, + "loss": 0.5957, + "step": 72340 + }, + { + "epoch": 1.85, + "learning_rate": 6.724273361120609e-07, + "loss": 0.5601, + "step": 72341 + }, + { + "epoch": 1.85, + "learning_rate": 6.724011924734936e-07, + "loss": 0.5449, + "step": 72342 + }, + { + "epoch": 1.85, + "learning_rate": 6.723750490857533e-07, + "loss": 0.5278, + "step": 72343 + }, + { + "epoch": 1.85, + "learning_rate": 6.723489059488607e-07, + "loss": 0.4077, + "step": 72344 + }, + { + "epoch": 1.85, + "learning_rate": 6.723227630628356e-07, + "loss": 0.3584, + "step": 72345 + }, + { + "epoch": 1.85, + "learning_rate": 6.722966204276977e-07, + "loss": 0.6973, + "step": 72346 + }, + { + "epoch": 1.85, + "learning_rate": 6.722704780434669e-07, + "loss": 0.5469, + "step": 72347 + }, + { + "epoch": 1.85, + "learning_rate": 6.722443359101639e-07, + "loss": 0.6729, + "step": 72348 + }, + { + "epoch": 1.85, + "learning_rate": 6.722181940278081e-07, + "loss": 0.7686, + "step": 72349 + }, + { + "epoch": 1.85, + "learning_rate": 6.7219205239642e-07, + "loss": 0.75, + "step": 72350 + }, + { + "epoch": 1.85, + "learning_rate": 6.721659110160191e-07, + "loss": 0.7803, + "step": 72351 + }, + { + "epoch": 1.85, + "learning_rate": 6.721397698866257e-07, + "loss": 0.6201, + "step": 72352 + }, + { + "epoch": 1.85, + "learning_rate": 6.721136290082599e-07, + "loss": 0.6152, + "step": 72353 + }, + { + "epoch": 1.85, + "learning_rate": 6.720874883809418e-07, + "loss": 0.4314, + "step": 72354 + }, + { + "epoch": 1.85, + "learning_rate": 6.720613480046914e-07, + "loss": 0.6147, + "step": 72355 + }, + { + "epoch": 1.85, + "learning_rate": 6.720352078795281e-07, + "loss": 0.6904, + "step": 72356 + }, + { + "epoch": 1.85, + "learning_rate": 6.720090680054725e-07, + "loss": 0.793, + "step": 72357 + }, + { + "epoch": 1.85, + "learning_rate": 6.719829283825444e-07, + "loss": 0.7021, + "step": 72358 + }, + { + "epoch": 1.85, + "learning_rate": 6.71956789010764e-07, + "loss": 0.6357, + "step": 72359 + }, + { + "epoch": 1.85, + "learning_rate": 6.71930649890151e-07, + "loss": 0.4707, + "step": 72360 + }, + { + "epoch": 1.85, + "learning_rate": 6.719045110207259e-07, + "loss": 0.7822, + "step": 72361 + }, + { + "epoch": 1.85, + "learning_rate": 6.718783724025081e-07, + "loss": 0.5244, + "step": 72362 + }, + { + "epoch": 1.85, + "learning_rate": 6.718522340355182e-07, + "loss": 0.5996, + "step": 72363 + }, + { + "epoch": 1.85, + "learning_rate": 6.718260959197759e-07, + "loss": 0.71, + "step": 72364 + }, + { + "epoch": 1.85, + "learning_rate": 6.717999580553017e-07, + "loss": 0.5701, + "step": 72365 + }, + { + "epoch": 1.85, + "learning_rate": 6.717738204421146e-07, + "loss": 0.5991, + "step": 72366 + }, + { + "epoch": 1.85, + "learning_rate": 6.717476830802354e-07, + "loss": 0.5459, + "step": 72367 + }, + { + "epoch": 1.85, + "learning_rate": 6.717215459696838e-07, + "loss": 0.6543, + "step": 72368 + }, + { + "epoch": 1.85, + "learning_rate": 6.7169540911048e-07, + "loss": 0.5728, + "step": 72369 + }, + { + "epoch": 1.85, + "learning_rate": 6.716692725026438e-07, + "loss": 0.4938, + "step": 72370 + }, + { + "epoch": 1.85, + "learning_rate": 6.716431361461955e-07, + "loss": 0.5396, + "step": 72371 + }, + { + "epoch": 1.85, + "learning_rate": 6.716170000411548e-07, + "loss": 0.4902, + "step": 72372 + }, + { + "epoch": 1.85, + "learning_rate": 6.715908641875419e-07, + "loss": 0.6523, + "step": 72373 + }, + { + "epoch": 1.85, + "learning_rate": 6.715647285853768e-07, + "loss": 0.6875, + "step": 72374 + }, + { + "epoch": 1.86, + "learning_rate": 6.715385932346798e-07, + "loss": 0.5908, + "step": 72375 + }, + { + "epoch": 1.86, + "learning_rate": 6.715124581354704e-07, + "loss": 0.6602, + "step": 72376 + }, + { + "epoch": 1.86, + "learning_rate": 6.714863232877685e-07, + "loss": 0.6196, + "step": 72377 + }, + { + "epoch": 1.86, + "learning_rate": 6.714601886915947e-07, + "loss": 0.5996, + "step": 72378 + }, + { + "epoch": 1.86, + "learning_rate": 6.714340543469685e-07, + "loss": 0.4058, + "step": 72379 + }, + { + "epoch": 1.86, + "learning_rate": 6.714079202539105e-07, + "loss": 0.5723, + "step": 72380 + }, + { + "epoch": 1.86, + "learning_rate": 6.713817864124401e-07, + "loss": 0.5405, + "step": 72381 + }, + { + "epoch": 1.86, + "learning_rate": 6.713556528225775e-07, + "loss": 0.6543, + "step": 72382 + }, + { + "epoch": 1.86, + "learning_rate": 6.713295194843428e-07, + "loss": 0.5952, + "step": 72383 + }, + { + "epoch": 1.86, + "learning_rate": 6.713033863977561e-07, + "loss": 0.6909, + "step": 72384 + }, + { + "epoch": 1.86, + "learning_rate": 6.712772535628375e-07, + "loss": 0.6787, + "step": 72385 + }, + { + "epoch": 1.86, + "learning_rate": 6.712511209796066e-07, + "loss": 0.6855, + "step": 72386 + }, + { + "epoch": 1.86, + "learning_rate": 6.712249886480834e-07, + "loss": 0.6436, + "step": 72387 + }, + { + "epoch": 1.86, + "learning_rate": 6.711988565682883e-07, + "loss": 0.6362, + "step": 72388 + }, + { + "epoch": 1.86, + "learning_rate": 6.711727247402409e-07, + "loss": 0.603, + "step": 72389 + }, + { + "epoch": 1.86, + "learning_rate": 6.711465931639616e-07, + "loss": 0.6704, + "step": 72390 + }, + { + "epoch": 1.86, + "learning_rate": 6.711204618394701e-07, + "loss": 0.5063, + "step": 72391 + }, + { + "epoch": 1.86, + "learning_rate": 6.710943307667866e-07, + "loss": 0.6797, + "step": 72392 + }, + { + "epoch": 1.86, + "learning_rate": 6.710681999459311e-07, + "loss": 0.5791, + "step": 72393 + }, + { + "epoch": 1.86, + "learning_rate": 6.710420693769237e-07, + "loss": 0.6597, + "step": 72394 + }, + { + "epoch": 1.86, + "learning_rate": 6.710159390597842e-07, + "loss": 0.5111, + "step": 72395 + }, + { + "epoch": 1.86, + "learning_rate": 6.709898089945325e-07, + "loss": 0.6338, + "step": 72396 + }, + { + "epoch": 1.86, + "learning_rate": 6.709636791811889e-07, + "loss": 0.6328, + "step": 72397 + }, + { + "epoch": 1.86, + "learning_rate": 6.709375496197731e-07, + "loss": 0.6675, + "step": 72398 + }, + { + "epoch": 1.86, + "learning_rate": 6.709114203103055e-07, + "loss": 0.7456, + "step": 72399 + }, + { + "epoch": 1.86, + "learning_rate": 6.708852912528057e-07, + "loss": 0.6592, + "step": 72400 + }, + { + "epoch": 1.86, + "learning_rate": 6.708591624472942e-07, + "loss": 0.5566, + "step": 72401 + }, + { + "epoch": 1.86, + "learning_rate": 6.708330338937904e-07, + "loss": 0.7295, + "step": 72402 + }, + { + "epoch": 1.86, + "learning_rate": 6.708069055923146e-07, + "loss": 0.6279, + "step": 72403 + }, + { + "epoch": 1.86, + "learning_rate": 6.707807775428873e-07, + "loss": 0.6777, + "step": 72404 + }, + { + "epoch": 1.86, + "learning_rate": 6.707546497455276e-07, + "loss": 0.6353, + "step": 72405 + }, + { + "epoch": 1.86, + "learning_rate": 6.707285222002559e-07, + "loss": 0.564, + "step": 72406 + }, + { + "epoch": 1.86, + "learning_rate": 6.707023949070924e-07, + "loss": 0.5684, + "step": 72407 + }, + { + "epoch": 1.86, + "learning_rate": 6.706762678660567e-07, + "loss": 0.7627, + "step": 72408 + }, + { + "epoch": 1.86, + "learning_rate": 6.706501410771693e-07, + "loss": 0.583, + "step": 72409 + }, + { + "epoch": 1.86, + "learning_rate": 6.706240145404498e-07, + "loss": 0.7568, + "step": 72410 + }, + { + "epoch": 1.86, + "learning_rate": 6.705978882559184e-07, + "loss": 0.5776, + "step": 72411 + }, + { + "epoch": 1.86, + "learning_rate": 6.705717622235949e-07, + "loss": 0.6479, + "step": 72412 + }, + { + "epoch": 1.86, + "learning_rate": 6.705456364434996e-07, + "loss": 0.5845, + "step": 72413 + }, + { + "epoch": 1.86, + "learning_rate": 6.705195109156527e-07, + "loss": 0.4561, + "step": 72414 + }, + { + "epoch": 1.86, + "learning_rate": 6.704933856400733e-07, + "loss": 0.5708, + "step": 72415 + }, + { + "epoch": 1.86, + "learning_rate": 6.704672606167823e-07, + "loss": 0.6973, + "step": 72416 + }, + { + "epoch": 1.86, + "learning_rate": 6.704411358457991e-07, + "loss": 0.4966, + "step": 72417 + }, + { + "epoch": 1.86, + "learning_rate": 6.70415011327144e-07, + "loss": 0.6426, + "step": 72418 + }, + { + "epoch": 1.86, + "learning_rate": 6.703888870608373e-07, + "loss": 0.6187, + "step": 72419 + }, + { + "epoch": 1.86, + "learning_rate": 6.703627630468983e-07, + "loss": 0.7188, + "step": 72420 + }, + { + "epoch": 1.86, + "learning_rate": 6.703366392853476e-07, + "loss": 0.5962, + "step": 72421 + }, + { + "epoch": 1.86, + "learning_rate": 6.703105157762048e-07, + "loss": 0.7676, + "step": 72422 + }, + { + "epoch": 1.86, + "learning_rate": 6.702843925194902e-07, + "loss": 0.7852, + "step": 72423 + }, + { + "epoch": 1.86, + "learning_rate": 6.702582695152239e-07, + "loss": 0.4451, + "step": 72424 + }, + { + "epoch": 1.86, + "learning_rate": 6.702321467634253e-07, + "loss": 0.7073, + "step": 72425 + }, + { + "epoch": 1.86, + "learning_rate": 6.70206024264115e-07, + "loss": 0.4739, + "step": 72426 + }, + { + "epoch": 1.86, + "learning_rate": 6.701799020173127e-07, + "loss": 0.6758, + "step": 72427 + }, + { + "epoch": 1.86, + "learning_rate": 6.701537800230385e-07, + "loss": 0.6089, + "step": 72428 + }, + { + "epoch": 1.86, + "learning_rate": 6.701276582813122e-07, + "loss": 0.7363, + "step": 72429 + }, + { + "epoch": 1.86, + "learning_rate": 6.701015367921543e-07, + "loss": 0.5386, + "step": 72430 + }, + { + "epoch": 1.86, + "learning_rate": 6.700754155555841e-07, + "loss": 0.6787, + "step": 72431 + }, + { + "epoch": 1.86, + "learning_rate": 6.700492945716223e-07, + "loss": 0.3884, + "step": 72432 + }, + { + "epoch": 1.86, + "learning_rate": 6.700231738402884e-07, + "loss": 0.6348, + "step": 72433 + }, + { + "epoch": 1.86, + "learning_rate": 6.699970533616031e-07, + "loss": 0.7393, + "step": 72434 + }, + { + "epoch": 1.86, + "learning_rate": 6.699709331355854e-07, + "loss": 0.71, + "step": 72435 + }, + { + "epoch": 1.86, + "learning_rate": 6.699448131622558e-07, + "loss": 0.6465, + "step": 72436 + }, + { + "epoch": 1.86, + "learning_rate": 6.699186934416343e-07, + "loss": 0.7158, + "step": 72437 + }, + { + "epoch": 1.86, + "learning_rate": 6.698925739737411e-07, + "loss": 0.5649, + "step": 72438 + }, + { + "epoch": 1.86, + "learning_rate": 6.698664547585956e-07, + "loss": 0.5659, + "step": 72439 + }, + { + "epoch": 1.86, + "learning_rate": 6.698403357962183e-07, + "loss": 0.5698, + "step": 72440 + }, + { + "epoch": 1.86, + "learning_rate": 6.698142170866291e-07, + "loss": 0.7227, + "step": 72441 + }, + { + "epoch": 1.86, + "learning_rate": 6.69788098629848e-07, + "loss": 0.7314, + "step": 72442 + }, + { + "epoch": 1.86, + "learning_rate": 6.697619804258949e-07, + "loss": 0.7188, + "step": 72443 + }, + { + "epoch": 1.86, + "learning_rate": 6.697358624747903e-07, + "loss": 0.5253, + "step": 72444 + }, + { + "epoch": 1.86, + "learning_rate": 6.697097447765534e-07, + "loss": 0.7075, + "step": 72445 + }, + { + "epoch": 1.86, + "learning_rate": 6.696836273312045e-07, + "loss": 0.6099, + "step": 72446 + }, + { + "epoch": 1.86, + "learning_rate": 6.696575101387638e-07, + "loss": 0.5579, + "step": 72447 + }, + { + "epoch": 1.86, + "learning_rate": 6.69631393199251e-07, + "loss": 0.7739, + "step": 72448 + }, + { + "epoch": 1.86, + "learning_rate": 6.696052765126864e-07, + "loss": 0.5381, + "step": 72449 + }, + { + "epoch": 1.86, + "learning_rate": 6.695791600790897e-07, + "loss": 0.6416, + "step": 72450 + }, + { + "epoch": 1.86, + "learning_rate": 6.695530438984811e-07, + "loss": 0.748, + "step": 72451 + }, + { + "epoch": 1.86, + "learning_rate": 6.695269279708803e-07, + "loss": 0.6309, + "step": 72452 + }, + { + "epoch": 1.86, + "learning_rate": 6.695008122963081e-07, + "loss": 0.4941, + "step": 72453 + }, + { + "epoch": 1.86, + "learning_rate": 6.694746968747839e-07, + "loss": 0.6055, + "step": 72454 + }, + { + "epoch": 1.86, + "learning_rate": 6.694485817063276e-07, + "loss": 0.6514, + "step": 72455 + }, + { + "epoch": 1.86, + "learning_rate": 6.694224667909589e-07, + "loss": 0.7666, + "step": 72456 + }, + { + "epoch": 1.86, + "learning_rate": 6.693963521286986e-07, + "loss": 0.422, + "step": 72457 + }, + { + "epoch": 1.86, + "learning_rate": 6.693702377195661e-07, + "loss": 0.4949, + "step": 72458 + }, + { + "epoch": 1.86, + "learning_rate": 6.693441235635817e-07, + "loss": 0.6865, + "step": 72459 + }, + { + "epoch": 1.86, + "learning_rate": 6.693180096607653e-07, + "loss": 0.6396, + "step": 72460 + }, + { + "epoch": 1.86, + "learning_rate": 6.692918960111369e-07, + "loss": 0.6328, + "step": 72461 + }, + { + "epoch": 1.86, + "learning_rate": 6.692657826147164e-07, + "loss": 0.5317, + "step": 72462 + }, + { + "epoch": 1.86, + "learning_rate": 6.692396694715241e-07, + "loss": 0.5537, + "step": 72463 + }, + { + "epoch": 1.86, + "learning_rate": 6.692135565815799e-07, + "loss": 0.6787, + "step": 72464 + }, + { + "epoch": 1.86, + "learning_rate": 6.691874439449033e-07, + "loss": 0.4907, + "step": 72465 + }, + { + "epoch": 1.86, + "learning_rate": 6.691613315615149e-07, + "loss": 0.6299, + "step": 72466 + }, + { + "epoch": 1.86, + "learning_rate": 6.691352194314342e-07, + "loss": 0.8018, + "step": 72467 + }, + { + "epoch": 1.86, + "learning_rate": 6.691091075546817e-07, + "loss": 0.8047, + "step": 72468 + }, + { + "epoch": 1.86, + "learning_rate": 6.69082995931277e-07, + "loss": 0.4463, + "step": 72469 + }, + { + "epoch": 1.86, + "learning_rate": 6.690568845612403e-07, + "loss": 0.4878, + "step": 72470 + }, + { + "epoch": 1.86, + "learning_rate": 6.690307734445913e-07, + "loss": 0.6914, + "step": 72471 + }, + { + "epoch": 1.86, + "learning_rate": 6.690046625813506e-07, + "loss": 0.4956, + "step": 72472 + }, + { + "epoch": 1.86, + "learning_rate": 6.689785519715375e-07, + "loss": 0.6323, + "step": 72473 + }, + { + "epoch": 1.86, + "learning_rate": 6.689524416151729e-07, + "loss": 0.6562, + "step": 72474 + }, + { + "epoch": 1.86, + "learning_rate": 6.689263315122755e-07, + "loss": 0.5186, + "step": 72475 + }, + { + "epoch": 1.86, + "learning_rate": 6.689002216628663e-07, + "loss": 0.5969, + "step": 72476 + }, + { + "epoch": 1.86, + "learning_rate": 6.688741120669648e-07, + "loss": 0.7329, + "step": 72477 + }, + { + "epoch": 1.86, + "learning_rate": 6.688480027245913e-07, + "loss": 0.7031, + "step": 72478 + }, + { + "epoch": 1.86, + "learning_rate": 6.688218936357654e-07, + "loss": 0.6084, + "step": 72479 + }, + { + "epoch": 1.86, + "learning_rate": 6.687957848005077e-07, + "loss": 0.7109, + "step": 72480 + }, + { + "epoch": 1.86, + "learning_rate": 6.687696762188375e-07, + "loss": 0.7363, + "step": 72481 + }, + { + "epoch": 1.86, + "learning_rate": 6.687435678907754e-07, + "loss": 0.5862, + "step": 72482 + }, + { + "epoch": 1.86, + "learning_rate": 6.68717459816341e-07, + "loss": 0.6797, + "step": 72483 + }, + { + "epoch": 1.86, + "learning_rate": 6.686913519955547e-07, + "loss": 0.7061, + "step": 72484 + }, + { + "epoch": 1.86, + "learning_rate": 6.68665244428436e-07, + "loss": 0.666, + "step": 72485 + }, + { + "epoch": 1.86, + "learning_rate": 6.686391371150049e-07, + "loss": 0.5879, + "step": 72486 + }, + { + "epoch": 1.86, + "learning_rate": 6.686130300552818e-07, + "loss": 0.5918, + "step": 72487 + }, + { + "epoch": 1.86, + "learning_rate": 6.685869232492862e-07, + "loss": 0.5889, + "step": 72488 + }, + { + "epoch": 1.86, + "learning_rate": 6.685608166970387e-07, + "loss": 0.6562, + "step": 72489 + }, + { + "epoch": 1.86, + "learning_rate": 6.685347103985586e-07, + "loss": 0.6816, + "step": 72490 + }, + { + "epoch": 1.86, + "learning_rate": 6.685086043538665e-07, + "loss": 0.6855, + "step": 72491 + }, + { + "epoch": 1.86, + "learning_rate": 6.684824985629821e-07, + "loss": 0.6787, + "step": 72492 + }, + { + "epoch": 1.86, + "learning_rate": 6.684563930259253e-07, + "loss": 0.5024, + "step": 72493 + }, + { + "epoch": 1.86, + "learning_rate": 6.684302877427164e-07, + "loss": 0.5303, + "step": 72494 + }, + { + "epoch": 1.86, + "learning_rate": 6.68404182713375e-07, + "loss": 0.5913, + "step": 72495 + }, + { + "epoch": 1.86, + "learning_rate": 6.683780779379212e-07, + "loss": 0.478, + "step": 72496 + }, + { + "epoch": 1.86, + "learning_rate": 6.683519734163751e-07, + "loss": 0.8115, + "step": 72497 + }, + { + "epoch": 1.86, + "learning_rate": 6.683258691487567e-07, + "loss": 0.8516, + "step": 72498 + }, + { + "epoch": 1.86, + "learning_rate": 6.68299765135086e-07, + "loss": 0.4941, + "step": 72499 + }, + { + "epoch": 1.86, + "learning_rate": 6.682736613753826e-07, + "loss": 0.7891, + "step": 72500 + }, + { + "epoch": 1.86, + "learning_rate": 6.682475578696671e-07, + "loss": 0.6958, + "step": 72501 + }, + { + "epoch": 1.86, + "learning_rate": 6.68221454617959e-07, + "loss": 0.5457, + "step": 72502 + }, + { + "epoch": 1.86, + "learning_rate": 6.681953516202787e-07, + "loss": 0.5081, + "step": 72503 + }, + { + "epoch": 1.86, + "learning_rate": 6.681692488766461e-07, + "loss": 0.6455, + "step": 72504 + }, + { + "epoch": 1.86, + "learning_rate": 6.681431463870809e-07, + "loss": 0.6489, + "step": 72505 + }, + { + "epoch": 1.86, + "learning_rate": 6.681170441516031e-07, + "loss": 0.5795, + "step": 72506 + }, + { + "epoch": 1.86, + "learning_rate": 6.680909421702327e-07, + "loss": 0.708, + "step": 72507 + }, + { + "epoch": 1.86, + "learning_rate": 6.6806484044299e-07, + "loss": 0.5077, + "step": 72508 + }, + { + "epoch": 1.86, + "learning_rate": 6.680387389698949e-07, + "loss": 0.3953, + "step": 72509 + }, + { + "epoch": 1.86, + "learning_rate": 6.680126377509669e-07, + "loss": 0.6665, + "step": 72510 + }, + { + "epoch": 1.86, + "learning_rate": 6.679865367862268e-07, + "loss": 0.7363, + "step": 72511 + }, + { + "epoch": 1.86, + "learning_rate": 6.679604360756939e-07, + "loss": 0.6523, + "step": 72512 + }, + { + "epoch": 1.86, + "learning_rate": 6.679343356193885e-07, + "loss": 0.7402, + "step": 72513 + }, + { + "epoch": 1.86, + "learning_rate": 6.679082354173307e-07, + "loss": 0.6006, + "step": 72514 + }, + { + "epoch": 1.86, + "learning_rate": 6.678821354695399e-07, + "loss": 0.7002, + "step": 72515 + }, + { + "epoch": 1.86, + "learning_rate": 6.678560357760367e-07, + "loss": 0.708, + "step": 72516 + }, + { + "epoch": 1.86, + "learning_rate": 6.678299363368407e-07, + "loss": 0.7109, + "step": 72517 + }, + { + "epoch": 1.86, + "learning_rate": 6.678038371519721e-07, + "loss": 0.5308, + "step": 72518 + }, + { + "epoch": 1.86, + "learning_rate": 6.677777382214508e-07, + "loss": 0.6621, + "step": 72519 + }, + { + "epoch": 1.86, + "learning_rate": 6.67751639545297e-07, + "loss": 0.6455, + "step": 72520 + }, + { + "epoch": 1.86, + "learning_rate": 6.677255411235303e-07, + "loss": 0.6104, + "step": 72521 + }, + { + "epoch": 1.86, + "learning_rate": 6.67699442956171e-07, + "loss": 0.7207, + "step": 72522 + }, + { + "epoch": 1.86, + "learning_rate": 6.676733450432388e-07, + "loss": 0.5693, + "step": 72523 + }, + { + "epoch": 1.86, + "learning_rate": 6.676472473847542e-07, + "loss": 0.5435, + "step": 72524 + }, + { + "epoch": 1.86, + "learning_rate": 6.676211499807367e-07, + "loss": 0.627, + "step": 72525 + }, + { + "epoch": 1.86, + "learning_rate": 6.67595052831206e-07, + "loss": 0.6165, + "step": 72526 + }, + { + "epoch": 1.86, + "learning_rate": 6.675689559361829e-07, + "loss": 0.7026, + "step": 72527 + }, + { + "epoch": 1.86, + "learning_rate": 6.675428592956869e-07, + "loss": 0.4971, + "step": 72528 + }, + { + "epoch": 1.86, + "learning_rate": 6.675167629097378e-07, + "loss": 0.6174, + "step": 72529 + }, + { + "epoch": 1.86, + "learning_rate": 6.67490666778356e-07, + "loss": 0.6904, + "step": 72530 + }, + { + "epoch": 1.86, + "learning_rate": 6.674645709015613e-07, + "loss": 0.6914, + "step": 72531 + }, + { + "epoch": 1.86, + "learning_rate": 6.674384752793737e-07, + "loss": 0.5244, + "step": 72532 + }, + { + "epoch": 1.86, + "learning_rate": 6.674123799118129e-07, + "loss": 0.5688, + "step": 72533 + }, + { + "epoch": 1.86, + "learning_rate": 6.673862847988998e-07, + "loss": 0.499, + "step": 72534 + }, + { + "epoch": 1.86, + "learning_rate": 6.673601899406533e-07, + "loss": 0.6362, + "step": 72535 + }, + { + "epoch": 1.86, + "learning_rate": 6.673340953370939e-07, + "loss": 0.5764, + "step": 72536 + }, + { + "epoch": 1.86, + "learning_rate": 6.673080009882414e-07, + "loss": 0.5898, + "step": 72537 + }, + { + "epoch": 1.86, + "learning_rate": 6.672819068941158e-07, + "loss": 0.7119, + "step": 72538 + }, + { + "epoch": 1.86, + "learning_rate": 6.672558130547372e-07, + "loss": 0.5725, + "step": 72539 + }, + { + "epoch": 1.86, + "learning_rate": 6.672297194701255e-07, + "loss": 0.5645, + "step": 72540 + }, + { + "epoch": 1.86, + "learning_rate": 6.672036261403009e-07, + "loss": 0.5492, + "step": 72541 + }, + { + "epoch": 1.86, + "learning_rate": 6.671775330652829e-07, + "loss": 0.5366, + "step": 72542 + }, + { + "epoch": 1.86, + "learning_rate": 6.671514402450919e-07, + "loss": 0.793, + "step": 72543 + }, + { + "epoch": 1.86, + "learning_rate": 6.67125347679748e-07, + "loss": 0.4509, + "step": 72544 + }, + { + "epoch": 1.86, + "learning_rate": 6.670992553692708e-07, + "loss": 0.6104, + "step": 72545 + }, + { + "epoch": 1.86, + "learning_rate": 6.670731633136801e-07, + "loss": 0.5771, + "step": 72546 + }, + { + "epoch": 1.86, + "learning_rate": 6.670470715129963e-07, + "loss": 0.626, + "step": 72547 + }, + { + "epoch": 1.86, + "learning_rate": 6.670209799672393e-07, + "loss": 0.6348, + "step": 72548 + }, + { + "epoch": 1.86, + "learning_rate": 6.66994888676429e-07, + "loss": 0.6279, + "step": 72549 + }, + { + "epoch": 1.86, + "learning_rate": 6.669687976405853e-07, + "loss": 0.4951, + "step": 72550 + }, + { + "epoch": 1.86, + "learning_rate": 6.669427068597284e-07, + "loss": 0.8623, + "step": 72551 + }, + { + "epoch": 1.86, + "learning_rate": 6.66916616333878e-07, + "loss": 0.6885, + "step": 72552 + }, + { + "epoch": 1.86, + "learning_rate": 6.668905260630544e-07, + "loss": 0.5444, + "step": 72553 + }, + { + "epoch": 1.86, + "learning_rate": 6.668644360472778e-07, + "loss": 0.6519, + "step": 72554 + }, + { + "epoch": 1.86, + "learning_rate": 6.668383462865671e-07, + "loss": 0.6846, + "step": 72555 + }, + { + "epoch": 1.86, + "learning_rate": 6.668122567809433e-07, + "loss": 0.7666, + "step": 72556 + }, + { + "epoch": 1.86, + "learning_rate": 6.667861675304258e-07, + "loss": 0.7012, + "step": 72557 + }, + { + "epoch": 1.86, + "learning_rate": 6.667600785350351e-07, + "loss": 0.4573, + "step": 72558 + }, + { + "epoch": 1.86, + "learning_rate": 6.667339897947906e-07, + "loss": 0.5539, + "step": 72559 + }, + { + "epoch": 1.86, + "learning_rate": 6.667079013097127e-07, + "loss": 0.5806, + "step": 72560 + }, + { + "epoch": 1.86, + "learning_rate": 6.666818130798211e-07, + "loss": 0.5981, + "step": 72561 + }, + { + "epoch": 1.86, + "learning_rate": 6.666557251051361e-07, + "loss": 0.7324, + "step": 72562 + }, + { + "epoch": 1.86, + "learning_rate": 6.666296373856772e-07, + "loss": 0.4966, + "step": 72563 + }, + { + "epoch": 1.86, + "learning_rate": 6.666035499214655e-07, + "loss": 0.5232, + "step": 72564 + }, + { + "epoch": 1.86, + "learning_rate": 6.665774627125193e-07, + "loss": 0.6934, + "step": 72565 + }, + { + "epoch": 1.86, + "learning_rate": 6.665513757588597e-07, + "loss": 0.623, + "step": 72566 + }, + { + "epoch": 1.86, + "learning_rate": 6.665252890605062e-07, + "loss": 0.5616, + "step": 72567 + }, + { + "epoch": 1.86, + "learning_rate": 6.664992026174791e-07, + "loss": 0.5869, + "step": 72568 + }, + { + "epoch": 1.86, + "learning_rate": 6.664731164297981e-07, + "loss": 0.4741, + "step": 72569 + }, + { + "epoch": 1.86, + "learning_rate": 6.664470304974834e-07, + "loss": 0.4473, + "step": 72570 + }, + { + "epoch": 1.86, + "learning_rate": 6.664209448205546e-07, + "loss": 0.5197, + "step": 72571 + }, + { + "epoch": 1.86, + "learning_rate": 6.663948593990324e-07, + "loss": 0.623, + "step": 72572 + }, + { + "epoch": 1.86, + "learning_rate": 6.663687742329361e-07, + "loss": 0.606, + "step": 72573 + }, + { + "epoch": 1.86, + "learning_rate": 6.663426893222861e-07, + "loss": 0.6084, + "step": 72574 + }, + { + "epoch": 1.86, + "learning_rate": 6.66316604667102e-07, + "loss": 0.6406, + "step": 72575 + }, + { + "epoch": 1.86, + "learning_rate": 6.662905202674037e-07, + "loss": 0.5752, + "step": 72576 + }, + { + "epoch": 1.86, + "learning_rate": 6.662644361232117e-07, + "loss": 0.5947, + "step": 72577 + }, + { + "epoch": 1.86, + "learning_rate": 6.662383522345454e-07, + "loss": 0.7363, + "step": 72578 + }, + { + "epoch": 1.86, + "learning_rate": 6.662122686014254e-07, + "loss": 0.6104, + "step": 72579 + }, + { + "epoch": 1.86, + "learning_rate": 6.66186185223871e-07, + "loss": 0.6323, + "step": 72580 + }, + { + "epoch": 1.86, + "learning_rate": 6.661601021019027e-07, + "loss": 0.7075, + "step": 72581 + }, + { + "epoch": 1.86, + "learning_rate": 6.661340192355403e-07, + "loss": 0.5674, + "step": 72582 + }, + { + "epoch": 1.86, + "learning_rate": 6.661079366248034e-07, + "loss": 0.7529, + "step": 72583 + }, + { + "epoch": 1.86, + "learning_rate": 6.660818542697129e-07, + "loss": 0.6377, + "step": 72584 + }, + { + "epoch": 1.86, + "learning_rate": 6.660557721702878e-07, + "loss": 0.6372, + "step": 72585 + }, + { + "epoch": 1.86, + "learning_rate": 6.660296903265483e-07, + "loss": 0.623, + "step": 72586 + }, + { + "epoch": 1.86, + "learning_rate": 6.660036087385146e-07, + "loss": 0.7812, + "step": 72587 + }, + { + "epoch": 1.86, + "learning_rate": 6.659775274062065e-07, + "loss": 0.5723, + "step": 72588 + }, + { + "epoch": 1.86, + "learning_rate": 6.659514463296443e-07, + "loss": 0.5391, + "step": 72589 + }, + { + "epoch": 1.86, + "learning_rate": 6.659253655088475e-07, + "loss": 0.4863, + "step": 72590 + }, + { + "epoch": 1.86, + "learning_rate": 6.658992849438363e-07, + "loss": 0.668, + "step": 72591 + }, + { + "epoch": 1.86, + "learning_rate": 6.658732046346307e-07, + "loss": 0.8318, + "step": 72592 + }, + { + "epoch": 1.86, + "learning_rate": 6.658471245812507e-07, + "loss": 0.7617, + "step": 72593 + }, + { + "epoch": 1.86, + "learning_rate": 6.658210447837163e-07, + "loss": 0.6313, + "step": 72594 + }, + { + "epoch": 1.86, + "learning_rate": 6.657949652420472e-07, + "loss": 0.6611, + "step": 72595 + }, + { + "epoch": 1.86, + "learning_rate": 6.657688859562636e-07, + "loss": 0.5864, + "step": 72596 + }, + { + "epoch": 1.86, + "learning_rate": 6.657428069263851e-07, + "loss": 0.6074, + "step": 72597 + }, + { + "epoch": 1.86, + "learning_rate": 6.657167281524323e-07, + "loss": 0.6885, + "step": 72598 + }, + { + "epoch": 1.86, + "learning_rate": 6.656906496344246e-07, + "loss": 0.6772, + "step": 72599 + }, + { + "epoch": 1.86, + "learning_rate": 6.656645713723823e-07, + "loss": 0.7227, + "step": 72600 + }, + { + "epoch": 1.86, + "learning_rate": 6.656384933663255e-07, + "loss": 0.7222, + "step": 72601 + }, + { + "epoch": 1.86, + "learning_rate": 6.656124156162735e-07, + "loss": 0.667, + "step": 72602 + }, + { + "epoch": 1.86, + "learning_rate": 6.65586338122247e-07, + "loss": 0.6816, + "step": 72603 + }, + { + "epoch": 1.86, + "learning_rate": 6.655602608842658e-07, + "loss": 0.7705, + "step": 72604 + }, + { + "epoch": 1.86, + "learning_rate": 6.655341839023494e-07, + "loss": 0.6299, + "step": 72605 + }, + { + "epoch": 1.86, + "learning_rate": 6.655081071765183e-07, + "loss": 0.667, + "step": 72606 + }, + { + "epoch": 1.86, + "learning_rate": 6.65482030706792e-07, + "loss": 0.6523, + "step": 72607 + }, + { + "epoch": 1.86, + "learning_rate": 6.654559544931909e-07, + "loss": 0.6479, + "step": 72608 + }, + { + "epoch": 1.86, + "learning_rate": 6.654298785357347e-07, + "loss": 0.7168, + "step": 72609 + }, + { + "epoch": 1.86, + "learning_rate": 6.654038028344435e-07, + "loss": 0.6367, + "step": 72610 + }, + { + "epoch": 1.86, + "learning_rate": 6.653777273893373e-07, + "loss": 0.5669, + "step": 72611 + }, + { + "epoch": 1.86, + "learning_rate": 6.653516522004359e-07, + "loss": 0.5569, + "step": 72612 + }, + { + "epoch": 1.86, + "learning_rate": 6.653255772677593e-07, + "loss": 0.5625, + "step": 72613 + }, + { + "epoch": 1.86, + "learning_rate": 6.65299502591328e-07, + "loss": 0.6973, + "step": 72614 + }, + { + "epoch": 1.86, + "learning_rate": 6.652734281711612e-07, + "loss": 0.5093, + "step": 72615 + }, + { + "epoch": 1.86, + "learning_rate": 6.652473540072787e-07, + "loss": 0.7051, + "step": 72616 + }, + { + "epoch": 1.86, + "learning_rate": 6.652212800997015e-07, + "loss": 0.5913, + "step": 72617 + }, + { + "epoch": 1.86, + "learning_rate": 6.651952064484488e-07, + "loss": 0.5488, + "step": 72618 + }, + { + "epoch": 1.86, + "learning_rate": 6.651691330535405e-07, + "loss": 0.7241, + "step": 72619 + }, + { + "epoch": 1.86, + "learning_rate": 6.65143059914997e-07, + "loss": 0.4707, + "step": 72620 + }, + { + "epoch": 1.86, + "learning_rate": 6.651169870328379e-07, + "loss": 0.5001, + "step": 72621 + }, + { + "epoch": 1.86, + "learning_rate": 6.650909144070836e-07, + "loss": 0.5977, + "step": 72622 + }, + { + "epoch": 1.86, + "learning_rate": 6.650648420377534e-07, + "loss": 0.6553, + "step": 72623 + }, + { + "epoch": 1.86, + "learning_rate": 6.650387699248681e-07, + "loss": 0.6367, + "step": 72624 + }, + { + "epoch": 1.86, + "learning_rate": 6.650126980684471e-07, + "loss": 0.3621, + "step": 72625 + }, + { + "epoch": 1.86, + "learning_rate": 6.649866264685102e-07, + "loss": 0.6436, + "step": 72626 + }, + { + "epoch": 1.86, + "learning_rate": 6.649605551250779e-07, + "loss": 0.5352, + "step": 72627 + }, + { + "epoch": 1.86, + "learning_rate": 6.649344840381697e-07, + "loss": 0.4587, + "step": 72628 + }, + { + "epoch": 1.86, + "learning_rate": 6.64908413207806e-07, + "loss": 0.7383, + "step": 72629 + }, + { + "epoch": 1.86, + "learning_rate": 6.648823426340063e-07, + "loss": 0.6553, + "step": 72630 + }, + { + "epoch": 1.86, + "learning_rate": 6.648562723167907e-07, + "loss": 0.7207, + "step": 72631 + }, + { + "epoch": 1.86, + "learning_rate": 6.648302022561793e-07, + "loss": 0.6816, + "step": 72632 + }, + { + "epoch": 1.86, + "learning_rate": 6.648041324521923e-07, + "loss": 0.4636, + "step": 72633 + }, + { + "epoch": 1.86, + "learning_rate": 6.647780629048494e-07, + "loss": 0.6035, + "step": 72634 + }, + { + "epoch": 1.86, + "learning_rate": 6.647519936141704e-07, + "loss": 0.73, + "step": 72635 + }, + { + "epoch": 1.86, + "learning_rate": 6.647259245801751e-07, + "loss": 0.6123, + "step": 72636 + }, + { + "epoch": 1.86, + "learning_rate": 6.64699855802884e-07, + "loss": 0.7598, + "step": 72637 + }, + { + "epoch": 1.86, + "learning_rate": 6.646737872823166e-07, + "loss": 0.6348, + "step": 72638 + }, + { + "epoch": 1.86, + "learning_rate": 6.646477190184932e-07, + "loss": 0.5322, + "step": 72639 + }, + { + "epoch": 1.86, + "learning_rate": 6.646216510114335e-07, + "loss": 0.6738, + "step": 72640 + }, + { + "epoch": 1.86, + "learning_rate": 6.645955832611579e-07, + "loss": 0.5957, + "step": 72641 + }, + { + "epoch": 1.86, + "learning_rate": 6.645695157676856e-07, + "loss": 0.7646, + "step": 72642 + }, + { + "epoch": 1.86, + "learning_rate": 6.645434485310373e-07, + "loss": 0.6631, + "step": 72643 + }, + { + "epoch": 1.86, + "learning_rate": 6.645173815512328e-07, + "loss": 0.7188, + "step": 72644 + }, + { + "epoch": 1.86, + "learning_rate": 6.644913148282916e-07, + "loss": 0.5757, + "step": 72645 + }, + { + "epoch": 1.86, + "learning_rate": 6.644652483622342e-07, + "loss": 0.2648, + "step": 72646 + }, + { + "epoch": 1.86, + "learning_rate": 6.6443918215308e-07, + "loss": 0.49, + "step": 72647 + }, + { + "epoch": 1.86, + "learning_rate": 6.644131162008496e-07, + "loss": 0.6021, + "step": 72648 + }, + { + "epoch": 1.86, + "learning_rate": 6.643870505055624e-07, + "loss": 0.8311, + "step": 72649 + }, + { + "epoch": 1.86, + "learning_rate": 6.643609850672388e-07, + "loss": 0.6562, + "step": 72650 + }, + { + "epoch": 1.86, + "learning_rate": 6.643349198858983e-07, + "loss": 0.6479, + "step": 72651 + }, + { + "epoch": 1.86, + "learning_rate": 6.643088549615614e-07, + "loss": 0.6621, + "step": 72652 + }, + { + "epoch": 1.86, + "learning_rate": 6.642827902942476e-07, + "loss": 0.6587, + "step": 72653 + }, + { + "epoch": 1.86, + "learning_rate": 6.642567258839776e-07, + "loss": 0.6494, + "step": 72654 + }, + { + "epoch": 1.86, + "learning_rate": 6.642306617307702e-07, + "loss": 0.5764, + "step": 72655 + }, + { + "epoch": 1.86, + "learning_rate": 6.642045978346461e-07, + "loss": 0.7375, + "step": 72656 + }, + { + "epoch": 1.86, + "learning_rate": 6.64178534195625e-07, + "loss": 0.6953, + "step": 72657 + }, + { + "epoch": 1.86, + "learning_rate": 6.641524708137271e-07, + "loss": 0.5991, + "step": 72658 + }, + { + "epoch": 1.86, + "learning_rate": 6.641264076889718e-07, + "loss": 0.6328, + "step": 72659 + }, + { + "epoch": 1.86, + "learning_rate": 6.6410034482138e-07, + "loss": 0.6348, + "step": 72660 + }, + { + "epoch": 1.86, + "learning_rate": 6.640742822109707e-07, + "loss": 0.5576, + "step": 72661 + }, + { + "epoch": 1.86, + "learning_rate": 6.640482198577646e-07, + "loss": 0.2839, + "step": 72662 + }, + { + "epoch": 1.86, + "learning_rate": 6.64022157761781e-07, + "loss": 0.5571, + "step": 72663 + }, + { + "epoch": 1.86, + "learning_rate": 6.639960959230407e-07, + "loss": 0.6758, + "step": 72664 + }, + { + "epoch": 1.86, + "learning_rate": 6.639700343415629e-07, + "loss": 0.5918, + "step": 72665 + }, + { + "epoch": 1.86, + "learning_rate": 6.639439730173677e-07, + "loss": 0.7705, + "step": 72666 + }, + { + "epoch": 1.86, + "learning_rate": 6.639179119504752e-07, + "loss": 0.7188, + "step": 72667 + }, + { + "epoch": 1.86, + "learning_rate": 6.638918511409051e-07, + "loss": 0.6465, + "step": 72668 + }, + { + "epoch": 1.86, + "learning_rate": 6.638657905886778e-07, + "loss": 0.583, + "step": 72669 + }, + { + "epoch": 1.86, + "learning_rate": 6.638397302938128e-07, + "loss": 0.7061, + "step": 72670 + }, + { + "epoch": 1.86, + "learning_rate": 6.638136702563306e-07, + "loss": 0.7637, + "step": 72671 + }, + { + "epoch": 1.86, + "learning_rate": 6.637876104762507e-07, + "loss": 0.5796, + "step": 72672 + }, + { + "epoch": 1.86, + "learning_rate": 6.637615509535928e-07, + "loss": 0.6377, + "step": 72673 + }, + { + "epoch": 1.86, + "learning_rate": 6.637354916883778e-07, + "loss": 0.583, + "step": 72674 + }, + { + "epoch": 1.86, + "learning_rate": 6.63709432680625e-07, + "loss": 0.3926, + "step": 72675 + }, + { + "epoch": 1.86, + "learning_rate": 6.63683373930354e-07, + "loss": 0.5391, + "step": 72676 + }, + { + "epoch": 1.86, + "learning_rate": 6.636573154375854e-07, + "loss": 0.6299, + "step": 72677 + }, + { + "epoch": 1.86, + "learning_rate": 6.636312572023388e-07, + "loss": 0.4751, + "step": 72678 + }, + { + "epoch": 1.86, + "learning_rate": 6.636051992246345e-07, + "loss": 0.7344, + "step": 72679 + }, + { + "epoch": 1.86, + "learning_rate": 6.63579141504492e-07, + "loss": 0.5386, + "step": 72680 + }, + { + "epoch": 1.86, + "learning_rate": 6.635530840419317e-07, + "loss": 0.6992, + "step": 72681 + }, + { + "epoch": 1.86, + "learning_rate": 6.63527026836973e-07, + "loss": 0.5151, + "step": 72682 + }, + { + "epoch": 1.86, + "learning_rate": 6.635009698896366e-07, + "loss": 0.6387, + "step": 72683 + }, + { + "epoch": 1.86, + "learning_rate": 6.63474913199942e-07, + "loss": 0.5312, + "step": 72684 + }, + { + "epoch": 1.86, + "learning_rate": 6.634488567679088e-07, + "loss": 0.6289, + "step": 72685 + }, + { + "epoch": 1.86, + "learning_rate": 6.634228005935578e-07, + "loss": 0.5479, + "step": 72686 + }, + { + "epoch": 1.86, + "learning_rate": 6.633967446769081e-07, + "loss": 0.7637, + "step": 72687 + }, + { + "epoch": 1.86, + "learning_rate": 6.633706890179802e-07, + "loss": 0.5801, + "step": 72688 + }, + { + "epoch": 1.86, + "learning_rate": 6.633446336167938e-07, + "loss": 0.7793, + "step": 72689 + }, + { + "epoch": 1.86, + "learning_rate": 6.63318578473369e-07, + "loss": 0.502, + "step": 72690 + }, + { + "epoch": 1.86, + "learning_rate": 6.632925235877258e-07, + "loss": 0.5989, + "step": 72691 + }, + { + "epoch": 1.86, + "learning_rate": 6.632664689598839e-07, + "loss": 0.5151, + "step": 72692 + }, + { + "epoch": 1.86, + "learning_rate": 6.632404145898634e-07, + "loss": 0.5405, + "step": 72693 + }, + { + "epoch": 1.86, + "learning_rate": 6.632143604776845e-07, + "loss": 0.7969, + "step": 72694 + }, + { + "epoch": 1.86, + "learning_rate": 6.631883066233666e-07, + "loss": 0.5181, + "step": 72695 + }, + { + "epoch": 1.86, + "learning_rate": 6.6316225302693e-07, + "loss": 0.5952, + "step": 72696 + }, + { + "epoch": 1.86, + "learning_rate": 6.631361996883944e-07, + "loss": 0.668, + "step": 72697 + }, + { + "epoch": 1.86, + "learning_rate": 6.631101466077799e-07, + "loss": 0.5503, + "step": 72698 + }, + { + "epoch": 1.86, + "learning_rate": 6.630840937851065e-07, + "loss": 0.6738, + "step": 72699 + }, + { + "epoch": 1.86, + "learning_rate": 6.630580412203945e-07, + "loss": 0.6299, + "step": 72700 + }, + { + "epoch": 1.86, + "learning_rate": 6.630319889136629e-07, + "loss": 0.5896, + "step": 72701 + }, + { + "epoch": 1.86, + "learning_rate": 6.630059368649326e-07, + "loss": 0.6553, + "step": 72702 + }, + { + "epoch": 1.86, + "learning_rate": 6.629798850742234e-07, + "loss": 0.4983, + "step": 72703 + }, + { + "epoch": 1.86, + "learning_rate": 6.629538335415545e-07, + "loss": 0.6934, + "step": 72704 + }, + { + "epoch": 1.86, + "learning_rate": 6.629277822669466e-07, + "loss": 0.6016, + "step": 72705 + }, + { + "epoch": 1.86, + "learning_rate": 6.629017312504192e-07, + "loss": 0.6914, + "step": 72706 + }, + { + "epoch": 1.86, + "learning_rate": 6.628756804919926e-07, + "loss": 0.5796, + "step": 72707 + }, + { + "epoch": 1.86, + "learning_rate": 6.628496299916867e-07, + "loss": 0.6221, + "step": 72708 + }, + { + "epoch": 1.86, + "learning_rate": 6.628235797495209e-07, + "loss": 0.5127, + "step": 72709 + }, + { + "epoch": 1.86, + "learning_rate": 6.62797529765516e-07, + "loss": 0.7009, + "step": 72710 + }, + { + "epoch": 1.86, + "learning_rate": 6.627714800396913e-07, + "loss": 0.7715, + "step": 72711 + }, + { + "epoch": 1.86, + "learning_rate": 6.627454305720672e-07, + "loss": 0.5884, + "step": 72712 + }, + { + "epoch": 1.86, + "learning_rate": 6.627193813626634e-07, + "loss": 0.6738, + "step": 72713 + }, + { + "epoch": 1.86, + "learning_rate": 6.626933324114998e-07, + "loss": 0.3793, + "step": 72714 + }, + { + "epoch": 1.86, + "learning_rate": 6.626672837185964e-07, + "loss": 0.7051, + "step": 72715 + }, + { + "epoch": 1.86, + "learning_rate": 6.62641235283973e-07, + "loss": 0.53, + "step": 72716 + }, + { + "epoch": 1.86, + "learning_rate": 6.626151871076498e-07, + "loss": 0.6099, + "step": 72717 + }, + { + "epoch": 1.86, + "learning_rate": 6.625891391896466e-07, + "loss": 0.5244, + "step": 72718 + }, + { + "epoch": 1.86, + "learning_rate": 6.625630915299834e-07, + "loss": 0.5703, + "step": 72719 + }, + { + "epoch": 1.86, + "learning_rate": 6.625370441286799e-07, + "loss": 0.6113, + "step": 72720 + }, + { + "epoch": 1.86, + "learning_rate": 6.625109969857567e-07, + "loss": 0.7314, + "step": 72721 + }, + { + "epoch": 1.86, + "learning_rate": 6.62484950101233e-07, + "loss": 0.6914, + "step": 72722 + }, + { + "epoch": 1.86, + "learning_rate": 6.624589034751294e-07, + "loss": 0.6479, + "step": 72723 + }, + { + "epoch": 1.86, + "learning_rate": 6.624328571074654e-07, + "loss": 0.5288, + "step": 72724 + }, + { + "epoch": 1.86, + "learning_rate": 6.62406810998261e-07, + "loss": 0.7266, + "step": 72725 + }, + { + "epoch": 1.86, + "learning_rate": 6.62380765147536e-07, + "loss": 0.6777, + "step": 72726 + }, + { + "epoch": 1.86, + "learning_rate": 6.623547195553105e-07, + "loss": 0.7334, + "step": 72727 + }, + { + "epoch": 1.86, + "learning_rate": 6.623286742216045e-07, + "loss": 0.6436, + "step": 72728 + }, + { + "epoch": 1.86, + "learning_rate": 6.623026291464381e-07, + "loss": 0.6138, + "step": 72729 + }, + { + "epoch": 1.86, + "learning_rate": 6.622765843298308e-07, + "loss": 0.5007, + "step": 72730 + }, + { + "epoch": 1.86, + "learning_rate": 6.62250539771803e-07, + "loss": 0.5212, + "step": 72731 + }, + { + "epoch": 1.86, + "learning_rate": 6.622244954723743e-07, + "loss": 0.5923, + "step": 72732 + }, + { + "epoch": 1.86, + "learning_rate": 6.621984514315651e-07, + "loss": 0.6094, + "step": 72733 + }, + { + "epoch": 1.86, + "learning_rate": 6.621724076493947e-07, + "loss": 0.7383, + "step": 72734 + }, + { + "epoch": 1.86, + "learning_rate": 6.621463641258833e-07, + "loss": 0.52, + "step": 72735 + }, + { + "epoch": 1.86, + "learning_rate": 6.62120320861051e-07, + "loss": 0.7446, + "step": 72736 + }, + { + "epoch": 1.86, + "learning_rate": 6.620942778549176e-07, + "loss": 0.6765, + "step": 72737 + }, + { + "epoch": 1.86, + "learning_rate": 6.62068235107503e-07, + "loss": 0.6147, + "step": 72738 + }, + { + "epoch": 1.86, + "learning_rate": 6.620421926188274e-07, + "loss": 0.6689, + "step": 72739 + }, + { + "epoch": 1.86, + "learning_rate": 6.620161503889105e-07, + "loss": 0.6562, + "step": 72740 + }, + { + "epoch": 1.86, + "learning_rate": 6.619901084177721e-07, + "loss": 0.666, + "step": 72741 + }, + { + "epoch": 1.86, + "learning_rate": 6.619640667054326e-07, + "loss": 0.8018, + "step": 72742 + }, + { + "epoch": 1.86, + "learning_rate": 6.619380252519118e-07, + "loss": 0.5845, + "step": 72743 + }, + { + "epoch": 1.86, + "learning_rate": 6.619119840572294e-07, + "loss": 0.5898, + "step": 72744 + }, + { + "epoch": 1.86, + "learning_rate": 6.618859431214052e-07, + "loss": 0.4019, + "step": 72745 + }, + { + "epoch": 1.86, + "learning_rate": 6.618599024444596e-07, + "loss": 0.6738, + "step": 72746 + }, + { + "epoch": 1.86, + "learning_rate": 6.618338620264122e-07, + "loss": 0.5337, + "step": 72747 + }, + { + "epoch": 1.86, + "learning_rate": 6.61807821867283e-07, + "loss": 0.6138, + "step": 72748 + }, + { + "epoch": 1.86, + "learning_rate": 6.61781781967092e-07, + "loss": 0.6211, + "step": 72749 + }, + { + "epoch": 1.86, + "learning_rate": 6.617557423258593e-07, + "loss": 0.6919, + "step": 72750 + }, + { + "epoch": 1.86, + "learning_rate": 6.617297029436045e-07, + "loss": 0.6118, + "step": 72751 + }, + { + "epoch": 1.86, + "learning_rate": 6.617036638203479e-07, + "loss": 0.6494, + "step": 72752 + }, + { + "epoch": 1.86, + "learning_rate": 6.616776249561094e-07, + "loss": 0.6504, + "step": 72753 + }, + { + "epoch": 1.86, + "learning_rate": 6.616515863509085e-07, + "loss": 0.6572, + "step": 72754 + }, + { + "epoch": 1.86, + "learning_rate": 6.616255480047655e-07, + "loss": 0.7231, + "step": 72755 + }, + { + "epoch": 1.86, + "learning_rate": 6.615995099177001e-07, + "loss": 0.7354, + "step": 72756 + }, + { + "epoch": 1.86, + "learning_rate": 6.615734720897326e-07, + "loss": 0.5935, + "step": 72757 + }, + { + "epoch": 1.86, + "learning_rate": 6.615474345208824e-07, + "loss": 0.6182, + "step": 72758 + }, + { + "epoch": 1.86, + "learning_rate": 6.615213972111701e-07, + "loss": 0.6343, + "step": 72759 + }, + { + "epoch": 1.86, + "learning_rate": 6.614953601606153e-07, + "loss": 0.5747, + "step": 72760 + }, + { + "epoch": 1.86, + "learning_rate": 6.614693233692379e-07, + "loss": 0.6011, + "step": 72761 + }, + { + "epoch": 1.86, + "learning_rate": 6.614432868370577e-07, + "loss": 0.8232, + "step": 72762 + }, + { + "epoch": 1.86, + "learning_rate": 6.614172505640954e-07, + "loss": 0.5654, + "step": 72763 + }, + { + "epoch": 1.86, + "learning_rate": 6.613912145503697e-07, + "loss": 0.4834, + "step": 72764 + }, + { + "epoch": 1.87, + "learning_rate": 6.613651787959016e-07, + "loss": 0.5537, + "step": 72765 + }, + { + "epoch": 1.87, + "learning_rate": 6.613391433007103e-07, + "loss": 0.5396, + "step": 72766 + }, + { + "epoch": 1.87, + "learning_rate": 6.613131080648161e-07, + "loss": 0.6924, + "step": 72767 + }, + { + "epoch": 1.87, + "learning_rate": 6.612870730882387e-07, + "loss": 0.6265, + "step": 72768 + }, + { + "epoch": 1.87, + "learning_rate": 6.612610383709987e-07, + "loss": 0.5967, + "step": 72769 + }, + { + "epoch": 1.87, + "learning_rate": 6.61235003913115e-07, + "loss": 0.5635, + "step": 72770 + }, + { + "epoch": 1.87, + "learning_rate": 6.612089697146084e-07, + "loss": 0.6448, + "step": 72771 + }, + { + "epoch": 1.87, + "learning_rate": 6.611829357754983e-07, + "loss": 0.8379, + "step": 72772 + }, + { + "epoch": 1.87, + "learning_rate": 6.611569020958054e-07, + "loss": 0.5952, + "step": 72773 + }, + { + "epoch": 1.87, + "learning_rate": 6.611308686755488e-07, + "loss": 0.7109, + "step": 72774 + }, + { + "epoch": 1.87, + "learning_rate": 6.611048355147484e-07, + "loss": 0.7061, + "step": 72775 + }, + { + "epoch": 1.87, + "learning_rate": 6.610788026134247e-07, + "loss": 0.5256, + "step": 72776 + }, + { + "epoch": 1.87, + "learning_rate": 6.610527699715973e-07, + "loss": 0.4905, + "step": 72777 + }, + { + "epoch": 1.87, + "learning_rate": 6.610267375892862e-07, + "loss": 0.6729, + "step": 72778 + }, + { + "epoch": 1.87, + "learning_rate": 6.610007054665112e-07, + "loss": 0.5112, + "step": 72779 + }, + { + "epoch": 1.87, + "learning_rate": 6.609746736032927e-07, + "loss": 0.5962, + "step": 72780 + }, + { + "epoch": 1.87, + "learning_rate": 6.609486419996501e-07, + "loss": 0.5493, + "step": 72781 + }, + { + "epoch": 1.87, + "learning_rate": 6.609226106556037e-07, + "loss": 0.6641, + "step": 72782 + }, + { + "epoch": 1.87, + "learning_rate": 6.608965795711733e-07, + "loss": 0.5388, + "step": 72783 + }, + { + "epoch": 1.87, + "learning_rate": 6.608705487463788e-07, + "loss": 0.8301, + "step": 72784 + }, + { + "epoch": 1.87, + "learning_rate": 6.608445181812399e-07, + "loss": 0.7266, + "step": 72785 + }, + { + "epoch": 1.87, + "learning_rate": 6.608184878757767e-07, + "loss": 0.5632, + "step": 72786 + }, + { + "epoch": 1.87, + "learning_rate": 6.607924578300092e-07, + "loss": 0.7432, + "step": 72787 + }, + { + "epoch": 1.87, + "learning_rate": 6.607664280439576e-07, + "loss": 0.6426, + "step": 72788 + }, + { + "epoch": 1.87, + "learning_rate": 6.607403985176412e-07, + "loss": 0.6196, + "step": 72789 + }, + { + "epoch": 1.87, + "learning_rate": 6.607143692510806e-07, + "loss": 0.5183, + "step": 72790 + }, + { + "epoch": 1.87, + "learning_rate": 6.606883402442951e-07, + "loss": 0.7227, + "step": 72791 + }, + { + "epoch": 1.87, + "learning_rate": 6.606623114973052e-07, + "loss": 0.5376, + "step": 72792 + }, + { + "epoch": 1.87, + "learning_rate": 6.606362830101307e-07, + "loss": 0.6777, + "step": 72793 + }, + { + "epoch": 1.87, + "learning_rate": 6.606102547827911e-07, + "loss": 0.6411, + "step": 72794 + }, + { + "epoch": 1.87, + "learning_rate": 6.605842268153068e-07, + "loss": 0.5161, + "step": 72795 + }, + { + "epoch": 1.87, + "learning_rate": 6.605581991076972e-07, + "loss": 0.6943, + "step": 72796 + }, + { + "epoch": 1.87, + "learning_rate": 6.60532171659983e-07, + "loss": 0.5386, + "step": 72797 + }, + { + "epoch": 1.87, + "learning_rate": 6.605061444721835e-07, + "loss": 0.3782, + "step": 72798 + }, + { + "epoch": 1.87, + "learning_rate": 6.604801175443188e-07, + "loss": 0.5801, + "step": 72799 + }, + { + "epoch": 1.87, + "learning_rate": 6.604540908764089e-07, + "loss": 0.7295, + "step": 72800 + }, + { + "epoch": 1.87, + "learning_rate": 6.604280644684736e-07, + "loss": 0.6445, + "step": 72801 + }, + { + "epoch": 1.87, + "learning_rate": 6.604020383205331e-07, + "loss": 0.7437, + "step": 72802 + }, + { + "epoch": 1.87, + "learning_rate": 6.603760124326074e-07, + "loss": 0.6641, + "step": 72803 + }, + { + "epoch": 1.87, + "learning_rate": 6.603499868047157e-07, + "loss": 0.71, + "step": 72804 + }, + { + "epoch": 1.87, + "learning_rate": 6.603239614368787e-07, + "loss": 0.615, + "step": 72805 + }, + { + "epoch": 1.87, + "learning_rate": 6.602979363291157e-07, + "loss": 0.623, + "step": 72806 + }, + { + "epoch": 1.87, + "learning_rate": 6.602719114814472e-07, + "loss": 0.535, + "step": 72807 + }, + { + "epoch": 1.87, + "learning_rate": 6.602458868938927e-07, + "loss": 0.7168, + "step": 72808 + }, + { + "epoch": 1.87, + "learning_rate": 6.602198625664723e-07, + "loss": 0.6885, + "step": 72809 + }, + { + "epoch": 1.87, + "learning_rate": 6.601938384992061e-07, + "loss": 0.6353, + "step": 72810 + }, + { + "epoch": 1.87, + "learning_rate": 6.601678146921137e-07, + "loss": 0.4685, + "step": 72811 + }, + { + "epoch": 1.87, + "learning_rate": 6.601417911452151e-07, + "loss": 0.5566, + "step": 72812 + }, + { + "epoch": 1.87, + "learning_rate": 6.601157678585307e-07, + "loss": 0.7188, + "step": 72813 + }, + { + "epoch": 1.87, + "learning_rate": 6.6008974483208e-07, + "loss": 0.6572, + "step": 72814 + }, + { + "epoch": 1.87, + "learning_rate": 6.600637220658828e-07, + "loss": 0.7656, + "step": 72815 + }, + { + "epoch": 1.87, + "learning_rate": 6.600376995599591e-07, + "loss": 0.5088, + "step": 72816 + }, + { + "epoch": 1.87, + "learning_rate": 6.600116773143288e-07, + "loss": 0.7451, + "step": 72817 + }, + { + "epoch": 1.87, + "learning_rate": 6.599856553290119e-07, + "loss": 0.6089, + "step": 72818 + }, + { + "epoch": 1.87, + "learning_rate": 6.599596336040287e-07, + "loss": 0.4497, + "step": 72819 + }, + { + "epoch": 1.87, + "learning_rate": 6.599336121393983e-07, + "loss": 0.479, + "step": 72820 + }, + { + "epoch": 1.87, + "learning_rate": 6.599075909351415e-07, + "loss": 0.4338, + "step": 72821 + }, + { + "epoch": 1.87, + "learning_rate": 6.598815699912776e-07, + "loss": 0.7764, + "step": 72822 + }, + { + "epoch": 1.87, + "learning_rate": 6.598555493078271e-07, + "loss": 0.5742, + "step": 72823 + }, + { + "epoch": 1.87, + "learning_rate": 6.598295288848092e-07, + "loss": 0.7334, + "step": 72824 + }, + { + "epoch": 1.87, + "learning_rate": 6.598035087222442e-07, + "loss": 0.5493, + "step": 72825 + }, + { + "epoch": 1.87, + "learning_rate": 6.597774888201521e-07, + "loss": 0.6787, + "step": 72826 + }, + { + "epoch": 1.87, + "learning_rate": 6.597514691785527e-07, + "loss": 0.585, + "step": 72827 + }, + { + "epoch": 1.87, + "learning_rate": 6.597254497974661e-07, + "loss": 0.5352, + "step": 72828 + }, + { + "epoch": 1.87, + "learning_rate": 6.596994306769118e-07, + "loss": 0.6943, + "step": 72829 + }, + { + "epoch": 1.87, + "learning_rate": 6.596734118169102e-07, + "loss": 0.6255, + "step": 72830 + }, + { + "epoch": 1.87, + "learning_rate": 6.596473932174809e-07, + "loss": 0.6113, + "step": 72831 + }, + { + "epoch": 1.87, + "learning_rate": 6.596213748786441e-07, + "loss": 0.5369, + "step": 72832 + }, + { + "epoch": 1.87, + "learning_rate": 6.595953568004198e-07, + "loss": 0.6982, + "step": 72833 + }, + { + "epoch": 1.87, + "learning_rate": 6.595693389828274e-07, + "loss": 0.6055, + "step": 72834 + }, + { + "epoch": 1.87, + "learning_rate": 6.595433214258869e-07, + "loss": 0.5996, + "step": 72835 + }, + { + "epoch": 1.87, + "learning_rate": 6.595173041296187e-07, + "loss": 0.5496, + "step": 72836 + }, + { + "epoch": 1.87, + "learning_rate": 6.594912870940421e-07, + "loss": 0.623, + "step": 72837 + }, + { + "epoch": 1.87, + "learning_rate": 6.594652703191777e-07, + "loss": 0.666, + "step": 72838 + }, + { + "epoch": 1.87, + "learning_rate": 6.594392538050449e-07, + "loss": 0.5923, + "step": 72839 + }, + { + "epoch": 1.87, + "learning_rate": 6.594132375516639e-07, + "loss": 0.749, + "step": 72840 + }, + { + "epoch": 1.87, + "learning_rate": 6.593872215590544e-07, + "loss": 0.5527, + "step": 72841 + }, + { + "epoch": 1.87, + "learning_rate": 6.593612058272366e-07, + "loss": 0.6196, + "step": 72842 + }, + { + "epoch": 1.87, + "learning_rate": 6.593351903562306e-07, + "loss": 0.7197, + "step": 72843 + }, + { + "epoch": 1.87, + "learning_rate": 6.593091751460553e-07, + "loss": 0.6938, + "step": 72844 + }, + { + "epoch": 1.87, + "learning_rate": 6.592831601967316e-07, + "loss": 0.5894, + "step": 72845 + }, + { + "epoch": 1.87, + "learning_rate": 6.592571455082791e-07, + "loss": 0.6616, + "step": 72846 + }, + { + "epoch": 1.87, + "learning_rate": 6.592311310807178e-07, + "loss": 0.6553, + "step": 72847 + }, + { + "epoch": 1.87, + "learning_rate": 6.592051169140673e-07, + "loss": 0.5273, + "step": 72848 + }, + { + "epoch": 1.87, + "learning_rate": 6.591791030083481e-07, + "loss": 0.9189, + "step": 72849 + }, + { + "epoch": 1.87, + "learning_rate": 6.591530893635795e-07, + "loss": 0.6792, + "step": 72850 + }, + { + "epoch": 1.87, + "learning_rate": 6.59127075979782e-07, + "loss": 0.5725, + "step": 72851 + }, + { + "epoch": 1.87, + "learning_rate": 6.591010628569749e-07, + "loss": 0.5498, + "step": 72852 + }, + { + "epoch": 1.87, + "learning_rate": 6.590750499951792e-07, + "loss": 0.7207, + "step": 72853 + }, + { + "epoch": 1.87, + "learning_rate": 6.590490373944133e-07, + "loss": 0.4761, + "step": 72854 + }, + { + "epoch": 1.87, + "learning_rate": 6.590230250546982e-07, + "loss": 0.5864, + "step": 72855 + }, + { + "epoch": 1.87, + "learning_rate": 6.589970129760531e-07, + "loss": 0.6797, + "step": 72856 + }, + { + "epoch": 1.87, + "learning_rate": 6.589710011584988e-07, + "loss": 0.4883, + "step": 72857 + }, + { + "epoch": 1.87, + "learning_rate": 6.589449896020543e-07, + "loss": 0.6943, + "step": 72858 + }, + { + "epoch": 1.87, + "learning_rate": 6.589189783067401e-07, + "loss": 0.6504, + "step": 72859 + }, + { + "epoch": 1.87, + "learning_rate": 6.588929672725759e-07, + "loss": 0.7764, + "step": 72860 + }, + { + "epoch": 1.87, + "learning_rate": 6.588669564995819e-07, + "loss": 0.5869, + "step": 72861 + }, + { + "epoch": 1.87, + "learning_rate": 6.588409459877776e-07, + "loss": 0.666, + "step": 72862 + }, + { + "epoch": 1.87, + "learning_rate": 6.588149357371833e-07, + "loss": 0.5303, + "step": 72863 + }, + { + "epoch": 1.87, + "learning_rate": 6.587889257478186e-07, + "loss": 0.6328, + "step": 72864 + }, + { + "epoch": 1.87, + "learning_rate": 6.587629160197034e-07, + "loss": 0.6641, + "step": 72865 + }, + { + "epoch": 1.87, + "learning_rate": 6.587369065528579e-07, + "loss": 0.6387, + "step": 72866 + }, + { + "epoch": 1.87, + "learning_rate": 6.587108973473017e-07, + "loss": 0.5205, + "step": 72867 + }, + { + "epoch": 1.87, + "learning_rate": 6.586848884030549e-07, + "loss": 0.6689, + "step": 72868 + }, + { + "epoch": 1.87, + "learning_rate": 6.586588797201373e-07, + "loss": 0.7471, + "step": 72869 + }, + { + "epoch": 1.87, + "learning_rate": 6.586328712985691e-07, + "loss": 0.5962, + "step": 72870 + }, + { + "epoch": 1.87, + "learning_rate": 6.586068631383701e-07, + "loss": 0.4563, + "step": 72871 + }, + { + "epoch": 1.87, + "learning_rate": 6.5858085523956e-07, + "loss": 0.4651, + "step": 72872 + }, + { + "epoch": 1.87, + "learning_rate": 6.585548476021589e-07, + "loss": 0.5105, + "step": 72873 + }, + { + "epoch": 1.87, + "learning_rate": 6.585288402261868e-07, + "loss": 0.7266, + "step": 72874 + }, + { + "epoch": 1.87, + "learning_rate": 6.585028331116631e-07, + "loss": 0.6533, + "step": 72875 + }, + { + "epoch": 1.87, + "learning_rate": 6.584768262586082e-07, + "loss": 0.464, + "step": 72876 + }, + { + "epoch": 1.87, + "learning_rate": 6.584508196670419e-07, + "loss": 0.6216, + "step": 72877 + }, + { + "epoch": 1.87, + "learning_rate": 6.584248133369841e-07, + "loss": 0.7295, + "step": 72878 + }, + { + "epoch": 1.87, + "learning_rate": 6.583988072684546e-07, + "loss": 0.605, + "step": 72879 + }, + { + "epoch": 1.87, + "learning_rate": 6.583728014614737e-07, + "loss": 0.7026, + "step": 72880 + }, + { + "epoch": 1.87, + "learning_rate": 6.583467959160607e-07, + "loss": 0.7773, + "step": 72881 + }, + { + "epoch": 1.87, + "learning_rate": 6.583207906322361e-07, + "loss": 0.6455, + "step": 72882 + }, + { + "epoch": 1.87, + "learning_rate": 6.582947856100198e-07, + "loss": 0.5537, + "step": 72883 + }, + { + "epoch": 1.87, + "learning_rate": 6.582687808494312e-07, + "loss": 0.665, + "step": 72884 + }, + { + "epoch": 1.87, + "learning_rate": 6.582427763504905e-07, + "loss": 0.6191, + "step": 72885 + }, + { + "epoch": 1.87, + "learning_rate": 6.582167721132174e-07, + "loss": 0.4097, + "step": 72886 + }, + { + "epoch": 1.87, + "learning_rate": 6.581907681376322e-07, + "loss": 0.7061, + "step": 72887 + }, + { + "epoch": 1.87, + "learning_rate": 6.581647644237547e-07, + "loss": 0.6113, + "step": 72888 + }, + { + "epoch": 1.87, + "learning_rate": 6.581387609716044e-07, + "loss": 0.6709, + "step": 72889 + }, + { + "epoch": 1.87, + "learning_rate": 6.581127577812018e-07, + "loss": 0.7578, + "step": 72890 + }, + { + "epoch": 1.87, + "learning_rate": 6.580867548525664e-07, + "loss": 0.5547, + "step": 72891 + }, + { + "epoch": 1.87, + "learning_rate": 6.580607521857183e-07, + "loss": 0.4016, + "step": 72892 + }, + { + "epoch": 1.87, + "learning_rate": 6.580347497806776e-07, + "loss": 0.5879, + "step": 72893 + }, + { + "epoch": 1.87, + "learning_rate": 6.580087476374636e-07, + "loss": 0.5601, + "step": 72894 + }, + { + "epoch": 1.87, + "learning_rate": 6.579827457560969e-07, + "loss": 0.7266, + "step": 72895 + }, + { + "epoch": 1.87, + "learning_rate": 6.579567441365968e-07, + "loss": 0.6934, + "step": 72896 + }, + { + "epoch": 1.87, + "learning_rate": 6.579307427789835e-07, + "loss": 0.625, + "step": 72897 + }, + { + "epoch": 1.87, + "learning_rate": 6.579047416832769e-07, + "loss": 0.7012, + "step": 72898 + }, + { + "epoch": 1.87, + "learning_rate": 6.578787408494971e-07, + "loss": 0.4702, + "step": 72899 + }, + { + "epoch": 1.87, + "learning_rate": 6.578527402776636e-07, + "loss": 0.8262, + "step": 72900 + }, + { + "epoch": 1.87, + "learning_rate": 6.578267399677967e-07, + "loss": 0.7305, + "step": 72901 + }, + { + "epoch": 1.87, + "learning_rate": 6.578007399199159e-07, + "loss": 0.6382, + "step": 72902 + }, + { + "epoch": 1.87, + "learning_rate": 6.577747401340418e-07, + "loss": 0.7529, + "step": 72903 + }, + { + "epoch": 1.87, + "learning_rate": 6.577487406101937e-07, + "loss": 0.8042, + "step": 72904 + }, + { + "epoch": 1.87, + "learning_rate": 6.577227413483915e-07, + "loss": 0.4878, + "step": 72905 + }, + { + "epoch": 1.87, + "learning_rate": 6.576967423486553e-07, + "loss": 0.4431, + "step": 72906 + }, + { + "epoch": 1.87, + "learning_rate": 6.576707436110049e-07, + "loss": 0.7524, + "step": 72907 + }, + { + "epoch": 1.87, + "learning_rate": 6.576447451354602e-07, + "loss": 0.6484, + "step": 72908 + }, + { + "epoch": 1.87, + "learning_rate": 6.576187469220413e-07, + "loss": 0.4956, + "step": 72909 + }, + { + "epoch": 1.87, + "learning_rate": 6.575927489707679e-07, + "loss": 0.584, + "step": 72910 + }, + { + "epoch": 1.87, + "learning_rate": 6.575667512816601e-07, + "loss": 0.6094, + "step": 72911 + }, + { + "epoch": 1.87, + "learning_rate": 6.575407538547375e-07, + "loss": 0.8506, + "step": 72912 + }, + { + "epoch": 1.87, + "learning_rate": 6.575147566900207e-07, + "loss": 0.4673, + "step": 72913 + }, + { + "epoch": 1.87, + "learning_rate": 6.574887597875287e-07, + "loss": 0.749, + "step": 72914 + }, + { + "epoch": 1.87, + "learning_rate": 6.574627631472817e-07, + "loss": 0.5801, + "step": 72915 + }, + { + "epoch": 1.87, + "learning_rate": 6.574367667693e-07, + "loss": 0.668, + "step": 72916 + }, + { + "epoch": 1.87, + "learning_rate": 6.57410770653603e-07, + "loss": 0.6904, + "step": 72917 + }, + { + "epoch": 1.87, + "learning_rate": 6.573847748002111e-07, + "loss": 0.7422, + "step": 72918 + }, + { + "epoch": 1.87, + "learning_rate": 6.573587792091435e-07, + "loss": 0.6431, + "step": 72919 + }, + { + "epoch": 1.87, + "learning_rate": 6.573327838804208e-07, + "loss": 0.5645, + "step": 72920 + }, + { + "epoch": 1.87, + "learning_rate": 6.573067888140624e-07, + "loss": 0.7412, + "step": 72921 + }, + { + "epoch": 1.87, + "learning_rate": 6.572807940100887e-07, + "loss": 0.8018, + "step": 72922 + }, + { + "epoch": 1.87, + "learning_rate": 6.572547994685196e-07, + "loss": 0.6895, + "step": 72923 + }, + { + "epoch": 1.87, + "learning_rate": 6.572288051893744e-07, + "loss": 0.6777, + "step": 72924 + }, + { + "epoch": 1.87, + "learning_rate": 6.572028111726732e-07, + "loss": 0.7754, + "step": 72925 + }, + { + "epoch": 1.87, + "learning_rate": 6.571768174184363e-07, + "loss": 0.6416, + "step": 72926 + }, + { + "epoch": 1.87, + "learning_rate": 6.571508239266832e-07, + "loss": 0.7134, + "step": 72927 + }, + { + "epoch": 1.87, + "learning_rate": 6.57124830697434e-07, + "loss": 0.4634, + "step": 72928 + }, + { + "epoch": 1.87, + "learning_rate": 6.570988377307084e-07, + "loss": 0.7559, + "step": 72929 + }, + { + "epoch": 1.87, + "learning_rate": 6.570728450265266e-07, + "loss": 0.5898, + "step": 72930 + }, + { + "epoch": 1.87, + "learning_rate": 6.570468525849083e-07, + "loss": 0.6377, + "step": 72931 + }, + { + "epoch": 1.87, + "learning_rate": 6.570208604058736e-07, + "loss": 0.668, + "step": 72932 + }, + { + "epoch": 1.87, + "learning_rate": 6.569948684894425e-07, + "loss": 0.6865, + "step": 72933 + }, + { + "epoch": 1.87, + "learning_rate": 6.569688768356341e-07, + "loss": 0.5981, + "step": 72934 + }, + { + "epoch": 1.87, + "learning_rate": 6.56942885444469e-07, + "loss": 0.6304, + "step": 72935 + }, + { + "epoch": 1.87, + "learning_rate": 6.56916894315967e-07, + "loss": 0.7656, + "step": 72936 + }, + { + "epoch": 1.87, + "learning_rate": 6.56890903450148e-07, + "loss": 0.5898, + "step": 72937 + }, + { + "epoch": 1.87, + "learning_rate": 6.568649128470318e-07, + "loss": 0.5591, + "step": 72938 + }, + { + "epoch": 1.87, + "learning_rate": 6.568389225066384e-07, + "loss": 0.7515, + "step": 72939 + }, + { + "epoch": 1.87, + "learning_rate": 6.568129324289875e-07, + "loss": 0.6265, + "step": 72940 + }, + { + "epoch": 1.87, + "learning_rate": 6.567869426140995e-07, + "loss": 0.7388, + "step": 72941 + }, + { + "epoch": 1.87, + "learning_rate": 6.567609530619935e-07, + "loss": 0.5747, + "step": 72942 + }, + { + "epoch": 1.87, + "learning_rate": 6.567349637726906e-07, + "loss": 0.541, + "step": 72943 + }, + { + "epoch": 1.87, + "learning_rate": 6.567089747462095e-07, + "loss": 0.6079, + "step": 72944 + }, + { + "epoch": 1.87, + "learning_rate": 6.566829859825706e-07, + "loss": 0.6709, + "step": 72945 + }, + { + "epoch": 1.87, + "learning_rate": 6.566569974817935e-07, + "loss": 0.7188, + "step": 72946 + }, + { + "epoch": 1.87, + "learning_rate": 6.566310092438987e-07, + "loss": 0.6714, + "step": 72947 + }, + { + "epoch": 1.87, + "learning_rate": 6.566050212689054e-07, + "loss": 0.6641, + "step": 72948 + }, + { + "epoch": 1.87, + "learning_rate": 6.565790335568342e-07, + "loss": 0.6079, + "step": 72949 + }, + { + "epoch": 1.87, + "learning_rate": 6.565530461077042e-07, + "loss": 0.7339, + "step": 72950 + }, + { + "epoch": 1.87, + "learning_rate": 6.565270589215362e-07, + "loss": 0.6943, + "step": 72951 + }, + { + "epoch": 1.87, + "learning_rate": 6.565010719983493e-07, + "loss": 0.5405, + "step": 72952 + }, + { + "epoch": 1.87, + "learning_rate": 6.564750853381642e-07, + "loss": 0.6851, + "step": 72953 + }, + { + "epoch": 1.87, + "learning_rate": 6.564490989410001e-07, + "loss": 0.5151, + "step": 72954 + }, + { + "epoch": 1.87, + "learning_rate": 6.564231128068769e-07, + "loss": 0.6797, + "step": 72955 + }, + { + "epoch": 1.87, + "learning_rate": 6.563971269358148e-07, + "loss": 0.7119, + "step": 72956 + }, + { + "epoch": 1.87, + "learning_rate": 6.563711413278336e-07, + "loss": 0.8271, + "step": 72957 + }, + { + "epoch": 1.87, + "learning_rate": 6.563451559829534e-07, + "loss": 0.4683, + "step": 72958 + }, + { + "epoch": 1.87, + "learning_rate": 6.563191709011937e-07, + "loss": 0.6396, + "step": 72959 + }, + { + "epoch": 1.87, + "learning_rate": 6.562931860825749e-07, + "loss": 0.6416, + "step": 72960 + }, + { + "epoch": 1.87, + "learning_rate": 6.562672015271164e-07, + "loss": 0.8184, + "step": 72961 + }, + { + "epoch": 1.87, + "learning_rate": 6.562412172348383e-07, + "loss": 0.731, + "step": 72962 + }, + { + "epoch": 1.87, + "learning_rate": 6.562152332057608e-07, + "loss": 0.5073, + "step": 72963 + }, + { + "epoch": 1.87, + "learning_rate": 6.561892494399033e-07, + "loss": 0.6816, + "step": 72964 + }, + { + "epoch": 1.87, + "learning_rate": 6.561632659372856e-07, + "loss": 0.7158, + "step": 72965 + }, + { + "epoch": 1.87, + "learning_rate": 6.561372826979281e-07, + "loss": 0.6519, + "step": 72966 + }, + { + "epoch": 1.87, + "learning_rate": 6.561112997218503e-07, + "loss": 0.6904, + "step": 72967 + }, + { + "epoch": 1.87, + "learning_rate": 6.560853170090725e-07, + "loss": 0.7197, + "step": 72968 + }, + { + "epoch": 1.87, + "learning_rate": 6.560593345596142e-07, + "loss": 0.7227, + "step": 72969 + }, + { + "epoch": 1.87, + "learning_rate": 6.560333523734956e-07, + "loss": 0.519, + "step": 72970 + }, + { + "epoch": 1.87, + "learning_rate": 6.560073704507363e-07, + "loss": 0.4561, + "step": 72971 + }, + { + "epoch": 1.87, + "learning_rate": 6.559813887913565e-07, + "loss": 0.6147, + "step": 72972 + }, + { + "epoch": 1.87, + "learning_rate": 6.559554073953761e-07, + "loss": 0.5532, + "step": 72973 + }, + { + "epoch": 1.87, + "learning_rate": 6.559294262628144e-07, + "loss": 0.5171, + "step": 72974 + }, + { + "epoch": 1.87, + "learning_rate": 6.559034453936921e-07, + "loss": 0.3677, + "step": 72975 + }, + { + "epoch": 1.87, + "learning_rate": 6.558774647880282e-07, + "loss": 0.7568, + "step": 72976 + }, + { + "epoch": 1.87, + "learning_rate": 6.558514844458434e-07, + "loss": 0.6709, + "step": 72977 + }, + { + "epoch": 1.87, + "learning_rate": 6.558255043671575e-07, + "loss": 0.4902, + "step": 72978 + }, + { + "epoch": 1.87, + "learning_rate": 6.557995245519899e-07, + "loss": 0.6021, + "step": 72979 + }, + { + "epoch": 1.87, + "learning_rate": 6.557735450003607e-07, + "loss": 0.667, + "step": 72980 + }, + { + "epoch": 1.87, + "learning_rate": 6.5574756571229e-07, + "loss": 0.6284, + "step": 72981 + }, + { + "epoch": 1.87, + "learning_rate": 6.557215866877976e-07, + "loss": 0.751, + "step": 72982 + }, + { + "epoch": 1.87, + "learning_rate": 6.556956079269036e-07, + "loss": 0.6172, + "step": 72983 + }, + { + "epoch": 1.87, + "learning_rate": 6.556696294296274e-07, + "loss": 0.7051, + "step": 72984 + }, + { + "epoch": 1.87, + "learning_rate": 6.556436511959891e-07, + "loss": 0.6484, + "step": 72985 + }, + { + "epoch": 1.87, + "learning_rate": 6.556176732260085e-07, + "loss": 0.5757, + "step": 72986 + }, + { + "epoch": 1.87, + "learning_rate": 6.555916955197058e-07, + "loss": 0.6543, + "step": 72987 + }, + { + "epoch": 1.87, + "learning_rate": 6.555657180771006e-07, + "loss": 0.4897, + "step": 72988 + }, + { + "epoch": 1.87, + "learning_rate": 6.555397408982129e-07, + "loss": 0.7109, + "step": 72989 + }, + { + "epoch": 1.87, + "learning_rate": 6.555137639830626e-07, + "loss": 0.7246, + "step": 72990 + }, + { + "epoch": 1.87, + "learning_rate": 6.554877873316696e-07, + "loss": 0.606, + "step": 72991 + }, + { + "epoch": 1.87, + "learning_rate": 6.554618109440536e-07, + "loss": 0.5371, + "step": 72992 + }, + { + "epoch": 1.87, + "learning_rate": 6.554358348202351e-07, + "loss": 0.6246, + "step": 72993 + }, + { + "epoch": 1.87, + "learning_rate": 6.554098589602333e-07, + "loss": 0.6797, + "step": 72994 + }, + { + "epoch": 1.87, + "learning_rate": 6.553838833640684e-07, + "loss": 0.7607, + "step": 72995 + }, + { + "epoch": 1.87, + "learning_rate": 6.553579080317598e-07, + "loss": 0.583, + "step": 72996 + }, + { + "epoch": 1.87, + "learning_rate": 6.553319329633282e-07, + "loss": 0.7764, + "step": 72997 + }, + { + "epoch": 1.87, + "learning_rate": 6.553059581587929e-07, + "loss": 0.5552, + "step": 72998 + }, + { + "epoch": 1.87, + "learning_rate": 6.552799836181741e-07, + "loss": 0.6162, + "step": 72999 + }, + { + "epoch": 1.87, + "learning_rate": 6.552540093414913e-07, + "loss": 0.5366, + "step": 73000 + }, + { + "epoch": 1.87, + "learning_rate": 6.552280353287649e-07, + "loss": 0.6738, + "step": 73001 + }, + { + "epoch": 1.87, + "learning_rate": 6.552020615800149e-07, + "loss": 0.6426, + "step": 73002 + }, + { + "epoch": 1.87, + "learning_rate": 6.551760880952603e-07, + "loss": 0.7192, + "step": 73003 + }, + { + "epoch": 1.87, + "learning_rate": 6.551501148745218e-07, + "loss": 0.5874, + "step": 73004 + }, + { + "epoch": 1.87, + "learning_rate": 6.551241419178186e-07, + "loss": 0.6826, + "step": 73005 + }, + { + "epoch": 1.87, + "learning_rate": 6.550981692251713e-07, + "loss": 0.4592, + "step": 73006 + }, + { + "epoch": 1.87, + "learning_rate": 6.550721967965993e-07, + "loss": 0.4948, + "step": 73007 + }, + { + "epoch": 1.87, + "learning_rate": 6.550462246321228e-07, + "loss": 0.6904, + "step": 73008 + }, + { + "epoch": 1.87, + "learning_rate": 6.550202527317615e-07, + "loss": 0.6895, + "step": 73009 + }, + { + "epoch": 1.87, + "learning_rate": 6.549942810955353e-07, + "loss": 0.5996, + "step": 73010 + }, + { + "epoch": 1.87, + "learning_rate": 6.549683097234641e-07, + "loss": 0.6294, + "step": 73011 + }, + { + "epoch": 1.87, + "learning_rate": 6.549423386155684e-07, + "loss": 0.7188, + "step": 73012 + }, + { + "epoch": 1.87, + "learning_rate": 6.549163677718668e-07, + "loss": 0.7217, + "step": 73013 + }, + { + "epoch": 1.87, + "learning_rate": 6.5489039719238e-07, + "loss": 0.6626, + "step": 73014 + }, + { + "epoch": 1.87, + "learning_rate": 6.548644268771276e-07, + "loss": 0.5952, + "step": 73015 + }, + { + "epoch": 1.87, + "learning_rate": 6.548384568261299e-07, + "loss": 0.7178, + "step": 73016 + }, + { + "epoch": 1.87, + "learning_rate": 6.548124870394062e-07, + "loss": 0.7344, + "step": 73017 + }, + { + "epoch": 1.87, + "learning_rate": 6.547865175169771e-07, + "loss": 0.6978, + "step": 73018 + }, + { + "epoch": 1.87, + "learning_rate": 6.547605482588618e-07, + "loss": 0.5879, + "step": 73019 + }, + { + "epoch": 1.87, + "learning_rate": 6.547345792650807e-07, + "loss": 0.6357, + "step": 73020 + }, + { + "epoch": 1.87, + "learning_rate": 6.547086105356532e-07, + "loss": 0.6182, + "step": 73021 + }, + { + "epoch": 1.87, + "learning_rate": 6.546826420705999e-07, + "loss": 0.5808, + "step": 73022 + }, + { + "epoch": 1.87, + "learning_rate": 6.546566738699399e-07, + "loss": 0.6343, + "step": 73023 + }, + { + "epoch": 1.87, + "learning_rate": 6.546307059336933e-07, + "loss": 0.6279, + "step": 73024 + }, + { + "epoch": 1.87, + "learning_rate": 6.546047382618803e-07, + "loss": 0.7939, + "step": 73025 + }, + { + "epoch": 1.87, + "learning_rate": 6.545787708545204e-07, + "loss": 0.6982, + "step": 73026 + }, + { + "epoch": 1.87, + "learning_rate": 6.545528037116338e-07, + "loss": 0.5859, + "step": 73027 + }, + { + "epoch": 1.87, + "learning_rate": 6.5452683683324e-07, + "loss": 0.6133, + "step": 73028 + }, + { + "epoch": 1.87, + "learning_rate": 6.545008702193594e-07, + "loss": 0.7031, + "step": 73029 + }, + { + "epoch": 1.87, + "learning_rate": 6.544749038700112e-07, + "loss": 0.5161, + "step": 73030 + }, + { + "epoch": 1.87, + "learning_rate": 6.544489377852162e-07, + "loss": 0.6147, + "step": 73031 + }, + { + "epoch": 1.87, + "learning_rate": 6.544229719649938e-07, + "loss": 0.6506, + "step": 73032 + }, + { + "epoch": 1.87, + "learning_rate": 6.543970064093636e-07, + "loss": 0.7227, + "step": 73033 + }, + { + "epoch": 1.87, + "learning_rate": 6.543710411183457e-07, + "loss": 0.6455, + "step": 73034 + }, + { + "epoch": 1.87, + "learning_rate": 6.543450760919599e-07, + "loss": 0.5193, + "step": 73035 + }, + { + "epoch": 1.87, + "learning_rate": 6.543191113302261e-07, + "loss": 0.5071, + "step": 73036 + }, + { + "epoch": 1.87, + "learning_rate": 6.542931468331645e-07, + "loss": 0.6646, + "step": 73037 + }, + { + "epoch": 1.87, + "learning_rate": 6.542671826007946e-07, + "loss": 0.5537, + "step": 73038 + }, + { + "epoch": 1.87, + "learning_rate": 6.542412186331365e-07, + "loss": 0.6699, + "step": 73039 + }, + { + "epoch": 1.87, + "learning_rate": 6.542152549302098e-07, + "loss": 0.7705, + "step": 73040 + }, + { + "epoch": 1.87, + "learning_rate": 6.541892914920348e-07, + "loss": 0.6011, + "step": 73041 + }, + { + "epoch": 1.87, + "learning_rate": 6.541633283186315e-07, + "loss": 0.5327, + "step": 73042 + }, + { + "epoch": 1.87, + "learning_rate": 6.541373654100189e-07, + "loss": 0.7324, + "step": 73043 + }, + { + "epoch": 1.87, + "learning_rate": 6.541114027662178e-07, + "loss": 0.7402, + "step": 73044 + }, + { + "epoch": 1.87, + "learning_rate": 6.540854403872472e-07, + "loss": 0.7305, + "step": 73045 + }, + { + "epoch": 1.87, + "learning_rate": 6.540594782731279e-07, + "loss": 0.6787, + "step": 73046 + }, + { + "epoch": 1.87, + "learning_rate": 6.54033516423879e-07, + "loss": 0.6987, + "step": 73047 + }, + { + "epoch": 1.87, + "learning_rate": 6.54007554839521e-07, + "loss": 0.5684, + "step": 73048 + }, + { + "epoch": 1.87, + "learning_rate": 6.539815935200733e-07, + "loss": 0.6572, + "step": 73049 + }, + { + "epoch": 1.87, + "learning_rate": 6.539556324655562e-07, + "loss": 0.6123, + "step": 73050 + }, + { + "epoch": 1.87, + "learning_rate": 6.539296716759894e-07, + "loss": 0.7256, + "step": 73051 + }, + { + "epoch": 1.87, + "learning_rate": 6.539037111513929e-07, + "loss": 0.7754, + "step": 73052 + }, + { + "epoch": 1.87, + "learning_rate": 6.53877750891786e-07, + "loss": 0.5615, + "step": 73053 + }, + { + "epoch": 1.87, + "learning_rate": 6.538517908971892e-07, + "loss": 0.6025, + "step": 73054 + }, + { + "epoch": 1.87, + "learning_rate": 6.538258311676219e-07, + "loss": 0.7383, + "step": 73055 + }, + { + "epoch": 1.87, + "learning_rate": 6.537998717031045e-07, + "loss": 0.6543, + "step": 73056 + }, + { + "epoch": 1.87, + "learning_rate": 6.537739125036564e-07, + "loss": 0.5923, + "step": 73057 + }, + { + "epoch": 1.87, + "learning_rate": 6.53747953569298e-07, + "loss": 0.5806, + "step": 73058 + }, + { + "epoch": 1.87, + "learning_rate": 6.537219949000486e-07, + "loss": 0.6777, + "step": 73059 + }, + { + "epoch": 1.87, + "learning_rate": 6.536960364959285e-07, + "loss": 0.7686, + "step": 73060 + }, + { + "epoch": 1.87, + "learning_rate": 6.536700783569572e-07, + "loss": 0.6387, + "step": 73061 + }, + { + "epoch": 1.87, + "learning_rate": 6.536441204831554e-07, + "loss": 0.6543, + "step": 73062 + }, + { + "epoch": 1.87, + "learning_rate": 6.536181628745418e-07, + "loss": 0.5049, + "step": 73063 + }, + { + "epoch": 1.87, + "learning_rate": 6.53592205531137e-07, + "loss": 0.7529, + "step": 73064 + }, + { + "epoch": 1.87, + "learning_rate": 6.535662484529608e-07, + "loss": 0.751, + "step": 73065 + }, + { + "epoch": 1.87, + "learning_rate": 6.535402916400328e-07, + "loss": 0.4752, + "step": 73066 + }, + { + "epoch": 1.87, + "learning_rate": 6.535143350923732e-07, + "loss": 0.6128, + "step": 73067 + }, + { + "epoch": 1.87, + "learning_rate": 6.534883788100019e-07, + "loss": 0.7524, + "step": 73068 + }, + { + "epoch": 1.87, + "learning_rate": 6.534624227929382e-07, + "loss": 0.6553, + "step": 73069 + }, + { + "epoch": 1.87, + "learning_rate": 6.534364670412026e-07, + "loss": 0.6748, + "step": 73070 + }, + { + "epoch": 1.87, + "learning_rate": 6.534105115548147e-07, + "loss": 0.4878, + "step": 73071 + }, + { + "epoch": 1.87, + "learning_rate": 6.533845563337949e-07, + "loss": 0.6279, + "step": 73072 + }, + { + "epoch": 1.87, + "learning_rate": 6.533586013781622e-07, + "loss": 0.5688, + "step": 73073 + }, + { + "epoch": 1.87, + "learning_rate": 6.533326466879368e-07, + "loss": 0.6416, + "step": 73074 + }, + { + "epoch": 1.87, + "learning_rate": 6.533066922631388e-07, + "loss": 0.4858, + "step": 73075 + }, + { + "epoch": 1.87, + "learning_rate": 6.532807381037879e-07, + "loss": 0.8701, + "step": 73076 + }, + { + "epoch": 1.87, + "learning_rate": 6.53254784209904e-07, + "loss": 0.6226, + "step": 73077 + }, + { + "epoch": 1.87, + "learning_rate": 6.532288305815068e-07, + "loss": 0.6055, + "step": 73078 + }, + { + "epoch": 1.87, + "learning_rate": 6.532028772186166e-07, + "loss": 0.5859, + "step": 73079 + }, + { + "epoch": 1.87, + "learning_rate": 6.531769241212526e-07, + "loss": 0.5715, + "step": 73080 + }, + { + "epoch": 1.87, + "learning_rate": 6.531509712894357e-07, + "loss": 0.6802, + "step": 73081 + }, + { + "epoch": 1.87, + "learning_rate": 6.531250187231849e-07, + "loss": 0.3105, + "step": 73082 + }, + { + "epoch": 1.87, + "learning_rate": 6.530990664225202e-07, + "loss": 0.5066, + "step": 73083 + }, + { + "epoch": 1.87, + "learning_rate": 6.530731143874617e-07, + "loss": 0.5715, + "step": 73084 + }, + { + "epoch": 1.87, + "learning_rate": 6.530471626180291e-07, + "loss": 0.793, + "step": 73085 + }, + { + "epoch": 1.87, + "learning_rate": 6.530212111142423e-07, + "loss": 0.5571, + "step": 73086 + }, + { + "epoch": 1.87, + "learning_rate": 6.529952598761213e-07, + "loss": 0.5376, + "step": 73087 + }, + { + "epoch": 1.87, + "learning_rate": 6.529693089036858e-07, + "loss": 0.8291, + "step": 73088 + }, + { + "epoch": 1.87, + "learning_rate": 6.529433581969558e-07, + "loss": 0.5723, + "step": 73089 + }, + { + "epoch": 1.87, + "learning_rate": 6.529174077559509e-07, + "loss": 0.521, + "step": 73090 + }, + { + "epoch": 1.87, + "learning_rate": 6.528914575806914e-07, + "loss": 0.5474, + "step": 73091 + }, + { + "epoch": 1.87, + "learning_rate": 6.528655076711973e-07, + "loss": 0.6826, + "step": 73092 + }, + { + "epoch": 1.87, + "learning_rate": 6.528395580274875e-07, + "loss": 0.7871, + "step": 73093 + }, + { + "epoch": 1.87, + "learning_rate": 6.528136086495829e-07, + "loss": 0.7646, + "step": 73094 + }, + { + "epoch": 1.87, + "learning_rate": 6.527876595375026e-07, + "loss": 0.5576, + "step": 73095 + }, + { + "epoch": 1.87, + "learning_rate": 6.52761710691267e-07, + "loss": 0.6621, + "step": 73096 + }, + { + "epoch": 1.87, + "learning_rate": 6.527357621108957e-07, + "loss": 0.8037, + "step": 73097 + }, + { + "epoch": 1.87, + "learning_rate": 6.527098137964089e-07, + "loss": 0.5957, + "step": 73098 + }, + { + "epoch": 1.87, + "learning_rate": 6.526838657478259e-07, + "loss": 0.5596, + "step": 73099 + }, + { + "epoch": 1.87, + "learning_rate": 6.526579179651672e-07, + "loss": 0.6128, + "step": 73100 + }, + { + "epoch": 1.87, + "learning_rate": 6.526319704484521e-07, + "loss": 0.5469, + "step": 73101 + }, + { + "epoch": 1.87, + "learning_rate": 6.526060231977011e-07, + "loss": 0.5586, + "step": 73102 + }, + { + "epoch": 1.87, + "learning_rate": 6.525800762129336e-07, + "loss": 0.5684, + "step": 73103 + }, + { + "epoch": 1.87, + "learning_rate": 6.525541294941694e-07, + "loss": 0.4819, + "step": 73104 + }, + { + "epoch": 1.87, + "learning_rate": 6.525281830414284e-07, + "loss": 0.4351, + "step": 73105 + }, + { + "epoch": 1.87, + "learning_rate": 6.525022368547308e-07, + "loss": 0.7217, + "step": 73106 + }, + { + "epoch": 1.87, + "learning_rate": 6.524762909340961e-07, + "loss": 0.6112, + "step": 73107 + }, + { + "epoch": 1.87, + "learning_rate": 6.524503452795446e-07, + "loss": 0.5796, + "step": 73108 + }, + { + "epoch": 1.87, + "learning_rate": 6.524243998910956e-07, + "loss": 0.6128, + "step": 73109 + }, + { + "epoch": 1.87, + "learning_rate": 6.523984547687693e-07, + "loss": 0.6289, + "step": 73110 + }, + { + "epoch": 1.87, + "learning_rate": 6.523725099125856e-07, + "loss": 0.7803, + "step": 73111 + }, + { + "epoch": 1.87, + "learning_rate": 6.523465653225645e-07, + "loss": 0.4839, + "step": 73112 + }, + { + "epoch": 1.87, + "learning_rate": 6.523206209987256e-07, + "loss": 0.6006, + "step": 73113 + }, + { + "epoch": 1.87, + "learning_rate": 6.522946769410884e-07, + "loss": 0.5435, + "step": 73114 + }, + { + "epoch": 1.87, + "learning_rate": 6.522687331496734e-07, + "loss": 0.5122, + "step": 73115 + }, + { + "epoch": 1.87, + "learning_rate": 6.522427896245002e-07, + "loss": 0.7002, + "step": 73116 + }, + { + "epoch": 1.87, + "learning_rate": 6.522168463655888e-07, + "loss": 0.7188, + "step": 73117 + }, + { + "epoch": 1.87, + "learning_rate": 6.521909033729588e-07, + "loss": 0.6611, + "step": 73118 + }, + { + "epoch": 1.87, + "learning_rate": 6.521649606466304e-07, + "loss": 0.7119, + "step": 73119 + }, + { + "epoch": 1.87, + "learning_rate": 6.521390181866231e-07, + "loss": 0.833, + "step": 73120 + }, + { + "epoch": 1.87, + "learning_rate": 6.521130759929572e-07, + "loss": 0.7559, + "step": 73121 + }, + { + "epoch": 1.87, + "learning_rate": 6.520871340656527e-07, + "loss": 0.6509, + "step": 73122 + }, + { + "epoch": 1.87, + "learning_rate": 6.520611924047286e-07, + "loss": 0.6484, + "step": 73123 + }, + { + "epoch": 1.87, + "learning_rate": 6.520352510102052e-07, + "loss": 0.7373, + "step": 73124 + }, + { + "epoch": 1.87, + "learning_rate": 6.520093098821025e-07, + "loss": 0.7256, + "step": 73125 + }, + { + "epoch": 1.87, + "learning_rate": 6.519833690204401e-07, + "loss": 0.3957, + "step": 73126 + }, + { + "epoch": 1.87, + "learning_rate": 6.519574284252383e-07, + "loss": 0.7061, + "step": 73127 + }, + { + "epoch": 1.87, + "learning_rate": 6.519314880965164e-07, + "loss": 0.605, + "step": 73128 + }, + { + "epoch": 1.87, + "learning_rate": 6.519055480342947e-07, + "loss": 0.623, + "step": 73129 + }, + { + "epoch": 1.87, + "learning_rate": 6.518796082385929e-07, + "loss": 0.5977, + "step": 73130 + }, + { + "epoch": 1.87, + "learning_rate": 6.518536687094309e-07, + "loss": 0.584, + "step": 73131 + }, + { + "epoch": 1.87, + "learning_rate": 6.518277294468289e-07, + "loss": 0.7637, + "step": 73132 + }, + { + "epoch": 1.87, + "learning_rate": 6.51801790450806e-07, + "loss": 0.5757, + "step": 73133 + }, + { + "epoch": 1.87, + "learning_rate": 6.517758517213825e-07, + "loss": 0.7402, + "step": 73134 + }, + { + "epoch": 1.87, + "learning_rate": 6.517499132585782e-07, + "loss": 0.7046, + "step": 73135 + }, + { + "epoch": 1.87, + "learning_rate": 6.517239750624131e-07, + "loss": 0.7637, + "step": 73136 + }, + { + "epoch": 1.87, + "learning_rate": 6.516980371329066e-07, + "loss": 0.7031, + "step": 73137 + }, + { + "epoch": 1.87, + "learning_rate": 6.516720994700793e-07, + "loss": 0.4678, + "step": 73138 + }, + { + "epoch": 1.87, + "learning_rate": 6.516461620739503e-07, + "loss": 0.562, + "step": 73139 + }, + { + "epoch": 1.87, + "learning_rate": 6.516202249445401e-07, + "loss": 0.5093, + "step": 73140 + }, + { + "epoch": 1.87, + "learning_rate": 6.515942880818683e-07, + "loss": 0.7251, + "step": 73141 + }, + { + "epoch": 1.87, + "learning_rate": 6.515683514859549e-07, + "loss": 0.6582, + "step": 73142 + }, + { + "epoch": 1.87, + "learning_rate": 6.515424151568192e-07, + "loss": 0.7144, + "step": 73143 + }, + { + "epoch": 1.87, + "learning_rate": 6.515164790944816e-07, + "loss": 0.5574, + "step": 73144 + }, + { + "epoch": 1.87, + "learning_rate": 6.514905432989617e-07, + "loss": 0.564, + "step": 73145 + }, + { + "epoch": 1.87, + "learning_rate": 6.514646077702796e-07, + "loss": 0.7446, + "step": 73146 + }, + { + "epoch": 1.87, + "learning_rate": 6.514386725084548e-07, + "loss": 0.6826, + "step": 73147 + }, + { + "epoch": 1.87, + "learning_rate": 6.514127375135076e-07, + "loss": 0.6436, + "step": 73148 + }, + { + "epoch": 1.87, + "learning_rate": 6.513868027854575e-07, + "loss": 0.4497, + "step": 73149 + }, + { + "epoch": 1.87, + "learning_rate": 6.513608683243247e-07, + "loss": 0.6279, + "step": 73150 + }, + { + "epoch": 1.87, + "learning_rate": 6.513349341301286e-07, + "loss": 0.6284, + "step": 73151 + }, + { + "epoch": 1.87, + "learning_rate": 6.513090002028897e-07, + "loss": 0.7383, + "step": 73152 + }, + { + "epoch": 1.87, + "learning_rate": 6.512830665426272e-07, + "loss": 0.7051, + "step": 73153 + }, + { + "epoch": 1.87, + "learning_rate": 6.512571331493612e-07, + "loss": 0.6191, + "step": 73154 + }, + { + "epoch": 1.88, + "learning_rate": 6.512312000231117e-07, + "loss": 0.751, + "step": 73155 + }, + { + "epoch": 1.88, + "learning_rate": 6.512052671638981e-07, + "loss": 0.6748, + "step": 73156 + }, + { + "epoch": 1.88, + "learning_rate": 6.511793345717409e-07, + "loss": 0.6436, + "step": 73157 + }, + { + "epoch": 1.88, + "learning_rate": 6.511534022466598e-07, + "loss": 0.5356, + "step": 73158 + }, + { + "epoch": 1.88, + "learning_rate": 6.511274701886741e-07, + "loss": 0.7119, + "step": 73159 + }, + { + "epoch": 1.88, + "learning_rate": 6.511015383978042e-07, + "loss": 0.6387, + "step": 73160 + }, + { + "epoch": 1.88, + "learning_rate": 6.510756068740697e-07, + "loss": 0.6465, + "step": 73161 + }, + { + "epoch": 1.88, + "learning_rate": 6.51049675617491e-07, + "loss": 0.6484, + "step": 73162 + }, + { + "epoch": 1.88, + "learning_rate": 6.510237446280873e-07, + "loss": 0.6328, + "step": 73163 + }, + { + "epoch": 1.88, + "learning_rate": 6.509978139058784e-07, + "loss": 0.5557, + "step": 73164 + }, + { + "epoch": 1.88, + "learning_rate": 6.509718834508848e-07, + "loss": 0.6973, + "step": 73165 + }, + { + "epoch": 1.88, + "learning_rate": 6.509459532631256e-07, + "loss": 0.6465, + "step": 73166 + }, + { + "epoch": 1.88, + "learning_rate": 6.509200233426214e-07, + "loss": 0.5635, + "step": 73167 + }, + { + "epoch": 1.88, + "learning_rate": 6.508940936893914e-07, + "loss": 0.6187, + "step": 73168 + }, + { + "epoch": 1.88, + "learning_rate": 6.508681643034559e-07, + "loss": 0.5918, + "step": 73169 + }, + { + "epoch": 1.88, + "learning_rate": 6.508422351848344e-07, + "loss": 0.4517, + "step": 73170 + }, + { + "epoch": 1.88, + "learning_rate": 6.508163063335472e-07, + "loss": 0.6914, + "step": 73171 + }, + { + "epoch": 1.88, + "learning_rate": 6.507903777496141e-07, + "loss": 0.75, + "step": 73172 + }, + { + "epoch": 1.88, + "learning_rate": 6.507644494330544e-07, + "loss": 0.5488, + "step": 73173 + }, + { + "epoch": 1.88, + "learning_rate": 6.507385213838883e-07, + "loss": 0.7783, + "step": 73174 + }, + { + "epoch": 1.88, + "learning_rate": 6.507125936021358e-07, + "loss": 0.6465, + "step": 73175 + }, + { + "epoch": 1.88, + "learning_rate": 6.506866660878164e-07, + "loss": 0.6216, + "step": 73176 + }, + { + "epoch": 1.88, + "learning_rate": 6.506607388409504e-07, + "loss": 0.6172, + "step": 73177 + }, + { + "epoch": 1.88, + "learning_rate": 6.506348118615572e-07, + "loss": 0.5483, + "step": 73178 + }, + { + "epoch": 1.88, + "learning_rate": 6.50608885149657e-07, + "loss": 0.7832, + "step": 73179 + }, + { + "epoch": 1.88, + "learning_rate": 6.505829587052693e-07, + "loss": 0.5718, + "step": 73180 + }, + { + "epoch": 1.88, + "learning_rate": 6.505570325284144e-07, + "loss": 0.5344, + "step": 73181 + }, + { + "epoch": 1.88, + "learning_rate": 6.505311066191121e-07, + "loss": 0.48, + "step": 73182 + }, + { + "epoch": 1.88, + "learning_rate": 6.505051809773816e-07, + "loss": 0.5918, + "step": 73183 + }, + { + "epoch": 1.88, + "learning_rate": 6.504792556032435e-07, + "loss": 0.7178, + "step": 73184 + }, + { + "epoch": 1.88, + "learning_rate": 6.50453330496717e-07, + "loss": 0.5757, + "step": 73185 + }, + { + "epoch": 1.88, + "learning_rate": 6.504274056578228e-07, + "loss": 0.4709, + "step": 73186 + }, + { + "epoch": 1.88, + "learning_rate": 6.504014810865799e-07, + "loss": 0.5366, + "step": 73187 + }, + { + "epoch": 1.88, + "learning_rate": 6.503755567830087e-07, + "loss": 0.7412, + "step": 73188 + }, + { + "epoch": 1.88, + "learning_rate": 6.503496327471286e-07, + "loss": 0.5759, + "step": 73189 + }, + { + "epoch": 1.88, + "learning_rate": 6.503237089789601e-07, + "loss": 0.5486, + "step": 73190 + }, + { + "epoch": 1.88, + "learning_rate": 6.502977854785223e-07, + "loss": 0.6333, + "step": 73191 + }, + { + "epoch": 1.88, + "learning_rate": 6.502718622458359e-07, + "loss": 0.8115, + "step": 73192 + }, + { + "epoch": 1.88, + "learning_rate": 6.502459392809199e-07, + "loss": 0.5938, + "step": 73193 + }, + { + "epoch": 1.88, + "learning_rate": 6.502200165837947e-07, + "loss": 0.4142, + "step": 73194 + }, + { + "epoch": 1.88, + "learning_rate": 6.501940941544796e-07, + "loss": 0.6655, + "step": 73195 + }, + { + "epoch": 1.88, + "learning_rate": 6.50168171992995e-07, + "loss": 0.7041, + "step": 73196 + }, + { + "epoch": 1.88, + "learning_rate": 6.501422500993605e-07, + "loss": 0.834, + "step": 73197 + }, + { + "epoch": 1.88, + "learning_rate": 6.50116328473596e-07, + "loss": 0.5856, + "step": 73198 + }, + { + "epoch": 1.88, + "learning_rate": 6.500904071157213e-07, + "loss": 0.5259, + "step": 73199 + }, + { + "epoch": 1.88, + "learning_rate": 6.500644860257564e-07, + "loss": 0.6313, + "step": 73200 + }, + { + "epoch": 1.88, + "learning_rate": 6.500385652037208e-07, + "loss": 0.5471, + "step": 73201 + }, + { + "epoch": 1.88, + "learning_rate": 6.500126446496351e-07, + "loss": 0.7539, + "step": 73202 + }, + { + "epoch": 1.88, + "learning_rate": 6.499867243635184e-07, + "loss": 0.7236, + "step": 73203 + }, + { + "epoch": 1.88, + "learning_rate": 6.499608043453904e-07, + "loss": 0.6235, + "step": 73204 + }, + { + "epoch": 1.88, + "learning_rate": 6.499348845952717e-07, + "loss": 0.8154, + "step": 73205 + }, + { + "epoch": 1.88, + "learning_rate": 6.499089651131815e-07, + "loss": 0.7012, + "step": 73206 + }, + { + "epoch": 1.88, + "learning_rate": 6.498830458991402e-07, + "loss": 0.4778, + "step": 73207 + }, + { + "epoch": 1.88, + "learning_rate": 6.498571269531669e-07, + "loss": 0.7734, + "step": 73208 + }, + { + "epoch": 1.88, + "learning_rate": 6.498312082752824e-07, + "loss": 0.6279, + "step": 73209 + }, + { + "epoch": 1.88, + "learning_rate": 6.498052898655057e-07, + "loss": 0.7607, + "step": 73210 + }, + { + "epoch": 1.88, + "learning_rate": 6.497793717238571e-07, + "loss": 0.533, + "step": 73211 + }, + { + "epoch": 1.88, + "learning_rate": 6.497534538503567e-07, + "loss": 0.7598, + "step": 73212 + }, + { + "epoch": 1.88, + "learning_rate": 6.497275362450237e-07, + "loss": 0.5806, + "step": 73213 + }, + { + "epoch": 1.88, + "learning_rate": 6.497016189078781e-07, + "loss": 0.7627, + "step": 73214 + }, + { + "epoch": 1.88, + "learning_rate": 6.496757018389399e-07, + "loss": 0.6387, + "step": 73215 + }, + { + "epoch": 1.88, + "learning_rate": 6.496497850382288e-07, + "loss": 0.5977, + "step": 73216 + }, + { + "epoch": 1.88, + "learning_rate": 6.496238685057649e-07, + "loss": 0.5737, + "step": 73217 + }, + { + "epoch": 1.88, + "learning_rate": 6.495979522415677e-07, + "loss": 0.7314, + "step": 73218 + }, + { + "epoch": 1.88, + "learning_rate": 6.495720362456576e-07, + "loss": 0.7734, + "step": 73219 + }, + { + "epoch": 1.88, + "learning_rate": 6.495461205180537e-07, + "loss": 0.584, + "step": 73220 + }, + { + "epoch": 1.88, + "learning_rate": 6.495202050587765e-07, + "loss": 0.6045, + "step": 73221 + }, + { + "epoch": 1.88, + "learning_rate": 6.494942898678457e-07, + "loss": 0.6396, + "step": 73222 + }, + { + "epoch": 1.88, + "learning_rate": 6.494683749452808e-07, + "loss": 0.6885, + "step": 73223 + }, + { + "epoch": 1.88, + "learning_rate": 6.494424602911018e-07, + "loss": 0.6201, + "step": 73224 + }, + { + "epoch": 1.88, + "learning_rate": 6.494165459053285e-07, + "loss": 0.5488, + "step": 73225 + }, + { + "epoch": 1.88, + "learning_rate": 6.49390631787981e-07, + "loss": 0.6504, + "step": 73226 + }, + { + "epoch": 1.88, + "learning_rate": 6.493647179390786e-07, + "loss": 0.5718, + "step": 73227 + }, + { + "epoch": 1.88, + "learning_rate": 6.49338804358642e-07, + "loss": 0.6016, + "step": 73228 + }, + { + "epoch": 1.88, + "learning_rate": 6.493128910466903e-07, + "loss": 0.4812, + "step": 73229 + }, + { + "epoch": 1.88, + "learning_rate": 6.492869780032438e-07, + "loss": 0.5796, + "step": 73230 + }, + { + "epoch": 1.88, + "learning_rate": 6.492610652283219e-07, + "loss": 0.6973, + "step": 73231 + }, + { + "epoch": 1.88, + "learning_rate": 6.49235152721945e-07, + "loss": 0.5562, + "step": 73232 + }, + { + "epoch": 1.88, + "learning_rate": 6.492092404841324e-07, + "loss": 0.4819, + "step": 73233 + }, + { + "epoch": 1.88, + "learning_rate": 6.491833285149042e-07, + "loss": 0.5122, + "step": 73234 + }, + { + "epoch": 1.88, + "learning_rate": 6.4915741681428e-07, + "loss": 0.6416, + "step": 73235 + }, + { + "epoch": 1.88, + "learning_rate": 6.491315053822802e-07, + "loss": 0.5776, + "step": 73236 + }, + { + "epoch": 1.88, + "learning_rate": 6.491055942189237e-07, + "loss": 0.6011, + "step": 73237 + }, + { + "epoch": 1.88, + "learning_rate": 6.490796833242313e-07, + "loss": 0.5376, + "step": 73238 + }, + { + "epoch": 1.88, + "learning_rate": 6.490537726982224e-07, + "loss": 0.7461, + "step": 73239 + }, + { + "epoch": 1.88, + "learning_rate": 6.490278623409169e-07, + "loss": 0.793, + "step": 73240 + }, + { + "epoch": 1.88, + "learning_rate": 6.490019522523345e-07, + "loss": 0.4685, + "step": 73241 + }, + { + "epoch": 1.88, + "learning_rate": 6.489760424324957e-07, + "loss": 0.5508, + "step": 73242 + }, + { + "epoch": 1.88, + "learning_rate": 6.489501328814194e-07, + "loss": 0.6714, + "step": 73243 + }, + { + "epoch": 1.88, + "learning_rate": 6.489242235991257e-07, + "loss": 0.6973, + "step": 73244 + }, + { + "epoch": 1.88, + "learning_rate": 6.488983145856348e-07, + "loss": 0.582, + "step": 73245 + }, + { + "epoch": 1.88, + "learning_rate": 6.488724058409661e-07, + "loss": 0.7178, + "step": 73246 + }, + { + "epoch": 1.88, + "learning_rate": 6.488464973651399e-07, + "loss": 0.5361, + "step": 73247 + }, + { + "epoch": 1.88, + "learning_rate": 6.488205891581758e-07, + "loss": 0.4722, + "step": 73248 + }, + { + "epoch": 1.88, + "learning_rate": 6.487946812200933e-07, + "loss": 0.5649, + "step": 73249 + }, + { + "epoch": 1.88, + "learning_rate": 6.487687735509128e-07, + "loss": 0.6816, + "step": 73250 + }, + { + "epoch": 1.88, + "learning_rate": 6.487428661506538e-07, + "loss": 0.6289, + "step": 73251 + }, + { + "epoch": 1.88, + "learning_rate": 6.487169590193365e-07, + "loss": 0.7295, + "step": 73252 + }, + { + "epoch": 1.88, + "learning_rate": 6.486910521569804e-07, + "loss": 0.6953, + "step": 73253 + }, + { + "epoch": 1.88, + "learning_rate": 6.486651455636052e-07, + "loss": 0.667, + "step": 73254 + }, + { + "epoch": 1.88, + "learning_rate": 6.486392392392311e-07, + "loss": 0.7129, + "step": 73255 + }, + { + "epoch": 1.88, + "learning_rate": 6.486133331838775e-07, + "loss": 0.3975, + "step": 73256 + }, + { + "epoch": 1.88, + "learning_rate": 6.485874273975649e-07, + "loss": 0.5171, + "step": 73257 + }, + { + "epoch": 1.88, + "learning_rate": 6.485615218803124e-07, + "loss": 0.4629, + "step": 73258 + }, + { + "epoch": 1.88, + "learning_rate": 6.485356166321404e-07, + "loss": 0.585, + "step": 73259 + }, + { + "epoch": 1.88, + "learning_rate": 6.485097116530683e-07, + "loss": 0.7207, + "step": 73260 + }, + { + "epoch": 1.88, + "learning_rate": 6.484838069431165e-07, + "loss": 0.7588, + "step": 73261 + }, + { + "epoch": 1.88, + "learning_rate": 6.484579025023045e-07, + "loss": 0.6426, + "step": 73262 + }, + { + "epoch": 1.88, + "learning_rate": 6.484319983306518e-07, + "loss": 0.3848, + "step": 73263 + }, + { + "epoch": 1.88, + "learning_rate": 6.484060944281788e-07, + "loss": 0.6738, + "step": 73264 + }, + { + "epoch": 1.88, + "learning_rate": 6.483801907949048e-07, + "loss": 0.7295, + "step": 73265 + }, + { + "epoch": 1.88, + "learning_rate": 6.483542874308502e-07, + "loss": 0.668, + "step": 73266 + }, + { + "epoch": 1.88, + "learning_rate": 6.483283843360345e-07, + "loss": 0.645, + "step": 73267 + }, + { + "epoch": 1.88, + "learning_rate": 6.483024815104774e-07, + "loss": 0.833, + "step": 73268 + }, + { + "epoch": 1.88, + "learning_rate": 6.482765789541991e-07, + "loss": 0.6973, + "step": 73269 + }, + { + "epoch": 1.88, + "learning_rate": 6.482506766672191e-07, + "loss": 0.6602, + "step": 73270 + }, + { + "epoch": 1.88, + "learning_rate": 6.482247746495575e-07, + "loss": 0.8447, + "step": 73271 + }, + { + "epoch": 1.88, + "learning_rate": 6.481988729012343e-07, + "loss": 0.5337, + "step": 73272 + }, + { + "epoch": 1.88, + "learning_rate": 6.481729714222686e-07, + "loss": 0.6816, + "step": 73273 + }, + { + "epoch": 1.88, + "learning_rate": 6.481470702126809e-07, + "loss": 0.6152, + "step": 73274 + }, + { + "epoch": 1.88, + "learning_rate": 6.481211692724906e-07, + "loss": 0.7656, + "step": 73275 + }, + { + "epoch": 1.88, + "learning_rate": 6.480952686017179e-07, + "loss": 0.6406, + "step": 73276 + }, + { + "epoch": 1.88, + "learning_rate": 6.480693682003824e-07, + "loss": 0.4062, + "step": 73277 + }, + { + "epoch": 1.88, + "learning_rate": 6.480434680685041e-07, + "loss": 0.5596, + "step": 73278 + }, + { + "epoch": 1.88, + "learning_rate": 6.480175682061026e-07, + "loss": 0.4443, + "step": 73279 + }, + { + "epoch": 1.88, + "learning_rate": 6.479916686131979e-07, + "loss": 0.6494, + "step": 73280 + }, + { + "epoch": 1.88, + "learning_rate": 6.479657692898097e-07, + "loss": 0.4412, + "step": 73281 + }, + { + "epoch": 1.88, + "learning_rate": 6.479398702359585e-07, + "loss": 0.6528, + "step": 73282 + }, + { + "epoch": 1.88, + "learning_rate": 6.47913971451663e-07, + "loss": 0.5409, + "step": 73283 + }, + { + "epoch": 1.88, + "learning_rate": 6.478880729369438e-07, + "loss": 0.6367, + "step": 73284 + }, + { + "epoch": 1.88, + "learning_rate": 6.478621746918203e-07, + "loss": 0.5505, + "step": 73285 + }, + { + "epoch": 1.88, + "learning_rate": 6.478362767163128e-07, + "loss": 0.6436, + "step": 73286 + }, + { + "epoch": 1.88, + "learning_rate": 6.478103790104406e-07, + "loss": 0.457, + "step": 73287 + }, + { + "epoch": 1.88, + "learning_rate": 6.47784481574224e-07, + "loss": 0.5942, + "step": 73288 + }, + { + "epoch": 1.88, + "learning_rate": 6.477585844076822e-07, + "loss": 0.5674, + "step": 73289 + }, + { + "epoch": 1.88, + "learning_rate": 6.47732687510836e-07, + "loss": 0.6582, + "step": 73290 + }, + { + "epoch": 1.88, + "learning_rate": 6.477067908837047e-07, + "loss": 0.5112, + "step": 73291 + }, + { + "epoch": 1.88, + "learning_rate": 6.476808945263078e-07, + "loss": 0.6392, + "step": 73292 + }, + { + "epoch": 1.88, + "learning_rate": 6.476549984386656e-07, + "loss": 0.7021, + "step": 73293 + }, + { + "epoch": 1.88, + "learning_rate": 6.476291026207976e-07, + "loss": 0.7002, + "step": 73294 + }, + { + "epoch": 1.88, + "learning_rate": 6.47603207072724e-07, + "loss": 0.585, + "step": 73295 + }, + { + "epoch": 1.88, + "learning_rate": 6.475773117944641e-07, + "loss": 0.54, + "step": 73296 + }, + { + "epoch": 1.88, + "learning_rate": 6.475514167860383e-07, + "loss": 0.5522, + "step": 73297 + }, + { + "epoch": 1.88, + "learning_rate": 6.47525522047466e-07, + "loss": 0.6375, + "step": 73298 + }, + { + "epoch": 1.88, + "learning_rate": 6.474996275787674e-07, + "loss": 0.5422, + "step": 73299 + }, + { + "epoch": 1.88, + "learning_rate": 6.47473733379962e-07, + "loss": 0.8408, + "step": 73300 + }, + { + "epoch": 1.88, + "learning_rate": 6.474478394510703e-07, + "loss": 0.4768, + "step": 73301 + }, + { + "epoch": 1.88, + "learning_rate": 6.474219457921109e-07, + "loss": 0.7104, + "step": 73302 + }, + { + "epoch": 1.88, + "learning_rate": 6.473960524031046e-07, + "loss": 0.5327, + "step": 73303 + }, + { + "epoch": 1.88, + "learning_rate": 6.473701592840708e-07, + "loss": 0.6064, + "step": 73304 + }, + { + "epoch": 1.88, + "learning_rate": 6.473442664350294e-07, + "loss": 0.752, + "step": 73305 + }, + { + "epoch": 1.88, + "learning_rate": 6.473183738560002e-07, + "loss": 0.502, + "step": 73306 + }, + { + "epoch": 1.88, + "learning_rate": 6.472924815470035e-07, + "loss": 0.6143, + "step": 73307 + }, + { + "epoch": 1.88, + "learning_rate": 6.472665895080583e-07, + "loss": 0.5874, + "step": 73308 + }, + { + "epoch": 1.88, + "learning_rate": 6.472406977391851e-07, + "loss": 0.6846, + "step": 73309 + }, + { + "epoch": 1.88, + "learning_rate": 6.472148062404032e-07, + "loss": 0.8076, + "step": 73310 + }, + { + "epoch": 1.88, + "learning_rate": 6.471889150117334e-07, + "loss": 0.6074, + "step": 73311 + }, + { + "epoch": 1.88, + "learning_rate": 6.471630240531943e-07, + "loss": 0.4858, + "step": 73312 + }, + { + "epoch": 1.88, + "learning_rate": 6.471371333648062e-07, + "loss": 0.7266, + "step": 73313 + }, + { + "epoch": 1.88, + "learning_rate": 6.471112429465892e-07, + "loss": 0.5276, + "step": 73314 + }, + { + "epoch": 1.88, + "learning_rate": 6.470853527985627e-07, + "loss": 0.6489, + "step": 73315 + }, + { + "epoch": 1.88, + "learning_rate": 6.470594629207468e-07, + "loss": 0.8096, + "step": 73316 + }, + { + "epoch": 1.88, + "learning_rate": 6.470335733131611e-07, + "loss": 0.6377, + "step": 73317 + }, + { + "epoch": 1.88, + "learning_rate": 6.470076839758257e-07, + "loss": 0.5698, + "step": 73318 + }, + { + "epoch": 1.88, + "learning_rate": 6.469817949087602e-07, + "loss": 0.4629, + "step": 73319 + }, + { + "epoch": 1.88, + "learning_rate": 6.469559061119847e-07, + "loss": 0.6899, + "step": 73320 + }, + { + "epoch": 1.88, + "learning_rate": 6.469300175855189e-07, + "loss": 0.6665, + "step": 73321 + }, + { + "epoch": 1.88, + "learning_rate": 6.469041293293825e-07, + "loss": 0.6978, + "step": 73322 + }, + { + "epoch": 1.88, + "learning_rate": 6.468782413435951e-07, + "loss": 0.6108, + "step": 73323 + }, + { + "epoch": 1.88, + "learning_rate": 6.46852353628177e-07, + "loss": 0.6963, + "step": 73324 + }, + { + "epoch": 1.88, + "learning_rate": 6.468264661831475e-07, + "loss": 0.4211, + "step": 73325 + }, + { + "epoch": 1.88, + "learning_rate": 6.468005790085272e-07, + "loss": 0.834, + "step": 73326 + }, + { + "epoch": 1.88, + "learning_rate": 6.46774692104335e-07, + "loss": 0.4854, + "step": 73327 + }, + { + "epoch": 1.88, + "learning_rate": 6.467488054705915e-07, + "loss": 0.5557, + "step": 73328 + }, + { + "epoch": 1.88, + "learning_rate": 6.46722919107316e-07, + "loss": 0.5728, + "step": 73329 + }, + { + "epoch": 1.88, + "learning_rate": 6.466970330145288e-07, + "loss": 0.6025, + "step": 73330 + }, + { + "epoch": 1.88, + "learning_rate": 6.466711471922495e-07, + "loss": 0.6855, + "step": 73331 + }, + { + "epoch": 1.88, + "learning_rate": 6.466452616404974e-07, + "loss": 0.8311, + "step": 73332 + }, + { + "epoch": 1.88, + "learning_rate": 6.466193763592931e-07, + "loss": 0.7441, + "step": 73333 + }, + { + "epoch": 1.88, + "learning_rate": 6.465934913486558e-07, + "loss": 0.6318, + "step": 73334 + }, + { + "epoch": 1.88, + "learning_rate": 6.465676066086059e-07, + "loss": 0.364, + "step": 73335 + }, + { + "epoch": 1.88, + "learning_rate": 6.465417221391627e-07, + "loss": 0.7065, + "step": 73336 + }, + { + "epoch": 1.88, + "learning_rate": 6.465158379403465e-07, + "loss": 0.5386, + "step": 73337 + }, + { + "epoch": 1.88, + "learning_rate": 6.464899540121768e-07, + "loss": 0.6699, + "step": 73338 + }, + { + "epoch": 1.88, + "learning_rate": 6.464640703546733e-07, + "loss": 0.7754, + "step": 73339 + }, + { + "epoch": 1.88, + "learning_rate": 6.464381869678563e-07, + "loss": 0.5996, + "step": 73340 + }, + { + "epoch": 1.88, + "learning_rate": 6.464123038517454e-07, + "loss": 0.5503, + "step": 73341 + }, + { + "epoch": 1.88, + "learning_rate": 6.463864210063599e-07, + "loss": 0.7109, + "step": 73342 + }, + { + "epoch": 1.88, + "learning_rate": 6.463605384317204e-07, + "loss": 0.7764, + "step": 73343 + }, + { + "epoch": 1.88, + "learning_rate": 6.463346561278461e-07, + "loss": 0.8223, + "step": 73344 + }, + { + "epoch": 1.88, + "learning_rate": 6.463087740947573e-07, + "loss": 0.6826, + "step": 73345 + }, + { + "epoch": 1.88, + "learning_rate": 6.462828923324735e-07, + "loss": 0.6694, + "step": 73346 + }, + { + "epoch": 1.88, + "learning_rate": 6.462570108410145e-07, + "loss": 0.6396, + "step": 73347 + }, + { + "epoch": 1.88, + "learning_rate": 6.462311296204004e-07, + "loss": 0.7148, + "step": 73348 + }, + { + "epoch": 1.88, + "learning_rate": 6.46205248670651e-07, + "loss": 0.8818, + "step": 73349 + }, + { + "epoch": 1.88, + "learning_rate": 6.461793679917858e-07, + "loss": 0.6533, + "step": 73350 + }, + { + "epoch": 1.88, + "learning_rate": 6.461534875838251e-07, + "loss": 0.5173, + "step": 73351 + }, + { + "epoch": 1.88, + "learning_rate": 6.461276074467881e-07, + "loss": 0.668, + "step": 73352 + }, + { + "epoch": 1.88, + "learning_rate": 6.461017275806948e-07, + "loss": 0.7041, + "step": 73353 + }, + { + "epoch": 1.88, + "learning_rate": 6.460758479855654e-07, + "loss": 0.5286, + "step": 73354 + }, + { + "epoch": 1.88, + "learning_rate": 6.460499686614192e-07, + "loss": 0.6592, + "step": 73355 + }, + { + "epoch": 1.88, + "learning_rate": 6.460240896082765e-07, + "loss": 0.6641, + "step": 73356 + }, + { + "epoch": 1.88, + "learning_rate": 6.459982108261568e-07, + "loss": 0.4723, + "step": 73357 + }, + { + "epoch": 1.88, + "learning_rate": 6.459723323150799e-07, + "loss": 0.6621, + "step": 73358 + }, + { + "epoch": 1.88, + "learning_rate": 6.459464540750658e-07, + "loss": 0.6104, + "step": 73359 + }, + { + "epoch": 1.88, + "learning_rate": 6.45920576106134e-07, + "loss": 0.7998, + "step": 73360 + }, + { + "epoch": 1.88, + "learning_rate": 6.458946984083051e-07, + "loss": 0.7842, + "step": 73361 + }, + { + "epoch": 1.88, + "learning_rate": 6.45868820981598e-07, + "loss": 0.5771, + "step": 73362 + }, + { + "epoch": 1.88, + "learning_rate": 6.458429438260326e-07, + "loss": 0.5238, + "step": 73363 + }, + { + "epoch": 1.88, + "learning_rate": 6.458170669416294e-07, + "loss": 0.5542, + "step": 73364 + }, + { + "epoch": 1.88, + "learning_rate": 6.457911903284074e-07, + "loss": 0.6201, + "step": 73365 + }, + { + "epoch": 1.88, + "learning_rate": 6.457653139863872e-07, + "loss": 0.5225, + "step": 73366 + }, + { + "epoch": 1.88, + "learning_rate": 6.457394379155878e-07, + "loss": 0.6191, + "step": 73367 + }, + { + "epoch": 1.88, + "learning_rate": 6.457135621160296e-07, + "loss": 0.8135, + "step": 73368 + }, + { + "epoch": 1.88, + "learning_rate": 6.456876865877323e-07, + "loss": 0.5073, + "step": 73369 + }, + { + "epoch": 1.88, + "learning_rate": 6.456618113307157e-07, + "loss": 0.4872, + "step": 73370 + }, + { + "epoch": 1.88, + "learning_rate": 6.456359363449997e-07, + "loss": 0.6152, + "step": 73371 + }, + { + "epoch": 1.88, + "learning_rate": 6.456100616306036e-07, + "loss": 0.7056, + "step": 73372 + }, + { + "epoch": 1.88, + "learning_rate": 6.455841871875478e-07, + "loss": 0.7168, + "step": 73373 + }, + { + "epoch": 1.88, + "learning_rate": 6.45558313015852e-07, + "loss": 0.7227, + "step": 73374 + }, + { + "epoch": 1.88, + "learning_rate": 6.455324391155354e-07, + "loss": 0.5786, + "step": 73375 + }, + { + "epoch": 1.88, + "learning_rate": 6.455065654866187e-07, + "loss": 0.7065, + "step": 73376 + }, + { + "epoch": 1.88, + "learning_rate": 6.454806921291211e-07, + "loss": 0.6377, + "step": 73377 + }, + { + "epoch": 1.88, + "learning_rate": 6.45454819043063e-07, + "loss": 0.709, + "step": 73378 + }, + { + "epoch": 1.88, + "learning_rate": 6.454289462284635e-07, + "loss": 0.6729, + "step": 73379 + }, + { + "epoch": 1.88, + "learning_rate": 6.454030736853429e-07, + "loss": 0.4507, + "step": 73380 + }, + { + "epoch": 1.88, + "learning_rate": 6.45377201413721e-07, + "loss": 0.6875, + "step": 73381 + }, + { + "epoch": 1.88, + "learning_rate": 6.453513294136172e-07, + "loss": 0.7637, + "step": 73382 + }, + { + "epoch": 1.88, + "learning_rate": 6.453254576850519e-07, + "loss": 0.5747, + "step": 73383 + }, + { + "epoch": 1.88, + "learning_rate": 6.452995862280441e-07, + "loss": 0.4875, + "step": 73384 + }, + { + "epoch": 1.88, + "learning_rate": 6.452737150426146e-07, + "loss": 0.6523, + "step": 73385 + }, + { + "epoch": 1.88, + "learning_rate": 6.452478441287823e-07, + "loss": 0.5962, + "step": 73386 + }, + { + "epoch": 1.88, + "learning_rate": 6.452219734865677e-07, + "loss": 0.5903, + "step": 73387 + }, + { + "epoch": 1.88, + "learning_rate": 6.451961031159901e-07, + "loss": 0.6387, + "step": 73388 + }, + { + "epoch": 1.88, + "learning_rate": 6.451702330170696e-07, + "loss": 0.5649, + "step": 73389 + }, + { + "epoch": 1.88, + "learning_rate": 6.451443631898259e-07, + "loss": 0.5244, + "step": 73390 + }, + { + "epoch": 1.88, + "learning_rate": 6.451184936342795e-07, + "loss": 0.5691, + "step": 73391 + }, + { + "epoch": 1.88, + "learning_rate": 6.450926243504489e-07, + "loss": 0.6113, + "step": 73392 + }, + { + "epoch": 1.88, + "learning_rate": 6.450667553383546e-07, + "loss": 0.7012, + "step": 73393 + }, + { + "epoch": 1.88, + "learning_rate": 6.450408865980163e-07, + "loss": 0.6084, + "step": 73394 + }, + { + "epoch": 1.88, + "learning_rate": 6.45015018129454e-07, + "loss": 0.4329, + "step": 73395 + }, + { + "epoch": 1.88, + "learning_rate": 6.449891499326872e-07, + "loss": 0.6289, + "step": 73396 + }, + { + "epoch": 1.88, + "learning_rate": 6.449632820077362e-07, + "loss": 0.5203, + "step": 73397 + }, + { + "epoch": 1.88, + "learning_rate": 6.449374143546202e-07, + "loss": 0.6499, + "step": 73398 + }, + { + "epoch": 1.88, + "learning_rate": 6.449115469733595e-07, + "loss": 0.5742, + "step": 73399 + }, + { + "epoch": 1.88, + "learning_rate": 6.448856798639735e-07, + "loss": 0.6182, + "step": 73400 + }, + { + "epoch": 1.88, + "learning_rate": 6.448598130264827e-07, + "loss": 0.5918, + "step": 73401 + }, + { + "epoch": 1.88, + "learning_rate": 6.44833946460906e-07, + "loss": 0.5503, + "step": 73402 + }, + { + "epoch": 1.88, + "learning_rate": 6.448080801672635e-07, + "loss": 0.5938, + "step": 73403 + }, + { + "epoch": 1.88, + "learning_rate": 6.447822141455754e-07, + "loss": 0.6074, + "step": 73404 + }, + { + "epoch": 1.88, + "learning_rate": 6.44756348395861e-07, + "loss": 0.5542, + "step": 73405 + }, + { + "epoch": 1.88, + "learning_rate": 6.447304829181404e-07, + "loss": 0.4692, + "step": 73406 + }, + { + "epoch": 1.88, + "learning_rate": 6.447046177124333e-07, + "loss": 0.7607, + "step": 73407 + }, + { + "epoch": 1.88, + "learning_rate": 6.446787527787596e-07, + "loss": 0.3619, + "step": 73408 + }, + { + "epoch": 1.88, + "learning_rate": 6.446528881171389e-07, + "loss": 0.5212, + "step": 73409 + }, + { + "epoch": 1.88, + "learning_rate": 6.446270237275915e-07, + "loss": 0.6719, + "step": 73410 + }, + { + "epoch": 1.88, + "learning_rate": 6.446011596101368e-07, + "loss": 0.6382, + "step": 73411 + }, + { + "epoch": 1.88, + "learning_rate": 6.445752957647945e-07, + "loss": 0.5791, + "step": 73412 + }, + { + "epoch": 1.88, + "learning_rate": 6.445494321915845e-07, + "loss": 0.5762, + "step": 73413 + }, + { + "epoch": 1.88, + "learning_rate": 6.445235688905268e-07, + "loss": 0.7178, + "step": 73414 + }, + { + "epoch": 1.88, + "learning_rate": 6.444977058616407e-07, + "loss": 0.7588, + "step": 73415 + }, + { + "epoch": 1.88, + "learning_rate": 6.444718431049467e-07, + "loss": 0.6797, + "step": 73416 + }, + { + "epoch": 1.88, + "learning_rate": 6.444459806204641e-07, + "loss": 0.627, + "step": 73417 + }, + { + "epoch": 1.88, + "learning_rate": 6.44420118408213e-07, + "loss": 0.6143, + "step": 73418 + }, + { + "epoch": 1.88, + "learning_rate": 6.44394256468213e-07, + "loss": 0.6221, + "step": 73419 + }, + { + "epoch": 1.88, + "learning_rate": 6.443683948004839e-07, + "loss": 0.5376, + "step": 73420 + }, + { + "epoch": 1.88, + "learning_rate": 6.44342533405046e-07, + "loss": 0.7305, + "step": 73421 + }, + { + "epoch": 1.88, + "learning_rate": 6.443166722819182e-07, + "loss": 0.4888, + "step": 73422 + }, + { + "epoch": 1.88, + "learning_rate": 6.44290811431121e-07, + "loss": 0.6548, + "step": 73423 + }, + { + "epoch": 1.88, + "learning_rate": 6.442649508526736e-07, + "loss": 0.4561, + "step": 73424 + }, + { + "epoch": 1.88, + "learning_rate": 6.442390905465965e-07, + "loss": 0.5139, + "step": 73425 + }, + { + "epoch": 1.88, + "learning_rate": 6.44213230512909e-07, + "loss": 0.6577, + "step": 73426 + }, + { + "epoch": 1.88, + "learning_rate": 6.441873707516312e-07, + "loss": 0.668, + "step": 73427 + }, + { + "epoch": 1.88, + "learning_rate": 6.441615112627826e-07, + "loss": 0.627, + "step": 73428 + }, + { + "epoch": 1.88, + "learning_rate": 6.441356520463835e-07, + "loss": 0.2308, + "step": 73429 + }, + { + "epoch": 1.88, + "learning_rate": 6.44109793102453e-07, + "loss": 0.708, + "step": 73430 + }, + { + "epoch": 1.88, + "learning_rate": 6.440839344310118e-07, + "loss": 0.6354, + "step": 73431 + }, + { + "epoch": 1.88, + "learning_rate": 6.440580760320786e-07, + "loss": 0.7871, + "step": 73432 + }, + { + "epoch": 1.88, + "learning_rate": 6.440322179056741e-07, + "loss": 0.5664, + "step": 73433 + }, + { + "epoch": 1.88, + "learning_rate": 6.440063600518175e-07, + "loss": 0.6357, + "step": 73434 + }, + { + "epoch": 1.88, + "learning_rate": 6.439805024705291e-07, + "loss": 0.769, + "step": 73435 + }, + { + "epoch": 1.88, + "learning_rate": 6.439546451618282e-07, + "loss": 0.6484, + "step": 73436 + }, + { + "epoch": 1.88, + "learning_rate": 6.439287881257352e-07, + "loss": 0.6816, + "step": 73437 + }, + { + "epoch": 1.88, + "learning_rate": 6.43902931362269e-07, + "loss": 0.6729, + "step": 73438 + }, + { + "epoch": 1.88, + "learning_rate": 6.438770748714505e-07, + "loss": 0.6699, + "step": 73439 + }, + { + "epoch": 1.88, + "learning_rate": 6.438512186532986e-07, + "loss": 0.6626, + "step": 73440 + }, + { + "epoch": 1.88, + "learning_rate": 6.438253627078339e-07, + "loss": 0.5413, + "step": 73441 + }, + { + "epoch": 1.88, + "learning_rate": 6.437995070350754e-07, + "loss": 0.5659, + "step": 73442 + }, + { + "epoch": 1.88, + "learning_rate": 6.437736516350433e-07, + "loss": 0.7568, + "step": 73443 + }, + { + "epoch": 1.88, + "learning_rate": 6.437477965077573e-07, + "loss": 0.5513, + "step": 73444 + }, + { + "epoch": 1.88, + "learning_rate": 6.437219416532372e-07, + "loss": 0.4735, + "step": 73445 + }, + { + "epoch": 1.88, + "learning_rate": 6.436960870715029e-07, + "loss": 0.5645, + "step": 73446 + }, + { + "epoch": 1.88, + "learning_rate": 6.436702327625742e-07, + "loss": 0.6909, + "step": 73447 + }, + { + "epoch": 1.88, + "learning_rate": 6.436443787264706e-07, + "loss": 0.5566, + "step": 73448 + }, + { + "epoch": 1.88, + "learning_rate": 6.436185249632122e-07, + "loss": 0.6221, + "step": 73449 + }, + { + "epoch": 1.88, + "learning_rate": 6.435926714728187e-07, + "loss": 0.6855, + "step": 73450 + }, + { + "epoch": 1.88, + "learning_rate": 6.435668182553102e-07, + "loss": 0.7393, + "step": 73451 + }, + { + "epoch": 1.88, + "learning_rate": 6.43540965310706e-07, + "loss": 0.502, + "step": 73452 + }, + { + "epoch": 1.88, + "learning_rate": 6.435151126390259e-07, + "loss": 0.6826, + "step": 73453 + }, + { + "epoch": 1.88, + "learning_rate": 6.434892602402902e-07, + "loss": 0.6655, + "step": 73454 + }, + { + "epoch": 1.88, + "learning_rate": 6.43463408114518e-07, + "loss": 0.6284, + "step": 73455 + }, + { + "epoch": 1.88, + "learning_rate": 6.434375562617298e-07, + "loss": 0.7607, + "step": 73456 + }, + { + "epoch": 1.88, + "learning_rate": 6.434117046819447e-07, + "loss": 0.4937, + "step": 73457 + }, + { + "epoch": 1.88, + "learning_rate": 6.433858533751833e-07, + "loss": 0.6182, + "step": 73458 + }, + { + "epoch": 1.88, + "learning_rate": 6.433600023414645e-07, + "loss": 0.6748, + "step": 73459 + }, + { + "epoch": 1.88, + "learning_rate": 6.43334151580809e-07, + "loss": 0.6807, + "step": 73460 + }, + { + "epoch": 1.88, + "learning_rate": 6.433083010932362e-07, + "loss": 0.7354, + "step": 73461 + }, + { + "epoch": 1.88, + "learning_rate": 6.432824508787655e-07, + "loss": 0.5703, + "step": 73462 + }, + { + "epoch": 1.88, + "learning_rate": 6.432566009374171e-07, + "loss": 0.4487, + "step": 73463 + }, + { + "epoch": 1.88, + "learning_rate": 6.432307512692108e-07, + "loss": 0.5107, + "step": 73464 + }, + { + "epoch": 1.88, + "learning_rate": 6.432049018741661e-07, + "loss": 0.5125, + "step": 73465 + }, + { + "epoch": 1.88, + "learning_rate": 6.431790527523032e-07, + "loss": 0.6963, + "step": 73466 + }, + { + "epoch": 1.88, + "learning_rate": 6.431532039036414e-07, + "loss": 0.6177, + "step": 73467 + }, + { + "epoch": 1.88, + "learning_rate": 6.431273553282012e-07, + "loss": 0.6641, + "step": 73468 + }, + { + "epoch": 1.88, + "learning_rate": 6.431015070260017e-07, + "loss": 0.8887, + "step": 73469 + }, + { + "epoch": 1.88, + "learning_rate": 6.430756589970631e-07, + "loss": 0.7354, + "step": 73470 + }, + { + "epoch": 1.88, + "learning_rate": 6.430498112414052e-07, + "loss": 0.8076, + "step": 73471 + }, + { + "epoch": 1.88, + "learning_rate": 6.430239637590473e-07, + "loss": 0.5566, + "step": 73472 + }, + { + "epoch": 1.88, + "learning_rate": 6.429981165500098e-07, + "loss": 0.582, + "step": 73473 + }, + { + "epoch": 1.88, + "learning_rate": 6.42972269614312e-07, + "loss": 0.6465, + "step": 73474 + }, + { + "epoch": 1.88, + "learning_rate": 6.429464229519741e-07, + "loss": 0.6157, + "step": 73475 + }, + { + "epoch": 1.88, + "learning_rate": 6.429205765630155e-07, + "loss": 0.7593, + "step": 73476 + }, + { + "epoch": 1.88, + "learning_rate": 6.428947304474563e-07, + "loss": 0.5635, + "step": 73477 + }, + { + "epoch": 1.88, + "learning_rate": 6.428688846053162e-07, + "loss": 0.624, + "step": 73478 + }, + { + "epoch": 1.88, + "learning_rate": 6.428430390366151e-07, + "loss": 0.6924, + "step": 73479 + }, + { + "epoch": 1.88, + "learning_rate": 6.428171937413725e-07, + "loss": 0.8018, + "step": 73480 + }, + { + "epoch": 1.88, + "learning_rate": 6.427913487196089e-07, + "loss": 0.6597, + "step": 73481 + }, + { + "epoch": 1.88, + "learning_rate": 6.427655039713428e-07, + "loss": 0.6436, + "step": 73482 + }, + { + "epoch": 1.88, + "learning_rate": 6.427396594965951e-07, + "loss": 0.6777, + "step": 73483 + }, + { + "epoch": 1.88, + "learning_rate": 6.427138152953848e-07, + "loss": 0.4271, + "step": 73484 + }, + { + "epoch": 1.88, + "learning_rate": 6.426879713677326e-07, + "loss": 0.585, + "step": 73485 + }, + { + "epoch": 1.88, + "learning_rate": 6.426621277136575e-07, + "loss": 0.563, + "step": 73486 + }, + { + "epoch": 1.88, + "learning_rate": 6.426362843331796e-07, + "loss": 0.7617, + "step": 73487 + }, + { + "epoch": 1.88, + "learning_rate": 6.426104412263187e-07, + "loss": 0.4236, + "step": 73488 + }, + { + "epoch": 1.88, + "learning_rate": 6.425845983930947e-07, + "loss": 0.6875, + "step": 73489 + }, + { + "epoch": 1.88, + "learning_rate": 6.425587558335268e-07, + "loss": 0.5864, + "step": 73490 + }, + { + "epoch": 1.88, + "learning_rate": 6.425329135476359e-07, + "loss": 0.6514, + "step": 73491 + }, + { + "epoch": 1.88, + "learning_rate": 6.425070715354408e-07, + "loss": 0.5698, + "step": 73492 + }, + { + "epoch": 1.88, + "learning_rate": 6.424812297969615e-07, + "loss": 0.7559, + "step": 73493 + }, + { + "epoch": 1.88, + "learning_rate": 6.424553883322179e-07, + "loss": 0.3063, + "step": 73494 + }, + { + "epoch": 1.88, + "learning_rate": 6.424295471412297e-07, + "loss": 0.5562, + "step": 73495 + }, + { + "epoch": 1.88, + "learning_rate": 6.424037062240169e-07, + "loss": 0.6965, + "step": 73496 + }, + { + "epoch": 1.88, + "learning_rate": 6.423778655805989e-07, + "loss": 0.8184, + "step": 73497 + }, + { + "epoch": 1.88, + "learning_rate": 6.42352025210996e-07, + "loss": 0.5745, + "step": 73498 + }, + { + "epoch": 1.88, + "learning_rate": 6.423261851152275e-07, + "loss": 0.7383, + "step": 73499 + }, + { + "epoch": 1.88, + "learning_rate": 6.423003452933137e-07, + "loss": 0.6406, + "step": 73500 + }, + { + "epoch": 1.88, + "learning_rate": 6.42274505745274e-07, + "loss": 0.7422, + "step": 73501 + }, + { + "epoch": 1.88, + "learning_rate": 6.422486664711284e-07, + "loss": 0.4399, + "step": 73502 + }, + { + "epoch": 1.88, + "learning_rate": 6.422228274708962e-07, + "loss": 0.6084, + "step": 73503 + }, + { + "epoch": 1.88, + "learning_rate": 6.421969887445977e-07, + "loss": 0.668, + "step": 73504 + }, + { + "epoch": 1.88, + "learning_rate": 6.421711502922523e-07, + "loss": 0.5659, + "step": 73505 + }, + { + "epoch": 1.88, + "learning_rate": 6.421453121138802e-07, + "loss": 0.6807, + "step": 73506 + }, + { + "epoch": 1.88, + "learning_rate": 6.421194742095009e-07, + "loss": 0.5923, + "step": 73507 + }, + { + "epoch": 1.88, + "learning_rate": 6.420936365791343e-07, + "loss": 0.6846, + "step": 73508 + }, + { + "epoch": 1.88, + "learning_rate": 6.420677992228e-07, + "loss": 0.6831, + "step": 73509 + }, + { + "epoch": 1.88, + "learning_rate": 6.420419621405182e-07, + "loss": 0.5408, + "step": 73510 + }, + { + "epoch": 1.88, + "learning_rate": 6.420161253323084e-07, + "loss": 0.5663, + "step": 73511 + }, + { + "epoch": 1.88, + "learning_rate": 6.419902887981903e-07, + "loss": 0.6553, + "step": 73512 + }, + { + "epoch": 1.88, + "learning_rate": 6.419644525381837e-07, + "loss": 0.71, + "step": 73513 + }, + { + "epoch": 1.88, + "learning_rate": 6.419386165523084e-07, + "loss": 0.5161, + "step": 73514 + }, + { + "epoch": 1.88, + "learning_rate": 6.419127808405844e-07, + "loss": 0.6621, + "step": 73515 + }, + { + "epoch": 1.88, + "learning_rate": 6.418869454030311e-07, + "loss": 0.709, + "step": 73516 + }, + { + "epoch": 1.88, + "learning_rate": 6.418611102396687e-07, + "loss": 0.6416, + "step": 73517 + }, + { + "epoch": 1.88, + "learning_rate": 6.418352753505167e-07, + "loss": 0.7061, + "step": 73518 + }, + { + "epoch": 1.88, + "learning_rate": 6.418094407355949e-07, + "loss": 0.665, + "step": 73519 + }, + { + "epoch": 1.88, + "learning_rate": 6.417836063949235e-07, + "loss": 0.6445, + "step": 73520 + }, + { + "epoch": 1.88, + "learning_rate": 6.417577723285219e-07, + "loss": 0.6924, + "step": 73521 + }, + { + "epoch": 1.88, + "learning_rate": 6.417319385364095e-07, + "loss": 0.6455, + "step": 73522 + }, + { + "epoch": 1.88, + "learning_rate": 6.417061050186068e-07, + "loss": 0.4741, + "step": 73523 + }, + { + "epoch": 1.88, + "learning_rate": 6.416802717751328e-07, + "loss": 0.7803, + "step": 73524 + }, + { + "epoch": 1.88, + "learning_rate": 6.416544388060081e-07, + "loss": 0.6255, + "step": 73525 + }, + { + "epoch": 1.88, + "learning_rate": 6.41628606111252e-07, + "loss": 0.5625, + "step": 73526 + }, + { + "epoch": 1.88, + "learning_rate": 6.416027736908846e-07, + "loss": 0.6523, + "step": 73527 + }, + { + "epoch": 1.88, + "learning_rate": 6.415769415449251e-07, + "loss": 0.6938, + "step": 73528 + }, + { + "epoch": 1.88, + "learning_rate": 6.41551109673394e-07, + "loss": 0.7314, + "step": 73529 + }, + { + "epoch": 1.88, + "learning_rate": 6.415252780763105e-07, + "loss": 0.3878, + "step": 73530 + }, + { + "epoch": 1.88, + "learning_rate": 6.414994467536949e-07, + "loss": 0.5786, + "step": 73531 + }, + { + "epoch": 1.88, + "learning_rate": 6.414736157055667e-07, + "loss": 0.832, + "step": 73532 + }, + { + "epoch": 1.88, + "learning_rate": 6.414477849319453e-07, + "loss": 0.5424, + "step": 73533 + }, + { + "epoch": 1.88, + "learning_rate": 6.414219544328512e-07, + "loss": 0.4399, + "step": 73534 + }, + { + "epoch": 1.88, + "learning_rate": 6.413961242083034e-07, + "loss": 0.5684, + "step": 73535 + }, + { + "epoch": 1.88, + "learning_rate": 6.413702942583225e-07, + "loss": 0.709, + "step": 73536 + }, + { + "epoch": 1.88, + "learning_rate": 6.413444645829278e-07, + "loss": 0.4976, + "step": 73537 + }, + { + "epoch": 1.88, + "learning_rate": 6.413186351821389e-07, + "loss": 0.6963, + "step": 73538 + }, + { + "epoch": 1.88, + "learning_rate": 6.412928060559761e-07, + "loss": 0.4893, + "step": 73539 + }, + { + "epoch": 1.88, + "learning_rate": 6.412669772044588e-07, + "loss": 0.5869, + "step": 73540 + }, + { + "epoch": 1.88, + "learning_rate": 6.41241148627607e-07, + "loss": 0.5237, + "step": 73541 + }, + { + "epoch": 1.88, + "learning_rate": 6.412153203254404e-07, + "loss": 0.6982, + "step": 73542 + }, + { + "epoch": 1.88, + "learning_rate": 6.411894922979785e-07, + "loss": 0.7114, + "step": 73543 + }, + { + "epoch": 1.88, + "learning_rate": 6.411636645452414e-07, + "loss": 0.429, + "step": 73544 + }, + { + "epoch": 1.88, + "learning_rate": 6.411378370672486e-07, + "loss": 0.7998, + "step": 73545 + }, + { + "epoch": 1.89, + "learning_rate": 6.411120098640203e-07, + "loss": 0.5688, + "step": 73546 + }, + { + "epoch": 1.89, + "learning_rate": 6.410861829355759e-07, + "loss": 0.438, + "step": 73547 + }, + { + "epoch": 1.89, + "learning_rate": 6.410603562819354e-07, + "loss": 0.6123, + "step": 73548 + }, + { + "epoch": 1.89, + "learning_rate": 6.410345299031184e-07, + "loss": 0.6782, + "step": 73549 + }, + { + "epoch": 1.89, + "learning_rate": 6.410087037991449e-07, + "loss": 0.7197, + "step": 73550 + }, + { + "epoch": 1.89, + "learning_rate": 6.409828779700346e-07, + "loss": 0.6934, + "step": 73551 + }, + { + "epoch": 1.89, + "learning_rate": 6.40957052415807e-07, + "loss": 0.5889, + "step": 73552 + }, + { + "epoch": 1.89, + "learning_rate": 6.409312271364822e-07, + "loss": 0.5107, + "step": 73553 + }, + { + "epoch": 1.89, + "learning_rate": 6.409054021320797e-07, + "loss": 0.5576, + "step": 73554 + }, + { + "epoch": 1.89, + "learning_rate": 6.408795774026194e-07, + "loss": 0.749, + "step": 73555 + }, + { + "epoch": 1.89, + "learning_rate": 6.408537529481213e-07, + "loss": 0.6968, + "step": 73556 + }, + { + "epoch": 1.89, + "learning_rate": 6.408279287686047e-07, + "loss": 0.5166, + "step": 73557 + }, + { + "epoch": 1.89, + "learning_rate": 6.408021048640899e-07, + "loss": 0.5532, + "step": 73558 + }, + { + "epoch": 1.89, + "learning_rate": 6.407762812345962e-07, + "loss": 0.5825, + "step": 73559 + }, + { + "epoch": 1.89, + "learning_rate": 6.407504578801437e-07, + "loss": 0.6768, + "step": 73560 + }, + { + "epoch": 1.89, + "learning_rate": 6.407246348007522e-07, + "loss": 0.7158, + "step": 73561 + }, + { + "epoch": 1.89, + "learning_rate": 6.406988119964412e-07, + "loss": 0.4843, + "step": 73562 + }, + { + "epoch": 1.89, + "learning_rate": 6.406729894672306e-07, + "loss": 0.6748, + "step": 73563 + }, + { + "epoch": 1.89, + "learning_rate": 6.406471672131399e-07, + "loss": 0.6816, + "step": 73564 + }, + { + "epoch": 1.89, + "learning_rate": 6.406213452341896e-07, + "loss": 0.6421, + "step": 73565 + }, + { + "epoch": 1.89, + "learning_rate": 6.405955235303986e-07, + "loss": 0.6963, + "step": 73566 + }, + { + "epoch": 1.89, + "learning_rate": 6.405697021017873e-07, + "loss": 0.6035, + "step": 73567 + }, + { + "epoch": 1.89, + "learning_rate": 6.405438809483751e-07, + "loss": 0.7598, + "step": 73568 + }, + { + "epoch": 1.89, + "learning_rate": 6.405180600701821e-07, + "loss": 0.6665, + "step": 73569 + }, + { + "epoch": 1.89, + "learning_rate": 6.404922394672277e-07, + "loss": 0.6787, + "step": 73570 + }, + { + "epoch": 1.89, + "learning_rate": 6.404664191395325e-07, + "loss": 0.6865, + "step": 73571 + }, + { + "epoch": 1.89, + "learning_rate": 6.404405990871149e-07, + "loss": 0.4917, + "step": 73572 + }, + { + "epoch": 1.89, + "learning_rate": 6.404147793099957e-07, + "loss": 0.5801, + "step": 73573 + }, + { + "epoch": 1.89, + "learning_rate": 6.403889598081942e-07, + "loss": 0.418, + "step": 73574 + }, + { + "epoch": 1.89, + "learning_rate": 6.403631405817304e-07, + "loss": 0.6836, + "step": 73575 + }, + { + "epoch": 1.89, + "learning_rate": 6.403373216306241e-07, + "loss": 0.4673, + "step": 73576 + }, + { + "epoch": 1.89, + "learning_rate": 6.403115029548949e-07, + "loss": 0.6963, + "step": 73577 + }, + { + "epoch": 1.89, + "learning_rate": 6.402856845545625e-07, + "loss": 0.6611, + "step": 73578 + }, + { + "epoch": 1.89, + "learning_rate": 6.40259866429647e-07, + "loss": 0.5957, + "step": 73579 + }, + { + "epoch": 1.89, + "learning_rate": 6.402340485801678e-07, + "loss": 0.5151, + "step": 73580 + }, + { + "epoch": 1.89, + "learning_rate": 6.402082310061454e-07, + "loss": 0.6758, + "step": 73581 + }, + { + "epoch": 1.89, + "learning_rate": 6.401824137075986e-07, + "loss": 0.6929, + "step": 73582 + }, + { + "epoch": 1.89, + "learning_rate": 6.401565966845475e-07, + "loss": 0.6035, + "step": 73583 + }, + { + "epoch": 1.89, + "learning_rate": 6.401307799370122e-07, + "loss": 0.6016, + "step": 73584 + }, + { + "epoch": 1.89, + "learning_rate": 6.401049634650118e-07, + "loss": 0.6055, + "step": 73585 + }, + { + "epoch": 1.89, + "learning_rate": 6.400791472685668e-07, + "loss": 0.6387, + "step": 73586 + }, + { + "epoch": 1.89, + "learning_rate": 6.400533313476965e-07, + "loss": 0.6392, + "step": 73587 + }, + { + "epoch": 1.89, + "learning_rate": 6.400275157024209e-07, + "loss": 0.8164, + "step": 73588 + }, + { + "epoch": 1.89, + "learning_rate": 6.400017003327596e-07, + "loss": 0.5835, + "step": 73589 + }, + { + "epoch": 1.89, + "learning_rate": 6.399758852387329e-07, + "loss": 0.7314, + "step": 73590 + }, + { + "epoch": 1.89, + "learning_rate": 6.399500704203596e-07, + "loss": 0.7412, + "step": 73591 + }, + { + "epoch": 1.89, + "learning_rate": 6.399242558776603e-07, + "loss": 0.6475, + "step": 73592 + }, + { + "epoch": 1.89, + "learning_rate": 6.398984416106541e-07, + "loss": 0.6318, + "step": 73593 + }, + { + "epoch": 1.89, + "learning_rate": 6.398726276193613e-07, + "loss": 0.6387, + "step": 73594 + }, + { + "epoch": 1.89, + "learning_rate": 6.398468139038013e-07, + "loss": 0.6218, + "step": 73595 + }, + { + "epoch": 1.89, + "learning_rate": 6.398210004639941e-07, + "loss": 0.7305, + "step": 73596 + }, + { + "epoch": 1.89, + "learning_rate": 6.397951872999594e-07, + "loss": 0.667, + "step": 73597 + }, + { + "epoch": 1.89, + "learning_rate": 6.397693744117171e-07, + "loss": 0.6235, + "step": 73598 + }, + { + "epoch": 1.89, + "learning_rate": 6.397435617992866e-07, + "loss": 0.7114, + "step": 73599 + }, + { + "epoch": 1.89, + "learning_rate": 6.397177494626883e-07, + "loss": 0.4692, + "step": 73600 + }, + { + "epoch": 1.89, + "learning_rate": 6.396919374019413e-07, + "loss": 0.5654, + "step": 73601 + }, + { + "epoch": 1.89, + "learning_rate": 6.396661256170654e-07, + "loss": 0.5991, + "step": 73602 + }, + { + "epoch": 1.89, + "learning_rate": 6.39640314108081e-07, + "loss": 0.5547, + "step": 73603 + }, + { + "epoch": 1.89, + "learning_rate": 6.39614502875007e-07, + "loss": 0.5728, + "step": 73604 + }, + { + "epoch": 1.89, + "learning_rate": 6.395886919178639e-07, + "loss": 0.7979, + "step": 73605 + }, + { + "epoch": 1.89, + "learning_rate": 6.39562881236671e-07, + "loss": 0.7959, + "step": 73606 + }, + { + "epoch": 1.89, + "learning_rate": 6.395370708314485e-07, + "loss": 0.6562, + "step": 73607 + }, + { + "epoch": 1.89, + "learning_rate": 6.395112607022155e-07, + "loss": 0.6562, + "step": 73608 + }, + { + "epoch": 1.89, + "learning_rate": 6.394854508489924e-07, + "loss": 0.5635, + "step": 73609 + }, + { + "epoch": 1.89, + "learning_rate": 6.39459641271799e-07, + "loss": 0.6382, + "step": 73610 + }, + { + "epoch": 1.89, + "learning_rate": 6.394338319706545e-07, + "loss": 0.5308, + "step": 73611 + }, + { + "epoch": 1.89, + "learning_rate": 6.394080229455787e-07, + "loss": 0.5305, + "step": 73612 + }, + { + "epoch": 1.89, + "learning_rate": 6.393822141965919e-07, + "loss": 0.7319, + "step": 73613 + }, + { + "epoch": 1.89, + "learning_rate": 6.393564057237133e-07, + "loss": 0.709, + "step": 73614 + }, + { + "epoch": 1.89, + "learning_rate": 6.393305975269631e-07, + "loss": 0.7148, + "step": 73615 + }, + { + "epoch": 1.89, + "learning_rate": 6.393047896063608e-07, + "loss": 0.6416, + "step": 73616 + }, + { + "epoch": 1.89, + "learning_rate": 6.392789819619262e-07, + "loss": 0.5806, + "step": 73617 + }, + { + "epoch": 1.89, + "learning_rate": 6.392531745936791e-07, + "loss": 0.6069, + "step": 73618 + }, + { + "epoch": 1.89, + "learning_rate": 6.392273675016394e-07, + "loss": 0.6143, + "step": 73619 + }, + { + "epoch": 1.89, + "learning_rate": 6.39201560685827e-07, + "loss": 0.4692, + "step": 73620 + }, + { + "epoch": 1.89, + "learning_rate": 6.391757541462608e-07, + "loss": 0.7344, + "step": 73621 + }, + { + "epoch": 1.89, + "learning_rate": 6.391499478829614e-07, + "loss": 0.6226, + "step": 73622 + }, + { + "epoch": 1.89, + "learning_rate": 6.391241418959481e-07, + "loss": 0.4333, + "step": 73623 + }, + { + "epoch": 1.89, + "learning_rate": 6.390983361852411e-07, + "loss": 0.5469, + "step": 73624 + }, + { + "epoch": 1.89, + "learning_rate": 6.390725307508597e-07, + "loss": 0.5669, + "step": 73625 + }, + { + "epoch": 1.89, + "learning_rate": 6.39046725592824e-07, + "loss": 0.6758, + "step": 73626 + }, + { + "epoch": 1.89, + "learning_rate": 6.390209207111536e-07, + "loss": 0.5576, + "step": 73627 + }, + { + "epoch": 1.89, + "learning_rate": 6.389951161058682e-07, + "loss": 0.7686, + "step": 73628 + }, + { + "epoch": 1.89, + "learning_rate": 6.389693117769879e-07, + "loss": 0.6006, + "step": 73629 + }, + { + "epoch": 1.89, + "learning_rate": 6.389435077245322e-07, + "loss": 0.5332, + "step": 73630 + }, + { + "epoch": 1.89, + "learning_rate": 6.389177039485205e-07, + "loss": 0.3975, + "step": 73631 + }, + { + "epoch": 1.89, + "learning_rate": 6.388919004489732e-07, + "loss": 0.6646, + "step": 73632 + }, + { + "epoch": 1.89, + "learning_rate": 6.388660972259095e-07, + "loss": 0.7729, + "step": 73633 + }, + { + "epoch": 1.89, + "learning_rate": 6.388402942793496e-07, + "loss": 0.6475, + "step": 73634 + }, + { + "epoch": 1.89, + "learning_rate": 6.38814491609313e-07, + "loss": 0.6562, + "step": 73635 + }, + { + "epoch": 1.89, + "learning_rate": 6.387886892158196e-07, + "loss": 0.5815, + "step": 73636 + }, + { + "epoch": 1.89, + "learning_rate": 6.387628870988891e-07, + "loss": 0.3828, + "step": 73637 + }, + { + "epoch": 1.89, + "learning_rate": 6.387370852585412e-07, + "loss": 0.6841, + "step": 73638 + }, + { + "epoch": 1.89, + "learning_rate": 6.387112836947956e-07, + "loss": 0.665, + "step": 73639 + }, + { + "epoch": 1.89, + "learning_rate": 6.386854824076725e-07, + "loss": 0.6338, + "step": 73640 + }, + { + "epoch": 1.89, + "learning_rate": 6.386596813971912e-07, + "loss": 0.6089, + "step": 73641 + }, + { + "epoch": 1.89, + "learning_rate": 6.386338806633713e-07, + "loss": 0.5962, + "step": 73642 + }, + { + "epoch": 1.89, + "learning_rate": 6.38608080206233e-07, + "loss": 0.7041, + "step": 73643 + }, + { + "epoch": 1.89, + "learning_rate": 6.385822800257961e-07, + "loss": 0.603, + "step": 73644 + }, + { + "epoch": 1.89, + "learning_rate": 6.385564801220797e-07, + "loss": 0.5464, + "step": 73645 + }, + { + "epoch": 1.89, + "learning_rate": 6.385306804951043e-07, + "loss": 0.6279, + "step": 73646 + }, + { + "epoch": 1.89, + "learning_rate": 6.385048811448889e-07, + "loss": 0.5083, + "step": 73647 + }, + { + "epoch": 1.89, + "learning_rate": 6.384790820714542e-07, + "loss": 0.7676, + "step": 73648 + }, + { + "epoch": 1.89, + "learning_rate": 6.38453283274819e-07, + "loss": 0.6484, + "step": 73649 + }, + { + "epoch": 1.89, + "learning_rate": 6.384274847550042e-07, + "loss": 0.7627, + "step": 73650 + }, + { + "epoch": 1.89, + "learning_rate": 6.384016865120284e-07, + "loss": 0.6177, + "step": 73651 + }, + { + "epoch": 1.89, + "learning_rate": 6.383758885459117e-07, + "loss": 0.6479, + "step": 73652 + }, + { + "epoch": 1.89, + "learning_rate": 6.383500908566741e-07, + "loss": 0.793, + "step": 73653 + }, + { + "epoch": 1.89, + "learning_rate": 6.38324293444335e-07, + "loss": 0.5723, + "step": 73654 + }, + { + "epoch": 1.89, + "learning_rate": 6.382984963089147e-07, + "loss": 0.625, + "step": 73655 + }, + { + "epoch": 1.89, + "learning_rate": 6.382726994504322e-07, + "loss": 0.6299, + "step": 73656 + }, + { + "epoch": 1.89, + "learning_rate": 6.38246902868908e-07, + "loss": 0.6797, + "step": 73657 + }, + { + "epoch": 1.89, + "learning_rate": 6.382211065643612e-07, + "loss": 0.6484, + "step": 73658 + }, + { + "epoch": 1.89, + "learning_rate": 6.381953105368121e-07, + "loss": 0.5947, + "step": 73659 + }, + { + "epoch": 1.89, + "learning_rate": 6.381695147862805e-07, + "loss": 0.6582, + "step": 73660 + }, + { + "epoch": 1.89, + "learning_rate": 6.381437193127856e-07, + "loss": 0.7734, + "step": 73661 + }, + { + "epoch": 1.89, + "learning_rate": 6.381179241163473e-07, + "loss": 0.5789, + "step": 73662 + }, + { + "epoch": 1.89, + "learning_rate": 6.380921291969856e-07, + "loss": 0.624, + "step": 73663 + }, + { + "epoch": 1.89, + "learning_rate": 6.380663345547199e-07, + "loss": 0.7578, + "step": 73664 + }, + { + "epoch": 1.89, + "learning_rate": 6.380405401895703e-07, + "loss": 0.6855, + "step": 73665 + }, + { + "epoch": 1.89, + "learning_rate": 6.380147461015564e-07, + "loss": 0.7061, + "step": 73666 + }, + { + "epoch": 1.89, + "learning_rate": 6.379889522906979e-07, + "loss": 0.451, + "step": 73667 + }, + { + "epoch": 1.89, + "learning_rate": 6.379631587570147e-07, + "loss": 0.7793, + "step": 73668 + }, + { + "epoch": 1.89, + "learning_rate": 6.379373655005265e-07, + "loss": 0.7222, + "step": 73669 + }, + { + "epoch": 1.89, + "learning_rate": 6.379115725212532e-07, + "loss": 0.5112, + "step": 73670 + }, + { + "epoch": 1.89, + "learning_rate": 6.37885779819214e-07, + "loss": 0.6201, + "step": 73671 + }, + { + "epoch": 1.89, + "learning_rate": 6.378599873944292e-07, + "loss": 0.8799, + "step": 73672 + }, + { + "epoch": 1.89, + "learning_rate": 6.378341952469182e-07, + "loss": 0.749, + "step": 73673 + }, + { + "epoch": 1.89, + "learning_rate": 6.37808403376701e-07, + "loss": 0.7236, + "step": 73674 + }, + { + "epoch": 1.89, + "learning_rate": 6.377826117837973e-07, + "loss": 0.6538, + "step": 73675 + }, + { + "epoch": 1.89, + "learning_rate": 6.377568204682267e-07, + "loss": 0.5908, + "step": 73676 + }, + { + "epoch": 1.89, + "learning_rate": 6.377310294300089e-07, + "loss": 0.6914, + "step": 73677 + }, + { + "epoch": 1.89, + "learning_rate": 6.377052386691642e-07, + "loss": 0.6489, + "step": 73678 + }, + { + "epoch": 1.89, + "learning_rate": 6.376794481857115e-07, + "loss": 0.5718, + "step": 73679 + }, + { + "epoch": 1.89, + "learning_rate": 6.376536579796716e-07, + "loss": 0.6001, + "step": 73680 + }, + { + "epoch": 1.89, + "learning_rate": 6.376278680510632e-07, + "loss": 0.5786, + "step": 73681 + }, + { + "epoch": 1.89, + "learning_rate": 6.376020783999066e-07, + "loss": 0.5923, + "step": 73682 + }, + { + "epoch": 1.89, + "learning_rate": 6.375762890262213e-07, + "loss": 0.7354, + "step": 73683 + }, + { + "epoch": 1.89, + "learning_rate": 6.375504999300272e-07, + "loss": 0.5649, + "step": 73684 + }, + { + "epoch": 1.89, + "learning_rate": 6.37524711111344e-07, + "loss": 0.6343, + "step": 73685 + }, + { + "epoch": 1.89, + "learning_rate": 6.374989225701915e-07, + "loss": 0.7256, + "step": 73686 + }, + { + "epoch": 1.89, + "learning_rate": 6.374731343065893e-07, + "loss": 0.5898, + "step": 73687 + }, + { + "epoch": 1.89, + "learning_rate": 6.374473463205574e-07, + "loss": 0.5588, + "step": 73688 + }, + { + "epoch": 1.89, + "learning_rate": 6.374215586121152e-07, + "loss": 0.8115, + "step": 73689 + }, + { + "epoch": 1.89, + "learning_rate": 6.373957711812832e-07, + "loss": 0.6416, + "step": 73690 + }, + { + "epoch": 1.89, + "learning_rate": 6.373699840280802e-07, + "loss": 0.6992, + "step": 73691 + }, + { + "epoch": 1.89, + "learning_rate": 6.373441971525262e-07, + "loss": 0.6855, + "step": 73692 + }, + { + "epoch": 1.89, + "learning_rate": 6.373184105546412e-07, + "loss": 0.6284, + "step": 73693 + }, + { + "epoch": 1.89, + "learning_rate": 6.372926242344447e-07, + "loss": 0.7148, + "step": 73694 + }, + { + "epoch": 1.89, + "learning_rate": 6.372668381919567e-07, + "loss": 0.5645, + "step": 73695 + }, + { + "epoch": 1.89, + "learning_rate": 6.372410524271966e-07, + "loss": 0.5354, + "step": 73696 + }, + { + "epoch": 1.89, + "learning_rate": 6.372152669401847e-07, + "loss": 0.6685, + "step": 73697 + }, + { + "epoch": 1.89, + "learning_rate": 6.3718948173094e-07, + "loss": 0.6553, + "step": 73698 + }, + { + "epoch": 1.89, + "learning_rate": 6.371636967994829e-07, + "loss": 0.6611, + "step": 73699 + }, + { + "epoch": 1.89, + "learning_rate": 6.371379121458331e-07, + "loss": 0.437, + "step": 73700 + }, + { + "epoch": 1.89, + "learning_rate": 6.371121277700098e-07, + "loss": 0.4724, + "step": 73701 + }, + { + "epoch": 1.89, + "learning_rate": 6.370863436720331e-07, + "loss": 0.4368, + "step": 73702 + }, + { + "epoch": 1.89, + "learning_rate": 6.370605598519226e-07, + "loss": 0.6772, + "step": 73703 + }, + { + "epoch": 1.89, + "learning_rate": 6.370347763096982e-07, + "loss": 0.6504, + "step": 73704 + }, + { + "epoch": 1.89, + "learning_rate": 6.370089930453796e-07, + "loss": 0.4858, + "step": 73705 + }, + { + "epoch": 1.89, + "learning_rate": 6.369832100589864e-07, + "loss": 0.666, + "step": 73706 + }, + { + "epoch": 1.89, + "learning_rate": 6.369574273505387e-07, + "loss": 0.5869, + "step": 73707 + }, + { + "epoch": 1.89, + "learning_rate": 6.369316449200557e-07, + "loss": 0.7129, + "step": 73708 + }, + { + "epoch": 1.89, + "learning_rate": 6.369058627675576e-07, + "loss": 0.7207, + "step": 73709 + }, + { + "epoch": 1.89, + "learning_rate": 6.368800808930644e-07, + "loss": 0.6011, + "step": 73710 + }, + { + "epoch": 1.89, + "learning_rate": 6.368542992965949e-07, + "loss": 0.6763, + "step": 73711 + }, + { + "epoch": 1.89, + "learning_rate": 6.368285179781696e-07, + "loss": 0.7129, + "step": 73712 + }, + { + "epoch": 1.89, + "learning_rate": 6.368027369378077e-07, + "loss": 0.5898, + "step": 73713 + }, + { + "epoch": 1.89, + "learning_rate": 6.367769561755296e-07, + "loss": 0.7764, + "step": 73714 + }, + { + "epoch": 1.89, + "learning_rate": 6.367511756913544e-07, + "loss": 0.5825, + "step": 73715 + }, + { + "epoch": 1.89, + "learning_rate": 6.367253954853023e-07, + "loss": 0.6387, + "step": 73716 + }, + { + "epoch": 1.89, + "learning_rate": 6.36699615557393e-07, + "loss": 0.5029, + "step": 73717 + }, + { + "epoch": 1.89, + "learning_rate": 6.366738359076458e-07, + "loss": 0.5437, + "step": 73718 + }, + { + "epoch": 1.89, + "learning_rate": 6.366480565360809e-07, + "loss": 0.5083, + "step": 73719 + }, + { + "epoch": 1.89, + "learning_rate": 6.366222774427182e-07, + "loss": 0.479, + "step": 73720 + }, + { + "epoch": 1.89, + "learning_rate": 6.365964986275764e-07, + "loss": 0.6963, + "step": 73721 + }, + { + "epoch": 1.89, + "learning_rate": 6.365707200906765e-07, + "loss": 0.4619, + "step": 73722 + }, + { + "epoch": 1.89, + "learning_rate": 6.365449418320374e-07, + "loss": 0.7773, + "step": 73723 + }, + { + "epoch": 1.89, + "learning_rate": 6.365191638516793e-07, + "loss": 0.585, + "step": 73724 + }, + { + "epoch": 1.89, + "learning_rate": 6.364933861496216e-07, + "loss": 0.6475, + "step": 73725 + }, + { + "epoch": 1.89, + "learning_rate": 6.364676087258842e-07, + "loss": 0.7168, + "step": 73726 + }, + { + "epoch": 1.89, + "learning_rate": 6.364418315804869e-07, + "loss": 0.7222, + "step": 73727 + }, + { + "epoch": 1.89, + "learning_rate": 6.364160547134493e-07, + "loss": 0.5361, + "step": 73728 + }, + { + "epoch": 1.89, + "learning_rate": 6.363902781247913e-07, + "loss": 0.6572, + "step": 73729 + }, + { + "epoch": 1.89, + "learning_rate": 6.363645018145329e-07, + "loss": 0.6982, + "step": 73730 + }, + { + "epoch": 1.89, + "learning_rate": 6.363387257826931e-07, + "loss": 0.5811, + "step": 73731 + }, + { + "epoch": 1.89, + "learning_rate": 6.363129500292919e-07, + "loss": 0.4814, + "step": 73732 + }, + { + "epoch": 1.89, + "learning_rate": 6.362871745543494e-07, + "loss": 0.5576, + "step": 73733 + }, + { + "epoch": 1.89, + "learning_rate": 6.362613993578851e-07, + "loss": 0.7012, + "step": 73734 + }, + { + "epoch": 1.89, + "learning_rate": 6.362356244399184e-07, + "loss": 0.6475, + "step": 73735 + }, + { + "epoch": 1.89, + "learning_rate": 6.362098498004696e-07, + "loss": 0.6504, + "step": 73736 + }, + { + "epoch": 1.89, + "learning_rate": 6.36184075439558e-07, + "loss": 0.4807, + "step": 73737 + }, + { + "epoch": 1.89, + "learning_rate": 6.361583013572038e-07, + "loss": 0.6396, + "step": 73738 + }, + { + "epoch": 1.89, + "learning_rate": 6.361325275534262e-07, + "loss": 0.6011, + "step": 73739 + }, + { + "epoch": 1.89, + "learning_rate": 6.361067540282457e-07, + "loss": 0.752, + "step": 73740 + }, + { + "epoch": 1.89, + "learning_rate": 6.360809807816811e-07, + "loss": 0.665, + "step": 73741 + }, + { + "epoch": 1.89, + "learning_rate": 6.360552078137525e-07, + "loss": 0.7324, + "step": 73742 + }, + { + "epoch": 1.89, + "learning_rate": 6.360294351244799e-07, + "loss": 0.6089, + "step": 73743 + }, + { + "epoch": 1.89, + "learning_rate": 6.360036627138825e-07, + "loss": 0.6196, + "step": 73744 + }, + { + "epoch": 1.89, + "learning_rate": 6.359778905819808e-07, + "loss": 0.5337, + "step": 73745 + }, + { + "epoch": 1.89, + "learning_rate": 6.359521187287937e-07, + "loss": 0.6885, + "step": 73746 + }, + { + "epoch": 1.89, + "learning_rate": 6.359263471543415e-07, + "loss": 0.7007, + "step": 73747 + }, + { + "epoch": 1.89, + "learning_rate": 6.359005758586436e-07, + "loss": 0.709, + "step": 73748 + }, + { + "epoch": 1.89, + "learning_rate": 6.358748048417201e-07, + "loss": 0.6211, + "step": 73749 + }, + { + "epoch": 1.89, + "learning_rate": 6.358490341035908e-07, + "loss": 0.7773, + "step": 73750 + }, + { + "epoch": 1.89, + "learning_rate": 6.358232636442749e-07, + "loss": 0.5967, + "step": 73751 + }, + { + "epoch": 1.89, + "learning_rate": 6.357974934637922e-07, + "loss": 0.541, + "step": 73752 + }, + { + "epoch": 1.89, + "learning_rate": 6.357717235621627e-07, + "loss": 0.6172, + "step": 73753 + }, + { + "epoch": 1.89, + "learning_rate": 6.357459539394059e-07, + "loss": 0.6846, + "step": 73754 + }, + { + "epoch": 1.89, + "learning_rate": 6.35720184595542e-07, + "loss": 0.2909, + "step": 73755 + }, + { + "epoch": 1.89, + "learning_rate": 6.356944155305901e-07, + "loss": 0.5, + "step": 73756 + }, + { + "epoch": 1.89, + "learning_rate": 6.356686467445704e-07, + "loss": 0.6875, + "step": 73757 + }, + { + "epoch": 1.89, + "learning_rate": 6.356428782375023e-07, + "loss": 0.6914, + "step": 73758 + }, + { + "epoch": 1.89, + "learning_rate": 6.356171100094059e-07, + "loss": 0.7373, + "step": 73759 + }, + { + "epoch": 1.89, + "learning_rate": 6.35591342060301e-07, + "loss": 0.3826, + "step": 73760 + }, + { + "epoch": 1.89, + "learning_rate": 6.355655743902064e-07, + "loss": 0.791, + "step": 73761 + }, + { + "epoch": 1.89, + "learning_rate": 6.355398069991429e-07, + "loss": 0.5856, + "step": 73762 + }, + { + "epoch": 1.89, + "learning_rate": 6.355140398871296e-07, + "loss": 0.5254, + "step": 73763 + }, + { + "epoch": 1.89, + "learning_rate": 6.354882730541866e-07, + "loss": 0.5813, + "step": 73764 + }, + { + "epoch": 1.89, + "learning_rate": 6.354625065003333e-07, + "loss": 0.6392, + "step": 73765 + }, + { + "epoch": 1.89, + "learning_rate": 6.354367402255898e-07, + "loss": 0.7705, + "step": 73766 + }, + { + "epoch": 1.89, + "learning_rate": 6.354109742299754e-07, + "loss": 0.6445, + "step": 73767 + }, + { + "epoch": 1.89, + "learning_rate": 6.353852085135101e-07, + "loss": 0.665, + "step": 73768 + }, + { + "epoch": 1.89, + "learning_rate": 6.353594430762137e-07, + "loss": 0.6436, + "step": 73769 + }, + { + "epoch": 1.89, + "learning_rate": 6.353336779181062e-07, + "loss": 0.7339, + "step": 73770 + }, + { + "epoch": 1.89, + "learning_rate": 6.353079130392063e-07, + "loss": 0.7598, + "step": 73771 + }, + { + "epoch": 1.89, + "learning_rate": 6.352821484395346e-07, + "loss": 0.5432, + "step": 73772 + }, + { + "epoch": 1.89, + "learning_rate": 6.352563841191106e-07, + "loss": 0.666, + "step": 73773 + }, + { + "epoch": 1.89, + "learning_rate": 6.352306200779539e-07, + "loss": 0.5923, + "step": 73774 + }, + { + "epoch": 1.89, + "learning_rate": 6.352048563160843e-07, + "loss": 0.593, + "step": 73775 + }, + { + "epoch": 1.89, + "learning_rate": 6.351790928335218e-07, + "loss": 0.4641, + "step": 73776 + }, + { + "epoch": 1.89, + "learning_rate": 6.351533296302856e-07, + "loss": 0.4824, + "step": 73777 + }, + { + "epoch": 1.89, + "learning_rate": 6.35127566706396e-07, + "loss": 0.5762, + "step": 73778 + }, + { + "epoch": 1.89, + "learning_rate": 6.351018040618721e-07, + "loss": 0.7275, + "step": 73779 + }, + { + "epoch": 1.89, + "learning_rate": 6.350760416967346e-07, + "loss": 0.6494, + "step": 73780 + }, + { + "epoch": 1.89, + "learning_rate": 6.350502796110023e-07, + "loss": 0.8096, + "step": 73781 + }, + { + "epoch": 1.89, + "learning_rate": 6.350245178046949e-07, + "loss": 0.7246, + "step": 73782 + }, + { + "epoch": 1.89, + "learning_rate": 6.349987562778327e-07, + "loss": 0.5757, + "step": 73783 + }, + { + "epoch": 1.89, + "learning_rate": 6.34972995030435e-07, + "loss": 0.5244, + "step": 73784 + }, + { + "epoch": 1.89, + "learning_rate": 6.349472340625219e-07, + "loss": 0.6611, + "step": 73785 + }, + { + "epoch": 1.89, + "learning_rate": 6.349214733741129e-07, + "loss": 0.5732, + "step": 73786 + }, + { + "epoch": 1.89, + "learning_rate": 6.348957129652277e-07, + "loss": 0.644, + "step": 73787 + }, + { + "epoch": 1.89, + "learning_rate": 6.348699528358859e-07, + "loss": 0.6353, + "step": 73788 + }, + { + "epoch": 1.89, + "learning_rate": 6.348441929861074e-07, + "loss": 0.6543, + "step": 73789 + }, + { + "epoch": 1.89, + "learning_rate": 6.348184334159124e-07, + "loss": 0.4268, + "step": 73790 + }, + { + "epoch": 1.89, + "learning_rate": 6.347926741253201e-07, + "loss": 0.6484, + "step": 73791 + }, + { + "epoch": 1.89, + "learning_rate": 6.347669151143497e-07, + "loss": 0.7002, + "step": 73792 + }, + { + "epoch": 1.89, + "learning_rate": 6.347411563830218e-07, + "loss": 0.7627, + "step": 73793 + }, + { + "epoch": 1.89, + "learning_rate": 6.347153979313555e-07, + "loss": 0.6025, + "step": 73794 + }, + { + "epoch": 1.89, + "learning_rate": 6.346896397593711e-07, + "loss": 0.4805, + "step": 73795 + }, + { + "epoch": 1.89, + "learning_rate": 6.346638818670879e-07, + "loss": 0.6992, + "step": 73796 + }, + { + "epoch": 1.89, + "learning_rate": 6.34638124254526e-07, + "loss": 0.7334, + "step": 73797 + }, + { + "epoch": 1.89, + "learning_rate": 6.346123669217045e-07, + "loss": 0.5938, + "step": 73798 + }, + { + "epoch": 1.89, + "learning_rate": 6.345866098686439e-07, + "loss": 0.6787, + "step": 73799 + }, + { + "epoch": 1.89, + "learning_rate": 6.345608530953636e-07, + "loss": 0.5994, + "step": 73800 + }, + { + "epoch": 1.89, + "learning_rate": 6.345350966018829e-07, + "loss": 0.6694, + "step": 73801 + }, + { + "epoch": 1.89, + "learning_rate": 6.345093403882221e-07, + "loss": 0.5767, + "step": 73802 + }, + { + "epoch": 1.89, + "learning_rate": 6.344835844544005e-07, + "loss": 0.624, + "step": 73803 + }, + { + "epoch": 1.89, + "learning_rate": 6.344578288004382e-07, + "loss": 0.5693, + "step": 73804 + }, + { + "epoch": 1.89, + "learning_rate": 6.344320734263546e-07, + "loss": 0.6042, + "step": 73805 + }, + { + "epoch": 1.89, + "learning_rate": 6.344063183321695e-07, + "loss": 0.5977, + "step": 73806 + }, + { + "epoch": 1.89, + "learning_rate": 6.34380563517903e-07, + "loss": 0.4648, + "step": 73807 + }, + { + "epoch": 1.89, + "learning_rate": 6.34354808983574e-07, + "loss": 0.6016, + "step": 73808 + }, + { + "epoch": 1.89, + "learning_rate": 6.343290547292031e-07, + "loss": 0.5186, + "step": 73809 + }, + { + "epoch": 1.89, + "learning_rate": 6.343033007548097e-07, + "loss": 0.6592, + "step": 73810 + }, + { + "epoch": 1.89, + "learning_rate": 6.342775470604131e-07, + "loss": 0.7148, + "step": 73811 + }, + { + "epoch": 1.89, + "learning_rate": 6.342517936460337e-07, + "loss": 0.5376, + "step": 73812 + }, + { + "epoch": 1.89, + "learning_rate": 6.342260405116906e-07, + "loss": 0.6753, + "step": 73813 + }, + { + "epoch": 1.89, + "learning_rate": 6.34200287657404e-07, + "loss": 0.667, + "step": 73814 + }, + { + "epoch": 1.89, + "learning_rate": 6.341745350831931e-07, + "loss": 0.7607, + "step": 73815 + }, + { + "epoch": 1.89, + "learning_rate": 6.341487827890782e-07, + "loss": 0.6743, + "step": 73816 + }, + { + "epoch": 1.89, + "learning_rate": 6.341230307750787e-07, + "loss": 0.563, + "step": 73817 + }, + { + "epoch": 1.89, + "learning_rate": 6.340972790412144e-07, + "loss": 0.6533, + "step": 73818 + }, + { + "epoch": 1.89, + "learning_rate": 6.340715275875049e-07, + "loss": 0.5505, + "step": 73819 + }, + { + "epoch": 1.89, + "learning_rate": 6.340457764139703e-07, + "loss": 0.5728, + "step": 73820 + }, + { + "epoch": 1.89, + "learning_rate": 6.340200255206299e-07, + "loss": 0.5889, + "step": 73821 + }, + { + "epoch": 1.89, + "learning_rate": 6.339942749075032e-07, + "loss": 0.6104, + "step": 73822 + }, + { + "epoch": 1.89, + "learning_rate": 6.339685245746106e-07, + "loss": 0.5894, + "step": 73823 + }, + { + "epoch": 1.89, + "learning_rate": 6.339427745219714e-07, + "loss": 0.5869, + "step": 73824 + }, + { + "epoch": 1.89, + "learning_rate": 6.339170247496053e-07, + "loss": 0.6099, + "step": 73825 + }, + { + "epoch": 1.89, + "learning_rate": 6.338912752575322e-07, + "loss": 0.6069, + "step": 73826 + }, + { + "epoch": 1.89, + "learning_rate": 6.338655260457715e-07, + "loss": 0.7168, + "step": 73827 + }, + { + "epoch": 1.89, + "learning_rate": 6.338397771143434e-07, + "loss": 0.6492, + "step": 73828 + }, + { + "epoch": 1.89, + "learning_rate": 6.338140284632671e-07, + "loss": 0.5469, + "step": 73829 + }, + { + "epoch": 1.89, + "learning_rate": 6.337882800925629e-07, + "loss": 0.7627, + "step": 73830 + }, + { + "epoch": 1.89, + "learning_rate": 6.337625320022501e-07, + "loss": 0.5396, + "step": 73831 + }, + { + "epoch": 1.89, + "learning_rate": 6.337367841923483e-07, + "loss": 0.7041, + "step": 73832 + }, + { + "epoch": 1.89, + "learning_rate": 6.337110366628775e-07, + "loss": 0.7188, + "step": 73833 + }, + { + "epoch": 1.89, + "learning_rate": 6.336852894138571e-07, + "loss": 0.5469, + "step": 73834 + }, + { + "epoch": 1.89, + "learning_rate": 6.336595424453073e-07, + "loss": 0.5039, + "step": 73835 + }, + { + "epoch": 1.89, + "learning_rate": 6.336337957572474e-07, + "loss": 0.6992, + "step": 73836 + }, + { + "epoch": 1.89, + "learning_rate": 6.336080493496974e-07, + "loss": 0.5503, + "step": 73837 + }, + { + "epoch": 1.89, + "learning_rate": 6.335823032226766e-07, + "loss": 0.5317, + "step": 73838 + }, + { + "epoch": 1.89, + "learning_rate": 6.335565573762053e-07, + "loss": 0.7383, + "step": 73839 + }, + { + "epoch": 1.89, + "learning_rate": 6.335308118103031e-07, + "loss": 0.6582, + "step": 73840 + }, + { + "epoch": 1.89, + "learning_rate": 6.335050665249892e-07, + "loss": 0.6514, + "step": 73841 + }, + { + "epoch": 1.89, + "learning_rate": 6.334793215202834e-07, + "loss": 0.6421, + "step": 73842 + }, + { + "epoch": 1.89, + "learning_rate": 6.334535767962059e-07, + "loss": 0.748, + "step": 73843 + }, + { + "epoch": 1.89, + "learning_rate": 6.33427832352776e-07, + "loss": 0.5938, + "step": 73844 + }, + { + "epoch": 1.89, + "learning_rate": 6.334020881900136e-07, + "loss": 0.8506, + "step": 73845 + }, + { + "epoch": 1.89, + "learning_rate": 6.333763443079383e-07, + "loss": 0.709, + "step": 73846 + }, + { + "epoch": 1.89, + "learning_rate": 6.333506007065701e-07, + "loss": 0.666, + "step": 73847 + }, + { + "epoch": 1.89, + "learning_rate": 6.333248573859281e-07, + "loss": 0.6924, + "step": 73848 + }, + { + "epoch": 1.89, + "learning_rate": 6.332991143460327e-07, + "loss": 0.4695, + "step": 73849 + }, + { + "epoch": 1.89, + "learning_rate": 6.332733715869036e-07, + "loss": 0.5908, + "step": 73850 + }, + { + "epoch": 1.89, + "learning_rate": 6.332476291085597e-07, + "loss": 0.6514, + "step": 73851 + }, + { + "epoch": 1.89, + "learning_rate": 6.332218869110215e-07, + "loss": 0.5918, + "step": 73852 + }, + { + "epoch": 1.89, + "learning_rate": 6.331961449943082e-07, + "loss": 0.5569, + "step": 73853 + }, + { + "epoch": 1.89, + "learning_rate": 6.331704033584399e-07, + "loss": 0.6475, + "step": 73854 + }, + { + "epoch": 1.89, + "learning_rate": 6.331446620034359e-07, + "loss": 0.6851, + "step": 73855 + }, + { + "epoch": 1.89, + "learning_rate": 6.331189209293166e-07, + "loss": 0.5962, + "step": 73856 + }, + { + "epoch": 1.89, + "learning_rate": 6.330931801361008e-07, + "loss": 0.6699, + "step": 73857 + }, + { + "epoch": 1.89, + "learning_rate": 6.330674396238091e-07, + "loss": 0.6826, + "step": 73858 + }, + { + "epoch": 1.89, + "learning_rate": 6.330416993924605e-07, + "loss": 0.4995, + "step": 73859 + }, + { + "epoch": 1.89, + "learning_rate": 6.330159594420756e-07, + "loss": 0.6396, + "step": 73860 + }, + { + "epoch": 1.89, + "learning_rate": 6.329902197726729e-07, + "loss": 0.5591, + "step": 73861 + }, + { + "epoch": 1.89, + "learning_rate": 6.329644803842728e-07, + "loss": 0.4783, + "step": 73862 + }, + { + "epoch": 1.89, + "learning_rate": 6.329387412768949e-07, + "loss": 0.5806, + "step": 73863 + }, + { + "epoch": 1.89, + "learning_rate": 6.329130024505591e-07, + "loss": 0.5791, + "step": 73864 + }, + { + "epoch": 1.89, + "learning_rate": 6.328872639052846e-07, + "loss": 0.6543, + "step": 73865 + }, + { + "epoch": 1.89, + "learning_rate": 6.328615256410918e-07, + "loss": 0.5742, + "step": 73866 + }, + { + "epoch": 1.89, + "learning_rate": 6.32835787658e-07, + "loss": 0.667, + "step": 73867 + }, + { + "epoch": 1.89, + "learning_rate": 6.328100499560289e-07, + "loss": 0.4858, + "step": 73868 + }, + { + "epoch": 1.89, + "learning_rate": 6.32784312535198e-07, + "loss": 0.8369, + "step": 73869 + }, + { + "epoch": 1.89, + "learning_rate": 6.327585753955278e-07, + "loss": 0.5728, + "step": 73870 + }, + { + "epoch": 1.89, + "learning_rate": 6.327328385370373e-07, + "loss": 0.5142, + "step": 73871 + }, + { + "epoch": 1.89, + "learning_rate": 6.327071019597461e-07, + "loss": 0.6689, + "step": 73872 + }, + { + "epoch": 1.89, + "learning_rate": 6.326813656636745e-07, + "loss": 0.6221, + "step": 73873 + }, + { + "epoch": 1.89, + "learning_rate": 6.326556296488414e-07, + "loss": 0.5281, + "step": 73874 + }, + { + "epoch": 1.89, + "learning_rate": 6.326298939152675e-07, + "loss": 0.5552, + "step": 73875 + }, + { + "epoch": 1.89, + "learning_rate": 6.326041584629716e-07, + "loss": 0.4291, + "step": 73876 + }, + { + "epoch": 1.89, + "learning_rate": 6.325784232919742e-07, + "loss": 0.4771, + "step": 73877 + }, + { + "epoch": 1.89, + "learning_rate": 6.325526884022943e-07, + "loss": 0.7119, + "step": 73878 + }, + { + "epoch": 1.89, + "learning_rate": 6.325269537939522e-07, + "loss": 0.7188, + "step": 73879 + }, + { + "epoch": 1.89, + "learning_rate": 6.325012194669673e-07, + "loss": 0.6382, + "step": 73880 + }, + { + "epoch": 1.89, + "learning_rate": 6.324754854213592e-07, + "loss": 0.5249, + "step": 73881 + }, + { + "epoch": 1.89, + "learning_rate": 6.324497516571477e-07, + "loss": 0.5852, + "step": 73882 + }, + { + "epoch": 1.89, + "learning_rate": 6.324240181743526e-07, + "loss": 0.6132, + "step": 73883 + }, + { + "epoch": 1.89, + "learning_rate": 6.323982849729932e-07, + "loss": 0.709, + "step": 73884 + }, + { + "epoch": 1.89, + "learning_rate": 6.323725520530898e-07, + "loss": 0.6021, + "step": 73885 + }, + { + "epoch": 1.89, + "learning_rate": 6.323468194146618e-07, + "loss": 0.7979, + "step": 73886 + }, + { + "epoch": 1.89, + "learning_rate": 6.323210870577289e-07, + "loss": 0.4873, + "step": 73887 + }, + { + "epoch": 1.89, + "learning_rate": 6.322953549823109e-07, + "loss": 0.603, + "step": 73888 + }, + { + "epoch": 1.89, + "learning_rate": 6.322696231884277e-07, + "loss": 0.71, + "step": 73889 + }, + { + "epoch": 1.89, + "learning_rate": 6.322438916760985e-07, + "loss": 0.4685, + "step": 73890 + }, + { + "epoch": 1.89, + "learning_rate": 6.32218160445343e-07, + "loss": 0.7881, + "step": 73891 + }, + { + "epoch": 1.89, + "learning_rate": 6.321924294961814e-07, + "loss": 0.4695, + "step": 73892 + }, + { + "epoch": 1.89, + "learning_rate": 6.321666988286329e-07, + "loss": 0.689, + "step": 73893 + }, + { + "epoch": 1.89, + "learning_rate": 6.321409684427178e-07, + "loss": 0.4839, + "step": 73894 + }, + { + "epoch": 1.89, + "learning_rate": 6.321152383384552e-07, + "loss": 0.6729, + "step": 73895 + }, + { + "epoch": 1.89, + "learning_rate": 6.320895085158652e-07, + "loss": 0.6938, + "step": 73896 + }, + { + "epoch": 1.89, + "learning_rate": 6.320637789749673e-07, + "loss": 0.6133, + "step": 73897 + }, + { + "epoch": 1.89, + "learning_rate": 6.320380497157811e-07, + "loss": 0.5525, + "step": 73898 + }, + { + "epoch": 1.89, + "learning_rate": 6.320123207383269e-07, + "loss": 0.647, + "step": 73899 + }, + { + "epoch": 1.89, + "learning_rate": 6.319865920426238e-07, + "loss": 0.7539, + "step": 73900 + }, + { + "epoch": 1.89, + "learning_rate": 6.319608636286912e-07, + "loss": 0.5629, + "step": 73901 + }, + { + "epoch": 1.89, + "learning_rate": 6.319351354965496e-07, + "loss": 0.6201, + "step": 73902 + }, + { + "epoch": 1.89, + "learning_rate": 6.319094076462181e-07, + "loss": 0.564, + "step": 73903 + }, + { + "epoch": 1.89, + "learning_rate": 6.318836800777168e-07, + "loss": 0.6768, + "step": 73904 + }, + { + "epoch": 1.89, + "learning_rate": 6.318579527910651e-07, + "loss": 0.7549, + "step": 73905 + }, + { + "epoch": 1.89, + "learning_rate": 6.318322257862831e-07, + "loss": 0.5645, + "step": 73906 + }, + { + "epoch": 1.89, + "learning_rate": 6.3180649906339e-07, + "loss": 0.5251, + "step": 73907 + }, + { + "epoch": 1.89, + "learning_rate": 6.317807726224058e-07, + "loss": 0.4036, + "step": 73908 + }, + { + "epoch": 1.89, + "learning_rate": 6.317550464633505e-07, + "loss": 0.6396, + "step": 73909 + }, + { + "epoch": 1.89, + "learning_rate": 6.317293205862429e-07, + "loss": 0.5815, + "step": 73910 + }, + { + "epoch": 1.89, + "learning_rate": 6.317035949911035e-07, + "loss": 0.6953, + "step": 73911 + }, + { + "epoch": 1.89, + "learning_rate": 6.316778696779515e-07, + "loss": 0.7832, + "step": 73912 + }, + { + "epoch": 1.89, + "learning_rate": 6.31652144646807e-07, + "loss": 0.7197, + "step": 73913 + }, + { + "epoch": 1.89, + "learning_rate": 6.316264198976896e-07, + "loss": 0.5244, + "step": 73914 + }, + { + "epoch": 1.89, + "learning_rate": 6.316006954306186e-07, + "loss": 0.7764, + "step": 73915 + }, + { + "epoch": 1.89, + "learning_rate": 6.315749712456144e-07, + "loss": 0.7549, + "step": 73916 + }, + { + "epoch": 1.89, + "learning_rate": 6.31549247342696e-07, + "loss": 0.5256, + "step": 73917 + }, + { + "epoch": 1.89, + "learning_rate": 6.315235237218834e-07, + "loss": 0.7539, + "step": 73918 + }, + { + "epoch": 1.89, + "learning_rate": 6.314978003831968e-07, + "loss": 0.7441, + "step": 73919 + }, + { + "epoch": 1.89, + "learning_rate": 6.314720773266549e-07, + "loss": 0.751, + "step": 73920 + }, + { + "epoch": 1.89, + "learning_rate": 6.314463545522779e-07, + "loss": 0.7568, + "step": 73921 + }, + { + "epoch": 1.89, + "learning_rate": 6.314206320600854e-07, + "loss": 0.6816, + "step": 73922 + }, + { + "epoch": 1.89, + "learning_rate": 6.313949098500975e-07, + "loss": 0.4771, + "step": 73923 + }, + { + "epoch": 1.89, + "learning_rate": 6.313691879223333e-07, + "loss": 0.8701, + "step": 73924 + }, + { + "epoch": 1.89, + "learning_rate": 6.313434662768129e-07, + "loss": 0.6631, + "step": 73925 + }, + { + "epoch": 1.89, + "learning_rate": 6.313177449135556e-07, + "loss": 0.5918, + "step": 73926 + }, + { + "epoch": 1.89, + "learning_rate": 6.312920238325816e-07, + "loss": 0.7319, + "step": 73927 + }, + { + "epoch": 1.89, + "learning_rate": 6.312663030339103e-07, + "loss": 0.5889, + "step": 73928 + }, + { + "epoch": 1.89, + "learning_rate": 6.312405825175617e-07, + "loss": 0.5659, + "step": 73929 + }, + { + "epoch": 1.89, + "learning_rate": 6.31214862283555e-07, + "loss": 0.6885, + "step": 73930 + }, + { + "epoch": 1.89, + "learning_rate": 6.311891423319103e-07, + "loss": 0.6348, + "step": 73931 + }, + { + "epoch": 1.89, + "learning_rate": 6.311634226626467e-07, + "loss": 0.5688, + "step": 73932 + }, + { + "epoch": 1.89, + "learning_rate": 6.311377032757846e-07, + "loss": 0.661, + "step": 73933 + }, + { + "epoch": 1.89, + "learning_rate": 6.311119841713432e-07, + "loss": 0.4653, + "step": 73934 + }, + { + "epoch": 1.89, + "learning_rate": 6.310862653493425e-07, + "loss": 0.7236, + "step": 73935 + }, + { + "epoch": 1.9, + "learning_rate": 6.31060546809802e-07, + "loss": 0.6333, + "step": 73936 + }, + { + "epoch": 1.9, + "learning_rate": 6.310348285527416e-07, + "loss": 0.604, + "step": 73937 + }, + { + "epoch": 1.9, + "learning_rate": 6.310091105781808e-07, + "loss": 0.6226, + "step": 73938 + }, + { + "epoch": 1.9, + "learning_rate": 6.309833928861397e-07, + "loss": 0.7412, + "step": 73939 + }, + { + "epoch": 1.9, + "learning_rate": 6.309576754766374e-07, + "loss": 0.667, + "step": 73940 + }, + { + "epoch": 1.9, + "learning_rate": 6.309319583496936e-07, + "loss": 0.5391, + "step": 73941 + }, + { + "epoch": 1.9, + "learning_rate": 6.309062415053285e-07, + "loss": 0.6621, + "step": 73942 + }, + { + "epoch": 1.9, + "learning_rate": 6.308805249435613e-07, + "loss": 0.7354, + "step": 73943 + }, + { + "epoch": 1.9, + "learning_rate": 6.30854808664412e-07, + "loss": 0.9414, + "step": 73944 + }, + { + "epoch": 1.9, + "learning_rate": 6.308290926679002e-07, + "loss": 0.5786, + "step": 73945 + }, + { + "epoch": 1.9, + "learning_rate": 6.308033769540457e-07, + "loss": 0.4644, + "step": 73946 + }, + { + "epoch": 1.9, + "learning_rate": 6.30777661522868e-07, + "loss": 0.6475, + "step": 73947 + }, + { + "epoch": 1.9, + "learning_rate": 6.307519463743868e-07, + "loss": 0.5498, + "step": 73948 + }, + { + "epoch": 1.9, + "learning_rate": 6.307262315086221e-07, + "loss": 0.6567, + "step": 73949 + }, + { + "epoch": 1.9, + "learning_rate": 6.307005169255934e-07, + "loss": 0.7412, + "step": 73950 + }, + { + "epoch": 1.9, + "learning_rate": 6.306748026253199e-07, + "loss": 0.4592, + "step": 73951 + }, + { + "epoch": 1.9, + "learning_rate": 6.30649088607822e-07, + "loss": 0.6885, + "step": 73952 + }, + { + "epoch": 1.9, + "learning_rate": 6.306233748731189e-07, + "loss": 0.6074, + "step": 73953 + }, + { + "epoch": 1.9, + "learning_rate": 6.305976614212307e-07, + "loss": 0.5571, + "step": 73954 + }, + { + "epoch": 1.9, + "learning_rate": 6.305719482521768e-07, + "loss": 0.6191, + "step": 73955 + }, + { + "epoch": 1.9, + "learning_rate": 6.305462353659769e-07, + "loss": 0.5278, + "step": 73956 + }, + { + "epoch": 1.9, + "learning_rate": 6.305205227626508e-07, + "loss": 0.6333, + "step": 73957 + }, + { + "epoch": 1.9, + "learning_rate": 6.304948104422183e-07, + "loss": 0.793, + "step": 73958 + }, + { + "epoch": 1.9, + "learning_rate": 6.304690984046991e-07, + "loss": 0.7686, + "step": 73959 + }, + { + "epoch": 1.9, + "learning_rate": 6.304433866501123e-07, + "loss": 0.6934, + "step": 73960 + }, + { + "epoch": 1.9, + "learning_rate": 6.304176751784782e-07, + "loss": 0.645, + "step": 73961 + }, + { + "epoch": 1.9, + "learning_rate": 6.303919639898162e-07, + "loss": 0.7393, + "step": 73962 + }, + { + "epoch": 1.9, + "learning_rate": 6.303662530841463e-07, + "loss": 0.533, + "step": 73963 + }, + { + "epoch": 1.9, + "learning_rate": 6.303405424614876e-07, + "loss": 0.6221, + "step": 73964 + }, + { + "epoch": 1.9, + "learning_rate": 6.303148321218603e-07, + "loss": 0.6553, + "step": 73965 + }, + { + "epoch": 1.9, + "learning_rate": 6.30289122065284e-07, + "loss": 0.6045, + "step": 73966 + }, + { + "epoch": 1.9, + "learning_rate": 6.302634122917783e-07, + "loss": 0.6768, + "step": 73967 + }, + { + "epoch": 1.9, + "learning_rate": 6.302377028013628e-07, + "loss": 0.7734, + "step": 73968 + }, + { + "epoch": 1.9, + "learning_rate": 6.302119935940578e-07, + "loss": 0.6562, + "step": 73969 + }, + { + "epoch": 1.9, + "learning_rate": 6.30186284669882e-07, + "loss": 0.5918, + "step": 73970 + }, + { + "epoch": 1.9, + "learning_rate": 6.301605760288556e-07, + "loss": 0.6572, + "step": 73971 + }, + { + "epoch": 1.9, + "learning_rate": 6.301348676709981e-07, + "loss": 0.7227, + "step": 73972 + }, + { + "epoch": 1.9, + "learning_rate": 6.301091595963296e-07, + "loss": 0.7852, + "step": 73973 + }, + { + "epoch": 1.9, + "learning_rate": 6.300834518048692e-07, + "loss": 0.5635, + "step": 73974 + }, + { + "epoch": 1.9, + "learning_rate": 6.300577442966372e-07, + "loss": 0.5903, + "step": 73975 + }, + { + "epoch": 1.9, + "learning_rate": 6.300320370716528e-07, + "loss": 0.708, + "step": 73976 + }, + { + "epoch": 1.9, + "learning_rate": 6.30006330129936e-07, + "loss": 0.7471, + "step": 73977 + }, + { + "epoch": 1.9, + "learning_rate": 6.299806234715062e-07, + "loss": 0.6086, + "step": 73978 + }, + { + "epoch": 1.9, + "learning_rate": 6.299549170963834e-07, + "loss": 0.5286, + "step": 73979 + }, + { + "epoch": 1.9, + "learning_rate": 6.299292110045871e-07, + "loss": 0.5879, + "step": 73980 + }, + { + "epoch": 1.9, + "learning_rate": 6.299035051961367e-07, + "loss": 0.625, + "step": 73981 + }, + { + "epoch": 1.9, + "learning_rate": 6.298777996710525e-07, + "loss": 0.6191, + "step": 73982 + }, + { + "epoch": 1.9, + "learning_rate": 6.298520944293534e-07, + "loss": 0.3274, + "step": 73983 + }, + { + "epoch": 1.9, + "learning_rate": 6.2982638947106e-07, + "loss": 0.3811, + "step": 73984 + }, + { + "epoch": 1.9, + "learning_rate": 6.298006847961912e-07, + "loss": 0.6133, + "step": 73985 + }, + { + "epoch": 1.9, + "learning_rate": 6.297749804047672e-07, + "loss": 0.5225, + "step": 73986 + }, + { + "epoch": 1.9, + "learning_rate": 6.297492762968075e-07, + "loss": 0.6143, + "step": 73987 + }, + { + "epoch": 1.9, + "learning_rate": 6.297235724723316e-07, + "loss": 0.6167, + "step": 73988 + }, + { + "epoch": 1.9, + "learning_rate": 6.296978689313597e-07, + "loss": 0.6562, + "step": 73989 + }, + { + "epoch": 1.9, + "learning_rate": 6.296721656739108e-07, + "loss": 0.6953, + "step": 73990 + }, + { + "epoch": 1.9, + "learning_rate": 6.296464627000048e-07, + "loss": 0.7412, + "step": 73991 + }, + { + "epoch": 1.9, + "learning_rate": 6.296207600096616e-07, + "loss": 0.5254, + "step": 73992 + }, + { + "epoch": 1.9, + "learning_rate": 6.295950576029005e-07, + "loss": 0.583, + "step": 73993 + }, + { + "epoch": 1.9, + "learning_rate": 6.295693554797419e-07, + "loss": 0.6111, + "step": 73994 + }, + { + "epoch": 1.9, + "learning_rate": 6.295436536402046e-07, + "loss": 0.5415, + "step": 73995 + }, + { + "epoch": 1.9, + "learning_rate": 6.295179520843089e-07, + "loss": 0.6118, + "step": 73996 + }, + { + "epoch": 1.9, + "learning_rate": 6.294922508120741e-07, + "loss": 0.4399, + "step": 73997 + }, + { + "epoch": 1.9, + "learning_rate": 6.294665498235203e-07, + "loss": 0.6234, + "step": 73998 + }, + { + "epoch": 1.9, + "learning_rate": 6.294408491186671e-07, + "loss": 0.7148, + "step": 73999 + }, + { + "epoch": 1.9, + "learning_rate": 6.294151486975335e-07, + "loss": 0.7412, + "step": 74000 + }, + { + "epoch": 1.9, + "learning_rate": 6.293894485601399e-07, + "loss": 0.5084, + "step": 74001 + }, + { + "epoch": 1.9, + "learning_rate": 6.293637487065058e-07, + "loss": 0.6875, + "step": 74002 + }, + { + "epoch": 1.9, + "learning_rate": 6.293380491366508e-07, + "loss": 0.6172, + "step": 74003 + }, + { + "epoch": 1.9, + "learning_rate": 6.293123498505946e-07, + "loss": 0.6089, + "step": 74004 + }, + { + "epoch": 1.9, + "learning_rate": 6.292866508483568e-07, + "loss": 0.6631, + "step": 74005 + }, + { + "epoch": 1.9, + "learning_rate": 6.292609521299573e-07, + "loss": 0.7158, + "step": 74006 + }, + { + "epoch": 1.9, + "learning_rate": 6.292352536954156e-07, + "loss": 0.6177, + "step": 74007 + }, + { + "epoch": 1.9, + "learning_rate": 6.292095555447514e-07, + "loss": 0.4089, + "step": 74008 + }, + { + "epoch": 1.9, + "learning_rate": 6.291838576779847e-07, + "loss": 0.8145, + "step": 74009 + }, + { + "epoch": 1.9, + "learning_rate": 6.291581600951343e-07, + "loss": 0.6069, + "step": 74010 + }, + { + "epoch": 1.9, + "learning_rate": 6.291324627962209e-07, + "loss": 0.5601, + "step": 74011 + }, + { + "epoch": 1.9, + "learning_rate": 6.291067657812634e-07, + "loss": 0.7305, + "step": 74012 + }, + { + "epoch": 1.9, + "learning_rate": 6.290810690502819e-07, + "loss": 0.6006, + "step": 74013 + }, + { + "epoch": 1.9, + "learning_rate": 6.290553726032959e-07, + "loss": 0.4431, + "step": 74014 + }, + { + "epoch": 1.9, + "learning_rate": 6.290296764403253e-07, + "loss": 0.6157, + "step": 74015 + }, + { + "epoch": 1.9, + "learning_rate": 6.290039805613895e-07, + "loss": 0.6602, + "step": 74016 + }, + { + "epoch": 1.9, + "learning_rate": 6.289782849665084e-07, + "loss": 0.5349, + "step": 74017 + }, + { + "epoch": 1.9, + "learning_rate": 6.289525896557014e-07, + "loss": 0.644, + "step": 74018 + }, + { + "epoch": 1.9, + "learning_rate": 6.289268946289887e-07, + "loss": 0.481, + "step": 74019 + }, + { + "epoch": 1.9, + "learning_rate": 6.289011998863895e-07, + "loss": 0.6099, + "step": 74020 + }, + { + "epoch": 1.9, + "learning_rate": 6.288755054279234e-07, + "loss": 0.6113, + "step": 74021 + }, + { + "epoch": 1.9, + "learning_rate": 6.288498112536103e-07, + "loss": 0.6948, + "step": 74022 + }, + { + "epoch": 1.9, + "learning_rate": 6.2882411736347e-07, + "loss": 0.6318, + "step": 74023 + }, + { + "epoch": 1.9, + "learning_rate": 6.287984237575218e-07, + "loss": 0.7329, + "step": 74024 + }, + { + "epoch": 1.9, + "learning_rate": 6.287727304357857e-07, + "loss": 0.7109, + "step": 74025 + }, + { + "epoch": 1.9, + "learning_rate": 6.287470373982811e-07, + "loss": 0.9287, + "step": 74026 + }, + { + "epoch": 1.9, + "learning_rate": 6.287213446450279e-07, + "loss": 0.6689, + "step": 74027 + }, + { + "epoch": 1.9, + "learning_rate": 6.286956521760455e-07, + "loss": 0.7285, + "step": 74028 + }, + { + "epoch": 1.9, + "learning_rate": 6.286699599913544e-07, + "loss": 0.6982, + "step": 74029 + }, + { + "epoch": 1.9, + "learning_rate": 6.286442680909734e-07, + "loss": 0.7734, + "step": 74030 + }, + { + "epoch": 1.9, + "learning_rate": 6.28618576474922e-07, + "loss": 0.707, + "step": 74031 + }, + { + "epoch": 1.9, + "learning_rate": 6.285928851432205e-07, + "loss": 0.6387, + "step": 74032 + }, + { + "epoch": 1.9, + "learning_rate": 6.285671940958883e-07, + "loss": 0.7207, + "step": 74033 + }, + { + "epoch": 1.9, + "learning_rate": 6.285415033329453e-07, + "loss": 0.6802, + "step": 74034 + }, + { + "epoch": 1.9, + "learning_rate": 6.285158128544107e-07, + "loss": 0.7363, + "step": 74035 + }, + { + "epoch": 1.9, + "learning_rate": 6.284901226603048e-07, + "loss": 0.5801, + "step": 74036 + }, + { + "epoch": 1.9, + "learning_rate": 6.284644327506466e-07, + "loss": 0.7812, + "step": 74037 + }, + { + "epoch": 1.9, + "learning_rate": 6.284387431254563e-07, + "loss": 0.6709, + "step": 74038 + }, + { + "epoch": 1.9, + "learning_rate": 6.284130537847536e-07, + "loss": 0.5488, + "step": 74039 + }, + { + "epoch": 1.9, + "learning_rate": 6.283873647285578e-07, + "loss": 0.6606, + "step": 74040 + }, + { + "epoch": 1.9, + "learning_rate": 6.283616759568883e-07, + "loss": 0.6748, + "step": 74041 + }, + { + "epoch": 1.9, + "learning_rate": 6.283359874697656e-07, + "loss": 0.6895, + "step": 74042 + }, + { + "epoch": 1.9, + "learning_rate": 6.283102992672087e-07, + "loss": 0.5371, + "step": 74043 + }, + { + "epoch": 1.9, + "learning_rate": 6.282846113492377e-07, + "loss": 0.6709, + "step": 74044 + }, + { + "epoch": 1.9, + "learning_rate": 6.282589237158717e-07, + "loss": 0.7236, + "step": 74045 + }, + { + "epoch": 1.9, + "learning_rate": 6.282332363671312e-07, + "loss": 0.6973, + "step": 74046 + }, + { + "epoch": 1.9, + "learning_rate": 6.282075493030352e-07, + "loss": 0.5442, + "step": 74047 + }, + { + "epoch": 1.9, + "learning_rate": 6.281818625236037e-07, + "loss": 0.5601, + "step": 74048 + }, + { + "epoch": 1.9, + "learning_rate": 6.281561760288565e-07, + "loss": 0.5066, + "step": 74049 + }, + { + "epoch": 1.9, + "learning_rate": 6.281304898188126e-07, + "loss": 0.7119, + "step": 74050 + }, + { + "epoch": 1.9, + "learning_rate": 6.281048038934922e-07, + "loss": 0.6621, + "step": 74051 + }, + { + "epoch": 1.9, + "learning_rate": 6.280791182529147e-07, + "loss": 0.5664, + "step": 74052 + }, + { + "epoch": 1.9, + "learning_rate": 6.280534328971001e-07, + "loss": 0.5586, + "step": 74053 + }, + { + "epoch": 1.9, + "learning_rate": 6.280277478260678e-07, + "loss": 0.6465, + "step": 74054 + }, + { + "epoch": 1.9, + "learning_rate": 6.280020630398377e-07, + "loss": 0.7407, + "step": 74055 + }, + { + "epoch": 1.9, + "learning_rate": 6.279763785384291e-07, + "loss": 0.5752, + "step": 74056 + }, + { + "epoch": 1.9, + "learning_rate": 6.27950694321862e-07, + "loss": 0.521, + "step": 74057 + }, + { + "epoch": 1.9, + "learning_rate": 6.279250103901559e-07, + "loss": 0.5503, + "step": 74058 + }, + { + "epoch": 1.9, + "learning_rate": 6.27899326743331e-07, + "loss": 0.4269, + "step": 74059 + }, + { + "epoch": 1.9, + "learning_rate": 6.278736433814058e-07, + "loss": 0.5073, + "step": 74060 + }, + { + "epoch": 1.9, + "learning_rate": 6.27847960304401e-07, + "loss": 0.6992, + "step": 74061 + }, + { + "epoch": 1.9, + "learning_rate": 6.278222775123357e-07, + "loss": 0.7188, + "step": 74062 + }, + { + "epoch": 1.9, + "learning_rate": 6.277965950052299e-07, + "loss": 0.6924, + "step": 74063 + }, + { + "epoch": 1.9, + "learning_rate": 6.277709127831029e-07, + "loss": 0.498, + "step": 74064 + }, + { + "epoch": 1.9, + "learning_rate": 6.277452308459749e-07, + "loss": 0.6841, + "step": 74065 + }, + { + "epoch": 1.9, + "learning_rate": 6.277195491938649e-07, + "loss": 0.7002, + "step": 74066 + }, + { + "epoch": 1.9, + "learning_rate": 6.276938678267933e-07, + "loss": 0.646, + "step": 74067 + }, + { + "epoch": 1.9, + "learning_rate": 6.276681867447791e-07, + "loss": 0.6875, + "step": 74068 + }, + { + "epoch": 1.9, + "learning_rate": 6.276425059478427e-07, + "loss": 0.4581, + "step": 74069 + }, + { + "epoch": 1.9, + "learning_rate": 6.27616825436003e-07, + "loss": 0.5806, + "step": 74070 + }, + { + "epoch": 1.9, + "learning_rate": 6.275911452092799e-07, + "loss": 0.7383, + "step": 74071 + }, + { + "epoch": 1.9, + "learning_rate": 6.275654652676933e-07, + "loss": 0.7227, + "step": 74072 + }, + { + "epoch": 1.9, + "learning_rate": 6.275397856112625e-07, + "loss": 0.4426, + "step": 74073 + }, + { + "epoch": 1.9, + "learning_rate": 6.275141062400076e-07, + "loss": 0.6699, + "step": 74074 + }, + { + "epoch": 1.9, + "learning_rate": 6.274884271539477e-07, + "loss": 0.6855, + "step": 74075 + }, + { + "epoch": 1.9, + "learning_rate": 6.274627483531029e-07, + "loss": 0.7568, + "step": 74076 + }, + { + "epoch": 1.9, + "learning_rate": 6.274370698374932e-07, + "loss": 0.6943, + "step": 74077 + }, + { + "epoch": 1.9, + "learning_rate": 6.274113916071371e-07, + "loss": 0.6348, + "step": 74078 + }, + { + "epoch": 1.9, + "learning_rate": 6.273857136620556e-07, + "loss": 0.7012, + "step": 74079 + }, + { + "epoch": 1.9, + "learning_rate": 6.273600360022675e-07, + "loss": 0.5874, + "step": 74080 + }, + { + "epoch": 1.9, + "learning_rate": 6.273343586277925e-07, + "loss": 0.5723, + "step": 74081 + }, + { + "epoch": 1.9, + "learning_rate": 6.273086815386505e-07, + "loss": 0.6299, + "step": 74082 + }, + { + "epoch": 1.9, + "learning_rate": 6.272830047348612e-07, + "loss": 0.6343, + "step": 74083 + }, + { + "epoch": 1.9, + "learning_rate": 6.272573282164441e-07, + "loss": 0.6084, + "step": 74084 + }, + { + "epoch": 1.9, + "learning_rate": 6.272316519834188e-07, + "loss": 0.5039, + "step": 74085 + }, + { + "epoch": 1.9, + "learning_rate": 6.272059760358052e-07, + "loss": 0.5259, + "step": 74086 + }, + { + "epoch": 1.9, + "learning_rate": 6.271803003736229e-07, + "loss": 0.6357, + "step": 74087 + }, + { + "epoch": 1.9, + "learning_rate": 6.271546249968915e-07, + "loss": 0.614, + "step": 74088 + }, + { + "epoch": 1.9, + "learning_rate": 6.271289499056309e-07, + "loss": 0.6934, + "step": 74089 + }, + { + "epoch": 1.9, + "learning_rate": 6.271032750998601e-07, + "loss": 0.7451, + "step": 74090 + }, + { + "epoch": 1.9, + "learning_rate": 6.270776005795995e-07, + "loss": 0.5732, + "step": 74091 + }, + { + "epoch": 1.9, + "learning_rate": 6.270519263448682e-07, + "loss": 0.6123, + "step": 74092 + }, + { + "epoch": 1.9, + "learning_rate": 6.270262523956861e-07, + "loss": 0.5808, + "step": 74093 + }, + { + "epoch": 1.9, + "learning_rate": 6.270005787320729e-07, + "loss": 0.6777, + "step": 74094 + }, + { + "epoch": 1.9, + "learning_rate": 6.26974905354048e-07, + "loss": 0.6509, + "step": 74095 + }, + { + "epoch": 1.9, + "learning_rate": 6.269492322616317e-07, + "loss": 0.5889, + "step": 74096 + }, + { + "epoch": 1.9, + "learning_rate": 6.269235594548427e-07, + "loss": 0.5903, + "step": 74097 + }, + { + "epoch": 1.9, + "learning_rate": 6.268978869337016e-07, + "loss": 0.4268, + "step": 74098 + }, + { + "epoch": 1.9, + "learning_rate": 6.268722146982279e-07, + "loss": 0.4805, + "step": 74099 + }, + { + "epoch": 1.9, + "learning_rate": 6.268465427484404e-07, + "loss": 0.707, + "step": 74100 + }, + { + "epoch": 1.9, + "learning_rate": 6.268208710843597e-07, + "loss": 0.5645, + "step": 74101 + }, + { + "epoch": 1.9, + "learning_rate": 6.267951997060047e-07, + "loss": 0.7051, + "step": 74102 + }, + { + "epoch": 1.9, + "learning_rate": 6.267695286133958e-07, + "loss": 0.5996, + "step": 74103 + }, + { + "epoch": 1.9, + "learning_rate": 6.26743857806552e-07, + "loss": 0.5676, + "step": 74104 + }, + { + "epoch": 1.9, + "learning_rate": 6.267181872854936e-07, + "loss": 0.686, + "step": 74105 + }, + { + "epoch": 1.9, + "learning_rate": 6.266925170502396e-07, + "loss": 0.5254, + "step": 74106 + }, + { + "epoch": 1.9, + "learning_rate": 6.266668471008104e-07, + "loss": 0.5034, + "step": 74107 + }, + { + "epoch": 1.9, + "learning_rate": 6.266411774372247e-07, + "loss": 0.7578, + "step": 74108 + }, + { + "epoch": 1.9, + "learning_rate": 6.266155080595032e-07, + "loss": 0.5913, + "step": 74109 + }, + { + "epoch": 1.9, + "learning_rate": 6.265898389676649e-07, + "loss": 0.6287, + "step": 74110 + }, + { + "epoch": 1.9, + "learning_rate": 6.265641701617294e-07, + "loss": 0.6826, + "step": 74111 + }, + { + "epoch": 1.9, + "learning_rate": 6.265385016417167e-07, + "loss": 0.6768, + "step": 74112 + }, + { + "epoch": 1.9, + "learning_rate": 6.265128334076463e-07, + "loss": 0.5752, + "step": 74113 + }, + { + "epoch": 1.9, + "learning_rate": 6.264871654595376e-07, + "loss": 0.5835, + "step": 74114 + }, + { + "epoch": 1.9, + "learning_rate": 6.264614977974107e-07, + "loss": 0.7549, + "step": 74115 + }, + { + "epoch": 1.9, + "learning_rate": 6.26435830421285e-07, + "loss": 0.5127, + "step": 74116 + }, + { + "epoch": 1.9, + "learning_rate": 6.264101633311803e-07, + "loss": 0.5747, + "step": 74117 + }, + { + "epoch": 1.9, + "learning_rate": 6.26384496527116e-07, + "loss": 0.4912, + "step": 74118 + }, + { + "epoch": 1.9, + "learning_rate": 6.263588300091123e-07, + "loss": 0.5503, + "step": 74119 + }, + { + "epoch": 1.9, + "learning_rate": 6.263331637771883e-07, + "loss": 0.6152, + "step": 74120 + }, + { + "epoch": 1.9, + "learning_rate": 6.263074978313636e-07, + "loss": 0.5688, + "step": 74121 + }, + { + "epoch": 1.9, + "learning_rate": 6.262818321716582e-07, + "loss": 0.4856, + "step": 74122 + }, + { + "epoch": 1.9, + "learning_rate": 6.262561667980914e-07, + "loss": 0.6025, + "step": 74123 + }, + { + "epoch": 1.9, + "learning_rate": 6.262305017106833e-07, + "loss": 0.7041, + "step": 74124 + }, + { + "epoch": 1.9, + "learning_rate": 6.262048369094532e-07, + "loss": 0.3745, + "step": 74125 + }, + { + "epoch": 1.9, + "learning_rate": 6.26179172394421e-07, + "loss": 0.6519, + "step": 74126 + }, + { + "epoch": 1.9, + "learning_rate": 6.26153508165606e-07, + "loss": 0.7549, + "step": 74127 + }, + { + "epoch": 1.9, + "learning_rate": 6.261278442230284e-07, + "loss": 0.6406, + "step": 74128 + }, + { + "epoch": 1.9, + "learning_rate": 6.261021805667075e-07, + "loss": 0.6436, + "step": 74129 + }, + { + "epoch": 1.9, + "learning_rate": 6.260765171966629e-07, + "loss": 0.6323, + "step": 74130 + }, + { + "epoch": 1.9, + "learning_rate": 6.260508541129141e-07, + "loss": 0.5737, + "step": 74131 + }, + { + "epoch": 1.9, + "learning_rate": 6.260251913154813e-07, + "loss": 0.5908, + "step": 74132 + }, + { + "epoch": 1.9, + "learning_rate": 6.259995288043834e-07, + "loss": 0.4248, + "step": 74133 + }, + { + "epoch": 1.9, + "learning_rate": 6.259738665796408e-07, + "loss": 0.5842, + "step": 74134 + }, + { + "epoch": 1.9, + "learning_rate": 6.259482046412725e-07, + "loss": 0.6709, + "step": 74135 + }, + { + "epoch": 1.9, + "learning_rate": 6.259225429892987e-07, + "loss": 0.5818, + "step": 74136 + }, + { + "epoch": 1.9, + "learning_rate": 6.258968816237387e-07, + "loss": 0.5054, + "step": 74137 + }, + { + "epoch": 1.9, + "learning_rate": 6.258712205446123e-07, + "loss": 0.6797, + "step": 74138 + }, + { + "epoch": 1.9, + "learning_rate": 6.258455597519394e-07, + "loss": 0.5325, + "step": 74139 + }, + { + "epoch": 1.9, + "learning_rate": 6.25819899245739e-07, + "loss": 0.6797, + "step": 74140 + }, + { + "epoch": 1.9, + "learning_rate": 6.257942390260312e-07, + "loss": 0.6338, + "step": 74141 + }, + { + "epoch": 1.9, + "learning_rate": 6.257685790928353e-07, + "loss": 0.7344, + "step": 74142 + }, + { + "epoch": 1.9, + "learning_rate": 6.257429194461717e-07, + "loss": 0.5757, + "step": 74143 + }, + { + "epoch": 1.9, + "learning_rate": 6.25717260086059e-07, + "loss": 0.6943, + "step": 74144 + }, + { + "epoch": 1.9, + "learning_rate": 6.256916010125177e-07, + "loss": 0.6572, + "step": 74145 + }, + { + "epoch": 1.9, + "learning_rate": 6.256659422255669e-07, + "loss": 0.7275, + "step": 74146 + }, + { + "epoch": 1.9, + "learning_rate": 6.256402837252268e-07, + "loss": 0.6128, + "step": 74147 + }, + { + "epoch": 1.9, + "learning_rate": 6.256146255115162e-07, + "loss": 0.708, + "step": 74148 + }, + { + "epoch": 1.9, + "learning_rate": 6.255889675844562e-07, + "loss": 0.593, + "step": 74149 + }, + { + "epoch": 1.9, + "learning_rate": 6.255633099440648e-07, + "loss": 0.748, + "step": 74150 + }, + { + "epoch": 1.9, + "learning_rate": 6.255376525903626e-07, + "loss": 0.6348, + "step": 74151 + }, + { + "epoch": 1.9, + "learning_rate": 6.255119955233687e-07, + "loss": 0.4338, + "step": 74152 + }, + { + "epoch": 1.9, + "learning_rate": 6.254863387431033e-07, + "loss": 0.521, + "step": 74153 + }, + { + "epoch": 1.9, + "learning_rate": 6.254606822495855e-07, + "loss": 0.7163, + "step": 74154 + }, + { + "epoch": 1.9, + "learning_rate": 6.254350260428356e-07, + "loss": 0.6514, + "step": 74155 + }, + { + "epoch": 1.9, + "learning_rate": 6.254093701228727e-07, + "loss": 0.6182, + "step": 74156 + }, + { + "epoch": 1.9, + "learning_rate": 6.253837144897167e-07, + "loss": 0.575, + "step": 74157 + }, + { + "epoch": 1.9, + "learning_rate": 6.253580591433869e-07, + "loss": 0.6021, + "step": 74158 + }, + { + "epoch": 1.9, + "learning_rate": 6.253324040839038e-07, + "loss": 0.6523, + "step": 74159 + }, + { + "epoch": 1.9, + "learning_rate": 6.253067493112861e-07, + "loss": 0.4763, + "step": 74160 + }, + { + "epoch": 1.9, + "learning_rate": 6.252810948255536e-07, + "loss": 0.3882, + "step": 74161 + }, + { + "epoch": 1.9, + "learning_rate": 6.252554406267265e-07, + "loss": 0.8906, + "step": 74162 + }, + { + "epoch": 1.9, + "learning_rate": 6.252297867148237e-07, + "loss": 0.5908, + "step": 74163 + }, + { + "epoch": 1.9, + "learning_rate": 6.252041330898655e-07, + "loss": 0.6191, + "step": 74164 + }, + { + "epoch": 1.9, + "learning_rate": 6.251784797518709e-07, + "loss": 0.5605, + "step": 74165 + }, + { + "epoch": 1.9, + "learning_rate": 6.251528267008603e-07, + "loss": 0.6611, + "step": 74166 + }, + { + "epoch": 1.9, + "learning_rate": 6.251271739368529e-07, + "loss": 0.5957, + "step": 74167 + }, + { + "epoch": 1.9, + "learning_rate": 6.251015214598681e-07, + "loss": 0.7109, + "step": 74168 + }, + { + "epoch": 1.9, + "learning_rate": 6.250758692699264e-07, + "loss": 0.3484, + "step": 74169 + }, + { + "epoch": 1.9, + "learning_rate": 6.250502173670466e-07, + "loss": 0.6206, + "step": 74170 + }, + { + "epoch": 1.9, + "learning_rate": 6.250245657512482e-07, + "loss": 0.6719, + "step": 74171 + }, + { + "epoch": 1.9, + "learning_rate": 6.249989144225518e-07, + "loss": 0.5601, + "step": 74172 + }, + { + "epoch": 1.9, + "learning_rate": 6.249732633809761e-07, + "loss": 0.5903, + "step": 74173 + }, + { + "epoch": 1.9, + "learning_rate": 6.249476126265412e-07, + "loss": 0.4106, + "step": 74174 + }, + { + "epoch": 1.9, + "learning_rate": 6.249219621592667e-07, + "loss": 0.7207, + "step": 74175 + }, + { + "epoch": 1.9, + "learning_rate": 6.248963119791723e-07, + "loss": 0.5107, + "step": 74176 + }, + { + "epoch": 1.9, + "learning_rate": 6.248706620862773e-07, + "loss": 0.6328, + "step": 74177 + }, + { + "epoch": 1.9, + "learning_rate": 6.248450124806022e-07, + "loss": 0.6738, + "step": 74178 + }, + { + "epoch": 1.9, + "learning_rate": 6.248193631621656e-07, + "loss": 0.6465, + "step": 74179 + }, + { + "epoch": 1.9, + "learning_rate": 6.247937141309874e-07, + "loss": 0.6875, + "step": 74180 + }, + { + "epoch": 1.9, + "learning_rate": 6.247680653870877e-07, + "loss": 0.7197, + "step": 74181 + }, + { + "epoch": 1.9, + "learning_rate": 6.247424169304855e-07, + "loss": 0.5845, + "step": 74182 + }, + { + "epoch": 1.9, + "learning_rate": 6.247167687612011e-07, + "loss": 0.6622, + "step": 74183 + }, + { + "epoch": 1.9, + "learning_rate": 6.246911208792536e-07, + "loss": 0.5066, + "step": 74184 + }, + { + "epoch": 1.9, + "learning_rate": 6.246654732846629e-07, + "loss": 0.5454, + "step": 74185 + }, + { + "epoch": 1.9, + "learning_rate": 6.246398259774487e-07, + "loss": 0.5671, + "step": 74186 + }, + { + "epoch": 1.9, + "learning_rate": 6.246141789576304e-07, + "loss": 0.5615, + "step": 74187 + }, + { + "epoch": 1.9, + "learning_rate": 6.24588532225228e-07, + "loss": 0.6572, + "step": 74188 + }, + { + "epoch": 1.9, + "learning_rate": 6.245628857802609e-07, + "loss": 0.6211, + "step": 74189 + }, + { + "epoch": 1.9, + "learning_rate": 6.245372396227484e-07, + "loss": 0.4089, + "step": 74190 + }, + { + "epoch": 1.9, + "learning_rate": 6.245115937527106e-07, + "loss": 0.8613, + "step": 74191 + }, + { + "epoch": 1.9, + "learning_rate": 6.24485948170167e-07, + "loss": 0.5811, + "step": 74192 + }, + { + "epoch": 1.9, + "learning_rate": 6.244603028751373e-07, + "loss": 0.5542, + "step": 74193 + }, + { + "epoch": 1.9, + "learning_rate": 6.24434657867641e-07, + "loss": 0.6348, + "step": 74194 + }, + { + "epoch": 1.9, + "learning_rate": 6.244090131476978e-07, + "loss": 0.5801, + "step": 74195 + }, + { + "epoch": 1.9, + "learning_rate": 6.243833687153273e-07, + "loss": 0.7021, + "step": 74196 + }, + { + "epoch": 1.9, + "learning_rate": 6.243577245705494e-07, + "loss": 0.4941, + "step": 74197 + }, + { + "epoch": 1.9, + "learning_rate": 6.243320807133836e-07, + "loss": 0.6597, + "step": 74198 + }, + { + "epoch": 1.9, + "learning_rate": 6.243064371438492e-07, + "loss": 0.7432, + "step": 74199 + }, + { + "epoch": 1.9, + "learning_rate": 6.242807938619663e-07, + "loss": 0.6206, + "step": 74200 + }, + { + "epoch": 1.9, + "learning_rate": 6.242551508677541e-07, + "loss": 0.6768, + "step": 74201 + }, + { + "epoch": 1.9, + "learning_rate": 6.242295081612325e-07, + "loss": 0.5874, + "step": 74202 + }, + { + "epoch": 1.9, + "learning_rate": 6.242038657424211e-07, + "loss": 0.5493, + "step": 74203 + }, + { + "epoch": 1.9, + "learning_rate": 6.241782236113396e-07, + "loss": 0.3569, + "step": 74204 + }, + { + "epoch": 1.9, + "learning_rate": 6.241525817680073e-07, + "loss": 0.6304, + "step": 74205 + }, + { + "epoch": 1.9, + "learning_rate": 6.241269402124443e-07, + "loss": 0.6396, + "step": 74206 + }, + { + "epoch": 1.9, + "learning_rate": 6.2410129894467e-07, + "loss": 0.6963, + "step": 74207 + }, + { + "epoch": 1.9, + "learning_rate": 6.240756579647044e-07, + "loss": 0.6338, + "step": 74208 + }, + { + "epoch": 1.9, + "learning_rate": 6.240500172725662e-07, + "loss": 0.6494, + "step": 74209 + }, + { + "epoch": 1.9, + "learning_rate": 6.24024376868276e-07, + "loss": 0.6924, + "step": 74210 + }, + { + "epoch": 1.9, + "learning_rate": 6.239987367518526e-07, + "loss": 0.6338, + "step": 74211 + }, + { + "epoch": 1.9, + "learning_rate": 6.239730969233165e-07, + "loss": 0.7358, + "step": 74212 + }, + { + "epoch": 1.9, + "learning_rate": 6.239474573826866e-07, + "loss": 0.5327, + "step": 74213 + }, + { + "epoch": 1.9, + "learning_rate": 6.239218181299833e-07, + "loss": 0.6699, + "step": 74214 + }, + { + "epoch": 1.9, + "learning_rate": 6.238961791652253e-07, + "loss": 0.6836, + "step": 74215 + }, + { + "epoch": 1.9, + "learning_rate": 6.238705404884329e-07, + "loss": 0.7568, + "step": 74216 + }, + { + "epoch": 1.9, + "learning_rate": 6.238449020996254e-07, + "loss": 0.5845, + "step": 74217 + }, + { + "epoch": 1.9, + "learning_rate": 6.238192639988229e-07, + "loss": 0.425, + "step": 74218 + }, + { + "epoch": 1.9, + "learning_rate": 6.237936261860446e-07, + "loss": 0.5696, + "step": 74219 + }, + { + "epoch": 1.9, + "learning_rate": 6.237679886613102e-07, + "loss": 0.5928, + "step": 74220 + }, + { + "epoch": 1.9, + "learning_rate": 6.237423514246392e-07, + "loss": 0.7803, + "step": 74221 + }, + { + "epoch": 1.9, + "learning_rate": 6.237167144760514e-07, + "loss": 0.6328, + "step": 74222 + }, + { + "epoch": 1.9, + "learning_rate": 6.236910778155663e-07, + "loss": 0.8232, + "step": 74223 + }, + { + "epoch": 1.9, + "learning_rate": 6.236654414432039e-07, + "loss": 0.6387, + "step": 74224 + }, + { + "epoch": 1.9, + "learning_rate": 6.236398053589833e-07, + "loss": 0.6318, + "step": 74225 + }, + { + "epoch": 1.9, + "learning_rate": 6.236141695629246e-07, + "loss": 0.7441, + "step": 74226 + }, + { + "epoch": 1.9, + "learning_rate": 6.23588534055047e-07, + "loss": 0.6514, + "step": 74227 + }, + { + "epoch": 1.9, + "learning_rate": 6.235628988353708e-07, + "loss": 0.6055, + "step": 74228 + }, + { + "epoch": 1.9, + "learning_rate": 6.235372639039149e-07, + "loss": 0.5664, + "step": 74229 + }, + { + "epoch": 1.9, + "learning_rate": 6.235116292606993e-07, + "loss": 0.6099, + "step": 74230 + }, + { + "epoch": 1.9, + "learning_rate": 6.234859949057434e-07, + "loss": 0.6052, + "step": 74231 + }, + { + "epoch": 1.9, + "learning_rate": 6.234603608390668e-07, + "loss": 0.5991, + "step": 74232 + }, + { + "epoch": 1.9, + "learning_rate": 6.234347270606897e-07, + "loss": 0.6099, + "step": 74233 + }, + { + "epoch": 1.9, + "learning_rate": 6.234090935706308e-07, + "loss": 0.6387, + "step": 74234 + }, + { + "epoch": 1.9, + "learning_rate": 6.233834603689108e-07, + "loss": 0.553, + "step": 74235 + }, + { + "epoch": 1.9, + "learning_rate": 6.233578274555482e-07, + "loss": 0.6758, + "step": 74236 + }, + { + "epoch": 1.9, + "learning_rate": 6.233321948305637e-07, + "loss": 0.6641, + "step": 74237 + }, + { + "epoch": 1.9, + "learning_rate": 6.233065624939764e-07, + "loss": 0.6343, + "step": 74238 + }, + { + "epoch": 1.9, + "learning_rate": 6.232809304458059e-07, + "loss": 0.6367, + "step": 74239 + }, + { + "epoch": 1.9, + "learning_rate": 6.232552986860716e-07, + "loss": 0.4219, + "step": 74240 + }, + { + "epoch": 1.9, + "learning_rate": 6.232296672147936e-07, + "loss": 0.7012, + "step": 74241 + }, + { + "epoch": 1.9, + "learning_rate": 6.232040360319911e-07, + "loss": 0.5051, + "step": 74242 + }, + { + "epoch": 1.9, + "learning_rate": 6.231784051376842e-07, + "loss": 0.6538, + "step": 74243 + }, + { + "epoch": 1.9, + "learning_rate": 6.231527745318919e-07, + "loss": 0.564, + "step": 74244 + }, + { + "epoch": 1.9, + "learning_rate": 6.231271442146347e-07, + "loss": 0.668, + "step": 74245 + }, + { + "epoch": 1.9, + "learning_rate": 6.231015141859312e-07, + "loss": 0.667, + "step": 74246 + }, + { + "epoch": 1.9, + "learning_rate": 6.230758844458019e-07, + "loss": 0.5747, + "step": 74247 + }, + { + "epoch": 1.9, + "learning_rate": 6.230502549942662e-07, + "loss": 0.4698, + "step": 74248 + }, + { + "epoch": 1.9, + "learning_rate": 6.230246258313434e-07, + "loss": 0.7676, + "step": 74249 + }, + { + "epoch": 1.9, + "learning_rate": 6.229989969570533e-07, + "loss": 0.5454, + "step": 74250 + }, + { + "epoch": 1.9, + "learning_rate": 6.229733683714153e-07, + "loss": 0.6553, + "step": 74251 + }, + { + "epoch": 1.9, + "learning_rate": 6.229477400744496e-07, + "loss": 0.7046, + "step": 74252 + }, + { + "epoch": 1.9, + "learning_rate": 6.229221120661751e-07, + "loss": 0.6802, + "step": 74253 + }, + { + "epoch": 1.9, + "learning_rate": 6.228964843466123e-07, + "loss": 0.54, + "step": 74254 + }, + { + "epoch": 1.9, + "learning_rate": 6.228708569157799e-07, + "loss": 0.8535, + "step": 74255 + }, + { + "epoch": 1.9, + "learning_rate": 6.228452297736982e-07, + "loss": 0.7031, + "step": 74256 + }, + { + "epoch": 1.9, + "learning_rate": 6.228196029203865e-07, + "loss": 0.6777, + "step": 74257 + }, + { + "epoch": 1.9, + "learning_rate": 6.227939763558647e-07, + "loss": 0.6421, + "step": 74258 + }, + { + "epoch": 1.9, + "learning_rate": 6.227683500801518e-07, + "loss": 0.5811, + "step": 74259 + }, + { + "epoch": 1.9, + "learning_rate": 6.227427240932681e-07, + "loss": 0.6143, + "step": 74260 + }, + { + "epoch": 1.9, + "learning_rate": 6.227170983952327e-07, + "loss": 0.6553, + "step": 74261 + }, + { + "epoch": 1.9, + "learning_rate": 6.226914729860657e-07, + "loss": 0.5781, + "step": 74262 + }, + { + "epoch": 1.9, + "learning_rate": 6.226658478657862e-07, + "loss": 0.6042, + "step": 74263 + }, + { + "epoch": 1.9, + "learning_rate": 6.226402230344144e-07, + "loss": 0.6763, + "step": 74264 + }, + { + "epoch": 1.9, + "learning_rate": 6.226145984919695e-07, + "loss": 0.6445, + "step": 74265 + }, + { + "epoch": 1.9, + "learning_rate": 6.225889742384713e-07, + "loss": 0.3785, + "step": 74266 + }, + { + "epoch": 1.9, + "learning_rate": 6.225633502739393e-07, + "loss": 0.7451, + "step": 74267 + }, + { + "epoch": 1.9, + "learning_rate": 6.225377265983935e-07, + "loss": 0.5654, + "step": 74268 + }, + { + "epoch": 1.9, + "learning_rate": 6.22512103211853e-07, + "loss": 0.6592, + "step": 74269 + }, + { + "epoch": 1.9, + "learning_rate": 6.224864801143374e-07, + "loss": 0.5684, + "step": 74270 + }, + { + "epoch": 1.9, + "learning_rate": 6.224608573058668e-07, + "loss": 0.6797, + "step": 74271 + }, + { + "epoch": 1.9, + "learning_rate": 6.224352347864604e-07, + "loss": 0.6777, + "step": 74272 + }, + { + "epoch": 1.9, + "learning_rate": 6.224096125561382e-07, + "loss": 0.5317, + "step": 74273 + }, + { + "epoch": 1.9, + "learning_rate": 6.223839906149194e-07, + "loss": 0.6611, + "step": 74274 + }, + { + "epoch": 1.9, + "learning_rate": 6.223583689628238e-07, + "loss": 0.6904, + "step": 74275 + }, + { + "epoch": 1.9, + "learning_rate": 6.223327475998712e-07, + "loss": 0.6611, + "step": 74276 + }, + { + "epoch": 1.9, + "learning_rate": 6.223071265260809e-07, + "loss": 0.7314, + "step": 74277 + }, + { + "epoch": 1.9, + "learning_rate": 6.222815057414729e-07, + "loss": 0.6392, + "step": 74278 + }, + { + "epoch": 1.9, + "learning_rate": 6.222558852460666e-07, + "loss": 0.5962, + "step": 74279 + }, + { + "epoch": 1.9, + "learning_rate": 6.222302650398812e-07, + "loss": 0.7422, + "step": 74280 + }, + { + "epoch": 1.9, + "learning_rate": 6.222046451229371e-07, + "loss": 0.6694, + "step": 74281 + }, + { + "epoch": 1.9, + "learning_rate": 6.221790254952532e-07, + "loss": 0.6431, + "step": 74282 + }, + { + "epoch": 1.9, + "learning_rate": 6.221534061568497e-07, + "loss": 0.7188, + "step": 74283 + }, + { + "epoch": 1.9, + "learning_rate": 6.221277871077457e-07, + "loss": 0.6807, + "step": 74284 + }, + { + "epoch": 1.9, + "learning_rate": 6.221021683479612e-07, + "loss": 0.6514, + "step": 74285 + }, + { + "epoch": 1.9, + "learning_rate": 6.220765498775156e-07, + "loss": 0.6602, + "step": 74286 + }, + { + "epoch": 1.9, + "learning_rate": 6.220509316964288e-07, + "loss": 0.5645, + "step": 74287 + }, + { + "epoch": 1.9, + "learning_rate": 6.220253138047205e-07, + "loss": 0.6914, + "step": 74288 + }, + { + "epoch": 1.9, + "learning_rate": 6.219996962024096e-07, + "loss": 0.6577, + "step": 74289 + }, + { + "epoch": 1.9, + "learning_rate": 6.219740788895163e-07, + "loss": 0.6895, + "step": 74290 + }, + { + "epoch": 1.9, + "learning_rate": 6.2194846186606e-07, + "loss": 0.6304, + "step": 74291 + }, + { + "epoch": 1.9, + "learning_rate": 6.219228451320604e-07, + "loss": 0.6494, + "step": 74292 + }, + { + "epoch": 1.9, + "learning_rate": 6.218972286875372e-07, + "loss": 0.5435, + "step": 74293 + }, + { + "epoch": 1.9, + "learning_rate": 6.218716125325097e-07, + "loss": 0.5566, + "step": 74294 + }, + { + "epoch": 1.9, + "learning_rate": 6.218459966669979e-07, + "loss": 0.4165, + "step": 74295 + }, + { + "epoch": 1.9, + "learning_rate": 6.218203810910209e-07, + "loss": 0.6646, + "step": 74296 + }, + { + "epoch": 1.9, + "learning_rate": 6.217947658045991e-07, + "loss": 0.6816, + "step": 74297 + }, + { + "epoch": 1.9, + "learning_rate": 6.217691508077517e-07, + "loss": 0.7007, + "step": 74298 + }, + { + "epoch": 1.9, + "learning_rate": 6.217435361004979e-07, + "loss": 0.5537, + "step": 74299 + }, + { + "epoch": 1.9, + "learning_rate": 6.217179216828579e-07, + "loss": 0.6953, + "step": 74300 + }, + { + "epoch": 1.9, + "learning_rate": 6.216923075548509e-07, + "loss": 0.3933, + "step": 74301 + }, + { + "epoch": 1.9, + "learning_rate": 6.216666937164969e-07, + "loss": 0.7686, + "step": 74302 + }, + { + "epoch": 1.9, + "learning_rate": 6.216410801678152e-07, + "loss": 0.7988, + "step": 74303 + }, + { + "epoch": 1.9, + "learning_rate": 6.216154669088255e-07, + "loss": 0.6484, + "step": 74304 + }, + { + "epoch": 1.9, + "learning_rate": 6.215898539395474e-07, + "loss": 0.543, + "step": 74305 + }, + { + "epoch": 1.9, + "learning_rate": 6.215642412600006e-07, + "loss": 0.4124, + "step": 74306 + }, + { + "epoch": 1.9, + "learning_rate": 6.215386288702047e-07, + "loss": 0.6016, + "step": 74307 + }, + { + "epoch": 1.9, + "learning_rate": 6.215130167701794e-07, + "loss": 0.6318, + "step": 74308 + }, + { + "epoch": 1.9, + "learning_rate": 6.214874049599442e-07, + "loss": 0.6855, + "step": 74309 + }, + { + "epoch": 1.9, + "learning_rate": 6.214617934395186e-07, + "loss": 0.6523, + "step": 74310 + }, + { + "epoch": 1.9, + "learning_rate": 6.214361822089221e-07, + "loss": 0.5923, + "step": 74311 + }, + { + "epoch": 1.9, + "learning_rate": 6.214105712681748e-07, + "loss": 0.498, + "step": 74312 + }, + { + "epoch": 1.9, + "learning_rate": 6.213849606172957e-07, + "loss": 0.71, + "step": 74313 + }, + { + "epoch": 1.9, + "learning_rate": 6.21359350256305e-07, + "loss": 0.6602, + "step": 74314 + }, + { + "epoch": 1.9, + "learning_rate": 6.213337401852217e-07, + "loss": 0.6367, + "step": 74315 + }, + { + "epoch": 1.9, + "learning_rate": 6.213081304040662e-07, + "loss": 0.7158, + "step": 74316 + }, + { + "epoch": 1.9, + "learning_rate": 6.212825209128571e-07, + "loss": 0.6062, + "step": 74317 + }, + { + "epoch": 1.9, + "learning_rate": 6.212569117116153e-07, + "loss": 0.604, + "step": 74318 + }, + { + "epoch": 1.9, + "learning_rate": 6.212313028003593e-07, + "loss": 0.6396, + "step": 74319 + }, + { + "epoch": 1.9, + "learning_rate": 6.212056941791088e-07, + "loss": 0.666, + "step": 74320 + }, + { + "epoch": 1.9, + "learning_rate": 6.211800858478841e-07, + "loss": 0.6377, + "step": 74321 + }, + { + "epoch": 1.9, + "learning_rate": 6.211544778067039e-07, + "loss": 0.4697, + "step": 74322 + }, + { + "epoch": 1.9, + "learning_rate": 6.211288700555887e-07, + "loss": 0.6719, + "step": 74323 + }, + { + "epoch": 1.9, + "learning_rate": 6.211032625945576e-07, + "loss": 0.6528, + "step": 74324 + }, + { + "epoch": 1.9, + "learning_rate": 6.210776554236303e-07, + "loss": 0.5574, + "step": 74325 + }, + { + "epoch": 1.91, + "learning_rate": 6.210520485428263e-07, + "loss": 0.4536, + "step": 74326 + }, + { + "epoch": 1.91, + "learning_rate": 6.210264419521656e-07, + "loss": 0.7236, + "step": 74327 + }, + { + "epoch": 1.91, + "learning_rate": 6.210008356516676e-07, + "loss": 0.6084, + "step": 74328 + }, + { + "epoch": 1.91, + "learning_rate": 6.209752296413517e-07, + "loss": 0.7861, + "step": 74329 + }, + { + "epoch": 1.91, + "learning_rate": 6.209496239212372e-07, + "loss": 0.6689, + "step": 74330 + }, + { + "epoch": 1.91, + "learning_rate": 6.209240184913447e-07, + "loss": 0.6377, + "step": 74331 + }, + { + "epoch": 1.91, + "learning_rate": 6.208984133516929e-07, + "loss": 0.4048, + "step": 74332 + }, + { + "epoch": 1.91, + "learning_rate": 6.208728085023021e-07, + "loss": 0.5945, + "step": 74333 + }, + { + "epoch": 1.91, + "learning_rate": 6.208472039431912e-07, + "loss": 0.6582, + "step": 74334 + }, + { + "epoch": 1.91, + "learning_rate": 6.208215996743803e-07, + "loss": 0.7754, + "step": 74335 + }, + { + "epoch": 1.91, + "learning_rate": 6.207959956958888e-07, + "loss": 0.6333, + "step": 74336 + }, + { + "epoch": 1.91, + "learning_rate": 6.207703920077365e-07, + "loss": 0.6758, + "step": 74337 + }, + { + "epoch": 1.91, + "learning_rate": 6.20744788609943e-07, + "loss": 0.7051, + "step": 74338 + }, + { + "epoch": 1.91, + "learning_rate": 6.207191855025276e-07, + "loss": 0.6021, + "step": 74339 + }, + { + "epoch": 1.91, + "learning_rate": 6.206935826855101e-07, + "loss": 0.8379, + "step": 74340 + }, + { + "epoch": 1.91, + "learning_rate": 6.206679801589099e-07, + "loss": 0.4919, + "step": 74341 + }, + { + "epoch": 1.91, + "learning_rate": 6.20642377922747e-07, + "loss": 0.3822, + "step": 74342 + }, + { + "epoch": 1.91, + "learning_rate": 6.206167759770407e-07, + "loss": 0.6084, + "step": 74343 + }, + { + "epoch": 1.91, + "learning_rate": 6.205911743218106e-07, + "loss": 0.6274, + "step": 74344 + }, + { + "epoch": 1.91, + "learning_rate": 6.205655729570765e-07, + "loss": 0.6523, + "step": 74345 + }, + { + "epoch": 1.91, + "learning_rate": 6.205399718828579e-07, + "loss": 0.647, + "step": 74346 + }, + { + "epoch": 1.91, + "learning_rate": 6.205143710991743e-07, + "loss": 0.6509, + "step": 74347 + }, + { + "epoch": 1.91, + "learning_rate": 6.20488770606046e-07, + "loss": 0.4719, + "step": 74348 + }, + { + "epoch": 1.91, + "learning_rate": 6.204631704034914e-07, + "loss": 0.6475, + "step": 74349 + }, + { + "epoch": 1.91, + "learning_rate": 6.204375704915308e-07, + "loss": 0.5366, + "step": 74350 + }, + { + "epoch": 1.91, + "learning_rate": 6.204119708701836e-07, + "loss": 0.4897, + "step": 74351 + }, + { + "epoch": 1.91, + "learning_rate": 6.203863715394697e-07, + "loss": 0.6729, + "step": 74352 + }, + { + "epoch": 1.91, + "learning_rate": 6.203607724994082e-07, + "loss": 0.5967, + "step": 74353 + }, + { + "epoch": 1.91, + "learning_rate": 6.203351737500193e-07, + "loss": 0.635, + "step": 74354 + }, + { + "epoch": 1.91, + "learning_rate": 6.203095752913221e-07, + "loss": 0.5386, + "step": 74355 + }, + { + "epoch": 1.91, + "learning_rate": 6.202839771233366e-07, + "loss": 0.6211, + "step": 74356 + }, + { + "epoch": 1.91, + "learning_rate": 6.202583792460819e-07, + "loss": 0.8125, + "step": 74357 + }, + { + "epoch": 1.91, + "learning_rate": 6.202327816595784e-07, + "loss": 0.5254, + "step": 74358 + }, + { + "epoch": 1.91, + "learning_rate": 6.20207184363845e-07, + "loss": 0.6494, + "step": 74359 + }, + { + "epoch": 1.91, + "learning_rate": 6.201815873589012e-07, + "loss": 0.6646, + "step": 74360 + }, + { + "epoch": 1.91, + "learning_rate": 6.201559906447672e-07, + "loss": 0.5796, + "step": 74361 + }, + { + "epoch": 1.91, + "learning_rate": 6.20130394221462e-07, + "loss": 0.6714, + "step": 74362 + }, + { + "epoch": 1.91, + "learning_rate": 6.201047980890057e-07, + "loss": 0.5796, + "step": 74363 + }, + { + "epoch": 1.91, + "learning_rate": 6.200792022474175e-07, + "loss": 0.6836, + "step": 74364 + }, + { + "epoch": 1.91, + "learning_rate": 6.200536066967175e-07, + "loss": 0.5085, + "step": 74365 + }, + { + "epoch": 1.91, + "learning_rate": 6.200280114369249e-07, + "loss": 0.6943, + "step": 74366 + }, + { + "epoch": 1.91, + "learning_rate": 6.20002416468059e-07, + "loss": 0.6128, + "step": 74367 + }, + { + "epoch": 1.91, + "learning_rate": 6.199768217901405e-07, + "loss": 0.5532, + "step": 74368 + }, + { + "epoch": 1.91, + "learning_rate": 6.19951227403188e-07, + "loss": 0.6436, + "step": 74369 + }, + { + "epoch": 1.91, + "learning_rate": 6.199256333072211e-07, + "loss": 0.5715, + "step": 74370 + }, + { + "epoch": 1.91, + "learning_rate": 6.199000395022597e-07, + "loss": 0.5654, + "step": 74371 + }, + { + "epoch": 1.91, + "learning_rate": 6.198744459883234e-07, + "loss": 0.5979, + "step": 74372 + }, + { + "epoch": 1.91, + "learning_rate": 6.198488527654319e-07, + "loss": 0.7109, + "step": 74373 + }, + { + "epoch": 1.91, + "learning_rate": 6.198232598336044e-07, + "loss": 0.5547, + "step": 74374 + }, + { + "epoch": 1.91, + "learning_rate": 6.19797667192861e-07, + "loss": 0.6987, + "step": 74375 + }, + { + "epoch": 1.91, + "learning_rate": 6.197720748432208e-07, + "loss": 0.7305, + "step": 74376 + }, + { + "epoch": 1.91, + "learning_rate": 6.197464827847038e-07, + "loss": 0.5723, + "step": 74377 + }, + { + "epoch": 1.91, + "learning_rate": 6.197208910173297e-07, + "loss": 0.5903, + "step": 74378 + }, + { + "epoch": 1.91, + "learning_rate": 6.196952995411175e-07, + "loss": 0.668, + "step": 74379 + }, + { + "epoch": 1.91, + "learning_rate": 6.196697083560872e-07, + "loss": 0.5571, + "step": 74380 + }, + { + "epoch": 1.91, + "learning_rate": 6.196441174622582e-07, + "loss": 0.6426, + "step": 74381 + }, + { + "epoch": 1.91, + "learning_rate": 6.196185268596503e-07, + "loss": 0.8018, + "step": 74382 + }, + { + "epoch": 1.91, + "learning_rate": 6.195929365482831e-07, + "loss": 0.6484, + "step": 74383 + }, + { + "epoch": 1.91, + "learning_rate": 6.195673465281759e-07, + "loss": 0.4929, + "step": 74384 + }, + { + "epoch": 1.91, + "learning_rate": 6.195417567993486e-07, + "loss": 0.5996, + "step": 74385 + }, + { + "epoch": 1.91, + "learning_rate": 6.195161673618207e-07, + "loss": 0.7705, + "step": 74386 + }, + { + "epoch": 1.91, + "learning_rate": 6.194905782156117e-07, + "loss": 0.4285, + "step": 74387 + }, + { + "epoch": 1.91, + "learning_rate": 6.194649893607416e-07, + "loss": 0.5938, + "step": 74388 + }, + { + "epoch": 1.91, + "learning_rate": 6.194394007972293e-07, + "loss": 0.6875, + "step": 74389 + }, + { + "epoch": 1.91, + "learning_rate": 6.19413812525095e-07, + "loss": 0.7725, + "step": 74390 + }, + { + "epoch": 1.91, + "learning_rate": 6.193882245443577e-07, + "loss": 0.4868, + "step": 74391 + }, + { + "epoch": 1.91, + "learning_rate": 6.193626368550376e-07, + "loss": 0.5806, + "step": 74392 + }, + { + "epoch": 1.91, + "learning_rate": 6.193370494571537e-07, + "loss": 0.4178, + "step": 74393 + }, + { + "epoch": 1.91, + "learning_rate": 6.193114623507263e-07, + "loss": 0.71, + "step": 74394 + }, + { + "epoch": 1.91, + "learning_rate": 6.192858755357743e-07, + "loss": 0.6548, + "step": 74395 + }, + { + "epoch": 1.91, + "learning_rate": 6.192602890123179e-07, + "loss": 0.7031, + "step": 74396 + }, + { + "epoch": 1.91, + "learning_rate": 6.192347027803761e-07, + "loss": 0.5068, + "step": 74397 + }, + { + "epoch": 1.91, + "learning_rate": 6.192091168399691e-07, + "loss": 0.3925, + "step": 74398 + }, + { + "epoch": 1.91, + "learning_rate": 6.191835311911162e-07, + "loss": 0.6973, + "step": 74399 + }, + { + "epoch": 1.91, + "learning_rate": 6.191579458338368e-07, + "loss": 0.6562, + "step": 74400 + }, + { + "epoch": 1.91, + "learning_rate": 6.191323607681505e-07, + "loss": 0.7354, + "step": 74401 + }, + { + "epoch": 1.91, + "learning_rate": 6.191067759940772e-07, + "loss": 0.6387, + "step": 74402 + }, + { + "epoch": 1.91, + "learning_rate": 6.19081191511636e-07, + "loss": 0.4043, + "step": 74403 + }, + { + "epoch": 1.91, + "learning_rate": 6.190556073208472e-07, + "loss": 0.7236, + "step": 74404 + }, + { + "epoch": 1.91, + "learning_rate": 6.190300234217299e-07, + "loss": 0.5225, + "step": 74405 + }, + { + "epoch": 1.91, + "learning_rate": 6.190044398143038e-07, + "loss": 0.5444, + "step": 74406 + }, + { + "epoch": 1.91, + "learning_rate": 6.189788564985883e-07, + "loss": 0.7773, + "step": 74407 + }, + { + "epoch": 1.91, + "learning_rate": 6.189532734746037e-07, + "loss": 0.6338, + "step": 74408 + }, + { + "epoch": 1.91, + "learning_rate": 6.189276907423689e-07, + "loss": 0.6289, + "step": 74409 + }, + { + "epoch": 1.91, + "learning_rate": 6.189021083019032e-07, + "loss": 0.7744, + "step": 74410 + }, + { + "epoch": 1.91, + "learning_rate": 6.18876526153227e-07, + "loss": 0.5669, + "step": 74411 + }, + { + "epoch": 1.91, + "learning_rate": 6.188509442963592e-07, + "loss": 0.6836, + "step": 74412 + }, + { + "epoch": 1.91, + "learning_rate": 6.1882536273132e-07, + "loss": 0.5347, + "step": 74413 + }, + { + "epoch": 1.91, + "learning_rate": 6.187997814581285e-07, + "loss": 0.7373, + "step": 74414 + }, + { + "epoch": 1.91, + "learning_rate": 6.187742004768046e-07, + "loss": 0.6191, + "step": 74415 + }, + { + "epoch": 1.91, + "learning_rate": 6.187486197873677e-07, + "loss": 0.5537, + "step": 74416 + }, + { + "epoch": 1.91, + "learning_rate": 6.187230393898375e-07, + "loss": 0.5791, + "step": 74417 + }, + { + "epoch": 1.91, + "learning_rate": 6.186974592842338e-07, + "loss": 0.6602, + "step": 74418 + }, + { + "epoch": 1.91, + "learning_rate": 6.186718794705758e-07, + "loss": 0.6182, + "step": 74419 + }, + { + "epoch": 1.91, + "learning_rate": 6.186462999488829e-07, + "loss": 0.6387, + "step": 74420 + }, + { + "epoch": 1.91, + "learning_rate": 6.186207207191751e-07, + "loss": 0.7378, + "step": 74421 + }, + { + "epoch": 1.91, + "learning_rate": 6.185951417814719e-07, + "loss": 0.5996, + "step": 74422 + }, + { + "epoch": 1.91, + "learning_rate": 6.185695631357931e-07, + "loss": 0.668, + "step": 74423 + }, + { + "epoch": 1.91, + "learning_rate": 6.185439847821576e-07, + "loss": 0.6196, + "step": 74424 + }, + { + "epoch": 1.91, + "learning_rate": 6.185184067205858e-07, + "loss": 0.6685, + "step": 74425 + }, + { + "epoch": 1.91, + "learning_rate": 6.184928289510967e-07, + "loss": 0.6084, + "step": 74426 + }, + { + "epoch": 1.91, + "learning_rate": 6.184672514737101e-07, + "loss": 0.5522, + "step": 74427 + }, + { + "epoch": 1.91, + "learning_rate": 6.184416742884459e-07, + "loss": 0.6577, + "step": 74428 + }, + { + "epoch": 1.91, + "learning_rate": 6.184160973953232e-07, + "loss": 0.7158, + "step": 74429 + }, + { + "epoch": 1.91, + "learning_rate": 6.183905207943617e-07, + "loss": 0.8486, + "step": 74430 + }, + { + "epoch": 1.91, + "learning_rate": 6.183649444855809e-07, + "loss": 0.6914, + "step": 74431 + }, + { + "epoch": 1.91, + "learning_rate": 6.183393684690007e-07, + "loss": 0.6353, + "step": 74432 + }, + { + "epoch": 1.91, + "learning_rate": 6.183137927446402e-07, + "loss": 0.5532, + "step": 74433 + }, + { + "epoch": 1.91, + "learning_rate": 6.182882173125197e-07, + "loss": 0.5273, + "step": 74434 + }, + { + "epoch": 1.91, + "learning_rate": 6.18262642172658e-07, + "loss": 0.5459, + "step": 74435 + }, + { + "epoch": 1.91, + "learning_rate": 6.182370673250752e-07, + "loss": 0.7002, + "step": 74436 + }, + { + "epoch": 1.91, + "learning_rate": 6.182114927697907e-07, + "loss": 0.5439, + "step": 74437 + }, + { + "epoch": 1.91, + "learning_rate": 6.181859185068245e-07, + "loss": 0.5566, + "step": 74438 + }, + { + "epoch": 1.91, + "learning_rate": 6.181603445361954e-07, + "loss": 0.6753, + "step": 74439 + }, + { + "epoch": 1.91, + "learning_rate": 6.181347708579234e-07, + "loss": 0.6685, + "step": 74440 + }, + { + "epoch": 1.91, + "learning_rate": 6.181091974720279e-07, + "loss": 0.5903, + "step": 74441 + }, + { + "epoch": 1.91, + "learning_rate": 6.180836243785289e-07, + "loss": 0.8291, + "step": 74442 + }, + { + "epoch": 1.91, + "learning_rate": 6.180580515774454e-07, + "loss": 0.5889, + "step": 74443 + }, + { + "epoch": 1.91, + "learning_rate": 6.180324790687976e-07, + "loss": 0.4854, + "step": 74444 + }, + { + "epoch": 1.91, + "learning_rate": 6.180069068526043e-07, + "loss": 0.5571, + "step": 74445 + }, + { + "epoch": 1.91, + "learning_rate": 6.179813349288861e-07, + "loss": 0.8027, + "step": 74446 + }, + { + "epoch": 1.91, + "learning_rate": 6.179557632976618e-07, + "loss": 0.6729, + "step": 74447 + }, + { + "epoch": 1.91, + "learning_rate": 6.179301919589514e-07, + "loss": 0.6416, + "step": 74448 + }, + { + "epoch": 1.91, + "learning_rate": 6.179046209127741e-07, + "loss": 0.6016, + "step": 74449 + }, + { + "epoch": 1.91, + "learning_rate": 6.178790501591495e-07, + "loss": 0.8164, + "step": 74450 + }, + { + "epoch": 1.91, + "learning_rate": 6.178534796980976e-07, + "loss": 0.7305, + "step": 74451 + }, + { + "epoch": 1.91, + "learning_rate": 6.178279095296375e-07, + "loss": 0.5913, + "step": 74452 + }, + { + "epoch": 1.91, + "learning_rate": 6.178023396537891e-07, + "loss": 0.5342, + "step": 74453 + }, + { + "epoch": 1.91, + "learning_rate": 6.177767700705719e-07, + "loss": 0.6089, + "step": 74454 + }, + { + "epoch": 1.91, + "learning_rate": 6.177512007800054e-07, + "loss": 0.6421, + "step": 74455 + }, + { + "epoch": 1.91, + "learning_rate": 6.177256317821093e-07, + "loss": 0.4812, + "step": 74456 + }, + { + "epoch": 1.91, + "learning_rate": 6.177000630769029e-07, + "loss": 0.5354, + "step": 74457 + }, + { + "epoch": 1.91, + "learning_rate": 6.176744946644066e-07, + "loss": 0.5541, + "step": 74458 + }, + { + "epoch": 1.91, + "learning_rate": 6.17648926544639e-07, + "loss": 0.6396, + "step": 74459 + }, + { + "epoch": 1.91, + "learning_rate": 6.176233587176197e-07, + "loss": 0.6729, + "step": 74460 + }, + { + "epoch": 1.91, + "learning_rate": 6.175977911833689e-07, + "loss": 0.7036, + "step": 74461 + }, + { + "epoch": 1.91, + "learning_rate": 6.175722239419058e-07, + "loss": 0.7041, + "step": 74462 + }, + { + "epoch": 1.91, + "learning_rate": 6.175466569932502e-07, + "loss": 0.5552, + "step": 74463 + }, + { + "epoch": 1.91, + "learning_rate": 6.175210903374213e-07, + "loss": 0.6167, + "step": 74464 + }, + { + "epoch": 1.91, + "learning_rate": 6.174955239744392e-07, + "loss": 0.7705, + "step": 74465 + }, + { + "epoch": 1.91, + "learning_rate": 6.174699579043229e-07, + "loss": 0.5063, + "step": 74466 + }, + { + "epoch": 1.91, + "learning_rate": 6.174443921270924e-07, + "loss": 0.7842, + "step": 74467 + }, + { + "epoch": 1.91, + "learning_rate": 6.174188266427676e-07, + "loss": 0.7412, + "step": 74468 + }, + { + "epoch": 1.91, + "learning_rate": 6.173932614513669e-07, + "loss": 0.5776, + "step": 74469 + }, + { + "epoch": 1.91, + "learning_rate": 6.173676965529109e-07, + "loss": 0.6494, + "step": 74470 + }, + { + "epoch": 1.91, + "learning_rate": 6.173421319474188e-07, + "loss": 0.7236, + "step": 74471 + }, + { + "epoch": 1.91, + "learning_rate": 6.173165676349102e-07, + "loss": 0.5864, + "step": 74472 + }, + { + "epoch": 1.91, + "learning_rate": 6.172910036154049e-07, + "loss": 0.7305, + "step": 74473 + }, + { + "epoch": 1.91, + "learning_rate": 6.17265439888922e-07, + "loss": 0.7617, + "step": 74474 + }, + { + "epoch": 1.91, + "learning_rate": 6.172398764554816e-07, + "loss": 0.5854, + "step": 74475 + }, + { + "epoch": 1.91, + "learning_rate": 6.172143133151027e-07, + "loss": 0.7285, + "step": 74476 + }, + { + "epoch": 1.91, + "learning_rate": 6.171887504678058e-07, + "loss": 0.498, + "step": 74477 + }, + { + "epoch": 1.91, + "learning_rate": 6.171631879136096e-07, + "loss": 0.543, + "step": 74478 + }, + { + "epoch": 1.91, + "learning_rate": 6.171376256525335e-07, + "loss": 0.689, + "step": 74479 + }, + { + "epoch": 1.91, + "learning_rate": 6.171120636845981e-07, + "loss": 0.7139, + "step": 74480 + }, + { + "epoch": 1.91, + "learning_rate": 6.170865020098219e-07, + "loss": 0.6187, + "step": 74481 + }, + { + "epoch": 1.91, + "learning_rate": 6.170609406282255e-07, + "loss": 0.6172, + "step": 74482 + }, + { + "epoch": 1.91, + "learning_rate": 6.170353795398273e-07, + "loss": 0.4465, + "step": 74483 + }, + { + "epoch": 1.91, + "learning_rate": 6.17009818744648e-07, + "loss": 0.7178, + "step": 74484 + }, + { + "epoch": 1.91, + "learning_rate": 6.169842582427063e-07, + "loss": 0.5269, + "step": 74485 + }, + { + "epoch": 1.91, + "learning_rate": 6.169586980340224e-07, + "loss": 0.7256, + "step": 74486 + }, + { + "epoch": 1.91, + "learning_rate": 6.169331381186159e-07, + "loss": 0.5493, + "step": 74487 + }, + { + "epoch": 1.91, + "learning_rate": 6.169075784965057e-07, + "loss": 0.5801, + "step": 74488 + }, + { + "epoch": 1.91, + "learning_rate": 6.168820191677117e-07, + "loss": 0.6899, + "step": 74489 + }, + { + "epoch": 1.91, + "learning_rate": 6.168564601322537e-07, + "loss": 0.6484, + "step": 74490 + }, + { + "epoch": 1.91, + "learning_rate": 6.168309013901509e-07, + "loss": 0.6172, + "step": 74491 + }, + { + "epoch": 1.91, + "learning_rate": 6.168053429414233e-07, + "loss": 0.6963, + "step": 74492 + }, + { + "epoch": 1.91, + "learning_rate": 6.167797847860898e-07, + "loss": 0.6035, + "step": 74493 + }, + { + "epoch": 1.91, + "learning_rate": 6.167542269241709e-07, + "loss": 0.7109, + "step": 74494 + }, + { + "epoch": 1.91, + "learning_rate": 6.167286693556852e-07, + "loss": 0.6577, + "step": 74495 + }, + { + "epoch": 1.91, + "learning_rate": 6.167031120806531e-07, + "loss": 0.479, + "step": 74496 + }, + { + "epoch": 1.91, + "learning_rate": 6.16677555099094e-07, + "loss": 0.6733, + "step": 74497 + }, + { + "epoch": 1.91, + "learning_rate": 6.166519984110269e-07, + "loss": 0.709, + "step": 74498 + }, + { + "epoch": 1.91, + "learning_rate": 6.166264420164719e-07, + "loss": 0.5669, + "step": 74499 + }, + { + "epoch": 1.91, + "learning_rate": 6.166008859154481e-07, + "loss": 0.5723, + "step": 74500 + }, + { + "epoch": 1.91, + "learning_rate": 6.165753301079757e-07, + "loss": 0.5898, + "step": 74501 + }, + { + "epoch": 1.91, + "learning_rate": 6.165497745940736e-07, + "loss": 0.6504, + "step": 74502 + }, + { + "epoch": 1.91, + "learning_rate": 6.165242193737621e-07, + "loss": 0.5854, + "step": 74503 + }, + { + "epoch": 1.91, + "learning_rate": 6.1649866444706e-07, + "loss": 0.6553, + "step": 74504 + }, + { + "epoch": 1.91, + "learning_rate": 6.164731098139875e-07, + "loss": 0.7402, + "step": 74505 + }, + { + "epoch": 1.91, + "learning_rate": 6.164475554745637e-07, + "loss": 0.6077, + "step": 74506 + }, + { + "epoch": 1.91, + "learning_rate": 6.164220014288091e-07, + "loss": 0.6436, + "step": 74507 + }, + { + "epoch": 1.91, + "learning_rate": 6.163964476767418e-07, + "loss": 0.6914, + "step": 74508 + }, + { + "epoch": 1.91, + "learning_rate": 6.163708942183823e-07, + "loss": 0.6421, + "step": 74509 + }, + { + "epoch": 1.91, + "learning_rate": 6.163453410537498e-07, + "loss": 0.6973, + "step": 74510 + }, + { + "epoch": 1.91, + "learning_rate": 6.163197881828642e-07, + "loss": 0.519, + "step": 74511 + }, + { + "epoch": 1.91, + "learning_rate": 6.162942356057447e-07, + "loss": 0.4932, + "step": 74512 + }, + { + "epoch": 1.91, + "learning_rate": 6.162686833224114e-07, + "loss": 0.7236, + "step": 74513 + }, + { + "epoch": 1.91, + "learning_rate": 6.162431313328831e-07, + "loss": 0.8545, + "step": 74514 + }, + { + "epoch": 1.91, + "learning_rate": 6.162175796371801e-07, + "loss": 0.6641, + "step": 74515 + }, + { + "epoch": 1.91, + "learning_rate": 6.161920282353214e-07, + "loss": 0.5244, + "step": 74516 + }, + { + "epoch": 1.91, + "learning_rate": 6.161664771273272e-07, + "loss": 0.8438, + "step": 74517 + }, + { + "epoch": 1.91, + "learning_rate": 6.161409263132167e-07, + "loss": 0.5356, + "step": 74518 + }, + { + "epoch": 1.91, + "learning_rate": 6.16115375793009e-07, + "loss": 0.7188, + "step": 74519 + }, + { + "epoch": 1.91, + "learning_rate": 6.160898255667244e-07, + "loss": 0.5474, + "step": 74520 + }, + { + "epoch": 1.91, + "learning_rate": 6.160642756343819e-07, + "loss": 0.7139, + "step": 74521 + }, + { + "epoch": 1.91, + "learning_rate": 6.160387259960016e-07, + "loss": 0.6416, + "step": 74522 + }, + { + "epoch": 1.91, + "learning_rate": 6.160131766516026e-07, + "loss": 0.5002, + "step": 74523 + }, + { + "epoch": 1.91, + "learning_rate": 6.159876276012048e-07, + "loss": 0.3545, + "step": 74524 + }, + { + "epoch": 1.91, + "learning_rate": 6.159620788448275e-07, + "loss": 0.5947, + "step": 74525 + }, + { + "epoch": 1.91, + "learning_rate": 6.159365303824905e-07, + "loss": 0.5635, + "step": 74526 + }, + { + "epoch": 1.91, + "learning_rate": 6.159109822142135e-07, + "loss": 0.6934, + "step": 74527 + }, + { + "epoch": 1.91, + "learning_rate": 6.158854343400155e-07, + "loss": 0.6235, + "step": 74528 + }, + { + "epoch": 1.91, + "learning_rate": 6.158598867599163e-07, + "loss": 0.583, + "step": 74529 + }, + { + "epoch": 1.91, + "learning_rate": 6.158343394739356e-07, + "loss": 0.5117, + "step": 74530 + }, + { + "epoch": 1.91, + "learning_rate": 6.158087924820927e-07, + "loss": 0.6562, + "step": 74531 + }, + { + "epoch": 1.91, + "learning_rate": 6.157832457844076e-07, + "loss": 0.4722, + "step": 74532 + }, + { + "epoch": 1.91, + "learning_rate": 6.157576993808992e-07, + "loss": 0.7168, + "step": 74533 + }, + { + "epoch": 1.91, + "learning_rate": 6.15732153271588e-07, + "loss": 0.6357, + "step": 74534 + }, + { + "epoch": 1.91, + "learning_rate": 6.157066074564927e-07, + "loss": 0.6602, + "step": 74535 + }, + { + "epoch": 1.91, + "learning_rate": 6.156810619356332e-07, + "loss": 0.4004, + "step": 74536 + }, + { + "epoch": 1.91, + "learning_rate": 6.156555167090293e-07, + "loss": 0.6108, + "step": 74537 + }, + { + "epoch": 1.91, + "learning_rate": 6.156299717767002e-07, + "loss": 0.5522, + "step": 74538 + }, + { + "epoch": 1.91, + "learning_rate": 6.156044271386655e-07, + "loss": 0.6855, + "step": 74539 + }, + { + "epoch": 1.91, + "learning_rate": 6.155788827949446e-07, + "loss": 0.5327, + "step": 74540 + }, + { + "epoch": 1.91, + "learning_rate": 6.155533387455575e-07, + "loss": 0.749, + "step": 74541 + }, + { + "epoch": 1.91, + "learning_rate": 6.155277949905233e-07, + "loss": 0.6299, + "step": 74542 + }, + { + "epoch": 1.91, + "learning_rate": 6.15502251529862e-07, + "loss": 0.6528, + "step": 74543 + }, + { + "epoch": 1.91, + "learning_rate": 6.154767083635929e-07, + "loss": 0.4307, + "step": 74544 + }, + { + "epoch": 1.91, + "learning_rate": 6.154511654917356e-07, + "loss": 0.4058, + "step": 74545 + }, + { + "epoch": 1.91, + "learning_rate": 6.154256229143098e-07, + "loss": 0.5269, + "step": 74546 + }, + { + "epoch": 1.91, + "learning_rate": 6.154000806313351e-07, + "loss": 0.7178, + "step": 74547 + }, + { + "epoch": 1.91, + "learning_rate": 6.153745386428304e-07, + "loss": 0.4888, + "step": 74548 + }, + { + "epoch": 1.91, + "learning_rate": 6.153489969488159e-07, + "loss": 0.5731, + "step": 74549 + }, + { + "epoch": 1.91, + "learning_rate": 6.153234555493109e-07, + "loss": 0.8184, + "step": 74550 + }, + { + "epoch": 1.91, + "learning_rate": 6.152979144443352e-07, + "loss": 0.707, + "step": 74551 + }, + { + "epoch": 1.91, + "learning_rate": 6.15272373633908e-07, + "loss": 0.709, + "step": 74552 + }, + { + "epoch": 1.91, + "learning_rate": 6.152468331180493e-07, + "loss": 0.5698, + "step": 74553 + }, + { + "epoch": 1.91, + "learning_rate": 6.152212928967781e-07, + "loss": 0.6719, + "step": 74554 + }, + { + "epoch": 1.91, + "learning_rate": 6.151957529701146e-07, + "loss": 0.6201, + "step": 74555 + }, + { + "epoch": 1.91, + "learning_rate": 6.151702133380776e-07, + "loss": 0.7236, + "step": 74556 + }, + { + "epoch": 1.91, + "learning_rate": 6.151446740006877e-07, + "loss": 0.6116, + "step": 74557 + }, + { + "epoch": 1.91, + "learning_rate": 6.151191349579636e-07, + "loss": 0.623, + "step": 74558 + }, + { + "epoch": 1.91, + "learning_rate": 6.150935962099247e-07, + "loss": 0.7568, + "step": 74559 + }, + { + "epoch": 1.91, + "learning_rate": 6.150680577565913e-07, + "loss": 0.6826, + "step": 74560 + }, + { + "epoch": 1.91, + "learning_rate": 6.150425195979824e-07, + "loss": 0.6016, + "step": 74561 + }, + { + "epoch": 1.91, + "learning_rate": 6.150169817341179e-07, + "loss": 0.6719, + "step": 74562 + }, + { + "epoch": 1.91, + "learning_rate": 6.149914441650172e-07, + "loss": 0.6079, + "step": 74563 + }, + { + "epoch": 1.91, + "learning_rate": 6.149659068906996e-07, + "loss": 0.4456, + "step": 74564 + }, + { + "epoch": 1.91, + "learning_rate": 6.14940369911185e-07, + "loss": 0.8311, + "step": 74565 + }, + { + "epoch": 1.91, + "learning_rate": 6.149148332264929e-07, + "loss": 0.7607, + "step": 74566 + }, + { + "epoch": 1.91, + "learning_rate": 6.14889296836643e-07, + "loss": 0.5437, + "step": 74567 + }, + { + "epoch": 1.91, + "learning_rate": 6.148637607416546e-07, + "loss": 0.6111, + "step": 74568 + }, + { + "epoch": 1.91, + "learning_rate": 6.148382249415471e-07, + "loss": 0.5928, + "step": 74569 + }, + { + "epoch": 1.91, + "learning_rate": 6.148126894363403e-07, + "loss": 0.6182, + "step": 74570 + }, + { + "epoch": 1.91, + "learning_rate": 6.147871542260536e-07, + "loss": 0.5952, + "step": 74571 + }, + { + "epoch": 1.91, + "learning_rate": 6.147616193107071e-07, + "loss": 0.6543, + "step": 74572 + }, + { + "epoch": 1.91, + "learning_rate": 6.147360846903193e-07, + "loss": 0.5562, + "step": 74573 + }, + { + "epoch": 1.91, + "learning_rate": 6.147105503649109e-07, + "loss": 0.5129, + "step": 74574 + }, + { + "epoch": 1.91, + "learning_rate": 6.146850163345005e-07, + "loss": 0.6699, + "step": 74575 + }, + { + "epoch": 1.91, + "learning_rate": 6.146594825991084e-07, + "loss": 0.6045, + "step": 74576 + }, + { + "epoch": 1.91, + "learning_rate": 6.14633949158754e-07, + "loss": 0.6338, + "step": 74577 + }, + { + "epoch": 1.91, + "learning_rate": 6.146084160134561e-07, + "loss": 0.7754, + "step": 74578 + }, + { + "epoch": 1.91, + "learning_rate": 6.145828831632353e-07, + "loss": 0.6855, + "step": 74579 + }, + { + "epoch": 1.91, + "learning_rate": 6.145573506081106e-07, + "loss": 0.6143, + "step": 74580 + }, + { + "epoch": 1.91, + "learning_rate": 6.145318183481012e-07, + "loss": 0.75, + "step": 74581 + }, + { + "epoch": 1.91, + "learning_rate": 6.145062863832273e-07, + "loss": 0.4277, + "step": 74582 + }, + { + "epoch": 1.91, + "learning_rate": 6.144807547135082e-07, + "loss": 0.4888, + "step": 74583 + }, + { + "epoch": 1.91, + "learning_rate": 6.144552233389635e-07, + "loss": 0.6411, + "step": 74584 + }, + { + "epoch": 1.91, + "learning_rate": 6.144296922596127e-07, + "loss": 0.6216, + "step": 74585 + }, + { + "epoch": 1.91, + "learning_rate": 6.144041614754753e-07, + "loss": 0.7012, + "step": 74586 + }, + { + "epoch": 1.91, + "learning_rate": 6.143786309865712e-07, + "loss": 0.4536, + "step": 74587 + }, + { + "epoch": 1.91, + "learning_rate": 6.143531007929193e-07, + "loss": 0.6313, + "step": 74588 + }, + { + "epoch": 1.91, + "learning_rate": 6.143275708945397e-07, + "loss": 0.6538, + "step": 74589 + }, + { + "epoch": 1.91, + "learning_rate": 6.143020412914514e-07, + "loss": 0.6367, + "step": 74590 + }, + { + "epoch": 1.91, + "learning_rate": 6.142765119836748e-07, + "loss": 0.5945, + "step": 74591 + }, + { + "epoch": 1.91, + "learning_rate": 6.142509829712286e-07, + "loss": 0.6621, + "step": 74592 + }, + { + "epoch": 1.91, + "learning_rate": 6.142254542541327e-07, + "loss": 0.7207, + "step": 74593 + }, + { + "epoch": 1.91, + "learning_rate": 6.141999258324066e-07, + "loss": 0.5818, + "step": 74594 + }, + { + "epoch": 1.91, + "learning_rate": 6.1417439770607e-07, + "loss": 0.6499, + "step": 74595 + }, + { + "epoch": 1.91, + "learning_rate": 6.141488698751423e-07, + "loss": 0.6284, + "step": 74596 + }, + { + "epoch": 1.91, + "learning_rate": 6.141233423396434e-07, + "loss": 0.666, + "step": 74597 + }, + { + "epoch": 1.91, + "learning_rate": 6.140978150995921e-07, + "loss": 0.7207, + "step": 74598 + }, + { + "epoch": 1.91, + "learning_rate": 6.140722881550084e-07, + "loss": 0.6499, + "step": 74599 + }, + { + "epoch": 1.91, + "learning_rate": 6.140467615059118e-07, + "loss": 0.2649, + "step": 74600 + }, + { + "epoch": 1.91, + "learning_rate": 6.14021235152322e-07, + "loss": 0.6055, + "step": 74601 + }, + { + "epoch": 1.91, + "learning_rate": 6.139957090942581e-07, + "loss": 0.4177, + "step": 74602 + }, + { + "epoch": 1.91, + "learning_rate": 6.139701833317403e-07, + "loss": 0.6289, + "step": 74603 + }, + { + "epoch": 1.91, + "learning_rate": 6.139446578647873e-07, + "loss": 0.4768, + "step": 74604 + }, + { + "epoch": 1.91, + "learning_rate": 6.139191326934196e-07, + "loss": 0.5198, + "step": 74605 + }, + { + "epoch": 1.91, + "learning_rate": 6.13893607817656e-07, + "loss": 0.5645, + "step": 74606 + }, + { + "epoch": 1.91, + "learning_rate": 6.138680832375167e-07, + "loss": 0.7021, + "step": 74607 + }, + { + "epoch": 1.91, + "learning_rate": 6.138425589530205e-07, + "loss": 0.3096, + "step": 74608 + }, + { + "epoch": 1.91, + "learning_rate": 6.138170349641874e-07, + "loss": 0.8047, + "step": 74609 + }, + { + "epoch": 1.91, + "learning_rate": 6.137915112710367e-07, + "loss": 0.6899, + "step": 74610 + }, + { + "epoch": 1.91, + "learning_rate": 6.137659878735881e-07, + "loss": 0.5107, + "step": 74611 + }, + { + "epoch": 1.91, + "learning_rate": 6.137404647718613e-07, + "loss": 0.6782, + "step": 74612 + }, + { + "epoch": 1.91, + "learning_rate": 6.137149419658754e-07, + "loss": 0.6537, + "step": 74613 + }, + { + "epoch": 1.91, + "learning_rate": 6.136894194556505e-07, + "loss": 0.6895, + "step": 74614 + }, + { + "epoch": 1.91, + "learning_rate": 6.136638972412055e-07, + "loss": 0.8135, + "step": 74615 + }, + { + "epoch": 1.91, + "learning_rate": 6.136383753225605e-07, + "loss": 0.6689, + "step": 74616 + }, + { + "epoch": 1.91, + "learning_rate": 6.136128536997352e-07, + "loss": 0.5679, + "step": 74617 + }, + { + "epoch": 1.91, + "learning_rate": 6.135873323727485e-07, + "loss": 0.5752, + "step": 74618 + }, + { + "epoch": 1.91, + "learning_rate": 6.1356181134162e-07, + "loss": 0.6133, + "step": 74619 + }, + { + "epoch": 1.91, + "learning_rate": 6.135362906063697e-07, + "loss": 0.7686, + "step": 74620 + }, + { + "epoch": 1.91, + "learning_rate": 6.135107701670166e-07, + "loss": 0.6121, + "step": 74621 + }, + { + "epoch": 1.91, + "learning_rate": 6.134852500235808e-07, + "loss": 0.6855, + "step": 74622 + }, + { + "epoch": 1.91, + "learning_rate": 6.134597301760813e-07, + "loss": 0.7646, + "step": 74623 + }, + { + "epoch": 1.91, + "learning_rate": 6.134342106245381e-07, + "loss": 0.4302, + "step": 74624 + }, + { + "epoch": 1.91, + "learning_rate": 6.134086913689704e-07, + "loss": 0.6631, + "step": 74625 + }, + { + "epoch": 1.91, + "learning_rate": 6.133831724093981e-07, + "loss": 0.6382, + "step": 74626 + }, + { + "epoch": 1.91, + "learning_rate": 6.133576537458407e-07, + "loss": 0.6128, + "step": 74627 + }, + { + "epoch": 1.91, + "learning_rate": 6.133321353783172e-07, + "loss": 0.6069, + "step": 74628 + }, + { + "epoch": 1.91, + "learning_rate": 6.133066173068477e-07, + "loss": 0.6768, + "step": 74629 + }, + { + "epoch": 1.91, + "learning_rate": 6.132810995314513e-07, + "loss": 0.79, + "step": 74630 + }, + { + "epoch": 1.91, + "learning_rate": 6.132555820521482e-07, + "loss": 0.6904, + "step": 74631 + }, + { + "epoch": 1.91, + "learning_rate": 6.13230064868957e-07, + "loss": 0.7275, + "step": 74632 + }, + { + "epoch": 1.91, + "learning_rate": 6.132045479818982e-07, + "loss": 0.5776, + "step": 74633 + }, + { + "epoch": 1.91, + "learning_rate": 6.131790313909904e-07, + "loss": 0.5234, + "step": 74634 + }, + { + "epoch": 1.91, + "learning_rate": 6.13153515096254e-07, + "loss": 0.6108, + "step": 74635 + }, + { + "epoch": 1.91, + "learning_rate": 6.131279990977081e-07, + "loss": 0.501, + "step": 74636 + }, + { + "epoch": 1.91, + "learning_rate": 6.131024833953727e-07, + "loss": 0.6274, + "step": 74637 + }, + { + "epoch": 1.91, + "learning_rate": 6.130769679892665e-07, + "loss": 0.5684, + "step": 74638 + }, + { + "epoch": 1.91, + "learning_rate": 6.130514528794095e-07, + "loss": 0.6016, + "step": 74639 + }, + { + "epoch": 1.91, + "learning_rate": 6.130259380658212e-07, + "loss": 0.6221, + "step": 74640 + }, + { + "epoch": 1.91, + "learning_rate": 6.130004235485211e-07, + "loss": 0.5249, + "step": 74641 + }, + { + "epoch": 1.91, + "learning_rate": 6.129749093275287e-07, + "loss": 0.5747, + "step": 74642 + }, + { + "epoch": 1.91, + "learning_rate": 6.129493954028639e-07, + "loss": 0.5337, + "step": 74643 + }, + { + "epoch": 1.91, + "learning_rate": 6.129238817745457e-07, + "loss": 0.6367, + "step": 74644 + }, + { + "epoch": 1.91, + "learning_rate": 6.128983684425941e-07, + "loss": 0.6533, + "step": 74645 + }, + { + "epoch": 1.91, + "learning_rate": 6.128728554070281e-07, + "loss": 0.6069, + "step": 74646 + }, + { + "epoch": 1.91, + "learning_rate": 6.128473426678681e-07, + "loss": 0.5811, + "step": 74647 + }, + { + "epoch": 1.91, + "learning_rate": 6.128218302251329e-07, + "loss": 0.4968, + "step": 74648 + }, + { + "epoch": 1.91, + "learning_rate": 6.127963180788419e-07, + "loss": 0.7324, + "step": 74649 + }, + { + "epoch": 1.91, + "learning_rate": 6.127708062290152e-07, + "loss": 0.6758, + "step": 74650 + }, + { + "epoch": 1.91, + "learning_rate": 6.127452946756719e-07, + "loss": 0.7373, + "step": 74651 + }, + { + "epoch": 1.91, + "learning_rate": 6.12719783418832e-07, + "loss": 0.7666, + "step": 74652 + }, + { + "epoch": 1.91, + "learning_rate": 6.126942724585147e-07, + "loss": 0.5933, + "step": 74653 + }, + { + "epoch": 1.91, + "learning_rate": 6.126687617947393e-07, + "loss": 0.6484, + "step": 74654 + }, + { + "epoch": 1.91, + "learning_rate": 6.12643251427526e-07, + "loss": 0.5874, + "step": 74655 + }, + { + "epoch": 1.91, + "learning_rate": 6.126177413568935e-07, + "loss": 0.7764, + "step": 74656 + }, + { + "epoch": 1.91, + "learning_rate": 6.125922315828624e-07, + "loss": 0.5664, + "step": 74657 + }, + { + "epoch": 1.91, + "learning_rate": 6.125667221054513e-07, + "loss": 0.6245, + "step": 74658 + }, + { + "epoch": 1.91, + "learning_rate": 6.125412129246799e-07, + "loss": 0.6455, + "step": 74659 + }, + { + "epoch": 1.91, + "learning_rate": 6.12515704040568e-07, + "loss": 0.4595, + "step": 74660 + }, + { + "epoch": 1.91, + "learning_rate": 6.124901954531349e-07, + "loss": 0.6265, + "step": 74661 + }, + { + "epoch": 1.91, + "learning_rate": 6.124646871624004e-07, + "loss": 0.5776, + "step": 74662 + }, + { + "epoch": 1.91, + "learning_rate": 6.124391791683836e-07, + "loss": 0.5884, + "step": 74663 + }, + { + "epoch": 1.91, + "learning_rate": 6.124136714711046e-07, + "loss": 0.5215, + "step": 74664 + }, + { + "epoch": 1.91, + "learning_rate": 6.123881640705823e-07, + "loss": 0.6055, + "step": 74665 + }, + { + "epoch": 1.91, + "learning_rate": 6.12362656966837e-07, + "loss": 0.6523, + "step": 74666 + }, + { + "epoch": 1.91, + "learning_rate": 6.123371501598879e-07, + "loss": 0.7173, + "step": 74667 + }, + { + "epoch": 1.91, + "learning_rate": 6.123116436497539e-07, + "loss": 0.4802, + "step": 74668 + }, + { + "epoch": 1.91, + "learning_rate": 6.122861374364554e-07, + "loss": 0.7822, + "step": 74669 + }, + { + "epoch": 1.91, + "learning_rate": 6.122606315200114e-07, + "loss": 0.6826, + "step": 74670 + }, + { + "epoch": 1.91, + "learning_rate": 6.122351259004415e-07, + "loss": 0.6279, + "step": 74671 + }, + { + "epoch": 1.91, + "learning_rate": 6.122096205777656e-07, + "loss": 0.5889, + "step": 74672 + }, + { + "epoch": 1.91, + "learning_rate": 6.121841155520027e-07, + "loss": 0.5635, + "step": 74673 + }, + { + "epoch": 1.91, + "learning_rate": 6.121586108231728e-07, + "loss": 0.7285, + "step": 74674 + }, + { + "epoch": 1.91, + "learning_rate": 6.12133106391295e-07, + "loss": 0.6914, + "step": 74675 + }, + { + "epoch": 1.91, + "learning_rate": 6.121076022563892e-07, + "loss": 0.7104, + "step": 74676 + }, + { + "epoch": 1.91, + "learning_rate": 6.120820984184751e-07, + "loss": 0.5122, + "step": 74677 + }, + { + "epoch": 1.91, + "learning_rate": 6.120565948775714e-07, + "loss": 0.5684, + "step": 74678 + }, + { + "epoch": 1.91, + "learning_rate": 6.120310916336983e-07, + "loss": 0.7051, + "step": 74679 + }, + { + "epoch": 1.91, + "learning_rate": 6.120055886868751e-07, + "loss": 0.6777, + "step": 74680 + }, + { + "epoch": 1.91, + "learning_rate": 6.119800860371214e-07, + "loss": 0.6372, + "step": 74681 + }, + { + "epoch": 1.91, + "learning_rate": 6.119545836844566e-07, + "loss": 0.5859, + "step": 74682 + }, + { + "epoch": 1.91, + "learning_rate": 6.119290816289006e-07, + "loss": 0.5942, + "step": 74683 + }, + { + "epoch": 1.91, + "learning_rate": 6.119035798704723e-07, + "loss": 0.6182, + "step": 74684 + }, + { + "epoch": 1.91, + "learning_rate": 6.118780784091919e-07, + "loss": 0.6304, + "step": 74685 + }, + { + "epoch": 1.91, + "learning_rate": 6.118525772450784e-07, + "loss": 0.5405, + "step": 74686 + }, + { + "epoch": 1.91, + "learning_rate": 6.118270763781519e-07, + "loss": 0.542, + "step": 74687 + }, + { + "epoch": 1.91, + "learning_rate": 6.118015758084314e-07, + "loss": 0.7812, + "step": 74688 + }, + { + "epoch": 1.91, + "learning_rate": 6.117760755359365e-07, + "loss": 0.6504, + "step": 74689 + }, + { + "epoch": 1.91, + "learning_rate": 6.117505755606867e-07, + "loss": 0.5674, + "step": 74690 + }, + { + "epoch": 1.91, + "learning_rate": 6.117250758827018e-07, + "loss": 0.6523, + "step": 74691 + }, + { + "epoch": 1.91, + "learning_rate": 6.11699576502001e-07, + "loss": 0.6289, + "step": 74692 + }, + { + "epoch": 1.91, + "learning_rate": 6.116740774186041e-07, + "loss": 0.6709, + "step": 74693 + }, + { + "epoch": 1.91, + "learning_rate": 6.116485786325302e-07, + "loss": 0.7002, + "step": 74694 + }, + { + "epoch": 1.91, + "learning_rate": 6.116230801437996e-07, + "loss": 0.6631, + "step": 74695 + }, + { + "epoch": 1.91, + "learning_rate": 6.115975819524311e-07, + "loss": 0.6621, + "step": 74696 + }, + { + "epoch": 1.91, + "learning_rate": 6.115720840584447e-07, + "loss": 0.7197, + "step": 74697 + }, + { + "epoch": 1.91, + "learning_rate": 6.115465864618596e-07, + "loss": 0.5146, + "step": 74698 + }, + { + "epoch": 1.91, + "learning_rate": 6.115210891626952e-07, + "loss": 0.4893, + "step": 74699 + }, + { + "epoch": 1.91, + "learning_rate": 6.114955921609715e-07, + "loss": 0.749, + "step": 74700 + }, + { + "epoch": 1.91, + "learning_rate": 6.114700954567074e-07, + "loss": 0.6108, + "step": 74701 + }, + { + "epoch": 1.91, + "learning_rate": 6.11444599049923e-07, + "loss": 0.6074, + "step": 74702 + }, + { + "epoch": 1.91, + "learning_rate": 6.114191029406376e-07, + "loss": 0.5183, + "step": 74703 + }, + { + "epoch": 1.91, + "learning_rate": 6.113936071288707e-07, + "loss": 0.5884, + "step": 74704 + }, + { + "epoch": 1.91, + "learning_rate": 6.113681116146419e-07, + "loss": 0.6689, + "step": 74705 + }, + { + "epoch": 1.91, + "learning_rate": 6.113426163979707e-07, + "loss": 0.7432, + "step": 74706 + }, + { + "epoch": 1.91, + "learning_rate": 6.113171214788768e-07, + "loss": 0.6934, + "step": 74707 + }, + { + "epoch": 1.91, + "learning_rate": 6.112916268573793e-07, + "loss": 0.5444, + "step": 74708 + }, + { + "epoch": 1.91, + "learning_rate": 6.112661325334978e-07, + "loss": 0.5913, + "step": 74709 + }, + { + "epoch": 1.91, + "learning_rate": 6.11240638507252e-07, + "loss": 0.7285, + "step": 74710 + }, + { + "epoch": 1.91, + "learning_rate": 6.112151447786614e-07, + "loss": 0.688, + "step": 74711 + }, + { + "epoch": 1.91, + "learning_rate": 6.111896513477455e-07, + "loss": 0.6709, + "step": 74712 + }, + { + "epoch": 1.91, + "learning_rate": 6.111641582145236e-07, + "loss": 0.7441, + "step": 74713 + }, + { + "epoch": 1.91, + "learning_rate": 6.111386653790157e-07, + "loss": 0.5571, + "step": 74714 + }, + { + "epoch": 1.91, + "learning_rate": 6.111131728412408e-07, + "loss": 0.7227, + "step": 74715 + }, + { + "epoch": 1.92, + "learning_rate": 6.110876806012189e-07, + "loss": 0.6592, + "step": 74716 + }, + { + "epoch": 1.92, + "learning_rate": 6.110621886589695e-07, + "loss": 0.6343, + "step": 74717 + }, + { + "epoch": 1.92, + "learning_rate": 6.110366970145115e-07, + "loss": 0.5179, + "step": 74718 + }, + { + "epoch": 1.92, + "learning_rate": 6.110112056678649e-07, + "loss": 0.5132, + "step": 74719 + }, + { + "epoch": 1.92, + "learning_rate": 6.109857146190491e-07, + "loss": 0.5815, + "step": 74720 + }, + { + "epoch": 1.92, + "learning_rate": 6.109602238680838e-07, + "loss": 0.6196, + "step": 74721 + }, + { + "epoch": 1.92, + "learning_rate": 6.109347334149881e-07, + "loss": 0.4355, + "step": 74722 + }, + { + "epoch": 1.92, + "learning_rate": 6.10909243259782e-07, + "loss": 0.6089, + "step": 74723 + }, + { + "epoch": 1.92, + "learning_rate": 6.108837534024845e-07, + "loss": 0.6904, + "step": 74724 + }, + { + "epoch": 1.92, + "learning_rate": 6.108582638431158e-07, + "loss": 0.8193, + "step": 74725 + }, + { + "epoch": 1.92, + "learning_rate": 6.10832774581695e-07, + "loss": 0.6748, + "step": 74726 + }, + { + "epoch": 1.92, + "learning_rate": 6.108072856182418e-07, + "loss": 0.689, + "step": 74727 + }, + { + "epoch": 1.92, + "learning_rate": 6.107817969527752e-07, + "loss": 0.5322, + "step": 74728 + }, + { + "epoch": 1.92, + "learning_rate": 6.107563085853153e-07, + "loss": 0.6455, + "step": 74729 + }, + { + "epoch": 1.92, + "learning_rate": 6.107308205158811e-07, + "loss": 0.6826, + "step": 74730 + }, + { + "epoch": 1.92, + "learning_rate": 6.107053327444926e-07, + "loss": 0.6104, + "step": 74731 + }, + { + "epoch": 1.92, + "learning_rate": 6.106798452711691e-07, + "loss": 0.7192, + "step": 74732 + }, + { + "epoch": 1.92, + "learning_rate": 6.106543580959303e-07, + "loss": 0.5354, + "step": 74733 + }, + { + "epoch": 1.92, + "learning_rate": 6.106288712187952e-07, + "loss": 0.6592, + "step": 74734 + }, + { + "epoch": 1.92, + "learning_rate": 6.10603384639784e-07, + "loss": 0.7383, + "step": 74735 + }, + { + "epoch": 1.92, + "learning_rate": 6.105778983589156e-07, + "loss": 0.6768, + "step": 74736 + }, + { + "epoch": 1.92, + "learning_rate": 6.105524123762102e-07, + "loss": 0.7744, + "step": 74737 + }, + { + "epoch": 1.92, + "learning_rate": 6.105269266916869e-07, + "loss": 0.5527, + "step": 74738 + }, + { + "epoch": 1.92, + "learning_rate": 6.105014413053649e-07, + "loss": 0.6226, + "step": 74739 + }, + { + "epoch": 1.92, + "learning_rate": 6.104759562172641e-07, + "loss": 0.6846, + "step": 74740 + }, + { + "epoch": 1.92, + "learning_rate": 6.10450471427404e-07, + "loss": 0.6479, + "step": 74741 + }, + { + "epoch": 1.92, + "learning_rate": 6.10424986935804e-07, + "loss": 0.467, + "step": 74742 + }, + { + "epoch": 1.92, + "learning_rate": 6.10399502742484e-07, + "loss": 0.5811, + "step": 74743 + }, + { + "epoch": 1.92, + "learning_rate": 6.103740188474626e-07, + "loss": 0.9297, + "step": 74744 + }, + { + "epoch": 1.92, + "learning_rate": 6.103485352507604e-07, + "loss": 0.6401, + "step": 74745 + }, + { + "epoch": 1.92, + "learning_rate": 6.103230519523961e-07, + "loss": 0.5288, + "step": 74746 + }, + { + "epoch": 1.92, + "learning_rate": 6.1029756895239e-07, + "loss": 0.5596, + "step": 74747 + }, + { + "epoch": 1.92, + "learning_rate": 6.102720862507608e-07, + "loss": 0.8369, + "step": 74748 + }, + { + "epoch": 1.92, + "learning_rate": 6.102466038475282e-07, + "loss": 0.7158, + "step": 74749 + }, + { + "epoch": 1.92, + "learning_rate": 6.10221121742712e-07, + "loss": 0.6309, + "step": 74750 + }, + { + "epoch": 1.92, + "learning_rate": 6.101956399363315e-07, + "loss": 0.7676, + "step": 74751 + }, + { + "epoch": 1.92, + "learning_rate": 6.101701584284062e-07, + "loss": 0.6992, + "step": 74752 + }, + { + "epoch": 1.92, + "learning_rate": 6.101446772189557e-07, + "loss": 0.749, + "step": 74753 + }, + { + "epoch": 1.92, + "learning_rate": 6.101191963079998e-07, + "loss": 0.6973, + "step": 74754 + }, + { + "epoch": 1.92, + "learning_rate": 6.100937156955574e-07, + "loss": 0.5386, + "step": 74755 + }, + { + "epoch": 1.92, + "learning_rate": 6.100682353816484e-07, + "loss": 0.7705, + "step": 74756 + }, + { + "epoch": 1.92, + "learning_rate": 6.100427553662926e-07, + "loss": 0.4871, + "step": 74757 + }, + { + "epoch": 1.92, + "learning_rate": 6.100172756495085e-07, + "loss": 0.7148, + "step": 74758 + }, + { + "epoch": 1.92, + "learning_rate": 6.099917962313167e-07, + "loss": 0.7725, + "step": 74759 + }, + { + "epoch": 1.92, + "learning_rate": 6.099663171117362e-07, + "loss": 0.5889, + "step": 74760 + }, + { + "epoch": 1.92, + "learning_rate": 6.099408382907862e-07, + "loss": 0.5815, + "step": 74761 + }, + { + "epoch": 1.92, + "learning_rate": 6.099153597684868e-07, + "loss": 0.6504, + "step": 74762 + }, + { + "epoch": 1.92, + "learning_rate": 6.098898815448572e-07, + "loss": 0.5337, + "step": 74763 + }, + { + "epoch": 1.92, + "learning_rate": 6.098644036199171e-07, + "loss": 0.6743, + "step": 74764 + }, + { + "epoch": 1.92, + "learning_rate": 6.098389259936857e-07, + "loss": 0.7256, + "step": 74765 + }, + { + "epoch": 1.92, + "learning_rate": 6.098134486661829e-07, + "loss": 0.7725, + "step": 74766 + }, + { + "epoch": 1.92, + "learning_rate": 6.097879716374281e-07, + "loss": 0.7188, + "step": 74767 + }, + { + "epoch": 1.92, + "learning_rate": 6.097624949074404e-07, + "loss": 0.4939, + "step": 74768 + }, + { + "epoch": 1.92, + "learning_rate": 6.097370184762398e-07, + "loss": 0.4236, + "step": 74769 + }, + { + "epoch": 1.92, + "learning_rate": 6.097115423438455e-07, + "loss": 0.5908, + "step": 74770 + }, + { + "epoch": 1.92, + "learning_rate": 6.096860665102772e-07, + "loss": 0.603, + "step": 74771 + }, + { + "epoch": 1.92, + "learning_rate": 6.096605909755543e-07, + "loss": 0.8271, + "step": 74772 + }, + { + "epoch": 1.92, + "learning_rate": 6.096351157396964e-07, + "loss": 0.6318, + "step": 74773 + }, + { + "epoch": 1.92, + "learning_rate": 6.096096408027227e-07, + "loss": 0.7021, + "step": 74774 + }, + { + "epoch": 1.92, + "learning_rate": 6.095841661646533e-07, + "loss": 0.667, + "step": 74775 + }, + { + "epoch": 1.92, + "learning_rate": 6.095586918255074e-07, + "loss": 0.4966, + "step": 74776 + }, + { + "epoch": 1.92, + "learning_rate": 6.095332177853041e-07, + "loss": 0.6504, + "step": 74777 + }, + { + "epoch": 1.92, + "learning_rate": 6.095077440440635e-07, + "loss": 0.5674, + "step": 74778 + }, + { + "epoch": 1.92, + "learning_rate": 6.09482270601805e-07, + "loss": 0.47, + "step": 74779 + }, + { + "epoch": 1.92, + "learning_rate": 6.094567974585475e-07, + "loss": 0.6553, + "step": 74780 + }, + { + "epoch": 1.92, + "learning_rate": 6.094313246143112e-07, + "loss": 0.6885, + "step": 74781 + }, + { + "epoch": 1.92, + "learning_rate": 6.094058520691154e-07, + "loss": 0.7305, + "step": 74782 + }, + { + "epoch": 1.92, + "learning_rate": 6.093803798229797e-07, + "loss": 0.6343, + "step": 74783 + }, + { + "epoch": 1.92, + "learning_rate": 6.093549078759232e-07, + "loss": 0.5203, + "step": 74784 + }, + { + "epoch": 1.92, + "learning_rate": 6.093294362279659e-07, + "loss": 0.4421, + "step": 74785 + }, + { + "epoch": 1.92, + "learning_rate": 6.093039648791273e-07, + "loss": 0.6562, + "step": 74786 + }, + { + "epoch": 1.92, + "learning_rate": 6.092784938294261e-07, + "loss": 0.5613, + "step": 74787 + }, + { + "epoch": 1.92, + "learning_rate": 6.092530230788829e-07, + "loss": 0.5244, + "step": 74788 + }, + { + "epoch": 1.92, + "learning_rate": 6.092275526275163e-07, + "loss": 0.5005, + "step": 74789 + }, + { + "epoch": 1.92, + "learning_rate": 6.092020824753466e-07, + "loss": 0.5327, + "step": 74790 + }, + { + "epoch": 1.92, + "learning_rate": 6.091766126223925e-07, + "loss": 0.4995, + "step": 74791 + }, + { + "epoch": 1.92, + "learning_rate": 6.091511430686742e-07, + "loss": 0.7637, + "step": 74792 + }, + { + "epoch": 1.92, + "learning_rate": 6.091256738142106e-07, + "loss": 0.7295, + "step": 74793 + }, + { + "epoch": 1.92, + "learning_rate": 6.091002048590219e-07, + "loss": 0.7051, + "step": 74794 + }, + { + "epoch": 1.92, + "learning_rate": 6.090747362031267e-07, + "loss": 0.5503, + "step": 74795 + }, + { + "epoch": 1.92, + "learning_rate": 6.090492678465459e-07, + "loss": 0.7666, + "step": 74796 + }, + { + "epoch": 1.92, + "learning_rate": 6.090237997892973e-07, + "loss": 0.7302, + "step": 74797 + }, + { + "epoch": 1.92, + "learning_rate": 6.089983320314015e-07, + "loss": 0.8047, + "step": 74798 + }, + { + "epoch": 1.92, + "learning_rate": 6.089728645728774e-07, + "loss": 0.6143, + "step": 74799 + }, + { + "epoch": 1.92, + "learning_rate": 6.089473974137451e-07, + "loss": 0.5439, + "step": 74800 + }, + { + "epoch": 1.92, + "learning_rate": 6.089219305540235e-07, + "loss": 0.7725, + "step": 74801 + }, + { + "epoch": 1.92, + "learning_rate": 6.088964639937326e-07, + "loss": 0.6865, + "step": 74802 + }, + { + "epoch": 1.92, + "learning_rate": 6.088709977328916e-07, + "loss": 0.6494, + "step": 74803 + }, + { + "epoch": 1.92, + "learning_rate": 6.088455317715202e-07, + "loss": 0.5928, + "step": 74804 + }, + { + "epoch": 1.92, + "learning_rate": 6.088200661096377e-07, + "loss": 0.4731, + "step": 74805 + }, + { + "epoch": 1.92, + "learning_rate": 6.08794600747264e-07, + "loss": 0.6538, + "step": 74806 + }, + { + "epoch": 1.92, + "learning_rate": 6.08769135684418e-07, + "loss": 0.6094, + "step": 74807 + }, + { + "epoch": 1.92, + "learning_rate": 6.087436709211194e-07, + "loss": 0.8145, + "step": 74808 + }, + { + "epoch": 1.92, + "learning_rate": 6.08718206457388e-07, + "loss": 0.668, + "step": 74809 + }, + { + "epoch": 1.92, + "learning_rate": 6.086927422932428e-07, + "loss": 0.6313, + "step": 74810 + }, + { + "epoch": 1.92, + "learning_rate": 6.086672784287039e-07, + "loss": 0.6504, + "step": 74811 + }, + { + "epoch": 1.92, + "learning_rate": 6.086418148637902e-07, + "loss": 0.6904, + "step": 74812 + }, + { + "epoch": 1.92, + "learning_rate": 6.086163515985216e-07, + "loss": 0.6323, + "step": 74813 + }, + { + "epoch": 1.92, + "learning_rate": 6.085908886329173e-07, + "loss": 0.5898, + "step": 74814 + }, + { + "epoch": 1.92, + "learning_rate": 6.085654259669972e-07, + "loss": 0.4922, + "step": 74815 + }, + { + "epoch": 1.92, + "learning_rate": 6.085399636007808e-07, + "loss": 0.5244, + "step": 74816 + }, + { + "epoch": 1.92, + "learning_rate": 6.08514501534287e-07, + "loss": 0.6914, + "step": 74817 + }, + { + "epoch": 1.92, + "learning_rate": 6.084890397675355e-07, + "loss": 0.4858, + "step": 74818 + }, + { + "epoch": 1.92, + "learning_rate": 6.084635783005461e-07, + "loss": 0.6372, + "step": 74819 + }, + { + "epoch": 1.92, + "learning_rate": 6.084381171333382e-07, + "loss": 0.498, + "step": 74820 + }, + { + "epoch": 1.92, + "learning_rate": 6.084126562659311e-07, + "loss": 0.749, + "step": 74821 + }, + { + "epoch": 1.92, + "learning_rate": 6.083871956983444e-07, + "loss": 0.6196, + "step": 74822 + }, + { + "epoch": 1.92, + "learning_rate": 6.083617354305976e-07, + "loss": 0.6382, + "step": 74823 + }, + { + "epoch": 1.92, + "learning_rate": 6.083362754627104e-07, + "loss": 0.6543, + "step": 74824 + }, + { + "epoch": 1.92, + "learning_rate": 6.08310815794702e-07, + "loss": 0.489, + "step": 74825 + }, + { + "epoch": 1.92, + "learning_rate": 6.082853564265923e-07, + "loss": 0.5244, + "step": 74826 + }, + { + "epoch": 1.92, + "learning_rate": 6.082598973584001e-07, + "loss": 0.7119, + "step": 74827 + }, + { + "epoch": 1.92, + "learning_rate": 6.082344385901455e-07, + "loss": 0.5591, + "step": 74828 + }, + { + "epoch": 1.92, + "learning_rate": 6.082089801218475e-07, + "loss": 0.5029, + "step": 74829 + }, + { + "epoch": 1.92, + "learning_rate": 6.081835219535261e-07, + "loss": 0.542, + "step": 74830 + }, + { + "epoch": 1.92, + "learning_rate": 6.081580640852003e-07, + "loss": 0.6099, + "step": 74831 + }, + { + "epoch": 1.92, + "learning_rate": 6.081326065168902e-07, + "loss": 0.4808, + "step": 74832 + }, + { + "epoch": 1.92, + "learning_rate": 6.081071492486147e-07, + "loss": 0.7852, + "step": 74833 + }, + { + "epoch": 1.92, + "learning_rate": 6.080816922803936e-07, + "loss": 0.7891, + "step": 74834 + }, + { + "epoch": 1.92, + "learning_rate": 6.080562356122465e-07, + "loss": 0.5098, + "step": 74835 + }, + { + "epoch": 1.92, + "learning_rate": 6.080307792441928e-07, + "loss": 0.5112, + "step": 74836 + }, + { + "epoch": 1.92, + "learning_rate": 6.080053231762515e-07, + "loss": 0.5918, + "step": 74837 + }, + { + "epoch": 1.92, + "learning_rate": 6.079798674084427e-07, + "loss": 0.3398, + "step": 74838 + }, + { + "epoch": 1.92, + "learning_rate": 6.079544119407856e-07, + "loss": 0.6626, + "step": 74839 + }, + { + "epoch": 1.92, + "learning_rate": 6.079289567732999e-07, + "loss": 0.4956, + "step": 74840 + }, + { + "epoch": 1.92, + "learning_rate": 6.079035019060048e-07, + "loss": 0.6445, + "step": 74841 + }, + { + "epoch": 1.92, + "learning_rate": 6.078780473389202e-07, + "loss": 0.6738, + "step": 74842 + }, + { + "epoch": 1.92, + "learning_rate": 6.07852593072065e-07, + "loss": 0.6924, + "step": 74843 + }, + { + "epoch": 1.92, + "learning_rate": 6.078271391054594e-07, + "loss": 0.7725, + "step": 74844 + }, + { + "epoch": 1.92, + "learning_rate": 6.078016854391223e-07, + "loss": 0.5972, + "step": 74845 + }, + { + "epoch": 1.92, + "learning_rate": 6.077762320730737e-07, + "loss": 0.5024, + "step": 74846 + }, + { + "epoch": 1.92, + "learning_rate": 6.077507790073328e-07, + "loss": 0.6113, + "step": 74847 + }, + { + "epoch": 1.92, + "learning_rate": 6.077253262419187e-07, + "loss": 0.562, + "step": 74848 + }, + { + "epoch": 1.92, + "learning_rate": 6.076998737768516e-07, + "loss": 0.5908, + "step": 74849 + }, + { + "epoch": 1.92, + "learning_rate": 6.076744216121505e-07, + "loss": 0.5923, + "step": 74850 + }, + { + "epoch": 1.92, + "learning_rate": 6.076489697478351e-07, + "loss": 0.6289, + "step": 74851 + }, + { + "epoch": 1.92, + "learning_rate": 6.076235181839248e-07, + "loss": 0.6777, + "step": 74852 + }, + { + "epoch": 1.92, + "learning_rate": 6.075980669204392e-07, + "loss": 0.6235, + "step": 74853 + }, + { + "epoch": 1.92, + "learning_rate": 6.075726159573977e-07, + "loss": 0.7109, + "step": 74854 + }, + { + "epoch": 1.92, + "learning_rate": 6.075471652948198e-07, + "loss": 0.6484, + "step": 74855 + }, + { + "epoch": 1.92, + "learning_rate": 6.075217149327252e-07, + "loss": 0.6104, + "step": 74856 + }, + { + "epoch": 1.92, + "learning_rate": 6.074962648711331e-07, + "loss": 0.6611, + "step": 74857 + }, + { + "epoch": 1.92, + "learning_rate": 6.074708151100627e-07, + "loss": 0.4219, + "step": 74858 + }, + { + "epoch": 1.92, + "learning_rate": 6.074453656495342e-07, + "loss": 0.4839, + "step": 74859 + }, + { + "epoch": 1.92, + "learning_rate": 6.074199164895664e-07, + "loss": 0.3911, + "step": 74860 + }, + { + "epoch": 1.92, + "learning_rate": 6.073944676301794e-07, + "loss": 0.6934, + "step": 74861 + }, + { + "epoch": 1.92, + "learning_rate": 6.073690190713922e-07, + "loss": 0.6963, + "step": 74862 + }, + { + "epoch": 1.92, + "learning_rate": 6.073435708132249e-07, + "loss": 0.5229, + "step": 74863 + }, + { + "epoch": 1.92, + "learning_rate": 6.073181228556961e-07, + "loss": 0.6494, + "step": 74864 + }, + { + "epoch": 1.92, + "learning_rate": 6.072926751988259e-07, + "loss": 0.5771, + "step": 74865 + }, + { + "epoch": 1.92, + "learning_rate": 6.072672278426341e-07, + "loss": 0.833, + "step": 74866 + }, + { + "epoch": 1.92, + "learning_rate": 6.072417807871392e-07, + "loss": 0.749, + "step": 74867 + }, + { + "epoch": 1.92, + "learning_rate": 6.072163340323613e-07, + "loss": 0.7236, + "step": 74868 + }, + { + "epoch": 1.92, + "learning_rate": 6.0719088757832e-07, + "loss": 0.7002, + "step": 74869 + }, + { + "epoch": 1.92, + "learning_rate": 6.071654414250342e-07, + "loss": 0.4536, + "step": 74870 + }, + { + "epoch": 1.92, + "learning_rate": 6.071399955725241e-07, + "loss": 0.7178, + "step": 74871 + }, + { + "epoch": 1.92, + "learning_rate": 6.071145500208086e-07, + "loss": 0.79, + "step": 74872 + }, + { + "epoch": 1.92, + "learning_rate": 6.070891047699075e-07, + "loss": 0.6416, + "step": 74873 + }, + { + "epoch": 1.92, + "learning_rate": 6.070636598198401e-07, + "loss": 0.6147, + "step": 74874 + }, + { + "epoch": 1.92, + "learning_rate": 6.070382151706261e-07, + "loss": 0.6406, + "step": 74875 + }, + { + "epoch": 1.92, + "learning_rate": 6.070127708222852e-07, + "loss": 0.5264, + "step": 74876 + }, + { + "epoch": 1.92, + "learning_rate": 6.069873267748363e-07, + "loss": 0.6465, + "step": 74877 + }, + { + "epoch": 1.92, + "learning_rate": 6.06961883028299e-07, + "loss": 0.4355, + "step": 74878 + }, + { + "epoch": 1.92, + "learning_rate": 6.069364395826928e-07, + "loss": 0.5044, + "step": 74879 + }, + { + "epoch": 1.92, + "learning_rate": 6.069109964380376e-07, + "loss": 0.4756, + "step": 74880 + }, + { + "epoch": 1.92, + "learning_rate": 6.068855535943523e-07, + "loss": 0.3749, + "step": 74881 + }, + { + "epoch": 1.92, + "learning_rate": 6.068601110516569e-07, + "loss": 0.7651, + "step": 74882 + }, + { + "epoch": 1.92, + "learning_rate": 6.068346688099703e-07, + "loss": 0.6748, + "step": 74883 + }, + { + "epoch": 1.92, + "learning_rate": 6.068092268693128e-07, + "loss": 0.5942, + "step": 74884 + }, + { + "epoch": 1.92, + "learning_rate": 6.067837852297031e-07, + "loss": 0.6543, + "step": 74885 + }, + { + "epoch": 1.92, + "learning_rate": 6.067583438911614e-07, + "loss": 0.5308, + "step": 74886 + }, + { + "epoch": 1.92, + "learning_rate": 6.067329028537063e-07, + "loss": 0.5869, + "step": 74887 + }, + { + "epoch": 1.92, + "learning_rate": 6.067074621173578e-07, + "loss": 0.5957, + "step": 74888 + }, + { + "epoch": 1.92, + "learning_rate": 6.066820216821354e-07, + "loss": 0.6973, + "step": 74889 + }, + { + "epoch": 1.92, + "learning_rate": 6.066565815480585e-07, + "loss": 0.6768, + "step": 74890 + }, + { + "epoch": 1.92, + "learning_rate": 6.066311417151461e-07, + "loss": 0.5103, + "step": 74891 + }, + { + "epoch": 1.92, + "learning_rate": 6.066057021834188e-07, + "loss": 0.3967, + "step": 74892 + }, + { + "epoch": 1.92, + "learning_rate": 6.06580262952895e-07, + "loss": 0.6475, + "step": 74893 + }, + { + "epoch": 1.92, + "learning_rate": 6.065548240235948e-07, + "loss": 0.6504, + "step": 74894 + }, + { + "epoch": 1.92, + "learning_rate": 6.065293853955373e-07, + "loss": 0.6416, + "step": 74895 + }, + { + "epoch": 1.92, + "learning_rate": 6.065039470687426e-07, + "loss": 0.5503, + "step": 74896 + }, + { + "epoch": 1.92, + "learning_rate": 6.064785090432295e-07, + "loss": 0.6523, + "step": 74897 + }, + { + "epoch": 1.92, + "learning_rate": 6.064530713190174e-07, + "loss": 0.6899, + "step": 74898 + }, + { + "epoch": 1.92, + "learning_rate": 6.064276338961264e-07, + "loss": 0.479, + "step": 74899 + }, + { + "epoch": 1.92, + "learning_rate": 6.064021967745756e-07, + "loss": 0.7646, + "step": 74900 + }, + { + "epoch": 1.92, + "learning_rate": 6.063767599543846e-07, + "loss": 0.7188, + "step": 74901 + }, + { + "epoch": 1.92, + "learning_rate": 6.063513234355726e-07, + "loss": 0.5977, + "step": 74902 + }, + { + "epoch": 1.92, + "learning_rate": 6.063258872181596e-07, + "loss": 0.6396, + "step": 74903 + }, + { + "epoch": 1.92, + "learning_rate": 6.063004513021645e-07, + "loss": 0.667, + "step": 74904 + }, + { + "epoch": 1.92, + "learning_rate": 6.062750156876072e-07, + "loss": 0.6553, + "step": 74905 + }, + { + "epoch": 1.92, + "learning_rate": 6.062495803745072e-07, + "loss": 0.6646, + "step": 74906 + }, + { + "epoch": 1.92, + "learning_rate": 6.062241453628837e-07, + "loss": 0.4686, + "step": 74907 + }, + { + "epoch": 1.92, + "learning_rate": 6.06198710652756e-07, + "loss": 0.4355, + "step": 74908 + }, + { + "epoch": 1.92, + "learning_rate": 6.061732762441441e-07, + "loss": 0.707, + "step": 74909 + }, + { + "epoch": 1.92, + "learning_rate": 6.061478421370669e-07, + "loss": 0.4397, + "step": 74910 + }, + { + "epoch": 1.92, + "learning_rate": 6.061224083315443e-07, + "loss": 0.8457, + "step": 74911 + }, + { + "epoch": 1.92, + "learning_rate": 6.060969748275957e-07, + "loss": 0.6455, + "step": 74912 + }, + { + "epoch": 1.92, + "learning_rate": 6.060715416252407e-07, + "loss": 0.7529, + "step": 74913 + }, + { + "epoch": 1.92, + "learning_rate": 6.060461087244984e-07, + "loss": 0.6895, + "step": 74914 + }, + { + "epoch": 1.92, + "learning_rate": 6.060206761253886e-07, + "loss": 0.5718, + "step": 74915 + }, + { + "epoch": 1.92, + "learning_rate": 6.059952438279308e-07, + "loss": 0.7051, + "step": 74916 + }, + { + "epoch": 1.92, + "learning_rate": 6.05969811832144e-07, + "loss": 0.7302, + "step": 74917 + }, + { + "epoch": 1.92, + "learning_rate": 6.059443801380482e-07, + "loss": 0.6851, + "step": 74918 + }, + { + "epoch": 1.92, + "learning_rate": 6.059189487456624e-07, + "loss": 0.5479, + "step": 74919 + }, + { + "epoch": 1.92, + "learning_rate": 6.058935176550066e-07, + "loss": 0.6147, + "step": 74920 + }, + { + "epoch": 1.92, + "learning_rate": 6.058680868660999e-07, + "loss": 0.5042, + "step": 74921 + }, + { + "epoch": 1.92, + "learning_rate": 6.05842656378962e-07, + "loss": 0.6616, + "step": 74922 + }, + { + "epoch": 1.92, + "learning_rate": 6.058172261936124e-07, + "loss": 0.5093, + "step": 74923 + }, + { + "epoch": 1.92, + "learning_rate": 6.057917963100699e-07, + "loss": 0.7314, + "step": 74924 + }, + { + "epoch": 1.92, + "learning_rate": 6.05766366728355e-07, + "loss": 0.8672, + "step": 74925 + }, + { + "epoch": 1.92, + "learning_rate": 6.057409374484867e-07, + "loss": 0.6865, + "step": 74926 + }, + { + "epoch": 1.92, + "learning_rate": 6.057155084704841e-07, + "loss": 0.4279, + "step": 74927 + }, + { + "epoch": 1.92, + "learning_rate": 6.056900797943672e-07, + "loss": 0.6226, + "step": 74928 + }, + { + "epoch": 1.92, + "learning_rate": 6.05664651420155e-07, + "loss": 0.5361, + "step": 74929 + }, + { + "epoch": 1.92, + "learning_rate": 6.056392233478676e-07, + "loss": 0.6846, + "step": 74930 + }, + { + "epoch": 1.92, + "learning_rate": 6.056137955775238e-07, + "loss": 0.7803, + "step": 74931 + }, + { + "epoch": 1.92, + "learning_rate": 6.055883681091436e-07, + "loss": 0.6406, + "step": 74932 + }, + { + "epoch": 1.92, + "learning_rate": 6.05562940942746e-07, + "loss": 0.6758, + "step": 74933 + }, + { + "epoch": 1.92, + "learning_rate": 6.05537514078351e-07, + "loss": 0.6465, + "step": 74934 + }, + { + "epoch": 1.92, + "learning_rate": 6.055120875159775e-07, + "loss": 0.553, + "step": 74935 + }, + { + "epoch": 1.92, + "learning_rate": 6.054866612556457e-07, + "loss": 0.457, + "step": 74936 + }, + { + "epoch": 1.92, + "learning_rate": 6.054612352973745e-07, + "loss": 0.4512, + "step": 74937 + }, + { + "epoch": 1.92, + "learning_rate": 6.054358096411831e-07, + "loss": 0.6172, + "step": 74938 + }, + { + "epoch": 1.92, + "learning_rate": 6.054103842870918e-07, + "loss": 0.5543, + "step": 74939 + }, + { + "epoch": 1.92, + "learning_rate": 6.053849592351192e-07, + "loss": 0.4702, + "step": 74940 + }, + { + "epoch": 1.92, + "learning_rate": 6.053595344852855e-07, + "loss": 0.6865, + "step": 74941 + }, + { + "epoch": 1.92, + "learning_rate": 6.0533411003761e-07, + "loss": 0.6846, + "step": 74942 + }, + { + "epoch": 1.92, + "learning_rate": 6.053086858921117e-07, + "loss": 0.709, + "step": 74943 + }, + { + "epoch": 1.92, + "learning_rate": 6.052832620488105e-07, + "loss": 0.6582, + "step": 74944 + }, + { + "epoch": 1.92, + "learning_rate": 6.052578385077256e-07, + "loss": 0.5762, + "step": 74945 + }, + { + "epoch": 1.92, + "learning_rate": 6.052324152688772e-07, + "loss": 0.5239, + "step": 74946 + }, + { + "epoch": 1.92, + "learning_rate": 6.052069923322838e-07, + "loss": 0.791, + "step": 74947 + }, + { + "epoch": 1.92, + "learning_rate": 6.051815696979651e-07, + "loss": 0.4484, + "step": 74948 + }, + { + "epoch": 1.92, + "learning_rate": 6.051561473659409e-07, + "loss": 0.6899, + "step": 74949 + }, + { + "epoch": 1.92, + "learning_rate": 6.051307253362304e-07, + "loss": 0.5254, + "step": 74950 + }, + { + "epoch": 1.92, + "learning_rate": 6.051053036088531e-07, + "loss": 0.6147, + "step": 74951 + }, + { + "epoch": 1.92, + "learning_rate": 6.050798821838285e-07, + "loss": 0.6633, + "step": 74952 + }, + { + "epoch": 1.92, + "learning_rate": 6.050544610611762e-07, + "loss": 0.5864, + "step": 74953 + }, + { + "epoch": 1.92, + "learning_rate": 6.050290402409154e-07, + "loss": 0.6348, + "step": 74954 + }, + { + "epoch": 1.92, + "learning_rate": 6.050036197230659e-07, + "loss": 0.6533, + "step": 74955 + }, + { + "epoch": 1.92, + "learning_rate": 6.049781995076471e-07, + "loss": 0.7471, + "step": 74956 + }, + { + "epoch": 1.92, + "learning_rate": 6.04952779594678e-07, + "loss": 0.7158, + "step": 74957 + }, + { + "epoch": 1.92, + "learning_rate": 6.049273599841785e-07, + "loss": 0.6616, + "step": 74958 + }, + { + "epoch": 1.92, + "learning_rate": 6.049019406761679e-07, + "loss": 0.6826, + "step": 74959 + }, + { + "epoch": 1.92, + "learning_rate": 6.048765216706657e-07, + "loss": 0.6187, + "step": 74960 + }, + { + "epoch": 1.92, + "learning_rate": 6.048511029676916e-07, + "loss": 0.5806, + "step": 74961 + }, + { + "epoch": 1.92, + "learning_rate": 6.048256845672645e-07, + "loss": 0.6567, + "step": 74962 + }, + { + "epoch": 1.92, + "learning_rate": 6.048002664694045e-07, + "loss": 0.6377, + "step": 74963 + }, + { + "epoch": 1.92, + "learning_rate": 6.047748486741304e-07, + "loss": 0.5706, + "step": 74964 + }, + { + "epoch": 1.92, + "learning_rate": 6.047494311814625e-07, + "loss": 0.6338, + "step": 74965 + }, + { + "epoch": 1.92, + "learning_rate": 6.047240139914199e-07, + "loss": 0.4956, + "step": 74966 + }, + { + "epoch": 1.92, + "learning_rate": 6.046985971040213e-07, + "loss": 0.5913, + "step": 74967 + }, + { + "epoch": 1.92, + "learning_rate": 6.046731805192873e-07, + "loss": 0.6475, + "step": 74968 + }, + { + "epoch": 1.92, + "learning_rate": 6.046477642372365e-07, + "loss": 0.6274, + "step": 74969 + }, + { + "epoch": 1.92, + "learning_rate": 6.046223482578889e-07, + "loss": 0.5254, + "step": 74970 + }, + { + "epoch": 1.92, + "learning_rate": 6.045969325812637e-07, + "loss": 0.4977, + "step": 74971 + }, + { + "epoch": 1.92, + "learning_rate": 6.045715172073807e-07, + "loss": 0.7461, + "step": 74972 + }, + { + "epoch": 1.92, + "learning_rate": 6.045461021362587e-07, + "loss": 0.5718, + "step": 74973 + }, + { + "epoch": 1.92, + "learning_rate": 6.045206873679179e-07, + "loss": 0.6367, + "step": 74974 + }, + { + "epoch": 1.92, + "learning_rate": 6.044952729023773e-07, + "loss": 0.667, + "step": 74975 + }, + { + "epoch": 1.92, + "learning_rate": 6.04469858739657e-07, + "loss": 0.6562, + "step": 74976 + }, + { + "epoch": 1.92, + "learning_rate": 6.044444448797753e-07, + "loss": 0.543, + "step": 74977 + }, + { + "epoch": 1.92, + "learning_rate": 6.044190313227526e-07, + "loss": 0.6221, + "step": 74978 + }, + { + "epoch": 1.92, + "learning_rate": 6.043936180686078e-07, + "loss": 0.6245, + "step": 74979 + }, + { + "epoch": 1.92, + "learning_rate": 6.043682051173608e-07, + "loss": 0.5005, + "step": 74980 + }, + { + "epoch": 1.92, + "learning_rate": 6.043427924690307e-07, + "loss": 0.5708, + "step": 74981 + }, + { + "epoch": 1.92, + "learning_rate": 6.043173801236373e-07, + "loss": 0.5669, + "step": 74982 + }, + { + "epoch": 1.92, + "learning_rate": 6.042919680811997e-07, + "loss": 0.4675, + "step": 74983 + }, + { + "epoch": 1.92, + "learning_rate": 6.042665563417378e-07, + "loss": 0.5815, + "step": 74984 + }, + { + "epoch": 1.92, + "learning_rate": 6.042411449052704e-07, + "loss": 0.6455, + "step": 74985 + }, + { + "epoch": 1.92, + "learning_rate": 6.04215733771818e-07, + "loss": 0.5149, + "step": 74986 + }, + { + "epoch": 1.92, + "learning_rate": 6.041903229413991e-07, + "loss": 0.5654, + "step": 74987 + }, + { + "epoch": 1.92, + "learning_rate": 6.041649124140334e-07, + "loss": 0.6128, + "step": 74988 + }, + { + "epoch": 1.92, + "learning_rate": 6.041395021897405e-07, + "loss": 0.5552, + "step": 74989 + }, + { + "epoch": 1.92, + "learning_rate": 6.041140922685396e-07, + "loss": 0.4468, + "step": 74990 + }, + { + "epoch": 1.92, + "learning_rate": 6.040886826504506e-07, + "loss": 0.6377, + "step": 74991 + }, + { + "epoch": 1.92, + "learning_rate": 6.040632733354923e-07, + "loss": 0.5591, + "step": 74992 + }, + { + "epoch": 1.92, + "learning_rate": 6.040378643236849e-07, + "loss": 0.6953, + "step": 74993 + }, + { + "epoch": 1.92, + "learning_rate": 6.040124556150473e-07, + "loss": 0.582, + "step": 74994 + }, + { + "epoch": 1.92, + "learning_rate": 6.039870472095993e-07, + "loss": 0.6987, + "step": 74995 + }, + { + "epoch": 1.92, + "learning_rate": 6.039616391073605e-07, + "loss": 0.667, + "step": 74996 + }, + { + "epoch": 1.92, + "learning_rate": 6.039362313083498e-07, + "loss": 0.7256, + "step": 74997 + }, + { + "epoch": 1.92, + "learning_rate": 6.039108238125867e-07, + "loss": 0.494, + "step": 74998 + }, + { + "epoch": 1.92, + "learning_rate": 6.038854166200911e-07, + "loss": 0.7432, + "step": 74999 + }, + { + "epoch": 1.92, + "learning_rate": 6.03860009730882e-07, + "loss": 0.7031, + "step": 75000 + }, + { + "epoch": 1.92, + "learning_rate": 6.038346031449792e-07, + "loss": 0.6494, + "step": 75001 + }, + { + "epoch": 1.92, + "learning_rate": 6.03809196862402e-07, + "loss": 0.6001, + "step": 75002 + }, + { + "epoch": 1.92, + "learning_rate": 6.0378379088317e-07, + "loss": 0.7686, + "step": 75003 + }, + { + "epoch": 1.92, + "learning_rate": 6.037583852073023e-07, + "loss": 0.6719, + "step": 75004 + }, + { + "epoch": 1.92, + "learning_rate": 6.037329798348189e-07, + "loss": 0.5889, + "step": 75005 + }, + { + "epoch": 1.92, + "learning_rate": 6.037075747657389e-07, + "loss": 0.6562, + "step": 75006 + }, + { + "epoch": 1.92, + "learning_rate": 6.036821700000816e-07, + "loss": 0.6436, + "step": 75007 + }, + { + "epoch": 1.92, + "learning_rate": 6.036567655378668e-07, + "loss": 0.7549, + "step": 75008 + }, + { + "epoch": 1.92, + "learning_rate": 6.036313613791135e-07, + "loss": 0.6313, + "step": 75009 + }, + { + "epoch": 1.92, + "learning_rate": 6.036059575238418e-07, + "loss": 0.6841, + "step": 75010 + }, + { + "epoch": 1.92, + "learning_rate": 6.035805539720704e-07, + "loss": 0.48, + "step": 75011 + }, + { + "epoch": 1.92, + "learning_rate": 6.035551507238195e-07, + "loss": 0.5811, + "step": 75012 + }, + { + "epoch": 1.92, + "learning_rate": 6.035297477791079e-07, + "loss": 0.6523, + "step": 75013 + }, + { + "epoch": 1.92, + "learning_rate": 6.035043451379556e-07, + "loss": 0.6074, + "step": 75014 + }, + { + "epoch": 1.92, + "learning_rate": 6.034789428003818e-07, + "loss": 0.7329, + "step": 75015 + }, + { + "epoch": 1.92, + "learning_rate": 6.03453540766406e-07, + "loss": 0.7471, + "step": 75016 + }, + { + "epoch": 1.92, + "learning_rate": 6.034281390360474e-07, + "loss": 0.4795, + "step": 75017 + }, + { + "epoch": 1.92, + "learning_rate": 6.034027376093258e-07, + "loss": 0.6523, + "step": 75018 + }, + { + "epoch": 1.92, + "learning_rate": 6.033773364862602e-07, + "loss": 0.6748, + "step": 75019 + }, + { + "epoch": 1.92, + "learning_rate": 6.033519356668706e-07, + "loss": 0.6968, + "step": 75020 + }, + { + "epoch": 1.92, + "learning_rate": 6.033265351511759e-07, + "loss": 0.5688, + "step": 75021 + }, + { + "epoch": 1.92, + "learning_rate": 6.033011349391961e-07, + "loss": 0.4169, + "step": 75022 + }, + { + "epoch": 1.92, + "learning_rate": 6.032757350309501e-07, + "loss": 0.4905, + "step": 75023 + }, + { + "epoch": 1.92, + "learning_rate": 6.03250335426458e-07, + "loss": 0.5542, + "step": 75024 + }, + { + "epoch": 1.92, + "learning_rate": 6.032249361257385e-07, + "loss": 0.458, + "step": 75025 + }, + { + "epoch": 1.92, + "learning_rate": 6.031995371288119e-07, + "loss": 0.5439, + "step": 75026 + }, + { + "epoch": 1.92, + "learning_rate": 6.03174138435697e-07, + "loss": 0.6406, + "step": 75027 + }, + { + "epoch": 1.92, + "learning_rate": 6.031487400464132e-07, + "loss": 0.5522, + "step": 75028 + }, + { + "epoch": 1.92, + "learning_rate": 6.031233419609802e-07, + "loss": 0.5781, + "step": 75029 + }, + { + "epoch": 1.92, + "learning_rate": 6.030979441794174e-07, + "loss": 0.6323, + "step": 75030 + }, + { + "epoch": 1.92, + "learning_rate": 6.030725467017444e-07, + "loss": 0.5591, + "step": 75031 + }, + { + "epoch": 1.92, + "learning_rate": 6.030471495279805e-07, + "loss": 0.5576, + "step": 75032 + }, + { + "epoch": 1.92, + "learning_rate": 6.030217526581449e-07, + "loss": 0.749, + "step": 75033 + }, + { + "epoch": 1.92, + "learning_rate": 6.029963560922576e-07, + "loss": 0.3771, + "step": 75034 + }, + { + "epoch": 1.92, + "learning_rate": 6.029709598303374e-07, + "loss": 0.6709, + "step": 75035 + }, + { + "epoch": 1.92, + "learning_rate": 6.029455638724046e-07, + "loss": 0.7144, + "step": 75036 + }, + { + "epoch": 1.92, + "learning_rate": 6.029201682184779e-07, + "loss": 0.8125, + "step": 75037 + }, + { + "epoch": 1.92, + "learning_rate": 6.028947728685767e-07, + "loss": 0.3254, + "step": 75038 + }, + { + "epoch": 1.92, + "learning_rate": 6.028693778227209e-07, + "loss": 0.6133, + "step": 75039 + }, + { + "epoch": 1.92, + "learning_rate": 6.028439830809296e-07, + "loss": 0.5962, + "step": 75040 + }, + { + "epoch": 1.92, + "learning_rate": 6.028185886432227e-07, + "loss": 0.6831, + "step": 75041 + }, + { + "epoch": 1.92, + "learning_rate": 6.027931945096189e-07, + "loss": 0.6885, + "step": 75042 + }, + { + "epoch": 1.92, + "learning_rate": 6.027678006801385e-07, + "loss": 0.6826, + "step": 75043 + }, + { + "epoch": 1.92, + "learning_rate": 6.027424071548003e-07, + "loss": 0.8037, + "step": 75044 + }, + { + "epoch": 1.92, + "learning_rate": 6.027170139336241e-07, + "loss": 0.6523, + "step": 75045 + }, + { + "epoch": 1.92, + "learning_rate": 6.026916210166295e-07, + "loss": 0.7598, + "step": 75046 + }, + { + "epoch": 1.92, + "learning_rate": 6.026662284038353e-07, + "loss": 0.667, + "step": 75047 + }, + { + "epoch": 1.92, + "learning_rate": 6.026408360952613e-07, + "loss": 0.7275, + "step": 75048 + }, + { + "epoch": 1.92, + "learning_rate": 6.02615444090927e-07, + "loss": 0.6235, + "step": 75049 + }, + { + "epoch": 1.92, + "learning_rate": 6.025900523908517e-07, + "loss": 0.6274, + "step": 75050 + }, + { + "epoch": 1.92, + "learning_rate": 6.025646609950551e-07, + "loss": 0.6416, + "step": 75051 + }, + { + "epoch": 1.92, + "learning_rate": 6.025392699035562e-07, + "loss": 0.3041, + "step": 75052 + }, + { + "epoch": 1.92, + "learning_rate": 6.025138791163748e-07, + "loss": 0.5859, + "step": 75053 + }, + { + "epoch": 1.92, + "learning_rate": 6.024884886335303e-07, + "loss": 0.5693, + "step": 75054 + }, + { + "epoch": 1.92, + "learning_rate": 6.024630984550422e-07, + "loss": 0.6377, + "step": 75055 + }, + { + "epoch": 1.92, + "learning_rate": 6.024377085809301e-07, + "loss": 0.6338, + "step": 75056 + }, + { + "epoch": 1.92, + "learning_rate": 6.024123190112124e-07, + "loss": 0.7168, + "step": 75057 + }, + { + "epoch": 1.92, + "learning_rate": 6.023869297459099e-07, + "loss": 0.634, + "step": 75058 + }, + { + "epoch": 1.92, + "learning_rate": 6.023615407850411e-07, + "loss": 0.6128, + "step": 75059 + }, + { + "epoch": 1.92, + "learning_rate": 6.02336152128626e-07, + "loss": 0.6523, + "step": 75060 + }, + { + "epoch": 1.92, + "learning_rate": 6.023107637766836e-07, + "loss": 0.5693, + "step": 75061 + }, + { + "epoch": 1.92, + "learning_rate": 6.022853757292338e-07, + "loss": 0.7061, + "step": 75062 + }, + { + "epoch": 1.92, + "learning_rate": 6.022599879862955e-07, + "loss": 0.4993, + "step": 75063 + }, + { + "epoch": 1.92, + "learning_rate": 6.022346005478887e-07, + "loss": 0.7373, + "step": 75064 + }, + { + "epoch": 1.92, + "learning_rate": 6.022092134140329e-07, + "loss": 0.7012, + "step": 75065 + }, + { + "epoch": 1.92, + "learning_rate": 6.021838265847469e-07, + "loss": 0.3555, + "step": 75066 + }, + { + "epoch": 1.92, + "learning_rate": 6.021584400600501e-07, + "loss": 0.6592, + "step": 75067 + }, + { + "epoch": 1.92, + "learning_rate": 6.021330538399627e-07, + "loss": 0.5811, + "step": 75068 + }, + { + "epoch": 1.92, + "learning_rate": 6.021076679245035e-07, + "loss": 0.6416, + "step": 75069 + }, + { + "epoch": 1.92, + "learning_rate": 6.020822823136924e-07, + "loss": 0.6138, + "step": 75070 + }, + { + "epoch": 1.92, + "learning_rate": 6.020568970075484e-07, + "loss": 0.6147, + "step": 75071 + }, + { + "epoch": 1.92, + "learning_rate": 6.020315120060911e-07, + "loss": 0.7686, + "step": 75072 + }, + { + "epoch": 1.92, + "learning_rate": 6.020061273093399e-07, + "loss": 0.6245, + "step": 75073 + }, + { + "epoch": 1.92, + "learning_rate": 6.019807429173147e-07, + "loss": 0.5947, + "step": 75074 + }, + { + "epoch": 1.92, + "learning_rate": 6.019553588300346e-07, + "loss": 0.5327, + "step": 75075 + }, + { + "epoch": 1.92, + "learning_rate": 6.019299750475186e-07, + "loss": 0.5817, + "step": 75076 + }, + { + "epoch": 1.92, + "learning_rate": 6.019045915697867e-07, + "loss": 0.7061, + "step": 75077 + }, + { + "epoch": 1.92, + "learning_rate": 6.018792083968578e-07, + "loss": 0.623, + "step": 75078 + }, + { + "epoch": 1.92, + "learning_rate": 6.018538255287521e-07, + "loss": 0.4399, + "step": 75079 + }, + { + "epoch": 1.92, + "learning_rate": 6.018284429654883e-07, + "loss": 0.6606, + "step": 75080 + }, + { + "epoch": 1.92, + "learning_rate": 6.018030607070865e-07, + "loss": 0.6465, + "step": 75081 + }, + { + "epoch": 1.92, + "learning_rate": 6.017776787535653e-07, + "loss": 0.5815, + "step": 75082 + }, + { + "epoch": 1.92, + "learning_rate": 6.017522971049451e-07, + "loss": 0.4644, + "step": 75083 + }, + { + "epoch": 1.92, + "learning_rate": 6.017269157612446e-07, + "loss": 0.4678, + "step": 75084 + }, + { + "epoch": 1.92, + "learning_rate": 6.01701534722484e-07, + "loss": 0.7158, + "step": 75085 + }, + { + "epoch": 1.92, + "learning_rate": 6.016761539886816e-07, + "loss": 0.6367, + "step": 75086 + }, + { + "epoch": 1.92, + "learning_rate": 6.016507735598577e-07, + "loss": 0.542, + "step": 75087 + }, + { + "epoch": 1.92, + "learning_rate": 6.016253934360314e-07, + "loss": 0.6631, + "step": 75088 + }, + { + "epoch": 1.92, + "learning_rate": 6.016000136172224e-07, + "loss": 0.6912, + "step": 75089 + }, + { + "epoch": 1.92, + "learning_rate": 6.015746341034496e-07, + "loss": 0.6528, + "step": 75090 + }, + { + "epoch": 1.92, + "learning_rate": 6.01549254894733e-07, + "loss": 0.5054, + "step": 75091 + }, + { + "epoch": 1.92, + "learning_rate": 6.015238759910916e-07, + "loss": 0.5266, + "step": 75092 + }, + { + "epoch": 1.92, + "learning_rate": 6.014984973925454e-07, + "loss": 0.5928, + "step": 75093 + }, + { + "epoch": 1.92, + "learning_rate": 6.014731190991131e-07, + "loss": 0.6191, + "step": 75094 + }, + { + "epoch": 1.92, + "learning_rate": 6.014477411108151e-07, + "loss": 0.5447, + "step": 75095 + }, + { + "epoch": 1.92, + "learning_rate": 6.0142236342767e-07, + "loss": 0.5544, + "step": 75096 + }, + { + "epoch": 1.92, + "learning_rate": 6.013969860496972e-07, + "loss": 0.2887, + "step": 75097 + }, + { + "epoch": 1.92, + "learning_rate": 6.013716089769166e-07, + "loss": 0.6631, + "step": 75098 + }, + { + "epoch": 1.92, + "learning_rate": 6.013462322093472e-07, + "loss": 0.7002, + "step": 75099 + }, + { + "epoch": 1.92, + "learning_rate": 6.013208557470089e-07, + "loss": 0.5479, + "step": 75100 + }, + { + "epoch": 1.92, + "learning_rate": 6.012954795899206e-07, + "loss": 0.7334, + "step": 75101 + }, + { + "epoch": 1.92, + "learning_rate": 6.012701037381024e-07, + "loss": 0.6982, + "step": 75102 + }, + { + "epoch": 1.92, + "learning_rate": 6.01244728191573e-07, + "loss": 0.6885, + "step": 75103 + }, + { + "epoch": 1.92, + "learning_rate": 6.012193529503524e-07, + "loss": 0.6611, + "step": 75104 + }, + { + "epoch": 1.92, + "learning_rate": 6.011939780144602e-07, + "loss": 0.7378, + "step": 75105 + }, + { + "epoch": 1.93, + "learning_rate": 6.011686033839149e-07, + "loss": 0.5933, + "step": 75106 + }, + { + "epoch": 1.93, + "learning_rate": 6.011432290587365e-07, + "loss": 0.7217, + "step": 75107 + }, + { + "epoch": 1.93, + "learning_rate": 6.011178550389444e-07, + "loss": 0.5208, + "step": 75108 + }, + { + "epoch": 1.93, + "learning_rate": 6.01092481324558e-07, + "loss": 0.4487, + "step": 75109 + }, + { + "epoch": 1.93, + "learning_rate": 6.010671079155969e-07, + "loss": 0.6211, + "step": 75110 + }, + { + "epoch": 1.93, + "learning_rate": 6.010417348120802e-07, + "loss": 0.6348, + "step": 75111 + }, + { + "epoch": 1.93, + "learning_rate": 6.010163620140276e-07, + "loss": 0.6543, + "step": 75112 + }, + { + "epoch": 1.93, + "learning_rate": 6.009909895214582e-07, + "loss": 0.5645, + "step": 75113 + }, + { + "epoch": 1.93, + "learning_rate": 6.00965617334392e-07, + "loss": 0.7139, + "step": 75114 + }, + { + "epoch": 1.93, + "learning_rate": 6.009402454528483e-07, + "loss": 0.6074, + "step": 75115 + }, + { + "epoch": 1.93, + "learning_rate": 6.009148738768457e-07, + "loss": 0.5991, + "step": 75116 + }, + { + "epoch": 1.93, + "learning_rate": 6.008895026064046e-07, + "loss": 0.666, + "step": 75117 + }, + { + "epoch": 1.93, + "learning_rate": 6.008641316415437e-07, + "loss": 0.4978, + "step": 75118 + }, + { + "epoch": 1.93, + "learning_rate": 6.008387609822832e-07, + "loss": 0.7107, + "step": 75119 + }, + { + "epoch": 1.93, + "learning_rate": 6.008133906286417e-07, + "loss": 0.5796, + "step": 75120 + }, + { + "epoch": 1.93, + "learning_rate": 6.007880205806394e-07, + "loss": 0.5942, + "step": 75121 + }, + { + "epoch": 1.93, + "learning_rate": 6.007626508382952e-07, + "loss": 0.6113, + "step": 75122 + }, + { + "epoch": 1.93, + "learning_rate": 6.007372814016286e-07, + "loss": 0.5347, + "step": 75123 + }, + { + "epoch": 1.93, + "learning_rate": 6.007119122706593e-07, + "loss": 0.6855, + "step": 75124 + }, + { + "epoch": 1.93, + "learning_rate": 6.006865434454067e-07, + "loss": 0.6616, + "step": 75125 + }, + { + "epoch": 1.93, + "learning_rate": 6.006611749258896e-07, + "loss": 0.6475, + "step": 75126 + }, + { + "epoch": 1.93, + "learning_rate": 6.006358067121281e-07, + "loss": 0.9131, + "step": 75127 + }, + { + "epoch": 1.93, + "learning_rate": 6.006104388041412e-07, + "loss": 0.6504, + "step": 75128 + }, + { + "epoch": 1.93, + "learning_rate": 6.005850712019487e-07, + "loss": 0.5981, + "step": 75129 + }, + { + "epoch": 1.93, + "learning_rate": 6.005597039055698e-07, + "loss": 0.6338, + "step": 75130 + }, + { + "epoch": 1.93, + "learning_rate": 6.00534336915024e-07, + "loss": 0.5298, + "step": 75131 + }, + { + "epoch": 1.93, + "learning_rate": 6.005089702303305e-07, + "loss": 0.6992, + "step": 75132 + }, + { + "epoch": 1.93, + "learning_rate": 6.004836038515092e-07, + "loss": 0.4644, + "step": 75133 + }, + { + "epoch": 1.93, + "learning_rate": 6.00458237778579e-07, + "loss": 0.4264, + "step": 75134 + }, + { + "epoch": 1.93, + "learning_rate": 6.004328720115599e-07, + "loss": 0.748, + "step": 75135 + }, + { + "epoch": 1.93, + "learning_rate": 6.004075065504707e-07, + "loss": 0.4724, + "step": 75136 + }, + { + "epoch": 1.93, + "learning_rate": 6.003821413953312e-07, + "loss": 0.6943, + "step": 75137 + }, + { + "epoch": 1.93, + "learning_rate": 6.003567765461608e-07, + "loss": 0.7266, + "step": 75138 + }, + { + "epoch": 1.93, + "learning_rate": 6.003314120029787e-07, + "loss": 0.6592, + "step": 75139 + }, + { + "epoch": 1.93, + "learning_rate": 6.003060477658044e-07, + "loss": 0.7471, + "step": 75140 + }, + { + "epoch": 1.93, + "learning_rate": 6.002806838346575e-07, + "loss": 0.6152, + "step": 75141 + }, + { + "epoch": 1.93, + "learning_rate": 6.00255320209557e-07, + "loss": 0.6182, + "step": 75142 + }, + { + "epoch": 1.93, + "learning_rate": 6.002299568905231e-07, + "loss": 0.4609, + "step": 75143 + }, + { + "epoch": 1.93, + "learning_rate": 6.002045938775743e-07, + "loss": 0.5679, + "step": 75144 + }, + { + "epoch": 1.93, + "learning_rate": 6.00179231170731e-07, + "loss": 0.7773, + "step": 75145 + }, + { + "epoch": 1.93, + "learning_rate": 6.001538687700119e-07, + "loss": 0.5854, + "step": 75146 + }, + { + "epoch": 1.93, + "learning_rate": 6.001285066754362e-07, + "loss": 0.6028, + "step": 75147 + }, + { + "epoch": 1.93, + "learning_rate": 6.001031448870241e-07, + "loss": 0.6201, + "step": 75148 + }, + { + "epoch": 1.93, + "learning_rate": 6.000777834047944e-07, + "loss": 0.493, + "step": 75149 + }, + { + "epoch": 1.93, + "learning_rate": 6.000524222287668e-07, + "loss": 0.6968, + "step": 75150 + }, + { + "epoch": 1.93, + "learning_rate": 6.000270613589607e-07, + "loss": 0.6943, + "step": 75151 + }, + { + "epoch": 1.93, + "learning_rate": 6.000017007953955e-07, + "loss": 0.6016, + "step": 75152 + }, + { + "epoch": 1.93, + "learning_rate": 5.999763405380905e-07, + "loss": 0.7656, + "step": 75153 + }, + { + "epoch": 1.93, + "learning_rate": 5.999509805870655e-07, + "loss": 0.5542, + "step": 75154 + }, + { + "epoch": 1.93, + "learning_rate": 5.999256209423397e-07, + "loss": 0.585, + "step": 75155 + }, + { + "epoch": 1.93, + "learning_rate": 5.999002616039323e-07, + "loss": 0.6069, + "step": 75156 + }, + { + "epoch": 1.93, + "learning_rate": 5.998749025718627e-07, + "loss": 0.6953, + "step": 75157 + }, + { + "epoch": 1.93, + "learning_rate": 5.998495438461507e-07, + "loss": 0.5493, + "step": 75158 + }, + { + "epoch": 1.93, + "learning_rate": 5.998241854268153e-07, + "loss": 0.665, + "step": 75159 + }, + { + "epoch": 1.93, + "learning_rate": 5.997988273138763e-07, + "loss": 0.6777, + "step": 75160 + }, + { + "epoch": 1.93, + "learning_rate": 5.997734695073527e-07, + "loss": 0.6448, + "step": 75161 + }, + { + "epoch": 1.93, + "learning_rate": 5.997481120072642e-07, + "loss": 0.6875, + "step": 75162 + }, + { + "epoch": 1.93, + "learning_rate": 5.997227548136303e-07, + "loss": 0.709, + "step": 75163 + }, + { + "epoch": 1.93, + "learning_rate": 5.996973979264704e-07, + "loss": 0.5142, + "step": 75164 + }, + { + "epoch": 1.93, + "learning_rate": 5.996720413458038e-07, + "loss": 0.5239, + "step": 75165 + }, + { + "epoch": 1.93, + "learning_rate": 5.996466850716497e-07, + "loss": 0.7959, + "step": 75166 + }, + { + "epoch": 1.93, + "learning_rate": 5.996213291040277e-07, + "loss": 0.6357, + "step": 75167 + }, + { + "epoch": 1.93, + "learning_rate": 5.995959734429573e-07, + "loss": 0.6055, + "step": 75168 + }, + { + "epoch": 1.93, + "learning_rate": 5.995706180884579e-07, + "loss": 0.6162, + "step": 75169 + }, + { + "epoch": 1.93, + "learning_rate": 5.995452630405488e-07, + "loss": 0.6113, + "step": 75170 + }, + { + "epoch": 1.93, + "learning_rate": 5.995199082992495e-07, + "loss": 0.6934, + "step": 75171 + }, + { + "epoch": 1.93, + "learning_rate": 5.994945538645792e-07, + "loss": 0.5815, + "step": 75172 + }, + { + "epoch": 1.93, + "learning_rate": 5.99469199736558e-07, + "loss": 0.7129, + "step": 75173 + }, + { + "epoch": 1.93, + "learning_rate": 5.994438459152042e-07, + "loss": 0.4111, + "step": 75174 + }, + { + "epoch": 1.93, + "learning_rate": 5.994184924005388e-07, + "loss": 0.6562, + "step": 75175 + }, + { + "epoch": 1.93, + "learning_rate": 5.993931391925795e-07, + "loss": 0.3896, + "step": 75176 + }, + { + "epoch": 1.93, + "learning_rate": 5.993677862913466e-07, + "loss": 0.5938, + "step": 75177 + }, + { + "epoch": 1.93, + "learning_rate": 5.993424336968591e-07, + "loss": 0.6719, + "step": 75178 + }, + { + "epoch": 1.93, + "learning_rate": 5.993170814091371e-07, + "loss": 0.7373, + "step": 75179 + }, + { + "epoch": 1.93, + "learning_rate": 5.992917294281992e-07, + "loss": 0.6377, + "step": 75180 + }, + { + "epoch": 1.93, + "learning_rate": 5.992663777540654e-07, + "loss": 0.5986, + "step": 75181 + }, + { + "epoch": 1.93, + "learning_rate": 5.992410263867548e-07, + "loss": 0.6709, + "step": 75182 + }, + { + "epoch": 1.93, + "learning_rate": 5.992156753262872e-07, + "loss": 0.5977, + "step": 75183 + }, + { + "epoch": 1.93, + "learning_rate": 5.991903245726813e-07, + "loss": 0.6343, + "step": 75184 + }, + { + "epoch": 1.93, + "learning_rate": 5.991649741259574e-07, + "loss": 0.5405, + "step": 75185 + }, + { + "epoch": 1.93, + "learning_rate": 5.991396239861344e-07, + "loss": 0.6162, + "step": 75186 + }, + { + "epoch": 1.93, + "learning_rate": 5.991142741532313e-07, + "loss": 0.6221, + "step": 75187 + }, + { + "epoch": 1.93, + "learning_rate": 5.990889246272683e-07, + "loss": 0.6372, + "step": 75188 + }, + { + "epoch": 1.93, + "learning_rate": 5.990635754082645e-07, + "loss": 0.668, + "step": 75189 + }, + { + "epoch": 1.93, + "learning_rate": 5.990382264962393e-07, + "loss": 0.5007, + "step": 75190 + }, + { + "epoch": 1.93, + "learning_rate": 5.990128778912118e-07, + "loss": 0.7031, + "step": 75191 + }, + { + "epoch": 1.93, + "learning_rate": 5.98987529593202e-07, + "loss": 0.6689, + "step": 75192 + }, + { + "epoch": 1.93, + "learning_rate": 5.989621816022288e-07, + "loss": 0.7007, + "step": 75193 + }, + { + "epoch": 1.93, + "learning_rate": 5.989368339183119e-07, + "loss": 0.7324, + "step": 75194 + }, + { + "epoch": 1.93, + "learning_rate": 5.98911486541471e-07, + "loss": 0.5513, + "step": 75195 + }, + { + "epoch": 1.93, + "learning_rate": 5.988861394717248e-07, + "loss": 0.4648, + "step": 75196 + }, + { + "epoch": 1.93, + "learning_rate": 5.98860792709093e-07, + "loss": 0.5737, + "step": 75197 + }, + { + "epoch": 1.93, + "learning_rate": 5.988354462535951e-07, + "loss": 0.7031, + "step": 75198 + }, + { + "epoch": 1.93, + "learning_rate": 5.988101001052504e-07, + "loss": 0.7334, + "step": 75199 + }, + { + "epoch": 1.93, + "learning_rate": 5.987847542640784e-07, + "loss": 0.6738, + "step": 75200 + }, + { + "epoch": 1.93, + "learning_rate": 5.987594087300983e-07, + "loss": 0.4111, + "step": 75201 + }, + { + "epoch": 1.93, + "learning_rate": 5.987340635033299e-07, + "loss": 0.8379, + "step": 75202 + }, + { + "epoch": 1.93, + "learning_rate": 5.987087185837921e-07, + "loss": 0.6152, + "step": 75203 + }, + { + "epoch": 1.93, + "learning_rate": 5.986833739715049e-07, + "loss": 0.6523, + "step": 75204 + }, + { + "epoch": 1.93, + "learning_rate": 5.986580296664876e-07, + "loss": 0.5566, + "step": 75205 + }, + { + "epoch": 1.93, + "learning_rate": 5.986326856687589e-07, + "loss": 0.6768, + "step": 75206 + }, + { + "epoch": 1.93, + "learning_rate": 5.986073419783389e-07, + "loss": 0.623, + "step": 75207 + }, + { + "epoch": 1.93, + "learning_rate": 5.985819985952467e-07, + "loss": 0.7109, + "step": 75208 + }, + { + "epoch": 1.93, + "learning_rate": 5.985566555195019e-07, + "loss": 0.5991, + "step": 75209 + }, + { + "epoch": 1.93, + "learning_rate": 5.985313127511236e-07, + "loss": 0.5192, + "step": 75210 + }, + { + "epoch": 1.93, + "learning_rate": 5.985059702901316e-07, + "loss": 0.563, + "step": 75211 + }, + { + "epoch": 1.93, + "learning_rate": 5.984806281365453e-07, + "loss": 0.6772, + "step": 75212 + }, + { + "epoch": 1.93, + "learning_rate": 5.984552862903835e-07, + "loss": 0.7441, + "step": 75213 + }, + { + "epoch": 1.93, + "learning_rate": 5.984299447516664e-07, + "loss": 0.5781, + "step": 75214 + }, + { + "epoch": 1.93, + "learning_rate": 5.984046035204132e-07, + "loss": 0.6514, + "step": 75215 + }, + { + "epoch": 1.93, + "learning_rate": 5.983792625966426e-07, + "loss": 0.7676, + "step": 75216 + }, + { + "epoch": 1.93, + "learning_rate": 5.983539219803748e-07, + "loss": 0.6553, + "step": 75217 + }, + { + "epoch": 1.93, + "learning_rate": 5.983285816716288e-07, + "loss": 0.4656, + "step": 75218 + }, + { + "epoch": 1.93, + "learning_rate": 5.983032416704243e-07, + "loss": 0.5752, + "step": 75219 + }, + { + "epoch": 1.93, + "learning_rate": 5.982779019767803e-07, + "loss": 0.7422, + "step": 75220 + }, + { + "epoch": 1.93, + "learning_rate": 5.982525625907167e-07, + "loss": 0.426, + "step": 75221 + }, + { + "epoch": 1.93, + "learning_rate": 5.982272235122523e-07, + "loss": 0.562, + "step": 75222 + }, + { + "epoch": 1.93, + "learning_rate": 5.982018847414072e-07, + "loss": 0.75, + "step": 75223 + }, + { + "epoch": 1.93, + "learning_rate": 5.981765462782002e-07, + "loss": 0.5684, + "step": 75224 + }, + { + "epoch": 1.93, + "learning_rate": 5.981512081226513e-07, + "loss": 0.6041, + "step": 75225 + }, + { + "epoch": 1.93, + "learning_rate": 5.981258702747794e-07, + "loss": 0.6875, + "step": 75226 + }, + { + "epoch": 1.93, + "learning_rate": 5.981005327346038e-07, + "loss": 0.5034, + "step": 75227 + }, + { + "epoch": 1.93, + "learning_rate": 5.980751955021444e-07, + "loss": 0.623, + "step": 75228 + }, + { + "epoch": 1.93, + "learning_rate": 5.980498585774203e-07, + "loss": 0.646, + "step": 75229 + }, + { + "epoch": 1.93, + "learning_rate": 5.980245219604507e-07, + "loss": 0.5801, + "step": 75230 + }, + { + "epoch": 1.93, + "learning_rate": 5.979991856512554e-07, + "loss": 0.6909, + "step": 75231 + }, + { + "epoch": 1.93, + "learning_rate": 5.979738496498536e-07, + "loss": 0.7334, + "step": 75232 + }, + { + "epoch": 1.93, + "learning_rate": 5.979485139562648e-07, + "loss": 0.6973, + "step": 75233 + }, + { + "epoch": 1.93, + "learning_rate": 5.979231785705081e-07, + "loss": 0.5957, + "step": 75234 + }, + { + "epoch": 1.93, + "learning_rate": 5.978978434926036e-07, + "loss": 0.7637, + "step": 75235 + }, + { + "epoch": 1.93, + "learning_rate": 5.978725087225702e-07, + "loss": 0.4849, + "step": 75236 + }, + { + "epoch": 1.93, + "learning_rate": 5.97847174260427e-07, + "loss": 0.5693, + "step": 75237 + }, + { + "epoch": 1.93, + "learning_rate": 5.978218401061938e-07, + "loss": 0.5482, + "step": 75238 + }, + { + "epoch": 1.93, + "learning_rate": 5.977965062598899e-07, + "loss": 0.7344, + "step": 75239 + }, + { + "epoch": 1.93, + "learning_rate": 5.977711727215349e-07, + "loss": 0.5107, + "step": 75240 + }, + { + "epoch": 1.93, + "learning_rate": 5.977458394911477e-07, + "loss": 0.3691, + "step": 75241 + }, + { + "epoch": 1.93, + "learning_rate": 5.977205065687483e-07, + "loss": 0.5996, + "step": 75242 + }, + { + "epoch": 1.93, + "learning_rate": 5.976951739543557e-07, + "loss": 0.6035, + "step": 75243 + }, + { + "epoch": 1.93, + "learning_rate": 5.976698416479894e-07, + "loss": 0.7476, + "step": 75244 + }, + { + "epoch": 1.93, + "learning_rate": 5.976445096496692e-07, + "loss": 0.7192, + "step": 75245 + }, + { + "epoch": 1.93, + "learning_rate": 5.976191779594138e-07, + "loss": 0.5801, + "step": 75246 + }, + { + "epoch": 1.93, + "learning_rate": 5.975938465772425e-07, + "loss": 0.6375, + "step": 75247 + }, + { + "epoch": 1.93, + "learning_rate": 5.975685155031755e-07, + "loss": 0.5776, + "step": 75248 + }, + { + "epoch": 1.93, + "learning_rate": 5.975431847372317e-07, + "loss": 0.4504, + "step": 75249 + }, + { + "epoch": 1.93, + "learning_rate": 5.975178542794306e-07, + "loss": 0.6489, + "step": 75250 + }, + { + "epoch": 1.93, + "learning_rate": 5.974925241297915e-07, + "loss": 0.6787, + "step": 75251 + }, + { + "epoch": 1.93, + "learning_rate": 5.974671942883339e-07, + "loss": 0.6177, + "step": 75252 + }, + { + "epoch": 1.93, + "learning_rate": 5.974418647550771e-07, + "loss": 0.5317, + "step": 75253 + }, + { + "epoch": 1.93, + "learning_rate": 5.974165355300406e-07, + "loss": 0.7568, + "step": 75254 + }, + { + "epoch": 1.93, + "learning_rate": 5.973912066132442e-07, + "loss": 0.6797, + "step": 75255 + }, + { + "epoch": 1.93, + "learning_rate": 5.973658780047062e-07, + "loss": 0.408, + "step": 75256 + }, + { + "epoch": 1.93, + "learning_rate": 5.97340549704447e-07, + "loss": 0.5439, + "step": 75257 + }, + { + "epoch": 1.93, + "learning_rate": 5.973152217124853e-07, + "loss": 0.5801, + "step": 75258 + }, + { + "epoch": 1.93, + "learning_rate": 5.972898940288411e-07, + "loss": 0.5684, + "step": 75259 + }, + { + "epoch": 1.93, + "learning_rate": 5.972645666535332e-07, + "loss": 0.6826, + "step": 75260 + }, + { + "epoch": 1.93, + "learning_rate": 5.972392395865817e-07, + "loss": 0.5674, + "step": 75261 + }, + { + "epoch": 1.93, + "learning_rate": 5.972139128280051e-07, + "loss": 0.5767, + "step": 75262 + }, + { + "epoch": 1.93, + "learning_rate": 5.971885863778238e-07, + "loss": 0.6494, + "step": 75263 + }, + { + "epoch": 1.93, + "learning_rate": 5.971632602360563e-07, + "loss": 0.5752, + "step": 75264 + }, + { + "epoch": 1.93, + "learning_rate": 5.97137934402723e-07, + "loss": 0.6533, + "step": 75265 + }, + { + "epoch": 1.93, + "learning_rate": 5.971126088778421e-07, + "loss": 0.7812, + "step": 75266 + }, + { + "epoch": 1.93, + "learning_rate": 5.970872836614338e-07, + "loss": 0.4956, + "step": 75267 + }, + { + "epoch": 1.93, + "learning_rate": 5.970619587535168e-07, + "loss": 0.5654, + "step": 75268 + }, + { + "epoch": 1.93, + "learning_rate": 5.970366341541114e-07, + "loss": 0.6143, + "step": 75269 + }, + { + "epoch": 1.93, + "learning_rate": 5.970113098632363e-07, + "loss": 0.7896, + "step": 75270 + }, + { + "epoch": 1.93, + "learning_rate": 5.969859858809112e-07, + "loss": 0.6528, + "step": 75271 + }, + { + "epoch": 1.93, + "learning_rate": 5.969606622071551e-07, + "loss": 0.6284, + "step": 75272 + }, + { + "epoch": 1.93, + "learning_rate": 5.969353388419879e-07, + "loss": 0.5626, + "step": 75273 + }, + { + "epoch": 1.93, + "learning_rate": 5.969100157854287e-07, + "loss": 0.687, + "step": 75274 + }, + { + "epoch": 1.93, + "learning_rate": 5.968846930374975e-07, + "loss": 0.6523, + "step": 75275 + }, + { + "epoch": 1.93, + "learning_rate": 5.968593705982127e-07, + "loss": 0.5796, + "step": 75276 + }, + { + "epoch": 1.93, + "learning_rate": 5.968340484675943e-07, + "loss": 0.6079, + "step": 75277 + }, + { + "epoch": 1.93, + "learning_rate": 5.968087266456614e-07, + "loss": 0.5793, + "step": 75278 + }, + { + "epoch": 1.93, + "learning_rate": 5.967834051324334e-07, + "loss": 0.5107, + "step": 75279 + }, + { + "epoch": 1.93, + "learning_rate": 5.9675808392793e-07, + "loss": 0.5295, + "step": 75280 + }, + { + "epoch": 1.93, + "learning_rate": 5.967327630321701e-07, + "loss": 0.5933, + "step": 75281 + }, + { + "epoch": 1.93, + "learning_rate": 5.967074424451737e-07, + "loss": 0.7617, + "step": 75282 + }, + { + "epoch": 1.93, + "learning_rate": 5.966821221669597e-07, + "loss": 0.7617, + "step": 75283 + }, + { + "epoch": 1.93, + "learning_rate": 5.966568021975478e-07, + "loss": 0.5581, + "step": 75284 + }, + { + "epoch": 1.93, + "learning_rate": 5.966314825369574e-07, + "loss": 0.5601, + "step": 75285 + }, + { + "epoch": 1.93, + "learning_rate": 5.966061631852076e-07, + "loss": 0.4663, + "step": 75286 + }, + { + "epoch": 1.93, + "learning_rate": 5.965808441423177e-07, + "loss": 0.7695, + "step": 75287 + }, + { + "epoch": 1.93, + "learning_rate": 5.965555254083074e-07, + "loss": 0.6646, + "step": 75288 + }, + { + "epoch": 1.93, + "learning_rate": 5.965302069831959e-07, + "loss": 0.6392, + "step": 75289 + }, + { + "epoch": 1.93, + "learning_rate": 5.965048888670029e-07, + "loss": 0.5054, + "step": 75290 + }, + { + "epoch": 1.93, + "learning_rate": 5.964795710597472e-07, + "loss": 0.4314, + "step": 75291 + }, + { + "epoch": 1.93, + "learning_rate": 5.96454253561449e-07, + "loss": 0.5581, + "step": 75292 + }, + { + "epoch": 1.93, + "learning_rate": 5.964289363721267e-07, + "loss": 0.5674, + "step": 75293 + }, + { + "epoch": 1.93, + "learning_rate": 5.964036194918006e-07, + "loss": 0.4548, + "step": 75294 + }, + { + "epoch": 1.93, + "learning_rate": 5.963783029204898e-07, + "loss": 0.7207, + "step": 75295 + }, + { + "epoch": 1.93, + "learning_rate": 5.963529866582134e-07, + "loss": 0.6943, + "step": 75296 + }, + { + "epoch": 1.93, + "learning_rate": 5.963276707049909e-07, + "loss": 0.5239, + "step": 75297 + }, + { + "epoch": 1.93, + "learning_rate": 5.963023550608416e-07, + "loss": 0.6045, + "step": 75298 + }, + { + "epoch": 1.93, + "learning_rate": 5.962770397257852e-07, + "loss": 0.6113, + "step": 75299 + }, + { + "epoch": 1.93, + "learning_rate": 5.962517246998408e-07, + "loss": 0.6299, + "step": 75300 + }, + { + "epoch": 1.93, + "learning_rate": 5.96226409983028e-07, + "loss": 0.624, + "step": 75301 + }, + { + "epoch": 1.93, + "learning_rate": 5.962010955753661e-07, + "loss": 0.7178, + "step": 75302 + }, + { + "epoch": 1.93, + "learning_rate": 5.961757814768742e-07, + "loss": 0.5933, + "step": 75303 + }, + { + "epoch": 1.93, + "learning_rate": 5.961504676875722e-07, + "loss": 0.7061, + "step": 75304 + }, + { + "epoch": 1.93, + "learning_rate": 5.961251542074794e-07, + "loss": 0.5078, + "step": 75305 + }, + { + "epoch": 1.93, + "learning_rate": 5.960998410366147e-07, + "loss": 0.5062, + "step": 75306 + }, + { + "epoch": 1.93, + "learning_rate": 5.960745281749979e-07, + "loss": 0.5933, + "step": 75307 + }, + { + "epoch": 1.93, + "learning_rate": 5.960492156226481e-07, + "loss": 0.5771, + "step": 75308 + }, + { + "epoch": 1.93, + "learning_rate": 5.96023903379585e-07, + "loss": 0.5308, + "step": 75309 + }, + { + "epoch": 1.93, + "learning_rate": 5.959985914458276e-07, + "loss": 0.6689, + "step": 75310 + }, + { + "epoch": 1.93, + "learning_rate": 5.959732798213956e-07, + "loss": 0.5825, + "step": 75311 + }, + { + "epoch": 1.93, + "learning_rate": 5.959479685063083e-07, + "loss": 0.6348, + "step": 75312 + }, + { + "epoch": 1.93, + "learning_rate": 5.959226575005852e-07, + "loss": 0.6201, + "step": 75313 + }, + { + "epoch": 1.93, + "learning_rate": 5.958973468042453e-07, + "loss": 0.7197, + "step": 75314 + }, + { + "epoch": 1.93, + "learning_rate": 5.958720364173087e-07, + "loss": 0.6865, + "step": 75315 + }, + { + "epoch": 1.93, + "learning_rate": 5.958467263397939e-07, + "loss": 0.5652, + "step": 75316 + }, + { + "epoch": 1.93, + "learning_rate": 5.958214165717206e-07, + "loss": 0.8242, + "step": 75317 + }, + { + "epoch": 1.93, + "learning_rate": 5.957961071131086e-07, + "loss": 0.6304, + "step": 75318 + }, + { + "epoch": 1.93, + "learning_rate": 5.957707979639768e-07, + "loss": 0.4639, + "step": 75319 + }, + { + "epoch": 1.93, + "learning_rate": 5.957454891243445e-07, + "loss": 0.5972, + "step": 75320 + }, + { + "epoch": 1.93, + "learning_rate": 5.957201805942314e-07, + "loss": 0.6479, + "step": 75321 + }, + { + "epoch": 1.93, + "learning_rate": 5.956948723736567e-07, + "loss": 0.6777, + "step": 75322 + }, + { + "epoch": 1.93, + "learning_rate": 5.9566956446264e-07, + "loss": 0.5662, + "step": 75323 + }, + { + "epoch": 1.93, + "learning_rate": 5.956442568612003e-07, + "loss": 0.6494, + "step": 75324 + }, + { + "epoch": 1.93, + "learning_rate": 5.956189495693577e-07, + "loss": 0.6676, + "step": 75325 + }, + { + "epoch": 1.93, + "learning_rate": 5.955936425871308e-07, + "loss": 0.6919, + "step": 75326 + }, + { + "epoch": 1.93, + "learning_rate": 5.955683359145391e-07, + "loss": 0.5415, + "step": 75327 + }, + { + "epoch": 1.93, + "learning_rate": 5.955430295516023e-07, + "loss": 0.4222, + "step": 75328 + }, + { + "epoch": 1.93, + "learning_rate": 5.955177234983394e-07, + "loss": 0.574, + "step": 75329 + }, + { + "epoch": 1.93, + "learning_rate": 5.954924177547702e-07, + "loss": 0.7266, + "step": 75330 + }, + { + "epoch": 1.93, + "learning_rate": 5.954671123209137e-07, + "loss": 0.5674, + "step": 75331 + }, + { + "epoch": 1.93, + "learning_rate": 5.954418071967895e-07, + "loss": 0.6086, + "step": 75332 + }, + { + "epoch": 1.93, + "learning_rate": 5.954165023824167e-07, + "loss": 0.6821, + "step": 75333 + }, + { + "epoch": 1.93, + "learning_rate": 5.953911978778152e-07, + "loss": 0.6387, + "step": 75334 + }, + { + "epoch": 1.93, + "learning_rate": 5.953658936830042e-07, + "loss": 0.6401, + "step": 75335 + }, + { + "epoch": 1.93, + "learning_rate": 5.953405897980029e-07, + "loss": 0.7129, + "step": 75336 + }, + { + "epoch": 1.93, + "learning_rate": 5.953152862228302e-07, + "loss": 0.6211, + "step": 75337 + }, + { + "epoch": 1.93, + "learning_rate": 5.952899829575063e-07, + "loss": 0.4875, + "step": 75338 + }, + { + "epoch": 1.93, + "learning_rate": 5.952646800020501e-07, + "loss": 0.6313, + "step": 75339 + }, + { + "epoch": 1.93, + "learning_rate": 5.952393773564813e-07, + "loss": 0.6387, + "step": 75340 + }, + { + "epoch": 1.93, + "learning_rate": 5.952140750208189e-07, + "loss": 0.6423, + "step": 75341 + }, + { + "epoch": 1.93, + "learning_rate": 5.951887729950826e-07, + "loss": 0.6816, + "step": 75342 + }, + { + "epoch": 1.93, + "learning_rate": 5.951634712792915e-07, + "loss": 0.7422, + "step": 75343 + }, + { + "epoch": 1.93, + "learning_rate": 5.951381698734655e-07, + "loss": 0.5142, + "step": 75344 + }, + { + "epoch": 1.93, + "learning_rate": 5.951128687776235e-07, + "loss": 0.4788, + "step": 75345 + }, + { + "epoch": 1.93, + "learning_rate": 5.950875679917847e-07, + "loss": 0.7549, + "step": 75346 + }, + { + "epoch": 1.93, + "learning_rate": 5.950622675159689e-07, + "loss": 0.6367, + "step": 75347 + }, + { + "epoch": 1.93, + "learning_rate": 5.950369673501952e-07, + "loss": 0.7021, + "step": 75348 + }, + { + "epoch": 1.93, + "learning_rate": 5.950116674944831e-07, + "loss": 0.6528, + "step": 75349 + }, + { + "epoch": 1.93, + "learning_rate": 5.949863679488518e-07, + "loss": 0.7188, + "step": 75350 + }, + { + "epoch": 1.93, + "learning_rate": 5.949610687133211e-07, + "loss": 0.5046, + "step": 75351 + }, + { + "epoch": 1.93, + "learning_rate": 5.949357697879097e-07, + "loss": 0.519, + "step": 75352 + }, + { + "epoch": 1.93, + "learning_rate": 5.949104711726377e-07, + "loss": 0.7197, + "step": 75353 + }, + { + "epoch": 1.93, + "learning_rate": 5.94885172867524e-07, + "loss": 0.6006, + "step": 75354 + }, + { + "epoch": 1.93, + "learning_rate": 5.948598748725886e-07, + "loss": 0.4858, + "step": 75355 + }, + { + "epoch": 1.93, + "learning_rate": 5.948345771878496e-07, + "loss": 0.7812, + "step": 75356 + }, + { + "epoch": 1.93, + "learning_rate": 5.948092798133275e-07, + "loss": 0.7454, + "step": 75357 + }, + { + "epoch": 1.93, + "learning_rate": 5.947839827490412e-07, + "loss": 0.6089, + "step": 75358 + }, + { + "epoch": 1.93, + "learning_rate": 5.947586859950102e-07, + "loss": 0.3855, + "step": 75359 + }, + { + "epoch": 1.93, + "learning_rate": 5.947333895512537e-07, + "loss": 0.6523, + "step": 75360 + }, + { + "epoch": 1.93, + "learning_rate": 5.947080934177915e-07, + "loss": 0.4526, + "step": 75361 + }, + { + "epoch": 1.93, + "learning_rate": 5.946827975946425e-07, + "loss": 0.4893, + "step": 75362 + }, + { + "epoch": 1.93, + "learning_rate": 5.946575020818263e-07, + "loss": 0.6333, + "step": 75363 + }, + { + "epoch": 1.93, + "learning_rate": 5.946322068793623e-07, + "loss": 0.4192, + "step": 75364 + }, + { + "epoch": 1.93, + "learning_rate": 5.946069119872696e-07, + "loss": 0.6611, + "step": 75365 + }, + { + "epoch": 1.93, + "learning_rate": 5.945816174055679e-07, + "loss": 0.6577, + "step": 75366 + }, + { + "epoch": 1.93, + "learning_rate": 5.945563231342763e-07, + "loss": 0.6714, + "step": 75367 + }, + { + "epoch": 1.93, + "learning_rate": 5.945310291734142e-07, + "loss": 0.6553, + "step": 75368 + }, + { + "epoch": 1.93, + "learning_rate": 5.945057355230011e-07, + "loss": 0.5605, + "step": 75369 + }, + { + "epoch": 1.93, + "learning_rate": 5.944804421830565e-07, + "loss": 0.7246, + "step": 75370 + }, + { + "epoch": 1.93, + "learning_rate": 5.944551491535993e-07, + "loss": 0.6509, + "step": 75371 + }, + { + "epoch": 1.93, + "learning_rate": 5.944298564346493e-07, + "loss": 0.54, + "step": 75372 + }, + { + "epoch": 1.93, + "learning_rate": 5.944045640262256e-07, + "loss": 0.4839, + "step": 75373 + }, + { + "epoch": 1.93, + "learning_rate": 5.943792719283483e-07, + "loss": 0.5264, + "step": 75374 + }, + { + "epoch": 1.93, + "learning_rate": 5.943539801410354e-07, + "loss": 0.791, + "step": 75375 + }, + { + "epoch": 1.93, + "learning_rate": 5.943286886643072e-07, + "loss": 0.6343, + "step": 75376 + }, + { + "epoch": 1.93, + "learning_rate": 5.94303397498183e-07, + "loss": 0.4971, + "step": 75377 + }, + { + "epoch": 1.93, + "learning_rate": 5.942781066426819e-07, + "loss": 0.6309, + "step": 75378 + }, + { + "epoch": 1.93, + "learning_rate": 5.942528160978233e-07, + "loss": 0.7192, + "step": 75379 + }, + { + "epoch": 1.93, + "learning_rate": 5.942275258636269e-07, + "loss": 0.5439, + "step": 75380 + }, + { + "epoch": 1.93, + "learning_rate": 5.942022359401115e-07, + "loss": 0.5352, + "step": 75381 + }, + { + "epoch": 1.93, + "learning_rate": 5.941769463272971e-07, + "loss": 0.6445, + "step": 75382 + }, + { + "epoch": 1.93, + "learning_rate": 5.941516570252026e-07, + "loss": 0.5332, + "step": 75383 + }, + { + "epoch": 1.93, + "learning_rate": 5.941263680338477e-07, + "loss": 0.5938, + "step": 75384 + }, + { + "epoch": 1.93, + "learning_rate": 5.941010793532517e-07, + "loss": 0.4448, + "step": 75385 + }, + { + "epoch": 1.93, + "learning_rate": 5.940757909834333e-07, + "loss": 0.6201, + "step": 75386 + }, + { + "epoch": 1.93, + "learning_rate": 5.940505029244129e-07, + "loss": 0.6582, + "step": 75387 + }, + { + "epoch": 1.93, + "learning_rate": 5.940252151762088e-07, + "loss": 0.6377, + "step": 75388 + }, + { + "epoch": 1.93, + "learning_rate": 5.939999277388414e-07, + "loss": 0.6531, + "step": 75389 + }, + { + "epoch": 1.93, + "learning_rate": 5.939746406123294e-07, + "loss": 0.7334, + "step": 75390 + }, + { + "epoch": 1.93, + "learning_rate": 5.939493537966924e-07, + "loss": 0.4561, + "step": 75391 + }, + { + "epoch": 1.93, + "learning_rate": 5.939240672919499e-07, + "loss": 0.6855, + "step": 75392 + }, + { + "epoch": 1.93, + "learning_rate": 5.938987810981208e-07, + "loss": 0.6836, + "step": 75393 + }, + { + "epoch": 1.93, + "learning_rate": 5.938734952152251e-07, + "loss": 0.6616, + "step": 75394 + }, + { + "epoch": 1.93, + "learning_rate": 5.938482096432815e-07, + "loss": 0.6719, + "step": 75395 + }, + { + "epoch": 1.93, + "learning_rate": 5.938229243823097e-07, + "loss": 0.8438, + "step": 75396 + }, + { + "epoch": 1.93, + "learning_rate": 5.937976394323289e-07, + "loss": 0.709, + "step": 75397 + }, + { + "epoch": 1.93, + "learning_rate": 5.937723547933585e-07, + "loss": 0.7695, + "step": 75398 + }, + { + "epoch": 1.93, + "learning_rate": 5.937470704654181e-07, + "loss": 0.6152, + "step": 75399 + }, + { + "epoch": 1.93, + "learning_rate": 5.937217864485268e-07, + "loss": 0.6177, + "step": 75400 + }, + { + "epoch": 1.93, + "learning_rate": 5.936965027427042e-07, + "loss": 0.71, + "step": 75401 + }, + { + "epoch": 1.93, + "learning_rate": 5.936712193479693e-07, + "loss": 0.6699, + "step": 75402 + }, + { + "epoch": 1.93, + "learning_rate": 5.936459362643418e-07, + "loss": 0.585, + "step": 75403 + }, + { + "epoch": 1.93, + "learning_rate": 5.936206534918411e-07, + "loss": 0.8301, + "step": 75404 + }, + { + "epoch": 1.93, + "learning_rate": 5.935953710304862e-07, + "loss": 0.6719, + "step": 75405 + }, + { + "epoch": 1.93, + "learning_rate": 5.935700888802966e-07, + "loss": 0.6753, + "step": 75406 + }, + { + "epoch": 1.93, + "learning_rate": 5.935448070412916e-07, + "loss": 0.6099, + "step": 75407 + }, + { + "epoch": 1.93, + "learning_rate": 5.935195255134909e-07, + "loss": 0.7256, + "step": 75408 + }, + { + "epoch": 1.93, + "learning_rate": 5.934942442969135e-07, + "loss": 0.7119, + "step": 75409 + }, + { + "epoch": 1.93, + "learning_rate": 5.934689633915785e-07, + "loss": 0.4937, + "step": 75410 + }, + { + "epoch": 1.93, + "learning_rate": 5.934436827975063e-07, + "loss": 0.5542, + "step": 75411 + }, + { + "epoch": 1.93, + "learning_rate": 5.934184025147151e-07, + "loss": 0.6313, + "step": 75412 + }, + { + "epoch": 1.93, + "learning_rate": 5.933931225432248e-07, + "loss": 0.751, + "step": 75413 + }, + { + "epoch": 1.93, + "learning_rate": 5.933678428830551e-07, + "loss": 0.5435, + "step": 75414 + }, + { + "epoch": 1.93, + "learning_rate": 5.933425635342244e-07, + "loss": 0.5469, + "step": 75415 + }, + { + "epoch": 1.93, + "learning_rate": 5.933172844967529e-07, + "loss": 0.7607, + "step": 75416 + }, + { + "epoch": 1.93, + "learning_rate": 5.932920057706594e-07, + "loss": 0.5547, + "step": 75417 + }, + { + "epoch": 1.93, + "learning_rate": 5.932667273559638e-07, + "loss": 0.6562, + "step": 75418 + }, + { + "epoch": 1.93, + "learning_rate": 5.93241449252685e-07, + "loss": 0.7129, + "step": 75419 + }, + { + "epoch": 1.93, + "learning_rate": 5.932161714608426e-07, + "loss": 0.5537, + "step": 75420 + }, + { + "epoch": 1.93, + "learning_rate": 5.931908939804557e-07, + "loss": 0.6484, + "step": 75421 + }, + { + "epoch": 1.93, + "learning_rate": 5.93165616811544e-07, + "loss": 0.6182, + "step": 75422 + }, + { + "epoch": 1.93, + "learning_rate": 5.931403399541265e-07, + "loss": 0.7803, + "step": 75423 + }, + { + "epoch": 1.93, + "learning_rate": 5.931150634082232e-07, + "loss": 0.623, + "step": 75424 + }, + { + "epoch": 1.93, + "learning_rate": 5.930897871738528e-07, + "loss": 0.7676, + "step": 75425 + }, + { + "epoch": 1.93, + "learning_rate": 5.930645112510346e-07, + "loss": 0.432, + "step": 75426 + }, + { + "epoch": 1.93, + "learning_rate": 5.930392356397882e-07, + "loss": 0.5073, + "step": 75427 + }, + { + "epoch": 1.93, + "learning_rate": 5.930139603401331e-07, + "loss": 0.6304, + "step": 75428 + }, + { + "epoch": 1.93, + "learning_rate": 5.929886853520882e-07, + "loss": 0.6072, + "step": 75429 + }, + { + "epoch": 1.93, + "learning_rate": 5.929634106756735e-07, + "loss": 0.6274, + "step": 75430 + }, + { + "epoch": 1.93, + "learning_rate": 5.929381363109078e-07, + "loss": 0.8145, + "step": 75431 + }, + { + "epoch": 1.93, + "learning_rate": 5.929128622578108e-07, + "loss": 0.7041, + "step": 75432 + }, + { + "epoch": 1.93, + "learning_rate": 5.928875885164015e-07, + "loss": 0.5996, + "step": 75433 + }, + { + "epoch": 1.93, + "learning_rate": 5.928623150866998e-07, + "loss": 0.6348, + "step": 75434 + }, + { + "epoch": 1.93, + "learning_rate": 5.928370419687247e-07, + "loss": 0.6211, + "step": 75435 + }, + { + "epoch": 1.93, + "learning_rate": 5.928117691624952e-07, + "loss": 0.7129, + "step": 75436 + }, + { + "epoch": 1.93, + "learning_rate": 5.927864966680312e-07, + "loss": 0.6895, + "step": 75437 + }, + { + "epoch": 1.93, + "learning_rate": 5.927612244853517e-07, + "loss": 0.522, + "step": 75438 + }, + { + "epoch": 1.93, + "learning_rate": 5.927359526144764e-07, + "loss": 0.5024, + "step": 75439 + }, + { + "epoch": 1.93, + "learning_rate": 5.927106810554241e-07, + "loss": 0.7041, + "step": 75440 + }, + { + "epoch": 1.93, + "learning_rate": 5.926854098082149e-07, + "loss": 0.6187, + "step": 75441 + }, + { + "epoch": 1.93, + "learning_rate": 5.926601388728675e-07, + "loss": 0.6719, + "step": 75442 + }, + { + "epoch": 1.93, + "learning_rate": 5.926348682494018e-07, + "loss": 0.6436, + "step": 75443 + }, + { + "epoch": 1.93, + "learning_rate": 5.926095979378369e-07, + "loss": 0.6074, + "step": 75444 + }, + { + "epoch": 1.93, + "learning_rate": 5.92584327938192e-07, + "loss": 0.5903, + "step": 75445 + }, + { + "epoch": 1.93, + "learning_rate": 5.925590582504863e-07, + "loss": 0.5894, + "step": 75446 + }, + { + "epoch": 1.93, + "learning_rate": 5.925337888747395e-07, + "loss": 0.6343, + "step": 75447 + }, + { + "epoch": 1.93, + "learning_rate": 5.925085198109708e-07, + "loss": 0.5386, + "step": 75448 + }, + { + "epoch": 1.93, + "learning_rate": 5.924832510591996e-07, + "loss": 0.6875, + "step": 75449 + }, + { + "epoch": 1.93, + "learning_rate": 5.924579826194451e-07, + "loss": 0.7295, + "step": 75450 + }, + { + "epoch": 1.93, + "learning_rate": 5.924327144917272e-07, + "loss": 0.5205, + "step": 75451 + }, + { + "epoch": 1.93, + "learning_rate": 5.924074466760645e-07, + "loss": 0.6812, + "step": 75452 + }, + { + "epoch": 1.93, + "learning_rate": 5.923821791724767e-07, + "loss": 0.626, + "step": 75453 + }, + { + "epoch": 1.93, + "learning_rate": 5.923569119809835e-07, + "loss": 0.668, + "step": 75454 + }, + { + "epoch": 1.93, + "learning_rate": 5.923316451016033e-07, + "loss": 0.537, + "step": 75455 + }, + { + "epoch": 1.93, + "learning_rate": 5.923063785343565e-07, + "loss": 0.592, + "step": 75456 + }, + { + "epoch": 1.93, + "learning_rate": 5.922811122792617e-07, + "loss": 0.6973, + "step": 75457 + }, + { + "epoch": 1.93, + "learning_rate": 5.922558463363385e-07, + "loss": 0.498, + "step": 75458 + }, + { + "epoch": 1.93, + "learning_rate": 5.922305807056063e-07, + "loss": 0.7021, + "step": 75459 + }, + { + "epoch": 1.93, + "learning_rate": 5.922053153870842e-07, + "loss": 0.4595, + "step": 75460 + }, + { + "epoch": 1.93, + "learning_rate": 5.921800503807919e-07, + "loss": 0.6152, + "step": 75461 + }, + { + "epoch": 1.93, + "learning_rate": 5.921547856867488e-07, + "loss": 0.6025, + "step": 75462 + }, + { + "epoch": 1.93, + "learning_rate": 5.921295213049736e-07, + "loss": 0.6279, + "step": 75463 + }, + { + "epoch": 1.93, + "learning_rate": 5.921042572354868e-07, + "loss": 0.4834, + "step": 75464 + }, + { + "epoch": 1.93, + "learning_rate": 5.920789934783063e-07, + "loss": 0.6338, + "step": 75465 + }, + { + "epoch": 1.93, + "learning_rate": 5.920537300334526e-07, + "loss": 0.5503, + "step": 75466 + }, + { + "epoch": 1.93, + "learning_rate": 5.920284669009442e-07, + "loss": 0.6436, + "step": 75467 + }, + { + "epoch": 1.93, + "learning_rate": 5.920032040808012e-07, + "loss": 0.6201, + "step": 75468 + }, + { + "epoch": 1.93, + "learning_rate": 5.919779415730422e-07, + "loss": 0.666, + "step": 75469 + }, + { + "epoch": 1.93, + "learning_rate": 5.919526793776872e-07, + "loss": 0.7881, + "step": 75470 + }, + { + "epoch": 1.93, + "learning_rate": 5.91927417494755e-07, + "loss": 0.6562, + "step": 75471 + }, + { + "epoch": 1.93, + "learning_rate": 5.919021559242656e-07, + "loss": 0.6904, + "step": 75472 + }, + { + "epoch": 1.93, + "learning_rate": 5.918768946662377e-07, + "loss": 0.585, + "step": 75473 + }, + { + "epoch": 1.93, + "learning_rate": 5.918516337206912e-07, + "loss": 0.6187, + "step": 75474 + }, + { + "epoch": 1.93, + "learning_rate": 5.91826373087645e-07, + "loss": 0.5488, + "step": 75475 + }, + { + "epoch": 1.93, + "learning_rate": 5.918011127671184e-07, + "loss": 0.5615, + "step": 75476 + }, + { + "epoch": 1.93, + "learning_rate": 5.91775852759131e-07, + "loss": 0.5269, + "step": 75477 + }, + { + "epoch": 1.93, + "learning_rate": 5.91750593063702e-07, + "loss": 0.6807, + "step": 75478 + }, + { + "epoch": 1.93, + "learning_rate": 5.91725333680851e-07, + "loss": 0.585, + "step": 75479 + }, + { + "epoch": 1.93, + "learning_rate": 5.917000746105968e-07, + "loss": 0.7412, + "step": 75480 + }, + { + "epoch": 1.93, + "learning_rate": 5.916748158529594e-07, + "loss": 0.5046, + "step": 75481 + }, + { + "epoch": 1.93, + "learning_rate": 5.916495574079577e-07, + "loss": 0.6528, + "step": 75482 + }, + { + "epoch": 1.93, + "learning_rate": 5.916242992756111e-07, + "loss": 0.6934, + "step": 75483 + }, + { + "epoch": 1.93, + "learning_rate": 5.915990414559393e-07, + "loss": 0.457, + "step": 75484 + }, + { + "epoch": 1.93, + "learning_rate": 5.915737839489611e-07, + "loss": 0.7168, + "step": 75485 + }, + { + "epoch": 1.93, + "learning_rate": 5.91548526754696e-07, + "loss": 0.6631, + "step": 75486 + }, + { + "epoch": 1.93, + "learning_rate": 5.915232698731636e-07, + "loss": 0.5635, + "step": 75487 + }, + { + "epoch": 1.93, + "learning_rate": 5.914980133043827e-07, + "loss": 0.8467, + "step": 75488 + }, + { + "epoch": 1.93, + "learning_rate": 5.914727570483732e-07, + "loss": 0.5143, + "step": 75489 + }, + { + "epoch": 1.93, + "learning_rate": 5.914475011051543e-07, + "loss": 0.6628, + "step": 75490 + }, + { + "epoch": 1.93, + "learning_rate": 5.914222454747453e-07, + "loss": 0.5273, + "step": 75491 + }, + { + "epoch": 1.93, + "learning_rate": 5.913969901571651e-07, + "loss": 0.6484, + "step": 75492 + }, + { + "epoch": 1.93, + "learning_rate": 5.913717351524339e-07, + "loss": 0.5977, + "step": 75493 + }, + { + "epoch": 1.93, + "learning_rate": 5.913464804605708e-07, + "loss": 0.6045, + "step": 75494 + }, + { + "epoch": 1.93, + "learning_rate": 5.913212260815943e-07, + "loss": 0.4956, + "step": 75495 + }, + { + "epoch": 1.94, + "learning_rate": 5.912959720155246e-07, + "loss": 0.624, + "step": 75496 + }, + { + "epoch": 1.94, + "learning_rate": 5.912707182623807e-07, + "loss": 0.7451, + "step": 75497 + }, + { + "epoch": 1.94, + "learning_rate": 5.912454648221821e-07, + "loss": 0.603, + "step": 75498 + }, + { + "epoch": 1.94, + "learning_rate": 5.912202116949481e-07, + "loss": 0.7007, + "step": 75499 + }, + { + "epoch": 1.94, + "learning_rate": 5.911949588806977e-07, + "loss": 0.5571, + "step": 75500 + }, + { + "epoch": 1.94, + "learning_rate": 5.911697063794509e-07, + "loss": 0.6597, + "step": 75501 + }, + { + "epoch": 1.94, + "learning_rate": 5.911444541912263e-07, + "loss": 0.5649, + "step": 75502 + }, + { + "epoch": 1.94, + "learning_rate": 5.911192023160438e-07, + "loss": 0.6353, + "step": 75503 + }, + { + "epoch": 1.94, + "learning_rate": 5.910939507539229e-07, + "loss": 0.5498, + "step": 75504 + }, + { + "epoch": 1.94, + "learning_rate": 5.91068699504882e-07, + "loss": 0.6504, + "step": 75505 + }, + { + "epoch": 1.94, + "learning_rate": 5.910434485689413e-07, + "loss": 0.6533, + "step": 75506 + }, + { + "epoch": 1.94, + "learning_rate": 5.910181979461195e-07, + "loss": 0.6982, + "step": 75507 + }, + { + "epoch": 1.94, + "learning_rate": 5.909929476364366e-07, + "loss": 0.7148, + "step": 75508 + }, + { + "epoch": 1.94, + "learning_rate": 5.909676976399111e-07, + "loss": 0.6094, + "step": 75509 + }, + { + "epoch": 1.94, + "learning_rate": 5.909424479565635e-07, + "loss": 0.7197, + "step": 75510 + }, + { + "epoch": 1.94, + "learning_rate": 5.909171985864119e-07, + "loss": 0.5942, + "step": 75511 + }, + { + "epoch": 1.94, + "learning_rate": 5.908919495294764e-07, + "loss": 0.5708, + "step": 75512 + }, + { + "epoch": 1.94, + "learning_rate": 5.908667007857761e-07, + "loss": 0.6123, + "step": 75513 + }, + { + "epoch": 1.94, + "learning_rate": 5.908414523553307e-07, + "loss": 0.6201, + "step": 75514 + }, + { + "epoch": 1.94, + "learning_rate": 5.908162042381588e-07, + "loss": 0.6597, + "step": 75515 + }, + { + "epoch": 1.94, + "learning_rate": 5.907909564342803e-07, + "loss": 0.5527, + "step": 75516 + }, + { + "epoch": 1.94, + "learning_rate": 5.907657089437142e-07, + "loss": 0.7188, + "step": 75517 + }, + { + "epoch": 1.94, + "learning_rate": 5.9074046176648e-07, + "loss": 0.6191, + "step": 75518 + }, + { + "epoch": 1.94, + "learning_rate": 5.907152149025969e-07, + "loss": 0.7627, + "step": 75519 + }, + { + "epoch": 1.94, + "learning_rate": 5.906899683520846e-07, + "loss": 0.4459, + "step": 75520 + }, + { + "epoch": 1.94, + "learning_rate": 5.906647221149619e-07, + "loss": 0.5859, + "step": 75521 + }, + { + "epoch": 1.94, + "learning_rate": 5.906394761912487e-07, + "loss": 0.6416, + "step": 75522 + }, + { + "epoch": 1.94, + "learning_rate": 5.906142305809638e-07, + "loss": 0.5591, + "step": 75523 + }, + { + "epoch": 1.94, + "learning_rate": 5.90588985284127e-07, + "loss": 0.5087, + "step": 75524 + }, + { + "epoch": 1.94, + "learning_rate": 5.905637403007572e-07, + "loss": 0.5693, + "step": 75525 + }, + { + "epoch": 1.94, + "learning_rate": 5.905384956308738e-07, + "loss": 0.6543, + "step": 75526 + }, + { + "epoch": 1.94, + "learning_rate": 5.905132512744966e-07, + "loss": 0.5, + "step": 75527 + }, + { + "epoch": 1.94, + "learning_rate": 5.904880072316443e-07, + "loss": 0.5913, + "step": 75528 + }, + { + "epoch": 1.94, + "learning_rate": 5.904627635023366e-07, + "loss": 0.543, + "step": 75529 + }, + { + "epoch": 1.94, + "learning_rate": 5.904375200865925e-07, + "loss": 0.5874, + "step": 75530 + }, + { + "epoch": 1.94, + "learning_rate": 5.904122769844318e-07, + "loss": 0.6514, + "step": 75531 + }, + { + "epoch": 1.94, + "learning_rate": 5.903870341958735e-07, + "loss": 0.708, + "step": 75532 + }, + { + "epoch": 1.94, + "learning_rate": 5.903617917209371e-07, + "loss": 0.5967, + "step": 75533 + }, + { + "epoch": 1.94, + "learning_rate": 5.903365495596421e-07, + "loss": 0.3521, + "step": 75534 + }, + { + "epoch": 1.94, + "learning_rate": 5.903113077120073e-07, + "loss": 0.5946, + "step": 75535 + }, + { + "epoch": 1.94, + "learning_rate": 5.902860661780522e-07, + "loss": 0.6641, + "step": 75536 + }, + { + "epoch": 1.94, + "learning_rate": 5.902608249577962e-07, + "loss": 0.7148, + "step": 75537 + }, + { + "epoch": 1.94, + "learning_rate": 5.902355840512587e-07, + "loss": 0.6973, + "step": 75538 + }, + { + "epoch": 1.94, + "learning_rate": 5.902103434584591e-07, + "loss": 0.7881, + "step": 75539 + }, + { + "epoch": 1.94, + "learning_rate": 5.901851031794162e-07, + "loss": 0.9854, + "step": 75540 + }, + { + "epoch": 1.94, + "learning_rate": 5.901598632141502e-07, + "loss": 0.481, + "step": 75541 + }, + { + "epoch": 1.94, + "learning_rate": 5.901346235626796e-07, + "loss": 0.4386, + "step": 75542 + }, + { + "epoch": 1.94, + "learning_rate": 5.901093842250244e-07, + "loss": 0.8652, + "step": 75543 + }, + { + "epoch": 1.94, + "learning_rate": 5.900841452012037e-07, + "loss": 0.6348, + "step": 75544 + }, + { + "epoch": 1.94, + "learning_rate": 5.900589064912362e-07, + "loss": 0.6099, + "step": 75545 + }, + { + "epoch": 1.94, + "learning_rate": 5.900336680951421e-07, + "loss": 0.6265, + "step": 75546 + }, + { + "epoch": 1.94, + "learning_rate": 5.900084300129402e-07, + "loss": 0.7178, + "step": 75547 + }, + { + "epoch": 1.94, + "learning_rate": 5.899831922446501e-07, + "loss": 0.7217, + "step": 75548 + }, + { + "epoch": 1.94, + "learning_rate": 5.899579547902909e-07, + "loss": 0.585, + "step": 75549 + }, + { + "epoch": 1.94, + "learning_rate": 5.899327176498822e-07, + "loss": 0.6309, + "step": 75550 + }, + { + "epoch": 1.94, + "learning_rate": 5.89907480823443e-07, + "loss": 0.5347, + "step": 75551 + }, + { + "epoch": 1.94, + "learning_rate": 5.898822443109928e-07, + "loss": 0.4399, + "step": 75552 + }, + { + "epoch": 1.94, + "learning_rate": 5.89857008112551e-07, + "loss": 0.5317, + "step": 75553 + }, + { + "epoch": 1.94, + "learning_rate": 5.898317722281372e-07, + "loss": 0.6201, + "step": 75554 + }, + { + "epoch": 1.94, + "learning_rate": 5.898065366577698e-07, + "loss": 0.6797, + "step": 75555 + }, + { + "epoch": 1.94, + "learning_rate": 5.897813014014689e-07, + "loss": 0.7339, + "step": 75556 + }, + { + "epoch": 1.94, + "learning_rate": 5.897560664592535e-07, + "loss": 0.6602, + "step": 75557 + }, + { + "epoch": 1.94, + "learning_rate": 5.897308318311431e-07, + "loss": 0.5291, + "step": 75558 + }, + { + "epoch": 1.94, + "learning_rate": 5.897055975171567e-07, + "loss": 0.4624, + "step": 75559 + }, + { + "epoch": 1.94, + "learning_rate": 5.896803635173142e-07, + "loss": 0.6367, + "step": 75560 + }, + { + "epoch": 1.94, + "learning_rate": 5.896551298316342e-07, + "loss": 0.4941, + "step": 75561 + }, + { + "epoch": 1.94, + "learning_rate": 5.896298964601367e-07, + "loss": 0.6074, + "step": 75562 + }, + { + "epoch": 1.94, + "learning_rate": 5.896046634028404e-07, + "loss": 0.6328, + "step": 75563 + }, + { + "epoch": 1.94, + "learning_rate": 5.895794306597656e-07, + "loss": 0.605, + "step": 75564 + }, + { + "epoch": 1.94, + "learning_rate": 5.895541982309305e-07, + "loss": 0.6157, + "step": 75565 + }, + { + "epoch": 1.94, + "learning_rate": 5.895289661163549e-07, + "loss": 0.751, + "step": 75566 + }, + { + "epoch": 1.94, + "learning_rate": 5.895037343160582e-07, + "loss": 0.5903, + "step": 75567 + }, + { + "epoch": 1.94, + "learning_rate": 5.894785028300593e-07, + "loss": 0.326, + "step": 75568 + }, + { + "epoch": 1.94, + "learning_rate": 5.894532716583782e-07, + "loss": 0.7617, + "step": 75569 + }, + { + "epoch": 1.94, + "learning_rate": 5.894280408010334e-07, + "loss": 0.6313, + "step": 75570 + }, + { + "epoch": 1.94, + "learning_rate": 5.894028102580451e-07, + "loss": 0.666, + "step": 75571 + }, + { + "epoch": 1.94, + "learning_rate": 5.893775800294323e-07, + "loss": 0.5742, + "step": 75572 + }, + { + "epoch": 1.94, + "learning_rate": 5.893523501152138e-07, + "loss": 0.4209, + "step": 75573 + }, + { + "epoch": 1.94, + "learning_rate": 5.893271205154097e-07, + "loss": 0.4971, + "step": 75574 + }, + { + "epoch": 1.94, + "learning_rate": 5.893018912300389e-07, + "loss": 0.5464, + "step": 75575 + }, + { + "epoch": 1.94, + "learning_rate": 5.892766622591205e-07, + "loss": 0.626, + "step": 75576 + }, + { + "epoch": 1.94, + "learning_rate": 5.892514336026741e-07, + "loss": 0.6094, + "step": 75577 + }, + { + "epoch": 1.94, + "learning_rate": 5.89226205260719e-07, + "loss": 0.6895, + "step": 75578 + }, + { + "epoch": 1.94, + "learning_rate": 5.892009772332746e-07, + "loss": 0.6377, + "step": 75579 + }, + { + "epoch": 1.94, + "learning_rate": 5.8917574952036e-07, + "loss": 0.5315, + "step": 75580 + }, + { + "epoch": 1.94, + "learning_rate": 5.891505221219948e-07, + "loss": 0.6182, + "step": 75581 + }, + { + "epoch": 1.94, + "learning_rate": 5.89125295038198e-07, + "loss": 0.5601, + "step": 75582 + }, + { + "epoch": 1.94, + "learning_rate": 5.891000682689892e-07, + "loss": 0.606, + "step": 75583 + }, + { + "epoch": 1.94, + "learning_rate": 5.890748418143878e-07, + "loss": 0.6733, + "step": 75584 + }, + { + "epoch": 1.94, + "learning_rate": 5.890496156744125e-07, + "loss": 0.6377, + "step": 75585 + }, + { + "epoch": 1.94, + "learning_rate": 5.890243898490832e-07, + "loss": 0.5393, + "step": 75586 + }, + { + "epoch": 1.94, + "learning_rate": 5.889991643384189e-07, + "loss": 0.6924, + "step": 75587 + }, + { + "epoch": 1.94, + "learning_rate": 5.889739391424391e-07, + "loss": 0.7476, + "step": 75588 + }, + { + "epoch": 1.94, + "learning_rate": 5.889487142611631e-07, + "loss": 0.5605, + "step": 75589 + }, + { + "epoch": 1.94, + "learning_rate": 5.889234896946101e-07, + "loss": 0.5081, + "step": 75590 + }, + { + "epoch": 1.94, + "learning_rate": 5.888982654427996e-07, + "loss": 0.667, + "step": 75591 + }, + { + "epoch": 1.94, + "learning_rate": 5.888730415057506e-07, + "loss": 0.6191, + "step": 75592 + }, + { + "epoch": 1.94, + "learning_rate": 5.888478178834828e-07, + "loss": 0.7207, + "step": 75593 + }, + { + "epoch": 1.94, + "learning_rate": 5.888225945760154e-07, + "loss": 0.4307, + "step": 75594 + }, + { + "epoch": 1.94, + "learning_rate": 5.887973715833674e-07, + "loss": 0.4771, + "step": 75595 + }, + { + "epoch": 1.94, + "learning_rate": 5.887721489055586e-07, + "loss": 0.666, + "step": 75596 + }, + { + "epoch": 1.94, + "learning_rate": 5.887469265426078e-07, + "loss": 0.5132, + "step": 75597 + }, + { + "epoch": 1.94, + "learning_rate": 5.887217044945346e-07, + "loss": 0.6064, + "step": 75598 + }, + { + "epoch": 1.94, + "learning_rate": 5.886964827613582e-07, + "loss": 0.6221, + "step": 75599 + }, + { + "epoch": 1.94, + "learning_rate": 5.886712613430982e-07, + "loss": 0.832, + "step": 75600 + }, + { + "epoch": 1.94, + "learning_rate": 5.886460402397735e-07, + "loss": 0.6021, + "step": 75601 + }, + { + "epoch": 1.94, + "learning_rate": 5.886208194514038e-07, + "loss": 0.647, + "step": 75602 + }, + { + "epoch": 1.94, + "learning_rate": 5.88595598978008e-07, + "loss": 0.592, + "step": 75603 + }, + { + "epoch": 1.94, + "learning_rate": 5.885703788196061e-07, + "loss": 0.6802, + "step": 75604 + }, + { + "epoch": 1.94, + "learning_rate": 5.885451589762167e-07, + "loss": 0.6216, + "step": 75605 + }, + { + "epoch": 1.94, + "learning_rate": 5.885199394478591e-07, + "loss": 0.6528, + "step": 75606 + }, + { + "epoch": 1.94, + "learning_rate": 5.884947202345531e-07, + "loss": 0.7393, + "step": 75607 + }, + { + "epoch": 1.94, + "learning_rate": 5.884695013363179e-07, + "loss": 0.7471, + "step": 75608 + }, + { + "epoch": 1.94, + "learning_rate": 5.884442827531723e-07, + "loss": 0.5532, + "step": 75609 + }, + { + "epoch": 1.94, + "learning_rate": 5.884190644851364e-07, + "loss": 0.6636, + "step": 75610 + }, + { + "epoch": 1.94, + "learning_rate": 5.883938465322287e-07, + "loss": 0.5857, + "step": 75611 + }, + { + "epoch": 1.94, + "learning_rate": 5.883686288944692e-07, + "loss": 0.6045, + "step": 75612 + }, + { + "epoch": 1.94, + "learning_rate": 5.883434115718766e-07, + "loss": 0.5723, + "step": 75613 + }, + { + "epoch": 1.94, + "learning_rate": 5.883181945644711e-07, + "loss": 0.6313, + "step": 75614 + }, + { + "epoch": 1.94, + "learning_rate": 5.88292977872271e-07, + "loss": 0.7305, + "step": 75615 + }, + { + "epoch": 1.94, + "learning_rate": 5.88267761495296e-07, + "loss": 0.7715, + "step": 75616 + }, + { + "epoch": 1.94, + "learning_rate": 5.882425454335656e-07, + "loss": 0.5786, + "step": 75617 + }, + { + "epoch": 1.94, + "learning_rate": 5.882173296870987e-07, + "loss": 0.6338, + "step": 75618 + }, + { + "epoch": 1.94, + "learning_rate": 5.881921142559151e-07, + "loss": 0.5806, + "step": 75619 + }, + { + "epoch": 1.94, + "learning_rate": 5.881668991400337e-07, + "loss": 0.6201, + "step": 75620 + }, + { + "epoch": 1.94, + "learning_rate": 5.881416843394742e-07, + "loss": 0.6992, + "step": 75621 + }, + { + "epoch": 1.94, + "learning_rate": 5.881164698542553e-07, + "loss": 0.7959, + "step": 75622 + }, + { + "epoch": 1.94, + "learning_rate": 5.880912556843971e-07, + "loss": 0.5188, + "step": 75623 + }, + { + "epoch": 1.94, + "learning_rate": 5.880660418299186e-07, + "loss": 0.54, + "step": 75624 + }, + { + "epoch": 1.94, + "learning_rate": 5.880408282908388e-07, + "loss": 0.4346, + "step": 75625 + }, + { + "epoch": 1.94, + "learning_rate": 5.880156150671769e-07, + "loss": 0.6416, + "step": 75626 + }, + { + "epoch": 1.94, + "learning_rate": 5.879904021589528e-07, + "loss": 0.5562, + "step": 75627 + }, + { + "epoch": 1.94, + "learning_rate": 5.879651895661853e-07, + "loss": 0.7139, + "step": 75628 + }, + { + "epoch": 1.94, + "learning_rate": 5.87939977288894e-07, + "loss": 0.707, + "step": 75629 + }, + { + "epoch": 1.94, + "learning_rate": 5.879147653270981e-07, + "loss": 0.5605, + "step": 75630 + }, + { + "epoch": 1.94, + "learning_rate": 5.878895536808169e-07, + "loss": 0.7021, + "step": 75631 + }, + { + "epoch": 1.94, + "learning_rate": 5.878643423500698e-07, + "loss": 0.6943, + "step": 75632 + }, + { + "epoch": 1.94, + "learning_rate": 5.878391313348759e-07, + "loss": 0.7656, + "step": 75633 + }, + { + "epoch": 1.94, + "learning_rate": 5.87813920635255e-07, + "loss": 0.6367, + "step": 75634 + }, + { + "epoch": 1.94, + "learning_rate": 5.877887102512256e-07, + "loss": 0.5537, + "step": 75635 + }, + { + "epoch": 1.94, + "learning_rate": 5.877635001828077e-07, + "loss": 0.6504, + "step": 75636 + }, + { + "epoch": 1.94, + "learning_rate": 5.877382904300201e-07, + "loss": 0.5293, + "step": 75637 + }, + { + "epoch": 1.94, + "learning_rate": 5.877130809928824e-07, + "loss": 0.6362, + "step": 75638 + }, + { + "epoch": 1.94, + "learning_rate": 5.876878718714138e-07, + "loss": 0.6606, + "step": 75639 + }, + { + "epoch": 1.94, + "learning_rate": 5.876626630656338e-07, + "loss": 0.5034, + "step": 75640 + }, + { + "epoch": 1.94, + "learning_rate": 5.876374545755613e-07, + "loss": 0.5845, + "step": 75641 + }, + { + "epoch": 1.94, + "learning_rate": 5.876122464012161e-07, + "loss": 0.7178, + "step": 75642 + }, + { + "epoch": 1.94, + "learning_rate": 5.875870385426169e-07, + "loss": 0.582, + "step": 75643 + }, + { + "epoch": 1.94, + "learning_rate": 5.87561830999784e-07, + "loss": 0.7007, + "step": 75644 + }, + { + "epoch": 1.94, + "learning_rate": 5.875366237727355e-07, + "loss": 0.6543, + "step": 75645 + }, + { + "epoch": 1.94, + "learning_rate": 5.875114168614914e-07, + "loss": 0.5098, + "step": 75646 + }, + { + "epoch": 1.94, + "learning_rate": 5.874862102660707e-07, + "loss": 0.5845, + "step": 75647 + }, + { + "epoch": 1.94, + "learning_rate": 5.874610039864931e-07, + "loss": 0.6787, + "step": 75648 + }, + { + "epoch": 1.94, + "learning_rate": 5.874357980227773e-07, + "loss": 0.6631, + "step": 75649 + }, + { + "epoch": 1.94, + "learning_rate": 5.874105923749431e-07, + "loss": 0.5332, + "step": 75650 + }, + { + "epoch": 1.94, + "learning_rate": 5.873853870430097e-07, + "loss": 0.7334, + "step": 75651 + }, + { + "epoch": 1.94, + "learning_rate": 5.873601820269962e-07, + "loss": 0.5723, + "step": 75652 + }, + { + "epoch": 1.94, + "learning_rate": 5.87334977326922e-07, + "loss": 0.7153, + "step": 75653 + }, + { + "epoch": 1.94, + "learning_rate": 5.873097729428069e-07, + "loss": 0.5767, + "step": 75654 + }, + { + "epoch": 1.94, + "learning_rate": 5.872845688746695e-07, + "loss": 0.5884, + "step": 75655 + }, + { + "epoch": 1.94, + "learning_rate": 5.872593651225291e-07, + "loss": 0.5542, + "step": 75656 + }, + { + "epoch": 1.94, + "learning_rate": 5.872341616864054e-07, + "loss": 0.6138, + "step": 75657 + }, + { + "epoch": 1.94, + "learning_rate": 5.872089585663174e-07, + "loss": 0.5942, + "step": 75658 + }, + { + "epoch": 1.94, + "learning_rate": 5.871837557622846e-07, + "loss": 0.6279, + "step": 75659 + }, + { + "epoch": 1.94, + "learning_rate": 5.87158553274326e-07, + "loss": 0.7607, + "step": 75660 + }, + { + "epoch": 1.94, + "learning_rate": 5.871333511024615e-07, + "loss": 0.3912, + "step": 75661 + }, + { + "epoch": 1.94, + "learning_rate": 5.871081492467099e-07, + "loss": 0.4185, + "step": 75662 + }, + { + "epoch": 1.94, + "learning_rate": 5.870829477070906e-07, + "loss": 0.5806, + "step": 75663 + }, + { + "epoch": 1.94, + "learning_rate": 5.870577464836229e-07, + "loss": 0.5659, + "step": 75664 + }, + { + "epoch": 1.94, + "learning_rate": 5.870325455763259e-07, + "loss": 0.563, + "step": 75665 + }, + { + "epoch": 1.94, + "learning_rate": 5.870073449852191e-07, + "loss": 0.6382, + "step": 75666 + }, + { + "epoch": 1.94, + "learning_rate": 5.86982144710322e-07, + "loss": 0.4446, + "step": 75667 + }, + { + "epoch": 1.94, + "learning_rate": 5.869569447516535e-07, + "loss": 0.5708, + "step": 75668 + }, + { + "epoch": 1.94, + "learning_rate": 5.869317451092333e-07, + "loss": 0.5391, + "step": 75669 + }, + { + "epoch": 1.94, + "learning_rate": 5.869065457830802e-07, + "loss": 0.7993, + "step": 75670 + }, + { + "epoch": 1.94, + "learning_rate": 5.868813467732139e-07, + "loss": 0.6484, + "step": 75671 + }, + { + "epoch": 1.94, + "learning_rate": 5.868561480796534e-07, + "loss": 0.6406, + "step": 75672 + }, + { + "epoch": 1.94, + "learning_rate": 5.868309497024187e-07, + "loss": 0.6172, + "step": 75673 + }, + { + "epoch": 1.94, + "learning_rate": 5.868057516415281e-07, + "loss": 0.7686, + "step": 75674 + }, + { + "epoch": 1.94, + "learning_rate": 5.867805538970012e-07, + "loss": 0.6924, + "step": 75675 + }, + { + "epoch": 1.94, + "learning_rate": 5.867553564688576e-07, + "loss": 0.627, + "step": 75676 + }, + { + "epoch": 1.94, + "learning_rate": 5.867301593571164e-07, + "loss": 0.666, + "step": 75677 + }, + { + "epoch": 1.94, + "learning_rate": 5.867049625617971e-07, + "loss": 0.6016, + "step": 75678 + }, + { + "epoch": 1.94, + "learning_rate": 5.866797660829186e-07, + "loss": 0.5679, + "step": 75679 + }, + { + "epoch": 1.94, + "learning_rate": 5.866545699205003e-07, + "loss": 0.3542, + "step": 75680 + }, + { + "epoch": 1.94, + "learning_rate": 5.866293740745618e-07, + "loss": 0.563, + "step": 75681 + }, + { + "epoch": 1.94, + "learning_rate": 5.866041785451221e-07, + "loss": 0.6895, + "step": 75682 + }, + { + "epoch": 1.94, + "learning_rate": 5.865789833322008e-07, + "loss": 0.708, + "step": 75683 + }, + { + "epoch": 1.94, + "learning_rate": 5.86553788435817e-07, + "loss": 0.6382, + "step": 75684 + }, + { + "epoch": 1.94, + "learning_rate": 5.865285938559895e-07, + "loss": 0.4395, + "step": 75685 + }, + { + "epoch": 1.94, + "learning_rate": 5.865033995927382e-07, + "loss": 0.7373, + "step": 75686 + }, + { + "epoch": 1.94, + "learning_rate": 5.864782056460822e-07, + "loss": 0.6689, + "step": 75687 + }, + { + "epoch": 1.94, + "learning_rate": 5.864530120160409e-07, + "loss": 0.7725, + "step": 75688 + }, + { + "epoch": 1.94, + "learning_rate": 5.864278187026334e-07, + "loss": 0.7002, + "step": 75689 + }, + { + "epoch": 1.94, + "learning_rate": 5.864026257058794e-07, + "loss": 0.645, + "step": 75690 + }, + { + "epoch": 1.94, + "learning_rate": 5.863774330257975e-07, + "loss": 0.6025, + "step": 75691 + }, + { + "epoch": 1.94, + "learning_rate": 5.863522406624077e-07, + "loss": 0.4135, + "step": 75692 + }, + { + "epoch": 1.94, + "learning_rate": 5.863270486157293e-07, + "loss": 0.6118, + "step": 75693 + }, + { + "epoch": 1.94, + "learning_rate": 5.863018568857805e-07, + "loss": 0.6382, + "step": 75694 + }, + { + "epoch": 1.94, + "learning_rate": 5.862766654725818e-07, + "loss": 0.4839, + "step": 75695 + }, + { + "epoch": 1.94, + "learning_rate": 5.862514743761517e-07, + "loss": 0.6729, + "step": 75696 + }, + { + "epoch": 1.94, + "learning_rate": 5.862262835965102e-07, + "loss": 0.7148, + "step": 75697 + }, + { + "epoch": 1.94, + "learning_rate": 5.86201093133676e-07, + "loss": 0.6523, + "step": 75698 + }, + { + "epoch": 1.94, + "learning_rate": 5.861759029876685e-07, + "loss": 0.5464, + "step": 75699 + }, + { + "epoch": 1.94, + "learning_rate": 5.861507131585074e-07, + "loss": 0.8037, + "step": 75700 + }, + { + "epoch": 1.94, + "learning_rate": 5.861255236462112e-07, + "loss": 0.5498, + "step": 75701 + }, + { + "epoch": 1.94, + "learning_rate": 5.861003344508002e-07, + "loss": 0.6689, + "step": 75702 + }, + { + "epoch": 1.94, + "learning_rate": 5.860751455722931e-07, + "loss": 0.6992, + "step": 75703 + }, + { + "epoch": 1.94, + "learning_rate": 5.860499570107089e-07, + "loss": 0.6992, + "step": 75704 + }, + { + "epoch": 1.94, + "learning_rate": 5.860247687660673e-07, + "loss": 0.7627, + "step": 75705 + }, + { + "epoch": 1.94, + "learning_rate": 5.859995808383875e-07, + "loss": 0.6689, + "step": 75706 + }, + { + "epoch": 1.94, + "learning_rate": 5.859743932276889e-07, + "loss": 0.5613, + "step": 75707 + }, + { + "epoch": 1.94, + "learning_rate": 5.859492059339904e-07, + "loss": 0.6357, + "step": 75708 + }, + { + "epoch": 1.94, + "learning_rate": 5.859240189573118e-07, + "loss": 0.646, + "step": 75709 + }, + { + "epoch": 1.94, + "learning_rate": 5.858988322976719e-07, + "loss": 0.4102, + "step": 75710 + }, + { + "epoch": 1.94, + "learning_rate": 5.858736459550905e-07, + "loss": 0.6729, + "step": 75711 + }, + { + "epoch": 1.94, + "learning_rate": 5.858484599295864e-07, + "loss": 0.6543, + "step": 75712 + }, + { + "epoch": 1.94, + "learning_rate": 5.858232742211795e-07, + "loss": 0.4817, + "step": 75713 + }, + { + "epoch": 1.94, + "learning_rate": 5.857980888298884e-07, + "loss": 0.7676, + "step": 75714 + }, + { + "epoch": 1.94, + "learning_rate": 5.857729037557327e-07, + "loss": 0.7344, + "step": 75715 + }, + { + "epoch": 1.94, + "learning_rate": 5.857477189987314e-07, + "loss": 0.7666, + "step": 75716 + }, + { + "epoch": 1.94, + "learning_rate": 5.857225345589043e-07, + "loss": 0.7793, + "step": 75717 + }, + { + "epoch": 1.94, + "learning_rate": 5.856973504362701e-07, + "loss": 0.4387, + "step": 75718 + }, + { + "epoch": 1.94, + "learning_rate": 5.856721666308486e-07, + "loss": 0.6836, + "step": 75719 + }, + { + "epoch": 1.94, + "learning_rate": 5.856469831426588e-07, + "loss": 0.4746, + "step": 75720 + }, + { + "epoch": 1.94, + "learning_rate": 5.856217999717202e-07, + "loss": 0.6313, + "step": 75721 + }, + { + "epoch": 1.94, + "learning_rate": 5.855966171180518e-07, + "loss": 0.5518, + "step": 75722 + }, + { + "epoch": 1.94, + "learning_rate": 5.855714345816733e-07, + "loss": 0.6284, + "step": 75723 + }, + { + "epoch": 1.94, + "learning_rate": 5.855462523626035e-07, + "loss": 0.3071, + "step": 75724 + }, + { + "epoch": 1.94, + "learning_rate": 5.855210704608617e-07, + "loss": 0.5205, + "step": 75725 + }, + { + "epoch": 1.94, + "learning_rate": 5.854958888764675e-07, + "loss": 0.7852, + "step": 75726 + }, + { + "epoch": 1.94, + "learning_rate": 5.854707076094399e-07, + "loss": 0.7861, + "step": 75727 + }, + { + "epoch": 1.94, + "learning_rate": 5.854455266597986e-07, + "loss": 0.6553, + "step": 75728 + }, + { + "epoch": 1.94, + "learning_rate": 5.854203460275622e-07, + "loss": 0.7451, + "step": 75729 + }, + { + "epoch": 1.94, + "learning_rate": 5.853951657127507e-07, + "loss": 0.627, + "step": 75730 + }, + { + "epoch": 1.94, + "learning_rate": 5.853699857153829e-07, + "loss": 0.5942, + "step": 75731 + }, + { + "epoch": 1.94, + "learning_rate": 5.853448060354784e-07, + "loss": 0.3667, + "step": 75732 + }, + { + "epoch": 1.94, + "learning_rate": 5.853196266730565e-07, + "loss": 0.4402, + "step": 75733 + }, + { + "epoch": 1.94, + "learning_rate": 5.85294447628136e-07, + "loss": 0.7031, + "step": 75734 + }, + { + "epoch": 1.94, + "learning_rate": 5.852692689007365e-07, + "loss": 0.8857, + "step": 75735 + }, + { + "epoch": 1.94, + "learning_rate": 5.852440904908773e-07, + "loss": 0.626, + "step": 75736 + }, + { + "epoch": 1.94, + "learning_rate": 5.852189123985773e-07, + "loss": 0.7432, + "step": 75737 + }, + { + "epoch": 1.94, + "learning_rate": 5.851937346238566e-07, + "loss": 0.6821, + "step": 75738 + }, + { + "epoch": 1.94, + "learning_rate": 5.851685571667337e-07, + "loss": 0.7021, + "step": 75739 + }, + { + "epoch": 1.94, + "learning_rate": 5.851433800272283e-07, + "loss": 0.6562, + "step": 75740 + }, + { + "epoch": 1.94, + "learning_rate": 5.851182032053592e-07, + "loss": 0.6582, + "step": 75741 + }, + { + "epoch": 1.94, + "learning_rate": 5.850930267011465e-07, + "loss": 0.4833, + "step": 75742 + }, + { + "epoch": 1.94, + "learning_rate": 5.850678505146089e-07, + "loss": 0.5981, + "step": 75743 + }, + { + "epoch": 1.94, + "learning_rate": 5.850426746457657e-07, + "loss": 0.6504, + "step": 75744 + }, + { + "epoch": 1.94, + "learning_rate": 5.850174990946362e-07, + "loss": 0.5425, + "step": 75745 + }, + { + "epoch": 1.94, + "learning_rate": 5.849923238612395e-07, + "loss": 0.6948, + "step": 75746 + }, + { + "epoch": 1.94, + "learning_rate": 5.849671489455953e-07, + "loss": 0.8047, + "step": 75747 + }, + { + "epoch": 1.94, + "learning_rate": 5.849419743477226e-07, + "loss": 0.519, + "step": 75748 + }, + { + "epoch": 1.94, + "learning_rate": 5.849168000676409e-07, + "loss": 0.6162, + "step": 75749 + }, + { + "epoch": 1.94, + "learning_rate": 5.848916261053691e-07, + "loss": 0.6025, + "step": 75750 + }, + { + "epoch": 1.94, + "learning_rate": 5.84866452460927e-07, + "loss": 0.623, + "step": 75751 + }, + { + "epoch": 1.94, + "learning_rate": 5.848412791343334e-07, + "loss": 0.5443, + "step": 75752 + }, + { + "epoch": 1.94, + "learning_rate": 5.848161061256081e-07, + "loss": 0.7197, + "step": 75753 + }, + { + "epoch": 1.94, + "learning_rate": 5.847909334347694e-07, + "loss": 0.6396, + "step": 75754 + }, + { + "epoch": 1.94, + "learning_rate": 5.847657610618376e-07, + "loss": 0.5159, + "step": 75755 + }, + { + "epoch": 1.94, + "learning_rate": 5.847405890068313e-07, + "loss": 0.4595, + "step": 75756 + }, + { + "epoch": 1.94, + "learning_rate": 5.847154172697702e-07, + "loss": 0.6101, + "step": 75757 + }, + { + "epoch": 1.94, + "learning_rate": 5.846902458506732e-07, + "loss": 0.7188, + "step": 75758 + }, + { + "epoch": 1.94, + "learning_rate": 5.8466507474956e-07, + "loss": 0.3779, + "step": 75759 + }, + { + "epoch": 1.94, + "learning_rate": 5.846399039664495e-07, + "loss": 0.5786, + "step": 75760 + }, + { + "epoch": 1.94, + "learning_rate": 5.846147335013614e-07, + "loss": 0.6572, + "step": 75761 + }, + { + "epoch": 1.94, + "learning_rate": 5.845895633543143e-07, + "loss": 0.7119, + "step": 75762 + }, + { + "epoch": 1.94, + "learning_rate": 5.845643935253283e-07, + "loss": 0.6738, + "step": 75763 + }, + { + "epoch": 1.94, + "learning_rate": 5.845392240144223e-07, + "loss": 0.5415, + "step": 75764 + }, + { + "epoch": 1.94, + "learning_rate": 5.84514054821615e-07, + "loss": 0.5227, + "step": 75765 + }, + { + "epoch": 1.94, + "learning_rate": 5.844888859469266e-07, + "loss": 0.6553, + "step": 75766 + }, + { + "epoch": 1.94, + "learning_rate": 5.844637173903756e-07, + "loss": 0.6191, + "step": 75767 + }, + { + "epoch": 1.94, + "learning_rate": 5.844385491519819e-07, + "loss": 0.6543, + "step": 75768 + }, + { + "epoch": 1.94, + "learning_rate": 5.844133812317642e-07, + "loss": 0.4963, + "step": 75769 + }, + { + "epoch": 1.94, + "learning_rate": 5.843882136297424e-07, + "loss": 0.8564, + "step": 75770 + }, + { + "epoch": 1.94, + "learning_rate": 5.843630463459355e-07, + "loss": 0.6709, + "step": 75771 + }, + { + "epoch": 1.94, + "learning_rate": 5.843378793803623e-07, + "loss": 0.7461, + "step": 75772 + }, + { + "epoch": 1.94, + "learning_rate": 5.84312712733043e-07, + "loss": 0.6118, + "step": 75773 + }, + { + "epoch": 1.94, + "learning_rate": 5.842875464039961e-07, + "loss": 0.7041, + "step": 75774 + }, + { + "epoch": 1.94, + "learning_rate": 5.842623803932408e-07, + "loss": 0.5239, + "step": 75775 + }, + { + "epoch": 1.94, + "learning_rate": 5.84237214700797e-07, + "loss": 0.4886, + "step": 75776 + }, + { + "epoch": 1.94, + "learning_rate": 5.842120493266835e-07, + "loss": 0.6396, + "step": 75777 + }, + { + "epoch": 1.94, + "learning_rate": 5.841868842709199e-07, + "loss": 0.7666, + "step": 75778 + }, + { + "epoch": 1.94, + "learning_rate": 5.841617195335249e-07, + "loss": 0.7559, + "step": 75779 + }, + { + "epoch": 1.94, + "learning_rate": 5.841365551145185e-07, + "loss": 0.4878, + "step": 75780 + }, + { + "epoch": 1.94, + "learning_rate": 5.841113910139195e-07, + "loss": 0.6157, + "step": 75781 + }, + { + "epoch": 1.94, + "learning_rate": 5.840862272317473e-07, + "loss": 0.6958, + "step": 75782 + }, + { + "epoch": 1.94, + "learning_rate": 5.840610637680214e-07, + "loss": 0.6611, + "step": 75783 + }, + { + "epoch": 1.94, + "learning_rate": 5.840359006227606e-07, + "loss": 0.5142, + "step": 75784 + }, + { + "epoch": 1.94, + "learning_rate": 5.840107377959844e-07, + "loss": 0.7373, + "step": 75785 + }, + { + "epoch": 1.94, + "learning_rate": 5.839855752877119e-07, + "loss": 0.6836, + "step": 75786 + }, + { + "epoch": 1.94, + "learning_rate": 5.839604130979628e-07, + "loss": 0.6509, + "step": 75787 + }, + { + "epoch": 1.94, + "learning_rate": 5.839352512267559e-07, + "loss": 0.5396, + "step": 75788 + }, + { + "epoch": 1.94, + "learning_rate": 5.839100896741105e-07, + "loss": 0.6548, + "step": 75789 + }, + { + "epoch": 1.94, + "learning_rate": 5.838849284400462e-07, + "loss": 0.6709, + "step": 75790 + }, + { + "epoch": 1.94, + "learning_rate": 5.83859767524582e-07, + "loss": 0.5801, + "step": 75791 + }, + { + "epoch": 1.94, + "learning_rate": 5.838346069277371e-07, + "loss": 0.5728, + "step": 75792 + }, + { + "epoch": 1.94, + "learning_rate": 5.838094466495313e-07, + "loss": 0.6729, + "step": 75793 + }, + { + "epoch": 1.94, + "learning_rate": 5.837842866899836e-07, + "loss": 0.4056, + "step": 75794 + }, + { + "epoch": 1.94, + "learning_rate": 5.837591270491127e-07, + "loss": 0.6572, + "step": 75795 + }, + { + "epoch": 1.94, + "learning_rate": 5.837339677269383e-07, + "loss": 0.709, + "step": 75796 + }, + { + "epoch": 1.94, + "learning_rate": 5.837088087234796e-07, + "loss": 0.5156, + "step": 75797 + }, + { + "epoch": 1.94, + "learning_rate": 5.836836500387563e-07, + "loss": 0.6191, + "step": 75798 + }, + { + "epoch": 1.94, + "learning_rate": 5.83658491672787e-07, + "loss": 0.4673, + "step": 75799 + }, + { + "epoch": 1.94, + "learning_rate": 5.836333336255912e-07, + "loss": 0.5693, + "step": 75800 + }, + { + "epoch": 1.94, + "learning_rate": 5.836081758971882e-07, + "loss": 0.5142, + "step": 75801 + }, + { + "epoch": 1.94, + "learning_rate": 5.835830184875976e-07, + "loss": 0.562, + "step": 75802 + }, + { + "epoch": 1.94, + "learning_rate": 5.835578613968385e-07, + "loss": 0.575, + "step": 75803 + }, + { + "epoch": 1.94, + "learning_rate": 5.835327046249295e-07, + "loss": 0.7236, + "step": 75804 + }, + { + "epoch": 1.94, + "learning_rate": 5.835075481718903e-07, + "loss": 0.8018, + "step": 75805 + }, + { + "epoch": 1.94, + "learning_rate": 5.834823920377407e-07, + "loss": 0.6802, + "step": 75806 + }, + { + "epoch": 1.94, + "learning_rate": 5.834572362224992e-07, + "loss": 0.4214, + "step": 75807 + }, + { + "epoch": 1.94, + "learning_rate": 5.834320807261852e-07, + "loss": 0.71, + "step": 75808 + }, + { + "epoch": 1.94, + "learning_rate": 5.834069255488181e-07, + "loss": 0.4207, + "step": 75809 + }, + { + "epoch": 1.94, + "learning_rate": 5.833817706904177e-07, + "loss": 0.6616, + "step": 75810 + }, + { + "epoch": 1.94, + "learning_rate": 5.83356616151002e-07, + "loss": 0.5337, + "step": 75811 + }, + { + "epoch": 1.94, + "learning_rate": 5.833314619305911e-07, + "loss": 0.624, + "step": 75812 + }, + { + "epoch": 1.94, + "learning_rate": 5.833063080292046e-07, + "loss": 0.5747, + "step": 75813 + }, + { + "epoch": 1.94, + "learning_rate": 5.83281154446861e-07, + "loss": 0.6172, + "step": 75814 + }, + { + "epoch": 1.94, + "learning_rate": 5.832560011835803e-07, + "loss": 0.5051, + "step": 75815 + }, + { + "epoch": 1.94, + "learning_rate": 5.832308482393806e-07, + "loss": 0.522, + "step": 75816 + }, + { + "epoch": 1.94, + "learning_rate": 5.832056956142822e-07, + "loss": 0.5664, + "step": 75817 + }, + { + "epoch": 1.94, + "learning_rate": 5.831805433083039e-07, + "loss": 0.5695, + "step": 75818 + }, + { + "epoch": 1.94, + "learning_rate": 5.831553913214655e-07, + "loss": 0.8105, + "step": 75819 + }, + { + "epoch": 1.94, + "learning_rate": 5.831302396537854e-07, + "loss": 0.5596, + "step": 75820 + }, + { + "epoch": 1.94, + "learning_rate": 5.831050883052834e-07, + "loss": 0.707, + "step": 75821 + }, + { + "epoch": 1.94, + "learning_rate": 5.830799372759785e-07, + "loss": 0.6221, + "step": 75822 + }, + { + "epoch": 1.94, + "learning_rate": 5.830547865658911e-07, + "loss": 0.4919, + "step": 75823 + }, + { + "epoch": 1.94, + "learning_rate": 5.830296361750386e-07, + "loss": 0.509, + "step": 75824 + }, + { + "epoch": 1.94, + "learning_rate": 5.830044861034411e-07, + "loss": 0.4536, + "step": 75825 + }, + { + "epoch": 1.94, + "learning_rate": 5.82979336351118e-07, + "loss": 0.791, + "step": 75826 + }, + { + "epoch": 1.94, + "learning_rate": 5.829541869180887e-07, + "loss": 0.5352, + "step": 75827 + }, + { + "epoch": 1.94, + "learning_rate": 5.82929037804372e-07, + "loss": 0.6406, + "step": 75828 + }, + { + "epoch": 1.94, + "learning_rate": 5.829038890099872e-07, + "loss": 0.6162, + "step": 75829 + }, + { + "epoch": 1.94, + "learning_rate": 5.828787405349537e-07, + "loss": 0.666, + "step": 75830 + }, + { + "epoch": 1.94, + "learning_rate": 5.828535923792914e-07, + "loss": 0.7559, + "step": 75831 + }, + { + "epoch": 1.94, + "learning_rate": 5.828284445430183e-07, + "loss": 0.6274, + "step": 75832 + }, + { + "epoch": 1.94, + "learning_rate": 5.828032970261547e-07, + "loss": 0.9492, + "step": 75833 + }, + { + "epoch": 1.94, + "learning_rate": 5.827781498287191e-07, + "loss": 0.5581, + "step": 75834 + }, + { + "epoch": 1.94, + "learning_rate": 5.82753002950731e-07, + "loss": 0.5591, + "step": 75835 + }, + { + "epoch": 1.94, + "learning_rate": 5.827278563922102e-07, + "loss": 0.6304, + "step": 75836 + }, + { + "epoch": 1.94, + "learning_rate": 5.827027101531751e-07, + "loss": 0.6523, + "step": 75837 + }, + { + "epoch": 1.94, + "learning_rate": 5.826775642336453e-07, + "loss": 0.564, + "step": 75838 + }, + { + "epoch": 1.94, + "learning_rate": 5.826524186336401e-07, + "loss": 0.6865, + "step": 75839 + }, + { + "epoch": 1.94, + "learning_rate": 5.826272733531793e-07, + "loss": 0.4863, + "step": 75840 + }, + { + "epoch": 1.94, + "learning_rate": 5.826021283922811e-07, + "loss": 0.6453, + "step": 75841 + }, + { + "epoch": 1.94, + "learning_rate": 5.825769837509652e-07, + "loss": 0.7354, + "step": 75842 + }, + { + "epoch": 1.94, + "learning_rate": 5.825518394292513e-07, + "loss": 0.4583, + "step": 75843 + }, + { + "epoch": 1.94, + "learning_rate": 5.825266954271584e-07, + "loss": 0.5693, + "step": 75844 + }, + { + "epoch": 1.94, + "learning_rate": 5.825015517447052e-07, + "loss": 0.5054, + "step": 75845 + }, + { + "epoch": 1.94, + "learning_rate": 5.824764083819112e-07, + "loss": 0.6885, + "step": 75846 + }, + { + "epoch": 1.94, + "learning_rate": 5.82451265338796e-07, + "loss": 0.8838, + "step": 75847 + }, + { + "epoch": 1.94, + "learning_rate": 5.824261226153789e-07, + "loss": 0.5469, + "step": 75848 + }, + { + "epoch": 1.94, + "learning_rate": 5.824009802116786e-07, + "loss": 0.8281, + "step": 75849 + }, + { + "epoch": 1.94, + "learning_rate": 5.823758381277146e-07, + "loss": 0.5581, + "step": 75850 + }, + { + "epoch": 1.94, + "learning_rate": 5.823506963635063e-07, + "loss": 0.4688, + "step": 75851 + }, + { + "epoch": 1.94, + "learning_rate": 5.823255549190733e-07, + "loss": 0.6147, + "step": 75852 + }, + { + "epoch": 1.94, + "learning_rate": 5.823004137944344e-07, + "loss": 0.7129, + "step": 75853 + }, + { + "epoch": 1.94, + "learning_rate": 5.822752729896084e-07, + "loss": 0.4068, + "step": 75854 + }, + { + "epoch": 1.94, + "learning_rate": 5.822501325046151e-07, + "loss": 0.4951, + "step": 75855 + }, + { + "epoch": 1.94, + "learning_rate": 5.822249923394735e-07, + "loss": 0.5449, + "step": 75856 + }, + { + "epoch": 1.94, + "learning_rate": 5.821998524942036e-07, + "loss": 0.7197, + "step": 75857 + }, + { + "epoch": 1.94, + "learning_rate": 5.821747129688237e-07, + "loss": 0.7422, + "step": 75858 + }, + { + "epoch": 1.94, + "learning_rate": 5.821495737633532e-07, + "loss": 0.3264, + "step": 75859 + }, + { + "epoch": 1.94, + "learning_rate": 5.82124434877812e-07, + "loss": 0.3811, + "step": 75860 + }, + { + "epoch": 1.94, + "learning_rate": 5.820992963122187e-07, + "loss": 0.6392, + "step": 75861 + }, + { + "epoch": 1.94, + "learning_rate": 5.820741580665925e-07, + "loss": 0.5271, + "step": 75862 + }, + { + "epoch": 1.94, + "learning_rate": 5.820490201409534e-07, + "loss": 0.5732, + "step": 75863 + }, + { + "epoch": 1.94, + "learning_rate": 5.820238825353199e-07, + "loss": 0.502, + "step": 75864 + }, + { + "epoch": 1.94, + "learning_rate": 5.819987452497117e-07, + "loss": 0.5811, + "step": 75865 + }, + { + "epoch": 1.94, + "learning_rate": 5.819736082841476e-07, + "loss": 0.5991, + "step": 75866 + }, + { + "epoch": 1.94, + "learning_rate": 5.819484716386469e-07, + "loss": 0.5308, + "step": 75867 + }, + { + "epoch": 1.94, + "learning_rate": 5.819233353132291e-07, + "loss": 0.5, + "step": 75868 + }, + { + "epoch": 1.94, + "learning_rate": 5.818981993079139e-07, + "loss": 0.5591, + "step": 75869 + }, + { + "epoch": 1.94, + "learning_rate": 5.818730636227195e-07, + "loss": 0.4521, + "step": 75870 + }, + { + "epoch": 1.94, + "learning_rate": 5.818479282576656e-07, + "loss": 0.5942, + "step": 75871 + }, + { + "epoch": 1.94, + "learning_rate": 5.818227932127717e-07, + "loss": 0.5747, + "step": 75872 + }, + { + "epoch": 1.94, + "learning_rate": 5.817976584880571e-07, + "loss": 0.8018, + "step": 75873 + }, + { + "epoch": 1.94, + "learning_rate": 5.817725240835409e-07, + "loss": 0.6104, + "step": 75874 + }, + { + "epoch": 1.94, + "learning_rate": 5.817473899992417e-07, + "loss": 0.5762, + "step": 75875 + }, + { + "epoch": 1.94, + "learning_rate": 5.817222562351796e-07, + "loss": 0.5913, + "step": 75876 + }, + { + "epoch": 1.94, + "learning_rate": 5.816971227913736e-07, + "loss": 0.5308, + "step": 75877 + }, + { + "epoch": 1.94, + "learning_rate": 5.816719896678427e-07, + "loss": 0.5464, + "step": 75878 + }, + { + "epoch": 1.94, + "learning_rate": 5.816468568646062e-07, + "loss": 0.6539, + "step": 75879 + }, + { + "epoch": 1.94, + "learning_rate": 5.816217243816835e-07, + "loss": 0.5557, + "step": 75880 + }, + { + "epoch": 1.94, + "learning_rate": 5.815965922190943e-07, + "loss": 0.6367, + "step": 75881 + }, + { + "epoch": 1.94, + "learning_rate": 5.815714603768569e-07, + "loss": 0.7451, + "step": 75882 + }, + { + "epoch": 1.94, + "learning_rate": 5.815463288549913e-07, + "loss": 0.5367, + "step": 75883 + }, + { + "epoch": 1.94, + "learning_rate": 5.815211976535162e-07, + "loss": 0.582, + "step": 75884 + }, + { + "epoch": 1.94, + "learning_rate": 5.814960667724509e-07, + "loss": 0.6138, + "step": 75885 + }, + { + "epoch": 1.94, + "learning_rate": 5.814709362118153e-07, + "loss": 0.6055, + "step": 75886 + }, + { + "epoch": 1.95, + "learning_rate": 5.814458059716278e-07, + "loss": 0.5305, + "step": 75887 + }, + { + "epoch": 1.95, + "learning_rate": 5.814206760519078e-07, + "loss": 0.4893, + "step": 75888 + }, + { + "epoch": 1.95, + "learning_rate": 5.813955464526749e-07, + "loss": 0.7039, + "step": 75889 + }, + { + "epoch": 1.95, + "learning_rate": 5.813704171739486e-07, + "loss": 0.6211, + "step": 75890 + }, + { + "epoch": 1.95, + "learning_rate": 5.813452882157473e-07, + "loss": 0.6523, + "step": 75891 + }, + { + "epoch": 1.95, + "learning_rate": 5.813201595780908e-07, + "loss": 0.4622, + "step": 75892 + }, + { + "epoch": 1.95, + "learning_rate": 5.812950312609983e-07, + "loss": 0.6797, + "step": 75893 + }, + { + "epoch": 1.95, + "learning_rate": 5.812699032644892e-07, + "loss": 0.6367, + "step": 75894 + }, + { + "epoch": 1.95, + "learning_rate": 5.81244775588582e-07, + "loss": 0.501, + "step": 75895 + }, + { + "epoch": 1.95, + "learning_rate": 5.812196482332964e-07, + "loss": 0.6221, + "step": 75896 + }, + { + "epoch": 1.95, + "learning_rate": 5.811945211986516e-07, + "loss": 0.6514, + "step": 75897 + }, + { + "epoch": 1.95, + "learning_rate": 5.811693944846674e-07, + "loss": 0.4612, + "step": 75898 + }, + { + "epoch": 1.95, + "learning_rate": 5.81144268091362e-07, + "loss": 0.7793, + "step": 75899 + }, + { + "epoch": 1.95, + "learning_rate": 5.811191420187553e-07, + "loss": 0.4712, + "step": 75900 + }, + { + "epoch": 1.95, + "learning_rate": 5.810940162668664e-07, + "loss": 0.791, + "step": 75901 + }, + { + "epoch": 1.95, + "learning_rate": 5.81068890835715e-07, + "loss": 0.6943, + "step": 75902 + }, + { + "epoch": 1.95, + "learning_rate": 5.810437657253199e-07, + "loss": 0.5625, + "step": 75903 + }, + { + "epoch": 1.95, + "learning_rate": 5.810186409356998e-07, + "loss": 0.6777, + "step": 75904 + }, + { + "epoch": 1.95, + "learning_rate": 5.809935164668744e-07, + "loss": 0.6748, + "step": 75905 + }, + { + "epoch": 1.95, + "learning_rate": 5.809683923188633e-07, + "loss": 0.6162, + "step": 75906 + }, + { + "epoch": 1.95, + "learning_rate": 5.809432684916855e-07, + "loss": 0.4971, + "step": 75907 + }, + { + "epoch": 1.95, + "learning_rate": 5.8091814498536e-07, + "loss": 0.667, + "step": 75908 + }, + { + "epoch": 1.95, + "learning_rate": 5.808930217999062e-07, + "loss": 0.5571, + "step": 75909 + }, + { + "epoch": 1.95, + "learning_rate": 5.808678989353432e-07, + "loss": 0.8145, + "step": 75910 + }, + { + "epoch": 1.95, + "learning_rate": 5.808427763916908e-07, + "loss": 0.4998, + "step": 75911 + }, + { + "epoch": 1.95, + "learning_rate": 5.808176541689675e-07, + "loss": 0.6182, + "step": 75912 + }, + { + "epoch": 1.95, + "learning_rate": 5.807925322671932e-07, + "loss": 0.707, + "step": 75913 + }, + { + "epoch": 1.95, + "learning_rate": 5.807674106863863e-07, + "loss": 0.833, + "step": 75914 + }, + { + "epoch": 1.95, + "learning_rate": 5.80742289426567e-07, + "loss": 0.6699, + "step": 75915 + }, + { + "epoch": 1.95, + "learning_rate": 5.807171684877537e-07, + "loss": 0.3777, + "step": 75916 + }, + { + "epoch": 1.95, + "learning_rate": 5.80692047869966e-07, + "loss": 0.4114, + "step": 75917 + }, + { + "epoch": 1.95, + "learning_rate": 5.80666927573223e-07, + "loss": 0.7588, + "step": 75918 + }, + { + "epoch": 1.95, + "learning_rate": 5.806418075975445e-07, + "loss": 0.6255, + "step": 75919 + }, + { + "epoch": 1.95, + "learning_rate": 5.806166879429488e-07, + "loss": 0.6655, + "step": 75920 + }, + { + "epoch": 1.95, + "learning_rate": 5.805915686094558e-07, + "loss": 0.5771, + "step": 75921 + }, + { + "epoch": 1.95, + "learning_rate": 5.805664495970845e-07, + "loss": 0.606, + "step": 75922 + }, + { + "epoch": 1.95, + "learning_rate": 5.805413309058544e-07, + "loss": 0.6387, + "step": 75923 + }, + { + "epoch": 1.95, + "learning_rate": 5.805162125357848e-07, + "loss": 0.6807, + "step": 75924 + }, + { + "epoch": 1.95, + "learning_rate": 5.804910944868941e-07, + "loss": 0.793, + "step": 75925 + }, + { + "epoch": 1.95, + "learning_rate": 5.80465976759202e-07, + "loss": 0.7451, + "step": 75926 + }, + { + "epoch": 1.95, + "learning_rate": 5.804408593527279e-07, + "loss": 0.5879, + "step": 75927 + }, + { + "epoch": 1.95, + "learning_rate": 5.804157422674913e-07, + "loss": 0.626, + "step": 75928 + }, + { + "epoch": 1.95, + "learning_rate": 5.80390625503511e-07, + "loss": 0.667, + "step": 75929 + }, + { + "epoch": 1.95, + "learning_rate": 5.803655090608059e-07, + "loss": 0.5713, + "step": 75930 + }, + { + "epoch": 1.95, + "learning_rate": 5.803403929393957e-07, + "loss": 0.7119, + "step": 75931 + }, + { + "epoch": 1.95, + "learning_rate": 5.803152771393001e-07, + "loss": 0.6328, + "step": 75932 + }, + { + "epoch": 1.95, + "learning_rate": 5.802901616605375e-07, + "loss": 0.6572, + "step": 75933 + }, + { + "epoch": 1.95, + "learning_rate": 5.802650465031273e-07, + "loss": 0.4995, + "step": 75934 + }, + { + "epoch": 1.95, + "learning_rate": 5.802399316670889e-07, + "loss": 0.4304, + "step": 75935 + }, + { + "epoch": 1.95, + "learning_rate": 5.802148171524417e-07, + "loss": 0.6201, + "step": 75936 + }, + { + "epoch": 1.95, + "learning_rate": 5.801897029592044e-07, + "loss": 0.5262, + "step": 75937 + }, + { + "epoch": 1.95, + "learning_rate": 5.801645890873965e-07, + "loss": 0.7842, + "step": 75938 + }, + { + "epoch": 1.95, + "learning_rate": 5.801394755370373e-07, + "loss": 0.5615, + "step": 75939 + }, + { + "epoch": 1.95, + "learning_rate": 5.801143623081465e-07, + "loss": 0.7305, + "step": 75940 + }, + { + "epoch": 1.95, + "learning_rate": 5.800892494007423e-07, + "loss": 0.7339, + "step": 75941 + }, + { + "epoch": 1.95, + "learning_rate": 5.800641368148444e-07, + "loss": 0.6729, + "step": 75942 + }, + { + "epoch": 1.95, + "learning_rate": 5.800390245504726e-07, + "loss": 0.5503, + "step": 75943 + }, + { + "epoch": 1.95, + "learning_rate": 5.80013912607645e-07, + "loss": 0.7568, + "step": 75944 + }, + { + "epoch": 1.95, + "learning_rate": 5.799888009863822e-07, + "loss": 0.6953, + "step": 75945 + }, + { + "epoch": 1.95, + "learning_rate": 5.79963689686702e-07, + "loss": 0.4664, + "step": 75946 + }, + { + "epoch": 1.95, + "learning_rate": 5.799385787086244e-07, + "loss": 0.7607, + "step": 75947 + }, + { + "epoch": 1.95, + "learning_rate": 5.799134680521684e-07, + "loss": 0.563, + "step": 75948 + }, + { + "epoch": 1.95, + "learning_rate": 5.798883577173539e-07, + "loss": 0.833, + "step": 75949 + }, + { + "epoch": 1.95, + "learning_rate": 5.798632477041991e-07, + "loss": 0.6641, + "step": 75950 + }, + { + "epoch": 1.95, + "learning_rate": 5.798381380127236e-07, + "loss": 0.7031, + "step": 75951 + }, + { + "epoch": 1.95, + "learning_rate": 5.798130286429472e-07, + "loss": 0.6118, + "step": 75952 + }, + { + "epoch": 1.95, + "learning_rate": 5.797879195948887e-07, + "loss": 0.751, + "step": 75953 + }, + { + "epoch": 1.95, + "learning_rate": 5.797628108685667e-07, + "loss": 0.6228, + "step": 75954 + }, + { + "epoch": 1.95, + "learning_rate": 5.797377024640012e-07, + "loss": 0.7969, + "step": 75955 + }, + { + "epoch": 1.95, + "learning_rate": 5.79712594381211e-07, + "loss": 0.6636, + "step": 75956 + }, + { + "epoch": 1.95, + "learning_rate": 5.79687486620216e-07, + "loss": 0.6689, + "step": 75957 + }, + { + "epoch": 1.95, + "learning_rate": 5.796623791810347e-07, + "loss": 0.6631, + "step": 75958 + }, + { + "epoch": 1.95, + "learning_rate": 5.796372720636865e-07, + "loss": 0.707, + "step": 75959 + }, + { + "epoch": 1.95, + "learning_rate": 5.796121652681906e-07, + "loss": 0.708, + "step": 75960 + }, + { + "epoch": 1.95, + "learning_rate": 5.79587058794567e-07, + "loss": 0.4731, + "step": 75961 + }, + { + "epoch": 1.95, + "learning_rate": 5.795619526428341e-07, + "loss": 0.6143, + "step": 75962 + }, + { + "epoch": 1.95, + "learning_rate": 5.795368468130109e-07, + "loss": 0.5244, + "step": 75963 + }, + { + "epoch": 1.95, + "learning_rate": 5.795117413051169e-07, + "loss": 0.5212, + "step": 75964 + }, + { + "epoch": 1.95, + "learning_rate": 5.794866361191714e-07, + "loss": 0.5513, + "step": 75965 + }, + { + "epoch": 1.95, + "learning_rate": 5.794615312551942e-07, + "loss": 0.71, + "step": 75966 + }, + { + "epoch": 1.95, + "learning_rate": 5.794364267132037e-07, + "loss": 0.6104, + "step": 75967 + }, + { + "epoch": 1.95, + "learning_rate": 5.794113224932191e-07, + "loss": 0.5854, + "step": 75968 + }, + { + "epoch": 1.95, + "learning_rate": 5.793862185952604e-07, + "loss": 0.6387, + "step": 75969 + }, + { + "epoch": 1.95, + "learning_rate": 5.79361115019346e-07, + "loss": 0.6235, + "step": 75970 + }, + { + "epoch": 1.95, + "learning_rate": 5.793360117654955e-07, + "loss": 0.5283, + "step": 75971 + }, + { + "epoch": 1.95, + "learning_rate": 5.793109088337285e-07, + "loss": 0.791, + "step": 75972 + }, + { + "epoch": 1.95, + "learning_rate": 5.792858062240631e-07, + "loss": 0.7412, + "step": 75973 + }, + { + "epoch": 1.95, + "learning_rate": 5.792607039365198e-07, + "loss": 0.7002, + "step": 75974 + }, + { + "epoch": 1.95, + "learning_rate": 5.792356019711169e-07, + "loss": 0.5908, + "step": 75975 + }, + { + "epoch": 1.95, + "learning_rate": 5.792105003278739e-07, + "loss": 0.5647, + "step": 75976 + }, + { + "epoch": 1.95, + "learning_rate": 5.791853990068101e-07, + "loss": 0.6191, + "step": 75977 + }, + { + "epoch": 1.95, + "learning_rate": 5.791602980079449e-07, + "loss": 0.7305, + "step": 75978 + }, + { + "epoch": 1.95, + "learning_rate": 5.791351973312971e-07, + "loss": 0.6621, + "step": 75979 + }, + { + "epoch": 1.95, + "learning_rate": 5.79110096976886e-07, + "loss": 0.4565, + "step": 75980 + }, + { + "epoch": 1.95, + "learning_rate": 5.790849969447311e-07, + "loss": 0.583, + "step": 75981 + }, + { + "epoch": 1.95, + "learning_rate": 5.790598972348518e-07, + "loss": 0.6809, + "step": 75982 + }, + { + "epoch": 1.95, + "learning_rate": 5.790347978472669e-07, + "loss": 0.6455, + "step": 75983 + }, + { + "epoch": 1.95, + "learning_rate": 5.790096987819954e-07, + "loss": 0.5952, + "step": 75984 + }, + { + "epoch": 1.95, + "learning_rate": 5.789846000390568e-07, + "loss": 0.6387, + "step": 75985 + }, + { + "epoch": 1.95, + "learning_rate": 5.789595016184708e-07, + "loss": 0.8271, + "step": 75986 + }, + { + "epoch": 1.95, + "learning_rate": 5.789344035202557e-07, + "loss": 0.5781, + "step": 75987 + }, + { + "epoch": 1.95, + "learning_rate": 5.789093057444311e-07, + "loss": 0.7031, + "step": 75988 + }, + { + "epoch": 1.95, + "learning_rate": 5.788842082910164e-07, + "loss": 0.5017, + "step": 75989 + }, + { + "epoch": 1.95, + "learning_rate": 5.78859111160031e-07, + "loss": 0.6836, + "step": 75990 + }, + { + "epoch": 1.95, + "learning_rate": 5.788340143514934e-07, + "loss": 0.709, + "step": 75991 + }, + { + "epoch": 1.95, + "learning_rate": 5.788089178654236e-07, + "loss": 0.6465, + "step": 75992 + }, + { + "epoch": 1.95, + "learning_rate": 5.787838217018401e-07, + "loss": 0.6753, + "step": 75993 + }, + { + "epoch": 1.95, + "learning_rate": 5.787587258607625e-07, + "loss": 0.6162, + "step": 75994 + }, + { + "epoch": 1.95, + "learning_rate": 5.787336303422103e-07, + "loss": 0.71, + "step": 75995 + }, + { + "epoch": 1.95, + "learning_rate": 5.78708535146202e-07, + "loss": 0.666, + "step": 75996 + }, + { + "epoch": 1.95, + "learning_rate": 5.786834402727572e-07, + "loss": 0.6282, + "step": 75997 + }, + { + "epoch": 1.95, + "learning_rate": 5.786583457218952e-07, + "loss": 0.6074, + "step": 75998 + }, + { + "epoch": 1.95, + "learning_rate": 5.786332514936355e-07, + "loss": 0.5522, + "step": 75999 + }, + { + "epoch": 1.95, + "learning_rate": 5.786081575879965e-07, + "loss": 0.6432, + "step": 76000 + }, + { + "epoch": 1.95, + "learning_rate": 5.78583064004998e-07, + "loss": 0.5576, + "step": 76001 + }, + { + "epoch": 1.95, + "learning_rate": 5.785579707446593e-07, + "loss": 0.7744, + "step": 76002 + }, + { + "epoch": 1.95, + "learning_rate": 5.785328778069993e-07, + "loss": 0.3103, + "step": 76003 + }, + { + "epoch": 1.95, + "learning_rate": 5.785077851920371e-07, + "loss": 0.6162, + "step": 76004 + }, + { + "epoch": 1.95, + "learning_rate": 5.784826928997921e-07, + "loss": 0.6401, + "step": 76005 + }, + { + "epoch": 1.95, + "learning_rate": 5.784576009302835e-07, + "loss": 0.6416, + "step": 76006 + }, + { + "epoch": 1.95, + "learning_rate": 5.784325092835309e-07, + "loss": 0.5818, + "step": 76007 + }, + { + "epoch": 1.95, + "learning_rate": 5.784074179595526e-07, + "loss": 0.7422, + "step": 76008 + }, + { + "epoch": 1.95, + "learning_rate": 5.783823269583685e-07, + "loss": 0.8398, + "step": 76009 + }, + { + "epoch": 1.95, + "learning_rate": 5.783572362799978e-07, + "loss": 0.7012, + "step": 76010 + }, + { + "epoch": 1.95, + "learning_rate": 5.783321459244597e-07, + "loss": 0.833, + "step": 76011 + }, + { + "epoch": 1.95, + "learning_rate": 5.783070558917736e-07, + "loss": 0.5537, + "step": 76012 + }, + { + "epoch": 1.95, + "learning_rate": 5.782819661819577e-07, + "loss": 0.5835, + "step": 76013 + }, + { + "epoch": 1.95, + "learning_rate": 5.78256876795032e-07, + "loss": 0.7754, + "step": 76014 + }, + { + "epoch": 1.95, + "learning_rate": 5.782317877310156e-07, + "loss": 0.6382, + "step": 76015 + }, + { + "epoch": 1.95, + "learning_rate": 5.782066989899281e-07, + "loss": 0.7256, + "step": 76016 + }, + { + "epoch": 1.95, + "learning_rate": 5.78181610571788e-07, + "loss": 0.4604, + "step": 76017 + }, + { + "epoch": 1.95, + "learning_rate": 5.781565224766149e-07, + "loss": 0.5903, + "step": 76018 + }, + { + "epoch": 1.95, + "learning_rate": 5.78131434704428e-07, + "loss": 0.562, + "step": 76019 + }, + { + "epoch": 1.95, + "learning_rate": 5.781063472552468e-07, + "loss": 0.4475, + "step": 76020 + }, + { + "epoch": 1.95, + "learning_rate": 5.780812601290896e-07, + "loss": 0.5044, + "step": 76021 + }, + { + "epoch": 1.95, + "learning_rate": 5.780561733259768e-07, + "loss": 0.6292, + "step": 76022 + }, + { + "epoch": 1.95, + "learning_rate": 5.780310868459265e-07, + "loss": 0.6616, + "step": 76023 + }, + { + "epoch": 1.95, + "learning_rate": 5.780060006889588e-07, + "loss": 0.5771, + "step": 76024 + }, + { + "epoch": 1.95, + "learning_rate": 5.779809148550921e-07, + "loss": 0.4622, + "step": 76025 + }, + { + "epoch": 1.95, + "learning_rate": 5.77955829344346e-07, + "loss": 0.54, + "step": 76026 + }, + { + "epoch": 1.95, + "learning_rate": 5.779307441567397e-07, + "loss": 0.4917, + "step": 76027 + }, + { + "epoch": 1.95, + "learning_rate": 5.779056592922929e-07, + "loss": 0.5771, + "step": 76028 + }, + { + "epoch": 1.95, + "learning_rate": 5.778805747510238e-07, + "loss": 0.5732, + "step": 76029 + }, + { + "epoch": 1.95, + "learning_rate": 5.778554905329522e-07, + "loss": 0.4766, + "step": 76030 + }, + { + "epoch": 1.95, + "learning_rate": 5.778304066380972e-07, + "loss": 0.708, + "step": 76031 + }, + { + "epoch": 1.95, + "learning_rate": 5.778053230664786e-07, + "loss": 0.5493, + "step": 76032 + }, + { + "epoch": 1.95, + "learning_rate": 5.777802398181148e-07, + "loss": 0.7202, + "step": 76033 + }, + { + "epoch": 1.95, + "learning_rate": 5.77755156893025e-07, + "loss": 0.4607, + "step": 76034 + }, + { + "epoch": 1.95, + "learning_rate": 5.777300742912288e-07, + "loss": 0.5284, + "step": 76035 + }, + { + "epoch": 1.95, + "learning_rate": 5.77704992012745e-07, + "loss": 0.5508, + "step": 76036 + }, + { + "epoch": 1.95, + "learning_rate": 5.776799100575936e-07, + "loss": 0.7363, + "step": 76037 + }, + { + "epoch": 1.95, + "learning_rate": 5.776548284257929e-07, + "loss": 0.5913, + "step": 76038 + }, + { + "epoch": 1.95, + "learning_rate": 5.776297471173626e-07, + "loss": 0.6455, + "step": 76039 + }, + { + "epoch": 1.95, + "learning_rate": 5.77604666132322e-07, + "loss": 0.5142, + "step": 76040 + }, + { + "epoch": 1.95, + "learning_rate": 5.775795854706896e-07, + "loss": 0.7041, + "step": 76041 + }, + { + "epoch": 1.95, + "learning_rate": 5.775545051324856e-07, + "loss": 0.875, + "step": 76042 + }, + { + "epoch": 1.95, + "learning_rate": 5.775294251177283e-07, + "loss": 0.6465, + "step": 76043 + }, + { + "epoch": 1.95, + "learning_rate": 5.775043454264373e-07, + "loss": 0.603, + "step": 76044 + }, + { + "epoch": 1.95, + "learning_rate": 5.774792660586322e-07, + "loss": 0.5283, + "step": 76045 + }, + { + "epoch": 1.95, + "learning_rate": 5.774541870143314e-07, + "loss": 0.6392, + "step": 76046 + }, + { + "epoch": 1.95, + "learning_rate": 5.774291082935545e-07, + "loss": 0.5762, + "step": 76047 + }, + { + "epoch": 1.95, + "learning_rate": 5.774040298963206e-07, + "loss": 0.687, + "step": 76048 + }, + { + "epoch": 1.95, + "learning_rate": 5.773789518226495e-07, + "loss": 0.5469, + "step": 76049 + }, + { + "epoch": 1.95, + "learning_rate": 5.773538740725594e-07, + "loss": 0.6611, + "step": 76050 + }, + { + "epoch": 1.95, + "learning_rate": 5.773287966460703e-07, + "loss": 0.8037, + "step": 76051 + }, + { + "epoch": 1.95, + "learning_rate": 5.773037195432011e-07, + "loss": 0.606, + "step": 76052 + }, + { + "epoch": 1.95, + "learning_rate": 5.772786427639709e-07, + "loss": 0.4766, + "step": 76053 + }, + { + "epoch": 1.95, + "learning_rate": 5.772535663083993e-07, + "loss": 0.7549, + "step": 76054 + }, + { + "epoch": 1.95, + "learning_rate": 5.772284901765048e-07, + "loss": 0.5293, + "step": 76055 + }, + { + "epoch": 1.95, + "learning_rate": 5.772034143683071e-07, + "loss": 0.5493, + "step": 76056 + }, + { + "epoch": 1.95, + "learning_rate": 5.771783388838256e-07, + "loss": 0.5288, + "step": 76057 + }, + { + "epoch": 1.95, + "learning_rate": 5.771532637230788e-07, + "loss": 0.6143, + "step": 76058 + }, + { + "epoch": 1.95, + "learning_rate": 5.771281888860864e-07, + "loss": 0.4795, + "step": 76059 + }, + { + "epoch": 1.95, + "learning_rate": 5.771031143728673e-07, + "loss": 0.5146, + "step": 76060 + }, + { + "epoch": 1.95, + "learning_rate": 5.770780401834414e-07, + "loss": 0.6221, + "step": 76061 + }, + { + "epoch": 1.95, + "learning_rate": 5.770529663178275e-07, + "loss": 0.6641, + "step": 76062 + }, + { + "epoch": 1.95, + "learning_rate": 5.770278927760443e-07, + "loss": 0.7578, + "step": 76063 + }, + { + "epoch": 1.95, + "learning_rate": 5.770028195581114e-07, + "loss": 0.5522, + "step": 76064 + }, + { + "epoch": 1.95, + "learning_rate": 5.769777466640478e-07, + "loss": 0.5527, + "step": 76065 + }, + { + "epoch": 1.95, + "learning_rate": 5.769526740938734e-07, + "loss": 0.6655, + "step": 76066 + }, + { + "epoch": 1.95, + "learning_rate": 5.769276018476065e-07, + "loss": 0.6279, + "step": 76067 + }, + { + "epoch": 1.95, + "learning_rate": 5.769025299252667e-07, + "loss": 0.4587, + "step": 76068 + }, + { + "epoch": 1.95, + "learning_rate": 5.768774583268732e-07, + "loss": 0.708, + "step": 76069 + }, + { + "epoch": 1.95, + "learning_rate": 5.768523870524454e-07, + "loss": 0.6289, + "step": 76070 + }, + { + "epoch": 1.95, + "learning_rate": 5.76827316102002e-07, + "loss": 0.4746, + "step": 76071 + }, + { + "epoch": 1.95, + "learning_rate": 5.768022454755629e-07, + "loss": 0.5112, + "step": 76072 + }, + { + "epoch": 1.95, + "learning_rate": 5.767771751731464e-07, + "loss": 0.5986, + "step": 76073 + }, + { + "epoch": 1.95, + "learning_rate": 5.767521051947721e-07, + "loss": 0.7373, + "step": 76074 + }, + { + "epoch": 1.95, + "learning_rate": 5.767270355404599e-07, + "loss": 0.5391, + "step": 76075 + }, + { + "epoch": 1.95, + "learning_rate": 5.767019662102277e-07, + "loss": 0.5317, + "step": 76076 + }, + { + "epoch": 1.95, + "learning_rate": 5.766768972040954e-07, + "loss": 0.6067, + "step": 76077 + }, + { + "epoch": 1.95, + "learning_rate": 5.766518285220825e-07, + "loss": 0.6807, + "step": 76078 + }, + { + "epoch": 1.95, + "learning_rate": 5.766267601642075e-07, + "loss": 0.7178, + "step": 76079 + }, + { + "epoch": 1.95, + "learning_rate": 5.766016921304899e-07, + "loss": 0.4617, + "step": 76080 + }, + { + "epoch": 1.95, + "learning_rate": 5.765766244209489e-07, + "loss": 0.5818, + "step": 76081 + }, + { + "epoch": 1.95, + "learning_rate": 5.765515570356041e-07, + "loss": 0.5383, + "step": 76082 + }, + { + "epoch": 1.95, + "learning_rate": 5.765264899744744e-07, + "loss": 0.7178, + "step": 76083 + }, + { + "epoch": 1.95, + "learning_rate": 5.765014232375784e-07, + "loss": 0.6587, + "step": 76084 + }, + { + "epoch": 1.95, + "learning_rate": 5.764763568249358e-07, + "loss": 0.6743, + "step": 76085 + }, + { + "epoch": 1.95, + "learning_rate": 5.764512907365658e-07, + "loss": 0.7744, + "step": 76086 + }, + { + "epoch": 1.95, + "learning_rate": 5.764262249724881e-07, + "loss": 0.5315, + "step": 76087 + }, + { + "epoch": 1.95, + "learning_rate": 5.764011595327207e-07, + "loss": 0.5547, + "step": 76088 + }, + { + "epoch": 1.95, + "learning_rate": 5.763760944172835e-07, + "loss": 0.873, + "step": 76089 + }, + { + "epoch": 1.95, + "learning_rate": 5.763510296261957e-07, + "loss": 0.5581, + "step": 76090 + }, + { + "epoch": 1.95, + "learning_rate": 5.76325965159477e-07, + "loss": 0.5757, + "step": 76091 + }, + { + "epoch": 1.95, + "learning_rate": 5.763009010171458e-07, + "loss": 0.7861, + "step": 76092 + }, + { + "epoch": 1.95, + "learning_rate": 5.762758371992213e-07, + "loss": 0.6978, + "step": 76093 + }, + { + "epoch": 1.95, + "learning_rate": 5.762507737057227e-07, + "loss": 0.52, + "step": 76094 + }, + { + "epoch": 1.95, + "learning_rate": 5.7622571053667e-07, + "loss": 0.5903, + "step": 76095 + }, + { + "epoch": 1.95, + "learning_rate": 5.762006476920813e-07, + "loss": 0.5857, + "step": 76096 + }, + { + "epoch": 1.95, + "learning_rate": 5.761755851719763e-07, + "loss": 0.4719, + "step": 76097 + }, + { + "epoch": 1.95, + "learning_rate": 5.761505229763741e-07, + "loss": 0.7715, + "step": 76098 + }, + { + "epoch": 1.95, + "learning_rate": 5.761254611052944e-07, + "loss": 0.6475, + "step": 76099 + }, + { + "epoch": 1.95, + "learning_rate": 5.761003995587556e-07, + "loss": 0.5776, + "step": 76100 + }, + { + "epoch": 1.95, + "learning_rate": 5.760753383367771e-07, + "loss": 0.6997, + "step": 76101 + }, + { + "epoch": 1.95, + "learning_rate": 5.760502774393788e-07, + "loss": 0.6641, + "step": 76102 + }, + { + "epoch": 1.95, + "learning_rate": 5.760252168665787e-07, + "loss": 0.5449, + "step": 76103 + }, + { + "epoch": 1.95, + "learning_rate": 5.760001566183972e-07, + "loss": 0.5278, + "step": 76104 + }, + { + "epoch": 1.95, + "learning_rate": 5.759750966948523e-07, + "loss": 0.5149, + "step": 76105 + }, + { + "epoch": 1.95, + "learning_rate": 5.759500370959639e-07, + "loss": 0.6753, + "step": 76106 + }, + { + "epoch": 1.95, + "learning_rate": 5.75924977821751e-07, + "loss": 0.5439, + "step": 76107 + }, + { + "epoch": 1.95, + "learning_rate": 5.758999188722333e-07, + "loss": 0.6709, + "step": 76108 + }, + { + "epoch": 1.95, + "learning_rate": 5.75874860247429e-07, + "loss": 0.6543, + "step": 76109 + }, + { + "epoch": 1.95, + "learning_rate": 5.758498019473579e-07, + "loss": 0.5518, + "step": 76110 + }, + { + "epoch": 1.95, + "learning_rate": 5.758247439720392e-07, + "loss": 0.6919, + "step": 76111 + }, + { + "epoch": 1.95, + "learning_rate": 5.757996863214927e-07, + "loss": 0.7402, + "step": 76112 + }, + { + "epoch": 1.95, + "learning_rate": 5.757746289957362e-07, + "loss": 0.583, + "step": 76113 + }, + { + "epoch": 1.95, + "learning_rate": 5.757495719947894e-07, + "loss": 0.6953, + "step": 76114 + }, + { + "epoch": 1.95, + "learning_rate": 5.757245153186716e-07, + "loss": 0.5818, + "step": 76115 + }, + { + "epoch": 1.95, + "learning_rate": 5.756994589674025e-07, + "loss": 0.6973, + "step": 76116 + }, + { + "epoch": 1.95, + "learning_rate": 5.756744029410004e-07, + "loss": 0.6514, + "step": 76117 + }, + { + "epoch": 1.95, + "learning_rate": 5.75649347239485e-07, + "loss": 0.5527, + "step": 76118 + }, + { + "epoch": 1.95, + "learning_rate": 5.756242918628753e-07, + "loss": 0.6611, + "step": 76119 + }, + { + "epoch": 1.95, + "learning_rate": 5.755992368111911e-07, + "loss": 0.5676, + "step": 76120 + }, + { + "epoch": 1.95, + "learning_rate": 5.755741820844504e-07, + "loss": 0.6475, + "step": 76121 + }, + { + "epoch": 1.95, + "learning_rate": 5.755491276826736e-07, + "loss": 0.6355, + "step": 76122 + }, + { + "epoch": 1.95, + "learning_rate": 5.755240736058789e-07, + "loss": 0.7959, + "step": 76123 + }, + { + "epoch": 1.95, + "learning_rate": 5.754990198540857e-07, + "loss": 0.5996, + "step": 76124 + }, + { + "epoch": 1.95, + "learning_rate": 5.754739664273141e-07, + "loss": 0.5728, + "step": 76125 + }, + { + "epoch": 1.95, + "learning_rate": 5.75448913325582e-07, + "loss": 0.6309, + "step": 76126 + }, + { + "epoch": 1.95, + "learning_rate": 5.754238605489091e-07, + "loss": 0.6226, + "step": 76127 + }, + { + "epoch": 1.95, + "learning_rate": 5.753988080973147e-07, + "loss": 0.6792, + "step": 76128 + }, + { + "epoch": 1.95, + "learning_rate": 5.753737559708182e-07, + "loss": 0.5693, + "step": 76129 + }, + { + "epoch": 1.95, + "learning_rate": 5.753487041694382e-07, + "loss": 0.7744, + "step": 76130 + }, + { + "epoch": 1.95, + "learning_rate": 5.753236526931942e-07, + "loss": 0.4854, + "step": 76131 + }, + { + "epoch": 1.95, + "learning_rate": 5.752986015421058e-07, + "loss": 0.6787, + "step": 76132 + }, + { + "epoch": 1.95, + "learning_rate": 5.752735507161917e-07, + "loss": 0.7236, + "step": 76133 + }, + { + "epoch": 1.95, + "learning_rate": 5.752485002154705e-07, + "loss": 0.4492, + "step": 76134 + }, + { + "epoch": 1.95, + "learning_rate": 5.752234500399622e-07, + "loss": 0.6025, + "step": 76135 + }, + { + "epoch": 1.95, + "learning_rate": 5.751984001896858e-07, + "loss": 0.7598, + "step": 76136 + }, + { + "epoch": 1.95, + "learning_rate": 5.751733506646607e-07, + "loss": 0.562, + "step": 76137 + }, + { + "epoch": 1.95, + "learning_rate": 5.751483014649056e-07, + "loss": 0.6963, + "step": 76138 + }, + { + "epoch": 1.95, + "learning_rate": 5.751232525904398e-07, + "loss": 0.6719, + "step": 76139 + }, + { + "epoch": 1.95, + "learning_rate": 5.750982040412826e-07, + "loss": 0.5342, + "step": 76140 + }, + { + "epoch": 1.95, + "learning_rate": 5.750731558174535e-07, + "loss": 0.6758, + "step": 76141 + }, + { + "epoch": 1.95, + "learning_rate": 5.750481079189715e-07, + "loss": 0.6455, + "step": 76142 + }, + { + "epoch": 1.95, + "learning_rate": 5.750230603458552e-07, + "loss": 0.4878, + "step": 76143 + }, + { + "epoch": 1.95, + "learning_rate": 5.749980130981241e-07, + "loss": 0.6313, + "step": 76144 + }, + { + "epoch": 1.95, + "learning_rate": 5.749729661757976e-07, + "loss": 0.5903, + "step": 76145 + }, + { + "epoch": 1.95, + "learning_rate": 5.749479195788951e-07, + "loss": 0.584, + "step": 76146 + }, + { + "epoch": 1.95, + "learning_rate": 5.749228733074349e-07, + "loss": 0.6641, + "step": 76147 + }, + { + "epoch": 1.95, + "learning_rate": 5.748978273614368e-07, + "loss": 0.6484, + "step": 76148 + }, + { + "epoch": 1.95, + "learning_rate": 5.748727817409205e-07, + "loss": 0.7598, + "step": 76149 + }, + { + "epoch": 1.95, + "learning_rate": 5.748477364459039e-07, + "loss": 0.4956, + "step": 76150 + }, + { + "epoch": 1.95, + "learning_rate": 5.748226914764069e-07, + "loss": 0.7065, + "step": 76151 + }, + { + "epoch": 1.95, + "learning_rate": 5.747976468324491e-07, + "loss": 0.6758, + "step": 76152 + }, + { + "epoch": 1.95, + "learning_rate": 5.747726025140486e-07, + "loss": 0.6758, + "step": 76153 + }, + { + "epoch": 1.95, + "learning_rate": 5.747475585212258e-07, + "loss": 0.6416, + "step": 76154 + }, + { + "epoch": 1.95, + "learning_rate": 5.747225148539987e-07, + "loss": 0.7793, + "step": 76155 + }, + { + "epoch": 1.95, + "learning_rate": 5.74697471512387e-07, + "loss": 0.5332, + "step": 76156 + }, + { + "epoch": 1.95, + "learning_rate": 5.746724284964099e-07, + "loss": 0.5193, + "step": 76157 + }, + { + "epoch": 1.95, + "learning_rate": 5.74647385806087e-07, + "loss": 0.6753, + "step": 76158 + }, + { + "epoch": 1.95, + "learning_rate": 5.746223434414366e-07, + "loss": 0.4722, + "step": 76159 + }, + { + "epoch": 1.95, + "learning_rate": 5.745973014024784e-07, + "loss": 0.7178, + "step": 76160 + }, + { + "epoch": 1.95, + "learning_rate": 5.745722596892315e-07, + "loss": 0.6372, + "step": 76161 + }, + { + "epoch": 1.95, + "learning_rate": 5.745472183017154e-07, + "loss": 0.7192, + "step": 76162 + }, + { + "epoch": 1.95, + "learning_rate": 5.745221772399489e-07, + "loss": 0.6602, + "step": 76163 + }, + { + "epoch": 1.95, + "learning_rate": 5.744971365039508e-07, + "loss": 0.7637, + "step": 76164 + }, + { + "epoch": 1.95, + "learning_rate": 5.744720960937407e-07, + "loss": 0.2976, + "step": 76165 + }, + { + "epoch": 1.95, + "learning_rate": 5.744470560093382e-07, + "loss": 0.5718, + "step": 76166 + }, + { + "epoch": 1.95, + "learning_rate": 5.744220162507615e-07, + "loss": 0.7695, + "step": 76167 + }, + { + "epoch": 1.95, + "learning_rate": 5.743969768180304e-07, + "loss": 0.5923, + "step": 76168 + }, + { + "epoch": 1.95, + "learning_rate": 5.74371937711164e-07, + "loss": 0.623, + "step": 76169 + }, + { + "epoch": 1.95, + "learning_rate": 5.743468989301818e-07, + "loss": 0.6133, + "step": 76170 + }, + { + "epoch": 1.95, + "learning_rate": 5.743218604751021e-07, + "loss": 0.5854, + "step": 76171 + }, + { + "epoch": 1.95, + "learning_rate": 5.742968223459452e-07, + "loss": 0.5396, + "step": 76172 + }, + { + "epoch": 1.95, + "learning_rate": 5.742717845427289e-07, + "loss": 0.6348, + "step": 76173 + }, + { + "epoch": 1.95, + "learning_rate": 5.742467470654735e-07, + "loss": 0.7871, + "step": 76174 + }, + { + "epoch": 1.95, + "learning_rate": 5.742217099141979e-07, + "loss": 0.6943, + "step": 76175 + }, + { + "epoch": 1.95, + "learning_rate": 5.741966730889209e-07, + "loss": 0.5601, + "step": 76176 + }, + { + "epoch": 1.95, + "learning_rate": 5.74171636589662e-07, + "loss": 0.6426, + "step": 76177 + }, + { + "epoch": 1.95, + "learning_rate": 5.741466004164401e-07, + "loss": 0.7188, + "step": 76178 + }, + { + "epoch": 1.95, + "learning_rate": 5.741215645692752e-07, + "loss": 0.771, + "step": 76179 + }, + { + "epoch": 1.95, + "learning_rate": 5.740965290481852e-07, + "loss": 0.6396, + "step": 76180 + }, + { + "epoch": 1.95, + "learning_rate": 5.740714938531901e-07, + "loss": 0.564, + "step": 76181 + }, + { + "epoch": 1.95, + "learning_rate": 5.740464589843091e-07, + "loss": 0.6851, + "step": 76182 + }, + { + "epoch": 1.95, + "learning_rate": 5.740214244415613e-07, + "loss": 0.7461, + "step": 76183 + }, + { + "epoch": 1.95, + "learning_rate": 5.739963902249651e-07, + "loss": 0.7002, + "step": 76184 + }, + { + "epoch": 1.95, + "learning_rate": 5.739713563345405e-07, + "loss": 0.6328, + "step": 76185 + }, + { + "epoch": 1.95, + "learning_rate": 5.739463227703063e-07, + "loss": 0.6841, + "step": 76186 + }, + { + "epoch": 1.95, + "learning_rate": 5.739212895322822e-07, + "loss": 0.8096, + "step": 76187 + }, + { + "epoch": 1.95, + "learning_rate": 5.738962566204868e-07, + "loss": 0.7271, + "step": 76188 + }, + { + "epoch": 1.95, + "learning_rate": 5.738712240349393e-07, + "loss": 0.7236, + "step": 76189 + }, + { + "epoch": 1.95, + "learning_rate": 5.73846191775659e-07, + "loss": 0.5615, + "step": 76190 + }, + { + "epoch": 1.95, + "learning_rate": 5.738211598426654e-07, + "loss": 0.6885, + "step": 76191 + }, + { + "epoch": 1.95, + "learning_rate": 5.737961282359773e-07, + "loss": 0.5752, + "step": 76192 + }, + { + "epoch": 1.95, + "learning_rate": 5.737710969556138e-07, + "loss": 0.5923, + "step": 76193 + }, + { + "epoch": 1.95, + "learning_rate": 5.737460660015938e-07, + "loss": 0.6621, + "step": 76194 + }, + { + "epoch": 1.95, + "learning_rate": 5.737210353739372e-07, + "loss": 0.6602, + "step": 76195 + }, + { + "epoch": 1.95, + "learning_rate": 5.73696005072663e-07, + "loss": 0.6836, + "step": 76196 + }, + { + "epoch": 1.95, + "learning_rate": 5.736709750977897e-07, + "loss": 0.7295, + "step": 76197 + }, + { + "epoch": 1.95, + "learning_rate": 5.736459454493371e-07, + "loss": 0.6128, + "step": 76198 + }, + { + "epoch": 1.95, + "learning_rate": 5.736209161273242e-07, + "loss": 0.7056, + "step": 76199 + }, + { + "epoch": 1.95, + "learning_rate": 5.735958871317703e-07, + "loss": 0.6729, + "step": 76200 + }, + { + "epoch": 1.95, + "learning_rate": 5.735708584626942e-07, + "loss": 0.5762, + "step": 76201 + }, + { + "epoch": 1.95, + "learning_rate": 5.735458301201157e-07, + "loss": 0.6216, + "step": 76202 + }, + { + "epoch": 1.95, + "learning_rate": 5.735208021040532e-07, + "loss": 0.593, + "step": 76203 + }, + { + "epoch": 1.95, + "learning_rate": 5.734957744145266e-07, + "loss": 0.5786, + "step": 76204 + }, + { + "epoch": 1.95, + "learning_rate": 5.734707470515542e-07, + "loss": 0.6484, + "step": 76205 + }, + { + "epoch": 1.95, + "learning_rate": 5.734457200151557e-07, + "loss": 0.6963, + "step": 76206 + }, + { + "epoch": 1.95, + "learning_rate": 5.734206933053501e-07, + "loss": 0.7461, + "step": 76207 + }, + { + "epoch": 1.95, + "learning_rate": 5.733956669221571e-07, + "loss": 0.6299, + "step": 76208 + }, + { + "epoch": 1.95, + "learning_rate": 5.73370640865595e-07, + "loss": 0.5834, + "step": 76209 + }, + { + "epoch": 1.95, + "learning_rate": 5.733456151356835e-07, + "loss": 0.6162, + "step": 76210 + }, + { + "epoch": 1.95, + "learning_rate": 5.733205897324416e-07, + "loss": 0.6436, + "step": 76211 + }, + { + "epoch": 1.95, + "learning_rate": 5.732955646558888e-07, + "loss": 0.709, + "step": 76212 + }, + { + "epoch": 1.95, + "learning_rate": 5.73270539906044e-07, + "loss": 0.5908, + "step": 76213 + }, + { + "epoch": 1.95, + "learning_rate": 5.732455154829261e-07, + "loss": 0.6548, + "step": 76214 + }, + { + "epoch": 1.95, + "learning_rate": 5.732204913865544e-07, + "loss": 0.7578, + "step": 76215 + }, + { + "epoch": 1.95, + "learning_rate": 5.731954676169479e-07, + "loss": 0.6338, + "step": 76216 + }, + { + "epoch": 1.95, + "learning_rate": 5.731704441741267e-07, + "loss": 0.6572, + "step": 76217 + }, + { + "epoch": 1.95, + "learning_rate": 5.731454210581088e-07, + "loss": 0.585, + "step": 76218 + }, + { + "epoch": 1.95, + "learning_rate": 5.731203982689137e-07, + "loss": 0.5369, + "step": 76219 + }, + { + "epoch": 1.95, + "learning_rate": 5.730953758065613e-07, + "loss": 0.5271, + "step": 76220 + }, + { + "epoch": 1.95, + "learning_rate": 5.730703536710695e-07, + "loss": 0.7178, + "step": 76221 + }, + { + "epoch": 1.95, + "learning_rate": 5.730453318624587e-07, + "loss": 0.6836, + "step": 76222 + }, + { + "epoch": 1.95, + "learning_rate": 5.73020310380747e-07, + "loss": 0.624, + "step": 76223 + }, + { + "epoch": 1.95, + "learning_rate": 5.72995289225954e-07, + "loss": 0.6267, + "step": 76224 + }, + { + "epoch": 1.95, + "learning_rate": 5.729702683980992e-07, + "loss": 0.4958, + "step": 76225 + }, + { + "epoch": 1.95, + "learning_rate": 5.729452478972011e-07, + "loss": 0.5366, + "step": 76226 + }, + { + "epoch": 1.95, + "learning_rate": 5.729202277232792e-07, + "loss": 0.6787, + "step": 76227 + }, + { + "epoch": 1.95, + "learning_rate": 5.728952078763526e-07, + "loss": 0.6895, + "step": 76228 + }, + { + "epoch": 1.95, + "learning_rate": 5.728701883564409e-07, + "loss": 0.46, + "step": 76229 + }, + { + "epoch": 1.95, + "learning_rate": 5.728451691635625e-07, + "loss": 0.791, + "step": 76230 + }, + { + "epoch": 1.95, + "learning_rate": 5.728201502977369e-07, + "loss": 0.6538, + "step": 76231 + }, + { + "epoch": 1.95, + "learning_rate": 5.727951317589836e-07, + "loss": 0.5542, + "step": 76232 + }, + { + "epoch": 1.95, + "learning_rate": 5.727701135473211e-07, + "loss": 0.6592, + "step": 76233 + }, + { + "epoch": 1.95, + "learning_rate": 5.727450956627693e-07, + "loss": 0.5845, + "step": 76234 + }, + { + "epoch": 1.95, + "learning_rate": 5.727200781053465e-07, + "loss": 0.6851, + "step": 76235 + }, + { + "epoch": 1.95, + "learning_rate": 5.726950608750723e-07, + "loss": 0.6353, + "step": 76236 + }, + { + "epoch": 1.95, + "learning_rate": 5.726700439719659e-07, + "loss": 0.4795, + "step": 76237 + }, + { + "epoch": 1.95, + "learning_rate": 5.726450273960467e-07, + "loss": 0.6553, + "step": 76238 + }, + { + "epoch": 1.95, + "learning_rate": 5.726200111473331e-07, + "loss": 0.7129, + "step": 76239 + }, + { + "epoch": 1.95, + "learning_rate": 5.725949952258449e-07, + "loss": 0.9033, + "step": 76240 + }, + { + "epoch": 1.95, + "learning_rate": 5.725699796316012e-07, + "loss": 0.5867, + "step": 76241 + }, + { + "epoch": 1.95, + "learning_rate": 5.725449643646212e-07, + "loss": 0.4976, + "step": 76242 + }, + { + "epoch": 1.95, + "learning_rate": 5.725199494249236e-07, + "loss": 0.5566, + "step": 76243 + }, + { + "epoch": 1.95, + "learning_rate": 5.724949348125275e-07, + "loss": 0.5703, + "step": 76244 + }, + { + "epoch": 1.95, + "learning_rate": 5.724699205274526e-07, + "loss": 0.7119, + "step": 76245 + }, + { + "epoch": 1.95, + "learning_rate": 5.724449065697181e-07, + "loss": 0.4985, + "step": 76246 + }, + { + "epoch": 1.95, + "learning_rate": 5.724198929393425e-07, + "loss": 0.4556, + "step": 76247 + }, + { + "epoch": 1.95, + "learning_rate": 5.723948796363453e-07, + "loss": 0.7021, + "step": 76248 + }, + { + "epoch": 1.95, + "learning_rate": 5.723698666607457e-07, + "loss": 0.6787, + "step": 76249 + }, + { + "epoch": 1.95, + "learning_rate": 5.723448540125633e-07, + "loss": 0.7012, + "step": 76250 + }, + { + "epoch": 1.95, + "learning_rate": 5.723198416918168e-07, + "loss": 0.4834, + "step": 76251 + }, + { + "epoch": 1.95, + "learning_rate": 5.722948296985249e-07, + "loss": 0.7607, + "step": 76252 + }, + { + "epoch": 1.95, + "learning_rate": 5.72269818032707e-07, + "loss": 0.7354, + "step": 76253 + }, + { + "epoch": 1.95, + "learning_rate": 5.722448066943827e-07, + "loss": 0.707, + "step": 76254 + }, + { + "epoch": 1.95, + "learning_rate": 5.722197956835712e-07, + "loss": 0.624, + "step": 76255 + }, + { + "epoch": 1.95, + "learning_rate": 5.721947850002909e-07, + "loss": 0.3051, + "step": 76256 + }, + { + "epoch": 1.95, + "learning_rate": 5.721697746445613e-07, + "loss": 0.5493, + "step": 76257 + }, + { + "epoch": 1.95, + "learning_rate": 5.721447646164021e-07, + "loss": 0.4824, + "step": 76258 + }, + { + "epoch": 1.95, + "learning_rate": 5.721197549158317e-07, + "loss": 0.708, + "step": 76259 + }, + { + "epoch": 1.95, + "learning_rate": 5.720947455428693e-07, + "loss": 0.7627, + "step": 76260 + }, + { + "epoch": 1.95, + "learning_rate": 5.720697364975349e-07, + "loss": 0.6396, + "step": 76261 + }, + { + "epoch": 1.95, + "learning_rate": 5.720447277798464e-07, + "loss": 0.6328, + "step": 76262 + }, + { + "epoch": 1.95, + "learning_rate": 5.720197193898242e-07, + "loss": 0.4656, + "step": 76263 + }, + { + "epoch": 1.95, + "learning_rate": 5.719947113274863e-07, + "loss": 0.6162, + "step": 76264 + }, + { + "epoch": 1.95, + "learning_rate": 5.719697035928523e-07, + "loss": 0.5586, + "step": 76265 + }, + { + "epoch": 1.95, + "learning_rate": 5.719446961859415e-07, + "loss": 0.541, + "step": 76266 + }, + { + "epoch": 1.95, + "learning_rate": 5.719196891067734e-07, + "loss": 0.514, + "step": 76267 + }, + { + "epoch": 1.95, + "learning_rate": 5.718946823553663e-07, + "loss": 0.6982, + "step": 76268 + }, + { + "epoch": 1.95, + "learning_rate": 5.718696759317398e-07, + "loss": 0.4802, + "step": 76269 + }, + { + "epoch": 1.95, + "learning_rate": 5.718446698359129e-07, + "loss": 0.6543, + "step": 76270 + }, + { + "epoch": 1.95, + "learning_rate": 5.718196640679054e-07, + "loss": 0.5066, + "step": 76271 + }, + { + "epoch": 1.95, + "learning_rate": 5.717946586277357e-07, + "loss": 0.6855, + "step": 76272 + }, + { + "epoch": 1.95, + "learning_rate": 5.717696535154228e-07, + "loss": 0.519, + "step": 76273 + }, + { + "epoch": 1.95, + "learning_rate": 5.717446487309863e-07, + "loss": 0.5811, + "step": 76274 + }, + { + "epoch": 1.95, + "learning_rate": 5.717196442744454e-07, + "loss": 0.5303, + "step": 76275 + }, + { + "epoch": 1.95, + "learning_rate": 5.71694640145819e-07, + "loss": 0.8125, + "step": 76276 + }, + { + "epoch": 1.96, + "learning_rate": 5.716696363451262e-07, + "loss": 0.4849, + "step": 76277 + }, + { + "epoch": 1.96, + "learning_rate": 5.716446328723861e-07, + "loss": 0.4553, + "step": 76278 + }, + { + "epoch": 1.96, + "learning_rate": 5.716196297276185e-07, + "loss": 0.6943, + "step": 76279 + }, + { + "epoch": 1.96, + "learning_rate": 5.715946269108416e-07, + "loss": 0.6885, + "step": 76280 + }, + { + "epoch": 1.96, + "learning_rate": 5.715696244220754e-07, + "loss": 0.5811, + "step": 76281 + }, + { + "epoch": 1.96, + "learning_rate": 5.715446222613384e-07, + "loss": 0.4639, + "step": 76282 + }, + { + "epoch": 1.96, + "learning_rate": 5.715196204286499e-07, + "loss": 0.627, + "step": 76283 + }, + { + "epoch": 1.96, + "learning_rate": 5.714946189240295e-07, + "loss": 0.6504, + "step": 76284 + }, + { + "epoch": 1.96, + "learning_rate": 5.714696177474956e-07, + "loss": 0.5247, + "step": 76285 + }, + { + "epoch": 1.96, + "learning_rate": 5.714446168990677e-07, + "loss": 0.665, + "step": 76286 + }, + { + "epoch": 1.96, + "learning_rate": 5.714196163787648e-07, + "loss": 0.5455, + "step": 76287 + }, + { + "epoch": 1.96, + "learning_rate": 5.713946161866068e-07, + "loss": 0.7598, + "step": 76288 + }, + { + "epoch": 1.96, + "learning_rate": 5.713696163226117e-07, + "loss": 0.45, + "step": 76289 + }, + { + "epoch": 1.96, + "learning_rate": 5.713446167867993e-07, + "loss": 0.5854, + "step": 76290 + }, + { + "epoch": 1.96, + "learning_rate": 5.713196175791889e-07, + "loss": 0.7061, + "step": 76291 + }, + { + "epoch": 1.96, + "learning_rate": 5.712946186997993e-07, + "loss": 0.5183, + "step": 76292 + }, + { + "epoch": 1.96, + "learning_rate": 5.712696201486496e-07, + "loss": 0.6543, + "step": 76293 + }, + { + "epoch": 1.96, + "learning_rate": 5.712446219257587e-07, + "loss": 0.5669, + "step": 76294 + }, + { + "epoch": 1.96, + "learning_rate": 5.712196240311462e-07, + "loss": 0.75, + "step": 76295 + }, + { + "epoch": 1.96, + "learning_rate": 5.711946264648316e-07, + "loss": 0.6064, + "step": 76296 + }, + { + "epoch": 1.96, + "learning_rate": 5.711696292268331e-07, + "loss": 0.6953, + "step": 76297 + }, + { + "epoch": 1.96, + "learning_rate": 5.711446323171703e-07, + "loss": 0.6816, + "step": 76298 + }, + { + "epoch": 1.96, + "learning_rate": 5.711196357358623e-07, + "loss": 0.575, + "step": 76299 + }, + { + "epoch": 1.96, + "learning_rate": 5.710946394829288e-07, + "loss": 0.6519, + "step": 76300 + }, + { + "epoch": 1.96, + "learning_rate": 5.710696435583883e-07, + "loss": 0.7383, + "step": 76301 + }, + { + "epoch": 1.96, + "learning_rate": 5.710446479622597e-07, + "loss": 0.6345, + "step": 76302 + }, + { + "epoch": 1.96, + "learning_rate": 5.710196526945623e-07, + "loss": 0.3068, + "step": 76303 + }, + { + "epoch": 1.96, + "learning_rate": 5.709946577553157e-07, + "loss": 0.536, + "step": 76304 + }, + { + "epoch": 1.96, + "learning_rate": 5.709696631445391e-07, + "loss": 0.6631, + "step": 76305 + }, + { + "epoch": 1.96, + "learning_rate": 5.709446688622508e-07, + "loss": 0.6782, + "step": 76306 + }, + { + "epoch": 1.96, + "learning_rate": 5.709196749084705e-07, + "loss": 0.5273, + "step": 76307 + }, + { + "epoch": 1.96, + "learning_rate": 5.708946812832172e-07, + "loss": 0.6582, + "step": 76308 + }, + { + "epoch": 1.96, + "learning_rate": 5.708696879865107e-07, + "loss": 0.7144, + "step": 76309 + }, + { + "epoch": 1.96, + "learning_rate": 5.70844695018369e-07, + "loss": 0.5322, + "step": 76310 + }, + { + "epoch": 1.96, + "learning_rate": 5.708197023788122e-07, + "loss": 0.7061, + "step": 76311 + }, + { + "epoch": 1.96, + "learning_rate": 5.707947100678585e-07, + "loss": 0.6738, + "step": 76312 + }, + { + "epoch": 1.96, + "learning_rate": 5.707697180855283e-07, + "loss": 0.6582, + "step": 76313 + }, + { + "epoch": 1.96, + "learning_rate": 5.707447264318392e-07, + "loss": 0.5322, + "step": 76314 + }, + { + "epoch": 1.96, + "learning_rate": 5.707197351068114e-07, + "loss": 0.4272, + "step": 76315 + }, + { + "epoch": 1.96, + "learning_rate": 5.706947441104636e-07, + "loss": 0.6274, + "step": 76316 + }, + { + "epoch": 1.96, + "learning_rate": 5.706697534428156e-07, + "loss": 0.6123, + "step": 76317 + }, + { + "epoch": 1.96, + "learning_rate": 5.706447631038856e-07, + "loss": 0.6289, + "step": 76318 + }, + { + "epoch": 1.96, + "learning_rate": 5.70619773093693e-07, + "loss": 0.6743, + "step": 76319 + }, + { + "epoch": 1.96, + "learning_rate": 5.705947834122573e-07, + "loss": 0.707, + "step": 76320 + }, + { + "epoch": 1.96, + "learning_rate": 5.705697940595978e-07, + "loss": 0.6172, + "step": 76321 + }, + { + "epoch": 1.96, + "learning_rate": 5.705448050357333e-07, + "loss": 0.4956, + "step": 76322 + }, + { + "epoch": 1.96, + "learning_rate": 5.705198163406823e-07, + "loss": 0.5723, + "step": 76323 + }, + { + "epoch": 1.96, + "learning_rate": 5.704948279744648e-07, + "loss": 0.5889, + "step": 76324 + }, + { + "epoch": 1.96, + "learning_rate": 5.704698399370995e-07, + "loss": 0.7798, + "step": 76325 + }, + { + "epoch": 1.96, + "learning_rate": 5.704448522286061e-07, + "loss": 0.4175, + "step": 76326 + }, + { + "epoch": 1.96, + "learning_rate": 5.704198648490029e-07, + "loss": 0.7588, + "step": 76327 + }, + { + "epoch": 1.96, + "learning_rate": 5.703948777983095e-07, + "loss": 0.6611, + "step": 76328 + }, + { + "epoch": 1.96, + "learning_rate": 5.703698910765453e-07, + "loss": 0.4756, + "step": 76329 + }, + { + "epoch": 1.96, + "learning_rate": 5.703449046837288e-07, + "loss": 0.7891, + "step": 76330 + }, + { + "epoch": 1.96, + "learning_rate": 5.703199186198799e-07, + "loss": 0.6123, + "step": 76331 + }, + { + "epoch": 1.96, + "learning_rate": 5.702949328850169e-07, + "loss": 0.5437, + "step": 76332 + }, + { + "epoch": 1.96, + "learning_rate": 5.702699474791592e-07, + "loss": 0.5449, + "step": 76333 + }, + { + "epoch": 1.96, + "learning_rate": 5.702449624023265e-07, + "loss": 0.7393, + "step": 76334 + }, + { + "epoch": 1.96, + "learning_rate": 5.702199776545371e-07, + "loss": 0.5288, + "step": 76335 + }, + { + "epoch": 1.96, + "learning_rate": 5.701949932358105e-07, + "loss": 0.4708, + "step": 76336 + }, + { + "epoch": 1.96, + "learning_rate": 5.701700091461657e-07, + "loss": 0.6641, + "step": 76337 + }, + { + "epoch": 1.96, + "learning_rate": 5.701450253856225e-07, + "loss": 0.6562, + "step": 76338 + }, + { + "epoch": 1.96, + "learning_rate": 5.701200419541989e-07, + "loss": 0.5479, + "step": 76339 + }, + { + "epoch": 1.96, + "learning_rate": 5.700950588519148e-07, + "loss": 0.7354, + "step": 76340 + }, + { + "epoch": 1.96, + "learning_rate": 5.700700760787896e-07, + "loss": 0.6621, + "step": 76341 + }, + { + "epoch": 1.96, + "learning_rate": 5.700450936348414e-07, + "loss": 0.5952, + "step": 76342 + }, + { + "epoch": 1.96, + "learning_rate": 5.700201115200905e-07, + "loss": 0.4946, + "step": 76343 + }, + { + "epoch": 1.96, + "learning_rate": 5.699951297345549e-07, + "loss": 0.7422, + "step": 76344 + }, + { + "epoch": 1.96, + "learning_rate": 5.699701482782542e-07, + "loss": 0.665, + "step": 76345 + }, + { + "epoch": 1.96, + "learning_rate": 5.699451671512081e-07, + "loss": 0.7842, + "step": 76346 + }, + { + "epoch": 1.96, + "learning_rate": 5.699201863534348e-07, + "loss": 0.6045, + "step": 76347 + }, + { + "epoch": 1.96, + "learning_rate": 5.698952058849538e-07, + "loss": 0.6475, + "step": 76348 + }, + { + "epoch": 1.96, + "learning_rate": 5.698702257457842e-07, + "loss": 0.6714, + "step": 76349 + }, + { + "epoch": 1.96, + "learning_rate": 5.698452459359456e-07, + "loss": 0.5635, + "step": 76350 + }, + { + "epoch": 1.96, + "learning_rate": 5.698202664554568e-07, + "loss": 0.751, + "step": 76351 + }, + { + "epoch": 1.96, + "learning_rate": 5.697952873043365e-07, + "loss": 0.605, + "step": 76352 + }, + { + "epoch": 1.96, + "learning_rate": 5.69770308482604e-07, + "loss": 0.3298, + "step": 76353 + }, + { + "epoch": 1.96, + "learning_rate": 5.697453299902787e-07, + "loss": 0.6543, + "step": 76354 + }, + { + "epoch": 1.96, + "learning_rate": 5.6972035182738e-07, + "loss": 0.8066, + "step": 76355 + }, + { + "epoch": 1.96, + "learning_rate": 5.696953739939262e-07, + "loss": 0.7539, + "step": 76356 + }, + { + "epoch": 1.96, + "learning_rate": 5.69670396489937e-07, + "loss": 0.606, + "step": 76357 + }, + { + "epoch": 1.96, + "learning_rate": 5.696454193154312e-07, + "loss": 0.6724, + "step": 76358 + }, + { + "epoch": 1.96, + "learning_rate": 5.696204424704285e-07, + "loss": 0.5645, + "step": 76359 + }, + { + "epoch": 1.96, + "learning_rate": 5.695954659549475e-07, + "loss": 0.6235, + "step": 76360 + }, + { + "epoch": 1.96, + "learning_rate": 5.695704897690077e-07, + "loss": 0.7031, + "step": 76361 + }, + { + "epoch": 1.96, + "learning_rate": 5.695455139126275e-07, + "loss": 0.6289, + "step": 76362 + }, + { + "epoch": 1.96, + "learning_rate": 5.695205383858271e-07, + "loss": 0.7539, + "step": 76363 + }, + { + "epoch": 1.96, + "learning_rate": 5.694955631886245e-07, + "loss": 0.6777, + "step": 76364 + }, + { + "epoch": 1.96, + "learning_rate": 5.694705883210393e-07, + "loss": 0.7803, + "step": 76365 + }, + { + "epoch": 1.96, + "learning_rate": 5.694456137830907e-07, + "loss": 0.4316, + "step": 76366 + }, + { + "epoch": 1.96, + "learning_rate": 5.694206395747983e-07, + "loss": 0.7349, + "step": 76367 + }, + { + "epoch": 1.96, + "learning_rate": 5.693956656961802e-07, + "loss": 0.7939, + "step": 76368 + }, + { + "epoch": 1.96, + "learning_rate": 5.69370692147256e-07, + "loss": 0.6855, + "step": 76369 + }, + { + "epoch": 1.96, + "learning_rate": 5.69345718928045e-07, + "loss": 0.6499, + "step": 76370 + }, + { + "epoch": 1.96, + "learning_rate": 5.693207460385668e-07, + "loss": 0.6904, + "step": 76371 + }, + { + "epoch": 1.96, + "learning_rate": 5.692957734788395e-07, + "loss": 0.7461, + "step": 76372 + }, + { + "epoch": 1.96, + "learning_rate": 5.692708012488824e-07, + "loss": 0.4565, + "step": 76373 + }, + { + "epoch": 1.96, + "learning_rate": 5.692458293487148e-07, + "loss": 0.5996, + "step": 76374 + }, + { + "epoch": 1.96, + "learning_rate": 5.692208577783558e-07, + "loss": 0.5718, + "step": 76375 + }, + { + "epoch": 1.96, + "learning_rate": 5.69195886537825e-07, + "loss": 0.6035, + "step": 76376 + }, + { + "epoch": 1.96, + "learning_rate": 5.691709156271409e-07, + "loss": 0.6167, + "step": 76377 + }, + { + "epoch": 1.96, + "learning_rate": 5.691459450463226e-07, + "loss": 0.6143, + "step": 76378 + }, + { + "epoch": 1.96, + "learning_rate": 5.691209747953896e-07, + "loss": 0.6313, + "step": 76379 + }, + { + "epoch": 1.96, + "learning_rate": 5.690960048743612e-07, + "loss": 0.55, + "step": 76380 + }, + { + "epoch": 1.96, + "learning_rate": 5.69071035283256e-07, + "loss": 0.6758, + "step": 76381 + }, + { + "epoch": 1.96, + "learning_rate": 5.690460660220931e-07, + "loss": 0.5581, + "step": 76382 + }, + { + "epoch": 1.96, + "learning_rate": 5.690210970908918e-07, + "loss": 0.4736, + "step": 76383 + }, + { + "epoch": 1.96, + "learning_rate": 5.689961284896715e-07, + "loss": 0.7383, + "step": 76384 + }, + { + "epoch": 1.96, + "learning_rate": 5.689711602184507e-07, + "loss": 0.666, + "step": 76385 + }, + { + "epoch": 1.96, + "learning_rate": 5.689461922772489e-07, + "loss": 0.4299, + "step": 76386 + }, + { + "epoch": 1.96, + "learning_rate": 5.689212246660852e-07, + "loss": 0.6533, + "step": 76387 + }, + { + "epoch": 1.96, + "learning_rate": 5.688962573849791e-07, + "loss": 0.6572, + "step": 76388 + }, + { + "epoch": 1.96, + "learning_rate": 5.688712904339487e-07, + "loss": 0.5532, + "step": 76389 + }, + { + "epoch": 1.96, + "learning_rate": 5.688463238130141e-07, + "loss": 0.6167, + "step": 76390 + }, + { + "epoch": 1.96, + "learning_rate": 5.688213575221942e-07, + "loss": 0.5942, + "step": 76391 + }, + { + "epoch": 1.96, + "learning_rate": 5.687963915615076e-07, + "loss": 0.5898, + "step": 76392 + }, + { + "epoch": 1.96, + "learning_rate": 5.687714259309742e-07, + "loss": 0.5879, + "step": 76393 + }, + { + "epoch": 1.96, + "learning_rate": 5.687464606306122e-07, + "loss": 0.5557, + "step": 76394 + }, + { + "epoch": 1.96, + "learning_rate": 5.687214956604413e-07, + "loss": 0.6787, + "step": 76395 + }, + { + "epoch": 1.96, + "learning_rate": 5.686965310204806e-07, + "loss": 0.6855, + "step": 76396 + }, + { + "epoch": 1.96, + "learning_rate": 5.686715667107493e-07, + "loss": 0.5105, + "step": 76397 + }, + { + "epoch": 1.96, + "learning_rate": 5.686466027312662e-07, + "loss": 0.6812, + "step": 76398 + }, + { + "epoch": 1.96, + "learning_rate": 5.686216390820504e-07, + "loss": 0.5654, + "step": 76399 + }, + { + "epoch": 1.96, + "learning_rate": 5.685966757631213e-07, + "loss": 0.6138, + "step": 76400 + }, + { + "epoch": 1.96, + "learning_rate": 5.685717127744986e-07, + "loss": 0.5986, + "step": 76401 + }, + { + "epoch": 1.96, + "learning_rate": 5.685467501161998e-07, + "loss": 0.5947, + "step": 76402 + }, + { + "epoch": 1.96, + "learning_rate": 5.685217877882451e-07, + "loss": 0.6592, + "step": 76403 + }, + { + "epoch": 1.96, + "learning_rate": 5.684968257906532e-07, + "loss": 0.6992, + "step": 76404 + }, + { + "epoch": 1.96, + "learning_rate": 5.684718641234442e-07, + "loss": 0.8682, + "step": 76405 + }, + { + "epoch": 1.96, + "learning_rate": 5.684469027866359e-07, + "loss": 0.5171, + "step": 76406 + }, + { + "epoch": 1.96, + "learning_rate": 5.684219417802478e-07, + "loss": 0.7822, + "step": 76407 + }, + { + "epoch": 1.96, + "learning_rate": 5.683969811042993e-07, + "loss": 0.5869, + "step": 76408 + }, + { + "epoch": 1.96, + "learning_rate": 5.683720207588098e-07, + "loss": 0.4561, + "step": 76409 + }, + { + "epoch": 1.96, + "learning_rate": 5.683470607437975e-07, + "loss": 0.5913, + "step": 76410 + }, + { + "epoch": 1.96, + "learning_rate": 5.683221010592825e-07, + "loss": 0.5288, + "step": 76411 + }, + { + "epoch": 1.96, + "learning_rate": 5.68297141705283e-07, + "loss": 0.5007, + "step": 76412 + }, + { + "epoch": 1.96, + "learning_rate": 5.682721826818186e-07, + "loss": 0.6074, + "step": 76413 + }, + { + "epoch": 1.96, + "learning_rate": 5.682472239889085e-07, + "loss": 0.6748, + "step": 76414 + }, + { + "epoch": 1.96, + "learning_rate": 5.682222656265714e-07, + "loss": 0.5879, + "step": 76415 + }, + { + "epoch": 1.96, + "learning_rate": 5.681973075948268e-07, + "loss": 0.5435, + "step": 76416 + }, + { + "epoch": 1.96, + "learning_rate": 5.681723498936934e-07, + "loss": 0.7432, + "step": 76417 + }, + { + "epoch": 1.96, + "learning_rate": 5.681473925231913e-07, + "loss": 0.5645, + "step": 76418 + }, + { + "epoch": 1.96, + "learning_rate": 5.681224354833383e-07, + "loss": 0.6392, + "step": 76419 + }, + { + "epoch": 1.96, + "learning_rate": 5.680974787741539e-07, + "loss": 0.6611, + "step": 76420 + }, + { + "epoch": 1.96, + "learning_rate": 5.680725223956581e-07, + "loss": 0.6963, + "step": 76421 + }, + { + "epoch": 1.96, + "learning_rate": 5.680475663478692e-07, + "loss": 0.645, + "step": 76422 + }, + { + "epoch": 1.96, + "learning_rate": 5.680226106308059e-07, + "loss": 0.7812, + "step": 76423 + }, + { + "epoch": 1.96, + "learning_rate": 5.679976552444881e-07, + "loss": 0.6348, + "step": 76424 + }, + { + "epoch": 1.96, + "learning_rate": 5.679727001889344e-07, + "loss": 0.4902, + "step": 76425 + }, + { + "epoch": 1.96, + "learning_rate": 5.679477454641646e-07, + "loss": 0.4763, + "step": 76426 + }, + { + "epoch": 1.96, + "learning_rate": 5.679227910701969e-07, + "loss": 0.7529, + "step": 76427 + }, + { + "epoch": 1.96, + "learning_rate": 5.67897837007051e-07, + "loss": 0.5468, + "step": 76428 + }, + { + "epoch": 1.96, + "learning_rate": 5.678728832747457e-07, + "loss": 0.7949, + "step": 76429 + }, + { + "epoch": 1.96, + "learning_rate": 5.678479298733008e-07, + "loss": 0.7231, + "step": 76430 + }, + { + "epoch": 1.96, + "learning_rate": 5.678229768027347e-07, + "loss": 0.7256, + "step": 76431 + }, + { + "epoch": 1.96, + "learning_rate": 5.677980240630664e-07, + "loss": 0.502, + "step": 76432 + }, + { + "epoch": 1.96, + "learning_rate": 5.677730716543152e-07, + "loss": 0.501, + "step": 76433 + }, + { + "epoch": 1.96, + "learning_rate": 5.677481195765004e-07, + "loss": 0.7207, + "step": 76434 + }, + { + "epoch": 1.96, + "learning_rate": 5.677231678296412e-07, + "loss": 0.5815, + "step": 76435 + }, + { + "epoch": 1.96, + "learning_rate": 5.676982164137563e-07, + "loss": 0.5083, + "step": 76436 + }, + { + "epoch": 1.96, + "learning_rate": 5.67673265328865e-07, + "loss": 0.6133, + "step": 76437 + }, + { + "epoch": 1.96, + "learning_rate": 5.676483145749866e-07, + "loss": 0.5962, + "step": 76438 + }, + { + "epoch": 1.96, + "learning_rate": 5.676233641521397e-07, + "loss": 0.2526, + "step": 76439 + }, + { + "epoch": 1.96, + "learning_rate": 5.675984140603438e-07, + "loss": 0.6582, + "step": 76440 + }, + { + "epoch": 1.96, + "learning_rate": 5.675734642996183e-07, + "loss": 0.5905, + "step": 76441 + }, + { + "epoch": 1.96, + "learning_rate": 5.675485148699815e-07, + "loss": 0.7065, + "step": 76442 + }, + { + "epoch": 1.96, + "learning_rate": 5.675235657714533e-07, + "loss": 0.666, + "step": 76443 + }, + { + "epoch": 1.96, + "learning_rate": 5.674986170040519e-07, + "loss": 0.6875, + "step": 76444 + }, + { + "epoch": 1.96, + "learning_rate": 5.674736685677969e-07, + "loss": 0.5938, + "step": 76445 + }, + { + "epoch": 1.96, + "learning_rate": 5.674487204627076e-07, + "loss": 0.4949, + "step": 76446 + }, + { + "epoch": 1.96, + "learning_rate": 5.674237726888034e-07, + "loss": 0.5356, + "step": 76447 + }, + { + "epoch": 1.96, + "learning_rate": 5.673988252461023e-07, + "loss": 0.5752, + "step": 76448 + }, + { + "epoch": 1.96, + "learning_rate": 5.673738781346241e-07, + "loss": 0.7578, + "step": 76449 + }, + { + "epoch": 1.96, + "learning_rate": 5.673489313543879e-07, + "loss": 0.6738, + "step": 76450 + }, + { + "epoch": 1.96, + "learning_rate": 5.67323984905413e-07, + "loss": 0.4731, + "step": 76451 + }, + { + "epoch": 1.96, + "learning_rate": 5.672990387877184e-07, + "loss": 0.5957, + "step": 76452 + }, + { + "epoch": 1.96, + "learning_rate": 5.672740930013224e-07, + "loss": 0.8057, + "step": 76453 + }, + { + "epoch": 1.96, + "learning_rate": 5.67249147546245e-07, + "loss": 0.5112, + "step": 76454 + }, + { + "epoch": 1.96, + "learning_rate": 5.672242024225053e-07, + "loss": 0.6577, + "step": 76455 + }, + { + "epoch": 1.96, + "learning_rate": 5.671992576301217e-07, + "loss": 0.7451, + "step": 76456 + }, + { + "epoch": 1.96, + "learning_rate": 5.671743131691138e-07, + "loss": 0.7373, + "step": 76457 + }, + { + "epoch": 1.96, + "learning_rate": 5.671493690395005e-07, + "loss": 0.5938, + "step": 76458 + }, + { + "epoch": 1.96, + "learning_rate": 5.671244252413016e-07, + "loss": 0.8135, + "step": 76459 + }, + { + "epoch": 1.96, + "learning_rate": 5.67099481774535e-07, + "loss": 0.4883, + "step": 76460 + }, + { + "epoch": 1.96, + "learning_rate": 5.67074538639221e-07, + "loss": 0.7031, + "step": 76461 + }, + { + "epoch": 1.96, + "learning_rate": 5.670495958353777e-07, + "loss": 0.625, + "step": 76462 + }, + { + "epoch": 1.96, + "learning_rate": 5.670246533630246e-07, + "loss": 0.5034, + "step": 76463 + }, + { + "epoch": 1.96, + "learning_rate": 5.669997112221811e-07, + "loss": 0.6104, + "step": 76464 + }, + { + "epoch": 1.96, + "learning_rate": 5.669747694128657e-07, + "loss": 0.6392, + "step": 76465 + }, + { + "epoch": 1.96, + "learning_rate": 5.669498279350979e-07, + "loss": 0.5122, + "step": 76466 + }, + { + "epoch": 1.96, + "learning_rate": 5.669248867888966e-07, + "loss": 0.7529, + "step": 76467 + }, + { + "epoch": 1.96, + "learning_rate": 5.668999459742815e-07, + "loss": 0.6592, + "step": 76468 + }, + { + "epoch": 1.96, + "learning_rate": 5.668750054912706e-07, + "loss": 0.4417, + "step": 76469 + }, + { + "epoch": 1.96, + "learning_rate": 5.668500653398838e-07, + "loss": 0.6294, + "step": 76470 + }, + { + "epoch": 1.96, + "learning_rate": 5.668251255201403e-07, + "loss": 0.5957, + "step": 76471 + }, + { + "epoch": 1.96, + "learning_rate": 5.668001860320588e-07, + "loss": 0.7012, + "step": 76472 + }, + { + "epoch": 1.96, + "learning_rate": 5.667752468756582e-07, + "loss": 0.7676, + "step": 76473 + }, + { + "epoch": 1.96, + "learning_rate": 5.667503080509579e-07, + "loss": 0.4302, + "step": 76474 + }, + { + "epoch": 1.96, + "learning_rate": 5.66725369557977e-07, + "loss": 0.6079, + "step": 76475 + }, + { + "epoch": 1.96, + "learning_rate": 5.667004313967348e-07, + "loss": 0.6416, + "step": 76476 + }, + { + "epoch": 1.96, + "learning_rate": 5.666754935672498e-07, + "loss": 0.7295, + "step": 76477 + }, + { + "epoch": 1.96, + "learning_rate": 5.666505560695415e-07, + "loss": 0.5419, + "step": 76478 + }, + { + "epoch": 1.96, + "learning_rate": 5.666256189036289e-07, + "loss": 0.6572, + "step": 76479 + }, + { + "epoch": 1.96, + "learning_rate": 5.666006820695315e-07, + "loss": 0.5571, + "step": 76480 + }, + { + "epoch": 1.96, + "learning_rate": 5.665757455672681e-07, + "loss": 0.6787, + "step": 76481 + }, + { + "epoch": 1.96, + "learning_rate": 5.665508093968574e-07, + "loss": 0.5806, + "step": 76482 + }, + { + "epoch": 1.96, + "learning_rate": 5.665258735583187e-07, + "loss": 0.6743, + "step": 76483 + }, + { + "epoch": 1.96, + "learning_rate": 5.665009380516712e-07, + "loss": 0.7588, + "step": 76484 + }, + { + "epoch": 1.96, + "learning_rate": 5.664760028769345e-07, + "loss": 0.6094, + "step": 76485 + }, + { + "epoch": 1.96, + "learning_rate": 5.664510680341266e-07, + "loss": 0.563, + "step": 76486 + }, + { + "epoch": 1.96, + "learning_rate": 5.664261335232674e-07, + "loss": 0.6143, + "step": 76487 + }, + { + "epoch": 1.96, + "learning_rate": 5.664011993443755e-07, + "loss": 0.5957, + "step": 76488 + }, + { + "epoch": 1.96, + "learning_rate": 5.663762654974709e-07, + "loss": 0.7031, + "step": 76489 + }, + { + "epoch": 1.96, + "learning_rate": 5.663513319825717e-07, + "loss": 0.6787, + "step": 76490 + }, + { + "epoch": 1.96, + "learning_rate": 5.663263987996976e-07, + "loss": 0.5237, + "step": 76491 + }, + { + "epoch": 1.96, + "learning_rate": 5.66301465948867e-07, + "loss": 0.6162, + "step": 76492 + }, + { + "epoch": 1.96, + "learning_rate": 5.662765334300999e-07, + "loss": 0.5503, + "step": 76493 + }, + { + "epoch": 1.96, + "learning_rate": 5.662516012434146e-07, + "loss": 0.4863, + "step": 76494 + }, + { + "epoch": 1.96, + "learning_rate": 5.662266693888303e-07, + "loss": 0.6958, + "step": 76495 + }, + { + "epoch": 1.96, + "learning_rate": 5.662017378663665e-07, + "loss": 0.5942, + "step": 76496 + }, + { + "epoch": 1.96, + "learning_rate": 5.661768066760424e-07, + "loss": 0.5059, + "step": 76497 + }, + { + "epoch": 1.96, + "learning_rate": 5.661518758178763e-07, + "loss": 0.5947, + "step": 76498 + }, + { + "epoch": 1.96, + "learning_rate": 5.661269452918879e-07, + "loss": 0.79, + "step": 76499 + }, + { + "epoch": 1.96, + "learning_rate": 5.661020150980961e-07, + "loss": 0.6445, + "step": 76500 + }, + { + "epoch": 1.96, + "learning_rate": 5.660770852365205e-07, + "loss": 0.5664, + "step": 76501 + }, + { + "epoch": 1.96, + "learning_rate": 5.660521557071796e-07, + "loss": 0.4646, + "step": 76502 + }, + { + "epoch": 1.96, + "learning_rate": 5.660272265100922e-07, + "loss": 0.5557, + "step": 76503 + }, + { + "epoch": 1.96, + "learning_rate": 5.660022976452779e-07, + "loss": 0.3943, + "step": 76504 + }, + { + "epoch": 1.96, + "learning_rate": 5.659773691127555e-07, + "loss": 0.707, + "step": 76505 + }, + { + "epoch": 1.96, + "learning_rate": 5.659524409125448e-07, + "loss": 0.5864, + "step": 76506 + }, + { + "epoch": 1.96, + "learning_rate": 5.65927513044664e-07, + "loss": 0.5276, + "step": 76507 + }, + { + "epoch": 1.96, + "learning_rate": 5.659025855091324e-07, + "loss": 0.6211, + "step": 76508 + }, + { + "epoch": 1.96, + "learning_rate": 5.658776583059698e-07, + "loss": 0.7666, + "step": 76509 + }, + { + "epoch": 1.96, + "learning_rate": 5.658527314351942e-07, + "loss": 0.5854, + "step": 76510 + }, + { + "epoch": 1.96, + "learning_rate": 5.658278048968257e-07, + "loss": 0.5098, + "step": 76511 + }, + { + "epoch": 1.96, + "learning_rate": 5.658028786908824e-07, + "loss": 0.6499, + "step": 76512 + }, + { + "epoch": 1.96, + "learning_rate": 5.657779528173839e-07, + "loss": 0.6636, + "step": 76513 + }, + { + "epoch": 1.96, + "learning_rate": 5.657530272763498e-07, + "loss": 0.6113, + "step": 76514 + }, + { + "epoch": 1.96, + "learning_rate": 5.65728102067798e-07, + "loss": 0.5908, + "step": 76515 + }, + { + "epoch": 1.96, + "learning_rate": 5.657031771917483e-07, + "loss": 0.5328, + "step": 76516 + }, + { + "epoch": 1.96, + "learning_rate": 5.656782526482197e-07, + "loss": 0.5796, + "step": 76517 + }, + { + "epoch": 1.96, + "learning_rate": 5.656533284372318e-07, + "loss": 0.7617, + "step": 76518 + }, + { + "epoch": 1.96, + "learning_rate": 5.656284045588027e-07, + "loss": 0.5605, + "step": 76519 + }, + { + "epoch": 1.96, + "learning_rate": 5.656034810129519e-07, + "loss": 0.5586, + "step": 76520 + }, + { + "epoch": 1.96, + "learning_rate": 5.65578557799699e-07, + "loss": 0.7354, + "step": 76521 + }, + { + "epoch": 1.96, + "learning_rate": 5.655536349190622e-07, + "loss": 0.5752, + "step": 76522 + }, + { + "epoch": 1.96, + "learning_rate": 5.655287123710615e-07, + "loss": 0.8037, + "step": 76523 + }, + { + "epoch": 1.96, + "learning_rate": 5.65503790155715e-07, + "loss": 0.6885, + "step": 76524 + }, + { + "epoch": 1.96, + "learning_rate": 5.654788682730423e-07, + "loss": 0.6875, + "step": 76525 + }, + { + "epoch": 1.96, + "learning_rate": 5.654539467230628e-07, + "loss": 0.5112, + "step": 76526 + }, + { + "epoch": 1.96, + "learning_rate": 5.654290255057949e-07, + "loss": 0.5498, + "step": 76527 + }, + { + "epoch": 1.96, + "learning_rate": 5.654041046212579e-07, + "loss": 0.6299, + "step": 76528 + }, + { + "epoch": 1.96, + "learning_rate": 5.65379184069471e-07, + "loss": 0.709, + "step": 76529 + }, + { + "epoch": 1.96, + "learning_rate": 5.653542638504538e-07, + "loss": 0.5508, + "step": 76530 + }, + { + "epoch": 1.96, + "learning_rate": 5.653293439642249e-07, + "loss": 0.6221, + "step": 76531 + }, + { + "epoch": 1.96, + "learning_rate": 5.653044244108027e-07, + "loss": 0.5698, + "step": 76532 + }, + { + "epoch": 1.96, + "learning_rate": 5.652795051902071e-07, + "loss": 0.6621, + "step": 76533 + }, + { + "epoch": 1.96, + "learning_rate": 5.65254586302457e-07, + "loss": 0.708, + "step": 76534 + }, + { + "epoch": 1.96, + "learning_rate": 5.652296677475718e-07, + "loss": 0.5479, + "step": 76535 + }, + { + "epoch": 1.96, + "learning_rate": 5.652047495255698e-07, + "loss": 0.6948, + "step": 76536 + }, + { + "epoch": 1.96, + "learning_rate": 5.651798316364706e-07, + "loss": 0.6885, + "step": 76537 + }, + { + "epoch": 1.96, + "learning_rate": 5.651549140802933e-07, + "loss": 0.7969, + "step": 76538 + }, + { + "epoch": 1.96, + "learning_rate": 5.651299968570571e-07, + "loss": 0.8223, + "step": 76539 + }, + { + "epoch": 1.96, + "learning_rate": 5.651050799667807e-07, + "loss": 0.4761, + "step": 76540 + }, + { + "epoch": 1.96, + "learning_rate": 5.650801634094835e-07, + "loss": 0.6484, + "step": 76541 + }, + { + "epoch": 1.96, + "learning_rate": 5.650552471851841e-07, + "loss": 0.5181, + "step": 76542 + }, + { + "epoch": 1.96, + "learning_rate": 5.650303312939024e-07, + "loss": 0.4188, + "step": 76543 + }, + { + "epoch": 1.96, + "learning_rate": 5.650054157356565e-07, + "loss": 0.6353, + "step": 76544 + }, + { + "epoch": 1.96, + "learning_rate": 5.64980500510466e-07, + "loss": 0.5269, + "step": 76545 + }, + { + "epoch": 1.96, + "learning_rate": 5.649555856183499e-07, + "loss": 0.6221, + "step": 76546 + }, + { + "epoch": 1.96, + "learning_rate": 5.649306710593275e-07, + "loss": 0.7119, + "step": 76547 + }, + { + "epoch": 1.96, + "learning_rate": 5.649057568334175e-07, + "loss": 0.624, + "step": 76548 + }, + { + "epoch": 1.96, + "learning_rate": 5.648808429406391e-07, + "loss": 0.5654, + "step": 76549 + }, + { + "epoch": 1.96, + "learning_rate": 5.648559293810119e-07, + "loss": 0.4025, + "step": 76550 + }, + { + "epoch": 1.96, + "learning_rate": 5.648310161545541e-07, + "loss": 0.7305, + "step": 76551 + }, + { + "epoch": 1.96, + "learning_rate": 5.648061032612855e-07, + "loss": 0.67, + "step": 76552 + }, + { + "epoch": 1.96, + "learning_rate": 5.647811907012245e-07, + "loss": 0.5811, + "step": 76553 + }, + { + "epoch": 1.96, + "learning_rate": 5.647562784743904e-07, + "loss": 0.7998, + "step": 76554 + }, + { + "epoch": 1.96, + "learning_rate": 5.647313665808027e-07, + "loss": 0.6841, + "step": 76555 + }, + { + "epoch": 1.96, + "learning_rate": 5.647064550204803e-07, + "loss": 0.5918, + "step": 76556 + }, + { + "epoch": 1.96, + "learning_rate": 5.64681543793442e-07, + "loss": 0.6709, + "step": 76557 + }, + { + "epoch": 1.96, + "learning_rate": 5.646566328997067e-07, + "loss": 0.8232, + "step": 76558 + }, + { + "epoch": 1.96, + "learning_rate": 5.64631722339294e-07, + "loss": 0.6533, + "step": 76559 + }, + { + "epoch": 1.96, + "learning_rate": 5.646068121122236e-07, + "loss": 0.813, + "step": 76560 + }, + { + "epoch": 1.96, + "learning_rate": 5.64581902218513e-07, + "loss": 0.5967, + "step": 76561 + }, + { + "epoch": 1.96, + "learning_rate": 5.645569926581819e-07, + "loss": 0.6929, + "step": 76562 + }, + { + "epoch": 1.96, + "learning_rate": 5.645320834312494e-07, + "loss": 0.6631, + "step": 76563 + }, + { + "epoch": 1.96, + "learning_rate": 5.645071745377352e-07, + "loss": 0.6025, + "step": 76564 + }, + { + "epoch": 1.96, + "learning_rate": 5.644822659776574e-07, + "loss": 0.5103, + "step": 76565 + }, + { + "epoch": 1.96, + "learning_rate": 5.644573577510355e-07, + "loss": 0.4298, + "step": 76566 + }, + { + "epoch": 1.96, + "learning_rate": 5.644324498578885e-07, + "loss": 0.5413, + "step": 76567 + }, + { + "epoch": 1.96, + "learning_rate": 5.644075422982362e-07, + "loss": 0.4941, + "step": 76568 + }, + { + "epoch": 1.96, + "learning_rate": 5.643826350720964e-07, + "loss": 0.2236, + "step": 76569 + }, + { + "epoch": 1.96, + "learning_rate": 5.643577281794892e-07, + "loss": 0.6299, + "step": 76570 + }, + { + "epoch": 1.96, + "learning_rate": 5.643328216204329e-07, + "loss": 0.6099, + "step": 76571 + }, + { + "epoch": 1.96, + "learning_rate": 5.643079153949469e-07, + "loss": 0.6074, + "step": 76572 + }, + { + "epoch": 1.96, + "learning_rate": 5.642830095030507e-07, + "loss": 0.6479, + "step": 76573 + }, + { + "epoch": 1.96, + "learning_rate": 5.642581039447624e-07, + "loss": 0.5516, + "step": 76574 + }, + { + "epoch": 1.96, + "learning_rate": 5.642331987201019e-07, + "loss": 0.5977, + "step": 76575 + }, + { + "epoch": 1.96, + "learning_rate": 5.64208293829088e-07, + "loss": 0.5703, + "step": 76576 + }, + { + "epoch": 1.96, + "learning_rate": 5.641833892717401e-07, + "loss": 0.5103, + "step": 76577 + }, + { + "epoch": 1.96, + "learning_rate": 5.641584850480764e-07, + "loss": 0.688, + "step": 76578 + }, + { + "epoch": 1.96, + "learning_rate": 5.641335811581166e-07, + "loss": 0.6426, + "step": 76579 + }, + { + "epoch": 1.96, + "learning_rate": 5.641086776018801e-07, + "loss": 0.5234, + "step": 76580 + }, + { + "epoch": 1.96, + "learning_rate": 5.640837743793856e-07, + "loss": 0.7178, + "step": 76581 + }, + { + "epoch": 1.96, + "learning_rate": 5.640588714906516e-07, + "loss": 0.7363, + "step": 76582 + }, + { + "epoch": 1.96, + "learning_rate": 5.640339689356977e-07, + "loss": 0.5449, + "step": 76583 + }, + { + "epoch": 1.96, + "learning_rate": 5.64009066714543e-07, + "loss": 0.5854, + "step": 76584 + }, + { + "epoch": 1.96, + "learning_rate": 5.639841648272068e-07, + "loss": 0.4961, + "step": 76585 + }, + { + "epoch": 1.96, + "learning_rate": 5.639592632737075e-07, + "loss": 0.7061, + "step": 76586 + }, + { + "epoch": 1.96, + "learning_rate": 5.639343620540647e-07, + "loss": 0.5356, + "step": 76587 + }, + { + "epoch": 1.96, + "learning_rate": 5.639094611682972e-07, + "loss": 0.5967, + "step": 76588 + }, + { + "epoch": 1.96, + "learning_rate": 5.638845606164245e-07, + "loss": 0.5293, + "step": 76589 + }, + { + "epoch": 1.96, + "learning_rate": 5.638596603984656e-07, + "loss": 0.5781, + "step": 76590 + }, + { + "epoch": 1.96, + "learning_rate": 5.638347605144386e-07, + "loss": 0.5591, + "step": 76591 + }, + { + "epoch": 1.96, + "learning_rate": 5.638098609643633e-07, + "loss": 0.6406, + "step": 76592 + }, + { + "epoch": 1.96, + "learning_rate": 5.637849617482588e-07, + "loss": 0.4321, + "step": 76593 + }, + { + "epoch": 1.96, + "learning_rate": 5.637600628661446e-07, + "loss": 0.5894, + "step": 76594 + }, + { + "epoch": 1.96, + "learning_rate": 5.637351643180388e-07, + "loss": 0.4649, + "step": 76595 + }, + { + "epoch": 1.96, + "learning_rate": 5.637102661039609e-07, + "loss": 0.4824, + "step": 76596 + }, + { + "epoch": 1.96, + "learning_rate": 5.6368536822393e-07, + "loss": 0.584, + "step": 76597 + }, + { + "epoch": 1.96, + "learning_rate": 5.636604706779656e-07, + "loss": 0.605, + "step": 76598 + }, + { + "epoch": 1.96, + "learning_rate": 5.636355734660858e-07, + "loss": 0.6377, + "step": 76599 + }, + { + "epoch": 1.96, + "learning_rate": 5.636106765883106e-07, + "loss": 0.4424, + "step": 76600 + }, + { + "epoch": 1.96, + "learning_rate": 5.635857800446583e-07, + "loss": 0.7197, + "step": 76601 + }, + { + "epoch": 1.96, + "learning_rate": 5.635608838351486e-07, + "loss": 0.75, + "step": 76602 + }, + { + "epoch": 1.96, + "learning_rate": 5.635359879598001e-07, + "loss": 0.4219, + "step": 76603 + }, + { + "epoch": 1.96, + "learning_rate": 5.635110924186317e-07, + "loss": 0.7891, + "step": 76604 + }, + { + "epoch": 1.96, + "learning_rate": 5.63486197211663e-07, + "loss": 0.7788, + "step": 76605 + }, + { + "epoch": 1.96, + "learning_rate": 5.634613023389132e-07, + "loss": 0.5713, + "step": 76606 + }, + { + "epoch": 1.96, + "learning_rate": 5.634364078004006e-07, + "loss": 0.6897, + "step": 76607 + }, + { + "epoch": 1.96, + "learning_rate": 5.634115135961447e-07, + "loss": 0.4546, + "step": 76608 + }, + { + "epoch": 1.96, + "learning_rate": 5.633866197261646e-07, + "loss": 0.5361, + "step": 76609 + }, + { + "epoch": 1.96, + "learning_rate": 5.633617261904795e-07, + "loss": 0.6631, + "step": 76610 + }, + { + "epoch": 1.96, + "learning_rate": 5.633368329891084e-07, + "loss": 0.605, + "step": 76611 + }, + { + "epoch": 1.96, + "learning_rate": 5.633119401220696e-07, + "loss": 0.6982, + "step": 76612 + }, + { + "epoch": 1.96, + "learning_rate": 5.63287047589383e-07, + "loss": 0.6958, + "step": 76613 + }, + { + "epoch": 1.96, + "learning_rate": 5.632621553910674e-07, + "loss": 0.6035, + "step": 76614 + }, + { + "epoch": 1.96, + "learning_rate": 5.632372635271422e-07, + "loss": 0.6738, + "step": 76615 + }, + { + "epoch": 1.96, + "learning_rate": 5.632123719976258e-07, + "loss": 0.521, + "step": 76616 + }, + { + "epoch": 1.96, + "learning_rate": 5.631874808025375e-07, + "loss": 0.7583, + "step": 76617 + }, + { + "epoch": 1.96, + "learning_rate": 5.63162589941897e-07, + "loss": 0.6729, + "step": 76618 + }, + { + "epoch": 1.96, + "learning_rate": 5.631376994157223e-07, + "loss": 0.7402, + "step": 76619 + }, + { + "epoch": 1.96, + "learning_rate": 5.631128092240335e-07, + "loss": 0.509, + "step": 76620 + }, + { + "epoch": 1.96, + "learning_rate": 5.630879193668487e-07, + "loss": 0.7329, + "step": 76621 + }, + { + "epoch": 1.96, + "learning_rate": 5.630630298441873e-07, + "loss": 0.5579, + "step": 76622 + }, + { + "epoch": 1.96, + "learning_rate": 5.63038140656069e-07, + "loss": 0.5864, + "step": 76623 + }, + { + "epoch": 1.96, + "learning_rate": 5.630132518025117e-07, + "loss": 0.5452, + "step": 76624 + }, + { + "epoch": 1.96, + "learning_rate": 5.629883632835352e-07, + "loss": 0.5737, + "step": 76625 + }, + { + "epoch": 1.96, + "learning_rate": 5.629634750991583e-07, + "loss": 0.6685, + "step": 76626 + }, + { + "epoch": 1.96, + "learning_rate": 5.629385872494006e-07, + "loss": 0.5991, + "step": 76627 + }, + { + "epoch": 1.96, + "learning_rate": 5.629136997342804e-07, + "loss": 0.5991, + "step": 76628 + }, + { + "epoch": 1.96, + "learning_rate": 5.628888125538172e-07, + "loss": 0.7627, + "step": 76629 + }, + { + "epoch": 1.96, + "learning_rate": 5.628639257080301e-07, + "loss": 0.6768, + "step": 76630 + }, + { + "epoch": 1.96, + "learning_rate": 5.628390391969378e-07, + "loss": 0.5522, + "step": 76631 + }, + { + "epoch": 1.96, + "learning_rate": 5.628141530205597e-07, + "loss": 0.875, + "step": 76632 + }, + { + "epoch": 1.96, + "learning_rate": 5.627892671789145e-07, + "loss": 0.4773, + "step": 76633 + }, + { + "epoch": 1.96, + "learning_rate": 5.627643816720214e-07, + "loss": 0.6504, + "step": 76634 + }, + { + "epoch": 1.96, + "learning_rate": 5.627394964998999e-07, + "loss": 0.7256, + "step": 76635 + }, + { + "epoch": 1.96, + "learning_rate": 5.627146116625683e-07, + "loss": 0.7041, + "step": 76636 + }, + { + "epoch": 1.96, + "learning_rate": 5.62689727160046e-07, + "loss": 0.6089, + "step": 76637 + }, + { + "epoch": 1.96, + "learning_rate": 5.626648429923519e-07, + "loss": 0.75, + "step": 76638 + }, + { + "epoch": 1.96, + "learning_rate": 5.626399591595059e-07, + "loss": 0.6621, + "step": 76639 + }, + { + "epoch": 1.96, + "learning_rate": 5.626150756615262e-07, + "loss": 0.5215, + "step": 76640 + }, + { + "epoch": 1.96, + "learning_rate": 5.625901924984318e-07, + "loss": 0.5061, + "step": 76641 + }, + { + "epoch": 1.96, + "learning_rate": 5.625653096702418e-07, + "loss": 0.5487, + "step": 76642 + }, + { + "epoch": 1.96, + "learning_rate": 5.625404271769754e-07, + "loss": 0.625, + "step": 76643 + }, + { + "epoch": 1.96, + "learning_rate": 5.625155450186522e-07, + "loss": 0.501, + "step": 76644 + }, + { + "epoch": 1.96, + "learning_rate": 5.624906631952902e-07, + "loss": 0.5605, + "step": 76645 + }, + { + "epoch": 1.96, + "learning_rate": 5.624657817069092e-07, + "loss": 0.6611, + "step": 76646 + }, + { + "epoch": 1.96, + "learning_rate": 5.624409005535278e-07, + "loss": 0.6475, + "step": 76647 + }, + { + "epoch": 1.96, + "learning_rate": 5.624160197351657e-07, + "loss": 0.5947, + "step": 76648 + }, + { + "epoch": 1.96, + "learning_rate": 5.623911392518414e-07, + "loss": 0.7588, + "step": 76649 + }, + { + "epoch": 1.96, + "learning_rate": 5.623662591035742e-07, + "loss": 0.6357, + "step": 76650 + }, + { + "epoch": 1.96, + "learning_rate": 5.623413792903828e-07, + "loss": 0.7339, + "step": 76651 + }, + { + "epoch": 1.96, + "learning_rate": 5.623164998122867e-07, + "loss": 0.7046, + "step": 76652 + }, + { + "epoch": 1.96, + "learning_rate": 5.622916206693045e-07, + "loss": 0.5225, + "step": 76653 + }, + { + "epoch": 1.96, + "learning_rate": 5.622667418614554e-07, + "loss": 0.7402, + "step": 76654 + }, + { + "epoch": 1.96, + "learning_rate": 5.622418633887586e-07, + "loss": 0.5791, + "step": 76655 + }, + { + "epoch": 1.96, + "learning_rate": 5.622169852512334e-07, + "loss": 0.7783, + "step": 76656 + }, + { + "epoch": 1.96, + "learning_rate": 5.621921074488982e-07, + "loss": 0.7183, + "step": 76657 + }, + { + "epoch": 1.96, + "learning_rate": 5.621672299817724e-07, + "loss": 0.7188, + "step": 76658 + }, + { + "epoch": 1.96, + "learning_rate": 5.621423528498747e-07, + "loss": 0.5728, + "step": 76659 + }, + { + "epoch": 1.96, + "learning_rate": 5.621174760532253e-07, + "loss": 0.7227, + "step": 76660 + }, + { + "epoch": 1.96, + "learning_rate": 5.620925995918422e-07, + "loss": 0.8545, + "step": 76661 + }, + { + "epoch": 1.96, + "learning_rate": 5.620677234657442e-07, + "loss": 0.5615, + "step": 76662 + }, + { + "epoch": 1.96, + "learning_rate": 5.620428476749509e-07, + "loss": 0.665, + "step": 76663 + }, + { + "epoch": 1.96, + "learning_rate": 5.620179722194813e-07, + "loss": 0.7441, + "step": 76664 + }, + { + "epoch": 1.96, + "learning_rate": 5.619930970993548e-07, + "loss": 0.5923, + "step": 76665 + }, + { + "epoch": 1.96, + "learning_rate": 5.619682223145895e-07, + "loss": 0.7979, + "step": 76666 + }, + { + "epoch": 1.97, + "learning_rate": 5.619433478652052e-07, + "loss": 0.4624, + "step": 76667 + }, + { + "epoch": 1.97, + "learning_rate": 5.619184737512206e-07, + "loss": 0.4714, + "step": 76668 + }, + { + "epoch": 1.97, + "learning_rate": 5.618935999726553e-07, + "loss": 0.3795, + "step": 76669 + }, + { + "epoch": 1.97, + "learning_rate": 5.618687265295279e-07, + "loss": 0.7041, + "step": 76670 + }, + { + "epoch": 1.97, + "learning_rate": 5.61843853421857e-07, + "loss": 0.6152, + "step": 76671 + }, + { + "epoch": 1.97, + "learning_rate": 5.618189806496623e-07, + "loss": 0.5244, + "step": 76672 + }, + { + "epoch": 1.97, + "learning_rate": 5.617941082129629e-07, + "loss": 0.543, + "step": 76673 + }, + { + "epoch": 1.97, + "learning_rate": 5.617692361117773e-07, + "loss": 0.6973, + "step": 76674 + }, + { + "epoch": 1.97, + "learning_rate": 5.617443643461248e-07, + "loss": 0.4561, + "step": 76675 + }, + { + "epoch": 1.97, + "learning_rate": 5.617194929160245e-07, + "loss": 0.563, + "step": 76676 + }, + { + "epoch": 1.97, + "learning_rate": 5.616946218214959e-07, + "loss": 0.686, + "step": 76677 + }, + { + "epoch": 1.97, + "learning_rate": 5.616697510625571e-07, + "loss": 0.6768, + "step": 76678 + }, + { + "epoch": 1.97, + "learning_rate": 5.616448806392275e-07, + "loss": 0.5337, + "step": 76679 + }, + { + "epoch": 1.97, + "learning_rate": 5.61620010551527e-07, + "loss": 0.344, + "step": 76680 + }, + { + "epoch": 1.97, + "learning_rate": 5.615951407994732e-07, + "loss": 0.6826, + "step": 76681 + }, + { + "epoch": 1.97, + "learning_rate": 5.615702713830863e-07, + "loss": 0.5981, + "step": 76682 + }, + { + "epoch": 1.97, + "learning_rate": 5.615454023023844e-07, + "loss": 0.8037, + "step": 76683 + }, + { + "epoch": 1.97, + "learning_rate": 5.615205335573873e-07, + "loss": 0.71, + "step": 76684 + }, + { + "epoch": 1.97, + "learning_rate": 5.614956651481135e-07, + "loss": 0.5957, + "step": 76685 + }, + { + "epoch": 1.97, + "learning_rate": 5.614707970745829e-07, + "loss": 0.5659, + "step": 76686 + }, + { + "epoch": 1.97, + "learning_rate": 5.614459293368134e-07, + "loss": 0.7852, + "step": 76687 + }, + { + "epoch": 1.97, + "learning_rate": 5.614210619348247e-07, + "loss": 0.6641, + "step": 76688 + }, + { + "epoch": 1.97, + "learning_rate": 5.613961948686361e-07, + "loss": 0.709, + "step": 76689 + }, + { + "epoch": 1.97, + "learning_rate": 5.613713281382662e-07, + "loss": 0.5874, + "step": 76690 + }, + { + "epoch": 1.97, + "learning_rate": 5.613464617437338e-07, + "loss": 0.7002, + "step": 76691 + }, + { + "epoch": 1.97, + "learning_rate": 5.613215956850581e-07, + "loss": 0.4722, + "step": 76692 + }, + { + "epoch": 1.97, + "learning_rate": 5.612967299622584e-07, + "loss": 0.5635, + "step": 76693 + }, + { + "epoch": 1.97, + "learning_rate": 5.61271864575354e-07, + "loss": 0.6499, + "step": 76694 + }, + { + "epoch": 1.97, + "learning_rate": 5.612469995243632e-07, + "loss": 0.5859, + "step": 76695 + }, + { + "epoch": 1.97, + "learning_rate": 5.612221348093053e-07, + "loss": 0.647, + "step": 76696 + }, + { + "epoch": 1.97, + "learning_rate": 5.611972704301995e-07, + "loss": 0.707, + "step": 76697 + }, + { + "epoch": 1.97, + "learning_rate": 5.611724063870651e-07, + "loss": 0.7197, + "step": 76698 + }, + { + "epoch": 1.97, + "learning_rate": 5.611475426799204e-07, + "loss": 0.3895, + "step": 76699 + }, + { + "epoch": 1.97, + "learning_rate": 5.611226793087855e-07, + "loss": 0.5698, + "step": 76700 + }, + { + "epoch": 1.97, + "learning_rate": 5.610978162736782e-07, + "loss": 0.6816, + "step": 76701 + }, + { + "epoch": 1.97, + "learning_rate": 5.61072953574618e-07, + "loss": 0.5552, + "step": 76702 + }, + { + "epoch": 1.97, + "learning_rate": 5.610480912116247e-07, + "loss": 0.477, + "step": 76703 + }, + { + "epoch": 1.97, + "learning_rate": 5.610232291847161e-07, + "loss": 0.8164, + "step": 76704 + }, + { + "epoch": 1.97, + "learning_rate": 5.609983674939118e-07, + "loss": 0.5835, + "step": 76705 + }, + { + "epoch": 1.97, + "learning_rate": 5.609735061392314e-07, + "loss": 0.5503, + "step": 76706 + }, + { + "epoch": 1.97, + "learning_rate": 5.60948645120693e-07, + "loss": 0.4946, + "step": 76707 + }, + { + "epoch": 1.97, + "learning_rate": 5.60923784438316e-07, + "loss": 0.8047, + "step": 76708 + }, + { + "epoch": 1.97, + "learning_rate": 5.608989240921195e-07, + "loss": 0.521, + "step": 76709 + }, + { + "epoch": 1.97, + "learning_rate": 5.608740640821227e-07, + "loss": 0.4736, + "step": 76710 + }, + { + "epoch": 1.97, + "learning_rate": 5.608492044083448e-07, + "loss": 0.7822, + "step": 76711 + }, + { + "epoch": 1.97, + "learning_rate": 5.608243450708039e-07, + "loss": 0.6592, + "step": 76712 + }, + { + "epoch": 1.97, + "learning_rate": 5.607994860695195e-07, + "loss": 0.5359, + "step": 76713 + }, + { + "epoch": 1.97, + "learning_rate": 5.607746274045109e-07, + "loss": 0.6865, + "step": 76714 + }, + { + "epoch": 1.97, + "learning_rate": 5.607497690757972e-07, + "loss": 0.7305, + "step": 76715 + }, + { + "epoch": 1.97, + "learning_rate": 5.607249110833969e-07, + "loss": 0.6162, + "step": 76716 + }, + { + "epoch": 1.97, + "learning_rate": 5.607000534273294e-07, + "loss": 0.5898, + "step": 76717 + }, + { + "epoch": 1.97, + "learning_rate": 5.606751961076136e-07, + "loss": 0.5806, + "step": 76718 + }, + { + "epoch": 1.97, + "learning_rate": 5.60650339124269e-07, + "loss": 0.6179, + "step": 76719 + }, + { + "epoch": 1.97, + "learning_rate": 5.606254824773143e-07, + "loss": 0.6719, + "step": 76720 + }, + { + "epoch": 1.97, + "learning_rate": 5.60600626166768e-07, + "loss": 0.4124, + "step": 76721 + }, + { + "epoch": 1.97, + "learning_rate": 5.605757701926496e-07, + "loss": 0.8906, + "step": 76722 + }, + { + "epoch": 1.97, + "learning_rate": 5.605509145549785e-07, + "loss": 0.7207, + "step": 76723 + }, + { + "epoch": 1.97, + "learning_rate": 5.60526059253773e-07, + "loss": 0.751, + "step": 76724 + }, + { + "epoch": 1.97, + "learning_rate": 5.605012042890524e-07, + "loss": 0.3896, + "step": 76725 + }, + { + "epoch": 1.97, + "learning_rate": 5.60476349660836e-07, + "loss": 0.6376, + "step": 76726 + }, + { + "epoch": 1.97, + "learning_rate": 5.60451495369143e-07, + "loss": 0.5952, + "step": 76727 + }, + { + "epoch": 1.97, + "learning_rate": 5.604266414139915e-07, + "loss": 0.6865, + "step": 76728 + }, + { + "epoch": 1.97, + "learning_rate": 5.604017877954013e-07, + "loss": 0.6733, + "step": 76729 + }, + { + "epoch": 1.97, + "learning_rate": 5.603769345133915e-07, + "loss": 0.6528, + "step": 76730 + }, + { + "epoch": 1.97, + "learning_rate": 5.603520815679806e-07, + "loss": 0.5574, + "step": 76731 + }, + { + "epoch": 1.97, + "learning_rate": 5.603272289591883e-07, + "loss": 0.7988, + "step": 76732 + }, + { + "epoch": 1.97, + "learning_rate": 5.603023766870328e-07, + "loss": 0.5762, + "step": 76733 + }, + { + "epoch": 1.97, + "learning_rate": 5.602775247515334e-07, + "loss": 0.3634, + "step": 76734 + }, + { + "epoch": 1.97, + "learning_rate": 5.602526731527094e-07, + "loss": 0.6553, + "step": 76735 + }, + { + "epoch": 1.97, + "learning_rate": 5.6022782189058e-07, + "loss": 0.6582, + "step": 76736 + }, + { + "epoch": 1.97, + "learning_rate": 5.602029709651637e-07, + "loss": 0.6816, + "step": 76737 + }, + { + "epoch": 1.97, + "learning_rate": 5.601781203764797e-07, + "loss": 0.603, + "step": 76738 + }, + { + "epoch": 1.97, + "learning_rate": 5.60153270124547e-07, + "loss": 0.6328, + "step": 76739 + }, + { + "epoch": 1.97, + "learning_rate": 5.601284202093853e-07, + "loss": 0.6524, + "step": 76740 + }, + { + "epoch": 1.97, + "learning_rate": 5.601035706310128e-07, + "loss": 0.667, + "step": 76741 + }, + { + "epoch": 1.97, + "learning_rate": 5.600787213894486e-07, + "loss": 0.7998, + "step": 76742 + }, + { + "epoch": 1.97, + "learning_rate": 5.60053872484712e-07, + "loss": 0.7075, + "step": 76743 + }, + { + "epoch": 1.97, + "learning_rate": 5.60029023916822e-07, + "loss": 0.6377, + "step": 76744 + }, + { + "epoch": 1.97, + "learning_rate": 5.600041756857973e-07, + "loss": 0.4976, + "step": 76745 + }, + { + "epoch": 1.97, + "learning_rate": 5.599793277916571e-07, + "loss": 0.5234, + "step": 76746 + }, + { + "epoch": 1.97, + "learning_rate": 5.599544802344206e-07, + "loss": 0.6309, + "step": 76747 + }, + { + "epoch": 1.97, + "learning_rate": 5.59929633014107e-07, + "loss": 0.7002, + "step": 76748 + }, + { + "epoch": 1.97, + "learning_rate": 5.599047861307348e-07, + "loss": 0.5815, + "step": 76749 + }, + { + "epoch": 1.97, + "learning_rate": 5.598799395843236e-07, + "loss": 0.5269, + "step": 76750 + }, + { + "epoch": 1.97, + "learning_rate": 5.598550933748916e-07, + "loss": 0.5752, + "step": 76751 + }, + { + "epoch": 1.97, + "learning_rate": 5.598302475024583e-07, + "loss": 0.5115, + "step": 76752 + }, + { + "epoch": 1.97, + "learning_rate": 5.598054019670432e-07, + "loss": 0.5417, + "step": 76753 + }, + { + "epoch": 1.97, + "learning_rate": 5.597805567686646e-07, + "loss": 0.4683, + "step": 76754 + }, + { + "epoch": 1.97, + "learning_rate": 5.597557119073417e-07, + "loss": 0.8467, + "step": 76755 + }, + { + "epoch": 1.97, + "learning_rate": 5.597308673830936e-07, + "loss": 0.625, + "step": 76756 + }, + { + "epoch": 1.97, + "learning_rate": 5.597060231959396e-07, + "loss": 0.5374, + "step": 76757 + }, + { + "epoch": 1.97, + "learning_rate": 5.596811793458982e-07, + "loss": 0.6685, + "step": 76758 + }, + { + "epoch": 1.97, + "learning_rate": 5.596563358329886e-07, + "loss": 0.6016, + "step": 76759 + }, + { + "epoch": 1.97, + "learning_rate": 5.596314926572305e-07, + "loss": 0.5479, + "step": 76760 + }, + { + "epoch": 1.97, + "learning_rate": 5.596066498186422e-07, + "loss": 0.5674, + "step": 76761 + }, + { + "epoch": 1.97, + "learning_rate": 5.595818073172423e-07, + "loss": 0.748, + "step": 76762 + }, + { + "epoch": 1.97, + "learning_rate": 5.595569651530506e-07, + "loss": 0.6011, + "step": 76763 + }, + { + "epoch": 1.97, + "learning_rate": 5.595321233260857e-07, + "loss": 0.6104, + "step": 76764 + }, + { + "epoch": 1.97, + "learning_rate": 5.59507281836367e-07, + "loss": 0.4882, + "step": 76765 + }, + { + "epoch": 1.97, + "learning_rate": 5.594824406839134e-07, + "loss": 0.3604, + "step": 76766 + }, + { + "epoch": 1.97, + "learning_rate": 5.594575998687434e-07, + "loss": 0.5764, + "step": 76767 + }, + { + "epoch": 1.97, + "learning_rate": 5.594327593908767e-07, + "loss": 0.5132, + "step": 76768 + }, + { + "epoch": 1.97, + "learning_rate": 5.594079192503325e-07, + "loss": 0.5718, + "step": 76769 + }, + { + "epoch": 1.97, + "learning_rate": 5.593830794471292e-07, + "loss": 0.6318, + "step": 76770 + }, + { + "epoch": 1.97, + "learning_rate": 5.593582399812859e-07, + "loss": 0.5781, + "step": 76771 + }, + { + "epoch": 1.97, + "learning_rate": 5.593334008528216e-07, + "loss": 0.6748, + "step": 76772 + }, + { + "epoch": 1.97, + "learning_rate": 5.593085620617554e-07, + "loss": 0.7197, + "step": 76773 + }, + { + "epoch": 1.97, + "learning_rate": 5.592837236081067e-07, + "loss": 0.5208, + "step": 76774 + }, + { + "epoch": 1.97, + "learning_rate": 5.59258885491894e-07, + "loss": 0.6963, + "step": 76775 + }, + { + "epoch": 1.97, + "learning_rate": 5.592340477131363e-07, + "loss": 0.646, + "step": 76776 + }, + { + "epoch": 1.97, + "learning_rate": 5.592092102718529e-07, + "loss": 0.3879, + "step": 76777 + }, + { + "epoch": 1.97, + "learning_rate": 5.591843731680632e-07, + "loss": 0.6787, + "step": 76778 + }, + { + "epoch": 1.97, + "learning_rate": 5.591595364017854e-07, + "loss": 0.5625, + "step": 76779 + }, + { + "epoch": 1.97, + "learning_rate": 5.591346999730391e-07, + "loss": 0.5215, + "step": 76780 + }, + { + "epoch": 1.97, + "learning_rate": 5.591098638818428e-07, + "loss": 0.7754, + "step": 76781 + }, + { + "epoch": 1.97, + "learning_rate": 5.590850281282162e-07, + "loss": 0.5737, + "step": 76782 + }, + { + "epoch": 1.97, + "learning_rate": 5.590601927121775e-07, + "loss": 0.6777, + "step": 76783 + }, + { + "epoch": 1.97, + "learning_rate": 5.590353576337461e-07, + "loss": 0.5144, + "step": 76784 + }, + { + "epoch": 1.97, + "learning_rate": 5.590105228929412e-07, + "loss": 0.4541, + "step": 76785 + }, + { + "epoch": 1.97, + "learning_rate": 5.589856884897819e-07, + "loss": 0.7812, + "step": 76786 + }, + { + "epoch": 1.97, + "learning_rate": 5.589608544242866e-07, + "loss": 0.6387, + "step": 76787 + }, + { + "epoch": 1.97, + "learning_rate": 5.589360206964747e-07, + "loss": 0.5979, + "step": 76788 + }, + { + "epoch": 1.97, + "learning_rate": 5.589111873063652e-07, + "loss": 0.6914, + "step": 76789 + }, + { + "epoch": 1.97, + "learning_rate": 5.588863542539776e-07, + "loss": 0.4382, + "step": 76790 + }, + { + "epoch": 1.97, + "learning_rate": 5.588615215393304e-07, + "loss": 0.6338, + "step": 76791 + }, + { + "epoch": 1.97, + "learning_rate": 5.588366891624423e-07, + "loss": 0.5732, + "step": 76792 + }, + { + "epoch": 1.97, + "learning_rate": 5.588118571233325e-07, + "loss": 0.584, + "step": 76793 + }, + { + "epoch": 1.97, + "learning_rate": 5.587870254220204e-07, + "loss": 0.6553, + "step": 76794 + }, + { + "epoch": 1.97, + "learning_rate": 5.58762194058525e-07, + "loss": 0.5918, + "step": 76795 + }, + { + "epoch": 1.97, + "learning_rate": 5.587373630328648e-07, + "loss": 0.6211, + "step": 76796 + }, + { + "epoch": 1.97, + "learning_rate": 5.58712532345059e-07, + "loss": 0.7188, + "step": 76797 + }, + { + "epoch": 1.97, + "learning_rate": 5.586877019951272e-07, + "loss": 0.3022, + "step": 76798 + }, + { + "epoch": 1.97, + "learning_rate": 5.586628719830875e-07, + "loss": 0.5942, + "step": 76799 + }, + { + "epoch": 1.97, + "learning_rate": 5.586380423089598e-07, + "loss": 0.5674, + "step": 76800 + }, + { + "epoch": 1.97, + "learning_rate": 5.586132129727623e-07, + "loss": 0.7549, + "step": 76801 + }, + { + "epoch": 1.97, + "learning_rate": 5.585883839745142e-07, + "loss": 0.6162, + "step": 76802 + }, + { + "epoch": 1.97, + "learning_rate": 5.585635553142352e-07, + "loss": 0.6421, + "step": 76803 + }, + { + "epoch": 1.97, + "learning_rate": 5.585387269919435e-07, + "loss": 0.5317, + "step": 76804 + }, + { + "epoch": 1.97, + "learning_rate": 5.585138990076582e-07, + "loss": 0.6748, + "step": 76805 + }, + { + "epoch": 1.97, + "learning_rate": 5.584890713613986e-07, + "loss": 0.3796, + "step": 76806 + }, + { + "epoch": 1.97, + "learning_rate": 5.58464244053184e-07, + "loss": 0.7471, + "step": 76807 + }, + { + "epoch": 1.97, + "learning_rate": 5.584394170830327e-07, + "loss": 0.6777, + "step": 76808 + }, + { + "epoch": 1.97, + "learning_rate": 5.584145904509638e-07, + "loss": 0.71, + "step": 76809 + }, + { + "epoch": 1.97, + "learning_rate": 5.583897641569971e-07, + "loss": 0.4844, + "step": 76810 + }, + { + "epoch": 1.97, + "learning_rate": 5.583649382011506e-07, + "loss": 0.6594, + "step": 76811 + }, + { + "epoch": 1.97, + "learning_rate": 5.583401125834443e-07, + "loss": 0.4932, + "step": 76812 + }, + { + "epoch": 1.97, + "learning_rate": 5.583152873038961e-07, + "loss": 0.7104, + "step": 76813 + }, + { + "epoch": 1.97, + "learning_rate": 5.582904623625258e-07, + "loss": 0.6846, + "step": 76814 + }, + { + "epoch": 1.97, + "learning_rate": 5.582656377593523e-07, + "loss": 0.6968, + "step": 76815 + }, + { + "epoch": 1.97, + "learning_rate": 5.582408134943943e-07, + "loss": 0.6328, + "step": 76816 + }, + { + "epoch": 1.97, + "learning_rate": 5.582159895676708e-07, + "loss": 0.6406, + "step": 76817 + }, + { + "epoch": 1.97, + "learning_rate": 5.581911659792012e-07, + "loss": 0.541, + "step": 76818 + }, + { + "epoch": 1.97, + "learning_rate": 5.581663427290046e-07, + "loss": 0.5962, + "step": 76819 + }, + { + "epoch": 1.97, + "learning_rate": 5.581415198170998e-07, + "loss": 0.5996, + "step": 76820 + }, + { + "epoch": 1.97, + "learning_rate": 5.581166972435051e-07, + "loss": 0.7344, + "step": 76821 + }, + { + "epoch": 1.97, + "learning_rate": 5.580918750082404e-07, + "loss": 0.562, + "step": 76822 + }, + { + "epoch": 1.97, + "learning_rate": 5.580670531113243e-07, + "loss": 0.5996, + "step": 76823 + }, + { + "epoch": 1.97, + "learning_rate": 5.580422315527764e-07, + "loss": 0.6685, + "step": 76824 + }, + { + "epoch": 1.97, + "learning_rate": 5.580174103326148e-07, + "loss": 0.6318, + "step": 76825 + }, + { + "epoch": 1.97, + "learning_rate": 5.57992589450859e-07, + "loss": 0.7832, + "step": 76826 + }, + { + "epoch": 1.97, + "learning_rate": 5.579677689075279e-07, + "loss": 0.709, + "step": 76827 + }, + { + "epoch": 1.97, + "learning_rate": 5.57942948702641e-07, + "loss": 0.5801, + "step": 76828 + }, + { + "epoch": 1.97, + "learning_rate": 5.579181288362163e-07, + "loss": 0.6807, + "step": 76829 + }, + { + "epoch": 1.97, + "learning_rate": 5.578933093082739e-07, + "loss": 0.5198, + "step": 76830 + }, + { + "epoch": 1.97, + "learning_rate": 5.578684901188319e-07, + "loss": 0.665, + "step": 76831 + }, + { + "epoch": 1.97, + "learning_rate": 5.5784367126791e-07, + "loss": 0.5557, + "step": 76832 + }, + { + "epoch": 1.97, + "learning_rate": 5.578188527555265e-07, + "loss": 0.8174, + "step": 76833 + }, + { + "epoch": 1.97, + "learning_rate": 5.577940345817007e-07, + "loss": 0.4609, + "step": 76834 + }, + { + "epoch": 1.97, + "learning_rate": 5.577692167464517e-07, + "loss": 0.5557, + "step": 76835 + }, + { + "epoch": 1.97, + "learning_rate": 5.57744399249799e-07, + "loss": 0.752, + "step": 76836 + }, + { + "epoch": 1.97, + "learning_rate": 5.577195820917605e-07, + "loss": 0.6479, + "step": 76837 + }, + { + "epoch": 1.97, + "learning_rate": 5.576947652723559e-07, + "loss": 0.8135, + "step": 76838 + }, + { + "epoch": 1.97, + "learning_rate": 5.576699487916043e-07, + "loss": 0.6953, + "step": 76839 + }, + { + "epoch": 1.97, + "learning_rate": 5.576451326495243e-07, + "loss": 0.6729, + "step": 76840 + }, + { + "epoch": 1.97, + "learning_rate": 5.576203168461354e-07, + "loss": 0.6929, + "step": 76841 + }, + { + "epoch": 1.97, + "learning_rate": 5.575955013814559e-07, + "loss": 0.7471, + "step": 76842 + }, + { + "epoch": 1.97, + "learning_rate": 5.575706862555052e-07, + "loss": 0.7129, + "step": 76843 + }, + { + "epoch": 1.97, + "learning_rate": 5.575458714683021e-07, + "loss": 0.7314, + "step": 76844 + }, + { + "epoch": 1.97, + "learning_rate": 5.575210570198664e-07, + "loss": 0.6104, + "step": 76845 + }, + { + "epoch": 1.97, + "learning_rate": 5.57496242910216e-07, + "loss": 0.5918, + "step": 76846 + }, + { + "epoch": 1.97, + "learning_rate": 5.574714291393706e-07, + "loss": 0.748, + "step": 76847 + }, + { + "epoch": 1.97, + "learning_rate": 5.574466157073485e-07, + "loss": 0.458, + "step": 76848 + }, + { + "epoch": 1.97, + "learning_rate": 5.574218026141704e-07, + "loss": 0.5032, + "step": 76849 + }, + { + "epoch": 1.97, + "learning_rate": 5.57396989859853e-07, + "loss": 0.5989, + "step": 76850 + }, + { + "epoch": 1.97, + "learning_rate": 5.573721774444165e-07, + "loss": 0.7583, + "step": 76851 + }, + { + "epoch": 1.97, + "learning_rate": 5.573473653678798e-07, + "loss": 0.6641, + "step": 76852 + }, + { + "epoch": 1.97, + "learning_rate": 5.573225536302623e-07, + "loss": 0.7002, + "step": 76853 + }, + { + "epoch": 1.97, + "learning_rate": 5.572977422315821e-07, + "loss": 0.6533, + "step": 76854 + }, + { + "epoch": 1.97, + "learning_rate": 5.572729311718586e-07, + "loss": 0.5601, + "step": 76855 + }, + { + "epoch": 1.97, + "learning_rate": 5.572481204511109e-07, + "loss": 0.6562, + "step": 76856 + }, + { + "epoch": 1.97, + "learning_rate": 5.572233100693584e-07, + "loss": 0.6387, + "step": 76857 + }, + { + "epoch": 1.97, + "learning_rate": 5.571985000266193e-07, + "loss": 0.5981, + "step": 76858 + }, + { + "epoch": 1.97, + "learning_rate": 5.571736903229132e-07, + "loss": 0.7109, + "step": 76859 + }, + { + "epoch": 1.97, + "learning_rate": 5.571488809582585e-07, + "loss": 0.5977, + "step": 76860 + }, + { + "epoch": 1.97, + "learning_rate": 5.571240719326746e-07, + "loss": 0.5898, + "step": 76861 + }, + { + "epoch": 1.97, + "learning_rate": 5.570992632461808e-07, + "loss": 0.6597, + "step": 76862 + }, + { + "epoch": 1.97, + "learning_rate": 5.570744548987954e-07, + "loss": 0.5042, + "step": 76863 + }, + { + "epoch": 1.97, + "learning_rate": 5.570496468905375e-07, + "loss": 0.7598, + "step": 76864 + }, + { + "epoch": 1.97, + "learning_rate": 5.570248392214265e-07, + "loss": 0.7085, + "step": 76865 + }, + { + "epoch": 1.97, + "learning_rate": 5.570000318914816e-07, + "loss": 0.5933, + "step": 76866 + }, + { + "epoch": 1.97, + "learning_rate": 5.56975224900721e-07, + "loss": 0.4553, + "step": 76867 + }, + { + "epoch": 1.97, + "learning_rate": 5.569504182491641e-07, + "loss": 0.45, + "step": 76868 + }, + { + "epoch": 1.97, + "learning_rate": 5.569256119368302e-07, + "loss": 0.7461, + "step": 76869 + }, + { + "epoch": 1.97, + "learning_rate": 5.569008059637381e-07, + "loss": 0.583, + "step": 76870 + }, + { + "epoch": 1.97, + "learning_rate": 5.568760003299062e-07, + "loss": 0.7104, + "step": 76871 + }, + { + "epoch": 1.97, + "learning_rate": 5.56851195035354e-07, + "loss": 0.7607, + "step": 76872 + }, + { + "epoch": 1.97, + "learning_rate": 5.568263900801005e-07, + "loss": 0.5176, + "step": 76873 + }, + { + "epoch": 1.97, + "learning_rate": 5.56801585464165e-07, + "loss": 0.6875, + "step": 76874 + }, + { + "epoch": 1.97, + "learning_rate": 5.567767811875659e-07, + "loss": 0.5811, + "step": 76875 + }, + { + "epoch": 1.97, + "learning_rate": 5.567519772503221e-07, + "loss": 0.5874, + "step": 76876 + }, + { + "epoch": 1.97, + "learning_rate": 5.567271736524533e-07, + "loss": 0.5436, + "step": 76877 + }, + { + "epoch": 1.97, + "learning_rate": 5.567023703939783e-07, + "loss": 0.5388, + "step": 76878 + }, + { + "epoch": 1.97, + "learning_rate": 5.56677567474916e-07, + "loss": 0.5718, + "step": 76879 + }, + { + "epoch": 1.97, + "learning_rate": 5.56652764895285e-07, + "loss": 0.4988, + "step": 76880 + }, + { + "epoch": 1.97, + "learning_rate": 5.566279626551045e-07, + "loss": 0.5779, + "step": 76881 + }, + { + "epoch": 1.97, + "learning_rate": 5.566031607543935e-07, + "loss": 0.5996, + "step": 76882 + }, + { + "epoch": 1.97, + "learning_rate": 5.565783591931714e-07, + "loss": 0.7939, + "step": 76883 + }, + { + "epoch": 1.97, + "learning_rate": 5.565535579714567e-07, + "loss": 0.5198, + "step": 76884 + }, + { + "epoch": 1.97, + "learning_rate": 5.565287570892685e-07, + "loss": 0.7812, + "step": 76885 + }, + { + "epoch": 1.97, + "learning_rate": 5.565039565466261e-07, + "loss": 0.6963, + "step": 76886 + }, + { + "epoch": 1.97, + "learning_rate": 5.56479156343548e-07, + "loss": 0.3719, + "step": 76887 + }, + { + "epoch": 1.97, + "learning_rate": 5.564543564800533e-07, + "loss": 0.6489, + "step": 76888 + }, + { + "epoch": 1.97, + "learning_rate": 5.564295569561614e-07, + "loss": 0.793, + "step": 76889 + }, + { + "epoch": 1.97, + "learning_rate": 5.564047577718907e-07, + "loss": 0.6084, + "step": 76890 + }, + { + "epoch": 1.97, + "learning_rate": 5.56379958927261e-07, + "loss": 0.6494, + "step": 76891 + }, + { + "epoch": 1.97, + "learning_rate": 5.563551604222902e-07, + "loss": 0.5435, + "step": 76892 + }, + { + "epoch": 1.97, + "learning_rate": 5.563303622569979e-07, + "loss": 0.6479, + "step": 76893 + }, + { + "epoch": 1.97, + "learning_rate": 5.563055644314032e-07, + "loss": 0.6465, + "step": 76894 + }, + { + "epoch": 1.97, + "learning_rate": 5.562807669455252e-07, + "loss": 0.6084, + "step": 76895 + }, + { + "epoch": 1.97, + "learning_rate": 5.562559697993821e-07, + "loss": 0.6111, + "step": 76896 + }, + { + "epoch": 1.97, + "learning_rate": 5.562311729929936e-07, + "loss": 0.5789, + "step": 76897 + }, + { + "epoch": 1.97, + "learning_rate": 5.562063765263783e-07, + "loss": 0.6484, + "step": 76898 + }, + { + "epoch": 1.97, + "learning_rate": 5.561815803995559e-07, + "loss": 0.7725, + "step": 76899 + }, + { + "epoch": 1.97, + "learning_rate": 5.561567846125448e-07, + "loss": 0.5596, + "step": 76900 + }, + { + "epoch": 1.97, + "learning_rate": 5.561319891653637e-07, + "loss": 0.6284, + "step": 76901 + }, + { + "epoch": 1.97, + "learning_rate": 5.561071940580318e-07, + "loss": 0.5615, + "step": 76902 + }, + { + "epoch": 1.97, + "learning_rate": 5.560823992905684e-07, + "loss": 0.5085, + "step": 76903 + }, + { + "epoch": 1.97, + "learning_rate": 5.560576048629925e-07, + "loss": 0.5342, + "step": 76904 + }, + { + "epoch": 1.97, + "learning_rate": 5.560328107753226e-07, + "loss": 0.6514, + "step": 76905 + }, + { + "epoch": 1.97, + "learning_rate": 5.560080170275779e-07, + "loss": 0.6904, + "step": 76906 + }, + { + "epoch": 1.97, + "learning_rate": 5.559832236197779e-07, + "loss": 0.6313, + "step": 76907 + }, + { + "epoch": 1.97, + "learning_rate": 5.559584305519407e-07, + "loss": 0.5269, + "step": 76908 + }, + { + "epoch": 1.97, + "learning_rate": 5.559336378240862e-07, + "loss": 0.5242, + "step": 76909 + }, + { + "epoch": 1.97, + "learning_rate": 5.559088454362324e-07, + "loss": 0.54, + "step": 76910 + }, + { + "epoch": 1.97, + "learning_rate": 5.558840533883987e-07, + "loss": 0.6299, + "step": 76911 + }, + { + "epoch": 1.97, + "learning_rate": 5.558592616806047e-07, + "loss": 0.5718, + "step": 76912 + }, + { + "epoch": 1.97, + "learning_rate": 5.558344703128684e-07, + "loss": 0.6665, + "step": 76913 + }, + { + "epoch": 1.97, + "learning_rate": 5.558096792852091e-07, + "loss": 0.7461, + "step": 76914 + }, + { + "epoch": 1.97, + "learning_rate": 5.557848885976462e-07, + "loss": 0.5552, + "step": 76915 + }, + { + "epoch": 1.97, + "learning_rate": 5.557600982501985e-07, + "loss": 0.6387, + "step": 76916 + }, + { + "epoch": 1.97, + "learning_rate": 5.557353082428846e-07, + "loss": 0.5342, + "step": 76917 + }, + { + "epoch": 1.97, + "learning_rate": 5.557105185757237e-07, + "loss": 0.6426, + "step": 76918 + }, + { + "epoch": 1.97, + "learning_rate": 5.556857292487353e-07, + "loss": 0.5, + "step": 76919 + }, + { + "epoch": 1.97, + "learning_rate": 5.556609402619374e-07, + "loss": 0.6453, + "step": 76920 + }, + { + "epoch": 1.97, + "learning_rate": 5.556361516153499e-07, + "loss": 0.4128, + "step": 76921 + }, + { + "epoch": 1.97, + "learning_rate": 5.55611363308991e-07, + "loss": 0.5352, + "step": 76922 + }, + { + "epoch": 1.97, + "learning_rate": 5.555865753428801e-07, + "loss": 0.7764, + "step": 76923 + }, + { + "epoch": 1.97, + "learning_rate": 5.555617877170365e-07, + "loss": 0.4731, + "step": 76924 + }, + { + "epoch": 1.97, + "learning_rate": 5.555370004314784e-07, + "loss": 0.6191, + "step": 76925 + }, + { + "epoch": 1.97, + "learning_rate": 5.555122134862251e-07, + "loss": 0.71, + "step": 76926 + }, + { + "epoch": 1.97, + "learning_rate": 5.554874268812957e-07, + "loss": 0.6392, + "step": 76927 + }, + { + "epoch": 1.97, + "learning_rate": 5.554626406167096e-07, + "loss": 0.668, + "step": 76928 + }, + { + "epoch": 1.97, + "learning_rate": 5.554378546924853e-07, + "loss": 0.7988, + "step": 76929 + }, + { + "epoch": 1.97, + "learning_rate": 5.554130691086414e-07, + "loss": 0.6465, + "step": 76930 + }, + { + "epoch": 1.97, + "learning_rate": 5.553882838651972e-07, + "loss": 0.3818, + "step": 76931 + }, + { + "epoch": 1.97, + "learning_rate": 5.553634989621718e-07, + "loss": 0.6958, + "step": 76932 + }, + { + "epoch": 1.97, + "learning_rate": 5.553387143995844e-07, + "loss": 0.6421, + "step": 76933 + }, + { + "epoch": 1.97, + "learning_rate": 5.553139301774534e-07, + "loss": 0.6943, + "step": 76934 + }, + { + "epoch": 1.97, + "learning_rate": 5.552891462957981e-07, + "loss": 0.481, + "step": 76935 + }, + { + "epoch": 1.97, + "learning_rate": 5.552643627546375e-07, + "loss": 0.7432, + "step": 76936 + }, + { + "epoch": 1.97, + "learning_rate": 5.552395795539908e-07, + "loss": 0.4428, + "step": 76937 + }, + { + "epoch": 1.97, + "learning_rate": 5.552147966938765e-07, + "loss": 0.5747, + "step": 76938 + }, + { + "epoch": 1.97, + "learning_rate": 5.55190014174314e-07, + "loss": 0.6572, + "step": 76939 + }, + { + "epoch": 1.97, + "learning_rate": 5.551652319953217e-07, + "loss": 0.7666, + "step": 76940 + }, + { + "epoch": 1.97, + "learning_rate": 5.551404501569193e-07, + "loss": 0.6147, + "step": 76941 + }, + { + "epoch": 1.97, + "learning_rate": 5.551156686591251e-07, + "loss": 0.6094, + "step": 76942 + }, + { + "epoch": 1.97, + "learning_rate": 5.550908875019583e-07, + "loss": 0.6436, + "step": 76943 + }, + { + "epoch": 1.97, + "learning_rate": 5.550661066854379e-07, + "loss": 0.5479, + "step": 76944 + }, + { + "epoch": 1.97, + "learning_rate": 5.550413262095834e-07, + "loss": 0.6426, + "step": 76945 + }, + { + "epoch": 1.97, + "learning_rate": 5.55016546074413e-07, + "loss": 0.665, + "step": 76946 + }, + { + "epoch": 1.97, + "learning_rate": 5.549917662799457e-07, + "loss": 0.7109, + "step": 76947 + }, + { + "epoch": 1.97, + "learning_rate": 5.549669868262009e-07, + "loss": 0.4946, + "step": 76948 + }, + { + "epoch": 1.97, + "learning_rate": 5.549422077131978e-07, + "loss": 0.5474, + "step": 76949 + }, + { + "epoch": 1.97, + "learning_rate": 5.54917428940955e-07, + "loss": 0.5811, + "step": 76950 + }, + { + "epoch": 1.97, + "learning_rate": 5.54892650509491e-07, + "loss": 0.6504, + "step": 76951 + }, + { + "epoch": 1.97, + "learning_rate": 5.548678724188254e-07, + "loss": 0.6709, + "step": 76952 + }, + { + "epoch": 1.97, + "learning_rate": 5.548430946689768e-07, + "loss": 0.3877, + "step": 76953 + }, + { + "epoch": 1.97, + "learning_rate": 5.548183172599648e-07, + "loss": 0.6953, + "step": 76954 + }, + { + "epoch": 1.97, + "learning_rate": 5.547935401918077e-07, + "loss": 0.4966, + "step": 76955 + }, + { + "epoch": 1.97, + "learning_rate": 5.547687634645246e-07, + "loss": 0.6504, + "step": 76956 + }, + { + "epoch": 1.97, + "learning_rate": 5.547439870781345e-07, + "loss": 0.6982, + "step": 76957 + }, + { + "epoch": 1.97, + "learning_rate": 5.54719211032657e-07, + "loss": 0.5251, + "step": 76958 + }, + { + "epoch": 1.97, + "learning_rate": 5.546944353281106e-07, + "loss": 0.6113, + "step": 76959 + }, + { + "epoch": 1.97, + "learning_rate": 5.546696599645137e-07, + "loss": 0.6357, + "step": 76960 + }, + { + "epoch": 1.97, + "learning_rate": 5.546448849418856e-07, + "loss": 0.7627, + "step": 76961 + }, + { + "epoch": 1.97, + "learning_rate": 5.546201102602461e-07, + "loss": 0.6572, + "step": 76962 + }, + { + "epoch": 1.97, + "learning_rate": 5.545953359196129e-07, + "loss": 0.7422, + "step": 76963 + }, + { + "epoch": 1.97, + "learning_rate": 5.545705619200056e-07, + "loss": 0.4785, + "step": 76964 + }, + { + "epoch": 1.97, + "learning_rate": 5.545457882614433e-07, + "loss": 0.521, + "step": 76965 + }, + { + "epoch": 1.97, + "learning_rate": 5.54521014943945e-07, + "loss": 0.7373, + "step": 76966 + }, + { + "epoch": 1.97, + "learning_rate": 5.544962419675292e-07, + "loss": 0.5654, + "step": 76967 + }, + { + "epoch": 1.97, + "learning_rate": 5.544714693322152e-07, + "loss": 0.5615, + "step": 76968 + }, + { + "epoch": 1.97, + "learning_rate": 5.544466970380222e-07, + "loss": 0.6035, + "step": 76969 + }, + { + "epoch": 1.97, + "learning_rate": 5.544219250849685e-07, + "loss": 0.6191, + "step": 76970 + }, + { + "epoch": 1.97, + "learning_rate": 5.543971534730738e-07, + "loss": 0.7051, + "step": 76971 + }, + { + "epoch": 1.97, + "learning_rate": 5.543723822023564e-07, + "loss": 0.7295, + "step": 76972 + }, + { + "epoch": 1.97, + "learning_rate": 5.543476112728356e-07, + "loss": 0.8623, + "step": 76973 + }, + { + "epoch": 1.97, + "learning_rate": 5.543228406845302e-07, + "loss": 0.6689, + "step": 76974 + }, + { + "epoch": 1.97, + "learning_rate": 5.542980704374598e-07, + "loss": 0.623, + "step": 76975 + }, + { + "epoch": 1.97, + "learning_rate": 5.542733005316424e-07, + "loss": 0.6758, + "step": 76976 + }, + { + "epoch": 1.97, + "learning_rate": 5.542485309670974e-07, + "loss": 0.7666, + "step": 76977 + }, + { + "epoch": 1.97, + "learning_rate": 5.542237617438445e-07, + "loss": 0.5957, + "step": 76978 + }, + { + "epoch": 1.97, + "learning_rate": 5.541989928619017e-07, + "loss": 0.5566, + "step": 76979 + }, + { + "epoch": 1.97, + "learning_rate": 5.541742243212879e-07, + "loss": 0.6924, + "step": 76980 + }, + { + "epoch": 1.97, + "learning_rate": 5.541494561220224e-07, + "loss": 0.5718, + "step": 76981 + }, + { + "epoch": 1.97, + "learning_rate": 5.541246882641241e-07, + "loss": 0.5312, + "step": 76982 + }, + { + "epoch": 1.97, + "learning_rate": 5.540999207476125e-07, + "loss": 0.3888, + "step": 76983 + }, + { + "epoch": 1.97, + "learning_rate": 5.540751535725056e-07, + "loss": 0.4756, + "step": 76984 + }, + { + "epoch": 1.97, + "learning_rate": 5.54050386738823e-07, + "loss": 0.6978, + "step": 76985 + }, + { + "epoch": 1.97, + "learning_rate": 5.540256202465833e-07, + "loss": 0.2551, + "step": 76986 + }, + { + "epoch": 1.97, + "learning_rate": 5.540008540958063e-07, + "loss": 0.6392, + "step": 76987 + }, + { + "epoch": 1.97, + "learning_rate": 5.539760882865098e-07, + "loss": 0.6753, + "step": 76988 + }, + { + "epoch": 1.97, + "learning_rate": 5.539513228187138e-07, + "loss": 0.5372, + "step": 76989 + }, + { + "epoch": 1.97, + "learning_rate": 5.539265576924363e-07, + "loss": 0.6387, + "step": 76990 + }, + { + "epoch": 1.97, + "learning_rate": 5.539017929076968e-07, + "loss": 0.525, + "step": 76991 + }, + { + "epoch": 1.97, + "learning_rate": 5.538770284645145e-07, + "loss": 0.667, + "step": 76992 + }, + { + "epoch": 1.97, + "learning_rate": 5.538522643629077e-07, + "loss": 0.6787, + "step": 76993 + }, + { + "epoch": 1.97, + "learning_rate": 5.538275006028956e-07, + "loss": 0.5654, + "step": 76994 + }, + { + "epoch": 1.97, + "learning_rate": 5.538027371844977e-07, + "loss": 0.6377, + "step": 76995 + }, + { + "epoch": 1.97, + "learning_rate": 5.537779741077324e-07, + "loss": 0.5723, + "step": 76996 + }, + { + "epoch": 1.97, + "learning_rate": 5.537532113726185e-07, + "loss": 0.5981, + "step": 76997 + }, + { + "epoch": 1.97, + "learning_rate": 5.537284489791752e-07, + "loss": 0.6074, + "step": 76998 + }, + { + "epoch": 1.97, + "learning_rate": 5.537036869274221e-07, + "loss": 0.6521, + "step": 76999 + }, + { + "epoch": 1.97, + "learning_rate": 5.536789252173774e-07, + "loss": 0.4858, + "step": 77000 + }, + { + "epoch": 1.97, + "learning_rate": 5.5365416384906e-07, + "loss": 0.4443, + "step": 77001 + }, + { + "epoch": 1.97, + "learning_rate": 5.536294028224889e-07, + "loss": 0.6035, + "step": 77002 + }, + { + "epoch": 1.97, + "learning_rate": 5.536046421376833e-07, + "loss": 0.7705, + "step": 77003 + }, + { + "epoch": 1.97, + "learning_rate": 5.535798817946625e-07, + "loss": 0.6133, + "step": 77004 + }, + { + "epoch": 1.97, + "learning_rate": 5.535551217934447e-07, + "loss": 0.7012, + "step": 77005 + }, + { + "epoch": 1.97, + "learning_rate": 5.535303621340492e-07, + "loss": 0.6309, + "step": 77006 + }, + { + "epoch": 1.97, + "learning_rate": 5.53505602816495e-07, + "loss": 0.7944, + "step": 77007 + }, + { + "epoch": 1.97, + "learning_rate": 5.534808438408014e-07, + "loss": 0.7002, + "step": 77008 + }, + { + "epoch": 1.97, + "learning_rate": 5.534560852069869e-07, + "loss": 0.6943, + "step": 77009 + }, + { + "epoch": 1.97, + "learning_rate": 5.534313269150703e-07, + "loss": 0.6509, + "step": 77010 + }, + { + "epoch": 1.97, + "learning_rate": 5.534065689650708e-07, + "loss": 0.7949, + "step": 77011 + }, + { + "epoch": 1.97, + "learning_rate": 5.533818113570077e-07, + "loss": 0.5728, + "step": 77012 + }, + { + "epoch": 1.97, + "learning_rate": 5.533570540908992e-07, + "loss": 0.7207, + "step": 77013 + }, + { + "epoch": 1.97, + "learning_rate": 5.533322971667646e-07, + "loss": 0.7764, + "step": 77014 + }, + { + "epoch": 1.97, + "learning_rate": 5.533075405846231e-07, + "loss": 0.6572, + "step": 77015 + }, + { + "epoch": 1.97, + "learning_rate": 5.532827843444936e-07, + "loss": 0.6846, + "step": 77016 + }, + { + "epoch": 1.97, + "learning_rate": 5.532580284463947e-07, + "loss": 0.6182, + "step": 77017 + }, + { + "epoch": 1.97, + "learning_rate": 5.532332728903456e-07, + "loss": 0.6431, + "step": 77018 + }, + { + "epoch": 1.97, + "learning_rate": 5.532085176763657e-07, + "loss": 0.5869, + "step": 77019 + }, + { + "epoch": 1.97, + "learning_rate": 5.531837628044728e-07, + "loss": 0.4917, + "step": 77020 + }, + { + "epoch": 1.97, + "learning_rate": 5.531590082746873e-07, + "loss": 0.5366, + "step": 77021 + }, + { + "epoch": 1.97, + "learning_rate": 5.531342540870267e-07, + "loss": 0.5227, + "step": 77022 + }, + { + "epoch": 1.97, + "learning_rate": 5.531095002415109e-07, + "loss": 0.6436, + "step": 77023 + }, + { + "epoch": 1.97, + "learning_rate": 5.530847467381585e-07, + "loss": 0.5994, + "step": 77024 + }, + { + "epoch": 1.97, + "learning_rate": 5.530599935769891e-07, + "loss": 0.4883, + "step": 77025 + }, + { + "epoch": 1.97, + "learning_rate": 5.530352407580206e-07, + "loss": 0.6738, + "step": 77026 + }, + { + "epoch": 1.97, + "learning_rate": 5.530104882812724e-07, + "loss": 0.5015, + "step": 77027 + }, + { + "epoch": 1.97, + "learning_rate": 5.529857361467636e-07, + "loss": 0.6228, + "step": 77028 + }, + { + "epoch": 1.97, + "learning_rate": 5.529609843545137e-07, + "loss": 0.6943, + "step": 77029 + }, + { + "epoch": 1.97, + "learning_rate": 5.529362329045404e-07, + "loss": 0.6206, + "step": 77030 + }, + { + "epoch": 1.97, + "learning_rate": 5.529114817968632e-07, + "loss": 0.7109, + "step": 77031 + }, + { + "epoch": 1.97, + "learning_rate": 5.528867310315013e-07, + "loss": 0.6035, + "step": 77032 + }, + { + "epoch": 1.97, + "learning_rate": 5.528619806084737e-07, + "loss": 0.6953, + "step": 77033 + }, + { + "epoch": 1.97, + "learning_rate": 5.528372305277986e-07, + "loss": 0.7007, + "step": 77034 + }, + { + "epoch": 1.97, + "learning_rate": 5.528124807894957e-07, + "loss": 0.6621, + "step": 77035 + }, + { + "epoch": 1.97, + "learning_rate": 5.527877313935836e-07, + "loss": 0.3552, + "step": 77036 + }, + { + "epoch": 1.97, + "learning_rate": 5.527629823400819e-07, + "loss": 0.6396, + "step": 77037 + }, + { + "epoch": 1.97, + "learning_rate": 5.527382336290085e-07, + "loss": 0.5215, + "step": 77038 + }, + { + "epoch": 1.97, + "learning_rate": 5.527134852603832e-07, + "loss": 0.5703, + "step": 77039 + }, + { + "epoch": 1.97, + "learning_rate": 5.526887372342243e-07, + "loss": 0.5386, + "step": 77040 + }, + { + "epoch": 1.97, + "learning_rate": 5.526639895505511e-07, + "loss": 0.5911, + "step": 77041 + }, + { + "epoch": 1.97, + "learning_rate": 5.52639242209383e-07, + "loss": 0.7334, + "step": 77042 + }, + { + "epoch": 1.97, + "learning_rate": 5.526144952107378e-07, + "loss": 0.519, + "step": 77043 + }, + { + "epoch": 1.97, + "learning_rate": 5.525897485546354e-07, + "loss": 0.5273, + "step": 77044 + }, + { + "epoch": 1.97, + "learning_rate": 5.525650022410943e-07, + "loss": 0.9131, + "step": 77045 + }, + { + "epoch": 1.97, + "learning_rate": 5.52540256270134e-07, + "loss": 0.6465, + "step": 77046 + }, + { + "epoch": 1.97, + "learning_rate": 5.525155106417727e-07, + "loss": 0.4917, + "step": 77047 + }, + { + "epoch": 1.97, + "learning_rate": 5.524907653560297e-07, + "loss": 0.6777, + "step": 77048 + }, + { + "epoch": 1.97, + "learning_rate": 5.524660204129243e-07, + "loss": 0.5942, + "step": 77049 + }, + { + "epoch": 1.97, + "learning_rate": 5.52441275812475e-07, + "loss": 0.7041, + "step": 77050 + }, + { + "epoch": 1.97, + "learning_rate": 5.524165315547007e-07, + "loss": 0.6748, + "step": 77051 + }, + { + "epoch": 1.97, + "learning_rate": 5.523917876396203e-07, + "loss": 0.6562, + "step": 77052 + }, + { + "epoch": 1.97, + "learning_rate": 5.523670440672529e-07, + "loss": 0.8428, + "step": 77053 + }, + { + "epoch": 1.97, + "learning_rate": 5.523423008376179e-07, + "loss": 0.7158, + "step": 77054 + }, + { + "epoch": 1.97, + "learning_rate": 5.523175579507334e-07, + "loss": 0.6919, + "step": 77055 + }, + { + "epoch": 1.97, + "learning_rate": 5.522928154066189e-07, + "loss": 0.5325, + "step": 77056 + }, + { + "epoch": 1.98, + "learning_rate": 5.522680732052932e-07, + "loss": 0.6387, + "step": 77057 + }, + { + "epoch": 1.98, + "learning_rate": 5.522433313467753e-07, + "loss": 0.5669, + "step": 77058 + }, + { + "epoch": 1.98, + "learning_rate": 5.522185898310844e-07, + "loss": 0.668, + "step": 77059 + }, + { + "epoch": 1.98, + "learning_rate": 5.521938486582387e-07, + "loss": 0.6387, + "step": 77060 + }, + { + "epoch": 1.98, + "learning_rate": 5.521691078282576e-07, + "loss": 0.5737, + "step": 77061 + }, + { + "epoch": 1.98, + "learning_rate": 5.5214436734116e-07, + "loss": 0.5684, + "step": 77062 + }, + { + "epoch": 1.98, + "learning_rate": 5.521196271969653e-07, + "loss": 0.834, + "step": 77063 + }, + { + "epoch": 1.98, + "learning_rate": 5.520948873956914e-07, + "loss": 0.5713, + "step": 77064 + }, + { + "epoch": 1.98, + "learning_rate": 5.520701479373582e-07, + "loss": 0.6938, + "step": 77065 + }, + { + "epoch": 1.98, + "learning_rate": 5.52045408821984e-07, + "loss": 0.5295, + "step": 77066 + }, + { + "epoch": 1.98, + "learning_rate": 5.520206700495885e-07, + "loss": 0.5789, + "step": 77067 + }, + { + "epoch": 1.98, + "learning_rate": 5.519959316201898e-07, + "loss": 0.6035, + "step": 77068 + }, + { + "epoch": 1.98, + "learning_rate": 5.519711935338077e-07, + "loss": 0.625, + "step": 77069 + }, + { + "epoch": 1.98, + "learning_rate": 5.519464557904601e-07, + "loss": 0.615, + "step": 77070 + }, + { + "epoch": 1.98, + "learning_rate": 5.51921718390167e-07, + "loss": 0.5249, + "step": 77071 + }, + { + "epoch": 1.98, + "learning_rate": 5.518969813329463e-07, + "loss": 0.6865, + "step": 77072 + }, + { + "epoch": 1.98, + "learning_rate": 5.518722446188178e-07, + "loss": 0.7578, + "step": 77073 + }, + { + "epoch": 1.98, + "learning_rate": 5.518475082477998e-07, + "loss": 0.3537, + "step": 77074 + }, + { + "epoch": 1.98, + "learning_rate": 5.518227722199121e-07, + "loss": 0.5996, + "step": 77075 + }, + { + "epoch": 1.98, + "learning_rate": 5.517980365351727e-07, + "loss": 0.6533, + "step": 77076 + }, + { + "epoch": 1.98, + "learning_rate": 5.517733011936008e-07, + "loss": 0.5376, + "step": 77077 + }, + { + "epoch": 1.98, + "learning_rate": 5.517485661952156e-07, + "loss": 0.5142, + "step": 77078 + }, + { + "epoch": 1.98, + "learning_rate": 5.517238315400363e-07, + "loss": 0.5737, + "step": 77079 + }, + { + "epoch": 1.98, + "learning_rate": 5.516990972280814e-07, + "loss": 0.2742, + "step": 77080 + }, + { + "epoch": 1.98, + "learning_rate": 5.516743632593694e-07, + "loss": 0.6924, + "step": 77081 + }, + { + "epoch": 1.98, + "learning_rate": 5.5164962963392e-07, + "loss": 0.6641, + "step": 77082 + }, + { + "epoch": 1.98, + "learning_rate": 5.516248963517515e-07, + "loss": 0.7725, + "step": 77083 + }, + { + "epoch": 1.98, + "learning_rate": 5.51600163412884e-07, + "loss": 0.6636, + "step": 77084 + }, + { + "epoch": 1.98, + "learning_rate": 5.515754308173351e-07, + "loss": 0.6338, + "step": 77085 + }, + { + "epoch": 1.98, + "learning_rate": 5.515506985651241e-07, + "loss": 0.6235, + "step": 77086 + }, + { + "epoch": 1.98, + "learning_rate": 5.515259666562706e-07, + "loss": 0.5854, + "step": 77087 + }, + { + "epoch": 1.98, + "learning_rate": 5.515012350907926e-07, + "loss": 0.5981, + "step": 77088 + }, + { + "epoch": 1.98, + "learning_rate": 5.5147650386871e-07, + "loss": 0.6416, + "step": 77089 + }, + { + "epoch": 1.98, + "learning_rate": 5.514517729900408e-07, + "loss": 0.5267, + "step": 77090 + }, + { + "epoch": 1.98, + "learning_rate": 5.514270424548044e-07, + "loss": 0.6255, + "step": 77091 + }, + { + "epoch": 1.98, + "learning_rate": 5.514023122630199e-07, + "loss": 0.6206, + "step": 77092 + }, + { + "epoch": 1.98, + "learning_rate": 5.513775824147058e-07, + "loss": 0.6245, + "step": 77093 + }, + { + "epoch": 1.98, + "learning_rate": 5.513528529098812e-07, + "loss": 0.6465, + "step": 77094 + }, + { + "epoch": 1.98, + "learning_rate": 5.51328123748565e-07, + "loss": 0.6904, + "step": 77095 + }, + { + "epoch": 1.98, + "learning_rate": 5.513033949307767e-07, + "loss": 0.6357, + "step": 77096 + }, + { + "epoch": 1.98, + "learning_rate": 5.512786664565343e-07, + "loss": 0.665, + "step": 77097 + }, + { + "epoch": 1.98, + "learning_rate": 5.512539383258574e-07, + "loss": 0.5625, + "step": 77098 + }, + { + "epoch": 1.98, + "learning_rate": 5.512292105387649e-07, + "loss": 0.5713, + "step": 77099 + }, + { + "epoch": 1.98, + "learning_rate": 5.512044830952753e-07, + "loss": 0.6641, + "step": 77100 + }, + { + "epoch": 1.98, + "learning_rate": 5.511797559954081e-07, + "loss": 0.4601, + "step": 77101 + }, + { + "epoch": 1.98, + "learning_rate": 5.511550292391816e-07, + "loss": 0.6196, + "step": 77102 + }, + { + "epoch": 1.98, + "learning_rate": 5.51130302826615e-07, + "loss": 0.5566, + "step": 77103 + }, + { + "epoch": 1.98, + "learning_rate": 5.511055767577277e-07, + "loss": 0.6934, + "step": 77104 + }, + { + "epoch": 1.98, + "learning_rate": 5.510808510325378e-07, + "loss": 0.6201, + "step": 77105 + }, + { + "epoch": 1.98, + "learning_rate": 5.510561256510647e-07, + "loss": 0.7305, + "step": 77106 + }, + { + "epoch": 1.98, + "learning_rate": 5.510314006133272e-07, + "loss": 0.5735, + "step": 77107 + }, + { + "epoch": 1.98, + "learning_rate": 5.510066759193447e-07, + "loss": 0.4673, + "step": 77108 + }, + { + "epoch": 1.98, + "learning_rate": 5.509819515691359e-07, + "loss": 0.6543, + "step": 77109 + }, + { + "epoch": 1.98, + "learning_rate": 5.50957227562719e-07, + "loss": 0.6289, + "step": 77110 + }, + { + "epoch": 1.98, + "learning_rate": 5.509325039001136e-07, + "loss": 0.5212, + "step": 77111 + }, + { + "epoch": 1.98, + "learning_rate": 5.509077805813385e-07, + "loss": 0.5913, + "step": 77112 + }, + { + "epoch": 1.98, + "learning_rate": 5.508830576064131e-07, + "loss": 0.6709, + "step": 77113 + }, + { + "epoch": 1.98, + "learning_rate": 5.508583349753555e-07, + "loss": 0.7549, + "step": 77114 + }, + { + "epoch": 1.98, + "learning_rate": 5.50833612688185e-07, + "loss": 0.582, + "step": 77115 + }, + { + "epoch": 1.98, + "learning_rate": 5.508088907449204e-07, + "loss": 0.6758, + "step": 77116 + }, + { + "epoch": 1.98, + "learning_rate": 5.507841691455815e-07, + "loss": 0.7539, + "step": 77117 + }, + { + "epoch": 1.98, + "learning_rate": 5.507594478901858e-07, + "loss": 0.3563, + "step": 77118 + }, + { + "epoch": 1.98, + "learning_rate": 5.507347269787534e-07, + "loss": 0.7012, + "step": 77119 + }, + { + "epoch": 1.98, + "learning_rate": 5.507100064113025e-07, + "loss": 0.4678, + "step": 77120 + }, + { + "epoch": 1.98, + "learning_rate": 5.506852861878526e-07, + "loss": 0.397, + "step": 77121 + }, + { + "epoch": 1.98, + "learning_rate": 5.506605663084219e-07, + "loss": 0.7407, + "step": 77122 + }, + { + "epoch": 1.98, + "learning_rate": 5.506358467730299e-07, + "loss": 0.6953, + "step": 77123 + }, + { + "epoch": 1.98, + "learning_rate": 5.506111275816951e-07, + "loss": 0.7568, + "step": 77124 + }, + { + "epoch": 1.98, + "learning_rate": 5.505864087344373e-07, + "loss": 0.5464, + "step": 77125 + }, + { + "epoch": 1.98, + "learning_rate": 5.505616902312743e-07, + "loss": 0.6758, + "step": 77126 + }, + { + "epoch": 1.98, + "learning_rate": 5.505369720722257e-07, + "loss": 0.6108, + "step": 77127 + }, + { + "epoch": 1.98, + "learning_rate": 5.505122542573102e-07, + "loss": 0.7305, + "step": 77128 + }, + { + "epoch": 1.98, + "learning_rate": 5.504875367865471e-07, + "loss": 0.7432, + "step": 77129 + }, + { + "epoch": 1.98, + "learning_rate": 5.50462819659955e-07, + "loss": 0.6895, + "step": 77130 + }, + { + "epoch": 1.98, + "learning_rate": 5.504381028775527e-07, + "loss": 0.6514, + "step": 77131 + }, + { + "epoch": 1.98, + "learning_rate": 5.50413386439359e-07, + "loss": 0.6279, + "step": 77132 + }, + { + "epoch": 1.98, + "learning_rate": 5.503886703453933e-07, + "loss": 0.5259, + "step": 77133 + }, + { + "epoch": 1.98, + "learning_rate": 5.503639545956746e-07, + "loss": 0.4927, + "step": 77134 + }, + { + "epoch": 1.98, + "learning_rate": 5.503392391902211e-07, + "loss": 0.6104, + "step": 77135 + }, + { + "epoch": 1.98, + "learning_rate": 5.503145241290524e-07, + "loss": 0.7383, + "step": 77136 + }, + { + "epoch": 1.98, + "learning_rate": 5.50289809412187e-07, + "loss": 0.6978, + "step": 77137 + }, + { + "epoch": 1.98, + "learning_rate": 5.502650950396448e-07, + "loss": 0.6514, + "step": 77138 + }, + { + "epoch": 1.98, + "learning_rate": 5.502403810114433e-07, + "loss": 0.7422, + "step": 77139 + }, + { + "epoch": 1.98, + "learning_rate": 5.50215667327602e-07, + "loss": 0.6777, + "step": 77140 + }, + { + "epoch": 1.98, + "learning_rate": 5.501909539881398e-07, + "loss": 0.6333, + "step": 77141 + }, + { + "epoch": 1.98, + "learning_rate": 5.501662409930761e-07, + "loss": 0.584, + "step": 77142 + }, + { + "epoch": 1.98, + "learning_rate": 5.501415283424291e-07, + "loss": 0.5605, + "step": 77143 + }, + { + "epoch": 1.98, + "learning_rate": 5.501168160362179e-07, + "loss": 0.5718, + "step": 77144 + }, + { + "epoch": 1.98, + "learning_rate": 5.500921040744617e-07, + "loss": 0.8623, + "step": 77145 + }, + { + "epoch": 1.98, + "learning_rate": 5.500673924571797e-07, + "loss": 0.7217, + "step": 77146 + }, + { + "epoch": 1.98, + "learning_rate": 5.5004268118439e-07, + "loss": 0.5684, + "step": 77147 + }, + { + "epoch": 1.98, + "learning_rate": 5.500179702561123e-07, + "loss": 0.709, + "step": 77148 + }, + { + "epoch": 1.98, + "learning_rate": 5.499932596723647e-07, + "loss": 0.7695, + "step": 77149 + }, + { + "epoch": 1.98, + "learning_rate": 5.499685494331667e-07, + "loss": 0.7148, + "step": 77150 + }, + { + "epoch": 1.98, + "learning_rate": 5.499438395385374e-07, + "loss": 0.7236, + "step": 77151 + }, + { + "epoch": 1.98, + "learning_rate": 5.499191299884951e-07, + "loss": 0.7656, + "step": 77152 + }, + { + "epoch": 1.98, + "learning_rate": 5.498944207830589e-07, + "loss": 0.7217, + "step": 77153 + }, + { + "epoch": 1.98, + "learning_rate": 5.498697119222479e-07, + "loss": 0.6143, + "step": 77154 + }, + { + "epoch": 1.98, + "learning_rate": 5.498450034060814e-07, + "loss": 0.5962, + "step": 77155 + }, + { + "epoch": 1.98, + "learning_rate": 5.498202952345774e-07, + "loss": 0.7393, + "step": 77156 + }, + { + "epoch": 1.98, + "learning_rate": 5.497955874077553e-07, + "loss": 0.6816, + "step": 77157 + }, + { + "epoch": 1.98, + "learning_rate": 5.497708799256346e-07, + "loss": 0.5503, + "step": 77158 + }, + { + "epoch": 1.98, + "learning_rate": 5.497461727882334e-07, + "loss": 0.6887, + "step": 77159 + }, + { + "epoch": 1.98, + "learning_rate": 5.497214659955706e-07, + "loss": 0.6182, + "step": 77160 + }, + { + "epoch": 1.98, + "learning_rate": 5.496967595476654e-07, + "loss": 0.5029, + "step": 77161 + }, + { + "epoch": 1.98, + "learning_rate": 5.496720534445365e-07, + "loss": 0.603, + "step": 77162 + }, + { + "epoch": 1.98, + "learning_rate": 5.496473476862035e-07, + "loss": 0.6279, + "step": 77163 + }, + { + "epoch": 1.98, + "learning_rate": 5.496226422726844e-07, + "loss": 0.7422, + "step": 77164 + }, + { + "epoch": 1.98, + "learning_rate": 5.495979372039986e-07, + "loss": 0.6611, + "step": 77165 + }, + { + "epoch": 1.98, + "learning_rate": 5.49573232480165e-07, + "loss": 0.4907, + "step": 77166 + }, + { + "epoch": 1.98, + "learning_rate": 5.495485281012027e-07, + "loss": 0.6152, + "step": 77167 + }, + { + "epoch": 1.98, + "learning_rate": 5.495238240671304e-07, + "loss": 0.5903, + "step": 77168 + }, + { + "epoch": 1.98, + "learning_rate": 5.494991203779666e-07, + "loss": 0.5129, + "step": 77169 + }, + { + "epoch": 1.98, + "learning_rate": 5.494744170337307e-07, + "loss": 0.4463, + "step": 77170 + }, + { + "epoch": 1.98, + "learning_rate": 5.494497140344415e-07, + "loss": 0.3987, + "step": 77171 + }, + { + "epoch": 1.98, + "learning_rate": 5.494250113801183e-07, + "loss": 0.6484, + "step": 77172 + }, + { + "epoch": 1.98, + "learning_rate": 5.494003090707793e-07, + "loss": 0.7236, + "step": 77173 + }, + { + "epoch": 1.98, + "learning_rate": 5.493756071064437e-07, + "loss": 0.5713, + "step": 77174 + }, + { + "epoch": 1.98, + "learning_rate": 5.49350905487131e-07, + "loss": 0.5098, + "step": 77175 + }, + { + "epoch": 1.98, + "learning_rate": 5.49326204212859e-07, + "loss": 0.5698, + "step": 77176 + }, + { + "epoch": 1.98, + "learning_rate": 5.493015032836473e-07, + "loss": 0.6064, + "step": 77177 + }, + { + "epoch": 1.98, + "learning_rate": 5.492768026995152e-07, + "loss": 0.7168, + "step": 77178 + }, + { + "epoch": 1.98, + "learning_rate": 5.492521024604805e-07, + "loss": 0.6475, + "step": 77179 + }, + { + "epoch": 1.98, + "learning_rate": 5.492274025665633e-07, + "loss": 0.6196, + "step": 77180 + }, + { + "epoch": 1.98, + "learning_rate": 5.492027030177816e-07, + "loss": 0.6973, + "step": 77181 + }, + { + "epoch": 1.98, + "learning_rate": 5.491780038141547e-07, + "loss": 0.5511, + "step": 77182 + }, + { + "epoch": 1.98, + "learning_rate": 5.491533049557013e-07, + "loss": 0.6699, + "step": 77183 + }, + { + "epoch": 1.98, + "learning_rate": 5.49128606442441e-07, + "loss": 0.6045, + "step": 77184 + }, + { + "epoch": 1.98, + "learning_rate": 5.491039082743917e-07, + "loss": 0.5703, + "step": 77185 + }, + { + "epoch": 1.98, + "learning_rate": 5.490792104515729e-07, + "loss": 0.5801, + "step": 77186 + }, + { + "epoch": 1.98, + "learning_rate": 5.490545129740033e-07, + "loss": 0.5298, + "step": 77187 + }, + { + "epoch": 1.98, + "learning_rate": 5.490298158417024e-07, + "loss": 0.5967, + "step": 77188 + }, + { + "epoch": 1.98, + "learning_rate": 5.490051190546886e-07, + "loss": 0.5859, + "step": 77189 + }, + { + "epoch": 1.98, + "learning_rate": 5.489804226129805e-07, + "loss": 0.6299, + "step": 77190 + }, + { + "epoch": 1.98, + "learning_rate": 5.489557265165974e-07, + "loss": 0.7109, + "step": 77191 + }, + { + "epoch": 1.98, + "learning_rate": 5.489310307655584e-07, + "loss": 0.4836, + "step": 77192 + }, + { + "epoch": 1.98, + "learning_rate": 5.489063353598818e-07, + "loss": 0.6836, + "step": 77193 + }, + { + "epoch": 1.98, + "learning_rate": 5.48881640299587e-07, + "loss": 0.6348, + "step": 77194 + }, + { + "epoch": 1.98, + "learning_rate": 5.488569455846928e-07, + "loss": 0.7905, + "step": 77195 + }, + { + "epoch": 1.98, + "learning_rate": 5.488322512152184e-07, + "loss": 0.437, + "step": 77196 + }, + { + "epoch": 1.98, + "learning_rate": 5.488075571911818e-07, + "loss": 0.5488, + "step": 77197 + }, + { + "epoch": 1.98, + "learning_rate": 5.487828635126033e-07, + "loss": 0.626, + "step": 77198 + }, + { + "epoch": 1.98, + "learning_rate": 5.487581701795003e-07, + "loss": 0.575, + "step": 77199 + }, + { + "epoch": 1.98, + "learning_rate": 5.487334771918926e-07, + "loss": 0.6533, + "step": 77200 + }, + { + "epoch": 1.98, + "learning_rate": 5.487087845497993e-07, + "loss": 0.4927, + "step": 77201 + }, + { + "epoch": 1.98, + "learning_rate": 5.486840922532385e-07, + "loss": 0.6058, + "step": 77202 + }, + { + "epoch": 1.98, + "learning_rate": 5.486594003022295e-07, + "loss": 0.667, + "step": 77203 + }, + { + "epoch": 1.98, + "learning_rate": 5.486347086967913e-07, + "loss": 0.5737, + "step": 77204 + }, + { + "epoch": 1.98, + "learning_rate": 5.486100174369432e-07, + "loss": 0.573, + "step": 77205 + }, + { + "epoch": 1.98, + "learning_rate": 5.485853265227031e-07, + "loss": 0.7114, + "step": 77206 + }, + { + "epoch": 1.98, + "learning_rate": 5.485606359540907e-07, + "loss": 0.6396, + "step": 77207 + }, + { + "epoch": 1.98, + "learning_rate": 5.485359457311247e-07, + "loss": 0.6475, + "step": 77208 + }, + { + "epoch": 1.98, + "learning_rate": 5.485112558538243e-07, + "loss": 0.6958, + "step": 77209 + }, + { + "epoch": 1.98, + "learning_rate": 5.484865663222076e-07, + "loss": 0.5474, + "step": 77210 + }, + { + "epoch": 1.98, + "learning_rate": 5.484618771362939e-07, + "loss": 0.873, + "step": 77211 + }, + { + "epoch": 1.98, + "learning_rate": 5.484371882961022e-07, + "loss": 0.4346, + "step": 77212 + }, + { + "epoch": 1.98, + "learning_rate": 5.484124998016517e-07, + "loss": 0.7227, + "step": 77213 + }, + { + "epoch": 1.98, + "learning_rate": 5.483878116529608e-07, + "loss": 0.5977, + "step": 77214 + }, + { + "epoch": 1.98, + "learning_rate": 5.483631238500484e-07, + "loss": 0.5269, + "step": 77215 + }, + { + "epoch": 1.98, + "learning_rate": 5.483384363929336e-07, + "loss": 0.5432, + "step": 77216 + }, + { + "epoch": 1.98, + "learning_rate": 5.483137492816357e-07, + "loss": 0.5942, + "step": 77217 + }, + { + "epoch": 1.98, + "learning_rate": 5.482890625161733e-07, + "loss": 0.7549, + "step": 77218 + }, + { + "epoch": 1.98, + "learning_rate": 5.482643760965648e-07, + "loss": 0.4741, + "step": 77219 + }, + { + "epoch": 1.98, + "learning_rate": 5.482396900228294e-07, + "loss": 0.6309, + "step": 77220 + }, + { + "epoch": 1.98, + "learning_rate": 5.48215004294986e-07, + "loss": 0.6533, + "step": 77221 + }, + { + "epoch": 1.98, + "learning_rate": 5.481903189130542e-07, + "loss": 0.7275, + "step": 77222 + }, + { + "epoch": 1.98, + "learning_rate": 5.481656338770519e-07, + "loss": 0.5219, + "step": 77223 + }, + { + "epoch": 1.98, + "learning_rate": 5.481409491869982e-07, + "loss": 0.667, + "step": 77224 + }, + { + "epoch": 1.98, + "learning_rate": 5.481162648429123e-07, + "loss": 0.5431, + "step": 77225 + }, + { + "epoch": 1.98, + "learning_rate": 5.480915808448135e-07, + "loss": 0.5464, + "step": 77226 + }, + { + "epoch": 1.98, + "learning_rate": 5.480668971927196e-07, + "loss": 0.519, + "step": 77227 + }, + { + "epoch": 1.98, + "learning_rate": 5.480422138866507e-07, + "loss": 0.7197, + "step": 77228 + }, + { + "epoch": 1.98, + "learning_rate": 5.480175309266247e-07, + "loss": 0.4556, + "step": 77229 + }, + { + "epoch": 1.98, + "learning_rate": 5.47992848312661e-07, + "loss": 0.6416, + "step": 77230 + }, + { + "epoch": 1.98, + "learning_rate": 5.479681660447782e-07, + "loss": 0.7002, + "step": 77231 + }, + { + "epoch": 1.98, + "learning_rate": 5.479434841229954e-07, + "loss": 0.5225, + "step": 77232 + }, + { + "epoch": 1.98, + "learning_rate": 5.479188025473315e-07, + "loss": 0.7949, + "step": 77233 + }, + { + "epoch": 1.98, + "learning_rate": 5.478941213178057e-07, + "loss": 0.7051, + "step": 77234 + }, + { + "epoch": 1.98, + "learning_rate": 5.478694404344363e-07, + "loss": 0.5889, + "step": 77235 + }, + { + "epoch": 1.98, + "learning_rate": 5.478447598972424e-07, + "loss": 0.5239, + "step": 77236 + }, + { + "epoch": 1.98, + "learning_rate": 5.47820079706243e-07, + "loss": 0.4941, + "step": 77237 + }, + { + "epoch": 1.98, + "learning_rate": 5.477953998614573e-07, + "loss": 0.4749, + "step": 77238 + }, + { + "epoch": 1.98, + "learning_rate": 5.477707203629039e-07, + "loss": 0.6484, + "step": 77239 + }, + { + "epoch": 1.98, + "learning_rate": 5.477460412106014e-07, + "loss": 0.615, + "step": 77240 + }, + { + "epoch": 1.98, + "learning_rate": 5.477213624045689e-07, + "loss": 0.6523, + "step": 77241 + }, + { + "epoch": 1.98, + "learning_rate": 5.476966839448252e-07, + "loss": 0.6406, + "step": 77242 + }, + { + "epoch": 1.98, + "learning_rate": 5.4767200583139e-07, + "loss": 0.666, + "step": 77243 + }, + { + "epoch": 1.98, + "learning_rate": 5.476473280642809e-07, + "loss": 0.3945, + "step": 77244 + }, + { + "epoch": 1.98, + "learning_rate": 5.476226506435176e-07, + "loss": 0.522, + "step": 77245 + }, + { + "epoch": 1.98, + "learning_rate": 5.475979735691187e-07, + "loss": 0.9072, + "step": 77246 + }, + { + "epoch": 1.98, + "learning_rate": 5.475732968411038e-07, + "loss": 0.6826, + "step": 77247 + }, + { + "epoch": 1.98, + "learning_rate": 5.475486204594912e-07, + "loss": 0.6602, + "step": 77248 + }, + { + "epoch": 1.98, + "learning_rate": 5.475239444242993e-07, + "loss": 0.4819, + "step": 77249 + }, + { + "epoch": 1.98, + "learning_rate": 5.474992687355476e-07, + "loss": 0.7246, + "step": 77250 + }, + { + "epoch": 1.98, + "learning_rate": 5.474745933932552e-07, + "loss": 0.511, + "step": 77251 + }, + { + "epoch": 1.98, + "learning_rate": 5.474499183974404e-07, + "loss": 0.751, + "step": 77252 + }, + { + "epoch": 1.98, + "learning_rate": 5.474252437481224e-07, + "loss": 0.6587, + "step": 77253 + }, + { + "epoch": 1.98, + "learning_rate": 5.474005694453199e-07, + "loss": 0.7104, + "step": 77254 + }, + { + "epoch": 1.98, + "learning_rate": 5.473758954890526e-07, + "loss": 0.6289, + "step": 77255 + }, + { + "epoch": 1.98, + "learning_rate": 5.473512218793384e-07, + "loss": 0.5615, + "step": 77256 + }, + { + "epoch": 1.98, + "learning_rate": 5.473265486161963e-07, + "loss": 0.6611, + "step": 77257 + }, + { + "epoch": 1.98, + "learning_rate": 5.473018756996459e-07, + "loss": 0.8057, + "step": 77258 + }, + { + "epoch": 1.98, + "learning_rate": 5.472772031297054e-07, + "loss": 0.6147, + "step": 77259 + }, + { + "epoch": 1.98, + "learning_rate": 5.472525309063942e-07, + "loss": 0.7168, + "step": 77260 + }, + { + "epoch": 1.98, + "learning_rate": 5.472278590297306e-07, + "loss": 0.3347, + "step": 77261 + }, + { + "epoch": 1.98, + "learning_rate": 5.472031874997338e-07, + "loss": 0.6719, + "step": 77262 + }, + { + "epoch": 1.98, + "learning_rate": 5.471785163164226e-07, + "loss": 0.4277, + "step": 77263 + }, + { + "epoch": 1.98, + "learning_rate": 5.471538454798165e-07, + "loss": 0.5652, + "step": 77264 + }, + { + "epoch": 1.98, + "learning_rate": 5.471291749899335e-07, + "loss": 0.5962, + "step": 77265 + }, + { + "epoch": 1.98, + "learning_rate": 5.471045048467929e-07, + "loss": 0.6362, + "step": 77266 + }, + { + "epoch": 1.98, + "learning_rate": 5.470798350504137e-07, + "loss": 0.4558, + "step": 77267 + }, + { + "epoch": 1.98, + "learning_rate": 5.470551656008149e-07, + "loss": 0.5801, + "step": 77268 + }, + { + "epoch": 1.98, + "learning_rate": 5.470304964980146e-07, + "loss": 0.5273, + "step": 77269 + }, + { + "epoch": 1.98, + "learning_rate": 5.470058277420323e-07, + "loss": 0.5122, + "step": 77270 + }, + { + "epoch": 1.98, + "learning_rate": 5.469811593328868e-07, + "loss": 0.6997, + "step": 77271 + }, + { + "epoch": 1.98, + "learning_rate": 5.469564912705973e-07, + "loss": 0.6836, + "step": 77272 + }, + { + "epoch": 1.98, + "learning_rate": 5.469318235551821e-07, + "loss": 0.6272, + "step": 77273 + }, + { + "epoch": 1.98, + "learning_rate": 5.469071561866603e-07, + "loss": 0.6699, + "step": 77274 + }, + { + "epoch": 1.98, + "learning_rate": 5.468824891650508e-07, + "loss": 0.6797, + "step": 77275 + }, + { + "epoch": 1.98, + "learning_rate": 5.46857822490373e-07, + "loss": 0.7012, + "step": 77276 + }, + { + "epoch": 1.98, + "learning_rate": 5.46833156162645e-07, + "loss": 0.7646, + "step": 77277 + }, + { + "epoch": 1.98, + "learning_rate": 5.468084901818863e-07, + "loss": 0.834, + "step": 77278 + }, + { + "epoch": 1.98, + "learning_rate": 5.467838245481153e-07, + "loss": 0.7871, + "step": 77279 + }, + { + "epoch": 1.98, + "learning_rate": 5.467591592613509e-07, + "loss": 0.5361, + "step": 77280 + }, + { + "epoch": 1.98, + "learning_rate": 5.467344943216127e-07, + "loss": 0.8242, + "step": 77281 + }, + { + "epoch": 1.98, + "learning_rate": 5.467098297289185e-07, + "loss": 0.6738, + "step": 77282 + }, + { + "epoch": 1.98, + "learning_rate": 5.466851654832878e-07, + "loss": 0.6277, + "step": 77283 + }, + { + "epoch": 1.98, + "learning_rate": 5.466605015847398e-07, + "loss": 0.5669, + "step": 77284 + }, + { + "epoch": 1.98, + "learning_rate": 5.466358380332927e-07, + "loss": 0.6284, + "step": 77285 + }, + { + "epoch": 1.98, + "learning_rate": 5.466111748289657e-07, + "loss": 0.5552, + "step": 77286 + }, + { + "epoch": 1.98, + "learning_rate": 5.465865119717777e-07, + "loss": 0.6328, + "step": 77287 + }, + { + "epoch": 1.98, + "learning_rate": 5.465618494617478e-07, + "loss": 0.5496, + "step": 77288 + }, + { + "epoch": 1.98, + "learning_rate": 5.465371872988946e-07, + "loss": 0.7148, + "step": 77289 + }, + { + "epoch": 1.98, + "learning_rate": 5.465125254832368e-07, + "loss": 0.6289, + "step": 77290 + }, + { + "epoch": 1.98, + "learning_rate": 5.464878640147935e-07, + "loss": 0.5825, + "step": 77291 + }, + { + "epoch": 1.98, + "learning_rate": 5.464632028935837e-07, + "loss": 0.5264, + "step": 77292 + }, + { + "epoch": 1.98, + "learning_rate": 5.464385421196263e-07, + "loss": 0.5437, + "step": 77293 + }, + { + "epoch": 1.98, + "learning_rate": 5.464138816929398e-07, + "loss": 0.5386, + "step": 77294 + }, + { + "epoch": 1.98, + "learning_rate": 5.463892216135433e-07, + "loss": 0.5276, + "step": 77295 + }, + { + "epoch": 1.98, + "learning_rate": 5.463645618814557e-07, + "loss": 0.4785, + "step": 77296 + }, + { + "epoch": 1.98, + "learning_rate": 5.463399024966964e-07, + "loss": 0.7207, + "step": 77297 + }, + { + "epoch": 1.98, + "learning_rate": 5.463152434592836e-07, + "loss": 0.4358, + "step": 77298 + }, + { + "epoch": 1.98, + "learning_rate": 5.46290584769236e-07, + "loss": 0.6938, + "step": 77299 + }, + { + "epoch": 1.98, + "learning_rate": 5.46265926426573e-07, + "loss": 0.4707, + "step": 77300 + }, + { + "epoch": 1.98, + "learning_rate": 5.462412684313136e-07, + "loss": 0.5117, + "step": 77301 + }, + { + "epoch": 1.98, + "learning_rate": 5.462166107834759e-07, + "loss": 0.6953, + "step": 77302 + }, + { + "epoch": 1.98, + "learning_rate": 5.461919534830795e-07, + "loss": 0.6235, + "step": 77303 + }, + { + "epoch": 1.98, + "learning_rate": 5.461672965301428e-07, + "loss": 0.7969, + "step": 77304 + }, + { + "epoch": 1.98, + "learning_rate": 5.461426399246856e-07, + "loss": 0.4142, + "step": 77305 + }, + { + "epoch": 1.98, + "learning_rate": 5.461179836667254e-07, + "loss": 0.7871, + "step": 77306 + }, + { + "epoch": 1.98, + "learning_rate": 5.46093327756282e-07, + "loss": 0.6235, + "step": 77307 + }, + { + "epoch": 1.98, + "learning_rate": 5.460686721933745e-07, + "loss": 0.6377, + "step": 77308 + }, + { + "epoch": 1.98, + "learning_rate": 5.460440169780208e-07, + "loss": 0.5347, + "step": 77309 + }, + { + "epoch": 1.98, + "learning_rate": 5.460193621102409e-07, + "loss": 0.5886, + "step": 77310 + }, + { + "epoch": 1.98, + "learning_rate": 5.459947075900526e-07, + "loss": 0.5557, + "step": 77311 + }, + { + "epoch": 1.98, + "learning_rate": 5.459700534174752e-07, + "loss": 0.562, + "step": 77312 + }, + { + "epoch": 1.98, + "learning_rate": 5.459453995925278e-07, + "loss": 0.6133, + "step": 77313 + }, + { + "epoch": 1.98, + "learning_rate": 5.459207461152294e-07, + "loss": 0.6499, + "step": 77314 + }, + { + "epoch": 1.98, + "learning_rate": 5.458960929855983e-07, + "loss": 0.7529, + "step": 77315 + }, + { + "epoch": 1.98, + "learning_rate": 5.458714402036536e-07, + "loss": 0.4699, + "step": 77316 + }, + { + "epoch": 1.98, + "learning_rate": 5.458467877694144e-07, + "loss": 0.6885, + "step": 77317 + }, + { + "epoch": 1.98, + "learning_rate": 5.458221356829001e-07, + "loss": 0.5562, + "step": 77318 + }, + { + "epoch": 1.98, + "learning_rate": 5.457974839441281e-07, + "loss": 0.52, + "step": 77319 + }, + { + "epoch": 1.98, + "learning_rate": 5.457728325531181e-07, + "loss": 0.353, + "step": 77320 + }, + { + "epoch": 1.98, + "learning_rate": 5.457481815098889e-07, + "loss": 0.7314, + "step": 77321 + }, + { + "epoch": 1.98, + "learning_rate": 5.457235308144601e-07, + "loss": 0.5615, + "step": 77322 + }, + { + "epoch": 1.98, + "learning_rate": 5.456988804668492e-07, + "loss": 0.7217, + "step": 77323 + }, + { + "epoch": 1.98, + "learning_rate": 5.456742304670759e-07, + "loss": 0.6582, + "step": 77324 + }, + { + "epoch": 1.98, + "learning_rate": 5.45649580815159e-07, + "loss": 0.5679, + "step": 77325 + }, + { + "epoch": 1.98, + "learning_rate": 5.456249315111177e-07, + "loss": 0.8516, + "step": 77326 + }, + { + "epoch": 1.98, + "learning_rate": 5.4560028255497e-07, + "loss": 0.6992, + "step": 77327 + }, + { + "epoch": 1.98, + "learning_rate": 5.455756339467356e-07, + "loss": 0.48, + "step": 77328 + }, + { + "epoch": 1.98, + "learning_rate": 5.455509856864328e-07, + "loss": 0.7217, + "step": 77329 + }, + { + "epoch": 1.98, + "learning_rate": 5.455263377740809e-07, + "loss": 0.707, + "step": 77330 + }, + { + "epoch": 1.98, + "learning_rate": 5.455016902096987e-07, + "loss": 0.4633, + "step": 77331 + }, + { + "epoch": 1.98, + "learning_rate": 5.454770429933047e-07, + "loss": 0.519, + "step": 77332 + }, + { + "epoch": 1.98, + "learning_rate": 5.454523961249179e-07, + "loss": 0.5396, + "step": 77333 + }, + { + "epoch": 1.98, + "learning_rate": 5.454277496045573e-07, + "loss": 0.5693, + "step": 77334 + }, + { + "epoch": 1.98, + "learning_rate": 5.454031034322424e-07, + "loss": 0.5283, + "step": 77335 + }, + { + "epoch": 1.98, + "learning_rate": 5.453784576079907e-07, + "loss": 0.3632, + "step": 77336 + }, + { + "epoch": 1.98, + "learning_rate": 5.453538121318221e-07, + "loss": 0.7744, + "step": 77337 + }, + { + "epoch": 1.98, + "learning_rate": 5.453291670037554e-07, + "loss": 0.6377, + "step": 77338 + }, + { + "epoch": 1.98, + "learning_rate": 5.453045222238093e-07, + "loss": 0.5151, + "step": 77339 + }, + { + "epoch": 1.98, + "learning_rate": 5.452798777920022e-07, + "loss": 0.7715, + "step": 77340 + }, + { + "epoch": 1.98, + "learning_rate": 5.452552337083536e-07, + "loss": 0.563, + "step": 77341 + }, + { + "epoch": 1.98, + "learning_rate": 5.452305899728819e-07, + "loss": 0.4612, + "step": 77342 + }, + { + "epoch": 1.98, + "learning_rate": 5.452059465856067e-07, + "loss": 0.7334, + "step": 77343 + }, + { + "epoch": 1.98, + "learning_rate": 5.45181303546546e-07, + "loss": 0.6616, + "step": 77344 + }, + { + "epoch": 1.98, + "learning_rate": 5.451566608557191e-07, + "loss": 0.6699, + "step": 77345 + }, + { + "epoch": 1.98, + "learning_rate": 5.451320185131447e-07, + "loss": 0.5947, + "step": 77346 + }, + { + "epoch": 1.98, + "learning_rate": 5.451073765188424e-07, + "loss": 0.5708, + "step": 77347 + }, + { + "epoch": 1.98, + "learning_rate": 5.450827348728304e-07, + "loss": 0.4886, + "step": 77348 + }, + { + "epoch": 1.98, + "learning_rate": 5.450580935751271e-07, + "loss": 0.7783, + "step": 77349 + }, + { + "epoch": 1.98, + "learning_rate": 5.45033452625752e-07, + "loss": 0.6143, + "step": 77350 + }, + { + "epoch": 1.98, + "learning_rate": 5.450088120247238e-07, + "loss": 0.5083, + "step": 77351 + }, + { + "epoch": 1.98, + "learning_rate": 5.44984171772062e-07, + "loss": 0.8047, + "step": 77352 + }, + { + "epoch": 1.98, + "learning_rate": 5.449595318677844e-07, + "loss": 0.627, + "step": 77353 + }, + { + "epoch": 1.98, + "learning_rate": 5.449348923119104e-07, + "loss": 0.7021, + "step": 77354 + }, + { + "epoch": 1.98, + "learning_rate": 5.449102531044592e-07, + "loss": 0.5977, + "step": 77355 + }, + { + "epoch": 1.98, + "learning_rate": 5.448856142454487e-07, + "loss": 0.6084, + "step": 77356 + }, + { + "epoch": 1.98, + "learning_rate": 5.448609757348986e-07, + "loss": 0.6699, + "step": 77357 + }, + { + "epoch": 1.98, + "learning_rate": 5.448363375728279e-07, + "loss": 0.6675, + "step": 77358 + }, + { + "epoch": 1.98, + "learning_rate": 5.448116997592546e-07, + "loss": 0.6724, + "step": 77359 + }, + { + "epoch": 1.98, + "learning_rate": 5.447870622941985e-07, + "loss": 0.4236, + "step": 77360 + }, + { + "epoch": 1.98, + "learning_rate": 5.447624251776777e-07, + "loss": 0.8408, + "step": 77361 + }, + { + "epoch": 1.98, + "learning_rate": 5.447377884097112e-07, + "loss": 0.5161, + "step": 77362 + }, + { + "epoch": 1.98, + "learning_rate": 5.447131519903181e-07, + "loss": 0.543, + "step": 77363 + }, + { + "epoch": 1.98, + "learning_rate": 5.446885159195176e-07, + "loss": 0.7373, + "step": 77364 + }, + { + "epoch": 1.98, + "learning_rate": 5.446638801973278e-07, + "loss": 0.6094, + "step": 77365 + }, + { + "epoch": 1.98, + "learning_rate": 5.44639244823768e-07, + "loss": 0.6306, + "step": 77366 + }, + { + "epoch": 1.98, + "learning_rate": 5.446146097988569e-07, + "loss": 0.4473, + "step": 77367 + }, + { + "epoch": 1.98, + "learning_rate": 5.445899751226139e-07, + "loss": 0.6313, + "step": 77368 + }, + { + "epoch": 1.98, + "learning_rate": 5.445653407950574e-07, + "loss": 0.585, + "step": 77369 + }, + { + "epoch": 1.98, + "learning_rate": 5.445407068162058e-07, + "loss": 0.4501, + "step": 77370 + }, + { + "epoch": 1.98, + "learning_rate": 5.445160731860785e-07, + "loss": 0.6494, + "step": 77371 + }, + { + "epoch": 1.98, + "learning_rate": 5.444914399046947e-07, + "loss": 0.7041, + "step": 77372 + }, + { + "epoch": 1.98, + "learning_rate": 5.444668069720726e-07, + "loss": 0.5259, + "step": 77373 + }, + { + "epoch": 1.98, + "learning_rate": 5.444421743882311e-07, + "loss": 0.6577, + "step": 77374 + }, + { + "epoch": 1.98, + "learning_rate": 5.444175421531893e-07, + "loss": 0.6504, + "step": 77375 + }, + { + "epoch": 1.98, + "learning_rate": 5.443929102669666e-07, + "loss": 0.5508, + "step": 77376 + }, + { + "epoch": 1.98, + "learning_rate": 5.443682787295808e-07, + "loss": 0.8145, + "step": 77377 + }, + { + "epoch": 1.98, + "learning_rate": 5.443436475410517e-07, + "loss": 0.707, + "step": 77378 + }, + { + "epoch": 1.98, + "learning_rate": 5.443190167013972e-07, + "loss": 0.6587, + "step": 77379 + }, + { + "epoch": 1.98, + "learning_rate": 5.442943862106369e-07, + "loss": 0.5723, + "step": 77380 + }, + { + "epoch": 1.98, + "learning_rate": 5.442697560687897e-07, + "loss": 0.4524, + "step": 77381 + }, + { + "epoch": 1.98, + "learning_rate": 5.442451262758737e-07, + "loss": 0.542, + "step": 77382 + }, + { + "epoch": 1.98, + "learning_rate": 5.442204968319084e-07, + "loss": 0.6111, + "step": 77383 + }, + { + "epoch": 1.98, + "learning_rate": 5.441958677369124e-07, + "loss": 0.6377, + "step": 77384 + }, + { + "epoch": 1.98, + "learning_rate": 5.44171238990905e-07, + "loss": 0.6572, + "step": 77385 + }, + { + "epoch": 1.98, + "learning_rate": 5.441466105939046e-07, + "loss": 0.7783, + "step": 77386 + }, + { + "epoch": 1.98, + "learning_rate": 5.4412198254593e-07, + "loss": 0.6172, + "step": 77387 + }, + { + "epoch": 1.98, + "learning_rate": 5.440973548470006e-07, + "loss": 0.5981, + "step": 77388 + }, + { + "epoch": 1.98, + "learning_rate": 5.440727274971348e-07, + "loss": 0.5089, + "step": 77389 + }, + { + "epoch": 1.98, + "learning_rate": 5.440481004963515e-07, + "loss": 0.4863, + "step": 77390 + }, + { + "epoch": 1.98, + "learning_rate": 5.440234738446693e-07, + "loss": 0.5737, + "step": 77391 + }, + { + "epoch": 1.98, + "learning_rate": 5.439988475421075e-07, + "loss": 0.7559, + "step": 77392 + }, + { + "epoch": 1.98, + "learning_rate": 5.439742215886851e-07, + "loss": 0.6089, + "step": 77393 + }, + { + "epoch": 1.98, + "learning_rate": 5.439495959844203e-07, + "loss": 0.5903, + "step": 77394 + }, + { + "epoch": 1.98, + "learning_rate": 5.439249707293324e-07, + "loss": 0.5654, + "step": 77395 + }, + { + "epoch": 1.98, + "learning_rate": 5.439003458234401e-07, + "loss": 0.5693, + "step": 77396 + }, + { + "epoch": 1.98, + "learning_rate": 5.438757212667629e-07, + "loss": 0.6123, + "step": 77397 + }, + { + "epoch": 1.98, + "learning_rate": 5.438510970593188e-07, + "loss": 0.5398, + "step": 77398 + }, + { + "epoch": 1.98, + "learning_rate": 5.438264732011268e-07, + "loss": 0.6758, + "step": 77399 + }, + { + "epoch": 1.98, + "learning_rate": 5.438018496922059e-07, + "loss": 0.6611, + "step": 77400 + }, + { + "epoch": 1.98, + "learning_rate": 5.437772265325748e-07, + "loss": 0.6641, + "step": 77401 + }, + { + "epoch": 1.98, + "learning_rate": 5.437526037222528e-07, + "loss": 0.5757, + "step": 77402 + }, + { + "epoch": 1.98, + "learning_rate": 5.437279812612583e-07, + "loss": 0.7539, + "step": 77403 + }, + { + "epoch": 1.98, + "learning_rate": 5.437033591496101e-07, + "loss": 0.667, + "step": 77404 + }, + { + "epoch": 1.98, + "learning_rate": 5.436787373873276e-07, + "loss": 0.6953, + "step": 77405 + }, + { + "epoch": 1.98, + "learning_rate": 5.436541159744293e-07, + "loss": 0.4512, + "step": 77406 + }, + { + "epoch": 1.98, + "learning_rate": 5.436294949109339e-07, + "loss": 0.6777, + "step": 77407 + }, + { + "epoch": 1.98, + "learning_rate": 5.436048741968606e-07, + "loss": 0.5339, + "step": 77408 + }, + { + "epoch": 1.98, + "learning_rate": 5.435802538322278e-07, + "loss": 0.5557, + "step": 77409 + }, + { + "epoch": 1.98, + "learning_rate": 5.43555633817055e-07, + "loss": 0.8867, + "step": 77410 + }, + { + "epoch": 1.98, + "learning_rate": 5.435310141513604e-07, + "loss": 0.6113, + "step": 77411 + }, + { + "epoch": 1.98, + "learning_rate": 5.43506394835163e-07, + "loss": 0.8477, + "step": 77412 + }, + { + "epoch": 1.98, + "learning_rate": 5.434817758684818e-07, + "loss": 0.6431, + "step": 77413 + }, + { + "epoch": 1.98, + "learning_rate": 5.434571572513359e-07, + "loss": 0.8354, + "step": 77414 + }, + { + "epoch": 1.98, + "learning_rate": 5.434325389837436e-07, + "loss": 0.6123, + "step": 77415 + }, + { + "epoch": 1.98, + "learning_rate": 5.434079210657238e-07, + "loss": 0.7852, + "step": 77416 + }, + { + "epoch": 1.98, + "learning_rate": 5.433833034972957e-07, + "loss": 0.6328, + "step": 77417 + }, + { + "epoch": 1.98, + "learning_rate": 5.433586862784785e-07, + "loss": 0.6323, + "step": 77418 + }, + { + "epoch": 1.98, + "learning_rate": 5.433340694092905e-07, + "loss": 0.5576, + "step": 77419 + }, + { + "epoch": 1.98, + "learning_rate": 5.433094528897501e-07, + "loss": 0.363, + "step": 77420 + }, + { + "epoch": 1.98, + "learning_rate": 5.432848367198768e-07, + "loss": 0.3209, + "step": 77421 + }, + { + "epoch": 1.98, + "learning_rate": 5.432602208996891e-07, + "loss": 0.7588, + "step": 77422 + }, + { + "epoch": 1.98, + "learning_rate": 5.432356054292067e-07, + "loss": 0.6719, + "step": 77423 + }, + { + "epoch": 1.98, + "learning_rate": 5.432109903084471e-07, + "loss": 0.7026, + "step": 77424 + }, + { + "epoch": 1.98, + "learning_rate": 5.431863755374302e-07, + "loss": 0.6621, + "step": 77425 + }, + { + "epoch": 1.98, + "learning_rate": 5.431617611161742e-07, + "loss": 0.5767, + "step": 77426 + }, + { + "epoch": 1.98, + "learning_rate": 5.431371470446987e-07, + "loss": 0.6724, + "step": 77427 + }, + { + "epoch": 1.98, + "learning_rate": 5.431125333230222e-07, + "loss": 0.4878, + "step": 77428 + }, + { + "epoch": 1.98, + "learning_rate": 5.430879199511629e-07, + "loss": 0.4692, + "step": 77429 + }, + { + "epoch": 1.98, + "learning_rate": 5.430633069291401e-07, + "loss": 0.582, + "step": 77430 + }, + { + "epoch": 1.98, + "learning_rate": 5.430386942569734e-07, + "loss": 0.6279, + "step": 77431 + }, + { + "epoch": 1.98, + "learning_rate": 5.430140819346803e-07, + "loss": 0.6597, + "step": 77432 + }, + { + "epoch": 1.98, + "learning_rate": 5.429894699622803e-07, + "loss": 0.5659, + "step": 77433 + }, + { + "epoch": 1.98, + "learning_rate": 5.429648583397924e-07, + "loss": 0.5488, + "step": 77434 + }, + { + "epoch": 1.98, + "learning_rate": 5.429402470672356e-07, + "loss": 0.6748, + "step": 77435 + }, + { + "epoch": 1.98, + "learning_rate": 5.429156361446281e-07, + "loss": 0.5913, + "step": 77436 + }, + { + "epoch": 1.98, + "learning_rate": 5.428910255719894e-07, + "loss": 0.7842, + "step": 77437 + }, + { + "epoch": 1.98, + "learning_rate": 5.428664153493376e-07, + "loss": 0.6484, + "step": 77438 + }, + { + "epoch": 1.98, + "learning_rate": 5.428418054766921e-07, + "loss": 0.573, + "step": 77439 + }, + { + "epoch": 1.98, + "learning_rate": 5.428171959540719e-07, + "loss": 0.5605, + "step": 77440 + }, + { + "epoch": 1.98, + "learning_rate": 5.427925867814953e-07, + "loss": 0.5916, + "step": 77441 + }, + { + "epoch": 1.98, + "learning_rate": 5.427679779589812e-07, + "loss": 0.6133, + "step": 77442 + }, + { + "epoch": 1.98, + "learning_rate": 5.427433694865487e-07, + "loss": 0.6982, + "step": 77443 + }, + { + "epoch": 1.98, + "learning_rate": 5.427187613642171e-07, + "loss": 0.7188, + "step": 77444 + }, + { + "epoch": 1.98, + "learning_rate": 5.426941535920042e-07, + "loss": 0.71, + "step": 77445 + }, + { + "epoch": 1.98, + "learning_rate": 5.426695461699293e-07, + "loss": 0.3694, + "step": 77446 + }, + { + "epoch": 1.99, + "learning_rate": 5.426449390980118e-07, + "loss": 0.6313, + "step": 77447 + }, + { + "epoch": 1.99, + "learning_rate": 5.4262033237627e-07, + "loss": 0.4385, + "step": 77448 + }, + { + "epoch": 1.99, + "learning_rate": 5.425957260047225e-07, + "loss": 0.6245, + "step": 77449 + }, + { + "epoch": 1.99, + "learning_rate": 5.425711199833883e-07, + "loss": 0.7266, + "step": 77450 + }, + { + "epoch": 1.99, + "learning_rate": 5.425465143122863e-07, + "loss": 0.4424, + "step": 77451 + }, + { + "epoch": 1.99, + "learning_rate": 5.425219089914359e-07, + "loss": 0.6465, + "step": 77452 + }, + { + "epoch": 1.99, + "learning_rate": 5.42497304020855e-07, + "loss": 0.5132, + "step": 77453 + }, + { + "epoch": 1.99, + "learning_rate": 5.424726994005628e-07, + "loss": 0.646, + "step": 77454 + }, + { + "epoch": 1.99, + "learning_rate": 5.424480951305783e-07, + "loss": 0.6699, + "step": 77455 + }, + { + "epoch": 1.99, + "learning_rate": 5.424234912109207e-07, + "loss": 0.6196, + "step": 77456 + }, + { + "epoch": 1.99, + "learning_rate": 5.423988876416084e-07, + "loss": 0.6768, + "step": 77457 + }, + { + "epoch": 1.99, + "learning_rate": 5.423742844226598e-07, + "loss": 0.2644, + "step": 77458 + }, + { + "epoch": 1.99, + "learning_rate": 5.423496815540942e-07, + "loss": 0.6118, + "step": 77459 + }, + { + "epoch": 1.99, + "learning_rate": 5.423250790359304e-07, + "loss": 0.406, + "step": 77460 + }, + { + "epoch": 1.99, + "learning_rate": 5.423004768681876e-07, + "loss": 0.6328, + "step": 77461 + }, + { + "epoch": 1.99, + "learning_rate": 5.422758750508838e-07, + "loss": 0.7812, + "step": 77462 + }, + { + "epoch": 1.99, + "learning_rate": 5.422512735840384e-07, + "loss": 0.5962, + "step": 77463 + }, + { + "epoch": 1.99, + "learning_rate": 5.422266724676706e-07, + "loss": 0.3366, + "step": 77464 + }, + { + "epoch": 1.99, + "learning_rate": 5.422020717017983e-07, + "loss": 0.7158, + "step": 77465 + }, + { + "epoch": 1.99, + "learning_rate": 5.421774712864409e-07, + "loss": 0.5972, + "step": 77466 + }, + { + "epoch": 1.99, + "learning_rate": 5.421528712216175e-07, + "loss": 0.5586, + "step": 77467 + }, + { + "epoch": 1.99, + "learning_rate": 5.421282715073462e-07, + "loss": 0.6738, + "step": 77468 + }, + { + "epoch": 1.99, + "learning_rate": 5.421036721436466e-07, + "loss": 0.6587, + "step": 77469 + }, + { + "epoch": 1.99, + "learning_rate": 5.420790731305368e-07, + "loss": 0.7188, + "step": 77470 + }, + { + "epoch": 1.99, + "learning_rate": 5.42054474468036e-07, + "loss": 0.5344, + "step": 77471 + }, + { + "epoch": 1.99, + "learning_rate": 5.42029876156163e-07, + "loss": 0.5662, + "step": 77472 + }, + { + "epoch": 1.99, + "learning_rate": 5.420052781949372e-07, + "loss": 0.5908, + "step": 77473 + }, + { + "epoch": 1.99, + "learning_rate": 5.419806805843763e-07, + "loss": 0.4761, + "step": 77474 + }, + { + "epoch": 1.99, + "learning_rate": 5.419560833244999e-07, + "loss": 0.6782, + "step": 77475 + }, + { + "epoch": 1.99, + "learning_rate": 5.419314864153266e-07, + "loss": 0.708, + "step": 77476 + }, + { + "epoch": 1.99, + "learning_rate": 5.419068898568757e-07, + "loss": 0.5996, + "step": 77477 + }, + { + "epoch": 1.99, + "learning_rate": 5.418822936491656e-07, + "loss": 0.5894, + "step": 77478 + }, + { + "epoch": 1.99, + "learning_rate": 5.418576977922149e-07, + "loss": 0.6924, + "step": 77479 + }, + { + "epoch": 1.99, + "learning_rate": 5.418331022860426e-07, + "loss": 0.7471, + "step": 77480 + }, + { + "epoch": 1.99, + "learning_rate": 5.41808507130668e-07, + "loss": 0.5391, + "step": 77481 + }, + { + "epoch": 1.99, + "learning_rate": 5.417839123261091e-07, + "loss": 0.7324, + "step": 77482 + }, + { + "epoch": 1.99, + "learning_rate": 5.417593178723852e-07, + "loss": 0.5864, + "step": 77483 + }, + { + "epoch": 1.99, + "learning_rate": 5.417347237695152e-07, + "loss": 0.4648, + "step": 77484 + }, + { + "epoch": 1.99, + "learning_rate": 5.417101300175182e-07, + "loss": 0.7354, + "step": 77485 + }, + { + "epoch": 1.99, + "learning_rate": 5.416855366164123e-07, + "loss": 0.6997, + "step": 77486 + }, + { + "epoch": 1.99, + "learning_rate": 5.416609435662172e-07, + "loss": 0.6777, + "step": 77487 + }, + { + "epoch": 1.99, + "learning_rate": 5.416363508669508e-07, + "loss": 0.6382, + "step": 77488 + }, + { + "epoch": 1.99, + "learning_rate": 5.416117585186324e-07, + "loss": 0.6357, + "step": 77489 + }, + { + "epoch": 1.99, + "learning_rate": 5.41587166521281e-07, + "loss": 0.5415, + "step": 77490 + }, + { + "epoch": 1.99, + "learning_rate": 5.415625748749151e-07, + "loss": 0.6348, + "step": 77491 + }, + { + "epoch": 1.99, + "learning_rate": 5.415379835795534e-07, + "loss": 0.5791, + "step": 77492 + }, + { + "epoch": 1.99, + "learning_rate": 5.415133926352151e-07, + "loss": 0.457, + "step": 77493 + }, + { + "epoch": 1.99, + "learning_rate": 5.414888020419193e-07, + "loss": 0.5962, + "step": 77494 + }, + { + "epoch": 1.99, + "learning_rate": 5.414642117996841e-07, + "loss": 0.7637, + "step": 77495 + }, + { + "epoch": 1.99, + "learning_rate": 5.414396219085287e-07, + "loss": 0.7871, + "step": 77496 + }, + { + "epoch": 1.99, + "learning_rate": 5.414150323684721e-07, + "loss": 0.5674, + "step": 77497 + }, + { + "epoch": 1.99, + "learning_rate": 5.41390443179533e-07, + "loss": 0.4844, + "step": 77498 + }, + { + "epoch": 1.99, + "learning_rate": 5.413658543417299e-07, + "loss": 0.572, + "step": 77499 + }, + { + "epoch": 1.99, + "learning_rate": 5.413412658550818e-07, + "loss": 0.5977, + "step": 77500 + }, + { + "epoch": 1.99, + "learning_rate": 5.413166777196076e-07, + "loss": 0.6475, + "step": 77501 + }, + { + "epoch": 1.99, + "learning_rate": 5.412920899353264e-07, + "loss": 0.6367, + "step": 77502 + }, + { + "epoch": 1.99, + "learning_rate": 5.412675025022565e-07, + "loss": 0.6494, + "step": 77503 + }, + { + "epoch": 1.99, + "learning_rate": 5.41242915420417e-07, + "loss": 0.5537, + "step": 77504 + }, + { + "epoch": 1.99, + "learning_rate": 5.412183286898266e-07, + "loss": 0.7959, + "step": 77505 + }, + { + "epoch": 1.99, + "learning_rate": 5.411937423105047e-07, + "loss": 0.5447, + "step": 77506 + }, + { + "epoch": 1.99, + "learning_rate": 5.411691562824696e-07, + "loss": 0.5601, + "step": 77507 + }, + { + "epoch": 1.99, + "learning_rate": 5.411445706057398e-07, + "loss": 0.5403, + "step": 77508 + }, + { + "epoch": 1.99, + "learning_rate": 5.411199852803345e-07, + "loss": 0.5043, + "step": 77509 + }, + { + "epoch": 1.99, + "learning_rate": 5.410954003062725e-07, + "loss": 0.4541, + "step": 77510 + }, + { + "epoch": 1.99, + "learning_rate": 5.410708156835732e-07, + "loss": 0.4397, + "step": 77511 + }, + { + "epoch": 1.99, + "learning_rate": 5.410462314122544e-07, + "loss": 0.562, + "step": 77512 + }, + { + "epoch": 1.99, + "learning_rate": 5.410216474923352e-07, + "loss": 0.6943, + "step": 77513 + }, + { + "epoch": 1.99, + "learning_rate": 5.409970639238348e-07, + "loss": 0.6177, + "step": 77514 + }, + { + "epoch": 1.99, + "learning_rate": 5.409724807067723e-07, + "loss": 0.6377, + "step": 77515 + }, + { + "epoch": 1.99, + "learning_rate": 5.409478978411655e-07, + "loss": 0.7017, + "step": 77516 + }, + { + "epoch": 1.99, + "learning_rate": 5.409233153270344e-07, + "loss": 0.6709, + "step": 77517 + }, + { + "epoch": 1.99, + "learning_rate": 5.408987331643966e-07, + "loss": 0.5337, + "step": 77518 + }, + { + "epoch": 1.99, + "learning_rate": 5.40874151353272e-07, + "loss": 0.4304, + "step": 77519 + }, + { + "epoch": 1.99, + "learning_rate": 5.408495698936786e-07, + "loss": 0.509, + "step": 77520 + }, + { + "epoch": 1.99, + "learning_rate": 5.408249887856355e-07, + "loss": 0.6294, + "step": 77521 + }, + { + "epoch": 1.99, + "learning_rate": 5.408004080291617e-07, + "loss": 0.647, + "step": 77522 + }, + { + "epoch": 1.99, + "learning_rate": 5.407758276242762e-07, + "loss": 0.6543, + "step": 77523 + }, + { + "epoch": 1.99, + "learning_rate": 5.407512475709972e-07, + "loss": 0.3071, + "step": 77524 + }, + { + "epoch": 1.99, + "learning_rate": 5.407266678693438e-07, + "loss": 0.6348, + "step": 77525 + }, + { + "epoch": 1.99, + "learning_rate": 5.40702088519335e-07, + "loss": 0.6172, + "step": 77526 + }, + { + "epoch": 1.99, + "learning_rate": 5.406775095209898e-07, + "loss": 0.554, + "step": 77527 + }, + { + "epoch": 1.99, + "learning_rate": 5.406529308743266e-07, + "loss": 0.5251, + "step": 77528 + }, + { + "epoch": 1.99, + "learning_rate": 5.406283525793641e-07, + "loss": 0.6006, + "step": 77529 + }, + { + "epoch": 1.99, + "learning_rate": 5.406037746361214e-07, + "loss": 0.5483, + "step": 77530 + }, + { + "epoch": 1.99, + "learning_rate": 5.40579197044617e-07, + "loss": 0.6953, + "step": 77531 + }, + { + "epoch": 1.99, + "learning_rate": 5.405546198048706e-07, + "loss": 0.6719, + "step": 77532 + }, + { + "epoch": 1.99, + "learning_rate": 5.405300429169e-07, + "loss": 0.6323, + "step": 77533 + }, + { + "epoch": 1.99, + "learning_rate": 5.405054663807242e-07, + "loss": 0.6514, + "step": 77534 + }, + { + "epoch": 1.99, + "learning_rate": 5.404808901963629e-07, + "loss": 0.6118, + "step": 77535 + }, + { + "epoch": 1.99, + "learning_rate": 5.404563143638337e-07, + "loss": 0.5005, + "step": 77536 + }, + { + "epoch": 1.99, + "learning_rate": 5.404317388831566e-07, + "loss": 0.5264, + "step": 77537 + }, + { + "epoch": 1.99, + "learning_rate": 5.40407163754349e-07, + "loss": 0.5947, + "step": 77538 + }, + { + "epoch": 1.99, + "learning_rate": 5.403825889774307e-07, + "loss": 0.6934, + "step": 77539 + }, + { + "epoch": 1.99, + "learning_rate": 5.403580145524207e-07, + "loss": 0.8203, + "step": 77540 + }, + { + "epoch": 1.99, + "learning_rate": 5.403334404793371e-07, + "loss": 0.5659, + "step": 77541 + }, + { + "epoch": 1.99, + "learning_rate": 5.40308866758199e-07, + "loss": 0.4422, + "step": 77542 + }, + { + "epoch": 1.99, + "learning_rate": 5.402842933890252e-07, + "loss": 0.6235, + "step": 77543 + }, + { + "epoch": 1.99, + "learning_rate": 5.402597203718351e-07, + "loss": 0.707, + "step": 77544 + }, + { + "epoch": 1.99, + "learning_rate": 5.402351477066466e-07, + "loss": 0.5084, + "step": 77545 + }, + { + "epoch": 1.99, + "learning_rate": 5.402105753934788e-07, + "loss": 0.7314, + "step": 77546 + }, + { + "epoch": 1.99, + "learning_rate": 5.401860034323511e-07, + "loss": 0.4905, + "step": 77547 + }, + { + "epoch": 1.99, + "learning_rate": 5.401614318232814e-07, + "loss": 0.6904, + "step": 77548 + }, + { + "epoch": 1.99, + "learning_rate": 5.401368605662893e-07, + "loss": 0.7383, + "step": 77549 + }, + { + "epoch": 1.99, + "learning_rate": 5.40112289661393e-07, + "loss": 0.7559, + "step": 77550 + }, + { + "epoch": 1.99, + "learning_rate": 5.400877191086115e-07, + "loss": 0.583, + "step": 77551 + }, + { + "epoch": 1.99, + "learning_rate": 5.40063148907964e-07, + "loss": 0.7002, + "step": 77552 + }, + { + "epoch": 1.99, + "learning_rate": 5.400385790594686e-07, + "loss": 0.7432, + "step": 77553 + }, + { + "epoch": 1.99, + "learning_rate": 5.400140095631447e-07, + "loss": 0.6348, + "step": 77554 + }, + { + "epoch": 1.99, + "learning_rate": 5.399894404190107e-07, + "loss": 0.5957, + "step": 77555 + }, + { + "epoch": 1.99, + "learning_rate": 5.399648716270862e-07, + "loss": 0.5229, + "step": 77556 + }, + { + "epoch": 1.99, + "learning_rate": 5.399403031873893e-07, + "loss": 0.522, + "step": 77557 + }, + { + "epoch": 1.99, + "learning_rate": 5.399157350999386e-07, + "loss": 0.6953, + "step": 77558 + }, + { + "epoch": 1.99, + "learning_rate": 5.398911673647534e-07, + "loss": 0.5742, + "step": 77559 + }, + { + "epoch": 1.99, + "learning_rate": 5.398665999818523e-07, + "loss": 0.7056, + "step": 77560 + }, + { + "epoch": 1.99, + "learning_rate": 5.398420329512545e-07, + "loss": 0.6172, + "step": 77561 + }, + { + "epoch": 1.99, + "learning_rate": 5.398174662729782e-07, + "loss": 0.8154, + "step": 77562 + }, + { + "epoch": 1.99, + "learning_rate": 5.397928999470424e-07, + "loss": 0.6025, + "step": 77563 + }, + { + "epoch": 1.99, + "learning_rate": 5.397683339734661e-07, + "loss": 0.668, + "step": 77564 + }, + { + "epoch": 1.99, + "learning_rate": 5.397437683522685e-07, + "loss": 0.5317, + "step": 77565 + }, + { + "epoch": 1.99, + "learning_rate": 5.397192030834675e-07, + "loss": 0.4374, + "step": 77566 + }, + { + "epoch": 1.99, + "learning_rate": 5.396946381670826e-07, + "loss": 0.5771, + "step": 77567 + }, + { + "epoch": 1.99, + "learning_rate": 5.39670073603132e-07, + "loss": 0.6602, + "step": 77568 + }, + { + "epoch": 1.99, + "learning_rate": 5.396455093916349e-07, + "loss": 0.625, + "step": 77569 + }, + { + "epoch": 1.99, + "learning_rate": 5.396209455326103e-07, + "loss": 0.4783, + "step": 77570 + }, + { + "epoch": 1.99, + "learning_rate": 5.395963820260767e-07, + "loss": 0.5957, + "step": 77571 + }, + { + "epoch": 1.99, + "learning_rate": 5.395718188720529e-07, + "loss": 0.6411, + "step": 77572 + }, + { + "epoch": 1.99, + "learning_rate": 5.395472560705579e-07, + "loss": 0.6475, + "step": 77573 + }, + { + "epoch": 1.99, + "learning_rate": 5.395226936216102e-07, + "loss": 0.6377, + "step": 77574 + }, + { + "epoch": 1.99, + "learning_rate": 5.394981315252288e-07, + "loss": 0.4078, + "step": 77575 + }, + { + "epoch": 1.99, + "learning_rate": 5.394735697814325e-07, + "loss": 0.5981, + "step": 77576 + }, + { + "epoch": 1.99, + "learning_rate": 5.394490083902406e-07, + "loss": 0.6641, + "step": 77577 + }, + { + "epoch": 1.99, + "learning_rate": 5.394244473516713e-07, + "loss": 0.624, + "step": 77578 + }, + { + "epoch": 1.99, + "learning_rate": 5.393998866657432e-07, + "loss": 0.6099, + "step": 77579 + }, + { + "epoch": 1.99, + "learning_rate": 5.393753263324753e-07, + "loss": 0.6787, + "step": 77580 + }, + { + "epoch": 1.99, + "learning_rate": 5.393507663518866e-07, + "loss": 0.5869, + "step": 77581 + }, + { + "epoch": 1.99, + "learning_rate": 5.393262067239963e-07, + "loss": 0.6104, + "step": 77582 + }, + { + "epoch": 1.99, + "learning_rate": 5.393016474488222e-07, + "loss": 0.5713, + "step": 77583 + }, + { + "epoch": 1.99, + "learning_rate": 5.392770885263837e-07, + "loss": 0.6318, + "step": 77584 + }, + { + "epoch": 1.99, + "learning_rate": 5.392525299566997e-07, + "loss": 0.5752, + "step": 77585 + }, + { + "epoch": 1.99, + "learning_rate": 5.392279717397891e-07, + "loss": 0.6777, + "step": 77586 + }, + { + "epoch": 1.99, + "learning_rate": 5.392034138756704e-07, + "loss": 0.7695, + "step": 77587 + }, + { + "epoch": 1.99, + "learning_rate": 5.391788563643623e-07, + "loss": 0.7275, + "step": 77588 + }, + { + "epoch": 1.99, + "learning_rate": 5.391542992058835e-07, + "loss": 0.6626, + "step": 77589 + }, + { + "epoch": 1.99, + "learning_rate": 5.391297424002536e-07, + "loss": 0.6157, + "step": 77590 + }, + { + "epoch": 1.99, + "learning_rate": 5.391051859474904e-07, + "loss": 0.5293, + "step": 77591 + }, + { + "epoch": 1.99, + "learning_rate": 5.390806298476133e-07, + "loss": 0.6689, + "step": 77592 + }, + { + "epoch": 1.99, + "learning_rate": 5.390560741006408e-07, + "loss": 0.563, + "step": 77593 + }, + { + "epoch": 1.99, + "learning_rate": 5.390315187065924e-07, + "loss": 0.52, + "step": 77594 + }, + { + "epoch": 1.99, + "learning_rate": 5.390069636654859e-07, + "loss": 0.6836, + "step": 77595 + }, + { + "epoch": 1.99, + "learning_rate": 5.389824089773405e-07, + "loss": 0.584, + "step": 77596 + }, + { + "epoch": 1.99, + "learning_rate": 5.389578546421755e-07, + "loss": 0.6167, + "step": 77597 + }, + { + "epoch": 1.99, + "learning_rate": 5.38933300660009e-07, + "loss": 0.6494, + "step": 77598 + }, + { + "epoch": 1.99, + "learning_rate": 5.389087470308604e-07, + "loss": 0.6812, + "step": 77599 + }, + { + "epoch": 1.99, + "learning_rate": 5.388841937547478e-07, + "loss": 0.5444, + "step": 77600 + }, + { + "epoch": 1.99, + "learning_rate": 5.388596408316903e-07, + "loss": 0.791, + "step": 77601 + }, + { + "epoch": 1.99, + "learning_rate": 5.388350882617068e-07, + "loss": 0.6553, + "step": 77602 + }, + { + "epoch": 1.99, + "learning_rate": 5.388105360448165e-07, + "loss": 0.5908, + "step": 77603 + }, + { + "epoch": 1.99, + "learning_rate": 5.387859841810374e-07, + "loss": 0.626, + "step": 77604 + }, + { + "epoch": 1.99, + "learning_rate": 5.387614326703886e-07, + "loss": 0.7793, + "step": 77605 + }, + { + "epoch": 1.99, + "learning_rate": 5.38736881512889e-07, + "loss": 0.4219, + "step": 77606 + }, + { + "epoch": 1.99, + "learning_rate": 5.387123307085581e-07, + "loss": 0.549, + "step": 77607 + }, + { + "epoch": 1.99, + "learning_rate": 5.386877802574132e-07, + "loss": 0.5474, + "step": 77608 + }, + { + "epoch": 1.99, + "learning_rate": 5.386632301594738e-07, + "loss": 0.6875, + "step": 77609 + }, + { + "epoch": 1.99, + "learning_rate": 5.386386804147587e-07, + "loss": 0.6396, + "step": 77610 + }, + { + "epoch": 1.99, + "learning_rate": 5.386141310232872e-07, + "loss": 0.6865, + "step": 77611 + }, + { + "epoch": 1.99, + "learning_rate": 5.385895819850774e-07, + "loss": 0.8105, + "step": 77612 + }, + { + "epoch": 1.99, + "learning_rate": 5.385650333001483e-07, + "loss": 0.543, + "step": 77613 + }, + { + "epoch": 1.99, + "learning_rate": 5.385404849685186e-07, + "loss": 0.6567, + "step": 77614 + }, + { + "epoch": 1.99, + "learning_rate": 5.385159369902077e-07, + "loss": 0.6426, + "step": 77615 + }, + { + "epoch": 1.99, + "learning_rate": 5.384913893652334e-07, + "loss": 0.4976, + "step": 77616 + }, + { + "epoch": 1.99, + "learning_rate": 5.384668420936156e-07, + "loss": 0.7783, + "step": 77617 + }, + { + "epoch": 1.99, + "learning_rate": 5.384422951753721e-07, + "loss": 0.6113, + "step": 77618 + }, + { + "epoch": 1.99, + "learning_rate": 5.384177486105221e-07, + "loss": 0.7949, + "step": 77619 + }, + { + "epoch": 1.99, + "learning_rate": 5.383932023990847e-07, + "loss": 0.6143, + "step": 77620 + }, + { + "epoch": 1.99, + "learning_rate": 5.383686565410781e-07, + "loss": 0.4849, + "step": 77621 + }, + { + "epoch": 1.99, + "learning_rate": 5.383441110365214e-07, + "loss": 0.6514, + "step": 77622 + }, + { + "epoch": 1.99, + "learning_rate": 5.383195658854333e-07, + "loss": 0.6641, + "step": 77623 + }, + { + "epoch": 1.99, + "learning_rate": 5.382950210878332e-07, + "loss": 0.5542, + "step": 77624 + }, + { + "epoch": 1.99, + "learning_rate": 5.382704766437389e-07, + "loss": 0.6284, + "step": 77625 + }, + { + "epoch": 1.99, + "learning_rate": 5.382459325531696e-07, + "loss": 0.6299, + "step": 77626 + }, + { + "epoch": 1.99, + "learning_rate": 5.382213888161447e-07, + "loss": 0.5728, + "step": 77627 + }, + { + "epoch": 1.99, + "learning_rate": 5.381968454326824e-07, + "loss": 0.5239, + "step": 77628 + }, + { + "epoch": 1.99, + "learning_rate": 5.381723024028011e-07, + "loss": 0.592, + "step": 77629 + }, + { + "epoch": 1.99, + "learning_rate": 5.381477597265201e-07, + "loss": 0.7051, + "step": 77630 + }, + { + "epoch": 1.99, + "learning_rate": 5.381232174038581e-07, + "loss": 0.5601, + "step": 77631 + }, + { + "epoch": 1.99, + "learning_rate": 5.380986754348343e-07, + "loss": 0.5276, + "step": 77632 + }, + { + "epoch": 1.99, + "learning_rate": 5.380741338194666e-07, + "loss": 0.8984, + "step": 77633 + }, + { + "epoch": 1.99, + "learning_rate": 5.380495925577745e-07, + "loss": 0.7607, + "step": 77634 + }, + { + "epoch": 1.99, + "learning_rate": 5.380250516497764e-07, + "loss": 0.5259, + "step": 77635 + }, + { + "epoch": 1.99, + "learning_rate": 5.380005110954919e-07, + "loss": 0.5864, + "step": 77636 + }, + { + "epoch": 1.99, + "learning_rate": 5.37975970894939e-07, + "loss": 0.6431, + "step": 77637 + }, + { + "epoch": 1.99, + "learning_rate": 5.379514310481362e-07, + "loss": 0.6943, + "step": 77638 + }, + { + "epoch": 1.99, + "learning_rate": 5.379268915551028e-07, + "loss": 0.6719, + "step": 77639 + }, + { + "epoch": 1.99, + "learning_rate": 5.379023524158575e-07, + "loss": 0.5046, + "step": 77640 + }, + { + "epoch": 1.99, + "learning_rate": 5.378778136304196e-07, + "loss": 0.4834, + "step": 77641 + }, + { + "epoch": 1.99, + "learning_rate": 5.37853275198807e-07, + "loss": 0.8223, + "step": 77642 + }, + { + "epoch": 1.99, + "learning_rate": 5.378287371210389e-07, + "loss": 0.606, + "step": 77643 + }, + { + "epoch": 1.99, + "learning_rate": 5.378041993971345e-07, + "loss": 0.624, + "step": 77644 + }, + { + "epoch": 1.99, + "learning_rate": 5.377796620271118e-07, + "loss": 0.5122, + "step": 77645 + }, + { + "epoch": 1.99, + "learning_rate": 5.377551250109898e-07, + "loss": 0.6201, + "step": 77646 + }, + { + "epoch": 1.99, + "learning_rate": 5.377305883487879e-07, + "loss": 0.5781, + "step": 77647 + }, + { + "epoch": 1.99, + "learning_rate": 5.377060520405241e-07, + "loss": 0.7705, + "step": 77648 + }, + { + "epoch": 1.99, + "learning_rate": 5.376815160862179e-07, + "loss": 0.6143, + "step": 77649 + }, + { + "epoch": 1.99, + "learning_rate": 5.376569804858874e-07, + "loss": 0.438, + "step": 77650 + }, + { + "epoch": 1.99, + "learning_rate": 5.376324452395515e-07, + "loss": 0.624, + "step": 77651 + }, + { + "epoch": 1.99, + "learning_rate": 5.376079103472293e-07, + "loss": 0.6738, + "step": 77652 + }, + { + "epoch": 1.99, + "learning_rate": 5.375833758089399e-07, + "loss": 0.5078, + "step": 77653 + }, + { + "epoch": 1.99, + "learning_rate": 5.375588416247011e-07, + "loss": 0.7031, + "step": 77654 + }, + { + "epoch": 1.99, + "learning_rate": 5.375343077945323e-07, + "loss": 0.6396, + "step": 77655 + }, + { + "epoch": 1.99, + "learning_rate": 5.375097743184522e-07, + "loss": 0.6387, + "step": 77656 + }, + { + "epoch": 1.99, + "learning_rate": 5.374852411964801e-07, + "loss": 0.7529, + "step": 77657 + }, + { + "epoch": 1.99, + "learning_rate": 5.374607084286343e-07, + "loss": 0.707, + "step": 77658 + }, + { + "epoch": 1.99, + "learning_rate": 5.37436176014933e-07, + "loss": 0.7393, + "step": 77659 + }, + { + "epoch": 1.99, + "learning_rate": 5.374116439553956e-07, + "loss": 0.6846, + "step": 77660 + }, + { + "epoch": 1.99, + "learning_rate": 5.373871122500413e-07, + "loss": 0.7246, + "step": 77661 + }, + { + "epoch": 1.99, + "learning_rate": 5.37362580898888e-07, + "loss": 0.7109, + "step": 77662 + }, + { + "epoch": 1.99, + "learning_rate": 5.373380499019549e-07, + "loss": 0.6597, + "step": 77663 + }, + { + "epoch": 1.99, + "learning_rate": 5.373135192592606e-07, + "loss": 0.6025, + "step": 77664 + }, + { + "epoch": 1.99, + "learning_rate": 5.372889889708248e-07, + "loss": 0.5171, + "step": 77665 + }, + { + "epoch": 1.99, + "learning_rate": 5.372644590366648e-07, + "loss": 0.7004, + "step": 77666 + }, + { + "epoch": 1.99, + "learning_rate": 5.372399294568008e-07, + "loss": 0.449, + "step": 77667 + }, + { + "epoch": 1.99, + "learning_rate": 5.372154002312503e-07, + "loss": 0.6245, + "step": 77668 + }, + { + "epoch": 1.99, + "learning_rate": 5.371908713600328e-07, + "loss": 0.4824, + "step": 77669 + }, + { + "epoch": 1.99, + "learning_rate": 5.371663428431674e-07, + "loss": 0.4662, + "step": 77670 + }, + { + "epoch": 1.99, + "learning_rate": 5.371418146806719e-07, + "loss": 0.6396, + "step": 77671 + }, + { + "epoch": 1.99, + "learning_rate": 5.371172868725658e-07, + "loss": 0.6299, + "step": 77672 + }, + { + "epoch": 1.99, + "learning_rate": 5.370927594188676e-07, + "loss": 0.5469, + "step": 77673 + }, + { + "epoch": 1.99, + "learning_rate": 5.370682323195967e-07, + "loss": 0.6699, + "step": 77674 + }, + { + "epoch": 1.99, + "learning_rate": 5.37043705574771e-07, + "loss": 0.7949, + "step": 77675 + }, + { + "epoch": 1.99, + "learning_rate": 5.370191791844095e-07, + "loss": 0.5325, + "step": 77676 + }, + { + "epoch": 1.99, + "learning_rate": 5.369946531485316e-07, + "loss": 0.7412, + "step": 77677 + }, + { + "epoch": 1.99, + "learning_rate": 5.369701274671556e-07, + "loss": 0.6543, + "step": 77678 + }, + { + "epoch": 1.99, + "learning_rate": 5.369456021402998e-07, + "loss": 0.533, + "step": 77679 + }, + { + "epoch": 1.99, + "learning_rate": 5.369210771679835e-07, + "loss": 0.5176, + "step": 77680 + }, + { + "epoch": 1.99, + "learning_rate": 5.368965525502255e-07, + "loss": 0.4816, + "step": 77681 + }, + { + "epoch": 1.99, + "learning_rate": 5.368720282870449e-07, + "loss": 0.8022, + "step": 77682 + }, + { + "epoch": 1.99, + "learning_rate": 5.368475043784598e-07, + "loss": 0.7085, + "step": 77683 + }, + { + "epoch": 1.99, + "learning_rate": 5.368229808244891e-07, + "loss": 0.647, + "step": 77684 + }, + { + "epoch": 1.99, + "learning_rate": 5.367984576251516e-07, + "loss": 0.4319, + "step": 77685 + }, + { + "epoch": 1.99, + "learning_rate": 5.367739347804669e-07, + "loss": 0.6074, + "step": 77686 + }, + { + "epoch": 1.99, + "learning_rate": 5.36749412290453e-07, + "loss": 0.5918, + "step": 77687 + }, + { + "epoch": 1.99, + "learning_rate": 5.367248901551284e-07, + "loss": 0.7114, + "step": 77688 + }, + { + "epoch": 1.99, + "learning_rate": 5.367003683745122e-07, + "loss": 0.6924, + "step": 77689 + }, + { + "epoch": 1.99, + "learning_rate": 5.366758469486233e-07, + "loss": 0.7559, + "step": 77690 + }, + { + "epoch": 1.99, + "learning_rate": 5.366513258774807e-07, + "loss": 0.8516, + "step": 77691 + }, + { + "epoch": 1.99, + "learning_rate": 5.366268051611026e-07, + "loss": 0.6475, + "step": 77692 + }, + { + "epoch": 1.99, + "learning_rate": 5.366022847995079e-07, + "loss": 0.582, + "step": 77693 + }, + { + "epoch": 1.99, + "learning_rate": 5.365777647927157e-07, + "loss": 0.707, + "step": 77694 + }, + { + "epoch": 1.99, + "learning_rate": 5.365532451407449e-07, + "loss": 0.6616, + "step": 77695 + }, + { + "epoch": 1.99, + "learning_rate": 5.365287258436136e-07, + "loss": 0.7437, + "step": 77696 + }, + { + "epoch": 1.99, + "learning_rate": 5.365042069013413e-07, + "loss": 0.5894, + "step": 77697 + }, + { + "epoch": 1.99, + "learning_rate": 5.36479688313946e-07, + "loss": 0.6455, + "step": 77698 + }, + { + "epoch": 1.99, + "learning_rate": 5.364551700814473e-07, + "loss": 0.6426, + "step": 77699 + }, + { + "epoch": 1.99, + "learning_rate": 5.364306522038632e-07, + "loss": 0.6035, + "step": 77700 + }, + { + "epoch": 1.99, + "learning_rate": 5.364061346812128e-07, + "loss": 0.5637, + "step": 77701 + }, + { + "epoch": 1.99, + "learning_rate": 5.36381617513515e-07, + "loss": 0.5757, + "step": 77702 + }, + { + "epoch": 1.99, + "learning_rate": 5.363571007007888e-07, + "loss": 0.5801, + "step": 77703 + }, + { + "epoch": 1.99, + "learning_rate": 5.363325842430522e-07, + "loss": 0.6826, + "step": 77704 + }, + { + "epoch": 1.99, + "learning_rate": 5.363080681403245e-07, + "loss": 0.4089, + "step": 77705 + }, + { + "epoch": 1.99, + "learning_rate": 5.362835523926243e-07, + "loss": 0.5908, + "step": 77706 + }, + { + "epoch": 1.99, + "learning_rate": 5.362590369999709e-07, + "loss": 0.7139, + "step": 77707 + }, + { + "epoch": 1.99, + "learning_rate": 5.362345219623828e-07, + "loss": 0.5435, + "step": 77708 + }, + { + "epoch": 1.99, + "learning_rate": 5.362100072798778e-07, + "loss": 0.5439, + "step": 77709 + }, + { + "epoch": 1.99, + "learning_rate": 5.361854929524759e-07, + "loss": 0.479, + "step": 77710 + }, + { + "epoch": 1.99, + "learning_rate": 5.361609789801953e-07, + "loss": 0.6973, + "step": 77711 + }, + { + "epoch": 1.99, + "learning_rate": 5.361364653630552e-07, + "loss": 0.7241, + "step": 77712 + }, + { + "epoch": 1.99, + "learning_rate": 5.361119521010738e-07, + "loss": 0.6157, + "step": 77713 + }, + { + "epoch": 1.99, + "learning_rate": 5.3608743919427e-07, + "loss": 0.4366, + "step": 77714 + }, + { + "epoch": 1.99, + "learning_rate": 5.360629266426633e-07, + "loss": 0.6479, + "step": 77715 + }, + { + "epoch": 1.99, + "learning_rate": 5.360384144462714e-07, + "loss": 0.5645, + "step": 77716 + }, + { + "epoch": 1.99, + "learning_rate": 5.36013902605114e-07, + "loss": 0.5439, + "step": 77717 + }, + { + "epoch": 1.99, + "learning_rate": 5.359893911192091e-07, + "loss": 0.6641, + "step": 77718 + }, + { + "epoch": 1.99, + "learning_rate": 5.359648799885755e-07, + "loss": 0.688, + "step": 77719 + }, + { + "epoch": 1.99, + "learning_rate": 5.35940369213233e-07, + "loss": 0.6914, + "step": 77720 + }, + { + "epoch": 1.99, + "learning_rate": 5.359158587931989e-07, + "loss": 0.6855, + "step": 77721 + }, + { + "epoch": 1.99, + "learning_rate": 5.358913487284929e-07, + "loss": 0.7686, + "step": 77722 + }, + { + "epoch": 1.99, + "learning_rate": 5.358668390191334e-07, + "loss": 0.5527, + "step": 77723 + }, + { + "epoch": 1.99, + "learning_rate": 5.358423296651398e-07, + "loss": 0.5925, + "step": 77724 + }, + { + "epoch": 1.99, + "learning_rate": 5.3581782066653e-07, + "loss": 0.6768, + "step": 77725 + }, + { + "epoch": 1.99, + "learning_rate": 5.357933120233236e-07, + "loss": 0.6211, + "step": 77726 + }, + { + "epoch": 1.99, + "learning_rate": 5.357688037355385e-07, + "loss": 0.564, + "step": 77727 + }, + { + "epoch": 1.99, + "learning_rate": 5.357442958031938e-07, + "loss": 0.562, + "step": 77728 + }, + { + "epoch": 1.99, + "learning_rate": 5.357197882263087e-07, + "loss": 0.6665, + "step": 77729 + }, + { + "epoch": 1.99, + "learning_rate": 5.356952810049014e-07, + "loss": 0.7324, + "step": 77730 + }, + { + "epoch": 1.99, + "learning_rate": 5.356707741389908e-07, + "loss": 0.6885, + "step": 77731 + }, + { + "epoch": 1.99, + "learning_rate": 5.356462676285957e-07, + "loss": 0.5381, + "step": 77732 + }, + { + "epoch": 1.99, + "learning_rate": 5.356217614737353e-07, + "loss": 0.5681, + "step": 77733 + }, + { + "epoch": 1.99, + "learning_rate": 5.355972556744274e-07, + "loss": 0.5967, + "step": 77734 + }, + { + "epoch": 1.99, + "learning_rate": 5.355727502306917e-07, + "loss": 0.6846, + "step": 77735 + }, + { + "epoch": 1.99, + "learning_rate": 5.355482451425467e-07, + "loss": 0.7793, + "step": 77736 + }, + { + "epoch": 1.99, + "learning_rate": 5.355237404100111e-07, + "loss": 0.5879, + "step": 77737 + }, + { + "epoch": 1.99, + "learning_rate": 5.354992360331033e-07, + "loss": 0.4175, + "step": 77738 + }, + { + "epoch": 1.99, + "learning_rate": 5.354747320118424e-07, + "loss": 0.5781, + "step": 77739 + }, + { + "epoch": 1.99, + "learning_rate": 5.35450228346247e-07, + "loss": 0.6157, + "step": 77740 + }, + { + "epoch": 1.99, + "learning_rate": 5.354257250363366e-07, + "loss": 0.6841, + "step": 77741 + }, + { + "epoch": 1.99, + "learning_rate": 5.354012220821287e-07, + "loss": 0.7021, + "step": 77742 + }, + { + "epoch": 1.99, + "learning_rate": 5.353767194836429e-07, + "loss": 0.6846, + "step": 77743 + }, + { + "epoch": 1.99, + "learning_rate": 5.353522172408977e-07, + "loss": 0.6621, + "step": 77744 + }, + { + "epoch": 1.99, + "learning_rate": 5.353277153539124e-07, + "loss": 0.6533, + "step": 77745 + }, + { + "epoch": 1.99, + "learning_rate": 5.353032138227054e-07, + "loss": 0.3726, + "step": 77746 + }, + { + "epoch": 1.99, + "learning_rate": 5.352787126472947e-07, + "loss": 0.4663, + "step": 77747 + }, + { + "epoch": 1.99, + "learning_rate": 5.352542118277e-07, + "loss": 0.6626, + "step": 77748 + }, + { + "epoch": 1.99, + "learning_rate": 5.352297113639395e-07, + "loss": 0.4814, + "step": 77749 + }, + { + "epoch": 1.99, + "learning_rate": 5.352052112560328e-07, + "loss": 0.5896, + "step": 77750 + }, + { + "epoch": 1.99, + "learning_rate": 5.351807115039977e-07, + "loss": 0.4675, + "step": 77751 + }, + { + "epoch": 1.99, + "learning_rate": 5.351562121078534e-07, + "loss": 0.562, + "step": 77752 + }, + { + "epoch": 1.99, + "learning_rate": 5.35131713067619e-07, + "loss": 0.6699, + "step": 77753 + }, + { + "epoch": 1.99, + "learning_rate": 5.351072143833125e-07, + "loss": 0.6631, + "step": 77754 + }, + { + "epoch": 1.99, + "learning_rate": 5.350827160549528e-07, + "loss": 0.6797, + "step": 77755 + }, + { + "epoch": 1.99, + "learning_rate": 5.350582180825595e-07, + "loss": 0.6069, + "step": 77756 + }, + { + "epoch": 1.99, + "learning_rate": 5.350337204661503e-07, + "loss": 0.4756, + "step": 77757 + }, + { + "epoch": 1.99, + "learning_rate": 5.350092232057447e-07, + "loss": 0.6929, + "step": 77758 + }, + { + "epoch": 1.99, + "learning_rate": 5.349847263013609e-07, + "loss": 0.6223, + "step": 77759 + }, + { + "epoch": 1.99, + "learning_rate": 5.349602297530178e-07, + "loss": 0.5869, + "step": 77760 + }, + { + "epoch": 1.99, + "learning_rate": 5.349357335607343e-07, + "loss": 0.7295, + "step": 77761 + }, + { + "epoch": 1.99, + "learning_rate": 5.349112377245296e-07, + "loss": 0.6826, + "step": 77762 + }, + { + "epoch": 1.99, + "learning_rate": 5.348867422444216e-07, + "loss": 0.6094, + "step": 77763 + }, + { + "epoch": 1.99, + "learning_rate": 5.348622471204294e-07, + "loss": 0.5029, + "step": 77764 + }, + { + "epoch": 1.99, + "learning_rate": 5.348377523525716e-07, + "loss": 0.5737, + "step": 77765 + }, + { + "epoch": 1.99, + "learning_rate": 5.348132579408678e-07, + "loss": 0.792, + "step": 77766 + }, + { + "epoch": 1.99, + "learning_rate": 5.347887638853359e-07, + "loss": 0.7168, + "step": 77767 + }, + { + "epoch": 1.99, + "learning_rate": 5.347642701859946e-07, + "loss": 0.6973, + "step": 77768 + }, + { + "epoch": 1.99, + "learning_rate": 5.347397768428629e-07, + "loss": 0.7832, + "step": 77769 + }, + { + "epoch": 1.99, + "learning_rate": 5.347152838559598e-07, + "loss": 0.6333, + "step": 77770 + }, + { + "epoch": 1.99, + "learning_rate": 5.346907912253036e-07, + "loss": 0.6396, + "step": 77771 + }, + { + "epoch": 1.99, + "learning_rate": 5.346662989509131e-07, + "loss": 0.7285, + "step": 77772 + }, + { + "epoch": 1.99, + "learning_rate": 5.346418070328074e-07, + "loss": 0.5414, + "step": 77773 + }, + { + "epoch": 1.99, + "learning_rate": 5.346173154710054e-07, + "loss": 0.7764, + "step": 77774 + }, + { + "epoch": 1.99, + "learning_rate": 5.345928242655251e-07, + "loss": 0.8076, + "step": 77775 + }, + { + "epoch": 1.99, + "learning_rate": 5.345683334163861e-07, + "loss": 0.5205, + "step": 77776 + }, + { + "epoch": 1.99, + "learning_rate": 5.345438429236062e-07, + "loss": 0.5845, + "step": 77777 + }, + { + "epoch": 1.99, + "learning_rate": 5.345193527872049e-07, + "loss": 0.5256, + "step": 77778 + }, + { + "epoch": 1.99, + "learning_rate": 5.344948630072011e-07, + "loss": 0.6208, + "step": 77779 + }, + { + "epoch": 1.99, + "learning_rate": 5.344703735836126e-07, + "loss": 0.5669, + "step": 77780 + }, + { + "epoch": 1.99, + "learning_rate": 5.344458845164588e-07, + "loss": 0.7134, + "step": 77781 + }, + { + "epoch": 1.99, + "learning_rate": 5.344213958057584e-07, + "loss": 0.6543, + "step": 77782 + }, + { + "epoch": 1.99, + "learning_rate": 5.343969074515305e-07, + "loss": 0.6895, + "step": 77783 + }, + { + "epoch": 1.99, + "learning_rate": 5.343724194537931e-07, + "loss": 0.9097, + "step": 77784 + }, + { + "epoch": 1.99, + "learning_rate": 5.343479318125654e-07, + "loss": 0.5679, + "step": 77785 + }, + { + "epoch": 1.99, + "learning_rate": 5.343234445278664e-07, + "loss": 0.5845, + "step": 77786 + }, + { + "epoch": 1.99, + "learning_rate": 5.342989575997145e-07, + "loss": 0.5967, + "step": 77787 + }, + { + "epoch": 1.99, + "learning_rate": 5.342744710281282e-07, + "loss": 0.7021, + "step": 77788 + }, + { + "epoch": 1.99, + "learning_rate": 5.342499848131264e-07, + "loss": 0.6479, + "step": 77789 + }, + { + "epoch": 1.99, + "learning_rate": 5.342254989547281e-07, + "loss": 0.4297, + "step": 77790 + }, + { + "epoch": 1.99, + "learning_rate": 5.342010134529521e-07, + "loss": 0.4536, + "step": 77791 + }, + { + "epoch": 1.99, + "learning_rate": 5.341765283078167e-07, + "loss": 0.6719, + "step": 77792 + }, + { + "epoch": 1.99, + "learning_rate": 5.34152043519341e-07, + "loss": 0.5107, + "step": 77793 + }, + { + "epoch": 1.99, + "learning_rate": 5.341275590875435e-07, + "loss": 0.6548, + "step": 77794 + }, + { + "epoch": 1.99, + "learning_rate": 5.341030750124436e-07, + "loss": 0.6826, + "step": 77795 + }, + { + "epoch": 1.99, + "learning_rate": 5.340785912940595e-07, + "loss": 0.4045, + "step": 77796 + }, + { + "epoch": 1.99, + "learning_rate": 5.340541079324097e-07, + "loss": 0.6836, + "step": 77797 + }, + { + "epoch": 1.99, + "learning_rate": 5.340296249275131e-07, + "loss": 0.5835, + "step": 77798 + }, + { + "epoch": 1.99, + "learning_rate": 5.340051422793886e-07, + "loss": 0.668, + "step": 77799 + }, + { + "epoch": 1.99, + "learning_rate": 5.339806599880554e-07, + "loss": 0.7578, + "step": 77800 + }, + { + "epoch": 1.99, + "learning_rate": 5.339561780535314e-07, + "loss": 0.4971, + "step": 77801 + }, + { + "epoch": 1.99, + "learning_rate": 5.339316964758357e-07, + "loss": 0.3479, + "step": 77802 + }, + { + "epoch": 1.99, + "learning_rate": 5.339072152549871e-07, + "loss": 0.5264, + "step": 77803 + }, + { + "epoch": 1.99, + "learning_rate": 5.338827343910046e-07, + "loss": 0.7139, + "step": 77804 + }, + { + "epoch": 1.99, + "learning_rate": 5.338582538839065e-07, + "loss": 0.666, + "step": 77805 + }, + { + "epoch": 1.99, + "learning_rate": 5.338337737337119e-07, + "loss": 0.6143, + "step": 77806 + }, + { + "epoch": 1.99, + "learning_rate": 5.33809293940439e-07, + "loss": 0.6807, + "step": 77807 + }, + { + "epoch": 1.99, + "learning_rate": 5.337848145041073e-07, + "loss": 0.6523, + "step": 77808 + }, + { + "epoch": 1.99, + "learning_rate": 5.337603354247346e-07, + "loss": 0.6963, + "step": 77809 + }, + { + "epoch": 1.99, + "learning_rate": 5.337358567023403e-07, + "loss": 0.8076, + "step": 77810 + }, + { + "epoch": 1.99, + "learning_rate": 5.33711378336943e-07, + "loss": 0.5547, + "step": 77811 + }, + { + "epoch": 1.99, + "learning_rate": 5.336869003285617e-07, + "loss": 0.668, + "step": 77812 + }, + { + "epoch": 1.99, + "learning_rate": 5.336624226772148e-07, + "loss": 0.5579, + "step": 77813 + }, + { + "epoch": 1.99, + "learning_rate": 5.336379453829209e-07, + "loss": 0.6924, + "step": 77814 + }, + { + "epoch": 1.99, + "learning_rate": 5.336134684456992e-07, + "loss": 0.584, + "step": 77815 + }, + { + "epoch": 1.99, + "learning_rate": 5.335889918655685e-07, + "loss": 0.7041, + "step": 77816 + }, + { + "epoch": 1.99, + "learning_rate": 5.335645156425472e-07, + "loss": 0.6279, + "step": 77817 + }, + { + "epoch": 1.99, + "learning_rate": 5.335400397766539e-07, + "loss": 0.6885, + "step": 77818 + }, + { + "epoch": 1.99, + "learning_rate": 5.335155642679072e-07, + "loss": 0.6387, + "step": 77819 + }, + { + "epoch": 1.99, + "learning_rate": 5.334910891163265e-07, + "loss": 0.5029, + "step": 77820 + }, + { + "epoch": 1.99, + "learning_rate": 5.334666143219304e-07, + "loss": 0.6943, + "step": 77821 + }, + { + "epoch": 1.99, + "learning_rate": 5.334421398847373e-07, + "loss": 0.6357, + "step": 77822 + }, + { + "epoch": 1.99, + "learning_rate": 5.33417665804766e-07, + "loss": 0.5591, + "step": 77823 + }, + { + "epoch": 1.99, + "learning_rate": 5.333931920820356e-07, + "loss": 0.5303, + "step": 77824 + }, + { + "epoch": 1.99, + "learning_rate": 5.333687187165643e-07, + "loss": 0.5498, + "step": 77825 + }, + { + "epoch": 1.99, + "learning_rate": 5.333442457083715e-07, + "loss": 0.6753, + "step": 77826 + }, + { + "epoch": 1.99, + "learning_rate": 5.333197730574752e-07, + "loss": 0.5693, + "step": 77827 + }, + { + "epoch": 1.99, + "learning_rate": 5.332953007638944e-07, + "loss": 0.6855, + "step": 77828 + }, + { + "epoch": 1.99, + "learning_rate": 5.332708288276484e-07, + "loss": 0.4822, + "step": 77829 + }, + { + "epoch": 1.99, + "learning_rate": 5.332463572487551e-07, + "loss": 0.4009, + "step": 77830 + }, + { + "epoch": 1.99, + "learning_rate": 5.332218860272335e-07, + "loss": 0.6382, + "step": 77831 + }, + { + "epoch": 1.99, + "learning_rate": 5.331974151631024e-07, + "loss": 0.6963, + "step": 77832 + }, + { + "epoch": 1.99, + "learning_rate": 5.331729446563811e-07, + "loss": 0.6895, + "step": 77833 + }, + { + "epoch": 1.99, + "learning_rate": 5.331484745070873e-07, + "loss": 0.6616, + "step": 77834 + }, + { + "epoch": 1.99, + "learning_rate": 5.331240047152404e-07, + "loss": 0.666, + "step": 77835 + }, + { + "epoch": 1.99, + "learning_rate": 5.330995352808594e-07, + "loss": 0.5493, + "step": 77836 + }, + { + "epoch": 2.0, + "learning_rate": 5.33075066203962e-07, + "loss": 0.5923, + "step": 77837 + }, + { + "epoch": 2.0, + "learning_rate": 5.33050597484568e-07, + "loss": 0.6025, + "step": 77838 + }, + { + "epoch": 2.0, + "learning_rate": 5.330261291226954e-07, + "loss": 0.626, + "step": 77839 + }, + { + "epoch": 2.0, + "learning_rate": 5.330016611183632e-07, + "loss": 0.5688, + "step": 77840 + }, + { + "epoch": 2.0, + "learning_rate": 5.329771934715906e-07, + "loss": 0.7881, + "step": 77841 + }, + { + "epoch": 2.0, + "learning_rate": 5.329527261823954e-07, + "loss": 0.6357, + "step": 77842 + }, + { + "epoch": 2.0, + "learning_rate": 5.329282592507969e-07, + "loss": 0.7026, + "step": 77843 + }, + { + "epoch": 2.0, + "learning_rate": 5.329037926768136e-07, + "loss": 0.4946, + "step": 77844 + }, + { + "epoch": 2.0, + "learning_rate": 5.32879326460465e-07, + "loss": 0.5747, + "step": 77845 + }, + { + "epoch": 2.0, + "learning_rate": 5.32854860601769e-07, + "loss": 0.5571, + "step": 77846 + }, + { + "epoch": 2.0, + "learning_rate": 5.328303951007442e-07, + "loss": 0.7549, + "step": 77847 + }, + { + "epoch": 2.0, + "learning_rate": 5.328059299574098e-07, + "loss": 0.5144, + "step": 77848 + }, + { + "epoch": 2.0, + "learning_rate": 5.327814651717843e-07, + "loss": 0.792, + "step": 77849 + }, + { + "epoch": 2.0, + "learning_rate": 5.327570007438871e-07, + "loss": 0.6138, + "step": 77850 + }, + { + "epoch": 2.0, + "learning_rate": 5.327325366737359e-07, + "loss": 0.5035, + "step": 77851 + }, + { + "epoch": 2.0, + "learning_rate": 5.327080729613497e-07, + "loss": 0.8301, + "step": 77852 + }, + { + "epoch": 2.0, + "learning_rate": 5.326836096067477e-07, + "loss": 0.7725, + "step": 77853 + }, + { + "epoch": 2.0, + "learning_rate": 5.326591466099488e-07, + "loss": 0.6504, + "step": 77854 + }, + { + "epoch": 2.0, + "learning_rate": 5.326346839709708e-07, + "loss": 0.5898, + "step": 77855 + }, + { + "epoch": 2.0, + "learning_rate": 5.326102216898334e-07, + "loss": 0.7393, + "step": 77856 + }, + { + "epoch": 2.0, + "learning_rate": 5.325857597665544e-07, + "loss": 0.5576, + "step": 77857 + }, + { + "epoch": 2.0, + "learning_rate": 5.325612982011534e-07, + "loss": 0.6865, + "step": 77858 + }, + { + "epoch": 2.0, + "learning_rate": 5.325368369936483e-07, + "loss": 0.6208, + "step": 77859 + }, + { + "epoch": 2.0, + "learning_rate": 5.325123761440583e-07, + "loss": 0.6553, + "step": 77860 + }, + { + "epoch": 2.0, + "learning_rate": 5.32487915652402e-07, + "loss": 0.563, + "step": 77861 + }, + { + "epoch": 2.0, + "learning_rate": 5.324634555186986e-07, + "loss": 0.668, + "step": 77862 + }, + { + "epoch": 2.0, + "learning_rate": 5.324389957429662e-07, + "loss": 0.7969, + "step": 77863 + }, + { + "epoch": 2.0, + "learning_rate": 5.324145363252237e-07, + "loss": 0.501, + "step": 77864 + }, + { + "epoch": 2.0, + "learning_rate": 5.323900772654899e-07, + "loss": 0.6748, + "step": 77865 + }, + { + "epoch": 2.0, + "learning_rate": 5.323656185637837e-07, + "loss": 0.582, + "step": 77866 + }, + { + "epoch": 2.0, + "learning_rate": 5.323411602201238e-07, + "loss": 0.7529, + "step": 77867 + }, + { + "epoch": 2.0, + "learning_rate": 5.323167022345285e-07, + "loss": 0.6553, + "step": 77868 + }, + { + "epoch": 2.0, + "learning_rate": 5.322922446070166e-07, + "loss": 0.5688, + "step": 77869 + }, + { + "epoch": 2.0, + "learning_rate": 5.322677873376071e-07, + "loss": 0.5898, + "step": 77870 + }, + { + "epoch": 2.0, + "learning_rate": 5.322433304263191e-07, + "loss": 0.6797, + "step": 77871 + }, + { + "epoch": 2.0, + "learning_rate": 5.322188738731703e-07, + "loss": 0.5088, + "step": 77872 + }, + { + "epoch": 2.0, + "learning_rate": 5.321944176781801e-07, + "loss": 0.6104, + "step": 77873 + }, + { + "epoch": 2.0, + "learning_rate": 5.321699618413673e-07, + "loss": 0.5356, + "step": 77874 + }, + { + "epoch": 2.0, + "learning_rate": 5.321455063627507e-07, + "loss": 0.4834, + "step": 77875 + }, + { + "epoch": 2.0, + "learning_rate": 5.321210512423486e-07, + "loss": 0.5139, + "step": 77876 + }, + { + "epoch": 2.0, + "learning_rate": 5.320965964801798e-07, + "loss": 0.5737, + "step": 77877 + }, + { + "epoch": 2.0, + "learning_rate": 5.320721420762629e-07, + "loss": 0.5469, + "step": 77878 + }, + { + "epoch": 2.0, + "learning_rate": 5.320476880306173e-07, + "loss": 0.5881, + "step": 77879 + }, + { + "epoch": 2.0, + "learning_rate": 5.320232343432609e-07, + "loss": 0.7422, + "step": 77880 + }, + { + "epoch": 2.0, + "learning_rate": 5.319987810142128e-07, + "loss": 0.6777, + "step": 77881 + }, + { + "epoch": 2.0, + "learning_rate": 5.319743280434917e-07, + "loss": 0.5546, + "step": 77882 + }, + { + "epoch": 2.0, + "learning_rate": 5.319498754311167e-07, + "loss": 0.624, + "step": 77883 + }, + { + "epoch": 2.0, + "learning_rate": 5.319254231771058e-07, + "loss": 0.623, + "step": 77884 + }, + { + "epoch": 2.0, + "learning_rate": 5.319009712814781e-07, + "loss": 0.6318, + "step": 77885 + }, + { + "epoch": 2.0, + "learning_rate": 5.318765197442527e-07, + "loss": 0.5859, + "step": 77886 + }, + { + "epoch": 2.0, + "learning_rate": 5.318520685654475e-07, + "loss": 0.5762, + "step": 77887 + }, + { + "epoch": 2.0, + "learning_rate": 5.31827617745082e-07, + "loss": 0.5381, + "step": 77888 + }, + { + "epoch": 2.0, + "learning_rate": 5.318031672831742e-07, + "loss": 0.5127, + "step": 77889 + }, + { + "epoch": 2.0, + "learning_rate": 5.317787171797432e-07, + "loss": 0.5723, + "step": 77890 + }, + { + "epoch": 2.0, + "learning_rate": 5.317542674348078e-07, + "loss": 0.749, + "step": 77891 + }, + { + "epoch": 2.0, + "learning_rate": 5.31729818048387e-07, + "loss": 0.6245, + "step": 77892 + }, + { + "epoch": 2.0, + "learning_rate": 5.317053690204985e-07, + "loss": 0.6758, + "step": 77893 + }, + { + "epoch": 2.0, + "learning_rate": 5.316809203511618e-07, + "loss": 0.5664, + "step": 77894 + }, + { + "epoch": 2.0, + "learning_rate": 5.316564720403956e-07, + "loss": 0.5298, + "step": 77895 + }, + { + "epoch": 2.0, + "learning_rate": 5.316320240882193e-07, + "loss": 0.6416, + "step": 77896 + }, + { + "epoch": 2.0, + "learning_rate": 5.3160757649465e-07, + "loss": 0.437, + "step": 77897 + }, + { + "epoch": 2.0, + "learning_rate": 5.315831292597072e-07, + "loss": 0.707, + "step": 77898 + }, + { + "epoch": 2.0, + "learning_rate": 5.315586823834096e-07, + "loss": 0.5288, + "step": 77899 + }, + { + "epoch": 2.0, + "learning_rate": 5.315342358657764e-07, + "loss": 0.5352, + "step": 77900 + }, + { + "epoch": 2.0, + "learning_rate": 5.315097897068255e-07, + "loss": 0.4922, + "step": 77901 + }, + { + "epoch": 2.0, + "learning_rate": 5.314853439065761e-07, + "loss": 0.6973, + "step": 77902 + }, + { + "epoch": 2.0, + "learning_rate": 5.314608984650469e-07, + "loss": 0.3765, + "step": 77903 + }, + { + "epoch": 2.0, + "learning_rate": 5.314364533822566e-07, + "loss": 0.6943, + "step": 77904 + }, + { + "epoch": 2.0, + "learning_rate": 5.314120086582237e-07, + "loss": 0.5933, + "step": 77905 + }, + { + "epoch": 2.0, + "learning_rate": 5.313875642929675e-07, + "loss": 0.3682, + "step": 77906 + }, + { + "epoch": 2.0, + "learning_rate": 5.313631202865059e-07, + "loss": 0.6025, + "step": 77907 + }, + { + "epoch": 2.0, + "learning_rate": 5.313386766388579e-07, + "loss": 0.6226, + "step": 77908 + }, + { + "epoch": 2.0, + "learning_rate": 5.313142333500429e-07, + "loss": 0.5596, + "step": 77909 + }, + { + "epoch": 2.0, + "learning_rate": 5.312897904200785e-07, + "loss": 0.5249, + "step": 77910 + }, + { + "epoch": 2.0, + "learning_rate": 5.31265347848984e-07, + "loss": 0.4507, + "step": 77911 + }, + { + "epoch": 2.0, + "learning_rate": 5.31240905636778e-07, + "loss": 0.6758, + "step": 77912 + }, + { + "epoch": 2.0, + "learning_rate": 5.312164637834797e-07, + "loss": 0.5771, + "step": 77913 + }, + { + "epoch": 2.0, + "learning_rate": 5.311920222891071e-07, + "loss": 0.6177, + "step": 77914 + }, + { + "epoch": 2.0, + "learning_rate": 5.311675811536791e-07, + "loss": 0.667, + "step": 77915 + }, + { + "epoch": 2.0, + "learning_rate": 5.311431403772151e-07, + "loss": 0.5938, + "step": 77916 + }, + { + "epoch": 2.0, + "learning_rate": 5.311186999597331e-07, + "loss": 0.7441, + "step": 77917 + }, + { + "epoch": 2.0, + "learning_rate": 5.310942599012515e-07, + "loss": 0.5164, + "step": 77918 + }, + { + "epoch": 2.0, + "learning_rate": 5.310698202017896e-07, + "loss": 0.6855, + "step": 77919 + }, + { + "epoch": 2.0, + "learning_rate": 5.310453808613659e-07, + "loss": 0.4844, + "step": 77920 + }, + { + "epoch": 2.0, + "learning_rate": 5.310209418799996e-07, + "loss": 0.7261, + "step": 77921 + }, + { + "epoch": 2.0, + "learning_rate": 5.309965032577086e-07, + "loss": 0.5583, + "step": 77922 + }, + { + "epoch": 2.0, + "learning_rate": 5.309720649945119e-07, + "loss": 0.5669, + "step": 77923 + }, + { + "epoch": 2.0, + "learning_rate": 5.309476270904285e-07, + "loss": 0.4583, + "step": 77924 + }, + { + "epoch": 2.0, + "learning_rate": 5.309231895454773e-07, + "loss": 0.5864, + "step": 77925 + }, + { + "epoch": 2.0, + "learning_rate": 5.308987523596767e-07, + "loss": 0.5811, + "step": 77926 + }, + { + "epoch": 2.0, + "learning_rate": 5.308743155330449e-07, + "loss": 0.7334, + "step": 77927 + }, + { + "epoch": 2.0, + "learning_rate": 5.308498790656009e-07, + "loss": 0.5996, + "step": 77928 + }, + { + "epoch": 2.0, + "learning_rate": 5.308254429573638e-07, + "loss": 0.7246, + "step": 77929 + }, + { + "epoch": 2.0, + "learning_rate": 5.308010072083523e-07, + "loss": 0.3831, + "step": 77930 + }, + { + "epoch": 2.0, + "learning_rate": 5.307765718185846e-07, + "loss": 0.6221, + "step": 77931 + }, + { + "epoch": 2.0, + "learning_rate": 5.307521367880796e-07, + "loss": 0.5891, + "step": 77932 + }, + { + "epoch": 2.0, + "learning_rate": 5.307277021168567e-07, + "loss": 0.6377, + "step": 77933 + }, + { + "epoch": 2.0, + "learning_rate": 5.307032678049335e-07, + "loss": 0.52, + "step": 77934 + }, + { + "epoch": 2.0, + "learning_rate": 5.306788338523294e-07, + "loss": 0.5801, + "step": 77935 + }, + { + "epoch": 2.0, + "learning_rate": 5.30654400259063e-07, + "loss": 0.7056, + "step": 77936 + }, + { + "epoch": 2.0, + "learning_rate": 5.306299670251529e-07, + "loss": 0.5796, + "step": 77937 + }, + { + "epoch": 2.0, + "learning_rate": 5.306055341506179e-07, + "loss": 0.6011, + "step": 77938 + }, + { + "epoch": 2.0, + "learning_rate": 5.305811016354765e-07, + "loss": 0.5596, + "step": 77939 + }, + { + "epoch": 2.0, + "learning_rate": 5.305566694797476e-07, + "loss": 0.644, + "step": 77940 + }, + { + "epoch": 2.0, + "learning_rate": 5.305322376834498e-07, + "loss": 0.7285, + "step": 77941 + }, + { + "epoch": 2.0, + "learning_rate": 5.305078062466022e-07, + "loss": 0.6133, + "step": 77942 + }, + { + "epoch": 2.0, + "learning_rate": 5.304833751692228e-07, + "loss": 0.6147, + "step": 77943 + }, + { + "epoch": 2.0, + "learning_rate": 5.304589444513308e-07, + "loss": 0.5122, + "step": 77944 + }, + { + "epoch": 2.0, + "learning_rate": 5.304345140929447e-07, + "loss": 0.5391, + "step": 77945 + }, + { + "epoch": 2.0, + "learning_rate": 5.304100840940837e-07, + "loss": 0.7666, + "step": 77946 + }, + { + "epoch": 2.0, + "learning_rate": 5.303856544547663e-07, + "loss": 0.7588, + "step": 77947 + }, + { + "epoch": 2.0, + "learning_rate": 5.303612251750103e-07, + "loss": 0.5664, + "step": 77948 + }, + { + "epoch": 2.0, + "learning_rate": 5.303367962548353e-07, + "loss": 0.5894, + "step": 77949 + }, + { + "epoch": 2.0, + "learning_rate": 5.303123676942603e-07, + "loss": 0.502, + "step": 77950 + }, + { + "epoch": 2.0, + "learning_rate": 5.30287939493303e-07, + "loss": 0.7266, + "step": 77951 + }, + { + "epoch": 2.0, + "learning_rate": 5.302635116519827e-07, + "loss": 0.7148, + "step": 77952 + }, + { + "epoch": 2.0, + "learning_rate": 5.302390841703179e-07, + "loss": 0.5723, + "step": 77953 + }, + { + "epoch": 2.0, + "learning_rate": 5.302146570483279e-07, + "loss": 0.6362, + "step": 77954 + }, + { + "epoch": 2.0, + "learning_rate": 5.301902302860306e-07, + "loss": 0.5718, + "step": 77955 + }, + { + "epoch": 2.0, + "learning_rate": 5.301658038834454e-07, + "loss": 0.7017, + "step": 77956 + }, + { + "epoch": 2.0, + "learning_rate": 5.301413778405901e-07, + "loss": 0.7026, + "step": 77957 + }, + { + "epoch": 2.0, + "learning_rate": 5.301169521574841e-07, + "loss": 0.5894, + "step": 77958 + }, + { + "epoch": 2.0, + "learning_rate": 5.300925268341463e-07, + "loss": 0.8467, + "step": 77959 + }, + { + "epoch": 2.0, + "learning_rate": 5.300681018705946e-07, + "loss": 0.7046, + "step": 77960 + }, + { + "epoch": 2.0, + "learning_rate": 5.300436772668481e-07, + "loss": 0.5105, + "step": 77961 + }, + { + "epoch": 2.0, + "learning_rate": 5.300192530229258e-07, + "loss": 0.624, + "step": 77962 + }, + { + "epoch": 2.0, + "learning_rate": 5.299948291388463e-07, + "loss": 0.6455, + "step": 77963 + }, + { + "epoch": 2.0, + "learning_rate": 5.299704056146279e-07, + "loss": 0.7393, + "step": 77964 + }, + { + "epoch": 2.0, + "learning_rate": 5.299459824502894e-07, + "loss": 0.7393, + "step": 77965 + }, + { + "epoch": 2.0, + "learning_rate": 5.299215596458502e-07, + "loss": 0.4507, + "step": 77966 + }, + { + "epoch": 2.0, + "learning_rate": 5.298971372013283e-07, + "loss": 0.582, + "step": 77967 + }, + { + "epoch": 2.0, + "learning_rate": 5.298727151167423e-07, + "loss": 0.5176, + "step": 77968 + }, + { + "epoch": 2.0, + "learning_rate": 5.298482933921111e-07, + "loss": 0.7246, + "step": 77969 + }, + { + "epoch": 2.0, + "learning_rate": 5.298238720274535e-07, + "loss": 0.707, + "step": 77970 + }, + { + "epoch": 2.0, + "learning_rate": 5.297994510227884e-07, + "loss": 0.6196, + "step": 77971 + }, + { + "epoch": 2.0, + "learning_rate": 5.297750303781339e-07, + "loss": 0.4736, + "step": 77972 + }, + { + "epoch": 2.0, + "learning_rate": 5.297506100935089e-07, + "loss": 0.5908, + "step": 77973 + }, + { + "epoch": 2.0, + "learning_rate": 5.297261901689325e-07, + "loss": 0.7344, + "step": 77974 + }, + { + "epoch": 2.0, + "learning_rate": 5.297017706044234e-07, + "loss": 0.5977, + "step": 77975 + }, + { + "epoch": 2.0, + "learning_rate": 5.296773514000001e-07, + "loss": 0.5825, + "step": 77976 + }, + { + "epoch": 2.0, + "learning_rate": 5.296529325556806e-07, + "loss": 0.5464, + "step": 77977 + }, + { + "epoch": 2.0, + "learning_rate": 5.296285140714845e-07, + "loss": 0.6992, + "step": 77978 + }, + { + "epoch": 2.0, + "learning_rate": 5.296040959474302e-07, + "loss": 0.6616, + "step": 77979 + }, + { + "epoch": 2.0, + "learning_rate": 5.295796781835366e-07, + "loss": 0.6694, + "step": 77980 + }, + { + "epoch": 2.0, + "learning_rate": 5.295552607798219e-07, + "loss": 0.6875, + "step": 77981 + }, + { + "epoch": 2.0, + "learning_rate": 5.29530843736305e-07, + "loss": 0.5757, + "step": 77982 + }, + { + "epoch": 2.0, + "learning_rate": 5.29506427053005e-07, + "loss": 0.6685, + "step": 77983 + }, + { + "epoch": 2.0, + "learning_rate": 5.294820107299405e-07, + "loss": 0.604, + "step": 77984 + }, + { + "epoch": 2.0, + "learning_rate": 5.294575947671296e-07, + "loss": 0.6211, + "step": 77985 + }, + { + "epoch": 2.0, + "learning_rate": 5.294331791645919e-07, + "loss": 0.5271, + "step": 77986 + }, + { + "epoch": 2.0, + "learning_rate": 5.29408763922345e-07, + "loss": 0.583, + "step": 77987 + }, + { + "epoch": 2.0, + "learning_rate": 5.293843490404086e-07, + "loss": 0.7217, + "step": 77988 + }, + { + "epoch": 2.0, + "learning_rate": 5.293599345188007e-07, + "loss": 0.5024, + "step": 77989 + }, + { + "epoch": 2.0, + "learning_rate": 5.293355203575402e-07, + "loss": 0.645, + "step": 77990 + }, + { + "epoch": 2.0, + "learning_rate": 5.293111065566458e-07, + "loss": 0.7148, + "step": 77991 + }, + { + "epoch": 2.0, + "learning_rate": 5.292866931161367e-07, + "loss": 0.835, + "step": 77992 + }, + { + "epoch": 2.0, + "learning_rate": 5.292622800360306e-07, + "loss": 0.6465, + "step": 77993 + }, + { + "epoch": 2.0, + "learning_rate": 5.292378673163469e-07, + "loss": 0.709, + "step": 77994 + }, + { + "epoch": 2.0, + "learning_rate": 5.292134549571039e-07, + "loss": 0.7129, + "step": 77995 + }, + { + "epoch": 2.0, + "learning_rate": 5.291890429583211e-07, + "loss": 0.8311, + "step": 77996 + }, + { + "epoch": 2.0, + "learning_rate": 5.291646313200165e-07, + "loss": 0.3918, + "step": 77997 + }, + { + "epoch": 2.0, + "learning_rate": 5.291402200422086e-07, + "loss": 0.6187, + "step": 77998 + }, + { + "epoch": 2.0, + "learning_rate": 5.291158091249164e-07, + "loss": 0.6047, + "step": 77999 + }, + { + "epoch": 2.0, + "learning_rate": 5.290913985681584e-07, + "loss": 0.4841, + "step": 78000 + }, + { + "epoch": 2.0, + "learning_rate": 5.29066988371954e-07, + "loss": 0.6318, + "step": 78001 + }, + { + "epoch": 2.0, + "learning_rate": 5.290425785363209e-07, + "loss": 0.6235, + "step": 78002 + }, + { + "epoch": 2.0, + "learning_rate": 5.290181690612783e-07, + "loss": 0.7383, + "step": 78003 + }, + { + "epoch": 2.0, + "learning_rate": 5.289937599468452e-07, + "loss": 0.6357, + "step": 78004 + }, + { + "epoch": 2.0, + "learning_rate": 5.289693511930396e-07, + "loss": 0.6973, + "step": 78005 + }, + { + "epoch": 2.0, + "learning_rate": 5.289449427998806e-07, + "loss": 0.7168, + "step": 78006 + }, + { + "epoch": 2.0, + "learning_rate": 5.289205347673867e-07, + "loss": 0.5439, + "step": 78007 + }, + { + "epoch": 2.0, + "learning_rate": 5.288961270955766e-07, + "loss": 0.6318, + "step": 78008 + }, + { + "epoch": 2.0, + "learning_rate": 5.288717197844695e-07, + "loss": 0.6797, + "step": 78009 + }, + { + "epoch": 2.0, + "learning_rate": 5.288473128340833e-07, + "loss": 0.7441, + "step": 78010 + }, + { + "epoch": 2.0, + "learning_rate": 5.28822906244437e-07, + "loss": 0.4835, + "step": 78011 + }, + { + "epoch": 2.0, + "learning_rate": 5.287985000155493e-07, + "loss": 0.6924, + "step": 78012 + }, + { + "epoch": 2.0, + "learning_rate": 5.287740941474394e-07, + "loss": 0.6274, + "step": 78013 + }, + { + "epoch": 2.0, + "learning_rate": 5.287496886401251e-07, + "loss": 0.6543, + "step": 78014 + }, + { + "epoch": 2.0, + "learning_rate": 5.287252834936253e-07, + "loss": 0.688, + "step": 78015 + }, + { + "epoch": 2.0, + "learning_rate": 5.287008787079595e-07, + "loss": 0.6445, + "step": 78016 + }, + { + "epoch": 2.0, + "learning_rate": 5.286764742831453e-07, + "loss": 0.3557, + "step": 78017 + }, + { + "epoch": 2.0, + "learning_rate": 5.286520702192022e-07, + "loss": 0.5977, + "step": 78018 + }, + { + "epoch": 2.0, + "learning_rate": 5.286276665161482e-07, + "loss": 0.5996, + "step": 78019 + }, + { + "epoch": 2.0, + "learning_rate": 5.286032631740023e-07, + "loss": 0.5674, + "step": 78020 + }, + { + "epoch": 2.0, + "learning_rate": 5.285788601927836e-07, + "loss": 0.6108, + "step": 78021 + }, + { + "epoch": 2.0, + "learning_rate": 5.285544575725101e-07, + "loss": 0.6543, + "step": 78022 + }, + { + "epoch": 2.0, + "learning_rate": 5.285300553132006e-07, + "loss": 0.5542, + "step": 78023 + }, + { + "epoch": 2.0, + "learning_rate": 5.28505653414874e-07, + "loss": 0.7598, + "step": 78024 + }, + { + "epoch": 2.0, + "learning_rate": 5.284812518775494e-07, + "loss": 0.8291, + "step": 78025 + }, + { + "epoch": 2.0, + "learning_rate": 5.28456850701245e-07, + "loss": 0.707, + "step": 78026 + }, + { + "epoch": 2.0, + "learning_rate": 5.284324498859792e-07, + "loss": 0.7422, + "step": 78027 + }, + { + "epoch": 2.0, + "learning_rate": 5.284080494317709e-07, + "loss": 0.7637, + "step": 78028 + }, + { + "epoch": 2.0, + "learning_rate": 5.283836493386388e-07, + "loss": 0.7324, + "step": 78029 + }, + { + "epoch": 2.0, + "learning_rate": 5.283592496066021e-07, + "loss": 0.6748, + "step": 78030 + }, + { + "epoch": 2.0, + "learning_rate": 5.283348502356785e-07, + "loss": 0.6123, + "step": 78031 + }, + { + "epoch": 2.0, + "learning_rate": 5.283104512258876e-07, + "loss": 0.6738, + "step": 78032 + }, + { + "epoch": 2.0, + "learning_rate": 5.282860525772474e-07, + "loss": 0.4316, + "step": 78033 + }, + { + "epoch": 2.0, + "learning_rate": 5.282616542897773e-07, + "loss": 0.5317, + "step": 78034 + }, + { + "epoch": 2.0, + "learning_rate": 5.282372563634957e-07, + "loss": 0.2528, + "step": 78035 + }, + { + "epoch": 2.0, + "learning_rate": 5.282128587984207e-07, + "loss": 0.4692, + "step": 78036 + }, + { + "epoch": 2.0, + "learning_rate": 5.281884615945713e-07, + "loss": 0.4561, + "step": 78037 + }, + { + "epoch": 2.0, + "learning_rate": 5.281640647519667e-07, + "loss": 0.3325, + "step": 78038 + }, + { + "epoch": 2.0, + "learning_rate": 5.28139668270625e-07, + "loss": 0.4868, + "step": 78039 + }, + { + "epoch": 2.0, + "learning_rate": 5.281152721505649e-07, + "loss": 0.491, + "step": 78040 + }, + { + "epoch": 2.0, + "learning_rate": 5.280908763918053e-07, + "loss": 0.3757, + "step": 78041 + }, + { + "epoch": 2.0, + "learning_rate": 5.280664809943651e-07, + "loss": 0.4419, + "step": 78042 + }, + { + "epoch": 2.0, + "learning_rate": 5.280420859582624e-07, + "loss": 0.298, + "step": 78043 + }, + { + "epoch": 2.0, + "learning_rate": 5.280176912835161e-07, + "loss": 0.603, + "step": 78044 + }, + { + "epoch": 2.0, + "learning_rate": 5.279932969701454e-07, + "loss": 0.4521, + "step": 78045 + }, + { + "epoch": 2.0, + "learning_rate": 5.279689030181681e-07, + "loss": 0.4775, + "step": 78046 + }, + { + "epoch": 2.0, + "learning_rate": 5.279445094276038e-07, + "loss": 0.3804, + "step": 78047 + }, + { + "epoch": 2.0, + "learning_rate": 5.279201161984701e-07, + "loss": 0.5171, + "step": 78048 + }, + { + "epoch": 2.0, + "learning_rate": 5.278957233307864e-07, + "loss": 0.4331, + "step": 78049 + }, + { + "epoch": 2.0, + "learning_rate": 5.278713308245713e-07, + "loss": 0.519, + "step": 78050 + }, + { + "epoch": 2.0, + "learning_rate": 5.278469386798436e-07, + "loss": 0.4927, + "step": 78051 + }, + { + "epoch": 2.0, + "learning_rate": 5.278225468966215e-07, + "loss": 0.5303, + "step": 78052 + }, + { + "epoch": 2.0, + "learning_rate": 5.27798155474924e-07, + "loss": 0.5957, + "step": 78053 + }, + { + "epoch": 2.0, + "learning_rate": 5.277737644147698e-07, + "loss": 0.448, + "step": 78054 + }, + { + "epoch": 2.0, + "learning_rate": 5.277493737161782e-07, + "loss": 0.4421, + "step": 78055 + }, + { + "epoch": 2.0, + "learning_rate": 5.277249833791664e-07, + "loss": 0.4062, + "step": 78056 + }, + { + "epoch": 2.0, + "learning_rate": 5.277005934037539e-07, + "loss": 0.4736, + "step": 78057 + }, + { + "epoch": 2.0, + "learning_rate": 5.276762037899594e-07, + "loss": 0.5078, + "step": 78058 + }, + { + "epoch": 2.0, + "learning_rate": 5.276518145378017e-07, + "loss": 0.5005, + "step": 78059 + }, + { + "epoch": 2.0, + "learning_rate": 5.27627425647299e-07, + "loss": 0.4453, + "step": 78060 + }, + { + "epoch": 2.0, + "learning_rate": 5.276030371184703e-07, + "loss": 0.5425, + "step": 78061 + }, + { + "epoch": 2.0, + "learning_rate": 5.275786489513343e-07, + "loss": 0.5029, + "step": 78062 + }, + { + "epoch": 2.0, + "learning_rate": 5.275542611459098e-07, + "loss": 0.4268, + "step": 78063 + }, + { + "epoch": 2.0, + "learning_rate": 5.275298737022152e-07, + "loss": 0.4824, + "step": 78064 + }, + { + "epoch": 2.0, + "learning_rate": 5.275054866202692e-07, + "loss": 0.4678, + "step": 78065 + }, + { + "epoch": 2.0, + "learning_rate": 5.274810999000905e-07, + "loss": 0.4834, + "step": 78066 + }, + { + "epoch": 2.0, + "learning_rate": 5.274567135416976e-07, + "loss": 0.4829, + "step": 78067 + }, + { + "epoch": 2.0, + "learning_rate": 5.274323275451099e-07, + "loss": 0.4746, + "step": 78068 + }, + { + "epoch": 2.0, + "learning_rate": 5.274079419103451e-07, + "loss": 0.3428, + "step": 78069 + }, + { + "epoch": 2.0, + "learning_rate": 5.273835566374222e-07, + "loss": 0.4971, + "step": 78070 + }, + { + "epoch": 2.0, + "learning_rate": 5.273591717263601e-07, + "loss": 0.4116, + "step": 78071 + }, + { + "epoch": 2.0, + "learning_rate": 5.273347871771777e-07, + "loss": 0.4033, + "step": 78072 + }, + { + "epoch": 2.0, + "learning_rate": 5.273104029898929e-07, + "loss": 0.4004, + "step": 78073 + }, + { + "epoch": 2.0, + "learning_rate": 5.272860191645249e-07, + "loss": 0.3368, + "step": 78074 + }, + { + "epoch": 2.0, + "learning_rate": 5.272616357010926e-07, + "loss": 0.4941, + "step": 78075 + }, + { + "epoch": 2.0, + "learning_rate": 5.272372525996142e-07, + "loss": 0.4116, + "step": 78076 + }, + { + "epoch": 2.0, + "learning_rate": 5.272128698601083e-07, + "loss": 0.3885, + "step": 78077 + }, + { + "epoch": 2.0, + "learning_rate": 5.271884874825936e-07, + "loss": 0.4219, + "step": 78078 + }, + { + "epoch": 2.0, + "learning_rate": 5.27164105467089e-07, + "loss": 0.3994, + "step": 78079 + }, + { + "epoch": 2.0, + "learning_rate": 5.271397238136135e-07, + "loss": 0.4431, + "step": 78080 + }, + { + "epoch": 2.0, + "learning_rate": 5.271153425221851e-07, + "loss": 0.3655, + "step": 78081 + }, + { + "epoch": 2.0, + "learning_rate": 5.270909615928225e-07, + "loss": 0.4717, + "step": 78082 + }, + { + "epoch": 2.0, + "learning_rate": 5.270665810255448e-07, + "loss": 0.4053, + "step": 78083 + }, + { + "epoch": 2.0, + "learning_rate": 5.270422008203708e-07, + "loss": 0.2834, + "step": 78084 + }, + { + "epoch": 2.0, + "learning_rate": 5.270178209773188e-07, + "loss": 0.3918, + "step": 78085 + }, + { + "epoch": 2.0, + "learning_rate": 5.269934414964073e-07, + "loss": 0.4204, + "step": 78086 + }, + { + "epoch": 2.0, + "learning_rate": 5.269690623776548e-07, + "loss": 0.4399, + "step": 78087 + }, + { + "epoch": 2.0, + "learning_rate": 5.269446836210807e-07, + "loss": 0.397, + "step": 78088 + }, + { + "epoch": 2.0, + "learning_rate": 5.269203052267034e-07, + "loss": 0.3647, + "step": 78089 + }, + { + "epoch": 2.0, + "learning_rate": 5.268959271945413e-07, + "loss": 0.5059, + "step": 78090 + }, + { + "epoch": 2.0, + "learning_rate": 5.268715495246133e-07, + "loss": 0.481, + "step": 78091 + }, + { + "epoch": 2.0, + "learning_rate": 5.268471722169377e-07, + "loss": 0.3955, + "step": 78092 + }, + { + "epoch": 2.0, + "learning_rate": 5.268227952715341e-07, + "loss": 0.3887, + "step": 78093 + }, + { + "epoch": 2.0, + "learning_rate": 5.267984186884201e-07, + "loss": 0.4668, + "step": 78094 + }, + { + "epoch": 2.0, + "learning_rate": 5.267740424676151e-07, + "loss": 0.4087, + "step": 78095 + }, + { + "epoch": 2.0, + "learning_rate": 5.267496666091371e-07, + "loss": 0.4761, + "step": 78096 + }, + { + "epoch": 2.0, + "learning_rate": 5.267252911130054e-07, + "loss": 0.3792, + "step": 78097 + }, + { + "epoch": 2.0, + "learning_rate": 5.267009159792382e-07, + "loss": 0.4546, + "step": 78098 + }, + { + "epoch": 2.0, + "learning_rate": 5.266765412078542e-07, + "loss": 0.2788, + "step": 78099 + }, + { + "epoch": 2.0, + "learning_rate": 5.266521667988723e-07, + "loss": 0.501, + "step": 78100 + }, + { + "epoch": 2.0, + "learning_rate": 5.266277927523114e-07, + "loss": 0.4751, + "step": 78101 + }, + { + "epoch": 2.0, + "learning_rate": 5.266034190681894e-07, + "loss": 0.355, + "step": 78102 + }, + { + "epoch": 2.0, + "learning_rate": 5.265790457465256e-07, + "loss": 0.3735, + "step": 78103 + }, + { + "epoch": 2.0, + "learning_rate": 5.265546727873383e-07, + "loss": 0.2698, + "step": 78104 + }, + { + "epoch": 2.0, + "learning_rate": 5.265303001906468e-07, + "loss": 0.3696, + "step": 78105 + }, + { + "epoch": 2.0, + "learning_rate": 5.26505927956469e-07, + "loss": 0.3317, + "step": 78106 + }, + { + "epoch": 2.0, + "learning_rate": 5.264815560848236e-07, + "loss": 0.3982, + "step": 78107 + }, + { + "epoch": 2.0, + "learning_rate": 5.264571845757297e-07, + "loss": 0.4165, + "step": 78108 + }, + { + "epoch": 2.0, + "learning_rate": 5.264328134292055e-07, + "loss": 0.4966, + "step": 78109 + }, + { + "epoch": 2.0, + "learning_rate": 5.264084426452705e-07, + "loss": 0.4023, + "step": 78110 + }, + { + "epoch": 2.0, + "learning_rate": 5.263840722239424e-07, + "loss": 0.439, + "step": 78111 + }, + { + "epoch": 2.0, + "learning_rate": 5.2635970216524e-07, + "loss": 0.4658, + "step": 78112 + }, + { + "epoch": 2.0, + "learning_rate": 5.263353324691829e-07, + "loss": 0.4307, + "step": 78113 + }, + { + "epoch": 2.0, + "learning_rate": 5.263109631357884e-07, + "loss": 0.4531, + "step": 78114 + }, + { + "epoch": 2.0, + "learning_rate": 5.262865941650763e-07, + "loss": 0.3076, + "step": 78115 + }, + { + "epoch": 2.0, + "learning_rate": 5.262622255570644e-07, + "loss": 0.3187, + "step": 78116 + }, + { + "epoch": 2.0, + "learning_rate": 5.262378573117717e-07, + "loss": 0.5376, + "step": 78117 + }, + { + "epoch": 2.0, + "learning_rate": 5.262134894292174e-07, + "loss": 0.302, + "step": 78118 + }, + { + "epoch": 2.0, + "learning_rate": 5.26189121909419e-07, + "loss": 0.4541, + "step": 78119 + }, + { + "epoch": 2.0, + "learning_rate": 5.26164754752396e-07, + "loss": 0.3804, + "step": 78120 + }, + { + "epoch": 2.0, + "learning_rate": 5.261403879581668e-07, + "loss": 0.4678, + "step": 78121 + }, + { + "epoch": 2.0, + "learning_rate": 5.261160215267506e-07, + "loss": 0.2551, + "step": 78122 + }, + { + "epoch": 2.0, + "learning_rate": 5.260916554581651e-07, + "loss": 0.4377, + "step": 78123 + }, + { + "epoch": 2.0, + "learning_rate": 5.260672897524294e-07, + "loss": 0.4534, + "step": 78124 + }, + { + "epoch": 2.0, + "learning_rate": 5.260429244095625e-07, + "loss": 0.5771, + "step": 78125 + }, + { + "epoch": 2.0, + "learning_rate": 5.260185594295825e-07, + "loss": 0.4453, + "step": 78126 + }, + { + "epoch": 2.0, + "learning_rate": 5.259941948125088e-07, + "loss": 0.4919, + "step": 78127 + }, + { + "epoch": 2.0, + "learning_rate": 5.259698305583589e-07, + "loss": 0.3728, + "step": 78128 + }, + { + "epoch": 2.0, + "learning_rate": 5.259454666671523e-07, + "loss": 0.5352, + "step": 78129 + }, + { + "epoch": 2.0, + "learning_rate": 5.259211031389077e-07, + "loss": 0.3974, + "step": 78130 + }, + { + "epoch": 2.0, + "learning_rate": 5.258967399736431e-07, + "loss": 0.4629, + "step": 78131 + }, + { + "epoch": 2.0, + "learning_rate": 5.258723771713778e-07, + "loss": 0.3584, + "step": 78132 + }, + { + "epoch": 2.0, + "learning_rate": 5.258480147321301e-07, + "loss": 0.4458, + "step": 78133 + }, + { + "epoch": 2.0, + "learning_rate": 5.25823652655919e-07, + "loss": 0.3635, + "step": 78134 + }, + { + "epoch": 2.0, + "learning_rate": 5.257992909427631e-07, + "loss": 0.4307, + "step": 78135 + }, + { + "epoch": 2.0, + "learning_rate": 5.257749295926803e-07, + "loss": 0.4602, + "step": 78136 + }, + { + "epoch": 2.0, + "learning_rate": 5.2575056860569e-07, + "loss": 0.3545, + "step": 78137 + }, + { + "epoch": 2.0, + "learning_rate": 5.257262079818108e-07, + "loss": 0.4172, + "step": 78138 + }, + { + "epoch": 2.0, + "learning_rate": 5.257018477210614e-07, + "loss": 0.4292, + "step": 78139 + }, + { + "epoch": 2.0, + "learning_rate": 5.2567748782346e-07, + "loss": 0.4927, + "step": 78140 + }, + { + "epoch": 2.0, + "learning_rate": 5.256531282890256e-07, + "loss": 0.3938, + "step": 78141 + }, + { + "epoch": 2.0, + "learning_rate": 5.256287691177765e-07, + "loss": 0.4976, + "step": 78142 + }, + { + "epoch": 2.0, + "learning_rate": 5.256044103097323e-07, + "loss": 0.3514, + "step": 78143 + }, + { + "epoch": 2.0, + "learning_rate": 5.255800518649105e-07, + "loss": 0.3755, + "step": 78144 + }, + { + "epoch": 2.0, + "learning_rate": 5.255556937833308e-07, + "loss": 0.3921, + "step": 78145 + }, + { + "epoch": 2.0, + "learning_rate": 5.255313360650107e-07, + "loss": 0.3545, + "step": 78146 + }, + { + "epoch": 2.0, + "learning_rate": 5.255069787099699e-07, + "loss": 0.4082, + "step": 78147 + }, + { + "epoch": 2.0, + "learning_rate": 5.254826217182262e-07, + "loss": 0.3723, + "step": 78148 + }, + { + "epoch": 2.0, + "learning_rate": 5.254582650897985e-07, + "loss": 0.4307, + "step": 78149 + }, + { + "epoch": 2.0, + "learning_rate": 5.254339088247057e-07, + "loss": 0.5298, + "step": 78150 + }, + { + "epoch": 2.0, + "learning_rate": 5.254095529229668e-07, + "loss": 0.2917, + "step": 78151 + }, + { + "epoch": 2.0, + "learning_rate": 5.253851973845995e-07, + "loss": 0.5732, + "step": 78152 + }, + { + "epoch": 2.0, + "learning_rate": 5.25360842209623e-07, + "loss": 0.4048, + "step": 78153 + }, + { + "epoch": 2.0, + "learning_rate": 5.253364873980559e-07, + "loss": 0.4658, + "step": 78154 + }, + { + "epoch": 2.0, + "learning_rate": 5.253121329499171e-07, + "loss": 0.5146, + "step": 78155 + }, + { + "epoch": 2.0, + "learning_rate": 5.25287778865225e-07, + "loss": 0.5723, + "step": 78156 + }, + { + "epoch": 2.0, + "learning_rate": 5.252634251439979e-07, + "loss": 0.4355, + "step": 78157 + }, + { + "epoch": 2.0, + "learning_rate": 5.252390717862547e-07, + "loss": 0.3872, + "step": 78158 + }, + { + "epoch": 2.0, + "learning_rate": 5.252147187920141e-07, + "loss": 0.5107, + "step": 78159 + }, + { + "epoch": 2.0, + "learning_rate": 5.251903661612953e-07, + "loss": 0.2463, + "step": 78160 + }, + { + "epoch": 2.0, + "learning_rate": 5.251660138941158e-07, + "loss": 0.5508, + "step": 78161 + }, + { + "epoch": 2.0, + "learning_rate": 5.25141661990495e-07, + "loss": 0.4663, + "step": 78162 + }, + { + "epoch": 2.0, + "learning_rate": 5.251173104504513e-07, + "loss": 0.4751, + "step": 78163 + }, + { + "epoch": 2.0, + "learning_rate": 5.250929592740039e-07, + "loss": 0.3884, + "step": 78164 + }, + { + "epoch": 2.0, + "learning_rate": 5.250686084611711e-07, + "loss": 0.3831, + "step": 78165 + }, + { + "epoch": 2.0, + "learning_rate": 5.250442580119708e-07, + "loss": 0.4253, + "step": 78166 + }, + { + "epoch": 2.0, + "learning_rate": 5.250199079264223e-07, + "loss": 0.4326, + "step": 78167 + }, + { + "epoch": 2.0, + "learning_rate": 5.249955582045447e-07, + "loss": 0.2772, + "step": 78168 + }, + { + "epoch": 2.0, + "learning_rate": 5.249712088463559e-07, + "loss": 0.4365, + "step": 78169 + }, + { + "epoch": 2.0, + "learning_rate": 5.249468598518746e-07, + "loss": 0.4316, + "step": 78170 + }, + { + "epoch": 2.0, + "learning_rate": 5.249225112211197e-07, + "loss": 0.4365, + "step": 78171 + }, + { + "epoch": 2.0, + "learning_rate": 5.248981629541101e-07, + "loss": 0.377, + "step": 78172 + }, + { + "epoch": 2.0, + "learning_rate": 5.248738150508638e-07, + "loss": 0.4399, + "step": 78173 + }, + { + "epoch": 2.0, + "learning_rate": 5.248494675113999e-07, + "loss": 0.3857, + "step": 78174 + }, + { + "epoch": 2.0, + "learning_rate": 5.248251203357372e-07, + "loss": 0.3704, + "step": 78175 + }, + { + "epoch": 2.0, + "learning_rate": 5.248007735238937e-07, + "loss": 0.2454, + "step": 78176 + }, + { + "epoch": 2.0, + "learning_rate": 5.247764270758886e-07, + "loss": 0.4395, + "step": 78177 + }, + { + "epoch": 2.0, + "learning_rate": 5.247520809917402e-07, + "loss": 0.5127, + "step": 78178 + }, + { + "epoch": 2.0, + "learning_rate": 5.247277352714672e-07, + "loss": 0.4127, + "step": 78179 + }, + { + "epoch": 2.0, + "learning_rate": 5.247033899150882e-07, + "loss": 0.395, + "step": 78180 + }, + { + "epoch": 2.0, + "learning_rate": 5.246790449226225e-07, + "loss": 0.2844, + "step": 78181 + }, + { + "epoch": 2.0, + "learning_rate": 5.246547002940878e-07, + "loss": 0.5435, + "step": 78182 + }, + { + "epoch": 2.0, + "learning_rate": 5.24630356029503e-07, + "loss": 0.1517, + "step": 78183 + }, + { + "epoch": 2.0, + "learning_rate": 5.246060121288873e-07, + "loss": 0.4287, + "step": 78184 + }, + { + "epoch": 2.0, + "learning_rate": 5.24581668592259e-07, + "loss": 0.3926, + "step": 78185 + }, + { + "epoch": 2.0, + "learning_rate": 5.245573254196362e-07, + "loss": 0.4087, + "step": 78186 + }, + { + "epoch": 2.0, + "learning_rate": 5.24532982611038e-07, + "loss": 0.3584, + "step": 78187 + }, + { + "epoch": 2.0, + "learning_rate": 5.245086401664832e-07, + "loss": 0.4497, + "step": 78188 + }, + { + "epoch": 2.0, + "learning_rate": 5.244842980859905e-07, + "loss": 0.4495, + "step": 78189 + }, + { + "epoch": 2.0, + "learning_rate": 5.24459956369578e-07, + "loss": 0.4722, + "step": 78190 + }, + { + "epoch": 2.0, + "learning_rate": 5.244356150172647e-07, + "loss": 0.394, + "step": 78191 + }, + { + "epoch": 2.0, + "learning_rate": 5.244112740290689e-07, + "loss": 0.3804, + "step": 78192 + }, + { + "epoch": 2.0, + "learning_rate": 5.243869334050101e-07, + "loss": 0.4238, + "step": 78193 + }, + { + "epoch": 2.0, + "learning_rate": 5.24362593145106e-07, + "loss": 0.3882, + "step": 78194 + }, + { + "epoch": 2.0, + "learning_rate": 5.24338253249376e-07, + "loss": 0.4092, + "step": 78195 + }, + { + "epoch": 2.0, + "learning_rate": 5.243139137178378e-07, + "loss": 0.5234, + "step": 78196 + }, + { + "epoch": 2.0, + "learning_rate": 5.242895745505107e-07, + "loss": 0.4238, + "step": 78197 + }, + { + "epoch": 2.0, + "learning_rate": 5.242652357474135e-07, + "loss": 0.4067, + "step": 78198 + }, + { + "epoch": 2.0, + "learning_rate": 5.242408973085642e-07, + "loss": 0.3896, + "step": 78199 + }, + { + "epoch": 2.0, + "learning_rate": 5.242165592339817e-07, + "loss": 0.4438, + "step": 78200 + }, + { + "epoch": 2.0, + "learning_rate": 5.241922215236852e-07, + "loss": 0.3044, + "step": 78201 + }, + { + "epoch": 2.0, + "learning_rate": 5.241678841776923e-07, + "loss": 0.3755, + "step": 78202 + }, + { + "epoch": 2.0, + "learning_rate": 5.241435471960223e-07, + "loss": 0.4459, + "step": 78203 + }, + { + "epoch": 2.0, + "learning_rate": 5.241192105786935e-07, + "loss": 0.3599, + "step": 78204 + }, + { + "epoch": 2.0, + "learning_rate": 5.240948743257254e-07, + "loss": 0.48, + "step": 78205 + }, + { + "epoch": 2.0, + "learning_rate": 5.240705384371359e-07, + "loss": 0.3394, + "step": 78206 + }, + { + "epoch": 2.0, + "learning_rate": 5.240462029129433e-07, + "loss": 0.4226, + "step": 78207 + }, + { + "epoch": 2.0, + "learning_rate": 5.240218677531664e-07, + "loss": 0.2361, + "step": 78208 + }, + { + "epoch": 2.0, + "learning_rate": 5.239975329578245e-07, + "loss": 0.4756, + "step": 78209 + }, + { + "epoch": 2.0, + "learning_rate": 5.239731985269359e-07, + "loss": 0.4443, + "step": 78210 + }, + { + "epoch": 2.0, + "learning_rate": 5.239488644605188e-07, + "loss": 0.3853, + "step": 78211 + }, + { + "epoch": 2.0, + "learning_rate": 5.239245307585922e-07, + "loss": 0.3284, + "step": 78212 + }, + { + "epoch": 2.0, + "learning_rate": 5.239001974211748e-07, + "loss": 0.4146, + "step": 78213 + }, + { + "epoch": 2.0, + "learning_rate": 5.238758644482853e-07, + "loss": 0.302, + "step": 78214 + }, + { + "epoch": 2.0, + "learning_rate": 5.238515318399422e-07, + "loss": 0.4492, + "step": 78215 + }, + { + "epoch": 2.0, + "learning_rate": 5.238271995961639e-07, + "loss": 0.3931, + "step": 78216 + }, + { + "epoch": 2.0, + "learning_rate": 5.23802867716969e-07, + "loss": 0.3782, + "step": 78217 + }, + { + "epoch": 2.0, + "learning_rate": 5.237785362023767e-07, + "loss": 0.3159, + "step": 78218 + }, + { + "epoch": 2.0, + "learning_rate": 5.23754205052405e-07, + "loss": 0.4565, + "step": 78219 + }, + { + "epoch": 2.0, + "learning_rate": 5.237298742670728e-07, + "loss": 0.3599, + "step": 78220 + }, + { + "epoch": 2.0, + "learning_rate": 5.237055438463989e-07, + "loss": 0.4351, + "step": 78221 + }, + { + "epoch": 2.0, + "learning_rate": 5.236812137904019e-07, + "loss": 0.4226, + "step": 78222 + }, + { + "epoch": 2.0, + "learning_rate": 5.236568840991e-07, + "loss": 0.415, + "step": 78223 + }, + { + "epoch": 2.0, + "learning_rate": 5.236325547725121e-07, + "loss": 0.3713, + "step": 78224 + }, + { + "epoch": 2.0, + "learning_rate": 5.236082258106574e-07, + "loss": 0.3457, + "step": 78225 + }, + { + "epoch": 2.0, + "learning_rate": 5.235838972135533e-07, + "loss": 0.4497, + "step": 78226 + }, + { + "epoch": 2.0, + "learning_rate": 5.235595689812195e-07, + "loss": 0.3303, + "step": 78227 + }, + { + "epoch": 2.01, + "learning_rate": 5.235352411136741e-07, + "loss": 0.5103, + "step": 78228 + }, + { + "epoch": 2.01, + "learning_rate": 5.235109136109357e-07, + "loss": 0.3788, + "step": 78229 + }, + { + "epoch": 2.01, + "learning_rate": 5.234865864730231e-07, + "loss": 0.3574, + "step": 78230 + }, + { + "epoch": 2.01, + "learning_rate": 5.234622596999554e-07, + "loss": 0.438, + "step": 78231 + }, + { + "epoch": 2.01, + "learning_rate": 5.234379332917502e-07, + "loss": 0.3907, + "step": 78232 + }, + { + "epoch": 2.01, + "learning_rate": 5.234136072484268e-07, + "loss": 0.4336, + "step": 78233 + }, + { + "epoch": 2.01, + "learning_rate": 5.233892815700036e-07, + "loss": 0.4243, + "step": 78234 + }, + { + "epoch": 2.01, + "learning_rate": 5.233649562564997e-07, + "loss": 0.625, + "step": 78235 + }, + { + "epoch": 2.01, + "learning_rate": 5.233406313079334e-07, + "loss": 0.3159, + "step": 78236 + }, + { + "epoch": 2.01, + "learning_rate": 5.233163067243226e-07, + "loss": 0.4414, + "step": 78237 + }, + { + "epoch": 2.01, + "learning_rate": 5.23291982505687e-07, + "loss": 0.3918, + "step": 78238 + }, + { + "epoch": 2.01, + "learning_rate": 5.23267658652045e-07, + "loss": 0.4395, + "step": 78239 + }, + { + "epoch": 2.01, + "learning_rate": 5.232433351634147e-07, + "loss": 0.4565, + "step": 78240 + }, + { + "epoch": 2.01, + "learning_rate": 5.23219012039815e-07, + "loss": 0.3557, + "step": 78241 + }, + { + "epoch": 2.01, + "learning_rate": 5.231946892812645e-07, + "loss": 0.3911, + "step": 78242 + }, + { + "epoch": 2.01, + "learning_rate": 5.231703668877824e-07, + "loss": 0.3875, + "step": 78243 + }, + { + "epoch": 2.01, + "learning_rate": 5.231460448593864e-07, + "loss": 0.3394, + "step": 78244 + }, + { + "epoch": 2.01, + "learning_rate": 5.23121723196096e-07, + "loss": 0.361, + "step": 78245 + }, + { + "epoch": 2.01, + "learning_rate": 5.230974018979288e-07, + "loss": 0.4106, + "step": 78246 + }, + { + "epoch": 2.01, + "learning_rate": 5.230730809649042e-07, + "loss": 0.3354, + "step": 78247 + }, + { + "epoch": 2.01, + "learning_rate": 5.230487603970409e-07, + "loss": 0.4111, + "step": 78248 + }, + { + "epoch": 2.01, + "learning_rate": 5.230244401943568e-07, + "loss": 0.5405, + "step": 78249 + }, + { + "epoch": 2.01, + "learning_rate": 5.230001203568711e-07, + "loss": 0.4121, + "step": 78250 + }, + { + "epoch": 2.01, + "learning_rate": 5.229758008846021e-07, + "loss": 0.4883, + "step": 78251 + }, + { + "epoch": 2.01, + "learning_rate": 5.229514817775692e-07, + "loss": 0.406, + "step": 78252 + }, + { + "epoch": 2.01, + "learning_rate": 5.229271630357899e-07, + "loss": 0.4976, + "step": 78253 + }, + { + "epoch": 2.01, + "learning_rate": 5.229028446592834e-07, + "loss": 0.4482, + "step": 78254 + }, + { + "epoch": 2.01, + "learning_rate": 5.228785266480685e-07, + "loss": 0.5229, + "step": 78255 + }, + { + "epoch": 2.01, + "learning_rate": 5.228542090021637e-07, + "loss": 0.4502, + "step": 78256 + }, + { + "epoch": 2.01, + "learning_rate": 5.22829891721587e-07, + "loss": 0.3556, + "step": 78257 + }, + { + "epoch": 2.01, + "learning_rate": 5.228055748063576e-07, + "loss": 0.5015, + "step": 78258 + }, + { + "epoch": 2.01, + "learning_rate": 5.22781258256494e-07, + "loss": 0.3311, + "step": 78259 + }, + { + "epoch": 2.01, + "learning_rate": 5.227569420720152e-07, + "loss": 0.4963, + "step": 78260 + }, + { + "epoch": 2.01, + "learning_rate": 5.227326262529393e-07, + "loss": 0.4893, + "step": 78261 + }, + { + "epoch": 2.01, + "learning_rate": 5.227083107992847e-07, + "loss": 0.4653, + "step": 78262 + }, + { + "epoch": 2.01, + "learning_rate": 5.226839957110707e-07, + "loss": 0.4688, + "step": 78263 + }, + { + "epoch": 2.01, + "learning_rate": 5.226596809883159e-07, + "loss": 0.439, + "step": 78264 + }, + { + "epoch": 2.01, + "learning_rate": 5.226353666310385e-07, + "loss": 0.3685, + "step": 78265 + }, + { + "epoch": 2.01, + "learning_rate": 5.226110526392571e-07, + "loss": 0.3721, + "step": 78266 + }, + { + "epoch": 2.01, + "learning_rate": 5.225867390129904e-07, + "loss": 0.5068, + "step": 78267 + }, + { + "epoch": 2.01, + "learning_rate": 5.22562425752257e-07, + "loss": 0.3914, + "step": 78268 + }, + { + "epoch": 2.01, + "learning_rate": 5.225381128570761e-07, + "loss": 0.3552, + "step": 78269 + }, + { + "epoch": 2.01, + "learning_rate": 5.225138003274653e-07, + "loss": 0.4023, + "step": 78270 + }, + { + "epoch": 2.01, + "learning_rate": 5.224894881634438e-07, + "loss": 0.3076, + "step": 78271 + }, + { + "epoch": 2.01, + "learning_rate": 5.224651763650301e-07, + "loss": 0.4596, + "step": 78272 + }, + { + "epoch": 2.01, + "learning_rate": 5.224408649322433e-07, + "loss": 0.4731, + "step": 78273 + }, + { + "epoch": 2.01, + "learning_rate": 5.224165538651011e-07, + "loss": 0.52, + "step": 78274 + }, + { + "epoch": 2.01, + "learning_rate": 5.223922431636229e-07, + "loss": 0.5659, + "step": 78275 + }, + { + "epoch": 2.01, + "learning_rate": 5.223679328278269e-07, + "loss": 0.4146, + "step": 78276 + }, + { + "epoch": 2.01, + "learning_rate": 5.22343622857732e-07, + "loss": 0.3315, + "step": 78277 + }, + { + "epoch": 2.01, + "learning_rate": 5.223193132533563e-07, + "loss": 0.5737, + "step": 78278 + }, + { + "epoch": 2.01, + "learning_rate": 5.222950040147187e-07, + "loss": 0.3867, + "step": 78279 + }, + { + "epoch": 2.01, + "learning_rate": 5.222706951418378e-07, + "loss": 0.4194, + "step": 78280 + }, + { + "epoch": 2.01, + "learning_rate": 5.222463866347328e-07, + "loss": 0.5786, + "step": 78281 + }, + { + "epoch": 2.01, + "learning_rate": 5.222220784934213e-07, + "loss": 0.5259, + "step": 78282 + }, + { + "epoch": 2.01, + "learning_rate": 5.221977707179224e-07, + "loss": 0.355, + "step": 78283 + }, + { + "epoch": 2.01, + "learning_rate": 5.221734633082546e-07, + "loss": 0.3086, + "step": 78284 + }, + { + "epoch": 2.01, + "learning_rate": 5.221491562644371e-07, + "loss": 0.3877, + "step": 78285 + }, + { + "epoch": 2.01, + "learning_rate": 5.22124849586488e-07, + "loss": 0.4259, + "step": 78286 + }, + { + "epoch": 2.01, + "learning_rate": 5.221005432744256e-07, + "loss": 0.3643, + "step": 78287 + }, + { + "epoch": 2.01, + "learning_rate": 5.220762373282688e-07, + "loss": 0.3862, + "step": 78288 + }, + { + "epoch": 2.01, + "learning_rate": 5.22051931748036e-07, + "loss": 0.4277, + "step": 78289 + }, + { + "epoch": 2.01, + "learning_rate": 5.220276265337469e-07, + "loss": 0.4707, + "step": 78290 + }, + { + "epoch": 2.01, + "learning_rate": 5.220033216854184e-07, + "loss": 0.3848, + "step": 78291 + }, + { + "epoch": 2.01, + "learning_rate": 5.219790172030704e-07, + "loss": 0.4722, + "step": 78292 + }, + { + "epoch": 2.01, + "learning_rate": 5.219547130867212e-07, + "loss": 0.4409, + "step": 78293 + }, + { + "epoch": 2.01, + "learning_rate": 5.219304093363891e-07, + "loss": 0.5356, + "step": 78294 + }, + { + "epoch": 2.01, + "learning_rate": 5.219061059520932e-07, + "loss": 0.3457, + "step": 78295 + }, + { + "epoch": 2.01, + "learning_rate": 5.218818029338514e-07, + "loss": 0.4697, + "step": 78296 + }, + { + "epoch": 2.01, + "learning_rate": 5.218575002816827e-07, + "loss": 0.3975, + "step": 78297 + }, + { + "epoch": 2.01, + "learning_rate": 5.218331979956062e-07, + "loss": 0.4248, + "step": 78298 + }, + { + "epoch": 2.01, + "learning_rate": 5.218088960756397e-07, + "loss": 0.3457, + "step": 78299 + }, + { + "epoch": 2.01, + "learning_rate": 5.21784594521802e-07, + "loss": 0.5015, + "step": 78300 + }, + { + "epoch": 2.01, + "learning_rate": 5.217602933341119e-07, + "loss": 0.5278, + "step": 78301 + }, + { + "epoch": 2.01, + "learning_rate": 5.217359925125884e-07, + "loss": 0.4556, + "step": 78302 + }, + { + "epoch": 2.01, + "learning_rate": 5.21711692057249e-07, + "loss": 0.4375, + "step": 78303 + }, + { + "epoch": 2.01, + "learning_rate": 5.216873919681133e-07, + "loss": 0.5195, + "step": 78304 + }, + { + "epoch": 2.01, + "learning_rate": 5.216630922451999e-07, + "loss": 0.4531, + "step": 78305 + }, + { + "epoch": 2.01, + "learning_rate": 5.216387928885266e-07, + "loss": 0.4712, + "step": 78306 + }, + { + "epoch": 2.01, + "learning_rate": 5.216144938981128e-07, + "loss": 0.459, + "step": 78307 + }, + { + "epoch": 2.01, + "learning_rate": 5.215901952739765e-07, + "loss": 0.2781, + "step": 78308 + }, + { + "epoch": 2.01, + "learning_rate": 5.215658970161365e-07, + "loss": 0.4282, + "step": 78309 + }, + { + "epoch": 2.01, + "learning_rate": 5.21541599124612e-07, + "loss": 0.375, + "step": 78310 + }, + { + "epoch": 2.01, + "learning_rate": 5.215173015994207e-07, + "loss": 0.4541, + "step": 78311 + }, + { + "epoch": 2.01, + "learning_rate": 5.214930044405817e-07, + "loss": 0.4385, + "step": 78312 + }, + { + "epoch": 2.01, + "learning_rate": 5.214687076481133e-07, + "loss": 0.3127, + "step": 78313 + }, + { + "epoch": 2.01, + "learning_rate": 5.214444112220346e-07, + "loss": 0.4001, + "step": 78314 + }, + { + "epoch": 2.01, + "learning_rate": 5.214201151623642e-07, + "loss": 0.5186, + "step": 78315 + }, + { + "epoch": 2.01, + "learning_rate": 5.2139581946912e-07, + "loss": 0.3094, + "step": 78316 + }, + { + "epoch": 2.01, + "learning_rate": 5.213715241423207e-07, + "loss": 0.3958, + "step": 78317 + }, + { + "epoch": 2.01, + "learning_rate": 5.213472291819855e-07, + "loss": 0.417, + "step": 78318 + }, + { + "epoch": 2.01, + "learning_rate": 5.213229345881331e-07, + "loss": 0.4495, + "step": 78319 + }, + { + "epoch": 2.01, + "learning_rate": 5.212986403607812e-07, + "loss": 0.259, + "step": 78320 + }, + { + "epoch": 2.01, + "learning_rate": 5.212743464999489e-07, + "loss": 0.406, + "step": 78321 + }, + { + "epoch": 2.01, + "learning_rate": 5.21250053005655e-07, + "loss": 0.4111, + "step": 78322 + }, + { + "epoch": 2.01, + "learning_rate": 5.212257598779181e-07, + "loss": 0.5415, + "step": 78323 + }, + { + "epoch": 2.01, + "learning_rate": 5.212014671167568e-07, + "loss": 0.3224, + "step": 78324 + }, + { + "epoch": 2.01, + "learning_rate": 5.211771747221892e-07, + "loss": 0.2822, + "step": 78325 + }, + { + "epoch": 2.01, + "learning_rate": 5.21152882694234e-07, + "loss": 0.376, + "step": 78326 + }, + { + "epoch": 2.01, + "learning_rate": 5.211285910329105e-07, + "loss": 0.3643, + "step": 78327 + }, + { + "epoch": 2.01, + "learning_rate": 5.211042997382364e-07, + "loss": 0.3276, + "step": 78328 + }, + { + "epoch": 2.01, + "learning_rate": 5.210800088102307e-07, + "loss": 0.5005, + "step": 78329 + }, + { + "epoch": 2.01, + "learning_rate": 5.210557182489121e-07, + "loss": 0.5151, + "step": 78330 + }, + { + "epoch": 2.01, + "learning_rate": 5.210314280542995e-07, + "loss": 0.3347, + "step": 78331 + }, + { + "epoch": 2.01, + "learning_rate": 5.210071382264108e-07, + "loss": 0.4585, + "step": 78332 + }, + { + "epoch": 2.01, + "learning_rate": 5.209828487652646e-07, + "loss": 0.4683, + "step": 78333 + }, + { + "epoch": 2.01, + "learning_rate": 5.209585596708806e-07, + "loss": 0.4521, + "step": 78334 + }, + { + "epoch": 2.01, + "learning_rate": 5.209342709432758e-07, + "loss": 0.3255, + "step": 78335 + }, + { + "epoch": 2.01, + "learning_rate": 5.209099825824703e-07, + "loss": 0.5591, + "step": 78336 + }, + { + "epoch": 2.01, + "learning_rate": 5.208856945884814e-07, + "loss": 0.478, + "step": 78337 + }, + { + "epoch": 2.01, + "learning_rate": 5.208614069613284e-07, + "loss": 0.3513, + "step": 78338 + }, + { + "epoch": 2.01, + "learning_rate": 5.208371197010298e-07, + "loss": 0.48, + "step": 78339 + }, + { + "epoch": 2.01, + "learning_rate": 5.208128328076046e-07, + "loss": 0.4009, + "step": 78340 + }, + { + "epoch": 2.01, + "learning_rate": 5.207885462810706e-07, + "loss": 0.4883, + "step": 78341 + }, + { + "epoch": 2.01, + "learning_rate": 5.207642601214467e-07, + "loss": 0.5176, + "step": 78342 + }, + { + "epoch": 2.01, + "learning_rate": 5.207399743287516e-07, + "loss": 0.3972, + "step": 78343 + }, + { + "epoch": 2.01, + "learning_rate": 5.207156889030047e-07, + "loss": 0.5098, + "step": 78344 + }, + { + "epoch": 2.01, + "learning_rate": 5.206914038442229e-07, + "loss": 0.4985, + "step": 78345 + }, + { + "epoch": 2.01, + "learning_rate": 5.206671191524257e-07, + "loss": 0.3117, + "step": 78346 + }, + { + "epoch": 2.01, + "learning_rate": 5.206428348276315e-07, + "loss": 0.3259, + "step": 78347 + }, + { + "epoch": 2.01, + "learning_rate": 5.206185508698596e-07, + "loss": 0.479, + "step": 78348 + }, + { + "epoch": 2.01, + "learning_rate": 5.205942672791276e-07, + "loss": 0.3542, + "step": 78349 + }, + { + "epoch": 2.01, + "learning_rate": 5.205699840554545e-07, + "loss": 0.3572, + "step": 78350 + }, + { + "epoch": 2.01, + "learning_rate": 5.20545701198859e-07, + "loss": 0.3229, + "step": 78351 + }, + { + "epoch": 2.01, + "learning_rate": 5.205214187093598e-07, + "loss": 0.4795, + "step": 78352 + }, + { + "epoch": 2.01, + "learning_rate": 5.204971365869751e-07, + "loss": 0.4055, + "step": 78353 + }, + { + "epoch": 2.01, + "learning_rate": 5.204728548317241e-07, + "loss": 0.4194, + "step": 78354 + }, + { + "epoch": 2.01, + "learning_rate": 5.204485734436245e-07, + "loss": 0.3347, + "step": 78355 + }, + { + "epoch": 2.01, + "learning_rate": 5.204242924226953e-07, + "loss": 0.4824, + "step": 78356 + }, + { + "epoch": 2.01, + "learning_rate": 5.204000117689557e-07, + "loss": 0.4829, + "step": 78357 + }, + { + "epoch": 2.01, + "learning_rate": 5.203757314824235e-07, + "loss": 0.4302, + "step": 78358 + }, + { + "epoch": 2.01, + "learning_rate": 5.203514515631173e-07, + "loss": 0.386, + "step": 78359 + }, + { + "epoch": 2.01, + "learning_rate": 5.20327172011056e-07, + "loss": 0.3938, + "step": 78360 + }, + { + "epoch": 2.01, + "learning_rate": 5.203028928262585e-07, + "loss": 0.3851, + "step": 78361 + }, + { + "epoch": 2.01, + "learning_rate": 5.202786140087427e-07, + "loss": 0.4199, + "step": 78362 + }, + { + "epoch": 2.01, + "learning_rate": 5.202543355585276e-07, + "loss": 0.3608, + "step": 78363 + }, + { + "epoch": 2.01, + "learning_rate": 5.202300574756319e-07, + "loss": 0.437, + "step": 78364 + }, + { + "epoch": 2.01, + "learning_rate": 5.202057797600741e-07, + "loss": 0.3745, + "step": 78365 + }, + { + "epoch": 2.01, + "learning_rate": 5.201815024118721e-07, + "loss": 0.3384, + "step": 78366 + }, + { + "epoch": 2.01, + "learning_rate": 5.201572254310452e-07, + "loss": 0.4189, + "step": 78367 + }, + { + "epoch": 2.01, + "learning_rate": 5.201329488176119e-07, + "loss": 0.4014, + "step": 78368 + }, + { + "epoch": 2.01, + "learning_rate": 5.201086725715911e-07, + "loss": 0.4712, + "step": 78369 + }, + { + "epoch": 2.01, + "learning_rate": 5.200843966930005e-07, + "loss": 0.5366, + "step": 78370 + }, + { + "epoch": 2.01, + "learning_rate": 5.200601211818594e-07, + "loss": 0.395, + "step": 78371 + }, + { + "epoch": 2.01, + "learning_rate": 5.200358460381861e-07, + "loss": 0.3218, + "step": 78372 + }, + { + "epoch": 2.01, + "learning_rate": 5.200115712619997e-07, + "loss": 0.2944, + "step": 78373 + }, + { + "epoch": 2.01, + "learning_rate": 5.199872968533183e-07, + "loss": 0.3787, + "step": 78374 + }, + { + "epoch": 2.01, + "learning_rate": 5.199630228121602e-07, + "loss": 0.3656, + "step": 78375 + }, + { + "epoch": 2.01, + "learning_rate": 5.199387491385443e-07, + "loss": 0.4077, + "step": 78376 + }, + { + "epoch": 2.01, + "learning_rate": 5.199144758324894e-07, + "loss": 0.3892, + "step": 78377 + }, + { + "epoch": 2.01, + "learning_rate": 5.198902028940142e-07, + "loss": 0.4746, + "step": 78378 + }, + { + "epoch": 2.01, + "learning_rate": 5.198659303231366e-07, + "loss": 0.3911, + "step": 78379 + }, + { + "epoch": 2.01, + "learning_rate": 5.198416581198755e-07, + "loss": 0.4805, + "step": 78380 + }, + { + "epoch": 2.01, + "learning_rate": 5.1981738628425e-07, + "loss": 0.3213, + "step": 78381 + }, + { + "epoch": 2.01, + "learning_rate": 5.197931148162778e-07, + "loss": 0.4565, + "step": 78382 + }, + { + "epoch": 2.01, + "learning_rate": 5.19768843715978e-07, + "loss": 0.2996, + "step": 78383 + }, + { + "epoch": 2.01, + "learning_rate": 5.197445729833696e-07, + "loss": 0.5024, + "step": 78384 + }, + { + "epoch": 2.01, + "learning_rate": 5.197203026184702e-07, + "loss": 0.4717, + "step": 78385 + }, + { + "epoch": 2.01, + "learning_rate": 5.196960326212994e-07, + "loss": 0.4277, + "step": 78386 + }, + { + "epoch": 2.01, + "learning_rate": 5.196717629918748e-07, + "loss": 0.4177, + "step": 78387 + }, + { + "epoch": 2.01, + "learning_rate": 5.196474937302153e-07, + "loss": 0.4248, + "step": 78388 + }, + { + "epoch": 2.01, + "learning_rate": 5.196232248363397e-07, + "loss": 0.2826, + "step": 78389 + }, + { + "epoch": 2.01, + "learning_rate": 5.19598956310267e-07, + "loss": 0.5049, + "step": 78390 + }, + { + "epoch": 2.01, + "learning_rate": 5.195746881520148e-07, + "loss": 0.3979, + "step": 78391 + }, + { + "epoch": 2.01, + "learning_rate": 5.195504203616023e-07, + "loss": 0.3676, + "step": 78392 + }, + { + "epoch": 2.01, + "learning_rate": 5.195261529390478e-07, + "loss": 0.4375, + "step": 78393 + }, + { + "epoch": 2.01, + "learning_rate": 5.195018858843705e-07, + "loss": 0.4736, + "step": 78394 + }, + { + "epoch": 2.01, + "learning_rate": 5.194776191975885e-07, + "loss": 0.4224, + "step": 78395 + }, + { + "epoch": 2.01, + "learning_rate": 5.1945335287872e-07, + "loss": 0.4182, + "step": 78396 + }, + { + "epoch": 2.01, + "learning_rate": 5.19429086927784e-07, + "loss": 0.4028, + "step": 78397 + }, + { + "epoch": 2.01, + "learning_rate": 5.19404821344799e-07, + "loss": 0.4697, + "step": 78398 + }, + { + "epoch": 2.01, + "learning_rate": 5.193805561297839e-07, + "loss": 0.4094, + "step": 78399 + }, + { + "epoch": 2.01, + "learning_rate": 5.193562912827569e-07, + "loss": 0.4258, + "step": 78400 + }, + { + "epoch": 2.01, + "learning_rate": 5.193320268037364e-07, + "loss": 0.3555, + "step": 78401 + }, + { + "epoch": 2.01, + "learning_rate": 5.193077626927418e-07, + "loss": 0.5117, + "step": 78402 + }, + { + "epoch": 2.01, + "learning_rate": 5.192834989497909e-07, + "loss": 0.5576, + "step": 78403 + }, + { + "epoch": 2.01, + "learning_rate": 5.192592355749027e-07, + "loss": 0.5127, + "step": 78404 + }, + { + "epoch": 2.01, + "learning_rate": 5.192349725680952e-07, + "loss": 0.4497, + "step": 78405 + }, + { + "epoch": 2.01, + "learning_rate": 5.192107099293875e-07, + "loss": 0.46, + "step": 78406 + }, + { + "epoch": 2.01, + "learning_rate": 5.191864476587984e-07, + "loss": 0.5381, + "step": 78407 + }, + { + "epoch": 2.01, + "learning_rate": 5.191621857563458e-07, + "loss": 0.4966, + "step": 78408 + }, + { + "epoch": 2.01, + "learning_rate": 5.191379242220484e-07, + "loss": 0.5332, + "step": 78409 + }, + { + "epoch": 2.01, + "learning_rate": 5.191136630559252e-07, + "loss": 0.3877, + "step": 78410 + }, + { + "epoch": 2.01, + "learning_rate": 5.190894022579948e-07, + "loss": 0.498, + "step": 78411 + }, + { + "epoch": 2.01, + "learning_rate": 5.190651418282752e-07, + "loss": 0.4072, + "step": 78412 + }, + { + "epoch": 2.01, + "learning_rate": 5.190408817667852e-07, + "loss": 0.3403, + "step": 78413 + }, + { + "epoch": 2.01, + "learning_rate": 5.190166220735441e-07, + "loss": 0.4663, + "step": 78414 + }, + { + "epoch": 2.01, + "learning_rate": 5.189923627485692e-07, + "loss": 0.4429, + "step": 78415 + }, + { + "epoch": 2.01, + "learning_rate": 5.189681037918805e-07, + "loss": 0.4507, + "step": 78416 + }, + { + "epoch": 2.01, + "learning_rate": 5.189438452034952e-07, + "loss": 0.5024, + "step": 78417 + }, + { + "epoch": 2.01, + "learning_rate": 5.189195869834324e-07, + "loss": 0.4883, + "step": 78418 + }, + { + "epoch": 2.01, + "learning_rate": 5.188953291317112e-07, + "loss": 0.4878, + "step": 78419 + }, + { + "epoch": 2.01, + "learning_rate": 5.188710716483493e-07, + "loss": 0.4824, + "step": 78420 + }, + { + "epoch": 2.01, + "learning_rate": 5.188468145333657e-07, + "loss": 0.5835, + "step": 78421 + }, + { + "epoch": 2.01, + "learning_rate": 5.18822557786779e-07, + "loss": 0.397, + "step": 78422 + }, + { + "epoch": 2.01, + "learning_rate": 5.187983014086082e-07, + "loss": 0.459, + "step": 78423 + }, + { + "epoch": 2.01, + "learning_rate": 5.187740453988714e-07, + "loss": 0.4468, + "step": 78424 + }, + { + "epoch": 2.01, + "learning_rate": 5.187497897575867e-07, + "loss": 0.4861, + "step": 78425 + }, + { + "epoch": 2.01, + "learning_rate": 5.187255344847731e-07, + "loss": 0.4756, + "step": 78426 + }, + { + "epoch": 2.01, + "learning_rate": 5.187012795804494e-07, + "loss": 0.4951, + "step": 78427 + }, + { + "epoch": 2.01, + "learning_rate": 5.186770250446344e-07, + "loss": 0.4849, + "step": 78428 + }, + { + "epoch": 2.01, + "learning_rate": 5.186527708773457e-07, + "loss": 0.4194, + "step": 78429 + }, + { + "epoch": 2.01, + "learning_rate": 5.186285170786025e-07, + "loss": 0.3706, + "step": 78430 + }, + { + "epoch": 2.01, + "learning_rate": 5.186042636484233e-07, + "loss": 0.4546, + "step": 78431 + }, + { + "epoch": 2.01, + "learning_rate": 5.185800105868272e-07, + "loss": 0.4922, + "step": 78432 + }, + { + "epoch": 2.01, + "learning_rate": 5.185557578938317e-07, + "loss": 0.3339, + "step": 78433 + }, + { + "epoch": 2.01, + "learning_rate": 5.185315055694566e-07, + "loss": 0.3643, + "step": 78434 + }, + { + "epoch": 2.01, + "learning_rate": 5.185072536137191e-07, + "loss": 0.4599, + "step": 78435 + }, + { + "epoch": 2.01, + "learning_rate": 5.184830020266389e-07, + "loss": 0.3054, + "step": 78436 + }, + { + "epoch": 2.01, + "learning_rate": 5.184587508082338e-07, + "loss": 0.4219, + "step": 78437 + }, + { + "epoch": 2.01, + "learning_rate": 5.184344999585226e-07, + "loss": 0.2299, + "step": 78438 + }, + { + "epoch": 2.01, + "learning_rate": 5.184102494775241e-07, + "loss": 0.5078, + "step": 78439 + }, + { + "epoch": 2.01, + "learning_rate": 5.18385999365257e-07, + "loss": 0.4985, + "step": 78440 + }, + { + "epoch": 2.01, + "learning_rate": 5.183617496217393e-07, + "loss": 0.4319, + "step": 78441 + }, + { + "epoch": 2.01, + "learning_rate": 5.183375002469899e-07, + "loss": 0.4062, + "step": 78442 + }, + { + "epoch": 2.01, + "learning_rate": 5.183132512410271e-07, + "loss": 0.373, + "step": 78443 + }, + { + "epoch": 2.01, + "learning_rate": 5.182890026038702e-07, + "loss": 0.4717, + "step": 78444 + }, + { + "epoch": 2.01, + "learning_rate": 5.182647543355374e-07, + "loss": 0.2192, + "step": 78445 + }, + { + "epoch": 2.01, + "learning_rate": 5.182405064360466e-07, + "loss": 0.4229, + "step": 78446 + }, + { + "epoch": 2.01, + "learning_rate": 5.182162589054169e-07, + "loss": 0.4038, + "step": 78447 + }, + { + "epoch": 2.01, + "learning_rate": 5.181920117436669e-07, + "loss": 0.4434, + "step": 78448 + }, + { + "epoch": 2.01, + "learning_rate": 5.181677649508154e-07, + "loss": 0.4939, + "step": 78449 + }, + { + "epoch": 2.01, + "learning_rate": 5.181435185268803e-07, + "loss": 0.458, + "step": 78450 + }, + { + "epoch": 2.01, + "learning_rate": 5.181192724718808e-07, + "loss": 0.4546, + "step": 78451 + }, + { + "epoch": 2.01, + "learning_rate": 5.18095026785835e-07, + "loss": 0.4817, + "step": 78452 + }, + { + "epoch": 2.01, + "learning_rate": 5.180707814687622e-07, + "loss": 0.3473, + "step": 78453 + }, + { + "epoch": 2.01, + "learning_rate": 5.180465365206804e-07, + "loss": 0.4985, + "step": 78454 + }, + { + "epoch": 2.01, + "learning_rate": 5.180222919416076e-07, + "loss": 0.322, + "step": 78455 + }, + { + "epoch": 2.01, + "learning_rate": 5.179980477315632e-07, + "loss": 0.4124, + "step": 78456 + }, + { + "epoch": 2.01, + "learning_rate": 5.179738038905659e-07, + "loss": 0.5259, + "step": 78457 + }, + { + "epoch": 2.01, + "learning_rate": 5.179495604186335e-07, + "loss": 0.3767, + "step": 78458 + }, + { + "epoch": 2.01, + "learning_rate": 5.179253173157848e-07, + "loss": 0.3936, + "step": 78459 + }, + { + "epoch": 2.01, + "learning_rate": 5.179010745820387e-07, + "loss": 0.4751, + "step": 78460 + }, + { + "epoch": 2.01, + "learning_rate": 5.178768322174138e-07, + "loss": 0.4165, + "step": 78461 + }, + { + "epoch": 2.01, + "learning_rate": 5.178525902219282e-07, + "loss": 0.3887, + "step": 78462 + }, + { + "epoch": 2.01, + "learning_rate": 5.178283485956008e-07, + "loss": 0.4287, + "step": 78463 + }, + { + "epoch": 2.01, + "learning_rate": 5.178041073384502e-07, + "loss": 0.3582, + "step": 78464 + }, + { + "epoch": 2.01, + "learning_rate": 5.177798664504946e-07, + "loss": 0.2697, + "step": 78465 + }, + { + "epoch": 2.01, + "learning_rate": 5.177556259317531e-07, + "loss": 0.3721, + "step": 78466 + }, + { + "epoch": 2.01, + "learning_rate": 5.177313857822437e-07, + "loss": 0.3696, + "step": 78467 + }, + { + "epoch": 2.01, + "learning_rate": 5.17707146001985e-07, + "loss": 0.4487, + "step": 78468 + }, + { + "epoch": 2.01, + "learning_rate": 5.176829065909958e-07, + "loss": 0.4062, + "step": 78469 + }, + { + "epoch": 2.01, + "learning_rate": 5.176586675492951e-07, + "loss": 0.2988, + "step": 78470 + }, + { + "epoch": 2.01, + "learning_rate": 5.176344288769006e-07, + "loss": 0.2781, + "step": 78471 + }, + { + "epoch": 2.01, + "learning_rate": 5.176101905738311e-07, + "loss": 0.4165, + "step": 78472 + }, + { + "epoch": 2.01, + "learning_rate": 5.175859526401059e-07, + "loss": 0.4756, + "step": 78473 + }, + { + "epoch": 2.01, + "learning_rate": 5.175617150757427e-07, + "loss": 0.4834, + "step": 78474 + }, + { + "epoch": 2.01, + "learning_rate": 5.175374778807599e-07, + "loss": 0.3411, + "step": 78475 + }, + { + "epoch": 2.01, + "learning_rate": 5.175132410551768e-07, + "loss": 0.4424, + "step": 78476 + }, + { + "epoch": 2.01, + "learning_rate": 5.174890045990115e-07, + "loss": 0.4062, + "step": 78477 + }, + { + "epoch": 2.01, + "learning_rate": 5.174647685122828e-07, + "loss": 0.4121, + "step": 78478 + }, + { + "epoch": 2.01, + "learning_rate": 5.174405327950091e-07, + "loss": 0.4736, + "step": 78479 + }, + { + "epoch": 2.01, + "learning_rate": 5.174162974472088e-07, + "loss": 0.3989, + "step": 78480 + }, + { + "epoch": 2.01, + "learning_rate": 5.173920624689007e-07, + "loss": 0.3669, + "step": 78481 + }, + { + "epoch": 2.01, + "learning_rate": 5.173678278601037e-07, + "loss": 0.3014, + "step": 78482 + }, + { + "epoch": 2.01, + "learning_rate": 5.173435936208357e-07, + "loss": 0.4014, + "step": 78483 + }, + { + "epoch": 2.01, + "learning_rate": 5.173193597511156e-07, + "loss": 0.4167, + "step": 78484 + }, + { + "epoch": 2.01, + "learning_rate": 5.172951262509617e-07, + "loss": 0.5088, + "step": 78485 + }, + { + "epoch": 2.01, + "learning_rate": 5.172708931203927e-07, + "loss": 0.5156, + "step": 78486 + }, + { + "epoch": 2.01, + "learning_rate": 5.172466603594277e-07, + "loss": 0.4492, + "step": 78487 + }, + { + "epoch": 2.01, + "learning_rate": 5.172224279680842e-07, + "loss": 0.4069, + "step": 78488 + }, + { + "epoch": 2.01, + "learning_rate": 5.171981959463811e-07, + "loss": 0.3989, + "step": 78489 + }, + { + "epoch": 2.01, + "learning_rate": 5.171739642943378e-07, + "loss": 0.415, + "step": 78490 + }, + { + "epoch": 2.01, + "learning_rate": 5.171497330119718e-07, + "loss": 0.3573, + "step": 78491 + }, + { + "epoch": 2.01, + "learning_rate": 5.17125502099302e-07, + "loss": 0.3462, + "step": 78492 + }, + { + "epoch": 2.01, + "learning_rate": 5.17101271556347e-07, + "loss": 0.3118, + "step": 78493 + }, + { + "epoch": 2.01, + "learning_rate": 5.170770413831255e-07, + "loss": 0.3899, + "step": 78494 + }, + { + "epoch": 2.01, + "learning_rate": 5.170528115796563e-07, + "loss": 0.3794, + "step": 78495 + }, + { + "epoch": 2.01, + "learning_rate": 5.17028582145957e-07, + "loss": 0.4736, + "step": 78496 + }, + { + "epoch": 2.01, + "learning_rate": 5.170043530820467e-07, + "loss": 0.4072, + "step": 78497 + }, + { + "epoch": 2.01, + "learning_rate": 5.169801243879439e-07, + "loss": 0.3979, + "step": 78498 + }, + { + "epoch": 2.01, + "learning_rate": 5.169558960636677e-07, + "loss": 0.4138, + "step": 78499 + }, + { + "epoch": 2.01, + "learning_rate": 5.169316681092357e-07, + "loss": 0.3862, + "step": 78500 + }, + { + "epoch": 2.01, + "learning_rate": 5.16907440524667e-07, + "loss": 0.4111, + "step": 78501 + }, + { + "epoch": 2.01, + "learning_rate": 5.168832133099798e-07, + "loss": 0.4458, + "step": 78502 + }, + { + "epoch": 2.01, + "learning_rate": 5.168589864651935e-07, + "loss": 0.5, + "step": 78503 + }, + { + "epoch": 2.01, + "learning_rate": 5.168347599903262e-07, + "loss": 0.4204, + "step": 78504 + }, + { + "epoch": 2.01, + "learning_rate": 5.168105338853958e-07, + "loss": 0.4819, + "step": 78505 + }, + { + "epoch": 2.01, + "learning_rate": 5.167863081504214e-07, + "loss": 0.2122, + "step": 78506 + }, + { + "epoch": 2.01, + "learning_rate": 5.167620827854217e-07, + "loss": 0.4575, + "step": 78507 + }, + { + "epoch": 2.01, + "learning_rate": 5.167378577904148e-07, + "loss": 0.4292, + "step": 78508 + }, + { + "epoch": 2.01, + "learning_rate": 5.167136331654194e-07, + "loss": 0.394, + "step": 78509 + }, + { + "epoch": 2.01, + "learning_rate": 5.166894089104543e-07, + "loss": 0.3682, + "step": 78510 + }, + { + "epoch": 2.01, + "learning_rate": 5.166651850255382e-07, + "loss": 0.4988, + "step": 78511 + }, + { + "epoch": 2.01, + "learning_rate": 5.166409615106891e-07, + "loss": 0.3689, + "step": 78512 + }, + { + "epoch": 2.01, + "learning_rate": 5.166167383659255e-07, + "loss": 0.4268, + "step": 78513 + }, + { + "epoch": 2.01, + "learning_rate": 5.165925155912669e-07, + "loss": 0.5088, + "step": 78514 + }, + { + "epoch": 2.01, + "learning_rate": 5.165682931867306e-07, + "loss": 0.2888, + "step": 78515 + }, + { + "epoch": 2.01, + "learning_rate": 5.165440711523363e-07, + "loss": 0.5664, + "step": 78516 + }, + { + "epoch": 2.01, + "learning_rate": 5.165198494881013e-07, + "loss": 0.4888, + "step": 78517 + }, + { + "epoch": 2.01, + "learning_rate": 5.164956281940452e-07, + "loss": 0.2608, + "step": 78518 + }, + { + "epoch": 2.01, + "learning_rate": 5.164714072701859e-07, + "loss": 0.4946, + "step": 78519 + }, + { + "epoch": 2.01, + "learning_rate": 5.164471867165428e-07, + "loss": 0.5596, + "step": 78520 + }, + { + "epoch": 2.01, + "learning_rate": 5.164229665331333e-07, + "loss": 0.4773, + "step": 78521 + }, + { + "epoch": 2.01, + "learning_rate": 5.163987467199764e-07, + "loss": 0.332, + "step": 78522 + }, + { + "epoch": 2.01, + "learning_rate": 5.163745272770909e-07, + "loss": 0.4453, + "step": 78523 + }, + { + "epoch": 2.01, + "learning_rate": 5.16350308204496e-07, + "loss": 0.3879, + "step": 78524 + }, + { + "epoch": 2.01, + "learning_rate": 5.163260895022086e-07, + "loss": 0.283, + "step": 78525 + }, + { + "epoch": 2.01, + "learning_rate": 5.163018711702481e-07, + "loss": 0.3926, + "step": 78526 + }, + { + "epoch": 2.01, + "learning_rate": 5.162776532086331e-07, + "loss": 0.394, + "step": 78527 + }, + { + "epoch": 2.01, + "learning_rate": 5.162534356173822e-07, + "loss": 0.363, + "step": 78528 + }, + { + "epoch": 2.01, + "learning_rate": 5.162292183965135e-07, + "loss": 0.4561, + "step": 78529 + }, + { + "epoch": 2.01, + "learning_rate": 5.16205001546046e-07, + "loss": 0.4351, + "step": 78530 + }, + { + "epoch": 2.01, + "learning_rate": 5.161807850659978e-07, + "loss": 0.2691, + "step": 78531 + }, + { + "epoch": 2.01, + "learning_rate": 5.161565689563884e-07, + "loss": 0.3257, + "step": 78532 + }, + { + "epoch": 2.01, + "learning_rate": 5.161323532172352e-07, + "loss": 0.3409, + "step": 78533 + }, + { + "epoch": 2.01, + "learning_rate": 5.161081378485576e-07, + "loss": 0.4316, + "step": 78534 + }, + { + "epoch": 2.01, + "learning_rate": 5.160839228503733e-07, + "loss": 0.4209, + "step": 78535 + }, + { + "epoch": 2.01, + "learning_rate": 5.160597082227012e-07, + "loss": 0.2959, + "step": 78536 + }, + { + "epoch": 2.01, + "learning_rate": 5.160354939655604e-07, + "loss": 0.3508, + "step": 78537 + }, + { + "epoch": 2.01, + "learning_rate": 5.160112800789686e-07, + "loss": 0.3276, + "step": 78538 + }, + { + "epoch": 2.01, + "learning_rate": 5.159870665629449e-07, + "loss": 0.4136, + "step": 78539 + }, + { + "epoch": 2.01, + "learning_rate": 5.159628534175075e-07, + "loss": 0.4636, + "step": 78540 + }, + { + "epoch": 2.01, + "learning_rate": 5.159386406426753e-07, + "loss": 0.4517, + "step": 78541 + }, + { + "epoch": 2.01, + "learning_rate": 5.159144282384664e-07, + "loss": 0.3843, + "step": 78542 + }, + { + "epoch": 2.01, + "learning_rate": 5.158902162048996e-07, + "loss": 0.2074, + "step": 78543 + }, + { + "epoch": 2.01, + "learning_rate": 5.158660045419938e-07, + "loss": 0.5093, + "step": 78544 + }, + { + "epoch": 2.01, + "learning_rate": 5.158417932497669e-07, + "loss": 0.428, + "step": 78545 + }, + { + "epoch": 2.01, + "learning_rate": 5.158175823282376e-07, + "loss": 0.4746, + "step": 78546 + }, + { + "epoch": 2.01, + "learning_rate": 5.157933717774243e-07, + "loss": 0.3682, + "step": 78547 + }, + { + "epoch": 2.01, + "learning_rate": 5.157691615973459e-07, + "loss": 0.4893, + "step": 78548 + }, + { + "epoch": 2.01, + "learning_rate": 5.15744951788021e-07, + "loss": 0.2278, + "step": 78549 + }, + { + "epoch": 2.01, + "learning_rate": 5.157207423494677e-07, + "loss": 0.4609, + "step": 78550 + }, + { + "epoch": 2.01, + "learning_rate": 5.156965332817048e-07, + "loss": 0.4099, + "step": 78551 + }, + { + "epoch": 2.01, + "learning_rate": 5.156723245847506e-07, + "loss": 0.4043, + "step": 78552 + }, + { + "epoch": 2.01, + "learning_rate": 5.156481162586244e-07, + "loss": 0.3447, + "step": 78553 + }, + { + "epoch": 2.01, + "learning_rate": 5.15623908303344e-07, + "loss": 0.3508, + "step": 78554 + }, + { + "epoch": 2.01, + "learning_rate": 5.155997007189279e-07, + "loss": 0.5229, + "step": 78555 + }, + { + "epoch": 2.01, + "learning_rate": 5.155754935053946e-07, + "loss": 0.3821, + "step": 78556 + }, + { + "epoch": 2.01, + "learning_rate": 5.15551286662763e-07, + "loss": 0.4043, + "step": 78557 + }, + { + "epoch": 2.01, + "learning_rate": 5.155270801910519e-07, + "loss": 0.3872, + "step": 78558 + }, + { + "epoch": 2.01, + "learning_rate": 5.155028740902791e-07, + "loss": 0.4561, + "step": 78559 + }, + { + "epoch": 2.01, + "learning_rate": 5.154786683604633e-07, + "loss": 0.3933, + "step": 78560 + }, + { + "epoch": 2.01, + "learning_rate": 5.154544630016234e-07, + "loss": 0.3643, + "step": 78561 + }, + { + "epoch": 2.01, + "learning_rate": 5.154302580137781e-07, + "loss": 0.4387, + "step": 78562 + }, + { + "epoch": 2.01, + "learning_rate": 5.154060533969451e-07, + "loss": 0.254, + "step": 78563 + }, + { + "epoch": 2.01, + "learning_rate": 5.153818491511438e-07, + "loss": 0.4277, + "step": 78564 + }, + { + "epoch": 2.01, + "learning_rate": 5.153576452763919e-07, + "loss": 0.4375, + "step": 78565 + }, + { + "epoch": 2.01, + "learning_rate": 5.153334417727089e-07, + "loss": 0.386, + "step": 78566 + }, + { + "epoch": 2.01, + "learning_rate": 5.153092386401123e-07, + "loss": 0.3025, + "step": 78567 + }, + { + "epoch": 2.01, + "learning_rate": 5.152850358786211e-07, + "loss": 0.4204, + "step": 78568 + }, + { + "epoch": 2.01, + "learning_rate": 5.15260833488254e-07, + "loss": 0.4614, + "step": 78569 + }, + { + "epoch": 2.01, + "learning_rate": 5.152366314690297e-07, + "loss": 0.5425, + "step": 78570 + }, + { + "epoch": 2.01, + "learning_rate": 5.15212429820966e-07, + "loss": 0.603, + "step": 78571 + }, + { + "epoch": 2.01, + "learning_rate": 5.151882285440818e-07, + "loss": 0.304, + "step": 78572 + }, + { + "epoch": 2.01, + "learning_rate": 5.151640276383958e-07, + "loss": 0.4917, + "step": 78573 + }, + { + "epoch": 2.01, + "learning_rate": 5.151398271039269e-07, + "loss": 0.4482, + "step": 78574 + }, + { + "epoch": 2.01, + "learning_rate": 5.151156269406929e-07, + "loss": 0.3727, + "step": 78575 + }, + { + "epoch": 2.01, + "learning_rate": 5.150914271487124e-07, + "loss": 0.4717, + "step": 78576 + }, + { + "epoch": 2.01, + "learning_rate": 5.150672277280039e-07, + "loss": 0.345, + "step": 78577 + }, + { + "epoch": 2.01, + "learning_rate": 5.150430286785862e-07, + "loss": 0.4756, + "step": 78578 + }, + { + "epoch": 2.01, + "learning_rate": 5.150188300004781e-07, + "loss": 0.3235, + "step": 78579 + }, + { + "epoch": 2.01, + "learning_rate": 5.149946316936975e-07, + "loss": 0.4438, + "step": 78580 + }, + { + "epoch": 2.01, + "learning_rate": 5.149704337582631e-07, + "loss": 0.5303, + "step": 78581 + }, + { + "epoch": 2.01, + "learning_rate": 5.149462361941941e-07, + "loss": 0.4941, + "step": 78582 + }, + { + "epoch": 2.01, + "learning_rate": 5.149220390015079e-07, + "loss": 0.4819, + "step": 78583 + }, + { + "epoch": 2.01, + "learning_rate": 5.148978421802239e-07, + "loss": 0.4653, + "step": 78584 + }, + { + "epoch": 2.01, + "learning_rate": 5.148736457303601e-07, + "loss": 0.6069, + "step": 78585 + }, + { + "epoch": 2.01, + "learning_rate": 5.148494496519353e-07, + "loss": 0.3257, + "step": 78586 + }, + { + "epoch": 2.01, + "learning_rate": 5.148252539449682e-07, + "loss": 0.3374, + "step": 78587 + }, + { + "epoch": 2.01, + "learning_rate": 5.148010586094768e-07, + "loss": 0.2526, + "step": 78588 + }, + { + "epoch": 2.01, + "learning_rate": 5.147768636454799e-07, + "loss": 0.3347, + "step": 78589 + }, + { + "epoch": 2.01, + "learning_rate": 5.14752669052996e-07, + "loss": 0.3048, + "step": 78590 + }, + { + "epoch": 2.01, + "learning_rate": 5.14728474832044e-07, + "loss": 0.438, + "step": 78591 + }, + { + "epoch": 2.01, + "learning_rate": 5.147042809826418e-07, + "loss": 0.4099, + "step": 78592 + }, + { + "epoch": 2.01, + "learning_rate": 5.146800875048083e-07, + "loss": 0.4702, + "step": 78593 + }, + { + "epoch": 2.01, + "learning_rate": 5.146558943985622e-07, + "loss": 0.415, + "step": 78594 + }, + { + "epoch": 2.01, + "learning_rate": 5.146317016639215e-07, + "loss": 0.3595, + "step": 78595 + }, + { + "epoch": 2.01, + "learning_rate": 5.146075093009052e-07, + "loss": 0.4878, + "step": 78596 + }, + { + "epoch": 2.01, + "learning_rate": 5.145833173095313e-07, + "loss": 0.3767, + "step": 78597 + }, + { + "epoch": 2.01, + "learning_rate": 5.145591256898187e-07, + "loss": 0.2612, + "step": 78598 + }, + { + "epoch": 2.01, + "learning_rate": 5.145349344417862e-07, + "loss": 0.4951, + "step": 78599 + }, + { + "epoch": 2.01, + "learning_rate": 5.145107435654516e-07, + "loss": 0.4282, + "step": 78600 + }, + { + "epoch": 2.01, + "learning_rate": 5.144865530608337e-07, + "loss": 0.4956, + "step": 78601 + }, + { + "epoch": 2.01, + "learning_rate": 5.144623629279512e-07, + "loss": 0.4697, + "step": 78602 + }, + { + "epoch": 2.01, + "learning_rate": 5.14438173166823e-07, + "loss": 0.417, + "step": 78603 + }, + { + "epoch": 2.01, + "learning_rate": 5.14413983777467e-07, + "loss": 0.4692, + "step": 78604 + }, + { + "epoch": 2.01, + "learning_rate": 5.143897947599017e-07, + "loss": 0.3602, + "step": 78605 + }, + { + "epoch": 2.01, + "learning_rate": 5.143656061141457e-07, + "loss": 0.5024, + "step": 78606 + }, + { + "epoch": 2.01, + "learning_rate": 5.143414178402176e-07, + "loss": 0.3263, + "step": 78607 + }, + { + "epoch": 2.01, + "learning_rate": 5.143172299381364e-07, + "loss": 0.3843, + "step": 78608 + }, + { + "epoch": 2.01, + "learning_rate": 5.142930424079197e-07, + "loss": 0.2759, + "step": 78609 + }, + { + "epoch": 2.01, + "learning_rate": 5.142688552495865e-07, + "loss": 0.4199, + "step": 78610 + }, + { + "epoch": 2.01, + "learning_rate": 5.142446684631554e-07, + "loss": 0.3435, + "step": 78611 + }, + { + "epoch": 2.01, + "learning_rate": 5.142204820486451e-07, + "loss": 0.3486, + "step": 78612 + }, + { + "epoch": 2.01, + "learning_rate": 5.141962960060739e-07, + "loss": 0.3682, + "step": 78613 + }, + { + "epoch": 2.01, + "learning_rate": 5.141721103354597e-07, + "loss": 0.4309, + "step": 78614 + }, + { + "epoch": 2.01, + "learning_rate": 5.141479250368218e-07, + "loss": 0.4854, + "step": 78615 + }, + { + "epoch": 2.01, + "learning_rate": 5.141237401101788e-07, + "loss": 0.4478, + "step": 78616 + }, + { + "epoch": 2.01, + "learning_rate": 5.140995555555485e-07, + "loss": 0.4619, + "step": 78617 + }, + { + "epoch": 2.02, + "learning_rate": 5.140753713729499e-07, + "loss": 0.4614, + "step": 78618 + }, + { + "epoch": 2.02, + "learning_rate": 5.140511875624014e-07, + "loss": 0.4287, + "step": 78619 + }, + { + "epoch": 2.02, + "learning_rate": 5.140270041239219e-07, + "loss": 0.3721, + "step": 78620 + }, + { + "epoch": 2.02, + "learning_rate": 5.140028210575292e-07, + "loss": 0.5088, + "step": 78621 + }, + { + "epoch": 2.02, + "learning_rate": 5.139786383632423e-07, + "loss": 0.3442, + "step": 78622 + }, + { + "epoch": 2.02, + "learning_rate": 5.139544560410799e-07, + "loss": 0.4316, + "step": 78623 + }, + { + "epoch": 2.02, + "learning_rate": 5.139302740910598e-07, + "loss": 0.52, + "step": 78624 + }, + { + "epoch": 2.02, + "learning_rate": 5.139060925132015e-07, + "loss": 0.2688, + "step": 78625 + }, + { + "epoch": 2.02, + "learning_rate": 5.138819113075223e-07, + "loss": 0.3862, + "step": 78626 + }, + { + "epoch": 2.02, + "learning_rate": 5.138577304740417e-07, + "loss": 0.4937, + "step": 78627 + }, + { + "epoch": 2.02, + "learning_rate": 5.138335500127776e-07, + "loss": 0.3457, + "step": 78628 + }, + { + "epoch": 2.02, + "learning_rate": 5.138093699237493e-07, + "loss": 0.3499, + "step": 78629 + }, + { + "epoch": 2.02, + "learning_rate": 5.137851902069744e-07, + "loss": 0.459, + "step": 78630 + }, + { + "epoch": 2.02, + "learning_rate": 5.137610108624719e-07, + "loss": 0.3333, + "step": 78631 + }, + { + "epoch": 2.02, + "learning_rate": 5.137368318902601e-07, + "loss": 0.5024, + "step": 78632 + }, + { + "epoch": 2.02, + "learning_rate": 5.137126532903587e-07, + "loss": 0.4531, + "step": 78633 + }, + { + "epoch": 2.02, + "learning_rate": 5.136884750627841e-07, + "loss": 0.439, + "step": 78634 + }, + { + "epoch": 2.02, + "learning_rate": 5.136642972075559e-07, + "loss": 0.4985, + "step": 78635 + }, + { + "epoch": 2.02, + "learning_rate": 5.136401197246927e-07, + "loss": 0.397, + "step": 78636 + }, + { + "epoch": 2.02, + "learning_rate": 5.136159426142132e-07, + "loss": 0.3462, + "step": 78637 + }, + { + "epoch": 2.02, + "learning_rate": 5.135917658761351e-07, + "loss": 0.3052, + "step": 78638 + }, + { + "epoch": 2.02, + "learning_rate": 5.135675895104776e-07, + "loss": 0.4736, + "step": 78639 + }, + { + "epoch": 2.02, + "learning_rate": 5.135434135172591e-07, + "loss": 0.4385, + "step": 78640 + }, + { + "epoch": 2.02, + "learning_rate": 5.135192378964983e-07, + "loss": 0.4419, + "step": 78641 + }, + { + "epoch": 2.02, + "learning_rate": 5.13495062648213e-07, + "loss": 0.4199, + "step": 78642 + }, + { + "epoch": 2.02, + "learning_rate": 5.134708877724228e-07, + "loss": 0.4482, + "step": 78643 + }, + { + "epoch": 2.02, + "learning_rate": 5.134467132691449e-07, + "loss": 0.4917, + "step": 78644 + }, + { + "epoch": 2.02, + "learning_rate": 5.134225391383986e-07, + "loss": 0.3989, + "step": 78645 + }, + { + "epoch": 2.02, + "learning_rate": 5.133983653802026e-07, + "loss": 0.3423, + "step": 78646 + }, + { + "epoch": 2.02, + "learning_rate": 5.133741919945749e-07, + "loss": 0.5015, + "step": 78647 + }, + { + "epoch": 2.02, + "learning_rate": 5.13350018981534e-07, + "loss": 0.4385, + "step": 78648 + }, + { + "epoch": 2.02, + "learning_rate": 5.133258463410988e-07, + "loss": 0.4165, + "step": 78649 + }, + { + "epoch": 2.02, + "learning_rate": 5.133016740732878e-07, + "loss": 0.4834, + "step": 78650 + }, + { + "epoch": 2.02, + "learning_rate": 5.13277502178119e-07, + "loss": 0.4053, + "step": 78651 + }, + { + "epoch": 2.02, + "learning_rate": 5.132533306556114e-07, + "loss": 0.5059, + "step": 78652 + }, + { + "epoch": 2.02, + "learning_rate": 5.132291595057836e-07, + "loss": 0.3955, + "step": 78653 + }, + { + "epoch": 2.02, + "learning_rate": 5.132049887286539e-07, + "loss": 0.4282, + "step": 78654 + }, + { + "epoch": 2.02, + "learning_rate": 5.131808183242403e-07, + "loss": 0.2925, + "step": 78655 + }, + { + "epoch": 2.02, + "learning_rate": 5.131566482925618e-07, + "loss": 0.342, + "step": 78656 + }, + { + "epoch": 2.02, + "learning_rate": 5.131324786336368e-07, + "loss": 0.3667, + "step": 78657 + }, + { + "epoch": 2.02, + "learning_rate": 5.131083093474844e-07, + "loss": 0.4287, + "step": 78658 + }, + { + "epoch": 2.02, + "learning_rate": 5.130841404341221e-07, + "loss": 0.3589, + "step": 78659 + }, + { + "epoch": 2.02, + "learning_rate": 5.130599718935689e-07, + "loss": 0.4141, + "step": 78660 + }, + { + "epoch": 2.02, + "learning_rate": 5.130358037258434e-07, + "loss": 0.3657, + "step": 78661 + }, + { + "epoch": 2.02, + "learning_rate": 5.130116359309642e-07, + "loss": 0.4629, + "step": 78662 + }, + { + "epoch": 2.02, + "learning_rate": 5.129874685089497e-07, + "loss": 0.3833, + "step": 78663 + }, + { + "epoch": 2.02, + "learning_rate": 5.129633014598178e-07, + "loss": 0.3691, + "step": 78664 + }, + { + "epoch": 2.02, + "learning_rate": 5.129391347835876e-07, + "loss": 0.3706, + "step": 78665 + }, + { + "epoch": 2.02, + "learning_rate": 5.129149684802776e-07, + "loss": 0.4521, + "step": 78666 + }, + { + "epoch": 2.02, + "learning_rate": 5.128908025499065e-07, + "loss": 0.3497, + "step": 78667 + }, + { + "epoch": 2.02, + "learning_rate": 5.128666369924921e-07, + "loss": 0.3372, + "step": 78668 + }, + { + "epoch": 2.02, + "learning_rate": 5.128424718080533e-07, + "loss": 0.5107, + "step": 78669 + }, + { + "epoch": 2.02, + "learning_rate": 5.128183069966091e-07, + "loss": 0.4536, + "step": 78670 + }, + { + "epoch": 2.02, + "learning_rate": 5.12794142558177e-07, + "loss": 0.4155, + "step": 78671 + }, + { + "epoch": 2.02, + "learning_rate": 5.127699784927762e-07, + "loss": 0.5718, + "step": 78672 + }, + { + "epoch": 2.02, + "learning_rate": 5.127458148004253e-07, + "loss": 0.4248, + "step": 78673 + }, + { + "epoch": 2.02, + "learning_rate": 5.127216514811422e-07, + "loss": 0.406, + "step": 78674 + }, + { + "epoch": 2.02, + "learning_rate": 5.126974885349461e-07, + "loss": 0.3746, + "step": 78675 + }, + { + "epoch": 2.02, + "learning_rate": 5.126733259618547e-07, + "loss": 0.4204, + "step": 78676 + }, + { + "epoch": 2.02, + "learning_rate": 5.12649163761887e-07, + "loss": 0.3596, + "step": 78677 + }, + { + "epoch": 2.02, + "learning_rate": 5.126250019350613e-07, + "loss": 0.4507, + "step": 78678 + }, + { + "epoch": 2.02, + "learning_rate": 5.126008404813966e-07, + "loss": 0.2878, + "step": 78679 + }, + { + "epoch": 2.02, + "learning_rate": 5.125766794009107e-07, + "loss": 0.5249, + "step": 78680 + }, + { + "epoch": 2.02, + "learning_rate": 5.125525186936226e-07, + "loss": 0.3894, + "step": 78681 + }, + { + "epoch": 2.02, + "learning_rate": 5.125283583595504e-07, + "loss": 0.3418, + "step": 78682 + }, + { + "epoch": 2.02, + "learning_rate": 5.125041983987133e-07, + "loss": 0.3989, + "step": 78683 + }, + { + "epoch": 2.02, + "learning_rate": 5.124800388111292e-07, + "loss": 0.3623, + "step": 78684 + }, + { + "epoch": 2.02, + "learning_rate": 5.124558795968165e-07, + "loss": 0.4015, + "step": 78685 + }, + { + "epoch": 2.02, + "learning_rate": 5.124317207557938e-07, + "loss": 0.312, + "step": 78686 + }, + { + "epoch": 2.02, + "learning_rate": 5.124075622880801e-07, + "loss": 0.3103, + "step": 78687 + }, + { + "epoch": 2.02, + "learning_rate": 5.123834041936931e-07, + "loss": 0.4565, + "step": 78688 + }, + { + "epoch": 2.02, + "learning_rate": 5.123592464726518e-07, + "loss": 0.3923, + "step": 78689 + }, + { + "epoch": 2.02, + "learning_rate": 5.123350891249747e-07, + "loss": 0.4399, + "step": 78690 + }, + { + "epoch": 2.02, + "learning_rate": 5.123109321506804e-07, + "loss": 0.502, + "step": 78691 + }, + { + "epoch": 2.02, + "learning_rate": 5.122867755497868e-07, + "loss": 0.3677, + "step": 78692 + }, + { + "epoch": 2.02, + "learning_rate": 5.122626193223133e-07, + "loss": 0.5039, + "step": 78693 + }, + { + "epoch": 2.02, + "learning_rate": 5.122384634682775e-07, + "loss": 0.4092, + "step": 78694 + }, + { + "epoch": 2.02, + "learning_rate": 5.122143079876982e-07, + "loss": 0.4092, + "step": 78695 + }, + { + "epoch": 2.02, + "learning_rate": 5.121901528805943e-07, + "loss": 0.4028, + "step": 78696 + }, + { + "epoch": 2.02, + "learning_rate": 5.121659981469837e-07, + "loss": 0.3535, + "step": 78697 + }, + { + "epoch": 2.02, + "learning_rate": 5.121418437868852e-07, + "loss": 0.3965, + "step": 78698 + }, + { + "epoch": 2.02, + "learning_rate": 5.121176898003171e-07, + "loss": 0.3828, + "step": 78699 + }, + { + "epoch": 2.02, + "learning_rate": 5.120935361872986e-07, + "loss": 0.519, + "step": 78700 + }, + { + "epoch": 2.02, + "learning_rate": 5.120693829478471e-07, + "loss": 0.4272, + "step": 78701 + }, + { + "epoch": 2.02, + "learning_rate": 5.120452300819818e-07, + "loss": 0.3315, + "step": 78702 + }, + { + "epoch": 2.02, + "learning_rate": 5.120210775897213e-07, + "loss": 0.4663, + "step": 78703 + }, + { + "epoch": 2.02, + "learning_rate": 5.119969254710838e-07, + "loss": 0.3298, + "step": 78704 + }, + { + "epoch": 2.02, + "learning_rate": 5.119727737260875e-07, + "loss": 0.2684, + "step": 78705 + }, + { + "epoch": 2.02, + "learning_rate": 5.119486223547513e-07, + "loss": 0.4644, + "step": 78706 + }, + { + "epoch": 2.02, + "learning_rate": 5.119244713570934e-07, + "loss": 0.4224, + "step": 78707 + }, + { + "epoch": 2.02, + "learning_rate": 5.11900320733133e-07, + "loss": 0.3899, + "step": 78708 + }, + { + "epoch": 2.02, + "learning_rate": 5.118761704828876e-07, + "loss": 0.3794, + "step": 78709 + }, + { + "epoch": 2.02, + "learning_rate": 5.118520206063763e-07, + "loss": 0.4673, + "step": 78710 + }, + { + "epoch": 2.02, + "learning_rate": 5.118278711036174e-07, + "loss": 0.2765, + "step": 78711 + }, + { + "epoch": 2.02, + "learning_rate": 5.118037219746298e-07, + "loss": 0.3813, + "step": 78712 + }, + { + "epoch": 2.02, + "learning_rate": 5.117795732194316e-07, + "loss": 0.3481, + "step": 78713 + }, + { + "epoch": 2.02, + "learning_rate": 5.117554248380412e-07, + "loss": 0.4282, + "step": 78714 + }, + { + "epoch": 2.02, + "learning_rate": 5.11731276830477e-07, + "loss": 0.3789, + "step": 78715 + }, + { + "epoch": 2.02, + "learning_rate": 5.117071291967578e-07, + "loss": 0.3623, + "step": 78716 + }, + { + "epoch": 2.02, + "learning_rate": 5.116829819369023e-07, + "loss": 0.3073, + "step": 78717 + }, + { + "epoch": 2.02, + "learning_rate": 5.116588350509284e-07, + "loss": 0.4214, + "step": 78718 + }, + { + "epoch": 2.02, + "learning_rate": 5.116346885388547e-07, + "loss": 0.26, + "step": 78719 + }, + { + "epoch": 2.02, + "learning_rate": 5.116105424007e-07, + "loss": 0.3879, + "step": 78720 + }, + { + "epoch": 2.02, + "learning_rate": 5.115863966364831e-07, + "loss": 0.4089, + "step": 78721 + }, + { + "epoch": 2.02, + "learning_rate": 5.115622512462215e-07, + "loss": 0.3378, + "step": 78722 + }, + { + "epoch": 2.02, + "learning_rate": 5.115381062299347e-07, + "loss": 0.5015, + "step": 78723 + }, + { + "epoch": 2.02, + "learning_rate": 5.115139615876403e-07, + "loss": 0.4062, + "step": 78724 + }, + { + "epoch": 2.02, + "learning_rate": 5.114898173193576e-07, + "loss": 0.478, + "step": 78725 + }, + { + "epoch": 2.02, + "learning_rate": 5.114656734251043e-07, + "loss": 0.3691, + "step": 78726 + }, + { + "epoch": 2.02, + "learning_rate": 5.114415299048993e-07, + "loss": 0.4316, + "step": 78727 + }, + { + "epoch": 2.02, + "learning_rate": 5.114173867587611e-07, + "loss": 0.376, + "step": 78728 + }, + { + "epoch": 2.02, + "learning_rate": 5.113932439867084e-07, + "loss": 0.4007, + "step": 78729 + }, + { + "epoch": 2.02, + "learning_rate": 5.113691015887591e-07, + "loss": 0.3838, + "step": 78730 + }, + { + "epoch": 2.02, + "learning_rate": 5.113449595649319e-07, + "loss": 0.4146, + "step": 78731 + }, + { + "epoch": 2.02, + "learning_rate": 5.113208179152455e-07, + "loss": 0.4302, + "step": 78732 + }, + { + "epoch": 2.02, + "learning_rate": 5.112966766397187e-07, + "loss": 0.4807, + "step": 78733 + }, + { + "epoch": 2.02, + "learning_rate": 5.112725357383696e-07, + "loss": 0.3211, + "step": 78734 + }, + { + "epoch": 2.02, + "learning_rate": 5.112483952112161e-07, + "loss": 0.4053, + "step": 78735 + }, + { + "epoch": 2.02, + "learning_rate": 5.112242550582772e-07, + "loss": 0.2922, + "step": 78736 + }, + { + "epoch": 2.02, + "learning_rate": 5.112001152795717e-07, + "loss": 0.4075, + "step": 78737 + }, + { + "epoch": 2.02, + "learning_rate": 5.11175975875118e-07, + "loss": 0.4077, + "step": 78738 + }, + { + "epoch": 2.02, + "learning_rate": 5.111518368449339e-07, + "loss": 0.3853, + "step": 78739 + }, + { + "epoch": 2.02, + "learning_rate": 5.111276981890384e-07, + "loss": 0.3555, + "step": 78740 + }, + { + "epoch": 2.02, + "learning_rate": 5.111035599074502e-07, + "loss": 0.3379, + "step": 78741 + }, + { + "epoch": 2.02, + "learning_rate": 5.110794220001876e-07, + "loss": 0.4625, + "step": 78742 + }, + { + "epoch": 2.02, + "learning_rate": 5.110552844672691e-07, + "loss": 0.479, + "step": 78743 + }, + { + "epoch": 2.02, + "learning_rate": 5.110311473087128e-07, + "loss": 0.4463, + "step": 78744 + }, + { + "epoch": 2.02, + "learning_rate": 5.110070105245374e-07, + "loss": 0.385, + "step": 78745 + }, + { + "epoch": 2.02, + "learning_rate": 5.109828741147617e-07, + "loss": 0.3652, + "step": 78746 + }, + { + "epoch": 2.02, + "learning_rate": 5.109587380794038e-07, + "loss": 0.4946, + "step": 78747 + }, + { + "epoch": 2.02, + "learning_rate": 5.109346024184821e-07, + "loss": 0.5786, + "step": 78748 + }, + { + "epoch": 2.02, + "learning_rate": 5.109104671320154e-07, + "loss": 0.4741, + "step": 78749 + }, + { + "epoch": 2.02, + "learning_rate": 5.108863322200223e-07, + "loss": 0.4746, + "step": 78750 + }, + { + "epoch": 2.02, + "learning_rate": 5.10862197682521e-07, + "loss": 0.2917, + "step": 78751 + }, + { + "epoch": 2.02, + "learning_rate": 5.108380635195296e-07, + "loss": 0.3755, + "step": 78752 + }, + { + "epoch": 2.02, + "learning_rate": 5.108139297310676e-07, + "loss": 0.3733, + "step": 78753 + }, + { + "epoch": 2.02, + "learning_rate": 5.107897963171526e-07, + "loss": 0.4685, + "step": 78754 + }, + { + "epoch": 2.02, + "learning_rate": 5.107656632778034e-07, + "loss": 0.406, + "step": 78755 + }, + { + "epoch": 2.02, + "learning_rate": 5.107415306130385e-07, + "loss": 0.46, + "step": 78756 + }, + { + "epoch": 2.02, + "learning_rate": 5.10717398322876e-07, + "loss": 0.4124, + "step": 78757 + }, + { + "epoch": 2.02, + "learning_rate": 5.106932664073348e-07, + "loss": 0.3623, + "step": 78758 + }, + { + "epoch": 2.02, + "learning_rate": 5.106691348664336e-07, + "loss": 0.5234, + "step": 78759 + }, + { + "epoch": 2.02, + "learning_rate": 5.106450037001902e-07, + "loss": 0.3569, + "step": 78760 + }, + { + "epoch": 2.02, + "learning_rate": 5.106208729086234e-07, + "loss": 0.3523, + "step": 78761 + }, + { + "epoch": 2.02, + "learning_rate": 5.105967424917521e-07, + "loss": 0.3298, + "step": 78762 + }, + { + "epoch": 2.02, + "learning_rate": 5.105726124495944e-07, + "loss": 0.5, + "step": 78763 + }, + { + "epoch": 2.02, + "learning_rate": 5.105484827821683e-07, + "loss": 0.4214, + "step": 78764 + }, + { + "epoch": 2.02, + "learning_rate": 5.105243534894928e-07, + "loss": 0.3815, + "step": 78765 + }, + { + "epoch": 2.02, + "learning_rate": 5.105002245715862e-07, + "loss": 0.3162, + "step": 78766 + }, + { + "epoch": 2.02, + "learning_rate": 5.104760960284674e-07, + "loss": 0.3333, + "step": 78767 + }, + { + "epoch": 2.02, + "learning_rate": 5.104519678601542e-07, + "loss": 0.3551, + "step": 78768 + }, + { + "epoch": 2.02, + "learning_rate": 5.104278400666655e-07, + "loss": 0.5093, + "step": 78769 + }, + { + "epoch": 2.02, + "learning_rate": 5.104037126480196e-07, + "loss": 0.481, + "step": 78770 + }, + { + "epoch": 2.02, + "learning_rate": 5.103795856042357e-07, + "loss": 0.4443, + "step": 78771 + }, + { + "epoch": 2.02, + "learning_rate": 5.10355458935331e-07, + "loss": 0.5005, + "step": 78772 + }, + { + "epoch": 2.02, + "learning_rate": 5.10331332641325e-07, + "loss": 0.4473, + "step": 78773 + }, + { + "epoch": 2.02, + "learning_rate": 5.103072067222355e-07, + "loss": 0.3251, + "step": 78774 + }, + { + "epoch": 2.02, + "learning_rate": 5.102830811780812e-07, + "loss": 0.3721, + "step": 78775 + }, + { + "epoch": 2.02, + "learning_rate": 5.10258956008881e-07, + "loss": 0.5043, + "step": 78776 + }, + { + "epoch": 2.02, + "learning_rate": 5.102348312146527e-07, + "loss": 0.263, + "step": 78777 + }, + { + "epoch": 2.02, + "learning_rate": 5.102107067954148e-07, + "loss": 0.4771, + "step": 78778 + }, + { + "epoch": 2.02, + "learning_rate": 5.101865827511869e-07, + "loss": 0.4316, + "step": 78779 + }, + { + "epoch": 2.02, + "learning_rate": 5.101624590819859e-07, + "loss": 0.4211, + "step": 78780 + }, + { + "epoch": 2.02, + "learning_rate": 5.101383357878311e-07, + "loss": 0.3596, + "step": 78781 + }, + { + "epoch": 2.02, + "learning_rate": 5.101142128687407e-07, + "loss": 0.3513, + "step": 78782 + }, + { + "epoch": 2.02, + "learning_rate": 5.100900903247338e-07, + "loss": 0.4006, + "step": 78783 + }, + { + "epoch": 2.02, + "learning_rate": 5.100659681558283e-07, + "loss": 0.3853, + "step": 78784 + }, + { + "epoch": 2.02, + "learning_rate": 5.100418463620426e-07, + "loss": 0.3898, + "step": 78785 + }, + { + "epoch": 2.02, + "learning_rate": 5.100177249433951e-07, + "loss": 0.4868, + "step": 78786 + }, + { + "epoch": 2.02, + "learning_rate": 5.099936038999046e-07, + "loss": 0.4736, + "step": 78787 + }, + { + "epoch": 2.02, + "learning_rate": 5.0996948323159e-07, + "loss": 0.4281, + "step": 78788 + }, + { + "epoch": 2.02, + "learning_rate": 5.099453629384686e-07, + "loss": 0.3356, + "step": 78789 + }, + { + "epoch": 2.02, + "learning_rate": 5.099212430205595e-07, + "loss": 0.4233, + "step": 78790 + }, + { + "epoch": 2.02, + "learning_rate": 5.098971234778813e-07, + "loss": 0.3494, + "step": 78791 + }, + { + "epoch": 2.02, + "learning_rate": 5.098730043104527e-07, + "loss": 0.3166, + "step": 78792 + }, + { + "epoch": 2.02, + "learning_rate": 5.098488855182919e-07, + "loss": 0.4042, + "step": 78793 + }, + { + "epoch": 2.02, + "learning_rate": 5.098247671014167e-07, + "loss": 0.3809, + "step": 78794 + }, + { + "epoch": 2.02, + "learning_rate": 5.098006490598463e-07, + "loss": 0.3633, + "step": 78795 + }, + { + "epoch": 2.02, + "learning_rate": 5.097765313935992e-07, + "loss": 0.3703, + "step": 78796 + }, + { + "epoch": 2.02, + "learning_rate": 5.097524141026935e-07, + "loss": 0.4229, + "step": 78797 + }, + { + "epoch": 2.02, + "learning_rate": 5.097282971871476e-07, + "loss": 0.4224, + "step": 78798 + }, + { + "epoch": 2.02, + "learning_rate": 5.097041806469804e-07, + "loss": 0.3037, + "step": 78799 + }, + { + "epoch": 2.02, + "learning_rate": 5.096800644822103e-07, + "loss": 0.4795, + "step": 78800 + }, + { + "epoch": 2.02, + "learning_rate": 5.096559486928555e-07, + "loss": 0.2552, + "step": 78801 + }, + { + "epoch": 2.02, + "learning_rate": 5.096318332789344e-07, + "loss": 0.3965, + "step": 78802 + }, + { + "epoch": 2.02, + "learning_rate": 5.096077182404663e-07, + "loss": 0.3772, + "step": 78803 + }, + { + "epoch": 2.02, + "learning_rate": 5.095836035774684e-07, + "loss": 0.4697, + "step": 78804 + }, + { + "epoch": 2.02, + "learning_rate": 5.095594892899603e-07, + "loss": 0.3673, + "step": 78805 + }, + { + "epoch": 2.02, + "learning_rate": 5.095353753779595e-07, + "loss": 0.4263, + "step": 78806 + }, + { + "epoch": 2.02, + "learning_rate": 5.095112618414849e-07, + "loss": 0.375, + "step": 78807 + }, + { + "epoch": 2.02, + "learning_rate": 5.09487148680555e-07, + "loss": 0.4065, + "step": 78808 + }, + { + "epoch": 2.02, + "learning_rate": 5.094630358951887e-07, + "loss": 0.3752, + "step": 78809 + }, + { + "epoch": 2.02, + "learning_rate": 5.094389234854036e-07, + "loss": 0.5034, + "step": 78810 + }, + { + "epoch": 2.02, + "learning_rate": 5.094148114512185e-07, + "loss": 0.5215, + "step": 78811 + }, + { + "epoch": 2.02, + "learning_rate": 5.093906997926518e-07, + "loss": 0.4961, + "step": 78812 + }, + { + "epoch": 2.02, + "learning_rate": 5.09366588509723e-07, + "loss": 0.4077, + "step": 78813 + }, + { + "epoch": 2.02, + "learning_rate": 5.093424776024489e-07, + "loss": 0.4185, + "step": 78814 + }, + { + "epoch": 2.02, + "learning_rate": 5.093183670708486e-07, + "loss": 0.3772, + "step": 78815 + }, + { + "epoch": 2.02, + "learning_rate": 5.092942569149408e-07, + "loss": 0.5166, + "step": 78816 + }, + { + "epoch": 2.02, + "learning_rate": 5.092701471347441e-07, + "loss": 0.3999, + "step": 78817 + }, + { + "epoch": 2.02, + "learning_rate": 5.092460377302763e-07, + "loss": 0.4414, + "step": 78818 + }, + { + "epoch": 2.02, + "learning_rate": 5.092219287015563e-07, + "loss": 0.4526, + "step": 78819 + }, + { + "epoch": 2.02, + "learning_rate": 5.091978200486025e-07, + "loss": 0.4556, + "step": 78820 + }, + { + "epoch": 2.02, + "learning_rate": 5.091737117714336e-07, + "loss": 0.519, + "step": 78821 + }, + { + "epoch": 2.02, + "learning_rate": 5.091496038700676e-07, + "loss": 0.3682, + "step": 78822 + }, + { + "epoch": 2.02, + "learning_rate": 5.091254963445235e-07, + "loss": 0.4673, + "step": 78823 + }, + { + "epoch": 2.02, + "learning_rate": 5.09101389194819e-07, + "loss": 0.4507, + "step": 78824 + }, + { + "epoch": 2.02, + "learning_rate": 5.09077282420973e-07, + "loss": 0.2232, + "step": 78825 + }, + { + "epoch": 2.02, + "learning_rate": 5.090531760230045e-07, + "loss": 0.3772, + "step": 78826 + }, + { + "epoch": 2.02, + "learning_rate": 5.090290700009309e-07, + "loss": 0.2639, + "step": 78827 + }, + { + "epoch": 2.02, + "learning_rate": 5.090049643547711e-07, + "loss": 0.417, + "step": 78828 + }, + { + "epoch": 2.02, + "learning_rate": 5.089808590845438e-07, + "loss": 0.5361, + "step": 78829 + }, + { + "epoch": 2.02, + "learning_rate": 5.089567541902675e-07, + "loss": 0.522, + "step": 78830 + }, + { + "epoch": 2.02, + "learning_rate": 5.089326496719601e-07, + "loss": 0.3091, + "step": 78831 + }, + { + "epoch": 2.02, + "learning_rate": 5.089085455296405e-07, + "loss": 0.4448, + "step": 78832 + }, + { + "epoch": 2.02, + "learning_rate": 5.088844417633274e-07, + "loss": 0.4893, + "step": 78833 + }, + { + "epoch": 2.02, + "learning_rate": 5.088603383730387e-07, + "loss": 0.5332, + "step": 78834 + }, + { + "epoch": 2.02, + "learning_rate": 5.088362353587929e-07, + "loss": 0.5054, + "step": 78835 + }, + { + "epoch": 2.02, + "learning_rate": 5.088121327206085e-07, + "loss": 0.3767, + "step": 78836 + }, + { + "epoch": 2.02, + "learning_rate": 5.08788030458504e-07, + "loss": 0.3184, + "step": 78837 + }, + { + "epoch": 2.02, + "learning_rate": 5.087639285724985e-07, + "loss": 0.3984, + "step": 78838 + }, + { + "epoch": 2.02, + "learning_rate": 5.087398270626093e-07, + "loss": 0.3645, + "step": 78839 + }, + { + "epoch": 2.02, + "learning_rate": 5.087157259288555e-07, + "loss": 0.3809, + "step": 78840 + }, + { + "epoch": 2.02, + "learning_rate": 5.086916251712556e-07, + "loss": 0.2244, + "step": 78841 + }, + { + "epoch": 2.02, + "learning_rate": 5.086675247898281e-07, + "loss": 0.2891, + "step": 78842 + }, + { + "epoch": 2.02, + "learning_rate": 5.086434247845914e-07, + "loss": 0.3711, + "step": 78843 + }, + { + "epoch": 2.02, + "learning_rate": 5.086193251555635e-07, + "loss": 0.3826, + "step": 78844 + }, + { + "epoch": 2.02, + "learning_rate": 5.085952259027631e-07, + "loss": 0.4565, + "step": 78845 + }, + { + "epoch": 2.02, + "learning_rate": 5.085711270262088e-07, + "loss": 0.3176, + "step": 78846 + }, + { + "epoch": 2.02, + "learning_rate": 5.085470285259193e-07, + "loss": 0.3423, + "step": 78847 + }, + { + "epoch": 2.02, + "learning_rate": 5.085229304019123e-07, + "loss": 0.3625, + "step": 78848 + }, + { + "epoch": 2.02, + "learning_rate": 5.084988326542068e-07, + "loss": 0.4575, + "step": 78849 + }, + { + "epoch": 2.02, + "learning_rate": 5.084747352828216e-07, + "loss": 0.3513, + "step": 78850 + }, + { + "epoch": 2.02, + "learning_rate": 5.084506382877742e-07, + "loss": 0.4244, + "step": 78851 + }, + { + "epoch": 2.02, + "learning_rate": 5.084265416690836e-07, + "loss": 0.3672, + "step": 78852 + }, + { + "epoch": 2.02, + "learning_rate": 5.084024454267686e-07, + "loss": 0.1902, + "step": 78853 + }, + { + "epoch": 2.02, + "learning_rate": 5.083783495608467e-07, + "loss": 0.4092, + "step": 78854 + }, + { + "epoch": 2.02, + "learning_rate": 5.083542540713375e-07, + "loss": 0.4624, + "step": 78855 + }, + { + "epoch": 2.02, + "learning_rate": 5.083301589582582e-07, + "loss": 0.3463, + "step": 78856 + }, + { + "epoch": 2.02, + "learning_rate": 5.083060642216281e-07, + "loss": 0.4365, + "step": 78857 + }, + { + "epoch": 2.02, + "learning_rate": 5.082819698614653e-07, + "loss": 0.5063, + "step": 78858 + }, + { + "epoch": 2.02, + "learning_rate": 5.082578758777889e-07, + "loss": 0.4492, + "step": 78859 + }, + { + "epoch": 2.02, + "learning_rate": 5.082337822706164e-07, + "loss": 0.3477, + "step": 78860 + }, + { + "epoch": 2.02, + "learning_rate": 5.082096890399667e-07, + "loss": 0.4194, + "step": 78861 + }, + { + "epoch": 2.02, + "learning_rate": 5.081855961858581e-07, + "loss": 0.3235, + "step": 78862 + }, + { + "epoch": 2.02, + "learning_rate": 5.081615037083098e-07, + "loss": 0.3772, + "step": 78863 + }, + { + "epoch": 2.02, + "learning_rate": 5.081374116073394e-07, + "loss": 0.623, + "step": 78864 + }, + { + "epoch": 2.02, + "learning_rate": 5.081133198829652e-07, + "loss": 0.335, + "step": 78865 + }, + { + "epoch": 2.02, + "learning_rate": 5.080892285352061e-07, + "loss": 0.4785, + "step": 78866 + }, + { + "epoch": 2.02, + "learning_rate": 5.080651375640809e-07, + "loss": 0.4395, + "step": 78867 + }, + { + "epoch": 2.02, + "learning_rate": 5.080410469696071e-07, + "loss": 0.3821, + "step": 78868 + }, + { + "epoch": 2.02, + "learning_rate": 5.080169567518037e-07, + "loss": 0.2823, + "step": 78869 + }, + { + "epoch": 2.02, + "learning_rate": 5.07992866910689e-07, + "loss": 0.3213, + "step": 78870 + }, + { + "epoch": 2.02, + "learning_rate": 5.07968777446282e-07, + "loss": 0.2996, + "step": 78871 + }, + { + "epoch": 2.02, + "learning_rate": 5.079446883586003e-07, + "loss": 0.3726, + "step": 78872 + }, + { + "epoch": 2.02, + "learning_rate": 5.079205996476632e-07, + "loss": 0.2815, + "step": 78873 + }, + { + "epoch": 2.02, + "learning_rate": 5.078965113134883e-07, + "loss": 0.4175, + "step": 78874 + }, + { + "epoch": 2.02, + "learning_rate": 5.078724233560943e-07, + "loss": 0.2892, + "step": 78875 + }, + { + "epoch": 2.02, + "learning_rate": 5.078483357755001e-07, + "loss": 0.3577, + "step": 78876 + }, + { + "epoch": 2.02, + "learning_rate": 5.078242485717234e-07, + "loss": 0.2507, + "step": 78877 + }, + { + "epoch": 2.02, + "learning_rate": 5.078001617447831e-07, + "loss": 0.3133, + "step": 78878 + }, + { + "epoch": 2.02, + "learning_rate": 5.077760752946975e-07, + "loss": 0.3179, + "step": 78879 + }, + { + "epoch": 2.02, + "learning_rate": 5.077519892214857e-07, + "loss": 0.4702, + "step": 78880 + }, + { + "epoch": 2.02, + "learning_rate": 5.077279035251651e-07, + "loss": 0.4155, + "step": 78881 + }, + { + "epoch": 2.02, + "learning_rate": 5.077038182057547e-07, + "loss": 0.3638, + "step": 78882 + }, + { + "epoch": 2.02, + "learning_rate": 5.076797332632731e-07, + "loss": 0.5107, + "step": 78883 + }, + { + "epoch": 2.02, + "learning_rate": 5.076556486977386e-07, + "loss": 0.363, + "step": 78884 + }, + { + "epoch": 2.02, + "learning_rate": 5.07631564509169e-07, + "loss": 0.4351, + "step": 78885 + }, + { + "epoch": 2.02, + "learning_rate": 5.076074806975833e-07, + "loss": 0.3932, + "step": 78886 + }, + { + "epoch": 2.02, + "learning_rate": 5.07583397263e-07, + "loss": 0.437, + "step": 78887 + }, + { + "epoch": 2.02, + "learning_rate": 5.075593142054377e-07, + "loss": 0.4458, + "step": 78888 + }, + { + "epoch": 2.02, + "learning_rate": 5.075352315249144e-07, + "loss": 0.3481, + "step": 78889 + }, + { + "epoch": 2.02, + "learning_rate": 5.075111492214485e-07, + "loss": 0.46, + "step": 78890 + }, + { + "epoch": 2.02, + "learning_rate": 5.074870672950588e-07, + "loss": 0.3882, + "step": 78891 + }, + { + "epoch": 2.02, + "learning_rate": 5.074629857457641e-07, + "loss": 0.3379, + "step": 78892 + }, + { + "epoch": 2.02, + "learning_rate": 5.074389045735822e-07, + "loss": 0.4453, + "step": 78893 + }, + { + "epoch": 2.02, + "learning_rate": 5.074148237785314e-07, + "loss": 0.3887, + "step": 78894 + }, + { + "epoch": 2.02, + "learning_rate": 5.073907433606303e-07, + "loss": 0.3813, + "step": 78895 + }, + { + "epoch": 2.02, + "learning_rate": 5.073666633198974e-07, + "loss": 0.4287, + "step": 78896 + }, + { + "epoch": 2.02, + "learning_rate": 5.073425836563517e-07, + "loss": 0.3322, + "step": 78897 + }, + { + "epoch": 2.02, + "learning_rate": 5.073185043700108e-07, + "loss": 0.5239, + "step": 78898 + }, + { + "epoch": 2.02, + "learning_rate": 5.072944254608934e-07, + "loss": 0.5508, + "step": 78899 + }, + { + "epoch": 2.02, + "learning_rate": 5.07270346929018e-07, + "loss": 0.4409, + "step": 78900 + }, + { + "epoch": 2.02, + "learning_rate": 5.072462687744035e-07, + "loss": 0.4365, + "step": 78901 + }, + { + "epoch": 2.02, + "learning_rate": 5.072221909970673e-07, + "loss": 0.5244, + "step": 78902 + }, + { + "epoch": 2.02, + "learning_rate": 5.071981135970289e-07, + "loss": 0.2012, + "step": 78903 + }, + { + "epoch": 2.02, + "learning_rate": 5.07174036574306e-07, + "loss": 0.3721, + "step": 78904 + }, + { + "epoch": 2.02, + "learning_rate": 5.071499599289174e-07, + "loss": 0.3168, + "step": 78905 + }, + { + "epoch": 2.02, + "learning_rate": 5.071258836608811e-07, + "loss": 0.3306, + "step": 78906 + }, + { + "epoch": 2.02, + "learning_rate": 5.07101807770216e-07, + "loss": 0.5698, + "step": 78907 + }, + { + "epoch": 2.02, + "learning_rate": 5.070777322569402e-07, + "loss": 0.3492, + "step": 78908 + }, + { + "epoch": 2.02, + "learning_rate": 5.070536571210729e-07, + "loss": 0.3898, + "step": 78909 + }, + { + "epoch": 2.02, + "learning_rate": 5.070295823626313e-07, + "loss": 0.2341, + "step": 78910 + }, + { + "epoch": 2.02, + "learning_rate": 5.070055079816348e-07, + "loss": 0.4355, + "step": 78911 + }, + { + "epoch": 2.02, + "learning_rate": 5.069814339781016e-07, + "loss": 0.376, + "step": 78912 + }, + { + "epoch": 2.02, + "learning_rate": 5.069573603520499e-07, + "loss": 0.4229, + "step": 78913 + }, + { + "epoch": 2.02, + "learning_rate": 5.069332871034985e-07, + "loss": 0.3999, + "step": 78914 + }, + { + "epoch": 2.02, + "learning_rate": 5.069092142324654e-07, + "loss": 0.4849, + "step": 78915 + }, + { + "epoch": 2.02, + "learning_rate": 5.06885141738969e-07, + "loss": 0.3456, + "step": 78916 + }, + { + "epoch": 2.02, + "learning_rate": 5.068610696230282e-07, + "loss": 0.4375, + "step": 78917 + }, + { + "epoch": 2.02, + "learning_rate": 5.068369978846613e-07, + "loss": 0.3689, + "step": 78918 + }, + { + "epoch": 2.02, + "learning_rate": 5.068129265238865e-07, + "loss": 0.4668, + "step": 78919 + }, + { + "epoch": 2.02, + "learning_rate": 5.067888555407224e-07, + "loss": 0.3696, + "step": 78920 + }, + { + "epoch": 2.02, + "learning_rate": 5.067647849351873e-07, + "loss": 0.3425, + "step": 78921 + }, + { + "epoch": 2.02, + "learning_rate": 5.067407147073004e-07, + "loss": 0.1973, + "step": 78922 + }, + { + "epoch": 2.02, + "learning_rate": 5.067166448570787e-07, + "loss": 0.4653, + "step": 78923 + }, + { + "epoch": 2.02, + "learning_rate": 5.066925753845415e-07, + "loss": 0.3696, + "step": 78924 + }, + { + "epoch": 2.02, + "learning_rate": 5.066685062897071e-07, + "loss": 0.4639, + "step": 78925 + }, + { + "epoch": 2.02, + "learning_rate": 5.066444375725944e-07, + "loss": 0.4512, + "step": 78926 + }, + { + "epoch": 2.02, + "learning_rate": 5.066203692332208e-07, + "loss": 0.2832, + "step": 78927 + }, + { + "epoch": 2.02, + "learning_rate": 5.065963012716054e-07, + "loss": 0.4443, + "step": 78928 + }, + { + "epoch": 2.02, + "learning_rate": 5.065722336877665e-07, + "loss": 0.457, + "step": 78929 + }, + { + "epoch": 2.02, + "learning_rate": 5.06548166481723e-07, + "loss": 0.4673, + "step": 78930 + }, + { + "epoch": 2.02, + "learning_rate": 5.065240996534924e-07, + "loss": 0.4404, + "step": 78931 + }, + { + "epoch": 2.02, + "learning_rate": 5.06500033203094e-07, + "loss": 0.4766, + "step": 78932 + }, + { + "epoch": 2.02, + "learning_rate": 5.064759671305455e-07, + "loss": 0.4717, + "step": 78933 + }, + { + "epoch": 2.02, + "learning_rate": 5.064519014358657e-07, + "loss": 0.5659, + "step": 78934 + }, + { + "epoch": 2.02, + "learning_rate": 5.064278361190732e-07, + "loss": 0.4055, + "step": 78935 + }, + { + "epoch": 2.02, + "learning_rate": 5.06403771180186e-07, + "loss": 0.3042, + "step": 78936 + }, + { + "epoch": 2.02, + "learning_rate": 5.063797066192226e-07, + "loss": 0.4663, + "step": 78937 + }, + { + "epoch": 2.02, + "learning_rate": 5.063556424362017e-07, + "loss": 0.6147, + "step": 78938 + }, + { + "epoch": 2.02, + "learning_rate": 5.063315786311418e-07, + "loss": 0.3376, + "step": 78939 + }, + { + "epoch": 2.02, + "learning_rate": 5.063075152040608e-07, + "loss": 0.4375, + "step": 78940 + }, + { + "epoch": 2.02, + "learning_rate": 5.062834521549775e-07, + "loss": 0.4058, + "step": 78941 + }, + { + "epoch": 2.02, + "learning_rate": 5.062593894839107e-07, + "loss": 0.3818, + "step": 78942 + }, + { + "epoch": 2.02, + "learning_rate": 5.062353271908782e-07, + "loss": 0.582, + "step": 78943 + }, + { + "epoch": 2.02, + "learning_rate": 5.062112652758983e-07, + "loss": 0.4609, + "step": 78944 + }, + { + "epoch": 2.02, + "learning_rate": 5.061872037389898e-07, + "loss": 0.2859, + "step": 78945 + }, + { + "epoch": 2.02, + "learning_rate": 5.061631425801709e-07, + "loss": 0.4873, + "step": 78946 + }, + { + "epoch": 2.02, + "learning_rate": 5.061390817994606e-07, + "loss": 0.4277, + "step": 78947 + }, + { + "epoch": 2.02, + "learning_rate": 5.061150213968765e-07, + "loss": 0.304, + "step": 78948 + }, + { + "epoch": 2.02, + "learning_rate": 5.060909613724376e-07, + "loss": 0.4697, + "step": 78949 + }, + { + "epoch": 2.02, + "learning_rate": 5.060669017261621e-07, + "loss": 0.4414, + "step": 78950 + }, + { + "epoch": 2.02, + "learning_rate": 5.060428424580687e-07, + "loss": 0.4941, + "step": 78951 + }, + { + "epoch": 2.02, + "learning_rate": 5.060187835681756e-07, + "loss": 0.3302, + "step": 78952 + }, + { + "epoch": 2.02, + "learning_rate": 5.059947250565008e-07, + "loss": 0.3652, + "step": 78953 + }, + { + "epoch": 2.02, + "learning_rate": 5.059706669230633e-07, + "loss": 0.415, + "step": 78954 + }, + { + "epoch": 2.02, + "learning_rate": 5.059466091678813e-07, + "loss": 0.458, + "step": 78955 + }, + { + "epoch": 2.02, + "learning_rate": 5.059225517909735e-07, + "loss": 0.4507, + "step": 78956 + }, + { + "epoch": 2.02, + "learning_rate": 5.058984947923578e-07, + "loss": 0.4438, + "step": 78957 + }, + { + "epoch": 2.02, + "learning_rate": 5.058744381720528e-07, + "loss": 0.3712, + "step": 78958 + }, + { + "epoch": 2.02, + "learning_rate": 5.058503819300775e-07, + "loss": 0.5024, + "step": 78959 + }, + { + "epoch": 2.02, + "learning_rate": 5.058263260664495e-07, + "loss": 0.4299, + "step": 78960 + }, + { + "epoch": 2.02, + "learning_rate": 5.058022705811875e-07, + "loss": 0.5039, + "step": 78961 + }, + { + "epoch": 2.02, + "learning_rate": 5.057782154743104e-07, + "loss": 0.3682, + "step": 78962 + }, + { + "epoch": 2.02, + "learning_rate": 5.057541607458357e-07, + "loss": 0.4558, + "step": 78963 + }, + { + "epoch": 2.02, + "learning_rate": 5.057301063957828e-07, + "loss": 0.3867, + "step": 78964 + }, + { + "epoch": 2.02, + "learning_rate": 5.057060524241693e-07, + "loss": 0.343, + "step": 78965 + }, + { + "epoch": 2.02, + "learning_rate": 5.05681998831014e-07, + "loss": 0.3582, + "step": 78966 + }, + { + "epoch": 2.02, + "learning_rate": 5.056579456163351e-07, + "loss": 0.332, + "step": 78967 + }, + { + "epoch": 2.02, + "learning_rate": 5.056338927801515e-07, + "loss": 0.3464, + "step": 78968 + }, + { + "epoch": 2.02, + "learning_rate": 5.05609840322481e-07, + "loss": 0.478, + "step": 78969 + }, + { + "epoch": 2.02, + "learning_rate": 5.055857882433423e-07, + "loss": 0.457, + "step": 78970 + }, + { + "epoch": 2.02, + "learning_rate": 5.055617365427538e-07, + "loss": 0.271, + "step": 78971 + }, + { + "epoch": 2.02, + "learning_rate": 5.055376852207344e-07, + "loss": 0.3596, + "step": 78972 + }, + { + "epoch": 2.02, + "learning_rate": 5.05513634277302e-07, + "loss": 0.4907, + "step": 78973 + }, + { + "epoch": 2.02, + "learning_rate": 5.054895837124749e-07, + "loss": 0.498, + "step": 78974 + }, + { + "epoch": 2.02, + "learning_rate": 5.054655335262714e-07, + "loss": 0.3304, + "step": 78975 + }, + { + "epoch": 2.02, + "learning_rate": 5.054414837187107e-07, + "loss": 0.3896, + "step": 78976 + }, + { + "epoch": 2.02, + "learning_rate": 5.054174342898103e-07, + "loss": 0.3298, + "step": 78977 + }, + { + "epoch": 2.02, + "learning_rate": 5.053933852395891e-07, + "loss": 0.4609, + "step": 78978 + }, + { + "epoch": 2.02, + "learning_rate": 5.053693365680655e-07, + "loss": 0.4536, + "step": 78979 + }, + { + "epoch": 2.02, + "learning_rate": 5.05345288275258e-07, + "loss": 0.4386, + "step": 78980 + }, + { + "epoch": 2.02, + "learning_rate": 5.053212403611847e-07, + "loss": 0.4707, + "step": 78981 + }, + { + "epoch": 2.02, + "learning_rate": 5.052971928258645e-07, + "loss": 0.3291, + "step": 78982 + }, + { + "epoch": 2.02, + "learning_rate": 5.052731456693151e-07, + "loss": 0.4375, + "step": 78983 + }, + { + "epoch": 2.02, + "learning_rate": 5.052490988915553e-07, + "loss": 0.4438, + "step": 78984 + }, + { + "epoch": 2.02, + "learning_rate": 5.05225052492604e-07, + "loss": 0.3818, + "step": 78985 + }, + { + "epoch": 2.02, + "learning_rate": 5.052010064724786e-07, + "loss": 0.3734, + "step": 78986 + }, + { + "epoch": 2.02, + "learning_rate": 5.05176960831198e-07, + "loss": 0.4712, + "step": 78987 + }, + { + "epoch": 2.02, + "learning_rate": 5.051529155687809e-07, + "loss": 0.4756, + "step": 78988 + }, + { + "epoch": 2.02, + "learning_rate": 5.051288706852456e-07, + "loss": 0.4849, + "step": 78989 + }, + { + "epoch": 2.02, + "learning_rate": 5.051048261806101e-07, + "loss": 0.4468, + "step": 78990 + }, + { + "epoch": 2.02, + "learning_rate": 5.05080782054893e-07, + "loss": 0.3303, + "step": 78991 + }, + { + "epoch": 2.02, + "learning_rate": 5.050567383081132e-07, + "loss": 0.3616, + "step": 78992 + }, + { + "epoch": 2.02, + "learning_rate": 5.050326949402888e-07, + "loss": 0.3477, + "step": 78993 + }, + { + "epoch": 2.02, + "learning_rate": 5.050086519514376e-07, + "loss": 0.374, + "step": 78994 + }, + { + "epoch": 2.02, + "learning_rate": 5.049846093415785e-07, + "loss": 0.2576, + "step": 78995 + }, + { + "epoch": 2.02, + "learning_rate": 5.0496056711073e-07, + "loss": 0.3284, + "step": 78996 + }, + { + "epoch": 2.02, + "learning_rate": 5.049365252589107e-07, + "loss": 0.3496, + "step": 78997 + }, + { + "epoch": 2.02, + "learning_rate": 5.049124837861385e-07, + "loss": 0.4077, + "step": 78998 + }, + { + "epoch": 2.02, + "learning_rate": 5.04888442692432e-07, + "loss": 0.5166, + "step": 78999 + }, + { + "epoch": 2.02, + "learning_rate": 5.048644019778097e-07, + "loss": 0.3438, + "step": 79000 + }, + { + "epoch": 2.02, + "learning_rate": 5.048403616422903e-07, + "loss": 0.3669, + "step": 79001 + }, + { + "epoch": 2.02, + "learning_rate": 5.048163216858917e-07, + "loss": 0.3625, + "step": 79002 + }, + { + "epoch": 2.02, + "learning_rate": 5.047922821086324e-07, + "loss": 0.2671, + "step": 79003 + }, + { + "epoch": 2.02, + "learning_rate": 5.047682429105307e-07, + "loss": 0.4878, + "step": 79004 + }, + { + "epoch": 2.02, + "learning_rate": 5.047442040916051e-07, + "loss": 0.4346, + "step": 79005 + }, + { + "epoch": 2.02, + "learning_rate": 5.047201656518745e-07, + "loss": 0.4517, + "step": 79006 + }, + { + "epoch": 2.02, + "learning_rate": 5.046961275913566e-07, + "loss": 0.4282, + "step": 79007 + }, + { + "epoch": 2.03, + "learning_rate": 5.046720899100702e-07, + "loss": 0.4263, + "step": 79008 + }, + { + "epoch": 2.03, + "learning_rate": 5.046480526080334e-07, + "loss": 0.4771, + "step": 79009 + }, + { + "epoch": 2.03, + "learning_rate": 5.046240156852654e-07, + "loss": 0.4856, + "step": 79010 + }, + { + "epoch": 2.03, + "learning_rate": 5.045999791417834e-07, + "loss": 0.4297, + "step": 79011 + }, + { + "epoch": 2.03, + "learning_rate": 5.045759429776071e-07, + "loss": 0.418, + "step": 79012 + }, + { + "epoch": 2.03, + "learning_rate": 5.045519071927535e-07, + "loss": 0.3604, + "step": 79013 + }, + { + "epoch": 2.03, + "learning_rate": 5.045278717872424e-07, + "loss": 0.2759, + "step": 79014 + }, + { + "epoch": 2.03, + "learning_rate": 5.04503836761091e-07, + "loss": 0.4966, + "step": 79015 + }, + { + "epoch": 2.03, + "learning_rate": 5.044798021143182e-07, + "loss": 0.4038, + "step": 79016 + }, + { + "epoch": 2.03, + "learning_rate": 5.044557678469425e-07, + "loss": 0.4248, + "step": 79017 + }, + { + "epoch": 2.03, + "learning_rate": 5.044317339589825e-07, + "loss": 0.4478, + "step": 79018 + }, + { + "epoch": 2.03, + "learning_rate": 5.044077004504561e-07, + "loss": 0.3789, + "step": 79019 + }, + { + "epoch": 2.03, + "learning_rate": 5.043836673213818e-07, + "loss": 0.3716, + "step": 79020 + }, + { + "epoch": 2.03, + "learning_rate": 5.043596345717783e-07, + "loss": 0.2028, + "step": 79021 + }, + { + "epoch": 2.03, + "learning_rate": 5.04335602201664e-07, + "loss": 0.3611, + "step": 79022 + }, + { + "epoch": 2.03, + "learning_rate": 5.043115702110573e-07, + "loss": 0.4893, + "step": 79023 + }, + { + "epoch": 2.03, + "learning_rate": 5.042875385999761e-07, + "loss": 0.5254, + "step": 79024 + }, + { + "epoch": 2.03, + "learning_rate": 5.04263507368439e-07, + "loss": 0.2472, + "step": 79025 + }, + { + "epoch": 2.03, + "learning_rate": 5.042394765164646e-07, + "loss": 0.4561, + "step": 79026 + }, + { + "epoch": 2.03, + "learning_rate": 5.042154460440716e-07, + "loss": 0.3608, + "step": 79027 + }, + { + "epoch": 2.03, + "learning_rate": 5.041914159512777e-07, + "loss": 0.436, + "step": 79028 + }, + { + "epoch": 2.03, + "learning_rate": 5.041673862381015e-07, + "loss": 0.4047, + "step": 79029 + }, + { + "epoch": 2.03, + "learning_rate": 5.041433569045621e-07, + "loss": 0.4951, + "step": 79030 + }, + { + "epoch": 2.03, + "learning_rate": 5.041193279506769e-07, + "loss": 0.3745, + "step": 79031 + }, + { + "epoch": 2.03, + "learning_rate": 5.040952993764651e-07, + "loss": 0.3303, + "step": 79032 + }, + { + "epoch": 2.03, + "learning_rate": 5.040712711819444e-07, + "loss": 0.4448, + "step": 79033 + }, + { + "epoch": 2.03, + "learning_rate": 5.040472433671333e-07, + "loss": 0.3965, + "step": 79034 + }, + { + "epoch": 2.03, + "learning_rate": 5.04023215932051e-07, + "loss": 0.3069, + "step": 79035 + }, + { + "epoch": 2.03, + "learning_rate": 5.039991888767149e-07, + "loss": 0.457, + "step": 79036 + }, + { + "epoch": 2.03, + "learning_rate": 5.039751622011438e-07, + "loss": 0.498, + "step": 79037 + }, + { + "epoch": 2.03, + "learning_rate": 5.039511359053561e-07, + "loss": 0.4135, + "step": 79038 + }, + { + "epoch": 2.03, + "learning_rate": 5.039271099893706e-07, + "loss": 0.2627, + "step": 79039 + }, + { + "epoch": 2.03, + "learning_rate": 5.03903084453205e-07, + "loss": 0.4775, + "step": 79040 + }, + { + "epoch": 2.03, + "learning_rate": 5.038790592968778e-07, + "loss": 0.3792, + "step": 79041 + }, + { + "epoch": 2.03, + "learning_rate": 5.038550345204083e-07, + "loss": 0.3804, + "step": 79042 + }, + { + "epoch": 2.03, + "learning_rate": 5.038310101238134e-07, + "loss": 0.3402, + "step": 79043 + }, + { + "epoch": 2.03, + "learning_rate": 5.038069861071129e-07, + "loss": 0.3284, + "step": 79044 + }, + { + "epoch": 2.03, + "learning_rate": 5.037829624703241e-07, + "loss": 0.4028, + "step": 79045 + }, + { + "epoch": 2.03, + "learning_rate": 5.03758939213466e-07, + "loss": 0.3549, + "step": 79046 + }, + { + "epoch": 2.03, + "learning_rate": 5.037349163365572e-07, + "loss": 0.5415, + "step": 79047 + }, + { + "epoch": 2.03, + "learning_rate": 5.037108938396153e-07, + "loss": 0.4185, + "step": 79048 + }, + { + "epoch": 2.03, + "learning_rate": 5.036868717226592e-07, + "loss": 0.321, + "step": 79049 + }, + { + "epoch": 2.03, + "learning_rate": 5.036628499857072e-07, + "loss": 0.2151, + "step": 79050 + }, + { + "epoch": 2.03, + "learning_rate": 5.036388286287781e-07, + "loss": 0.2374, + "step": 79051 + }, + { + "epoch": 2.03, + "learning_rate": 5.0361480765189e-07, + "loss": 0.4141, + "step": 79052 + }, + { + "epoch": 2.03, + "learning_rate": 5.035907870550608e-07, + "loss": 0.3271, + "step": 79053 + }, + { + "epoch": 2.03, + "learning_rate": 5.035667668383094e-07, + "loss": 0.5183, + "step": 79054 + }, + { + "epoch": 2.03, + "learning_rate": 5.03542747001654e-07, + "loss": 0.4272, + "step": 79055 + }, + { + "epoch": 2.03, + "learning_rate": 5.035187275451134e-07, + "loss": 0.2955, + "step": 79056 + }, + { + "epoch": 2.03, + "learning_rate": 5.034947084687055e-07, + "loss": 0.4487, + "step": 79057 + }, + { + "epoch": 2.03, + "learning_rate": 5.034706897724487e-07, + "loss": 0.3737, + "step": 79058 + }, + { + "epoch": 2.03, + "learning_rate": 5.034466714563617e-07, + "loss": 0.3623, + "step": 79059 + }, + { + "epoch": 2.03, + "learning_rate": 5.034226535204631e-07, + "loss": 0.5151, + "step": 79060 + }, + { + "epoch": 2.03, + "learning_rate": 5.033986359647704e-07, + "loss": 0.4712, + "step": 79061 + }, + { + "epoch": 2.03, + "learning_rate": 5.033746187893031e-07, + "loss": 0.4595, + "step": 79062 + }, + { + "epoch": 2.03, + "learning_rate": 5.033506019940785e-07, + "loss": 0.374, + "step": 79063 + }, + { + "epoch": 2.03, + "learning_rate": 5.03326585579116e-07, + "loss": 0.5049, + "step": 79064 + }, + { + "epoch": 2.03, + "learning_rate": 5.033025695444331e-07, + "loss": 0.402, + "step": 79065 + }, + { + "epoch": 2.03, + "learning_rate": 5.032785538900486e-07, + "loss": 0.3306, + "step": 79066 + }, + { + "epoch": 2.03, + "learning_rate": 5.032545386159807e-07, + "loss": 0.3538, + "step": 79067 + }, + { + "epoch": 2.03, + "learning_rate": 5.032305237222485e-07, + "loss": 0.4128, + "step": 79068 + }, + { + "epoch": 2.03, + "learning_rate": 5.032065092088694e-07, + "loss": 0.3789, + "step": 79069 + }, + { + "epoch": 2.03, + "learning_rate": 5.031824950758623e-07, + "loss": 0.3569, + "step": 79070 + }, + { + "epoch": 2.03, + "learning_rate": 5.031584813232454e-07, + "loss": 0.4541, + "step": 79071 + }, + { + "epoch": 2.03, + "learning_rate": 5.031344679510378e-07, + "loss": 0.5137, + "step": 79072 + }, + { + "epoch": 2.03, + "learning_rate": 5.031104549592571e-07, + "loss": 0.3862, + "step": 79073 + }, + { + "epoch": 2.03, + "learning_rate": 5.030864423479215e-07, + "loss": 0.4658, + "step": 79074 + }, + { + "epoch": 2.03, + "learning_rate": 5.030624301170499e-07, + "loss": 0.2529, + "step": 79075 + }, + { + "epoch": 2.03, + "learning_rate": 5.030384182666605e-07, + "loss": 0.4187, + "step": 79076 + }, + { + "epoch": 2.03, + "learning_rate": 5.03014406796772e-07, + "loss": 0.3853, + "step": 79077 + }, + { + "epoch": 2.03, + "learning_rate": 5.029903957074022e-07, + "loss": 0.3457, + "step": 79078 + }, + { + "epoch": 2.03, + "learning_rate": 5.029663849985699e-07, + "loss": 0.3654, + "step": 79079 + }, + { + "epoch": 2.03, + "learning_rate": 5.029423746702932e-07, + "loss": 0.4136, + "step": 79080 + }, + { + "epoch": 2.03, + "learning_rate": 5.029183647225912e-07, + "loss": 0.4873, + "step": 79081 + }, + { + "epoch": 2.03, + "learning_rate": 5.028943551554816e-07, + "loss": 0.4551, + "step": 79082 + }, + { + "epoch": 2.03, + "learning_rate": 5.028703459689827e-07, + "loss": 0.3755, + "step": 79083 + }, + { + "epoch": 2.03, + "learning_rate": 5.028463371631131e-07, + "loss": 0.5171, + "step": 79084 + }, + { + "epoch": 2.03, + "learning_rate": 5.028223287378916e-07, + "loss": 0.5884, + "step": 79085 + }, + { + "epoch": 2.03, + "learning_rate": 5.027983206933358e-07, + "loss": 0.4453, + "step": 79086 + }, + { + "epoch": 2.03, + "learning_rate": 5.027743130294643e-07, + "loss": 0.4946, + "step": 79087 + }, + { + "epoch": 2.03, + "learning_rate": 5.027503057462959e-07, + "loss": 0.5732, + "step": 79088 + }, + { + "epoch": 2.03, + "learning_rate": 5.027262988438489e-07, + "loss": 0.4272, + "step": 79089 + }, + { + "epoch": 2.03, + "learning_rate": 5.027022923221412e-07, + "loss": 0.3983, + "step": 79090 + }, + { + "epoch": 2.03, + "learning_rate": 5.026782861811914e-07, + "loss": 0.3595, + "step": 79091 + }, + { + "epoch": 2.03, + "learning_rate": 5.026542804210185e-07, + "loss": 0.4224, + "step": 79092 + }, + { + "epoch": 2.03, + "learning_rate": 5.026302750416399e-07, + "loss": 0.5059, + "step": 79093 + }, + { + "epoch": 2.03, + "learning_rate": 5.026062700430748e-07, + "loss": 0.4849, + "step": 79094 + }, + { + "epoch": 2.03, + "learning_rate": 5.025822654253409e-07, + "loss": 0.3867, + "step": 79095 + }, + { + "epoch": 2.03, + "learning_rate": 5.025582611884567e-07, + "loss": 0.4064, + "step": 79096 + }, + { + "epoch": 2.03, + "learning_rate": 5.02534257332441e-07, + "loss": 0.355, + "step": 79097 + }, + { + "epoch": 2.03, + "learning_rate": 5.025102538573123e-07, + "loss": 0.4854, + "step": 79098 + }, + { + "epoch": 2.03, + "learning_rate": 5.02486250763088e-07, + "loss": 0.4692, + "step": 79099 + }, + { + "epoch": 2.03, + "learning_rate": 5.024622480497873e-07, + "loss": 0.438, + "step": 79100 + }, + { + "epoch": 2.03, + "learning_rate": 5.024382457174283e-07, + "loss": 0.4653, + "step": 79101 + }, + { + "epoch": 2.03, + "learning_rate": 5.024142437660304e-07, + "loss": 0.4001, + "step": 79102 + }, + { + "epoch": 2.03, + "learning_rate": 5.023902421956101e-07, + "loss": 0.4214, + "step": 79103 + }, + { + "epoch": 2.03, + "learning_rate": 5.023662410061866e-07, + "loss": 0.4143, + "step": 79104 + }, + { + "epoch": 2.03, + "learning_rate": 5.023422401977785e-07, + "loss": 0.3359, + "step": 79105 + }, + { + "epoch": 2.03, + "learning_rate": 5.023182397704047e-07, + "loss": 0.5044, + "step": 79106 + }, + { + "epoch": 2.03, + "learning_rate": 5.022942397240822e-07, + "loss": 0.3821, + "step": 79107 + }, + { + "epoch": 2.03, + "learning_rate": 5.022702400588303e-07, + "loss": 0.3687, + "step": 79108 + }, + { + "epoch": 2.03, + "learning_rate": 5.022462407746672e-07, + "loss": 0.4868, + "step": 79109 + }, + { + "epoch": 2.03, + "learning_rate": 5.022222418716116e-07, + "loss": 0.4521, + "step": 79110 + }, + { + "epoch": 2.03, + "learning_rate": 5.02198243349681e-07, + "loss": 0.6328, + "step": 79111 + }, + { + "epoch": 2.03, + "learning_rate": 5.021742452088949e-07, + "loss": 0.3298, + "step": 79112 + }, + { + "epoch": 2.03, + "learning_rate": 5.021502474492707e-07, + "loss": 0.4658, + "step": 79113 + }, + { + "epoch": 2.03, + "learning_rate": 5.021262500708271e-07, + "loss": 0.3872, + "step": 79114 + }, + { + "epoch": 2.03, + "learning_rate": 5.02102253073583e-07, + "loss": 0.455, + "step": 79115 + }, + { + "epoch": 2.03, + "learning_rate": 5.020782564575559e-07, + "loss": 0.4697, + "step": 79116 + }, + { + "epoch": 2.03, + "learning_rate": 5.020542602227644e-07, + "loss": 0.3115, + "step": 79117 + }, + { + "epoch": 2.03, + "learning_rate": 5.020302643692274e-07, + "loss": 0.4878, + "step": 79118 + }, + { + "epoch": 2.03, + "learning_rate": 5.020062688969631e-07, + "loss": 0.4458, + "step": 79119 + }, + { + "epoch": 2.03, + "learning_rate": 5.019822738059892e-07, + "loss": 0.4146, + "step": 79120 + }, + { + "epoch": 2.03, + "learning_rate": 5.019582790963248e-07, + "loss": 0.4521, + "step": 79121 + }, + { + "epoch": 2.03, + "learning_rate": 5.019342847679882e-07, + "loss": 0.4663, + "step": 79122 + }, + { + "epoch": 2.03, + "learning_rate": 5.019102908209978e-07, + "loss": 0.2958, + "step": 79123 + }, + { + "epoch": 2.03, + "learning_rate": 5.018862972553715e-07, + "loss": 0.4561, + "step": 79124 + }, + { + "epoch": 2.03, + "learning_rate": 5.018623040711278e-07, + "loss": 0.4473, + "step": 79125 + }, + { + "epoch": 2.03, + "learning_rate": 5.018383112682852e-07, + "loss": 0.4326, + "step": 79126 + }, + { + "epoch": 2.03, + "learning_rate": 5.018143188468625e-07, + "loss": 0.6157, + "step": 79127 + }, + { + "epoch": 2.03, + "learning_rate": 5.017903268068773e-07, + "loss": 0.2894, + "step": 79128 + }, + { + "epoch": 2.03, + "learning_rate": 5.017663351483484e-07, + "loss": 0.4036, + "step": 79129 + }, + { + "epoch": 2.03, + "learning_rate": 5.01742343871294e-07, + "loss": 0.3962, + "step": 79130 + }, + { + "epoch": 2.03, + "learning_rate": 5.01718352975733e-07, + "loss": 0.3538, + "step": 79131 + }, + { + "epoch": 2.03, + "learning_rate": 5.016943624616834e-07, + "loss": 0.4863, + "step": 79132 + }, + { + "epoch": 2.03, + "learning_rate": 5.016703723291631e-07, + "loss": 0.4468, + "step": 79133 + }, + { + "epoch": 2.03, + "learning_rate": 5.016463825781909e-07, + "loss": 0.4478, + "step": 79134 + }, + { + "epoch": 2.03, + "learning_rate": 5.016223932087851e-07, + "loss": 0.4287, + "step": 79135 + }, + { + "epoch": 2.03, + "learning_rate": 5.015984042209646e-07, + "loss": 0.3638, + "step": 79136 + }, + { + "epoch": 2.03, + "learning_rate": 5.015744156147468e-07, + "loss": 0.3286, + "step": 79137 + }, + { + "epoch": 2.03, + "learning_rate": 5.015504273901505e-07, + "loss": 0.5166, + "step": 79138 + }, + { + "epoch": 2.03, + "learning_rate": 5.015264395471948e-07, + "loss": 0.3276, + "step": 79139 + }, + { + "epoch": 2.03, + "learning_rate": 5.015024520858967e-07, + "loss": 0.3345, + "step": 79140 + }, + { + "epoch": 2.03, + "learning_rate": 5.014784650062754e-07, + "loss": 0.522, + "step": 79141 + }, + { + "epoch": 2.03, + "learning_rate": 5.014544783083495e-07, + "loss": 0.4268, + "step": 79142 + }, + { + "epoch": 2.03, + "learning_rate": 5.014304919921364e-07, + "loss": 0.5234, + "step": 79143 + }, + { + "epoch": 2.03, + "learning_rate": 5.014065060576556e-07, + "loss": 0.4434, + "step": 79144 + }, + { + "epoch": 2.03, + "learning_rate": 5.013825205049245e-07, + "loss": 0.5146, + "step": 79145 + }, + { + "epoch": 2.03, + "learning_rate": 5.013585353339618e-07, + "loss": 0.4668, + "step": 79146 + }, + { + "epoch": 2.03, + "learning_rate": 5.013345505447861e-07, + "loss": 0.4653, + "step": 79147 + }, + { + "epoch": 2.03, + "learning_rate": 5.013105661374158e-07, + "loss": 0.3975, + "step": 79148 + }, + { + "epoch": 2.03, + "learning_rate": 5.012865821118688e-07, + "loss": 0.4414, + "step": 79149 + }, + { + "epoch": 2.03, + "learning_rate": 5.012625984681637e-07, + "loss": 0.3687, + "step": 79150 + }, + { + "epoch": 2.03, + "learning_rate": 5.012386152063191e-07, + "loss": 0.4148, + "step": 79151 + }, + { + "epoch": 2.03, + "learning_rate": 5.012146323263533e-07, + "loss": 0.4526, + "step": 79152 + }, + { + "epoch": 2.03, + "learning_rate": 5.011906498282845e-07, + "loss": 0.3459, + "step": 79153 + }, + { + "epoch": 2.03, + "learning_rate": 5.011666677121309e-07, + "loss": 0.4026, + "step": 79154 + }, + { + "epoch": 2.03, + "learning_rate": 5.011426859779109e-07, + "loss": 0.4116, + "step": 79155 + }, + { + "epoch": 2.03, + "learning_rate": 5.011187046256434e-07, + "loss": 0.302, + "step": 79156 + }, + { + "epoch": 2.03, + "learning_rate": 5.01094723655346e-07, + "loss": 0.3964, + "step": 79157 + }, + { + "epoch": 2.03, + "learning_rate": 5.010707430670374e-07, + "loss": 0.5586, + "step": 79158 + }, + { + "epoch": 2.03, + "learning_rate": 5.01046762860736e-07, + "loss": 0.4214, + "step": 79159 + }, + { + "epoch": 2.03, + "learning_rate": 5.010227830364606e-07, + "loss": 0.3301, + "step": 79160 + }, + { + "epoch": 2.03, + "learning_rate": 5.009988035942287e-07, + "loss": 0.4521, + "step": 79161 + }, + { + "epoch": 2.03, + "learning_rate": 5.009748245340595e-07, + "loss": 0.4506, + "step": 79162 + }, + { + "epoch": 2.03, + "learning_rate": 5.009508458559704e-07, + "loss": 0.418, + "step": 79163 + }, + { + "epoch": 2.03, + "learning_rate": 5.009268675599804e-07, + "loss": 0.3616, + "step": 79164 + }, + { + "epoch": 2.03, + "learning_rate": 5.009028896461081e-07, + "loss": 0.4138, + "step": 79165 + }, + { + "epoch": 2.03, + "learning_rate": 5.00878912114371e-07, + "loss": 0.4424, + "step": 79166 + }, + { + "epoch": 2.03, + "learning_rate": 5.008549349647883e-07, + "loss": 0.498, + "step": 79167 + }, + { + "epoch": 2.03, + "learning_rate": 5.008309581973777e-07, + "loss": 0.4473, + "step": 79168 + }, + { + "epoch": 2.03, + "learning_rate": 5.008069818121585e-07, + "loss": 0.4922, + "step": 79169 + }, + { + "epoch": 2.03, + "learning_rate": 5.007830058091479e-07, + "loss": 0.4976, + "step": 79170 + }, + { + "epoch": 2.03, + "learning_rate": 5.007590301883648e-07, + "loss": 0.5117, + "step": 79171 + }, + { + "epoch": 2.03, + "learning_rate": 5.00735054949828e-07, + "loss": 0.415, + "step": 79172 + }, + { + "epoch": 2.03, + "learning_rate": 5.007110800935554e-07, + "loss": 0.5625, + "step": 79173 + }, + { + "epoch": 2.03, + "learning_rate": 5.006871056195651e-07, + "loss": 0.4272, + "step": 79174 + }, + { + "epoch": 2.03, + "learning_rate": 5.006631315278755e-07, + "loss": 0.2542, + "step": 79175 + }, + { + "epoch": 2.03, + "learning_rate": 5.006391578185054e-07, + "loss": 0.4712, + "step": 79176 + }, + { + "epoch": 2.03, + "learning_rate": 5.006151844914732e-07, + "loss": 0.3774, + "step": 79177 + }, + { + "epoch": 2.03, + "learning_rate": 5.005912115467965e-07, + "loss": 0.4165, + "step": 79178 + }, + { + "epoch": 2.03, + "learning_rate": 5.005672389844944e-07, + "loss": 0.3528, + "step": 79179 + }, + { + "epoch": 2.03, + "learning_rate": 5.005432668045848e-07, + "loss": 0.3735, + "step": 79180 + }, + { + "epoch": 2.03, + "learning_rate": 5.005192950070867e-07, + "loss": 0.5107, + "step": 79181 + }, + { + "epoch": 2.03, + "learning_rate": 5.00495323592018e-07, + "loss": 0.2869, + "step": 79182 + }, + { + "epoch": 2.03, + "learning_rate": 5.004713525593966e-07, + "loss": 0.4355, + "step": 79183 + }, + { + "epoch": 2.03, + "learning_rate": 5.004473819092415e-07, + "loss": 0.3921, + "step": 79184 + }, + { + "epoch": 2.03, + "learning_rate": 5.004234116415708e-07, + "loss": 0.3604, + "step": 79185 + }, + { + "epoch": 2.03, + "learning_rate": 5.003994417564033e-07, + "loss": 0.4033, + "step": 79186 + }, + { + "epoch": 2.03, + "learning_rate": 5.003754722537565e-07, + "loss": 0.3154, + "step": 79187 + }, + { + "epoch": 2.03, + "learning_rate": 5.003515031336494e-07, + "loss": 0.3562, + "step": 79188 + }, + { + "epoch": 2.03, + "learning_rate": 5.003275343961e-07, + "loss": 0.3195, + "step": 79189 + }, + { + "epoch": 2.03, + "learning_rate": 5.003035660411274e-07, + "loss": 0.2976, + "step": 79190 + }, + { + "epoch": 2.03, + "learning_rate": 5.002795980687489e-07, + "loss": 0.395, + "step": 79191 + }, + { + "epoch": 2.03, + "learning_rate": 5.002556304789836e-07, + "loss": 0.5532, + "step": 79192 + }, + { + "epoch": 2.03, + "learning_rate": 5.002316632718493e-07, + "loss": 0.4424, + "step": 79193 + }, + { + "epoch": 2.03, + "learning_rate": 5.002076964473652e-07, + "loss": 0.3875, + "step": 79194 + }, + { + "epoch": 2.03, + "learning_rate": 5.001837300055484e-07, + "loss": 0.314, + "step": 79195 + }, + { + "epoch": 2.03, + "learning_rate": 5.001597639464181e-07, + "loss": 0.5049, + "step": 79196 + }, + { + "epoch": 2.03, + "learning_rate": 5.001357982699925e-07, + "loss": 0.4302, + "step": 79197 + }, + { + "epoch": 2.03, + "learning_rate": 5.001118329762902e-07, + "loss": 0.4258, + "step": 79198 + }, + { + "epoch": 2.03, + "learning_rate": 5.00087868065329e-07, + "loss": 0.4404, + "step": 79199 + }, + { + "epoch": 2.03, + "learning_rate": 5.000639035371274e-07, + "loss": 0.4424, + "step": 79200 + }, + { + "epoch": 2.03, + "learning_rate": 5.00039939391704e-07, + "loss": 0.3699, + "step": 79201 + }, + { + "epoch": 2.03, + "learning_rate": 5.000159756290775e-07, + "loss": 0.4722, + "step": 79202 + }, + { + "epoch": 2.03, + "learning_rate": 4.999920122492657e-07, + "loss": 0.478, + "step": 79203 + }, + { + "epoch": 2.03, + "learning_rate": 4.999680492522867e-07, + "loss": 0.2145, + "step": 79204 + }, + { + "epoch": 2.03, + "learning_rate": 4.99944086638159e-07, + "loss": 0.5137, + "step": 79205 + }, + { + "epoch": 2.03, + "learning_rate": 4.999201244069012e-07, + "loss": 0.4175, + "step": 79206 + }, + { + "epoch": 2.03, + "learning_rate": 4.99896162558532e-07, + "loss": 0.2743, + "step": 79207 + }, + { + "epoch": 2.03, + "learning_rate": 4.998722010930688e-07, + "loss": 0.3722, + "step": 79208 + }, + { + "epoch": 2.03, + "learning_rate": 4.998482400105306e-07, + "loss": 0.3262, + "step": 79209 + }, + { + "epoch": 2.03, + "learning_rate": 4.99824279310936e-07, + "loss": 0.4075, + "step": 79210 + }, + { + "epoch": 2.03, + "learning_rate": 4.998003189943028e-07, + "loss": 0.3931, + "step": 79211 + }, + { + "epoch": 2.03, + "learning_rate": 4.997763590606493e-07, + "loss": 0.4312, + "step": 79212 + }, + { + "epoch": 2.03, + "learning_rate": 4.99752399509994e-07, + "loss": 0.2446, + "step": 79213 + }, + { + "epoch": 2.03, + "learning_rate": 4.997284403423551e-07, + "loss": 0.4111, + "step": 79214 + }, + { + "epoch": 2.03, + "learning_rate": 4.997044815577517e-07, + "loss": 0.4424, + "step": 79215 + }, + { + "epoch": 2.03, + "learning_rate": 4.996805231562012e-07, + "loss": 0.4238, + "step": 79216 + }, + { + "epoch": 2.03, + "learning_rate": 4.996565651377221e-07, + "loss": 0.3296, + "step": 79217 + }, + { + "epoch": 2.03, + "learning_rate": 4.996326075023332e-07, + "loss": 0.4199, + "step": 79218 + }, + { + "epoch": 2.03, + "learning_rate": 4.996086502500529e-07, + "loss": 0.3354, + "step": 79219 + }, + { + "epoch": 2.03, + "learning_rate": 4.995846933808989e-07, + "loss": 0.3339, + "step": 79220 + }, + { + "epoch": 2.03, + "learning_rate": 4.995607368948902e-07, + "loss": 0.279, + "step": 79221 + }, + { + "epoch": 2.03, + "learning_rate": 4.995367807920446e-07, + "loss": 0.4673, + "step": 79222 + }, + { + "epoch": 2.03, + "learning_rate": 4.995128250723804e-07, + "loss": 0.4097, + "step": 79223 + }, + { + "epoch": 2.03, + "learning_rate": 4.994888697359168e-07, + "loss": 0.4795, + "step": 79224 + }, + { + "epoch": 2.03, + "learning_rate": 4.994649147826712e-07, + "loss": 0.4893, + "step": 79225 + }, + { + "epoch": 2.03, + "learning_rate": 4.994409602126622e-07, + "loss": 0.4434, + "step": 79226 + }, + { + "epoch": 2.03, + "learning_rate": 4.994170060259086e-07, + "loss": 0.3901, + "step": 79227 + }, + { + "epoch": 2.03, + "learning_rate": 4.993930522224281e-07, + "loss": 0.5073, + "step": 79228 + }, + { + "epoch": 2.03, + "learning_rate": 4.993690988022394e-07, + "loss": 0.3535, + "step": 79229 + }, + { + "epoch": 2.03, + "learning_rate": 4.993451457653605e-07, + "loss": 0.2915, + "step": 79230 + }, + { + "epoch": 2.03, + "learning_rate": 4.993211931118106e-07, + "loss": 0.4878, + "step": 79231 + }, + { + "epoch": 2.03, + "learning_rate": 4.992972408416074e-07, + "loss": 0.4561, + "step": 79232 + }, + { + "epoch": 2.03, + "learning_rate": 4.992732889547689e-07, + "loss": 0.5068, + "step": 79233 + }, + { + "epoch": 2.03, + "learning_rate": 4.992493374513137e-07, + "loss": 0.4883, + "step": 79234 + }, + { + "epoch": 2.03, + "learning_rate": 4.992253863312604e-07, + "loss": 0.4814, + "step": 79235 + }, + { + "epoch": 2.03, + "learning_rate": 4.992014355946274e-07, + "loss": 0.4819, + "step": 79236 + }, + { + "epoch": 2.03, + "learning_rate": 4.991774852414326e-07, + "loss": 0.4122, + "step": 79237 + }, + { + "epoch": 2.03, + "learning_rate": 4.991535352716945e-07, + "loss": 0.3584, + "step": 79238 + }, + { + "epoch": 2.03, + "learning_rate": 4.991295856854316e-07, + "loss": 0.4766, + "step": 79239 + }, + { + "epoch": 2.03, + "learning_rate": 4.991056364826626e-07, + "loss": 0.564, + "step": 79240 + }, + { + "epoch": 2.03, + "learning_rate": 4.990816876634052e-07, + "loss": 0.4985, + "step": 79241 + }, + { + "epoch": 2.03, + "learning_rate": 4.990577392276776e-07, + "loss": 0.3413, + "step": 79242 + }, + { + "epoch": 2.03, + "learning_rate": 4.990337911754985e-07, + "loss": 0.4194, + "step": 79243 + }, + { + "epoch": 2.03, + "learning_rate": 4.990098435068861e-07, + "loss": 0.3704, + "step": 79244 + }, + { + "epoch": 2.03, + "learning_rate": 4.989858962218593e-07, + "loss": 0.5371, + "step": 79245 + }, + { + "epoch": 2.03, + "learning_rate": 4.989619493204355e-07, + "loss": 0.395, + "step": 79246 + }, + { + "epoch": 2.03, + "learning_rate": 4.989380028026335e-07, + "loss": 0.3823, + "step": 79247 + }, + { + "epoch": 2.03, + "learning_rate": 4.989140566684721e-07, + "loss": 0.2991, + "step": 79248 + }, + { + "epoch": 2.03, + "learning_rate": 4.988901109179687e-07, + "loss": 0.4409, + "step": 79249 + }, + { + "epoch": 2.03, + "learning_rate": 4.988661655511422e-07, + "loss": 0.3828, + "step": 79250 + }, + { + "epoch": 2.03, + "learning_rate": 4.98842220568011e-07, + "loss": 0.4902, + "step": 79251 + }, + { + "epoch": 2.03, + "learning_rate": 4.988182759685932e-07, + "loss": 0.3936, + "step": 79252 + }, + { + "epoch": 2.03, + "learning_rate": 4.987943317529073e-07, + "loss": 0.3853, + "step": 79253 + }, + { + "epoch": 2.03, + "learning_rate": 4.987703879209712e-07, + "loss": 0.2297, + "step": 79254 + }, + { + "epoch": 2.03, + "learning_rate": 4.987464444728037e-07, + "loss": 0.4536, + "step": 79255 + }, + { + "epoch": 2.03, + "learning_rate": 4.98722501408423e-07, + "loss": 0.4269, + "step": 79256 + }, + { + "epoch": 2.03, + "learning_rate": 4.986985587278477e-07, + "loss": 0.4233, + "step": 79257 + }, + { + "epoch": 2.03, + "learning_rate": 4.986746164310955e-07, + "loss": 0.458, + "step": 79258 + }, + { + "epoch": 2.03, + "learning_rate": 4.986506745181852e-07, + "loss": 0.54, + "step": 79259 + }, + { + "epoch": 2.03, + "learning_rate": 4.98626732989135e-07, + "loss": 0.4937, + "step": 79260 + }, + { + "epoch": 2.03, + "learning_rate": 4.986027918439634e-07, + "loss": 0.4976, + "step": 79261 + }, + { + "epoch": 2.03, + "learning_rate": 4.98578851082689e-07, + "loss": 0.4404, + "step": 79262 + }, + { + "epoch": 2.03, + "learning_rate": 4.98554910705329e-07, + "loss": 0.3605, + "step": 79263 + }, + { + "epoch": 2.03, + "learning_rate": 4.985309707119026e-07, + "loss": 0.2917, + "step": 79264 + }, + { + "epoch": 2.03, + "learning_rate": 4.985070311024283e-07, + "loss": 0.3784, + "step": 79265 + }, + { + "epoch": 2.03, + "learning_rate": 4.984830918769237e-07, + "loss": 0.418, + "step": 79266 + }, + { + "epoch": 2.03, + "learning_rate": 4.984591530354076e-07, + "loss": 0.4404, + "step": 79267 + }, + { + "epoch": 2.03, + "learning_rate": 4.984352145778983e-07, + "loss": 0.481, + "step": 79268 + }, + { + "epoch": 2.03, + "learning_rate": 4.984112765044144e-07, + "loss": 0.3794, + "step": 79269 + }, + { + "epoch": 2.03, + "learning_rate": 4.983873388149735e-07, + "loss": 0.3821, + "step": 79270 + }, + { + "epoch": 2.03, + "learning_rate": 4.983634015095948e-07, + "loss": 0.4136, + "step": 79271 + }, + { + "epoch": 2.03, + "learning_rate": 4.983394645882958e-07, + "loss": 0.421, + "step": 79272 + }, + { + "epoch": 2.03, + "learning_rate": 4.983155280510952e-07, + "loss": 0.3586, + "step": 79273 + }, + { + "epoch": 2.03, + "learning_rate": 4.982915918980118e-07, + "loss": 0.4033, + "step": 79274 + }, + { + "epoch": 2.03, + "learning_rate": 4.982676561290629e-07, + "loss": 0.4526, + "step": 79275 + }, + { + "epoch": 2.03, + "learning_rate": 4.982437207442675e-07, + "loss": 0.4708, + "step": 79276 + }, + { + "epoch": 2.03, + "learning_rate": 4.982197857436437e-07, + "loss": 0.4414, + "step": 79277 + }, + { + "epoch": 2.03, + "learning_rate": 4.981958511272104e-07, + "loss": 0.3428, + "step": 79278 + }, + { + "epoch": 2.03, + "learning_rate": 4.981719168949851e-07, + "loss": 0.4966, + "step": 79279 + }, + { + "epoch": 2.03, + "learning_rate": 4.981479830469864e-07, + "loss": 0.3438, + "step": 79280 + }, + { + "epoch": 2.03, + "learning_rate": 4.981240495832333e-07, + "loss": 0.3818, + "step": 79281 + }, + { + "epoch": 2.03, + "learning_rate": 4.981001165037433e-07, + "loss": 0.4709, + "step": 79282 + }, + { + "epoch": 2.03, + "learning_rate": 4.980761838085348e-07, + "loss": 0.4409, + "step": 79283 + }, + { + "epoch": 2.03, + "learning_rate": 4.980522514976261e-07, + "loss": 0.3965, + "step": 79284 + }, + { + "epoch": 2.03, + "learning_rate": 4.980283195710358e-07, + "loss": 0.4263, + "step": 79285 + }, + { + "epoch": 2.03, + "learning_rate": 4.980043880287826e-07, + "loss": 0.4399, + "step": 79286 + }, + { + "epoch": 2.03, + "learning_rate": 4.979804568708838e-07, + "loss": 0.4199, + "step": 79287 + }, + { + "epoch": 2.03, + "learning_rate": 4.979565260973583e-07, + "loss": 0.3557, + "step": 79288 + }, + { + "epoch": 2.03, + "learning_rate": 4.979325957082245e-07, + "loss": 0.458, + "step": 79289 + }, + { + "epoch": 2.03, + "learning_rate": 4.97908665703501e-07, + "loss": 0.2637, + "step": 79290 + }, + { + "epoch": 2.03, + "learning_rate": 4.978847360832057e-07, + "loss": 0.4756, + "step": 79291 + }, + { + "epoch": 2.03, + "learning_rate": 4.978608068473566e-07, + "loss": 0.4614, + "step": 79292 + }, + { + "epoch": 2.03, + "learning_rate": 4.978368779959724e-07, + "loss": 0.206, + "step": 79293 + }, + { + "epoch": 2.03, + "learning_rate": 4.978129495290714e-07, + "loss": 0.3862, + "step": 79294 + }, + { + "epoch": 2.03, + "learning_rate": 4.977890214466722e-07, + "loss": 0.3696, + "step": 79295 + }, + { + "epoch": 2.03, + "learning_rate": 4.977650937487927e-07, + "loss": 0.4138, + "step": 79296 + }, + { + "epoch": 2.03, + "learning_rate": 4.977411664354512e-07, + "loss": 0.3521, + "step": 79297 + }, + { + "epoch": 2.03, + "learning_rate": 4.977172395066663e-07, + "loss": 0.4165, + "step": 79298 + }, + { + "epoch": 2.03, + "learning_rate": 4.976933129624565e-07, + "loss": 0.3799, + "step": 79299 + }, + { + "epoch": 2.03, + "learning_rate": 4.976693868028396e-07, + "loss": 0.3347, + "step": 79300 + }, + { + "epoch": 2.03, + "learning_rate": 4.976454610278344e-07, + "loss": 0.375, + "step": 79301 + }, + { + "epoch": 2.03, + "learning_rate": 4.976215356374587e-07, + "loss": 0.4746, + "step": 79302 + }, + { + "epoch": 2.03, + "learning_rate": 4.975976106317314e-07, + "loss": 0.3401, + "step": 79303 + }, + { + "epoch": 2.03, + "learning_rate": 4.9757368601067e-07, + "loss": 0.4038, + "step": 79304 + }, + { + "epoch": 2.03, + "learning_rate": 4.975497617742936e-07, + "loss": 0.3777, + "step": 79305 + }, + { + "epoch": 2.03, + "learning_rate": 4.975258379226201e-07, + "loss": 0.3906, + "step": 79306 + }, + { + "epoch": 2.03, + "learning_rate": 4.975019144556682e-07, + "loss": 0.4644, + "step": 79307 + }, + { + "epoch": 2.03, + "learning_rate": 4.974779913734558e-07, + "loss": 0.3887, + "step": 79308 + }, + { + "epoch": 2.03, + "learning_rate": 4.974540686760014e-07, + "loss": 0.3073, + "step": 79309 + }, + { + "epoch": 2.03, + "learning_rate": 4.974301463633232e-07, + "loss": 0.4326, + "step": 79310 + }, + { + "epoch": 2.03, + "learning_rate": 4.974062244354401e-07, + "loss": 0.3242, + "step": 79311 + }, + { + "epoch": 2.03, + "learning_rate": 4.973823028923699e-07, + "loss": 0.3555, + "step": 79312 + }, + { + "epoch": 2.03, + "learning_rate": 4.973583817341306e-07, + "loss": 0.4316, + "step": 79313 + }, + { + "epoch": 2.03, + "learning_rate": 4.973344609607408e-07, + "loss": 0.3943, + "step": 79314 + }, + { + "epoch": 2.03, + "learning_rate": 4.97310540572219e-07, + "loss": 0.4893, + "step": 79315 + }, + { + "epoch": 2.03, + "learning_rate": 4.972866205685837e-07, + "loss": 0.314, + "step": 79316 + }, + { + "epoch": 2.03, + "learning_rate": 4.972627009498526e-07, + "loss": 0.4795, + "step": 79317 + }, + { + "epoch": 2.03, + "learning_rate": 4.972387817160443e-07, + "loss": 0.5, + "step": 79318 + }, + { + "epoch": 2.03, + "learning_rate": 4.972148628671775e-07, + "loss": 0.3784, + "step": 79319 + }, + { + "epoch": 2.03, + "learning_rate": 4.971909444032698e-07, + "loss": 0.46, + "step": 79320 + }, + { + "epoch": 2.03, + "learning_rate": 4.971670263243403e-07, + "loss": 0.2705, + "step": 79321 + }, + { + "epoch": 2.03, + "learning_rate": 4.971431086304066e-07, + "loss": 0.364, + "step": 79322 + }, + { + "epoch": 2.03, + "learning_rate": 4.97119191321487e-07, + "loss": 0.4028, + "step": 79323 + }, + { + "epoch": 2.03, + "learning_rate": 4.970952743976008e-07, + "loss": 0.4565, + "step": 79324 + }, + { + "epoch": 2.03, + "learning_rate": 4.97071357858765e-07, + "loss": 0.5225, + "step": 79325 + }, + { + "epoch": 2.03, + "learning_rate": 4.970474417049987e-07, + "loss": 0.4192, + "step": 79326 + }, + { + "epoch": 2.03, + "learning_rate": 4.9702352593632e-07, + "loss": 0.3655, + "step": 79327 + }, + { + "epoch": 2.03, + "learning_rate": 4.969996105527477e-07, + "loss": 0.3843, + "step": 79328 + }, + { + "epoch": 2.03, + "learning_rate": 4.969756955542992e-07, + "loss": 0.3252, + "step": 79329 + }, + { + "epoch": 2.03, + "learning_rate": 4.969517809409932e-07, + "loss": 0.562, + "step": 79330 + }, + { + "epoch": 2.03, + "learning_rate": 4.969278667128486e-07, + "loss": 0.4365, + "step": 79331 + }, + { + "epoch": 2.03, + "learning_rate": 4.969039528698828e-07, + "loss": 0.4502, + "step": 79332 + }, + { + "epoch": 2.03, + "learning_rate": 4.968800394121148e-07, + "loss": 0.3181, + "step": 79333 + }, + { + "epoch": 2.03, + "learning_rate": 4.968561263395624e-07, + "loss": 0.4407, + "step": 79334 + }, + { + "epoch": 2.03, + "learning_rate": 4.968322136522441e-07, + "loss": 0.3535, + "step": 79335 + }, + { + "epoch": 2.03, + "learning_rate": 4.968083013501786e-07, + "loss": 0.4277, + "step": 79336 + }, + { + "epoch": 2.03, + "learning_rate": 4.967843894333834e-07, + "loss": 0.5371, + "step": 79337 + }, + { + "epoch": 2.03, + "learning_rate": 4.967604779018772e-07, + "loss": 0.4771, + "step": 79338 + }, + { + "epoch": 2.03, + "learning_rate": 4.967365667556786e-07, + "loss": 0.4395, + "step": 79339 + }, + { + "epoch": 2.03, + "learning_rate": 4.967126559948058e-07, + "loss": 0.3794, + "step": 79340 + }, + { + "epoch": 2.03, + "learning_rate": 4.966887456192771e-07, + "loss": 0.3464, + "step": 79341 + }, + { + "epoch": 2.03, + "learning_rate": 4.966648356291103e-07, + "loss": 0.3755, + "step": 79342 + }, + { + "epoch": 2.03, + "learning_rate": 4.966409260243241e-07, + "loss": 0.2068, + "step": 79343 + }, + { + "epoch": 2.03, + "learning_rate": 4.966170168049367e-07, + "loss": 0.2556, + "step": 79344 + }, + { + "epoch": 2.03, + "learning_rate": 4.96593107970967e-07, + "loss": 0.4041, + "step": 79345 + }, + { + "epoch": 2.03, + "learning_rate": 4.965691995224325e-07, + "loss": 0.4229, + "step": 79346 + }, + { + "epoch": 2.03, + "learning_rate": 4.965452914593517e-07, + "loss": 0.3582, + "step": 79347 + }, + { + "epoch": 2.03, + "learning_rate": 4.965213837817429e-07, + "loss": 0.4121, + "step": 79348 + }, + { + "epoch": 2.03, + "learning_rate": 4.964974764896252e-07, + "loss": 0.3511, + "step": 79349 + }, + { + "epoch": 2.03, + "learning_rate": 4.964735695830156e-07, + "loss": 0.4507, + "step": 79350 + }, + { + "epoch": 2.03, + "learning_rate": 4.964496630619334e-07, + "loss": 0.4033, + "step": 79351 + }, + { + "epoch": 2.03, + "learning_rate": 4.964257569263963e-07, + "loss": 0.2864, + "step": 79352 + }, + { + "epoch": 2.03, + "learning_rate": 4.964018511764232e-07, + "loss": 0.3652, + "step": 79353 + }, + { + "epoch": 2.03, + "learning_rate": 4.963779458120316e-07, + "loss": 0.4031, + "step": 79354 + }, + { + "epoch": 2.03, + "learning_rate": 4.963540408332404e-07, + "loss": 0.4932, + "step": 79355 + }, + { + "epoch": 2.03, + "learning_rate": 4.963301362400676e-07, + "loss": 0.481, + "step": 79356 + }, + { + "epoch": 2.03, + "learning_rate": 4.963062320325321e-07, + "loss": 0.4087, + "step": 79357 + }, + { + "epoch": 2.03, + "learning_rate": 4.962823282106513e-07, + "loss": 0.23, + "step": 79358 + }, + { + "epoch": 2.03, + "learning_rate": 4.962584247744441e-07, + "loss": 0.5635, + "step": 79359 + }, + { + "epoch": 2.03, + "learning_rate": 4.962345217239285e-07, + "loss": 0.3905, + "step": 79360 + }, + { + "epoch": 2.03, + "learning_rate": 4.962106190591235e-07, + "loss": 0.2839, + "step": 79361 + }, + { + "epoch": 2.03, + "learning_rate": 4.961867167800467e-07, + "loss": 0.3682, + "step": 79362 + }, + { + "epoch": 2.03, + "learning_rate": 4.961628148867164e-07, + "loss": 0.3267, + "step": 79363 + }, + { + "epoch": 2.03, + "learning_rate": 4.961389133791509e-07, + "loss": 0.3682, + "step": 79364 + }, + { + "epoch": 2.03, + "learning_rate": 4.961150122573688e-07, + "loss": 0.5068, + "step": 79365 + }, + { + "epoch": 2.03, + "learning_rate": 4.960911115213885e-07, + "loss": 0.4487, + "step": 79366 + }, + { + "epoch": 2.03, + "learning_rate": 4.960672111712278e-07, + "loss": 0.3857, + "step": 79367 + }, + { + "epoch": 2.03, + "learning_rate": 4.960433112069051e-07, + "loss": 0.5044, + "step": 79368 + }, + { + "epoch": 2.03, + "learning_rate": 4.960194116284389e-07, + "loss": 0.5786, + "step": 79369 + }, + { + "epoch": 2.03, + "learning_rate": 4.95995512435848e-07, + "loss": 0.3027, + "step": 79370 + }, + { + "epoch": 2.03, + "learning_rate": 4.959716136291501e-07, + "loss": 0.4692, + "step": 79371 + }, + { + "epoch": 2.03, + "learning_rate": 4.959477152083631e-07, + "loss": 0.3972, + "step": 79372 + }, + { + "epoch": 2.03, + "learning_rate": 4.959238171735058e-07, + "loss": 0.3085, + "step": 79373 + }, + { + "epoch": 2.03, + "learning_rate": 4.958999195245968e-07, + "loss": 0.4878, + "step": 79374 + }, + { + "epoch": 2.03, + "learning_rate": 4.958760222616538e-07, + "loss": 0.4121, + "step": 79375 + }, + { + "epoch": 2.03, + "learning_rate": 4.958521253846952e-07, + "loss": 0.4048, + "step": 79376 + }, + { + "epoch": 2.03, + "learning_rate": 4.958282288937395e-07, + "loss": 0.3848, + "step": 79377 + }, + { + "epoch": 2.03, + "learning_rate": 4.958043327888054e-07, + "loss": 0.5508, + "step": 79378 + }, + { + "epoch": 2.03, + "learning_rate": 4.957804370699102e-07, + "loss": 0.439, + "step": 79379 + }, + { + "epoch": 2.03, + "learning_rate": 4.957565417370729e-07, + "loss": 0.4565, + "step": 79380 + }, + { + "epoch": 2.03, + "learning_rate": 4.957326467903119e-07, + "loss": 0.4316, + "step": 79381 + }, + { + "epoch": 2.03, + "learning_rate": 4.957087522296449e-07, + "loss": 0.4517, + "step": 79382 + }, + { + "epoch": 2.03, + "learning_rate": 4.95684858055091e-07, + "loss": 0.4456, + "step": 79383 + }, + { + "epoch": 2.03, + "learning_rate": 4.956609642666675e-07, + "loss": 0.5371, + "step": 79384 + }, + { + "epoch": 2.03, + "learning_rate": 4.956370708643932e-07, + "loss": 0.3523, + "step": 79385 + }, + { + "epoch": 2.03, + "learning_rate": 4.956131778482864e-07, + "loss": 0.3502, + "step": 79386 + }, + { + "epoch": 2.03, + "learning_rate": 4.955892852183659e-07, + "loss": 0.3015, + "step": 79387 + }, + { + "epoch": 2.03, + "learning_rate": 4.955653929746489e-07, + "loss": 0.4971, + "step": 79388 + }, + { + "epoch": 2.03, + "learning_rate": 4.955415011171544e-07, + "loss": 0.3207, + "step": 79389 + }, + { + "epoch": 2.03, + "learning_rate": 4.95517609645901e-07, + "loss": 0.3926, + "step": 79390 + }, + { + "epoch": 2.03, + "learning_rate": 4.954937185609065e-07, + "loss": 0.4604, + "step": 79391 + }, + { + "epoch": 2.03, + "learning_rate": 4.954698278621889e-07, + "loss": 0.5571, + "step": 79392 + }, + { + "epoch": 2.03, + "learning_rate": 4.95445937549767e-07, + "loss": 0.2381, + "step": 79393 + }, + { + "epoch": 2.03, + "learning_rate": 4.954220476236587e-07, + "loss": 0.345, + "step": 79394 + }, + { + "epoch": 2.03, + "learning_rate": 4.953981580838831e-07, + "loss": 0.4595, + "step": 79395 + }, + { + "epoch": 2.03, + "learning_rate": 4.953742689304574e-07, + "loss": 0.4141, + "step": 79396 + }, + { + "epoch": 2.03, + "learning_rate": 4.953503801634005e-07, + "loss": 0.3691, + "step": 79397 + }, + { + "epoch": 2.04, + "learning_rate": 4.953264917827307e-07, + "loss": 0.2675, + "step": 79398 + }, + { + "epoch": 2.04, + "learning_rate": 4.953026037884664e-07, + "loss": 0.457, + "step": 79399 + }, + { + "epoch": 2.04, + "learning_rate": 4.952787161806255e-07, + "loss": 0.4429, + "step": 79400 + }, + { + "epoch": 2.04, + "learning_rate": 4.952548289592267e-07, + "loss": 0.5244, + "step": 79401 + }, + { + "epoch": 2.04, + "learning_rate": 4.952309421242877e-07, + "loss": 0.4829, + "step": 79402 + }, + { + "epoch": 2.04, + "learning_rate": 4.952070556758272e-07, + "loss": 0.3447, + "step": 79403 + }, + { + "epoch": 2.04, + "learning_rate": 4.951831696138638e-07, + "loss": 0.3168, + "step": 79404 + }, + { + "epoch": 2.04, + "learning_rate": 4.951592839384151e-07, + "loss": 0.5513, + "step": 79405 + }, + { + "epoch": 2.04, + "learning_rate": 4.951353986494997e-07, + "loss": 0.4702, + "step": 79406 + }, + { + "epoch": 2.04, + "learning_rate": 4.95111513747136e-07, + "loss": 0.4053, + "step": 79407 + }, + { + "epoch": 2.04, + "learning_rate": 4.950876292313425e-07, + "loss": 0.4502, + "step": 79408 + }, + { + "epoch": 2.04, + "learning_rate": 4.950637451021367e-07, + "loss": 0.3899, + "step": 79409 + }, + { + "epoch": 2.04, + "learning_rate": 4.950398613595375e-07, + "loss": 0.376, + "step": 79410 + }, + { + "epoch": 2.04, + "learning_rate": 4.950159780035634e-07, + "loss": 0.3843, + "step": 79411 + }, + { + "epoch": 2.04, + "learning_rate": 4.949920950342325e-07, + "loss": 0.3293, + "step": 79412 + }, + { + "epoch": 2.04, + "learning_rate": 4.949682124515624e-07, + "loss": 0.4551, + "step": 79413 + }, + { + "epoch": 2.04, + "learning_rate": 4.94944330255572e-07, + "loss": 0.3389, + "step": 79414 + }, + { + "epoch": 2.04, + "learning_rate": 4.949204484462793e-07, + "loss": 0.3174, + "step": 79415 + }, + { + "epoch": 2.04, + "learning_rate": 4.948965670237033e-07, + "loss": 0.4966, + "step": 79416 + }, + { + "epoch": 2.04, + "learning_rate": 4.948726859878613e-07, + "loss": 0.5581, + "step": 79417 + }, + { + "epoch": 2.04, + "learning_rate": 4.948488053387722e-07, + "loss": 0.3721, + "step": 79418 + }, + { + "epoch": 2.04, + "learning_rate": 4.948249250764542e-07, + "loss": 0.3232, + "step": 79419 + }, + { + "epoch": 2.04, + "learning_rate": 4.948010452009258e-07, + "loss": 0.6028, + "step": 79420 + }, + { + "epoch": 2.04, + "learning_rate": 4.94777165712205e-07, + "loss": 0.4521, + "step": 79421 + }, + { + "epoch": 2.04, + "learning_rate": 4.947532866103096e-07, + "loss": 0.3718, + "step": 79422 + }, + { + "epoch": 2.04, + "learning_rate": 4.947294078952586e-07, + "loss": 0.245, + "step": 79423 + }, + { + "epoch": 2.04, + "learning_rate": 4.9470552956707e-07, + "loss": 0.4736, + "step": 79424 + }, + { + "epoch": 2.04, + "learning_rate": 4.946816516257625e-07, + "loss": 0.3513, + "step": 79425 + }, + { + "epoch": 2.04, + "learning_rate": 4.946577740713536e-07, + "loss": 0.3912, + "step": 79426 + }, + { + "epoch": 2.04, + "learning_rate": 4.94633896903862e-07, + "loss": 0.4897, + "step": 79427 + }, + { + "epoch": 2.04, + "learning_rate": 4.946100201233064e-07, + "loss": 0.4155, + "step": 79428 + }, + { + "epoch": 2.04, + "learning_rate": 4.945861437297043e-07, + "loss": 0.4287, + "step": 79429 + }, + { + "epoch": 2.04, + "learning_rate": 4.945622677230742e-07, + "loss": 0.311, + "step": 79430 + }, + { + "epoch": 2.04, + "learning_rate": 4.945383921034351e-07, + "loss": 0.3926, + "step": 79431 + }, + { + "epoch": 2.04, + "learning_rate": 4.945145168708043e-07, + "loss": 0.5488, + "step": 79432 + }, + { + "epoch": 2.04, + "learning_rate": 4.94490642025201e-07, + "loss": 0.4536, + "step": 79433 + }, + { + "epoch": 2.04, + "learning_rate": 4.944667675666424e-07, + "loss": 0.5254, + "step": 79434 + }, + { + "epoch": 2.04, + "learning_rate": 4.944428934951473e-07, + "loss": 0.4082, + "step": 79435 + }, + { + "epoch": 2.04, + "learning_rate": 4.944190198107342e-07, + "loss": 0.3524, + "step": 79436 + }, + { + "epoch": 2.04, + "learning_rate": 4.943951465134216e-07, + "loss": 0.52, + "step": 79437 + }, + { + "epoch": 2.04, + "learning_rate": 4.943712736032269e-07, + "loss": 0.4243, + "step": 79438 + }, + { + "epoch": 2.04, + "learning_rate": 4.943474010801688e-07, + "loss": 0.3708, + "step": 79439 + }, + { + "epoch": 2.04, + "learning_rate": 4.943235289442657e-07, + "loss": 0.4565, + "step": 79440 + }, + { + "epoch": 2.04, + "learning_rate": 4.942996571955364e-07, + "loss": 0.4722, + "step": 79441 + }, + { + "epoch": 2.04, + "learning_rate": 4.942757858339983e-07, + "loss": 0.3533, + "step": 79442 + }, + { + "epoch": 2.04, + "learning_rate": 4.942519148596698e-07, + "loss": 0.5801, + "step": 79443 + }, + { + "epoch": 2.04, + "learning_rate": 4.942280442725692e-07, + "loss": 0.4531, + "step": 79444 + }, + { + "epoch": 2.04, + "learning_rate": 4.942041740727154e-07, + "loss": 0.3157, + "step": 79445 + }, + { + "epoch": 2.04, + "learning_rate": 4.941803042601259e-07, + "loss": 0.4658, + "step": 79446 + }, + { + "epoch": 2.04, + "learning_rate": 4.941564348348192e-07, + "loss": 0.4365, + "step": 79447 + }, + { + "epoch": 2.04, + "learning_rate": 4.941325657968138e-07, + "loss": 0.4448, + "step": 79448 + }, + { + "epoch": 2.04, + "learning_rate": 4.941086971461279e-07, + "loss": 0.4451, + "step": 79449 + }, + { + "epoch": 2.04, + "learning_rate": 4.940848288827796e-07, + "loss": 0.2884, + "step": 79450 + }, + { + "epoch": 2.04, + "learning_rate": 4.940609610067875e-07, + "loss": 0.3097, + "step": 79451 + }, + { + "epoch": 2.04, + "learning_rate": 4.940370935181694e-07, + "loss": 0.3396, + "step": 79452 + }, + { + "epoch": 2.04, + "learning_rate": 4.940132264169438e-07, + "loss": 0.5122, + "step": 79453 + }, + { + "epoch": 2.04, + "learning_rate": 4.939893597031294e-07, + "loss": 0.4663, + "step": 79454 + }, + { + "epoch": 2.04, + "learning_rate": 4.939654933767437e-07, + "loss": 0.5486, + "step": 79455 + }, + { + "epoch": 2.04, + "learning_rate": 4.939416274378052e-07, + "loss": 0.4761, + "step": 79456 + }, + { + "epoch": 2.04, + "learning_rate": 4.939177618863325e-07, + "loss": 0.5088, + "step": 79457 + }, + { + "epoch": 2.04, + "learning_rate": 4.93893896722344e-07, + "loss": 0.4673, + "step": 79458 + }, + { + "epoch": 2.04, + "learning_rate": 4.938700319458574e-07, + "loss": 0.3958, + "step": 79459 + }, + { + "epoch": 2.04, + "learning_rate": 4.938461675568911e-07, + "loss": 0.2576, + "step": 79460 + }, + { + "epoch": 2.04, + "learning_rate": 4.938223035554639e-07, + "loss": 0.4873, + "step": 79461 + }, + { + "epoch": 2.04, + "learning_rate": 4.937984399415939e-07, + "loss": 0.3787, + "step": 79462 + }, + { + "epoch": 2.04, + "learning_rate": 4.937745767152985e-07, + "loss": 0.4634, + "step": 79463 + }, + { + "epoch": 2.04, + "learning_rate": 4.937507138765968e-07, + "loss": 0.564, + "step": 79464 + }, + { + "epoch": 2.04, + "learning_rate": 4.937268514255068e-07, + "loss": 0.4922, + "step": 79465 + }, + { + "epoch": 2.04, + "learning_rate": 4.937029893620475e-07, + "loss": 0.4199, + "step": 79466 + }, + { + "epoch": 2.04, + "learning_rate": 4.936791276862358e-07, + "loss": 0.4265, + "step": 79467 + }, + { + "epoch": 2.04, + "learning_rate": 4.93655266398091e-07, + "loss": 0.3398, + "step": 79468 + }, + { + "epoch": 2.04, + "learning_rate": 4.936314054976309e-07, + "loss": 0.406, + "step": 79469 + }, + { + "epoch": 2.04, + "learning_rate": 4.936075449848744e-07, + "loss": 0.3894, + "step": 79470 + }, + { + "epoch": 2.04, + "learning_rate": 4.935836848598394e-07, + "loss": 0.4597, + "step": 79471 + }, + { + "epoch": 2.04, + "learning_rate": 4.935598251225435e-07, + "loss": 0.4097, + "step": 79472 + }, + { + "epoch": 2.04, + "learning_rate": 4.935359657730057e-07, + "loss": 0.4014, + "step": 79473 + }, + { + "epoch": 2.04, + "learning_rate": 4.935121068112441e-07, + "loss": 0.4297, + "step": 79474 + }, + { + "epoch": 2.04, + "learning_rate": 4.934882482372774e-07, + "loss": 0.5454, + "step": 79475 + }, + { + "epoch": 2.04, + "learning_rate": 4.93464390051123e-07, + "loss": 0.3933, + "step": 79476 + }, + { + "epoch": 2.04, + "learning_rate": 4.934405322527997e-07, + "loss": 0.3945, + "step": 79477 + }, + { + "epoch": 2.04, + "learning_rate": 4.934166748423256e-07, + "loss": 0.4419, + "step": 79478 + }, + { + "epoch": 2.04, + "learning_rate": 4.933928178197195e-07, + "loss": 0.2797, + "step": 79479 + }, + { + "epoch": 2.04, + "learning_rate": 4.93368961184999e-07, + "loss": 0.3782, + "step": 79480 + }, + { + "epoch": 2.04, + "learning_rate": 4.933451049381827e-07, + "loss": 0.3718, + "step": 79481 + }, + { + "epoch": 2.04, + "learning_rate": 4.933212490792885e-07, + "loss": 0.4922, + "step": 79482 + }, + { + "epoch": 2.04, + "learning_rate": 4.932973936083353e-07, + "loss": 0.3381, + "step": 79483 + }, + { + "epoch": 2.04, + "learning_rate": 4.932735385253406e-07, + "loss": 0.4438, + "step": 79484 + }, + { + "epoch": 2.04, + "learning_rate": 4.93249683830323e-07, + "loss": 0.4819, + "step": 79485 + }, + { + "epoch": 2.04, + "learning_rate": 4.93225829523301e-07, + "loss": 0.4248, + "step": 79486 + }, + { + "epoch": 2.04, + "learning_rate": 4.932019756042929e-07, + "loss": 0.3604, + "step": 79487 + }, + { + "epoch": 2.04, + "learning_rate": 4.931781220733164e-07, + "loss": 0.5249, + "step": 79488 + }, + { + "epoch": 2.04, + "learning_rate": 4.9315426893039e-07, + "loss": 0.3329, + "step": 79489 + }, + { + "epoch": 2.04, + "learning_rate": 4.931304161755323e-07, + "loss": 0.4688, + "step": 79490 + }, + { + "epoch": 2.04, + "learning_rate": 4.931065638087615e-07, + "loss": 0.436, + "step": 79491 + }, + { + "epoch": 2.04, + "learning_rate": 4.930827118300958e-07, + "loss": 0.4707, + "step": 79492 + }, + { + "epoch": 2.04, + "learning_rate": 4.93058860239553e-07, + "loss": 0.4346, + "step": 79493 + }, + { + "epoch": 2.04, + "learning_rate": 4.930350090371516e-07, + "loss": 0.3633, + "step": 79494 + }, + { + "epoch": 2.04, + "learning_rate": 4.930111582229102e-07, + "loss": 0.6035, + "step": 79495 + }, + { + "epoch": 2.04, + "learning_rate": 4.929873077968471e-07, + "loss": 0.3816, + "step": 79496 + }, + { + "epoch": 2.04, + "learning_rate": 4.929634577589798e-07, + "loss": 0.4399, + "step": 79497 + }, + { + "epoch": 2.04, + "learning_rate": 4.929396081093273e-07, + "loss": 0.4062, + "step": 79498 + }, + { + "epoch": 2.04, + "learning_rate": 4.929157588479078e-07, + "loss": 0.3752, + "step": 79499 + }, + { + "epoch": 2.04, + "learning_rate": 4.928919099747395e-07, + "loss": 0.4507, + "step": 79500 + }, + { + "epoch": 2.04, + "learning_rate": 4.928680614898402e-07, + "loss": 0.2661, + "step": 79501 + }, + { + "epoch": 2.04, + "learning_rate": 4.928442133932283e-07, + "loss": 0.45, + "step": 79502 + }, + { + "epoch": 2.04, + "learning_rate": 4.928203656849224e-07, + "loss": 0.3602, + "step": 79503 + }, + { + "epoch": 2.04, + "learning_rate": 4.927965183649412e-07, + "loss": 0.52, + "step": 79504 + }, + { + "epoch": 2.04, + "learning_rate": 4.927726714333016e-07, + "loss": 0.3542, + "step": 79505 + }, + { + "epoch": 2.04, + "learning_rate": 4.92748824890023e-07, + "loss": 0.3542, + "step": 79506 + }, + { + "epoch": 2.04, + "learning_rate": 4.927249787351232e-07, + "loss": 0.3661, + "step": 79507 + }, + { + "epoch": 2.04, + "learning_rate": 4.92701132968621e-07, + "loss": 0.4453, + "step": 79508 + }, + { + "epoch": 2.04, + "learning_rate": 4.926772875905336e-07, + "loss": 0.3373, + "step": 79509 + }, + { + "epoch": 2.04, + "learning_rate": 4.926534426008805e-07, + "loss": 0.4697, + "step": 79510 + }, + { + "epoch": 2.04, + "learning_rate": 4.926295979996787e-07, + "loss": 0.4165, + "step": 79511 + }, + { + "epoch": 2.04, + "learning_rate": 4.926057537869474e-07, + "loss": 0.5171, + "step": 79512 + }, + { + "epoch": 2.04, + "learning_rate": 4.925819099627047e-07, + "loss": 0.4316, + "step": 79513 + }, + { + "epoch": 2.04, + "learning_rate": 4.925580665269684e-07, + "loss": 0.3118, + "step": 79514 + }, + { + "epoch": 2.04, + "learning_rate": 4.92534223479757e-07, + "loss": 0.3448, + "step": 79515 + }, + { + "epoch": 2.04, + "learning_rate": 4.925103808210892e-07, + "loss": 0.3127, + "step": 79516 + }, + { + "epoch": 2.04, + "learning_rate": 4.924865385509826e-07, + "loss": 0.415, + "step": 79517 + }, + { + "epoch": 2.04, + "learning_rate": 4.924626966694556e-07, + "loss": 0.3618, + "step": 79518 + }, + { + "epoch": 2.04, + "learning_rate": 4.924388551765266e-07, + "loss": 0.4746, + "step": 79519 + }, + { + "epoch": 2.04, + "learning_rate": 4.924150140722142e-07, + "loss": 0.4346, + "step": 79520 + }, + { + "epoch": 2.04, + "learning_rate": 4.923911733565364e-07, + "loss": 0.3628, + "step": 79521 + }, + { + "epoch": 2.04, + "learning_rate": 4.923673330295108e-07, + "loss": 0.4248, + "step": 79522 + }, + { + "epoch": 2.04, + "learning_rate": 4.923434930911561e-07, + "loss": 0.3481, + "step": 79523 + }, + { + "epoch": 2.04, + "learning_rate": 4.92319653541491e-07, + "loss": 0.4497, + "step": 79524 + }, + { + "epoch": 2.04, + "learning_rate": 4.922958143805335e-07, + "loss": 0.4675, + "step": 79525 + }, + { + "epoch": 2.04, + "learning_rate": 4.922719756083015e-07, + "loss": 0.3623, + "step": 79526 + }, + { + "epoch": 2.04, + "learning_rate": 4.922481372248134e-07, + "loss": 0.2687, + "step": 79527 + }, + { + "epoch": 2.04, + "learning_rate": 4.922242992300876e-07, + "loss": 0.3953, + "step": 79528 + }, + { + "epoch": 2.04, + "learning_rate": 4.922004616241427e-07, + "loss": 0.3955, + "step": 79529 + }, + { + "epoch": 2.04, + "learning_rate": 4.921766244069965e-07, + "loss": 0.2925, + "step": 79530 + }, + { + "epoch": 2.04, + "learning_rate": 4.921527875786669e-07, + "loss": 0.3394, + "step": 79531 + }, + { + "epoch": 2.04, + "learning_rate": 4.921289511391727e-07, + "loss": 0.4214, + "step": 79532 + }, + { + "epoch": 2.04, + "learning_rate": 4.921051150885324e-07, + "loss": 0.4536, + "step": 79533 + }, + { + "epoch": 2.04, + "learning_rate": 4.920812794267633e-07, + "loss": 0.2861, + "step": 79534 + }, + { + "epoch": 2.04, + "learning_rate": 4.920574441538844e-07, + "loss": 0.2394, + "step": 79535 + }, + { + "epoch": 2.04, + "learning_rate": 4.920336092699137e-07, + "loss": 0.3516, + "step": 79536 + }, + { + "epoch": 2.04, + "learning_rate": 4.920097747748699e-07, + "loss": 0.3381, + "step": 79537 + }, + { + "epoch": 2.04, + "learning_rate": 4.919859406687704e-07, + "loss": 0.4219, + "step": 79538 + }, + { + "epoch": 2.04, + "learning_rate": 4.919621069516339e-07, + "loss": 0.4182, + "step": 79539 + }, + { + "epoch": 2.04, + "learning_rate": 4.919382736234791e-07, + "loss": 0.3025, + "step": 79540 + }, + { + "epoch": 2.04, + "learning_rate": 4.919144406843234e-07, + "loss": 0.377, + "step": 79541 + }, + { + "epoch": 2.04, + "learning_rate": 4.918906081341858e-07, + "loss": 0.3752, + "step": 79542 + }, + { + "epoch": 2.04, + "learning_rate": 4.918667759730838e-07, + "loss": 0.3486, + "step": 79543 + }, + { + "epoch": 2.04, + "learning_rate": 4.918429442010361e-07, + "loss": 0.5542, + "step": 79544 + }, + { + "epoch": 2.04, + "learning_rate": 4.918191128180609e-07, + "loss": 0.3599, + "step": 79545 + }, + { + "epoch": 2.04, + "learning_rate": 4.917952818241769e-07, + "loss": 0.481, + "step": 79546 + }, + { + "epoch": 2.04, + "learning_rate": 4.917714512194013e-07, + "loss": 0.4165, + "step": 79547 + }, + { + "epoch": 2.04, + "learning_rate": 4.917476210037531e-07, + "loss": 0.5503, + "step": 79548 + }, + { + "epoch": 2.04, + "learning_rate": 4.917237911772502e-07, + "loss": 0.498, + "step": 79549 + }, + { + "epoch": 2.04, + "learning_rate": 4.91699961739912e-07, + "loss": 0.3799, + "step": 79550 + }, + { + "epoch": 2.04, + "learning_rate": 4.916761326917549e-07, + "loss": 0.3892, + "step": 79551 + }, + { + "epoch": 2.04, + "learning_rate": 4.91652304032798e-07, + "loss": 0.4421, + "step": 79552 + }, + { + "epoch": 2.04, + "learning_rate": 4.916284757630595e-07, + "loss": 0.4761, + "step": 79553 + }, + { + "epoch": 2.04, + "learning_rate": 4.916046478825583e-07, + "loss": 0.4673, + "step": 79554 + }, + { + "epoch": 2.04, + "learning_rate": 4.915808203913114e-07, + "loss": 0.4941, + "step": 79555 + }, + { + "epoch": 2.04, + "learning_rate": 4.915569932893378e-07, + "loss": 0.3926, + "step": 79556 + }, + { + "epoch": 2.04, + "learning_rate": 4.915331665766557e-07, + "loss": 0.4233, + "step": 79557 + }, + { + "epoch": 2.04, + "learning_rate": 4.915093402532836e-07, + "loss": 0.4229, + "step": 79558 + }, + { + "epoch": 2.04, + "learning_rate": 4.91485514319239e-07, + "loss": 0.3726, + "step": 79559 + }, + { + "epoch": 2.04, + "learning_rate": 4.914616887745409e-07, + "loss": 0.3557, + "step": 79560 + }, + { + "epoch": 2.04, + "learning_rate": 4.91437863619207e-07, + "loss": 0.4033, + "step": 79561 + }, + { + "epoch": 2.04, + "learning_rate": 4.914140388532556e-07, + "loss": 0.418, + "step": 79562 + }, + { + "epoch": 2.04, + "learning_rate": 4.913902144767055e-07, + "loss": 0.4912, + "step": 79563 + }, + { + "epoch": 2.04, + "learning_rate": 4.913663904895742e-07, + "loss": 0.4434, + "step": 79564 + }, + { + "epoch": 2.04, + "learning_rate": 4.913425668918802e-07, + "loss": 0.3, + "step": 79565 + }, + { + "epoch": 2.04, + "learning_rate": 4.913187436836417e-07, + "loss": 0.4336, + "step": 79566 + }, + { + "epoch": 2.04, + "learning_rate": 4.912949208648777e-07, + "loss": 0.3121, + "step": 79567 + }, + { + "epoch": 2.04, + "learning_rate": 4.912710984356053e-07, + "loss": 0.4253, + "step": 79568 + }, + { + "epoch": 2.04, + "learning_rate": 4.912472763958431e-07, + "loss": 0.4722, + "step": 79569 + }, + { + "epoch": 2.04, + "learning_rate": 4.912234547456099e-07, + "loss": 0.3373, + "step": 79570 + }, + { + "epoch": 2.04, + "learning_rate": 4.911996334849235e-07, + "loss": 0.3716, + "step": 79571 + }, + { + "epoch": 2.04, + "learning_rate": 4.911758126138019e-07, + "loss": 0.324, + "step": 79572 + }, + { + "epoch": 2.04, + "learning_rate": 4.911519921322634e-07, + "loss": 0.3545, + "step": 79573 + }, + { + "epoch": 2.04, + "learning_rate": 4.911281720403267e-07, + "loss": 0.4883, + "step": 79574 + }, + { + "epoch": 2.04, + "learning_rate": 4.911043523380098e-07, + "loss": 0.3237, + "step": 79575 + }, + { + "epoch": 2.04, + "learning_rate": 4.910805330253307e-07, + "loss": 0.4092, + "step": 79576 + }, + { + "epoch": 2.04, + "learning_rate": 4.910567141023078e-07, + "loss": 0.5005, + "step": 79577 + }, + { + "epoch": 2.04, + "learning_rate": 4.910328955689595e-07, + "loss": 0.4858, + "step": 79578 + }, + { + "epoch": 2.04, + "learning_rate": 4.910090774253041e-07, + "loss": 0.5317, + "step": 79579 + }, + { + "epoch": 2.04, + "learning_rate": 4.909852596713596e-07, + "loss": 0.5479, + "step": 79580 + }, + { + "epoch": 2.04, + "learning_rate": 4.909614423071441e-07, + "loss": 0.4531, + "step": 79581 + }, + { + "epoch": 2.04, + "learning_rate": 4.909376253326759e-07, + "loss": 0.3828, + "step": 79582 + }, + { + "epoch": 2.04, + "learning_rate": 4.909138087479734e-07, + "loss": 0.48, + "step": 79583 + }, + { + "epoch": 2.04, + "learning_rate": 4.908899925530552e-07, + "loss": 0.4028, + "step": 79584 + }, + { + "epoch": 2.04, + "learning_rate": 4.908661767479386e-07, + "loss": 0.4321, + "step": 79585 + }, + { + "epoch": 2.04, + "learning_rate": 4.908423613326425e-07, + "loss": 0.5117, + "step": 79586 + }, + { + "epoch": 2.04, + "learning_rate": 4.908185463071849e-07, + "loss": 0.5542, + "step": 79587 + }, + { + "epoch": 2.04, + "learning_rate": 4.907947316715845e-07, + "loss": 0.522, + "step": 79588 + }, + { + "epoch": 2.04, + "learning_rate": 4.907709174258588e-07, + "loss": 0.4644, + "step": 79589 + }, + { + "epoch": 2.04, + "learning_rate": 4.907471035700269e-07, + "loss": 0.4243, + "step": 79590 + }, + { + "epoch": 2.04, + "learning_rate": 4.907232901041061e-07, + "loss": 0.3909, + "step": 79591 + }, + { + "epoch": 2.04, + "learning_rate": 4.906994770281153e-07, + "loss": 0.4614, + "step": 79592 + }, + { + "epoch": 2.04, + "learning_rate": 4.906756643420723e-07, + "loss": 0.5122, + "step": 79593 + }, + { + "epoch": 2.04, + "learning_rate": 4.906518520459953e-07, + "loss": 0.3591, + "step": 79594 + }, + { + "epoch": 2.04, + "learning_rate": 4.90628040139903e-07, + "loss": 0.2665, + "step": 79595 + }, + { + "epoch": 2.04, + "learning_rate": 4.906042286238136e-07, + "loss": 0.3735, + "step": 79596 + }, + { + "epoch": 2.04, + "learning_rate": 4.905804174977448e-07, + "loss": 0.4736, + "step": 79597 + }, + { + "epoch": 2.04, + "learning_rate": 4.905566067617152e-07, + "loss": 0.4304, + "step": 79598 + }, + { + "epoch": 2.04, + "learning_rate": 4.905327964157429e-07, + "loss": 0.3252, + "step": 79599 + }, + { + "epoch": 2.04, + "learning_rate": 4.905089864598467e-07, + "loss": 0.3525, + "step": 79600 + }, + { + "epoch": 2.04, + "learning_rate": 4.904851768940441e-07, + "loss": 0.3516, + "step": 79601 + }, + { + "epoch": 2.04, + "learning_rate": 4.904613677183534e-07, + "loss": 0.3804, + "step": 79602 + }, + { + "epoch": 2.04, + "learning_rate": 4.904375589327929e-07, + "loss": 0.4606, + "step": 79603 + }, + { + "epoch": 2.04, + "learning_rate": 4.90413750537381e-07, + "loss": 0.3254, + "step": 79604 + }, + { + "epoch": 2.04, + "learning_rate": 4.903899425321363e-07, + "loss": 0.4158, + "step": 79605 + }, + { + "epoch": 2.04, + "learning_rate": 4.903661349170761e-07, + "loss": 0.3477, + "step": 79606 + }, + { + "epoch": 2.04, + "learning_rate": 4.903423276922192e-07, + "loss": 0.5186, + "step": 79607 + }, + { + "epoch": 2.04, + "learning_rate": 4.90318520857584e-07, + "loss": 0.4883, + "step": 79608 + }, + { + "epoch": 2.04, + "learning_rate": 4.902947144131882e-07, + "loss": 0.4717, + "step": 79609 + }, + { + "epoch": 2.04, + "learning_rate": 4.902709083590506e-07, + "loss": 0.4917, + "step": 79610 + }, + { + "epoch": 2.04, + "learning_rate": 4.902471026951888e-07, + "loss": 0.4399, + "step": 79611 + }, + { + "epoch": 2.04, + "learning_rate": 4.902232974216213e-07, + "loss": 0.5098, + "step": 79612 + }, + { + "epoch": 2.04, + "learning_rate": 4.901994925383669e-07, + "loss": 0.4268, + "step": 79613 + }, + { + "epoch": 2.04, + "learning_rate": 4.901756880454428e-07, + "loss": 0.5684, + "step": 79614 + }, + { + "epoch": 2.04, + "learning_rate": 4.901518839428678e-07, + "loss": 0.4189, + "step": 79615 + }, + { + "epoch": 2.04, + "learning_rate": 4.9012808023066e-07, + "loss": 0.468, + "step": 79616 + }, + { + "epoch": 2.04, + "learning_rate": 4.90104276908838e-07, + "loss": 0.4127, + "step": 79617 + }, + { + "epoch": 2.04, + "learning_rate": 4.900804739774195e-07, + "loss": 0.4683, + "step": 79618 + }, + { + "epoch": 2.04, + "learning_rate": 4.900566714364229e-07, + "loss": 0.4609, + "step": 79619 + }, + { + "epoch": 2.04, + "learning_rate": 4.900328692858667e-07, + "loss": 0.2561, + "step": 79620 + }, + { + "epoch": 2.04, + "learning_rate": 4.900090675257686e-07, + "loss": 0.4194, + "step": 79621 + }, + { + "epoch": 2.04, + "learning_rate": 4.899852661561475e-07, + "loss": 0.4785, + "step": 79622 + }, + { + "epoch": 2.04, + "learning_rate": 4.899614651770208e-07, + "loss": 0.4004, + "step": 79623 + }, + { + "epoch": 2.04, + "learning_rate": 4.899376645884072e-07, + "loss": 0.4453, + "step": 79624 + }, + { + "epoch": 2.04, + "learning_rate": 4.899138643903253e-07, + "loss": 0.3639, + "step": 79625 + }, + { + "epoch": 2.04, + "learning_rate": 4.898900645827925e-07, + "loss": 0.5063, + "step": 79626 + }, + { + "epoch": 2.04, + "learning_rate": 4.898662651658274e-07, + "loss": 0.3625, + "step": 79627 + }, + { + "epoch": 2.04, + "learning_rate": 4.898424661394481e-07, + "loss": 0.416, + "step": 79628 + }, + { + "epoch": 2.04, + "learning_rate": 4.898186675036735e-07, + "loss": 0.5259, + "step": 79629 + }, + { + "epoch": 2.04, + "learning_rate": 4.897948692585213e-07, + "loss": 0.4277, + "step": 79630 + }, + { + "epoch": 2.04, + "learning_rate": 4.897710714040093e-07, + "loss": 0.359, + "step": 79631 + }, + { + "epoch": 2.04, + "learning_rate": 4.897472739401562e-07, + "loss": 0.3308, + "step": 79632 + }, + { + "epoch": 2.04, + "learning_rate": 4.8972347686698e-07, + "loss": 0.3716, + "step": 79633 + }, + { + "epoch": 2.04, + "learning_rate": 4.896996801844996e-07, + "loss": 0.1527, + "step": 79634 + }, + { + "epoch": 2.04, + "learning_rate": 4.896758838927322e-07, + "loss": 0.4639, + "step": 79635 + }, + { + "epoch": 2.04, + "learning_rate": 4.896520879916965e-07, + "loss": 0.4395, + "step": 79636 + }, + { + "epoch": 2.04, + "learning_rate": 4.896282924814108e-07, + "loss": 0.3206, + "step": 79637 + }, + { + "epoch": 2.04, + "learning_rate": 4.896044973618936e-07, + "loss": 0.4436, + "step": 79638 + }, + { + "epoch": 2.04, + "learning_rate": 4.895807026331624e-07, + "loss": 0.4136, + "step": 79639 + }, + { + "epoch": 2.04, + "learning_rate": 4.895569082952362e-07, + "loss": 0.458, + "step": 79640 + }, + { + "epoch": 2.04, + "learning_rate": 4.895331143481324e-07, + "loss": 0.4155, + "step": 79641 + }, + { + "epoch": 2.04, + "learning_rate": 4.895093207918699e-07, + "loss": 0.4219, + "step": 79642 + }, + { + "epoch": 2.04, + "learning_rate": 4.894855276264664e-07, + "loss": 0.35, + "step": 79643 + }, + { + "epoch": 2.04, + "learning_rate": 4.894617348519403e-07, + "loss": 0.2891, + "step": 79644 + }, + { + "epoch": 2.04, + "learning_rate": 4.894379424683098e-07, + "loss": 0.5137, + "step": 79645 + }, + { + "epoch": 2.04, + "learning_rate": 4.894141504755938e-07, + "loss": 0.3407, + "step": 79646 + }, + { + "epoch": 2.04, + "learning_rate": 4.893903588738093e-07, + "loss": 0.4756, + "step": 79647 + }, + { + "epoch": 2.04, + "learning_rate": 4.893665676629751e-07, + "loss": 0.5107, + "step": 79648 + }, + { + "epoch": 2.04, + "learning_rate": 4.893427768431097e-07, + "loss": 0.4131, + "step": 79649 + }, + { + "epoch": 2.04, + "learning_rate": 4.893189864142312e-07, + "loss": 0.4448, + "step": 79650 + }, + { + "epoch": 2.04, + "learning_rate": 4.892951963763578e-07, + "loss": 0.3799, + "step": 79651 + }, + { + "epoch": 2.04, + "learning_rate": 4.892714067295071e-07, + "loss": 0.4941, + "step": 79652 + }, + { + "epoch": 2.04, + "learning_rate": 4.892476174736978e-07, + "loss": 0.3085, + "step": 79653 + }, + { + "epoch": 2.04, + "learning_rate": 4.892238286089481e-07, + "loss": 0.3079, + "step": 79654 + }, + { + "epoch": 2.04, + "learning_rate": 4.892000401352768e-07, + "loss": 0.4067, + "step": 79655 + }, + { + "epoch": 2.04, + "learning_rate": 4.89176252052701e-07, + "loss": 0.4316, + "step": 79656 + }, + { + "epoch": 2.04, + "learning_rate": 4.891524643612395e-07, + "loss": 0.4287, + "step": 79657 + }, + { + "epoch": 2.04, + "learning_rate": 4.891286770609104e-07, + "loss": 0.3906, + "step": 79658 + }, + { + "epoch": 2.04, + "learning_rate": 4.891048901517325e-07, + "loss": 0.4102, + "step": 79659 + }, + { + "epoch": 2.04, + "learning_rate": 4.890811036337234e-07, + "loss": 0.521, + "step": 79660 + }, + { + "epoch": 2.04, + "learning_rate": 4.89057317506901e-07, + "loss": 0.4941, + "step": 79661 + }, + { + "epoch": 2.04, + "learning_rate": 4.89033531771284e-07, + "loss": 0.5073, + "step": 79662 + }, + { + "epoch": 2.04, + "learning_rate": 4.890097464268908e-07, + "loss": 0.5908, + "step": 79663 + }, + { + "epoch": 2.04, + "learning_rate": 4.889859614737391e-07, + "loss": 0.4043, + "step": 79664 + }, + { + "epoch": 2.04, + "learning_rate": 4.889621769118473e-07, + "loss": 0.4082, + "step": 79665 + }, + { + "epoch": 2.04, + "learning_rate": 4.889383927412336e-07, + "loss": 0.4761, + "step": 79666 + }, + { + "epoch": 2.04, + "learning_rate": 4.889146089619167e-07, + "loss": 0.4976, + "step": 79667 + }, + { + "epoch": 2.04, + "learning_rate": 4.88890825573914e-07, + "loss": 0.4365, + "step": 79668 + }, + { + "epoch": 2.04, + "learning_rate": 4.888670425772441e-07, + "loss": 0.3171, + "step": 79669 + }, + { + "epoch": 2.04, + "learning_rate": 4.888432599719256e-07, + "loss": 0.3091, + "step": 79670 + }, + { + "epoch": 2.04, + "learning_rate": 4.888194777579759e-07, + "loss": 0.4092, + "step": 79671 + }, + { + "epoch": 2.04, + "learning_rate": 4.88795695935414e-07, + "loss": 0.3794, + "step": 79672 + }, + { + "epoch": 2.04, + "learning_rate": 4.887719145042574e-07, + "loss": 0.4048, + "step": 79673 + }, + { + "epoch": 2.04, + "learning_rate": 4.887481334645246e-07, + "loss": 0.4688, + "step": 79674 + }, + { + "epoch": 2.04, + "learning_rate": 4.887243528162338e-07, + "loss": 0.4546, + "step": 79675 + }, + { + "epoch": 2.04, + "learning_rate": 4.887005725594038e-07, + "loss": 0.5425, + "step": 79676 + }, + { + "epoch": 2.04, + "learning_rate": 4.886767926940517e-07, + "loss": 0.2775, + "step": 79677 + }, + { + "epoch": 2.04, + "learning_rate": 4.886530132201964e-07, + "loss": 0.3247, + "step": 79678 + }, + { + "epoch": 2.04, + "learning_rate": 4.886292341378561e-07, + "loss": 0.4167, + "step": 79679 + }, + { + "epoch": 2.04, + "learning_rate": 4.886054554470492e-07, + "loss": 0.185, + "step": 79680 + }, + { + "epoch": 2.04, + "learning_rate": 4.885816771477931e-07, + "loss": 0.4561, + "step": 79681 + }, + { + "epoch": 2.04, + "learning_rate": 4.885578992401063e-07, + "loss": 0.4272, + "step": 79682 + }, + { + "epoch": 2.04, + "learning_rate": 4.885341217240075e-07, + "loss": 0.4736, + "step": 79683 + }, + { + "epoch": 2.04, + "learning_rate": 4.885103445995149e-07, + "loss": 0.4253, + "step": 79684 + }, + { + "epoch": 2.04, + "learning_rate": 4.884865678666459e-07, + "loss": 0.4238, + "step": 79685 + }, + { + "epoch": 2.04, + "learning_rate": 4.884627915254194e-07, + "loss": 0.4204, + "step": 79686 + }, + { + "epoch": 2.04, + "learning_rate": 4.884390155758533e-07, + "loss": 0.2114, + "step": 79687 + }, + { + "epoch": 2.04, + "learning_rate": 4.884152400179663e-07, + "loss": 0.5347, + "step": 79688 + }, + { + "epoch": 2.04, + "learning_rate": 4.883914648517758e-07, + "loss": 0.3599, + "step": 79689 + }, + { + "epoch": 2.04, + "learning_rate": 4.883676900773009e-07, + "loss": 0.3037, + "step": 79690 + }, + { + "epoch": 2.04, + "learning_rate": 4.88343915694559e-07, + "loss": 0.3513, + "step": 79691 + }, + { + "epoch": 2.04, + "learning_rate": 4.883201417035685e-07, + "loss": 0.2686, + "step": 79692 + }, + { + "epoch": 2.04, + "learning_rate": 4.882963681043482e-07, + "loss": 0.4531, + "step": 79693 + }, + { + "epoch": 2.04, + "learning_rate": 4.882725948969155e-07, + "loss": 0.5132, + "step": 79694 + }, + { + "epoch": 2.04, + "learning_rate": 4.882488220812889e-07, + "loss": 0.4051, + "step": 79695 + }, + { + "epoch": 2.04, + "learning_rate": 4.88225049657487e-07, + "loss": 0.4062, + "step": 79696 + }, + { + "epoch": 2.04, + "learning_rate": 4.882012776255273e-07, + "loss": 0.3367, + "step": 79697 + }, + { + "epoch": 2.04, + "learning_rate": 4.881775059854284e-07, + "loss": 0.499, + "step": 79698 + }, + { + "epoch": 2.04, + "learning_rate": 4.881537347372084e-07, + "loss": 0.3916, + "step": 79699 + }, + { + "epoch": 2.04, + "learning_rate": 4.881299638808859e-07, + "loss": 0.3215, + "step": 79700 + }, + { + "epoch": 2.04, + "learning_rate": 4.881061934164787e-07, + "loss": 0.3032, + "step": 79701 + }, + { + "epoch": 2.04, + "learning_rate": 4.880824233440048e-07, + "loss": 0.349, + "step": 79702 + }, + { + "epoch": 2.04, + "learning_rate": 4.880586536634826e-07, + "loss": 0.4182, + "step": 79703 + }, + { + "epoch": 2.04, + "learning_rate": 4.880348843749304e-07, + "loss": 0.5332, + "step": 79704 + }, + { + "epoch": 2.04, + "learning_rate": 4.880111154783666e-07, + "loss": 0.4365, + "step": 79705 + }, + { + "epoch": 2.04, + "learning_rate": 4.879873469738089e-07, + "loss": 0.4639, + "step": 79706 + }, + { + "epoch": 2.04, + "learning_rate": 4.879635788612756e-07, + "loss": 0.4341, + "step": 79707 + }, + { + "epoch": 2.04, + "learning_rate": 4.87939811140785e-07, + "loss": 0.4604, + "step": 79708 + }, + { + "epoch": 2.04, + "learning_rate": 4.879160438123559e-07, + "loss": 0.4436, + "step": 79709 + }, + { + "epoch": 2.04, + "learning_rate": 4.87892276876006e-07, + "loss": 0.459, + "step": 79710 + }, + { + "epoch": 2.04, + "learning_rate": 4.878685103317529e-07, + "loss": 0.4001, + "step": 79711 + }, + { + "epoch": 2.04, + "learning_rate": 4.878447441796154e-07, + "loss": 0.4175, + "step": 79712 + }, + { + "epoch": 2.04, + "learning_rate": 4.87820978419612e-07, + "loss": 0.374, + "step": 79713 + }, + { + "epoch": 2.04, + "learning_rate": 4.877972130517601e-07, + "loss": 0.5747, + "step": 79714 + }, + { + "epoch": 2.04, + "learning_rate": 4.877734480760783e-07, + "loss": 0.4167, + "step": 79715 + }, + { + "epoch": 2.04, + "learning_rate": 4.877496834925849e-07, + "loss": 0.5034, + "step": 79716 + }, + { + "epoch": 2.04, + "learning_rate": 4.877259193012983e-07, + "loss": 0.4717, + "step": 79717 + }, + { + "epoch": 2.04, + "learning_rate": 4.877021555022361e-07, + "loss": 0.4888, + "step": 79718 + }, + { + "epoch": 2.04, + "learning_rate": 4.876783920954169e-07, + "loss": 0.375, + "step": 79719 + }, + { + "epoch": 2.04, + "learning_rate": 4.876546290808591e-07, + "loss": 0.4639, + "step": 79720 + }, + { + "epoch": 2.04, + "learning_rate": 4.876308664585801e-07, + "loss": 0.478, + "step": 79721 + }, + { + "epoch": 2.04, + "learning_rate": 4.876071042285991e-07, + "loss": 0.4707, + "step": 79722 + }, + { + "epoch": 2.04, + "learning_rate": 4.875833423909334e-07, + "loss": 0.5356, + "step": 79723 + }, + { + "epoch": 2.04, + "learning_rate": 4.875595809456014e-07, + "loss": 0.4155, + "step": 79724 + }, + { + "epoch": 2.04, + "learning_rate": 4.875358198926218e-07, + "loss": 0.3975, + "step": 79725 + }, + { + "epoch": 2.04, + "learning_rate": 4.875120592320126e-07, + "loss": 0.6172, + "step": 79726 + }, + { + "epoch": 2.04, + "learning_rate": 4.874882989637914e-07, + "loss": 0.4028, + "step": 79727 + }, + { + "epoch": 2.04, + "learning_rate": 4.874645390879769e-07, + "loss": 0.439, + "step": 79728 + }, + { + "epoch": 2.04, + "learning_rate": 4.874407796045873e-07, + "loss": 0.2925, + "step": 79729 + }, + { + "epoch": 2.04, + "learning_rate": 4.874170205136415e-07, + "loss": 0.5352, + "step": 79730 + }, + { + "epoch": 2.04, + "learning_rate": 4.873932618151561e-07, + "loss": 0.3418, + "step": 79731 + }, + { + "epoch": 2.04, + "learning_rate": 4.873695035091502e-07, + "loss": 0.4722, + "step": 79732 + }, + { + "epoch": 2.04, + "learning_rate": 4.873457455956418e-07, + "loss": 0.4673, + "step": 79733 + }, + { + "epoch": 2.04, + "learning_rate": 4.873219880746497e-07, + "loss": 0.3787, + "step": 79734 + }, + { + "epoch": 2.04, + "learning_rate": 4.872982309461911e-07, + "loss": 0.3042, + "step": 79735 + }, + { + "epoch": 2.04, + "learning_rate": 4.872744742102845e-07, + "loss": 0.5117, + "step": 79736 + }, + { + "epoch": 2.04, + "learning_rate": 4.872507178669485e-07, + "loss": 0.3127, + "step": 79737 + }, + { + "epoch": 2.04, + "learning_rate": 4.872269619162014e-07, + "loss": 0.4233, + "step": 79738 + }, + { + "epoch": 2.04, + "learning_rate": 4.872032063580607e-07, + "loss": 0.3766, + "step": 79739 + }, + { + "epoch": 2.04, + "learning_rate": 4.871794511925451e-07, + "loss": 0.3586, + "step": 79740 + }, + { + "epoch": 2.04, + "learning_rate": 4.871556964196724e-07, + "loss": 0.4014, + "step": 79741 + }, + { + "epoch": 2.04, + "learning_rate": 4.871319420394609e-07, + "loss": 0.5493, + "step": 79742 + }, + { + "epoch": 2.04, + "learning_rate": 4.871081880519294e-07, + "loss": 0.4717, + "step": 79743 + }, + { + "epoch": 2.04, + "learning_rate": 4.870844344570951e-07, + "loss": 0.4053, + "step": 79744 + }, + { + "epoch": 2.04, + "learning_rate": 4.870606812549767e-07, + "loss": 0.3286, + "step": 79745 + }, + { + "epoch": 2.04, + "learning_rate": 4.870369284455925e-07, + "loss": 0.3928, + "step": 79746 + }, + { + "epoch": 2.04, + "learning_rate": 4.870131760289607e-07, + "loss": 0.48, + "step": 79747 + }, + { + "epoch": 2.04, + "learning_rate": 4.86989424005099e-07, + "loss": 0.3706, + "step": 79748 + }, + { + "epoch": 2.04, + "learning_rate": 4.869656723740259e-07, + "loss": 0.4434, + "step": 79749 + }, + { + "epoch": 2.04, + "learning_rate": 4.8694192113576e-07, + "loss": 0.4575, + "step": 79750 + }, + { + "epoch": 2.04, + "learning_rate": 4.86918170290319e-07, + "loss": 0.5039, + "step": 79751 + }, + { + "epoch": 2.04, + "learning_rate": 4.868944198377208e-07, + "loss": 0.2842, + "step": 79752 + }, + { + "epoch": 2.04, + "learning_rate": 4.86870669777984e-07, + "loss": 0.4644, + "step": 79753 + }, + { + "epoch": 2.04, + "learning_rate": 4.868469201111268e-07, + "loss": 0.5132, + "step": 79754 + }, + { + "epoch": 2.04, + "learning_rate": 4.868231708371676e-07, + "loss": 0.4658, + "step": 79755 + }, + { + "epoch": 2.04, + "learning_rate": 4.86799421956124e-07, + "loss": 0.4436, + "step": 79756 + }, + { + "epoch": 2.04, + "learning_rate": 4.867756734680144e-07, + "loss": 0.6001, + "step": 79757 + }, + { + "epoch": 2.04, + "learning_rate": 4.867519253728572e-07, + "loss": 0.3306, + "step": 79758 + }, + { + "epoch": 2.04, + "learning_rate": 4.867281776706708e-07, + "loss": 0.328, + "step": 79759 + }, + { + "epoch": 2.04, + "learning_rate": 4.867044303614729e-07, + "loss": 0.499, + "step": 79760 + }, + { + "epoch": 2.04, + "learning_rate": 4.866806834452815e-07, + "loss": 0.4436, + "step": 79761 + }, + { + "epoch": 2.04, + "learning_rate": 4.866569369221151e-07, + "loss": 0.5127, + "step": 79762 + }, + { + "epoch": 2.04, + "learning_rate": 4.866331907919918e-07, + "loss": 0.4189, + "step": 79763 + }, + { + "epoch": 2.04, + "learning_rate": 4.866094450549304e-07, + "loss": 0.3916, + "step": 79764 + }, + { + "epoch": 2.04, + "learning_rate": 4.865856997109481e-07, + "loss": 0.3892, + "step": 79765 + }, + { + "epoch": 2.04, + "learning_rate": 4.865619547600636e-07, + "loss": 0.3682, + "step": 79766 + }, + { + "epoch": 2.04, + "learning_rate": 4.865382102022948e-07, + "loss": 0.394, + "step": 79767 + }, + { + "epoch": 2.04, + "learning_rate": 4.865144660376607e-07, + "loss": 0.2832, + "step": 79768 + }, + { + "epoch": 2.04, + "learning_rate": 4.864907222661782e-07, + "loss": 0.3228, + "step": 79769 + }, + { + "epoch": 2.04, + "learning_rate": 4.864669788878668e-07, + "loss": 0.3499, + "step": 79770 + }, + { + "epoch": 2.04, + "learning_rate": 4.864432359027435e-07, + "loss": 0.4072, + "step": 79771 + }, + { + "epoch": 2.04, + "learning_rate": 4.864194933108274e-07, + "loss": 0.5293, + "step": 79772 + }, + { + "epoch": 2.04, + "learning_rate": 4.863957511121359e-07, + "loss": 0.481, + "step": 79773 + }, + { + "epoch": 2.04, + "learning_rate": 4.863720093066876e-07, + "loss": 0.3118, + "step": 79774 + }, + { + "epoch": 2.04, + "learning_rate": 4.863482678945005e-07, + "loss": 0.4663, + "step": 79775 + }, + { + "epoch": 2.04, + "learning_rate": 4.863245268755935e-07, + "loss": 0.3896, + "step": 79776 + }, + { + "epoch": 2.04, + "learning_rate": 4.863007862499836e-07, + "loss": 0.3506, + "step": 79777 + }, + { + "epoch": 2.04, + "learning_rate": 4.862770460176897e-07, + "loss": 0.3599, + "step": 79778 + }, + { + "epoch": 2.04, + "learning_rate": 4.862533061787298e-07, + "loss": 0.4187, + "step": 79779 + }, + { + "epoch": 2.04, + "learning_rate": 4.862295667331226e-07, + "loss": 0.4314, + "step": 79780 + }, + { + "epoch": 2.04, + "learning_rate": 4.862058276808856e-07, + "loss": 0.4214, + "step": 79781 + }, + { + "epoch": 2.04, + "learning_rate": 4.86182089022037e-07, + "loss": 0.4229, + "step": 79782 + }, + { + "epoch": 2.04, + "learning_rate": 4.861583507565949e-07, + "loss": 0.3242, + "step": 79783 + }, + { + "epoch": 2.04, + "learning_rate": 4.861346128845779e-07, + "loss": 0.3557, + "step": 79784 + }, + { + "epoch": 2.04, + "learning_rate": 4.861108754060043e-07, + "loss": 0.479, + "step": 79785 + }, + { + "epoch": 2.04, + "learning_rate": 4.860871383208918e-07, + "loss": 0.4717, + "step": 79786 + }, + { + "epoch": 2.04, + "learning_rate": 4.860634016292586e-07, + "loss": 0.4707, + "step": 79787 + }, + { + "epoch": 2.05, + "learning_rate": 4.860396653311234e-07, + "loss": 0.3567, + "step": 79788 + }, + { + "epoch": 2.05, + "learning_rate": 4.860159294265036e-07, + "loss": 0.5137, + "step": 79789 + }, + { + "epoch": 2.05, + "learning_rate": 4.859921939154181e-07, + "loss": 0.5098, + "step": 79790 + }, + { + "epoch": 2.05, + "learning_rate": 4.859684587978844e-07, + "loss": 0.5049, + "step": 79791 + }, + { + "epoch": 2.05, + "learning_rate": 4.859447240739211e-07, + "loss": 0.4956, + "step": 79792 + }, + { + "epoch": 2.05, + "learning_rate": 4.859209897435466e-07, + "loss": 0.4468, + "step": 79793 + }, + { + "epoch": 2.05, + "learning_rate": 4.858972558067783e-07, + "loss": 0.5356, + "step": 79794 + }, + { + "epoch": 2.05, + "learning_rate": 4.858735222636349e-07, + "loss": 0.437, + "step": 79795 + }, + { + "epoch": 2.05, + "learning_rate": 4.858497891141347e-07, + "loss": 0.3267, + "step": 79796 + }, + { + "epoch": 2.05, + "learning_rate": 4.858260563582957e-07, + "loss": 0.4902, + "step": 79797 + }, + { + "epoch": 2.05, + "learning_rate": 4.85802323996136e-07, + "loss": 0.237, + "step": 79798 + }, + { + "epoch": 2.05, + "learning_rate": 4.85778592027674e-07, + "loss": 0.4343, + "step": 79799 + }, + { + "epoch": 2.05, + "learning_rate": 4.857548604529274e-07, + "loss": 0.2676, + "step": 79800 + }, + { + "epoch": 2.05, + "learning_rate": 4.857311292719145e-07, + "loss": 0.4531, + "step": 79801 + }, + { + "epoch": 2.05, + "learning_rate": 4.857073984846542e-07, + "loss": 0.4055, + "step": 79802 + }, + { + "epoch": 2.05, + "learning_rate": 4.856836680911635e-07, + "loss": 0.4048, + "step": 79803 + }, + { + "epoch": 2.05, + "learning_rate": 4.856599380914614e-07, + "loss": 0.4551, + "step": 79804 + }, + { + "epoch": 2.05, + "learning_rate": 4.856362084855661e-07, + "loss": 0.46, + "step": 79805 + }, + { + "epoch": 2.05, + "learning_rate": 4.856124792734951e-07, + "loss": 0.4438, + "step": 79806 + }, + { + "epoch": 2.05, + "learning_rate": 4.85588750455267e-07, + "loss": 0.4165, + "step": 79807 + }, + { + "epoch": 2.05, + "learning_rate": 4.855650220309e-07, + "loss": 0.4517, + "step": 79808 + }, + { + "epoch": 2.05, + "learning_rate": 4.855412940004125e-07, + "loss": 0.3223, + "step": 79809 + }, + { + "epoch": 2.05, + "learning_rate": 4.855175663638225e-07, + "loss": 0.377, + "step": 79810 + }, + { + "epoch": 2.05, + "learning_rate": 4.854938391211475e-07, + "loss": 0.3975, + "step": 79811 + }, + { + "epoch": 2.05, + "learning_rate": 4.854701122724063e-07, + "loss": 0.2061, + "step": 79812 + }, + { + "epoch": 2.05, + "learning_rate": 4.85446385817617e-07, + "loss": 0.4189, + "step": 79813 + }, + { + "epoch": 2.05, + "learning_rate": 4.854226597567981e-07, + "loss": 0.5015, + "step": 79814 + }, + { + "epoch": 2.05, + "learning_rate": 4.853989340899671e-07, + "loss": 0.3643, + "step": 79815 + }, + { + "epoch": 2.05, + "learning_rate": 4.853752088171422e-07, + "loss": 0.3346, + "step": 79816 + }, + { + "epoch": 2.05, + "learning_rate": 4.853514839383422e-07, + "loss": 0.3643, + "step": 79817 + }, + { + "epoch": 2.05, + "learning_rate": 4.853277594535849e-07, + "loss": 0.3982, + "step": 79818 + }, + { + "epoch": 2.05, + "learning_rate": 4.853040353628888e-07, + "loss": 0.4668, + "step": 79819 + }, + { + "epoch": 2.05, + "learning_rate": 4.852803116662712e-07, + "loss": 0.4043, + "step": 79820 + }, + { + "epoch": 2.05, + "learning_rate": 4.852565883637508e-07, + "loss": 0.3069, + "step": 79821 + }, + { + "epoch": 2.05, + "learning_rate": 4.852328654553462e-07, + "loss": 0.5425, + "step": 79822 + }, + { + "epoch": 2.05, + "learning_rate": 4.852091429410747e-07, + "loss": 0.3896, + "step": 79823 + }, + { + "epoch": 2.05, + "learning_rate": 4.851854208209549e-07, + "loss": 0.4946, + "step": 79824 + }, + { + "epoch": 2.05, + "learning_rate": 4.85161699095005e-07, + "loss": 0.3542, + "step": 79825 + }, + { + "epoch": 2.05, + "learning_rate": 4.851379777632435e-07, + "loss": 0.5552, + "step": 79826 + }, + { + "epoch": 2.05, + "learning_rate": 4.851142568256878e-07, + "loss": 0.3892, + "step": 79827 + }, + { + "epoch": 2.05, + "learning_rate": 4.850905362823563e-07, + "loss": 0.2218, + "step": 79828 + }, + { + "epoch": 2.05, + "learning_rate": 4.850668161332679e-07, + "loss": 0.4136, + "step": 79829 + }, + { + "epoch": 2.05, + "learning_rate": 4.850430963784396e-07, + "loss": 0.3217, + "step": 79830 + }, + { + "epoch": 2.05, + "learning_rate": 4.850193770178905e-07, + "loss": 0.4407, + "step": 79831 + }, + { + "epoch": 2.05, + "learning_rate": 4.84995658051638e-07, + "loss": 0.4478, + "step": 79832 + }, + { + "epoch": 2.05, + "learning_rate": 4.849719394797007e-07, + "loss": 0.5654, + "step": 79833 + }, + { + "epoch": 2.05, + "learning_rate": 4.849482213020968e-07, + "loss": 0.4614, + "step": 79834 + }, + { + "epoch": 2.05, + "learning_rate": 4.849245035188446e-07, + "loss": 0.4531, + "step": 79835 + }, + { + "epoch": 2.05, + "learning_rate": 4.849007861299616e-07, + "loss": 0.4907, + "step": 79836 + }, + { + "epoch": 2.05, + "learning_rate": 4.848770691354666e-07, + "loss": 0.4194, + "step": 79837 + }, + { + "epoch": 2.05, + "learning_rate": 4.848533525353774e-07, + "loss": 0.4873, + "step": 79838 + }, + { + "epoch": 2.05, + "learning_rate": 4.848296363297131e-07, + "loss": 0.3784, + "step": 79839 + }, + { + "epoch": 2.05, + "learning_rate": 4.848059205184902e-07, + "loss": 0.3579, + "step": 79840 + }, + { + "epoch": 2.05, + "learning_rate": 4.847822051017278e-07, + "loss": 0.3696, + "step": 79841 + }, + { + "epoch": 2.05, + "learning_rate": 4.84758490079444e-07, + "loss": 0.4104, + "step": 79842 + }, + { + "epoch": 2.05, + "learning_rate": 4.847347754516573e-07, + "loss": 0.4648, + "step": 79843 + }, + { + "epoch": 2.05, + "learning_rate": 4.847110612183851e-07, + "loss": 0.3838, + "step": 79844 + }, + { + "epoch": 2.05, + "learning_rate": 4.846873473796459e-07, + "loss": 0.3811, + "step": 79845 + }, + { + "epoch": 2.05, + "learning_rate": 4.84663633935458e-07, + "loss": 0.356, + "step": 79846 + }, + { + "epoch": 2.05, + "learning_rate": 4.846399208858398e-07, + "loss": 0.4082, + "step": 79847 + }, + { + "epoch": 2.05, + "learning_rate": 4.846162082308088e-07, + "loss": 0.3806, + "step": 79848 + }, + { + "epoch": 2.05, + "learning_rate": 4.845924959703837e-07, + "loss": 0.4033, + "step": 79849 + }, + { + "epoch": 2.05, + "learning_rate": 4.845687841045821e-07, + "loss": 0.4036, + "step": 79850 + }, + { + "epoch": 2.05, + "learning_rate": 4.845450726334225e-07, + "loss": 0.5581, + "step": 79851 + }, + { + "epoch": 2.05, + "learning_rate": 4.845213615569234e-07, + "loss": 0.4536, + "step": 79852 + }, + { + "epoch": 2.05, + "learning_rate": 4.844976508751022e-07, + "loss": 0.2458, + "step": 79853 + }, + { + "epoch": 2.05, + "learning_rate": 4.844739405879776e-07, + "loss": 0.4526, + "step": 79854 + }, + { + "epoch": 2.05, + "learning_rate": 4.844502306955673e-07, + "loss": 0.3564, + "step": 79855 + }, + { + "epoch": 2.05, + "learning_rate": 4.844265211978904e-07, + "loss": 0.3051, + "step": 79856 + }, + { + "epoch": 2.05, + "learning_rate": 4.844028120949639e-07, + "loss": 0.5732, + "step": 79857 + }, + { + "epoch": 2.05, + "learning_rate": 4.843791033868066e-07, + "loss": 0.3945, + "step": 79858 + }, + { + "epoch": 2.05, + "learning_rate": 4.843553950734368e-07, + "loss": 0.3579, + "step": 79859 + }, + { + "epoch": 2.05, + "learning_rate": 4.843316871548723e-07, + "loss": 0.2959, + "step": 79860 + }, + { + "epoch": 2.05, + "learning_rate": 4.843079796311309e-07, + "loss": 0.3752, + "step": 79861 + }, + { + "epoch": 2.05, + "learning_rate": 4.842842725022312e-07, + "loss": 0.4697, + "step": 79862 + }, + { + "epoch": 2.05, + "learning_rate": 4.842605657681914e-07, + "loss": 0.5005, + "step": 79863 + }, + { + "epoch": 2.05, + "learning_rate": 4.8423685942903e-07, + "loss": 0.3915, + "step": 79864 + }, + { + "epoch": 2.05, + "learning_rate": 4.842131534847642e-07, + "loss": 0.5, + "step": 79865 + }, + { + "epoch": 2.05, + "learning_rate": 4.841894479354127e-07, + "loss": 0.2767, + "step": 79866 + }, + { + "epoch": 2.05, + "learning_rate": 4.841657427809938e-07, + "loss": 0.4956, + "step": 79867 + }, + { + "epoch": 2.05, + "learning_rate": 4.841420380215256e-07, + "loss": 0.4209, + "step": 79868 + }, + { + "epoch": 2.05, + "learning_rate": 4.841183336570263e-07, + "loss": 0.4404, + "step": 79869 + }, + { + "epoch": 2.05, + "learning_rate": 4.840946296875134e-07, + "loss": 0.4878, + "step": 79870 + }, + { + "epoch": 2.05, + "learning_rate": 4.840709261130055e-07, + "loss": 0.3748, + "step": 79871 + }, + { + "epoch": 2.05, + "learning_rate": 4.840472229335209e-07, + "loss": 0.366, + "step": 79872 + }, + { + "epoch": 2.05, + "learning_rate": 4.840235201490779e-07, + "loss": 0.3994, + "step": 79873 + }, + { + "epoch": 2.05, + "learning_rate": 4.839998177596939e-07, + "loss": 0.2949, + "step": 79874 + }, + { + "epoch": 2.05, + "learning_rate": 4.839761157653877e-07, + "loss": 0.4502, + "step": 79875 + }, + { + "epoch": 2.05, + "learning_rate": 4.839524141661775e-07, + "loss": 0.415, + "step": 79876 + }, + { + "epoch": 2.05, + "learning_rate": 4.839287129620808e-07, + "loss": 0.4927, + "step": 79877 + }, + { + "epoch": 2.05, + "learning_rate": 4.839050121531162e-07, + "loss": 0.3391, + "step": 79878 + }, + { + "epoch": 2.05, + "learning_rate": 4.838813117393022e-07, + "loss": 0.3398, + "step": 79879 + }, + { + "epoch": 2.05, + "learning_rate": 4.838576117206563e-07, + "loss": 0.4221, + "step": 79880 + }, + { + "epoch": 2.05, + "learning_rate": 4.838339120971972e-07, + "loss": 0.3984, + "step": 79881 + }, + { + "epoch": 2.05, + "learning_rate": 4.838102128689422e-07, + "loss": 0.3687, + "step": 79882 + }, + { + "epoch": 2.05, + "learning_rate": 4.837865140359101e-07, + "loss": 0.3999, + "step": 79883 + }, + { + "epoch": 2.05, + "learning_rate": 4.837628155981189e-07, + "loss": 0.3621, + "step": 79884 + }, + { + "epoch": 2.05, + "learning_rate": 4.837391175555873e-07, + "loss": 0.4727, + "step": 79885 + }, + { + "epoch": 2.05, + "learning_rate": 4.837154199083323e-07, + "loss": 0.3538, + "step": 79886 + }, + { + "epoch": 2.05, + "learning_rate": 4.836917226563728e-07, + "loss": 0.3689, + "step": 79887 + }, + { + "epoch": 2.05, + "learning_rate": 4.836680257997269e-07, + "loss": 0.4849, + "step": 79888 + }, + { + "epoch": 2.05, + "learning_rate": 4.836443293384128e-07, + "loss": 0.3916, + "step": 79889 + }, + { + "epoch": 2.05, + "learning_rate": 4.836206332724487e-07, + "loss": 0.4766, + "step": 79890 + }, + { + "epoch": 2.05, + "learning_rate": 4.835969376018521e-07, + "loss": 0.3424, + "step": 79891 + }, + { + "epoch": 2.05, + "learning_rate": 4.835732423266416e-07, + "loss": 0.4039, + "step": 79892 + }, + { + "epoch": 2.05, + "learning_rate": 4.835495474468356e-07, + "loss": 0.4214, + "step": 79893 + }, + { + "epoch": 2.05, + "learning_rate": 4.835258529624516e-07, + "loss": 0.4326, + "step": 79894 + }, + { + "epoch": 2.05, + "learning_rate": 4.835021588735082e-07, + "loss": 0.3818, + "step": 79895 + }, + { + "epoch": 2.05, + "learning_rate": 4.834784651800233e-07, + "loss": 0.4243, + "step": 79896 + }, + { + "epoch": 2.05, + "learning_rate": 4.834547718820157e-07, + "loss": 0.4468, + "step": 79897 + }, + { + "epoch": 2.05, + "learning_rate": 4.834310789795026e-07, + "loss": 0.4419, + "step": 79898 + }, + { + "epoch": 2.05, + "learning_rate": 4.83407386472503e-07, + "loss": 0.4023, + "step": 79899 + }, + { + "epoch": 2.05, + "learning_rate": 4.833836943610342e-07, + "loss": 0.4854, + "step": 79900 + }, + { + "epoch": 2.05, + "learning_rate": 4.833600026451148e-07, + "loss": 0.3462, + "step": 79901 + }, + { + "epoch": 2.05, + "learning_rate": 4.833363113247631e-07, + "loss": 0.2418, + "step": 79902 + }, + { + "epoch": 2.05, + "learning_rate": 4.833126203999968e-07, + "loss": 0.4246, + "step": 79903 + }, + { + "epoch": 2.05, + "learning_rate": 4.832889298708342e-07, + "loss": 0.3193, + "step": 79904 + }, + { + "epoch": 2.05, + "learning_rate": 4.832652397372936e-07, + "loss": 0.4185, + "step": 79905 + }, + { + "epoch": 2.05, + "learning_rate": 4.832415499993934e-07, + "loss": 0.4517, + "step": 79906 + }, + { + "epoch": 2.05, + "learning_rate": 4.83217860657151e-07, + "loss": 0.4141, + "step": 79907 + }, + { + "epoch": 2.05, + "learning_rate": 4.831941717105849e-07, + "loss": 0.4346, + "step": 79908 + }, + { + "epoch": 2.05, + "learning_rate": 4.831704831597135e-07, + "loss": 0.4351, + "step": 79909 + }, + { + "epoch": 2.05, + "learning_rate": 4.831467950045545e-07, + "loss": 0.3402, + "step": 79910 + }, + { + "epoch": 2.05, + "learning_rate": 4.831231072451266e-07, + "loss": 0.5142, + "step": 79911 + }, + { + "epoch": 2.05, + "learning_rate": 4.83099419881447e-07, + "loss": 0.5415, + "step": 79912 + }, + { + "epoch": 2.05, + "learning_rate": 4.830757329135346e-07, + "loss": 0.5542, + "step": 79913 + }, + { + "epoch": 2.05, + "learning_rate": 4.830520463414077e-07, + "loss": 0.3496, + "step": 79914 + }, + { + "epoch": 2.05, + "learning_rate": 4.830283601650838e-07, + "loss": 0.3735, + "step": 79915 + }, + { + "epoch": 2.05, + "learning_rate": 4.830046743845811e-07, + "loss": 0.3975, + "step": 79916 + }, + { + "epoch": 2.05, + "learning_rate": 4.829809889999181e-07, + "loss": 0.5156, + "step": 79917 + }, + { + "epoch": 2.05, + "learning_rate": 4.829573040111132e-07, + "loss": 0.4465, + "step": 79918 + }, + { + "epoch": 2.05, + "learning_rate": 4.829336194181839e-07, + "loss": 0.4126, + "step": 79919 + }, + { + "epoch": 2.05, + "learning_rate": 4.829099352211483e-07, + "loss": 0.3245, + "step": 79920 + }, + { + "epoch": 2.05, + "learning_rate": 4.828862514200249e-07, + "loss": 0.396, + "step": 79921 + }, + { + "epoch": 2.05, + "learning_rate": 4.828625680148315e-07, + "loss": 0.3105, + "step": 79922 + }, + { + "epoch": 2.05, + "learning_rate": 4.828388850055869e-07, + "loss": 0.4526, + "step": 79923 + }, + { + "epoch": 2.05, + "learning_rate": 4.828152023923084e-07, + "loss": 0.4268, + "step": 79924 + }, + { + "epoch": 2.05, + "learning_rate": 4.827915201750147e-07, + "loss": 0.3818, + "step": 79925 + }, + { + "epoch": 2.05, + "learning_rate": 4.827678383537236e-07, + "loss": 0.3823, + "step": 79926 + }, + { + "epoch": 2.05, + "learning_rate": 4.827441569284537e-07, + "loss": 0.2917, + "step": 79927 + }, + { + "epoch": 2.05, + "learning_rate": 4.827204758992225e-07, + "loss": 0.3882, + "step": 79928 + }, + { + "epoch": 2.05, + "learning_rate": 4.826967952660489e-07, + "loss": 0.2955, + "step": 79929 + }, + { + "epoch": 2.05, + "learning_rate": 4.826731150289501e-07, + "loss": 0.3923, + "step": 79930 + }, + { + "epoch": 2.05, + "learning_rate": 4.826494351879451e-07, + "loss": 0.3752, + "step": 79931 + }, + { + "epoch": 2.05, + "learning_rate": 4.826257557430513e-07, + "loss": 0.4746, + "step": 79932 + }, + { + "epoch": 2.05, + "learning_rate": 4.826020766942872e-07, + "loss": 0.3347, + "step": 79933 + }, + { + "epoch": 2.05, + "learning_rate": 4.825783980416708e-07, + "loss": 0.2912, + "step": 79934 + }, + { + "epoch": 2.05, + "learning_rate": 4.825547197852207e-07, + "loss": 0.4526, + "step": 79935 + }, + { + "epoch": 2.05, + "learning_rate": 4.825310419249545e-07, + "loss": 0.4697, + "step": 79936 + }, + { + "epoch": 2.05, + "learning_rate": 4.825073644608903e-07, + "loss": 0.481, + "step": 79937 + }, + { + "epoch": 2.05, + "learning_rate": 4.824836873930463e-07, + "loss": 0.4558, + "step": 79938 + }, + { + "epoch": 2.05, + "learning_rate": 4.824600107214414e-07, + "loss": 0.4399, + "step": 79939 + }, + { + "epoch": 2.05, + "learning_rate": 4.824363344460929e-07, + "loss": 0.4902, + "step": 79940 + }, + { + "epoch": 2.05, + "learning_rate": 4.824126585670188e-07, + "loss": 0.4116, + "step": 79941 + }, + { + "epoch": 2.05, + "learning_rate": 4.823889830842375e-07, + "loss": 0.4497, + "step": 79942 + }, + { + "epoch": 2.05, + "learning_rate": 4.823653079977671e-07, + "loss": 0.3672, + "step": 79943 + }, + { + "epoch": 2.05, + "learning_rate": 4.823416333076262e-07, + "loss": 0.4678, + "step": 79944 + }, + { + "epoch": 2.05, + "learning_rate": 4.823179590138321e-07, + "loss": 0.415, + "step": 79945 + }, + { + "epoch": 2.05, + "learning_rate": 4.822942851164033e-07, + "loss": 0.4785, + "step": 79946 + }, + { + "epoch": 2.05, + "learning_rate": 4.822706116153581e-07, + "loss": 0.2102, + "step": 79947 + }, + { + "epoch": 2.05, + "learning_rate": 4.822469385107148e-07, + "loss": 0.3667, + "step": 79948 + }, + { + "epoch": 2.05, + "learning_rate": 4.822232658024912e-07, + "loss": 0.3724, + "step": 79949 + }, + { + "epoch": 2.05, + "learning_rate": 4.821995934907051e-07, + "loss": 0.4067, + "step": 79950 + }, + { + "epoch": 2.05, + "learning_rate": 4.821759215753749e-07, + "loss": 0.2727, + "step": 79951 + }, + { + "epoch": 2.05, + "learning_rate": 4.821522500565191e-07, + "loss": 0.3127, + "step": 79952 + }, + { + "epoch": 2.05, + "learning_rate": 4.821285789341554e-07, + "loss": 0.3257, + "step": 79953 + }, + { + "epoch": 2.05, + "learning_rate": 4.821049082083017e-07, + "loss": 0.5283, + "step": 79954 + }, + { + "epoch": 2.05, + "learning_rate": 4.820812378789767e-07, + "loss": 0.3691, + "step": 79955 + }, + { + "epoch": 2.05, + "learning_rate": 4.820575679461985e-07, + "loss": 0.4351, + "step": 79956 + }, + { + "epoch": 2.05, + "learning_rate": 4.820338984099847e-07, + "loss": 0.353, + "step": 79957 + }, + { + "epoch": 2.05, + "learning_rate": 4.820102292703538e-07, + "loss": 0.5107, + "step": 79958 + }, + { + "epoch": 2.05, + "learning_rate": 4.819865605273242e-07, + "loss": 0.2261, + "step": 79959 + }, + { + "epoch": 2.05, + "learning_rate": 4.819628921809133e-07, + "loss": 0.5256, + "step": 79960 + }, + { + "epoch": 2.05, + "learning_rate": 4.819392242311398e-07, + "loss": 0.3765, + "step": 79961 + }, + { + "epoch": 2.05, + "learning_rate": 4.819155566780214e-07, + "loss": 0.5815, + "step": 79962 + }, + { + "epoch": 2.05, + "learning_rate": 4.818918895215764e-07, + "loss": 0.3735, + "step": 79963 + }, + { + "epoch": 2.05, + "learning_rate": 4.818682227618229e-07, + "loss": 0.5073, + "step": 79964 + }, + { + "epoch": 2.05, + "learning_rate": 4.818445563987797e-07, + "loss": 0.519, + "step": 79965 + }, + { + "epoch": 2.05, + "learning_rate": 4.818208904324636e-07, + "loss": 0.4321, + "step": 79966 + }, + { + "epoch": 2.05, + "learning_rate": 4.817972248628935e-07, + "loss": 0.4668, + "step": 79967 + }, + { + "epoch": 2.05, + "learning_rate": 4.817735596900879e-07, + "loss": 0.4624, + "step": 79968 + }, + { + "epoch": 2.05, + "learning_rate": 4.817498949140645e-07, + "loss": 0.2599, + "step": 79969 + }, + { + "epoch": 2.05, + "learning_rate": 4.817262305348409e-07, + "loss": 0.5098, + "step": 79970 + }, + { + "epoch": 2.05, + "learning_rate": 4.817025665524357e-07, + "loss": 0.5605, + "step": 79971 + }, + { + "epoch": 2.05, + "learning_rate": 4.816789029668669e-07, + "loss": 0.2808, + "step": 79972 + }, + { + "epoch": 2.05, + "learning_rate": 4.816552397781533e-07, + "loss": 0.4282, + "step": 79973 + }, + { + "epoch": 2.05, + "learning_rate": 4.816315769863121e-07, + "loss": 0.4062, + "step": 79974 + }, + { + "epoch": 2.05, + "learning_rate": 4.816079145913616e-07, + "loss": 0.4429, + "step": 79975 + }, + { + "epoch": 2.05, + "learning_rate": 4.815842525933201e-07, + "loss": 0.4131, + "step": 79976 + }, + { + "epoch": 2.05, + "learning_rate": 4.815605909922063e-07, + "loss": 0.4766, + "step": 79977 + }, + { + "epoch": 2.05, + "learning_rate": 4.815369297880371e-07, + "loss": 0.2898, + "step": 79978 + }, + { + "epoch": 2.05, + "learning_rate": 4.815132689808317e-07, + "loss": 0.4771, + "step": 79979 + }, + { + "epoch": 2.05, + "learning_rate": 4.814896085706073e-07, + "loss": 0.3019, + "step": 79980 + }, + { + "epoch": 2.05, + "learning_rate": 4.814659485573825e-07, + "loss": 0.478, + "step": 79981 + }, + { + "epoch": 2.05, + "learning_rate": 4.814422889411757e-07, + "loss": 0.4014, + "step": 79982 + }, + { + "epoch": 2.05, + "learning_rate": 4.814186297220045e-07, + "loss": 0.3464, + "step": 79983 + }, + { + "epoch": 2.05, + "learning_rate": 4.813949708998871e-07, + "loss": 0.4478, + "step": 79984 + }, + { + "epoch": 2.05, + "learning_rate": 4.813713124748422e-07, + "loss": 0.2253, + "step": 79985 + }, + { + "epoch": 2.05, + "learning_rate": 4.81347654446887e-07, + "loss": 0.458, + "step": 79986 + }, + { + "epoch": 2.05, + "learning_rate": 4.8132399681604e-07, + "loss": 0.4058, + "step": 79987 + }, + { + "epoch": 2.05, + "learning_rate": 4.813003395823193e-07, + "loss": 0.4341, + "step": 79988 + }, + { + "epoch": 2.05, + "learning_rate": 4.812766827457435e-07, + "loss": 0.5054, + "step": 79989 + }, + { + "epoch": 2.05, + "learning_rate": 4.812530263063303e-07, + "loss": 0.417, + "step": 79990 + }, + { + "epoch": 2.05, + "learning_rate": 4.812293702640976e-07, + "loss": 0.3774, + "step": 79991 + }, + { + "epoch": 2.05, + "learning_rate": 4.812057146190636e-07, + "loss": 0.4565, + "step": 79992 + }, + { + "epoch": 2.05, + "learning_rate": 4.811820593712465e-07, + "loss": 0.5327, + "step": 79993 + }, + { + "epoch": 2.05, + "learning_rate": 4.811584045206648e-07, + "loss": 0.3313, + "step": 79994 + }, + { + "epoch": 2.05, + "learning_rate": 4.811347500673359e-07, + "loss": 0.3779, + "step": 79995 + }, + { + "epoch": 2.05, + "learning_rate": 4.811110960112783e-07, + "loss": 0.3782, + "step": 79996 + }, + { + "epoch": 2.05, + "learning_rate": 4.810874423525099e-07, + "loss": 0.3647, + "step": 79997 + }, + { + "epoch": 2.05, + "learning_rate": 4.810637890910496e-07, + "loss": 0.4595, + "step": 79998 + }, + { + "epoch": 2.05, + "learning_rate": 4.810401362269149e-07, + "loss": 0.4429, + "step": 79999 + }, + { + "epoch": 2.05, + "learning_rate": 4.810164837601233e-07, + "loss": 0.2094, + "step": 80000 + }, + { + "epoch": 2.05, + "learning_rate": 4.809928316906937e-07, + "loss": 0.478, + "step": 80001 + }, + { + "epoch": 2.05, + "learning_rate": 4.809691800186444e-07, + "loss": 0.3979, + "step": 80002 + }, + { + "epoch": 2.05, + "learning_rate": 4.809455287439927e-07, + "loss": 0.4854, + "step": 80003 + }, + { + "epoch": 2.05, + "learning_rate": 4.80921877866757e-07, + "loss": 0.3679, + "step": 80004 + }, + { + "epoch": 2.05, + "learning_rate": 4.808982273869558e-07, + "loss": 0.3752, + "step": 80005 + }, + { + "epoch": 2.05, + "learning_rate": 4.808745773046073e-07, + "loss": 0.3575, + "step": 80006 + }, + { + "epoch": 2.05, + "learning_rate": 4.808509276197288e-07, + "loss": 0.3848, + "step": 80007 + }, + { + "epoch": 2.05, + "learning_rate": 4.808272783323389e-07, + "loss": 0.5474, + "step": 80008 + }, + { + "epoch": 2.05, + "learning_rate": 4.80803629442456e-07, + "loss": 0.3726, + "step": 80009 + }, + { + "epoch": 2.05, + "learning_rate": 4.807799809500975e-07, + "loss": 0.4082, + "step": 80010 + }, + { + "epoch": 2.05, + "learning_rate": 4.807563328552824e-07, + "loss": 0.394, + "step": 80011 + }, + { + "epoch": 2.05, + "learning_rate": 4.807326851580279e-07, + "loss": 0.3645, + "step": 80012 + }, + { + "epoch": 2.05, + "learning_rate": 4.807090378583523e-07, + "loss": 0.3838, + "step": 80013 + }, + { + "epoch": 2.05, + "learning_rate": 4.806853909562742e-07, + "loss": 0.4473, + "step": 80014 + }, + { + "epoch": 2.05, + "learning_rate": 4.806617444518117e-07, + "loss": 0.2947, + "step": 80015 + }, + { + "epoch": 2.05, + "learning_rate": 4.806380983449822e-07, + "loss": 0.4424, + "step": 80016 + }, + { + "epoch": 2.05, + "learning_rate": 4.806144526358042e-07, + "loss": 0.4253, + "step": 80017 + }, + { + "epoch": 2.05, + "learning_rate": 4.805908073242959e-07, + "loss": 0.2925, + "step": 80018 + }, + { + "epoch": 2.05, + "learning_rate": 4.805671624104761e-07, + "loss": 0.4191, + "step": 80019 + }, + { + "epoch": 2.05, + "learning_rate": 4.805435178943613e-07, + "loss": 0.2361, + "step": 80020 + }, + { + "epoch": 2.05, + "learning_rate": 4.805198737759705e-07, + "loss": 0.3389, + "step": 80021 + }, + { + "epoch": 2.05, + "learning_rate": 4.804962300553217e-07, + "loss": 0.5381, + "step": 80022 + }, + { + "epoch": 2.05, + "learning_rate": 4.804725867324335e-07, + "loss": 0.3413, + "step": 80023 + }, + { + "epoch": 2.05, + "learning_rate": 4.804489438073232e-07, + "loss": 0.3723, + "step": 80024 + }, + { + "epoch": 2.05, + "learning_rate": 4.804253012800092e-07, + "loss": 0.3683, + "step": 80025 + }, + { + "epoch": 2.05, + "learning_rate": 4.804016591505096e-07, + "loss": 0.2881, + "step": 80026 + }, + { + "epoch": 2.05, + "learning_rate": 4.803780174188429e-07, + "loss": 0.4253, + "step": 80027 + }, + { + "epoch": 2.05, + "learning_rate": 4.803543760850266e-07, + "loss": 0.417, + "step": 80028 + }, + { + "epoch": 2.05, + "learning_rate": 4.803307351490795e-07, + "loss": 0.302, + "step": 80029 + }, + { + "epoch": 2.05, + "learning_rate": 4.803070946110187e-07, + "loss": 0.5156, + "step": 80030 + }, + { + "epoch": 2.05, + "learning_rate": 4.802834544708631e-07, + "loss": 0.3745, + "step": 80031 + }, + { + "epoch": 2.05, + "learning_rate": 4.802598147286307e-07, + "loss": 0.4135, + "step": 80032 + }, + { + "epoch": 2.05, + "learning_rate": 4.802361753843391e-07, + "loss": 0.4531, + "step": 80033 + }, + { + "epoch": 2.05, + "learning_rate": 4.802125364380069e-07, + "loss": 0.4663, + "step": 80034 + }, + { + "epoch": 2.05, + "learning_rate": 4.80188897889652e-07, + "loss": 0.3912, + "step": 80035 + }, + { + "epoch": 2.05, + "learning_rate": 4.801652597392928e-07, + "loss": 0.459, + "step": 80036 + }, + { + "epoch": 2.05, + "learning_rate": 4.801416219869471e-07, + "loss": 0.4771, + "step": 80037 + }, + { + "epoch": 2.05, + "learning_rate": 4.801179846326328e-07, + "loss": 0.3088, + "step": 80038 + }, + { + "epoch": 2.05, + "learning_rate": 4.800943476763687e-07, + "loss": 0.3079, + "step": 80039 + }, + { + "epoch": 2.05, + "learning_rate": 4.800707111181724e-07, + "loss": 0.354, + "step": 80040 + }, + { + "epoch": 2.05, + "learning_rate": 4.800470749580617e-07, + "loss": 0.3778, + "step": 80041 + }, + { + "epoch": 2.05, + "learning_rate": 4.800234391960552e-07, + "loss": 0.4673, + "step": 80042 + }, + { + "epoch": 2.05, + "learning_rate": 4.799998038321707e-07, + "loss": 0.3024, + "step": 80043 + }, + { + "epoch": 2.05, + "learning_rate": 4.799761688664267e-07, + "loss": 0.364, + "step": 80044 + }, + { + "epoch": 2.05, + "learning_rate": 4.799525342988409e-07, + "loss": 0.4585, + "step": 80045 + }, + { + "epoch": 2.05, + "learning_rate": 4.799289001294315e-07, + "loss": 0.4849, + "step": 80046 + }, + { + "epoch": 2.05, + "learning_rate": 4.799052663582165e-07, + "loss": 0.4038, + "step": 80047 + }, + { + "epoch": 2.05, + "learning_rate": 4.798816329852145e-07, + "loss": 0.3892, + "step": 80048 + }, + { + "epoch": 2.05, + "learning_rate": 4.798580000104433e-07, + "loss": 0.3818, + "step": 80049 + }, + { + "epoch": 2.05, + "learning_rate": 4.798343674339205e-07, + "loss": 0.5532, + "step": 80050 + }, + { + "epoch": 2.05, + "learning_rate": 4.798107352556646e-07, + "loss": 0.3816, + "step": 80051 + }, + { + "epoch": 2.05, + "learning_rate": 4.797871034756938e-07, + "loss": 0.5444, + "step": 80052 + }, + { + "epoch": 2.05, + "learning_rate": 4.797634720940264e-07, + "loss": 0.4199, + "step": 80053 + }, + { + "epoch": 2.05, + "learning_rate": 4.797398411106797e-07, + "loss": 0.3523, + "step": 80054 + }, + { + "epoch": 2.05, + "learning_rate": 4.797162105256723e-07, + "loss": 0.3094, + "step": 80055 + }, + { + "epoch": 2.05, + "learning_rate": 4.796925803390228e-07, + "loss": 0.4492, + "step": 80056 + }, + { + "epoch": 2.05, + "learning_rate": 4.796689505507483e-07, + "loss": 0.5449, + "step": 80057 + }, + { + "epoch": 2.05, + "learning_rate": 4.796453211608674e-07, + "loss": 0.4302, + "step": 80058 + }, + { + "epoch": 2.05, + "learning_rate": 4.796216921693985e-07, + "loss": 0.3945, + "step": 80059 + }, + { + "epoch": 2.05, + "learning_rate": 4.79598063576359e-07, + "loss": 0.3857, + "step": 80060 + }, + { + "epoch": 2.05, + "learning_rate": 4.795744353817676e-07, + "loss": 0.5581, + "step": 80061 + }, + { + "epoch": 2.05, + "learning_rate": 4.79550807585642e-07, + "loss": 0.4536, + "step": 80062 + }, + { + "epoch": 2.05, + "learning_rate": 4.795271801880001e-07, + "loss": 0.3765, + "step": 80063 + }, + { + "epoch": 2.05, + "learning_rate": 4.795035531888605e-07, + "loss": 0.4146, + "step": 80064 + }, + { + "epoch": 2.05, + "learning_rate": 4.794799265882415e-07, + "loss": 0.4507, + "step": 80065 + }, + { + "epoch": 2.05, + "learning_rate": 4.794563003861602e-07, + "loss": 0.5078, + "step": 80066 + }, + { + "epoch": 2.05, + "learning_rate": 4.794326745826355e-07, + "loss": 0.3967, + "step": 80067 + }, + { + "epoch": 2.05, + "learning_rate": 4.794090491776851e-07, + "loss": 0.356, + "step": 80068 + }, + { + "epoch": 2.05, + "learning_rate": 4.793854241713277e-07, + "loss": 0.2376, + "step": 80069 + }, + { + "epoch": 2.05, + "learning_rate": 4.79361799563581e-07, + "loss": 0.3418, + "step": 80070 + }, + { + "epoch": 2.05, + "learning_rate": 4.793381753544626e-07, + "loss": 0.5186, + "step": 80071 + }, + { + "epoch": 2.05, + "learning_rate": 4.79314551543991e-07, + "loss": 0.3401, + "step": 80072 + }, + { + "epoch": 2.05, + "learning_rate": 4.792909281321843e-07, + "loss": 0.302, + "step": 80073 + }, + { + "epoch": 2.05, + "learning_rate": 4.79267305119061e-07, + "loss": 0.4336, + "step": 80074 + }, + { + "epoch": 2.05, + "learning_rate": 4.792436825046385e-07, + "loss": 0.3428, + "step": 80075 + }, + { + "epoch": 2.05, + "learning_rate": 4.79220060288935e-07, + "loss": 0.48, + "step": 80076 + }, + { + "epoch": 2.05, + "learning_rate": 4.791964384719692e-07, + "loss": 0.4268, + "step": 80077 + }, + { + "epoch": 2.05, + "learning_rate": 4.791728170537583e-07, + "loss": 0.4648, + "step": 80078 + }, + { + "epoch": 2.05, + "learning_rate": 4.791491960343214e-07, + "loss": 0.4951, + "step": 80079 + }, + { + "epoch": 2.05, + "learning_rate": 4.791255754136753e-07, + "loss": 0.3103, + "step": 80080 + }, + { + "epoch": 2.05, + "learning_rate": 4.791019551918392e-07, + "loss": 0.4893, + "step": 80081 + }, + { + "epoch": 2.05, + "learning_rate": 4.790783353688309e-07, + "loss": 0.3643, + "step": 80082 + }, + { + "epoch": 2.05, + "learning_rate": 4.79054715944668e-07, + "loss": 0.3325, + "step": 80083 + }, + { + "epoch": 2.05, + "learning_rate": 4.790310969193691e-07, + "loss": 0.3306, + "step": 80084 + }, + { + "epoch": 2.05, + "learning_rate": 4.79007478292952e-07, + "loss": 0.4189, + "step": 80085 + }, + { + "epoch": 2.05, + "learning_rate": 4.789838600654352e-07, + "loss": 0.2318, + "step": 80086 + }, + { + "epoch": 2.05, + "learning_rate": 4.789602422368363e-07, + "loss": 0.4419, + "step": 80087 + }, + { + "epoch": 2.05, + "learning_rate": 4.789366248071735e-07, + "loss": 0.3582, + "step": 80088 + }, + { + "epoch": 2.05, + "learning_rate": 4.789130077764654e-07, + "loss": 0.4907, + "step": 80089 + }, + { + "epoch": 2.05, + "learning_rate": 4.788893911447293e-07, + "loss": 0.2634, + "step": 80090 + }, + { + "epoch": 2.05, + "learning_rate": 4.788657749119839e-07, + "loss": 0.4492, + "step": 80091 + }, + { + "epoch": 2.05, + "learning_rate": 4.788421590782467e-07, + "loss": 0.2969, + "step": 80092 + }, + { + "epoch": 2.05, + "learning_rate": 4.788185436435361e-07, + "loss": 0.3945, + "step": 80093 + }, + { + "epoch": 2.05, + "learning_rate": 4.787949286078705e-07, + "loss": 0.3868, + "step": 80094 + }, + { + "epoch": 2.05, + "learning_rate": 4.787713139712674e-07, + "loss": 0.4021, + "step": 80095 + }, + { + "epoch": 2.05, + "learning_rate": 4.787476997337449e-07, + "loss": 0.4985, + "step": 80096 + }, + { + "epoch": 2.05, + "learning_rate": 4.787240858953215e-07, + "loss": 0.4341, + "step": 80097 + }, + { + "epoch": 2.05, + "learning_rate": 4.787004724560155e-07, + "loss": 0.3706, + "step": 80098 + }, + { + "epoch": 2.05, + "learning_rate": 4.786768594158446e-07, + "loss": 0.5161, + "step": 80099 + }, + { + "epoch": 2.05, + "learning_rate": 4.786532467748264e-07, + "loss": 0.2827, + "step": 80100 + }, + { + "epoch": 2.05, + "learning_rate": 4.786296345329795e-07, + "loss": 0.5195, + "step": 80101 + }, + { + "epoch": 2.05, + "learning_rate": 4.786060226903218e-07, + "loss": 0.4146, + "step": 80102 + }, + { + "epoch": 2.05, + "learning_rate": 4.785824112468719e-07, + "loss": 0.3562, + "step": 80103 + }, + { + "epoch": 2.05, + "learning_rate": 4.785588002026471e-07, + "loss": 0.4536, + "step": 80104 + }, + { + "epoch": 2.05, + "learning_rate": 4.78535189557666e-07, + "loss": 0.3647, + "step": 80105 + }, + { + "epoch": 2.05, + "learning_rate": 4.785115793119464e-07, + "loss": 0.3726, + "step": 80106 + }, + { + "epoch": 2.05, + "learning_rate": 4.784879694655069e-07, + "loss": 0.4346, + "step": 80107 + }, + { + "epoch": 2.05, + "learning_rate": 4.784643600183651e-07, + "loss": 0.4011, + "step": 80108 + }, + { + "epoch": 2.05, + "learning_rate": 4.784407509705389e-07, + "loss": 0.4277, + "step": 80109 + }, + { + "epoch": 2.05, + "learning_rate": 4.784171423220466e-07, + "loss": 0.3547, + "step": 80110 + }, + { + "epoch": 2.05, + "learning_rate": 4.783935340729067e-07, + "loss": 0.4397, + "step": 80111 + }, + { + "epoch": 2.05, + "learning_rate": 4.783699262231364e-07, + "loss": 0.4044, + "step": 80112 + }, + { + "epoch": 2.05, + "learning_rate": 4.783463187727544e-07, + "loss": 0.478, + "step": 80113 + }, + { + "epoch": 2.05, + "learning_rate": 4.783227117217786e-07, + "loss": 0.4097, + "step": 80114 + }, + { + "epoch": 2.05, + "learning_rate": 4.782991050702274e-07, + "loss": 0.2642, + "step": 80115 + }, + { + "epoch": 2.05, + "learning_rate": 4.782754988181183e-07, + "loss": 0.5137, + "step": 80116 + }, + { + "epoch": 2.05, + "learning_rate": 4.782518929654698e-07, + "loss": 0.4199, + "step": 80117 + }, + { + "epoch": 2.05, + "learning_rate": 4.782282875123e-07, + "loss": 0.3872, + "step": 80118 + }, + { + "epoch": 2.05, + "learning_rate": 4.782046824586265e-07, + "loss": 0.4927, + "step": 80119 + }, + { + "epoch": 2.05, + "learning_rate": 4.781810778044681e-07, + "loss": 0.3596, + "step": 80120 + }, + { + "epoch": 2.05, + "learning_rate": 4.781574735498419e-07, + "loss": 0.293, + "step": 80121 + }, + { + "epoch": 2.05, + "learning_rate": 4.781338696947667e-07, + "loss": 0.365, + "step": 80122 + }, + { + "epoch": 2.05, + "learning_rate": 4.781102662392603e-07, + "loss": 0.2646, + "step": 80123 + }, + { + "epoch": 2.05, + "learning_rate": 4.780866631833414e-07, + "loss": 0.5059, + "step": 80124 + }, + { + "epoch": 2.05, + "learning_rate": 4.78063060527027e-07, + "loss": 0.4106, + "step": 80125 + }, + { + "epoch": 2.05, + "learning_rate": 4.780394582703358e-07, + "loss": 0.3108, + "step": 80126 + }, + { + "epoch": 2.05, + "learning_rate": 4.780158564132858e-07, + "loss": 0.4185, + "step": 80127 + }, + { + "epoch": 2.05, + "learning_rate": 4.779922549558958e-07, + "loss": 0.375, + "step": 80128 + }, + { + "epoch": 2.05, + "learning_rate": 4.779686538981823e-07, + "loss": 0.46, + "step": 80129 + }, + { + "epoch": 2.05, + "learning_rate": 4.779450532401643e-07, + "loss": 0.4371, + "step": 80130 + }, + { + "epoch": 2.05, + "learning_rate": 4.779214529818597e-07, + "loss": 0.4629, + "step": 80131 + }, + { + "epoch": 2.05, + "learning_rate": 4.77897853123287e-07, + "loss": 0.5186, + "step": 80132 + }, + { + "epoch": 2.05, + "learning_rate": 4.778742536644637e-07, + "loss": 0.5005, + "step": 80133 + }, + { + "epoch": 2.05, + "learning_rate": 4.778506546054078e-07, + "loss": 0.4419, + "step": 80134 + }, + { + "epoch": 2.05, + "learning_rate": 4.778270559461378e-07, + "loss": 0.3047, + "step": 80135 + }, + { + "epoch": 2.05, + "learning_rate": 4.778034576866721e-07, + "loss": 0.3857, + "step": 80136 + }, + { + "epoch": 2.05, + "learning_rate": 4.777798598270277e-07, + "loss": 0.3215, + "step": 80137 + }, + { + "epoch": 2.05, + "learning_rate": 4.777562623672238e-07, + "loss": 0.4526, + "step": 80138 + }, + { + "epoch": 2.05, + "learning_rate": 4.777326653072774e-07, + "loss": 0.501, + "step": 80139 + }, + { + "epoch": 2.05, + "learning_rate": 4.777090686472071e-07, + "loss": 0.4614, + "step": 80140 + }, + { + "epoch": 2.05, + "learning_rate": 4.776854723870314e-07, + "loss": 0.4482, + "step": 80141 + }, + { + "epoch": 2.05, + "learning_rate": 4.776618765267674e-07, + "loss": 0.3604, + "step": 80142 + }, + { + "epoch": 2.05, + "learning_rate": 4.776382810664339e-07, + "loss": 0.4099, + "step": 80143 + }, + { + "epoch": 2.05, + "learning_rate": 4.776146860060486e-07, + "loss": 0.3979, + "step": 80144 + }, + { + "epoch": 2.05, + "learning_rate": 4.775910913456302e-07, + "loss": 0.3364, + "step": 80145 + }, + { + "epoch": 2.05, + "learning_rate": 4.775674970851958e-07, + "loss": 0.4951, + "step": 80146 + }, + { + "epoch": 2.05, + "learning_rate": 4.775439032247639e-07, + "loss": 0.4414, + "step": 80147 + }, + { + "epoch": 2.05, + "learning_rate": 4.775203097643531e-07, + "loss": 0.5229, + "step": 80148 + }, + { + "epoch": 2.05, + "learning_rate": 4.77496716703981e-07, + "loss": 0.4194, + "step": 80149 + }, + { + "epoch": 2.05, + "learning_rate": 4.774731240436651e-07, + "loss": 0.4248, + "step": 80150 + }, + { + "epoch": 2.05, + "learning_rate": 4.774495317834241e-07, + "loss": 0.2455, + "step": 80151 + }, + { + "epoch": 2.05, + "learning_rate": 4.774259399232759e-07, + "loss": 0.4951, + "step": 80152 + }, + { + "epoch": 2.05, + "learning_rate": 4.774023484632393e-07, + "loss": 0.3459, + "step": 80153 + }, + { + "epoch": 2.05, + "learning_rate": 4.77378757403331e-07, + "loss": 0.3735, + "step": 80154 + }, + { + "epoch": 2.05, + "learning_rate": 4.773551667435697e-07, + "loss": 0.3853, + "step": 80155 + }, + { + "epoch": 2.05, + "learning_rate": 4.773315764839738e-07, + "loss": 0.311, + "step": 80156 + }, + { + "epoch": 2.05, + "learning_rate": 4.773079866245613e-07, + "loss": 0.3423, + "step": 80157 + }, + { + "epoch": 2.05, + "learning_rate": 4.772843971653501e-07, + "loss": 0.2499, + "step": 80158 + }, + { + "epoch": 2.05, + "learning_rate": 4.772608081063577e-07, + "loss": 0.4019, + "step": 80159 + }, + { + "epoch": 2.05, + "learning_rate": 4.772372194476028e-07, + "loss": 0.373, + "step": 80160 + }, + { + "epoch": 2.05, + "learning_rate": 4.772136311891032e-07, + "loss": 0.4214, + "step": 80161 + }, + { + "epoch": 2.05, + "learning_rate": 4.771900433308775e-07, + "loss": 0.3262, + "step": 80162 + }, + { + "epoch": 2.05, + "learning_rate": 4.77166455872943e-07, + "loss": 0.4226, + "step": 80163 + }, + { + "epoch": 2.05, + "learning_rate": 4.771428688153182e-07, + "loss": 0.4099, + "step": 80164 + }, + { + "epoch": 2.05, + "learning_rate": 4.771192821580213e-07, + "loss": 0.4419, + "step": 80165 + }, + { + "epoch": 2.05, + "learning_rate": 4.770956959010698e-07, + "loss": 0.2192, + "step": 80166 + }, + { + "epoch": 2.05, + "learning_rate": 4.770721100444821e-07, + "loss": 0.4839, + "step": 80167 + }, + { + "epoch": 2.05, + "learning_rate": 4.770485245882766e-07, + "loss": 0.3728, + "step": 80168 + }, + { + "epoch": 2.05, + "learning_rate": 4.770249395324706e-07, + "loss": 0.4019, + "step": 80169 + }, + { + "epoch": 2.05, + "learning_rate": 4.770013548770829e-07, + "loss": 0.3574, + "step": 80170 + }, + { + "epoch": 2.05, + "learning_rate": 4.769777706221309e-07, + "loss": 0.2683, + "step": 80171 + }, + { + "epoch": 2.05, + "learning_rate": 4.76954186767633e-07, + "loss": 0.3575, + "step": 80172 + }, + { + "epoch": 2.05, + "learning_rate": 4.769306033136072e-07, + "loss": 0.3289, + "step": 80173 + }, + { + "epoch": 2.05, + "learning_rate": 4.769070202600719e-07, + "loss": 0.4668, + "step": 80174 + }, + { + "epoch": 2.05, + "learning_rate": 4.768834376070446e-07, + "loss": 0.5957, + "step": 80175 + }, + { + "epoch": 2.05, + "learning_rate": 4.768598553545434e-07, + "loss": 0.4255, + "step": 80176 + }, + { + "epoch": 2.05, + "learning_rate": 4.768362735025866e-07, + "loss": 0.3986, + "step": 80177 + }, + { + "epoch": 2.06, + "learning_rate": 4.768126920511927e-07, + "loss": 0.4287, + "step": 80178 + }, + { + "epoch": 2.06, + "learning_rate": 4.7678911100037923e-07, + "loss": 0.355, + "step": 80179 + }, + { + "epoch": 2.06, + "learning_rate": 4.767655303501639e-07, + "loss": 0.5361, + "step": 80180 + }, + { + "epoch": 2.06, + "learning_rate": 4.7674195010056504e-07, + "loss": 0.397, + "step": 80181 + }, + { + "epoch": 2.06, + "learning_rate": 4.7671837025160136e-07, + "loss": 0.4019, + "step": 80182 + }, + { + "epoch": 2.06, + "learning_rate": 4.766947908032899e-07, + "loss": 0.394, + "step": 80183 + }, + { + "epoch": 2.06, + "learning_rate": 4.7667121175564915e-07, + "loss": 0.4468, + "step": 80184 + }, + { + "epoch": 2.06, + "learning_rate": 4.7664763310869726e-07, + "loss": 0.502, + "step": 80185 + }, + { + "epoch": 2.06, + "learning_rate": 4.7662405486245247e-07, + "loss": 0.4419, + "step": 80186 + }, + { + "epoch": 2.06, + "learning_rate": 4.766004770169323e-07, + "loss": 0.3311, + "step": 80187 + }, + { + "epoch": 2.06, + "learning_rate": 4.7657689957215543e-07, + "loss": 0.3149, + "step": 80188 + }, + { + "epoch": 2.06, + "learning_rate": 4.7655332252813917e-07, + "loss": 0.5168, + "step": 80189 + }, + { + "epoch": 2.06, + "learning_rate": 4.76529745884902e-07, + "loss": 0.2542, + "step": 80190 + }, + { + "epoch": 2.06, + "learning_rate": 4.7650616964246226e-07, + "loss": 0.3669, + "step": 80191 + }, + { + "epoch": 2.06, + "learning_rate": 4.7648259380083733e-07, + "loss": 0.4656, + "step": 80192 + }, + { + "epoch": 2.06, + "learning_rate": 4.7645901836004565e-07, + "loss": 0.4629, + "step": 80193 + }, + { + "epoch": 2.06, + "learning_rate": 4.764354433201052e-07, + "loss": 0.4597, + "step": 80194 + }, + { + "epoch": 2.06, + "learning_rate": 4.7641186868103436e-07, + "loss": 0.4482, + "step": 80195 + }, + { + "epoch": 2.06, + "learning_rate": 4.763882944428506e-07, + "loss": 0.3779, + "step": 80196 + }, + { + "epoch": 2.06, + "learning_rate": 4.763647206055722e-07, + "loss": 0.5029, + "step": 80197 + }, + { + "epoch": 2.06, + "learning_rate": 4.7634114716921756e-07, + "loss": 0.3911, + "step": 80198 + }, + { + "epoch": 2.06, + "learning_rate": 4.763175741338046e-07, + "loss": 0.4375, + "step": 80199 + }, + { + "epoch": 2.06, + "learning_rate": 4.7629400149935064e-07, + "loss": 0.4048, + "step": 80200 + }, + { + "epoch": 2.06, + "learning_rate": 4.7627042926587436e-07, + "loss": 0.3374, + "step": 80201 + }, + { + "epoch": 2.06, + "learning_rate": 4.7624685743339375e-07, + "loss": 0.3098, + "step": 80202 + }, + { + "epoch": 2.06, + "learning_rate": 4.762232860019272e-07, + "loss": 0.2904, + "step": 80203 + }, + { + "epoch": 2.06, + "learning_rate": 4.76199714971492e-07, + "loss": 0.3193, + "step": 80204 + }, + { + "epoch": 2.06, + "learning_rate": 4.761761443421066e-07, + "loss": 0.4253, + "step": 80205 + }, + { + "epoch": 2.06, + "learning_rate": 4.761525741137891e-07, + "loss": 0.3275, + "step": 80206 + }, + { + "epoch": 2.06, + "learning_rate": 4.7612900428655776e-07, + "loss": 0.4277, + "step": 80207 + }, + { + "epoch": 2.06, + "learning_rate": 4.761054348604304e-07, + "loss": 0.4414, + "step": 80208 + }, + { + "epoch": 2.06, + "learning_rate": 4.760818658354246e-07, + "loss": 0.4098, + "step": 80209 + }, + { + "epoch": 2.06, + "learning_rate": 4.7605829721155887e-07, + "loss": 0.4785, + "step": 80210 + }, + { + "epoch": 2.06, + "learning_rate": 4.760347289888512e-07, + "loss": 0.3868, + "step": 80211 + }, + { + "epoch": 2.06, + "learning_rate": 4.760111611673201e-07, + "loss": 0.2522, + "step": 80212 + }, + { + "epoch": 2.06, + "learning_rate": 4.759875937469827e-07, + "loss": 0.5254, + "step": 80213 + }, + { + "epoch": 2.06, + "learning_rate": 4.759640267278575e-07, + "loss": 0.4028, + "step": 80214 + }, + { + "epoch": 2.06, + "learning_rate": 4.759404601099626e-07, + "loss": 0.4854, + "step": 80215 + }, + { + "epoch": 2.06, + "learning_rate": 4.7591689389331636e-07, + "loss": 0.4751, + "step": 80216 + }, + { + "epoch": 2.06, + "learning_rate": 4.7589332807793604e-07, + "loss": 0.4824, + "step": 80217 + }, + { + "epoch": 2.06, + "learning_rate": 4.758697626638405e-07, + "loss": 0.3042, + "step": 80218 + }, + { + "epoch": 2.06, + "learning_rate": 4.758461976510469e-07, + "loss": 0.3916, + "step": 80219 + }, + { + "epoch": 2.06, + "learning_rate": 4.758226330395744e-07, + "loss": 0.481, + "step": 80220 + }, + { + "epoch": 2.06, + "learning_rate": 4.757990688294398e-07, + "loss": 0.606, + "step": 80221 + }, + { + "epoch": 2.06, + "learning_rate": 4.757755050206619e-07, + "loss": 0.4658, + "step": 80222 + }, + { + "epoch": 2.06, + "learning_rate": 4.757519416132585e-07, + "loss": 0.4043, + "step": 80223 + }, + { + "epoch": 2.06, + "learning_rate": 4.757283786072481e-07, + "loss": 0.3833, + "step": 80224 + }, + { + "epoch": 2.06, + "learning_rate": 4.75704816002648e-07, + "loss": 0.4062, + "step": 80225 + }, + { + "epoch": 2.06, + "learning_rate": 4.756812537994767e-07, + "loss": 0.4185, + "step": 80226 + }, + { + "epoch": 2.06, + "learning_rate": 4.756576919977521e-07, + "loss": 0.4614, + "step": 80227 + }, + { + "epoch": 2.06, + "learning_rate": 4.7563413059749257e-07, + "loss": 0.5098, + "step": 80228 + }, + { + "epoch": 2.06, + "learning_rate": 4.7561056959871604e-07, + "loss": 0.4204, + "step": 80229 + }, + { + "epoch": 2.06, + "learning_rate": 4.755870090014399e-07, + "loss": 0.5205, + "step": 80230 + }, + { + "epoch": 2.06, + "learning_rate": 4.7556344880568267e-07, + "loss": 0.416, + "step": 80231 + }, + { + "epoch": 2.06, + "learning_rate": 4.755398890114625e-07, + "loss": 0.3735, + "step": 80232 + }, + { + "epoch": 2.06, + "learning_rate": 4.7551632961879763e-07, + "loss": 0.3716, + "step": 80233 + }, + { + "epoch": 2.06, + "learning_rate": 4.7549277062770543e-07, + "loss": 0.5229, + "step": 80234 + }, + { + "epoch": 2.06, + "learning_rate": 4.754692120382042e-07, + "loss": 0.3818, + "step": 80235 + }, + { + "epoch": 2.06, + "learning_rate": 4.7544565385031223e-07, + "loss": 0.4104, + "step": 80236 + }, + { + "epoch": 2.06, + "learning_rate": 4.754220960640477e-07, + "loss": 0.2992, + "step": 80237 + }, + { + "epoch": 2.06, + "learning_rate": 4.7539853867942834e-07, + "loss": 0.3342, + "step": 80238 + }, + { + "epoch": 2.06, + "learning_rate": 4.7537498169647185e-07, + "loss": 0.4185, + "step": 80239 + }, + { + "epoch": 2.06, + "learning_rate": 4.7535142511519655e-07, + "loss": 0.5151, + "step": 80240 + }, + { + "epoch": 2.06, + "learning_rate": 4.7532786893562106e-07, + "loss": 0.4658, + "step": 80241 + }, + { + "epoch": 2.06, + "learning_rate": 4.7530431315776243e-07, + "loss": 0.4443, + "step": 80242 + }, + { + "epoch": 2.06, + "learning_rate": 4.7528075778163914e-07, + "loss": 0.4102, + "step": 80243 + }, + { + "epoch": 2.06, + "learning_rate": 4.752572028072692e-07, + "loss": 0.3901, + "step": 80244 + }, + { + "epoch": 2.06, + "learning_rate": 4.7523364823467117e-07, + "loss": 0.4888, + "step": 80245 + }, + { + "epoch": 2.06, + "learning_rate": 4.7521009406386216e-07, + "loss": 0.4629, + "step": 80246 + }, + { + "epoch": 2.06, + "learning_rate": 4.751865402948607e-07, + "loss": 0.4756, + "step": 80247 + }, + { + "epoch": 2.06, + "learning_rate": 4.751629869276852e-07, + "loss": 0.4507, + "step": 80248 + }, + { + "epoch": 2.06, + "learning_rate": 4.751394339623528e-07, + "loss": 0.3386, + "step": 80249 + }, + { + "epoch": 2.06, + "learning_rate": 4.7511588139888234e-07, + "loss": 0.4565, + "step": 80250 + }, + { + "epoch": 2.06, + "learning_rate": 4.7509232923729123e-07, + "loss": 0.5078, + "step": 80251 + }, + { + "epoch": 2.06, + "learning_rate": 4.7506877747759777e-07, + "loss": 0.313, + "step": 80252 + }, + { + "epoch": 2.06, + "learning_rate": 4.7504522611982e-07, + "loss": 0.2368, + "step": 80253 + }, + { + "epoch": 2.06, + "learning_rate": 4.750216751639764e-07, + "loss": 0.5381, + "step": 80254 + }, + { + "epoch": 2.06, + "learning_rate": 4.7499812461008403e-07, + "loss": 0.4678, + "step": 80255 + }, + { + "epoch": 2.06, + "learning_rate": 4.749745744581616e-07, + "loss": 0.3357, + "step": 80256 + }, + { + "epoch": 2.06, + "learning_rate": 4.7495102470822734e-07, + "loss": 0.28, + "step": 80257 + }, + { + "epoch": 2.06, + "learning_rate": 4.74927475360299e-07, + "loss": 0.2958, + "step": 80258 + }, + { + "epoch": 2.06, + "learning_rate": 4.7490392641439403e-07, + "loss": 0.1877, + "step": 80259 + }, + { + "epoch": 2.06, + "learning_rate": 4.7488037787053104e-07, + "loss": 0.3604, + "step": 80260 + }, + { + "epoch": 2.06, + "learning_rate": 4.74856829728728e-07, + "loss": 0.4482, + "step": 80261 + }, + { + "epoch": 2.06, + "learning_rate": 4.748332819890033e-07, + "loss": 0.4453, + "step": 80262 + }, + { + "epoch": 2.06, + "learning_rate": 4.748097346513743e-07, + "loss": 0.5068, + "step": 80263 + }, + { + "epoch": 2.06, + "learning_rate": 4.747861877158593e-07, + "loss": 0.5337, + "step": 80264 + }, + { + "epoch": 2.06, + "learning_rate": 4.7476264118247636e-07, + "loss": 0.3755, + "step": 80265 + }, + { + "epoch": 2.06, + "learning_rate": 4.747390950512439e-07, + "loss": 0.4241, + "step": 80266 + }, + { + "epoch": 2.06, + "learning_rate": 4.7471554932217915e-07, + "loss": 0.4404, + "step": 80267 + }, + { + "epoch": 2.06, + "learning_rate": 4.7469200399530097e-07, + "loss": 0.4189, + "step": 80268 + }, + { + "epoch": 2.06, + "learning_rate": 4.746684590706266e-07, + "loss": 0.3662, + "step": 80269 + }, + { + "epoch": 2.06, + "learning_rate": 4.7464491454817437e-07, + "loss": 0.4966, + "step": 80270 + }, + { + "epoch": 2.06, + "learning_rate": 4.746213704279628e-07, + "loss": 0.3196, + "step": 80271 + }, + { + "epoch": 2.06, + "learning_rate": 4.7459782671000904e-07, + "loss": 0.3066, + "step": 80272 + }, + { + "epoch": 2.06, + "learning_rate": 4.745742833943316e-07, + "loss": 0.4849, + "step": 80273 + }, + { + "epoch": 2.06, + "learning_rate": 4.745507404809489e-07, + "loss": 0.3438, + "step": 80274 + }, + { + "epoch": 2.06, + "learning_rate": 4.745271979698782e-07, + "loss": 0.449, + "step": 80275 + }, + { + "epoch": 2.06, + "learning_rate": 4.7450365586113773e-07, + "loss": 0.4663, + "step": 80276 + }, + { + "epoch": 2.06, + "learning_rate": 4.7448011415474576e-07, + "loss": 0.3755, + "step": 80277 + }, + { + "epoch": 2.06, + "learning_rate": 4.744565728507205e-07, + "loss": 0.3191, + "step": 80278 + }, + { + "epoch": 2.06, + "learning_rate": 4.744330319490797e-07, + "loss": 0.3424, + "step": 80279 + }, + { + "epoch": 2.06, + "learning_rate": 4.74409491449841e-07, + "loss": 0.3442, + "step": 80280 + }, + { + "epoch": 2.06, + "learning_rate": 4.743859513530228e-07, + "loss": 0.4556, + "step": 80281 + }, + { + "epoch": 2.06, + "learning_rate": 4.743624116586431e-07, + "loss": 0.3761, + "step": 80282 + }, + { + "epoch": 2.06, + "learning_rate": 4.743388723667203e-07, + "loss": 0.4421, + "step": 80283 + }, + { + "epoch": 2.06, + "learning_rate": 4.743153334772717e-07, + "loss": 0.4336, + "step": 80284 + }, + { + "epoch": 2.06, + "learning_rate": 4.7429179499031555e-07, + "loss": 0.4021, + "step": 80285 + }, + { + "epoch": 2.06, + "learning_rate": 4.7426825690587013e-07, + "loss": 0.4956, + "step": 80286 + }, + { + "epoch": 2.06, + "learning_rate": 4.742447192239537e-07, + "loss": 0.3994, + "step": 80287 + }, + { + "epoch": 2.06, + "learning_rate": 4.7422118194458395e-07, + "loss": 0.4268, + "step": 80288 + }, + { + "epoch": 2.06, + "learning_rate": 4.741976450677784e-07, + "loss": 0.436, + "step": 80289 + }, + { + "epoch": 2.06, + "learning_rate": 4.741741085935556e-07, + "loss": 0.3447, + "step": 80290 + }, + { + "epoch": 2.06, + "learning_rate": 4.741505725219338e-07, + "loss": 0.3643, + "step": 80291 + }, + { + "epoch": 2.06, + "learning_rate": 4.7412703685293043e-07, + "loss": 0.4673, + "step": 80292 + }, + { + "epoch": 2.06, + "learning_rate": 4.7410350158656374e-07, + "loss": 0.3918, + "step": 80293 + }, + { + "epoch": 2.06, + "learning_rate": 4.740799667228519e-07, + "loss": 0.4133, + "step": 80294 + }, + { + "epoch": 2.06, + "learning_rate": 4.7405643226181314e-07, + "loss": 0.4446, + "step": 80295 + }, + { + "epoch": 2.06, + "learning_rate": 4.7403289820346493e-07, + "loss": 0.4478, + "step": 80296 + }, + { + "epoch": 2.06, + "learning_rate": 4.7400936454782546e-07, + "loss": 0.4158, + "step": 80297 + }, + { + "epoch": 2.06, + "learning_rate": 4.739858312949132e-07, + "loss": 0.423, + "step": 80298 + }, + { + "epoch": 2.06, + "learning_rate": 4.7396229844474546e-07, + "loss": 0.5928, + "step": 80299 + }, + { + "epoch": 2.06, + "learning_rate": 4.7393876599734094e-07, + "loss": 0.4038, + "step": 80300 + }, + { + "epoch": 2.06, + "learning_rate": 4.7391523395271695e-07, + "loss": 0.2812, + "step": 80301 + }, + { + "epoch": 2.06, + "learning_rate": 4.7389170231089195e-07, + "loss": 0.3796, + "step": 80302 + }, + { + "epoch": 2.06, + "learning_rate": 4.738681710718837e-07, + "loss": 0.4756, + "step": 80303 + }, + { + "epoch": 2.06, + "learning_rate": 4.738446402357109e-07, + "loss": 0.3287, + "step": 80304 + }, + { + "epoch": 2.06, + "learning_rate": 4.7382110980239075e-07, + "loss": 0.436, + "step": 80305 + }, + { + "epoch": 2.06, + "learning_rate": 4.7379757977194144e-07, + "loss": 0.4395, + "step": 80306 + }, + { + "epoch": 2.06, + "learning_rate": 4.7377405014438133e-07, + "loss": 0.4092, + "step": 80307 + }, + { + "epoch": 2.06, + "learning_rate": 4.737505209197288e-07, + "loss": 0.3999, + "step": 80308 + }, + { + "epoch": 2.06, + "learning_rate": 4.737269920980006e-07, + "loss": 0.4214, + "step": 80309 + }, + { + "epoch": 2.06, + "learning_rate": 4.737034636792154e-07, + "loss": 0.4041, + "step": 80310 + }, + { + "epoch": 2.06, + "learning_rate": 4.7367993566339135e-07, + "loss": 0.3923, + "step": 80311 + }, + { + "epoch": 2.06, + "learning_rate": 4.7365640805054676e-07, + "loss": 0.4214, + "step": 80312 + }, + { + "epoch": 2.06, + "learning_rate": 4.7363288084069873e-07, + "loss": 0.3541, + "step": 80313 + }, + { + "epoch": 2.06, + "learning_rate": 4.736093540338659e-07, + "loss": 0.5264, + "step": 80314 + }, + { + "epoch": 2.06, + "learning_rate": 4.7358582763006625e-07, + "loss": 0.267, + "step": 80315 + }, + { + "epoch": 2.06, + "learning_rate": 4.73562301629318e-07, + "loss": 0.4771, + "step": 80316 + }, + { + "epoch": 2.06, + "learning_rate": 4.735387760316386e-07, + "loss": 0.3402, + "step": 80317 + }, + { + "epoch": 2.06, + "learning_rate": 4.735152508370467e-07, + "loss": 0.4893, + "step": 80318 + }, + { + "epoch": 2.06, + "learning_rate": 4.734917260455595e-07, + "loss": 0.4287, + "step": 80319 + }, + { + "epoch": 2.06, + "learning_rate": 4.734682016571956e-07, + "loss": 0.5054, + "step": 80320 + }, + { + "epoch": 2.06, + "learning_rate": 4.7344467767197316e-07, + "loss": 0.3735, + "step": 80321 + }, + { + "epoch": 2.06, + "learning_rate": 4.7342115408990955e-07, + "loss": 0.3667, + "step": 80322 + }, + { + "epoch": 2.06, + "learning_rate": 4.7339763091102324e-07, + "loss": 0.3496, + "step": 80323 + }, + { + "epoch": 2.06, + "learning_rate": 4.733741081353321e-07, + "loss": 0.4482, + "step": 80324 + }, + { + "epoch": 2.06, + "learning_rate": 4.733505857628545e-07, + "loss": 0.4341, + "step": 80325 + }, + { + "epoch": 2.06, + "learning_rate": 4.733270637936079e-07, + "loss": 0.4021, + "step": 80326 + }, + { + "epoch": 2.06, + "learning_rate": 4.7330354222761037e-07, + "loss": 0.417, + "step": 80327 + }, + { + "epoch": 2.06, + "learning_rate": 4.7328002106488064e-07, + "loss": 0.48, + "step": 80328 + }, + { + "epoch": 2.06, + "learning_rate": 4.7325650030543606e-07, + "loss": 0.4233, + "step": 80329 + }, + { + "epoch": 2.06, + "learning_rate": 4.7323297994929446e-07, + "loss": 0.3828, + "step": 80330 + }, + { + "epoch": 2.06, + "learning_rate": 4.732094599964742e-07, + "loss": 0.2794, + "step": 80331 + }, + { + "epoch": 2.06, + "learning_rate": 4.731859404469931e-07, + "loss": 0.3293, + "step": 80332 + }, + { + "epoch": 2.06, + "learning_rate": 4.731624213008698e-07, + "loss": 0.3716, + "step": 80333 + }, + { + "epoch": 2.06, + "learning_rate": 4.731389025581213e-07, + "loss": 0.3745, + "step": 80334 + }, + { + "epoch": 2.06, + "learning_rate": 4.731153842187662e-07, + "loss": 0.3914, + "step": 80335 + }, + { + "epoch": 2.06, + "learning_rate": 4.730918662828224e-07, + "loss": 0.4551, + "step": 80336 + }, + { + "epoch": 2.06, + "learning_rate": 4.730683487503083e-07, + "loss": 0.3625, + "step": 80337 + }, + { + "epoch": 2.06, + "learning_rate": 4.7304483162124166e-07, + "loss": 0.3638, + "step": 80338 + }, + { + "epoch": 2.06, + "learning_rate": 4.730213148956398e-07, + "loss": 0.3635, + "step": 80339 + }, + { + "epoch": 2.06, + "learning_rate": 4.729977985735214e-07, + "loss": 0.4355, + "step": 80340 + }, + { + "epoch": 2.06, + "learning_rate": 4.7297428265490433e-07, + "loss": 0.4253, + "step": 80341 + }, + { + "epoch": 2.06, + "learning_rate": 4.7295076713980696e-07, + "loss": 0.4165, + "step": 80342 + }, + { + "epoch": 2.06, + "learning_rate": 4.7292725202824656e-07, + "loss": 0.3462, + "step": 80343 + }, + { + "epoch": 2.06, + "learning_rate": 4.7290373732024157e-07, + "loss": 0.418, + "step": 80344 + }, + { + "epoch": 2.06, + "learning_rate": 4.7288022301581045e-07, + "loss": 0.4365, + "step": 80345 + }, + { + "epoch": 2.06, + "learning_rate": 4.728567091149701e-07, + "loss": 0.4556, + "step": 80346 + }, + { + "epoch": 2.06, + "learning_rate": 4.7283319561773925e-07, + "loss": 0.319, + "step": 80347 + }, + { + "epoch": 2.06, + "learning_rate": 4.7280968252413623e-07, + "loss": 0.4517, + "step": 80348 + }, + { + "epoch": 2.06, + "learning_rate": 4.7278616983417807e-07, + "loss": 0.5044, + "step": 80349 + }, + { + "epoch": 2.06, + "learning_rate": 4.727626575478838e-07, + "loss": 0.3696, + "step": 80350 + }, + { + "epoch": 2.06, + "learning_rate": 4.727391456652704e-07, + "loss": 0.4702, + "step": 80351 + }, + { + "epoch": 2.06, + "learning_rate": 4.727156341863565e-07, + "loss": 0.3506, + "step": 80352 + }, + { + "epoch": 2.06, + "learning_rate": 4.7269212311116e-07, + "loss": 0.4673, + "step": 80353 + }, + { + "epoch": 2.06, + "learning_rate": 4.7266861243969925e-07, + "loss": 0.4294, + "step": 80354 + }, + { + "epoch": 2.06, + "learning_rate": 4.726451021719915e-07, + "loss": 0.3323, + "step": 80355 + }, + { + "epoch": 2.06, + "learning_rate": 4.726215923080552e-07, + "loss": 0.3459, + "step": 80356 + }, + { + "epoch": 2.06, + "learning_rate": 4.7259808284790826e-07, + "loss": 0.254, + "step": 80357 + }, + { + "epoch": 2.06, + "learning_rate": 4.7257457379156904e-07, + "loss": 0.4019, + "step": 80358 + }, + { + "epoch": 2.06, + "learning_rate": 4.725510651390553e-07, + "loss": 0.3945, + "step": 80359 + }, + { + "epoch": 2.06, + "learning_rate": 4.725275568903845e-07, + "loss": 0.4441, + "step": 80360 + }, + { + "epoch": 2.06, + "learning_rate": 4.725040490455752e-07, + "loss": 0.5366, + "step": 80361 + }, + { + "epoch": 2.06, + "learning_rate": 4.724805416046456e-07, + "loss": 0.277, + "step": 80362 + }, + { + "epoch": 2.06, + "learning_rate": 4.72457034567613e-07, + "loss": 0.4902, + "step": 80363 + }, + { + "epoch": 2.06, + "learning_rate": 4.7243352793449586e-07, + "loss": 0.3479, + "step": 80364 + }, + { + "epoch": 2.06, + "learning_rate": 4.7241002170531206e-07, + "loss": 0.417, + "step": 80365 + }, + { + "epoch": 2.06, + "learning_rate": 4.7238651588008006e-07, + "loss": 0.2025, + "step": 80366 + }, + { + "epoch": 2.06, + "learning_rate": 4.72363010458817e-07, + "loss": 0.4858, + "step": 80367 + }, + { + "epoch": 2.06, + "learning_rate": 4.7233950544154177e-07, + "loss": 0.3989, + "step": 80368 + }, + { + "epoch": 2.06, + "learning_rate": 4.723160008282715e-07, + "loss": 0.3579, + "step": 80369 + }, + { + "epoch": 2.06, + "learning_rate": 4.722924966190246e-07, + "loss": 0.5205, + "step": 80370 + }, + { + "epoch": 2.06, + "learning_rate": 4.722689928138195e-07, + "loss": 0.4485, + "step": 80371 + }, + { + "epoch": 2.06, + "learning_rate": 4.722454894126733e-07, + "loss": 0.4429, + "step": 80372 + }, + { + "epoch": 2.06, + "learning_rate": 4.7222198641560453e-07, + "loss": 0.3838, + "step": 80373 + }, + { + "epoch": 2.06, + "learning_rate": 4.7219848382263105e-07, + "loss": 0.35, + "step": 80374 + }, + { + "epoch": 2.06, + "learning_rate": 4.7217498163377143e-07, + "loss": 0.4214, + "step": 80375 + }, + { + "epoch": 2.06, + "learning_rate": 4.721514798490427e-07, + "loss": 0.4756, + "step": 80376 + }, + { + "epoch": 2.06, + "learning_rate": 4.7212797846846333e-07, + "loss": 0.582, + "step": 80377 + }, + { + "epoch": 2.06, + "learning_rate": 4.7210447749205164e-07, + "loss": 0.4219, + "step": 80378 + }, + { + "epoch": 2.06, + "learning_rate": 4.720809769198253e-07, + "loss": 0.4771, + "step": 80379 + }, + { + "epoch": 2.06, + "learning_rate": 4.7205747675180184e-07, + "loss": 0.3098, + "step": 80380 + }, + { + "epoch": 2.06, + "learning_rate": 4.720339769879997e-07, + "loss": 0.5288, + "step": 80381 + }, + { + "epoch": 2.06, + "learning_rate": 4.72010477628437e-07, + "loss": 0.4619, + "step": 80382 + }, + { + "epoch": 2.06, + "learning_rate": 4.7198697867313187e-07, + "loss": 0.4204, + "step": 80383 + }, + { + "epoch": 2.06, + "learning_rate": 4.7196348012210173e-07, + "loss": 0.457, + "step": 80384 + }, + { + "epoch": 2.06, + "learning_rate": 4.7193998197536475e-07, + "loss": 0.3643, + "step": 80385 + }, + { + "epoch": 2.06, + "learning_rate": 4.7191648423293915e-07, + "loss": 0.3167, + "step": 80386 + }, + { + "epoch": 2.06, + "learning_rate": 4.7189298689484314e-07, + "loss": 0.3396, + "step": 80387 + }, + { + "epoch": 2.06, + "learning_rate": 4.7186948996109446e-07, + "loss": 0.4714, + "step": 80388 + }, + { + "epoch": 2.06, + "learning_rate": 4.718459934317106e-07, + "loss": 0.418, + "step": 80389 + }, + { + "epoch": 2.06, + "learning_rate": 4.7182249730671e-07, + "loss": 0.4756, + "step": 80390 + }, + { + "epoch": 2.06, + "learning_rate": 4.7179900158611054e-07, + "loss": 0.54, + "step": 80391 + }, + { + "epoch": 2.06, + "learning_rate": 4.717755062699308e-07, + "loss": 0.3877, + "step": 80392 + }, + { + "epoch": 2.06, + "learning_rate": 4.7175201135818775e-07, + "loss": 0.4126, + "step": 80393 + }, + { + "epoch": 2.06, + "learning_rate": 4.717285168509e-07, + "loss": 0.502, + "step": 80394 + }, + { + "epoch": 2.06, + "learning_rate": 4.7170502274808544e-07, + "loss": 0.3877, + "step": 80395 + }, + { + "epoch": 2.06, + "learning_rate": 4.7168152904976243e-07, + "loss": 0.4683, + "step": 80396 + }, + { + "epoch": 2.06, + "learning_rate": 4.716580357559485e-07, + "loss": 0.4331, + "step": 80397 + }, + { + "epoch": 2.06, + "learning_rate": 4.7163454286666135e-07, + "loss": 0.3176, + "step": 80398 + }, + { + "epoch": 2.06, + "learning_rate": 4.716110503819194e-07, + "loss": 0.5029, + "step": 80399 + }, + { + "epoch": 2.06, + "learning_rate": 4.715875583017409e-07, + "loss": 0.2347, + "step": 80400 + }, + { + "epoch": 2.06, + "learning_rate": 4.715640666261432e-07, + "loss": 0.3994, + "step": 80401 + }, + { + "epoch": 2.06, + "learning_rate": 4.715405753551446e-07, + "loss": 0.3955, + "step": 80402 + }, + { + "epoch": 2.06, + "learning_rate": 4.7151708448876304e-07, + "loss": 0.4666, + "step": 80403 + }, + { + "epoch": 2.06, + "learning_rate": 4.714935940270168e-07, + "loss": 0.4463, + "step": 80404 + }, + { + "epoch": 2.06, + "learning_rate": 4.714701039699235e-07, + "loss": 0.4272, + "step": 80405 + }, + { + "epoch": 2.06, + "learning_rate": 4.71446614317501e-07, + "loss": 0.3694, + "step": 80406 + }, + { + "epoch": 2.06, + "learning_rate": 4.71423125069768e-07, + "loss": 0.4248, + "step": 80407 + }, + { + "epoch": 2.06, + "learning_rate": 4.713996362267416e-07, + "loss": 0.4648, + "step": 80408 + }, + { + "epoch": 2.06, + "learning_rate": 4.713761477884407e-07, + "loss": 0.2157, + "step": 80409 + }, + { + "epoch": 2.06, + "learning_rate": 4.7135265975488223e-07, + "loss": 0.4517, + "step": 80410 + }, + { + "epoch": 2.06, + "learning_rate": 4.713291721260848e-07, + "loss": 0.4014, + "step": 80411 + }, + { + "epoch": 2.06, + "learning_rate": 4.7130568490206634e-07, + "loss": 0.4893, + "step": 80412 + }, + { + "epoch": 2.06, + "learning_rate": 4.7128219808284506e-07, + "loss": 0.3275, + "step": 80413 + }, + { + "epoch": 2.06, + "learning_rate": 4.7125871166843847e-07, + "loss": 0.4355, + "step": 80414 + }, + { + "epoch": 2.06, + "learning_rate": 4.7123522565886476e-07, + "loss": 0.3041, + "step": 80415 + }, + { + "epoch": 2.06, + "learning_rate": 4.7121174005414177e-07, + "loss": 0.4004, + "step": 80416 + }, + { + "epoch": 2.06, + "learning_rate": 4.7118825485428846e-07, + "loss": 0.4019, + "step": 80417 + }, + { + "epoch": 2.06, + "learning_rate": 4.711647700593213e-07, + "loss": 0.3081, + "step": 80418 + }, + { + "epoch": 2.06, + "learning_rate": 4.711412856692589e-07, + "loss": 0.3931, + "step": 80419 + }, + { + "epoch": 2.06, + "learning_rate": 4.711178016841194e-07, + "loss": 0.6548, + "step": 80420 + }, + { + "epoch": 2.06, + "learning_rate": 4.7109431810392095e-07, + "loss": 0.542, + "step": 80421 + }, + { + "epoch": 2.06, + "learning_rate": 4.7107083492868094e-07, + "loss": 0.4958, + "step": 80422 + }, + { + "epoch": 2.06, + "learning_rate": 4.710473521584176e-07, + "loss": 0.4497, + "step": 80423 + }, + { + "epoch": 2.06, + "learning_rate": 4.71023869793149e-07, + "loss": 0.4028, + "step": 80424 + }, + { + "epoch": 2.06, + "learning_rate": 4.7100038783289353e-07, + "loss": 0.417, + "step": 80425 + }, + { + "epoch": 2.06, + "learning_rate": 4.709769062776683e-07, + "loss": 0.5435, + "step": 80426 + }, + { + "epoch": 2.06, + "learning_rate": 4.709534251274921e-07, + "loss": 0.3552, + "step": 80427 + }, + { + "epoch": 2.06, + "learning_rate": 4.7092994438238233e-07, + "loss": 0.4629, + "step": 80428 + }, + { + "epoch": 2.06, + "learning_rate": 4.70906464042357e-07, + "loss": 0.4463, + "step": 80429 + }, + { + "epoch": 2.06, + "learning_rate": 4.7088298410743466e-07, + "loss": 0.3906, + "step": 80430 + }, + { + "epoch": 2.06, + "learning_rate": 4.7085950457763255e-07, + "loss": 0.4814, + "step": 80431 + }, + { + "epoch": 2.06, + "learning_rate": 4.7083602545296895e-07, + "loss": 0.355, + "step": 80432 + }, + { + "epoch": 2.06, + "learning_rate": 4.708125467334619e-07, + "loss": 0.4722, + "step": 80433 + }, + { + "epoch": 2.06, + "learning_rate": 4.707890684191297e-07, + "loss": 0.4771, + "step": 80434 + }, + { + "epoch": 2.06, + "learning_rate": 4.7076559050998966e-07, + "loss": 0.4326, + "step": 80435 + }, + { + "epoch": 2.06, + "learning_rate": 4.7074211300606e-07, + "loss": 0.541, + "step": 80436 + }, + { + "epoch": 2.06, + "learning_rate": 4.7071863590735916e-07, + "loss": 0.5435, + "step": 80437 + }, + { + "epoch": 2.06, + "learning_rate": 4.706951592139048e-07, + "loss": 0.51, + "step": 80438 + }, + { + "epoch": 2.06, + "learning_rate": 4.7067168292571435e-07, + "loss": 0.2495, + "step": 80439 + }, + { + "epoch": 2.06, + "learning_rate": 4.706482070428063e-07, + "loss": 0.4434, + "step": 80440 + }, + { + "epoch": 2.06, + "learning_rate": 4.7062473156519853e-07, + "loss": 0.5259, + "step": 80441 + }, + { + "epoch": 2.06, + "learning_rate": 4.706012564929095e-07, + "loss": 0.4253, + "step": 80442 + }, + { + "epoch": 2.06, + "learning_rate": 4.705777818259563e-07, + "loss": 0.3523, + "step": 80443 + }, + { + "epoch": 2.06, + "learning_rate": 4.7055430756435745e-07, + "loss": 0.355, + "step": 80444 + }, + { + "epoch": 2.06, + "learning_rate": 4.7053083370813074e-07, + "loss": 0.4526, + "step": 80445 + }, + { + "epoch": 2.06, + "learning_rate": 4.705073602572946e-07, + "loss": 0.457, + "step": 80446 + }, + { + "epoch": 2.06, + "learning_rate": 4.704838872118666e-07, + "loss": 0.3628, + "step": 80447 + }, + { + "epoch": 2.06, + "learning_rate": 4.7046041457186446e-07, + "loss": 0.4077, + "step": 80448 + }, + { + "epoch": 2.06, + "learning_rate": 4.7043694233730635e-07, + "loss": 0.4209, + "step": 80449 + }, + { + "epoch": 2.06, + "learning_rate": 4.704134705082103e-07, + "loss": 0.5015, + "step": 80450 + }, + { + "epoch": 2.06, + "learning_rate": 4.703899990845949e-07, + "loss": 0.5322, + "step": 80451 + }, + { + "epoch": 2.06, + "learning_rate": 4.703665280664769e-07, + "loss": 0.356, + "step": 80452 + }, + { + "epoch": 2.06, + "learning_rate": 4.70343057453875e-07, + "loss": 0.4036, + "step": 80453 + }, + { + "epoch": 2.06, + "learning_rate": 4.7031958724680743e-07, + "loss": 0.343, + "step": 80454 + }, + { + "epoch": 2.06, + "learning_rate": 4.7029611744529143e-07, + "loss": 0.3672, + "step": 80455 + }, + { + "epoch": 2.06, + "learning_rate": 4.702726480493453e-07, + "loss": 0.293, + "step": 80456 + }, + { + "epoch": 2.06, + "learning_rate": 4.7024917905898743e-07, + "loss": 0.4515, + "step": 80457 + }, + { + "epoch": 2.06, + "learning_rate": 4.702257104742351e-07, + "loss": 0.2966, + "step": 80458 + }, + { + "epoch": 2.06, + "learning_rate": 4.7020224229510686e-07, + "loss": 0.3381, + "step": 80459 + }, + { + "epoch": 2.06, + "learning_rate": 4.7017877452162014e-07, + "loss": 0.4844, + "step": 80460 + }, + { + "epoch": 2.06, + "learning_rate": 4.70155307153793e-07, + "loss": 0.3989, + "step": 80461 + }, + { + "epoch": 2.06, + "learning_rate": 4.7013184019164374e-07, + "loss": 0.2706, + "step": 80462 + }, + { + "epoch": 2.06, + "learning_rate": 4.7010837363519053e-07, + "loss": 0.3347, + "step": 80463 + }, + { + "epoch": 2.06, + "learning_rate": 4.700849074844505e-07, + "loss": 0.437, + "step": 80464 + }, + { + "epoch": 2.06, + "learning_rate": 4.700614417394422e-07, + "loss": 0.4595, + "step": 80465 + }, + { + "epoch": 2.06, + "learning_rate": 4.7003797640018337e-07, + "loss": 0.3106, + "step": 80466 + }, + { + "epoch": 2.06, + "learning_rate": 4.7001451146669257e-07, + "loss": 0.3523, + "step": 80467 + }, + { + "epoch": 2.06, + "learning_rate": 4.699910469389872e-07, + "loss": 0.332, + "step": 80468 + }, + { + "epoch": 2.06, + "learning_rate": 4.69967582817085e-07, + "loss": 0.5073, + "step": 80469 + }, + { + "epoch": 2.06, + "learning_rate": 4.699441191010042e-07, + "loss": 0.4565, + "step": 80470 + }, + { + "epoch": 2.06, + "learning_rate": 4.6992065579076323e-07, + "loss": 0.5483, + "step": 80471 + }, + { + "epoch": 2.06, + "learning_rate": 4.698971928863793e-07, + "loss": 0.4375, + "step": 80472 + }, + { + "epoch": 2.06, + "learning_rate": 4.698737303878707e-07, + "loss": 0.2845, + "step": 80473 + }, + { + "epoch": 2.06, + "learning_rate": 4.698502682952553e-07, + "loss": 0.3923, + "step": 80474 + }, + { + "epoch": 2.06, + "learning_rate": 4.698268066085517e-07, + "loss": 0.2846, + "step": 80475 + }, + { + "epoch": 2.06, + "learning_rate": 4.6980334532777686e-07, + "loss": 0.3479, + "step": 80476 + }, + { + "epoch": 2.06, + "learning_rate": 4.6977988445294967e-07, + "loss": 0.3416, + "step": 80477 + }, + { + "epoch": 2.06, + "learning_rate": 4.697564239840872e-07, + "loss": 0.499, + "step": 80478 + }, + { + "epoch": 2.06, + "learning_rate": 4.6973296392120785e-07, + "loss": 0.6392, + "step": 80479 + }, + { + "epoch": 2.06, + "learning_rate": 4.6970950426432996e-07, + "loss": 0.4084, + "step": 80480 + }, + { + "epoch": 2.06, + "learning_rate": 4.6968604501347086e-07, + "loss": 0.4678, + "step": 80481 + }, + { + "epoch": 2.06, + "learning_rate": 4.696625861686486e-07, + "loss": 0.4316, + "step": 80482 + }, + { + "epoch": 2.06, + "learning_rate": 4.6963912772988143e-07, + "loss": 0.3696, + "step": 80483 + }, + { + "epoch": 2.06, + "learning_rate": 4.696156696971876e-07, + "loss": 0.3916, + "step": 80484 + }, + { + "epoch": 2.06, + "learning_rate": 4.695922120705842e-07, + "loss": 0.4434, + "step": 80485 + }, + { + "epoch": 2.06, + "learning_rate": 4.6956875485008965e-07, + "loss": 0.4263, + "step": 80486 + }, + { + "epoch": 2.06, + "learning_rate": 4.695452980357223e-07, + "loss": 0.5264, + "step": 80487 + }, + { + "epoch": 2.06, + "learning_rate": 4.6952184162749973e-07, + "loss": 0.4678, + "step": 80488 + }, + { + "epoch": 2.06, + "learning_rate": 4.6949838562543963e-07, + "loss": 0.3901, + "step": 80489 + }, + { + "epoch": 2.06, + "learning_rate": 4.6947493002956004e-07, + "loss": 0.4189, + "step": 80490 + }, + { + "epoch": 2.06, + "learning_rate": 4.6945147483987924e-07, + "loss": 0.418, + "step": 80491 + }, + { + "epoch": 2.06, + "learning_rate": 4.6942802005641537e-07, + "loss": 0.2683, + "step": 80492 + }, + { + "epoch": 2.06, + "learning_rate": 4.6940456567918574e-07, + "loss": 0.3092, + "step": 80493 + }, + { + "epoch": 2.06, + "learning_rate": 4.693811117082086e-07, + "loss": 0.392, + "step": 80494 + }, + { + "epoch": 2.06, + "learning_rate": 4.6935765814350193e-07, + "loss": 0.4563, + "step": 80495 + }, + { + "epoch": 2.06, + "learning_rate": 4.69334204985084e-07, + "loss": 0.4062, + "step": 80496 + }, + { + "epoch": 2.06, + "learning_rate": 4.693107522329726e-07, + "loss": 0.2913, + "step": 80497 + }, + { + "epoch": 2.06, + "learning_rate": 4.692872998871852e-07, + "loss": 0.3079, + "step": 80498 + }, + { + "epoch": 2.06, + "learning_rate": 4.6926384794773996e-07, + "loss": 0.4326, + "step": 80499 + }, + { + "epoch": 2.06, + "learning_rate": 4.6924039641465507e-07, + "loss": 0.373, + "step": 80500 + }, + { + "epoch": 2.06, + "learning_rate": 4.6921694528794874e-07, + "loss": 0.4209, + "step": 80501 + }, + { + "epoch": 2.06, + "learning_rate": 4.6919349456763834e-07, + "loss": 0.376, + "step": 80502 + }, + { + "epoch": 2.06, + "learning_rate": 4.6917004425374197e-07, + "loss": 0.4011, + "step": 80503 + }, + { + "epoch": 2.06, + "learning_rate": 4.691465943462777e-07, + "loss": 0.4556, + "step": 80504 + }, + { + "epoch": 2.06, + "learning_rate": 4.6912314484526384e-07, + "loss": 0.2974, + "step": 80505 + }, + { + "epoch": 2.06, + "learning_rate": 4.690996957507176e-07, + "loss": 0.2841, + "step": 80506 + }, + { + "epoch": 2.06, + "learning_rate": 4.690762470626578e-07, + "loss": 0.3005, + "step": 80507 + }, + { + "epoch": 2.06, + "learning_rate": 4.6905279878110135e-07, + "loss": 0.2868, + "step": 80508 + }, + { + "epoch": 2.06, + "learning_rate": 4.690293509060672e-07, + "loss": 0.5352, + "step": 80509 + }, + { + "epoch": 2.06, + "learning_rate": 4.690059034375725e-07, + "loss": 0.3318, + "step": 80510 + }, + { + "epoch": 2.06, + "learning_rate": 4.6898245637563563e-07, + "loss": 0.382, + "step": 80511 + }, + { + "epoch": 2.06, + "learning_rate": 4.6895900972027446e-07, + "loss": 0.4258, + "step": 80512 + }, + { + "epoch": 2.06, + "learning_rate": 4.689355634715072e-07, + "loss": 0.3972, + "step": 80513 + }, + { + "epoch": 2.06, + "learning_rate": 4.6891211762935134e-07, + "loss": 0.4302, + "step": 80514 + }, + { + "epoch": 2.06, + "learning_rate": 4.6888867219382497e-07, + "loss": 0.3828, + "step": 80515 + }, + { + "epoch": 2.06, + "learning_rate": 4.6886522716494615e-07, + "loss": 0.408, + "step": 80516 + }, + { + "epoch": 2.06, + "learning_rate": 4.688417825427331e-07, + "loss": 0.4653, + "step": 80517 + }, + { + "epoch": 2.06, + "learning_rate": 4.6881833832720363e-07, + "loss": 0.2723, + "step": 80518 + }, + { + "epoch": 2.06, + "learning_rate": 4.687948945183751e-07, + "loss": 0.5146, + "step": 80519 + }, + { + "epoch": 2.06, + "learning_rate": 4.687714511162658e-07, + "loss": 0.376, + "step": 80520 + }, + { + "epoch": 2.06, + "learning_rate": 4.687480081208939e-07, + "loss": 0.4771, + "step": 80521 + }, + { + "epoch": 2.06, + "learning_rate": 4.687245655322775e-07, + "loss": 0.4072, + "step": 80522 + }, + { + "epoch": 2.06, + "learning_rate": 4.687011233504339e-07, + "loss": 0.4153, + "step": 80523 + }, + { + "epoch": 2.06, + "learning_rate": 4.686776815753815e-07, + "loss": 0.3346, + "step": 80524 + }, + { + "epoch": 2.06, + "learning_rate": 4.686542402071384e-07, + "loss": 0.3843, + "step": 80525 + }, + { + "epoch": 2.06, + "learning_rate": 4.686307992457221e-07, + "loss": 0.4258, + "step": 80526 + }, + { + "epoch": 2.06, + "learning_rate": 4.686073586911511e-07, + "loss": 0.4526, + "step": 80527 + }, + { + "epoch": 2.06, + "learning_rate": 4.685839185434426e-07, + "loss": 0.4873, + "step": 80528 + }, + { + "epoch": 2.06, + "learning_rate": 4.6856047880261496e-07, + "loss": 0.4653, + "step": 80529 + }, + { + "epoch": 2.06, + "learning_rate": 4.685370394686865e-07, + "loss": 0.4058, + "step": 80530 + }, + { + "epoch": 2.06, + "learning_rate": 4.6851360054167443e-07, + "loss": 0.429, + "step": 80531 + }, + { + "epoch": 2.06, + "learning_rate": 4.684901620215971e-07, + "loss": 0.3804, + "step": 80532 + }, + { + "epoch": 2.06, + "learning_rate": 4.684667239084723e-07, + "loss": 0.4189, + "step": 80533 + }, + { + "epoch": 2.06, + "learning_rate": 4.684432862023185e-07, + "loss": 0.4402, + "step": 80534 + }, + { + "epoch": 2.06, + "learning_rate": 4.684198489031529e-07, + "loss": 0.426, + "step": 80535 + }, + { + "epoch": 2.06, + "learning_rate": 4.683964120109938e-07, + "loss": 0.3142, + "step": 80536 + }, + { + "epoch": 2.06, + "learning_rate": 4.6837297552585954e-07, + "loss": 0.4985, + "step": 80537 + }, + { + "epoch": 2.06, + "learning_rate": 4.6834953944776714e-07, + "loss": 0.4487, + "step": 80538 + }, + { + "epoch": 2.06, + "learning_rate": 4.683261037767354e-07, + "loss": 0.3567, + "step": 80539 + }, + { + "epoch": 2.06, + "learning_rate": 4.6830266851278164e-07, + "loss": 0.5342, + "step": 80540 + }, + { + "epoch": 2.06, + "learning_rate": 4.6827923365592413e-07, + "loss": 0.3447, + "step": 80541 + }, + { + "epoch": 2.06, + "learning_rate": 4.682557992061811e-07, + "loss": 0.3879, + "step": 80542 + }, + { + "epoch": 2.06, + "learning_rate": 4.682323651635698e-07, + "loss": 0.3772, + "step": 80543 + }, + { + "epoch": 2.06, + "learning_rate": 4.682089315281084e-07, + "loss": 0.2927, + "step": 80544 + }, + { + "epoch": 2.06, + "learning_rate": 4.6818549829981503e-07, + "loss": 0.3882, + "step": 80545 + }, + { + "epoch": 2.06, + "learning_rate": 4.68162065478708e-07, + "loss": 0.5327, + "step": 80546 + }, + { + "epoch": 2.06, + "learning_rate": 4.681386330648048e-07, + "loss": 0.418, + "step": 80547 + }, + { + "epoch": 2.06, + "learning_rate": 4.6811520105812297e-07, + "loss": 0.4233, + "step": 80548 + }, + { + "epoch": 2.06, + "learning_rate": 4.680917694586809e-07, + "loss": 0.4697, + "step": 80549 + }, + { + "epoch": 2.06, + "learning_rate": 4.680683382664965e-07, + "loss": 0.4683, + "step": 80550 + }, + { + "epoch": 2.06, + "learning_rate": 4.680449074815881e-07, + "loss": 0.4507, + "step": 80551 + }, + { + "epoch": 2.06, + "learning_rate": 4.6802147710397286e-07, + "loss": 0.3691, + "step": 80552 + }, + { + "epoch": 2.06, + "learning_rate": 4.679980471336692e-07, + "loss": 0.4443, + "step": 80553 + }, + { + "epoch": 2.06, + "learning_rate": 4.679746175706949e-07, + "loss": 0.5732, + "step": 80554 + }, + { + "epoch": 2.06, + "learning_rate": 4.679511884150683e-07, + "loss": 0.3762, + "step": 80555 + }, + { + "epoch": 2.06, + "learning_rate": 4.6792775966680674e-07, + "loss": 0.3867, + "step": 80556 + }, + { + "epoch": 2.06, + "learning_rate": 4.679043313259288e-07, + "loss": 0.3286, + "step": 80557 + }, + { + "epoch": 2.06, + "learning_rate": 4.6788090339245156e-07, + "loss": 0.4242, + "step": 80558 + }, + { + "epoch": 2.06, + "learning_rate": 4.678574758663939e-07, + "loss": 0.5059, + "step": 80559 + }, + { + "epoch": 2.06, + "learning_rate": 4.6783404874777286e-07, + "loss": 0.2932, + "step": 80560 + }, + { + "epoch": 2.06, + "learning_rate": 4.6781062203660695e-07, + "loss": 0.4634, + "step": 80561 + }, + { + "epoch": 2.06, + "learning_rate": 4.677871957329139e-07, + "loss": 0.3843, + "step": 80562 + }, + { + "epoch": 2.06, + "learning_rate": 4.677637698367121e-07, + "loss": 0.4658, + "step": 80563 + }, + { + "epoch": 2.06, + "learning_rate": 4.677403443480187e-07, + "loss": 0.4556, + "step": 80564 + }, + { + "epoch": 2.06, + "learning_rate": 4.6771691926685207e-07, + "loss": 0.4082, + "step": 80565 + }, + { + "epoch": 2.06, + "learning_rate": 4.6769349459323016e-07, + "loss": 0.4154, + "step": 80566 + }, + { + "epoch": 2.06, + "learning_rate": 4.676700703271712e-07, + "loss": 0.356, + "step": 80567 + }, + { + "epoch": 2.06, + "learning_rate": 4.676466464686928e-07, + "loss": 0.4624, + "step": 80568 + }, + { + "epoch": 2.07, + "learning_rate": 4.6762322301781257e-07, + "loss": 0.3276, + "step": 80569 + }, + { + "epoch": 2.07, + "learning_rate": 4.6759979997454856e-07, + "loss": 0.41, + "step": 80570 + }, + { + "epoch": 2.07, + "learning_rate": 4.675763773389191e-07, + "loss": 0.3401, + "step": 80571 + }, + { + "epoch": 2.07, + "learning_rate": 4.6755295511094215e-07, + "loss": 0.3887, + "step": 80572 + }, + { + "epoch": 2.07, + "learning_rate": 4.6752953329063517e-07, + "loss": 0.3756, + "step": 80573 + }, + { + "epoch": 2.07, + "learning_rate": 4.6750611187801636e-07, + "loss": 0.324, + "step": 80574 + }, + { + "epoch": 2.07, + "learning_rate": 4.6748269087310353e-07, + "loss": 0.447, + "step": 80575 + }, + { + "epoch": 2.07, + "learning_rate": 4.6745927027591514e-07, + "loss": 0.3464, + "step": 80576 + }, + { + "epoch": 2.07, + "learning_rate": 4.6743585008646866e-07, + "loss": 0.4248, + "step": 80577 + }, + { + "epoch": 2.07, + "learning_rate": 4.6741243030478183e-07, + "loss": 0.4897, + "step": 80578 + }, + { + "epoch": 2.07, + "learning_rate": 4.673890109308727e-07, + "loss": 0.4346, + "step": 80579 + }, + { + "epoch": 2.07, + "learning_rate": 4.6736559196475965e-07, + "loss": 0.5088, + "step": 80580 + }, + { + "epoch": 2.07, + "learning_rate": 4.6734217340646e-07, + "loss": 0.5288, + "step": 80581 + }, + { + "epoch": 2.07, + "learning_rate": 4.6731875525599185e-07, + "loss": 0.5278, + "step": 80582 + }, + { + "epoch": 2.07, + "learning_rate": 4.6729533751337336e-07, + "loss": 0.3762, + "step": 80583 + }, + { + "epoch": 2.07, + "learning_rate": 4.672719201786226e-07, + "loss": 0.436, + "step": 80584 + }, + { + "epoch": 2.07, + "learning_rate": 4.672485032517569e-07, + "loss": 0.4463, + "step": 80585 + }, + { + "epoch": 2.07, + "learning_rate": 4.672250867327946e-07, + "loss": 0.2716, + "step": 80586 + }, + { + "epoch": 2.07, + "learning_rate": 4.6720167062175387e-07, + "loss": 0.3486, + "step": 80587 + }, + { + "epoch": 2.07, + "learning_rate": 4.671782549186519e-07, + "loss": 0.3511, + "step": 80588 + }, + { + "epoch": 2.07, + "learning_rate": 4.6715483962350744e-07, + "loss": 0.4109, + "step": 80589 + }, + { + "epoch": 2.07, + "learning_rate": 4.671314247363376e-07, + "loss": 0.4221, + "step": 80590 + }, + { + "epoch": 2.07, + "learning_rate": 4.6710801025716083e-07, + "loss": 0.4692, + "step": 80591 + }, + { + "epoch": 2.07, + "learning_rate": 4.6708459618599496e-07, + "loss": 0.3616, + "step": 80592 + }, + { + "epoch": 2.07, + "learning_rate": 4.670611825228582e-07, + "loss": 0.5137, + "step": 80593 + }, + { + "epoch": 2.07, + "learning_rate": 4.6703776926776785e-07, + "loss": 0.3918, + "step": 80594 + }, + { + "epoch": 2.07, + "learning_rate": 4.6701435642074215e-07, + "loss": 0.3948, + "step": 80595 + }, + { + "epoch": 2.07, + "learning_rate": 4.6699094398179907e-07, + "loss": 0.3687, + "step": 80596 + }, + { + "epoch": 2.07, + "learning_rate": 4.6696753195095716e-07, + "loss": 0.3135, + "step": 80597 + }, + { + "epoch": 2.07, + "learning_rate": 4.6694412032823304e-07, + "loss": 0.4646, + "step": 80598 + }, + { + "epoch": 2.07, + "learning_rate": 4.6692070911364533e-07, + "loss": 0.3003, + "step": 80599 + }, + { + "epoch": 2.07, + "learning_rate": 4.6689729830721194e-07, + "loss": 0.499, + "step": 80600 + }, + { + "epoch": 2.07, + "learning_rate": 4.668738879089511e-07, + "loss": 0.4434, + "step": 80601 + }, + { + "epoch": 2.07, + "learning_rate": 4.668504779188801e-07, + "loss": 0.3584, + "step": 80602 + }, + { + "epoch": 2.07, + "learning_rate": 4.668270683370171e-07, + "loss": 0.3315, + "step": 80603 + }, + { + "epoch": 2.07, + "learning_rate": 4.6680365916338007e-07, + "loss": 0.415, + "step": 80604 + }, + { + "epoch": 2.07, + "learning_rate": 4.667802503979874e-07, + "loss": 0.3853, + "step": 80605 + }, + { + "epoch": 2.07, + "learning_rate": 4.6675684204085617e-07, + "loss": 0.344, + "step": 80606 + }, + { + "epoch": 2.07, + "learning_rate": 4.6673343409200516e-07, + "loss": 0.2678, + "step": 80607 + }, + { + "epoch": 2.07, + "learning_rate": 4.667100265514513e-07, + "loss": 0.4746, + "step": 80608 + }, + { + "epoch": 2.07, + "learning_rate": 4.6668661941921315e-07, + "loss": 0.376, + "step": 80609 + }, + { + "epoch": 2.07, + "learning_rate": 4.6666321269530894e-07, + "loss": 0.3442, + "step": 80610 + }, + { + "epoch": 2.07, + "learning_rate": 4.6663980637975577e-07, + "loss": 0.415, + "step": 80611 + }, + { + "epoch": 2.07, + "learning_rate": 4.66616400472572e-07, + "loss": 0.4126, + "step": 80612 + }, + { + "epoch": 2.07, + "learning_rate": 4.6659299497377555e-07, + "loss": 0.4795, + "step": 80613 + }, + { + "epoch": 2.07, + "learning_rate": 4.6656958988338455e-07, + "loss": 0.2474, + "step": 80614 + }, + { + "epoch": 2.07, + "learning_rate": 4.6654618520141653e-07, + "loss": 0.3984, + "step": 80615 + }, + { + "epoch": 2.07, + "learning_rate": 4.6652278092788944e-07, + "loss": 0.4309, + "step": 80616 + }, + { + "epoch": 2.07, + "learning_rate": 4.664993770628217e-07, + "loss": 0.4224, + "step": 80617 + }, + { + "epoch": 2.07, + "learning_rate": 4.6647597360623083e-07, + "loss": 0.4336, + "step": 80618 + }, + { + "epoch": 2.07, + "learning_rate": 4.6645257055813447e-07, + "loss": 0.4233, + "step": 80619 + }, + { + "epoch": 2.07, + "learning_rate": 4.664291679185508e-07, + "loss": 0.4397, + "step": 80620 + }, + { + "epoch": 2.07, + "learning_rate": 4.664057656874978e-07, + "loss": 0.272, + "step": 80621 + }, + { + "epoch": 2.07, + "learning_rate": 4.663823638649937e-07, + "loss": 0.3748, + "step": 80622 + }, + { + "epoch": 2.07, + "learning_rate": 4.663589624510558e-07, + "loss": 0.4443, + "step": 80623 + }, + { + "epoch": 2.07, + "learning_rate": 4.663355614457023e-07, + "loss": 0.4248, + "step": 80624 + }, + { + "epoch": 2.07, + "learning_rate": 4.66312160848951e-07, + "loss": 0.3757, + "step": 80625 + }, + { + "epoch": 2.07, + "learning_rate": 4.6628876066082046e-07, + "loss": 0.4712, + "step": 80626 + }, + { + "epoch": 2.07, + "learning_rate": 4.6626536088132794e-07, + "loss": 0.3354, + "step": 80627 + }, + { + "epoch": 2.07, + "learning_rate": 4.6624196151049124e-07, + "loss": 0.4106, + "step": 80628 + }, + { + "epoch": 2.07, + "learning_rate": 4.662185625483285e-07, + "loss": 0.5088, + "step": 80629 + }, + { + "epoch": 2.07, + "learning_rate": 4.6619516399485757e-07, + "loss": 0.2471, + "step": 80630 + }, + { + "epoch": 2.07, + "learning_rate": 4.6617176585009687e-07, + "loss": 0.3997, + "step": 80631 + }, + { + "epoch": 2.07, + "learning_rate": 4.6614836811406356e-07, + "loss": 0.396, + "step": 80632 + }, + { + "epoch": 2.07, + "learning_rate": 4.6612497078677595e-07, + "loss": 0.3589, + "step": 80633 + }, + { + "epoch": 2.07, + "learning_rate": 4.661015738682522e-07, + "loss": 0.3318, + "step": 80634 + }, + { + "epoch": 2.07, + "learning_rate": 4.660781773585095e-07, + "loss": 0.3618, + "step": 80635 + }, + { + "epoch": 2.07, + "learning_rate": 4.6605478125756636e-07, + "loss": 0.4194, + "step": 80636 + }, + { + "epoch": 2.07, + "learning_rate": 4.6603138556544075e-07, + "loss": 0.5244, + "step": 80637 + }, + { + "epoch": 2.07, + "learning_rate": 4.6600799028215e-07, + "loss": 0.4072, + "step": 80638 + }, + { + "epoch": 2.07, + "learning_rate": 4.6598459540771284e-07, + "loss": 0.4702, + "step": 80639 + }, + { + "epoch": 2.07, + "learning_rate": 4.659612009421463e-07, + "loss": 0.3528, + "step": 80640 + }, + { + "epoch": 2.07, + "learning_rate": 4.659378068854687e-07, + "loss": 0.4673, + "step": 80641 + }, + { + "epoch": 2.07, + "learning_rate": 4.65914413237698e-07, + "loss": 0.4004, + "step": 80642 + }, + { + "epoch": 2.07, + "learning_rate": 4.6589101999885237e-07, + "loss": 0.3755, + "step": 80643 + }, + { + "epoch": 2.07, + "learning_rate": 4.6586762716894914e-07, + "loss": 0.2965, + "step": 80644 + }, + { + "epoch": 2.07, + "learning_rate": 4.658442347480064e-07, + "loss": 0.3486, + "step": 80645 + }, + { + "epoch": 2.07, + "learning_rate": 4.6582084273604226e-07, + "loss": 0.4302, + "step": 80646 + }, + { + "epoch": 2.07, + "learning_rate": 4.657974511330749e-07, + "loss": 0.3289, + "step": 80647 + }, + { + "epoch": 2.07, + "learning_rate": 4.6577405993912176e-07, + "loss": 0.4526, + "step": 80648 + }, + { + "epoch": 2.07, + "learning_rate": 4.657506691542006e-07, + "loss": 0.4692, + "step": 80649 + }, + { + "epoch": 2.07, + "learning_rate": 4.6572727877832963e-07, + "loss": 0.5186, + "step": 80650 + }, + { + "epoch": 2.07, + "learning_rate": 4.65703888811527e-07, + "loss": 0.5312, + "step": 80651 + }, + { + "epoch": 2.07, + "learning_rate": 4.656804992538099e-07, + "loss": 0.3261, + "step": 80652 + }, + { + "epoch": 2.07, + "learning_rate": 4.6565711010519683e-07, + "loss": 0.353, + "step": 80653 + }, + { + "epoch": 2.07, + "learning_rate": 4.6563372136570544e-07, + "loss": 0.542, + "step": 80654 + }, + { + "epoch": 2.07, + "learning_rate": 4.6561033303535414e-07, + "loss": 0.4761, + "step": 80655 + }, + { + "epoch": 2.07, + "learning_rate": 4.655869451141601e-07, + "loss": 0.438, + "step": 80656 + }, + { + "epoch": 2.07, + "learning_rate": 4.6556355760214194e-07, + "loss": 0.3494, + "step": 80657 + }, + { + "epoch": 2.07, + "learning_rate": 4.655401704993167e-07, + "loss": 0.3691, + "step": 80658 + }, + { + "epoch": 2.07, + "learning_rate": 4.655167838057029e-07, + "loss": 0.4971, + "step": 80659 + }, + { + "epoch": 2.07, + "learning_rate": 4.6549339752131867e-07, + "loss": 0.3667, + "step": 80660 + }, + { + "epoch": 2.07, + "learning_rate": 4.6547001164618114e-07, + "loss": 0.3503, + "step": 80661 + }, + { + "epoch": 2.07, + "learning_rate": 4.654466261803087e-07, + "loss": 0.2986, + "step": 80662 + }, + { + "epoch": 2.07, + "learning_rate": 4.654232411237191e-07, + "loss": 0.4824, + "step": 80663 + }, + { + "epoch": 2.07, + "learning_rate": 4.6539985647643087e-07, + "loss": 0.3887, + "step": 80664 + }, + { + "epoch": 2.07, + "learning_rate": 4.6537647223846086e-07, + "loss": 0.4346, + "step": 80665 + }, + { + "epoch": 2.07, + "learning_rate": 4.653530884098277e-07, + "loss": 0.4131, + "step": 80666 + }, + { + "epoch": 2.07, + "learning_rate": 4.653297049905494e-07, + "loss": 0.5298, + "step": 80667 + }, + { + "epoch": 2.07, + "learning_rate": 4.6530632198064347e-07, + "loss": 0.5049, + "step": 80668 + }, + { + "epoch": 2.07, + "learning_rate": 4.6528293938012754e-07, + "loss": 0.4294, + "step": 80669 + }, + { + "epoch": 2.07, + "learning_rate": 4.6525955718901986e-07, + "loss": 0.2806, + "step": 80670 + }, + { + "epoch": 2.07, + "learning_rate": 4.652361754073384e-07, + "loss": 0.4385, + "step": 80671 + }, + { + "epoch": 2.07, + "learning_rate": 4.652127940351014e-07, + "loss": 0.2031, + "step": 80672 + }, + { + "epoch": 2.07, + "learning_rate": 4.6518941307232596e-07, + "loss": 0.3877, + "step": 80673 + }, + { + "epoch": 2.07, + "learning_rate": 4.6516603251903043e-07, + "loss": 0.4551, + "step": 80674 + }, + { + "epoch": 2.07, + "learning_rate": 4.6514265237523266e-07, + "loss": 0.3467, + "step": 80675 + }, + { + "epoch": 2.07, + "learning_rate": 4.65119272640951e-07, + "loss": 0.3833, + "step": 80676 + }, + { + "epoch": 2.07, + "learning_rate": 4.650958933162028e-07, + "loss": 0.3313, + "step": 80677 + }, + { + "epoch": 2.07, + "learning_rate": 4.650725144010058e-07, + "loss": 0.3032, + "step": 80678 + }, + { + "epoch": 2.07, + "learning_rate": 4.650491358953782e-07, + "loss": 0.519, + "step": 80679 + }, + { + "epoch": 2.07, + "learning_rate": 4.6502575779933773e-07, + "loss": 0.4192, + "step": 80680 + }, + { + "epoch": 2.07, + "learning_rate": 4.6500238011290293e-07, + "loss": 0.4236, + "step": 80681 + }, + { + "epoch": 2.07, + "learning_rate": 4.649790028360908e-07, + "loss": 0.4414, + "step": 80682 + }, + { + "epoch": 2.07, + "learning_rate": 4.649556259689197e-07, + "loss": 0.5122, + "step": 80683 + }, + { + "epoch": 2.07, + "learning_rate": 4.649322495114074e-07, + "loss": 0.521, + "step": 80684 + }, + { + "epoch": 2.07, + "learning_rate": 4.6490887346357233e-07, + "loss": 0.3597, + "step": 80685 + }, + { + "epoch": 2.07, + "learning_rate": 4.6488549782543186e-07, + "loss": 0.3801, + "step": 80686 + }, + { + "epoch": 2.07, + "learning_rate": 4.6486212259700366e-07, + "loss": 0.4175, + "step": 80687 + }, + { + "epoch": 2.07, + "learning_rate": 4.648387477783058e-07, + "loss": 0.4531, + "step": 80688 + }, + { + "epoch": 2.07, + "learning_rate": 4.648153733693568e-07, + "loss": 0.2231, + "step": 80689 + }, + { + "epoch": 2.07, + "learning_rate": 4.6479199937017364e-07, + "loss": 0.3516, + "step": 80690 + }, + { + "epoch": 2.07, + "learning_rate": 4.647686257807746e-07, + "loss": 0.4517, + "step": 80691 + }, + { + "epoch": 2.07, + "learning_rate": 4.647452526011777e-07, + "loss": 0.4219, + "step": 80692 + }, + { + "epoch": 2.07, + "learning_rate": 4.647218798314011e-07, + "loss": 0.306, + "step": 80693 + }, + { + "epoch": 2.07, + "learning_rate": 4.646985074714619e-07, + "loss": 0.374, + "step": 80694 + }, + { + "epoch": 2.07, + "learning_rate": 4.646751355213785e-07, + "loss": 0.3781, + "step": 80695 + }, + { + "epoch": 2.07, + "learning_rate": 4.64651763981169e-07, + "loss": 0.4854, + "step": 80696 + }, + { + "epoch": 2.07, + "learning_rate": 4.646283928508508e-07, + "loss": 0.3572, + "step": 80697 + }, + { + "epoch": 2.07, + "learning_rate": 4.646050221304423e-07, + "loss": 0.5146, + "step": 80698 + }, + { + "epoch": 2.07, + "learning_rate": 4.6458165181996077e-07, + "loss": 0.3651, + "step": 80699 + }, + { + "epoch": 2.07, + "learning_rate": 4.645582819194245e-07, + "loss": 0.4395, + "step": 80700 + }, + { + "epoch": 2.07, + "learning_rate": 4.645349124288513e-07, + "loss": 0.4824, + "step": 80701 + }, + { + "epoch": 2.07, + "learning_rate": 4.6451154334825946e-07, + "loss": 0.4702, + "step": 80702 + }, + { + "epoch": 2.07, + "learning_rate": 4.644881746776661e-07, + "loss": 0.4546, + "step": 80703 + }, + { + "epoch": 2.07, + "learning_rate": 4.6446480641708965e-07, + "loss": 0.5107, + "step": 80704 + }, + { + "epoch": 2.07, + "learning_rate": 4.644414385665482e-07, + "loss": 0.28, + "step": 80705 + }, + { + "epoch": 2.07, + "learning_rate": 4.644180711260592e-07, + "loss": 0.3843, + "step": 80706 + }, + { + "epoch": 2.07, + "learning_rate": 4.643947040956403e-07, + "loss": 0.5649, + "step": 80707 + }, + { + "epoch": 2.07, + "learning_rate": 4.643713374753099e-07, + "loss": 0.418, + "step": 80708 + }, + { + "epoch": 2.07, + "learning_rate": 4.6434797126508563e-07, + "loss": 0.4043, + "step": 80709 + }, + { + "epoch": 2.07, + "learning_rate": 4.643246054649859e-07, + "loss": 0.5298, + "step": 80710 + }, + { + "epoch": 2.07, + "learning_rate": 4.643012400750277e-07, + "loss": 0.4458, + "step": 80711 + }, + { + "epoch": 2.07, + "learning_rate": 4.642778750952295e-07, + "loss": 0.3994, + "step": 80712 + }, + { + "epoch": 2.07, + "learning_rate": 4.6425451052560914e-07, + "loss": 0.3606, + "step": 80713 + }, + { + "epoch": 2.07, + "learning_rate": 4.642311463661848e-07, + "loss": 0.4883, + "step": 80714 + }, + { + "epoch": 2.07, + "learning_rate": 4.6420778261697356e-07, + "loss": 0.3994, + "step": 80715 + }, + { + "epoch": 2.07, + "learning_rate": 4.6418441927799437e-07, + "loss": 0.3623, + "step": 80716 + }, + { + "epoch": 2.07, + "learning_rate": 4.6416105634926394e-07, + "loss": 0.2247, + "step": 80717 + }, + { + "epoch": 2.07, + "learning_rate": 4.641376938308009e-07, + "loss": 0.4409, + "step": 80718 + }, + { + "epoch": 2.07, + "learning_rate": 4.6411433172262327e-07, + "loss": 0.4736, + "step": 80719 + }, + { + "epoch": 2.07, + "learning_rate": 4.640909700247484e-07, + "loss": 0.257, + "step": 80720 + }, + { + "epoch": 2.07, + "learning_rate": 4.640676087371943e-07, + "loss": 0.2482, + "step": 80721 + }, + { + "epoch": 2.07, + "learning_rate": 4.6404424785997944e-07, + "loss": 0.2606, + "step": 80722 + }, + { + "epoch": 2.07, + "learning_rate": 4.6402088739312084e-07, + "loss": 0.4817, + "step": 80723 + }, + { + "epoch": 2.07, + "learning_rate": 4.639975273366369e-07, + "loss": 0.3417, + "step": 80724 + }, + { + "epoch": 2.07, + "learning_rate": 4.639741676905453e-07, + "loss": 0.3174, + "step": 80725 + }, + { + "epoch": 2.07, + "learning_rate": 4.6395080845486446e-07, + "loss": 0.3706, + "step": 80726 + }, + { + "epoch": 2.07, + "learning_rate": 4.6392744962961183e-07, + "loss": 0.4175, + "step": 80727 + }, + { + "epoch": 2.07, + "learning_rate": 4.639040912148049e-07, + "loss": 0.3975, + "step": 80728 + }, + { + "epoch": 2.07, + "learning_rate": 4.6388073321046197e-07, + "loss": 0.4614, + "step": 80729 + }, + { + "epoch": 2.07, + "learning_rate": 4.638573756166009e-07, + "loss": 0.3364, + "step": 80730 + }, + { + "epoch": 2.07, + "learning_rate": 4.6383401843324e-07, + "loss": 0.3884, + "step": 80731 + }, + { + "epoch": 2.07, + "learning_rate": 4.6381066166039626e-07, + "loss": 0.4766, + "step": 80732 + }, + { + "epoch": 2.07, + "learning_rate": 4.6378730529808817e-07, + "loss": 0.3218, + "step": 80733 + }, + { + "epoch": 2.07, + "learning_rate": 4.6376394934633345e-07, + "loss": 0.4121, + "step": 80734 + }, + { + "epoch": 2.07, + "learning_rate": 4.637405938051504e-07, + "loss": 0.3412, + "step": 80735 + }, + { + "epoch": 2.07, + "learning_rate": 4.6371723867455646e-07, + "loss": 0.5586, + "step": 80736 + }, + { + "epoch": 2.07, + "learning_rate": 4.6369388395456923e-07, + "loss": 0.4351, + "step": 80737 + }, + { + "epoch": 2.07, + "learning_rate": 4.636705296452069e-07, + "loss": 0.4312, + "step": 80738 + }, + { + "epoch": 2.07, + "learning_rate": 4.6364717574648746e-07, + "loss": 0.4204, + "step": 80739 + }, + { + "epoch": 2.07, + "learning_rate": 4.6362382225842913e-07, + "loss": 0.4575, + "step": 80740 + }, + { + "epoch": 2.07, + "learning_rate": 4.636004691810489e-07, + "loss": 0.5269, + "step": 80741 + }, + { + "epoch": 2.07, + "learning_rate": 4.6357711651436514e-07, + "loss": 0.4453, + "step": 80742 + }, + { + "epoch": 2.07, + "learning_rate": 4.6355376425839607e-07, + "loss": 0.4492, + "step": 80743 + }, + { + "epoch": 2.07, + "learning_rate": 4.6353041241315883e-07, + "loss": 0.4553, + "step": 80744 + }, + { + "epoch": 2.07, + "learning_rate": 4.6350706097867174e-07, + "loss": 0.2825, + "step": 80745 + }, + { + "epoch": 2.07, + "learning_rate": 4.63483709954953e-07, + "loss": 0.5254, + "step": 80746 + }, + { + "epoch": 2.07, + "learning_rate": 4.6346035934201976e-07, + "loss": 0.4238, + "step": 80747 + }, + { + "epoch": 2.07, + "learning_rate": 4.634370091398906e-07, + "loss": 0.3601, + "step": 80748 + }, + { + "epoch": 2.07, + "learning_rate": 4.634136593485827e-07, + "loss": 0.2351, + "step": 80749 + }, + { + "epoch": 2.07, + "learning_rate": 4.633903099681142e-07, + "loss": 0.4065, + "step": 80750 + }, + { + "epoch": 2.07, + "learning_rate": 4.633669609985031e-07, + "loss": 0.3481, + "step": 80751 + }, + { + "epoch": 2.07, + "learning_rate": 4.633436124397676e-07, + "loss": 0.4436, + "step": 80752 + }, + { + "epoch": 2.07, + "learning_rate": 4.6332026429192493e-07, + "loss": 0.3896, + "step": 80753 + }, + { + "epoch": 2.07, + "learning_rate": 4.6329691655499325e-07, + "loss": 0.4468, + "step": 80754 + }, + { + "epoch": 2.07, + "learning_rate": 4.632735692289904e-07, + "loss": 0.3218, + "step": 80755 + }, + { + "epoch": 2.07, + "learning_rate": 4.6325022231393464e-07, + "loss": 0.3779, + "step": 80756 + }, + { + "epoch": 2.07, + "learning_rate": 4.6322687580984353e-07, + "loss": 0.395, + "step": 80757 + }, + { + "epoch": 2.07, + "learning_rate": 4.632035297167346e-07, + "loss": 0.438, + "step": 80758 + }, + { + "epoch": 2.07, + "learning_rate": 4.63180184034626e-07, + "loss": 0.4194, + "step": 80759 + }, + { + "epoch": 2.07, + "learning_rate": 4.63156838763536e-07, + "loss": 0.2635, + "step": 80760 + }, + { + "epoch": 2.07, + "learning_rate": 4.631334939034818e-07, + "loss": 0.4214, + "step": 80761 + }, + { + "epoch": 2.07, + "learning_rate": 4.6311014945448154e-07, + "loss": 0.479, + "step": 80762 + }, + { + "epoch": 2.07, + "learning_rate": 4.6308680541655323e-07, + "loss": 0.3833, + "step": 80763 + }, + { + "epoch": 2.07, + "learning_rate": 4.63063461789715e-07, + "loss": 0.5195, + "step": 80764 + }, + { + "epoch": 2.07, + "learning_rate": 4.6304011857398394e-07, + "loss": 0.2659, + "step": 80765 + }, + { + "epoch": 2.07, + "learning_rate": 4.630167757693788e-07, + "loss": 0.5066, + "step": 80766 + }, + { + "epoch": 2.07, + "learning_rate": 4.6299343337591667e-07, + "loss": 0.4053, + "step": 80767 + }, + { + "epoch": 2.07, + "learning_rate": 4.6297009139361577e-07, + "loss": 0.3593, + "step": 80768 + }, + { + "epoch": 2.07, + "learning_rate": 4.6294674982249436e-07, + "loss": 0.4207, + "step": 80769 + }, + { + "epoch": 2.07, + "learning_rate": 4.629234086625695e-07, + "loss": 0.3367, + "step": 80770 + }, + { + "epoch": 2.07, + "learning_rate": 4.629000679138596e-07, + "loss": 0.1906, + "step": 80771 + }, + { + "epoch": 2.07, + "learning_rate": 4.6287672757638243e-07, + "loss": 0.3358, + "step": 80772 + }, + { + "epoch": 2.07, + "learning_rate": 4.628533876501561e-07, + "loss": 0.5586, + "step": 80773 + }, + { + "epoch": 2.07, + "learning_rate": 4.628300481351979e-07, + "loss": 0.3108, + "step": 80774 + }, + { + "epoch": 2.07, + "learning_rate": 4.6280670903152606e-07, + "loss": 0.2964, + "step": 80775 + }, + { + "epoch": 2.07, + "learning_rate": 4.6278337033915884e-07, + "loss": 0.4136, + "step": 80776 + }, + { + "epoch": 2.07, + "learning_rate": 4.6276003205811356e-07, + "loss": 0.4746, + "step": 80777 + }, + { + "epoch": 2.07, + "learning_rate": 4.6273669418840787e-07, + "loss": 0.5283, + "step": 80778 + }, + { + "epoch": 2.07, + "learning_rate": 4.6271335673006007e-07, + "loss": 0.4189, + "step": 80779 + }, + { + "epoch": 2.07, + "learning_rate": 4.6269001968308796e-07, + "loss": 0.4497, + "step": 80780 + }, + { + "epoch": 2.07, + "learning_rate": 4.6266668304750964e-07, + "loss": 0.4692, + "step": 80781 + }, + { + "epoch": 2.07, + "learning_rate": 4.626433468233425e-07, + "loss": 0.4971, + "step": 80782 + }, + { + "epoch": 2.07, + "learning_rate": 4.6262001101060457e-07, + "loss": 0.3867, + "step": 80783 + }, + { + "epoch": 2.07, + "learning_rate": 4.625966756093138e-07, + "loss": 0.3268, + "step": 80784 + }, + { + "epoch": 2.07, + "learning_rate": 4.625733406194885e-07, + "loss": 0.3441, + "step": 80785 + }, + { + "epoch": 2.07, + "learning_rate": 4.625500060411459e-07, + "loss": 0.5679, + "step": 80786 + }, + { + "epoch": 2.07, + "learning_rate": 4.6252667187430386e-07, + "loss": 0.4321, + "step": 80787 + }, + { + "epoch": 2.07, + "learning_rate": 4.6250333811898034e-07, + "loss": 0.4302, + "step": 80788 + }, + { + "epoch": 2.07, + "learning_rate": 4.6248000477519334e-07, + "loss": 0.4463, + "step": 80789 + }, + { + "epoch": 2.07, + "learning_rate": 4.62456671842961e-07, + "loss": 0.3936, + "step": 80790 + }, + { + "epoch": 2.07, + "learning_rate": 4.6243333932230057e-07, + "loss": 0.4331, + "step": 80791 + }, + { + "epoch": 2.07, + "learning_rate": 4.624100072132301e-07, + "loss": 0.3784, + "step": 80792 + }, + { + "epoch": 2.07, + "learning_rate": 4.623866755157676e-07, + "loss": 0.2679, + "step": 80793 + }, + { + "epoch": 2.07, + "learning_rate": 4.623633442299314e-07, + "loss": 0.4868, + "step": 80794 + }, + { + "epoch": 2.07, + "learning_rate": 4.6234001335573837e-07, + "loss": 0.5508, + "step": 80795 + }, + { + "epoch": 2.07, + "learning_rate": 4.6231668289320726e-07, + "loss": 0.3494, + "step": 80796 + }, + { + "epoch": 2.07, + "learning_rate": 4.6229335284235513e-07, + "loss": 0.4985, + "step": 80797 + }, + { + "epoch": 2.07, + "learning_rate": 4.6227002320320077e-07, + "loss": 0.4272, + "step": 80798 + }, + { + "epoch": 2.07, + "learning_rate": 4.622466939757611e-07, + "loss": 0.3052, + "step": 80799 + }, + { + "epoch": 2.07, + "learning_rate": 4.6222336516005434e-07, + "loss": 0.377, + "step": 80800 + }, + { + "epoch": 2.07, + "learning_rate": 4.622000367560984e-07, + "loss": 0.4438, + "step": 80801 + }, + { + "epoch": 2.07, + "learning_rate": 4.621767087639117e-07, + "loss": 0.3521, + "step": 80802 + }, + { + "epoch": 2.07, + "learning_rate": 4.621533811835111e-07, + "loss": 0.4194, + "step": 80803 + }, + { + "epoch": 2.07, + "learning_rate": 4.621300540149149e-07, + "loss": 0.4414, + "step": 80804 + }, + { + "epoch": 2.07, + "learning_rate": 4.6210672725814095e-07, + "loss": 0.4067, + "step": 80805 + }, + { + "epoch": 2.07, + "learning_rate": 4.620834009132076e-07, + "loss": 0.4465, + "step": 80806 + }, + { + "epoch": 2.07, + "learning_rate": 4.620600749801322e-07, + "loss": 0.3618, + "step": 80807 + }, + { + "epoch": 2.07, + "learning_rate": 4.6203674945893234e-07, + "loss": 0.3979, + "step": 80808 + }, + { + "epoch": 2.07, + "learning_rate": 4.620134243496262e-07, + "loss": 0.418, + "step": 80809 + }, + { + "epoch": 2.07, + "learning_rate": 4.619900996522316e-07, + "loss": 0.4326, + "step": 80810 + }, + { + "epoch": 2.07, + "learning_rate": 4.6196677536676686e-07, + "loss": 0.4668, + "step": 80811 + }, + { + "epoch": 2.07, + "learning_rate": 4.61943451493249e-07, + "loss": 0.4644, + "step": 80812 + }, + { + "epoch": 2.07, + "learning_rate": 4.6192012803169633e-07, + "loss": 0.3978, + "step": 80813 + }, + { + "epoch": 2.07, + "learning_rate": 4.61896804982127e-07, + "loss": 0.3838, + "step": 80814 + }, + { + "epoch": 2.07, + "learning_rate": 4.6187348234455826e-07, + "loss": 0.3794, + "step": 80815 + }, + { + "epoch": 2.07, + "learning_rate": 4.618501601190086e-07, + "loss": 0.5713, + "step": 80816 + }, + { + "epoch": 2.07, + "learning_rate": 4.6182683830549516e-07, + "loss": 0.4038, + "step": 80817 + }, + { + "epoch": 2.07, + "learning_rate": 4.6180351690403616e-07, + "loss": 0.4373, + "step": 80818 + }, + { + "epoch": 2.07, + "learning_rate": 4.617801959146498e-07, + "loss": 0.4214, + "step": 80819 + }, + { + "epoch": 2.07, + "learning_rate": 4.617568753373532e-07, + "loss": 0.4031, + "step": 80820 + }, + { + "epoch": 2.07, + "learning_rate": 4.617335551721647e-07, + "loss": 0.4238, + "step": 80821 + }, + { + "epoch": 2.07, + "learning_rate": 4.6171023541910203e-07, + "loss": 0.2961, + "step": 80822 + }, + { + "epoch": 2.07, + "learning_rate": 4.6168691607818345e-07, + "loss": 0.429, + "step": 80823 + }, + { + "epoch": 2.07, + "learning_rate": 4.61663597149426e-07, + "loss": 0.2859, + "step": 80824 + }, + { + "epoch": 2.07, + "learning_rate": 4.6164027863284807e-07, + "loss": 0.354, + "step": 80825 + }, + { + "epoch": 2.07, + "learning_rate": 4.616169605284678e-07, + "loss": 0.3584, + "step": 80826 + }, + { + "epoch": 2.07, + "learning_rate": 4.615936428363022e-07, + "loss": 0.3611, + "step": 80827 + }, + { + "epoch": 2.07, + "learning_rate": 4.615703255563701e-07, + "loss": 0.2996, + "step": 80828 + }, + { + "epoch": 2.07, + "learning_rate": 4.6154700868868834e-07, + "loss": 0.3523, + "step": 80829 + }, + { + "epoch": 2.07, + "learning_rate": 4.615236922332754e-07, + "loss": 0.5054, + "step": 80830 + }, + { + "epoch": 2.07, + "learning_rate": 4.6150037619014925e-07, + "loss": 0.226, + "step": 80831 + }, + { + "epoch": 2.07, + "learning_rate": 4.6147706055932725e-07, + "loss": 0.5015, + "step": 80832 + }, + { + "epoch": 2.07, + "learning_rate": 4.614537453408275e-07, + "loss": 0.4216, + "step": 80833 + }, + { + "epoch": 2.07, + "learning_rate": 4.614304305346678e-07, + "loss": 0.4058, + "step": 80834 + }, + { + "epoch": 2.07, + "learning_rate": 4.6140711614086636e-07, + "loss": 0.4712, + "step": 80835 + }, + { + "epoch": 2.07, + "learning_rate": 4.613838021594408e-07, + "loss": 0.3433, + "step": 80836 + }, + { + "epoch": 2.07, + "learning_rate": 4.6136048859040856e-07, + "loss": 0.3823, + "step": 80837 + }, + { + "epoch": 2.07, + "learning_rate": 4.613371754337878e-07, + "loss": 0.4045, + "step": 80838 + }, + { + "epoch": 2.07, + "learning_rate": 4.613138626895964e-07, + "loss": 0.3506, + "step": 80839 + }, + { + "epoch": 2.07, + "learning_rate": 4.612905503578525e-07, + "loss": 0.4976, + "step": 80840 + }, + { + "epoch": 2.07, + "learning_rate": 4.612672384385734e-07, + "loss": 0.3965, + "step": 80841 + }, + { + "epoch": 2.07, + "learning_rate": 4.612439269317772e-07, + "loss": 0.3616, + "step": 80842 + }, + { + "epoch": 2.07, + "learning_rate": 4.612206158374816e-07, + "loss": 0.4233, + "step": 80843 + }, + { + "epoch": 2.07, + "learning_rate": 4.611973051557051e-07, + "loss": 0.5635, + "step": 80844 + }, + { + "epoch": 2.07, + "learning_rate": 4.611739948864647e-07, + "loss": 0.396, + "step": 80845 + }, + { + "epoch": 2.07, + "learning_rate": 4.6115068502977884e-07, + "loss": 0.3163, + "step": 80846 + }, + { + "epoch": 2.07, + "learning_rate": 4.6112737558566485e-07, + "loss": 0.5137, + "step": 80847 + }, + { + "epoch": 2.07, + "learning_rate": 4.6110406655414123e-07, + "loss": 0.4604, + "step": 80848 + }, + { + "epoch": 2.07, + "learning_rate": 4.6108075793522505e-07, + "loss": 0.415, + "step": 80849 + }, + { + "epoch": 2.07, + "learning_rate": 4.6105744972893457e-07, + "loss": 0.4561, + "step": 80850 + }, + { + "epoch": 2.07, + "learning_rate": 4.6103414193528757e-07, + "loss": 0.5278, + "step": 80851 + }, + { + "epoch": 2.07, + "learning_rate": 4.6101083455430236e-07, + "loss": 0.3506, + "step": 80852 + }, + { + "epoch": 2.07, + "learning_rate": 4.60987527585996e-07, + "loss": 0.3918, + "step": 80853 + }, + { + "epoch": 2.07, + "learning_rate": 4.609642210303867e-07, + "loss": 0.3303, + "step": 80854 + }, + { + "epoch": 2.07, + "learning_rate": 4.609409148874923e-07, + "loss": 0.3491, + "step": 80855 + }, + { + "epoch": 2.07, + "learning_rate": 4.60917609157331e-07, + "loss": 0.4551, + "step": 80856 + }, + { + "epoch": 2.07, + "learning_rate": 4.6089430383992034e-07, + "loss": 0.5986, + "step": 80857 + }, + { + "epoch": 2.07, + "learning_rate": 4.608709989352777e-07, + "loss": 0.4448, + "step": 80858 + }, + { + "epoch": 2.07, + "learning_rate": 4.6084769444342143e-07, + "loss": 0.3413, + "step": 80859 + }, + { + "epoch": 2.07, + "learning_rate": 4.608243903643693e-07, + "loss": 0.3478, + "step": 80860 + }, + { + "epoch": 2.07, + "learning_rate": 4.6080108669813945e-07, + "loss": 0.5654, + "step": 80861 + }, + { + "epoch": 2.07, + "learning_rate": 4.6077778344474903e-07, + "loss": 0.2997, + "step": 80862 + }, + { + "epoch": 2.07, + "learning_rate": 4.607544806042163e-07, + "loss": 0.4116, + "step": 80863 + }, + { + "epoch": 2.07, + "learning_rate": 4.6073117817655905e-07, + "loss": 0.3999, + "step": 80864 + }, + { + "epoch": 2.07, + "learning_rate": 4.607078761617955e-07, + "loss": 0.4351, + "step": 80865 + }, + { + "epoch": 2.07, + "learning_rate": 4.6068457455994314e-07, + "loss": 0.4253, + "step": 80866 + }, + { + "epoch": 2.07, + "learning_rate": 4.6066127337101945e-07, + "loss": 0.4038, + "step": 80867 + }, + { + "epoch": 2.07, + "learning_rate": 4.606379725950427e-07, + "loss": 0.396, + "step": 80868 + }, + { + "epoch": 2.07, + "learning_rate": 4.6061467223203086e-07, + "loss": 0.4424, + "step": 80869 + }, + { + "epoch": 2.07, + "learning_rate": 4.605913722820013e-07, + "loss": 0.4609, + "step": 80870 + }, + { + "epoch": 2.07, + "learning_rate": 4.605680727449721e-07, + "loss": 0.4956, + "step": 80871 + }, + { + "epoch": 2.07, + "learning_rate": 4.605447736209611e-07, + "loss": 0.2132, + "step": 80872 + }, + { + "epoch": 2.07, + "learning_rate": 4.605214749099866e-07, + "loss": 0.4443, + "step": 80873 + }, + { + "epoch": 2.07, + "learning_rate": 4.6049817661206556e-07, + "loss": 0.4287, + "step": 80874 + }, + { + "epoch": 2.07, + "learning_rate": 4.6047487872721633e-07, + "loss": 0.5801, + "step": 80875 + }, + { + "epoch": 2.07, + "learning_rate": 4.60451581255457e-07, + "loss": 0.3868, + "step": 80876 + }, + { + "epoch": 2.07, + "learning_rate": 4.604282841968047e-07, + "loss": 0.3496, + "step": 80877 + }, + { + "epoch": 2.07, + "learning_rate": 4.604049875512781e-07, + "loss": 0.2908, + "step": 80878 + }, + { + "epoch": 2.07, + "learning_rate": 4.6038169131889413e-07, + "loss": 0.5059, + "step": 80879 + }, + { + "epoch": 2.07, + "learning_rate": 4.6035839549967117e-07, + "loss": 0.3616, + "step": 80880 + }, + { + "epoch": 2.07, + "learning_rate": 4.6033510009362686e-07, + "loss": 0.4937, + "step": 80881 + }, + { + "epoch": 2.07, + "learning_rate": 4.603118051007796e-07, + "loss": 0.4839, + "step": 80882 + }, + { + "epoch": 2.07, + "learning_rate": 4.602885105211464e-07, + "loss": 0.5151, + "step": 80883 + }, + { + "epoch": 2.07, + "learning_rate": 4.602652163547455e-07, + "loss": 0.4729, + "step": 80884 + }, + { + "epoch": 2.07, + "learning_rate": 4.60241922601595e-07, + "loss": 0.4121, + "step": 80885 + }, + { + "epoch": 2.07, + "learning_rate": 4.602186292617124e-07, + "loss": 0.3458, + "step": 80886 + }, + { + "epoch": 2.07, + "learning_rate": 4.601953363351153e-07, + "loss": 0.4233, + "step": 80887 + }, + { + "epoch": 2.07, + "learning_rate": 4.6017204382182183e-07, + "loss": 0.4023, + "step": 80888 + }, + { + "epoch": 2.07, + "learning_rate": 4.6014875172184976e-07, + "loss": 0.5137, + "step": 80889 + }, + { + "epoch": 2.07, + "learning_rate": 4.6012546003521733e-07, + "loss": 0.4648, + "step": 80890 + }, + { + "epoch": 2.07, + "learning_rate": 4.6010216876194163e-07, + "loss": 0.519, + "step": 80891 + }, + { + "epoch": 2.07, + "learning_rate": 4.6007887790204094e-07, + "loss": 0.4155, + "step": 80892 + }, + { + "epoch": 2.07, + "learning_rate": 4.60055587455533e-07, + "loss": 0.3979, + "step": 80893 + }, + { + "epoch": 2.07, + "learning_rate": 4.6003229742243597e-07, + "loss": 0.5044, + "step": 80894 + }, + { + "epoch": 2.07, + "learning_rate": 4.6000900780276706e-07, + "loss": 0.3779, + "step": 80895 + }, + { + "epoch": 2.07, + "learning_rate": 4.599857185965448e-07, + "loss": 0.4521, + "step": 80896 + }, + { + "epoch": 2.07, + "learning_rate": 4.599624298037863e-07, + "loss": 0.5024, + "step": 80897 + }, + { + "epoch": 2.07, + "learning_rate": 4.5993914142450976e-07, + "loss": 0.3845, + "step": 80898 + }, + { + "epoch": 2.07, + "learning_rate": 4.599158534587333e-07, + "loss": 0.4038, + "step": 80899 + }, + { + "epoch": 2.07, + "learning_rate": 4.598925659064741e-07, + "loss": 0.4438, + "step": 80900 + }, + { + "epoch": 2.07, + "learning_rate": 4.5986927876775027e-07, + "loss": 0.4097, + "step": 80901 + }, + { + "epoch": 2.07, + "learning_rate": 4.5984599204257966e-07, + "loss": 0.3225, + "step": 80902 + }, + { + "epoch": 2.07, + "learning_rate": 4.598227057309806e-07, + "loss": 0.5103, + "step": 80903 + }, + { + "epoch": 2.07, + "learning_rate": 4.597994198329701e-07, + "loss": 0.5234, + "step": 80904 + }, + { + "epoch": 2.07, + "learning_rate": 4.5977613434856635e-07, + "loss": 0.3235, + "step": 80905 + }, + { + "epoch": 2.07, + "learning_rate": 4.5975284927778746e-07, + "loss": 0.5059, + "step": 80906 + }, + { + "epoch": 2.07, + "learning_rate": 4.5972956462065096e-07, + "loss": 0.5474, + "step": 80907 + }, + { + "epoch": 2.07, + "learning_rate": 4.597062803771744e-07, + "loss": 0.4023, + "step": 80908 + }, + { + "epoch": 2.07, + "learning_rate": 4.5968299654737584e-07, + "loss": 0.2737, + "step": 80909 + }, + { + "epoch": 2.07, + "learning_rate": 4.5965971313127326e-07, + "loss": 0.5342, + "step": 80910 + }, + { + "epoch": 2.07, + "learning_rate": 4.5963643012888466e-07, + "loss": 0.3239, + "step": 80911 + }, + { + "epoch": 2.07, + "learning_rate": 4.596131475402273e-07, + "loss": 0.2686, + "step": 80912 + }, + { + "epoch": 2.07, + "learning_rate": 4.595898653653193e-07, + "loss": 0.3743, + "step": 80913 + }, + { + "epoch": 2.07, + "learning_rate": 4.5956658360417846e-07, + "loss": 0.3608, + "step": 80914 + }, + { + "epoch": 2.07, + "learning_rate": 4.5954330225682294e-07, + "loss": 0.5435, + "step": 80915 + }, + { + "epoch": 2.07, + "learning_rate": 4.595200213232704e-07, + "loss": 0.4297, + "step": 80916 + }, + { + "epoch": 2.07, + "learning_rate": 4.5949674080353806e-07, + "loss": 0.438, + "step": 80917 + }, + { + "epoch": 2.07, + "learning_rate": 4.5947346069764426e-07, + "loss": 0.5293, + "step": 80918 + }, + { + "epoch": 2.07, + "learning_rate": 4.5945018100560675e-07, + "loss": 0.459, + "step": 80919 + }, + { + "epoch": 2.07, + "learning_rate": 4.594269017274437e-07, + "loss": 0.3491, + "step": 80920 + }, + { + "epoch": 2.07, + "learning_rate": 4.5940362286317237e-07, + "loss": 0.3215, + "step": 80921 + }, + { + "epoch": 2.07, + "learning_rate": 4.593803444128107e-07, + "loss": 0.4023, + "step": 80922 + }, + { + "epoch": 2.07, + "learning_rate": 4.593570663763772e-07, + "loss": 0.459, + "step": 80923 + }, + { + "epoch": 2.07, + "learning_rate": 4.593337887538886e-07, + "loss": 0.4312, + "step": 80924 + }, + { + "epoch": 2.07, + "learning_rate": 4.593105115453633e-07, + "loss": 0.4277, + "step": 80925 + }, + { + "epoch": 2.07, + "learning_rate": 4.5928723475081943e-07, + "loss": 0.3357, + "step": 80926 + }, + { + "epoch": 2.07, + "learning_rate": 4.592639583702741e-07, + "loss": 0.406, + "step": 80927 + }, + { + "epoch": 2.07, + "learning_rate": 4.592406824037459e-07, + "loss": 0.5366, + "step": 80928 + }, + { + "epoch": 2.07, + "learning_rate": 4.592174068512519e-07, + "loss": 0.4028, + "step": 80929 + }, + { + "epoch": 2.07, + "learning_rate": 4.591941317128102e-07, + "loss": 0.5957, + "step": 80930 + }, + { + "epoch": 2.07, + "learning_rate": 4.591708569884386e-07, + "loss": 0.3818, + "step": 80931 + }, + { + "epoch": 2.07, + "learning_rate": 4.591475826781556e-07, + "loss": 0.4238, + "step": 80932 + }, + { + "epoch": 2.07, + "learning_rate": 4.591243087819778e-07, + "loss": 0.49, + "step": 80933 + }, + { + "epoch": 2.07, + "learning_rate": 4.5910103529992386e-07, + "loss": 0.2736, + "step": 80934 + }, + { + "epoch": 2.07, + "learning_rate": 4.590777622320113e-07, + "loss": 0.4438, + "step": 80935 + }, + { + "epoch": 2.07, + "learning_rate": 4.5905448957825844e-07, + "loss": 0.3677, + "step": 80936 + }, + { + "epoch": 2.07, + "learning_rate": 4.5903121733868255e-07, + "loss": 0.397, + "step": 80937 + }, + { + "epoch": 2.07, + "learning_rate": 4.5900794551330137e-07, + "loss": 0.4302, + "step": 80938 + }, + { + "epoch": 2.07, + "learning_rate": 4.589846741021328e-07, + "loss": 0.4302, + "step": 80939 + }, + { + "epoch": 2.07, + "learning_rate": 4.589614031051953e-07, + "loss": 0.384, + "step": 80940 + }, + { + "epoch": 2.07, + "learning_rate": 4.5893813252250567e-07, + "loss": 0.4033, + "step": 80941 + }, + { + "epoch": 2.07, + "learning_rate": 4.589148623540824e-07, + "loss": 0.5205, + "step": 80942 + }, + { + "epoch": 2.07, + "learning_rate": 4.58891592599943e-07, + "loss": 0.3425, + "step": 80943 + }, + { + "epoch": 2.07, + "learning_rate": 4.588683232601058e-07, + "loss": 0.348, + "step": 80944 + }, + { + "epoch": 2.07, + "learning_rate": 4.58845054334588e-07, + "loss": 0.373, + "step": 80945 + }, + { + "epoch": 2.07, + "learning_rate": 4.588217858234079e-07, + "loss": 0.6011, + "step": 80946 + }, + { + "epoch": 2.07, + "learning_rate": 4.587985177265827e-07, + "loss": 0.3679, + "step": 80947 + }, + { + "epoch": 2.07, + "learning_rate": 4.5877525004413064e-07, + "loss": 0.3629, + "step": 80948 + }, + { + "epoch": 2.07, + "learning_rate": 4.5875198277606984e-07, + "loss": 0.3107, + "step": 80949 + }, + { + "epoch": 2.07, + "learning_rate": 4.587287159224175e-07, + "loss": 0.5347, + "step": 80950 + }, + { + "epoch": 2.07, + "learning_rate": 4.5870544948319144e-07, + "loss": 0.22, + "step": 80951 + }, + { + "epoch": 2.07, + "learning_rate": 4.586821834584099e-07, + "loss": 0.4033, + "step": 80952 + }, + { + "epoch": 2.07, + "learning_rate": 4.5865891784809083e-07, + "loss": 0.3657, + "step": 80953 + }, + { + "epoch": 2.07, + "learning_rate": 4.5863565265225146e-07, + "loss": 0.3245, + "step": 80954 + }, + { + "epoch": 2.07, + "learning_rate": 4.5861238787090983e-07, + "loss": 0.4209, + "step": 80955 + }, + { + "epoch": 2.07, + "learning_rate": 4.585891235040842e-07, + "loss": 0.3989, + "step": 80956 + }, + { + "epoch": 2.07, + "learning_rate": 4.5856585955179196e-07, + "loss": 0.415, + "step": 80957 + }, + { + "epoch": 2.07, + "learning_rate": 4.5854259601405055e-07, + "loss": 0.4126, + "step": 80958 + }, + { + "epoch": 2.08, + "learning_rate": 4.585193328908782e-07, + "loss": 0.3833, + "step": 80959 + }, + { + "epoch": 2.08, + "learning_rate": 4.5849607018229263e-07, + "loss": 0.4639, + "step": 80960 + }, + { + "epoch": 2.08, + "learning_rate": 4.584728078883122e-07, + "loss": 0.5322, + "step": 80961 + }, + { + "epoch": 2.08, + "learning_rate": 4.584495460089538e-07, + "loss": 0.4641, + "step": 80962 + }, + { + "epoch": 2.08, + "learning_rate": 4.584262845442357e-07, + "loss": 0.4868, + "step": 80963 + }, + { + "epoch": 2.08, + "learning_rate": 4.584030234941757e-07, + "loss": 0.4077, + "step": 80964 + }, + { + "epoch": 2.08, + "learning_rate": 4.58379762858792e-07, + "loss": 0.4209, + "step": 80965 + }, + { + "epoch": 2.08, + "learning_rate": 4.583565026381019e-07, + "loss": 0.4214, + "step": 80966 + }, + { + "epoch": 2.08, + "learning_rate": 4.5833324283212306e-07, + "loss": 0.502, + "step": 80967 + }, + { + "epoch": 2.08, + "learning_rate": 4.583099834408736e-07, + "loss": 0.3513, + "step": 80968 + }, + { + "epoch": 2.08, + "learning_rate": 4.5828672446437113e-07, + "loss": 0.4109, + "step": 80969 + }, + { + "epoch": 2.08, + "learning_rate": 4.58263465902634e-07, + "loss": 0.4414, + "step": 80970 + }, + { + "epoch": 2.08, + "learning_rate": 4.582402077556793e-07, + "loss": 0.4753, + "step": 80971 + }, + { + "epoch": 2.08, + "learning_rate": 4.582169500235252e-07, + "loss": 0.3408, + "step": 80972 + }, + { + "epoch": 2.08, + "learning_rate": 4.5819369270618937e-07, + "loss": 0.4417, + "step": 80973 + }, + { + "epoch": 2.08, + "learning_rate": 4.581704358036902e-07, + "loss": 0.4163, + "step": 80974 + }, + { + "epoch": 2.08, + "learning_rate": 4.581471793160445e-07, + "loss": 0.3525, + "step": 80975 + }, + { + "epoch": 2.08, + "learning_rate": 4.581239232432711e-07, + "loss": 0.3153, + "step": 80976 + }, + { + "epoch": 2.08, + "learning_rate": 4.581006675853869e-07, + "loss": 0.5103, + "step": 80977 + }, + { + "epoch": 2.08, + "learning_rate": 4.580774123424104e-07, + "loss": 0.4155, + "step": 80978 + }, + { + "epoch": 2.08, + "learning_rate": 4.5805415751435885e-07, + "loss": 0.4902, + "step": 80979 + }, + { + "epoch": 2.08, + "learning_rate": 4.5803090310125027e-07, + "loss": 0.4292, + "step": 80980 + }, + { + "epoch": 2.08, + "learning_rate": 4.580076491031024e-07, + "loss": 0.3821, + "step": 80981 + }, + { + "epoch": 2.08, + "learning_rate": 4.5798439551993364e-07, + "loss": 0.4482, + "step": 80982 + }, + { + "epoch": 2.08, + "learning_rate": 4.579611423517609e-07, + "loss": 0.3353, + "step": 80983 + }, + { + "epoch": 2.08, + "learning_rate": 4.5793788959860237e-07, + "loss": 0.3965, + "step": 80984 + }, + { + "epoch": 2.08, + "learning_rate": 4.579146372604763e-07, + "loss": 0.5205, + "step": 80985 + }, + { + "epoch": 2.08, + "learning_rate": 4.5789138533739956e-07, + "loss": 0.4192, + "step": 80986 + }, + { + "epoch": 2.08, + "learning_rate": 4.5786813382939096e-07, + "loss": 0.2108, + "step": 80987 + }, + { + "epoch": 2.08, + "learning_rate": 4.5784488273646736e-07, + "loss": 0.2762, + "step": 80988 + }, + { + "epoch": 2.08, + "learning_rate": 4.578216320586471e-07, + "loss": 0.4482, + "step": 80989 + }, + { + "epoch": 2.08, + "learning_rate": 4.577983817959479e-07, + "loss": 0.1984, + "step": 80990 + }, + { + "epoch": 2.08, + "learning_rate": 4.577751319483878e-07, + "loss": 0.3457, + "step": 80991 + }, + { + "epoch": 2.08, + "learning_rate": 4.5775188251598397e-07, + "loss": 0.5044, + "step": 80992 + }, + { + "epoch": 2.08, + "learning_rate": 4.577286334987547e-07, + "loss": 0.3745, + "step": 80993 + }, + { + "epoch": 2.08, + "learning_rate": 4.5770538489671797e-07, + "loss": 0.4868, + "step": 80994 + }, + { + "epoch": 2.08, + "learning_rate": 4.576821367098913e-07, + "loss": 0.3101, + "step": 80995 + }, + { + "epoch": 2.08, + "learning_rate": 4.576588889382922e-07, + "loss": 0.3082, + "step": 80996 + }, + { + "epoch": 2.08, + "learning_rate": 4.5763564158193866e-07, + "loss": 0.4463, + "step": 80997 + }, + { + "epoch": 2.08, + "learning_rate": 4.5761239464084854e-07, + "loss": 0.3945, + "step": 80998 + }, + { + "epoch": 2.08, + "learning_rate": 4.5758914811504014e-07, + "loss": 0.439, + "step": 80999 + }, + { + "epoch": 2.08, + "learning_rate": 4.5756590200453035e-07, + "loss": 0.4399, + "step": 81000 + }, + { + "epoch": 2.08, + "learning_rate": 4.575426563093374e-07, + "loss": 0.4028, + "step": 81001 + }, + { + "epoch": 2.08, + "learning_rate": 4.575194110294791e-07, + "loss": 0.3462, + "step": 81002 + }, + { + "epoch": 2.08, + "learning_rate": 4.5749616616497367e-07, + "loss": 0.4961, + "step": 81003 + }, + { + "epoch": 2.08, + "learning_rate": 4.5747292171583807e-07, + "loss": 0.5342, + "step": 81004 + }, + { + "epoch": 2.08, + "learning_rate": 4.5744967768209097e-07, + "loss": 0.4072, + "step": 81005 + }, + { + "epoch": 2.08, + "learning_rate": 4.5742643406374915e-07, + "loss": 0.5142, + "step": 81006 + }, + { + "epoch": 2.08, + "learning_rate": 4.574031908608311e-07, + "loss": 0.3945, + "step": 81007 + }, + { + "epoch": 2.08, + "learning_rate": 4.573799480733548e-07, + "loss": 0.3188, + "step": 81008 + }, + { + "epoch": 2.08, + "learning_rate": 4.573567057013373e-07, + "loss": 0.3711, + "step": 81009 + }, + { + "epoch": 2.08, + "learning_rate": 4.5733346374479697e-07, + "loss": 0.4585, + "step": 81010 + }, + { + "epoch": 2.08, + "learning_rate": 4.573102222037517e-07, + "loss": 0.3738, + "step": 81011 + }, + { + "epoch": 2.08, + "learning_rate": 4.572869810782187e-07, + "loss": 0.4846, + "step": 81012 + }, + { + "epoch": 2.08, + "learning_rate": 4.5726374036821615e-07, + "loss": 0.3333, + "step": 81013 + }, + { + "epoch": 2.08, + "learning_rate": 4.572405000737617e-07, + "loss": 0.5039, + "step": 81014 + }, + { + "epoch": 2.08, + "learning_rate": 4.572172601948737e-07, + "loss": 0.4023, + "step": 81015 + }, + { + "epoch": 2.08, + "learning_rate": 4.5719402073156944e-07, + "loss": 0.3481, + "step": 81016 + }, + { + "epoch": 2.08, + "learning_rate": 4.571707816838665e-07, + "loss": 0.4653, + "step": 81017 + }, + { + "epoch": 2.08, + "learning_rate": 4.571475430517828e-07, + "loss": 0.437, + "step": 81018 + }, + { + "epoch": 2.08, + "learning_rate": 4.5712430483533627e-07, + "loss": 0.3309, + "step": 81019 + }, + { + "epoch": 2.08, + "learning_rate": 4.571010670345451e-07, + "loss": 0.356, + "step": 81020 + }, + { + "epoch": 2.08, + "learning_rate": 4.5707782964942633e-07, + "loss": 0.3893, + "step": 81021 + }, + { + "epoch": 2.08, + "learning_rate": 4.57054592679998e-07, + "loss": 0.3689, + "step": 81022 + }, + { + "epoch": 2.08, + "learning_rate": 4.5703135612627817e-07, + "loss": 0.4429, + "step": 81023 + }, + { + "epoch": 2.08, + "learning_rate": 4.570081199882847e-07, + "loss": 0.4614, + "step": 81024 + }, + { + "epoch": 2.08, + "learning_rate": 4.569848842660352e-07, + "loss": 0.3315, + "step": 81025 + }, + { + "epoch": 2.08, + "learning_rate": 4.56961648959547e-07, + "loss": 0.4229, + "step": 81026 + }, + { + "epoch": 2.08, + "learning_rate": 4.569384140688384e-07, + "loss": 0.4829, + "step": 81027 + }, + { + "epoch": 2.08, + "learning_rate": 4.5691517959392735e-07, + "loss": 0.4022, + "step": 81028 + }, + { + "epoch": 2.08, + "learning_rate": 4.5689194553483103e-07, + "loss": 0.4285, + "step": 81029 + }, + { + "epoch": 2.08, + "learning_rate": 4.5686871189156763e-07, + "loss": 0.3672, + "step": 81030 + }, + { + "epoch": 2.08, + "learning_rate": 4.568454786641548e-07, + "loss": 0.2462, + "step": 81031 + }, + { + "epoch": 2.08, + "learning_rate": 4.5682224585261085e-07, + "loss": 0.2977, + "step": 81032 + }, + { + "epoch": 2.08, + "learning_rate": 4.567990134569527e-07, + "loss": 0.4434, + "step": 81033 + }, + { + "epoch": 2.08, + "learning_rate": 4.5677578147719866e-07, + "loss": 0.3784, + "step": 81034 + }, + { + "epoch": 2.08, + "learning_rate": 4.5675254991336663e-07, + "loss": 0.4878, + "step": 81035 + }, + { + "epoch": 2.08, + "learning_rate": 4.5672931876547395e-07, + "loss": 0.4844, + "step": 81036 + }, + { + "epoch": 2.08, + "learning_rate": 4.56706088033539e-07, + "loss": 0.4702, + "step": 81037 + }, + { + "epoch": 2.08, + "learning_rate": 4.5668285771757886e-07, + "loss": 0.4404, + "step": 81038 + }, + { + "epoch": 2.08, + "learning_rate": 4.5665962781761167e-07, + "loss": 0.3389, + "step": 81039 + }, + { + "epoch": 2.08, + "learning_rate": 4.5663639833365517e-07, + "loss": 0.4595, + "step": 81040 + }, + { + "epoch": 2.08, + "learning_rate": 4.566131692657276e-07, + "loss": 0.3373, + "step": 81041 + }, + { + "epoch": 2.08, + "learning_rate": 4.5658994061384603e-07, + "loss": 0.4893, + "step": 81042 + }, + { + "epoch": 2.08, + "learning_rate": 4.565667123780285e-07, + "loss": 0.3265, + "step": 81043 + }, + { + "epoch": 2.08, + "learning_rate": 4.5654348455829283e-07, + "loss": 0.3408, + "step": 81044 + }, + { + "epoch": 2.08, + "learning_rate": 4.5652025715465757e-07, + "loss": 0.3152, + "step": 81045 + }, + { + "epoch": 2.08, + "learning_rate": 4.5649703016713905e-07, + "loss": 0.0738, + "step": 81046 + }, + { + "epoch": 2.08, + "learning_rate": 4.564738035957557e-07, + "loss": 0.3961, + "step": 81047 + }, + { + "epoch": 2.08, + "learning_rate": 4.564505774405254e-07, + "loss": 0.52, + "step": 81048 + }, + { + "epoch": 2.08, + "learning_rate": 4.564273517014663e-07, + "loss": 0.3274, + "step": 81049 + }, + { + "epoch": 2.08, + "learning_rate": 4.564041263785954e-07, + "loss": 0.5005, + "step": 81050 + }, + { + "epoch": 2.08, + "learning_rate": 4.5638090147193087e-07, + "loss": 0.4487, + "step": 81051 + }, + { + "epoch": 2.08, + "learning_rate": 4.563576769814904e-07, + "loss": 0.3787, + "step": 81052 + }, + { + "epoch": 2.08, + "learning_rate": 4.563344529072923e-07, + "loss": 0.4873, + "step": 81053 + }, + { + "epoch": 2.08, + "learning_rate": 4.5631122924935363e-07, + "loss": 0.3833, + "step": 81054 + }, + { + "epoch": 2.08, + "learning_rate": 4.562880060076927e-07, + "loss": 0.3179, + "step": 81055 + }, + { + "epoch": 2.08, + "learning_rate": 4.562647831823268e-07, + "loss": 0.4272, + "step": 81056 + }, + { + "epoch": 2.08, + "learning_rate": 4.562415607732738e-07, + "loss": 0.4438, + "step": 81057 + }, + { + "epoch": 2.08, + "learning_rate": 4.5621833878055203e-07, + "loss": 0.4419, + "step": 81058 + }, + { + "epoch": 2.08, + "learning_rate": 4.561951172041786e-07, + "loss": 0.4344, + "step": 81059 + }, + { + "epoch": 2.08, + "learning_rate": 4.561718960441715e-07, + "loss": 0.3176, + "step": 81060 + }, + { + "epoch": 2.08, + "learning_rate": 4.5614867530054855e-07, + "loss": 0.3455, + "step": 81061 + }, + { + "epoch": 2.08, + "learning_rate": 4.56125454973328e-07, + "loss": 0.4795, + "step": 81062 + }, + { + "epoch": 2.08, + "learning_rate": 4.561022350625268e-07, + "loss": 0.266, + "step": 81063 + }, + { + "epoch": 2.08, + "learning_rate": 4.560790155681631e-07, + "loss": 0.405, + "step": 81064 + }, + { + "epoch": 2.08, + "learning_rate": 4.5605579649025496e-07, + "loss": 0.4434, + "step": 81065 + }, + { + "epoch": 2.08, + "learning_rate": 4.5603257782882e-07, + "loss": 0.326, + "step": 81066 + }, + { + "epoch": 2.08, + "learning_rate": 4.5600935958387545e-07, + "loss": 0.2787, + "step": 81067 + }, + { + "epoch": 2.08, + "learning_rate": 4.559861417554395e-07, + "loss": 0.3594, + "step": 81068 + }, + { + "epoch": 2.08, + "learning_rate": 4.5596292434353e-07, + "loss": 0.3599, + "step": 81069 + }, + { + "epoch": 2.08, + "learning_rate": 4.55939707348165e-07, + "loss": 0.333, + "step": 81070 + }, + { + "epoch": 2.08, + "learning_rate": 4.5591649076936166e-07, + "loss": 0.3982, + "step": 81071 + }, + { + "epoch": 2.08, + "learning_rate": 4.55893274607138e-07, + "loss": 0.3979, + "step": 81072 + }, + { + "epoch": 2.08, + "learning_rate": 4.558700588615119e-07, + "loss": 0.4375, + "step": 81073 + }, + { + "epoch": 2.08, + "learning_rate": 4.558468435325014e-07, + "loss": 0.4314, + "step": 81074 + }, + { + "epoch": 2.08, + "learning_rate": 4.558236286201238e-07, + "loss": 0.4448, + "step": 81075 + }, + { + "epoch": 2.08, + "learning_rate": 4.5580041412439686e-07, + "loss": 0.4785, + "step": 81076 + }, + { + "epoch": 2.08, + "learning_rate": 4.557772000453385e-07, + "loss": 0.3773, + "step": 81077 + }, + { + "epoch": 2.08, + "learning_rate": 4.5575398638296635e-07, + "loss": 0.4971, + "step": 81078 + }, + { + "epoch": 2.08, + "learning_rate": 4.557307731372989e-07, + "loss": 0.4023, + "step": 81079 + }, + { + "epoch": 2.08, + "learning_rate": 4.557075603083529e-07, + "loss": 0.5034, + "step": 81080 + }, + { + "epoch": 2.08, + "learning_rate": 4.556843478961466e-07, + "loss": 0.4312, + "step": 81081 + }, + { + "epoch": 2.08, + "learning_rate": 4.5566113590069786e-07, + "loss": 0.3787, + "step": 81082 + }, + { + "epoch": 2.08, + "learning_rate": 4.556379243220246e-07, + "loss": 0.4087, + "step": 81083 + }, + { + "epoch": 2.08, + "learning_rate": 4.556147131601441e-07, + "loss": 0.3533, + "step": 81084 + }, + { + "epoch": 2.08, + "learning_rate": 4.555915024150747e-07, + "loss": 0.3555, + "step": 81085 + }, + { + "epoch": 2.08, + "learning_rate": 4.5556829208683347e-07, + "loss": 0.3994, + "step": 81086 + }, + { + "epoch": 2.08, + "learning_rate": 4.5554508217543897e-07, + "loss": 0.4937, + "step": 81087 + }, + { + "epoch": 2.08, + "learning_rate": 4.5552187268090814e-07, + "loss": 0.366, + "step": 81088 + }, + { + "epoch": 2.08, + "learning_rate": 4.554986636032592e-07, + "loss": 0.3989, + "step": 81089 + }, + { + "epoch": 2.08, + "learning_rate": 4.5547545494250994e-07, + "loss": 0.3418, + "step": 81090 + }, + { + "epoch": 2.08, + "learning_rate": 4.554522466986784e-07, + "loss": 0.5239, + "step": 81091 + }, + { + "epoch": 2.08, + "learning_rate": 4.554290388717816e-07, + "loss": 0.5151, + "step": 81092 + }, + { + "epoch": 2.08, + "learning_rate": 4.554058314618379e-07, + "loss": 0.3779, + "step": 81093 + }, + { + "epoch": 2.08, + "learning_rate": 4.553826244688649e-07, + "loss": 0.4111, + "step": 81094 + }, + { + "epoch": 2.08, + "learning_rate": 4.553594178928807e-07, + "loss": 0.1779, + "step": 81095 + }, + { + "epoch": 2.08, + "learning_rate": 4.5533621173390266e-07, + "loss": 0.3248, + "step": 81096 + }, + { + "epoch": 2.08, + "learning_rate": 4.5531300599194833e-07, + "loss": 0.2855, + "step": 81097 + }, + { + "epoch": 2.08, + "learning_rate": 4.552898006670358e-07, + "loss": 0.3406, + "step": 81098 + }, + { + "epoch": 2.08, + "learning_rate": 4.5526659575918293e-07, + "loss": 0.4355, + "step": 81099 + }, + { + "epoch": 2.08, + "learning_rate": 4.552433912684076e-07, + "loss": 0.3799, + "step": 81100 + }, + { + "epoch": 2.08, + "learning_rate": 4.552201871947271e-07, + "loss": 0.4272, + "step": 81101 + }, + { + "epoch": 2.08, + "learning_rate": 4.551969835381594e-07, + "loss": 0.4829, + "step": 81102 + }, + { + "epoch": 2.08, + "learning_rate": 4.5517378029872265e-07, + "loss": 0.3234, + "step": 81103 + }, + { + "epoch": 2.08, + "learning_rate": 4.5515057747643393e-07, + "loss": 0.5107, + "step": 81104 + }, + { + "epoch": 2.08, + "learning_rate": 4.5512737507131174e-07, + "loss": 0.3079, + "step": 81105 + }, + { + "epoch": 2.08, + "learning_rate": 4.551041730833731e-07, + "loss": 0.3009, + "step": 81106 + }, + { + "epoch": 2.08, + "learning_rate": 4.5508097151263614e-07, + "loss": 0.5435, + "step": 81107 + }, + { + "epoch": 2.08, + "learning_rate": 4.5505777035911895e-07, + "loss": 0.3958, + "step": 81108 + }, + { + "epoch": 2.08, + "learning_rate": 4.550345696228387e-07, + "loss": 0.625, + "step": 81109 + }, + { + "epoch": 2.08, + "learning_rate": 4.5501136930381334e-07, + "loss": 0.3657, + "step": 81110 + }, + { + "epoch": 2.08, + "learning_rate": 4.5498816940206076e-07, + "loss": 0.5117, + "step": 81111 + }, + { + "epoch": 2.08, + "learning_rate": 4.54964969917599e-07, + "loss": 0.4023, + "step": 81112 + }, + { + "epoch": 2.08, + "learning_rate": 4.5494177085044515e-07, + "loss": 0.5376, + "step": 81113 + }, + { + "epoch": 2.08, + "learning_rate": 4.549185722006174e-07, + "loss": 0.3667, + "step": 81114 + }, + { + "epoch": 2.08, + "learning_rate": 4.548953739681337e-07, + "loss": 0.4116, + "step": 81115 + }, + { + "epoch": 2.08, + "learning_rate": 4.548721761530112e-07, + "loss": 0.3187, + "step": 81116 + }, + { + "epoch": 2.08, + "learning_rate": 4.548489787552685e-07, + "loss": 0.3555, + "step": 81117 + }, + { + "epoch": 2.08, + "learning_rate": 4.548257817749224e-07, + "loss": 0.3943, + "step": 81118 + }, + { + "epoch": 2.08, + "learning_rate": 4.548025852119911e-07, + "loss": 0.3984, + "step": 81119 + }, + { + "epoch": 2.08, + "learning_rate": 4.5477938906649283e-07, + "loss": 0.239, + "step": 81120 + }, + { + "epoch": 2.08, + "learning_rate": 4.547561933384444e-07, + "loss": 0.3975, + "step": 81121 + }, + { + "epoch": 2.08, + "learning_rate": 4.547329980278642e-07, + "loss": 0.2649, + "step": 81122 + }, + { + "epoch": 2.08, + "learning_rate": 4.5470980313476993e-07, + "loss": 0.4893, + "step": 81123 + }, + { + "epoch": 2.08, + "learning_rate": 4.546866086591795e-07, + "loss": 0.3909, + "step": 81124 + }, + { + "epoch": 2.08, + "learning_rate": 4.5466341460111056e-07, + "loss": 0.3452, + "step": 81125 + }, + { + "epoch": 2.08, + "learning_rate": 4.546402209605804e-07, + "loss": 0.3313, + "step": 81126 + }, + { + "epoch": 2.08, + "learning_rate": 4.5461702773760714e-07, + "loss": 0.5122, + "step": 81127 + }, + { + "epoch": 2.08, + "learning_rate": 4.545938349322085e-07, + "loss": 0.4199, + "step": 81128 + }, + { + "epoch": 2.08, + "learning_rate": 4.545706425444027e-07, + "loss": 0.3809, + "step": 81129 + }, + { + "epoch": 2.08, + "learning_rate": 4.545474505742067e-07, + "loss": 0.3672, + "step": 81130 + }, + { + "epoch": 2.08, + "learning_rate": 4.545242590216386e-07, + "loss": 0.4617, + "step": 81131 + }, + { + "epoch": 2.08, + "learning_rate": 4.545010678867163e-07, + "loss": 0.4307, + "step": 81132 + }, + { + "epoch": 2.08, + "learning_rate": 4.5447787716945773e-07, + "loss": 0.4348, + "step": 81133 + }, + { + "epoch": 2.08, + "learning_rate": 4.5445468686987997e-07, + "loss": 0.4262, + "step": 81134 + }, + { + "epoch": 2.08, + "learning_rate": 4.544314969880017e-07, + "loss": 0.479, + "step": 81135 + }, + { + "epoch": 2.08, + "learning_rate": 4.5440830752383964e-07, + "loss": 0.3804, + "step": 81136 + }, + { + "epoch": 2.08, + "learning_rate": 4.5438511847741234e-07, + "loss": 0.2686, + "step": 81137 + }, + { + "epoch": 2.08, + "learning_rate": 4.5436192984873703e-07, + "loss": 0.324, + "step": 81138 + }, + { + "epoch": 2.08, + "learning_rate": 4.543387416378317e-07, + "loss": 0.4751, + "step": 81139 + }, + { + "epoch": 2.08, + "learning_rate": 4.543155538447141e-07, + "loss": 0.3643, + "step": 81140 + }, + { + "epoch": 2.08, + "learning_rate": 4.542923664694023e-07, + "loss": 0.3207, + "step": 81141 + }, + { + "epoch": 2.08, + "learning_rate": 4.5426917951191335e-07, + "loss": 0.4902, + "step": 81142 + }, + { + "epoch": 2.08, + "learning_rate": 4.542459929722655e-07, + "loss": 0.3528, + "step": 81143 + }, + { + "epoch": 2.08, + "learning_rate": 4.542228068504763e-07, + "loss": 0.3887, + "step": 81144 + }, + { + "epoch": 2.08, + "learning_rate": 4.5419962114656405e-07, + "loss": 0.4521, + "step": 81145 + }, + { + "epoch": 2.08, + "learning_rate": 4.541764358605461e-07, + "loss": 0.2946, + "step": 81146 + }, + { + "epoch": 2.08, + "learning_rate": 4.541532509924396e-07, + "loss": 0.448, + "step": 81147 + }, + { + "epoch": 2.08, + "learning_rate": 4.5413006654226306e-07, + "loss": 0.3921, + "step": 81148 + }, + { + "epoch": 2.08, + "learning_rate": 4.5410688251003395e-07, + "loss": 0.5112, + "step": 81149 + }, + { + "epoch": 2.08, + "learning_rate": 4.5408369889577045e-07, + "loss": 0.4775, + "step": 81150 + }, + { + "epoch": 2.08, + "learning_rate": 4.5406051569948954e-07, + "loss": 0.4805, + "step": 81151 + }, + { + "epoch": 2.08, + "learning_rate": 4.540373329212095e-07, + "loss": 0.3934, + "step": 81152 + }, + { + "epoch": 2.08, + "learning_rate": 4.5401415056094793e-07, + "loss": 0.4731, + "step": 81153 + }, + { + "epoch": 2.08, + "learning_rate": 4.5399096861872286e-07, + "loss": 0.3423, + "step": 81154 + }, + { + "epoch": 2.08, + "learning_rate": 4.5396778709455196e-07, + "loss": 0.4316, + "step": 81155 + }, + { + "epoch": 2.08, + "learning_rate": 4.5394460598845243e-07, + "loss": 0.4648, + "step": 81156 + }, + { + "epoch": 2.08, + "learning_rate": 4.5392142530044244e-07, + "loss": 0.397, + "step": 81157 + }, + { + "epoch": 2.08, + "learning_rate": 4.5389824503054e-07, + "loss": 0.385, + "step": 81158 + }, + { + "epoch": 2.08, + "learning_rate": 4.5387506517876215e-07, + "loss": 0.3943, + "step": 81159 + }, + { + "epoch": 2.08, + "learning_rate": 4.538518857451271e-07, + "loss": 0.4219, + "step": 81160 + }, + { + "epoch": 2.08, + "learning_rate": 4.5382870672965255e-07, + "loss": 0.3501, + "step": 81161 + }, + { + "epoch": 2.08, + "learning_rate": 4.538055281323566e-07, + "loss": 0.4087, + "step": 81162 + }, + { + "epoch": 2.08, + "learning_rate": 4.5378234995325636e-07, + "loss": 0.4717, + "step": 81163 + }, + { + "epoch": 2.08, + "learning_rate": 4.5375917219236983e-07, + "loss": 0.4517, + "step": 81164 + }, + { + "epoch": 2.08, + "learning_rate": 4.5373599484971514e-07, + "loss": 0.3096, + "step": 81165 + }, + { + "epoch": 2.08, + "learning_rate": 4.537128179253092e-07, + "loss": 0.3406, + "step": 81166 + }, + { + "epoch": 2.08, + "learning_rate": 4.536896414191708e-07, + "loss": 0.4258, + "step": 81167 + }, + { + "epoch": 2.08, + "learning_rate": 4.5366646533131657e-07, + "loss": 0.3049, + "step": 81168 + }, + { + "epoch": 2.08, + "learning_rate": 4.536432896617649e-07, + "loss": 0.2534, + "step": 81169 + }, + { + "epoch": 2.08, + "learning_rate": 4.5362011441053336e-07, + "loss": 0.3369, + "step": 81170 + }, + { + "epoch": 2.08, + "learning_rate": 4.535969395776403e-07, + "loss": 0.4565, + "step": 81171 + }, + { + "epoch": 2.08, + "learning_rate": 4.535737651631024e-07, + "loss": 0.4717, + "step": 81172 + }, + { + "epoch": 2.08, + "learning_rate": 4.535505911669381e-07, + "loss": 0.4238, + "step": 81173 + }, + { + "epoch": 2.08, + "learning_rate": 4.535274175891652e-07, + "loss": 0.3491, + "step": 81174 + }, + { + "epoch": 2.08, + "learning_rate": 4.5350424442980137e-07, + "loss": 0.4429, + "step": 81175 + }, + { + "epoch": 2.08, + "learning_rate": 4.5348107168886387e-07, + "loss": 0.5044, + "step": 81176 + }, + { + "epoch": 2.08, + "learning_rate": 4.534578993663706e-07, + "loss": 0.3821, + "step": 81177 + }, + { + "epoch": 2.08, + "learning_rate": 4.534347274623396e-07, + "loss": 0.3945, + "step": 81178 + }, + { + "epoch": 2.08, + "learning_rate": 4.534115559767888e-07, + "loss": 0.2937, + "step": 81179 + }, + { + "epoch": 2.08, + "learning_rate": 4.5338838490973543e-07, + "loss": 0.4209, + "step": 81180 + }, + { + "epoch": 2.08, + "learning_rate": 4.533652142611972e-07, + "loss": 0.3181, + "step": 81181 + }, + { + "epoch": 2.08, + "learning_rate": 4.5334204403119226e-07, + "loss": 0.3687, + "step": 81182 + }, + { + "epoch": 2.08, + "learning_rate": 4.533188742197386e-07, + "loss": 0.3997, + "step": 81183 + }, + { + "epoch": 2.08, + "learning_rate": 4.5329570482685297e-07, + "loss": 0.4431, + "step": 81184 + }, + { + "epoch": 2.08, + "learning_rate": 4.532725358525542e-07, + "loss": 0.4824, + "step": 81185 + }, + { + "epoch": 2.08, + "learning_rate": 4.5324936729685915e-07, + "loss": 0.3035, + "step": 81186 + }, + { + "epoch": 2.08, + "learning_rate": 4.532261991597858e-07, + "loss": 0.3311, + "step": 81187 + }, + { + "epoch": 2.08, + "learning_rate": 4.5320303144135244e-07, + "loss": 0.4629, + "step": 81188 + }, + { + "epoch": 2.08, + "learning_rate": 4.5317986414157607e-07, + "loss": 0.4756, + "step": 81189 + }, + { + "epoch": 2.08, + "learning_rate": 4.531566972604747e-07, + "loss": 0.4893, + "step": 81190 + }, + { + "epoch": 2.08, + "learning_rate": 4.5313353079806637e-07, + "loss": 0.4956, + "step": 81191 + }, + { + "epoch": 2.08, + "learning_rate": 4.5311036475436824e-07, + "loss": 0.3508, + "step": 81192 + }, + { + "epoch": 2.08, + "learning_rate": 4.530871991293984e-07, + "loss": 0.4722, + "step": 81193 + }, + { + "epoch": 2.08, + "learning_rate": 4.530640339231745e-07, + "loss": 0.5303, + "step": 81194 + }, + { + "epoch": 2.08, + "learning_rate": 4.530408691357147e-07, + "loss": 0.3403, + "step": 81195 + }, + { + "epoch": 2.08, + "learning_rate": 4.530177047670364e-07, + "loss": 0.4844, + "step": 81196 + }, + { + "epoch": 2.08, + "learning_rate": 4.529945408171569e-07, + "loss": 0.3848, + "step": 81197 + }, + { + "epoch": 2.08, + "learning_rate": 4.5297137728609436e-07, + "loss": 0.4211, + "step": 81198 + }, + { + "epoch": 2.08, + "learning_rate": 4.529482141738664e-07, + "loss": 0.3257, + "step": 81199 + }, + { + "epoch": 2.08, + "learning_rate": 4.529250514804912e-07, + "loss": 0.2804, + "step": 81200 + }, + { + "epoch": 2.08, + "learning_rate": 4.529018892059858e-07, + "loss": 0.4702, + "step": 81201 + }, + { + "epoch": 2.08, + "learning_rate": 4.5287872735036835e-07, + "loss": 0.4648, + "step": 81202 + }, + { + "epoch": 2.08, + "learning_rate": 4.528555659136565e-07, + "loss": 0.3356, + "step": 81203 + }, + { + "epoch": 2.08, + "learning_rate": 4.5283240489586826e-07, + "loss": 0.3291, + "step": 81204 + }, + { + "epoch": 2.08, + "learning_rate": 4.5280924429702105e-07, + "loss": 0.4268, + "step": 81205 + }, + { + "epoch": 2.08, + "learning_rate": 4.527860841171324e-07, + "loss": 0.3575, + "step": 81206 + }, + { + "epoch": 2.08, + "learning_rate": 4.527629243562202e-07, + "loss": 0.4902, + "step": 81207 + }, + { + "epoch": 2.08, + "learning_rate": 4.527397650143027e-07, + "loss": 0.4727, + "step": 81208 + }, + { + "epoch": 2.08, + "learning_rate": 4.527166060913967e-07, + "loss": 0.4932, + "step": 81209 + }, + { + "epoch": 2.08, + "learning_rate": 4.526934475875205e-07, + "loss": 0.3394, + "step": 81210 + }, + { + "epoch": 2.08, + "learning_rate": 4.526702895026918e-07, + "loss": 0.4614, + "step": 81211 + }, + { + "epoch": 2.08, + "learning_rate": 4.526471318369286e-07, + "loss": 0.4092, + "step": 81212 + }, + { + "epoch": 2.08, + "learning_rate": 4.5262397459024803e-07, + "loss": 0.4761, + "step": 81213 + }, + { + "epoch": 2.08, + "learning_rate": 4.526008177626681e-07, + "loss": 0.4473, + "step": 81214 + }, + { + "epoch": 2.08, + "learning_rate": 4.525776613542068e-07, + "loss": 0.5039, + "step": 81215 + }, + { + "epoch": 2.08, + "learning_rate": 4.5255450536488135e-07, + "loss": 0.3896, + "step": 81216 + }, + { + "epoch": 2.08, + "learning_rate": 4.525313497947102e-07, + "loss": 0.3064, + "step": 81217 + }, + { + "epoch": 2.08, + "learning_rate": 4.5250819464371013e-07, + "loss": 0.3455, + "step": 81218 + }, + { + "epoch": 2.08, + "learning_rate": 4.5248503991189937e-07, + "loss": 0.3516, + "step": 81219 + }, + { + "epoch": 2.08, + "learning_rate": 4.5246188559929563e-07, + "loss": 0.324, + "step": 81220 + }, + { + "epoch": 2.08, + "learning_rate": 4.5243873170591704e-07, + "loss": 0.3624, + "step": 81221 + }, + { + "epoch": 2.08, + "learning_rate": 4.524155782317807e-07, + "loss": 0.3833, + "step": 81222 + }, + { + "epoch": 2.08, + "learning_rate": 4.5239242517690436e-07, + "loss": 0.3523, + "step": 81223 + }, + { + "epoch": 2.08, + "learning_rate": 4.5236927254130607e-07, + "loss": 0.5186, + "step": 81224 + }, + { + "epoch": 2.08, + "learning_rate": 4.5234612032500416e-07, + "loss": 0.4124, + "step": 81225 + }, + { + "epoch": 2.08, + "learning_rate": 4.5232296852801486e-07, + "loss": 0.3147, + "step": 81226 + }, + { + "epoch": 2.08, + "learning_rate": 4.5229981715035684e-07, + "loss": 0.4497, + "step": 81227 + }, + { + "epoch": 2.08, + "learning_rate": 4.522766661920475e-07, + "loss": 0.2792, + "step": 81228 + }, + { + "epoch": 2.08, + "learning_rate": 4.522535156531051e-07, + "loss": 0.2914, + "step": 81229 + }, + { + "epoch": 2.08, + "learning_rate": 4.5223036553354666e-07, + "loss": 0.4146, + "step": 81230 + }, + { + "epoch": 2.08, + "learning_rate": 4.5220721583339027e-07, + "loss": 0.5195, + "step": 81231 + }, + { + "epoch": 2.08, + "learning_rate": 4.5218406655265363e-07, + "loss": 0.3254, + "step": 81232 + }, + { + "epoch": 2.08, + "learning_rate": 4.521609176913549e-07, + "loss": 0.3103, + "step": 81233 + }, + { + "epoch": 2.08, + "learning_rate": 4.5213776924951084e-07, + "loss": 0.3335, + "step": 81234 + }, + { + "epoch": 2.08, + "learning_rate": 4.5211462122714017e-07, + "loss": 0.4219, + "step": 81235 + }, + { + "epoch": 2.08, + "learning_rate": 4.520914736242597e-07, + "loss": 0.406, + "step": 81236 + }, + { + "epoch": 2.08, + "learning_rate": 4.5206832644088765e-07, + "loss": 0.4038, + "step": 81237 + }, + { + "epoch": 2.08, + "learning_rate": 4.52045179677042e-07, + "loss": 0.4238, + "step": 81238 + }, + { + "epoch": 2.08, + "learning_rate": 4.520220333327399e-07, + "loss": 0.4966, + "step": 81239 + }, + { + "epoch": 2.08, + "learning_rate": 4.519988874079993e-07, + "loss": 0.5918, + "step": 81240 + }, + { + "epoch": 2.08, + "learning_rate": 4.519757419028379e-07, + "loss": 0.3304, + "step": 81241 + }, + { + "epoch": 2.08, + "learning_rate": 4.5195259681727394e-07, + "loss": 0.4609, + "step": 81242 + }, + { + "epoch": 2.08, + "learning_rate": 4.5192945215132415e-07, + "loss": 0.5195, + "step": 81243 + }, + { + "epoch": 2.08, + "learning_rate": 4.519063079050069e-07, + "loss": 0.5107, + "step": 81244 + }, + { + "epoch": 2.08, + "learning_rate": 4.5188316407834015e-07, + "loss": 0.2512, + "step": 81245 + }, + { + "epoch": 2.08, + "learning_rate": 4.518600206713412e-07, + "loss": 0.4526, + "step": 81246 + }, + { + "epoch": 2.08, + "learning_rate": 4.5183687768402744e-07, + "loss": 0.3308, + "step": 81247 + }, + { + "epoch": 2.08, + "learning_rate": 4.5181373511641707e-07, + "loss": 0.5073, + "step": 81248 + }, + { + "epoch": 2.08, + "learning_rate": 4.5179059296852773e-07, + "loss": 0.4165, + "step": 81249 + }, + { + "epoch": 2.08, + "learning_rate": 4.517674512403774e-07, + "loss": 0.4009, + "step": 81250 + }, + { + "epoch": 2.08, + "learning_rate": 4.517443099319832e-07, + "loss": 0.5098, + "step": 81251 + }, + { + "epoch": 2.08, + "learning_rate": 4.517211690433632e-07, + "loss": 0.3621, + "step": 81252 + }, + { + "epoch": 2.08, + "learning_rate": 4.51698028574535e-07, + "loss": 0.5952, + "step": 81253 + }, + { + "epoch": 2.08, + "learning_rate": 4.5167488852551683e-07, + "loss": 0.5713, + "step": 81254 + }, + { + "epoch": 2.08, + "learning_rate": 4.5165174889632607e-07, + "loss": 0.479, + "step": 81255 + }, + { + "epoch": 2.08, + "learning_rate": 4.516286096869798e-07, + "loss": 0.3732, + "step": 81256 + }, + { + "epoch": 2.08, + "learning_rate": 4.5160547089749645e-07, + "loss": 0.4507, + "step": 81257 + }, + { + "epoch": 2.08, + "learning_rate": 4.5158233252789345e-07, + "loss": 0.4346, + "step": 81258 + }, + { + "epoch": 2.08, + "learning_rate": 4.515591945781891e-07, + "loss": 0.4666, + "step": 81259 + }, + { + "epoch": 2.08, + "learning_rate": 4.515360570484003e-07, + "loss": 0.5093, + "step": 81260 + }, + { + "epoch": 2.08, + "learning_rate": 4.515129199385451e-07, + "loss": 0.4619, + "step": 81261 + }, + { + "epoch": 2.08, + "learning_rate": 4.5148978324864116e-07, + "loss": 0.4329, + "step": 81262 + }, + { + "epoch": 2.08, + "learning_rate": 4.514666469787067e-07, + "loss": 0.4908, + "step": 81263 + }, + { + "epoch": 2.08, + "learning_rate": 4.5144351112875864e-07, + "loss": 0.3843, + "step": 81264 + }, + { + "epoch": 2.08, + "learning_rate": 4.514203756988155e-07, + "loss": 0.5415, + "step": 81265 + }, + { + "epoch": 2.08, + "learning_rate": 4.5139724068889404e-07, + "loss": 0.4146, + "step": 81266 + }, + { + "epoch": 2.08, + "learning_rate": 4.5137410609901303e-07, + "loss": 0.3284, + "step": 81267 + }, + { + "epoch": 2.08, + "learning_rate": 4.5135097192918916e-07, + "loss": 0.3691, + "step": 81268 + }, + { + "epoch": 2.08, + "learning_rate": 4.5132783817944065e-07, + "loss": 0.4521, + "step": 81269 + }, + { + "epoch": 2.08, + "learning_rate": 4.513047048497851e-07, + "loss": 0.3281, + "step": 81270 + }, + { + "epoch": 2.08, + "learning_rate": 4.5128157194024075e-07, + "loss": 0.2812, + "step": 81271 + }, + { + "epoch": 2.08, + "learning_rate": 4.5125843945082453e-07, + "loss": 0.5186, + "step": 81272 + }, + { + "epoch": 2.08, + "learning_rate": 4.5123530738155444e-07, + "loss": 0.4077, + "step": 81273 + }, + { + "epoch": 2.08, + "learning_rate": 4.5121217573244864e-07, + "loss": 0.4966, + "step": 81274 + }, + { + "epoch": 2.08, + "learning_rate": 4.511890445035241e-07, + "loss": 0.3767, + "step": 81275 + }, + { + "epoch": 2.08, + "learning_rate": 4.511659136947992e-07, + "loss": 0.4132, + "step": 81276 + }, + { + "epoch": 2.08, + "learning_rate": 4.5114278330629096e-07, + "loss": 0.3499, + "step": 81277 + }, + { + "epoch": 2.08, + "learning_rate": 4.511196533380175e-07, + "loss": 0.4106, + "step": 81278 + }, + { + "epoch": 2.08, + "learning_rate": 4.510965237899964e-07, + "loss": 0.4956, + "step": 81279 + }, + { + "epoch": 2.08, + "learning_rate": 4.5107339466224583e-07, + "loss": 0.4712, + "step": 81280 + }, + { + "epoch": 2.08, + "learning_rate": 4.510502659547828e-07, + "loss": 0.3245, + "step": 81281 + }, + { + "epoch": 2.08, + "learning_rate": 4.5102713766762536e-07, + "loss": 0.3774, + "step": 81282 + }, + { + "epoch": 2.08, + "learning_rate": 4.5100400980079155e-07, + "loss": 0.3973, + "step": 81283 + }, + { + "epoch": 2.08, + "learning_rate": 4.5098088235429864e-07, + "loss": 0.3872, + "step": 81284 + }, + { + "epoch": 2.08, + "learning_rate": 4.5095775532816414e-07, + "loss": 0.4033, + "step": 81285 + }, + { + "epoch": 2.08, + "learning_rate": 4.5093462872240606e-07, + "loss": 0.3848, + "step": 81286 + }, + { + "epoch": 2.08, + "learning_rate": 4.50911502537042e-07, + "loss": 0.4771, + "step": 81287 + }, + { + "epoch": 2.08, + "learning_rate": 4.5088837677209025e-07, + "loss": 0.2858, + "step": 81288 + }, + { + "epoch": 2.08, + "learning_rate": 4.508652514275675e-07, + "loss": 0.4814, + "step": 81289 + }, + { + "epoch": 2.08, + "learning_rate": 4.5084212650349207e-07, + "loss": 0.3118, + "step": 81290 + }, + { + "epoch": 2.08, + "learning_rate": 4.5081900199988156e-07, + "loss": 0.4006, + "step": 81291 + }, + { + "epoch": 2.08, + "learning_rate": 4.507958779167541e-07, + "loss": 0.4111, + "step": 81292 + }, + { + "epoch": 2.08, + "learning_rate": 4.5077275425412655e-07, + "loss": 0.3433, + "step": 81293 + }, + { + "epoch": 2.08, + "learning_rate": 4.5074963101201746e-07, + "loss": 0.4546, + "step": 81294 + }, + { + "epoch": 2.08, + "learning_rate": 4.5072650819044366e-07, + "loss": 0.4351, + "step": 81295 + }, + { + "epoch": 2.08, + "learning_rate": 4.5070338578942346e-07, + "loss": 0.4175, + "step": 81296 + }, + { + "epoch": 2.08, + "learning_rate": 4.506802638089747e-07, + "loss": 0.3734, + "step": 81297 + }, + { + "epoch": 2.08, + "learning_rate": 4.5065714224911445e-07, + "loss": 0.3735, + "step": 81298 + }, + { + "epoch": 2.08, + "learning_rate": 4.506340211098607e-07, + "loss": 0.4634, + "step": 81299 + }, + { + "epoch": 2.08, + "learning_rate": 4.506109003912317e-07, + "loss": 0.4233, + "step": 81300 + }, + { + "epoch": 2.08, + "learning_rate": 4.5058778009324425e-07, + "loss": 0.4331, + "step": 81301 + }, + { + "epoch": 2.08, + "learning_rate": 4.5056466021591653e-07, + "loss": 0.4702, + "step": 81302 + }, + { + "epoch": 2.08, + "learning_rate": 4.505415407592661e-07, + "loss": 0.502, + "step": 81303 + }, + { + "epoch": 2.08, + "learning_rate": 4.505184217233111e-07, + "loss": 0.3389, + "step": 81304 + }, + { + "epoch": 2.08, + "learning_rate": 4.5049530310806904e-07, + "loss": 0.3994, + "step": 81305 + }, + { + "epoch": 2.08, + "learning_rate": 4.50472184913557e-07, + "loss": 0.4292, + "step": 81306 + }, + { + "epoch": 2.08, + "learning_rate": 4.50449067139793e-07, + "loss": 0.439, + "step": 81307 + }, + { + "epoch": 2.08, + "learning_rate": 4.5042594978679505e-07, + "loss": 0.5088, + "step": 81308 + }, + { + "epoch": 2.08, + "learning_rate": 4.5040283285458103e-07, + "loss": 0.4531, + "step": 81309 + }, + { + "epoch": 2.08, + "learning_rate": 4.5037971634316784e-07, + "loss": 0.3384, + "step": 81310 + }, + { + "epoch": 2.08, + "learning_rate": 4.503566002525737e-07, + "loss": 0.4922, + "step": 81311 + }, + { + "epoch": 2.08, + "learning_rate": 4.503334845828163e-07, + "loss": 0.3564, + "step": 81312 + }, + { + "epoch": 2.08, + "learning_rate": 4.5031036933391355e-07, + "loss": 0.3745, + "step": 81313 + }, + { + "epoch": 2.08, + "learning_rate": 4.502872545058829e-07, + "loss": 0.2004, + "step": 81314 + }, + { + "epoch": 2.08, + "learning_rate": 4.502641400987416e-07, + "loss": 0.4004, + "step": 81315 + }, + { + "epoch": 2.08, + "learning_rate": 4.502410261125078e-07, + "loss": 0.3385, + "step": 81316 + }, + { + "epoch": 2.08, + "learning_rate": 4.5021791254719955e-07, + "loss": 0.4238, + "step": 81317 + }, + { + "epoch": 2.08, + "learning_rate": 4.5019479940283376e-07, + "loss": 0.5112, + "step": 81318 + }, + { + "epoch": 2.08, + "learning_rate": 4.501716866794286e-07, + "loss": 0.3787, + "step": 81319 + }, + { + "epoch": 2.08, + "learning_rate": 4.501485743770017e-07, + "loss": 0.3015, + "step": 81320 + }, + { + "epoch": 2.08, + "learning_rate": 4.5012546249557105e-07, + "loss": 0.5796, + "step": 81321 + }, + { + "epoch": 2.08, + "learning_rate": 4.501023510351537e-07, + "loss": 0.3751, + "step": 81322 + }, + { + "epoch": 2.08, + "learning_rate": 4.500792399957678e-07, + "loss": 0.4004, + "step": 81323 + }, + { + "epoch": 2.08, + "learning_rate": 4.500561293774312e-07, + "loss": 0.4448, + "step": 81324 + }, + { + "epoch": 2.08, + "learning_rate": 4.50033019180161e-07, + "loss": 0.4272, + "step": 81325 + }, + { + "epoch": 2.08, + "learning_rate": 4.5000990940397556e-07, + "loss": 0.4453, + "step": 81326 + }, + { + "epoch": 2.08, + "learning_rate": 4.499868000488919e-07, + "loss": 0.3309, + "step": 81327 + }, + { + "epoch": 2.08, + "learning_rate": 4.4996369111492806e-07, + "loss": 0.4214, + "step": 81328 + }, + { + "epoch": 2.08, + "learning_rate": 4.499405826021018e-07, + "loss": 0.4751, + "step": 81329 + }, + { + "epoch": 2.08, + "learning_rate": 4.4991747451043094e-07, + "loss": 0.3054, + "step": 81330 + }, + { + "epoch": 2.08, + "learning_rate": 4.4989436683993277e-07, + "loss": 0.4292, + "step": 81331 + }, + { + "epoch": 2.08, + "learning_rate": 4.498712595906251e-07, + "loss": 0.4438, + "step": 81332 + }, + { + "epoch": 2.08, + "learning_rate": 4.4984815276252573e-07, + "loss": 0.4448, + "step": 81333 + }, + { + "epoch": 2.08, + "learning_rate": 4.498250463556531e-07, + "loss": 0.3936, + "step": 81334 + }, + { + "epoch": 2.08, + "learning_rate": 4.498019403700234e-07, + "loss": 0.4211, + "step": 81335 + }, + { + "epoch": 2.08, + "learning_rate": 4.49778834805655e-07, + "loss": 0.522, + "step": 81336 + }, + { + "epoch": 2.08, + "learning_rate": 4.497557296625657e-07, + "loss": 0.5591, + "step": 81337 + }, + { + "epoch": 2.08, + "learning_rate": 4.497326249407735e-07, + "loss": 0.3539, + "step": 81338 + }, + { + "epoch": 2.08, + "learning_rate": 4.497095206402953e-07, + "loss": 0.4358, + "step": 81339 + }, + { + "epoch": 2.08, + "learning_rate": 4.496864167611493e-07, + "loss": 0.4102, + "step": 81340 + }, + { + "epoch": 2.08, + "learning_rate": 4.4966331330335306e-07, + "loss": 0.3267, + "step": 81341 + }, + { + "epoch": 2.08, + "learning_rate": 4.4964021026692466e-07, + "loss": 0.3748, + "step": 81342 + }, + { + "epoch": 2.08, + "learning_rate": 4.496171076518811e-07, + "loss": 0.3785, + "step": 81343 + }, + { + "epoch": 2.08, + "learning_rate": 4.4959400545824076e-07, + "loss": 0.3853, + "step": 81344 + }, + { + "epoch": 2.08, + "learning_rate": 4.495709036860207e-07, + "loss": 0.353, + "step": 81345 + }, + { + "epoch": 2.08, + "learning_rate": 4.495478023352388e-07, + "loss": 0.395, + "step": 81346 + }, + { + "epoch": 2.08, + "learning_rate": 4.4952470140591325e-07, + "loss": 0.3508, + "step": 81347 + }, + { + "epoch": 2.08, + "learning_rate": 4.495016008980609e-07, + "loss": 0.4526, + "step": 81348 + }, + { + "epoch": 2.09, + "learning_rate": 4.494785008116999e-07, + "loss": 0.3813, + "step": 81349 + }, + { + "epoch": 2.09, + "learning_rate": 4.49455401146848e-07, + "loss": 0.5049, + "step": 81350 + }, + { + "epoch": 2.09, + "learning_rate": 4.49432301903523e-07, + "loss": 0.5049, + "step": 81351 + }, + { + "epoch": 2.09, + "learning_rate": 4.4940920308174203e-07, + "loss": 0.3628, + "step": 81352 + }, + { + "epoch": 2.09, + "learning_rate": 4.4938610468152316e-07, + "loss": 0.4402, + "step": 81353 + }, + { + "epoch": 2.09, + "learning_rate": 4.493630067028844e-07, + "loss": 0.4004, + "step": 81354 + }, + { + "epoch": 2.09, + "learning_rate": 4.493399091458431e-07, + "loss": 0.4429, + "step": 81355 + }, + { + "epoch": 2.09, + "learning_rate": 4.4931681201041647e-07, + "loss": 0.4037, + "step": 81356 + }, + { + "epoch": 2.09, + "learning_rate": 4.492937152966226e-07, + "loss": 0.3988, + "step": 81357 + }, + { + "epoch": 2.09, + "learning_rate": 4.492706190044793e-07, + "loss": 0.2332, + "step": 81358 + }, + { + "epoch": 2.09, + "learning_rate": 4.4924752313400447e-07, + "loss": 0.3516, + "step": 81359 + }, + { + "epoch": 2.09, + "learning_rate": 4.492244276852152e-07, + "loss": 0.4272, + "step": 81360 + }, + { + "epoch": 2.09, + "learning_rate": 4.4920133265812945e-07, + "loss": 0.4526, + "step": 81361 + }, + { + "epoch": 2.09, + "learning_rate": 4.4917823805276477e-07, + "loss": 0.4385, + "step": 81362 + }, + { + "epoch": 2.09, + "learning_rate": 4.4915514386913954e-07, + "loss": 0.4556, + "step": 81363 + }, + { + "epoch": 2.09, + "learning_rate": 4.491320501072707e-07, + "loss": 0.4717, + "step": 81364 + }, + { + "epoch": 2.09, + "learning_rate": 4.4910895676717595e-07, + "loss": 0.4443, + "step": 81365 + }, + { + "epoch": 2.09, + "learning_rate": 4.4908586384887305e-07, + "loss": 0.4048, + "step": 81366 + }, + { + "epoch": 2.09, + "learning_rate": 4.490627713523798e-07, + "loss": 0.311, + "step": 81367 + }, + { + "epoch": 2.09, + "learning_rate": 4.4903967927771415e-07, + "loss": 0.2778, + "step": 81368 + }, + { + "epoch": 2.09, + "learning_rate": 4.4901658762489314e-07, + "loss": 0.5142, + "step": 81369 + }, + { + "epoch": 2.09, + "learning_rate": 4.489934963939348e-07, + "loss": 0.2972, + "step": 81370 + }, + { + "epoch": 2.09, + "learning_rate": 4.489704055848572e-07, + "loss": 0.401, + "step": 81371 + }, + { + "epoch": 2.09, + "learning_rate": 4.489473151976773e-07, + "loss": 0.4246, + "step": 81372 + }, + { + "epoch": 2.09, + "learning_rate": 4.4892422523241303e-07, + "loss": 0.396, + "step": 81373 + }, + { + "epoch": 2.09, + "learning_rate": 4.489011356890825e-07, + "loss": 0.4141, + "step": 81374 + }, + { + "epoch": 2.09, + "learning_rate": 4.488780465677027e-07, + "loss": 0.3374, + "step": 81375 + }, + { + "epoch": 2.09, + "learning_rate": 4.4885495786829197e-07, + "loss": 0.481, + "step": 81376 + }, + { + "epoch": 2.09, + "learning_rate": 4.488318695908673e-07, + "loss": 0.353, + "step": 81377 + }, + { + "epoch": 2.09, + "learning_rate": 4.4880878173544676e-07, + "loss": 0.4038, + "step": 81378 + }, + { + "epoch": 2.09, + "learning_rate": 4.4878569430204796e-07, + "loss": 0.3562, + "step": 81379 + }, + { + "epoch": 2.09, + "learning_rate": 4.4876260729068893e-07, + "loss": 0.4688, + "step": 81380 + }, + { + "epoch": 2.09, + "learning_rate": 4.487395207013868e-07, + "loss": 0.3467, + "step": 81381 + }, + { + "epoch": 2.09, + "learning_rate": 4.487164345341593e-07, + "loss": 0.4409, + "step": 81382 + }, + { + "epoch": 2.09, + "learning_rate": 4.486933487890244e-07, + "loss": 0.4873, + "step": 81383 + }, + { + "epoch": 2.09, + "learning_rate": 4.48670263466e-07, + "loss": 0.436, + "step": 81384 + }, + { + "epoch": 2.09, + "learning_rate": 4.4864717856510334e-07, + "loss": 0.4414, + "step": 81385 + }, + { + "epoch": 2.09, + "learning_rate": 4.486240940863519e-07, + "loss": 0.3304, + "step": 81386 + }, + { + "epoch": 2.09, + "learning_rate": 4.4860101002976356e-07, + "loss": 0.4492, + "step": 81387 + }, + { + "epoch": 2.09, + "learning_rate": 4.4857792639535666e-07, + "loss": 0.4243, + "step": 81388 + }, + { + "epoch": 2.09, + "learning_rate": 4.485548431831476e-07, + "loss": 0.3771, + "step": 81389 + }, + { + "epoch": 2.09, + "learning_rate": 4.48531760393155e-07, + "loss": 0.4844, + "step": 81390 + }, + { + "epoch": 2.09, + "learning_rate": 4.4850867802539617e-07, + "loss": 0.387, + "step": 81391 + }, + { + "epoch": 2.09, + "learning_rate": 4.484855960798892e-07, + "loss": 0.2753, + "step": 81392 + }, + { + "epoch": 2.09, + "learning_rate": 4.484625145566512e-07, + "loss": 0.5161, + "step": 81393 + }, + { + "epoch": 2.09, + "learning_rate": 4.4843943345570036e-07, + "loss": 0.3867, + "step": 81394 + }, + { + "epoch": 2.09, + "learning_rate": 4.4841635277705383e-07, + "loss": 0.3936, + "step": 81395 + }, + { + "epoch": 2.09, + "learning_rate": 4.4839327252072946e-07, + "loss": 0.4097, + "step": 81396 + }, + { + "epoch": 2.09, + "learning_rate": 4.4837019268674535e-07, + "loss": 0.3335, + "step": 81397 + }, + { + "epoch": 2.09, + "learning_rate": 4.4834711327511844e-07, + "loss": 0.3999, + "step": 81398 + }, + { + "epoch": 2.09, + "learning_rate": 4.4832403428586685e-07, + "loss": 0.3813, + "step": 81399 + }, + { + "epoch": 2.09, + "learning_rate": 4.483009557190081e-07, + "loss": 0.4482, + "step": 81400 + }, + { + "epoch": 2.09, + "learning_rate": 4.4827787757456036e-07, + "loss": 0.4199, + "step": 81401 + }, + { + "epoch": 2.09, + "learning_rate": 4.4825479985254046e-07, + "loss": 0.3645, + "step": 81402 + }, + { + "epoch": 2.09, + "learning_rate": 4.482317225529666e-07, + "loss": 0.4204, + "step": 81403 + }, + { + "epoch": 2.09, + "learning_rate": 4.482086456758566e-07, + "loss": 0.3928, + "step": 81404 + }, + { + "epoch": 2.09, + "learning_rate": 4.4818556922122755e-07, + "loss": 0.3325, + "step": 81405 + }, + { + "epoch": 2.09, + "learning_rate": 4.4816249318909783e-07, + "loss": 0.5127, + "step": 81406 + }, + { + "epoch": 2.09, + "learning_rate": 4.4813941757948424e-07, + "loss": 0.3816, + "step": 81407 + }, + { + "epoch": 2.09, + "learning_rate": 4.4811634239240504e-07, + "loss": 0.4565, + "step": 81408 + }, + { + "epoch": 2.09, + "learning_rate": 4.48093267627878e-07, + "loss": 0.3542, + "step": 81409 + }, + { + "epoch": 2.09, + "learning_rate": 4.4807019328592034e-07, + "loss": 0.4326, + "step": 81410 + }, + { + "epoch": 2.09, + "learning_rate": 4.4804711936654993e-07, + "loss": 0.4546, + "step": 81411 + }, + { + "epoch": 2.09, + "learning_rate": 4.480240458697845e-07, + "loss": 0.4609, + "step": 81412 + }, + { + "epoch": 2.09, + "learning_rate": 4.48000972795642e-07, + "loss": 0.4648, + "step": 81413 + }, + { + "epoch": 2.09, + "learning_rate": 4.4797790014413973e-07, + "loss": 0.4761, + "step": 81414 + }, + { + "epoch": 2.09, + "learning_rate": 4.4795482791529504e-07, + "loss": 0.3789, + "step": 81415 + }, + { + "epoch": 2.09, + "learning_rate": 4.4793175610912604e-07, + "loss": 0.3513, + "step": 81416 + }, + { + "epoch": 2.09, + "learning_rate": 4.4790868472565025e-07, + "loss": 0.5059, + "step": 81417 + }, + { + "epoch": 2.09, + "learning_rate": 4.478856137648858e-07, + "loss": 0.4751, + "step": 81418 + }, + { + "epoch": 2.09, + "learning_rate": 4.4786254322684945e-07, + "loss": 0.3391, + "step": 81419 + }, + { + "epoch": 2.09, + "learning_rate": 4.4783947311155944e-07, + "loss": 0.4697, + "step": 81420 + }, + { + "epoch": 2.09, + "learning_rate": 4.4781640341903336e-07, + "loss": 0.3735, + "step": 81421 + }, + { + "epoch": 2.09, + "learning_rate": 4.4779333414928933e-07, + "loss": 0.3477, + "step": 81422 + }, + { + "epoch": 2.09, + "learning_rate": 4.4777026530234407e-07, + "loss": 0.4225, + "step": 81423 + }, + { + "epoch": 2.09, + "learning_rate": 4.4774719687821616e-07, + "loss": 0.3307, + "step": 81424 + }, + { + "epoch": 2.09, + "learning_rate": 4.4772412887692234e-07, + "loss": 0.4775, + "step": 81425 + }, + { + "epoch": 2.09, + "learning_rate": 4.477010612984813e-07, + "loss": 0.3936, + "step": 81426 + }, + { + "epoch": 2.09, + "learning_rate": 4.476779941429096e-07, + "loss": 0.29, + "step": 81427 + }, + { + "epoch": 2.09, + "learning_rate": 4.4765492741022573e-07, + "loss": 0.2347, + "step": 81428 + }, + { + "epoch": 2.09, + "learning_rate": 4.476318611004468e-07, + "loss": 0.501, + "step": 81429 + }, + { + "epoch": 2.09, + "learning_rate": 4.476087952135913e-07, + "loss": 0.4277, + "step": 81430 + }, + { + "epoch": 2.09, + "learning_rate": 4.475857297496759e-07, + "loss": 0.6162, + "step": 81431 + }, + { + "epoch": 2.09, + "learning_rate": 4.475626647087187e-07, + "loss": 0.3004, + "step": 81432 + }, + { + "epoch": 2.09, + "learning_rate": 4.475396000907374e-07, + "loss": 0.5615, + "step": 81433 + }, + { + "epoch": 2.09, + "learning_rate": 4.475165358957501e-07, + "loss": 0.4761, + "step": 81434 + }, + { + "epoch": 2.09, + "learning_rate": 4.4749347212377384e-07, + "loss": 0.322, + "step": 81435 + }, + { + "epoch": 2.09, + "learning_rate": 4.474704087748261e-07, + "loss": 0.3264, + "step": 81436 + }, + { + "epoch": 2.09, + "learning_rate": 4.4744734584892485e-07, + "loss": 0.3396, + "step": 81437 + }, + { + "epoch": 2.09, + "learning_rate": 4.4742428334608786e-07, + "loss": 0.4512, + "step": 81438 + }, + { + "epoch": 2.09, + "learning_rate": 4.4740122126633287e-07, + "loss": 0.4014, + "step": 81439 + }, + { + "epoch": 2.09, + "learning_rate": 4.473781596096771e-07, + "loss": 0.3647, + "step": 81440 + }, + { + "epoch": 2.09, + "learning_rate": 4.473550983761385e-07, + "loss": 0.313, + "step": 81441 + }, + { + "epoch": 2.09, + "learning_rate": 4.473320375657346e-07, + "loss": 0.3831, + "step": 81442 + }, + { + "epoch": 2.09, + "learning_rate": 4.473089771784835e-07, + "loss": 0.4565, + "step": 81443 + }, + { + "epoch": 2.09, + "learning_rate": 4.4728591721440256e-07, + "loss": 0.3329, + "step": 81444 + }, + { + "epoch": 2.09, + "learning_rate": 4.47262857673509e-07, + "loss": 0.3203, + "step": 81445 + }, + { + "epoch": 2.09, + "learning_rate": 4.4723979855582083e-07, + "loss": 0.3018, + "step": 81446 + }, + { + "epoch": 2.09, + "learning_rate": 4.472167398613562e-07, + "loss": 0.3965, + "step": 81447 + }, + { + "epoch": 2.09, + "learning_rate": 4.471936815901318e-07, + "loss": 0.4023, + "step": 81448 + }, + { + "epoch": 2.09, + "learning_rate": 4.4717062374216586e-07, + "loss": 0.3212, + "step": 81449 + }, + { + "epoch": 2.09, + "learning_rate": 4.47147566317476e-07, + "loss": 0.2191, + "step": 81450 + }, + { + "epoch": 2.09, + "learning_rate": 4.4712450931608e-07, + "loss": 0.3862, + "step": 81451 + }, + { + "epoch": 2.09, + "learning_rate": 4.4710145273799514e-07, + "loss": 0.4253, + "step": 81452 + }, + { + "epoch": 2.09, + "learning_rate": 4.470783965832392e-07, + "loss": 0.4429, + "step": 81453 + }, + { + "epoch": 2.09, + "learning_rate": 4.470553408518303e-07, + "loss": 0.2822, + "step": 81454 + }, + { + "epoch": 2.09, + "learning_rate": 4.4703228554378534e-07, + "loss": 0.4717, + "step": 81455 + }, + { + "epoch": 2.09, + "learning_rate": 4.4700923065912275e-07, + "loss": 0.4077, + "step": 81456 + }, + { + "epoch": 2.09, + "learning_rate": 4.469861761978593e-07, + "loss": 0.37, + "step": 81457 + }, + { + "epoch": 2.09, + "learning_rate": 4.469631221600132e-07, + "loss": 0.3718, + "step": 81458 + }, + { + "epoch": 2.09, + "learning_rate": 4.4694006854560197e-07, + "loss": 0.4702, + "step": 81459 + }, + { + "epoch": 2.09, + "learning_rate": 4.4691701535464365e-07, + "loss": 0.4805, + "step": 81460 + }, + { + "epoch": 2.09, + "learning_rate": 4.4689396258715516e-07, + "loss": 0.4351, + "step": 81461 + }, + { + "epoch": 2.09, + "learning_rate": 4.4687091024315446e-07, + "loss": 0.397, + "step": 81462 + }, + { + "epoch": 2.09, + "learning_rate": 4.468478583226598e-07, + "loss": 0.4722, + "step": 81463 + }, + { + "epoch": 2.09, + "learning_rate": 4.4682480682568824e-07, + "loss": 0.5327, + "step": 81464 + }, + { + "epoch": 2.09, + "learning_rate": 4.4680175575225707e-07, + "loss": 0.4136, + "step": 81465 + }, + { + "epoch": 2.09, + "learning_rate": 4.4677870510238447e-07, + "loss": 0.5015, + "step": 81466 + }, + { + "epoch": 2.09, + "learning_rate": 4.467556548760879e-07, + "loss": 0.3149, + "step": 81467 + }, + { + "epoch": 2.09, + "learning_rate": 4.467326050733854e-07, + "loss": 0.3428, + "step": 81468 + }, + { + "epoch": 2.09, + "learning_rate": 4.4670955569429404e-07, + "loss": 0.4639, + "step": 81469 + }, + { + "epoch": 2.09, + "learning_rate": 4.466865067388317e-07, + "loss": 0.4609, + "step": 81470 + }, + { + "epoch": 2.09, + "learning_rate": 4.46663458207016e-07, + "loss": 0.5894, + "step": 81471 + }, + { + "epoch": 2.09, + "learning_rate": 4.466404100988651e-07, + "loss": 0.2927, + "step": 81472 + }, + { + "epoch": 2.09, + "learning_rate": 4.4661736241439575e-07, + "loss": 0.5791, + "step": 81473 + }, + { + "epoch": 2.09, + "learning_rate": 4.4659431515362643e-07, + "loss": 0.2277, + "step": 81474 + }, + { + "epoch": 2.09, + "learning_rate": 4.465712683165741e-07, + "loss": 0.2753, + "step": 81475 + }, + { + "epoch": 2.09, + "learning_rate": 4.465482219032566e-07, + "loss": 0.4761, + "step": 81476 + }, + { + "epoch": 2.09, + "learning_rate": 4.465251759136921e-07, + "loss": 0.5137, + "step": 81477 + }, + { + "epoch": 2.09, + "learning_rate": 4.4650213034789743e-07, + "loss": 0.3904, + "step": 81478 + }, + { + "epoch": 2.09, + "learning_rate": 4.464790852058907e-07, + "loss": 0.4658, + "step": 81479 + }, + { + "epoch": 2.09, + "learning_rate": 4.4645604048768983e-07, + "loss": 0.4531, + "step": 81480 + }, + { + "epoch": 2.09, + "learning_rate": 4.4643299619331163e-07, + "loss": 0.354, + "step": 81481 + }, + { + "epoch": 2.09, + "learning_rate": 4.464099523227743e-07, + "loss": 0.4297, + "step": 81482 + }, + { + "epoch": 2.09, + "learning_rate": 4.463869088760955e-07, + "loss": 0.3225, + "step": 81483 + }, + { + "epoch": 2.09, + "learning_rate": 4.4636386585329313e-07, + "loss": 0.3657, + "step": 81484 + }, + { + "epoch": 2.09, + "learning_rate": 4.4634082325438436e-07, + "loss": 0.1786, + "step": 81485 + }, + { + "epoch": 2.09, + "learning_rate": 4.4631778107938677e-07, + "loss": 0.4231, + "step": 81486 + }, + { + "epoch": 2.09, + "learning_rate": 4.4629473932831806e-07, + "loss": 0.5391, + "step": 81487 + }, + { + "epoch": 2.09, + "learning_rate": 4.46271698001196e-07, + "loss": 0.4819, + "step": 81488 + }, + { + "epoch": 2.09, + "learning_rate": 4.4624865709803873e-07, + "loss": 0.3735, + "step": 81489 + }, + { + "epoch": 2.09, + "learning_rate": 4.4622561661886294e-07, + "loss": 0.334, + "step": 81490 + }, + { + "epoch": 2.09, + "learning_rate": 4.4620257656368675e-07, + "loss": 0.417, + "step": 81491 + }, + { + "epoch": 2.09, + "learning_rate": 4.4617953693252785e-07, + "loss": 0.3252, + "step": 81492 + }, + { + "epoch": 2.09, + "learning_rate": 4.461564977254041e-07, + "loss": 0.3335, + "step": 81493 + }, + { + "epoch": 2.09, + "learning_rate": 4.4613345894233287e-07, + "loss": 0.4224, + "step": 81494 + }, + { + "epoch": 2.09, + "learning_rate": 4.461104205833315e-07, + "loss": 0.4653, + "step": 81495 + }, + { + "epoch": 2.09, + "learning_rate": 4.4608738264841783e-07, + "loss": 0.4941, + "step": 81496 + }, + { + "epoch": 2.09, + "learning_rate": 4.460643451376099e-07, + "loss": 0.467, + "step": 81497 + }, + { + "epoch": 2.09, + "learning_rate": 4.4604130805092475e-07, + "loss": 0.3901, + "step": 81498 + }, + { + "epoch": 2.09, + "learning_rate": 4.460182713883802e-07, + "loss": 0.4175, + "step": 81499 + }, + { + "epoch": 2.09, + "learning_rate": 4.4599523514999415e-07, + "loss": 0.4634, + "step": 81500 + }, + { + "epoch": 2.09, + "learning_rate": 4.4597219933578435e-07, + "loss": 0.4697, + "step": 81501 + }, + { + "epoch": 2.09, + "learning_rate": 4.4594916394576774e-07, + "loss": 0.436, + "step": 81502 + }, + { + "epoch": 2.09, + "learning_rate": 4.459261289799625e-07, + "loss": 0.3926, + "step": 81503 + }, + { + "epoch": 2.09, + "learning_rate": 4.4590309443838634e-07, + "loss": 0.4253, + "step": 81504 + }, + { + "epoch": 2.09, + "learning_rate": 4.4588006032105653e-07, + "loss": 0.427, + "step": 81505 + }, + { + "epoch": 2.09, + "learning_rate": 4.458570266279912e-07, + "loss": 0.2946, + "step": 81506 + }, + { + "epoch": 2.09, + "learning_rate": 4.4583399335920724e-07, + "loss": 0.3418, + "step": 81507 + }, + { + "epoch": 2.09, + "learning_rate": 4.458109605147227e-07, + "loss": 0.318, + "step": 81508 + }, + { + "epoch": 2.09, + "learning_rate": 4.457879280945552e-07, + "loss": 0.4639, + "step": 81509 + }, + { + "epoch": 2.09, + "learning_rate": 4.457648960987228e-07, + "loss": 0.542, + "step": 81510 + }, + { + "epoch": 2.09, + "learning_rate": 4.457418645272424e-07, + "loss": 0.4746, + "step": 81511 + }, + { + "epoch": 2.09, + "learning_rate": 4.457188333801319e-07, + "loss": 0.4434, + "step": 81512 + }, + { + "epoch": 2.09, + "learning_rate": 4.4569580265740916e-07, + "loss": 0.5156, + "step": 81513 + }, + { + "epoch": 2.09, + "learning_rate": 4.456727723590923e-07, + "loss": 0.4971, + "step": 81514 + }, + { + "epoch": 2.09, + "learning_rate": 4.456497424851975e-07, + "loss": 0.4189, + "step": 81515 + }, + { + "epoch": 2.09, + "learning_rate": 4.456267130357433e-07, + "loss": 0.4214, + "step": 81516 + }, + { + "epoch": 2.09, + "learning_rate": 4.456036840107472e-07, + "loss": 0.3335, + "step": 81517 + }, + { + "epoch": 2.09, + "learning_rate": 4.4558065541022726e-07, + "loss": 0.4829, + "step": 81518 + }, + { + "epoch": 2.09, + "learning_rate": 4.455576272342003e-07, + "loss": 0.4165, + "step": 81519 + }, + { + "epoch": 2.09, + "learning_rate": 4.4553459948268437e-07, + "loss": 0.2367, + "step": 81520 + }, + { + "epoch": 2.09, + "learning_rate": 4.455115721556971e-07, + "loss": 0.5952, + "step": 81521 + }, + { + "epoch": 2.09, + "learning_rate": 4.454885452532565e-07, + "loss": 0.4355, + "step": 81522 + }, + { + "epoch": 2.09, + "learning_rate": 4.4546551877537954e-07, + "loss": 0.2894, + "step": 81523 + }, + { + "epoch": 2.09, + "learning_rate": 4.4544249272208445e-07, + "loss": 0.2942, + "step": 81524 + }, + { + "epoch": 2.09, + "learning_rate": 4.454194670933882e-07, + "loss": 0.5488, + "step": 81525 + }, + { + "epoch": 2.09, + "learning_rate": 4.453964418893087e-07, + "loss": 0.5454, + "step": 81526 + }, + { + "epoch": 2.09, + "learning_rate": 4.4537341710986396e-07, + "loss": 0.3343, + "step": 81527 + }, + { + "epoch": 2.09, + "learning_rate": 4.4535039275507105e-07, + "loss": 0.3584, + "step": 81528 + }, + { + "epoch": 2.09, + "learning_rate": 4.453273688249478e-07, + "loss": 0.3901, + "step": 81529 + }, + { + "epoch": 2.09, + "learning_rate": 4.453043453195119e-07, + "loss": 0.4565, + "step": 81530 + }, + { + "epoch": 2.09, + "learning_rate": 4.4528132223878124e-07, + "loss": 0.3994, + "step": 81531 + }, + { + "epoch": 2.09, + "learning_rate": 4.4525829958277283e-07, + "loss": 0.353, + "step": 81532 + }, + { + "epoch": 2.09, + "learning_rate": 4.452352773515047e-07, + "loss": 0.4692, + "step": 81533 + }, + { + "epoch": 2.09, + "learning_rate": 4.4521225554499474e-07, + "loss": 0.4091, + "step": 81534 + }, + { + "epoch": 2.09, + "learning_rate": 4.4518923416326026e-07, + "loss": 0.4106, + "step": 81535 + }, + { + "epoch": 2.09, + "learning_rate": 4.451662132063184e-07, + "loss": 0.4314, + "step": 81536 + }, + { + "epoch": 2.09, + "learning_rate": 4.451431926741874e-07, + "loss": 0.395, + "step": 81537 + }, + { + "epoch": 2.09, + "learning_rate": 4.4512017256688473e-07, + "loss": 0.239, + "step": 81538 + }, + { + "epoch": 2.09, + "learning_rate": 4.4509715288442826e-07, + "loss": 0.5, + "step": 81539 + }, + { + "epoch": 2.09, + "learning_rate": 4.450741336268352e-07, + "loss": 0.4678, + "step": 81540 + }, + { + "epoch": 2.09, + "learning_rate": 4.450511147941233e-07, + "loss": 0.417, + "step": 81541 + }, + { + "epoch": 2.09, + "learning_rate": 4.450280963863102e-07, + "loss": 0.3613, + "step": 81542 + }, + { + "epoch": 2.09, + "learning_rate": 4.4500507840341397e-07, + "loss": 0.4517, + "step": 81543 + }, + { + "epoch": 2.09, + "learning_rate": 4.4498206084545176e-07, + "loss": 0.5303, + "step": 81544 + }, + { + "epoch": 2.09, + "learning_rate": 4.4495904371244095e-07, + "loss": 0.3457, + "step": 81545 + }, + { + "epoch": 2.09, + "learning_rate": 4.449360270043995e-07, + "loss": 0.3483, + "step": 81546 + }, + { + "epoch": 2.09, + "learning_rate": 4.44913010721345e-07, + "loss": 0.5684, + "step": 81547 + }, + { + "epoch": 2.09, + "learning_rate": 4.448899948632955e-07, + "loss": 0.249, + "step": 81548 + }, + { + "epoch": 2.09, + "learning_rate": 4.4486697943026774e-07, + "loss": 0.321, + "step": 81549 + }, + { + "epoch": 2.09, + "learning_rate": 4.448439644222798e-07, + "loss": 0.3435, + "step": 81550 + }, + { + "epoch": 2.09, + "learning_rate": 4.448209498393498e-07, + "loss": 0.5645, + "step": 81551 + }, + { + "epoch": 2.09, + "learning_rate": 4.4479793568149437e-07, + "loss": 0.5029, + "step": 81552 + }, + { + "epoch": 2.09, + "learning_rate": 4.447749219487317e-07, + "loss": 0.4595, + "step": 81553 + }, + { + "epoch": 2.09, + "learning_rate": 4.447519086410797e-07, + "loss": 0.3794, + "step": 81554 + }, + { + "epoch": 2.09, + "learning_rate": 4.4472889575855533e-07, + "loss": 0.5117, + "step": 81555 + }, + { + "epoch": 2.09, + "learning_rate": 4.4470588330117676e-07, + "loss": 0.3228, + "step": 81556 + }, + { + "epoch": 2.09, + "learning_rate": 4.446828712689611e-07, + "loss": 0.4609, + "step": 81557 + }, + { + "epoch": 2.09, + "learning_rate": 4.446598596619262e-07, + "loss": 0.3779, + "step": 81558 + }, + { + "epoch": 2.09, + "learning_rate": 4.4463684848008964e-07, + "loss": 0.4263, + "step": 81559 + }, + { + "epoch": 2.09, + "learning_rate": 4.446138377234695e-07, + "loss": 0.3505, + "step": 81560 + }, + { + "epoch": 2.09, + "learning_rate": 4.4459082739208273e-07, + "loss": 0.4189, + "step": 81561 + }, + { + "epoch": 2.09, + "learning_rate": 4.445678174859472e-07, + "loss": 0.4399, + "step": 81562 + }, + { + "epoch": 2.09, + "learning_rate": 4.445448080050804e-07, + "loss": 0.4153, + "step": 81563 + }, + { + "epoch": 2.09, + "learning_rate": 4.445217989495007e-07, + "loss": 0.3848, + "step": 81564 + }, + { + "epoch": 2.09, + "learning_rate": 4.44498790319225e-07, + "loss": 0.3505, + "step": 81565 + }, + { + "epoch": 2.09, + "learning_rate": 4.4447578211427064e-07, + "loss": 0.3994, + "step": 81566 + }, + { + "epoch": 2.09, + "learning_rate": 4.4445277433465567e-07, + "loss": 0.4536, + "step": 81567 + }, + { + "epoch": 2.09, + "learning_rate": 4.4442976698039803e-07, + "loss": 0.3831, + "step": 81568 + }, + { + "epoch": 2.09, + "learning_rate": 4.444067600515146e-07, + "loss": 0.4277, + "step": 81569 + }, + { + "epoch": 2.09, + "learning_rate": 4.443837535480234e-07, + "loss": 0.4678, + "step": 81570 + }, + { + "epoch": 2.09, + "learning_rate": 4.4436074746994187e-07, + "loss": 0.3367, + "step": 81571 + }, + { + "epoch": 2.09, + "learning_rate": 4.4433774181728836e-07, + "loss": 0.3691, + "step": 81572 + }, + { + "epoch": 2.09, + "learning_rate": 4.443147365900797e-07, + "loss": 0.4204, + "step": 81573 + }, + { + "epoch": 2.09, + "learning_rate": 4.4429173178833335e-07, + "loss": 0.4312, + "step": 81574 + }, + { + "epoch": 2.09, + "learning_rate": 4.442687274120673e-07, + "loss": 0.3481, + "step": 81575 + }, + { + "epoch": 2.09, + "learning_rate": 4.442457234612992e-07, + "loss": 0.3989, + "step": 81576 + }, + { + "epoch": 2.09, + "learning_rate": 4.44222719936047e-07, + "loss": 0.4482, + "step": 81577 + }, + { + "epoch": 2.09, + "learning_rate": 4.441997168363274e-07, + "loss": 0.543, + "step": 81578 + }, + { + "epoch": 2.09, + "learning_rate": 4.441767141621585e-07, + "loss": 0.4438, + "step": 81579 + }, + { + "epoch": 2.09, + "learning_rate": 4.441537119135581e-07, + "loss": 0.3489, + "step": 81580 + }, + { + "epoch": 2.09, + "learning_rate": 4.4413071009054393e-07, + "loss": 0.479, + "step": 81581 + }, + { + "epoch": 2.09, + "learning_rate": 4.4410770869313285e-07, + "loss": 0.3533, + "step": 81582 + }, + { + "epoch": 2.09, + "learning_rate": 4.4408470772134344e-07, + "loss": 0.4419, + "step": 81583 + }, + { + "epoch": 2.09, + "learning_rate": 4.440617071751924e-07, + "loss": 0.3149, + "step": 81584 + }, + { + "epoch": 2.09, + "learning_rate": 4.440387070546977e-07, + "loss": 0.4023, + "step": 81585 + }, + { + "epoch": 2.09, + "learning_rate": 4.440157073598775e-07, + "loss": 0.415, + "step": 81586 + }, + { + "epoch": 2.09, + "learning_rate": 4.439927080907484e-07, + "loss": 0.459, + "step": 81587 + }, + { + "epoch": 2.09, + "learning_rate": 4.4396970924732857e-07, + "loss": 0.3149, + "step": 81588 + }, + { + "epoch": 2.09, + "learning_rate": 4.439467108296359e-07, + "loss": 0.478, + "step": 81589 + }, + { + "epoch": 2.09, + "learning_rate": 4.4392371283768735e-07, + "loss": 0.3521, + "step": 81590 + }, + { + "epoch": 2.09, + "learning_rate": 4.4390071527150074e-07, + "loss": 0.2952, + "step": 81591 + }, + { + "epoch": 2.09, + "learning_rate": 4.4387771813109387e-07, + "loss": 0.4702, + "step": 81592 + }, + { + "epoch": 2.09, + "learning_rate": 4.4385472141648464e-07, + "loss": 0.3232, + "step": 81593 + }, + { + "epoch": 2.09, + "learning_rate": 4.438317251276903e-07, + "loss": 0.3862, + "step": 81594 + }, + { + "epoch": 2.09, + "learning_rate": 4.43808729264728e-07, + "loss": 0.4575, + "step": 81595 + }, + { + "epoch": 2.09, + "learning_rate": 4.4378573382761573e-07, + "loss": 0.5381, + "step": 81596 + }, + { + "epoch": 2.09, + "learning_rate": 4.437627388163713e-07, + "loss": 0.4204, + "step": 81597 + }, + { + "epoch": 2.09, + "learning_rate": 4.4373974423101246e-07, + "loss": 0.3433, + "step": 81598 + }, + { + "epoch": 2.09, + "learning_rate": 4.437167500715562e-07, + "loss": 0.4316, + "step": 81599 + }, + { + "epoch": 2.09, + "learning_rate": 4.436937563380203e-07, + "loss": 0.3466, + "step": 81600 + }, + { + "epoch": 2.09, + "learning_rate": 4.4367076303042263e-07, + "loss": 0.3502, + "step": 81601 + }, + { + "epoch": 2.09, + "learning_rate": 4.4364777014878106e-07, + "loss": 0.4746, + "step": 81602 + }, + { + "epoch": 2.09, + "learning_rate": 4.436247776931128e-07, + "loss": 0.3845, + "step": 81603 + }, + { + "epoch": 2.09, + "learning_rate": 4.43601785663435e-07, + "loss": 0.4873, + "step": 81604 + }, + { + "epoch": 2.09, + "learning_rate": 4.435787940597658e-07, + "loss": 0.4648, + "step": 81605 + }, + { + "epoch": 2.09, + "learning_rate": 4.4355580288212314e-07, + "loss": 0.374, + "step": 81606 + }, + { + "epoch": 2.09, + "learning_rate": 4.4353281213052374e-07, + "loss": 0.3009, + "step": 81607 + }, + { + "epoch": 2.09, + "learning_rate": 4.4350982180498577e-07, + "loss": 0.4767, + "step": 81608 + }, + { + "epoch": 2.09, + "learning_rate": 4.434868319055267e-07, + "loss": 0.5103, + "step": 81609 + }, + { + "epoch": 2.09, + "learning_rate": 4.434638424321646e-07, + "loss": 0.4067, + "step": 81610 + }, + { + "epoch": 2.09, + "learning_rate": 4.434408533849162e-07, + "loss": 0.4355, + "step": 81611 + }, + { + "epoch": 2.09, + "learning_rate": 4.434178647637996e-07, + "loss": 0.5449, + "step": 81612 + }, + { + "epoch": 2.09, + "learning_rate": 4.4339487656883266e-07, + "loss": 0.2874, + "step": 81613 + }, + { + "epoch": 2.09, + "learning_rate": 4.433718888000324e-07, + "loss": 0.4131, + "step": 81614 + }, + { + "epoch": 2.09, + "learning_rate": 4.43348901457417e-07, + "loss": 0.4009, + "step": 81615 + }, + { + "epoch": 2.09, + "learning_rate": 4.433259145410033e-07, + "loss": 0.5405, + "step": 81616 + }, + { + "epoch": 2.09, + "learning_rate": 4.4330292805080947e-07, + "loss": 0.4316, + "step": 81617 + }, + { + "epoch": 2.09, + "learning_rate": 4.432799419868529e-07, + "loss": 0.4355, + "step": 81618 + }, + { + "epoch": 2.09, + "learning_rate": 4.4325695634915173e-07, + "loss": 0.4648, + "step": 81619 + }, + { + "epoch": 2.09, + "learning_rate": 4.432339711377228e-07, + "loss": 0.5752, + "step": 81620 + }, + { + "epoch": 2.09, + "learning_rate": 4.432109863525838e-07, + "loss": 0.3794, + "step": 81621 + }, + { + "epoch": 2.09, + "learning_rate": 4.431880019937527e-07, + "loss": 0.4346, + "step": 81622 + }, + { + "epoch": 2.09, + "learning_rate": 4.4316501806124773e-07, + "loss": 0.4907, + "step": 81623 + }, + { + "epoch": 2.09, + "learning_rate": 4.4314203455508483e-07, + "loss": 0.3351, + "step": 81624 + }, + { + "epoch": 2.09, + "learning_rate": 4.431190514752825e-07, + "loss": 0.4814, + "step": 81625 + }, + { + "epoch": 2.09, + "learning_rate": 4.4309606882185835e-07, + "loss": 0.356, + "step": 81626 + }, + { + "epoch": 2.09, + "learning_rate": 4.4307308659483035e-07, + "loss": 0.3756, + "step": 81627 + }, + { + "epoch": 2.09, + "learning_rate": 4.4305010479421525e-07, + "loss": 0.5332, + "step": 81628 + }, + { + "epoch": 2.09, + "learning_rate": 4.43027123420031e-07, + "loss": 0.4424, + "step": 81629 + }, + { + "epoch": 2.09, + "learning_rate": 4.4300414247229533e-07, + "loss": 0.3865, + "step": 81630 + }, + { + "epoch": 2.09, + "learning_rate": 4.429811619510262e-07, + "loss": 0.4453, + "step": 81631 + }, + { + "epoch": 2.09, + "learning_rate": 4.4295818185624036e-07, + "loss": 0.376, + "step": 81632 + }, + { + "epoch": 2.09, + "learning_rate": 4.429352021879562e-07, + "loss": 0.4546, + "step": 81633 + }, + { + "epoch": 2.09, + "learning_rate": 4.429122229461906e-07, + "loss": 0.4512, + "step": 81634 + }, + { + "epoch": 2.09, + "learning_rate": 4.4288924413096154e-07, + "loss": 0.4211, + "step": 81635 + }, + { + "epoch": 2.09, + "learning_rate": 4.428662657422868e-07, + "loss": 0.3411, + "step": 81636 + }, + { + "epoch": 2.09, + "learning_rate": 4.4284328778018344e-07, + "loss": 0.4146, + "step": 81637 + }, + { + "epoch": 2.09, + "learning_rate": 4.428203102446694e-07, + "loss": 0.4001, + "step": 81638 + }, + { + "epoch": 2.09, + "learning_rate": 4.4279733313576216e-07, + "loss": 0.4154, + "step": 81639 + }, + { + "epoch": 2.09, + "learning_rate": 4.427743564534798e-07, + "loss": 0.4141, + "step": 81640 + }, + { + "epoch": 2.09, + "learning_rate": 4.427513801978391e-07, + "loss": 0.4888, + "step": 81641 + }, + { + "epoch": 2.09, + "learning_rate": 4.4272840436885805e-07, + "loss": 0.4033, + "step": 81642 + }, + { + "epoch": 2.09, + "learning_rate": 4.427054289665546e-07, + "loss": 0.4424, + "step": 81643 + }, + { + "epoch": 2.09, + "learning_rate": 4.4268245399094596e-07, + "loss": 0.438, + "step": 81644 + }, + { + "epoch": 2.09, + "learning_rate": 4.426594794420494e-07, + "loss": 0.4009, + "step": 81645 + }, + { + "epoch": 2.09, + "learning_rate": 4.426365053198828e-07, + "loss": 0.4019, + "step": 81646 + }, + { + "epoch": 2.09, + "learning_rate": 4.426135316244639e-07, + "loss": 0.3704, + "step": 81647 + }, + { + "epoch": 2.09, + "learning_rate": 4.425905583558105e-07, + "loss": 0.4829, + "step": 81648 + }, + { + "epoch": 2.09, + "learning_rate": 4.4256758551393946e-07, + "loss": 0.3979, + "step": 81649 + }, + { + "epoch": 2.09, + "learning_rate": 4.425446130988689e-07, + "loss": 0.4585, + "step": 81650 + }, + { + "epoch": 2.09, + "learning_rate": 4.425216411106162e-07, + "loss": 0.5098, + "step": 81651 + }, + { + "epoch": 2.09, + "learning_rate": 4.424986695491995e-07, + "loss": 0.2915, + "step": 81652 + }, + { + "epoch": 2.09, + "learning_rate": 4.4247569841463585e-07, + "loss": 0.5264, + "step": 81653 + }, + { + "epoch": 2.09, + "learning_rate": 4.4245272770694263e-07, + "loss": 0.4023, + "step": 81654 + }, + { + "epoch": 2.09, + "learning_rate": 4.4242975742613766e-07, + "loss": 0.4292, + "step": 81655 + }, + { + "epoch": 2.09, + "learning_rate": 4.424067875722386e-07, + "loss": 0.3555, + "step": 81656 + }, + { + "epoch": 2.09, + "learning_rate": 4.423838181452634e-07, + "loss": 0.3916, + "step": 81657 + }, + { + "epoch": 2.09, + "learning_rate": 4.423608491452289e-07, + "loss": 0.3564, + "step": 81658 + }, + { + "epoch": 2.09, + "learning_rate": 4.4233788057215304e-07, + "loss": 0.2751, + "step": 81659 + }, + { + "epoch": 2.09, + "learning_rate": 4.423149124260538e-07, + "loss": 0.3892, + "step": 81660 + }, + { + "epoch": 2.09, + "learning_rate": 4.422919447069481e-07, + "loss": 0.4268, + "step": 81661 + }, + { + "epoch": 2.09, + "learning_rate": 4.422689774148537e-07, + "loss": 0.3158, + "step": 81662 + }, + { + "epoch": 2.09, + "learning_rate": 4.422460105497887e-07, + "loss": 0.5557, + "step": 81663 + }, + { + "epoch": 2.09, + "learning_rate": 4.422230441117699e-07, + "loss": 0.4746, + "step": 81664 + }, + { + "epoch": 2.09, + "learning_rate": 4.422000781008157e-07, + "loss": 0.3403, + "step": 81665 + }, + { + "epoch": 2.09, + "learning_rate": 4.421771125169429e-07, + "loss": 0.458, + "step": 81666 + }, + { + "epoch": 2.09, + "learning_rate": 4.421541473601693e-07, + "loss": 0.5435, + "step": 81667 + }, + { + "epoch": 2.09, + "learning_rate": 4.4213118263051275e-07, + "loss": 0.4092, + "step": 81668 + }, + { + "epoch": 2.09, + "learning_rate": 4.4210821832799104e-07, + "loss": 0.4556, + "step": 81669 + }, + { + "epoch": 2.09, + "learning_rate": 4.42085254452621e-07, + "loss": 0.4946, + "step": 81670 + }, + { + "epoch": 2.09, + "learning_rate": 4.420622910044206e-07, + "loss": 0.3322, + "step": 81671 + }, + { + "epoch": 2.09, + "learning_rate": 4.420393279834076e-07, + "loss": 0.3955, + "step": 81672 + }, + { + "epoch": 2.09, + "learning_rate": 4.420163653895996e-07, + "loss": 0.4241, + "step": 81673 + }, + { + "epoch": 2.09, + "learning_rate": 4.4199340322301415e-07, + "loss": 0.4453, + "step": 81674 + }, + { + "epoch": 2.09, + "learning_rate": 4.4197044148366835e-07, + "loss": 0.3589, + "step": 81675 + }, + { + "epoch": 2.09, + "learning_rate": 4.4194748017158e-07, + "loss": 0.2864, + "step": 81676 + }, + { + "epoch": 2.09, + "learning_rate": 4.419245192867672e-07, + "loss": 0.3843, + "step": 81677 + }, + { + "epoch": 2.09, + "learning_rate": 4.4190155882924684e-07, + "loss": 0.3652, + "step": 81678 + }, + { + "epoch": 2.09, + "learning_rate": 4.4187859879903676e-07, + "loss": 0.4438, + "step": 81679 + }, + { + "epoch": 2.09, + "learning_rate": 4.4185563919615454e-07, + "loss": 0.4458, + "step": 81680 + }, + { + "epoch": 2.09, + "learning_rate": 4.418326800206182e-07, + "loss": 0.2975, + "step": 81681 + }, + { + "epoch": 2.09, + "learning_rate": 4.4180972127244455e-07, + "loss": 0.3638, + "step": 81682 + }, + { + "epoch": 2.09, + "learning_rate": 4.4178676295165183e-07, + "loss": 0.4922, + "step": 81683 + }, + { + "epoch": 2.09, + "learning_rate": 4.4176380505825707e-07, + "loss": 0.4072, + "step": 81684 + }, + { + "epoch": 2.09, + "learning_rate": 4.4174084759227803e-07, + "loss": 0.3613, + "step": 81685 + }, + { + "epoch": 2.09, + "learning_rate": 4.4171789055373274e-07, + "loss": 0.5557, + "step": 81686 + }, + { + "epoch": 2.09, + "learning_rate": 4.41694933942638e-07, + "loss": 0.3262, + "step": 81687 + }, + { + "epoch": 2.09, + "learning_rate": 4.4167197775901175e-07, + "loss": 0.5879, + "step": 81688 + }, + { + "epoch": 2.09, + "learning_rate": 4.416490220028717e-07, + "loss": 0.3721, + "step": 81689 + }, + { + "epoch": 2.09, + "learning_rate": 4.416260666742355e-07, + "loss": 0.2849, + "step": 81690 + }, + { + "epoch": 2.09, + "learning_rate": 4.4160311177312037e-07, + "loss": 0.3721, + "step": 81691 + }, + { + "epoch": 2.09, + "learning_rate": 4.41580157299544e-07, + "loss": 0.3833, + "step": 81692 + }, + { + "epoch": 2.09, + "learning_rate": 4.415572032535243e-07, + "loss": 0.5684, + "step": 81693 + }, + { + "epoch": 2.09, + "learning_rate": 4.415342496350787e-07, + "loss": 0.4937, + "step": 81694 + }, + { + "epoch": 2.09, + "learning_rate": 4.4151129644422424e-07, + "loss": 0.3428, + "step": 81695 + }, + { + "epoch": 2.09, + "learning_rate": 4.4148834368097885e-07, + "loss": 0.3657, + "step": 81696 + }, + { + "epoch": 2.09, + "learning_rate": 4.414653913453602e-07, + "loss": 0.3301, + "step": 81697 + }, + { + "epoch": 2.09, + "learning_rate": 4.4144243943738624e-07, + "loss": 0.4194, + "step": 81698 + }, + { + "epoch": 2.09, + "learning_rate": 4.4141948795707363e-07, + "loss": 0.4756, + "step": 81699 + }, + { + "epoch": 2.09, + "learning_rate": 4.4139653690444045e-07, + "loss": 0.3967, + "step": 81700 + }, + { + "epoch": 2.09, + "learning_rate": 4.413735862795044e-07, + "loss": 0.5781, + "step": 81701 + }, + { + "epoch": 2.09, + "learning_rate": 4.4135063608228316e-07, + "loss": 0.3428, + "step": 81702 + }, + { + "epoch": 2.09, + "learning_rate": 4.4132768631279404e-07, + "loss": 0.4146, + "step": 81703 + }, + { + "epoch": 2.09, + "learning_rate": 4.413047369710543e-07, + "loss": 0.4316, + "step": 81704 + }, + { + "epoch": 2.09, + "learning_rate": 4.4128178805708183e-07, + "loss": 0.324, + "step": 81705 + }, + { + "epoch": 2.09, + "learning_rate": 4.4125883957089416e-07, + "loss": 0.4241, + "step": 81706 + }, + { + "epoch": 2.09, + "learning_rate": 4.4123589151250927e-07, + "loss": 0.3916, + "step": 81707 + }, + { + "epoch": 2.09, + "learning_rate": 4.412129438819441e-07, + "loss": 0.4277, + "step": 81708 + }, + { + "epoch": 2.09, + "learning_rate": 4.4118999667921643e-07, + "loss": 0.3252, + "step": 81709 + }, + { + "epoch": 2.09, + "learning_rate": 4.4116704990434385e-07, + "loss": 0.3779, + "step": 81710 + }, + { + "epoch": 2.09, + "learning_rate": 4.4114410355734434e-07, + "loss": 0.416, + "step": 81711 + }, + { + "epoch": 2.09, + "learning_rate": 4.4112115763823476e-07, + "loss": 0.4795, + "step": 81712 + }, + { + "epoch": 2.09, + "learning_rate": 4.4109821214703335e-07, + "loss": 0.4048, + "step": 81713 + }, + { + "epoch": 2.09, + "learning_rate": 4.4107526708375696e-07, + "loss": 0.4399, + "step": 81714 + }, + { + "epoch": 2.09, + "learning_rate": 4.4105232244842395e-07, + "loss": 0.2355, + "step": 81715 + }, + { + "epoch": 2.09, + "learning_rate": 4.41029378241051e-07, + "loss": 0.4399, + "step": 81716 + }, + { + "epoch": 2.09, + "learning_rate": 4.410064344616563e-07, + "loss": 0.4431, + "step": 81717 + }, + { + "epoch": 2.09, + "learning_rate": 4.4098349111025725e-07, + "loss": 0.4639, + "step": 81718 + }, + { + "epoch": 2.09, + "learning_rate": 4.409605481868717e-07, + "loss": 0.3293, + "step": 81719 + }, + { + "epoch": 2.09, + "learning_rate": 4.409376056915166e-07, + "loss": 0.4248, + "step": 81720 + }, + { + "epoch": 2.09, + "learning_rate": 4.4091466362420994e-07, + "loss": 0.5913, + "step": 81721 + }, + { + "epoch": 2.09, + "learning_rate": 4.4089172198496927e-07, + "loss": 0.3354, + "step": 81722 + }, + { + "epoch": 2.09, + "learning_rate": 4.4086878077381227e-07, + "loss": 0.4087, + "step": 81723 + }, + { + "epoch": 2.09, + "learning_rate": 4.408458399907565e-07, + "loss": 0.4395, + "step": 81724 + }, + { + "epoch": 2.09, + "learning_rate": 4.4082289963581896e-07, + "loss": 0.3555, + "step": 81725 + }, + { + "epoch": 2.09, + "learning_rate": 4.407999597090176e-07, + "loss": 0.3298, + "step": 81726 + }, + { + "epoch": 2.09, + "learning_rate": 4.4077702021037e-07, + "loss": 0.3828, + "step": 81727 + }, + { + "epoch": 2.09, + "learning_rate": 4.407540811398941e-07, + "loss": 0.4185, + "step": 81728 + }, + { + "epoch": 2.09, + "learning_rate": 4.407311424976067e-07, + "loss": 0.4434, + "step": 81729 + }, + { + "epoch": 2.09, + "learning_rate": 4.4070820428352573e-07, + "loss": 0.2829, + "step": 81730 + }, + { + "epoch": 2.09, + "learning_rate": 4.406852664976691e-07, + "loss": 0.5283, + "step": 81731 + }, + { + "epoch": 2.09, + "learning_rate": 4.4066232914005373e-07, + "loss": 0.4268, + "step": 81732 + }, + { + "epoch": 2.09, + "learning_rate": 4.406393922106979e-07, + "loss": 0.5244, + "step": 81733 + }, + { + "epoch": 2.09, + "learning_rate": 4.4061645570961836e-07, + "loss": 0.4128, + "step": 81734 + }, + { + "epoch": 2.09, + "learning_rate": 4.405935196368331e-07, + "loss": 0.2625, + "step": 81735 + }, + { + "epoch": 2.09, + "learning_rate": 4.4057058399236e-07, + "loss": 0.3403, + "step": 81736 + }, + { + "epoch": 2.09, + "learning_rate": 4.4054764877621597e-07, + "loss": 0.418, + "step": 81737 + }, + { + "epoch": 2.09, + "learning_rate": 4.405247139884188e-07, + "loss": 0.479, + "step": 81738 + }, + { + "epoch": 2.1, + "learning_rate": 4.405017796289863e-07, + "loss": 0.3071, + "step": 81739 + }, + { + "epoch": 2.1, + "learning_rate": 4.40478845697936e-07, + "loss": 0.3611, + "step": 81740 + }, + { + "epoch": 2.1, + "learning_rate": 4.404559121952851e-07, + "loss": 0.4204, + "step": 81741 + }, + { + "epoch": 2.1, + "learning_rate": 4.4043297912105127e-07, + "loss": 0.3423, + "step": 81742 + }, + { + "epoch": 2.1, + "learning_rate": 4.404100464752526e-07, + "loss": 0.5151, + "step": 81743 + }, + { + "epoch": 2.1, + "learning_rate": 4.4038711425790586e-07, + "loss": 0.4282, + "step": 81744 + }, + { + "epoch": 2.1, + "learning_rate": 4.403641824690294e-07, + "loss": 0.335, + "step": 81745 + }, + { + "epoch": 2.1, + "learning_rate": 4.4034125110863994e-07, + "loss": 0.4819, + "step": 81746 + }, + { + "epoch": 2.1, + "learning_rate": 4.403183201767554e-07, + "loss": 0.5112, + "step": 81747 + }, + { + "epoch": 2.1, + "learning_rate": 4.402953896733934e-07, + "loss": 0.4087, + "step": 81748 + }, + { + "epoch": 2.1, + "learning_rate": 4.4027245959857196e-07, + "loss": 0.3411, + "step": 81749 + }, + { + "epoch": 2.1, + "learning_rate": 4.402495299523077e-07, + "loss": 0.4346, + "step": 81750 + }, + { + "epoch": 2.1, + "learning_rate": 4.402266007346187e-07, + "loss": 0.2797, + "step": 81751 + }, + { + "epoch": 2.1, + "learning_rate": 4.402036719455228e-07, + "loss": 0.5371, + "step": 81752 + }, + { + "epoch": 2.1, + "learning_rate": 4.401807435850371e-07, + "loss": 0.4214, + "step": 81753 + }, + { + "epoch": 2.1, + "learning_rate": 4.40157815653179e-07, + "loss": 0.4014, + "step": 81754 + }, + { + "epoch": 2.1, + "learning_rate": 4.4013488814996624e-07, + "loss": 0.3663, + "step": 81755 + }, + { + "epoch": 2.1, + "learning_rate": 4.401119610754166e-07, + "loss": 0.3352, + "step": 81756 + }, + { + "epoch": 2.1, + "learning_rate": 4.4008903442954773e-07, + "loss": 0.5444, + "step": 81757 + }, + { + "epoch": 2.1, + "learning_rate": 4.4006610821237653e-07, + "loss": 0.4097, + "step": 81758 + }, + { + "epoch": 2.1, + "learning_rate": 4.400431824239211e-07, + "loss": 0.314, + "step": 81759 + }, + { + "epoch": 2.1, + "learning_rate": 4.4002025706419877e-07, + "loss": 0.5669, + "step": 81760 + }, + { + "epoch": 2.1, + "learning_rate": 4.399973321332277e-07, + "loss": 0.3416, + "step": 81761 + }, + { + "epoch": 2.1, + "learning_rate": 4.3997440763102434e-07, + "loss": 0.4072, + "step": 81762 + }, + { + "epoch": 2.1, + "learning_rate": 4.3995148355760724e-07, + "loss": 0.4263, + "step": 81763 + }, + { + "epoch": 2.1, + "learning_rate": 4.3992855991299327e-07, + "loss": 0.3624, + "step": 81764 + }, + { + "epoch": 2.1, + "learning_rate": 4.3990563669720015e-07, + "loss": 0.4175, + "step": 81765 + }, + { + "epoch": 2.1, + "learning_rate": 4.39882713910246e-07, + "loss": 0.5234, + "step": 81766 + }, + { + "epoch": 2.1, + "learning_rate": 4.398597915521475e-07, + "loss": 0.3218, + "step": 81767 + }, + { + "epoch": 2.1, + "learning_rate": 4.3983686962292256e-07, + "loss": 0.4551, + "step": 81768 + }, + { + "epoch": 2.1, + "learning_rate": 4.398139481225891e-07, + "loss": 0.3994, + "step": 81769 + }, + { + "epoch": 2.1, + "learning_rate": 4.397910270511641e-07, + "loss": 0.3501, + "step": 81770 + }, + { + "epoch": 2.1, + "learning_rate": 4.397681064086652e-07, + "loss": 0.3203, + "step": 81771 + }, + { + "epoch": 2.1, + "learning_rate": 4.3974518619511024e-07, + "loss": 0.4502, + "step": 81772 + }, + { + "epoch": 2.1, + "learning_rate": 4.397222664105169e-07, + "loss": 0.5146, + "step": 81773 + }, + { + "epoch": 2.1, + "learning_rate": 4.396993470549025e-07, + "loss": 0.3071, + "step": 81774 + }, + { + "epoch": 2.1, + "learning_rate": 4.396764281282842e-07, + "loss": 0.2755, + "step": 81775 + }, + { + "epoch": 2.1, + "learning_rate": 4.3965350963067995e-07, + "loss": 0.5283, + "step": 81776 + }, + { + "epoch": 2.1, + "learning_rate": 4.3963059156210716e-07, + "loss": 0.4873, + "step": 81777 + }, + { + "epoch": 2.1, + "learning_rate": 4.396076739225838e-07, + "loss": 0.395, + "step": 81778 + }, + { + "epoch": 2.1, + "learning_rate": 4.395847567121267e-07, + "loss": 0.4233, + "step": 81779 + }, + { + "epoch": 2.1, + "learning_rate": 4.395618399307538e-07, + "loss": 0.3511, + "step": 81780 + }, + { + "epoch": 2.1, + "learning_rate": 4.395389235784827e-07, + "loss": 0.4697, + "step": 81781 + }, + { + "epoch": 2.1, + "learning_rate": 4.3951600765533116e-07, + "loss": 0.2593, + "step": 81782 + }, + { + "epoch": 2.1, + "learning_rate": 4.394930921613165e-07, + "loss": 0.4414, + "step": 81783 + }, + { + "epoch": 2.1, + "learning_rate": 4.3947017709645583e-07, + "loss": 0.394, + "step": 81784 + }, + { + "epoch": 2.1, + "learning_rate": 4.39447262460767e-07, + "loss": 0.4316, + "step": 81785 + }, + { + "epoch": 2.1, + "learning_rate": 4.394243482542681e-07, + "loss": 0.3706, + "step": 81786 + }, + { + "epoch": 2.1, + "learning_rate": 4.3940143447697573e-07, + "loss": 0.457, + "step": 81787 + }, + { + "epoch": 2.1, + "learning_rate": 4.3937852112890803e-07, + "loss": 0.2739, + "step": 81788 + }, + { + "epoch": 2.1, + "learning_rate": 4.393556082100823e-07, + "loss": 0.4214, + "step": 81789 + }, + { + "epoch": 2.1, + "learning_rate": 4.3933269572051665e-07, + "loss": 0.436, + "step": 81790 + }, + { + "epoch": 2.1, + "learning_rate": 4.3930978366022776e-07, + "loss": 0.4688, + "step": 81791 + }, + { + "epoch": 2.1, + "learning_rate": 4.3928687202923364e-07, + "loss": 0.2868, + "step": 81792 + }, + { + "epoch": 2.1, + "learning_rate": 4.3926396082755214e-07, + "loss": 0.2986, + "step": 81793 + }, + { + "epoch": 2.1, + "learning_rate": 4.392410500552001e-07, + "loss": 0.2681, + "step": 81794 + }, + { + "epoch": 2.1, + "learning_rate": 4.392181397121957e-07, + "loss": 0.364, + "step": 81795 + }, + { + "epoch": 2.1, + "learning_rate": 4.3919522979855574e-07, + "loss": 0.4316, + "step": 81796 + }, + { + "epoch": 2.1, + "learning_rate": 4.391723203142983e-07, + "loss": 0.4907, + "step": 81797 + }, + { + "epoch": 2.1, + "learning_rate": 4.3914941125944084e-07, + "loss": 0.3945, + "step": 81798 + }, + { + "epoch": 2.1, + "learning_rate": 4.391265026340013e-07, + "loss": 0.4065, + "step": 81799 + }, + { + "epoch": 2.1, + "learning_rate": 4.3910359443799636e-07, + "loss": 0.4697, + "step": 81800 + }, + { + "epoch": 2.1, + "learning_rate": 4.3908068667144406e-07, + "loss": 0.373, + "step": 81801 + }, + { + "epoch": 2.1, + "learning_rate": 4.390577793343618e-07, + "loss": 0.3755, + "step": 81802 + }, + { + "epoch": 2.1, + "learning_rate": 4.3903487242676794e-07, + "loss": 0.4321, + "step": 81803 + }, + { + "epoch": 2.1, + "learning_rate": 4.3901196594867864e-07, + "loss": 0.3989, + "step": 81804 + }, + { + "epoch": 2.1, + "learning_rate": 4.38989059900112e-07, + "loss": 0.3833, + "step": 81805 + }, + { + "epoch": 2.1, + "learning_rate": 4.3896615428108576e-07, + "loss": 0.4746, + "step": 81806 + }, + { + "epoch": 2.1, + "learning_rate": 4.3894324909161764e-07, + "loss": 0.4395, + "step": 81807 + }, + { + "epoch": 2.1, + "learning_rate": 4.389203443317245e-07, + "loss": 0.4263, + "step": 81808 + }, + { + "epoch": 2.1, + "learning_rate": 4.3889744000142426e-07, + "loss": 0.498, + "step": 81809 + }, + { + "epoch": 2.1, + "learning_rate": 4.3887453610073445e-07, + "loss": 0.5801, + "step": 81810 + }, + { + "epoch": 2.1, + "learning_rate": 4.3885163262967294e-07, + "loss": 0.3821, + "step": 81811 + }, + { + "epoch": 2.1, + "learning_rate": 4.3882872958825656e-07, + "loss": 0.4419, + "step": 81812 + }, + { + "epoch": 2.1, + "learning_rate": 4.388058269765037e-07, + "loss": 0.3159, + "step": 81813 + }, + { + "epoch": 2.1, + "learning_rate": 4.387829247944309e-07, + "loss": 0.4678, + "step": 81814 + }, + { + "epoch": 2.1, + "learning_rate": 4.3876002304205627e-07, + "loss": 0.4192, + "step": 81815 + }, + { + "epoch": 2.1, + "learning_rate": 4.387371217193977e-07, + "loss": 0.48, + "step": 81816 + }, + { + "epoch": 2.1, + "learning_rate": 4.387142208264719e-07, + "loss": 0.5439, + "step": 81817 + }, + { + "epoch": 2.1, + "learning_rate": 4.386913203632968e-07, + "loss": 0.342, + "step": 81818 + }, + { + "epoch": 2.1, + "learning_rate": 4.3866842032988993e-07, + "loss": 0.3169, + "step": 81819 + }, + { + "epoch": 2.1, + "learning_rate": 4.3864552072626926e-07, + "loss": 0.345, + "step": 81820 + }, + { + "epoch": 2.1, + "learning_rate": 4.3862262155245154e-07, + "loss": 0.3807, + "step": 81821 + }, + { + "epoch": 2.1, + "learning_rate": 4.385997228084546e-07, + "loss": 0.3123, + "step": 81822 + }, + { + "epoch": 2.1, + "learning_rate": 4.3857682449429647e-07, + "loss": 0.4258, + "step": 81823 + }, + { + "epoch": 2.1, + "learning_rate": 4.3855392660999424e-07, + "loss": 0.3093, + "step": 81824 + }, + { + "epoch": 2.1, + "learning_rate": 4.3853102915556504e-07, + "loss": 0.2477, + "step": 81825 + }, + { + "epoch": 2.1, + "learning_rate": 4.3850813213102687e-07, + "loss": 0.5315, + "step": 81826 + }, + { + "epoch": 2.1, + "learning_rate": 4.3848523553639714e-07, + "loss": 0.3264, + "step": 81827 + }, + { + "epoch": 2.1, + "learning_rate": 4.3846233937169387e-07, + "loss": 0.4258, + "step": 81828 + }, + { + "epoch": 2.1, + "learning_rate": 4.384394436369337e-07, + "loss": 0.3511, + "step": 81829 + }, + { + "epoch": 2.1, + "learning_rate": 4.384165483321348e-07, + "loss": 0.373, + "step": 81830 + }, + { + "epoch": 2.1, + "learning_rate": 4.3839365345731437e-07, + "loss": 0.4512, + "step": 81831 + }, + { + "epoch": 2.1, + "learning_rate": 4.3837075901249053e-07, + "loss": 0.6045, + "step": 81832 + }, + { + "epoch": 2.1, + "learning_rate": 4.383478649976804e-07, + "loss": 0.2977, + "step": 81833 + }, + { + "epoch": 2.1, + "learning_rate": 4.3832497141290104e-07, + "loss": 0.4448, + "step": 81834 + }, + { + "epoch": 2.1, + "learning_rate": 4.383020782581706e-07, + "loss": 0.5083, + "step": 81835 + }, + { + "epoch": 2.1, + "learning_rate": 4.382791855335062e-07, + "loss": 0.3293, + "step": 81836 + }, + { + "epoch": 2.1, + "learning_rate": 4.382562932389261e-07, + "loss": 0.3843, + "step": 81837 + }, + { + "epoch": 2.1, + "learning_rate": 4.382334013744469e-07, + "loss": 0.342, + "step": 81838 + }, + { + "epoch": 2.1, + "learning_rate": 4.3821050994008656e-07, + "loss": 0.3762, + "step": 81839 + }, + { + "epoch": 2.1, + "learning_rate": 4.3818761893586296e-07, + "loss": 0.3945, + "step": 81840 + }, + { + "epoch": 2.1, + "learning_rate": 4.3816472836179297e-07, + "loss": 0.4214, + "step": 81841 + }, + { + "epoch": 2.1, + "learning_rate": 4.3814183821789444e-07, + "loss": 0.479, + "step": 81842 + }, + { + "epoch": 2.1, + "learning_rate": 4.381189485041852e-07, + "loss": 0.4395, + "step": 81843 + }, + { + "epoch": 2.1, + "learning_rate": 4.380960592206819e-07, + "loss": 0.3232, + "step": 81844 + }, + { + "epoch": 2.1, + "learning_rate": 4.380731703674032e-07, + "loss": 0.4032, + "step": 81845 + }, + { + "epoch": 2.1, + "learning_rate": 4.3805028194436555e-07, + "loss": 0.4331, + "step": 81846 + }, + { + "epoch": 2.1, + "learning_rate": 4.3802739395158707e-07, + "loss": 0.4673, + "step": 81847 + }, + { + "epoch": 2.1, + "learning_rate": 4.38004506389085e-07, + "loss": 0.4697, + "step": 81848 + }, + { + "epoch": 2.1, + "learning_rate": 4.379816192568776e-07, + "loss": 0.4575, + "step": 81849 + }, + { + "epoch": 2.1, + "learning_rate": 4.379587325549814e-07, + "loss": 0.5161, + "step": 81850 + }, + { + "epoch": 2.1, + "learning_rate": 4.379358462834143e-07, + "loss": 0.5234, + "step": 81851 + }, + { + "epoch": 2.1, + "learning_rate": 4.3791296044219395e-07, + "loss": 0.4565, + "step": 81852 + }, + { + "epoch": 2.1, + "learning_rate": 4.378900750313381e-07, + "loss": 0.4312, + "step": 81853 + }, + { + "epoch": 2.1, + "learning_rate": 4.37867190050864e-07, + "loss": 0.3591, + "step": 81854 + }, + { + "epoch": 2.1, + "learning_rate": 4.3784430550078876e-07, + "loss": 0.4932, + "step": 81855 + }, + { + "epoch": 2.1, + "learning_rate": 4.378214213811303e-07, + "loss": 0.3955, + "step": 81856 + }, + { + "epoch": 2.1, + "learning_rate": 4.3779853769190654e-07, + "loss": 0.2921, + "step": 81857 + }, + { + "epoch": 2.1, + "learning_rate": 4.377756544331341e-07, + "loss": 0.4265, + "step": 81858 + }, + { + "epoch": 2.1, + "learning_rate": 4.3775277160483113e-07, + "loss": 0.4297, + "step": 81859 + }, + { + "epoch": 2.1, + "learning_rate": 4.37729889207015e-07, + "loss": 0.4612, + "step": 81860 + }, + { + "epoch": 2.1, + "learning_rate": 4.3770700723970356e-07, + "loss": 0.5005, + "step": 81861 + }, + { + "epoch": 2.1, + "learning_rate": 4.376841257029136e-07, + "loss": 0.3412, + "step": 81862 + }, + { + "epoch": 2.1, + "learning_rate": 4.3766124459666354e-07, + "loss": 0.3938, + "step": 81863 + }, + { + "epoch": 2.1, + "learning_rate": 4.3763836392096986e-07, + "loss": 0.4263, + "step": 81864 + }, + { + "epoch": 2.1, + "learning_rate": 4.3761548367585076e-07, + "loss": 0.4951, + "step": 81865 + }, + { + "epoch": 2.1, + "learning_rate": 4.3759260386132404e-07, + "loss": 0.4043, + "step": 81866 + }, + { + "epoch": 2.1, + "learning_rate": 4.3756972447740627e-07, + "loss": 0.4451, + "step": 81867 + }, + { + "epoch": 2.1, + "learning_rate": 4.375468455241156e-07, + "loss": 0.4341, + "step": 81868 + }, + { + "epoch": 2.1, + "learning_rate": 4.3752396700146945e-07, + "loss": 0.2817, + "step": 81869 + }, + { + "epoch": 2.1, + "learning_rate": 4.3750108890948566e-07, + "loss": 0.4536, + "step": 81870 + }, + { + "epoch": 2.1, + "learning_rate": 4.3747821124818107e-07, + "loss": 0.3799, + "step": 81871 + }, + { + "epoch": 2.1, + "learning_rate": 4.3745533401757394e-07, + "loss": 0.3665, + "step": 81872 + }, + { + "epoch": 2.1, + "learning_rate": 4.3743245721768105e-07, + "loss": 0.4507, + "step": 81873 + }, + { + "epoch": 2.1, + "learning_rate": 4.3740958084852056e-07, + "loss": 0.4238, + "step": 81874 + }, + { + "epoch": 2.1, + "learning_rate": 4.373867049101093e-07, + "loss": 0.4766, + "step": 81875 + }, + { + "epoch": 2.1, + "learning_rate": 4.373638294024653e-07, + "loss": 0.5103, + "step": 81876 + }, + { + "epoch": 2.1, + "learning_rate": 4.373409543256058e-07, + "loss": 0.4336, + "step": 81877 + }, + { + "epoch": 2.1, + "learning_rate": 4.3731807967954893e-07, + "loss": 0.4858, + "step": 81878 + }, + { + "epoch": 2.1, + "learning_rate": 4.3729520546431133e-07, + "loss": 0.5317, + "step": 81879 + }, + { + "epoch": 2.1, + "learning_rate": 4.3727233167991095e-07, + "loss": 0.3926, + "step": 81880 + }, + { + "epoch": 2.1, + "learning_rate": 4.3724945832636515e-07, + "loss": 0.4268, + "step": 81881 + }, + { + "epoch": 2.1, + "learning_rate": 4.3722658540369204e-07, + "loss": 0.3923, + "step": 81882 + }, + { + "epoch": 2.1, + "learning_rate": 4.372037129119086e-07, + "loss": 0.4912, + "step": 81883 + }, + { + "epoch": 2.1, + "learning_rate": 4.3718084085103214e-07, + "loss": 0.4092, + "step": 81884 + }, + { + "epoch": 2.1, + "learning_rate": 4.371579692210804e-07, + "loss": 0.314, + "step": 81885 + }, + { + "epoch": 2.1, + "learning_rate": 4.3713509802207083e-07, + "loss": 0.4023, + "step": 81886 + }, + { + "epoch": 2.1, + "learning_rate": 4.3711222725402143e-07, + "loss": 0.3891, + "step": 81887 + }, + { + "epoch": 2.1, + "learning_rate": 4.3708935691694895e-07, + "loss": 0.3198, + "step": 81888 + }, + { + "epoch": 2.1, + "learning_rate": 4.3706648701087135e-07, + "loss": 0.5049, + "step": 81889 + }, + { + "epoch": 2.1, + "learning_rate": 4.37043617535806e-07, + "loss": 0.3833, + "step": 81890 + }, + { + "epoch": 2.1, + "learning_rate": 4.3702074849177075e-07, + "loss": 0.4072, + "step": 81891 + }, + { + "epoch": 2.1, + "learning_rate": 4.369978798787829e-07, + "loss": 0.3993, + "step": 81892 + }, + { + "epoch": 2.1, + "learning_rate": 4.3697501169685956e-07, + "loss": 0.3945, + "step": 81893 + }, + { + "epoch": 2.1, + "learning_rate": 4.3695214394601854e-07, + "loss": 0.3301, + "step": 81894 + }, + { + "epoch": 2.1, + "learning_rate": 4.3692927662627764e-07, + "loss": 0.4077, + "step": 81895 + }, + { + "epoch": 2.1, + "learning_rate": 4.369064097376539e-07, + "loss": 0.4025, + "step": 81896 + }, + { + "epoch": 2.1, + "learning_rate": 4.3688354328016495e-07, + "loss": 0.4546, + "step": 81897 + }, + { + "epoch": 2.1, + "learning_rate": 4.368606772538284e-07, + "loss": 0.425, + "step": 81898 + }, + { + "epoch": 2.1, + "learning_rate": 4.3683781165866207e-07, + "loss": 0.3999, + "step": 81899 + }, + { + "epoch": 2.1, + "learning_rate": 4.3681494649468275e-07, + "loss": 0.4268, + "step": 81900 + }, + { + "epoch": 2.1, + "learning_rate": 4.367920817619084e-07, + "loss": 0.3645, + "step": 81901 + }, + { + "epoch": 2.1, + "learning_rate": 4.3676921746035677e-07, + "loss": 0.3606, + "step": 81902 + }, + { + "epoch": 2.1, + "learning_rate": 4.3674635359004463e-07, + "loss": 0.3967, + "step": 81903 + }, + { + "epoch": 2.1, + "learning_rate": 4.367234901509904e-07, + "loss": 0.5176, + "step": 81904 + }, + { + "epoch": 2.1, + "learning_rate": 4.3670062714321065e-07, + "loss": 0.3181, + "step": 81905 + }, + { + "epoch": 2.1, + "learning_rate": 4.3667776456672333e-07, + "loss": 0.5127, + "step": 81906 + }, + { + "epoch": 2.1, + "learning_rate": 4.36654902421546e-07, + "loss": 0.412, + "step": 81907 + }, + { + "epoch": 2.1, + "learning_rate": 4.3663204070769645e-07, + "loss": 0.5024, + "step": 81908 + }, + { + "epoch": 2.1, + "learning_rate": 4.3660917942519135e-07, + "loss": 0.3887, + "step": 81909 + }, + { + "epoch": 2.1, + "learning_rate": 4.365863185740488e-07, + "loss": 0.312, + "step": 81910 + }, + { + "epoch": 2.1, + "learning_rate": 4.365634581542863e-07, + "loss": 0.3118, + "step": 81911 + }, + { + "epoch": 2.1, + "learning_rate": 4.365405981659218e-07, + "loss": 0.343, + "step": 81912 + }, + { + "epoch": 2.1, + "learning_rate": 4.365177386089717e-07, + "loss": 0.3181, + "step": 81913 + }, + { + "epoch": 2.1, + "learning_rate": 4.36494879483454e-07, + "loss": 0.4524, + "step": 81914 + }, + { + "epoch": 2.1, + "learning_rate": 4.3647202078938617e-07, + "loss": 0.3643, + "step": 81915 + }, + { + "epoch": 2.1, + "learning_rate": 4.364491625267862e-07, + "loss": 0.3511, + "step": 81916 + }, + { + "epoch": 2.1, + "learning_rate": 4.364263046956709e-07, + "loss": 0.3574, + "step": 81917 + }, + { + "epoch": 2.1, + "learning_rate": 4.3640344729605805e-07, + "loss": 0.415, + "step": 81918 + }, + { + "epoch": 2.1, + "learning_rate": 4.3638059032796514e-07, + "loss": 0.2694, + "step": 81919 + }, + { + "epoch": 2.1, + "learning_rate": 4.3635773379141005e-07, + "loss": 0.4609, + "step": 81920 + }, + { + "epoch": 2.1, + "learning_rate": 4.363348776864095e-07, + "loss": 0.4668, + "step": 81921 + }, + { + "epoch": 2.1, + "learning_rate": 4.363120220129819e-07, + "loss": 0.3755, + "step": 81922 + }, + { + "epoch": 2.1, + "learning_rate": 4.362891667711438e-07, + "loss": 0.4434, + "step": 81923 + }, + { + "epoch": 2.1, + "learning_rate": 4.3626631196091323e-07, + "loss": 0.3798, + "step": 81924 + }, + { + "epoch": 2.1, + "learning_rate": 4.36243457582308e-07, + "loss": 0.4009, + "step": 81925 + }, + { + "epoch": 2.1, + "learning_rate": 4.3622060363534484e-07, + "loss": 0.3492, + "step": 81926 + }, + { + "epoch": 2.1, + "learning_rate": 4.3619775012004166e-07, + "loss": 0.3634, + "step": 81927 + }, + { + "epoch": 2.1, + "learning_rate": 4.3617489703641585e-07, + "loss": 0.3507, + "step": 81928 + }, + { + "epoch": 2.1, + "learning_rate": 4.361520443844855e-07, + "loss": 0.3545, + "step": 81929 + }, + { + "epoch": 2.1, + "learning_rate": 4.361291921642671e-07, + "loss": 0.5527, + "step": 81930 + }, + { + "epoch": 2.1, + "learning_rate": 4.3610634037577877e-07, + "loss": 0.4019, + "step": 81931 + }, + { + "epoch": 2.1, + "learning_rate": 4.3608348901903826e-07, + "loss": 0.3911, + "step": 81932 + }, + { + "epoch": 2.1, + "learning_rate": 4.3606063809406257e-07, + "loss": 0.3159, + "step": 81933 + }, + { + "epoch": 2.1, + "learning_rate": 4.360377876008691e-07, + "loss": 0.5005, + "step": 81934 + }, + { + "epoch": 2.1, + "learning_rate": 4.360149375394754e-07, + "loss": 0.4185, + "step": 81935 + }, + { + "epoch": 2.1, + "learning_rate": 4.359920879098993e-07, + "loss": 0.425, + "step": 81936 + }, + { + "epoch": 2.1, + "learning_rate": 4.359692387121583e-07, + "loss": 0.4062, + "step": 81937 + }, + { + "epoch": 2.1, + "learning_rate": 4.3594638994626954e-07, + "loss": 0.3031, + "step": 81938 + }, + { + "epoch": 2.1, + "learning_rate": 4.3592354161225054e-07, + "loss": 0.4448, + "step": 81939 + }, + { + "epoch": 2.1, + "learning_rate": 4.359006937101191e-07, + "loss": 0.4414, + "step": 81940 + }, + { + "epoch": 2.1, + "learning_rate": 4.358778462398928e-07, + "loss": 0.313, + "step": 81941 + }, + { + "epoch": 2.1, + "learning_rate": 4.3585499920158887e-07, + "loss": 0.2969, + "step": 81942 + }, + { + "epoch": 2.1, + "learning_rate": 4.3583215259522453e-07, + "loss": 0.4255, + "step": 81943 + }, + { + "epoch": 2.1, + "learning_rate": 4.3580930642081757e-07, + "loss": 0.3621, + "step": 81944 + }, + { + "epoch": 2.1, + "learning_rate": 4.3578646067838555e-07, + "loss": 0.3906, + "step": 81945 + }, + { + "epoch": 2.1, + "learning_rate": 4.3576361536794615e-07, + "loss": 0.4043, + "step": 81946 + }, + { + "epoch": 2.1, + "learning_rate": 4.3574077048951627e-07, + "loss": 0.4463, + "step": 81947 + }, + { + "epoch": 2.1, + "learning_rate": 4.3571792604311375e-07, + "loss": 0.4653, + "step": 81948 + }, + { + "epoch": 2.1, + "learning_rate": 4.3569508202875647e-07, + "loss": 0.519, + "step": 81949 + }, + { + "epoch": 2.1, + "learning_rate": 4.3567223844646106e-07, + "loss": 0.2714, + "step": 81950 + }, + { + "epoch": 2.1, + "learning_rate": 4.356493952962456e-07, + "loss": 0.4243, + "step": 81951 + }, + { + "epoch": 2.1, + "learning_rate": 4.3562655257812765e-07, + "loss": 0.4219, + "step": 81952 + }, + { + "epoch": 2.1, + "learning_rate": 4.3560371029212427e-07, + "loss": 0.5439, + "step": 81953 + }, + { + "epoch": 2.1, + "learning_rate": 4.355808684382535e-07, + "loss": 0.365, + "step": 81954 + }, + { + "epoch": 2.1, + "learning_rate": 4.355580270165321e-07, + "loss": 0.366, + "step": 81955 + }, + { + "epoch": 2.1, + "learning_rate": 4.3553518602697805e-07, + "loss": 0.3887, + "step": 81956 + }, + { + "epoch": 2.1, + "learning_rate": 4.3551234546960867e-07, + "loss": 0.3979, + "step": 81957 + }, + { + "epoch": 2.1, + "learning_rate": 4.3548950534444197e-07, + "loss": 0.458, + "step": 81958 + }, + { + "epoch": 2.1, + "learning_rate": 4.354666656514945e-07, + "loss": 0.375, + "step": 81959 + }, + { + "epoch": 2.1, + "learning_rate": 4.3544382639078436e-07, + "loss": 0.4907, + "step": 81960 + }, + { + "epoch": 2.1, + "learning_rate": 4.354209875623289e-07, + "loss": 0.3574, + "step": 81961 + }, + { + "epoch": 2.1, + "learning_rate": 4.3539814916614605e-07, + "loss": 0.2478, + "step": 81962 + }, + { + "epoch": 2.1, + "learning_rate": 4.353753112022528e-07, + "loss": 0.3018, + "step": 81963 + }, + { + "epoch": 2.1, + "learning_rate": 4.353524736706663e-07, + "loss": 0.3929, + "step": 81964 + }, + { + "epoch": 2.1, + "learning_rate": 4.3532963657140453e-07, + "loss": 0.3774, + "step": 81965 + }, + { + "epoch": 2.1, + "learning_rate": 4.3530679990448527e-07, + "loss": 0.4067, + "step": 81966 + }, + { + "epoch": 2.1, + "learning_rate": 4.3528396366992523e-07, + "loss": 0.4116, + "step": 81967 + }, + { + "epoch": 2.1, + "learning_rate": 4.352611278677423e-07, + "loss": 0.481, + "step": 81968 + }, + { + "epoch": 2.1, + "learning_rate": 4.3523829249795396e-07, + "loss": 0.4695, + "step": 81969 + }, + { + "epoch": 2.1, + "learning_rate": 4.35215457560578e-07, + "loss": 0.4546, + "step": 81970 + }, + { + "epoch": 2.1, + "learning_rate": 4.3519262305563133e-07, + "loss": 0.3656, + "step": 81971 + }, + { + "epoch": 2.1, + "learning_rate": 4.3516978898313195e-07, + "loss": 0.4897, + "step": 81972 + }, + { + "epoch": 2.1, + "learning_rate": 4.351469553430969e-07, + "loss": 0.3989, + "step": 81973 + }, + { + "epoch": 2.1, + "learning_rate": 4.351241221355437e-07, + "loss": 0.4629, + "step": 81974 + }, + { + "epoch": 2.1, + "learning_rate": 4.351012893604904e-07, + "loss": 0.562, + "step": 81975 + }, + { + "epoch": 2.1, + "learning_rate": 4.350784570179537e-07, + "loss": 0.4702, + "step": 81976 + }, + { + "epoch": 2.1, + "learning_rate": 4.350556251079515e-07, + "loss": 0.3723, + "step": 81977 + }, + { + "epoch": 2.1, + "learning_rate": 4.3503279363050106e-07, + "loss": 0.4824, + "step": 81978 + }, + { + "epoch": 2.1, + "learning_rate": 4.350099625856205e-07, + "loss": 0.4465, + "step": 81979 + }, + { + "epoch": 2.1, + "learning_rate": 4.349871319733266e-07, + "loss": 0.4308, + "step": 81980 + }, + { + "epoch": 2.1, + "learning_rate": 4.3496430179363685e-07, + "loss": 0.4951, + "step": 81981 + }, + { + "epoch": 2.1, + "learning_rate": 4.349414720465695e-07, + "loss": 0.4102, + "step": 81982 + }, + { + "epoch": 2.1, + "learning_rate": 4.3491864273214143e-07, + "loss": 0.3772, + "step": 81983 + }, + { + "epoch": 2.1, + "learning_rate": 4.348958138503698e-07, + "loss": 0.5127, + "step": 81984 + }, + { + "epoch": 2.1, + "learning_rate": 4.348729854012724e-07, + "loss": 0.3254, + "step": 81985 + }, + { + "epoch": 2.1, + "learning_rate": 4.348501573848667e-07, + "loss": 0.459, + "step": 81986 + }, + { + "epoch": 2.1, + "learning_rate": 4.3482732980117086e-07, + "loss": 0.395, + "step": 81987 + }, + { + "epoch": 2.1, + "learning_rate": 4.348045026502012e-07, + "loss": 0.5405, + "step": 81988 + }, + { + "epoch": 2.1, + "learning_rate": 4.347816759319758e-07, + "loss": 0.3989, + "step": 81989 + }, + { + "epoch": 2.1, + "learning_rate": 4.347588496465121e-07, + "loss": 0.4307, + "step": 81990 + }, + { + "epoch": 2.1, + "learning_rate": 4.347360237938279e-07, + "loss": 0.5132, + "step": 81991 + }, + { + "epoch": 2.1, + "learning_rate": 4.347131983739403e-07, + "loss": 0.2974, + "step": 81992 + }, + { + "epoch": 2.1, + "learning_rate": 4.3469037338686654e-07, + "loss": 0.4402, + "step": 81993 + }, + { + "epoch": 2.1, + "learning_rate": 4.3466754883262424e-07, + "loss": 0.3707, + "step": 81994 + }, + { + "epoch": 2.1, + "learning_rate": 4.3464472471123103e-07, + "loss": 0.4668, + "step": 81995 + }, + { + "epoch": 2.1, + "learning_rate": 4.346219010227048e-07, + "loss": 0.4287, + "step": 81996 + }, + { + "epoch": 2.1, + "learning_rate": 4.3459907776706216e-07, + "loss": 0.4595, + "step": 81997 + }, + { + "epoch": 2.1, + "learning_rate": 4.34576254944321e-07, + "loss": 0.4307, + "step": 81998 + }, + { + "epoch": 2.1, + "learning_rate": 4.3455343255449894e-07, + "loss": 0.5122, + "step": 81999 + }, + { + "epoch": 2.1, + "learning_rate": 4.345306105976135e-07, + "loss": 0.4087, + "step": 82000 + }, + { + "epoch": 2.1, + "learning_rate": 4.3450778907368167e-07, + "loss": 0.4067, + "step": 82001 + }, + { + "epoch": 2.1, + "learning_rate": 4.344849679827216e-07, + "loss": 0.3677, + "step": 82002 + }, + { + "epoch": 2.1, + "learning_rate": 4.3446214732475004e-07, + "loss": 0.4243, + "step": 82003 + }, + { + "epoch": 2.1, + "learning_rate": 4.3443932709978515e-07, + "loss": 0.4839, + "step": 82004 + }, + { + "epoch": 2.1, + "learning_rate": 4.344165073078437e-07, + "loss": 0.4458, + "step": 82005 + }, + { + "epoch": 2.1, + "learning_rate": 4.343936879489436e-07, + "loss": 0.4072, + "step": 82006 + }, + { + "epoch": 2.1, + "learning_rate": 4.3437086902310216e-07, + "loss": 0.2474, + "step": 82007 + }, + { + "epoch": 2.1, + "learning_rate": 4.3434805053033727e-07, + "loss": 0.375, + "step": 82008 + }, + { + "epoch": 2.1, + "learning_rate": 4.343252324706658e-07, + "loss": 0.5015, + "step": 82009 + }, + { + "epoch": 2.1, + "learning_rate": 4.343024148441055e-07, + "loss": 0.2089, + "step": 82010 + }, + { + "epoch": 2.1, + "learning_rate": 4.342795976506737e-07, + "loss": 0.4897, + "step": 82011 + }, + { + "epoch": 2.1, + "learning_rate": 4.342567808903884e-07, + "loss": 0.4316, + "step": 82012 + }, + { + "epoch": 2.1, + "learning_rate": 4.3423396456326677e-07, + "loss": 0.4785, + "step": 82013 + }, + { + "epoch": 2.1, + "learning_rate": 4.3421114866932576e-07, + "loss": 0.4062, + "step": 82014 + }, + { + "epoch": 2.1, + "learning_rate": 4.341883332085832e-07, + "loss": 0.3679, + "step": 82015 + }, + { + "epoch": 2.1, + "learning_rate": 4.341655181810566e-07, + "loss": 0.5864, + "step": 82016 + }, + { + "epoch": 2.1, + "learning_rate": 4.34142703586764e-07, + "loss": 0.3621, + "step": 82017 + }, + { + "epoch": 2.1, + "learning_rate": 4.3411988942572177e-07, + "loss": 0.3455, + "step": 82018 + }, + { + "epoch": 2.1, + "learning_rate": 4.34097075697948e-07, + "loss": 0.4795, + "step": 82019 + }, + { + "epoch": 2.1, + "learning_rate": 4.3407426240346035e-07, + "loss": 0.4272, + "step": 82020 + }, + { + "epoch": 2.1, + "learning_rate": 4.340514495422757e-07, + "loss": 0.3164, + "step": 82021 + }, + { + "epoch": 2.1, + "learning_rate": 4.340286371144122e-07, + "loss": 0.4868, + "step": 82022 + }, + { + "epoch": 2.1, + "learning_rate": 4.340058251198866e-07, + "loss": 0.5, + "step": 82023 + }, + { + "epoch": 2.1, + "learning_rate": 4.339830135587167e-07, + "loss": 0.3604, + "step": 82024 + }, + { + "epoch": 2.1, + "learning_rate": 4.3396020243092033e-07, + "loss": 0.4204, + "step": 82025 + }, + { + "epoch": 2.1, + "learning_rate": 4.3393739173651436e-07, + "loss": 0.3672, + "step": 82026 + }, + { + "epoch": 2.1, + "learning_rate": 4.339145814755163e-07, + "loss": 0.4868, + "step": 82027 + }, + { + "epoch": 2.1, + "learning_rate": 4.33891771647944e-07, + "loss": 0.3092, + "step": 82028 + }, + { + "epoch": 2.1, + "learning_rate": 4.3386896225381496e-07, + "loss": 0.499, + "step": 82029 + }, + { + "epoch": 2.1, + "learning_rate": 4.338461532931461e-07, + "loss": 0.3621, + "step": 82030 + }, + { + "epoch": 2.1, + "learning_rate": 4.338233447659553e-07, + "loss": 0.417, + "step": 82031 + }, + { + "epoch": 2.1, + "learning_rate": 4.3380053667226026e-07, + "loss": 0.4785, + "step": 82032 + }, + { + "epoch": 2.1, + "learning_rate": 4.3377772901207766e-07, + "loss": 0.4258, + "step": 82033 + }, + { + "epoch": 2.1, + "learning_rate": 4.3375492178542585e-07, + "loss": 0.3726, + "step": 82034 + }, + { + "epoch": 2.1, + "learning_rate": 4.3373211499232154e-07, + "loss": 0.4712, + "step": 82035 + }, + { + "epoch": 2.1, + "learning_rate": 4.3370930863278244e-07, + "loss": 0.2783, + "step": 82036 + }, + { + "epoch": 2.1, + "learning_rate": 4.3368650270682637e-07, + "loss": 0.3645, + "step": 82037 + }, + { + "epoch": 2.1, + "learning_rate": 4.336636972144703e-07, + "loss": 0.3412, + "step": 82038 + }, + { + "epoch": 2.1, + "learning_rate": 4.3364089215573184e-07, + "loss": 0.5117, + "step": 82039 + }, + { + "epoch": 2.1, + "learning_rate": 4.3361808753062843e-07, + "loss": 0.4038, + "step": 82040 + }, + { + "epoch": 2.1, + "learning_rate": 4.3359528333917805e-07, + "loss": 0.4658, + "step": 82041 + }, + { + "epoch": 2.1, + "learning_rate": 4.335724795813978e-07, + "loss": 0.3435, + "step": 82042 + }, + { + "epoch": 2.1, + "learning_rate": 4.335496762573045e-07, + "loss": 0.4307, + "step": 82043 + }, + { + "epoch": 2.1, + "learning_rate": 4.335268733669163e-07, + "loss": 0.3525, + "step": 82044 + }, + { + "epoch": 2.1, + "learning_rate": 4.3350407091025057e-07, + "loss": 0.4487, + "step": 82045 + }, + { + "epoch": 2.1, + "learning_rate": 4.3348126888732496e-07, + "loss": 0.4746, + "step": 82046 + }, + { + "epoch": 2.1, + "learning_rate": 4.334584672981564e-07, + "loss": 0.564, + "step": 82047 + }, + { + "epoch": 2.1, + "learning_rate": 4.3343566614276264e-07, + "loss": 0.3049, + "step": 82048 + }, + { + "epoch": 2.1, + "learning_rate": 4.3341286542116106e-07, + "loss": 0.4434, + "step": 82049 + }, + { + "epoch": 2.1, + "learning_rate": 4.3339006513336964e-07, + "loss": 0.3294, + "step": 82050 + }, + { + "epoch": 2.1, + "learning_rate": 4.3336726527940504e-07, + "loss": 0.3794, + "step": 82051 + }, + { + "epoch": 2.1, + "learning_rate": 4.333444658592854e-07, + "loss": 0.4126, + "step": 82052 + }, + { + "epoch": 2.1, + "learning_rate": 4.333216668730275e-07, + "loss": 0.4678, + "step": 82053 + }, + { + "epoch": 2.1, + "learning_rate": 4.3329886832064953e-07, + "loss": 0.438, + "step": 82054 + }, + { + "epoch": 2.1, + "learning_rate": 4.3327607020216814e-07, + "loss": 0.521, + "step": 82055 + }, + { + "epoch": 2.1, + "learning_rate": 4.3325327251760124e-07, + "loss": 0.3794, + "step": 82056 + }, + { + "epoch": 2.1, + "learning_rate": 4.332304752669662e-07, + "loss": 0.4805, + "step": 82057 + }, + { + "epoch": 2.1, + "learning_rate": 4.3320767845028096e-07, + "loss": 0.5708, + "step": 82058 + }, + { + "epoch": 2.1, + "learning_rate": 4.331848820675621e-07, + "loss": 0.3173, + "step": 82059 + }, + { + "epoch": 2.1, + "learning_rate": 4.3316208611882754e-07, + "loss": 0.3507, + "step": 82060 + }, + { + "epoch": 2.1, + "learning_rate": 4.3313929060409473e-07, + "loss": 0.3901, + "step": 82061 + }, + { + "epoch": 2.1, + "learning_rate": 4.331164955233815e-07, + "loss": 0.4629, + "step": 82062 + }, + { + "epoch": 2.1, + "learning_rate": 4.330937008767048e-07, + "loss": 0.4834, + "step": 82063 + }, + { + "epoch": 2.1, + "learning_rate": 4.33070906664082e-07, + "loss": 0.3613, + "step": 82064 + }, + { + "epoch": 2.1, + "learning_rate": 4.3304811288553055e-07, + "loss": 0.3048, + "step": 82065 + }, + { + "epoch": 2.1, + "learning_rate": 4.3302531954106815e-07, + "loss": 0.3394, + "step": 82066 + }, + { + "epoch": 2.1, + "learning_rate": 4.3300252663071257e-07, + "loss": 0.3481, + "step": 82067 + }, + { + "epoch": 2.1, + "learning_rate": 4.3297973415448054e-07, + "loss": 0.3896, + "step": 82068 + }, + { + "epoch": 2.1, + "learning_rate": 4.3295694211238974e-07, + "loss": 0.376, + "step": 82069 + }, + { + "epoch": 2.1, + "learning_rate": 4.329341505044579e-07, + "loss": 0.3811, + "step": 82070 + }, + { + "epoch": 2.1, + "learning_rate": 4.3291135933070256e-07, + "loss": 0.4717, + "step": 82071 + }, + { + "epoch": 2.1, + "learning_rate": 4.3288856859114096e-07, + "loss": 0.4722, + "step": 82072 + }, + { + "epoch": 2.1, + "learning_rate": 4.328657782857902e-07, + "loss": 0.4697, + "step": 82073 + }, + { + "epoch": 2.1, + "learning_rate": 4.3284298841466793e-07, + "loss": 0.397, + "step": 82074 + }, + { + "epoch": 2.1, + "learning_rate": 4.328201989777921e-07, + "loss": 0.3763, + "step": 82075 + }, + { + "epoch": 2.1, + "learning_rate": 4.3279740997517943e-07, + "loss": 0.4033, + "step": 82076 + }, + { + "epoch": 2.1, + "learning_rate": 4.327746214068477e-07, + "loss": 0.3585, + "step": 82077 + }, + { + "epoch": 2.1, + "learning_rate": 4.3275183327281426e-07, + "loss": 0.5527, + "step": 82078 + }, + { + "epoch": 2.1, + "learning_rate": 4.327290455730972e-07, + "loss": 0.3403, + "step": 82079 + }, + { + "epoch": 2.1, + "learning_rate": 4.327062583077129e-07, + "loss": 0.4287, + "step": 82080 + }, + { + "epoch": 2.1, + "learning_rate": 4.326834714766795e-07, + "loss": 0.4404, + "step": 82081 + }, + { + "epoch": 2.1, + "learning_rate": 4.326606850800145e-07, + "loss": 0.3576, + "step": 82082 + }, + { + "epoch": 2.1, + "learning_rate": 4.3263789911773487e-07, + "loss": 0.2698, + "step": 82083 + }, + { + "epoch": 2.1, + "learning_rate": 4.326151135898586e-07, + "loss": 0.4072, + "step": 82084 + }, + { + "epoch": 2.1, + "learning_rate": 4.325923284964025e-07, + "loss": 0.3523, + "step": 82085 + }, + { + "epoch": 2.1, + "learning_rate": 4.325695438373843e-07, + "loss": 0.3105, + "step": 82086 + }, + { + "epoch": 2.1, + "learning_rate": 4.325467596128216e-07, + "loss": 0.4792, + "step": 82087 + }, + { + "epoch": 2.1, + "learning_rate": 4.32523975822732e-07, + "loss": 0.4543, + "step": 82088 + }, + { + "epoch": 2.1, + "learning_rate": 4.3250119246713245e-07, + "loss": 0.4727, + "step": 82089 + }, + { + "epoch": 2.1, + "learning_rate": 4.3247840954604065e-07, + "loss": 0.4272, + "step": 82090 + }, + { + "epoch": 2.1, + "learning_rate": 4.32455627059474e-07, + "loss": 0.4224, + "step": 82091 + }, + { + "epoch": 2.1, + "learning_rate": 4.3243284500745067e-07, + "loss": 0.3804, + "step": 82092 + }, + { + "epoch": 2.1, + "learning_rate": 4.3241006338998674e-07, + "loss": 0.5371, + "step": 82093 + }, + { + "epoch": 2.1, + "learning_rate": 4.323872822071004e-07, + "loss": 0.5073, + "step": 82094 + }, + { + "epoch": 2.1, + "learning_rate": 4.3236450145880885e-07, + "loss": 0.3984, + "step": 82095 + }, + { + "epoch": 2.1, + "learning_rate": 4.323417211451302e-07, + "loss": 0.2361, + "step": 82096 + }, + { + "epoch": 2.1, + "learning_rate": 4.32318941266081e-07, + "loss": 0.2567, + "step": 82097 + }, + { + "epoch": 2.1, + "learning_rate": 4.3229616182167905e-07, + "loss": 0.2469, + "step": 82098 + }, + { + "epoch": 2.1, + "learning_rate": 4.3227338281194183e-07, + "loss": 0.5024, + "step": 82099 + }, + { + "epoch": 2.1, + "learning_rate": 4.322506042368872e-07, + "loss": 0.2769, + "step": 82100 + }, + { + "epoch": 2.1, + "learning_rate": 4.3222782609653174e-07, + "loss": 0.395, + "step": 82101 + }, + { + "epoch": 2.1, + "learning_rate": 4.3220504839089365e-07, + "loss": 0.3564, + "step": 82102 + }, + { + "epoch": 2.1, + "learning_rate": 4.321822711199897e-07, + "loss": 0.3584, + "step": 82103 + }, + { + "epoch": 2.1, + "learning_rate": 4.321594942838378e-07, + "loss": 0.3033, + "step": 82104 + }, + { + "epoch": 2.1, + "learning_rate": 4.3213671788245555e-07, + "loss": 0.5078, + "step": 82105 + }, + { + "epoch": 2.1, + "learning_rate": 4.321139419158597e-07, + "loss": 0.4067, + "step": 82106 + }, + { + "epoch": 2.1, + "learning_rate": 4.320911663840682e-07, + "loss": 0.3726, + "step": 82107 + }, + { + "epoch": 2.1, + "learning_rate": 4.320683912870983e-07, + "loss": 0.5308, + "step": 82108 + }, + { + "epoch": 2.1, + "learning_rate": 4.3204561662496784e-07, + "loss": 0.4307, + "step": 82109 + }, + { + "epoch": 2.1, + "learning_rate": 4.320228423976936e-07, + "loss": 0.48, + "step": 82110 + }, + { + "epoch": 2.1, + "learning_rate": 4.320000686052934e-07, + "loss": 0.2898, + "step": 82111 + }, + { + "epoch": 2.1, + "learning_rate": 4.3197729524778505e-07, + "loss": 0.3497, + "step": 82112 + }, + { + "epoch": 2.1, + "learning_rate": 4.3195452232518547e-07, + "loss": 0.4805, + "step": 82113 + }, + { + "epoch": 2.1, + "learning_rate": 4.319317498375118e-07, + "loss": 0.4053, + "step": 82114 + }, + { + "epoch": 2.1, + "learning_rate": 4.3190897778478196e-07, + "loss": 0.459, + "step": 82115 + }, + { + "epoch": 2.1, + "learning_rate": 4.3188620616701323e-07, + "loss": 0.4336, + "step": 82116 + }, + { + "epoch": 2.1, + "learning_rate": 4.318634349842235e-07, + "loss": 0.418, + "step": 82117 + }, + { + "epoch": 2.1, + "learning_rate": 4.318406642364294e-07, + "loss": 0.3164, + "step": 82118 + }, + { + "epoch": 2.1, + "learning_rate": 4.3181789392364887e-07, + "loss": 0.4644, + "step": 82119 + }, + { + "epoch": 2.1, + "learning_rate": 4.317951240458991e-07, + "loss": 0.2532, + "step": 82120 + }, + { + "epoch": 2.1, + "learning_rate": 4.317723546031983e-07, + "loss": 0.4619, + "step": 82121 + }, + { + "epoch": 2.1, + "learning_rate": 4.3174958559556307e-07, + "loss": 0.3735, + "step": 82122 + }, + { + "epoch": 2.1, + "learning_rate": 4.317268170230107e-07, + "loss": 0.4546, + "step": 82123 + }, + { + "epoch": 2.1, + "learning_rate": 4.31704048885559e-07, + "loss": 0.3057, + "step": 82124 + }, + { + "epoch": 2.1, + "learning_rate": 4.3168128118322546e-07, + "loss": 0.5654, + "step": 82125 + }, + { + "epoch": 2.1, + "learning_rate": 4.316585139160277e-07, + "loss": 0.4424, + "step": 82126 + }, + { + "epoch": 2.1, + "learning_rate": 4.316357470839825e-07, + "loss": 0.2769, + "step": 82127 + }, + { + "epoch": 2.1, + "learning_rate": 4.3161298068710783e-07, + "loss": 0.5625, + "step": 82128 + }, + { + "epoch": 2.11, + "learning_rate": 4.3159021472542125e-07, + "loss": 0.4131, + "step": 82129 + }, + { + "epoch": 2.11, + "learning_rate": 4.315674491989395e-07, + "loss": 0.4541, + "step": 82130 + }, + { + "epoch": 2.11, + "learning_rate": 4.315446841076804e-07, + "loss": 0.4282, + "step": 82131 + }, + { + "epoch": 2.11, + "learning_rate": 4.315219194516618e-07, + "loss": 0.2381, + "step": 82132 + }, + { + "epoch": 2.11, + "learning_rate": 4.314991552309004e-07, + "loss": 0.3429, + "step": 82133 + }, + { + "epoch": 2.11, + "learning_rate": 4.3147639144541427e-07, + "loss": 0.4453, + "step": 82134 + }, + { + "epoch": 2.11, + "learning_rate": 4.314536280952201e-07, + "loss": 0.3371, + "step": 82135 + }, + { + "epoch": 2.11, + "learning_rate": 4.314308651803359e-07, + "loss": 0.3572, + "step": 82136 + }, + { + "epoch": 2.11, + "learning_rate": 4.3140810270077886e-07, + "loss": 0.2562, + "step": 82137 + }, + { + "epoch": 2.11, + "learning_rate": 4.313853406565668e-07, + "loss": 0.3823, + "step": 82138 + }, + { + "epoch": 2.11, + "learning_rate": 4.3136257904771655e-07, + "loss": 0.2991, + "step": 82139 + }, + { + "epoch": 2.11, + "learning_rate": 4.313398178742459e-07, + "loss": 0.5137, + "step": 82140 + }, + { + "epoch": 2.11, + "learning_rate": 4.313170571361721e-07, + "loss": 0.4531, + "step": 82141 + }, + { + "epoch": 2.11, + "learning_rate": 4.3129429683351304e-07, + "loss": 0.394, + "step": 82142 + }, + { + "epoch": 2.11, + "learning_rate": 4.312715369662858e-07, + "loss": 0.4937, + "step": 82143 + }, + { + "epoch": 2.11, + "learning_rate": 4.312487775345074e-07, + "loss": 0.2415, + "step": 82144 + }, + { + "epoch": 2.11, + "learning_rate": 4.312260185381957e-07, + "loss": 0.3362, + "step": 82145 + }, + { + "epoch": 2.11, + "learning_rate": 4.312032599773685e-07, + "loss": 0.4634, + "step": 82146 + }, + { + "epoch": 2.11, + "learning_rate": 4.3118050185204234e-07, + "loss": 0.4448, + "step": 82147 + }, + { + "epoch": 2.11, + "learning_rate": 4.3115774416223516e-07, + "loss": 0.4424, + "step": 82148 + }, + { + "epoch": 2.11, + "learning_rate": 4.3113498690796437e-07, + "loss": 0.3174, + "step": 82149 + }, + { + "epoch": 2.11, + "learning_rate": 4.3111223008924767e-07, + "loss": 0.5156, + "step": 82150 + }, + { + "epoch": 2.11, + "learning_rate": 4.3108947370610183e-07, + "loss": 0.4785, + "step": 82151 + }, + { + "epoch": 2.11, + "learning_rate": 4.3106671775854496e-07, + "loss": 0.4644, + "step": 82152 + }, + { + "epoch": 2.11, + "learning_rate": 4.310439622465939e-07, + "loss": 0.429, + "step": 82153 + }, + { + "epoch": 2.11, + "learning_rate": 4.3102120717026626e-07, + "loss": 0.4775, + "step": 82154 + }, + { + "epoch": 2.11, + "learning_rate": 4.309984525295798e-07, + "loss": 0.439, + "step": 82155 + }, + { + "epoch": 2.11, + "learning_rate": 4.309756983245514e-07, + "loss": 0.335, + "step": 82156 + }, + { + "epoch": 2.11, + "learning_rate": 4.309529445551987e-07, + "loss": 0.3657, + "step": 82157 + }, + { + "epoch": 2.11, + "learning_rate": 4.3093019122153915e-07, + "loss": 0.4861, + "step": 82158 + }, + { + "epoch": 2.11, + "learning_rate": 4.309074383235906e-07, + "loss": 0.499, + "step": 82159 + }, + { + "epoch": 2.11, + "learning_rate": 4.308846858613696e-07, + "loss": 0.38, + "step": 82160 + }, + { + "epoch": 2.11, + "learning_rate": 4.3086193383489444e-07, + "loss": 0.3828, + "step": 82161 + }, + { + "epoch": 2.11, + "learning_rate": 4.308391822441818e-07, + "loss": 0.4683, + "step": 82162 + }, + { + "epoch": 2.11, + "learning_rate": 4.308164310892497e-07, + "loss": 0.3556, + "step": 82163 + }, + { + "epoch": 2.11, + "learning_rate": 4.30793680370115e-07, + "loss": 0.2393, + "step": 82164 + }, + { + "epoch": 2.11, + "learning_rate": 4.3077093008679544e-07, + "loss": 0.2894, + "step": 82165 + }, + { + "epoch": 2.11, + "learning_rate": 4.307481802393084e-07, + "loss": 0.3464, + "step": 82166 + }, + { + "epoch": 2.11, + "learning_rate": 4.3072543082767156e-07, + "loss": 0.4341, + "step": 82167 + }, + { + "epoch": 2.11, + "learning_rate": 4.3070268185190174e-07, + "loss": 0.3445, + "step": 82168 + }, + { + "epoch": 2.11, + "learning_rate": 4.3067993331201677e-07, + "loss": 0.4497, + "step": 82169 + }, + { + "epoch": 2.11, + "learning_rate": 4.3065718520803396e-07, + "loss": 0.3394, + "step": 82170 + }, + { + "epoch": 2.11, + "learning_rate": 4.306344375399712e-07, + "loss": 0.3813, + "step": 82171 + }, + { + "epoch": 2.11, + "learning_rate": 4.306116903078454e-07, + "loss": 0.3016, + "step": 82172 + }, + { + "epoch": 2.11, + "learning_rate": 4.305889435116736e-07, + "loss": 0.6045, + "step": 82173 + }, + { + "epoch": 2.11, + "learning_rate": 4.305661971514738e-07, + "loss": 0.4575, + "step": 82174 + }, + { + "epoch": 2.11, + "learning_rate": 4.305434512272632e-07, + "loss": 0.5288, + "step": 82175 + }, + { + "epoch": 2.11, + "learning_rate": 4.3052070573905973e-07, + "loss": 0.5366, + "step": 82176 + }, + { + "epoch": 2.11, + "learning_rate": 4.3049796068687994e-07, + "loss": 0.3804, + "step": 82177 + }, + { + "epoch": 2.11, + "learning_rate": 4.304752160707418e-07, + "loss": 0.4443, + "step": 82178 + }, + { + "epoch": 2.11, + "learning_rate": 4.3045247189066246e-07, + "loss": 0.5044, + "step": 82179 + }, + { + "epoch": 2.11, + "learning_rate": 4.304297281466599e-07, + "loss": 0.3955, + "step": 82180 + }, + { + "epoch": 2.11, + "learning_rate": 4.3040698483875105e-07, + "loss": 0.4307, + "step": 82181 + }, + { + "epoch": 2.11, + "learning_rate": 4.303842419669531e-07, + "loss": 0.3475, + "step": 82182 + }, + { + "epoch": 2.11, + "learning_rate": 4.3036149953128366e-07, + "loss": 0.3716, + "step": 82183 + }, + { + "epoch": 2.11, + "learning_rate": 4.3033875753176063e-07, + "loss": 0.5103, + "step": 82184 + }, + { + "epoch": 2.11, + "learning_rate": 4.303160159684007e-07, + "loss": 0.4011, + "step": 82185 + }, + { + "epoch": 2.11, + "learning_rate": 4.302932748412216e-07, + "loss": 0.3867, + "step": 82186 + }, + { + "epoch": 2.11, + "learning_rate": 4.302705341502406e-07, + "loss": 0.4341, + "step": 82187 + }, + { + "epoch": 2.11, + "learning_rate": 4.3024779389547573e-07, + "loss": 0.4673, + "step": 82188 + }, + { + "epoch": 2.11, + "learning_rate": 4.3022505407694353e-07, + "loss": 0.4272, + "step": 82189 + }, + { + "epoch": 2.11, + "learning_rate": 4.3020231469466184e-07, + "loss": 0.3938, + "step": 82190 + }, + { + "epoch": 2.11, + "learning_rate": 4.301795757486485e-07, + "loss": 0.4219, + "step": 82191 + }, + { + "epoch": 2.11, + "learning_rate": 4.3015683723891993e-07, + "loss": 0.3213, + "step": 82192 + }, + { + "epoch": 2.11, + "learning_rate": 4.3013409916549446e-07, + "loss": 0.394, + "step": 82193 + }, + { + "epoch": 2.11, + "learning_rate": 4.301113615283888e-07, + "loss": 0.4829, + "step": 82194 + }, + { + "epoch": 2.11, + "learning_rate": 4.300886243276206e-07, + "loss": 0.4355, + "step": 82195 + }, + { + "epoch": 2.11, + "learning_rate": 4.300658875632074e-07, + "loss": 0.3472, + "step": 82196 + }, + { + "epoch": 2.11, + "learning_rate": 4.300431512351669e-07, + "loss": 0.3687, + "step": 82197 + }, + { + "epoch": 2.11, + "learning_rate": 4.3002041534351575e-07, + "loss": 0.4678, + "step": 82198 + }, + { + "epoch": 2.11, + "learning_rate": 4.2999767988827187e-07, + "loss": 0.3406, + "step": 82199 + }, + { + "epoch": 2.11, + "learning_rate": 4.2997494486945276e-07, + "loss": 0.2095, + "step": 82200 + }, + { + "epoch": 2.11, + "learning_rate": 4.2995221028707575e-07, + "loss": 0.4009, + "step": 82201 + }, + { + "epoch": 2.11, + "learning_rate": 4.299294761411576e-07, + "loss": 0.3246, + "step": 82202 + }, + { + "epoch": 2.11, + "learning_rate": 4.2990674243171644e-07, + "loss": 0.3227, + "step": 82203 + }, + { + "epoch": 2.11, + "learning_rate": 4.298840091587693e-07, + "loss": 0.4741, + "step": 82204 + }, + { + "epoch": 2.11, + "learning_rate": 4.2986127632233424e-07, + "loss": 0.4648, + "step": 82205 + }, + { + "epoch": 2.11, + "learning_rate": 4.298385439224278e-07, + "loss": 0.4739, + "step": 82206 + }, + { + "epoch": 2.11, + "learning_rate": 4.298158119590677e-07, + "loss": 0.3182, + "step": 82207 + }, + { + "epoch": 2.11, + "learning_rate": 4.2979308043227145e-07, + "loss": 0.4165, + "step": 82208 + }, + { + "epoch": 2.11, + "learning_rate": 4.297703493420568e-07, + "loss": 0.355, + "step": 82209 + }, + { + "epoch": 2.11, + "learning_rate": 4.2974761868844046e-07, + "loss": 0.4502, + "step": 82210 + }, + { + "epoch": 2.11, + "learning_rate": 4.297248884714404e-07, + "loss": 0.3701, + "step": 82211 + }, + { + "epoch": 2.11, + "learning_rate": 4.297021586910735e-07, + "loss": 0.3657, + "step": 82212 + }, + { + "epoch": 2.11, + "learning_rate": 4.2967942934735737e-07, + "loss": 0.4094, + "step": 82213 + }, + { + "epoch": 2.11, + "learning_rate": 4.296567004403099e-07, + "loss": 0.3279, + "step": 82214 + }, + { + "epoch": 2.11, + "learning_rate": 4.2963397196994767e-07, + "loss": 0.4282, + "step": 82215 + }, + { + "epoch": 2.11, + "learning_rate": 4.2961124393628846e-07, + "loss": 0.375, + "step": 82216 + }, + { + "epoch": 2.11, + "learning_rate": 4.2958851633935013e-07, + "loss": 0.4253, + "step": 82217 + }, + { + "epoch": 2.11, + "learning_rate": 4.295657891791492e-07, + "loss": 0.3381, + "step": 82218 + }, + { + "epoch": 2.11, + "learning_rate": 4.295430624557036e-07, + "loss": 0.3972, + "step": 82219 + }, + { + "epoch": 2.11, + "learning_rate": 4.295203361690305e-07, + "loss": 0.4104, + "step": 82220 + }, + { + "epoch": 2.11, + "learning_rate": 4.2949761031914797e-07, + "loss": 0.4307, + "step": 82221 + }, + { + "epoch": 2.11, + "learning_rate": 4.2947488490607276e-07, + "loss": 0.4937, + "step": 82222 + }, + { + "epoch": 2.11, + "learning_rate": 4.294521599298222e-07, + "loss": 0.4873, + "step": 82223 + }, + { + "epoch": 2.11, + "learning_rate": 4.2942943539041375e-07, + "loss": 0.3152, + "step": 82224 + }, + { + "epoch": 2.11, + "learning_rate": 4.29406711287865e-07, + "loss": 0.4071, + "step": 82225 + }, + { + "epoch": 2.11, + "learning_rate": 4.293839876221936e-07, + "loss": 0.4165, + "step": 82226 + }, + { + "epoch": 2.11, + "learning_rate": 4.2936126439341637e-07, + "loss": 0.439, + "step": 82227 + }, + { + "epoch": 2.11, + "learning_rate": 4.293385416015509e-07, + "loss": 0.4189, + "step": 82228 + }, + { + "epoch": 2.11, + "learning_rate": 4.2931581924661466e-07, + "loss": 0.3992, + "step": 82229 + }, + { + "epoch": 2.11, + "learning_rate": 4.292930973286255e-07, + "loss": 0.3171, + "step": 82230 + }, + { + "epoch": 2.11, + "learning_rate": 4.2927037584760026e-07, + "loss": 0.4075, + "step": 82231 + }, + { + "epoch": 2.11, + "learning_rate": 4.292476548035562e-07, + "loss": 0.3381, + "step": 82232 + }, + { + "epoch": 2.11, + "learning_rate": 4.2922493419651093e-07, + "loss": 0.4492, + "step": 82233 + }, + { + "epoch": 2.11, + "learning_rate": 4.2920221402648226e-07, + "loss": 0.2314, + "step": 82234 + }, + { + "epoch": 2.11, + "learning_rate": 4.2917949429348686e-07, + "loss": 0.3567, + "step": 82235 + }, + { + "epoch": 2.11, + "learning_rate": 4.2915677499754245e-07, + "loss": 0.4199, + "step": 82236 + }, + { + "epoch": 2.11, + "learning_rate": 4.2913405613866636e-07, + "loss": 0.4517, + "step": 82237 + }, + { + "epoch": 2.11, + "learning_rate": 4.291113377168766e-07, + "loss": 0.4485, + "step": 82238 + }, + { + "epoch": 2.11, + "learning_rate": 4.290886197321896e-07, + "loss": 0.502, + "step": 82239 + }, + { + "epoch": 2.11, + "learning_rate": 4.2906590218462314e-07, + "loss": 0.4014, + "step": 82240 + }, + { + "epoch": 2.11, + "learning_rate": 4.290431850741951e-07, + "loss": 0.4707, + "step": 82241 + }, + { + "epoch": 2.11, + "learning_rate": 4.29020468400922e-07, + "loss": 0.519, + "step": 82242 + }, + { + "epoch": 2.11, + "learning_rate": 4.2899775216482217e-07, + "loss": 0.3723, + "step": 82243 + }, + { + "epoch": 2.11, + "learning_rate": 4.2897503636591205e-07, + "loss": 0.4401, + "step": 82244 + }, + { + "epoch": 2.11, + "learning_rate": 4.289523210042094e-07, + "loss": 0.4722, + "step": 82245 + }, + { + "epoch": 2.11, + "learning_rate": 4.289296060797318e-07, + "loss": 0.4004, + "step": 82246 + }, + { + "epoch": 2.11, + "learning_rate": 4.2890689159249694e-07, + "loss": 0.4175, + "step": 82247 + }, + { + "epoch": 2.11, + "learning_rate": 4.288841775425215e-07, + "loss": 0.4297, + "step": 82248 + }, + { + "epoch": 2.11, + "learning_rate": 4.28861463929823e-07, + "loss": 0.4497, + "step": 82249 + }, + { + "epoch": 2.11, + "learning_rate": 4.288387507544192e-07, + "loss": 0.314, + "step": 82250 + }, + { + "epoch": 2.11, + "learning_rate": 4.288160380163276e-07, + "loss": 0.3215, + "step": 82251 + }, + { + "epoch": 2.11, + "learning_rate": 4.2879332571556524e-07, + "loss": 0.3999, + "step": 82252 + }, + { + "epoch": 2.11, + "learning_rate": 4.287706138521493e-07, + "loss": 0.4292, + "step": 82253 + }, + { + "epoch": 2.11, + "learning_rate": 4.2874790242609737e-07, + "loss": 0.3955, + "step": 82254 + }, + { + "epoch": 2.11, + "learning_rate": 4.2872519143742727e-07, + "loss": 0.5166, + "step": 82255 + }, + { + "epoch": 2.11, + "learning_rate": 4.2870248088615567e-07, + "loss": 0.2712, + "step": 82256 + }, + { + "epoch": 2.11, + "learning_rate": 4.286797707723002e-07, + "loss": 0.4531, + "step": 82257 + }, + { + "epoch": 2.11, + "learning_rate": 4.286570610958785e-07, + "loss": 0.4668, + "step": 82258 + }, + { + "epoch": 2.11, + "learning_rate": 4.2863435185690824e-07, + "loss": 0.3813, + "step": 82259 + }, + { + "epoch": 2.11, + "learning_rate": 4.2861164305540586e-07, + "loss": 0.4678, + "step": 82260 + }, + { + "epoch": 2.11, + "learning_rate": 4.285889346913897e-07, + "loss": 0.3442, + "step": 82261 + }, + { + "epoch": 2.11, + "learning_rate": 4.285662267648764e-07, + "loss": 0.4575, + "step": 82262 + }, + { + "epoch": 2.11, + "learning_rate": 4.285435192758836e-07, + "loss": 0.5356, + "step": 82263 + }, + { + "epoch": 2.11, + "learning_rate": 4.2852081222442917e-07, + "loss": 0.3396, + "step": 82264 + }, + { + "epoch": 2.11, + "learning_rate": 4.2849810561052966e-07, + "loss": 0.2955, + "step": 82265 + }, + { + "epoch": 2.11, + "learning_rate": 4.284753994342029e-07, + "loss": 0.46, + "step": 82266 + }, + { + "epoch": 2.11, + "learning_rate": 4.284526936954662e-07, + "loss": 0.2488, + "step": 82267 + }, + { + "epoch": 2.11, + "learning_rate": 4.284299883943374e-07, + "loss": 0.4346, + "step": 82268 + }, + { + "epoch": 2.11, + "learning_rate": 4.284072835308331e-07, + "loss": 0.5625, + "step": 82269 + }, + { + "epoch": 2.11, + "learning_rate": 4.2838457910497117e-07, + "loss": 0.4443, + "step": 82270 + }, + { + "epoch": 2.11, + "learning_rate": 4.2836187511676913e-07, + "loss": 0.4163, + "step": 82271 + }, + { + "epoch": 2.11, + "learning_rate": 4.283391715662441e-07, + "loss": 0.3682, + "step": 82272 + }, + { + "epoch": 2.11, + "learning_rate": 4.283164684534132e-07, + "loss": 0.438, + "step": 82273 + }, + { + "epoch": 2.11, + "learning_rate": 4.2829376577829403e-07, + "loss": 0.3813, + "step": 82274 + }, + { + "epoch": 2.11, + "learning_rate": 4.28271063540904e-07, + "loss": 0.4897, + "step": 82275 + }, + { + "epoch": 2.11, + "learning_rate": 4.28248361741261e-07, + "loss": 0.4458, + "step": 82276 + }, + { + "epoch": 2.11, + "learning_rate": 4.2822566037938145e-07, + "loss": 0.3389, + "step": 82277 + }, + { + "epoch": 2.11, + "learning_rate": 4.282029594552833e-07, + "loss": 0.4331, + "step": 82278 + }, + { + "epoch": 2.11, + "learning_rate": 4.2818025896898393e-07, + "loss": 0.4519, + "step": 82279 + }, + { + "epoch": 2.11, + "learning_rate": 4.2815755892050085e-07, + "loss": 0.2495, + "step": 82280 + }, + { + "epoch": 2.11, + "learning_rate": 4.281348593098513e-07, + "loss": 0.4526, + "step": 82281 + }, + { + "epoch": 2.11, + "learning_rate": 4.281121601370522e-07, + "loss": 0.406, + "step": 82282 + }, + { + "epoch": 2.11, + "learning_rate": 4.2808946140212145e-07, + "loss": 0.3585, + "step": 82283 + }, + { + "epoch": 2.11, + "learning_rate": 4.280667631050762e-07, + "loss": 0.4961, + "step": 82284 + }, + { + "epoch": 2.11, + "learning_rate": 4.2804406524593426e-07, + "loss": 0.4214, + "step": 82285 + }, + { + "epoch": 2.11, + "learning_rate": 4.2802136782471233e-07, + "loss": 0.2615, + "step": 82286 + }, + { + "epoch": 2.11, + "learning_rate": 4.2799867084142814e-07, + "loss": 0.3612, + "step": 82287 + }, + { + "epoch": 2.11, + "learning_rate": 4.279759742960991e-07, + "loss": 0.4482, + "step": 82288 + }, + { + "epoch": 2.11, + "learning_rate": 4.279532781887429e-07, + "loss": 0.415, + "step": 82289 + }, + { + "epoch": 2.11, + "learning_rate": 4.279305825193763e-07, + "loss": 0.4771, + "step": 82290 + }, + { + "epoch": 2.11, + "learning_rate": 4.279078872880172e-07, + "loss": 0.3945, + "step": 82291 + }, + { + "epoch": 2.11, + "learning_rate": 4.2788519249468247e-07, + "loss": 0.4482, + "step": 82292 + }, + { + "epoch": 2.11, + "learning_rate": 4.2786249813939e-07, + "loss": 0.1985, + "step": 82293 + }, + { + "epoch": 2.11, + "learning_rate": 4.278398042221566e-07, + "loss": 0.3542, + "step": 82294 + }, + { + "epoch": 2.11, + "learning_rate": 4.2781711074299986e-07, + "loss": 0.324, + "step": 82295 + }, + { + "epoch": 2.11, + "learning_rate": 4.2779441770193734e-07, + "loss": 0.3618, + "step": 82296 + }, + { + "epoch": 2.11, + "learning_rate": 4.2777172509898663e-07, + "loss": 0.3418, + "step": 82297 + }, + { + "epoch": 2.11, + "learning_rate": 4.277490329341645e-07, + "loss": 0.4258, + "step": 82298 + }, + { + "epoch": 2.11, + "learning_rate": 4.277263412074885e-07, + "loss": 0.3887, + "step": 82299 + }, + { + "epoch": 2.11, + "learning_rate": 4.277036499189763e-07, + "loss": 0.5103, + "step": 82300 + }, + { + "epoch": 2.11, + "learning_rate": 4.276809590686453e-07, + "loss": 0.3403, + "step": 82301 + }, + { + "epoch": 2.11, + "learning_rate": 4.2765826865651276e-07, + "loss": 0.3159, + "step": 82302 + }, + { + "epoch": 2.11, + "learning_rate": 4.276355786825957e-07, + "loss": 0.3525, + "step": 82303 + }, + { + "epoch": 2.11, + "learning_rate": 4.276128891469116e-07, + "loss": 0.4927, + "step": 82304 + }, + { + "epoch": 2.11, + "learning_rate": 4.275902000494781e-07, + "loss": 0.4536, + "step": 82305 + }, + { + "epoch": 2.11, + "learning_rate": 4.2756751139031276e-07, + "loss": 0.4155, + "step": 82306 + }, + { + "epoch": 2.11, + "learning_rate": 4.275448231694323e-07, + "loss": 0.4399, + "step": 82307 + }, + { + "epoch": 2.11, + "learning_rate": 4.275221353868544e-07, + "loss": 0.3555, + "step": 82308 + }, + { + "epoch": 2.11, + "learning_rate": 4.2749944804259696e-07, + "loss": 0.4307, + "step": 82309 + }, + { + "epoch": 2.11, + "learning_rate": 4.274767611366764e-07, + "loss": 0.4355, + "step": 82310 + }, + { + "epoch": 2.11, + "learning_rate": 4.2745407466911096e-07, + "loss": 0.3843, + "step": 82311 + }, + { + "epoch": 2.11, + "learning_rate": 4.2743138863991726e-07, + "loss": 0.4209, + "step": 82312 + }, + { + "epoch": 2.11, + "learning_rate": 4.2740870304911303e-07, + "loss": 0.3867, + "step": 82313 + }, + { + "epoch": 2.11, + "learning_rate": 4.273860178967159e-07, + "loss": 0.4438, + "step": 82314 + }, + { + "epoch": 2.11, + "learning_rate": 4.2736333318274276e-07, + "loss": 0.5005, + "step": 82315 + }, + { + "epoch": 2.11, + "learning_rate": 4.27340648907211e-07, + "loss": 0.312, + "step": 82316 + }, + { + "epoch": 2.11, + "learning_rate": 4.2731796507013827e-07, + "loss": 0.3936, + "step": 82317 + }, + { + "epoch": 2.11, + "learning_rate": 4.272952816715423e-07, + "loss": 0.4351, + "step": 82318 + }, + { + "epoch": 2.11, + "learning_rate": 4.272725987114395e-07, + "loss": 0.4624, + "step": 82319 + }, + { + "epoch": 2.11, + "learning_rate": 4.2724991618984775e-07, + "loss": 0.3962, + "step": 82320 + }, + { + "epoch": 2.11, + "learning_rate": 4.2722723410678483e-07, + "loss": 0.6025, + "step": 82321 + }, + { + "epoch": 2.11, + "learning_rate": 4.272045524622673e-07, + "loss": 0.3618, + "step": 82322 + }, + { + "epoch": 2.11, + "learning_rate": 4.2718187125631323e-07, + "loss": 0.4673, + "step": 82323 + }, + { + "epoch": 2.11, + "learning_rate": 4.2715919048893933e-07, + "loss": 0.4604, + "step": 82324 + }, + { + "epoch": 2.11, + "learning_rate": 4.271365101601633e-07, + "loss": 0.4336, + "step": 82325 + }, + { + "epoch": 2.11, + "learning_rate": 4.271138302700028e-07, + "loss": 0.3345, + "step": 82326 + }, + { + "epoch": 2.11, + "learning_rate": 4.270911508184746e-07, + "loss": 0.3916, + "step": 82327 + }, + { + "epoch": 2.11, + "learning_rate": 4.2706847180559634e-07, + "loss": 0.4336, + "step": 82328 + }, + { + "epoch": 2.11, + "learning_rate": 4.2704579323138546e-07, + "loss": 0.3467, + "step": 82329 + }, + { + "epoch": 2.11, + "learning_rate": 4.2702311509585956e-07, + "loss": 0.4902, + "step": 82330 + }, + { + "epoch": 2.11, + "learning_rate": 4.270004373990357e-07, + "loss": 0.4907, + "step": 82331 + }, + { + "epoch": 2.11, + "learning_rate": 4.26977760140931e-07, + "loss": 0.396, + "step": 82332 + }, + { + "epoch": 2.11, + "learning_rate": 4.2695508332156294e-07, + "loss": 0.4751, + "step": 82333 + }, + { + "epoch": 2.11, + "learning_rate": 4.269324069409491e-07, + "loss": 0.4287, + "step": 82334 + }, + { + "epoch": 2.11, + "learning_rate": 4.269097309991072e-07, + "loss": 0.4277, + "step": 82335 + }, + { + "epoch": 2.11, + "learning_rate": 4.2688705549605377e-07, + "loss": 0.4529, + "step": 82336 + }, + { + "epoch": 2.11, + "learning_rate": 4.268643804318065e-07, + "loss": 0.4263, + "step": 82337 + }, + { + "epoch": 2.11, + "learning_rate": 4.268417058063828e-07, + "loss": 0.3345, + "step": 82338 + }, + { + "epoch": 2.11, + "learning_rate": 4.2681903161980046e-07, + "loss": 0.3936, + "step": 82339 + }, + { + "epoch": 2.11, + "learning_rate": 4.267963578720761e-07, + "loss": 0.4219, + "step": 82340 + }, + { + "epoch": 2.11, + "learning_rate": 4.267736845632278e-07, + "loss": 0.3854, + "step": 82341 + }, + { + "epoch": 2.11, + "learning_rate": 4.267510116932721e-07, + "loss": 0.4102, + "step": 82342 + }, + { + "epoch": 2.11, + "learning_rate": 4.267283392622272e-07, + "loss": 0.6729, + "step": 82343 + }, + { + "epoch": 2.11, + "learning_rate": 4.267056672701097e-07, + "loss": 0.3865, + "step": 82344 + }, + { + "epoch": 2.11, + "learning_rate": 4.2668299571693723e-07, + "loss": 0.4277, + "step": 82345 + }, + { + "epoch": 2.11, + "learning_rate": 4.2666032460272725e-07, + "loss": 0.4351, + "step": 82346 + }, + { + "epoch": 2.11, + "learning_rate": 4.266376539274975e-07, + "loss": 0.3555, + "step": 82347 + }, + { + "epoch": 2.11, + "learning_rate": 4.266149836912646e-07, + "loss": 0.3401, + "step": 82348 + }, + { + "epoch": 2.11, + "learning_rate": 4.2659231389404617e-07, + "loss": 0.4331, + "step": 82349 + }, + { + "epoch": 2.11, + "learning_rate": 4.2656964453585964e-07, + "loss": 0.3652, + "step": 82350 + }, + { + "epoch": 2.11, + "learning_rate": 4.2654697561672284e-07, + "loss": 0.458, + "step": 82351 + }, + { + "epoch": 2.11, + "learning_rate": 4.2652430713665256e-07, + "loss": 0.405, + "step": 82352 + }, + { + "epoch": 2.11, + "learning_rate": 4.2650163909566584e-07, + "loss": 0.4678, + "step": 82353 + }, + { + "epoch": 2.11, + "learning_rate": 4.264789714937805e-07, + "loss": 0.4399, + "step": 82354 + }, + { + "epoch": 2.11, + "learning_rate": 4.2645630433101387e-07, + "loss": 0.4202, + "step": 82355 + }, + { + "epoch": 2.11, + "learning_rate": 4.264336376073836e-07, + "loss": 0.3535, + "step": 82356 + }, + { + "epoch": 2.11, + "learning_rate": 4.2641097132290637e-07, + "loss": 0.2379, + "step": 82357 + }, + { + "epoch": 2.11, + "learning_rate": 4.2638830547759983e-07, + "loss": 0.392, + "step": 82358 + }, + { + "epoch": 2.11, + "learning_rate": 4.2636564007148147e-07, + "loss": 0.3994, + "step": 82359 + }, + { + "epoch": 2.11, + "learning_rate": 4.2634297510456895e-07, + "loss": 0.3877, + "step": 82360 + }, + { + "epoch": 2.11, + "learning_rate": 4.2632031057687913e-07, + "loss": 0.385, + "step": 82361 + }, + { + "epoch": 2.11, + "learning_rate": 4.2629764648842914e-07, + "loss": 0.3916, + "step": 82362 + }, + { + "epoch": 2.11, + "learning_rate": 4.262749828392367e-07, + "loss": 0.4614, + "step": 82363 + }, + { + "epoch": 2.11, + "learning_rate": 4.2625231962931953e-07, + "loss": 0.4102, + "step": 82364 + }, + { + "epoch": 2.11, + "learning_rate": 4.2622965685869415e-07, + "loss": 0.3474, + "step": 82365 + }, + { + "epoch": 2.11, + "learning_rate": 4.262069945273783e-07, + "loss": 0.3238, + "step": 82366 + }, + { + "epoch": 2.11, + "learning_rate": 4.2618433263538944e-07, + "loss": 0.2572, + "step": 82367 + }, + { + "epoch": 2.11, + "learning_rate": 4.2616167118274516e-07, + "loss": 0.4395, + "step": 82368 + }, + { + "epoch": 2.11, + "learning_rate": 4.2613901016946216e-07, + "loss": 0.4028, + "step": 82369 + }, + { + "epoch": 2.11, + "learning_rate": 4.261163495955582e-07, + "loss": 0.4736, + "step": 82370 + }, + { + "epoch": 2.11, + "learning_rate": 4.2609368946105085e-07, + "loss": 0.4302, + "step": 82371 + }, + { + "epoch": 2.11, + "learning_rate": 4.260710297659568e-07, + "loss": 0.4009, + "step": 82372 + }, + { + "epoch": 2.11, + "learning_rate": 4.260483705102942e-07, + "loss": 0.3955, + "step": 82373 + }, + { + "epoch": 2.11, + "learning_rate": 4.260257116940795e-07, + "loss": 0.3794, + "step": 82374 + }, + { + "epoch": 2.11, + "learning_rate": 4.2600305331733066e-07, + "loss": 0.4331, + "step": 82375 + }, + { + "epoch": 2.11, + "learning_rate": 4.259803953800648e-07, + "loss": 0.448, + "step": 82376 + }, + { + "epoch": 2.11, + "learning_rate": 4.2595773788229973e-07, + "loss": 0.4268, + "step": 82377 + }, + { + "epoch": 2.11, + "learning_rate": 4.2593508082405205e-07, + "loss": 0.3442, + "step": 82378 + }, + { + "epoch": 2.11, + "learning_rate": 4.2591242420533957e-07, + "loss": 0.4487, + "step": 82379 + }, + { + "epoch": 2.11, + "learning_rate": 4.258897680261798e-07, + "loss": 0.4169, + "step": 82380 + }, + { + "epoch": 2.11, + "learning_rate": 4.258671122865899e-07, + "loss": 0.4639, + "step": 82381 + }, + { + "epoch": 2.11, + "learning_rate": 4.258444569865868e-07, + "loss": 0.3979, + "step": 82382 + }, + { + "epoch": 2.11, + "learning_rate": 4.258218021261881e-07, + "loss": 0.3135, + "step": 82383 + }, + { + "epoch": 2.11, + "learning_rate": 4.2579914770541136e-07, + "loss": 0.3531, + "step": 82384 + }, + { + "epoch": 2.11, + "learning_rate": 4.2577649372427413e-07, + "loss": 0.3779, + "step": 82385 + }, + { + "epoch": 2.11, + "learning_rate": 4.2575384018279317e-07, + "loss": 0.4834, + "step": 82386 + }, + { + "epoch": 2.11, + "learning_rate": 4.257311870809859e-07, + "loss": 0.363, + "step": 82387 + }, + { + "epoch": 2.11, + "learning_rate": 4.2570853441887e-07, + "loss": 0.5117, + "step": 82388 + }, + { + "epoch": 2.11, + "learning_rate": 4.25685882196463e-07, + "loss": 0.4155, + "step": 82389 + }, + { + "epoch": 2.11, + "learning_rate": 4.256632304137815e-07, + "loss": 0.377, + "step": 82390 + }, + { + "epoch": 2.11, + "learning_rate": 4.256405790708436e-07, + "loss": 0.4229, + "step": 82391 + }, + { + "epoch": 2.11, + "learning_rate": 4.2561792816766607e-07, + "loss": 0.2994, + "step": 82392 + }, + { + "epoch": 2.11, + "learning_rate": 4.255952777042664e-07, + "loss": 0.2295, + "step": 82393 + }, + { + "epoch": 2.11, + "learning_rate": 4.2557262768066225e-07, + "loss": 0.4648, + "step": 82394 + }, + { + "epoch": 2.11, + "learning_rate": 4.255499780968705e-07, + "loss": 0.3738, + "step": 82395 + }, + { + "epoch": 2.11, + "learning_rate": 4.2552732895290875e-07, + "loss": 0.376, + "step": 82396 + }, + { + "epoch": 2.11, + "learning_rate": 4.255046802487946e-07, + "loss": 0.3405, + "step": 82397 + }, + { + "epoch": 2.11, + "learning_rate": 4.254820319845448e-07, + "loss": 0.4175, + "step": 82398 + }, + { + "epoch": 2.11, + "learning_rate": 4.254593841601769e-07, + "loss": 0.4636, + "step": 82399 + }, + { + "epoch": 2.11, + "learning_rate": 4.254367367757085e-07, + "loss": 0.4346, + "step": 82400 + }, + { + "epoch": 2.11, + "learning_rate": 4.25414089831157e-07, + "loss": 0.2913, + "step": 82401 + }, + { + "epoch": 2.11, + "learning_rate": 4.2539144332653953e-07, + "loss": 0.3589, + "step": 82402 + }, + { + "epoch": 2.11, + "learning_rate": 4.2536879726187303e-07, + "loss": 0.5571, + "step": 82403 + }, + { + "epoch": 2.11, + "learning_rate": 4.2534615163717524e-07, + "loss": 0.4297, + "step": 82404 + }, + { + "epoch": 2.11, + "learning_rate": 4.253235064524635e-07, + "loss": 0.4033, + "step": 82405 + }, + { + "epoch": 2.11, + "learning_rate": 4.2530086170775546e-07, + "loss": 0.4277, + "step": 82406 + }, + { + "epoch": 2.11, + "learning_rate": 4.2527821740306767e-07, + "loss": 0.4966, + "step": 82407 + }, + { + "epoch": 2.11, + "learning_rate": 4.252555735384181e-07, + "loss": 0.4375, + "step": 82408 + }, + { + "epoch": 2.11, + "learning_rate": 4.2523293011382375e-07, + "loss": 0.4043, + "step": 82409 + }, + { + "epoch": 2.11, + "learning_rate": 4.252102871293026e-07, + "loss": 0.5044, + "step": 82410 + }, + { + "epoch": 2.11, + "learning_rate": 4.251876445848715e-07, + "loss": 0.3638, + "step": 82411 + }, + { + "epoch": 2.11, + "learning_rate": 4.2516500248054743e-07, + "loss": 0.3665, + "step": 82412 + }, + { + "epoch": 2.11, + "learning_rate": 4.25142360816348e-07, + "loss": 0.4395, + "step": 82413 + }, + { + "epoch": 2.11, + "learning_rate": 4.2511971959229067e-07, + "loss": 0.4297, + "step": 82414 + }, + { + "epoch": 2.11, + "learning_rate": 4.2509707880839316e-07, + "loss": 0.302, + "step": 82415 + }, + { + "epoch": 2.11, + "learning_rate": 4.2507443846467194e-07, + "loss": 0.417, + "step": 82416 + }, + { + "epoch": 2.11, + "learning_rate": 4.250517985611448e-07, + "loss": 0.4478, + "step": 82417 + }, + { + "epoch": 2.11, + "learning_rate": 4.2502915909782945e-07, + "loss": 0.5928, + "step": 82418 + }, + { + "epoch": 2.11, + "learning_rate": 4.2500652007474245e-07, + "loss": 0.4917, + "step": 82419 + }, + { + "epoch": 2.11, + "learning_rate": 4.2498388149190155e-07, + "loss": 0.4224, + "step": 82420 + }, + { + "epoch": 2.11, + "learning_rate": 4.2496124334932435e-07, + "loss": 0.415, + "step": 82421 + }, + { + "epoch": 2.11, + "learning_rate": 4.249386056470277e-07, + "loss": 0.3621, + "step": 82422 + }, + { + "epoch": 2.11, + "learning_rate": 4.249159683850293e-07, + "loss": 0.4639, + "step": 82423 + }, + { + "epoch": 2.11, + "learning_rate": 4.2489333156334594e-07, + "loss": 0.4131, + "step": 82424 + }, + { + "epoch": 2.11, + "learning_rate": 4.2487069518199535e-07, + "loss": 0.4558, + "step": 82425 + }, + { + "epoch": 2.11, + "learning_rate": 4.2484805924099485e-07, + "loss": 0.502, + "step": 82426 + }, + { + "epoch": 2.11, + "learning_rate": 4.248254237403621e-07, + "loss": 0.345, + "step": 82427 + }, + { + "epoch": 2.11, + "learning_rate": 4.2480278868011366e-07, + "loss": 0.4795, + "step": 82428 + }, + { + "epoch": 2.11, + "learning_rate": 4.2478015406026735e-07, + "loss": 0.3318, + "step": 82429 + }, + { + "epoch": 2.11, + "learning_rate": 4.247575198808404e-07, + "loss": 0.4609, + "step": 82430 + }, + { + "epoch": 2.11, + "learning_rate": 4.247348861418505e-07, + "loss": 0.2961, + "step": 82431 + }, + { + "epoch": 2.11, + "learning_rate": 4.247122528433147e-07, + "loss": 0.4441, + "step": 82432 + }, + { + "epoch": 2.11, + "learning_rate": 4.246896199852499e-07, + "loss": 0.4766, + "step": 82433 + }, + { + "epoch": 2.11, + "learning_rate": 4.2466698756767373e-07, + "loss": 0.3584, + "step": 82434 + }, + { + "epoch": 2.11, + "learning_rate": 4.246443555906041e-07, + "loss": 0.3921, + "step": 82435 + }, + { + "epoch": 2.11, + "learning_rate": 4.246217240540573e-07, + "loss": 0.3612, + "step": 82436 + }, + { + "epoch": 2.11, + "learning_rate": 4.245990929580513e-07, + "loss": 0.3955, + "step": 82437 + }, + { + "epoch": 2.11, + "learning_rate": 4.2457646230260325e-07, + "loss": 0.3787, + "step": 82438 + }, + { + "epoch": 2.11, + "learning_rate": 4.2455383208773096e-07, + "loss": 0.3059, + "step": 82439 + }, + { + "epoch": 2.11, + "learning_rate": 4.2453120231345097e-07, + "loss": 0.2856, + "step": 82440 + }, + { + "epoch": 2.11, + "learning_rate": 4.2450857297978137e-07, + "loss": 0.3103, + "step": 82441 + }, + { + "epoch": 2.11, + "learning_rate": 4.244859440867387e-07, + "loss": 0.4135, + "step": 82442 + }, + { + "epoch": 2.11, + "learning_rate": 4.244633156343407e-07, + "loss": 0.3385, + "step": 82443 + }, + { + "epoch": 2.11, + "learning_rate": 4.2444068762260496e-07, + "loss": 0.4038, + "step": 82444 + }, + { + "epoch": 2.11, + "learning_rate": 4.2441806005154824e-07, + "loss": 0.4487, + "step": 82445 + }, + { + "epoch": 2.11, + "learning_rate": 4.2439543292118805e-07, + "loss": 0.3982, + "step": 82446 + }, + { + "epoch": 2.11, + "learning_rate": 4.243728062315419e-07, + "loss": 0.3901, + "step": 82447 + }, + { + "epoch": 2.11, + "learning_rate": 4.2435017998262733e-07, + "loss": 0.4268, + "step": 82448 + }, + { + "epoch": 2.11, + "learning_rate": 4.243275541744611e-07, + "loss": 0.4883, + "step": 82449 + }, + { + "epoch": 2.11, + "learning_rate": 4.243049288070607e-07, + "loss": 0.3843, + "step": 82450 + }, + { + "epoch": 2.11, + "learning_rate": 4.242823038804439e-07, + "loss": 0.358, + "step": 82451 + }, + { + "epoch": 2.11, + "learning_rate": 4.242596793946277e-07, + "loss": 0.3162, + "step": 82452 + }, + { + "epoch": 2.11, + "learning_rate": 4.2423705534962905e-07, + "loss": 0.4238, + "step": 82453 + }, + { + "epoch": 2.11, + "learning_rate": 4.242144317454656e-07, + "loss": 0.4824, + "step": 82454 + }, + { + "epoch": 2.11, + "learning_rate": 4.2419180858215466e-07, + "loss": 0.4678, + "step": 82455 + }, + { + "epoch": 2.11, + "learning_rate": 4.2416918585971396e-07, + "loss": 0.5044, + "step": 82456 + }, + { + "epoch": 2.11, + "learning_rate": 4.2414656357816004e-07, + "loss": 0.3955, + "step": 82457 + }, + { + "epoch": 2.11, + "learning_rate": 4.2412394173751065e-07, + "loss": 0.5078, + "step": 82458 + }, + { + "epoch": 2.11, + "learning_rate": 4.24101320337783e-07, + "loss": 0.4097, + "step": 82459 + }, + { + "epoch": 2.11, + "learning_rate": 4.24078699378995e-07, + "loss": 0.4746, + "step": 82460 + }, + { + "epoch": 2.11, + "learning_rate": 4.240560788611633e-07, + "loss": 0.4683, + "step": 82461 + }, + { + "epoch": 2.11, + "learning_rate": 4.240334587843052e-07, + "loss": 0.2338, + "step": 82462 + }, + { + "epoch": 2.11, + "learning_rate": 4.2401083914843805e-07, + "loss": 0.3672, + "step": 82463 + }, + { + "epoch": 2.11, + "learning_rate": 4.2398821995357934e-07, + "loss": 0.5132, + "step": 82464 + }, + { + "epoch": 2.11, + "learning_rate": 4.2396560119974676e-07, + "loss": 0.4685, + "step": 82465 + }, + { + "epoch": 2.11, + "learning_rate": 4.2394298288695683e-07, + "loss": 0.4434, + "step": 82466 + }, + { + "epoch": 2.11, + "learning_rate": 4.239203650152273e-07, + "loss": 0.3609, + "step": 82467 + }, + { + "epoch": 2.11, + "learning_rate": 4.238977475845754e-07, + "loss": 0.4001, + "step": 82468 + }, + { + "epoch": 2.11, + "learning_rate": 4.23875130595019e-07, + "loss": 0.4353, + "step": 82469 + }, + { + "epoch": 2.11, + "learning_rate": 4.2385251404657484e-07, + "loss": 0.416, + "step": 82470 + }, + { + "epoch": 2.11, + "learning_rate": 4.2382989793925996e-07, + "loss": 0.4326, + "step": 82471 + }, + { + "epoch": 2.11, + "learning_rate": 4.23807282273092e-07, + "loss": 0.5464, + "step": 82472 + }, + { + "epoch": 2.11, + "learning_rate": 4.237846670480887e-07, + "loss": 0.4585, + "step": 82473 + }, + { + "epoch": 2.11, + "learning_rate": 4.2376205226426667e-07, + "loss": 0.3619, + "step": 82474 + }, + { + "epoch": 2.11, + "learning_rate": 4.2373943792164345e-07, + "loss": 0.3767, + "step": 82475 + }, + { + "epoch": 2.11, + "learning_rate": 4.2371682402023647e-07, + "loss": 0.4595, + "step": 82476 + }, + { + "epoch": 2.11, + "learning_rate": 4.236942105600634e-07, + "loss": 0.3804, + "step": 82477 + }, + { + "epoch": 2.11, + "learning_rate": 4.2367159754114077e-07, + "loss": 0.5088, + "step": 82478 + }, + { + "epoch": 2.11, + "learning_rate": 4.2364898496348646e-07, + "loss": 0.3232, + "step": 82479 + }, + { + "epoch": 2.11, + "learning_rate": 4.236263728271178e-07, + "loss": 0.5439, + "step": 82480 + }, + { + "epoch": 2.11, + "learning_rate": 4.2360376113205163e-07, + "loss": 0.5037, + "step": 82481 + }, + { + "epoch": 2.11, + "learning_rate": 4.2358114987830596e-07, + "loss": 0.5591, + "step": 82482 + }, + { + "epoch": 2.11, + "learning_rate": 4.235585390658972e-07, + "loss": 0.543, + "step": 82483 + }, + { + "epoch": 2.11, + "learning_rate": 4.2353592869484335e-07, + "loss": 0.4888, + "step": 82484 + }, + { + "epoch": 2.11, + "learning_rate": 4.2351331876516137e-07, + "loss": 0.3436, + "step": 82485 + }, + { + "epoch": 2.11, + "learning_rate": 4.2349070927686915e-07, + "loss": 0.4224, + "step": 82486 + }, + { + "epoch": 2.11, + "learning_rate": 4.2346810022998327e-07, + "loss": 0.3716, + "step": 82487 + }, + { + "epoch": 2.11, + "learning_rate": 4.2344549162452126e-07, + "loss": 0.4644, + "step": 82488 + }, + { + "epoch": 2.11, + "learning_rate": 4.2342288346050105e-07, + "loss": 0.3887, + "step": 82489 + }, + { + "epoch": 2.11, + "learning_rate": 4.234002757379392e-07, + "loss": 0.3633, + "step": 82490 + }, + { + "epoch": 2.11, + "learning_rate": 4.233776684568531e-07, + "loss": 0.3521, + "step": 82491 + }, + { + "epoch": 2.11, + "learning_rate": 4.233550616172601e-07, + "loss": 0.4497, + "step": 82492 + }, + { + "epoch": 2.11, + "learning_rate": 4.233324552191776e-07, + "loss": 0.3262, + "step": 82493 + }, + { + "epoch": 2.11, + "learning_rate": 4.2330984926262334e-07, + "loss": 0.5342, + "step": 82494 + }, + { + "epoch": 2.11, + "learning_rate": 4.232872437476138e-07, + "loss": 0.4185, + "step": 82495 + }, + { + "epoch": 2.11, + "learning_rate": 4.2326463867416674e-07, + "loss": 0.4331, + "step": 82496 + }, + { + "epoch": 2.11, + "learning_rate": 4.232420340422994e-07, + "loss": 0.4351, + "step": 82497 + }, + { + "epoch": 2.11, + "learning_rate": 4.2321942985202954e-07, + "loss": 0.3484, + "step": 82498 + }, + { + "epoch": 2.11, + "learning_rate": 4.231968261033736e-07, + "loss": 0.397, + "step": 82499 + }, + { + "epoch": 2.11, + "learning_rate": 4.2317422279634974e-07, + "loss": 0.4541, + "step": 82500 + }, + { + "epoch": 2.11, + "learning_rate": 4.2315161993097447e-07, + "loss": 0.3596, + "step": 82501 + }, + { + "epoch": 2.11, + "learning_rate": 4.2312901750726547e-07, + "loss": 0.4424, + "step": 82502 + }, + { + "epoch": 2.11, + "learning_rate": 4.231064155252404e-07, + "loss": 0.2982, + "step": 82503 + }, + { + "epoch": 2.11, + "learning_rate": 4.230838139849159e-07, + "loss": 0.2219, + "step": 82504 + }, + { + "epoch": 2.11, + "learning_rate": 4.230612128863096e-07, + "loss": 0.3444, + "step": 82505 + }, + { + "epoch": 2.11, + "learning_rate": 4.2303861222943915e-07, + "loss": 0.4009, + "step": 82506 + }, + { + "epoch": 2.11, + "learning_rate": 4.2301601201432113e-07, + "loss": 0.4434, + "step": 82507 + }, + { + "epoch": 2.11, + "learning_rate": 4.229934122409733e-07, + "loss": 0.4351, + "step": 82508 + }, + { + "epoch": 2.11, + "learning_rate": 4.229708129094127e-07, + "loss": 0.4814, + "step": 82509 + }, + { + "epoch": 2.11, + "learning_rate": 4.229482140196573e-07, + "loss": 0.3994, + "step": 82510 + }, + { + "epoch": 2.11, + "learning_rate": 4.229256155717239e-07, + "loss": 0.2307, + "step": 82511 + }, + { + "epoch": 2.11, + "learning_rate": 4.2290301756562954e-07, + "loss": 0.458, + "step": 82512 + }, + { + "epoch": 2.11, + "learning_rate": 4.228804200013917e-07, + "loss": 0.3064, + "step": 82513 + }, + { + "epoch": 2.11, + "learning_rate": 4.228578228790278e-07, + "loss": 0.4512, + "step": 82514 + }, + { + "epoch": 2.11, + "learning_rate": 4.228352261985555e-07, + "loss": 0.3716, + "step": 82515 + }, + { + "epoch": 2.11, + "learning_rate": 4.2281262995999143e-07, + "loss": 0.3789, + "step": 82516 + }, + { + "epoch": 2.11, + "learning_rate": 4.227900341633531e-07, + "loss": 0.3257, + "step": 82517 + }, + { + "epoch": 2.11, + "learning_rate": 4.2276743880865795e-07, + "loss": 0.4104, + "step": 82518 + }, + { + "epoch": 2.12, + "learning_rate": 4.2274484389592356e-07, + "loss": 0.3188, + "step": 82519 + }, + { + "epoch": 2.12, + "learning_rate": 4.22722249425167e-07, + "loss": 0.4751, + "step": 82520 + }, + { + "epoch": 2.12, + "learning_rate": 4.2269965539640497e-07, + "loss": 0.4346, + "step": 82521 + }, + { + "epoch": 2.12, + "learning_rate": 4.2267706180965535e-07, + "loss": 0.2236, + "step": 82522 + }, + { + "epoch": 2.12, + "learning_rate": 4.226544686649357e-07, + "loss": 0.4893, + "step": 82523 + }, + { + "epoch": 2.12, + "learning_rate": 4.2263187596226256e-07, + "loss": 0.438, + "step": 82524 + }, + { + "epoch": 2.12, + "learning_rate": 4.226092837016537e-07, + "loss": 0.3857, + "step": 82525 + }, + { + "epoch": 2.12, + "learning_rate": 4.2258669188312633e-07, + "loss": 0.5234, + "step": 82526 + }, + { + "epoch": 2.12, + "learning_rate": 4.225641005066982e-07, + "loss": 0.4526, + "step": 82527 + }, + { + "epoch": 2.12, + "learning_rate": 4.225415095723858e-07, + "loss": 0.3342, + "step": 82528 + }, + { + "epoch": 2.12, + "learning_rate": 4.2251891908020676e-07, + "loss": 0.3956, + "step": 82529 + }, + { + "epoch": 2.12, + "learning_rate": 4.2249632903017883e-07, + "loss": 0.3711, + "step": 82530 + }, + { + "epoch": 2.12, + "learning_rate": 4.2247373942231857e-07, + "loss": 0.4246, + "step": 82531 + }, + { + "epoch": 2.12, + "learning_rate": 4.22451150256644e-07, + "loss": 0.457, + "step": 82532 + }, + { + "epoch": 2.12, + "learning_rate": 4.2242856153317164e-07, + "loss": 0.4053, + "step": 82533 + }, + { + "epoch": 2.12, + "learning_rate": 4.2240597325191907e-07, + "loss": 0.3503, + "step": 82534 + }, + { + "epoch": 2.12, + "learning_rate": 4.2238338541290384e-07, + "loss": 0.3645, + "step": 82535 + }, + { + "epoch": 2.12, + "learning_rate": 4.2236079801614335e-07, + "loss": 0.4292, + "step": 82536 + }, + { + "epoch": 2.12, + "learning_rate": 4.2233821106165434e-07, + "loss": 0.3848, + "step": 82537 + }, + { + "epoch": 2.12, + "learning_rate": 4.2231562454945433e-07, + "loss": 0.3156, + "step": 82538 + }, + { + "epoch": 2.12, + "learning_rate": 4.222930384795608e-07, + "loss": 0.4399, + "step": 82539 + }, + { + "epoch": 2.12, + "learning_rate": 4.2227045285199146e-07, + "loss": 0.3418, + "step": 82540 + }, + { + "epoch": 2.12, + "learning_rate": 4.222478676667626e-07, + "loss": 0.5522, + "step": 82541 + }, + { + "epoch": 2.12, + "learning_rate": 4.222252829238918e-07, + "loss": 0.4678, + "step": 82542 + }, + { + "epoch": 2.12, + "learning_rate": 4.222026986233965e-07, + "loss": 0.5889, + "step": 82543 + }, + { + "epoch": 2.12, + "learning_rate": 4.2218011476529446e-07, + "loss": 0.214, + "step": 82544 + }, + { + "epoch": 2.12, + "learning_rate": 4.221575313496022e-07, + "loss": 0.3885, + "step": 82545 + }, + { + "epoch": 2.12, + "learning_rate": 4.2213494837633736e-07, + "loss": 0.2524, + "step": 82546 + }, + { + "epoch": 2.12, + "learning_rate": 4.2211236584551725e-07, + "loss": 0.4055, + "step": 82547 + }, + { + "epoch": 2.12, + "learning_rate": 4.220897837571594e-07, + "loss": 0.3539, + "step": 82548 + }, + { + "epoch": 2.12, + "learning_rate": 4.220672021112804e-07, + "loss": 0.4512, + "step": 82549 + }, + { + "epoch": 2.12, + "learning_rate": 4.220446209078985e-07, + "loss": 0.4316, + "step": 82550 + }, + { + "epoch": 2.12, + "learning_rate": 4.2202204014703005e-07, + "loss": 0.2832, + "step": 82551 + }, + { + "epoch": 2.12, + "learning_rate": 4.2199945982869266e-07, + "loss": 0.3761, + "step": 82552 + }, + { + "epoch": 2.12, + "learning_rate": 4.219768799529042e-07, + "loss": 0.4438, + "step": 82553 + }, + { + "epoch": 2.12, + "learning_rate": 4.2195430051968094e-07, + "loss": 0.3273, + "step": 82554 + }, + { + "epoch": 2.12, + "learning_rate": 4.2193172152904086e-07, + "loss": 0.3936, + "step": 82555 + }, + { + "epoch": 2.12, + "learning_rate": 4.21909142981001e-07, + "loss": 0.3618, + "step": 82556 + }, + { + "epoch": 2.12, + "learning_rate": 4.218865648755791e-07, + "loss": 0.4673, + "step": 82557 + }, + { + "epoch": 2.12, + "learning_rate": 4.2186398721279173e-07, + "loss": 0.4302, + "step": 82558 + }, + { + "epoch": 2.12, + "learning_rate": 4.218414099926565e-07, + "loss": 0.4062, + "step": 82559 + }, + { + "epoch": 2.12, + "learning_rate": 4.2181883321519105e-07, + "loss": 0.4521, + "step": 82560 + }, + { + "epoch": 2.12, + "learning_rate": 4.217962568804124e-07, + "loss": 0.4307, + "step": 82561 + }, + { + "epoch": 2.12, + "learning_rate": 4.217736809883373e-07, + "loss": 0.3745, + "step": 82562 + }, + { + "epoch": 2.12, + "learning_rate": 4.2175110553898365e-07, + "loss": 0.4541, + "step": 82563 + }, + { + "epoch": 2.12, + "learning_rate": 4.2172853053236843e-07, + "loss": 0.428, + "step": 82564 + }, + { + "epoch": 2.12, + "learning_rate": 4.2170595596850957e-07, + "loss": 0.3882, + "step": 82565 + }, + { + "epoch": 2.12, + "learning_rate": 4.2168338184742347e-07, + "loss": 0.4478, + "step": 82566 + }, + { + "epoch": 2.12, + "learning_rate": 4.2166080816912786e-07, + "loss": 0.4321, + "step": 82567 + }, + { + "epoch": 2.12, + "learning_rate": 4.216382349336399e-07, + "loss": 0.3508, + "step": 82568 + }, + { + "epoch": 2.12, + "learning_rate": 4.2161566214097733e-07, + "loss": 0.417, + "step": 82569 + }, + { + "epoch": 2.12, + "learning_rate": 4.2159308979115714e-07, + "loss": 0.2996, + "step": 82570 + }, + { + "epoch": 2.12, + "learning_rate": 4.2157051788419605e-07, + "loss": 0.3213, + "step": 82571 + }, + { + "epoch": 2.12, + "learning_rate": 4.215479464201118e-07, + "loss": 0.4243, + "step": 82572 + }, + { + "epoch": 2.12, + "learning_rate": 4.2152537539892176e-07, + "loss": 0.213, + "step": 82573 + }, + { + "epoch": 2.12, + "learning_rate": 4.215028048206435e-07, + "loss": 0.356, + "step": 82574 + }, + { + "epoch": 2.12, + "learning_rate": 4.214802346852936e-07, + "loss": 0.46, + "step": 82575 + }, + { + "epoch": 2.12, + "learning_rate": 4.214576649928897e-07, + "loss": 0.5615, + "step": 82576 + }, + { + "epoch": 2.12, + "learning_rate": 4.214350957434489e-07, + "loss": 0.303, + "step": 82577 + }, + { + "epoch": 2.12, + "learning_rate": 4.2141252693698913e-07, + "loss": 0.3389, + "step": 82578 + }, + { + "epoch": 2.12, + "learning_rate": 4.213899585735269e-07, + "loss": 0.4102, + "step": 82579 + }, + { + "epoch": 2.12, + "learning_rate": 4.2136739065308e-07, + "loss": 0.499, + "step": 82580 + }, + { + "epoch": 2.12, + "learning_rate": 4.213448231756652e-07, + "loss": 0.3623, + "step": 82581 + }, + { + "epoch": 2.12, + "learning_rate": 4.2132225614130034e-07, + "loss": 0.246, + "step": 82582 + }, + { + "epoch": 2.12, + "learning_rate": 4.212996895500022e-07, + "loss": 0.4644, + "step": 82583 + }, + { + "epoch": 2.12, + "learning_rate": 4.2127712340178814e-07, + "loss": 0.364, + "step": 82584 + }, + { + "epoch": 2.12, + "learning_rate": 4.212545576966756e-07, + "loss": 0.2921, + "step": 82585 + }, + { + "epoch": 2.12, + "learning_rate": 4.212319924346822e-07, + "loss": 0.3506, + "step": 82586 + }, + { + "epoch": 2.12, + "learning_rate": 4.2120942761582454e-07, + "loss": 0.4316, + "step": 82587 + }, + { + "epoch": 2.12, + "learning_rate": 4.211868632401202e-07, + "loss": 0.3386, + "step": 82588 + }, + { + "epoch": 2.12, + "learning_rate": 4.2116429930758643e-07, + "loss": 0.3967, + "step": 82589 + }, + { + "epoch": 2.12, + "learning_rate": 4.21141735818241e-07, + "loss": 0.5249, + "step": 82590 + }, + { + "epoch": 2.12, + "learning_rate": 4.211191727721006e-07, + "loss": 0.3345, + "step": 82591 + }, + { + "epoch": 2.12, + "learning_rate": 4.210966101691823e-07, + "loss": 0.397, + "step": 82592 + }, + { + "epoch": 2.12, + "learning_rate": 4.2107404800950373e-07, + "loss": 0.4536, + "step": 82593 + }, + { + "epoch": 2.12, + "learning_rate": 4.2105148629308205e-07, + "loss": 0.3462, + "step": 82594 + }, + { + "epoch": 2.12, + "learning_rate": 4.2102892501993516e-07, + "loss": 0.3171, + "step": 82595 + }, + { + "epoch": 2.12, + "learning_rate": 4.210063641900793e-07, + "loss": 0.4448, + "step": 82596 + }, + { + "epoch": 2.12, + "learning_rate": 4.209838038035323e-07, + "loss": 0.4902, + "step": 82597 + }, + { + "epoch": 2.12, + "learning_rate": 4.209612438603117e-07, + "loss": 0.3755, + "step": 82598 + }, + { + "epoch": 2.12, + "learning_rate": 4.209386843604342e-07, + "loss": 0.3837, + "step": 82599 + }, + { + "epoch": 2.12, + "learning_rate": 4.209161253039176e-07, + "loss": 0.478, + "step": 82600 + }, + { + "epoch": 2.12, + "learning_rate": 4.208935666907785e-07, + "loss": 0.3967, + "step": 82601 + }, + { + "epoch": 2.12, + "learning_rate": 4.208710085210346e-07, + "loss": 0.4058, + "step": 82602 + }, + { + "epoch": 2.12, + "learning_rate": 4.2084845079470357e-07, + "loss": 0.3732, + "step": 82603 + }, + { + "epoch": 2.12, + "learning_rate": 4.2082589351180173e-07, + "loss": 0.4175, + "step": 82604 + }, + { + "epoch": 2.12, + "learning_rate": 4.20803336672347e-07, + "loss": 0.3943, + "step": 82605 + }, + { + "epoch": 2.12, + "learning_rate": 4.2078078027635653e-07, + "loss": 0.3765, + "step": 82606 + }, + { + "epoch": 2.12, + "learning_rate": 4.207582243238479e-07, + "loss": 0.4536, + "step": 82607 + }, + { + "epoch": 2.12, + "learning_rate": 4.207356688148377e-07, + "loss": 0.3647, + "step": 82608 + }, + { + "epoch": 2.12, + "learning_rate": 4.207131137493436e-07, + "loss": 0.3469, + "step": 82609 + }, + { + "epoch": 2.12, + "learning_rate": 4.206905591273832e-07, + "loss": 0.4062, + "step": 82610 + }, + { + "epoch": 2.12, + "learning_rate": 4.206680049489729e-07, + "loss": 0.4834, + "step": 82611 + }, + { + "epoch": 2.12, + "learning_rate": 4.20645451214131e-07, + "loss": 0.3082, + "step": 82612 + }, + { + "epoch": 2.12, + "learning_rate": 4.206228979228739e-07, + "loss": 0.5039, + "step": 82613 + }, + { + "epoch": 2.12, + "learning_rate": 4.2060034507521904e-07, + "loss": 0.4072, + "step": 82614 + }, + { + "epoch": 2.12, + "learning_rate": 4.205777926711843e-07, + "loss": 0.3823, + "step": 82615 + }, + { + "epoch": 2.12, + "learning_rate": 4.205552407107862e-07, + "loss": 0.4653, + "step": 82616 + }, + { + "epoch": 2.12, + "learning_rate": 4.2053268919404215e-07, + "loss": 0.2732, + "step": 82617 + }, + { + "epoch": 2.12, + "learning_rate": 4.2051013812096967e-07, + "loss": 0.395, + "step": 82618 + }, + { + "epoch": 2.12, + "learning_rate": 4.2048758749158633e-07, + "loss": 0.4604, + "step": 82619 + }, + { + "epoch": 2.12, + "learning_rate": 4.2046503730590897e-07, + "loss": 0.3584, + "step": 82620 + }, + { + "epoch": 2.12, + "learning_rate": 4.2044248756395453e-07, + "loss": 0.4722, + "step": 82621 + }, + { + "epoch": 2.12, + "learning_rate": 4.2041993826574064e-07, + "loss": 0.3889, + "step": 82622 + }, + { + "epoch": 2.12, + "learning_rate": 4.2039738941128445e-07, + "loss": 0.3801, + "step": 82623 + }, + { + "epoch": 2.12, + "learning_rate": 4.203748410006038e-07, + "loss": 0.5107, + "step": 82624 + }, + { + "epoch": 2.12, + "learning_rate": 4.203522930337151e-07, + "loss": 0.3877, + "step": 82625 + }, + { + "epoch": 2.12, + "learning_rate": 4.203297455106359e-07, + "loss": 0.224, + "step": 82626 + }, + { + "epoch": 2.12, + "learning_rate": 4.2030719843138375e-07, + "loss": 0.4316, + "step": 82627 + }, + { + "epoch": 2.12, + "learning_rate": 4.2028465179597596e-07, + "loss": 0.4668, + "step": 82628 + }, + { + "epoch": 2.12, + "learning_rate": 4.202621056044292e-07, + "loss": 0.4434, + "step": 82629 + }, + { + "epoch": 2.12, + "learning_rate": 4.202395598567614e-07, + "loss": 0.4016, + "step": 82630 + }, + { + "epoch": 2.12, + "learning_rate": 4.202170145529893e-07, + "loss": 0.2842, + "step": 82631 + }, + { + "epoch": 2.12, + "learning_rate": 4.201944696931307e-07, + "loss": 0.3557, + "step": 82632 + }, + { + "epoch": 2.12, + "learning_rate": 4.2017192527720205e-07, + "loss": 0.3459, + "step": 82633 + }, + { + "epoch": 2.12, + "learning_rate": 4.2014938130522117e-07, + "loss": 0.5405, + "step": 82634 + }, + { + "epoch": 2.12, + "learning_rate": 4.2012683777720525e-07, + "loss": 0.3887, + "step": 82635 + }, + { + "epoch": 2.12, + "learning_rate": 4.2010429469317187e-07, + "loss": 0.406, + "step": 82636 + }, + { + "epoch": 2.12, + "learning_rate": 4.2008175205313765e-07, + "loss": 0.4688, + "step": 82637 + }, + { + "epoch": 2.12, + "learning_rate": 4.2005920985712016e-07, + "loss": 0.2112, + "step": 82638 + }, + { + "epoch": 2.12, + "learning_rate": 4.200366681051366e-07, + "loss": 0.418, + "step": 82639 + }, + { + "epoch": 2.12, + "learning_rate": 4.200141267972047e-07, + "loss": 0.4419, + "step": 82640 + }, + { + "epoch": 2.12, + "learning_rate": 4.199915859333414e-07, + "loss": 0.3616, + "step": 82641 + }, + { + "epoch": 2.12, + "learning_rate": 4.199690455135635e-07, + "loss": 0.2949, + "step": 82642 + }, + { + "epoch": 2.12, + "learning_rate": 4.1994650553788845e-07, + "loss": 0.4763, + "step": 82643 + }, + { + "epoch": 2.12, + "learning_rate": 4.1992396600633385e-07, + "loss": 0.3931, + "step": 82644 + }, + { + "epoch": 2.12, + "learning_rate": 4.1990142691891717e-07, + "loss": 0.4717, + "step": 82645 + }, + { + "epoch": 2.12, + "learning_rate": 4.1987888827565487e-07, + "loss": 0.5439, + "step": 82646 + }, + { + "epoch": 2.12, + "learning_rate": 4.1985635007656463e-07, + "loss": 0.5239, + "step": 82647 + }, + { + "epoch": 2.12, + "learning_rate": 4.198338123216637e-07, + "loss": 0.4307, + "step": 82648 + }, + { + "epoch": 2.12, + "learning_rate": 4.198112750109698e-07, + "loss": 0.4141, + "step": 82649 + }, + { + "epoch": 2.12, + "learning_rate": 4.1978873814449964e-07, + "loss": 0.3623, + "step": 82650 + }, + { + "epoch": 2.12, + "learning_rate": 4.1976620172227017e-07, + "loss": 0.5, + "step": 82651 + }, + { + "epoch": 2.12, + "learning_rate": 4.197436657442991e-07, + "loss": 0.3068, + "step": 82652 + }, + { + "epoch": 2.12, + "learning_rate": 4.1972113021060397e-07, + "loss": 0.3616, + "step": 82653 + }, + { + "epoch": 2.12, + "learning_rate": 4.1969859512120133e-07, + "loss": 0.2964, + "step": 82654 + }, + { + "epoch": 2.12, + "learning_rate": 4.196760604761088e-07, + "loss": 0.3719, + "step": 82655 + }, + { + "epoch": 2.12, + "learning_rate": 4.196535262753437e-07, + "loss": 0.4712, + "step": 82656 + }, + { + "epoch": 2.12, + "learning_rate": 4.196309925189234e-07, + "loss": 0.2635, + "step": 82657 + }, + { + "epoch": 2.12, + "learning_rate": 4.196084592068647e-07, + "loss": 0.4697, + "step": 82658 + }, + { + "epoch": 2.12, + "learning_rate": 4.195859263391851e-07, + "loss": 0.4492, + "step": 82659 + }, + { + "epoch": 2.12, + "learning_rate": 4.1956339391590224e-07, + "loss": 0.356, + "step": 82660 + }, + { + "epoch": 2.12, + "learning_rate": 4.1954086193703264e-07, + "loss": 0.519, + "step": 82661 + }, + { + "epoch": 2.12, + "learning_rate": 4.195183304025943e-07, + "loss": 0.2437, + "step": 82662 + }, + { + "epoch": 2.12, + "learning_rate": 4.1949579931260373e-07, + "loss": 0.4805, + "step": 82663 + }, + { + "epoch": 2.12, + "learning_rate": 4.1947326866707845e-07, + "loss": 0.3569, + "step": 82664 + }, + { + "epoch": 2.12, + "learning_rate": 4.194507384660358e-07, + "loss": 0.3838, + "step": 82665 + }, + { + "epoch": 2.12, + "learning_rate": 4.194282087094935e-07, + "loss": 0.5352, + "step": 82666 + }, + { + "epoch": 2.12, + "learning_rate": 4.1940567939746785e-07, + "loss": 0.4233, + "step": 82667 + }, + { + "epoch": 2.12, + "learning_rate": 4.1938315052997664e-07, + "loss": 0.4819, + "step": 82668 + }, + { + "epoch": 2.12, + "learning_rate": 4.193606221070374e-07, + "loss": 0.3668, + "step": 82669 + }, + { + "epoch": 2.12, + "learning_rate": 4.1933809412866697e-07, + "loss": 0.4331, + "step": 82670 + }, + { + "epoch": 2.12, + "learning_rate": 4.1931556659488244e-07, + "loss": 0.4448, + "step": 82671 + }, + { + "epoch": 2.12, + "learning_rate": 4.1929303950570117e-07, + "loss": 0.5693, + "step": 82672 + }, + { + "epoch": 2.12, + "learning_rate": 4.1927051286114047e-07, + "loss": 0.3572, + "step": 82673 + }, + { + "epoch": 2.12, + "learning_rate": 4.1924798666121806e-07, + "loss": 0.4136, + "step": 82674 + }, + { + "epoch": 2.12, + "learning_rate": 4.1922546090595047e-07, + "loss": 0.4736, + "step": 82675 + }, + { + "epoch": 2.12, + "learning_rate": 4.1920293559535516e-07, + "loss": 0.3136, + "step": 82676 + }, + { + "epoch": 2.12, + "learning_rate": 4.1918041072944956e-07, + "loss": 0.2109, + "step": 82677 + }, + { + "epoch": 2.12, + "learning_rate": 4.1915788630825097e-07, + "loss": 0.3084, + "step": 82678 + }, + { + "epoch": 2.12, + "learning_rate": 4.191353623317763e-07, + "loss": 0.2535, + "step": 82679 + }, + { + "epoch": 2.12, + "learning_rate": 4.1911283880004324e-07, + "loss": 0.3701, + "step": 82680 + }, + { + "epoch": 2.12, + "learning_rate": 4.190903157130685e-07, + "loss": 0.457, + "step": 82681 + }, + { + "epoch": 2.12, + "learning_rate": 4.190677930708695e-07, + "loss": 0.4365, + "step": 82682 + }, + { + "epoch": 2.12, + "learning_rate": 4.1904527087346395e-07, + "loss": 0.3896, + "step": 82683 + }, + { + "epoch": 2.12, + "learning_rate": 4.1902274912086845e-07, + "loss": 0.6333, + "step": 82684 + }, + { + "epoch": 2.12, + "learning_rate": 4.190002278131004e-07, + "loss": 0.4232, + "step": 82685 + }, + { + "epoch": 2.12, + "learning_rate": 4.1897770695017763e-07, + "loss": 0.4561, + "step": 82686 + }, + { + "epoch": 2.12, + "learning_rate": 4.1895518653211647e-07, + "loss": 0.3843, + "step": 82687 + }, + { + "epoch": 2.12, + "learning_rate": 4.189326665589347e-07, + "loss": 0.3477, + "step": 82688 + }, + { + "epoch": 2.12, + "learning_rate": 4.189101470306493e-07, + "loss": 0.3003, + "step": 82689 + }, + { + "epoch": 2.12, + "learning_rate": 4.1888762794727817e-07, + "loss": 0.5327, + "step": 82690 + }, + { + "epoch": 2.12, + "learning_rate": 4.188651093088381e-07, + "loss": 0.3892, + "step": 82691 + }, + { + "epoch": 2.12, + "learning_rate": 4.188425911153458e-07, + "loss": 0.4634, + "step": 82692 + }, + { + "epoch": 2.12, + "learning_rate": 4.1882007336681915e-07, + "loss": 0.4888, + "step": 82693 + }, + { + "epoch": 2.12, + "learning_rate": 4.1879755606327515e-07, + "loss": 0.4492, + "step": 82694 + }, + { + "epoch": 2.12, + "learning_rate": 4.1877503920473157e-07, + "loss": 0.4116, + "step": 82695 + }, + { + "epoch": 2.12, + "learning_rate": 4.1875252279120475e-07, + "loss": 0.366, + "step": 82696 + }, + { + "epoch": 2.12, + "learning_rate": 4.1873000682271253e-07, + "loss": 0.4976, + "step": 82697 + }, + { + "epoch": 2.12, + "learning_rate": 4.1870749129927185e-07, + "loss": 0.3777, + "step": 82698 + }, + { + "epoch": 2.12, + "learning_rate": 4.186849762209006e-07, + "loss": 0.3359, + "step": 82699 + }, + { + "epoch": 2.12, + "learning_rate": 4.1866246158761555e-07, + "loss": 0.3918, + "step": 82700 + }, + { + "epoch": 2.12, + "learning_rate": 4.1863994739943354e-07, + "loss": 0.3457, + "step": 82701 + }, + { + "epoch": 2.12, + "learning_rate": 4.1861743365637216e-07, + "loss": 0.3281, + "step": 82702 + }, + { + "epoch": 2.12, + "learning_rate": 4.18594920358449e-07, + "loss": 0.4111, + "step": 82703 + }, + { + "epoch": 2.12, + "learning_rate": 4.185724075056807e-07, + "loss": 0.342, + "step": 82704 + }, + { + "epoch": 2.12, + "learning_rate": 4.185498950980847e-07, + "loss": 0.4961, + "step": 82705 + }, + { + "epoch": 2.12, + "learning_rate": 4.185273831356784e-07, + "loss": 0.3665, + "step": 82706 + }, + { + "epoch": 2.12, + "learning_rate": 4.1850487161847925e-07, + "loss": 0.4941, + "step": 82707 + }, + { + "epoch": 2.12, + "learning_rate": 4.1848236054650376e-07, + "loss": 0.4189, + "step": 82708 + }, + { + "epoch": 2.12, + "learning_rate": 4.1845984991976966e-07, + "loss": 0.418, + "step": 82709 + }, + { + "epoch": 2.12, + "learning_rate": 4.184373397382944e-07, + "loss": 0.3555, + "step": 82710 + }, + { + "epoch": 2.12, + "learning_rate": 4.1841483000209466e-07, + "loss": 0.3841, + "step": 82711 + }, + { + "epoch": 2.12, + "learning_rate": 4.1839232071118837e-07, + "loss": 0.4961, + "step": 82712 + }, + { + "epoch": 2.12, + "learning_rate": 4.183698118655918e-07, + "loss": 0.3951, + "step": 82713 + }, + { + "epoch": 2.12, + "learning_rate": 4.183473034653228e-07, + "loss": 0.479, + "step": 82714 + }, + { + "epoch": 2.12, + "learning_rate": 4.183247955103986e-07, + "loss": 0.4141, + "step": 82715 + }, + { + "epoch": 2.12, + "learning_rate": 4.1830228800083657e-07, + "loss": 0.2834, + "step": 82716 + }, + { + "epoch": 2.12, + "learning_rate": 4.182797809366535e-07, + "loss": 0.3994, + "step": 82717 + }, + { + "epoch": 2.12, + "learning_rate": 4.1825727431786674e-07, + "loss": 0.4761, + "step": 82718 + }, + { + "epoch": 2.12, + "learning_rate": 4.1823476814449365e-07, + "loss": 0.457, + "step": 82719 + }, + { + "epoch": 2.12, + "learning_rate": 4.1821226241655226e-07, + "loss": 0.4189, + "step": 82720 + }, + { + "epoch": 2.12, + "learning_rate": 4.1818975713405824e-07, + "loss": 0.3533, + "step": 82721 + }, + { + "epoch": 2.12, + "learning_rate": 4.1816725229702955e-07, + "loss": 0.3308, + "step": 82722 + }, + { + "epoch": 2.12, + "learning_rate": 4.181447479054835e-07, + "loss": 0.394, + "step": 82723 + }, + { + "epoch": 2.12, + "learning_rate": 4.181222439594375e-07, + "loss": 0.3923, + "step": 82724 + }, + { + "epoch": 2.12, + "learning_rate": 4.180997404589083e-07, + "loss": 0.4299, + "step": 82725 + }, + { + "epoch": 2.12, + "learning_rate": 4.180772374039133e-07, + "loss": 0.4036, + "step": 82726 + }, + { + "epoch": 2.12, + "learning_rate": 4.180547347944698e-07, + "loss": 0.4111, + "step": 82727 + }, + { + "epoch": 2.12, + "learning_rate": 4.1803223263059537e-07, + "loss": 0.5005, + "step": 82728 + }, + { + "epoch": 2.12, + "learning_rate": 4.180097309123066e-07, + "loss": 0.4546, + "step": 82729 + }, + { + "epoch": 2.12, + "learning_rate": 4.179872296396214e-07, + "loss": 0.3779, + "step": 82730 + }, + { + "epoch": 2.12, + "learning_rate": 4.179647288125562e-07, + "loss": 0.4062, + "step": 82731 + }, + { + "epoch": 2.12, + "learning_rate": 4.179422284311287e-07, + "loss": 0.3447, + "step": 82732 + }, + { + "epoch": 2.12, + "learning_rate": 4.179197284953564e-07, + "loss": 0.373, + "step": 82733 + }, + { + "epoch": 2.12, + "learning_rate": 4.178972290052558e-07, + "loss": 0.4189, + "step": 82734 + }, + { + "epoch": 2.12, + "learning_rate": 4.178747299608445e-07, + "loss": 0.4243, + "step": 82735 + }, + { + "epoch": 2.12, + "learning_rate": 4.178522313621399e-07, + "loss": 0.5938, + "step": 82736 + }, + { + "epoch": 2.12, + "learning_rate": 4.178297332091593e-07, + "loss": 0.4204, + "step": 82737 + }, + { + "epoch": 2.12, + "learning_rate": 4.178072355019194e-07, + "loss": 0.4138, + "step": 82738 + }, + { + "epoch": 2.12, + "learning_rate": 4.177847382404377e-07, + "loss": 0.3682, + "step": 82739 + }, + { + "epoch": 2.12, + "learning_rate": 4.1776224142473184e-07, + "loss": 0.4253, + "step": 82740 + }, + { + "epoch": 2.12, + "learning_rate": 4.1773974505481866e-07, + "loss": 0.4214, + "step": 82741 + }, + { + "epoch": 2.12, + "learning_rate": 4.1771724913071506e-07, + "loss": 0.4338, + "step": 82742 + }, + { + "epoch": 2.12, + "learning_rate": 4.176947536524386e-07, + "loss": 0.4902, + "step": 82743 + }, + { + "epoch": 2.12, + "learning_rate": 4.1767225862000646e-07, + "loss": 0.4253, + "step": 82744 + }, + { + "epoch": 2.12, + "learning_rate": 4.1764976403343623e-07, + "loss": 0.3813, + "step": 82745 + }, + { + "epoch": 2.12, + "learning_rate": 4.176272698927443e-07, + "loss": 0.3247, + "step": 82746 + }, + { + "epoch": 2.12, + "learning_rate": 4.1760477619794863e-07, + "loss": 0.3989, + "step": 82747 + }, + { + "epoch": 2.12, + "learning_rate": 4.1758228294906604e-07, + "loss": 0.1436, + "step": 82748 + }, + { + "epoch": 2.12, + "learning_rate": 4.175597901461144e-07, + "loss": 0.4263, + "step": 82749 + }, + { + "epoch": 2.12, + "learning_rate": 4.175372977891104e-07, + "loss": 0.3298, + "step": 82750 + }, + { + "epoch": 2.12, + "learning_rate": 4.17514805878071e-07, + "loss": 0.2788, + "step": 82751 + }, + { + "epoch": 2.12, + "learning_rate": 4.174923144130136e-07, + "loss": 0.4163, + "step": 82752 + }, + { + "epoch": 2.12, + "learning_rate": 4.1746982339395564e-07, + "loss": 0.4006, + "step": 82753 + }, + { + "epoch": 2.12, + "learning_rate": 4.174473328209146e-07, + "loss": 0.3382, + "step": 82754 + }, + { + "epoch": 2.12, + "learning_rate": 4.17424842693907e-07, + "loss": 0.3911, + "step": 82755 + }, + { + "epoch": 2.12, + "learning_rate": 4.1740235301295037e-07, + "loss": 0.3402, + "step": 82756 + }, + { + "epoch": 2.12, + "learning_rate": 4.17379863778062e-07, + "loss": 0.3337, + "step": 82757 + }, + { + "epoch": 2.12, + "learning_rate": 4.173573749892595e-07, + "loss": 0.3152, + "step": 82758 + }, + { + "epoch": 2.12, + "learning_rate": 4.173348866465596e-07, + "loss": 0.3259, + "step": 82759 + }, + { + "epoch": 2.12, + "learning_rate": 4.1731239874997916e-07, + "loss": 0.3779, + "step": 82760 + }, + { + "epoch": 2.12, + "learning_rate": 4.1728991129953594e-07, + "loss": 0.3904, + "step": 82761 + }, + { + "epoch": 2.12, + "learning_rate": 4.172674242952473e-07, + "loss": 0.4312, + "step": 82762 + }, + { + "epoch": 2.12, + "learning_rate": 4.1724493773712985e-07, + "loss": 0.2676, + "step": 82763 + }, + { + "epoch": 2.12, + "learning_rate": 4.172224516252013e-07, + "loss": 0.4438, + "step": 82764 + }, + { + "epoch": 2.12, + "learning_rate": 4.171999659594786e-07, + "loss": 0.3815, + "step": 82765 + }, + { + "epoch": 2.12, + "learning_rate": 4.1717748073997947e-07, + "loss": 0.4741, + "step": 82766 + }, + { + "epoch": 2.12, + "learning_rate": 4.171549959667203e-07, + "loss": 0.4141, + "step": 82767 + }, + { + "epoch": 2.12, + "learning_rate": 4.1713251163971886e-07, + "loss": 0.3677, + "step": 82768 + }, + { + "epoch": 2.12, + "learning_rate": 4.171100277589926e-07, + "loss": 0.4658, + "step": 82769 + }, + { + "epoch": 2.12, + "learning_rate": 4.1708754432455806e-07, + "loss": 0.4453, + "step": 82770 + }, + { + "epoch": 2.12, + "learning_rate": 4.1706506133643306e-07, + "loss": 0.4736, + "step": 82771 + }, + { + "epoch": 2.12, + "learning_rate": 4.1704257879463423e-07, + "loss": 0.3296, + "step": 82772 + }, + { + "epoch": 2.12, + "learning_rate": 4.1702009669917905e-07, + "loss": 0.3657, + "step": 82773 + }, + { + "epoch": 2.12, + "learning_rate": 4.169976150500848e-07, + "loss": 0.3979, + "step": 82774 + }, + { + "epoch": 2.12, + "learning_rate": 4.1697513384736905e-07, + "loss": 0.4526, + "step": 82775 + }, + { + "epoch": 2.12, + "learning_rate": 4.1695265309104834e-07, + "loss": 0.4478, + "step": 82776 + }, + { + "epoch": 2.12, + "learning_rate": 4.169301727811401e-07, + "loss": 0.4155, + "step": 82777 + }, + { + "epoch": 2.12, + "learning_rate": 4.1690769291766193e-07, + "loss": 0.4583, + "step": 82778 + }, + { + "epoch": 2.12, + "learning_rate": 4.168852135006308e-07, + "loss": 0.4629, + "step": 82779 + }, + { + "epoch": 2.12, + "learning_rate": 4.168627345300634e-07, + "loss": 0.3276, + "step": 82780 + }, + { + "epoch": 2.12, + "learning_rate": 4.168402560059774e-07, + "loss": 0.4253, + "step": 82781 + }, + { + "epoch": 2.12, + "learning_rate": 4.168177779283901e-07, + "loss": 0.4922, + "step": 82782 + }, + { + "epoch": 2.12, + "learning_rate": 4.167953002973189e-07, + "loss": 0.3975, + "step": 82783 + }, + { + "epoch": 2.12, + "learning_rate": 4.167728231127804e-07, + "loss": 0.4082, + "step": 82784 + }, + { + "epoch": 2.12, + "learning_rate": 4.1675034637479213e-07, + "loss": 0.3335, + "step": 82785 + }, + { + "epoch": 2.12, + "learning_rate": 4.167278700833713e-07, + "loss": 0.4111, + "step": 82786 + }, + { + "epoch": 2.12, + "learning_rate": 4.1670539423853543e-07, + "loss": 0.3877, + "step": 82787 + }, + { + "epoch": 2.12, + "learning_rate": 4.1668291884030104e-07, + "loss": 0.4116, + "step": 82788 + }, + { + "epoch": 2.12, + "learning_rate": 4.1666044388868616e-07, + "loss": 0.3489, + "step": 82789 + }, + { + "epoch": 2.12, + "learning_rate": 4.166379693837072e-07, + "loss": 0.4546, + "step": 82790 + }, + { + "epoch": 2.12, + "learning_rate": 4.1661549532538167e-07, + "loss": 0.4189, + "step": 82791 + }, + { + "epoch": 2.12, + "learning_rate": 4.165930217137272e-07, + "loss": 0.3459, + "step": 82792 + }, + { + "epoch": 2.12, + "learning_rate": 4.165705485487603e-07, + "loss": 0.4287, + "step": 82793 + }, + { + "epoch": 2.12, + "learning_rate": 4.1654807583049845e-07, + "loss": 0.2396, + "step": 82794 + }, + { + "epoch": 2.12, + "learning_rate": 4.165256035589594e-07, + "loss": 0.3682, + "step": 82795 + }, + { + "epoch": 2.12, + "learning_rate": 4.165031317341593e-07, + "loss": 0.4844, + "step": 82796 + }, + { + "epoch": 2.12, + "learning_rate": 4.1648066035611604e-07, + "loss": 0.374, + "step": 82797 + }, + { + "epoch": 2.12, + "learning_rate": 4.164581894248468e-07, + "loss": 0.4458, + "step": 82798 + }, + { + "epoch": 2.12, + "learning_rate": 4.164357189403689e-07, + "loss": 0.4321, + "step": 82799 + }, + { + "epoch": 2.12, + "learning_rate": 4.1641324890269935e-07, + "loss": 0.2822, + "step": 82800 + }, + { + "epoch": 2.12, + "learning_rate": 4.163907793118551e-07, + "loss": 0.3342, + "step": 82801 + }, + { + "epoch": 2.12, + "learning_rate": 4.163683101678535e-07, + "loss": 0.2921, + "step": 82802 + }, + { + "epoch": 2.12, + "learning_rate": 4.163458414707118e-07, + "loss": 0.3314, + "step": 82803 + }, + { + "epoch": 2.12, + "learning_rate": 4.1632337322044775e-07, + "loss": 0.3582, + "step": 82804 + }, + { + "epoch": 2.12, + "learning_rate": 4.1630090541707753e-07, + "loss": 0.3638, + "step": 82805 + }, + { + "epoch": 2.12, + "learning_rate": 4.1627843806061904e-07, + "loss": 0.3028, + "step": 82806 + }, + { + "epoch": 2.12, + "learning_rate": 4.1625597115108923e-07, + "loss": 0.52, + "step": 82807 + }, + { + "epoch": 2.12, + "learning_rate": 4.162335046885057e-07, + "loss": 0.4897, + "step": 82808 + }, + { + "epoch": 2.12, + "learning_rate": 4.162110386728854e-07, + "loss": 0.5034, + "step": 82809 + }, + { + "epoch": 2.12, + "learning_rate": 4.1618857310424507e-07, + "loss": 0.4927, + "step": 82810 + }, + { + "epoch": 2.12, + "learning_rate": 4.1616610798260233e-07, + "loss": 0.2697, + "step": 82811 + }, + { + "epoch": 2.12, + "learning_rate": 4.1614364330797467e-07, + "loss": 0.3853, + "step": 82812 + }, + { + "epoch": 2.12, + "learning_rate": 4.161211790803787e-07, + "loss": 0.355, + "step": 82813 + }, + { + "epoch": 2.12, + "learning_rate": 4.1609871529983174e-07, + "loss": 0.3831, + "step": 82814 + }, + { + "epoch": 2.12, + "learning_rate": 4.160762519663513e-07, + "loss": 0.4009, + "step": 82815 + }, + { + "epoch": 2.12, + "learning_rate": 4.1605378907995467e-07, + "loss": 0.479, + "step": 82816 + }, + { + "epoch": 2.12, + "learning_rate": 4.1603132664065855e-07, + "loss": 0.4819, + "step": 82817 + }, + { + "epoch": 2.12, + "learning_rate": 4.160088646484804e-07, + "loss": 0.4243, + "step": 82818 + }, + { + "epoch": 2.12, + "learning_rate": 4.159864031034377e-07, + "loss": 0.459, + "step": 82819 + }, + { + "epoch": 2.12, + "learning_rate": 4.15963942005547e-07, + "loss": 0.3784, + "step": 82820 + }, + { + "epoch": 2.12, + "learning_rate": 4.159414813548262e-07, + "loss": 0.4468, + "step": 82821 + }, + { + "epoch": 2.12, + "learning_rate": 4.1591902115129187e-07, + "loss": 0.3994, + "step": 82822 + }, + { + "epoch": 2.12, + "learning_rate": 4.1589656139496144e-07, + "loss": 0.4441, + "step": 82823 + }, + { + "epoch": 2.12, + "learning_rate": 4.1587410208585206e-07, + "loss": 0.4294, + "step": 82824 + }, + { + "epoch": 2.12, + "learning_rate": 4.158516432239815e-07, + "loss": 0.3643, + "step": 82825 + }, + { + "epoch": 2.12, + "learning_rate": 4.158291848093661e-07, + "loss": 0.4502, + "step": 82826 + }, + { + "epoch": 2.12, + "learning_rate": 4.1580672684202343e-07, + "loss": 0.5098, + "step": 82827 + }, + { + "epoch": 2.12, + "learning_rate": 4.157842693219706e-07, + "loss": 0.4341, + "step": 82828 + }, + { + "epoch": 2.12, + "learning_rate": 4.157618122492258e-07, + "loss": 0.3916, + "step": 82829 + }, + { + "epoch": 2.12, + "learning_rate": 4.157393556238045e-07, + "loss": 0.479, + "step": 82830 + }, + { + "epoch": 2.12, + "learning_rate": 4.157168994457246e-07, + "loss": 0.5293, + "step": 82831 + }, + { + "epoch": 2.12, + "learning_rate": 4.156944437150035e-07, + "loss": 0.5757, + "step": 82832 + }, + { + "epoch": 2.12, + "learning_rate": 4.1567198843165876e-07, + "loss": 0.3542, + "step": 82833 + }, + { + "epoch": 2.12, + "learning_rate": 4.1564953359570667e-07, + "loss": 0.2935, + "step": 82834 + }, + { + "epoch": 2.12, + "learning_rate": 4.156270792071648e-07, + "loss": 0.3816, + "step": 82835 + }, + { + "epoch": 2.12, + "learning_rate": 4.1560462526605044e-07, + "loss": 0.3057, + "step": 82836 + }, + { + "epoch": 2.12, + "learning_rate": 4.155821717723811e-07, + "loss": 0.5869, + "step": 82837 + }, + { + "epoch": 2.12, + "learning_rate": 4.1555971872617324e-07, + "loss": 0.2991, + "step": 82838 + }, + { + "epoch": 2.12, + "learning_rate": 4.155372661274449e-07, + "loss": 0.5552, + "step": 82839 + }, + { + "epoch": 2.12, + "learning_rate": 4.1551481397621234e-07, + "loss": 0.3813, + "step": 82840 + }, + { + "epoch": 2.12, + "learning_rate": 4.1549236227249316e-07, + "loss": 0.5, + "step": 82841 + }, + { + "epoch": 2.12, + "learning_rate": 4.154699110163051e-07, + "loss": 0.4941, + "step": 82842 + }, + { + "epoch": 2.12, + "learning_rate": 4.154474602076644e-07, + "loss": 0.4692, + "step": 82843 + }, + { + "epoch": 2.12, + "learning_rate": 4.154250098465888e-07, + "loss": 0.4233, + "step": 82844 + }, + { + "epoch": 2.12, + "learning_rate": 4.1540255993309525e-07, + "loss": 0.4478, + "step": 82845 + }, + { + "epoch": 2.12, + "learning_rate": 4.1538011046720154e-07, + "loss": 0.4453, + "step": 82846 + }, + { + "epoch": 2.12, + "learning_rate": 4.1535766144892404e-07, + "loss": 0.3772, + "step": 82847 + }, + { + "epoch": 2.12, + "learning_rate": 4.153352128782802e-07, + "loss": 0.4526, + "step": 82848 + }, + { + "epoch": 2.12, + "learning_rate": 4.1531276475528774e-07, + "loss": 0.458, + "step": 82849 + }, + { + "epoch": 2.12, + "learning_rate": 4.1529031707996345e-07, + "loss": 0.3566, + "step": 82850 + }, + { + "epoch": 2.12, + "learning_rate": 4.152678698523241e-07, + "loss": 0.5703, + "step": 82851 + }, + { + "epoch": 2.12, + "learning_rate": 4.152454230723872e-07, + "loss": 0.3706, + "step": 82852 + }, + { + "epoch": 2.12, + "learning_rate": 4.1522297674017003e-07, + "loss": 0.4272, + "step": 82853 + }, + { + "epoch": 2.12, + "learning_rate": 4.152005308556901e-07, + "loss": 0.4238, + "step": 82854 + }, + { + "epoch": 2.12, + "learning_rate": 4.151780854189638e-07, + "loss": 0.3038, + "step": 82855 + }, + { + "epoch": 2.12, + "learning_rate": 4.1515564043000886e-07, + "loss": 0.4888, + "step": 82856 + }, + { + "epoch": 2.12, + "learning_rate": 4.151331958888423e-07, + "loss": 0.457, + "step": 82857 + }, + { + "epoch": 2.12, + "learning_rate": 4.151107517954817e-07, + "loss": 0.3403, + "step": 82858 + }, + { + "epoch": 2.12, + "learning_rate": 4.150883081499439e-07, + "loss": 0.343, + "step": 82859 + }, + { + "epoch": 2.12, + "learning_rate": 4.150658649522458e-07, + "loss": 0.215, + "step": 82860 + }, + { + "epoch": 2.12, + "learning_rate": 4.1504342220240484e-07, + "loss": 0.4377, + "step": 82861 + }, + { + "epoch": 2.12, + "learning_rate": 4.150209799004382e-07, + "loss": 0.3733, + "step": 82862 + }, + { + "epoch": 2.12, + "learning_rate": 4.1499853804636345e-07, + "loss": 0.3374, + "step": 82863 + }, + { + "epoch": 2.12, + "learning_rate": 4.149760966401971e-07, + "loss": 0.3901, + "step": 82864 + }, + { + "epoch": 2.12, + "learning_rate": 4.149536556819566e-07, + "loss": 0.3513, + "step": 82865 + }, + { + "epoch": 2.12, + "learning_rate": 4.1493121517165963e-07, + "loss": 0.4492, + "step": 82866 + }, + { + "epoch": 2.12, + "learning_rate": 4.149087751093225e-07, + "loss": 0.3215, + "step": 82867 + }, + { + "epoch": 2.12, + "learning_rate": 4.148863354949629e-07, + "loss": 0.4824, + "step": 82868 + }, + { + "epoch": 2.12, + "learning_rate": 4.148638963285982e-07, + "loss": 0.2946, + "step": 82869 + }, + { + "epoch": 2.12, + "learning_rate": 4.148414576102449e-07, + "loss": 0.2722, + "step": 82870 + }, + { + "epoch": 2.12, + "learning_rate": 4.1481901933992104e-07, + "loss": 0.2947, + "step": 82871 + }, + { + "epoch": 2.12, + "learning_rate": 4.14796581517643e-07, + "loss": 0.3589, + "step": 82872 + }, + { + "epoch": 2.12, + "learning_rate": 4.1477414414342825e-07, + "loss": 0.4492, + "step": 82873 + }, + { + "epoch": 2.12, + "learning_rate": 4.1475170721729416e-07, + "loss": 0.4233, + "step": 82874 + }, + { + "epoch": 2.12, + "learning_rate": 4.14729270739258e-07, + "loss": 0.2872, + "step": 82875 + }, + { + "epoch": 2.12, + "learning_rate": 4.1470683470933645e-07, + "loss": 0.5024, + "step": 82876 + }, + { + "epoch": 2.12, + "learning_rate": 4.1468439912754683e-07, + "loss": 0.5117, + "step": 82877 + }, + { + "epoch": 2.12, + "learning_rate": 4.146619639939066e-07, + "loss": 0.3579, + "step": 82878 + }, + { + "epoch": 2.12, + "learning_rate": 4.1463952930843307e-07, + "loss": 0.4858, + "step": 82879 + }, + { + "epoch": 2.12, + "learning_rate": 4.146170950711432e-07, + "loss": 0.405, + "step": 82880 + }, + { + "epoch": 2.12, + "learning_rate": 4.145946612820537e-07, + "loss": 0.415, + "step": 82881 + }, + { + "epoch": 2.12, + "learning_rate": 4.1457222794118205e-07, + "loss": 0.3696, + "step": 82882 + }, + { + "epoch": 2.12, + "learning_rate": 4.14549795048546e-07, + "loss": 0.4575, + "step": 82883 + }, + { + "epoch": 2.12, + "learning_rate": 4.14527362604162e-07, + "loss": 0.2693, + "step": 82884 + }, + { + "epoch": 2.12, + "learning_rate": 4.1450493060804726e-07, + "loss": 0.2902, + "step": 82885 + }, + { + "epoch": 2.12, + "learning_rate": 4.144824990602193e-07, + "loss": 0.4741, + "step": 82886 + }, + { + "epoch": 2.12, + "learning_rate": 4.1446006796069556e-07, + "loss": 0.222, + "step": 82887 + }, + { + "epoch": 2.12, + "learning_rate": 4.1443763730949234e-07, + "loss": 0.6152, + "step": 82888 + }, + { + "epoch": 2.12, + "learning_rate": 4.144152071066277e-07, + "loss": 0.3163, + "step": 82889 + }, + { + "epoch": 2.12, + "learning_rate": 4.1439277735211806e-07, + "loss": 0.4033, + "step": 82890 + }, + { + "epoch": 2.12, + "learning_rate": 4.1437034804598104e-07, + "loss": 0.4307, + "step": 82891 + }, + { + "epoch": 2.12, + "learning_rate": 4.14347919188234e-07, + "loss": 0.3992, + "step": 82892 + }, + { + "epoch": 2.12, + "learning_rate": 4.1432549077889336e-07, + "loss": 0.3835, + "step": 82893 + }, + { + "epoch": 2.12, + "learning_rate": 4.143030628179769e-07, + "loss": 0.3706, + "step": 82894 + }, + { + "epoch": 2.12, + "learning_rate": 4.142806353055016e-07, + "loss": 0.4746, + "step": 82895 + }, + { + "epoch": 2.12, + "learning_rate": 4.1425820824148503e-07, + "loss": 0.2032, + "step": 82896 + }, + { + "epoch": 2.12, + "learning_rate": 4.1423578162594377e-07, + "loss": 0.3481, + "step": 82897 + }, + { + "epoch": 2.12, + "learning_rate": 4.1421335545889513e-07, + "loss": 0.4908, + "step": 82898 + }, + { + "epoch": 2.12, + "learning_rate": 4.1419092974035673e-07, + "loss": 0.5044, + "step": 82899 + }, + { + "epoch": 2.12, + "learning_rate": 4.1416850447034547e-07, + "loss": 0.3345, + "step": 82900 + }, + { + "epoch": 2.12, + "learning_rate": 4.1414607964887806e-07, + "loss": 0.415, + "step": 82901 + }, + { + "epoch": 2.12, + "learning_rate": 4.1412365527597205e-07, + "loss": 0.4106, + "step": 82902 + }, + { + "epoch": 2.12, + "learning_rate": 4.1410123135164467e-07, + "loss": 0.502, + "step": 82903 + }, + { + "epoch": 2.12, + "learning_rate": 4.140788078759133e-07, + "loss": 0.4751, + "step": 82904 + }, + { + "epoch": 2.12, + "learning_rate": 4.1405638484879457e-07, + "loss": 0.3896, + "step": 82905 + }, + { + "epoch": 2.12, + "learning_rate": 4.140339622703058e-07, + "loss": 0.5156, + "step": 82906 + }, + { + "epoch": 2.12, + "learning_rate": 4.1401154014046444e-07, + "loss": 0.4858, + "step": 82907 + }, + { + "epoch": 2.12, + "learning_rate": 4.1398911845928773e-07, + "loss": 0.3875, + "step": 82908 + }, + { + "epoch": 2.12, + "learning_rate": 4.139666972267927e-07, + "loss": 0.2994, + "step": 82909 + }, + { + "epoch": 2.13, + "learning_rate": 4.13944276442996e-07, + "loss": 0.4351, + "step": 82910 + }, + { + "epoch": 2.13, + "learning_rate": 4.139218561079153e-07, + "loss": 0.3923, + "step": 82911 + }, + { + "epoch": 2.13, + "learning_rate": 4.1389943622156766e-07, + "loss": 0.4136, + "step": 82912 + }, + { + "epoch": 2.13, + "learning_rate": 4.138770167839706e-07, + "loss": 0.3403, + "step": 82913 + }, + { + "epoch": 2.13, + "learning_rate": 4.1385459779514065e-07, + "loss": 0.3325, + "step": 82914 + }, + { + "epoch": 2.13, + "learning_rate": 4.1383217925509515e-07, + "loss": 0.4351, + "step": 82915 + }, + { + "epoch": 2.13, + "learning_rate": 4.138097611638516e-07, + "loss": 0.498, + "step": 82916 + }, + { + "epoch": 2.13, + "learning_rate": 4.137873435214272e-07, + "loss": 0.4775, + "step": 82917 + }, + { + "epoch": 2.13, + "learning_rate": 4.1376492632783843e-07, + "loss": 0.2937, + "step": 82918 + }, + { + "epoch": 2.13, + "learning_rate": 4.137425095831034e-07, + "loss": 0.4292, + "step": 82919 + }, + { + "epoch": 2.13, + "learning_rate": 4.1372009328723834e-07, + "loss": 0.4453, + "step": 82920 + }, + { + "epoch": 2.13, + "learning_rate": 4.136976774402613e-07, + "loss": 0.5107, + "step": 82921 + }, + { + "epoch": 2.13, + "learning_rate": 4.136752620421885e-07, + "loss": 0.3464, + "step": 82922 + }, + { + "epoch": 2.13, + "learning_rate": 4.1365284709303773e-07, + "loss": 0.4917, + "step": 82923 + }, + { + "epoch": 2.13, + "learning_rate": 4.1363043259282593e-07, + "loss": 0.3379, + "step": 82924 + }, + { + "epoch": 2.13, + "learning_rate": 4.136080185415707e-07, + "loss": 0.3452, + "step": 82925 + }, + { + "epoch": 2.13, + "learning_rate": 4.135856049392885e-07, + "loss": 0.2823, + "step": 82926 + }, + { + "epoch": 2.13, + "learning_rate": 4.1356319178599685e-07, + "loss": 0.4922, + "step": 82927 + }, + { + "epoch": 2.13, + "learning_rate": 4.135407790817129e-07, + "loss": 0.415, + "step": 82928 + }, + { + "epoch": 2.13, + "learning_rate": 4.1351836682645414e-07, + "loss": 0.3604, + "step": 82929 + }, + { + "epoch": 2.13, + "learning_rate": 4.134959550202375e-07, + "loss": 0.4429, + "step": 82930 + }, + { + "epoch": 2.13, + "learning_rate": 4.134735436630795e-07, + "loss": 0.3984, + "step": 82931 + }, + { + "epoch": 2.13, + "learning_rate": 4.1345113275499796e-07, + "loss": 0.4849, + "step": 82932 + }, + { + "epoch": 2.13, + "learning_rate": 4.134287222960099e-07, + "loss": 0.436, + "step": 82933 + }, + { + "epoch": 2.13, + "learning_rate": 4.134063122861329e-07, + "loss": 0.4771, + "step": 82934 + }, + { + "epoch": 2.13, + "learning_rate": 4.1338390272538327e-07, + "loss": 0.375, + "step": 82935 + }, + { + "epoch": 2.13, + "learning_rate": 4.133614936137787e-07, + "loss": 0.3657, + "step": 82936 + }, + { + "epoch": 2.13, + "learning_rate": 4.133390849513362e-07, + "loss": 0.3765, + "step": 82937 + }, + { + "epoch": 2.13, + "learning_rate": 4.1331667673807334e-07, + "loss": 0.2132, + "step": 82938 + }, + { + "epoch": 2.13, + "learning_rate": 4.132942689740069e-07, + "loss": 0.3573, + "step": 82939 + }, + { + "epoch": 2.13, + "learning_rate": 4.1327186165915376e-07, + "loss": 0.4399, + "step": 82940 + }, + { + "epoch": 2.13, + "learning_rate": 4.1324945479353133e-07, + "loss": 0.4604, + "step": 82941 + }, + { + "epoch": 2.13, + "learning_rate": 4.132270483771573e-07, + "loss": 0.4214, + "step": 82942 + }, + { + "epoch": 2.13, + "learning_rate": 4.1320464241004783e-07, + "loss": 0.439, + "step": 82943 + }, + { + "epoch": 2.13, + "learning_rate": 4.1318223689222063e-07, + "loss": 0.2936, + "step": 82944 + }, + { + "epoch": 2.13, + "learning_rate": 4.1315983182369285e-07, + "loss": 0.3651, + "step": 82945 + }, + { + "epoch": 2.13, + "learning_rate": 4.1313742720448184e-07, + "loss": 0.3807, + "step": 82946 + }, + { + "epoch": 2.13, + "learning_rate": 4.1311502303460435e-07, + "loss": 0.4961, + "step": 82947 + }, + { + "epoch": 2.13, + "learning_rate": 4.1309261931407757e-07, + "loss": 0.4149, + "step": 82948 + }, + { + "epoch": 2.13, + "learning_rate": 4.1307021604291913e-07, + "loss": 0.4814, + "step": 82949 + }, + { + "epoch": 2.13, + "learning_rate": 4.1304781322114544e-07, + "loss": 0.4128, + "step": 82950 + }, + { + "epoch": 2.13, + "learning_rate": 4.130254108487745e-07, + "loss": 0.3241, + "step": 82951 + }, + { + "epoch": 2.13, + "learning_rate": 4.1300300892582275e-07, + "loss": 0.5166, + "step": 82952 + }, + { + "epoch": 2.13, + "learning_rate": 4.1298060745230746e-07, + "loss": 0.1882, + "step": 82953 + }, + { + "epoch": 2.13, + "learning_rate": 4.1295820642824595e-07, + "loss": 0.4702, + "step": 82954 + }, + { + "epoch": 2.13, + "learning_rate": 4.129358058536557e-07, + "loss": 0.5869, + "step": 82955 + }, + { + "epoch": 2.13, + "learning_rate": 4.1291340572855313e-07, + "loss": 0.3978, + "step": 82956 + }, + { + "epoch": 2.13, + "learning_rate": 4.128910060529559e-07, + "loss": 0.5542, + "step": 82957 + }, + { + "epoch": 2.13, + "learning_rate": 4.128686068268813e-07, + "loss": 0.4468, + "step": 82958 + }, + { + "epoch": 2.13, + "learning_rate": 4.128462080503462e-07, + "loss": 0.3953, + "step": 82959 + }, + { + "epoch": 2.13, + "learning_rate": 4.1282380972336737e-07, + "loss": 0.3376, + "step": 82960 + }, + { + "epoch": 2.13, + "learning_rate": 4.128014118459624e-07, + "loss": 0.4419, + "step": 82961 + }, + { + "epoch": 2.13, + "learning_rate": 4.1277901441814845e-07, + "loss": 0.5098, + "step": 82962 + }, + { + "epoch": 2.13, + "learning_rate": 4.1275661743994283e-07, + "loss": 0.3828, + "step": 82963 + }, + { + "epoch": 2.13, + "learning_rate": 4.127342209113622e-07, + "loss": 0.4604, + "step": 82964 + }, + { + "epoch": 2.13, + "learning_rate": 4.1271182483242395e-07, + "loss": 0.3823, + "step": 82965 + }, + { + "epoch": 2.13, + "learning_rate": 4.126894292031452e-07, + "loss": 0.3094, + "step": 82966 + }, + { + "epoch": 2.13, + "learning_rate": 4.1266703402354364e-07, + "loss": 0.3708, + "step": 82967 + }, + { + "epoch": 2.13, + "learning_rate": 4.1264463929363547e-07, + "loss": 0.4546, + "step": 82968 + }, + { + "epoch": 2.13, + "learning_rate": 4.126222450134387e-07, + "loss": 0.3735, + "step": 82969 + }, + { + "epoch": 2.13, + "learning_rate": 4.1259985118296956e-07, + "loss": 0.46, + "step": 82970 + }, + { + "epoch": 2.13, + "learning_rate": 4.1257745780224586e-07, + "loss": 0.4155, + "step": 82971 + }, + { + "epoch": 2.13, + "learning_rate": 4.125550648712849e-07, + "loss": 0.5103, + "step": 82972 + }, + { + "epoch": 2.13, + "learning_rate": 4.1253267239010325e-07, + "loss": 0.4565, + "step": 82973 + }, + { + "epoch": 2.13, + "learning_rate": 4.125102803587182e-07, + "loss": 0.436, + "step": 82974 + }, + { + "epoch": 2.13, + "learning_rate": 4.1248788877714735e-07, + "loss": 0.3591, + "step": 82975 + }, + { + "epoch": 2.13, + "learning_rate": 4.124654976454073e-07, + "loss": 0.3071, + "step": 82976 + }, + { + "epoch": 2.13, + "learning_rate": 4.124431069635153e-07, + "loss": 0.4487, + "step": 82977 + }, + { + "epoch": 2.13, + "learning_rate": 4.124207167314886e-07, + "loss": 0.4727, + "step": 82978 + }, + { + "epoch": 2.13, + "learning_rate": 4.123983269493447e-07, + "loss": 0.2476, + "step": 82979 + }, + { + "epoch": 2.13, + "learning_rate": 4.123759376171004e-07, + "loss": 0.3599, + "step": 82980 + }, + { + "epoch": 2.13, + "learning_rate": 4.1235354873477246e-07, + "loss": 0.3208, + "step": 82981 + }, + { + "epoch": 2.13, + "learning_rate": 4.1233116030237833e-07, + "loss": 0.3882, + "step": 82982 + }, + { + "epoch": 2.13, + "learning_rate": 4.123087723199353e-07, + "loss": 0.4487, + "step": 82983 + }, + { + "epoch": 2.13, + "learning_rate": 4.122863847874607e-07, + "loss": 0.3518, + "step": 82984 + }, + { + "epoch": 2.13, + "learning_rate": 4.1226399770497113e-07, + "loss": 0.4121, + "step": 82985 + }, + { + "epoch": 2.13, + "learning_rate": 4.122416110724839e-07, + "loss": 0.4482, + "step": 82986 + }, + { + "epoch": 2.13, + "learning_rate": 4.122192248900163e-07, + "loss": 0.397, + "step": 82987 + }, + { + "epoch": 2.13, + "learning_rate": 4.1219683915758574e-07, + "loss": 0.3525, + "step": 82988 + }, + { + "epoch": 2.13, + "learning_rate": 4.121744538752091e-07, + "loss": 0.2573, + "step": 82989 + }, + { + "epoch": 2.13, + "learning_rate": 4.12152069042903e-07, + "loss": 0.406, + "step": 82990 + }, + { + "epoch": 2.13, + "learning_rate": 4.121296846606851e-07, + "loss": 0.3861, + "step": 82991 + }, + { + "epoch": 2.13, + "learning_rate": 4.121073007285728e-07, + "loss": 0.4541, + "step": 82992 + }, + { + "epoch": 2.13, + "learning_rate": 4.120849172465825e-07, + "loss": 0.3799, + "step": 82993 + }, + { + "epoch": 2.13, + "learning_rate": 4.1206253421473183e-07, + "loss": 0.3867, + "step": 82994 + }, + { + "epoch": 2.13, + "learning_rate": 4.1204015163303774e-07, + "loss": 0.52, + "step": 82995 + }, + { + "epoch": 2.13, + "learning_rate": 4.120177695015179e-07, + "loss": 0.4785, + "step": 82996 + }, + { + "epoch": 2.13, + "learning_rate": 4.119953878201886e-07, + "loss": 0.3132, + "step": 82997 + }, + { + "epoch": 2.13, + "learning_rate": 4.1197300658906753e-07, + "loss": 0.4951, + "step": 82998 + }, + { + "epoch": 2.13, + "learning_rate": 4.1195062580817195e-07, + "loss": 0.5195, + "step": 82999 + }, + { + "epoch": 2.13, + "learning_rate": 4.1192824547751837e-07, + "loss": 0.417, + "step": 83000 + }, + { + "epoch": 2.13, + "learning_rate": 4.119058655971247e-07, + "loss": 0.4248, + "step": 83001 + }, + { + "epoch": 2.13, + "learning_rate": 4.118834861670073e-07, + "loss": 0.356, + "step": 83002 + }, + { + "epoch": 2.13, + "learning_rate": 4.1186110718718356e-07, + "loss": 0.3394, + "step": 83003 + }, + { + "epoch": 2.13, + "learning_rate": 4.118387286576709e-07, + "loss": 0.4407, + "step": 83004 + }, + { + "epoch": 2.13, + "learning_rate": 4.1181635057848654e-07, + "loss": 0.252, + "step": 83005 + }, + { + "epoch": 2.13, + "learning_rate": 4.1179397294964704e-07, + "loss": 0.4194, + "step": 83006 + }, + { + "epoch": 2.13, + "learning_rate": 4.117715957711698e-07, + "loss": 0.4136, + "step": 83007 + }, + { + "epoch": 2.13, + "learning_rate": 4.1174921904307204e-07, + "loss": 0.4292, + "step": 83008 + }, + { + "epoch": 2.13, + "learning_rate": 4.1172684276537164e-07, + "loss": 0.4368, + "step": 83009 + }, + { + "epoch": 2.13, + "learning_rate": 4.1170446693808413e-07, + "loss": 0.4556, + "step": 83010 + }, + { + "epoch": 2.13, + "learning_rate": 4.1168209156122747e-07, + "loss": 0.4736, + "step": 83011 + }, + { + "epoch": 2.13, + "learning_rate": 4.116597166348188e-07, + "loss": 0.3511, + "step": 83012 + }, + { + "epoch": 2.13, + "learning_rate": 4.116373421588756e-07, + "loss": 0.4658, + "step": 83013 + }, + { + "epoch": 2.13, + "learning_rate": 4.1161496813341424e-07, + "loss": 0.4292, + "step": 83014 + }, + { + "epoch": 2.13, + "learning_rate": 4.115925945584522e-07, + "loss": 0.3711, + "step": 83015 + }, + { + "epoch": 2.13, + "learning_rate": 4.1157022143400674e-07, + "loss": 0.3994, + "step": 83016 + }, + { + "epoch": 2.13, + "learning_rate": 4.1154784876009516e-07, + "loss": 0.4624, + "step": 83017 + }, + { + "epoch": 2.13, + "learning_rate": 4.115254765367341e-07, + "loss": 0.4202, + "step": 83018 + }, + { + "epoch": 2.13, + "learning_rate": 4.115031047639412e-07, + "loss": 0.4214, + "step": 83019 + }, + { + "epoch": 2.13, + "learning_rate": 4.1148073344173307e-07, + "loss": 0.3887, + "step": 83020 + }, + { + "epoch": 2.13, + "learning_rate": 4.11458362570127e-07, + "loss": 0.4282, + "step": 83021 + }, + { + "epoch": 2.13, + "learning_rate": 4.114359921491405e-07, + "loss": 0.4993, + "step": 83022 + }, + { + "epoch": 2.13, + "learning_rate": 4.1141362217879014e-07, + "loss": 0.4019, + "step": 83023 + }, + { + "epoch": 2.13, + "learning_rate": 4.1139125265909325e-07, + "loss": 0.347, + "step": 83024 + }, + { + "epoch": 2.13, + "learning_rate": 4.1136888359006706e-07, + "loss": 0.3547, + "step": 83025 + }, + { + "epoch": 2.13, + "learning_rate": 4.11346514971729e-07, + "loss": 0.395, + "step": 83026 + }, + { + "epoch": 2.13, + "learning_rate": 4.1132414680409543e-07, + "loss": 0.3541, + "step": 83027 + }, + { + "epoch": 2.13, + "learning_rate": 4.1130177908718386e-07, + "loss": 0.4331, + "step": 83028 + }, + { + "epoch": 2.13, + "learning_rate": 4.112794118210119e-07, + "loss": 0.3376, + "step": 83029 + }, + { + "epoch": 2.13, + "learning_rate": 4.112570450055962e-07, + "loss": 0.4209, + "step": 83030 + }, + { + "epoch": 2.13, + "learning_rate": 4.1123467864095363e-07, + "loss": 0.519, + "step": 83031 + }, + { + "epoch": 2.13, + "learning_rate": 4.1121231272710146e-07, + "loss": 0.3594, + "step": 83032 + }, + { + "epoch": 2.13, + "learning_rate": 4.11189947264057e-07, + "loss": 0.3245, + "step": 83033 + }, + { + "epoch": 2.13, + "learning_rate": 4.111675822518377e-07, + "loss": 0.4629, + "step": 83034 + }, + { + "epoch": 2.13, + "learning_rate": 4.1114521769045995e-07, + "loss": 0.4038, + "step": 83035 + }, + { + "epoch": 2.13, + "learning_rate": 4.1112285357994124e-07, + "loss": 0.3984, + "step": 83036 + }, + { + "epoch": 2.13, + "learning_rate": 4.1110048992029865e-07, + "loss": 0.4146, + "step": 83037 + }, + { + "epoch": 2.13, + "learning_rate": 4.1107812671154963e-07, + "loss": 0.457, + "step": 83038 + }, + { + "epoch": 2.13, + "learning_rate": 4.110557639537111e-07, + "loss": 0.4297, + "step": 83039 + }, + { + "epoch": 2.13, + "learning_rate": 4.1103340164679976e-07, + "loss": 0.4177, + "step": 83040 + }, + { + "epoch": 2.13, + "learning_rate": 4.11011039790833e-07, + "loss": 0.3159, + "step": 83041 + }, + { + "epoch": 2.13, + "learning_rate": 4.109886783858281e-07, + "loss": 0.4312, + "step": 83042 + }, + { + "epoch": 2.13, + "learning_rate": 4.109663174318023e-07, + "loss": 0.3975, + "step": 83043 + }, + { + "epoch": 2.13, + "learning_rate": 4.1094395692877216e-07, + "loss": 0.4468, + "step": 83044 + }, + { + "epoch": 2.13, + "learning_rate": 4.109215968767552e-07, + "loss": 0.447, + "step": 83045 + }, + { + "epoch": 2.13, + "learning_rate": 4.1089923727576893e-07, + "loss": 0.3708, + "step": 83046 + }, + { + "epoch": 2.13, + "learning_rate": 4.108768781258295e-07, + "loss": 0.407, + "step": 83047 + }, + { + "epoch": 2.13, + "learning_rate": 4.1085451942695504e-07, + "loss": 0.3679, + "step": 83048 + }, + { + "epoch": 2.13, + "learning_rate": 4.1083216117916175e-07, + "loss": 0.3955, + "step": 83049 + }, + { + "epoch": 2.13, + "learning_rate": 4.108098033824673e-07, + "loss": 0.4399, + "step": 83050 + }, + { + "epoch": 2.13, + "learning_rate": 4.1078744603688896e-07, + "loss": 0.3162, + "step": 83051 + }, + { + "epoch": 2.13, + "learning_rate": 4.1076508914244325e-07, + "loss": 0.4468, + "step": 83052 + }, + { + "epoch": 2.13, + "learning_rate": 4.107427326991475e-07, + "loss": 0.4585, + "step": 83053 + }, + { + "epoch": 2.13, + "learning_rate": 4.107203767070191e-07, + "loss": 0.4873, + "step": 83054 + }, + { + "epoch": 2.13, + "learning_rate": 4.1069802116607533e-07, + "loss": 0.2744, + "step": 83055 + }, + { + "epoch": 2.13, + "learning_rate": 4.106756660763325e-07, + "loss": 0.3135, + "step": 83056 + }, + { + "epoch": 2.13, + "learning_rate": 4.1065331143780844e-07, + "loss": 0.4741, + "step": 83057 + }, + { + "epoch": 2.13, + "learning_rate": 4.106309572505202e-07, + "loss": 0.4399, + "step": 83058 + }, + { + "epoch": 2.13, + "learning_rate": 4.1060860351448454e-07, + "loss": 0.519, + "step": 83059 + }, + { + "epoch": 2.13, + "learning_rate": 4.1058625022971907e-07, + "loss": 0.3208, + "step": 83060 + }, + { + "epoch": 2.13, + "learning_rate": 4.105638973962402e-07, + "loss": 0.458, + "step": 83061 + }, + { + "epoch": 2.13, + "learning_rate": 4.1054154501406547e-07, + "loss": 0.4646, + "step": 83062 + }, + { + "epoch": 2.13, + "learning_rate": 4.1051919308321234e-07, + "loss": 0.4038, + "step": 83063 + }, + { + "epoch": 2.13, + "learning_rate": 4.104968416036972e-07, + "loss": 0.3723, + "step": 83064 + }, + { + "epoch": 2.13, + "learning_rate": 4.1047449057553753e-07, + "loss": 0.4253, + "step": 83065 + }, + { + "epoch": 2.13, + "learning_rate": 4.1045213999875053e-07, + "loss": 0.2243, + "step": 83066 + }, + { + "epoch": 2.13, + "learning_rate": 4.104297898733534e-07, + "loss": 0.4423, + "step": 83067 + }, + { + "epoch": 2.13, + "learning_rate": 4.1040744019936314e-07, + "loss": 0.5171, + "step": 83068 + }, + { + "epoch": 2.13, + "learning_rate": 4.103850909767964e-07, + "loss": 0.2869, + "step": 83069 + }, + { + "epoch": 2.13, + "learning_rate": 4.103627422056708e-07, + "loss": 0.4048, + "step": 83070 + }, + { + "epoch": 2.13, + "learning_rate": 4.103403938860033e-07, + "loss": 0.3235, + "step": 83071 + }, + { + "epoch": 2.13, + "learning_rate": 4.103180460178113e-07, + "loss": 0.4075, + "step": 83072 + }, + { + "epoch": 2.13, + "learning_rate": 4.1029569860111136e-07, + "loss": 0.4497, + "step": 83073 + }, + { + "epoch": 2.13, + "learning_rate": 4.102733516359209e-07, + "loss": 0.5298, + "step": 83074 + }, + { + "epoch": 2.13, + "learning_rate": 4.102510051222571e-07, + "loss": 0.563, + "step": 83075 + }, + { + "epoch": 2.13, + "learning_rate": 4.1022865906013727e-07, + "loss": 0.3354, + "step": 83076 + }, + { + "epoch": 2.13, + "learning_rate": 4.102063134495778e-07, + "loss": 0.2767, + "step": 83077 + }, + { + "epoch": 2.13, + "learning_rate": 4.1018396829059665e-07, + "loss": 0.4043, + "step": 83078 + }, + { + "epoch": 2.13, + "learning_rate": 4.1016162358321027e-07, + "loss": 0.4723, + "step": 83079 + }, + { + "epoch": 2.13, + "learning_rate": 4.1013927932743586e-07, + "loss": 0.347, + "step": 83080 + }, + { + "epoch": 2.13, + "learning_rate": 4.101169355232911e-07, + "loss": 0.4775, + "step": 83081 + }, + { + "epoch": 2.13, + "learning_rate": 4.1009459217079236e-07, + "loss": 0.4385, + "step": 83082 + }, + { + "epoch": 2.13, + "learning_rate": 4.10072249269957e-07, + "loss": 0.4575, + "step": 83083 + }, + { + "epoch": 2.13, + "learning_rate": 4.1004990682080253e-07, + "loss": 0.501, + "step": 83084 + }, + { + "epoch": 2.13, + "learning_rate": 4.1002756482334544e-07, + "loss": 0.3926, + "step": 83085 + }, + { + "epoch": 2.13, + "learning_rate": 4.100052232776031e-07, + "loss": 0.4087, + "step": 83086 + }, + { + "epoch": 2.13, + "learning_rate": 4.099828821835926e-07, + "loss": 0.3324, + "step": 83087 + }, + { + "epoch": 2.13, + "learning_rate": 4.099605415413314e-07, + "loss": 0.4126, + "step": 83088 + }, + { + "epoch": 2.13, + "learning_rate": 4.0993820135083635e-07, + "loss": 0.498, + "step": 83089 + }, + { + "epoch": 2.13, + "learning_rate": 4.099158616121241e-07, + "loss": 0.4448, + "step": 83090 + }, + { + "epoch": 2.13, + "learning_rate": 4.0989352232521226e-07, + "loss": 0.3461, + "step": 83091 + }, + { + "epoch": 2.13, + "learning_rate": 4.098711834901176e-07, + "loss": 0.4683, + "step": 83092 + }, + { + "epoch": 2.13, + "learning_rate": 4.098488451068579e-07, + "loss": 0.4312, + "step": 83093 + }, + { + "epoch": 2.13, + "learning_rate": 4.0982650717544953e-07, + "loss": 0.4143, + "step": 83094 + }, + { + "epoch": 2.13, + "learning_rate": 4.098041696959098e-07, + "loss": 0.4707, + "step": 83095 + }, + { + "epoch": 2.13, + "learning_rate": 4.0978183266825583e-07, + "loss": 0.3738, + "step": 83096 + }, + { + "epoch": 2.13, + "learning_rate": 4.0975949609250517e-07, + "loss": 0.4666, + "step": 83097 + }, + { + "epoch": 2.13, + "learning_rate": 4.0973715996867453e-07, + "loss": 0.2965, + "step": 83098 + }, + { + "epoch": 2.13, + "learning_rate": 4.097148242967806e-07, + "loss": 0.2426, + "step": 83099 + }, + { + "epoch": 2.13, + "learning_rate": 4.0969248907684096e-07, + "loss": 0.4761, + "step": 83100 + }, + { + "epoch": 2.13, + "learning_rate": 4.0967015430887296e-07, + "loss": 0.3804, + "step": 83101 + }, + { + "epoch": 2.13, + "learning_rate": 4.09647819992893e-07, + "loss": 0.4668, + "step": 83102 + }, + { + "epoch": 2.13, + "learning_rate": 4.0962548612891866e-07, + "loss": 0.4102, + "step": 83103 + }, + { + "epoch": 2.13, + "learning_rate": 4.0960315271696687e-07, + "loss": 0.397, + "step": 83104 + }, + { + "epoch": 2.13, + "learning_rate": 4.095808197570552e-07, + "loss": 0.2809, + "step": 83105 + }, + { + "epoch": 2.13, + "learning_rate": 4.0955848724919983e-07, + "loss": 0.5127, + "step": 83106 + }, + { + "epoch": 2.13, + "learning_rate": 4.0953615519341857e-07, + "loss": 0.4001, + "step": 83107 + }, + { + "epoch": 2.13, + "learning_rate": 4.0951382358972855e-07, + "loss": 0.3174, + "step": 83108 + }, + { + "epoch": 2.13, + "learning_rate": 4.094914924381463e-07, + "loss": 0.46, + "step": 83109 + }, + { + "epoch": 2.13, + "learning_rate": 4.094691617386897e-07, + "loss": 0.3065, + "step": 83110 + }, + { + "epoch": 2.13, + "learning_rate": 4.0944683149137503e-07, + "loss": 0.4214, + "step": 83111 + }, + { + "epoch": 2.13, + "learning_rate": 4.094245016962197e-07, + "loss": 0.416, + "step": 83112 + }, + { + "epoch": 2.13, + "learning_rate": 4.0940217235324095e-07, + "loss": 0.4126, + "step": 83113 + }, + { + "epoch": 2.13, + "learning_rate": 4.0937984346245616e-07, + "loss": 0.4534, + "step": 83114 + }, + { + "epoch": 2.13, + "learning_rate": 4.093575150238816e-07, + "loss": 0.3156, + "step": 83115 + }, + { + "epoch": 2.13, + "learning_rate": 4.093351870375349e-07, + "loss": 0.4678, + "step": 83116 + }, + { + "epoch": 2.13, + "learning_rate": 4.093128595034331e-07, + "loss": 0.4238, + "step": 83117 + }, + { + "epoch": 2.13, + "learning_rate": 4.092905324215941e-07, + "loss": 0.4047, + "step": 83118 + }, + { + "epoch": 2.13, + "learning_rate": 4.0926820579203326e-07, + "loss": 0.4463, + "step": 83119 + }, + { + "epoch": 2.13, + "learning_rate": 4.0924587961476875e-07, + "loss": 0.4153, + "step": 83120 + }, + { + "epoch": 2.13, + "learning_rate": 4.0922355388981746e-07, + "loss": 0.3105, + "step": 83121 + }, + { + "epoch": 2.13, + "learning_rate": 4.0920122861719685e-07, + "loss": 0.4272, + "step": 83122 + }, + { + "epoch": 2.13, + "learning_rate": 4.0917890379692333e-07, + "loss": 0.4536, + "step": 83123 + }, + { + "epoch": 2.13, + "learning_rate": 4.091565794290144e-07, + "loss": 0.2917, + "step": 83124 + }, + { + "epoch": 2.13, + "learning_rate": 4.0913425551348714e-07, + "loss": 0.373, + "step": 83125 + }, + { + "epoch": 2.13, + "learning_rate": 4.0911193205035887e-07, + "loss": 0.4619, + "step": 83126 + }, + { + "epoch": 2.13, + "learning_rate": 4.0908960903964604e-07, + "loss": 0.4324, + "step": 83127 + }, + { + "epoch": 2.13, + "learning_rate": 4.090672864813667e-07, + "loss": 0.4084, + "step": 83128 + }, + { + "epoch": 2.13, + "learning_rate": 4.090449643755368e-07, + "loss": 0.3264, + "step": 83129 + }, + { + "epoch": 2.13, + "learning_rate": 4.0902264272217414e-07, + "loss": 0.4341, + "step": 83130 + }, + { + "epoch": 2.13, + "learning_rate": 4.090003215212959e-07, + "loss": 0.2644, + "step": 83131 + }, + { + "epoch": 2.13, + "learning_rate": 4.089780007729187e-07, + "loss": 0.3489, + "step": 83132 + }, + { + "epoch": 2.13, + "learning_rate": 4.0895568047705973e-07, + "loss": 0.3804, + "step": 83133 + }, + { + "epoch": 2.13, + "learning_rate": 4.089333606337363e-07, + "loss": 0.4524, + "step": 83134 + }, + { + "epoch": 2.13, + "learning_rate": 4.0891104124296583e-07, + "loss": 0.4888, + "step": 83135 + }, + { + "epoch": 2.13, + "learning_rate": 4.0888872230476455e-07, + "loss": 0.4517, + "step": 83136 + }, + { + "epoch": 2.13, + "learning_rate": 4.0886640381915006e-07, + "loss": 0.4458, + "step": 83137 + }, + { + "epoch": 2.13, + "learning_rate": 4.088440857861397e-07, + "loss": 0.3013, + "step": 83138 + }, + { + "epoch": 2.13, + "learning_rate": 4.088217682057502e-07, + "loss": 0.4229, + "step": 83139 + }, + { + "epoch": 2.13, + "learning_rate": 4.087994510779984e-07, + "loss": 0.3479, + "step": 83140 + }, + { + "epoch": 2.13, + "learning_rate": 4.087771344029016e-07, + "loss": 0.3872, + "step": 83141 + }, + { + "epoch": 2.13, + "learning_rate": 4.0875481818047706e-07, + "loss": 0.3605, + "step": 83142 + }, + { + "epoch": 2.13, + "learning_rate": 4.087325024107421e-07, + "loss": 0.5718, + "step": 83143 + }, + { + "epoch": 2.13, + "learning_rate": 4.087101870937131e-07, + "loss": 0.3655, + "step": 83144 + }, + { + "epoch": 2.13, + "learning_rate": 4.086878722294075e-07, + "loss": 0.3687, + "step": 83145 + }, + { + "epoch": 2.13, + "learning_rate": 4.086655578178425e-07, + "loss": 0.5435, + "step": 83146 + }, + { + "epoch": 2.13, + "learning_rate": 4.0864324385903535e-07, + "loss": 0.4272, + "step": 83147 + }, + { + "epoch": 2.13, + "learning_rate": 4.0862093035300294e-07, + "loss": 0.5083, + "step": 83148 + }, + { + "epoch": 2.13, + "learning_rate": 4.0859861729976184e-07, + "loss": 0.3706, + "step": 83149 + }, + { + "epoch": 2.13, + "learning_rate": 4.085763046993297e-07, + "loss": 0.293, + "step": 83150 + }, + { + "epoch": 2.13, + "learning_rate": 4.085539925517234e-07, + "loss": 0.4048, + "step": 83151 + }, + { + "epoch": 2.13, + "learning_rate": 4.0853168085696057e-07, + "loss": 0.3564, + "step": 83152 + }, + { + "epoch": 2.13, + "learning_rate": 4.0850936961505734e-07, + "loss": 0.3638, + "step": 83153 + }, + { + "epoch": 2.13, + "learning_rate": 4.084870588260314e-07, + "loss": 0.4292, + "step": 83154 + }, + { + "epoch": 2.13, + "learning_rate": 4.084647484899001e-07, + "loss": 0.3119, + "step": 83155 + }, + { + "epoch": 2.13, + "learning_rate": 4.084424386066797e-07, + "loss": 0.3955, + "step": 83156 + }, + { + "epoch": 2.13, + "learning_rate": 4.0842012917638767e-07, + "loss": 0.4263, + "step": 83157 + }, + { + "epoch": 2.13, + "learning_rate": 4.083978201990417e-07, + "loss": 0.5073, + "step": 83158 + }, + { + "epoch": 2.13, + "learning_rate": 4.083755116746578e-07, + "loss": 0.3506, + "step": 83159 + }, + { + "epoch": 2.13, + "learning_rate": 4.08353203603254e-07, + "loss": 0.4204, + "step": 83160 + }, + { + "epoch": 2.13, + "learning_rate": 4.083308959848465e-07, + "loss": 0.3601, + "step": 83161 + }, + { + "epoch": 2.13, + "learning_rate": 4.0830858881945286e-07, + "loss": 0.439, + "step": 83162 + }, + { + "epoch": 2.13, + "learning_rate": 4.0828628210709014e-07, + "loss": 0.3564, + "step": 83163 + }, + { + "epoch": 2.13, + "learning_rate": 4.0826397584777585e-07, + "loss": 0.3708, + "step": 83164 + }, + { + "epoch": 2.13, + "learning_rate": 4.082416700415262e-07, + "loss": 0.447, + "step": 83165 + }, + { + "epoch": 2.13, + "learning_rate": 4.082193646883586e-07, + "loss": 0.3799, + "step": 83166 + }, + { + "epoch": 2.13, + "learning_rate": 4.0819705978829035e-07, + "loss": 0.4565, + "step": 83167 + }, + { + "epoch": 2.13, + "learning_rate": 4.0817475534133874e-07, + "loss": 0.4678, + "step": 83168 + }, + { + "epoch": 2.13, + "learning_rate": 4.0815245134752053e-07, + "loss": 0.4376, + "step": 83169 + }, + { + "epoch": 2.13, + "learning_rate": 4.081301478068523e-07, + "loss": 0.3809, + "step": 83170 + }, + { + "epoch": 2.13, + "learning_rate": 4.0810784471935166e-07, + "loss": 0.3955, + "step": 83171 + }, + { + "epoch": 2.13, + "learning_rate": 4.08085542085036e-07, + "loss": 0.5132, + "step": 83172 + }, + { + "epoch": 2.13, + "learning_rate": 4.0806323990392165e-07, + "loss": 0.4077, + "step": 83173 + }, + { + "epoch": 2.13, + "learning_rate": 4.0804093817602616e-07, + "loss": 0.314, + "step": 83174 + }, + { + "epoch": 2.13, + "learning_rate": 4.080186369013664e-07, + "loss": 0.252, + "step": 83175 + }, + { + "epoch": 2.13, + "learning_rate": 4.0799633607995985e-07, + "loss": 0.5044, + "step": 83176 + }, + { + "epoch": 2.13, + "learning_rate": 4.07974035711823e-07, + "loss": 0.5347, + "step": 83177 + }, + { + "epoch": 2.13, + "learning_rate": 4.079517357969736e-07, + "loss": 0.3833, + "step": 83178 + }, + { + "epoch": 2.13, + "learning_rate": 4.07929436335428e-07, + "loss": 0.3999, + "step": 83179 + }, + { + "epoch": 2.13, + "learning_rate": 4.079071373272035e-07, + "loss": 0.3838, + "step": 83180 + }, + { + "epoch": 2.13, + "learning_rate": 4.078848387723176e-07, + "loss": 0.354, + "step": 83181 + }, + { + "epoch": 2.13, + "learning_rate": 4.0786254067078683e-07, + "loss": 0.3136, + "step": 83182 + }, + { + "epoch": 2.13, + "learning_rate": 4.0784024302262844e-07, + "loss": 0.3691, + "step": 83183 + }, + { + "epoch": 2.13, + "learning_rate": 4.078179458278596e-07, + "loss": 0.458, + "step": 83184 + }, + { + "epoch": 2.13, + "learning_rate": 4.0779564908649755e-07, + "loss": 0.386, + "step": 83185 + }, + { + "epoch": 2.13, + "learning_rate": 4.0777335279855883e-07, + "loss": 0.3672, + "step": 83186 + }, + { + "epoch": 2.13, + "learning_rate": 4.0775105696406087e-07, + "loss": 0.4619, + "step": 83187 + }, + { + "epoch": 2.13, + "learning_rate": 4.0772876158302105e-07, + "loss": 0.3092, + "step": 83188 + }, + { + "epoch": 2.13, + "learning_rate": 4.0770646665545615e-07, + "loss": 0.4294, + "step": 83189 + }, + { + "epoch": 2.13, + "learning_rate": 4.0768417218138274e-07, + "loss": 0.4463, + "step": 83190 + }, + { + "epoch": 2.13, + "learning_rate": 4.0766187816081833e-07, + "loss": 0.3696, + "step": 83191 + }, + { + "epoch": 2.13, + "learning_rate": 4.076395845937799e-07, + "loss": 0.4263, + "step": 83192 + }, + { + "epoch": 2.13, + "learning_rate": 4.07617291480285e-07, + "loss": 0.5293, + "step": 83193 + }, + { + "epoch": 2.13, + "learning_rate": 4.0759499882035007e-07, + "loss": 0.4844, + "step": 83194 + }, + { + "epoch": 2.13, + "learning_rate": 4.075727066139922e-07, + "loss": 0.3809, + "step": 83195 + }, + { + "epoch": 2.13, + "learning_rate": 4.075504148612289e-07, + "loss": 0.3264, + "step": 83196 + }, + { + "epoch": 2.13, + "learning_rate": 4.075281235620772e-07, + "loss": 0.3569, + "step": 83197 + }, + { + "epoch": 2.13, + "learning_rate": 4.0750583271655403e-07, + "loss": 0.3701, + "step": 83198 + }, + { + "epoch": 2.13, + "learning_rate": 4.0748354232467607e-07, + "loss": 0.4082, + "step": 83199 + }, + { + "epoch": 2.13, + "learning_rate": 4.074612523864607e-07, + "loss": 0.5229, + "step": 83200 + }, + { + "epoch": 2.13, + "learning_rate": 4.074389629019249e-07, + "loss": 0.363, + "step": 83201 + }, + { + "epoch": 2.13, + "learning_rate": 4.0741667387108633e-07, + "loss": 0.3264, + "step": 83202 + }, + { + "epoch": 2.13, + "learning_rate": 4.073943852939612e-07, + "loss": 0.4849, + "step": 83203 + }, + { + "epoch": 2.13, + "learning_rate": 4.073720971705669e-07, + "loss": 0.3733, + "step": 83204 + }, + { + "epoch": 2.13, + "learning_rate": 4.0734980950092046e-07, + "loss": 0.374, + "step": 83205 + }, + { + "epoch": 2.13, + "learning_rate": 4.0732752228503955e-07, + "loss": 0.3726, + "step": 83206 + }, + { + "epoch": 2.13, + "learning_rate": 4.073052355229402e-07, + "loss": 0.4221, + "step": 83207 + }, + { + "epoch": 2.13, + "learning_rate": 4.0728294921464035e-07, + "loss": 0.5073, + "step": 83208 + }, + { + "epoch": 2.13, + "learning_rate": 4.0726066336015643e-07, + "loss": 0.3848, + "step": 83209 + }, + { + "epoch": 2.13, + "learning_rate": 4.07238377959506e-07, + "loss": 0.4268, + "step": 83210 + }, + { + "epoch": 2.13, + "learning_rate": 4.0721609301270563e-07, + "loss": 0.3779, + "step": 83211 + }, + { + "epoch": 2.13, + "learning_rate": 4.071938085197726e-07, + "loss": 0.3662, + "step": 83212 + }, + { + "epoch": 2.13, + "learning_rate": 4.07171524480724e-07, + "loss": 0.4443, + "step": 83213 + }, + { + "epoch": 2.13, + "learning_rate": 4.0714924089557734e-07, + "loss": 0.3882, + "step": 83214 + }, + { + "epoch": 2.13, + "learning_rate": 4.071269577643488e-07, + "loss": 0.3184, + "step": 83215 + }, + { + "epoch": 2.13, + "learning_rate": 4.0710467508705593e-07, + "loss": 0.3633, + "step": 83216 + }, + { + "epoch": 2.13, + "learning_rate": 4.070823928637157e-07, + "loss": 0.4026, + "step": 83217 + }, + { + "epoch": 2.13, + "learning_rate": 4.070601110943457e-07, + "loss": 0.3416, + "step": 83218 + }, + { + "epoch": 2.13, + "learning_rate": 4.070378297789624e-07, + "loss": 0.4893, + "step": 83219 + }, + { + "epoch": 2.13, + "learning_rate": 4.070155489175826e-07, + "loss": 0.4351, + "step": 83220 + }, + { + "epoch": 2.13, + "learning_rate": 4.0699326851022376e-07, + "loss": 0.3874, + "step": 83221 + }, + { + "epoch": 2.13, + "learning_rate": 4.069709885569029e-07, + "loss": 0.3058, + "step": 83222 + }, + { + "epoch": 2.13, + "learning_rate": 4.0694870905763747e-07, + "loss": 0.3589, + "step": 83223 + }, + { + "epoch": 2.13, + "learning_rate": 4.0692643001244373e-07, + "loss": 0.4199, + "step": 83224 + }, + { + "epoch": 2.13, + "learning_rate": 4.0690415142133917e-07, + "loss": 0.446, + "step": 83225 + }, + { + "epoch": 2.13, + "learning_rate": 4.068818732843412e-07, + "loss": 0.321, + "step": 83226 + }, + { + "epoch": 2.13, + "learning_rate": 4.0685959560146623e-07, + "loss": 0.4458, + "step": 83227 + }, + { + "epoch": 2.13, + "learning_rate": 4.0683731837273184e-07, + "loss": 0.3337, + "step": 83228 + }, + { + "epoch": 2.13, + "learning_rate": 4.068150415981545e-07, + "loss": 0.5283, + "step": 83229 + }, + { + "epoch": 2.13, + "learning_rate": 4.0679276527775166e-07, + "loss": 0.282, + "step": 83230 + }, + { + "epoch": 2.13, + "learning_rate": 4.067704894115407e-07, + "loss": 0.375, + "step": 83231 + }, + { + "epoch": 2.13, + "learning_rate": 4.0674821399953783e-07, + "loss": 0.5376, + "step": 83232 + }, + { + "epoch": 2.13, + "learning_rate": 4.0672593904176066e-07, + "loss": 0.4426, + "step": 83233 + }, + { + "epoch": 2.13, + "learning_rate": 4.0670366453822613e-07, + "loss": 0.4236, + "step": 83234 + }, + { + "epoch": 2.13, + "learning_rate": 4.066813904889517e-07, + "loss": 0.3948, + "step": 83235 + }, + { + "epoch": 2.13, + "learning_rate": 4.066591168939536e-07, + "loss": 0.2944, + "step": 83236 + }, + { + "epoch": 2.13, + "learning_rate": 4.066368437532495e-07, + "loss": 0.4194, + "step": 83237 + }, + { + "epoch": 2.13, + "learning_rate": 4.066145710668565e-07, + "loss": 0.4263, + "step": 83238 + }, + { + "epoch": 2.13, + "learning_rate": 4.0659229883479117e-07, + "loss": 0.4531, + "step": 83239 + }, + { + "epoch": 2.13, + "learning_rate": 4.0657002705707113e-07, + "loss": 0.5151, + "step": 83240 + }, + { + "epoch": 2.13, + "learning_rate": 4.065477557337128e-07, + "loss": 0.3707, + "step": 83241 + }, + { + "epoch": 2.13, + "learning_rate": 4.065254848647336e-07, + "loss": 0.4321, + "step": 83242 + }, + { + "epoch": 2.13, + "learning_rate": 4.065032144501505e-07, + "loss": 0.4033, + "step": 83243 + }, + { + "epoch": 2.13, + "learning_rate": 4.0648094448998093e-07, + "loss": 0.4023, + "step": 83244 + }, + { + "epoch": 2.13, + "learning_rate": 4.0645867498424123e-07, + "loss": 0.3216, + "step": 83245 + }, + { + "epoch": 2.13, + "learning_rate": 4.0643640593294894e-07, + "loss": 0.3733, + "step": 83246 + }, + { + "epoch": 2.13, + "learning_rate": 4.064141373361213e-07, + "loss": 0.4014, + "step": 83247 + }, + { + "epoch": 2.13, + "learning_rate": 4.063918691937751e-07, + "loss": 0.4419, + "step": 83248 + }, + { + "epoch": 2.13, + "learning_rate": 4.0636960150592694e-07, + "loss": 0.2581, + "step": 83249 + }, + { + "epoch": 2.13, + "learning_rate": 4.0634733427259426e-07, + "loss": 0.4761, + "step": 83250 + }, + { + "epoch": 2.13, + "learning_rate": 4.0632506749379423e-07, + "loss": 0.4575, + "step": 83251 + }, + { + "epoch": 2.13, + "learning_rate": 4.0630280116954405e-07, + "loss": 0.4097, + "step": 83252 + }, + { + "epoch": 2.13, + "learning_rate": 4.062805352998603e-07, + "loss": 0.3047, + "step": 83253 + }, + { + "epoch": 2.13, + "learning_rate": 4.0625826988476007e-07, + "loss": 0.3608, + "step": 83254 + }, + { + "epoch": 2.13, + "learning_rate": 4.0623600492426067e-07, + "loss": 0.3574, + "step": 83255 + }, + { + "epoch": 2.13, + "learning_rate": 4.0621374041837943e-07, + "loss": 0.417, + "step": 83256 + }, + { + "epoch": 2.13, + "learning_rate": 4.061914763671326e-07, + "loss": 0.3225, + "step": 83257 + }, + { + "epoch": 2.13, + "learning_rate": 4.061692127705381e-07, + "loss": 0.3848, + "step": 83258 + }, + { + "epoch": 2.13, + "learning_rate": 4.0614694962861207e-07, + "loss": 0.3008, + "step": 83259 + }, + { + "epoch": 2.13, + "learning_rate": 4.0612468694137213e-07, + "loss": 0.4355, + "step": 83260 + }, + { + "epoch": 2.13, + "learning_rate": 4.0610242470883547e-07, + "loss": 0.4014, + "step": 83261 + }, + { + "epoch": 2.13, + "learning_rate": 4.0608016293101854e-07, + "loss": 0.4282, + "step": 83262 + }, + { + "epoch": 2.13, + "learning_rate": 4.060579016079387e-07, + "loss": 0.4868, + "step": 83263 + }, + { + "epoch": 2.13, + "learning_rate": 4.060356407396135e-07, + "loss": 0.2797, + "step": 83264 + }, + { + "epoch": 2.13, + "learning_rate": 4.0601338032605903e-07, + "loss": 0.3059, + "step": 83265 + }, + { + "epoch": 2.13, + "learning_rate": 4.059911203672929e-07, + "loss": 0.4172, + "step": 83266 + }, + { + "epoch": 2.13, + "learning_rate": 4.0596886086333195e-07, + "loss": 0.4502, + "step": 83267 + }, + { + "epoch": 2.13, + "learning_rate": 4.059466018141937e-07, + "loss": 0.4839, + "step": 83268 + }, + { + "epoch": 2.13, + "learning_rate": 4.059243432198948e-07, + "loss": 0.5562, + "step": 83269 + }, + { + "epoch": 2.13, + "learning_rate": 4.05902085080452e-07, + "loss": 0.5615, + "step": 83270 + }, + { + "epoch": 2.13, + "learning_rate": 4.0587982739588265e-07, + "loss": 0.3302, + "step": 83271 + }, + { + "epoch": 2.13, + "learning_rate": 4.0585757016620383e-07, + "loss": 0.4141, + "step": 83272 + }, + { + "epoch": 2.13, + "learning_rate": 4.0583531339143286e-07, + "loss": 0.3828, + "step": 83273 + }, + { + "epoch": 2.13, + "learning_rate": 4.0581305707158607e-07, + "loss": 0.2847, + "step": 83274 + }, + { + "epoch": 2.13, + "learning_rate": 4.05790801206681e-07, + "loss": 0.4131, + "step": 83275 + }, + { + "epoch": 2.13, + "learning_rate": 4.0576854579673457e-07, + "loss": 0.5278, + "step": 83276 + }, + { + "epoch": 2.13, + "learning_rate": 4.0574629084176417e-07, + "loss": 0.4187, + "step": 83277 + }, + { + "epoch": 2.13, + "learning_rate": 4.057240363417865e-07, + "loss": 0.4019, + "step": 83278 + }, + { + "epoch": 2.13, + "learning_rate": 4.057017822968183e-07, + "loss": 0.3721, + "step": 83279 + }, + { + "epoch": 2.13, + "learning_rate": 4.0567952870687684e-07, + "loss": 0.4102, + "step": 83280 + }, + { + "epoch": 2.13, + "learning_rate": 4.056572755719797e-07, + "loss": 0.2705, + "step": 83281 + }, + { + "epoch": 2.13, + "learning_rate": 4.0563502289214303e-07, + "loss": 0.4521, + "step": 83282 + }, + { + "epoch": 2.13, + "learning_rate": 4.0561277066738433e-07, + "loss": 0.4946, + "step": 83283 + }, + { + "epoch": 2.13, + "learning_rate": 4.0559051889772056e-07, + "loss": 0.4507, + "step": 83284 + }, + { + "epoch": 2.13, + "learning_rate": 4.055682675831692e-07, + "loss": 0.4375, + "step": 83285 + }, + { + "epoch": 2.13, + "learning_rate": 4.0554601672374643e-07, + "loss": 0.502, + "step": 83286 + }, + { + "epoch": 2.13, + "learning_rate": 4.0552376631946986e-07, + "loss": 0.3187, + "step": 83287 + }, + { + "epoch": 2.13, + "learning_rate": 4.055015163703567e-07, + "loss": 0.3848, + "step": 83288 + }, + { + "epoch": 2.13, + "learning_rate": 4.0547926687642334e-07, + "loss": 0.5356, + "step": 83289 + }, + { + "epoch": 2.13, + "learning_rate": 4.054570178376876e-07, + "loss": 0.3408, + "step": 83290 + }, + { + "epoch": 2.13, + "learning_rate": 4.0543476925416567e-07, + "loss": 0.481, + "step": 83291 + }, + { + "epoch": 2.13, + "learning_rate": 4.05412521125875e-07, + "loss": 0.4766, + "step": 83292 + }, + { + "epoch": 2.13, + "learning_rate": 4.053902734528325e-07, + "loss": 0.343, + "step": 83293 + }, + { + "epoch": 2.13, + "learning_rate": 4.0536802623505585e-07, + "loss": 0.4624, + "step": 83294 + }, + { + "epoch": 2.13, + "learning_rate": 4.053457794725611e-07, + "loss": 0.3701, + "step": 83295 + }, + { + "epoch": 2.13, + "learning_rate": 4.053235331653658e-07, + "loss": 0.4756, + "step": 83296 + }, + { + "epoch": 2.13, + "learning_rate": 4.05301287313487e-07, + "loss": 0.501, + "step": 83297 + }, + { + "epoch": 2.13, + "learning_rate": 4.052790419169423e-07, + "loss": 0.3893, + "step": 83298 + }, + { + "epoch": 2.13, + "learning_rate": 4.052567969757473e-07, + "loss": 0.4119, + "step": 83299 + }, + { + "epoch": 2.14, + "learning_rate": 4.0523455248991986e-07, + "loss": 0.4839, + "step": 83300 + }, + { + "epoch": 2.14, + "learning_rate": 4.0521230845947707e-07, + "loss": 0.376, + "step": 83301 + }, + { + "epoch": 2.14, + "learning_rate": 4.051900648844362e-07, + "loss": 0.3848, + "step": 83302 + }, + { + "epoch": 2.14, + "learning_rate": 4.051678217648136e-07, + "loss": 0.3245, + "step": 83303 + }, + { + "epoch": 2.14, + "learning_rate": 4.051455791006265e-07, + "loss": 0.3804, + "step": 83304 + }, + { + "epoch": 2.14, + "learning_rate": 4.051233368918923e-07, + "loss": 0.308, + "step": 83305 + }, + { + "epoch": 2.14, + "learning_rate": 4.05101095138628e-07, + "loss": 0.5176, + "step": 83306 + }, + { + "epoch": 2.14, + "learning_rate": 4.050788538408501e-07, + "loss": 0.4614, + "step": 83307 + }, + { + "epoch": 2.14, + "learning_rate": 4.050566129985763e-07, + "loss": 0.3486, + "step": 83308 + }, + { + "epoch": 2.14, + "learning_rate": 4.0503437261182307e-07, + "loss": 0.3419, + "step": 83309 + }, + { + "epoch": 2.14, + "learning_rate": 4.0501213268060755e-07, + "loss": 0.3076, + "step": 83310 + }, + { + "epoch": 2.14, + "learning_rate": 4.0498989320494726e-07, + "loss": 0.4609, + "step": 83311 + }, + { + "epoch": 2.14, + "learning_rate": 4.0496765418485855e-07, + "loss": 0.308, + "step": 83312 + }, + { + "epoch": 2.14, + "learning_rate": 4.0494541562035865e-07, + "loss": 0.4529, + "step": 83313 + }, + { + "epoch": 2.14, + "learning_rate": 4.049231775114648e-07, + "loss": 0.4263, + "step": 83314 + }, + { + "epoch": 2.14, + "learning_rate": 4.049009398581942e-07, + "loss": 0.3438, + "step": 83315 + }, + { + "epoch": 2.14, + "learning_rate": 4.048787026605631e-07, + "loss": 0.459, + "step": 83316 + }, + { + "epoch": 2.14, + "learning_rate": 4.0485646591858926e-07, + "loss": 0.3022, + "step": 83317 + }, + { + "epoch": 2.14, + "learning_rate": 4.0483422963228965e-07, + "loss": 0.4194, + "step": 83318 + }, + { + "epoch": 2.14, + "learning_rate": 4.048119938016812e-07, + "loss": 0.4596, + "step": 83319 + }, + { + "epoch": 2.14, + "learning_rate": 4.0478975842678044e-07, + "loss": 0.4785, + "step": 83320 + }, + { + "epoch": 2.14, + "learning_rate": 4.047675235076048e-07, + "loss": 0.3916, + "step": 83321 + }, + { + "epoch": 2.14, + "learning_rate": 4.0474528904417126e-07, + "loss": 0.3528, + "step": 83322 + }, + { + "epoch": 2.14, + "learning_rate": 4.047230550364973e-07, + "loss": 0.4727, + "step": 83323 + }, + { + "epoch": 2.14, + "learning_rate": 4.0470082148459907e-07, + "loss": 0.4976, + "step": 83324 + }, + { + "epoch": 2.14, + "learning_rate": 4.046785883884941e-07, + "loss": 0.4448, + "step": 83325 + }, + { + "epoch": 2.14, + "learning_rate": 4.0465635574819933e-07, + "loss": 0.2217, + "step": 83326 + }, + { + "epoch": 2.14, + "learning_rate": 4.0463412356373226e-07, + "loss": 0.5034, + "step": 83327 + }, + { + "epoch": 2.14, + "learning_rate": 4.046118918351095e-07, + "loss": 0.3962, + "step": 83328 + }, + { + "epoch": 2.14, + "learning_rate": 4.0458966056234754e-07, + "loss": 0.3594, + "step": 83329 + }, + { + "epoch": 2.14, + "learning_rate": 4.04567429745464e-07, + "loss": 0.3682, + "step": 83330 + }, + { + "epoch": 2.14, + "learning_rate": 4.0454519938447573e-07, + "loss": 0.3511, + "step": 83331 + }, + { + "epoch": 2.14, + "learning_rate": 4.045229694794002e-07, + "loss": 0.3728, + "step": 83332 + }, + { + "epoch": 2.14, + "learning_rate": 4.045007400302537e-07, + "loss": 0.5015, + "step": 83333 + }, + { + "epoch": 2.14, + "learning_rate": 4.0447851103705354e-07, + "loss": 0.478, + "step": 83334 + }, + { + "epoch": 2.14, + "learning_rate": 4.0445628249981733e-07, + "loss": 0.3931, + "step": 83335 + }, + { + "epoch": 2.14, + "learning_rate": 4.0443405441856103e-07, + "loss": 0.5327, + "step": 83336 + }, + { + "epoch": 2.14, + "learning_rate": 4.044118267933023e-07, + "loss": 0.3411, + "step": 83337 + }, + { + "epoch": 2.14, + "learning_rate": 4.0438959962405836e-07, + "loss": 0.3726, + "step": 83338 + }, + { + "epoch": 2.14, + "learning_rate": 4.0436737291084556e-07, + "loss": 0.4839, + "step": 83339 + }, + { + "epoch": 2.14, + "learning_rate": 4.043451466536816e-07, + "loss": 0.4722, + "step": 83340 + }, + { + "epoch": 2.14, + "learning_rate": 4.043229208525829e-07, + "loss": 0.4341, + "step": 83341 + }, + { + "epoch": 2.14, + "learning_rate": 4.043006955075666e-07, + "loss": 0.3055, + "step": 83342 + }, + { + "epoch": 2.14, + "learning_rate": 4.042784706186501e-07, + "loss": 0.4585, + "step": 83343 + }, + { + "epoch": 2.14, + "learning_rate": 4.042562461858503e-07, + "loss": 0.3916, + "step": 83344 + }, + { + "epoch": 2.14, + "learning_rate": 4.042340222091839e-07, + "loss": 0.344, + "step": 83345 + }, + { + "epoch": 2.14, + "learning_rate": 4.0421179868866807e-07, + "loss": 0.438, + "step": 83346 + }, + { + "epoch": 2.14, + "learning_rate": 4.041895756243202e-07, + "loss": 0.418, + "step": 83347 + }, + { + "epoch": 2.14, + "learning_rate": 4.0416735301615666e-07, + "loss": 0.4033, + "step": 83348 + }, + { + "epoch": 2.14, + "learning_rate": 4.041451308641951e-07, + "loss": 0.3691, + "step": 83349 + }, + { + "epoch": 2.14, + "learning_rate": 4.0412290916845184e-07, + "loss": 0.3205, + "step": 83350 + }, + { + "epoch": 2.14, + "learning_rate": 4.0410068792894434e-07, + "loss": 0.3793, + "step": 83351 + }, + { + "epoch": 2.14, + "learning_rate": 4.040784671456898e-07, + "loss": 0.4122, + "step": 83352 + }, + { + "epoch": 2.14, + "learning_rate": 4.0405624681870475e-07, + "loss": 0.3501, + "step": 83353 + }, + { + "epoch": 2.14, + "learning_rate": 4.0403402694800636e-07, + "loss": 0.3669, + "step": 83354 + }, + { + "epoch": 2.14, + "learning_rate": 4.0401180753361177e-07, + "loss": 0.3511, + "step": 83355 + }, + { + "epoch": 2.14, + "learning_rate": 4.0398958857553813e-07, + "loss": 0.4326, + "step": 83356 + }, + { + "epoch": 2.14, + "learning_rate": 4.0396737007380243e-07, + "loss": 0.4067, + "step": 83357 + }, + { + "epoch": 2.14, + "learning_rate": 4.0394515202842103e-07, + "loss": 0.4521, + "step": 83358 + }, + { + "epoch": 2.14, + "learning_rate": 4.039229344394115e-07, + "loss": 0.3966, + "step": 83359 + }, + { + "epoch": 2.14, + "learning_rate": 4.0390071730679074e-07, + "loss": 0.4058, + "step": 83360 + }, + { + "epoch": 2.14, + "learning_rate": 4.0387850063057616e-07, + "loss": 0.3055, + "step": 83361 + }, + { + "epoch": 2.14, + "learning_rate": 4.03856284410784e-07, + "loss": 0.3254, + "step": 83362 + }, + { + "epoch": 2.14, + "learning_rate": 4.038340686474317e-07, + "loss": 0.4185, + "step": 83363 + }, + { + "epoch": 2.14, + "learning_rate": 4.0381185334053627e-07, + "loss": 0.4448, + "step": 83364 + }, + { + "epoch": 2.14, + "learning_rate": 4.03789638490115e-07, + "loss": 0.4878, + "step": 83365 + }, + { + "epoch": 2.14, + "learning_rate": 4.0376742409618434e-07, + "loss": 0.377, + "step": 83366 + }, + { + "epoch": 2.14, + "learning_rate": 4.0374521015876186e-07, + "loss": 0.4106, + "step": 83367 + }, + { + "epoch": 2.14, + "learning_rate": 4.037229966778638e-07, + "loss": 0.3843, + "step": 83368 + }, + { + "epoch": 2.14, + "learning_rate": 4.03700783653508e-07, + "loss": 0.3779, + "step": 83369 + }, + { + "epoch": 2.14, + "learning_rate": 4.036785710857108e-07, + "loss": 0.4985, + "step": 83370 + }, + { + "epoch": 2.14, + "learning_rate": 4.0365635897448946e-07, + "loss": 0.4102, + "step": 83371 + }, + { + "epoch": 2.14, + "learning_rate": 4.036341473198611e-07, + "loss": 0.4595, + "step": 83372 + }, + { + "epoch": 2.14, + "learning_rate": 4.0361193612184297e-07, + "loss": 0.5005, + "step": 83373 + }, + { + "epoch": 2.14, + "learning_rate": 4.0358972538045134e-07, + "loss": 0.4507, + "step": 83374 + }, + { + "epoch": 2.14, + "learning_rate": 4.0356751509570376e-07, + "loss": 0.3896, + "step": 83375 + }, + { + "epoch": 2.14, + "learning_rate": 4.03545305267617e-07, + "loss": 0.4229, + "step": 83376 + }, + { + "epoch": 2.14, + "learning_rate": 4.0352309589620846e-07, + "loss": 0.4634, + "step": 83377 + }, + { + "epoch": 2.14, + "learning_rate": 4.03500886981495e-07, + "loss": 0.4644, + "step": 83378 + }, + { + "epoch": 2.14, + "learning_rate": 4.0347867852349313e-07, + "loss": 0.2947, + "step": 83379 + }, + { + "epoch": 2.14, + "learning_rate": 4.034564705222201e-07, + "loss": 0.4785, + "step": 83380 + }, + { + "epoch": 2.14, + "learning_rate": 4.0343426297769313e-07, + "loss": 0.3762, + "step": 83381 + }, + { + "epoch": 2.14, + "learning_rate": 4.034120558899294e-07, + "loss": 0.4276, + "step": 83382 + }, + { + "epoch": 2.14, + "learning_rate": 4.0338984925894527e-07, + "loss": 0.5078, + "step": 83383 + }, + { + "epoch": 2.14, + "learning_rate": 4.033676430847581e-07, + "loss": 0.4751, + "step": 83384 + }, + { + "epoch": 2.14, + "learning_rate": 4.033454373673849e-07, + "loss": 0.3233, + "step": 83385 + }, + { + "epoch": 2.14, + "learning_rate": 4.0332323210684305e-07, + "loss": 0.3662, + "step": 83386 + }, + { + "epoch": 2.14, + "learning_rate": 4.033010273031492e-07, + "loss": 0.3416, + "step": 83387 + }, + { + "epoch": 2.14, + "learning_rate": 4.032788229563199e-07, + "loss": 0.4272, + "step": 83388 + }, + { + "epoch": 2.14, + "learning_rate": 4.0325661906637254e-07, + "loss": 0.3394, + "step": 83389 + }, + { + "epoch": 2.14, + "learning_rate": 4.032344156333246e-07, + "loss": 0.3247, + "step": 83390 + }, + { + "epoch": 2.14, + "learning_rate": 4.0321221265719216e-07, + "loss": 0.3767, + "step": 83391 + }, + { + "epoch": 2.14, + "learning_rate": 4.031900101379928e-07, + "loss": 0.3245, + "step": 83392 + }, + { + "epoch": 2.14, + "learning_rate": 4.0316780807574335e-07, + "loss": 0.4751, + "step": 83393 + }, + { + "epoch": 2.14, + "learning_rate": 4.0314560647046116e-07, + "loss": 0.4392, + "step": 83394 + }, + { + "epoch": 2.14, + "learning_rate": 4.031234053221626e-07, + "loss": 0.4624, + "step": 83395 + }, + { + "epoch": 2.14, + "learning_rate": 4.0310120463086503e-07, + "loss": 0.3552, + "step": 83396 + }, + { + "epoch": 2.14, + "learning_rate": 4.030790043965858e-07, + "loss": 0.2489, + "step": 83397 + }, + { + "epoch": 2.14, + "learning_rate": 4.0305680461934124e-07, + "loss": 0.4917, + "step": 83398 + }, + { + "epoch": 2.14, + "learning_rate": 4.030346052991489e-07, + "loss": 0.385, + "step": 83399 + }, + { + "epoch": 2.14, + "learning_rate": 4.030124064360252e-07, + "loss": 0.3462, + "step": 83400 + }, + { + "epoch": 2.14, + "learning_rate": 4.029902080299874e-07, + "loss": 0.4663, + "step": 83401 + }, + { + "epoch": 2.14, + "learning_rate": 4.029680100810525e-07, + "loss": 0.4033, + "step": 83402 + }, + { + "epoch": 2.14, + "learning_rate": 4.02945812589238e-07, + "loss": 0.3517, + "step": 83403 + }, + { + "epoch": 2.14, + "learning_rate": 4.029236155545601e-07, + "loss": 0.4199, + "step": 83404 + }, + { + "epoch": 2.14, + "learning_rate": 4.02901418977036e-07, + "loss": 0.5518, + "step": 83405 + }, + { + "epoch": 2.14, + "learning_rate": 4.02879222856683e-07, + "loss": 0.3926, + "step": 83406 + }, + { + "epoch": 2.14, + "learning_rate": 4.0285702719351856e-07, + "loss": 0.3228, + "step": 83407 + }, + { + "epoch": 2.14, + "learning_rate": 4.028348319875583e-07, + "loss": 0.54, + "step": 83408 + }, + { + "epoch": 2.14, + "learning_rate": 4.0281263723881986e-07, + "loss": 0.3784, + "step": 83409 + }, + { + "epoch": 2.14, + "learning_rate": 4.0279044294732047e-07, + "loss": 0.4438, + "step": 83410 + }, + { + "epoch": 2.14, + "learning_rate": 4.0276824911307726e-07, + "loss": 0.4282, + "step": 83411 + }, + { + "epoch": 2.14, + "learning_rate": 4.0274605573610664e-07, + "loss": 0.3021, + "step": 83412 + }, + { + "epoch": 2.14, + "learning_rate": 4.027238628164259e-07, + "loss": 0.3901, + "step": 83413 + }, + { + "epoch": 2.14, + "learning_rate": 4.02701670354052e-07, + "loss": 0.4055, + "step": 83414 + }, + { + "epoch": 2.14, + "learning_rate": 4.026794783490023e-07, + "loss": 0.4561, + "step": 83415 + }, + { + "epoch": 2.14, + "learning_rate": 4.026572868012932e-07, + "loss": 0.4531, + "step": 83416 + }, + { + "epoch": 2.14, + "learning_rate": 4.0263509571094223e-07, + "loss": 0.5225, + "step": 83417 + }, + { + "epoch": 2.14, + "learning_rate": 4.0261290507796576e-07, + "loss": 0.5513, + "step": 83418 + }, + { + "epoch": 2.14, + "learning_rate": 4.0259071490238105e-07, + "loss": 0.2632, + "step": 83419 + }, + { + "epoch": 2.14, + "learning_rate": 4.025685251842056e-07, + "loss": 0.4678, + "step": 83420 + }, + { + "epoch": 2.14, + "learning_rate": 4.0254633592345555e-07, + "loss": 0.4189, + "step": 83421 + }, + { + "epoch": 2.14, + "learning_rate": 4.025241471201484e-07, + "loss": 0.5244, + "step": 83422 + }, + { + "epoch": 2.14, + "learning_rate": 4.0250195877430095e-07, + "loss": 0.4272, + "step": 83423 + }, + { + "epoch": 2.14, + "learning_rate": 4.0247977088593066e-07, + "loss": 0.4771, + "step": 83424 + }, + { + "epoch": 2.14, + "learning_rate": 4.0245758345505377e-07, + "loss": 0.3195, + "step": 83425 + }, + { + "epoch": 2.14, + "learning_rate": 4.0243539648168765e-07, + "loss": 0.3813, + "step": 83426 + }, + { + "epoch": 2.14, + "learning_rate": 4.024132099658496e-07, + "loss": 0.439, + "step": 83427 + }, + { + "epoch": 2.14, + "learning_rate": 4.023910239075563e-07, + "loss": 0.3892, + "step": 83428 + }, + { + "epoch": 2.14, + "learning_rate": 4.0236883830682433e-07, + "loss": 0.4111, + "step": 83429 + }, + { + "epoch": 2.14, + "learning_rate": 4.023466531636711e-07, + "loss": 0.4009, + "step": 83430 + }, + { + "epoch": 2.14, + "learning_rate": 4.0232446847811354e-07, + "loss": 0.4824, + "step": 83431 + }, + { + "epoch": 2.14, + "learning_rate": 4.02302284250169e-07, + "loss": 0.4299, + "step": 83432 + }, + { + "epoch": 2.14, + "learning_rate": 4.022801004798537e-07, + "loss": 0.4722, + "step": 83433 + }, + { + "epoch": 2.14, + "learning_rate": 4.0225791716718516e-07, + "loss": 0.4062, + "step": 83434 + }, + { + "epoch": 2.14, + "learning_rate": 4.0223573431218015e-07, + "loss": 0.3877, + "step": 83435 + }, + { + "epoch": 2.14, + "learning_rate": 4.0221355191485616e-07, + "loss": 0.3417, + "step": 83436 + }, + { + "epoch": 2.14, + "learning_rate": 4.021913699752297e-07, + "loss": 0.4607, + "step": 83437 + }, + { + "epoch": 2.14, + "learning_rate": 4.021691884933176e-07, + "loss": 0.4019, + "step": 83438 + }, + { + "epoch": 2.14, + "learning_rate": 4.02147007469137e-07, + "loss": 0.498, + "step": 83439 + }, + { + "epoch": 2.14, + "learning_rate": 4.0212482690270486e-07, + "loss": 0.3831, + "step": 83440 + }, + { + "epoch": 2.14, + "learning_rate": 4.021026467940387e-07, + "loss": 0.2504, + "step": 83441 + }, + { + "epoch": 2.14, + "learning_rate": 4.0208046714315467e-07, + "loss": 0.3143, + "step": 83442 + }, + { + "epoch": 2.14, + "learning_rate": 4.0205828795007013e-07, + "loss": 0.5215, + "step": 83443 + }, + { + "epoch": 2.14, + "learning_rate": 4.0203610921480246e-07, + "loss": 0.4473, + "step": 83444 + }, + { + "epoch": 2.14, + "learning_rate": 4.020139309373679e-07, + "loss": 0.384, + "step": 83445 + }, + { + "epoch": 2.14, + "learning_rate": 4.0199175311778366e-07, + "loss": 0.3191, + "step": 83446 + }, + { + "epoch": 2.14, + "learning_rate": 4.0196957575606726e-07, + "loss": 0.4009, + "step": 83447 + }, + { + "epoch": 2.14, + "learning_rate": 4.0194739885223495e-07, + "loss": 0.4102, + "step": 83448 + }, + { + "epoch": 2.14, + "learning_rate": 4.019252224063043e-07, + "loss": 0.3994, + "step": 83449 + }, + { + "epoch": 2.14, + "learning_rate": 4.0190304641829177e-07, + "loss": 0.3628, + "step": 83450 + }, + { + "epoch": 2.14, + "learning_rate": 4.0188087088821445e-07, + "loss": 0.4722, + "step": 83451 + }, + { + "epoch": 2.14, + "learning_rate": 4.0185869581608946e-07, + "loss": 0.3828, + "step": 83452 + }, + { + "epoch": 2.14, + "learning_rate": 4.018365212019341e-07, + "loss": 0.5024, + "step": 83453 + }, + { + "epoch": 2.14, + "learning_rate": 4.018143470457648e-07, + "loss": 0.4883, + "step": 83454 + }, + { + "epoch": 2.14, + "learning_rate": 4.0179217334759865e-07, + "loss": 0.4114, + "step": 83455 + }, + { + "epoch": 2.14, + "learning_rate": 4.0177000010745267e-07, + "loss": 0.3368, + "step": 83456 + }, + { + "epoch": 2.14, + "learning_rate": 4.017478273253443e-07, + "loss": 0.2852, + "step": 83457 + }, + { + "epoch": 2.14, + "learning_rate": 4.017256550012901e-07, + "loss": 0.4404, + "step": 83458 + }, + { + "epoch": 2.14, + "learning_rate": 4.017034831353068e-07, + "loss": 0.3838, + "step": 83459 + }, + { + "epoch": 2.14, + "learning_rate": 4.016813117274115e-07, + "loss": 0.3672, + "step": 83460 + }, + { + "epoch": 2.14, + "learning_rate": 4.0165914077762174e-07, + "loss": 0.2881, + "step": 83461 + }, + { + "epoch": 2.14, + "learning_rate": 4.0163697028595367e-07, + "loss": 0.4883, + "step": 83462 + }, + { + "epoch": 2.14, + "learning_rate": 4.0161480025242466e-07, + "loss": 0.3774, + "step": 83463 + }, + { + "epoch": 2.14, + "learning_rate": 4.0159263067705164e-07, + "loss": 0.4326, + "step": 83464 + }, + { + "epoch": 2.14, + "learning_rate": 4.015704615598521e-07, + "loss": 0.4253, + "step": 83465 + }, + { + "epoch": 2.14, + "learning_rate": 4.0154829290084214e-07, + "loss": 0.3566, + "step": 83466 + }, + { + "epoch": 2.14, + "learning_rate": 4.015261247000394e-07, + "loss": 0.3882, + "step": 83467 + }, + { + "epoch": 2.14, + "learning_rate": 4.015039569574603e-07, + "loss": 0.5488, + "step": 83468 + }, + { + "epoch": 2.14, + "learning_rate": 4.014817896731221e-07, + "loss": 0.3568, + "step": 83469 + }, + { + "epoch": 2.14, + "learning_rate": 4.0145962284704216e-07, + "loss": 0.3268, + "step": 83470 + }, + { + "epoch": 2.14, + "learning_rate": 4.0143745647923664e-07, + "loss": 0.4917, + "step": 83471 + }, + { + "epoch": 2.14, + "learning_rate": 4.01415290569723e-07, + "loss": 0.4717, + "step": 83472 + }, + { + "epoch": 2.14, + "learning_rate": 4.013931251185182e-07, + "loss": 0.4951, + "step": 83473 + }, + { + "epoch": 2.14, + "learning_rate": 4.0137096012563943e-07, + "loss": 0.3979, + "step": 83474 + }, + { + "epoch": 2.14, + "learning_rate": 4.01348795591103e-07, + "loss": 0.4146, + "step": 83475 + }, + { + "epoch": 2.14, + "learning_rate": 4.0132663151492627e-07, + "loss": 0.4961, + "step": 83476 + }, + { + "epoch": 2.14, + "learning_rate": 4.0130446789712667e-07, + "loss": 0.5059, + "step": 83477 + }, + { + "epoch": 2.14, + "learning_rate": 4.0128230473772064e-07, + "loss": 0.3936, + "step": 83478 + }, + { + "epoch": 2.14, + "learning_rate": 4.012601420367249e-07, + "loss": 0.3706, + "step": 83479 + }, + { + "epoch": 2.14, + "learning_rate": 4.0123797979415674e-07, + "loss": 0.4351, + "step": 83480 + }, + { + "epoch": 2.14, + "learning_rate": 4.01215818010033e-07, + "loss": 0.4888, + "step": 83481 + }, + { + "epoch": 2.14, + "learning_rate": 4.011936566843713e-07, + "loss": 0.1868, + "step": 83482 + }, + { + "epoch": 2.14, + "learning_rate": 4.011714958171877e-07, + "loss": 0.3472, + "step": 83483 + }, + { + "epoch": 2.14, + "learning_rate": 4.0114933540849946e-07, + "loss": 0.385, + "step": 83484 + }, + { + "epoch": 2.14, + "learning_rate": 4.0112717545832367e-07, + "loss": 0.4819, + "step": 83485 + }, + { + "epoch": 2.14, + "learning_rate": 4.0110501596667767e-07, + "loss": 0.4011, + "step": 83486 + }, + { + "epoch": 2.14, + "learning_rate": 4.0108285693357804e-07, + "loss": 0.2612, + "step": 83487 + }, + { + "epoch": 2.14, + "learning_rate": 4.0106069835904124e-07, + "loss": 0.2828, + "step": 83488 + }, + { + "epoch": 2.14, + "learning_rate": 4.010385402430848e-07, + "loss": 0.2788, + "step": 83489 + }, + { + "epoch": 2.14, + "learning_rate": 4.010163825857257e-07, + "loss": 0.4912, + "step": 83490 + }, + { + "epoch": 2.14, + "learning_rate": 4.00994225386981e-07, + "loss": 0.3597, + "step": 83491 + }, + { + "epoch": 2.14, + "learning_rate": 4.0097206864686726e-07, + "loss": 0.3494, + "step": 83492 + }, + { + "epoch": 2.14, + "learning_rate": 4.0094991236540154e-07, + "loss": 0.3535, + "step": 83493 + }, + { + "epoch": 2.14, + "learning_rate": 4.0092775654260104e-07, + "loss": 0.4146, + "step": 83494 + }, + { + "epoch": 2.14, + "learning_rate": 4.0090560117848296e-07, + "loss": 0.3125, + "step": 83495 + }, + { + "epoch": 2.14, + "learning_rate": 4.008834462730635e-07, + "loss": 0.3835, + "step": 83496 + }, + { + "epoch": 2.14, + "learning_rate": 4.008612918263604e-07, + "loss": 0.3828, + "step": 83497 + }, + { + "epoch": 2.14, + "learning_rate": 4.0083913783838996e-07, + "loss": 0.4194, + "step": 83498 + }, + { + "epoch": 2.14, + "learning_rate": 4.0081698430916976e-07, + "loss": 0.439, + "step": 83499 + }, + { + "epoch": 2.14, + "learning_rate": 4.0079483123871605e-07, + "loss": 0.5142, + "step": 83500 + }, + { + "epoch": 2.14, + "learning_rate": 4.0077267862704624e-07, + "loss": 0.4722, + "step": 83501 + }, + { + "epoch": 2.14, + "learning_rate": 4.007505264741772e-07, + "loss": 0.522, + "step": 83502 + }, + { + "epoch": 2.14, + "learning_rate": 4.0072837478012634e-07, + "loss": 0.3157, + "step": 83503 + }, + { + "epoch": 2.14, + "learning_rate": 4.007062235449098e-07, + "loss": 0.4583, + "step": 83504 + }, + { + "epoch": 2.14, + "learning_rate": 4.00684072768545e-07, + "loss": 0.3931, + "step": 83505 + }, + { + "epoch": 2.14, + "learning_rate": 4.006619224510488e-07, + "loss": 0.4526, + "step": 83506 + }, + { + "epoch": 2.14, + "learning_rate": 4.0063977259243855e-07, + "loss": 0.333, + "step": 83507 + }, + { + "epoch": 2.14, + "learning_rate": 4.0061762319273086e-07, + "loss": 0.4746, + "step": 83508 + }, + { + "epoch": 2.14, + "learning_rate": 4.005954742519424e-07, + "loss": 0.4639, + "step": 83509 + }, + { + "epoch": 2.14, + "learning_rate": 4.005733257700904e-07, + "loss": 0.4453, + "step": 83510 + }, + { + "epoch": 2.14, + "learning_rate": 4.005511777471918e-07, + "loss": 0.321, + "step": 83511 + }, + { + "epoch": 2.14, + "learning_rate": 4.00529030183264e-07, + "loss": 0.4663, + "step": 83512 + }, + { + "epoch": 2.14, + "learning_rate": 4.005068830783231e-07, + "loss": 0.4619, + "step": 83513 + }, + { + "epoch": 2.14, + "learning_rate": 4.004847364323867e-07, + "loss": 0.4565, + "step": 83514 + }, + { + "epoch": 2.14, + "learning_rate": 4.004625902454718e-07, + "loss": 0.5518, + "step": 83515 + }, + { + "epoch": 2.14, + "learning_rate": 4.0044044451759486e-07, + "loss": 0.4731, + "step": 83516 + }, + { + "epoch": 2.14, + "learning_rate": 4.0041829924877337e-07, + "loss": 0.3892, + "step": 83517 + }, + { + "epoch": 2.14, + "learning_rate": 4.003961544390237e-07, + "loss": 0.5098, + "step": 83518 + }, + { + "epoch": 2.14, + "learning_rate": 4.0037401008836313e-07, + "loss": 0.4814, + "step": 83519 + }, + { + "epoch": 2.14, + "learning_rate": 4.0035186619680895e-07, + "loss": 0.394, + "step": 83520 + }, + { + "epoch": 2.14, + "learning_rate": 4.003297227643775e-07, + "loss": 0.4731, + "step": 83521 + }, + { + "epoch": 2.14, + "learning_rate": 4.0030757979108586e-07, + "loss": 0.4976, + "step": 83522 + }, + { + "epoch": 2.14, + "learning_rate": 4.002854372769512e-07, + "loss": 0.4492, + "step": 83523 + }, + { + "epoch": 2.14, + "learning_rate": 4.0026329522199077e-07, + "loss": 0.2637, + "step": 83524 + }, + { + "epoch": 2.14, + "learning_rate": 4.002411536262208e-07, + "loss": 0.3438, + "step": 83525 + }, + { + "epoch": 2.14, + "learning_rate": 4.002190124896586e-07, + "loss": 0.4321, + "step": 83526 + }, + { + "epoch": 2.14, + "learning_rate": 4.001968718123215e-07, + "loss": 0.3823, + "step": 83527 + }, + { + "epoch": 2.14, + "learning_rate": 4.0017473159422567e-07, + "loss": 0.3208, + "step": 83528 + }, + { + "epoch": 2.14, + "learning_rate": 4.0015259183538886e-07, + "loss": 0.4309, + "step": 83529 + }, + { + "epoch": 2.14, + "learning_rate": 4.0013045253582724e-07, + "loss": 0.3113, + "step": 83530 + }, + { + "epoch": 2.14, + "learning_rate": 4.0010831369555817e-07, + "loss": 0.4702, + "step": 83531 + }, + { + "epoch": 2.14, + "learning_rate": 4.0008617531459897e-07, + "loss": 0.3762, + "step": 83532 + }, + { + "epoch": 2.14, + "learning_rate": 4.0006403739296577e-07, + "loss": 0.335, + "step": 83533 + }, + { + "epoch": 2.14, + "learning_rate": 4.0004189993067606e-07, + "loss": 0.4277, + "step": 83534 + }, + { + "epoch": 2.14, + "learning_rate": 4.0001976292774665e-07, + "loss": 0.4219, + "step": 83535 + }, + { + "epoch": 2.14, + "learning_rate": 3.9999762638419477e-07, + "loss": 0.3396, + "step": 83536 + }, + { + "epoch": 2.14, + "learning_rate": 3.999754903000372e-07, + "loss": 0.4341, + "step": 83537 + }, + { + "epoch": 2.14, + "learning_rate": 3.999533546752905e-07, + "loss": 0.4255, + "step": 83538 + }, + { + "epoch": 2.14, + "learning_rate": 3.999312195099718e-07, + "loss": 0.3752, + "step": 83539 + }, + { + "epoch": 2.14, + "learning_rate": 3.999090848040982e-07, + "loss": 0.4448, + "step": 83540 + }, + { + "epoch": 2.14, + "learning_rate": 3.9988695055768704e-07, + "loss": 0.4185, + "step": 83541 + }, + { + "epoch": 2.14, + "learning_rate": 3.9986481677075444e-07, + "loss": 0.5811, + "step": 83542 + }, + { + "epoch": 2.14, + "learning_rate": 3.9984268344331783e-07, + "loss": 0.4717, + "step": 83543 + }, + { + "epoch": 2.14, + "learning_rate": 3.99820550575394e-07, + "loss": 0.3445, + "step": 83544 + }, + { + "epoch": 2.14, + "learning_rate": 3.9979841816700043e-07, + "loss": 0.3735, + "step": 83545 + }, + { + "epoch": 2.14, + "learning_rate": 3.997762862181532e-07, + "loss": 0.395, + "step": 83546 + }, + { + "epoch": 2.14, + "learning_rate": 3.9975415472887e-07, + "loss": 0.437, + "step": 83547 + }, + { + "epoch": 2.14, + "learning_rate": 3.997320236991671e-07, + "loss": 0.5366, + "step": 83548 + }, + { + "epoch": 2.14, + "learning_rate": 3.997098931290621e-07, + "loss": 0.355, + "step": 83549 + }, + { + "epoch": 2.14, + "learning_rate": 3.9968776301857134e-07, + "loss": 0.4021, + "step": 83550 + }, + { + "epoch": 2.14, + "learning_rate": 3.996656333677121e-07, + "loss": 0.4336, + "step": 83551 + }, + { + "epoch": 2.14, + "learning_rate": 3.996435041765012e-07, + "loss": 0.2737, + "step": 83552 + }, + { + "epoch": 2.14, + "learning_rate": 3.99621375444956e-07, + "loss": 0.3611, + "step": 83553 + }, + { + "epoch": 2.14, + "learning_rate": 3.995992471730929e-07, + "loss": 0.2714, + "step": 83554 + }, + { + "epoch": 2.14, + "learning_rate": 3.9957711936092885e-07, + "loss": 0.5063, + "step": 83555 + }, + { + "epoch": 2.14, + "learning_rate": 3.995549920084811e-07, + "loss": 0.2288, + "step": 83556 + }, + { + "epoch": 2.14, + "learning_rate": 3.995328651157669e-07, + "loss": 0.3466, + "step": 83557 + }, + { + "epoch": 2.14, + "learning_rate": 3.995107386828026e-07, + "loss": 0.4375, + "step": 83558 + }, + { + "epoch": 2.14, + "learning_rate": 3.994886127096051e-07, + "loss": 0.3669, + "step": 83559 + }, + { + "epoch": 2.14, + "learning_rate": 3.994664871961916e-07, + "loss": 0.4907, + "step": 83560 + }, + { + "epoch": 2.14, + "learning_rate": 3.994443621425788e-07, + "loss": 0.3064, + "step": 83561 + }, + { + "epoch": 2.14, + "learning_rate": 3.9942223754878436e-07, + "loss": 0.4438, + "step": 83562 + }, + { + "epoch": 2.14, + "learning_rate": 3.9940011341482425e-07, + "loss": 0.3491, + "step": 83563 + }, + { + "epoch": 2.14, + "learning_rate": 3.993779897407159e-07, + "loss": 0.5103, + "step": 83564 + }, + { + "epoch": 2.14, + "learning_rate": 3.993558665264762e-07, + "loss": 0.3425, + "step": 83565 + }, + { + "epoch": 2.14, + "learning_rate": 3.9933374377212245e-07, + "loss": 0.4541, + "step": 83566 + }, + { + "epoch": 2.14, + "learning_rate": 3.9931162147767126e-07, + "loss": 0.3333, + "step": 83567 + }, + { + "epoch": 2.14, + "learning_rate": 3.992894996431392e-07, + "loss": 0.3062, + "step": 83568 + }, + { + "epoch": 2.14, + "learning_rate": 3.992673782685435e-07, + "loss": 0.2939, + "step": 83569 + }, + { + "epoch": 2.14, + "learning_rate": 3.9924525735390146e-07, + "loss": 0.3508, + "step": 83570 + }, + { + "epoch": 2.14, + "learning_rate": 3.992231368992295e-07, + "loss": 0.4771, + "step": 83571 + }, + { + "epoch": 2.14, + "learning_rate": 3.9920101690454464e-07, + "loss": 0.3489, + "step": 83572 + }, + { + "epoch": 2.14, + "learning_rate": 3.99178897369864e-07, + "loss": 0.4248, + "step": 83573 + }, + { + "epoch": 2.14, + "learning_rate": 3.991567782952047e-07, + "loss": 0.4561, + "step": 83574 + }, + { + "epoch": 2.14, + "learning_rate": 3.9913465968058315e-07, + "loss": 0.4487, + "step": 83575 + }, + { + "epoch": 2.14, + "learning_rate": 3.991125415260165e-07, + "loss": 0.4062, + "step": 83576 + }, + { + "epoch": 2.14, + "learning_rate": 3.9909042383152214e-07, + "loss": 0.4082, + "step": 83577 + }, + { + "epoch": 2.14, + "learning_rate": 3.9906830659711633e-07, + "loss": 0.501, + "step": 83578 + }, + { + "epoch": 2.14, + "learning_rate": 3.9904618982281655e-07, + "loss": 0.4061, + "step": 83579 + }, + { + "epoch": 2.14, + "learning_rate": 3.990240735086392e-07, + "loss": 0.5117, + "step": 83580 + }, + { + "epoch": 2.14, + "learning_rate": 3.990019576546014e-07, + "loss": 0.4258, + "step": 83581 + }, + { + "epoch": 2.14, + "learning_rate": 3.9897984226072013e-07, + "loss": 0.3556, + "step": 83582 + }, + { + "epoch": 2.14, + "learning_rate": 3.989577273270128e-07, + "loss": 0.4893, + "step": 83583 + }, + { + "epoch": 2.14, + "learning_rate": 3.989356128534955e-07, + "loss": 0.5054, + "step": 83584 + }, + { + "epoch": 2.14, + "learning_rate": 3.9891349884018564e-07, + "loss": 0.3708, + "step": 83585 + }, + { + "epoch": 2.14, + "learning_rate": 3.9889138528709995e-07, + "loss": 0.4668, + "step": 83586 + }, + { + "epoch": 2.14, + "learning_rate": 3.9886927219425634e-07, + "loss": 0.4849, + "step": 83587 + }, + { + "epoch": 2.14, + "learning_rate": 3.9884715956167016e-07, + "loss": 0.4858, + "step": 83588 + }, + { + "epoch": 2.14, + "learning_rate": 3.98825047389359e-07, + "loss": 0.5176, + "step": 83589 + }, + { + "epoch": 2.14, + "learning_rate": 3.988029356773398e-07, + "loss": 0.2875, + "step": 83590 + }, + { + "epoch": 2.14, + "learning_rate": 3.9878082442563e-07, + "loss": 0.3313, + "step": 83591 + }, + { + "epoch": 2.14, + "learning_rate": 3.987587136342457e-07, + "loss": 0.4521, + "step": 83592 + }, + { + "epoch": 2.14, + "learning_rate": 3.987366033032042e-07, + "loss": 0.3898, + "step": 83593 + }, + { + "epoch": 2.14, + "learning_rate": 3.987144934325225e-07, + "loss": 0.4771, + "step": 83594 + }, + { + "epoch": 2.14, + "learning_rate": 3.986923840222177e-07, + "loss": 0.438, + "step": 83595 + }, + { + "epoch": 2.14, + "learning_rate": 3.9867027507230623e-07, + "loss": 0.6152, + "step": 83596 + }, + { + "epoch": 2.14, + "learning_rate": 3.9864816658280563e-07, + "loss": 0.3892, + "step": 83597 + }, + { + "epoch": 2.14, + "learning_rate": 3.986260585537321e-07, + "loss": 0.2844, + "step": 83598 + }, + { + "epoch": 2.14, + "learning_rate": 3.9860395098510294e-07, + "loss": 0.4307, + "step": 83599 + }, + { + "epoch": 2.14, + "learning_rate": 3.985818438769354e-07, + "loss": 0.4678, + "step": 83600 + }, + { + "epoch": 2.14, + "learning_rate": 3.9855973722924575e-07, + "loss": 0.4287, + "step": 83601 + }, + { + "epoch": 2.14, + "learning_rate": 3.9853763104205127e-07, + "loss": 0.3955, + "step": 83602 + }, + { + "epoch": 2.14, + "learning_rate": 3.985155253153689e-07, + "loss": 0.2395, + "step": 83603 + }, + { + "epoch": 2.14, + "learning_rate": 3.9849342004921593e-07, + "loss": 0.3442, + "step": 83604 + }, + { + "epoch": 2.14, + "learning_rate": 3.984713152436084e-07, + "loss": 0.5049, + "step": 83605 + }, + { + "epoch": 2.14, + "learning_rate": 3.9844921089856386e-07, + "loss": 0.4971, + "step": 83606 + }, + { + "epoch": 2.14, + "learning_rate": 3.9842710701409933e-07, + "loss": 0.3708, + "step": 83607 + }, + { + "epoch": 2.14, + "learning_rate": 3.984050035902316e-07, + "loss": 0.4253, + "step": 83608 + }, + { + "epoch": 2.14, + "learning_rate": 3.983829006269771e-07, + "loss": 0.4707, + "step": 83609 + }, + { + "epoch": 2.14, + "learning_rate": 3.983607981243532e-07, + "loss": 0.3463, + "step": 83610 + }, + { + "epoch": 2.14, + "learning_rate": 3.983386960823767e-07, + "loss": 0.3098, + "step": 83611 + }, + { + "epoch": 2.14, + "learning_rate": 3.983165945010649e-07, + "loss": 0.4775, + "step": 83612 + }, + { + "epoch": 2.14, + "learning_rate": 3.982944933804342e-07, + "loss": 0.3489, + "step": 83613 + }, + { + "epoch": 2.14, + "learning_rate": 3.982723927205017e-07, + "loss": 0.3051, + "step": 83614 + }, + { + "epoch": 2.14, + "learning_rate": 3.9825029252128426e-07, + "loss": 0.436, + "step": 83615 + }, + { + "epoch": 2.14, + "learning_rate": 3.982281927827994e-07, + "loss": 0.3413, + "step": 83616 + }, + { + "epoch": 2.14, + "learning_rate": 3.982060935050635e-07, + "loss": 0.4771, + "step": 83617 + }, + { + "epoch": 2.14, + "learning_rate": 3.9818399468809316e-07, + "loss": 0.4292, + "step": 83618 + }, + { + "epoch": 2.14, + "learning_rate": 3.981618963319057e-07, + "loss": 0.2808, + "step": 83619 + }, + { + "epoch": 2.14, + "learning_rate": 3.981397984365179e-07, + "loss": 0.3892, + "step": 83620 + }, + { + "epoch": 2.14, + "learning_rate": 3.981177010019472e-07, + "loss": 0.4609, + "step": 83621 + }, + { + "epoch": 2.14, + "learning_rate": 3.9809560402820973e-07, + "loss": 0.4067, + "step": 83622 + }, + { + "epoch": 2.14, + "learning_rate": 3.9807350751532275e-07, + "loss": 0.3792, + "step": 83623 + }, + { + "epoch": 2.14, + "learning_rate": 3.9805141146330365e-07, + "loss": 0.3853, + "step": 83624 + }, + { + "epoch": 2.14, + "learning_rate": 3.9802931587216847e-07, + "loss": 0.4512, + "step": 83625 + }, + { + "epoch": 2.14, + "learning_rate": 3.980072207419346e-07, + "loss": 0.3281, + "step": 83626 + }, + { + "epoch": 2.14, + "learning_rate": 3.9798512607261924e-07, + "loss": 0.5308, + "step": 83627 + }, + { + "epoch": 2.14, + "learning_rate": 3.9796303186423876e-07, + "loss": 0.3643, + "step": 83628 + }, + { + "epoch": 2.14, + "learning_rate": 3.979409381168105e-07, + "loss": 0.542, + "step": 83629 + }, + { + "epoch": 2.14, + "learning_rate": 3.979188448303509e-07, + "loss": 0.3341, + "step": 83630 + }, + { + "epoch": 2.14, + "learning_rate": 3.9789675200487717e-07, + "loss": 0.501, + "step": 83631 + }, + { + "epoch": 2.14, + "learning_rate": 3.978746596404061e-07, + "loss": 0.384, + "step": 83632 + }, + { + "epoch": 2.14, + "learning_rate": 3.9785256773695517e-07, + "loss": 0.562, + "step": 83633 + }, + { + "epoch": 2.14, + "learning_rate": 3.978304762945406e-07, + "loss": 0.4404, + "step": 83634 + }, + { + "epoch": 2.14, + "learning_rate": 3.9780838531317937e-07, + "loss": 0.4053, + "step": 83635 + }, + { + "epoch": 2.14, + "learning_rate": 3.977862947928886e-07, + "loss": 0.4302, + "step": 83636 + }, + { + "epoch": 2.14, + "learning_rate": 3.977642047336855e-07, + "loss": 0.2266, + "step": 83637 + }, + { + "epoch": 2.14, + "learning_rate": 3.9774211513558674e-07, + "loss": 0.4238, + "step": 83638 + }, + { + "epoch": 2.14, + "learning_rate": 3.977200259986088e-07, + "loss": 0.424, + "step": 83639 + }, + { + "epoch": 2.14, + "learning_rate": 3.976979373227689e-07, + "loss": 0.4409, + "step": 83640 + }, + { + "epoch": 2.14, + "learning_rate": 3.976758491080844e-07, + "loss": 0.3806, + "step": 83641 + }, + { + "epoch": 2.14, + "learning_rate": 3.976537613545713e-07, + "loss": 0.4077, + "step": 83642 + }, + { + "epoch": 2.14, + "learning_rate": 3.9763167406224716e-07, + "loss": 0.4712, + "step": 83643 + }, + { + "epoch": 2.14, + "learning_rate": 3.9760958723112867e-07, + "loss": 0.3643, + "step": 83644 + }, + { + "epoch": 2.14, + "learning_rate": 3.975875008612333e-07, + "loss": 0.5508, + "step": 83645 + }, + { + "epoch": 2.14, + "learning_rate": 3.9756541495257735e-07, + "loss": 0.3643, + "step": 83646 + }, + { + "epoch": 2.14, + "learning_rate": 3.9754332950517755e-07, + "loss": 0.4478, + "step": 83647 + }, + { + "epoch": 2.14, + "learning_rate": 3.9752124451905114e-07, + "loss": 0.3287, + "step": 83648 + }, + { + "epoch": 2.14, + "learning_rate": 3.97499159994215e-07, + "loss": 0.4797, + "step": 83649 + }, + { + "epoch": 2.14, + "learning_rate": 3.9747707593068636e-07, + "loss": 0.5312, + "step": 83650 + }, + { + "epoch": 2.14, + "learning_rate": 3.9745499232848155e-07, + "loss": 0.5029, + "step": 83651 + }, + { + "epoch": 2.14, + "learning_rate": 3.9743290918761774e-07, + "loss": 0.3984, + "step": 83652 + }, + { + "epoch": 2.14, + "learning_rate": 3.9741082650811176e-07, + "loss": 0.272, + "step": 83653 + }, + { + "epoch": 2.14, + "learning_rate": 3.97388744289981e-07, + "loss": 0.5767, + "step": 83654 + }, + { + "epoch": 2.14, + "learning_rate": 3.973666625332416e-07, + "loss": 0.3306, + "step": 83655 + }, + { + "epoch": 2.14, + "learning_rate": 3.9734458123791126e-07, + "loss": 0.5435, + "step": 83656 + }, + { + "epoch": 2.14, + "learning_rate": 3.9732250040400605e-07, + "loss": 0.4766, + "step": 83657 + }, + { + "epoch": 2.14, + "learning_rate": 3.9730042003154364e-07, + "loss": 0.3237, + "step": 83658 + }, + { + "epoch": 2.14, + "learning_rate": 3.972783401205402e-07, + "loss": 0.4585, + "step": 83659 + }, + { + "epoch": 2.14, + "learning_rate": 3.9725626067101313e-07, + "loss": 0.5054, + "step": 83660 + }, + { + "epoch": 2.14, + "learning_rate": 3.9723418168297917e-07, + "loss": 0.3567, + "step": 83661 + }, + { + "epoch": 2.14, + "learning_rate": 3.972121031564556e-07, + "loss": 0.3018, + "step": 83662 + }, + { + "epoch": 2.14, + "learning_rate": 3.971900250914586e-07, + "loss": 0.3328, + "step": 83663 + }, + { + "epoch": 2.14, + "learning_rate": 3.9716794748800566e-07, + "loss": 0.4219, + "step": 83664 + }, + { + "epoch": 2.14, + "learning_rate": 3.9714587034611337e-07, + "loss": 0.3958, + "step": 83665 + }, + { + "epoch": 2.14, + "learning_rate": 3.971237936657992e-07, + "loss": 0.2384, + "step": 83666 + }, + { + "epoch": 2.14, + "learning_rate": 3.9710171744707956e-07, + "loss": 0.3124, + "step": 83667 + }, + { + "epoch": 2.14, + "learning_rate": 3.97079641689971e-07, + "loss": 0.4634, + "step": 83668 + }, + { + "epoch": 2.14, + "learning_rate": 3.970575663944909e-07, + "loss": 0.5449, + "step": 83669 + }, + { + "epoch": 2.14, + "learning_rate": 3.970354915606561e-07, + "loss": 0.3823, + "step": 83670 + }, + { + "epoch": 2.14, + "learning_rate": 3.9701341718848393e-07, + "loss": 0.3208, + "step": 83671 + }, + { + "epoch": 2.14, + "learning_rate": 3.9699134327799045e-07, + "loss": 0.4263, + "step": 83672 + }, + { + "epoch": 2.14, + "learning_rate": 3.969692698291929e-07, + "loss": 0.4355, + "step": 83673 + }, + { + "epoch": 2.14, + "learning_rate": 3.969471968421083e-07, + "loss": 0.342, + "step": 83674 + }, + { + "epoch": 2.14, + "learning_rate": 3.9692512431675384e-07, + "loss": 0.3845, + "step": 83675 + }, + { + "epoch": 2.14, + "learning_rate": 3.9690305225314614e-07, + "loss": 0.3276, + "step": 83676 + }, + { + "epoch": 2.14, + "learning_rate": 3.968809806513016e-07, + "loss": 0.353, + "step": 83677 + }, + { + "epoch": 2.14, + "learning_rate": 3.968589095112377e-07, + "loss": 0.3438, + "step": 83678 + }, + { + "epoch": 2.14, + "learning_rate": 3.9683683883297137e-07, + "loss": 0.5444, + "step": 83679 + }, + { + "epoch": 2.14, + "learning_rate": 3.968147686165191e-07, + "loss": 0.3008, + "step": 83680 + }, + { + "epoch": 2.14, + "learning_rate": 3.9679269886189805e-07, + "loss": 0.2686, + "step": 83681 + }, + { + "epoch": 2.14, + "learning_rate": 3.96770629569125e-07, + "loss": 0.3679, + "step": 83682 + }, + { + "epoch": 2.14, + "learning_rate": 3.967485607382174e-07, + "loss": 0.4551, + "step": 83683 + }, + { + "epoch": 2.14, + "learning_rate": 3.967264923691913e-07, + "loss": 0.3433, + "step": 83684 + }, + { + "epoch": 2.14, + "learning_rate": 3.96704424462064e-07, + "loss": 0.3589, + "step": 83685 + }, + { + "epoch": 2.14, + "learning_rate": 3.966823570168526e-07, + "loss": 0.4849, + "step": 83686 + }, + { + "epoch": 2.14, + "learning_rate": 3.966602900335736e-07, + "loss": 0.3306, + "step": 83687 + }, + { + "epoch": 2.14, + "learning_rate": 3.966382235122443e-07, + "loss": 0.3745, + "step": 83688 + }, + { + "epoch": 2.14, + "learning_rate": 3.9661615745288114e-07, + "loss": 0.4473, + "step": 83689 + }, + { + "epoch": 2.15, + "learning_rate": 3.965940918555012e-07, + "loss": 0.582, + "step": 83690 + }, + { + "epoch": 2.15, + "learning_rate": 3.9657202672012137e-07, + "loss": 0.3447, + "step": 83691 + }, + { + "epoch": 2.15, + "learning_rate": 3.9654996204675893e-07, + "loss": 0.4478, + "step": 83692 + }, + { + "epoch": 2.15, + "learning_rate": 3.9652789783543014e-07, + "loss": 0.5552, + "step": 83693 + }, + { + "epoch": 2.15, + "learning_rate": 3.965058340861521e-07, + "loss": 0.418, + "step": 83694 + }, + { + "epoch": 2.15, + "learning_rate": 3.9648377079894226e-07, + "loss": 0.4565, + "step": 83695 + }, + { + "epoch": 2.15, + "learning_rate": 3.9646170797381704e-07, + "loss": 0.5366, + "step": 83696 + }, + { + "epoch": 2.15, + "learning_rate": 3.964396456107929e-07, + "loss": 0.4302, + "step": 83697 + }, + { + "epoch": 2.15, + "learning_rate": 3.964175837098873e-07, + "loss": 0.4731, + "step": 83698 + }, + { + "epoch": 2.15, + "learning_rate": 3.963955222711168e-07, + "loss": 0.3505, + "step": 83699 + }, + { + "epoch": 2.15, + "learning_rate": 3.963734612944991e-07, + "loss": 0.2896, + "step": 83700 + }, + { + "epoch": 2.15, + "learning_rate": 3.963514007800499e-07, + "loss": 0.4893, + "step": 83701 + }, + { + "epoch": 2.15, + "learning_rate": 3.963293407277869e-07, + "loss": 0.5327, + "step": 83702 + }, + { + "epoch": 2.15, + "learning_rate": 3.963072811377266e-07, + "loss": 0.3616, + "step": 83703 + }, + { + "epoch": 2.15, + "learning_rate": 3.9628522200988645e-07, + "loss": 0.3638, + "step": 83704 + }, + { + "epoch": 2.15, + "learning_rate": 3.9626316334428254e-07, + "loss": 0.4229, + "step": 83705 + }, + { + "epoch": 2.15, + "learning_rate": 3.9624110514093267e-07, + "loss": 0.4438, + "step": 83706 + }, + { + "epoch": 2.15, + "learning_rate": 3.962190473998528e-07, + "loss": 0.438, + "step": 83707 + }, + { + "epoch": 2.15, + "learning_rate": 3.961969901210602e-07, + "loss": 0.3999, + "step": 83708 + }, + { + "epoch": 2.15, + "learning_rate": 3.9617493330457217e-07, + "loss": 0.3589, + "step": 83709 + }, + { + "epoch": 2.15, + "learning_rate": 3.961528769504049e-07, + "loss": 0.2773, + "step": 83710 + }, + { + "epoch": 2.15, + "learning_rate": 3.9613082105857556e-07, + "loss": 0.4302, + "step": 83711 + }, + { + "epoch": 2.15, + "learning_rate": 3.9610876562910147e-07, + "loss": 0.4307, + "step": 83712 + }, + { + "epoch": 2.15, + "learning_rate": 3.9608671066199873e-07, + "loss": 0.297, + "step": 83713 + }, + { + "epoch": 2.15, + "learning_rate": 3.9606465615728466e-07, + "loss": 0.5435, + "step": 83714 + }, + { + "epoch": 2.15, + "learning_rate": 3.960426021149762e-07, + "loss": 0.4824, + "step": 83715 + }, + { + "epoch": 2.15, + "learning_rate": 3.9602054853509035e-07, + "loss": 0.3425, + "step": 83716 + }, + { + "epoch": 2.15, + "learning_rate": 3.9599849541764383e-07, + "loss": 0.4624, + "step": 83717 + }, + { + "epoch": 2.15, + "learning_rate": 3.959764427626533e-07, + "loss": 0.4341, + "step": 83718 + }, + { + "epoch": 2.15, + "learning_rate": 3.959543905701357e-07, + "loss": 0.2916, + "step": 83719 + }, + { + "epoch": 2.15, + "learning_rate": 3.95932338840108e-07, + "loss": 0.2756, + "step": 83720 + }, + { + "epoch": 2.15, + "learning_rate": 3.959102875725876e-07, + "loss": 0.2732, + "step": 83721 + }, + { + "epoch": 2.15, + "learning_rate": 3.958882367675904e-07, + "loss": 0.5947, + "step": 83722 + }, + { + "epoch": 2.15, + "learning_rate": 3.9586618642513393e-07, + "loss": 0.4097, + "step": 83723 + }, + { + "epoch": 2.15, + "learning_rate": 3.9584413654523495e-07, + "loss": 0.354, + "step": 83724 + }, + { + "epoch": 2.15, + "learning_rate": 3.9582208712791066e-07, + "loss": 0.3955, + "step": 83725 + }, + { + "epoch": 2.15, + "learning_rate": 3.9580003817317765e-07, + "loss": 0.3005, + "step": 83726 + }, + { + "epoch": 2.15, + "learning_rate": 3.9577798968105237e-07, + "loss": 0.4001, + "step": 83727 + }, + { + "epoch": 2.15, + "learning_rate": 3.9575594165155213e-07, + "loss": 0.4673, + "step": 83728 + }, + { + "epoch": 2.15, + "learning_rate": 3.9573389408469403e-07, + "loss": 0.3354, + "step": 83729 + }, + { + "epoch": 2.15, + "learning_rate": 3.9571184698049444e-07, + "loss": 0.5034, + "step": 83730 + }, + { + "epoch": 2.15, + "learning_rate": 3.956898003389705e-07, + "loss": 0.3961, + "step": 83731 + }, + { + "epoch": 2.15, + "learning_rate": 3.956677541601391e-07, + "loss": 0.3647, + "step": 83732 + }, + { + "epoch": 2.15, + "learning_rate": 3.9564570844401744e-07, + "loss": 0.3574, + "step": 83733 + }, + { + "epoch": 2.15, + "learning_rate": 3.956236631906218e-07, + "loss": 0.4287, + "step": 83734 + }, + { + "epoch": 2.15, + "learning_rate": 3.956016183999692e-07, + "loss": 0.3948, + "step": 83735 + }, + { + "epoch": 2.15, + "learning_rate": 3.955795740720771e-07, + "loss": 0.5586, + "step": 83736 + }, + { + "epoch": 2.15, + "learning_rate": 3.955575302069616e-07, + "loss": 0.5054, + "step": 83737 + }, + { + "epoch": 2.15, + "learning_rate": 3.955354868046401e-07, + "loss": 0.4355, + "step": 83738 + }, + { + "epoch": 2.15, + "learning_rate": 3.955134438651291e-07, + "loss": 0.584, + "step": 83739 + }, + { + "epoch": 2.15, + "learning_rate": 3.954914013884456e-07, + "loss": 0.3718, + "step": 83740 + }, + { + "epoch": 2.15, + "learning_rate": 3.9546935937460645e-07, + "loss": 0.4746, + "step": 83741 + }, + { + "epoch": 2.15, + "learning_rate": 3.954473178236291e-07, + "loss": 0.522, + "step": 83742 + }, + { + "epoch": 2.15, + "learning_rate": 3.954252767355295e-07, + "loss": 0.3721, + "step": 83743 + }, + { + "epoch": 2.15, + "learning_rate": 3.95403236110325e-07, + "loss": 0.4893, + "step": 83744 + }, + { + "epoch": 2.15, + "learning_rate": 3.9538119594803245e-07, + "loss": 0.2104, + "step": 83745 + }, + { + "epoch": 2.15, + "learning_rate": 3.953591562486691e-07, + "loss": 0.2144, + "step": 83746 + }, + { + "epoch": 2.15, + "learning_rate": 3.9533711701225134e-07, + "loss": 0.4248, + "step": 83747 + }, + { + "epoch": 2.15, + "learning_rate": 3.9531507823879596e-07, + "loss": 0.3535, + "step": 83748 + }, + { + "epoch": 2.15, + "learning_rate": 3.9529303992831984e-07, + "loss": 0.4321, + "step": 83749 + }, + { + "epoch": 2.15, + "learning_rate": 3.952710020808405e-07, + "loss": 0.3394, + "step": 83750 + }, + { + "epoch": 2.15, + "learning_rate": 3.9524896469637405e-07, + "loss": 0.2925, + "step": 83751 + }, + { + "epoch": 2.15, + "learning_rate": 3.9522692777493747e-07, + "loss": 0.342, + "step": 83752 + }, + { + "epoch": 2.15, + "learning_rate": 3.95204891316548e-07, + "loss": 0.3311, + "step": 83753 + }, + { + "epoch": 2.15, + "learning_rate": 3.9518285532122253e-07, + "loss": 0.3721, + "step": 83754 + }, + { + "epoch": 2.15, + "learning_rate": 3.9516081978897753e-07, + "loss": 0.4229, + "step": 83755 + }, + { + "epoch": 2.15, + "learning_rate": 3.951387847198303e-07, + "loss": 0.3687, + "step": 83756 + }, + { + "epoch": 2.15, + "learning_rate": 3.951167501137973e-07, + "loss": 0.46, + "step": 83757 + }, + { + "epoch": 2.15, + "learning_rate": 3.950947159708955e-07, + "loss": 0.3511, + "step": 83758 + }, + { + "epoch": 2.15, + "learning_rate": 3.950726822911422e-07, + "loss": 0.5098, + "step": 83759 + }, + { + "epoch": 2.15, + "learning_rate": 3.9505064907455357e-07, + "loss": 0.4453, + "step": 83760 + }, + { + "epoch": 2.15, + "learning_rate": 3.950286163211468e-07, + "loss": 0.3264, + "step": 83761 + }, + { + "epoch": 2.15, + "learning_rate": 3.9500658403093887e-07, + "loss": 0.417, + "step": 83762 + }, + { + "epoch": 2.15, + "learning_rate": 3.94984552203947e-07, + "loss": 0.3921, + "step": 83763 + }, + { + "epoch": 2.15, + "learning_rate": 3.949625208401872e-07, + "loss": 0.4819, + "step": 83764 + }, + { + "epoch": 2.15, + "learning_rate": 3.949404899396768e-07, + "loss": 0.4614, + "step": 83765 + }, + { + "epoch": 2.15, + "learning_rate": 3.9491845950243296e-07, + "loss": 0.4004, + "step": 83766 + }, + { + "epoch": 2.15, + "learning_rate": 3.9489642952847236e-07, + "loss": 0.2859, + "step": 83767 + }, + { + "epoch": 2.15, + "learning_rate": 3.9487440001781126e-07, + "loss": 0.4087, + "step": 83768 + }, + { + "epoch": 2.15, + "learning_rate": 3.9485237097046697e-07, + "loss": 0.3672, + "step": 83769 + }, + { + "epoch": 2.15, + "learning_rate": 3.948303423864565e-07, + "loss": 0.46, + "step": 83770 + }, + { + "epoch": 2.15, + "learning_rate": 3.94808314265797e-07, + "loss": 0.4102, + "step": 83771 + }, + { + "epoch": 2.15, + "learning_rate": 3.947862866085044e-07, + "loss": 0.5527, + "step": 83772 + }, + { + "epoch": 2.15, + "learning_rate": 3.947642594145962e-07, + "loss": 0.4043, + "step": 83773 + }, + { + "epoch": 2.15, + "learning_rate": 3.947422326840894e-07, + "loss": 0.3432, + "step": 83774 + }, + { + "epoch": 2.15, + "learning_rate": 3.9472020641700066e-07, + "loss": 0.4551, + "step": 83775 + }, + { + "epoch": 2.15, + "learning_rate": 3.94698180613347e-07, + "loss": 0.3513, + "step": 83776 + }, + { + "epoch": 2.15, + "learning_rate": 3.946761552731448e-07, + "loss": 0.3279, + "step": 83777 + }, + { + "epoch": 2.15, + "learning_rate": 3.9465413039641116e-07, + "loss": 0.5303, + "step": 83778 + }, + { + "epoch": 2.15, + "learning_rate": 3.94632105983163e-07, + "loss": 0.478, + "step": 83779 + }, + { + "epoch": 2.15, + "learning_rate": 3.946100820334175e-07, + "loss": 0.394, + "step": 83780 + }, + { + "epoch": 2.15, + "learning_rate": 3.94588058547191e-07, + "loss": 0.3579, + "step": 83781 + }, + { + "epoch": 2.15, + "learning_rate": 3.945660355245005e-07, + "loss": 0.3547, + "step": 83782 + }, + { + "epoch": 2.15, + "learning_rate": 3.94544012965363e-07, + "loss": 0.397, + "step": 83783 + }, + { + "epoch": 2.15, + "learning_rate": 3.9452199086979567e-07, + "loss": 0.3828, + "step": 83784 + }, + { + "epoch": 2.15, + "learning_rate": 3.944999692378146e-07, + "loss": 0.4636, + "step": 83785 + }, + { + "epoch": 2.15, + "learning_rate": 3.944779480694375e-07, + "loss": 0.4927, + "step": 83786 + }, + { + "epoch": 2.15, + "learning_rate": 3.9445592736468034e-07, + "loss": 0.4438, + "step": 83787 + }, + { + "epoch": 2.15, + "learning_rate": 3.9443390712356083e-07, + "loss": 0.3662, + "step": 83788 + }, + { + "epoch": 2.15, + "learning_rate": 3.944118873460951e-07, + "loss": 0.522, + "step": 83789 + }, + { + "epoch": 2.15, + "learning_rate": 3.9438986803230035e-07, + "loss": 0.3921, + "step": 83790 + }, + { + "epoch": 2.15, + "learning_rate": 3.9436784918219333e-07, + "loss": 0.4653, + "step": 83791 + }, + { + "epoch": 2.15, + "learning_rate": 3.943458307957914e-07, + "loss": 0.4189, + "step": 83792 + }, + { + "epoch": 2.15, + "learning_rate": 3.9432381287311077e-07, + "loss": 0.3555, + "step": 83793 + }, + { + "epoch": 2.15, + "learning_rate": 3.9430179541416844e-07, + "loss": 0.3887, + "step": 83794 + }, + { + "epoch": 2.15, + "learning_rate": 3.942797784189814e-07, + "loss": 0.3787, + "step": 83795 + }, + { + "epoch": 2.15, + "learning_rate": 3.942577618875669e-07, + "loss": 0.3672, + "step": 83796 + }, + { + "epoch": 2.15, + "learning_rate": 3.942357458199412e-07, + "loss": 0.4458, + "step": 83797 + }, + { + "epoch": 2.15, + "learning_rate": 3.9421373021612116e-07, + "loss": 0.3945, + "step": 83798 + }, + { + "epoch": 2.15, + "learning_rate": 3.941917150761237e-07, + "loss": 0.425, + "step": 83799 + }, + { + "epoch": 2.15, + "learning_rate": 3.941697003999659e-07, + "loss": 0.3618, + "step": 83800 + }, + { + "epoch": 2.15, + "learning_rate": 3.941476861876648e-07, + "loss": 0.3433, + "step": 83801 + }, + { + "epoch": 2.15, + "learning_rate": 3.941256724392366e-07, + "loss": 0.4436, + "step": 83802 + }, + { + "epoch": 2.15, + "learning_rate": 3.9410365915469844e-07, + "loss": 0.416, + "step": 83803 + }, + { + "epoch": 2.15, + "learning_rate": 3.940816463340677e-07, + "loss": 0.4443, + "step": 83804 + }, + { + "epoch": 2.15, + "learning_rate": 3.940596339773604e-07, + "loss": 0.3076, + "step": 83805 + }, + { + "epoch": 2.15, + "learning_rate": 3.9403762208459424e-07, + "loss": 0.3711, + "step": 83806 + }, + { + "epoch": 2.15, + "learning_rate": 3.940156106557851e-07, + "loss": 0.4456, + "step": 83807 + }, + { + "epoch": 2.15, + "learning_rate": 3.9399359969095037e-07, + "loss": 0.4092, + "step": 83808 + }, + { + "epoch": 2.15, + "learning_rate": 3.939715891901073e-07, + "loss": 0.2858, + "step": 83809 + }, + { + "epoch": 2.15, + "learning_rate": 3.939495791532719e-07, + "loss": 0.3289, + "step": 83810 + }, + { + "epoch": 2.15, + "learning_rate": 3.9392756958046147e-07, + "loss": 0.5068, + "step": 83811 + }, + { + "epoch": 2.15, + "learning_rate": 3.9390556047169274e-07, + "loss": 0.3279, + "step": 83812 + }, + { + "epoch": 2.15, + "learning_rate": 3.938835518269832e-07, + "loss": 0.4531, + "step": 83813 + }, + { + "epoch": 2.15, + "learning_rate": 3.938615436463486e-07, + "loss": 0.3438, + "step": 83814 + }, + { + "epoch": 2.15, + "learning_rate": 3.9383953592980643e-07, + "loss": 0.4087, + "step": 83815 + }, + { + "epoch": 2.15, + "learning_rate": 3.9381752867737383e-07, + "loss": 0.2812, + "step": 83816 + }, + { + "epoch": 2.15, + "learning_rate": 3.9379552188906695e-07, + "loss": 0.314, + "step": 83817 + }, + { + "epoch": 2.15, + "learning_rate": 3.937735155649032e-07, + "loss": 0.3799, + "step": 83818 + }, + { + "epoch": 2.15, + "learning_rate": 3.9375150970489903e-07, + "loss": 0.2712, + "step": 83819 + }, + { + "epoch": 2.15, + "learning_rate": 3.937295043090713e-07, + "loss": 0.3096, + "step": 83820 + }, + { + "epoch": 2.15, + "learning_rate": 3.9370749937743743e-07, + "loss": 0.4404, + "step": 83821 + }, + { + "epoch": 2.15, + "learning_rate": 3.936854949100135e-07, + "loss": 0.3998, + "step": 83822 + }, + { + "epoch": 2.15, + "learning_rate": 3.936634909068166e-07, + "loss": 0.4355, + "step": 83823 + }, + { + "epoch": 2.15, + "learning_rate": 3.936414873678637e-07, + "loss": 0.4128, + "step": 83824 + }, + { + "epoch": 2.15, + "learning_rate": 3.9361948429317217e-07, + "loss": 0.3735, + "step": 83825 + }, + { + "epoch": 2.15, + "learning_rate": 3.935974816827582e-07, + "loss": 0.5117, + "step": 83826 + }, + { + "epoch": 2.15, + "learning_rate": 3.935754795366384e-07, + "loss": 0.4165, + "step": 83827 + }, + { + "epoch": 2.15, + "learning_rate": 3.935534778548299e-07, + "loss": 0.5024, + "step": 83828 + }, + { + "epoch": 2.15, + "learning_rate": 3.9353147663734974e-07, + "loss": 0.5259, + "step": 83829 + }, + { + "epoch": 2.15, + "learning_rate": 3.935094758842149e-07, + "loss": 0.2935, + "step": 83830 + }, + { + "epoch": 2.15, + "learning_rate": 3.934874755954417e-07, + "loss": 0.4688, + "step": 83831 + }, + { + "epoch": 2.15, + "learning_rate": 3.9346547577104714e-07, + "loss": 0.3982, + "step": 83832 + }, + { + "epoch": 2.15, + "learning_rate": 3.9344347641104827e-07, + "loss": 0.4219, + "step": 83833 + }, + { + "epoch": 2.15, + "learning_rate": 3.9342147751546216e-07, + "loss": 0.5024, + "step": 83834 + }, + { + "epoch": 2.15, + "learning_rate": 3.9339947908430506e-07, + "loss": 0.3916, + "step": 83835 + }, + { + "epoch": 2.15, + "learning_rate": 3.933774811175943e-07, + "loss": 0.4199, + "step": 83836 + }, + { + "epoch": 2.15, + "learning_rate": 3.933554836153462e-07, + "loss": 0.4512, + "step": 83837 + }, + { + "epoch": 2.15, + "learning_rate": 3.9333348657757825e-07, + "loss": 0.3325, + "step": 83838 + }, + { + "epoch": 2.15, + "learning_rate": 3.9331149000430676e-07, + "loss": 0.3337, + "step": 83839 + }, + { + "epoch": 2.15, + "learning_rate": 3.9328949389554857e-07, + "loss": 0.4585, + "step": 83840 + }, + { + "epoch": 2.15, + "learning_rate": 3.9326749825132077e-07, + "loss": 0.3546, + "step": 83841 + }, + { + "epoch": 2.15, + "learning_rate": 3.932455030716405e-07, + "loss": 0.3877, + "step": 83842 + }, + { + "epoch": 2.15, + "learning_rate": 3.9322350835652394e-07, + "loss": 0.3477, + "step": 83843 + }, + { + "epoch": 2.15, + "learning_rate": 3.932015141059882e-07, + "loss": 0.4121, + "step": 83844 + }, + { + "epoch": 2.15, + "learning_rate": 3.931795203200502e-07, + "loss": 0.4458, + "step": 83845 + }, + { + "epoch": 2.15, + "learning_rate": 3.9315752699872705e-07, + "loss": 0.3945, + "step": 83846 + }, + { + "epoch": 2.15, + "learning_rate": 3.931355341420354e-07, + "loss": 0.3135, + "step": 83847 + }, + { + "epoch": 2.15, + "learning_rate": 3.9311354174999144e-07, + "loss": 0.3926, + "step": 83848 + }, + { + "epoch": 2.15, + "learning_rate": 3.930915498226126e-07, + "loss": 0.3252, + "step": 83849 + }, + { + "epoch": 2.15, + "learning_rate": 3.9306955835991573e-07, + "loss": 0.4233, + "step": 83850 + }, + { + "epoch": 2.15, + "learning_rate": 3.930475673619178e-07, + "loss": 0.3442, + "step": 83851 + }, + { + "epoch": 2.15, + "learning_rate": 3.9302557682863524e-07, + "loss": 0.4109, + "step": 83852 + }, + { + "epoch": 2.15, + "learning_rate": 3.9300358676008493e-07, + "loss": 0.4971, + "step": 83853 + }, + { + "epoch": 2.15, + "learning_rate": 3.9298159715628397e-07, + "loss": 0.3725, + "step": 83854 + }, + { + "epoch": 2.15, + "learning_rate": 3.9295960801724935e-07, + "loss": 0.4492, + "step": 83855 + }, + { + "epoch": 2.15, + "learning_rate": 3.9293761934299775e-07, + "loss": 0.4517, + "step": 83856 + }, + { + "epoch": 2.15, + "learning_rate": 3.929156311335455e-07, + "loss": 0.3391, + "step": 83857 + }, + { + "epoch": 2.15, + "learning_rate": 3.9289364338890983e-07, + "loss": 0.4775, + "step": 83858 + }, + { + "epoch": 2.15, + "learning_rate": 3.92871656109108e-07, + "loss": 0.3984, + "step": 83859 + }, + { + "epoch": 2.15, + "learning_rate": 3.9284966929415606e-07, + "loss": 0.244, + "step": 83860 + }, + { + "epoch": 2.15, + "learning_rate": 3.9282768294407107e-07, + "loss": 0.4197, + "step": 83861 + }, + { + "epoch": 2.15, + "learning_rate": 3.928056970588702e-07, + "loss": 0.4146, + "step": 83862 + }, + { + "epoch": 2.15, + "learning_rate": 3.9278371163857037e-07, + "loss": 0.3281, + "step": 83863 + }, + { + "epoch": 2.15, + "learning_rate": 3.9276172668318776e-07, + "loss": 0.4175, + "step": 83864 + }, + { + "epoch": 2.15, + "learning_rate": 3.927397421927395e-07, + "loss": 0.3757, + "step": 83865 + }, + { + "epoch": 2.15, + "learning_rate": 3.9271775816724296e-07, + "loss": 0.3594, + "step": 83866 + }, + { + "epoch": 2.15, + "learning_rate": 3.926957746067141e-07, + "loss": 0.4746, + "step": 83867 + }, + { + "epoch": 2.15, + "learning_rate": 3.9267379151117054e-07, + "loss": 0.3667, + "step": 83868 + }, + { + "epoch": 2.15, + "learning_rate": 3.9265180888062845e-07, + "loss": 0.3892, + "step": 83869 + }, + { + "epoch": 2.15, + "learning_rate": 3.926298267151048e-07, + "loss": 0.4203, + "step": 83870 + }, + { + "epoch": 2.15, + "learning_rate": 3.9260784501461665e-07, + "loss": 0.4785, + "step": 83871 + }, + { + "epoch": 2.15, + "learning_rate": 3.9258586377918103e-07, + "loss": 0.396, + "step": 83872 + }, + { + "epoch": 2.15, + "learning_rate": 3.9256388300881414e-07, + "loss": 0.4263, + "step": 83873 + }, + { + "epoch": 2.15, + "learning_rate": 3.9254190270353324e-07, + "loss": 0.3364, + "step": 83874 + }, + { + "epoch": 2.15, + "learning_rate": 3.9251992286335544e-07, + "loss": 0.3142, + "step": 83875 + }, + { + "epoch": 2.15, + "learning_rate": 3.9249794348829713e-07, + "loss": 0.4487, + "step": 83876 + }, + { + "epoch": 2.15, + "learning_rate": 3.9247596457837485e-07, + "loss": 0.3912, + "step": 83877 + }, + { + "epoch": 2.15, + "learning_rate": 3.924539861336058e-07, + "loss": 0.4912, + "step": 83878 + }, + { + "epoch": 2.15, + "learning_rate": 3.924320081540068e-07, + "loss": 0.5146, + "step": 83879 + }, + { + "epoch": 2.15, + "learning_rate": 3.92410030639595e-07, + "loss": 0.5073, + "step": 83880 + }, + { + "epoch": 2.15, + "learning_rate": 3.9238805359038664e-07, + "loss": 0.3354, + "step": 83881 + }, + { + "epoch": 2.15, + "learning_rate": 3.9236607700639867e-07, + "loss": 0.3691, + "step": 83882 + }, + { + "epoch": 2.15, + "learning_rate": 3.9234410088764826e-07, + "loss": 0.3936, + "step": 83883 + }, + { + "epoch": 2.15, + "learning_rate": 3.923221252341522e-07, + "loss": 0.4111, + "step": 83884 + }, + { + "epoch": 2.15, + "learning_rate": 3.9230015004592687e-07, + "loss": 0.2786, + "step": 83885 + }, + { + "epoch": 2.15, + "learning_rate": 3.9227817532298966e-07, + "loss": 0.3496, + "step": 83886 + }, + { + "epoch": 2.15, + "learning_rate": 3.9225620106535683e-07, + "loss": 0.4771, + "step": 83887 + }, + { + "epoch": 2.15, + "learning_rate": 3.9223422727304546e-07, + "loss": 0.3921, + "step": 83888 + }, + { + "epoch": 2.15, + "learning_rate": 3.922122539460727e-07, + "loss": 0.4746, + "step": 83889 + }, + { + "epoch": 2.15, + "learning_rate": 3.9219028108445483e-07, + "loss": 0.3735, + "step": 83890 + }, + { + "epoch": 2.15, + "learning_rate": 3.921683086882088e-07, + "loss": 0.3959, + "step": 83891 + }, + { + "epoch": 2.15, + "learning_rate": 3.92146336757352e-07, + "loss": 0.4417, + "step": 83892 + }, + { + "epoch": 2.15, + "learning_rate": 3.921243652919004e-07, + "loss": 0.4277, + "step": 83893 + }, + { + "epoch": 2.15, + "learning_rate": 3.921023942918712e-07, + "loss": 0.4297, + "step": 83894 + }, + { + "epoch": 2.15, + "learning_rate": 3.9208042375728123e-07, + "loss": 0.2795, + "step": 83895 + }, + { + "epoch": 2.15, + "learning_rate": 3.920584536881477e-07, + "loss": 0.2692, + "step": 83896 + }, + { + "epoch": 2.15, + "learning_rate": 3.920364840844871e-07, + "loss": 0.4551, + "step": 83897 + }, + { + "epoch": 2.15, + "learning_rate": 3.920145149463158e-07, + "loss": 0.4697, + "step": 83898 + }, + { + "epoch": 2.15, + "learning_rate": 3.9199254627365107e-07, + "loss": 0.2656, + "step": 83899 + }, + { + "epoch": 2.15, + "learning_rate": 3.919705780665097e-07, + "loss": 0.4385, + "step": 83900 + }, + { + "epoch": 2.15, + "learning_rate": 3.9194861032490876e-07, + "loss": 0.3801, + "step": 83901 + }, + { + "epoch": 2.15, + "learning_rate": 3.919266430488646e-07, + "loss": 0.3735, + "step": 83902 + }, + { + "epoch": 2.15, + "learning_rate": 3.9190467623839417e-07, + "loss": 0.4556, + "step": 83903 + }, + { + "epoch": 2.15, + "learning_rate": 3.918827098935144e-07, + "loss": 0.3208, + "step": 83904 + }, + { + "epoch": 2.15, + "learning_rate": 3.918607440142423e-07, + "loss": 0.4163, + "step": 83905 + }, + { + "epoch": 2.15, + "learning_rate": 3.9183877860059465e-07, + "loss": 0.4382, + "step": 83906 + }, + { + "epoch": 2.15, + "learning_rate": 3.9181681365258754e-07, + "loss": 0.2817, + "step": 83907 + }, + { + "epoch": 2.15, + "learning_rate": 3.9179484917023854e-07, + "loss": 0.3208, + "step": 83908 + }, + { + "epoch": 2.15, + "learning_rate": 3.917728851535641e-07, + "loss": 0.3503, + "step": 83909 + }, + { + "epoch": 2.15, + "learning_rate": 3.917509216025816e-07, + "loss": 0.4316, + "step": 83910 + }, + { + "epoch": 2.15, + "learning_rate": 3.917289585173071e-07, + "loss": 0.4312, + "step": 83911 + }, + { + "epoch": 2.15, + "learning_rate": 3.917069958977578e-07, + "loss": 0.3469, + "step": 83912 + }, + { + "epoch": 2.15, + "learning_rate": 3.916850337439508e-07, + "loss": 0.3906, + "step": 83913 + }, + { + "epoch": 2.15, + "learning_rate": 3.916630720559023e-07, + "loss": 0.3577, + "step": 83914 + }, + { + "epoch": 2.15, + "learning_rate": 3.916411108336294e-07, + "loss": 0.4312, + "step": 83915 + }, + { + "epoch": 2.15, + "learning_rate": 3.916191500771492e-07, + "loss": 0.5381, + "step": 83916 + }, + { + "epoch": 2.15, + "learning_rate": 3.9159718978647793e-07, + "loss": 0.3645, + "step": 83917 + }, + { + "epoch": 2.15, + "learning_rate": 3.9157522996163303e-07, + "loss": 0.4424, + "step": 83918 + }, + { + "epoch": 2.15, + "learning_rate": 3.915532706026308e-07, + "loss": 0.4324, + "step": 83919 + }, + { + "epoch": 2.15, + "learning_rate": 3.9153131170948804e-07, + "loss": 0.5146, + "step": 83920 + }, + { + "epoch": 2.15, + "learning_rate": 3.915093532822219e-07, + "loss": 0.2793, + "step": 83921 + }, + { + "epoch": 2.15, + "learning_rate": 3.914873953208494e-07, + "loss": 0.4614, + "step": 83922 + }, + { + "epoch": 2.15, + "learning_rate": 3.9146543782538677e-07, + "loss": 0.4907, + "step": 83923 + }, + { + "epoch": 2.15, + "learning_rate": 3.9144348079585086e-07, + "loss": 0.3901, + "step": 83924 + }, + { + "epoch": 2.15, + "learning_rate": 3.9142152423225894e-07, + "loss": 0.5046, + "step": 83925 + }, + { + "epoch": 2.15, + "learning_rate": 3.913995681346277e-07, + "loss": 0.3724, + "step": 83926 + }, + { + "epoch": 2.15, + "learning_rate": 3.9137761250297396e-07, + "loss": 0.437, + "step": 83927 + }, + { + "epoch": 2.15, + "learning_rate": 3.9135565733731404e-07, + "loss": 0.5156, + "step": 83928 + }, + { + "epoch": 2.15, + "learning_rate": 3.9133370263766507e-07, + "loss": 0.4131, + "step": 83929 + }, + { + "epoch": 2.15, + "learning_rate": 3.9131174840404426e-07, + "loss": 0.4277, + "step": 83930 + }, + { + "epoch": 2.15, + "learning_rate": 3.912897946364677e-07, + "loss": 0.4917, + "step": 83931 + }, + { + "epoch": 2.15, + "learning_rate": 3.912678413349526e-07, + "loss": 0.3677, + "step": 83932 + }, + { + "epoch": 2.15, + "learning_rate": 3.912458884995157e-07, + "loss": 0.373, + "step": 83933 + }, + { + "epoch": 2.15, + "learning_rate": 3.912239361301741e-07, + "loss": 0.4355, + "step": 83934 + }, + { + "epoch": 2.15, + "learning_rate": 3.912019842269444e-07, + "loss": 0.3523, + "step": 83935 + }, + { + "epoch": 2.15, + "learning_rate": 3.91180032789843e-07, + "loss": 0.4012, + "step": 83936 + }, + { + "epoch": 2.15, + "learning_rate": 3.911580818188871e-07, + "loss": 0.377, + "step": 83937 + }, + { + "epoch": 2.15, + "learning_rate": 3.911361313140934e-07, + "loss": 0.5093, + "step": 83938 + }, + { + "epoch": 2.15, + "learning_rate": 3.9111418127547913e-07, + "loss": 0.2825, + "step": 83939 + }, + { + "epoch": 2.15, + "learning_rate": 3.9109223170306036e-07, + "loss": 0.3287, + "step": 83940 + }, + { + "epoch": 2.15, + "learning_rate": 3.910702825968543e-07, + "loss": 0.3926, + "step": 83941 + }, + { + "epoch": 2.15, + "learning_rate": 3.9104833395687775e-07, + "loss": 0.4082, + "step": 83942 + }, + { + "epoch": 2.15, + "learning_rate": 3.9102638578314786e-07, + "loss": 0.3625, + "step": 83943 + }, + { + "epoch": 2.15, + "learning_rate": 3.9100443807568065e-07, + "loss": 0.3101, + "step": 83944 + }, + { + "epoch": 2.15, + "learning_rate": 3.9098249083449363e-07, + "loss": 0.325, + "step": 83945 + }, + { + "epoch": 2.15, + "learning_rate": 3.909605440596031e-07, + "loss": 0.4031, + "step": 83946 + }, + { + "epoch": 2.15, + "learning_rate": 3.9093859775102634e-07, + "loss": 0.356, + "step": 83947 + }, + { + "epoch": 2.15, + "learning_rate": 3.909166519087795e-07, + "loss": 0.3555, + "step": 83948 + }, + { + "epoch": 2.15, + "learning_rate": 3.908947065328799e-07, + "loss": 0.3073, + "step": 83949 + }, + { + "epoch": 2.15, + "learning_rate": 3.9087276162334416e-07, + "loss": 0.3292, + "step": 83950 + }, + { + "epoch": 2.15, + "learning_rate": 3.908508171801895e-07, + "loss": 0.3663, + "step": 83951 + }, + { + "epoch": 2.15, + "learning_rate": 3.9082887320343206e-07, + "loss": 0.4053, + "step": 83952 + }, + { + "epoch": 2.15, + "learning_rate": 3.908069296930888e-07, + "loss": 0.2779, + "step": 83953 + }, + { + "epoch": 2.15, + "learning_rate": 3.907849866491768e-07, + "loss": 0.4048, + "step": 83954 + }, + { + "epoch": 2.15, + "learning_rate": 3.90763044071713e-07, + "loss": 0.5762, + "step": 83955 + }, + { + "epoch": 2.15, + "learning_rate": 3.9074110196071397e-07, + "loss": 0.395, + "step": 83956 + }, + { + "epoch": 2.15, + "learning_rate": 3.90719160316196e-07, + "loss": 0.4688, + "step": 83957 + }, + { + "epoch": 2.15, + "learning_rate": 3.9069721913817643e-07, + "loss": 0.2743, + "step": 83958 + }, + { + "epoch": 2.15, + "learning_rate": 3.90675278426672e-07, + "loss": 0.363, + "step": 83959 + }, + { + "epoch": 2.15, + "learning_rate": 3.906533381816999e-07, + "loss": 0.3369, + "step": 83960 + }, + { + "epoch": 2.15, + "learning_rate": 3.906313984032761e-07, + "loss": 0.3452, + "step": 83961 + }, + { + "epoch": 2.15, + "learning_rate": 3.9060945909141775e-07, + "loss": 0.4438, + "step": 83962 + }, + { + "epoch": 2.15, + "learning_rate": 3.9058752024614185e-07, + "loss": 0.2382, + "step": 83963 + }, + { + "epoch": 2.15, + "learning_rate": 3.9056558186746533e-07, + "loss": 0.3105, + "step": 83964 + }, + { + "epoch": 2.15, + "learning_rate": 3.9054364395540476e-07, + "loss": 0.356, + "step": 83965 + }, + { + "epoch": 2.15, + "learning_rate": 3.905217065099765e-07, + "loss": 0.4624, + "step": 83966 + }, + { + "epoch": 2.15, + "learning_rate": 3.904997695311978e-07, + "loss": 0.5181, + "step": 83967 + }, + { + "epoch": 2.15, + "learning_rate": 3.904778330190857e-07, + "loss": 0.3618, + "step": 83968 + }, + { + "epoch": 2.15, + "learning_rate": 3.9045589697365633e-07, + "loss": 0.4385, + "step": 83969 + }, + { + "epoch": 2.15, + "learning_rate": 3.904339613949269e-07, + "loss": 0.2594, + "step": 83970 + }, + { + "epoch": 2.15, + "learning_rate": 3.9041202628291414e-07, + "loss": 0.437, + "step": 83971 + }, + { + "epoch": 2.15, + "learning_rate": 3.9039009163763524e-07, + "loss": 0.4873, + "step": 83972 + }, + { + "epoch": 2.15, + "learning_rate": 3.903681574591062e-07, + "loss": 0.3872, + "step": 83973 + }, + { + "epoch": 2.15, + "learning_rate": 3.903462237473444e-07, + "loss": 0.4746, + "step": 83974 + }, + { + "epoch": 2.15, + "learning_rate": 3.903242905023666e-07, + "loss": 0.3799, + "step": 83975 + }, + { + "epoch": 2.15, + "learning_rate": 3.903023577241893e-07, + "loss": 0.4897, + "step": 83976 + }, + { + "epoch": 2.15, + "learning_rate": 3.902804254128297e-07, + "loss": 0.3011, + "step": 83977 + }, + { + "epoch": 2.15, + "learning_rate": 3.90258493568304e-07, + "loss": 0.4438, + "step": 83978 + }, + { + "epoch": 2.15, + "learning_rate": 3.9023656219062927e-07, + "loss": 0.4829, + "step": 83979 + }, + { + "epoch": 2.15, + "learning_rate": 3.902146312798225e-07, + "loss": 0.5605, + "step": 83980 + }, + { + "epoch": 2.15, + "learning_rate": 3.901927008359005e-07, + "loss": 0.4561, + "step": 83981 + }, + { + "epoch": 2.15, + "learning_rate": 3.901707708588797e-07, + "loss": 0.3809, + "step": 83982 + }, + { + "epoch": 2.15, + "learning_rate": 3.901488413487771e-07, + "loss": 0.4092, + "step": 83983 + }, + { + "epoch": 2.15, + "learning_rate": 3.901269123056098e-07, + "loss": 0.4297, + "step": 83984 + }, + { + "epoch": 2.15, + "learning_rate": 3.9010498372939437e-07, + "loss": 0.3945, + "step": 83985 + }, + { + "epoch": 2.15, + "learning_rate": 3.900830556201471e-07, + "loss": 0.4429, + "step": 83986 + }, + { + "epoch": 2.15, + "learning_rate": 3.9006112797788514e-07, + "loss": 0.4121, + "step": 83987 + }, + { + "epoch": 2.15, + "learning_rate": 3.900392008026254e-07, + "loss": 0.5039, + "step": 83988 + }, + { + "epoch": 2.15, + "learning_rate": 3.900172740943849e-07, + "loss": 0.4673, + "step": 83989 + }, + { + "epoch": 2.15, + "learning_rate": 3.899953478531798e-07, + "loss": 0.3221, + "step": 83990 + }, + { + "epoch": 2.15, + "learning_rate": 3.899734220790272e-07, + "loss": 0.3726, + "step": 83991 + }, + { + "epoch": 2.15, + "learning_rate": 3.8995149677194395e-07, + "loss": 0.459, + "step": 83992 + }, + { + "epoch": 2.15, + "learning_rate": 3.899295719319471e-07, + "loss": 0.4585, + "step": 83993 + }, + { + "epoch": 2.15, + "learning_rate": 3.899076475590527e-07, + "loss": 0.4526, + "step": 83994 + }, + { + "epoch": 2.15, + "learning_rate": 3.8988572365327845e-07, + "loss": 0.4351, + "step": 83995 + }, + { + "epoch": 2.15, + "learning_rate": 3.8986380021464015e-07, + "loss": 0.3823, + "step": 83996 + }, + { + "epoch": 2.15, + "learning_rate": 3.898418772431552e-07, + "loss": 0.3931, + "step": 83997 + }, + { + "epoch": 2.15, + "learning_rate": 3.8981995473884055e-07, + "loss": 0.4546, + "step": 83998 + }, + { + "epoch": 2.15, + "learning_rate": 3.897980327017124e-07, + "loss": 0.4695, + "step": 83999 + }, + { + "epoch": 2.15, + "learning_rate": 3.8977611113178786e-07, + "loss": 0.3994, + "step": 84000 + }, + { + "epoch": 2.15, + "learning_rate": 3.8975419002908395e-07, + "loss": 0.4224, + "step": 84001 + }, + { + "epoch": 2.15, + "learning_rate": 3.897322693936169e-07, + "loss": 0.4482, + "step": 84002 + }, + { + "epoch": 2.15, + "learning_rate": 3.897103492254038e-07, + "loss": 0.4507, + "step": 84003 + }, + { + "epoch": 2.15, + "learning_rate": 3.896884295244615e-07, + "loss": 0.4141, + "step": 84004 + }, + { + "epoch": 2.15, + "learning_rate": 3.8966651029080686e-07, + "loss": 0.3857, + "step": 84005 + }, + { + "epoch": 2.15, + "learning_rate": 3.896445915244567e-07, + "loss": 0.4248, + "step": 84006 + }, + { + "epoch": 2.15, + "learning_rate": 3.896226732254272e-07, + "loss": 0.5239, + "step": 84007 + }, + { + "epoch": 2.15, + "learning_rate": 3.896007553937355e-07, + "loss": 0.5049, + "step": 84008 + }, + { + "epoch": 2.15, + "learning_rate": 3.895788380293985e-07, + "loss": 0.436, + "step": 84009 + }, + { + "epoch": 2.15, + "learning_rate": 3.8955692113243323e-07, + "loss": 0.4658, + "step": 84010 + }, + { + "epoch": 2.15, + "learning_rate": 3.8953500470285583e-07, + "loss": 0.3501, + "step": 84011 + }, + { + "epoch": 2.15, + "learning_rate": 3.8951308874068333e-07, + "loss": 0.4116, + "step": 84012 + }, + { + "epoch": 2.15, + "learning_rate": 3.8949117324593273e-07, + "loss": 0.2777, + "step": 84013 + }, + { + "epoch": 2.15, + "learning_rate": 3.8946925821862086e-07, + "loss": 0.4331, + "step": 84014 + }, + { + "epoch": 2.15, + "learning_rate": 3.894473436587644e-07, + "loss": 0.4092, + "step": 84015 + }, + { + "epoch": 2.15, + "learning_rate": 3.894254295663797e-07, + "loss": 0.5278, + "step": 84016 + }, + { + "epoch": 2.15, + "learning_rate": 3.894035159414839e-07, + "loss": 0.4663, + "step": 84017 + }, + { + "epoch": 2.15, + "learning_rate": 3.8938160278409406e-07, + "loss": 0.4478, + "step": 84018 + }, + { + "epoch": 2.15, + "learning_rate": 3.893596900942262e-07, + "loss": 0.4509, + "step": 84019 + }, + { + "epoch": 2.15, + "learning_rate": 3.893377778718977e-07, + "loss": 0.3828, + "step": 84020 + }, + { + "epoch": 2.15, + "learning_rate": 3.893158661171251e-07, + "loss": 0.4185, + "step": 84021 + }, + { + "epoch": 2.15, + "learning_rate": 3.8929395482992554e-07, + "loss": 0.313, + "step": 84022 + }, + { + "epoch": 2.15, + "learning_rate": 3.892720440103153e-07, + "loss": 0.364, + "step": 84023 + }, + { + "epoch": 2.15, + "learning_rate": 3.892501336583114e-07, + "loss": 0.479, + "step": 84024 + }, + { + "epoch": 2.15, + "learning_rate": 3.8922822377393084e-07, + "loss": 0.3535, + "step": 84025 + }, + { + "epoch": 2.15, + "learning_rate": 3.8920631435718977e-07, + "loss": 0.3579, + "step": 84026 + }, + { + "epoch": 2.15, + "learning_rate": 3.891844054081057e-07, + "loss": 0.4819, + "step": 84027 + }, + { + "epoch": 2.15, + "learning_rate": 3.891624969266948e-07, + "loss": 0.3838, + "step": 84028 + }, + { + "epoch": 2.15, + "learning_rate": 3.8914058891297406e-07, + "loss": 0.3799, + "step": 84029 + }, + { + "epoch": 2.15, + "learning_rate": 3.8911868136696026e-07, + "loss": 0.4702, + "step": 84030 + }, + { + "epoch": 2.15, + "learning_rate": 3.890967742886705e-07, + "loss": 0.3787, + "step": 84031 + }, + { + "epoch": 2.15, + "learning_rate": 3.890748676781209e-07, + "loss": 0.282, + "step": 84032 + }, + { + "epoch": 2.15, + "learning_rate": 3.8905296153532863e-07, + "loss": 0.4263, + "step": 84033 + }, + { + "epoch": 2.15, + "learning_rate": 3.890310558603104e-07, + "loss": 0.2653, + "step": 84034 + }, + { + "epoch": 2.15, + "learning_rate": 3.890091506530837e-07, + "loss": 0.418, + "step": 84035 + }, + { + "epoch": 2.15, + "learning_rate": 3.8898724591366395e-07, + "loss": 0.4053, + "step": 84036 + }, + { + "epoch": 2.15, + "learning_rate": 3.889653416420685e-07, + "loss": 0.4141, + "step": 84037 + }, + { + "epoch": 2.15, + "learning_rate": 3.889434378383142e-07, + "loss": 0.4106, + "step": 84038 + }, + { + "epoch": 2.15, + "learning_rate": 3.8892153450241815e-07, + "loss": 0.4482, + "step": 84039 + }, + { + "epoch": 2.15, + "learning_rate": 3.8889963163439653e-07, + "loss": 0.4482, + "step": 84040 + }, + { + "epoch": 2.15, + "learning_rate": 3.8887772923426633e-07, + "loss": 0.4082, + "step": 84041 + }, + { + "epoch": 2.15, + "learning_rate": 3.888558273020442e-07, + "loss": 0.458, + "step": 84042 + }, + { + "epoch": 2.15, + "learning_rate": 3.888339258377475e-07, + "loss": 0.4585, + "step": 84043 + }, + { + "epoch": 2.15, + "learning_rate": 3.888120248413923e-07, + "loss": 0.4922, + "step": 84044 + }, + { + "epoch": 2.15, + "learning_rate": 3.8879012431299593e-07, + "loss": 0.4902, + "step": 84045 + }, + { + "epoch": 2.15, + "learning_rate": 3.887682242525745e-07, + "loss": 0.3845, + "step": 84046 + }, + { + "epoch": 2.15, + "learning_rate": 3.887463246601451e-07, + "loss": 0.4404, + "step": 84047 + }, + { + "epoch": 2.15, + "learning_rate": 3.8872442553572495e-07, + "loss": 0.2937, + "step": 84048 + }, + { + "epoch": 2.15, + "learning_rate": 3.8870252687933003e-07, + "loss": 0.3457, + "step": 84049 + }, + { + "epoch": 2.15, + "learning_rate": 3.886806286909774e-07, + "loss": 0.3435, + "step": 84050 + }, + { + "epoch": 2.15, + "learning_rate": 3.88658730970684e-07, + "loss": 0.4287, + "step": 84051 + }, + { + "epoch": 2.15, + "learning_rate": 3.8863683371846676e-07, + "loss": 0.4429, + "step": 84052 + }, + { + "epoch": 2.15, + "learning_rate": 3.8861493693434187e-07, + "loss": 0.394, + "step": 84053 + }, + { + "epoch": 2.15, + "learning_rate": 3.8859304061832656e-07, + "loss": 0.4851, + "step": 84054 + }, + { + "epoch": 2.15, + "learning_rate": 3.885711447704376e-07, + "loss": 0.4966, + "step": 84055 + }, + { + "epoch": 2.15, + "learning_rate": 3.8854924939069167e-07, + "loss": 0.4915, + "step": 84056 + }, + { + "epoch": 2.15, + "learning_rate": 3.885273544791051e-07, + "loss": 0.4561, + "step": 84057 + }, + { + "epoch": 2.15, + "learning_rate": 3.8850546003569505e-07, + "loss": 0.4229, + "step": 84058 + }, + { + "epoch": 2.15, + "learning_rate": 3.8848356606047817e-07, + "loss": 0.4829, + "step": 84059 + }, + { + "epoch": 2.15, + "learning_rate": 3.884616725534717e-07, + "loss": 0.4736, + "step": 84060 + }, + { + "epoch": 2.15, + "learning_rate": 3.8843977951469173e-07, + "loss": 0.394, + "step": 84061 + }, + { + "epoch": 2.15, + "learning_rate": 3.884178869441552e-07, + "loss": 0.4839, + "step": 84062 + }, + { + "epoch": 2.15, + "learning_rate": 3.88395994841879e-07, + "loss": 0.4941, + "step": 84063 + }, + { + "epoch": 2.15, + "learning_rate": 3.8837410320788035e-07, + "loss": 0.3828, + "step": 84064 + }, + { + "epoch": 2.15, + "learning_rate": 3.883522120421754e-07, + "loss": 0.4448, + "step": 84065 + }, + { + "epoch": 2.15, + "learning_rate": 3.883303213447806e-07, + "loss": 0.4038, + "step": 84066 + }, + { + "epoch": 2.15, + "learning_rate": 3.883084311157133e-07, + "loss": 0.4429, + "step": 84067 + }, + { + "epoch": 2.15, + "learning_rate": 3.8828654135499007e-07, + "loss": 0.415, + "step": 84068 + }, + { + "epoch": 2.15, + "learning_rate": 3.88264652062628e-07, + "loss": 0.3235, + "step": 84069 + }, + { + "epoch": 2.15, + "learning_rate": 3.882427632386432e-07, + "loss": 0.4468, + "step": 84070 + }, + { + "epoch": 2.15, + "learning_rate": 3.882208748830529e-07, + "loss": 0.3787, + "step": 84071 + }, + { + "epoch": 2.15, + "learning_rate": 3.881989869958736e-07, + "loss": 0.457, + "step": 84072 + }, + { + "epoch": 2.15, + "learning_rate": 3.8817709957712265e-07, + "loss": 0.3518, + "step": 84073 + }, + { + "epoch": 2.15, + "learning_rate": 3.881552126268161e-07, + "loss": 0.3569, + "step": 84074 + }, + { + "epoch": 2.15, + "learning_rate": 3.881333261449712e-07, + "loss": 0.3582, + "step": 84075 + }, + { + "epoch": 2.15, + "learning_rate": 3.881114401316041e-07, + "loss": 0.2848, + "step": 84076 + }, + { + "epoch": 2.15, + "learning_rate": 3.880895545867323e-07, + "loss": 0.4912, + "step": 84077 + }, + { + "epoch": 2.15, + "learning_rate": 3.8806766951037184e-07, + "loss": 0.3691, + "step": 84078 + }, + { + "epoch": 2.15, + "learning_rate": 3.880457849025399e-07, + "loss": 0.3809, + "step": 84079 + }, + { + "epoch": 2.16, + "learning_rate": 3.880239007632531e-07, + "loss": 0.416, + "step": 84080 + }, + { + "epoch": 2.16, + "learning_rate": 3.8800201709252865e-07, + "loss": 0.3635, + "step": 84081 + }, + { + "epoch": 2.16, + "learning_rate": 3.879801338903825e-07, + "loss": 0.2853, + "step": 84082 + }, + { + "epoch": 2.16, + "learning_rate": 3.879582511568319e-07, + "loss": 0.3396, + "step": 84083 + }, + { + "epoch": 2.16, + "learning_rate": 3.8793636889189353e-07, + "loss": 0.3779, + "step": 84084 + }, + { + "epoch": 2.16, + "learning_rate": 3.879144870955844e-07, + "loss": 0.5312, + "step": 84085 + }, + { + "epoch": 2.16, + "learning_rate": 3.8789260576792106e-07, + "loss": 0.3428, + "step": 84086 + }, + { + "epoch": 2.16, + "learning_rate": 3.878707249089198e-07, + "loss": 0.3549, + "step": 84087 + }, + { + "epoch": 2.16, + "learning_rate": 3.878488445185979e-07, + "loss": 0.4238, + "step": 84088 + }, + { + "epoch": 2.16, + "learning_rate": 3.8782696459697193e-07, + "loss": 0.4053, + "step": 84089 + }, + { + "epoch": 2.16, + "learning_rate": 3.8780508514405896e-07, + "loss": 0.311, + "step": 84090 + }, + { + "epoch": 2.16, + "learning_rate": 3.877832061598753e-07, + "loss": 0.3167, + "step": 84091 + }, + { + "epoch": 2.16, + "learning_rate": 3.8776132764443783e-07, + "loss": 0.5474, + "step": 84092 + }, + { + "epoch": 2.16, + "learning_rate": 3.877394495977636e-07, + "loss": 0.5249, + "step": 84093 + }, + { + "epoch": 2.16, + "learning_rate": 3.8771757201986887e-07, + "loss": 0.4272, + "step": 84094 + }, + { + "epoch": 2.16, + "learning_rate": 3.87695694910771e-07, + "loss": 0.4629, + "step": 84095 + }, + { + "epoch": 2.16, + "learning_rate": 3.8767381827048606e-07, + "loss": 0.3474, + "step": 84096 + }, + { + "epoch": 2.16, + "learning_rate": 3.876519420990311e-07, + "loss": 0.392, + "step": 84097 + }, + { + "epoch": 2.16, + "learning_rate": 3.8763006639642313e-07, + "loss": 0.3286, + "step": 84098 + }, + { + "epoch": 2.16, + "learning_rate": 3.876081911626784e-07, + "loss": 0.3979, + "step": 84099 + }, + { + "epoch": 2.16, + "learning_rate": 3.875863163978139e-07, + "loss": 0.3367, + "step": 84100 + }, + { + "epoch": 2.16, + "learning_rate": 3.875644421018465e-07, + "loss": 0.519, + "step": 84101 + }, + { + "epoch": 2.16, + "learning_rate": 3.8754256827479304e-07, + "loss": 0.4224, + "step": 84102 + }, + { + "epoch": 2.16, + "learning_rate": 3.8752069491666985e-07, + "loss": 0.4829, + "step": 84103 + }, + { + "epoch": 2.16, + "learning_rate": 3.8749882202749385e-07, + "loss": 0.436, + "step": 84104 + }, + { + "epoch": 2.16, + "learning_rate": 3.8747694960728215e-07, + "loss": 0.5405, + "step": 84105 + }, + { + "epoch": 2.16, + "learning_rate": 3.874550776560509e-07, + "loss": 0.3066, + "step": 84106 + }, + { + "epoch": 2.16, + "learning_rate": 3.8743320617381747e-07, + "loss": 0.4155, + "step": 84107 + }, + { + "epoch": 2.16, + "learning_rate": 3.874113351605979e-07, + "loss": 0.4868, + "step": 84108 + }, + { + "epoch": 2.16, + "learning_rate": 3.873894646164093e-07, + "loss": 0.3877, + "step": 84109 + }, + { + "epoch": 2.16, + "learning_rate": 3.873675945412688e-07, + "loss": 0.4849, + "step": 84110 + }, + { + "epoch": 2.16, + "learning_rate": 3.8734572493519233e-07, + "loss": 0.5166, + "step": 84111 + }, + { + "epoch": 2.16, + "learning_rate": 3.8732385579819717e-07, + "loss": 0.377, + "step": 84112 + }, + { + "epoch": 2.16, + "learning_rate": 3.873019871302998e-07, + "loss": 0.3536, + "step": 84113 + }, + { + "epoch": 2.16, + "learning_rate": 3.8728011893151767e-07, + "loss": 0.2193, + "step": 84114 + }, + { + "epoch": 2.16, + "learning_rate": 3.8725825120186695e-07, + "loss": 0.4253, + "step": 84115 + }, + { + "epoch": 2.16, + "learning_rate": 3.872363839413639e-07, + "loss": 0.4199, + "step": 84116 + }, + { + "epoch": 2.16, + "learning_rate": 3.8721451715002596e-07, + "loss": 0.437, + "step": 84117 + }, + { + "epoch": 2.16, + "learning_rate": 3.8719265082786956e-07, + "loss": 0.5093, + "step": 84118 + }, + { + "epoch": 2.16, + "learning_rate": 3.871707849749121e-07, + "loss": 0.478, + "step": 84119 + }, + { + "epoch": 2.16, + "learning_rate": 3.8714891959116925e-07, + "loss": 0.4072, + "step": 84120 + }, + { + "epoch": 2.16, + "learning_rate": 3.871270546766583e-07, + "loss": 0.312, + "step": 84121 + }, + { + "epoch": 2.16, + "learning_rate": 3.871051902313961e-07, + "loss": 0.4512, + "step": 84122 + }, + { + "epoch": 2.16, + "learning_rate": 3.8708332625539954e-07, + "loss": 0.4111, + "step": 84123 + }, + { + "epoch": 2.16, + "learning_rate": 3.870614627486848e-07, + "loss": 0.4702, + "step": 84124 + }, + { + "epoch": 2.16, + "learning_rate": 3.870395997112692e-07, + "loss": 0.3296, + "step": 84125 + }, + { + "epoch": 2.16, + "learning_rate": 3.870177371431689e-07, + "loss": 0.3599, + "step": 84126 + }, + { + "epoch": 2.16, + "learning_rate": 3.8699587504440123e-07, + "loss": 0.3357, + "step": 84127 + }, + { + "epoch": 2.16, + "learning_rate": 3.869740134149824e-07, + "loss": 0.3319, + "step": 84128 + }, + { + "epoch": 2.16, + "learning_rate": 3.8695215225492926e-07, + "loss": 0.3258, + "step": 84129 + }, + { + "epoch": 2.16, + "learning_rate": 3.869302915642587e-07, + "loss": 0.3745, + "step": 84130 + }, + { + "epoch": 2.16, + "learning_rate": 3.8690843134298777e-07, + "loss": 0.4321, + "step": 84131 + }, + { + "epoch": 2.16, + "learning_rate": 3.868865715911325e-07, + "loss": 0.4521, + "step": 84132 + }, + { + "epoch": 2.16, + "learning_rate": 3.8686471230871e-07, + "loss": 0.3521, + "step": 84133 + }, + { + "epoch": 2.16, + "learning_rate": 3.868428534957371e-07, + "loss": 0.2231, + "step": 84134 + }, + { + "epoch": 2.16, + "learning_rate": 3.8682099515223064e-07, + "loss": 0.3696, + "step": 84135 + }, + { + "epoch": 2.16, + "learning_rate": 3.867991372782072e-07, + "loss": 0.4092, + "step": 84136 + }, + { + "epoch": 2.16, + "learning_rate": 3.8677727987368315e-07, + "loss": 0.4321, + "step": 84137 + }, + { + "epoch": 2.16, + "learning_rate": 3.8675542293867547e-07, + "loss": 0.322, + "step": 84138 + }, + { + "epoch": 2.16, + "learning_rate": 3.86733566473201e-07, + "loss": 0.3213, + "step": 84139 + }, + { + "epoch": 2.16, + "learning_rate": 3.867117104772768e-07, + "loss": 0.4453, + "step": 84140 + }, + { + "epoch": 2.16, + "learning_rate": 3.8668985495091887e-07, + "loss": 0.3911, + "step": 84141 + }, + { + "epoch": 2.16, + "learning_rate": 3.8666799989414434e-07, + "loss": 0.2468, + "step": 84142 + }, + { + "epoch": 2.16, + "learning_rate": 3.866461453069699e-07, + "loss": 0.4648, + "step": 84143 + }, + { + "epoch": 2.16, + "learning_rate": 3.8662429118941267e-07, + "loss": 0.4775, + "step": 84144 + }, + { + "epoch": 2.16, + "learning_rate": 3.8660243754148903e-07, + "loss": 0.3755, + "step": 84145 + }, + { + "epoch": 2.16, + "learning_rate": 3.8658058436321526e-07, + "loss": 0.3895, + "step": 84146 + }, + { + "epoch": 2.16, + "learning_rate": 3.865587316546086e-07, + "loss": 0.4087, + "step": 84147 + }, + { + "epoch": 2.16, + "learning_rate": 3.8653687941568616e-07, + "loss": 0.4097, + "step": 84148 + }, + { + "epoch": 2.16, + "learning_rate": 3.865150276464637e-07, + "loss": 0.3828, + "step": 84149 + }, + { + "epoch": 2.16, + "learning_rate": 3.8649317634695856e-07, + "loss": 0.4023, + "step": 84150 + }, + { + "epoch": 2.16, + "learning_rate": 3.864713255171874e-07, + "loss": 0.4072, + "step": 84151 + }, + { + "epoch": 2.16, + "learning_rate": 3.864494751571673e-07, + "loss": 0.3999, + "step": 84152 + }, + { + "epoch": 2.16, + "learning_rate": 3.864276252669142e-07, + "loss": 0.2937, + "step": 84153 + }, + { + "epoch": 2.16, + "learning_rate": 3.8640577584644527e-07, + "loss": 0.2554, + "step": 84154 + }, + { + "epoch": 2.16, + "learning_rate": 3.8638392689577757e-07, + "loss": 0.3821, + "step": 84155 + }, + { + "epoch": 2.16, + "learning_rate": 3.863620784149272e-07, + "loss": 0.3945, + "step": 84156 + }, + { + "epoch": 2.16, + "learning_rate": 3.863402304039115e-07, + "loss": 0.356, + "step": 84157 + }, + { + "epoch": 2.16, + "learning_rate": 3.8631838286274656e-07, + "loss": 0.2657, + "step": 84158 + }, + { + "epoch": 2.16, + "learning_rate": 3.8629653579144926e-07, + "loss": 0.3125, + "step": 84159 + }, + { + "epoch": 2.16, + "learning_rate": 3.862746891900366e-07, + "loss": 0.4238, + "step": 84160 + }, + { + "epoch": 2.16, + "learning_rate": 3.862528430585256e-07, + "loss": 0.3542, + "step": 84161 + }, + { + "epoch": 2.16, + "learning_rate": 3.862309973969321e-07, + "loss": 0.4688, + "step": 84162 + }, + { + "epoch": 2.16, + "learning_rate": 3.862091522052734e-07, + "loss": 0.4048, + "step": 84163 + }, + { + "epoch": 2.16, + "learning_rate": 3.861873074835664e-07, + "loss": 0.3904, + "step": 84164 + }, + { + "epoch": 2.16, + "learning_rate": 3.8616546323182755e-07, + "loss": 0.2668, + "step": 84165 + }, + { + "epoch": 2.16, + "learning_rate": 3.861436194500732e-07, + "loss": 0.3872, + "step": 84166 + }, + { + "epoch": 2.16, + "learning_rate": 3.8612177613832064e-07, + "loss": 0.4146, + "step": 84167 + }, + { + "epoch": 2.16, + "learning_rate": 3.8609993329658617e-07, + "loss": 0.3656, + "step": 84168 + }, + { + "epoch": 2.16, + "learning_rate": 3.860780909248873e-07, + "loss": 0.1659, + "step": 84169 + }, + { + "epoch": 2.16, + "learning_rate": 3.8605624902323973e-07, + "loss": 0.4902, + "step": 84170 + }, + { + "epoch": 2.16, + "learning_rate": 3.8603440759166074e-07, + "loss": 0.3481, + "step": 84171 + }, + { + "epoch": 2.16, + "learning_rate": 3.860125666301669e-07, + "loss": 0.4047, + "step": 84172 + }, + { + "epoch": 2.16, + "learning_rate": 3.8599072613877546e-07, + "loss": 0.3826, + "step": 84173 + }, + { + "epoch": 2.16, + "learning_rate": 3.859688861175022e-07, + "loss": 0.4326, + "step": 84174 + }, + { + "epoch": 2.16, + "learning_rate": 3.859470465663648e-07, + "loss": 0.2064, + "step": 84175 + }, + { + "epoch": 2.16, + "learning_rate": 3.8592520748537915e-07, + "loss": 0.3818, + "step": 84176 + }, + { + "epoch": 2.16, + "learning_rate": 3.8590336887456233e-07, + "loss": 0.3674, + "step": 84177 + }, + { + "epoch": 2.16, + "learning_rate": 3.858815307339314e-07, + "loss": 0.4756, + "step": 84178 + }, + { + "epoch": 2.16, + "learning_rate": 3.858596930635023e-07, + "loss": 0.3796, + "step": 84179 + }, + { + "epoch": 2.16, + "learning_rate": 3.858378558632923e-07, + "loss": 0.3787, + "step": 84180 + }, + { + "epoch": 2.16, + "learning_rate": 3.858160191333183e-07, + "loss": 0.2665, + "step": 84181 + }, + { + "epoch": 2.16, + "learning_rate": 3.857941828735964e-07, + "loss": 0.4634, + "step": 84182 + }, + { + "epoch": 2.16, + "learning_rate": 3.8577234708414376e-07, + "loss": 0.4521, + "step": 84183 + }, + { + "epoch": 2.16, + "learning_rate": 3.8575051176497687e-07, + "loss": 0.3511, + "step": 84184 + }, + { + "epoch": 2.16, + "learning_rate": 3.85728676916113e-07, + "loss": 0.3774, + "step": 84185 + }, + { + "epoch": 2.16, + "learning_rate": 3.8570684253756836e-07, + "loss": 0.4287, + "step": 84186 + }, + { + "epoch": 2.16, + "learning_rate": 3.8568500862935935e-07, + "loss": 0.4263, + "step": 84187 + }, + { + "epoch": 2.16, + "learning_rate": 3.8566317519150314e-07, + "loss": 0.3887, + "step": 84188 + }, + { + "epoch": 2.16, + "learning_rate": 3.8564134222401645e-07, + "loss": 0.4502, + "step": 84189 + }, + { + "epoch": 2.16, + "learning_rate": 3.8561950972691626e-07, + "loss": 0.276, + "step": 84190 + }, + { + "epoch": 2.16, + "learning_rate": 3.855976777002186e-07, + "loss": 0.4351, + "step": 84191 + }, + { + "epoch": 2.16, + "learning_rate": 3.8557584614394055e-07, + "loss": 0.3682, + "step": 84192 + }, + { + "epoch": 2.16, + "learning_rate": 3.855540150580988e-07, + "loss": 0.3306, + "step": 84193 + }, + { + "epoch": 2.16, + "learning_rate": 3.855321844427104e-07, + "loss": 0.2659, + "step": 84194 + }, + { + "epoch": 2.16, + "learning_rate": 3.855103542977919e-07, + "loss": 0.3265, + "step": 84195 + }, + { + "epoch": 2.16, + "learning_rate": 3.854885246233593e-07, + "loss": 0.4409, + "step": 84196 + }, + { + "epoch": 2.16, + "learning_rate": 3.8546669541943e-07, + "loss": 0.3264, + "step": 84197 + }, + { + "epoch": 2.16, + "learning_rate": 3.8544486668602094e-07, + "loss": 0.3774, + "step": 84198 + }, + { + "epoch": 2.16, + "learning_rate": 3.8542303842314815e-07, + "loss": 0.4482, + "step": 84199 + }, + { + "epoch": 2.16, + "learning_rate": 3.8540121063082873e-07, + "loss": 0.4492, + "step": 84200 + }, + { + "epoch": 2.16, + "learning_rate": 3.8537938330907926e-07, + "loss": 0.3538, + "step": 84201 + }, + { + "epoch": 2.16, + "learning_rate": 3.853575564579169e-07, + "loss": 0.4058, + "step": 84202 + }, + { + "epoch": 2.16, + "learning_rate": 3.8533573007735767e-07, + "loss": 0.562, + "step": 84203 + }, + { + "epoch": 2.16, + "learning_rate": 3.853139041674186e-07, + "loss": 0.3722, + "step": 84204 + }, + { + "epoch": 2.16, + "learning_rate": 3.8529207872811677e-07, + "loss": 0.3877, + "step": 84205 + }, + { + "epoch": 2.16, + "learning_rate": 3.852702537594681e-07, + "loss": 0.4854, + "step": 84206 + }, + { + "epoch": 2.16, + "learning_rate": 3.8524842926149014e-07, + "loss": 0.436, + "step": 84207 + }, + { + "epoch": 2.16, + "learning_rate": 3.8522660523419893e-07, + "loss": 0.4888, + "step": 84208 + }, + { + "epoch": 2.16, + "learning_rate": 3.852047816776113e-07, + "loss": 0.3679, + "step": 84209 + }, + { + "epoch": 2.16, + "learning_rate": 3.851829585917442e-07, + "loss": 0.4048, + "step": 84210 + }, + { + "epoch": 2.16, + "learning_rate": 3.8516113597661446e-07, + "loss": 0.4272, + "step": 84211 + }, + { + "epoch": 2.16, + "learning_rate": 3.851393138322383e-07, + "loss": 0.4248, + "step": 84212 + }, + { + "epoch": 2.16, + "learning_rate": 3.8511749215863276e-07, + "loss": 0.3979, + "step": 84213 + }, + { + "epoch": 2.16, + "learning_rate": 3.850956709558144e-07, + "loss": 0.3203, + "step": 84214 + }, + { + "epoch": 2.16, + "learning_rate": 3.850738502238008e-07, + "loss": 0.3835, + "step": 84215 + }, + { + "epoch": 2.16, + "learning_rate": 3.85052029962607e-07, + "loss": 0.4102, + "step": 84216 + }, + { + "epoch": 2.16, + "learning_rate": 3.850302101722508e-07, + "loss": 0.4878, + "step": 84217 + }, + { + "epoch": 2.16, + "learning_rate": 3.850083908527485e-07, + "loss": 0.3857, + "step": 84218 + }, + { + "epoch": 2.16, + "learning_rate": 3.8498657200411744e-07, + "loss": 0.4873, + "step": 84219 + }, + { + "epoch": 2.16, + "learning_rate": 3.8496475362637357e-07, + "loss": 0.354, + "step": 84220 + }, + { + "epoch": 2.16, + "learning_rate": 3.8494293571953385e-07, + "loss": 0.3892, + "step": 84221 + }, + { + "epoch": 2.16, + "learning_rate": 3.8492111828361507e-07, + "loss": 0.3813, + "step": 84222 + }, + { + "epoch": 2.16, + "learning_rate": 3.848993013186342e-07, + "loss": 0.4187, + "step": 84223 + }, + { + "epoch": 2.16, + "learning_rate": 3.8487748482460735e-07, + "loss": 0.3774, + "step": 84224 + }, + { + "epoch": 2.16, + "learning_rate": 3.8485566880155186e-07, + "loss": 0.4526, + "step": 84225 + }, + { + "epoch": 2.16, + "learning_rate": 3.848338532494838e-07, + "loss": 0.4541, + "step": 84226 + }, + { + "epoch": 2.16, + "learning_rate": 3.848120381684201e-07, + "loss": 0.4839, + "step": 84227 + }, + { + "epoch": 2.16, + "learning_rate": 3.847902235583779e-07, + "loss": 0.4021, + "step": 84228 + }, + { + "epoch": 2.16, + "learning_rate": 3.847684094193733e-07, + "loss": 0.4072, + "step": 84229 + }, + { + "epoch": 2.16, + "learning_rate": 3.847465957514231e-07, + "loss": 0.2708, + "step": 84230 + }, + { + "epoch": 2.16, + "learning_rate": 3.847247825545442e-07, + "loss": 0.2715, + "step": 84231 + }, + { + "epoch": 2.16, + "learning_rate": 3.847029698287535e-07, + "loss": 0.4561, + "step": 84232 + }, + { + "epoch": 2.16, + "learning_rate": 3.8468115757406715e-07, + "loss": 0.2569, + "step": 84233 + }, + { + "epoch": 2.16, + "learning_rate": 3.846593457905026e-07, + "loss": 0.5361, + "step": 84234 + }, + { + "epoch": 2.16, + "learning_rate": 3.846375344780757e-07, + "loss": 0.4097, + "step": 84235 + }, + { + "epoch": 2.16, + "learning_rate": 3.846157236368038e-07, + "loss": 0.4106, + "step": 84236 + }, + { + "epoch": 2.16, + "learning_rate": 3.845939132667031e-07, + "loss": 0.3967, + "step": 84237 + }, + { + "epoch": 2.16, + "learning_rate": 3.8457210336779045e-07, + "loss": 0.478, + "step": 84238 + }, + { + "epoch": 2.16, + "learning_rate": 3.8455029394008263e-07, + "loss": 0.3999, + "step": 84239 + }, + { + "epoch": 2.16, + "learning_rate": 3.845284849835968e-07, + "loss": 0.3646, + "step": 84240 + }, + { + "epoch": 2.16, + "learning_rate": 3.8450667649834877e-07, + "loss": 0.3723, + "step": 84241 + }, + { + "epoch": 2.16, + "learning_rate": 3.844848684843558e-07, + "loss": 0.4331, + "step": 84242 + }, + { + "epoch": 2.16, + "learning_rate": 3.844630609416344e-07, + "loss": 0.3784, + "step": 84243 + }, + { + "epoch": 2.16, + "learning_rate": 3.8444125387020164e-07, + "loss": 0.438, + "step": 84244 + }, + { + "epoch": 2.16, + "learning_rate": 3.844194472700739e-07, + "loss": 0.437, + "step": 84245 + }, + { + "epoch": 2.16, + "learning_rate": 3.843976411412676e-07, + "loss": 0.3406, + "step": 84246 + }, + { + "epoch": 2.16, + "learning_rate": 3.843758354837997e-07, + "loss": 0.4204, + "step": 84247 + }, + { + "epoch": 2.16, + "learning_rate": 3.8435403029768685e-07, + "loss": 0.3081, + "step": 84248 + }, + { + "epoch": 2.16, + "learning_rate": 3.843322255829463e-07, + "loss": 0.4331, + "step": 84249 + }, + { + "epoch": 2.16, + "learning_rate": 3.843104213395938e-07, + "loss": 0.386, + "step": 84250 + }, + { + "epoch": 2.16, + "learning_rate": 3.842886175676465e-07, + "loss": 0.4028, + "step": 84251 + }, + { + "epoch": 2.16, + "learning_rate": 3.8426681426712113e-07, + "loss": 0.4663, + "step": 84252 + }, + { + "epoch": 2.16, + "learning_rate": 3.842450114380347e-07, + "loss": 0.4873, + "step": 84253 + }, + { + "epoch": 2.16, + "learning_rate": 3.842232090804035e-07, + "loss": 0.3774, + "step": 84254 + }, + { + "epoch": 2.16, + "learning_rate": 3.84201407194244e-07, + "loss": 0.3594, + "step": 84255 + }, + { + "epoch": 2.16, + "learning_rate": 3.841796057795731e-07, + "loss": 0.4937, + "step": 84256 + }, + { + "epoch": 2.16, + "learning_rate": 3.841578048364079e-07, + "loss": 0.3438, + "step": 84257 + }, + { + "epoch": 2.16, + "learning_rate": 3.841360043647645e-07, + "loss": 0.3179, + "step": 84258 + }, + { + "epoch": 2.16, + "learning_rate": 3.841142043646598e-07, + "loss": 0.3424, + "step": 84259 + }, + { + "epoch": 2.16, + "learning_rate": 3.840924048361105e-07, + "loss": 0.4575, + "step": 84260 + }, + { + "epoch": 2.16, + "learning_rate": 3.840706057791338e-07, + "loss": 0.3901, + "step": 84261 + }, + { + "epoch": 2.16, + "learning_rate": 3.840488071937453e-07, + "loss": 0.479, + "step": 84262 + }, + { + "epoch": 2.16, + "learning_rate": 3.8402700907996254e-07, + "loss": 0.479, + "step": 84263 + }, + { + "epoch": 2.16, + "learning_rate": 3.8400521143780216e-07, + "loss": 0.5093, + "step": 84264 + }, + { + "epoch": 2.16, + "learning_rate": 3.839834142672804e-07, + "loss": 0.3833, + "step": 84265 + }, + { + "epoch": 2.16, + "learning_rate": 3.839616175684146e-07, + "loss": 0.4897, + "step": 84266 + }, + { + "epoch": 2.16, + "learning_rate": 3.8393982134122073e-07, + "loss": 0.4707, + "step": 84267 + }, + { + "epoch": 2.16, + "learning_rate": 3.839180255857157e-07, + "loss": 0.3882, + "step": 84268 + }, + { + "epoch": 2.16, + "learning_rate": 3.8389623030191645e-07, + "loss": 0.4805, + "step": 84269 + }, + { + "epoch": 2.16, + "learning_rate": 3.838744354898398e-07, + "loss": 0.429, + "step": 84270 + }, + { + "epoch": 2.16, + "learning_rate": 3.838526411495018e-07, + "loss": 0.3398, + "step": 84271 + }, + { + "epoch": 2.16, + "learning_rate": 3.838308472809195e-07, + "loss": 0.5142, + "step": 84272 + }, + { + "epoch": 2.16, + "learning_rate": 3.8380905388411e-07, + "loss": 0.3932, + "step": 84273 + }, + { + "epoch": 2.16, + "learning_rate": 3.837872609590895e-07, + "loss": 0.4172, + "step": 84274 + }, + { + "epoch": 2.16, + "learning_rate": 3.837654685058744e-07, + "loss": 0.3262, + "step": 84275 + }, + { + "epoch": 2.16, + "learning_rate": 3.837436765244818e-07, + "loss": 0.418, + "step": 84276 + }, + { + "epoch": 2.16, + "learning_rate": 3.8372188501492843e-07, + "loss": 0.2736, + "step": 84277 + }, + { + "epoch": 2.16, + "learning_rate": 3.83700093977231e-07, + "loss": 0.3618, + "step": 84278 + }, + { + "epoch": 2.16, + "learning_rate": 3.8367830341140596e-07, + "loss": 0.323, + "step": 84279 + }, + { + "epoch": 2.16, + "learning_rate": 3.8365651331746995e-07, + "loss": 0.3608, + "step": 84280 + }, + { + "epoch": 2.16, + "learning_rate": 3.836347236954398e-07, + "loss": 0.4932, + "step": 84281 + }, + { + "epoch": 2.16, + "learning_rate": 3.836129345453326e-07, + "loss": 0.4487, + "step": 84282 + }, + { + "epoch": 2.16, + "learning_rate": 3.8359114586716425e-07, + "loss": 0.3433, + "step": 84283 + }, + { + "epoch": 2.16, + "learning_rate": 3.8356935766095223e-07, + "loss": 0.4009, + "step": 84284 + }, + { + "epoch": 2.16, + "learning_rate": 3.835475699267123e-07, + "loss": 0.328, + "step": 84285 + }, + { + "epoch": 2.16, + "learning_rate": 3.8352578266446187e-07, + "loss": 0.2615, + "step": 84286 + }, + { + "epoch": 2.16, + "learning_rate": 3.835039958742177e-07, + "loss": 0.4229, + "step": 84287 + }, + { + "epoch": 2.16, + "learning_rate": 3.8348220955599567e-07, + "loss": 0.3984, + "step": 84288 + }, + { + "epoch": 2.16, + "learning_rate": 3.8346042370981315e-07, + "loss": 0.4204, + "step": 84289 + }, + { + "epoch": 2.16, + "learning_rate": 3.834386383356868e-07, + "loss": 0.3882, + "step": 84290 + }, + { + "epoch": 2.16, + "learning_rate": 3.8341685343363295e-07, + "loss": 0.3834, + "step": 84291 + }, + { + "epoch": 2.16, + "learning_rate": 3.8339506900366835e-07, + "loss": 0.5098, + "step": 84292 + }, + { + "epoch": 2.16, + "learning_rate": 3.833732850458099e-07, + "loss": 0.3262, + "step": 84293 + }, + { + "epoch": 2.16, + "learning_rate": 3.8335150156007443e-07, + "loss": 0.3896, + "step": 84294 + }, + { + "epoch": 2.16, + "learning_rate": 3.8332971854647836e-07, + "loss": 0.3452, + "step": 84295 + }, + { + "epoch": 2.16, + "learning_rate": 3.833079360050381e-07, + "loss": 0.4727, + "step": 84296 + }, + { + "epoch": 2.16, + "learning_rate": 3.8328615393577056e-07, + "loss": 0.4517, + "step": 84297 + }, + { + "epoch": 2.16, + "learning_rate": 3.8326437233869235e-07, + "loss": 0.3682, + "step": 84298 + }, + { + "epoch": 2.16, + "learning_rate": 3.832425912138207e-07, + "loss": 0.2932, + "step": 84299 + }, + { + "epoch": 2.16, + "learning_rate": 3.832208105611715e-07, + "loss": 0.353, + "step": 84300 + }, + { + "epoch": 2.16, + "learning_rate": 3.831990303807617e-07, + "loss": 0.4316, + "step": 84301 + }, + { + "epoch": 2.16, + "learning_rate": 3.831772506726082e-07, + "loss": 0.3386, + "step": 84302 + }, + { + "epoch": 2.16, + "learning_rate": 3.831554714367278e-07, + "loss": 0.3462, + "step": 84303 + }, + { + "epoch": 2.16, + "learning_rate": 3.831336926731368e-07, + "loss": 0.48, + "step": 84304 + }, + { + "epoch": 2.16, + "learning_rate": 3.8311191438185167e-07, + "loss": 0.4585, + "step": 84305 + }, + { + "epoch": 2.16, + "learning_rate": 3.830901365628894e-07, + "loss": 0.344, + "step": 84306 + }, + { + "epoch": 2.16, + "learning_rate": 3.830683592162669e-07, + "loss": 0.3119, + "step": 84307 + }, + { + "epoch": 2.16, + "learning_rate": 3.8304658234200037e-07, + "loss": 0.4624, + "step": 84308 + }, + { + "epoch": 2.16, + "learning_rate": 3.830248059401067e-07, + "loss": 0.4058, + "step": 84309 + }, + { + "epoch": 2.16, + "learning_rate": 3.830030300106024e-07, + "loss": 0.3367, + "step": 84310 + }, + { + "epoch": 2.16, + "learning_rate": 3.8298125455350485e-07, + "loss": 0.2988, + "step": 84311 + }, + { + "epoch": 2.16, + "learning_rate": 3.829594795688298e-07, + "loss": 0.3341, + "step": 84312 + }, + { + "epoch": 2.16, + "learning_rate": 3.829377050565942e-07, + "loss": 0.3652, + "step": 84313 + }, + { + "epoch": 2.16, + "learning_rate": 3.829159310168152e-07, + "loss": 0.4761, + "step": 84314 + }, + { + "epoch": 2.16, + "learning_rate": 3.828941574495088e-07, + "loss": 0.4883, + "step": 84315 + }, + { + "epoch": 2.16, + "learning_rate": 3.828723843546924e-07, + "loss": 0.2949, + "step": 84316 + }, + { + "epoch": 2.16, + "learning_rate": 3.8285061173238175e-07, + "loss": 0.439, + "step": 84317 + }, + { + "epoch": 2.16, + "learning_rate": 3.8282883958259404e-07, + "loss": 0.3008, + "step": 84318 + }, + { + "epoch": 2.16, + "learning_rate": 3.828070679053459e-07, + "loss": 0.4746, + "step": 84319 + }, + { + "epoch": 2.16, + "learning_rate": 3.827852967006544e-07, + "loss": 0.502, + "step": 84320 + }, + { + "epoch": 2.16, + "learning_rate": 3.827635259685354e-07, + "loss": 0.4512, + "step": 84321 + }, + { + "epoch": 2.16, + "learning_rate": 3.8274175570900603e-07, + "loss": 0.2839, + "step": 84322 + }, + { + "epoch": 2.16, + "learning_rate": 3.82719985922083e-07, + "loss": 0.3569, + "step": 84323 + }, + { + "epoch": 2.16, + "learning_rate": 3.8269821660778345e-07, + "loss": 0.2767, + "step": 84324 + }, + { + "epoch": 2.16, + "learning_rate": 3.8267644776612284e-07, + "loss": 0.3823, + "step": 84325 + }, + { + "epoch": 2.16, + "learning_rate": 3.826546793971186e-07, + "loss": 0.48, + "step": 84326 + }, + { + "epoch": 2.16, + "learning_rate": 3.826329115007871e-07, + "loss": 0.4512, + "step": 84327 + }, + { + "epoch": 2.16, + "learning_rate": 3.8261114407714567e-07, + "loss": 0.3555, + "step": 84328 + }, + { + "epoch": 2.16, + "learning_rate": 3.825893771262101e-07, + "loss": 0.4399, + "step": 84329 + }, + { + "epoch": 2.16, + "learning_rate": 3.825676106479975e-07, + "loss": 0.3472, + "step": 84330 + }, + { + "epoch": 2.16, + "learning_rate": 3.8254584464252447e-07, + "loss": 0.4023, + "step": 84331 + }, + { + "epoch": 2.16, + "learning_rate": 3.82524079109808e-07, + "loss": 0.4951, + "step": 84332 + }, + { + "epoch": 2.16, + "learning_rate": 3.825023140498641e-07, + "loss": 0.4331, + "step": 84333 + }, + { + "epoch": 2.16, + "learning_rate": 3.824805494627102e-07, + "loss": 0.416, + "step": 84334 + }, + { + "epoch": 2.16, + "learning_rate": 3.824587853483622e-07, + "loss": 0.3064, + "step": 84335 + }, + { + "epoch": 2.16, + "learning_rate": 3.82437021706837e-07, + "loss": 0.4326, + "step": 84336 + }, + { + "epoch": 2.16, + "learning_rate": 3.824152585381518e-07, + "loss": 0.4487, + "step": 84337 + }, + { + "epoch": 2.16, + "learning_rate": 3.823934958423225e-07, + "loss": 0.4648, + "step": 84338 + }, + { + "epoch": 2.16, + "learning_rate": 3.8237173361936615e-07, + "loss": 0.4604, + "step": 84339 + }, + { + "epoch": 2.16, + "learning_rate": 3.823499718692993e-07, + "loss": 0.3467, + "step": 84340 + }, + { + "epoch": 2.16, + "learning_rate": 3.8232821059213906e-07, + "loss": 0.4546, + "step": 84341 + }, + { + "epoch": 2.16, + "learning_rate": 3.823064497879013e-07, + "loss": 0.4556, + "step": 84342 + }, + { + "epoch": 2.16, + "learning_rate": 3.822846894566031e-07, + "loss": 0.4673, + "step": 84343 + }, + { + "epoch": 2.16, + "learning_rate": 3.8226292959826156e-07, + "loss": 0.3625, + "step": 84344 + }, + { + "epoch": 2.16, + "learning_rate": 3.822411702128928e-07, + "loss": 0.46, + "step": 84345 + }, + { + "epoch": 2.16, + "learning_rate": 3.822194113005132e-07, + "loss": 0.3496, + "step": 84346 + }, + { + "epoch": 2.16, + "learning_rate": 3.8219765286113983e-07, + "loss": 0.4102, + "step": 84347 + }, + { + "epoch": 2.16, + "learning_rate": 3.821758948947893e-07, + "loss": 0.449, + "step": 84348 + }, + { + "epoch": 2.16, + "learning_rate": 3.821541374014786e-07, + "loss": 0.3338, + "step": 84349 + }, + { + "epoch": 2.16, + "learning_rate": 3.8213238038122375e-07, + "loss": 0.3125, + "step": 84350 + }, + { + "epoch": 2.16, + "learning_rate": 3.821106238340418e-07, + "loss": 0.3848, + "step": 84351 + }, + { + "epoch": 2.16, + "learning_rate": 3.820888677599492e-07, + "loss": 0.4443, + "step": 84352 + }, + { + "epoch": 2.16, + "learning_rate": 3.8206711215896314e-07, + "loss": 0.2826, + "step": 84353 + }, + { + "epoch": 2.16, + "learning_rate": 3.820453570311e-07, + "loss": 0.281, + "step": 84354 + }, + { + "epoch": 2.16, + "learning_rate": 3.820236023763758e-07, + "loss": 0.3745, + "step": 84355 + }, + { + "epoch": 2.16, + "learning_rate": 3.820018481948077e-07, + "loss": 0.3584, + "step": 84356 + }, + { + "epoch": 2.16, + "learning_rate": 3.8198009448641244e-07, + "loss": 0.3933, + "step": 84357 + }, + { + "epoch": 2.16, + "learning_rate": 3.81958341251207e-07, + "loss": 0.5293, + "step": 84358 + }, + { + "epoch": 2.16, + "learning_rate": 3.8193658848920727e-07, + "loss": 0.3752, + "step": 84359 + }, + { + "epoch": 2.16, + "learning_rate": 3.819148362004302e-07, + "loss": 0.2527, + "step": 84360 + }, + { + "epoch": 2.16, + "learning_rate": 3.81893084384893e-07, + "loss": 0.457, + "step": 84361 + }, + { + "epoch": 2.16, + "learning_rate": 3.818713330426113e-07, + "loss": 0.4912, + "step": 84362 + }, + { + "epoch": 2.16, + "learning_rate": 3.8184958217360243e-07, + "loss": 0.3926, + "step": 84363 + }, + { + "epoch": 2.16, + "learning_rate": 3.8182783177788323e-07, + "loss": 0.3691, + "step": 84364 + }, + { + "epoch": 2.16, + "learning_rate": 3.818060818554697e-07, + "loss": 0.478, + "step": 84365 + }, + { + "epoch": 2.16, + "learning_rate": 3.817843324063792e-07, + "loss": 0.4385, + "step": 84366 + }, + { + "epoch": 2.16, + "learning_rate": 3.8176258343062763e-07, + "loss": 0.4072, + "step": 84367 + }, + { + "epoch": 2.16, + "learning_rate": 3.8174083492823205e-07, + "loss": 0.3174, + "step": 84368 + }, + { + "epoch": 2.16, + "learning_rate": 3.8171908689920904e-07, + "loss": 0.4243, + "step": 84369 + }, + { + "epoch": 2.16, + "learning_rate": 3.8169733934357575e-07, + "loss": 0.4414, + "step": 84370 + }, + { + "epoch": 2.16, + "learning_rate": 3.8167559226134795e-07, + "loss": 0.396, + "step": 84371 + }, + { + "epoch": 2.16, + "learning_rate": 3.8165384565254265e-07, + "loss": 0.4272, + "step": 84372 + }, + { + "epoch": 2.16, + "learning_rate": 3.8163209951717667e-07, + "loss": 0.3478, + "step": 84373 + }, + { + "epoch": 2.16, + "learning_rate": 3.8161035385526685e-07, + "loss": 0.3782, + "step": 84374 + }, + { + "epoch": 2.16, + "learning_rate": 3.815886086668295e-07, + "loss": 0.5181, + "step": 84375 + }, + { + "epoch": 2.16, + "learning_rate": 3.8156686395188107e-07, + "loss": 0.5161, + "step": 84376 + }, + { + "epoch": 2.16, + "learning_rate": 3.8154511971043846e-07, + "loss": 0.3273, + "step": 84377 + }, + { + "epoch": 2.16, + "learning_rate": 3.815233759425186e-07, + "loss": 0.4141, + "step": 84378 + }, + { + "epoch": 2.16, + "learning_rate": 3.815016326481375e-07, + "loss": 0.3896, + "step": 84379 + }, + { + "epoch": 2.16, + "learning_rate": 3.814798898273122e-07, + "loss": 0.4136, + "step": 84380 + }, + { + "epoch": 2.16, + "learning_rate": 3.8145814748005934e-07, + "loss": 0.2812, + "step": 84381 + }, + { + "epoch": 2.16, + "learning_rate": 3.814364056063958e-07, + "loss": 0.3561, + "step": 84382 + }, + { + "epoch": 2.16, + "learning_rate": 3.814146642063376e-07, + "loss": 0.3828, + "step": 84383 + }, + { + "epoch": 2.16, + "learning_rate": 3.813929232799021e-07, + "loss": 0.2969, + "step": 84384 + }, + { + "epoch": 2.16, + "learning_rate": 3.8137118282710536e-07, + "loss": 0.4287, + "step": 84385 + }, + { + "epoch": 2.16, + "learning_rate": 3.813494428479642e-07, + "loss": 0.3525, + "step": 84386 + }, + { + "epoch": 2.16, + "learning_rate": 3.813277033424956e-07, + "loss": 0.3008, + "step": 84387 + }, + { + "epoch": 2.16, + "learning_rate": 3.813059643107157e-07, + "loss": 0.3318, + "step": 84388 + }, + { + "epoch": 2.16, + "learning_rate": 3.812842257526414e-07, + "loss": 0.4492, + "step": 84389 + }, + { + "epoch": 2.16, + "learning_rate": 3.812624876682892e-07, + "loss": 0.2203, + "step": 84390 + }, + { + "epoch": 2.16, + "learning_rate": 3.812407500576763e-07, + "loss": 0.418, + "step": 84391 + }, + { + "epoch": 2.16, + "learning_rate": 3.812190129208185e-07, + "loss": 0.2435, + "step": 84392 + }, + { + "epoch": 2.16, + "learning_rate": 3.8119727625773277e-07, + "loss": 0.3525, + "step": 84393 + }, + { + "epoch": 2.16, + "learning_rate": 3.8117554006843634e-07, + "loss": 0.4321, + "step": 84394 + }, + { + "epoch": 2.16, + "learning_rate": 3.811538043529453e-07, + "loss": 0.2795, + "step": 84395 + }, + { + "epoch": 2.16, + "learning_rate": 3.8113206911127595e-07, + "loss": 0.2905, + "step": 84396 + }, + { + "epoch": 2.16, + "learning_rate": 3.811103343434453e-07, + "loss": 0.2708, + "step": 84397 + }, + { + "epoch": 2.16, + "learning_rate": 3.810886000494701e-07, + "loss": 0.3076, + "step": 84398 + }, + { + "epoch": 2.16, + "learning_rate": 3.810668662293671e-07, + "loss": 0.4604, + "step": 84399 + }, + { + "epoch": 2.16, + "learning_rate": 3.8104513288315256e-07, + "loss": 0.3696, + "step": 84400 + }, + { + "epoch": 2.16, + "learning_rate": 3.810234000108432e-07, + "loss": 0.4302, + "step": 84401 + }, + { + "epoch": 2.16, + "learning_rate": 3.810016676124558e-07, + "loss": 0.4097, + "step": 84402 + }, + { + "epoch": 2.16, + "learning_rate": 3.8097993568800737e-07, + "loss": 0.3563, + "step": 84403 + }, + { + "epoch": 2.16, + "learning_rate": 3.80958204237514e-07, + "loss": 0.5146, + "step": 84404 + }, + { + "epoch": 2.16, + "learning_rate": 3.809364732609922e-07, + "loss": 0.3999, + "step": 84405 + }, + { + "epoch": 2.16, + "learning_rate": 3.809147427584589e-07, + "loss": 0.4065, + "step": 84406 + }, + { + "epoch": 2.16, + "learning_rate": 3.808930127299307e-07, + "loss": 0.4985, + "step": 84407 + }, + { + "epoch": 2.16, + "learning_rate": 3.808712831754245e-07, + "loss": 0.4106, + "step": 84408 + }, + { + "epoch": 2.16, + "learning_rate": 3.8084955409495647e-07, + "loss": 0.4321, + "step": 84409 + }, + { + "epoch": 2.16, + "learning_rate": 3.808278254885434e-07, + "loss": 0.353, + "step": 84410 + }, + { + "epoch": 2.16, + "learning_rate": 3.808060973562021e-07, + "loss": 0.4829, + "step": 84411 + }, + { + "epoch": 2.16, + "learning_rate": 3.8078436969794924e-07, + "loss": 0.5312, + "step": 84412 + }, + { + "epoch": 2.16, + "learning_rate": 3.8076264251380106e-07, + "loss": 0.4604, + "step": 84413 + }, + { + "epoch": 2.16, + "learning_rate": 3.8074091580377486e-07, + "loss": 0.395, + "step": 84414 + }, + { + "epoch": 2.16, + "learning_rate": 3.807191895678865e-07, + "loss": 0.3743, + "step": 84415 + }, + { + "epoch": 2.16, + "learning_rate": 3.806974638061533e-07, + "loss": 0.4053, + "step": 84416 + }, + { + "epoch": 2.16, + "learning_rate": 3.8067573851859125e-07, + "loss": 0.5068, + "step": 84417 + }, + { + "epoch": 2.16, + "learning_rate": 3.806540137052173e-07, + "loss": 0.323, + "step": 84418 + }, + { + "epoch": 2.16, + "learning_rate": 3.806322893660482e-07, + "loss": 0.4058, + "step": 84419 + }, + { + "epoch": 2.16, + "learning_rate": 3.806105655011007e-07, + "loss": 0.4346, + "step": 84420 + }, + { + "epoch": 2.16, + "learning_rate": 3.8058884211039087e-07, + "loss": 0.4287, + "step": 84421 + }, + { + "epoch": 2.16, + "learning_rate": 3.805671191939357e-07, + "loss": 0.215, + "step": 84422 + }, + { + "epoch": 2.16, + "learning_rate": 3.805453967517518e-07, + "loss": 0.3416, + "step": 84423 + }, + { + "epoch": 2.16, + "learning_rate": 3.8052367478385616e-07, + "loss": 0.4121, + "step": 84424 + }, + { + "epoch": 2.16, + "learning_rate": 3.80501953290265e-07, + "loss": 0.438, + "step": 84425 + }, + { + "epoch": 2.16, + "learning_rate": 3.8048023227099477e-07, + "loss": 0.4038, + "step": 84426 + }, + { + "epoch": 2.16, + "learning_rate": 3.8045851172606225e-07, + "loss": 0.2635, + "step": 84427 + }, + { + "epoch": 2.16, + "learning_rate": 3.8043679165548427e-07, + "loss": 0.522, + "step": 84428 + }, + { + "epoch": 2.16, + "learning_rate": 3.8041507205927757e-07, + "loss": 0.478, + "step": 84429 + }, + { + "epoch": 2.16, + "learning_rate": 3.8039335293745823e-07, + "loss": 0.5332, + "step": 84430 + }, + { + "epoch": 2.16, + "learning_rate": 3.8037163429004325e-07, + "loss": 0.3965, + "step": 84431 + }, + { + "epoch": 2.16, + "learning_rate": 3.8034991611704926e-07, + "loss": 0.4783, + "step": 84432 + }, + { + "epoch": 2.16, + "learning_rate": 3.803281984184932e-07, + "loss": 0.481, + "step": 84433 + }, + { + "epoch": 2.16, + "learning_rate": 3.8030648119439124e-07, + "loss": 0.3708, + "step": 84434 + }, + { + "epoch": 2.16, + "learning_rate": 3.802847644447598e-07, + "loss": 0.3208, + "step": 84435 + }, + { + "epoch": 2.16, + "learning_rate": 3.8026304816961584e-07, + "loss": 0.4463, + "step": 84436 + }, + { + "epoch": 2.16, + "learning_rate": 3.802413323689764e-07, + "loss": 0.3569, + "step": 84437 + }, + { + "epoch": 2.16, + "learning_rate": 3.802196170428572e-07, + "loss": 0.3711, + "step": 84438 + }, + { + "epoch": 2.16, + "learning_rate": 3.8019790219127533e-07, + "loss": 0.4185, + "step": 84439 + }, + { + "epoch": 2.16, + "learning_rate": 3.801761878142475e-07, + "loss": 0.4546, + "step": 84440 + }, + { + "epoch": 2.16, + "learning_rate": 3.801544739117906e-07, + "loss": 0.3613, + "step": 84441 + }, + { + "epoch": 2.16, + "learning_rate": 3.801327604839205e-07, + "loss": 0.4104, + "step": 84442 + }, + { + "epoch": 2.16, + "learning_rate": 3.8011104753065436e-07, + "loss": 0.4502, + "step": 84443 + }, + { + "epoch": 2.16, + "learning_rate": 3.80089335052009e-07, + "loss": 0.3201, + "step": 84444 + }, + { + "epoch": 2.16, + "learning_rate": 3.8006762304800035e-07, + "loss": 0.4172, + "step": 84445 + }, + { + "epoch": 2.16, + "learning_rate": 3.8004591151864575e-07, + "loss": 0.4683, + "step": 84446 + }, + { + "epoch": 2.16, + "learning_rate": 3.800242004639612e-07, + "loss": 0.4238, + "step": 84447 + }, + { + "epoch": 2.16, + "learning_rate": 3.800024898839636e-07, + "loss": 0.4121, + "step": 84448 + }, + { + "epoch": 2.16, + "learning_rate": 3.799807797786695e-07, + "loss": 0.4219, + "step": 84449 + }, + { + "epoch": 2.16, + "learning_rate": 3.79959070148096e-07, + "loss": 0.3511, + "step": 84450 + }, + { + "epoch": 2.16, + "learning_rate": 3.7993736099225903e-07, + "loss": 0.4312, + "step": 84451 + }, + { + "epoch": 2.16, + "learning_rate": 3.799156523111755e-07, + "loss": 0.4839, + "step": 84452 + }, + { + "epoch": 2.16, + "learning_rate": 3.798939441048624e-07, + "loss": 0.3479, + "step": 84453 + }, + { + "epoch": 2.16, + "learning_rate": 3.79872236373336e-07, + "loss": 0.3074, + "step": 84454 + }, + { + "epoch": 2.16, + "learning_rate": 3.798505291166125e-07, + "loss": 0.3755, + "step": 84455 + }, + { + "epoch": 2.16, + "learning_rate": 3.7982882233470893e-07, + "loss": 0.5366, + "step": 84456 + }, + { + "epoch": 2.16, + "learning_rate": 3.7980711602764205e-07, + "loss": 0.3506, + "step": 84457 + }, + { + "epoch": 2.16, + "learning_rate": 3.797854101954285e-07, + "loss": 0.3647, + "step": 84458 + }, + { + "epoch": 2.16, + "learning_rate": 3.797637048380845e-07, + "loss": 0.3625, + "step": 84459 + }, + { + "epoch": 2.16, + "learning_rate": 3.7974199995562695e-07, + "loss": 0.3369, + "step": 84460 + }, + { + "epoch": 2.16, + "learning_rate": 3.797202955480724e-07, + "loss": 0.3911, + "step": 84461 + }, + { + "epoch": 2.16, + "learning_rate": 3.7969859161543785e-07, + "loss": 0.3202, + "step": 84462 + }, + { + "epoch": 2.16, + "learning_rate": 3.7967688815773914e-07, + "loss": 0.4009, + "step": 84463 + }, + { + "epoch": 2.16, + "learning_rate": 3.7965518517499373e-07, + "loss": 0.498, + "step": 84464 + }, + { + "epoch": 2.16, + "learning_rate": 3.796334826672175e-07, + "loss": 0.3225, + "step": 84465 + }, + { + "epoch": 2.16, + "learning_rate": 3.7961178063442735e-07, + "loss": 0.1563, + "step": 84466 + }, + { + "epoch": 2.16, + "learning_rate": 3.795900790766402e-07, + "loss": 0.521, + "step": 84467 + }, + { + "epoch": 2.16, + "learning_rate": 3.795683779938722e-07, + "loss": 0.4233, + "step": 84468 + }, + { + "epoch": 2.16, + "learning_rate": 3.795466773861401e-07, + "loss": 0.4492, + "step": 84469 + }, + { + "epoch": 2.17, + "learning_rate": 3.795249772534609e-07, + "loss": 0.5039, + "step": 84470 + }, + { + "epoch": 2.17, + "learning_rate": 3.795032775958505e-07, + "loss": 0.5156, + "step": 84471 + }, + { + "epoch": 2.17, + "learning_rate": 3.7948157841332605e-07, + "loss": 0.4766, + "step": 84472 + }, + { + "epoch": 2.17, + "learning_rate": 3.79459879705904e-07, + "loss": 0.3071, + "step": 84473 + }, + { + "epoch": 2.17, + "learning_rate": 3.794381814736013e-07, + "loss": 0.4795, + "step": 84474 + }, + { + "epoch": 2.17, + "learning_rate": 3.794164837164342e-07, + "loss": 0.4761, + "step": 84475 + }, + { + "epoch": 2.17, + "learning_rate": 3.79394786434419e-07, + "loss": 0.2471, + "step": 84476 + }, + { + "epoch": 2.17, + "learning_rate": 3.7937308962757277e-07, + "loss": 0.355, + "step": 84477 + }, + { + "epoch": 2.17, + "learning_rate": 3.7935139329591206e-07, + "loss": 0.4022, + "step": 84478 + }, + { + "epoch": 2.17, + "learning_rate": 3.793296974394536e-07, + "loss": 0.4243, + "step": 84479 + }, + { + "epoch": 2.17, + "learning_rate": 3.793080020582137e-07, + "loss": 0.301, + "step": 84480 + }, + { + "epoch": 2.17, + "learning_rate": 3.792863071522091e-07, + "loss": 0.3804, + "step": 84481 + }, + { + "epoch": 2.17, + "learning_rate": 3.7926461272145637e-07, + "loss": 0.3289, + "step": 84482 + }, + { + "epoch": 2.17, + "learning_rate": 3.792429187659726e-07, + "loss": 0.417, + "step": 84483 + }, + { + "epoch": 2.17, + "learning_rate": 3.792212252857738e-07, + "loss": 0.3364, + "step": 84484 + }, + { + "epoch": 2.17, + "learning_rate": 3.7919953228087666e-07, + "loss": 0.3848, + "step": 84485 + }, + { + "epoch": 2.17, + "learning_rate": 3.7917783975129766e-07, + "loss": 0.4243, + "step": 84486 + }, + { + "epoch": 2.17, + "learning_rate": 3.791561476970542e-07, + "loss": 0.5098, + "step": 84487 + }, + { + "epoch": 2.17, + "learning_rate": 3.7913445611816184e-07, + "loss": 0.5591, + "step": 84488 + }, + { + "epoch": 2.17, + "learning_rate": 3.791127650146377e-07, + "loss": 0.4402, + "step": 84489 + }, + { + "epoch": 2.17, + "learning_rate": 3.7909107438649845e-07, + "loss": 0.448, + "step": 84490 + }, + { + "epoch": 2.17, + "learning_rate": 3.790693842337609e-07, + "loss": 0.3923, + "step": 84491 + }, + { + "epoch": 2.17, + "learning_rate": 3.7904769455644103e-07, + "loss": 0.3823, + "step": 84492 + }, + { + "epoch": 2.17, + "learning_rate": 3.7902600535455586e-07, + "loss": 0.4002, + "step": 84493 + }, + { + "epoch": 2.17, + "learning_rate": 3.7900431662812213e-07, + "loss": 0.3857, + "step": 84494 + }, + { + "epoch": 2.17, + "learning_rate": 3.78982628377156e-07, + "loss": 0.4094, + "step": 84495 + }, + { + "epoch": 2.17, + "learning_rate": 3.7896094060167463e-07, + "loss": 0.5796, + "step": 84496 + }, + { + "epoch": 2.17, + "learning_rate": 3.7893925330169394e-07, + "loss": 0.5063, + "step": 84497 + }, + { + "epoch": 2.17, + "learning_rate": 3.7891756647723093e-07, + "loss": 0.606, + "step": 84498 + }, + { + "epoch": 2.17, + "learning_rate": 3.788958801283022e-07, + "loss": 0.3701, + "step": 84499 + }, + { + "epoch": 2.17, + "learning_rate": 3.7887419425492475e-07, + "loss": 0.46, + "step": 84500 + }, + { + "epoch": 2.17, + "learning_rate": 3.788525088571143e-07, + "loss": 0.3066, + "step": 84501 + }, + { + "epoch": 2.17, + "learning_rate": 3.78830823934888e-07, + "loss": 0.4714, + "step": 84502 + }, + { + "epoch": 2.17, + "learning_rate": 3.7880913948826234e-07, + "loss": 0.4026, + "step": 84503 + }, + { + "epoch": 2.17, + "learning_rate": 3.7878745551725464e-07, + "loss": 0.3147, + "step": 84504 + }, + { + "epoch": 2.17, + "learning_rate": 3.787657720218801e-07, + "loss": 0.4409, + "step": 84505 + }, + { + "epoch": 2.17, + "learning_rate": 3.7874408900215604e-07, + "loss": 0.4893, + "step": 84506 + }, + { + "epoch": 2.17, + "learning_rate": 3.7872240645809917e-07, + "loss": 0.4814, + "step": 84507 + }, + { + "epoch": 2.17, + "learning_rate": 3.787007243897262e-07, + "loss": 0.3101, + "step": 84508 + }, + { + "epoch": 2.17, + "learning_rate": 3.786790427970533e-07, + "loss": 0.3357, + "step": 84509 + }, + { + "epoch": 2.17, + "learning_rate": 3.786573616800972e-07, + "loss": 0.4561, + "step": 84510 + }, + { + "epoch": 2.17, + "learning_rate": 3.7863568103887464e-07, + "loss": 0.374, + "step": 84511 + }, + { + "epoch": 2.17, + "learning_rate": 3.7861400087340244e-07, + "loss": 0.3665, + "step": 84512 + }, + { + "epoch": 2.17, + "learning_rate": 3.785923211836967e-07, + "loss": 0.3745, + "step": 84513 + }, + { + "epoch": 2.17, + "learning_rate": 3.785706419697745e-07, + "loss": 0.5669, + "step": 84514 + }, + { + "epoch": 2.17, + "learning_rate": 3.7854896323165187e-07, + "loss": 0.4404, + "step": 84515 + }, + { + "epoch": 2.17, + "learning_rate": 3.785272849693457e-07, + "loss": 0.46, + "step": 84516 + }, + { + "epoch": 2.17, + "learning_rate": 3.7850560718287295e-07, + "loss": 0.3757, + "step": 84517 + }, + { + "epoch": 2.17, + "learning_rate": 3.7848392987224964e-07, + "loss": 0.4243, + "step": 84518 + }, + { + "epoch": 2.17, + "learning_rate": 3.7846225303749247e-07, + "loss": 0.395, + "step": 84519 + }, + { + "epoch": 2.17, + "learning_rate": 3.784405766786183e-07, + "loss": 0.3293, + "step": 84520 + }, + { + "epoch": 2.17, + "learning_rate": 3.784189007956439e-07, + "loss": 0.4316, + "step": 84521 + }, + { + "epoch": 2.17, + "learning_rate": 3.783972253885851e-07, + "loss": 0.3052, + "step": 84522 + }, + { + "epoch": 2.17, + "learning_rate": 3.783755504574591e-07, + "loss": 0.5083, + "step": 84523 + }, + { + "epoch": 2.17, + "learning_rate": 3.783538760022826e-07, + "loss": 0.5322, + "step": 84524 + }, + { + "epoch": 2.17, + "learning_rate": 3.7833220202307203e-07, + "loss": 0.4165, + "step": 84525 + }, + { + "epoch": 2.17, + "learning_rate": 3.7831052851984356e-07, + "loss": 0.3866, + "step": 84526 + }, + { + "epoch": 2.17, + "learning_rate": 3.7828885549261415e-07, + "loss": 0.2363, + "step": 84527 + }, + { + "epoch": 2.17, + "learning_rate": 3.7826718294140037e-07, + "loss": 0.3796, + "step": 84528 + }, + { + "epoch": 2.17, + "learning_rate": 3.7824551086621915e-07, + "loss": 0.4355, + "step": 84529 + }, + { + "epoch": 2.17, + "learning_rate": 3.7822383926708633e-07, + "loss": 0.4736, + "step": 84530 + }, + { + "epoch": 2.17, + "learning_rate": 3.7820216814401907e-07, + "loss": 0.3982, + "step": 84531 + }, + { + "epoch": 2.17, + "learning_rate": 3.781804974970337e-07, + "loss": 0.3511, + "step": 84532 + }, + { + "epoch": 2.17, + "learning_rate": 3.7815882732614736e-07, + "loss": 0.4146, + "step": 84533 + }, + { + "epoch": 2.17, + "learning_rate": 3.781371576313761e-07, + "loss": 0.2974, + "step": 84534 + }, + { + "epoch": 2.17, + "learning_rate": 3.7811548841273644e-07, + "loss": 0.3965, + "step": 84535 + }, + { + "epoch": 2.17, + "learning_rate": 3.78093819670245e-07, + "loss": 0.541, + "step": 84536 + }, + { + "epoch": 2.17, + "learning_rate": 3.780721514039186e-07, + "loss": 0.3308, + "step": 84537 + }, + { + "epoch": 2.17, + "learning_rate": 3.7805048361377413e-07, + "loss": 0.5005, + "step": 84538 + }, + { + "epoch": 2.17, + "learning_rate": 3.780288162998274e-07, + "loss": 0.3833, + "step": 84539 + }, + { + "epoch": 2.17, + "learning_rate": 3.7800714946209545e-07, + "loss": 0.4849, + "step": 84540 + }, + { + "epoch": 2.17, + "learning_rate": 3.779854831005952e-07, + "loss": 0.3791, + "step": 84541 + }, + { + "epoch": 2.17, + "learning_rate": 3.779638172153424e-07, + "loss": 0.4009, + "step": 84542 + }, + { + "epoch": 2.17, + "learning_rate": 3.779421518063546e-07, + "loss": 0.3094, + "step": 84543 + }, + { + "epoch": 2.17, + "learning_rate": 3.779204868736474e-07, + "loss": 0.4482, + "step": 84544 + }, + { + "epoch": 2.17, + "learning_rate": 3.778988224172379e-07, + "loss": 0.3998, + "step": 84545 + }, + { + "epoch": 2.17, + "learning_rate": 3.778771584371432e-07, + "loss": 0.3789, + "step": 84546 + }, + { + "epoch": 2.17, + "learning_rate": 3.778554949333788e-07, + "loss": 0.2621, + "step": 84547 + }, + { + "epoch": 2.17, + "learning_rate": 3.7783383190596195e-07, + "loss": 0.3048, + "step": 84548 + }, + { + "epoch": 2.17, + "learning_rate": 3.7781216935490903e-07, + "loss": 0.3618, + "step": 84549 + }, + { + "epoch": 2.17, + "learning_rate": 3.777905072802371e-07, + "loss": 0.4453, + "step": 84550 + }, + { + "epoch": 2.17, + "learning_rate": 3.777688456819621e-07, + "loss": 0.3627, + "step": 84551 + }, + { + "epoch": 2.17, + "learning_rate": 3.777471845601008e-07, + "loss": 0.4082, + "step": 84552 + }, + { + "epoch": 2.17, + "learning_rate": 3.7772552391467027e-07, + "loss": 0.541, + "step": 84553 + }, + { + "epoch": 2.17, + "learning_rate": 3.777038637456863e-07, + "loss": 0.3506, + "step": 84554 + }, + { + "epoch": 2.17, + "learning_rate": 3.7768220405316633e-07, + "loss": 0.3296, + "step": 84555 + }, + { + "epoch": 2.17, + "learning_rate": 3.7766054483712597e-07, + "loss": 0.3494, + "step": 84556 + }, + { + "epoch": 2.17, + "learning_rate": 3.7763888609758245e-07, + "loss": 0.3412, + "step": 84557 + }, + { + "epoch": 2.17, + "learning_rate": 3.776172278345524e-07, + "loss": 0.3398, + "step": 84558 + }, + { + "epoch": 2.17, + "learning_rate": 3.77595570048052e-07, + "loss": 0.4255, + "step": 84559 + }, + { + "epoch": 2.17, + "learning_rate": 3.77573912738098e-07, + "loss": 0.2875, + "step": 84560 + }, + { + "epoch": 2.17, + "learning_rate": 3.7755225590470707e-07, + "loss": 0.4414, + "step": 84561 + }, + { + "epoch": 2.17, + "learning_rate": 3.7753059954789614e-07, + "loss": 0.3633, + "step": 84562 + }, + { + "epoch": 2.17, + "learning_rate": 3.7750894366768137e-07, + "loss": 0.3293, + "step": 84563 + }, + { + "epoch": 2.17, + "learning_rate": 3.774872882640791e-07, + "loss": 0.261, + "step": 84564 + }, + { + "epoch": 2.17, + "learning_rate": 3.7746563333710603e-07, + "loss": 0.5552, + "step": 84565 + }, + { + "epoch": 2.17, + "learning_rate": 3.77443978886779e-07, + "loss": 0.4829, + "step": 84566 + }, + { + "epoch": 2.17, + "learning_rate": 3.7742232491311487e-07, + "loss": 0.4292, + "step": 84567 + }, + { + "epoch": 2.17, + "learning_rate": 3.774006714161294e-07, + "loss": 0.3037, + "step": 84568 + }, + { + "epoch": 2.17, + "learning_rate": 3.773790183958396e-07, + "loss": 0.3801, + "step": 84569 + }, + { + "epoch": 2.17, + "learning_rate": 3.7735736585226217e-07, + "loss": 0.3481, + "step": 84570 + }, + { + "epoch": 2.17, + "learning_rate": 3.7733571378541387e-07, + "loss": 0.3711, + "step": 84571 + }, + { + "epoch": 2.17, + "learning_rate": 3.773140621953106e-07, + "loss": 0.3865, + "step": 84572 + }, + { + "epoch": 2.17, + "learning_rate": 3.7729241108196973e-07, + "loss": 0.4299, + "step": 84573 + }, + { + "epoch": 2.17, + "learning_rate": 3.772707604454071e-07, + "loss": 0.5508, + "step": 84574 + }, + { + "epoch": 2.17, + "learning_rate": 3.7724911028563986e-07, + "loss": 0.436, + "step": 84575 + }, + { + "epoch": 2.17, + "learning_rate": 3.7722746060268405e-07, + "loss": 0.4028, + "step": 84576 + }, + { + "epoch": 2.17, + "learning_rate": 3.772058113965565e-07, + "loss": 0.3977, + "step": 84577 + }, + { + "epoch": 2.17, + "learning_rate": 3.771841626672739e-07, + "loss": 0.4341, + "step": 84578 + }, + { + "epoch": 2.17, + "learning_rate": 3.77162514414853e-07, + "loss": 0.6299, + "step": 84579 + }, + { + "epoch": 2.17, + "learning_rate": 3.771408666393099e-07, + "loss": 0.5884, + "step": 84580 + }, + { + "epoch": 2.17, + "learning_rate": 3.7711921934066125e-07, + "loss": 0.4056, + "step": 84581 + }, + { + "epoch": 2.17, + "learning_rate": 3.770975725189239e-07, + "loss": 0.4712, + "step": 84582 + }, + { + "epoch": 2.17, + "learning_rate": 3.7707592617411453e-07, + "loss": 0.4609, + "step": 84583 + }, + { + "epoch": 2.17, + "learning_rate": 3.7705428030624965e-07, + "loss": 0.4155, + "step": 84584 + }, + { + "epoch": 2.17, + "learning_rate": 3.770326349153452e-07, + "loss": 0.4116, + "step": 84585 + }, + { + "epoch": 2.17, + "learning_rate": 3.770109900014182e-07, + "loss": 0.3977, + "step": 84586 + }, + { + "epoch": 2.17, + "learning_rate": 3.7698934556448525e-07, + "loss": 0.4039, + "step": 84587 + }, + { + "epoch": 2.17, + "learning_rate": 3.7696770160456325e-07, + "loss": 0.4114, + "step": 84588 + }, + { + "epoch": 2.17, + "learning_rate": 3.769460581216681e-07, + "loss": 0.3553, + "step": 84589 + }, + { + "epoch": 2.17, + "learning_rate": 3.7692441511581676e-07, + "loss": 0.3511, + "step": 84590 + }, + { + "epoch": 2.17, + "learning_rate": 3.7690277258702575e-07, + "loss": 0.2913, + "step": 84591 + }, + { + "epoch": 2.17, + "learning_rate": 3.768811305353119e-07, + "loss": 0.4023, + "step": 84592 + }, + { + "epoch": 2.17, + "learning_rate": 3.7685948896069153e-07, + "loss": 0.4185, + "step": 84593 + }, + { + "epoch": 2.17, + "learning_rate": 3.7683784786318084e-07, + "loss": 0.3792, + "step": 84594 + }, + { + "epoch": 2.17, + "learning_rate": 3.768162072427968e-07, + "loss": 0.3728, + "step": 84595 + }, + { + "epoch": 2.17, + "learning_rate": 3.7679456709955625e-07, + "loss": 0.3987, + "step": 84596 + }, + { + "epoch": 2.17, + "learning_rate": 3.7677292743347513e-07, + "loss": 0.3271, + "step": 84597 + }, + { + "epoch": 2.17, + "learning_rate": 3.767512882445704e-07, + "loss": 0.2659, + "step": 84598 + }, + { + "epoch": 2.17, + "learning_rate": 3.767296495328583e-07, + "loss": 0.325, + "step": 84599 + }, + { + "epoch": 2.17, + "learning_rate": 3.7670801129835627e-07, + "loss": 0.397, + "step": 84600 + }, + { + "epoch": 2.17, + "learning_rate": 3.7668637354107977e-07, + "loss": 0.4624, + "step": 84601 + }, + { + "epoch": 2.17, + "learning_rate": 3.766647362610459e-07, + "loss": 0.5234, + "step": 84602 + }, + { + "epoch": 2.17, + "learning_rate": 3.7664309945827143e-07, + "loss": 0.5015, + "step": 84603 + }, + { + "epoch": 2.17, + "learning_rate": 3.766214631327724e-07, + "loss": 0.4067, + "step": 84604 + }, + { + "epoch": 2.17, + "learning_rate": 3.765998272845661e-07, + "loss": 0.3562, + "step": 84605 + }, + { + "epoch": 2.17, + "learning_rate": 3.7657819191366813e-07, + "loss": 0.4109, + "step": 84606 + }, + { + "epoch": 2.17, + "learning_rate": 3.765565570200957e-07, + "loss": 0.2994, + "step": 84607 + }, + { + "epoch": 2.17, + "learning_rate": 3.765349226038652e-07, + "loss": 0.4009, + "step": 84608 + }, + { + "epoch": 2.17, + "learning_rate": 3.7651328866499354e-07, + "loss": 0.3679, + "step": 84609 + }, + { + "epoch": 2.17, + "learning_rate": 3.764916552034967e-07, + "loss": 0.4312, + "step": 84610 + }, + { + "epoch": 2.17, + "learning_rate": 3.764700222193915e-07, + "loss": 0.3489, + "step": 84611 + }, + { + "epoch": 2.17, + "learning_rate": 3.7644838971269457e-07, + "loss": 0.3726, + "step": 84612 + }, + { + "epoch": 2.17, + "learning_rate": 3.764267576834231e-07, + "loss": 0.4048, + "step": 84613 + }, + { + "epoch": 2.17, + "learning_rate": 3.7640512613159225e-07, + "loss": 0.4375, + "step": 84614 + }, + { + "epoch": 2.17, + "learning_rate": 3.7638349505721947e-07, + "loss": 0.5381, + "step": 84615 + }, + { + "epoch": 2.17, + "learning_rate": 3.76361864460321e-07, + "loss": 0.4058, + "step": 84616 + }, + { + "epoch": 2.17, + "learning_rate": 3.76340234340914e-07, + "loss": 0.3276, + "step": 84617 + }, + { + "epoch": 2.17, + "learning_rate": 3.763186046990142e-07, + "loss": 0.3284, + "step": 84618 + }, + { + "epoch": 2.17, + "learning_rate": 3.7629697553463866e-07, + "loss": 0.355, + "step": 84619 + }, + { + "epoch": 2.17, + "learning_rate": 3.7627534684780384e-07, + "loss": 0.4067, + "step": 84620 + }, + { + "epoch": 2.17, + "learning_rate": 3.762537186385266e-07, + "loss": 0.3448, + "step": 84621 + }, + { + "epoch": 2.17, + "learning_rate": 3.76232090906823e-07, + "loss": 0.4688, + "step": 84622 + }, + { + "epoch": 2.17, + "learning_rate": 3.762104636527099e-07, + "loss": 0.4268, + "step": 84623 + }, + { + "epoch": 2.17, + "learning_rate": 3.7618883687620365e-07, + "loss": 0.3193, + "step": 84624 + }, + { + "epoch": 2.17, + "learning_rate": 3.761672105773208e-07, + "loss": 0.5254, + "step": 84625 + }, + { + "epoch": 2.17, + "learning_rate": 3.761455847560784e-07, + "loss": 0.5107, + "step": 84626 + }, + { + "epoch": 2.17, + "learning_rate": 3.761239594124923e-07, + "loss": 0.2996, + "step": 84627 + }, + { + "epoch": 2.17, + "learning_rate": 3.761023345465794e-07, + "loss": 0.3818, + "step": 84628 + }, + { + "epoch": 2.17, + "learning_rate": 3.760807101583563e-07, + "loss": 0.3403, + "step": 84629 + }, + { + "epoch": 2.17, + "learning_rate": 3.760590862478398e-07, + "loss": 0.3234, + "step": 84630 + }, + { + "epoch": 2.17, + "learning_rate": 3.760374628150458e-07, + "loss": 0.4614, + "step": 84631 + }, + { + "epoch": 2.17, + "learning_rate": 3.760158398599913e-07, + "loss": 0.4917, + "step": 84632 + }, + { + "epoch": 2.17, + "learning_rate": 3.75994217382693e-07, + "loss": 0.2502, + "step": 84633 + }, + { + "epoch": 2.17, + "learning_rate": 3.759725953831674e-07, + "loss": 0.4272, + "step": 84634 + }, + { + "epoch": 2.17, + "learning_rate": 3.759509738614304e-07, + "loss": 0.2732, + "step": 84635 + }, + { + "epoch": 2.17, + "learning_rate": 3.7592935281749917e-07, + "loss": 0.4751, + "step": 84636 + }, + { + "epoch": 2.17, + "learning_rate": 3.759077322513901e-07, + "loss": 0.2689, + "step": 84637 + }, + { + "epoch": 2.17, + "learning_rate": 3.7588611216312006e-07, + "loss": 0.4087, + "step": 84638 + }, + { + "epoch": 2.17, + "learning_rate": 3.75864492552705e-07, + "loss": 0.4272, + "step": 84639 + }, + { + "epoch": 2.17, + "learning_rate": 3.7584287342016185e-07, + "loss": 0.3263, + "step": 84640 + }, + { + "epoch": 2.17, + "learning_rate": 3.7582125476550707e-07, + "loss": 0.478, + "step": 84641 + }, + { + "epoch": 2.17, + "learning_rate": 3.757996365887576e-07, + "loss": 0.564, + "step": 84642 + }, + { + "epoch": 2.17, + "learning_rate": 3.7577801888992966e-07, + "loss": 0.3547, + "step": 84643 + }, + { + "epoch": 2.17, + "learning_rate": 3.7575640166903945e-07, + "loss": 0.5049, + "step": 84644 + }, + { + "epoch": 2.17, + "learning_rate": 3.757347849261039e-07, + "loss": 0.3542, + "step": 84645 + }, + { + "epoch": 2.17, + "learning_rate": 3.7571316866113947e-07, + "loss": 0.3582, + "step": 84646 + }, + { + "epoch": 2.17, + "learning_rate": 3.756915528741631e-07, + "loss": 0.2747, + "step": 84647 + }, + { + "epoch": 2.17, + "learning_rate": 3.7566993756519074e-07, + "loss": 0.4648, + "step": 84648 + }, + { + "epoch": 2.17, + "learning_rate": 3.756483227342391e-07, + "loss": 0.3264, + "step": 84649 + }, + { + "epoch": 2.17, + "learning_rate": 3.7562670838132513e-07, + "loss": 0.4233, + "step": 84650 + }, + { + "epoch": 2.17, + "learning_rate": 3.756050945064648e-07, + "loss": 0.2933, + "step": 84651 + }, + { + "epoch": 2.17, + "learning_rate": 3.755834811096751e-07, + "loss": 0.259, + "step": 84652 + }, + { + "epoch": 2.17, + "learning_rate": 3.755618681909726e-07, + "loss": 0.4214, + "step": 84653 + }, + { + "epoch": 2.17, + "learning_rate": 3.755402557503733e-07, + "loss": 0.4346, + "step": 84654 + }, + { + "epoch": 2.17, + "learning_rate": 3.7551864378789445e-07, + "loss": 0.5557, + "step": 84655 + }, + { + "epoch": 2.17, + "learning_rate": 3.75497032303552e-07, + "loss": 0.3275, + "step": 84656 + }, + { + "epoch": 2.17, + "learning_rate": 3.7547542129736265e-07, + "loss": 0.3848, + "step": 84657 + }, + { + "epoch": 2.17, + "learning_rate": 3.7545381076934313e-07, + "loss": 0.4062, + "step": 84658 + }, + { + "epoch": 2.17, + "learning_rate": 3.754322007195103e-07, + "loss": 0.4712, + "step": 84659 + }, + { + "epoch": 2.17, + "learning_rate": 3.7541059114787985e-07, + "loss": 0.3774, + "step": 84660 + }, + { + "epoch": 2.17, + "learning_rate": 3.753889820544689e-07, + "loss": 0.2917, + "step": 84661 + }, + { + "epoch": 2.17, + "learning_rate": 3.753673734392938e-07, + "loss": 0.4016, + "step": 84662 + }, + { + "epoch": 2.17, + "learning_rate": 3.753457653023716e-07, + "loss": 0.3945, + "step": 84663 + }, + { + "epoch": 2.17, + "learning_rate": 3.753241576437184e-07, + "loss": 0.3799, + "step": 84664 + }, + { + "epoch": 2.17, + "learning_rate": 3.7530255046335044e-07, + "loss": 0.4167, + "step": 84665 + }, + { + "epoch": 2.17, + "learning_rate": 3.752809437612845e-07, + "loss": 0.3349, + "step": 84666 + }, + { + "epoch": 2.17, + "learning_rate": 3.752593375375377e-07, + "loss": 0.4351, + "step": 84667 + }, + { + "epoch": 2.17, + "learning_rate": 3.752377317921257e-07, + "loss": 0.3789, + "step": 84668 + }, + { + "epoch": 2.17, + "learning_rate": 3.752161265250654e-07, + "loss": 0.3486, + "step": 84669 + }, + { + "epoch": 2.17, + "learning_rate": 3.7519452173637334e-07, + "loss": 0.479, + "step": 84670 + }, + { + "epoch": 2.17, + "learning_rate": 3.751729174260666e-07, + "loss": 0.2671, + "step": 84671 + }, + { + "epoch": 2.17, + "learning_rate": 3.7515131359416076e-07, + "loss": 0.3613, + "step": 84672 + }, + { + "epoch": 2.17, + "learning_rate": 3.751297102406732e-07, + "loss": 0.5107, + "step": 84673 + }, + { + "epoch": 2.17, + "learning_rate": 3.751081073656198e-07, + "loss": 0.5649, + "step": 84674 + }, + { + "epoch": 2.17, + "learning_rate": 3.7508650496901726e-07, + "loss": 0.3904, + "step": 84675 + }, + { + "epoch": 2.17, + "learning_rate": 3.750649030508828e-07, + "loss": 0.36, + "step": 84676 + }, + { + "epoch": 2.17, + "learning_rate": 3.7504330161123185e-07, + "loss": 0.3782, + "step": 84677 + }, + { + "epoch": 2.17, + "learning_rate": 3.7502170065008165e-07, + "loss": 0.2546, + "step": 84678 + }, + { + "epoch": 2.17, + "learning_rate": 3.750001001674485e-07, + "loss": 0.3726, + "step": 84679 + }, + { + "epoch": 2.17, + "learning_rate": 3.749785001633494e-07, + "loss": 0.4072, + "step": 84680 + }, + { + "epoch": 2.17, + "learning_rate": 3.749569006378003e-07, + "loss": 0.5273, + "step": 84681 + }, + { + "epoch": 2.17, + "learning_rate": 3.7493530159081786e-07, + "loss": 0.458, + "step": 84682 + }, + { + "epoch": 2.17, + "learning_rate": 3.749137030224191e-07, + "loss": 0.4536, + "step": 84683 + }, + { + "epoch": 2.17, + "learning_rate": 3.748921049326201e-07, + "loss": 0.353, + "step": 84684 + }, + { + "epoch": 2.17, + "learning_rate": 3.748705073214372e-07, + "loss": 0.3923, + "step": 84685 + }, + { + "epoch": 2.17, + "learning_rate": 3.748489101888872e-07, + "loss": 0.4146, + "step": 84686 + }, + { + "epoch": 2.17, + "learning_rate": 3.748273135349865e-07, + "loss": 0.4106, + "step": 84687 + }, + { + "epoch": 2.17, + "learning_rate": 3.748057173597523e-07, + "loss": 0.3882, + "step": 84688 + }, + { + "epoch": 2.17, + "learning_rate": 3.7478412166320027e-07, + "loss": 0.4336, + "step": 84689 + }, + { + "epoch": 2.17, + "learning_rate": 3.747625264453472e-07, + "loss": 0.3655, + "step": 84690 + }, + { + "epoch": 2.17, + "learning_rate": 3.7474093170620977e-07, + "loss": 0.3457, + "step": 84691 + }, + { + "epoch": 2.17, + "learning_rate": 3.7471933744580476e-07, + "loss": 0.5137, + "step": 84692 + }, + { + "epoch": 2.17, + "learning_rate": 3.7469774366414853e-07, + "loss": 0.4209, + "step": 84693 + }, + { + "epoch": 2.17, + "learning_rate": 3.74676150361257e-07, + "loss": 0.4033, + "step": 84694 + }, + { + "epoch": 2.17, + "learning_rate": 3.7465455753714726e-07, + "loss": 0.4878, + "step": 84695 + }, + { + "epoch": 2.17, + "learning_rate": 3.7463296519183573e-07, + "loss": 0.3315, + "step": 84696 + }, + { + "epoch": 2.17, + "learning_rate": 3.746113733253393e-07, + "loss": 0.4995, + "step": 84697 + }, + { + "epoch": 2.17, + "learning_rate": 3.7458978193767386e-07, + "loss": 0.3379, + "step": 84698 + }, + { + "epoch": 2.17, + "learning_rate": 3.745681910288563e-07, + "loss": 0.479, + "step": 84699 + }, + { + "epoch": 2.17, + "learning_rate": 3.745466005989031e-07, + "loss": 0.323, + "step": 84700 + }, + { + "epoch": 2.17, + "learning_rate": 3.7452501064783114e-07, + "loss": 0.437, + "step": 84701 + }, + { + "epoch": 2.17, + "learning_rate": 3.7450342117565636e-07, + "loss": 0.4194, + "step": 84702 + }, + { + "epoch": 2.17, + "learning_rate": 3.744818321823958e-07, + "loss": 0.3352, + "step": 84703 + }, + { + "epoch": 2.17, + "learning_rate": 3.744602436680654e-07, + "loss": 0.2561, + "step": 84704 + }, + { + "epoch": 2.17, + "learning_rate": 3.744386556326824e-07, + "loss": 0.4741, + "step": 84705 + }, + { + "epoch": 2.17, + "learning_rate": 3.744170680762626e-07, + "loss": 0.416, + "step": 84706 + }, + { + "epoch": 2.17, + "learning_rate": 3.743954809988229e-07, + "loss": 0.4546, + "step": 84707 + }, + { + "epoch": 2.17, + "learning_rate": 3.743738944003798e-07, + "loss": 0.4565, + "step": 84708 + }, + { + "epoch": 2.17, + "learning_rate": 3.743523082809502e-07, + "loss": 0.3687, + "step": 84709 + }, + { + "epoch": 2.17, + "learning_rate": 3.743307226405499e-07, + "loss": 0.5786, + "step": 84710 + }, + { + "epoch": 2.17, + "learning_rate": 3.743091374791958e-07, + "loss": 0.4507, + "step": 84711 + }, + { + "epoch": 2.17, + "learning_rate": 3.742875527969045e-07, + "loss": 0.3911, + "step": 84712 + }, + { + "epoch": 2.17, + "learning_rate": 3.7426596859369277e-07, + "loss": 0.5259, + "step": 84713 + }, + { + "epoch": 2.17, + "learning_rate": 3.7424438486957664e-07, + "loss": 0.4092, + "step": 84714 + }, + { + "epoch": 2.17, + "learning_rate": 3.7422280162457263e-07, + "loss": 0.4072, + "step": 84715 + }, + { + "epoch": 2.17, + "learning_rate": 3.7420121885869746e-07, + "loss": 0.3657, + "step": 84716 + }, + { + "epoch": 2.17, + "learning_rate": 3.741796365719676e-07, + "loss": 0.4309, + "step": 84717 + }, + { + "epoch": 2.17, + "learning_rate": 3.741580547644e-07, + "loss": 0.3153, + "step": 84718 + }, + { + "epoch": 2.17, + "learning_rate": 3.741364734360104e-07, + "loss": 0.4834, + "step": 84719 + }, + { + "epoch": 2.17, + "learning_rate": 3.741148925868157e-07, + "loss": 0.5493, + "step": 84720 + }, + { + "epoch": 2.17, + "learning_rate": 3.7409331221683284e-07, + "loss": 0.3979, + "step": 84721 + }, + { + "epoch": 2.17, + "learning_rate": 3.7407173232607756e-07, + "loss": 0.459, + "step": 84722 + }, + { + "epoch": 2.17, + "learning_rate": 3.740501529145672e-07, + "loss": 0.439, + "step": 84723 + }, + { + "epoch": 2.17, + "learning_rate": 3.740285739823175e-07, + "loss": 0.4326, + "step": 84724 + }, + { + "epoch": 2.17, + "learning_rate": 3.7400699552934536e-07, + "loss": 0.3799, + "step": 84725 + }, + { + "epoch": 2.17, + "learning_rate": 3.739854175556676e-07, + "loss": 0.4227, + "step": 84726 + }, + { + "epoch": 2.17, + "learning_rate": 3.739638400613e-07, + "loss": 0.4502, + "step": 84727 + }, + { + "epoch": 2.17, + "learning_rate": 3.739422630462595e-07, + "loss": 0.3982, + "step": 84728 + }, + { + "epoch": 2.17, + "learning_rate": 3.7392068651056277e-07, + "loss": 0.4067, + "step": 84729 + }, + { + "epoch": 2.17, + "learning_rate": 3.738991104542264e-07, + "loss": 0.3618, + "step": 84730 + }, + { + "epoch": 2.17, + "learning_rate": 3.7387753487726637e-07, + "loss": 0.4321, + "step": 84731 + }, + { + "epoch": 2.17, + "learning_rate": 3.7385595977969954e-07, + "loss": 0.4082, + "step": 84732 + }, + { + "epoch": 2.17, + "learning_rate": 3.7383438516154277e-07, + "loss": 0.3065, + "step": 84733 + }, + { + "epoch": 2.17, + "learning_rate": 3.7381281102281183e-07, + "loss": 0.2838, + "step": 84734 + }, + { + "epoch": 2.17, + "learning_rate": 3.7379123736352404e-07, + "loss": 0.2582, + "step": 84735 + }, + { + "epoch": 2.17, + "learning_rate": 3.73769664183695e-07, + "loss": 0.2854, + "step": 84736 + }, + { + "epoch": 2.17, + "learning_rate": 3.7374809148334186e-07, + "loss": 0.2902, + "step": 84737 + }, + { + "epoch": 2.17, + "learning_rate": 3.7372651926248135e-07, + "loss": 0.4097, + "step": 84738 + }, + { + "epoch": 2.17, + "learning_rate": 3.7370494752112936e-07, + "loss": 0.4473, + "step": 84739 + }, + { + "epoch": 2.17, + "learning_rate": 3.736833762593026e-07, + "loss": 0.3267, + "step": 84740 + }, + { + "epoch": 2.17, + "learning_rate": 3.7366180547701773e-07, + "loss": 0.4414, + "step": 84741 + }, + { + "epoch": 2.17, + "learning_rate": 3.7364023517429154e-07, + "loss": 0.2566, + "step": 84742 + }, + { + "epoch": 2.17, + "learning_rate": 3.7361866535114016e-07, + "loss": 0.3716, + "step": 84743 + }, + { + "epoch": 2.17, + "learning_rate": 3.7359709600757995e-07, + "loss": 0.5322, + "step": 84744 + }, + { + "epoch": 2.17, + "learning_rate": 3.735755271436275e-07, + "loss": 0.5723, + "step": 84745 + }, + { + "epoch": 2.17, + "learning_rate": 3.735539587592996e-07, + "loss": 0.4658, + "step": 84746 + }, + { + "epoch": 2.17, + "learning_rate": 3.7353239085461286e-07, + "loss": 0.3896, + "step": 84747 + }, + { + "epoch": 2.17, + "learning_rate": 3.735108234295833e-07, + "loss": 0.3877, + "step": 84748 + }, + { + "epoch": 2.17, + "learning_rate": 3.734892564842277e-07, + "loss": 0.4604, + "step": 84749 + }, + { + "epoch": 2.17, + "learning_rate": 3.7346769001856247e-07, + "loss": 0.4194, + "step": 84750 + }, + { + "epoch": 2.17, + "learning_rate": 3.7344612403260465e-07, + "loss": 0.2966, + "step": 84751 + }, + { + "epoch": 2.17, + "learning_rate": 3.7342455852637e-07, + "loss": 0.377, + "step": 84752 + }, + { + "epoch": 2.17, + "learning_rate": 3.734029934998757e-07, + "loss": 0.4219, + "step": 84753 + }, + { + "epoch": 2.17, + "learning_rate": 3.733814289531375e-07, + "loss": 0.4924, + "step": 84754 + }, + { + "epoch": 2.17, + "learning_rate": 3.733598648861723e-07, + "loss": 0.4258, + "step": 84755 + }, + { + "epoch": 2.17, + "learning_rate": 3.7333830129899714e-07, + "loss": 0.3794, + "step": 84756 + }, + { + "epoch": 2.17, + "learning_rate": 3.733167381916276e-07, + "loss": 0.3882, + "step": 84757 + }, + { + "epoch": 2.17, + "learning_rate": 3.7329517556408054e-07, + "loss": 0.3195, + "step": 84758 + }, + { + "epoch": 2.17, + "learning_rate": 3.73273613416373e-07, + "loss": 0.4434, + "step": 84759 + }, + { + "epoch": 2.17, + "learning_rate": 3.732520517485206e-07, + "loss": 0.4277, + "step": 84760 + }, + { + "epoch": 2.17, + "learning_rate": 3.7323049056054035e-07, + "loss": 0.3767, + "step": 84761 + }, + { + "epoch": 2.17, + "learning_rate": 3.732089298524487e-07, + "loss": 0.5054, + "step": 84762 + }, + { + "epoch": 2.17, + "learning_rate": 3.7318736962426244e-07, + "loss": 0.4541, + "step": 84763 + }, + { + "epoch": 2.17, + "learning_rate": 3.7316580987599776e-07, + "loss": 0.2854, + "step": 84764 + }, + { + "epoch": 2.17, + "learning_rate": 3.7314425060767094e-07, + "loss": 0.5415, + "step": 84765 + }, + { + "epoch": 2.17, + "learning_rate": 3.7312269181929867e-07, + "loss": 0.3949, + "step": 84766 + }, + { + "epoch": 2.17, + "learning_rate": 3.7310113351089767e-07, + "loss": 0.3833, + "step": 84767 + }, + { + "epoch": 2.17, + "learning_rate": 3.730795756824845e-07, + "loss": 0.5723, + "step": 84768 + }, + { + "epoch": 2.17, + "learning_rate": 3.7305801833407524e-07, + "loss": 0.3901, + "step": 84769 + }, + { + "epoch": 2.17, + "learning_rate": 3.730364614656866e-07, + "loss": 0.4214, + "step": 84770 + }, + { + "epoch": 2.17, + "learning_rate": 3.7301490507733504e-07, + "loss": 0.3138, + "step": 84771 + }, + { + "epoch": 2.17, + "learning_rate": 3.729933491690375e-07, + "loss": 0.3546, + "step": 84772 + }, + { + "epoch": 2.17, + "learning_rate": 3.729717937408101e-07, + "loss": 0.3655, + "step": 84773 + }, + { + "epoch": 2.17, + "learning_rate": 3.729502387926692e-07, + "loss": 0.4648, + "step": 84774 + }, + { + "epoch": 2.17, + "learning_rate": 3.7292868432463134e-07, + "loss": 0.4897, + "step": 84775 + }, + { + "epoch": 2.17, + "learning_rate": 3.7290713033671337e-07, + "loss": 0.421, + "step": 84776 + }, + { + "epoch": 2.17, + "learning_rate": 3.728855768289314e-07, + "loss": 0.4048, + "step": 84777 + }, + { + "epoch": 2.17, + "learning_rate": 3.728640238013021e-07, + "loss": 0.3921, + "step": 84778 + }, + { + "epoch": 2.17, + "learning_rate": 3.728424712538419e-07, + "loss": 0.3896, + "step": 84779 + }, + { + "epoch": 2.17, + "learning_rate": 3.7282091918656777e-07, + "loss": 0.3877, + "step": 84780 + }, + { + "epoch": 2.17, + "learning_rate": 3.727993675994955e-07, + "loss": 0.2597, + "step": 84781 + }, + { + "epoch": 2.17, + "learning_rate": 3.7277781649264193e-07, + "loss": 0.3379, + "step": 84782 + }, + { + "epoch": 2.17, + "learning_rate": 3.727562658660238e-07, + "loss": 0.2605, + "step": 84783 + }, + { + "epoch": 2.17, + "learning_rate": 3.7273471571965707e-07, + "loss": 0.5, + "step": 84784 + }, + { + "epoch": 2.17, + "learning_rate": 3.7271316605355896e-07, + "loss": 0.4424, + "step": 84785 + }, + { + "epoch": 2.17, + "learning_rate": 3.726916168677451e-07, + "loss": 0.5049, + "step": 84786 + }, + { + "epoch": 2.17, + "learning_rate": 3.7267006816223243e-07, + "loss": 0.4224, + "step": 84787 + }, + { + "epoch": 2.17, + "learning_rate": 3.7264851993703736e-07, + "loss": 0.4663, + "step": 84788 + }, + { + "epoch": 2.17, + "learning_rate": 3.72626972192177e-07, + "loss": 0.4644, + "step": 84789 + }, + { + "epoch": 2.17, + "learning_rate": 3.726054249276668e-07, + "loss": 0.4321, + "step": 84790 + }, + { + "epoch": 2.17, + "learning_rate": 3.7258387814352386e-07, + "loss": 0.4438, + "step": 84791 + }, + { + "epoch": 2.17, + "learning_rate": 3.725623318397646e-07, + "loss": 0.4172, + "step": 84792 + }, + { + "epoch": 2.17, + "learning_rate": 3.7254078601640615e-07, + "loss": 0.4238, + "step": 84793 + }, + { + "epoch": 2.17, + "learning_rate": 3.725192406734637e-07, + "loss": 0.3722, + "step": 84794 + }, + { + "epoch": 2.17, + "learning_rate": 3.7249769581095446e-07, + "loss": 0.3252, + "step": 84795 + }, + { + "epoch": 2.17, + "learning_rate": 3.724761514288949e-07, + "loss": 0.4893, + "step": 84796 + }, + { + "epoch": 2.17, + "learning_rate": 3.7245460752730174e-07, + "loss": 0.4209, + "step": 84797 + }, + { + "epoch": 2.17, + "learning_rate": 3.7243306410619104e-07, + "loss": 0.5132, + "step": 84798 + }, + { + "epoch": 2.17, + "learning_rate": 3.7241152116557927e-07, + "loss": 0.3945, + "step": 84799 + }, + { + "epoch": 2.17, + "learning_rate": 3.723899787054833e-07, + "loss": 0.4844, + "step": 84800 + }, + { + "epoch": 2.17, + "learning_rate": 3.7236843672591977e-07, + "loss": 0.3821, + "step": 84801 + }, + { + "epoch": 2.17, + "learning_rate": 3.7234689522690454e-07, + "loss": 0.4197, + "step": 84802 + }, + { + "epoch": 2.17, + "learning_rate": 3.723253542084548e-07, + "loss": 0.3938, + "step": 84803 + }, + { + "epoch": 2.17, + "learning_rate": 3.723038136705863e-07, + "loss": 0.3706, + "step": 84804 + }, + { + "epoch": 2.17, + "learning_rate": 3.722822736133159e-07, + "loss": 0.4282, + "step": 84805 + }, + { + "epoch": 2.17, + "learning_rate": 3.7226073403666037e-07, + "loss": 0.3386, + "step": 84806 + }, + { + "epoch": 2.17, + "learning_rate": 3.722391949406356e-07, + "loss": 0.3064, + "step": 84807 + }, + { + "epoch": 2.17, + "learning_rate": 3.722176563252585e-07, + "loss": 0.3682, + "step": 84808 + }, + { + "epoch": 2.17, + "learning_rate": 3.721961181905455e-07, + "loss": 0.4443, + "step": 84809 + }, + { + "epoch": 2.17, + "learning_rate": 3.721745805365133e-07, + "loss": 0.3572, + "step": 84810 + }, + { + "epoch": 2.17, + "learning_rate": 3.7215304336317785e-07, + "loss": 0.2302, + "step": 84811 + }, + { + "epoch": 2.17, + "learning_rate": 3.7213150667055606e-07, + "loss": 0.3623, + "step": 84812 + }, + { + "epoch": 2.17, + "learning_rate": 3.7210997045866454e-07, + "loss": 0.4243, + "step": 84813 + }, + { + "epoch": 2.17, + "learning_rate": 3.720884347275195e-07, + "loss": 0.4727, + "step": 84814 + }, + { + "epoch": 2.17, + "learning_rate": 3.720668994771372e-07, + "loss": 0.3975, + "step": 84815 + }, + { + "epoch": 2.17, + "learning_rate": 3.720453647075343e-07, + "loss": 0.479, + "step": 84816 + }, + { + "epoch": 2.17, + "learning_rate": 3.7202383041872755e-07, + "loss": 0.311, + "step": 84817 + }, + { + "epoch": 2.17, + "learning_rate": 3.720022966107336e-07, + "loss": 0.3118, + "step": 84818 + }, + { + "epoch": 2.17, + "learning_rate": 3.719807632835682e-07, + "loss": 0.3784, + "step": 84819 + }, + { + "epoch": 2.17, + "learning_rate": 3.719592304372483e-07, + "loss": 0.3906, + "step": 84820 + }, + { + "epoch": 2.17, + "learning_rate": 3.719376980717903e-07, + "loss": 0.4502, + "step": 84821 + }, + { + "epoch": 2.17, + "learning_rate": 3.71916166187211e-07, + "loss": 0.4127, + "step": 84822 + }, + { + "epoch": 2.17, + "learning_rate": 3.7189463478352676e-07, + "loss": 0.3881, + "step": 84823 + }, + { + "epoch": 2.17, + "learning_rate": 3.7187310386075354e-07, + "loss": 0.4021, + "step": 84824 + }, + { + "epoch": 2.17, + "learning_rate": 3.7185157341890816e-07, + "loss": 0.3862, + "step": 84825 + }, + { + "epoch": 2.17, + "learning_rate": 3.718300434580072e-07, + "loss": 0.5664, + "step": 84826 + }, + { + "epoch": 2.17, + "learning_rate": 3.7180851397806735e-07, + "loss": 0.4604, + "step": 84827 + }, + { + "epoch": 2.17, + "learning_rate": 3.7178698497910454e-07, + "loss": 0.3279, + "step": 84828 + }, + { + "epoch": 2.17, + "learning_rate": 3.7176545646113546e-07, + "loss": 0.374, + "step": 84829 + }, + { + "epoch": 2.17, + "learning_rate": 3.7174392842417713e-07, + "loss": 0.3374, + "step": 84830 + }, + { + "epoch": 2.17, + "learning_rate": 3.7172240086824527e-07, + "loss": 0.416, + "step": 84831 + }, + { + "epoch": 2.17, + "learning_rate": 3.717008737933569e-07, + "loss": 0.5447, + "step": 84832 + }, + { + "epoch": 2.17, + "learning_rate": 3.716793471995281e-07, + "loss": 0.396, + "step": 84833 + }, + { + "epoch": 2.17, + "learning_rate": 3.7165782108677537e-07, + "loss": 0.3301, + "step": 84834 + }, + { + "epoch": 2.17, + "learning_rate": 3.7163629545511574e-07, + "loss": 0.3264, + "step": 84835 + }, + { + "epoch": 2.17, + "learning_rate": 3.71614770304565e-07, + "loss": 0.4302, + "step": 84836 + }, + { + "epoch": 2.17, + "learning_rate": 3.7159324563513995e-07, + "loss": 0.2568, + "step": 84837 + }, + { + "epoch": 2.17, + "learning_rate": 3.7157172144685714e-07, + "loss": 0.458, + "step": 84838 + }, + { + "epoch": 2.17, + "learning_rate": 3.715501977397332e-07, + "loss": 0.4526, + "step": 84839 + }, + { + "epoch": 2.17, + "learning_rate": 3.71528674513784e-07, + "loss": 0.4326, + "step": 84840 + }, + { + "epoch": 2.17, + "learning_rate": 3.7150715176902646e-07, + "loss": 0.4121, + "step": 84841 + }, + { + "epoch": 2.17, + "learning_rate": 3.7148562950547726e-07, + "loss": 0.3381, + "step": 84842 + }, + { + "epoch": 2.17, + "learning_rate": 3.714641077231524e-07, + "loss": 0.3418, + "step": 84843 + }, + { + "epoch": 2.17, + "learning_rate": 3.7144258642206885e-07, + "loss": 0.4111, + "step": 84844 + }, + { + "epoch": 2.17, + "learning_rate": 3.714210656022424e-07, + "loss": 0.3413, + "step": 84845 + }, + { + "epoch": 2.17, + "learning_rate": 3.7139954526369e-07, + "loss": 0.5479, + "step": 84846 + }, + { + "epoch": 2.17, + "learning_rate": 3.713780254064284e-07, + "loss": 0.3625, + "step": 84847 + }, + { + "epoch": 2.17, + "learning_rate": 3.7135650603047343e-07, + "loss": 0.4761, + "step": 84848 + }, + { + "epoch": 2.17, + "learning_rate": 3.7133498713584176e-07, + "loss": 0.4614, + "step": 84849 + }, + { + "epoch": 2.17, + "learning_rate": 3.713134687225501e-07, + "loss": 0.417, + "step": 84850 + }, + { + "epoch": 2.17, + "learning_rate": 3.7129195079061517e-07, + "loss": 0.4624, + "step": 84851 + }, + { + "epoch": 2.17, + "learning_rate": 3.71270433340053e-07, + "loss": 0.415, + "step": 84852 + }, + { + "epoch": 2.17, + "learning_rate": 3.7124891637087987e-07, + "loss": 0.4106, + "step": 84853 + }, + { + "epoch": 2.17, + "learning_rate": 3.712273998831125e-07, + "loss": 0.3723, + "step": 84854 + }, + { + "epoch": 2.17, + "learning_rate": 3.7120588387676745e-07, + "loss": 0.4312, + "step": 84855 + }, + { + "epoch": 2.17, + "learning_rate": 3.711843683518614e-07, + "loss": 0.5679, + "step": 84856 + }, + { + "epoch": 2.17, + "learning_rate": 3.711628533084102e-07, + "loss": 0.3704, + "step": 84857 + }, + { + "epoch": 2.17, + "learning_rate": 3.7114133874643085e-07, + "loss": 0.3945, + "step": 84858 + }, + { + "epoch": 2.17, + "learning_rate": 3.711198246659395e-07, + "loss": 0.3896, + "step": 84859 + }, + { + "epoch": 2.18, + "learning_rate": 3.7109831106695324e-07, + "loss": 0.3921, + "step": 84860 + }, + { + "epoch": 2.18, + "learning_rate": 3.7107679794948766e-07, + "loss": 0.3752, + "step": 84861 + }, + { + "epoch": 2.18, + "learning_rate": 3.710552853135601e-07, + "loss": 0.3501, + "step": 84862 + }, + { + "epoch": 2.18, + "learning_rate": 3.7103377315918617e-07, + "loss": 0.4297, + "step": 84863 + }, + { + "epoch": 2.18, + "learning_rate": 3.710122614863831e-07, + "loss": 0.31, + "step": 84864 + }, + { + "epoch": 2.18, + "learning_rate": 3.7099075029516667e-07, + "loss": 0.3501, + "step": 84865 + }, + { + "epoch": 2.18, + "learning_rate": 3.709692395855537e-07, + "loss": 0.4053, + "step": 84866 + }, + { + "epoch": 2.18, + "learning_rate": 3.709477293575607e-07, + "loss": 0.3428, + "step": 84867 + }, + { + "epoch": 2.18, + "learning_rate": 3.709262196112044e-07, + "loss": 0.3894, + "step": 84868 + }, + { + "epoch": 2.18, + "learning_rate": 3.709047103465006e-07, + "loss": 0.377, + "step": 84869 + }, + { + "epoch": 2.18, + "learning_rate": 3.708832015634662e-07, + "loss": 0.3558, + "step": 84870 + }, + { + "epoch": 2.18, + "learning_rate": 3.708616932621176e-07, + "loss": 0.3123, + "step": 84871 + }, + { + "epoch": 2.18, + "learning_rate": 3.7084018544247163e-07, + "loss": 0.3513, + "step": 84872 + }, + { + "epoch": 2.18, + "learning_rate": 3.7081867810454436e-07, + "loss": 0.365, + "step": 84873 + }, + { + "epoch": 2.18, + "learning_rate": 3.70797171248352e-07, + "loss": 0.3391, + "step": 84874 + }, + { + "epoch": 2.18, + "learning_rate": 3.707756648739113e-07, + "loss": 0.4174, + "step": 84875 + }, + { + "epoch": 2.18, + "learning_rate": 3.7075415898123876e-07, + "loss": 0.3152, + "step": 84876 + }, + { + "epoch": 2.18, + "learning_rate": 3.707326535703511e-07, + "loss": 0.4482, + "step": 84877 + }, + { + "epoch": 2.18, + "learning_rate": 3.707111486412642e-07, + "loss": 0.3678, + "step": 84878 + }, + { + "epoch": 2.18, + "learning_rate": 3.7068964419399487e-07, + "loss": 0.4893, + "step": 84879 + }, + { + "epoch": 2.18, + "learning_rate": 3.706681402285594e-07, + "loss": 0.4707, + "step": 84880 + }, + { + "epoch": 2.18, + "learning_rate": 3.706466367449749e-07, + "loss": 0.4961, + "step": 84881 + }, + { + "epoch": 2.18, + "learning_rate": 3.7062513374325733e-07, + "loss": 0.3752, + "step": 84882 + }, + { + "epoch": 2.18, + "learning_rate": 3.7060363122342277e-07, + "loss": 0.3481, + "step": 84883 + }, + { + "epoch": 2.18, + "learning_rate": 3.7058212918548806e-07, + "loss": 0.4912, + "step": 84884 + }, + { + "epoch": 2.18, + "learning_rate": 3.7056062762947005e-07, + "loss": 0.4458, + "step": 84885 + }, + { + "epoch": 2.18, + "learning_rate": 3.7053912655538446e-07, + "loss": 0.3611, + "step": 84886 + }, + { + "epoch": 2.18, + "learning_rate": 3.705176259632481e-07, + "loss": 0.5264, + "step": 84887 + }, + { + "epoch": 2.18, + "learning_rate": 3.7049612585307744e-07, + "loss": 0.3589, + "step": 84888 + }, + { + "epoch": 2.18, + "learning_rate": 3.704746262248893e-07, + "loss": 0.4805, + "step": 84889 + }, + { + "epoch": 2.18, + "learning_rate": 3.7045312707869947e-07, + "loss": 0.3997, + "step": 84890 + }, + { + "epoch": 2.18, + "learning_rate": 3.704316284145247e-07, + "loss": 0.3589, + "step": 84891 + }, + { + "epoch": 2.18, + "learning_rate": 3.704101302323819e-07, + "loss": 0.342, + "step": 84892 + }, + { + "epoch": 2.18, + "learning_rate": 3.703886325322867e-07, + "loss": 0.4712, + "step": 84893 + }, + { + "epoch": 2.18, + "learning_rate": 3.7036713531425635e-07, + "loss": 0.417, + "step": 84894 + }, + { + "epoch": 2.18, + "learning_rate": 3.703456385783066e-07, + "loss": 0.3735, + "step": 84895 + }, + { + "epoch": 2.18, + "learning_rate": 3.703241423244542e-07, + "loss": 0.3618, + "step": 84896 + }, + { + "epoch": 2.18, + "learning_rate": 3.703026465527157e-07, + "loss": 0.3984, + "step": 84897 + }, + { + "epoch": 2.18, + "learning_rate": 3.7028115126310775e-07, + "loss": 0.4702, + "step": 84898 + }, + { + "epoch": 2.18, + "learning_rate": 3.702596564556464e-07, + "loss": 0.479, + "step": 84899 + }, + { + "epoch": 2.18, + "learning_rate": 3.702381621303482e-07, + "loss": 0.3645, + "step": 84900 + }, + { + "epoch": 2.18, + "learning_rate": 3.7021666828722996e-07, + "loss": 0.5024, + "step": 84901 + }, + { + "epoch": 2.18, + "learning_rate": 3.701951749263079e-07, + "loss": 0.5166, + "step": 84902 + }, + { + "epoch": 2.18, + "learning_rate": 3.701736820475981e-07, + "loss": 0.4012, + "step": 84903 + }, + { + "epoch": 2.18, + "learning_rate": 3.7015218965111737e-07, + "loss": 0.4121, + "step": 84904 + }, + { + "epoch": 2.18, + "learning_rate": 3.701306977368821e-07, + "loss": 0.5027, + "step": 84905 + }, + { + "epoch": 2.18, + "learning_rate": 3.7010920630490915e-07, + "loss": 0.3196, + "step": 84906 + }, + { + "epoch": 2.18, + "learning_rate": 3.700877153552143e-07, + "loss": 0.4624, + "step": 84907 + }, + { + "epoch": 2.18, + "learning_rate": 3.7006622488781424e-07, + "loss": 0.3766, + "step": 84908 + }, + { + "epoch": 2.18, + "learning_rate": 3.700447349027256e-07, + "loss": 0.5195, + "step": 84909 + }, + { + "epoch": 2.18, + "learning_rate": 3.700232453999651e-07, + "loss": 0.418, + "step": 84910 + }, + { + "epoch": 2.18, + "learning_rate": 3.7000175637954844e-07, + "loss": 0.4624, + "step": 84911 + }, + { + "epoch": 2.18, + "learning_rate": 3.699802678414928e-07, + "loss": 0.4136, + "step": 84912 + }, + { + "epoch": 2.18, + "learning_rate": 3.6995877978581404e-07, + "loss": 0.3635, + "step": 84913 + }, + { + "epoch": 2.18, + "learning_rate": 3.699372922125288e-07, + "loss": 0.5186, + "step": 84914 + }, + { + "epoch": 2.18, + "learning_rate": 3.699158051216539e-07, + "loss": 0.4438, + "step": 84915 + }, + { + "epoch": 2.18, + "learning_rate": 3.6989431851320517e-07, + "loss": 0.4521, + "step": 84916 + }, + { + "epoch": 2.18, + "learning_rate": 3.698728323871995e-07, + "loss": 0.4766, + "step": 84917 + }, + { + "epoch": 2.18, + "learning_rate": 3.6985134674365316e-07, + "loss": 0.2822, + "step": 84918 + }, + { + "epoch": 2.18, + "learning_rate": 3.69829861582583e-07, + "loss": 0.5386, + "step": 84919 + }, + { + "epoch": 2.18, + "learning_rate": 3.698083769040048e-07, + "loss": 0.3784, + "step": 84920 + }, + { + "epoch": 2.18, + "learning_rate": 3.697868927079353e-07, + "loss": 0.4409, + "step": 84921 + }, + { + "epoch": 2.18, + "learning_rate": 3.6976540899439135e-07, + "loss": 0.344, + "step": 84922 + }, + { + "epoch": 2.18, + "learning_rate": 3.697439257633891e-07, + "loss": 0.4087, + "step": 84923 + }, + { + "epoch": 2.18, + "learning_rate": 3.697224430149446e-07, + "loss": 0.3525, + "step": 84924 + }, + { + "epoch": 2.18, + "learning_rate": 3.697009607490746e-07, + "loss": 0.3542, + "step": 84925 + }, + { + "epoch": 2.18, + "learning_rate": 3.6967947896579567e-07, + "loss": 0.3098, + "step": 84926 + }, + { + "epoch": 2.18, + "learning_rate": 3.696579976651245e-07, + "loss": 0.3613, + "step": 84927 + }, + { + "epoch": 2.18, + "learning_rate": 3.6963651684707687e-07, + "loss": 0.4019, + "step": 84928 + }, + { + "epoch": 2.18, + "learning_rate": 3.6961503651166956e-07, + "loss": 0.3691, + "step": 84929 + }, + { + "epoch": 2.18, + "learning_rate": 3.69593556658919e-07, + "loss": 0.502, + "step": 84930 + }, + { + "epoch": 2.18, + "learning_rate": 3.695720772888421e-07, + "loss": 0.4468, + "step": 84931 + }, + { + "epoch": 2.18, + "learning_rate": 3.6955059840145473e-07, + "loss": 0.2987, + "step": 84932 + }, + { + "epoch": 2.18, + "learning_rate": 3.6952911999677327e-07, + "loss": 0.4402, + "step": 84933 + }, + { + "epoch": 2.18, + "learning_rate": 3.6950764207481434e-07, + "loss": 0.4531, + "step": 84934 + }, + { + "epoch": 2.18, + "learning_rate": 3.694861646355943e-07, + "loss": 0.3845, + "step": 84935 + }, + { + "epoch": 2.18, + "learning_rate": 3.694646876791302e-07, + "loss": 0.4321, + "step": 84936 + }, + { + "epoch": 2.18, + "learning_rate": 3.6944321120543763e-07, + "loss": 0.4331, + "step": 84937 + }, + { + "epoch": 2.18, + "learning_rate": 3.6942173521453336e-07, + "loss": 0.2831, + "step": 84938 + }, + { + "epoch": 2.18, + "learning_rate": 3.6940025970643416e-07, + "loss": 0.3511, + "step": 84939 + }, + { + "epoch": 2.18, + "learning_rate": 3.69378784681156e-07, + "loss": 0.4456, + "step": 84940 + }, + { + "epoch": 2.18, + "learning_rate": 3.693573101387154e-07, + "loss": 0.4243, + "step": 84941 + }, + { + "epoch": 2.18, + "learning_rate": 3.693358360791292e-07, + "loss": 0.4131, + "step": 84942 + }, + { + "epoch": 2.18, + "learning_rate": 3.693143625024133e-07, + "loss": 0.3798, + "step": 84943 + }, + { + "epoch": 2.18, + "learning_rate": 3.692928894085847e-07, + "loss": 0.3855, + "step": 84944 + }, + { + "epoch": 2.18, + "learning_rate": 3.6927141679765926e-07, + "loss": 0.3765, + "step": 84945 + }, + { + "epoch": 2.18, + "learning_rate": 3.6924994466965367e-07, + "loss": 0.5146, + "step": 84946 + }, + { + "epoch": 2.18, + "learning_rate": 3.692284730245844e-07, + "loss": 0.395, + "step": 84947 + }, + { + "epoch": 2.18, + "learning_rate": 3.692070018624681e-07, + "loss": 0.6177, + "step": 84948 + }, + { + "epoch": 2.18, + "learning_rate": 3.6918553118332083e-07, + "loss": 0.3694, + "step": 84949 + }, + { + "epoch": 2.18, + "learning_rate": 3.691640609871591e-07, + "loss": 0.4844, + "step": 84950 + }, + { + "epoch": 2.18, + "learning_rate": 3.691425912739994e-07, + "loss": 0.3057, + "step": 84951 + }, + { + "epoch": 2.18, + "learning_rate": 3.691211220438586e-07, + "loss": 0.3988, + "step": 84952 + }, + { + "epoch": 2.18, + "learning_rate": 3.6909965329675275e-07, + "loss": 0.4539, + "step": 84953 + }, + { + "epoch": 2.18, + "learning_rate": 3.6907818503269796e-07, + "loss": 0.3652, + "step": 84954 + }, + { + "epoch": 2.18, + "learning_rate": 3.6905671725171103e-07, + "loss": 0.3398, + "step": 84955 + }, + { + "epoch": 2.18, + "learning_rate": 3.6903524995380865e-07, + "loss": 0.4668, + "step": 84956 + }, + { + "epoch": 2.18, + "learning_rate": 3.6901378313900653e-07, + "loss": 0.4346, + "step": 84957 + }, + { + "epoch": 2.18, + "learning_rate": 3.6899231680732167e-07, + "loss": 0.4066, + "step": 84958 + }, + { + "epoch": 2.18, + "learning_rate": 3.689708509587703e-07, + "loss": 0.4521, + "step": 84959 + }, + { + "epoch": 2.18, + "learning_rate": 3.689493855933694e-07, + "loss": 0.4141, + "step": 84960 + }, + { + "epoch": 2.18, + "learning_rate": 3.6892792071113454e-07, + "loss": 0.4863, + "step": 84961 + }, + { + "epoch": 2.18, + "learning_rate": 3.689064563120828e-07, + "loss": 0.5464, + "step": 84962 + }, + { + "epoch": 2.18, + "learning_rate": 3.6888499239623016e-07, + "loss": 0.4795, + "step": 84963 + }, + { + "epoch": 2.18, + "learning_rate": 3.6886352896359317e-07, + "loss": 0.4937, + "step": 84964 + }, + { + "epoch": 2.18, + "learning_rate": 3.6884206601418874e-07, + "loss": 0.4229, + "step": 84965 + }, + { + "epoch": 2.18, + "learning_rate": 3.6882060354803255e-07, + "loss": 0.3218, + "step": 84966 + }, + { + "epoch": 2.18, + "learning_rate": 3.6879914156514147e-07, + "loss": 0.292, + "step": 84967 + }, + { + "epoch": 2.18, + "learning_rate": 3.6877768006553176e-07, + "loss": 0.4419, + "step": 84968 + }, + { + "epoch": 2.18, + "learning_rate": 3.6875621904922037e-07, + "loss": 0.4185, + "step": 84969 + }, + { + "epoch": 2.18, + "learning_rate": 3.6873475851622306e-07, + "loss": 0.4927, + "step": 84970 + }, + { + "epoch": 2.18, + "learning_rate": 3.687132984665564e-07, + "loss": 0.395, + "step": 84971 + }, + { + "epoch": 2.18, + "learning_rate": 3.6869183890023726e-07, + "loss": 0.5894, + "step": 84972 + }, + { + "epoch": 2.18, + "learning_rate": 3.686703798172818e-07, + "loss": 0.3887, + "step": 84973 + }, + { + "epoch": 2.18, + "learning_rate": 3.6864892121770606e-07, + "loss": 0.46, + "step": 84974 + }, + { + "epoch": 2.18, + "learning_rate": 3.686274631015268e-07, + "loss": 0.3683, + "step": 84975 + }, + { + "epoch": 2.18, + "learning_rate": 3.686060054687604e-07, + "loss": 0.4087, + "step": 84976 + }, + { + "epoch": 2.18, + "learning_rate": 3.6858454831942376e-07, + "loss": 0.3707, + "step": 84977 + }, + { + "epoch": 2.18, + "learning_rate": 3.685630916535326e-07, + "loss": 0.4319, + "step": 84978 + }, + { + "epoch": 2.18, + "learning_rate": 3.685416354711035e-07, + "loss": 0.4243, + "step": 84979 + }, + { + "epoch": 2.18, + "learning_rate": 3.685201797721532e-07, + "loss": 0.303, + "step": 84980 + }, + { + "epoch": 2.18, + "learning_rate": 3.684987245566982e-07, + "loss": 0.333, + "step": 84981 + }, + { + "epoch": 2.18, + "learning_rate": 3.684772698247547e-07, + "loss": 0.4526, + "step": 84982 + }, + { + "epoch": 2.18, + "learning_rate": 3.6845581557633886e-07, + "loss": 0.3184, + "step": 84983 + }, + { + "epoch": 2.18, + "learning_rate": 3.6843436181146727e-07, + "loss": 0.3727, + "step": 84984 + }, + { + "epoch": 2.18, + "learning_rate": 3.684129085301565e-07, + "loss": 0.3406, + "step": 84985 + }, + { + "epoch": 2.18, + "learning_rate": 3.6839145573242326e-07, + "loss": 0.2668, + "step": 84986 + }, + { + "epoch": 2.18, + "learning_rate": 3.6837000341828326e-07, + "loss": 0.4746, + "step": 84987 + }, + { + "epoch": 2.18, + "learning_rate": 3.6834855158775333e-07, + "loss": 0.4458, + "step": 84988 + }, + { + "epoch": 2.18, + "learning_rate": 3.683271002408499e-07, + "loss": 0.4419, + "step": 84989 + }, + { + "epoch": 2.18, + "learning_rate": 3.683056493775896e-07, + "loss": 0.4014, + "step": 84990 + }, + { + "epoch": 2.18, + "learning_rate": 3.6828419899798835e-07, + "loss": 0.5601, + "step": 84991 + }, + { + "epoch": 2.18, + "learning_rate": 3.6826274910206324e-07, + "loss": 0.4678, + "step": 84992 + }, + { + "epoch": 2.18, + "learning_rate": 3.6824129968982985e-07, + "loss": 0.5112, + "step": 84993 + }, + { + "epoch": 2.18, + "learning_rate": 3.6821985076130547e-07, + "loss": 0.5312, + "step": 84994 + }, + { + "epoch": 2.18, + "learning_rate": 3.6819840231650567e-07, + "loss": 0.408, + "step": 84995 + }, + { + "epoch": 2.18, + "learning_rate": 3.681769543554474e-07, + "loss": 0.222, + "step": 84996 + }, + { + "epoch": 2.18, + "learning_rate": 3.681555068781469e-07, + "loss": 0.3833, + "step": 84997 + }, + { + "epoch": 2.18, + "learning_rate": 3.681340598846211e-07, + "loss": 0.5103, + "step": 84998 + }, + { + "epoch": 2.18, + "learning_rate": 3.6811261337488565e-07, + "loss": 0.4241, + "step": 84999 + }, + { + "epoch": 2.18, + "learning_rate": 3.680911673489572e-07, + "loss": 0.4688, + "step": 85000 + } + ], + "logging_steps": 1.0, + "max_steps": 117048, + "num_train_epochs": 3, + "save_steps": 5000, + "total_flos": 2207165233029120.0, + "trial_name": null, + "trial_params": null +}